Coverage Report

Created: 2026-02-26 06:47

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
/src/libxml2/entities.c
Line
Count
Source
1
/*
2
 * entities.c : implementation for the XML entities handling
3
 *
4
 * See Copyright for the status of this software.
5
 *
6
 * daniel@veillard.com
7
 */
8
9
/* To avoid EBCDIC trouble when parsing on zOS */
10
#if defined(__MVS__)
11
#pragma convert("ISO8859-1")
12
#endif
13
14
#define IN_LIBXML
15
#include "libxml.h"
16
17
#include <string.h>
18
#include <stdlib.h>
19
20
#include <libxml/xmlmemory.h>
21
#include <libxml/hash.h>
22
#include <libxml/entities.h>
23
#include <libxml/parser.h>
24
#include <libxml/parserInternals.h>
25
#include <libxml/xmlerror.h>
26
#include <libxml/dict.h>
27
#include <libxml/xmlsave.h>
28
29
#include "private/entities.h"
30
#include "private/error.h"
31
32
#ifndef SIZE_MAX
33
  #define SIZE_MAX ((size_t) -1)
34
#endif
35
36
/*
37
 * The XML predefined entities.
38
 */
39
40
static xmlEntity xmlEntityLt = {
41
    NULL, XML_ENTITY_DECL, BAD_CAST "lt",
42
    NULL, NULL, NULL, NULL, NULL, NULL,
43
    BAD_CAST "<", BAD_CAST "<", 1,
44
    XML_INTERNAL_PREDEFINED_ENTITY,
45
    NULL, NULL, NULL, NULL, 0, 0, 0
46
};
47
static xmlEntity xmlEntityGt = {
48
    NULL, XML_ENTITY_DECL, BAD_CAST "gt",
49
    NULL, NULL, NULL, NULL, NULL, NULL,
50
    BAD_CAST ">", BAD_CAST ">", 1,
51
    XML_INTERNAL_PREDEFINED_ENTITY,
52
    NULL, NULL, NULL, NULL, 0, 0, 0
53
};
54
static xmlEntity xmlEntityAmp = {
55
    NULL, XML_ENTITY_DECL, BAD_CAST "amp",
56
    NULL, NULL, NULL, NULL, NULL, NULL,
57
    BAD_CAST "&", BAD_CAST "&", 1,
58
    XML_INTERNAL_PREDEFINED_ENTITY,
59
    NULL, NULL, NULL, NULL, 0, 0, 0
60
};
61
static xmlEntity xmlEntityQuot = {
62
    NULL, XML_ENTITY_DECL, BAD_CAST "quot",
63
    NULL, NULL, NULL, NULL, NULL, NULL,
64
    BAD_CAST "\"", BAD_CAST "\"", 1,
65
    XML_INTERNAL_PREDEFINED_ENTITY,
66
    NULL, NULL, NULL, NULL, 0, 0, 0
67
};
68
static xmlEntity xmlEntityApos = {
69
    NULL, XML_ENTITY_DECL, BAD_CAST "apos",
70
    NULL, NULL, NULL, NULL, NULL, NULL,
71
    BAD_CAST "'", BAD_CAST "'", 1,
72
    XML_INTERNAL_PREDEFINED_ENTITY,
73
    NULL, NULL, NULL, NULL, 0, 0, 0
74
};
75
76
/*
77
 * xmlFreeEntity:
78
 * @entity:  an entity
79
 *
80
 * Frees the entity.
81
 */
82
void
83
xmlFreeEntity(xmlEntityPtr entity)
84
84.9k
{
85
84.9k
    xmlDictPtr dict = NULL;
86
87
84.9k
    if (entity == NULL)
88
0
        return;
89
90
84.9k
    if (entity->doc != NULL)
91
84.8k
        dict = entity->doc->dict;
92
93
94
84.9k
    if ((entity->children) &&
95
1.24k
        (entity == (xmlEntityPtr) entity->children->parent))
96
1.24k
        xmlFreeNodeList(entity->children);
97
84.9k
    if ((entity->name != NULL) &&
98
84.9k
        ((dict == NULL) || (!xmlDictOwns(dict, entity->name))))
99
20.6k
        xmlFree((char *) entity->name);
100
84.9k
    if (entity->ExternalID != NULL)
101
6.83k
        xmlFree((char *) entity->ExternalID);
102
84.9k
    if (entity->SystemID != NULL)
103
30.1k
        xmlFree((char *) entity->SystemID);
104
84.9k
    if (entity->URI != NULL)
105
28.4k
        xmlFree((char *) entity->URI);
106
84.9k
    if (entity->content != NULL)
107
53.6k
        xmlFree((char *) entity->content);
108
84.9k
    if (entity->orig != NULL)
109
42.8k
        xmlFree((char *) entity->orig);
110
84.9k
    xmlFree(entity);
111
84.9k
}
112
113
/*
114
 * xmlCreateEntity:
115
 *
116
 * internal routine doing the entity node structures allocations
117
 */
118
static xmlEntityPtr
119
xmlCreateEntity(xmlDocPtr doc, const xmlChar *name, int type,
120
          const xmlChar *ExternalID, const xmlChar *SystemID,
121
73.4k
          const xmlChar *content) {
122
73.4k
    xmlEntityPtr ret;
123
124
73.4k
    ret = (xmlEntityPtr) xmlMalloc(sizeof(xmlEntity));
125
73.4k
    if (ret == NULL)
126
11
  return(NULL);
127
73.4k
    memset(ret, 0, sizeof(xmlEntity));
128
73.4k
    ret->doc = doc;
129
73.4k
    ret->type = XML_ENTITY_DECL;
130
131
    /*
132
     * fill the structure.
133
     */
134
73.4k
    ret->etype = (xmlEntityType) type;
135
73.4k
    if ((doc == NULL) || (doc->dict == NULL))
136
9.12k
  ret->name = xmlStrdup(name);
137
64.2k
    else
138
64.2k
        ret->name = xmlDictLookup(doc->dict, name, -1);
139
73.4k
    if (ret->name == NULL)
140
2
        goto error;
141
73.4k
    if (ExternalID != NULL) {
142
6.83k
        ret->ExternalID = xmlStrdup(ExternalID);
143
6.83k
        if (ret->ExternalID == NULL)
144
1
            goto error;
145
6.83k
    }
146
73.4k
    if (SystemID != NULL) {
147
28.5k
        ret->SystemID = xmlStrdup(SystemID);
148
28.5k
        if (ret->SystemID == NULL)
149
4
            goto error;
150
28.5k
    }
151
73.4k
    if (content != NULL) {
152
42.8k
        ret->length = xmlStrlen(content);
153
42.8k
  ret->content = xmlStrndup(content, ret->length);
154
42.8k
        if (ret->content == NULL)
155
5
            goto error;
156
42.8k
     } else {
157
30.5k
        ret->length = 0;
158
30.5k
        ret->content = NULL;
159
30.5k
    }
160
73.4k
    ret->URI = NULL; /* to be computed by the layer knowing
161
      the defining entity */
162
73.4k
    ret->orig = NULL;
163
164
73.4k
    return(ret);
165
166
12
error:
167
12
    xmlFreeEntity(ret);
168
12
    return(NULL);
169
73.4k
}
170
171
/**
172
 * xmlAddEntity:
173
 * @doc:  the document
174
 * @extSubset:  add to the external or internal subset
175
 * @name:  the entity name
176
 * @type:  the entity type XML_xxx_yyy_ENTITY
177
 * @ExternalID:  the entity external ID if available
178
 * @SystemID:  the entity system ID if available
179
 * @content:  the entity content
180
 * @out:  pointer to resulting entity (optional)
181
 *
182
 * Register a new entity for this document.
183
 *
184
 * Available since 2.13.0.
185
 *
186
 * Returns an xmlParserErrors error code.
187
 */
188
int
189
xmlAddEntity(xmlDocPtr doc, int extSubset, const xmlChar *name, int type,
190
    const xmlChar *ExternalID, const xmlChar *SystemID,
191
82.3k
    const xmlChar *content, xmlEntityPtr *out) {
192
82.3k
    xmlDtdPtr dtd;
193
82.3k
    xmlDictPtr dict = NULL;
194
82.3k
    xmlEntitiesTablePtr table = NULL;
195
82.3k
    xmlEntityPtr ret, predef;
196
82.3k
    int res;
197
198
82.3k
    if (out != NULL)
199
82.3k
        *out = NULL;
200
82.3k
    if ((doc == NULL) || (name == NULL))
201
0
  return(XML_ERR_ARGUMENT);
202
82.3k
    dict = doc->dict;
203
204
82.3k
    if (extSubset)
205
6.66k
        dtd = doc->extSubset;
206
75.6k
    else
207
75.6k
        dtd = doc->intSubset;
208
82.3k
    if (dtd == NULL)
209
0
        return(XML_DTD_NO_DTD);
210
211
82.3k
    switch (type) {
212
33.9k
        case XML_INTERNAL_GENERAL_ENTITY:
213
43.2k
        case XML_EXTERNAL_GENERAL_PARSED_ENTITY:
214
43.6k
        case XML_EXTERNAL_GENERAL_UNPARSED_ENTITY:
215
43.6k
            predef = xmlGetPredefinedEntity(name);
216
43.6k
            if (predef != NULL) {
217
12.1k
                int valid = 0;
218
219
                /* 4.6 Predefined Entities */
220
12.1k
                if ((type == XML_INTERNAL_GENERAL_ENTITY) &&
221
11.2k
                    (content != NULL)) {
222
10.8k
                    int c = predef->content[0];
223
224
10.8k
                    if (((content[0] == c) && (content[1] == 0)) &&
225
1.20k
                        ((c == '>') || (c == '\'') || (c == '"'))) {
226
976
                        valid = 1;
227
9.87k
                    } else if ((content[0] == '&') && (content[1] == '#')) {
228
5.64k
                        if (content[2] == 'x') {
229
4.70k
                            xmlChar *hex = BAD_CAST "0123456789ABCDEF";
230
4.70k
                            xmlChar ref[] = "00;";
231
232
4.70k
                            ref[0] = hex[c / 16 % 16];
233
4.70k
                            ref[1] = hex[c % 16];
234
4.70k
                            if (xmlStrcasecmp(&content[3], ref) == 0)
235
1.87k
                                valid = 1;
236
4.70k
                        } else {
237
937
                            xmlChar ref[] = "00;";
238
239
937
                            ref[0] = '0' + c / 10 % 10;
240
937
                            ref[1] = '0' + c % 10;
241
937
                            if (xmlStrEqual(&content[2], ref))
242
446
                                valid = 1;
243
937
                        }
244
5.64k
                    }
245
10.8k
                }
246
12.1k
                if (!valid)
247
8.88k
                    return(XML_ERR_REDECL_PREDEF_ENTITY);
248
12.1k
            }
249
34.7k
      if (dtd->entities == NULL) {
250
18.9k
    dtd->entities = xmlHashCreateDict(0, dict);
251
18.9k
                if (dtd->entities == NULL)
252
7
                    return(XML_ERR_NO_MEMORY);
253
18.9k
            }
254
34.7k
      table = dtd->entities;
255
34.7k
      break;
256
17.1k
        case XML_INTERNAL_PARAMETER_ENTITY:
257
38.7k
        case XML_EXTERNAL_PARAMETER_ENTITY:
258
38.7k
      if (dtd->pentities == NULL) {
259
17.8k
    dtd->pentities = xmlHashCreateDict(0, dict);
260
17.8k
                if (dtd->pentities == NULL)
261
3
                    return(XML_ERR_NO_MEMORY);
262
17.8k
            }
263
38.7k
      table = dtd->pentities;
264
38.7k
      break;
265
0
        default:
266
0
      return(XML_ERR_ARGUMENT);
267
82.3k
    }
268
73.4k
    ret = xmlCreateEntity(dtd->doc, name, type, ExternalID, SystemID, content);
269
73.4k
    if (ret == NULL)
270
23
        return(XML_ERR_NO_MEMORY);
271
272
73.4k
    res = xmlHashAdd(table, name, ret);
273
73.4k
    if (res < 0) {
274
12
        xmlFreeEntity(ret);
275
12
        return(XML_ERR_NO_MEMORY);
276
73.3k
    } else if (res == 0) {
277
  /*
278
   * entity was already defined at another level.
279
   */
280
11.0k
        xmlFreeEntity(ret);
281
11.0k
  return(XML_WAR_ENTITY_REDEFINED);
282
11.0k
    }
283
284
    /*
285
     * Link it to the DTD
286
     */
287
62.3k
    ret->parent = dtd;
288
62.3k
    ret->doc = dtd->doc;
289
62.3k
    if (dtd->last == NULL) {
290
27.2k
  dtd->children = dtd->last = (xmlNodePtr) ret;
291
35.1k
    } else {
292
35.1k
  dtd->last->next = (xmlNodePtr) ret;
293
35.1k
  ret->prev = dtd->last;
294
35.1k
  dtd->last = (xmlNodePtr) ret;
295
35.1k
    }
296
297
62.3k
    if (out != NULL)
298
62.3k
        *out = ret;
299
62.3k
    return(0);
300
73.4k
}
301
302
/**
303
 * xmlGetPredefinedEntity:
304
 * @name:  the entity name
305
 *
306
 * Check whether this name is an predefined entity.
307
 *
308
 * Returns NULL if not, otherwise the entity
309
 */
310
xmlEntityPtr
311
3.18M
xmlGetPredefinedEntity(const xmlChar *name) {
312
3.18M
    if (name == NULL) return(NULL);
313
3.18M
    switch (name[0]) {
314
12.6k
        case 'l':
315
12.6k
      if (xmlStrEqual(name, BAD_CAST "lt"))
316
8.16k
          return(&xmlEntityLt);
317
4.47k
      break;
318
35.8k
        case 'g':
319
35.8k
      if (xmlStrEqual(name, BAD_CAST "gt"))
320
34.2k
          return(&xmlEntityGt);
321
1.58k
      break;
322
1.72M
        case 'a':
323
1.72M
      if (xmlStrEqual(name, BAD_CAST "amp"))
324
63.6k
          return(&xmlEntityAmp);
325
1.65M
      if (xmlStrEqual(name, BAD_CAST "apos"))
326
3.20k
          return(&xmlEntityApos);
327
1.65M
      break;
328
1.65M
        case 'q':
329
344k
      if (xmlStrEqual(name, BAD_CAST "quot"))
330
5.10k
          return(&xmlEntityQuot);
331
339k
      break;
332
1.06M
  default:
333
1.06M
      break;
334
3.18M
    }
335
3.06M
    return(NULL);
336
3.18M
}
337
338
/**
339
 * xmlAddDtdEntity:
340
 * @doc:  the document
341
 * @name:  the entity name
342
 * @type:  the entity type XML_xxx_yyy_ENTITY
343
 * @ExternalID:  the entity external ID if available
344
 * @SystemID:  the entity system ID if available
345
 * @content:  the entity content
346
 *
347
 * Register a new entity for this document DTD external subset.
348
 *
349
 * Returns a pointer to the entity or NULL in case of error
350
 */
351
xmlEntityPtr
352
xmlAddDtdEntity(xmlDocPtr doc, const xmlChar *name, int type,
353
          const xmlChar *ExternalID, const xmlChar *SystemID,
354
0
    const xmlChar *content) {
355
0
    xmlEntityPtr ret;
356
357
0
    xmlAddEntity(doc, 1, name, type, ExternalID, SystemID, content, &ret);
358
0
    return(ret);
359
0
}
360
361
/**
362
 * xmlAddDocEntity:
363
 * @doc:  the document
364
 * @name:  the entity name
365
 * @type:  the entity type XML_xxx_yyy_ENTITY
366
 * @ExternalID:  the entity external ID if available
367
 * @SystemID:  the entity system ID if available
368
 * @content:  the entity content
369
 *
370
 * Register a new entity for this document.
371
 *
372
 * Returns a pointer to the entity or NULL in case of error
373
 */
374
xmlEntityPtr
375
xmlAddDocEntity(xmlDocPtr doc, const xmlChar *name, int type,
376
          const xmlChar *ExternalID, const xmlChar *SystemID,
377
0
          const xmlChar *content) {
378
0
    xmlEntityPtr ret;
379
380
0
    xmlAddEntity(doc, 0, name, type, ExternalID, SystemID, content, &ret);
381
0
    return(ret);
382
0
}
383
384
/**
385
 * xmlNewEntity:
386
 * @doc:  the document
387
 * @name:  the entity name
388
 * @type:  the entity type XML_xxx_yyy_ENTITY
389
 * @ExternalID:  the entity external ID if available
390
 * @SystemID:  the entity system ID if available
391
 * @content:  the entity content
392
 *
393
 * Create a new entity, this differs from xmlAddDocEntity() that if
394
 * the document is NULL or has no internal subset defined, then an
395
 * unlinked entity structure will be returned, it is then the responsibility
396
 * of the caller to link it to the document later or free it when not needed
397
 * anymore.
398
 *
399
 * Returns a pointer to the entity or NULL in case of error
400
 */
401
xmlEntityPtr
402
xmlNewEntity(xmlDocPtr doc, const xmlChar *name, int type,
403
       const xmlChar *ExternalID, const xmlChar *SystemID,
404
0
       const xmlChar *content) {
405
0
    if ((doc != NULL) && (doc->intSubset != NULL)) {
406
0
  return(xmlAddDocEntity(doc, name, type, ExternalID, SystemID, content));
407
0
    }
408
0
    if (name == NULL)
409
0
        return(NULL);
410
0
    return(xmlCreateEntity(doc, name, type, ExternalID, SystemID, content));
411
0
}
412
413
/**
414
 * xmlGetEntityFromTable:
415
 * @table:  an entity table
416
 * @name:  the entity name
417
 * @parameter:  look for parameter entities
418
 *
419
 * Do an entity lookup in the table.
420
 * returns the corresponding parameter entity, if found.
421
 *
422
 * Returns A pointer to the entity structure or NULL if not found.
423
 */
424
static xmlEntityPtr
425
1.48M
xmlGetEntityFromTable(xmlEntitiesTablePtr table, const xmlChar *name) {
426
1.48M
    return((xmlEntityPtr) xmlHashLookup(table, name));
427
1.48M
}
428
429
/**
430
 * xmlGetParameterEntity:
431
 * @doc:  the document referencing the entity
432
 * @name:  the entity name
433
 *
434
 * Do an entity lookup in the internal and external subsets and
435
 * returns the corresponding parameter entity, if found.
436
 *
437
 * Returns A pointer to the entity structure or NULL if not found.
438
 */
439
xmlEntityPtr
440
90.7k
xmlGetParameterEntity(xmlDocPtr doc, const xmlChar *name) {
441
90.7k
    xmlEntitiesTablePtr table;
442
90.7k
    xmlEntityPtr ret;
443
444
90.7k
    if (doc == NULL)
445
1.00k
  return(NULL);
446
89.7k
    if ((doc->intSubset != NULL) && (doc->intSubset->pentities != NULL)) {
447
87.1k
  table = (xmlEntitiesTablePtr) doc->intSubset->pentities;
448
87.1k
  ret = xmlGetEntityFromTable(table, name);
449
87.1k
  if (ret != NULL)
450
60.6k
      return(ret);
451
87.1k
    }
452
29.1k
    if ((doc->extSubset != NULL) && (doc->extSubset->pentities != NULL)) {
453
5.92k
  table = (xmlEntitiesTablePtr) doc->extSubset->pentities;
454
5.92k
  return(xmlGetEntityFromTable(table, name));
455
5.92k
    }
456
23.1k
    return(NULL);
457
29.1k
}
458
459
/**
460
 * xmlGetDtdEntity:
461
 * @doc:  the document referencing the entity
462
 * @name:  the entity name
463
 *
464
 * Do an entity lookup in the DTD entity hash table and
465
 * returns the corresponding entity, if found.
466
 * Note: the first argument is the document node, not the DTD node.
467
 *
468
 * Returns A pointer to the entity structure or NULL if not found.
469
 */
470
xmlEntityPtr
471
0
xmlGetDtdEntity(xmlDocPtr doc, const xmlChar *name) {
472
0
    xmlEntitiesTablePtr table;
473
474
0
    if (doc == NULL)
475
0
  return(NULL);
476
0
    if ((doc->extSubset != NULL) && (doc->extSubset->entities != NULL)) {
477
0
  table = (xmlEntitiesTablePtr) doc->extSubset->entities;
478
0
  return(xmlGetEntityFromTable(table, name));
479
0
    }
480
0
    return(NULL);
481
0
}
482
483
/**
484
 * xmlGetDocEntity:
485
 * @doc:  the document referencing the entity
486
 * @name:  the entity name
487
 *
488
 * Do an entity lookup in the document entity hash table and
489
 * returns the corresponding entity, otherwise a lookup is done
490
 * in the predefined entities too.
491
 *
492
 * Returns A pointer to the entity structure or NULL if not found.
493
 */
494
xmlEntityPtr
495
1.43M
xmlGetDocEntity(const xmlDoc *doc, const xmlChar *name) {
496
1.43M
    xmlEntityPtr cur;
497
1.43M
    xmlEntitiesTablePtr table;
498
499
1.43M
    if (doc != NULL) {
500
1.43M
  if ((doc->intSubset != NULL) && (doc->intSubset->entities != NULL)) {
501
1.34M
      table = (xmlEntitiesTablePtr) doc->intSubset->entities;
502
1.34M
      cur = xmlGetEntityFromTable(table, name);
503
1.34M
      if (cur != NULL)
504
1.10M
    return(cur);
505
1.34M
  }
506
325k
  if (doc->standalone != 1) {
507
324k
      if ((doc->extSubset != NULL) &&
508
43.9k
    (doc->extSubset->entities != NULL)) {
509
42.2k
    table = (xmlEntitiesTablePtr) doc->extSubset->entities;
510
42.2k
    cur = xmlGetEntityFromTable(table, name);
511
42.2k
    if (cur != NULL)
512
254
        return(cur);
513
42.2k
      }
514
324k
  }
515
325k
    }
516
326k
    return(xmlGetPredefinedEntity(name));
517
1.43M
}
518
519
/*
520
 * xmlSerializeHexCharRef:
521
 * @buf:  a char buffer
522
 * @val:  a codepoint
523
 *
524
 * Serializes a hex char ref like &#xA0;
525
 *
526
 * Writes at most 9 bytes. Does not include a terminating zero byte.
527
 *
528
 * Returns the number of bytes written.
529
 */
530
int
531
1.81k
xmlSerializeHexCharRef(char *buf, int val) {
532
1.81k
    char *out = buf;
533
1.81k
    int shift = 0, bits;
534
535
1.81k
    *out++ = '&';
536
1.81k
    *out++ = '#';
537
1.81k
    *out++ = 'x';
538
539
1.81k
    bits = val;
540
1.81k
    if (bits & 0xFF0000) {
541
286
        shift = 16;
542
286
        bits &= 0xFF0000;
543
1.52k
    } else if (bits & 0x00FF00) {
544
1.12k
        shift = 8;
545
1.12k
        bits &= 0x00FF00;
546
1.12k
    }
547
1.81k
    if (bits & 0xF0F0F0) {
548
1.49k
        shift += 4;
549
1.49k
    }
550
551
6.71k
    do {
552
6.71k
        int d = (val >> shift) & 0x0F;
553
554
6.71k
        if (d < 10)
555
1.39k
            *out++ = '0' + d;
556
5.31k
        else
557
5.31k
            *out++ = 'A' + (d - 10);
558
559
6.71k
  shift -= 4;
560
6.71k
    } while (shift >= 0);
561
562
1.81k
    *out++ = ';';
563
564
1.81k
    return(out - buf);
565
1.81k
}
566
567
/*
568
 * xmlSerializeDecCharRef:
569
 * @buf:  a char buffer
570
 * @val:  a codepoint
571
 *
572
 * Serializes a decimal char ref like &#38;
573
 *
574
 * Writes at most 10 bytes. Does not include a terminating zero byte.
575
 *
576
 * Returns the number of bytes written.
577
 */
578
int
579
55.3M
xmlSerializeDecCharRef(char *buf, int val) {
580
55.3M
    char *out = buf;
581
55.3M
    int len, i;
582
583
55.3M
    *out++ = '&';
584
55.3M
    *out++ = '#';
585
586
55.3M
    if (val < 100) {
587
793
        len = (val < 10) ? 1 : 2;
588
55.3M
    } else if (val < 10000) {
589
55.2M
        len = (val < 1000) ? 3 : 4;
590
55.2M
    } else if (val < 1000000) {
591
11.5k
        len = (val < 100000) ? 5 : 6;
592
11.5k
    } else {
593
219
        len = 7;
594
219
    }
595
596
223M
    for (i = len - 1; i >= 0; i--) {
597
168M
        out[i] = '0' + val % 10;
598
168M
        val /= 10;
599
168M
    }
600
601
55.3M
    out[len] = ';';
602
603
55.3M
    return(len + 3);
604
55.3M
}
605
606
static const char xmlEscapeSafe[128] = {
607
    0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0,
608
    0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
609
    1, 1, 0, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1,
610
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 1,
611
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
612
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
613
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
614
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1
615
};
616
617
/*
618
 * xmlEscapeText:
619
 * @text:  input text
620
 * @flags:  XML_ESCAPE flags
621
 *
622
 * Escapes certain characters with char refs.
623
 *
624
 * XML_ESCAPE_ATTR: for attribute content.
625
 * XML_ESCAPE_NON_ASCII: escape non-ASCII chars.
626
 * XML_ESCAPE_HTML: for HTML content.
627
 * XML_ESCAPE_QUOT: escape double quotes.
628
 * XML_ESCAPE_ALLOW_INVALID: allow invalid characters.
629
 *
630
 * Returns an escaped string or NULL if a memory allocation failed.
631
 */
632
xmlChar *
633
22.3k
xmlEscapeText(const xmlChar *text, int flags) {
634
22.3k
    const xmlChar *cur;
635
22.3k
    xmlChar *buffer;
636
22.3k
    xmlChar *out;
637
22.3k
    const xmlChar *unescaped;
638
22.3k
    size_t size = 50;
639
640
22.3k
    buffer = xmlMalloc(size + 1);
641
22.3k
    if (buffer == NULL)
642
59
        return(NULL);
643
22.3k
    out = buffer;
644
645
22.3k
    cur = text;
646
22.3k
    unescaped = cur;
647
648
496k
    while (*cur != '\0') {
649
473k
        char buf[12];
650
473k
  const xmlChar *end;
651
473k
        const xmlChar *repl;
652
473k
        size_t used;
653
473k
        size_t replSize;
654
473k
        size_t unescapedSize;
655
473k
        size_t totalSize;
656
473k
        int chunkSize = 1;
657
473k
        int c;
658
659
        /* accelerator */
660
69.7M
  while (1) {
661
69.7M
            c = *cur;
662
663
69.7M
            if (c < 0x80) {
664
42.4M
                if (!xmlEscapeSafe[*cur])
665
473k
                    break;
666
42.4M
            } else {
667
27.3M
               if (flags & XML_ESCAPE_NON_ASCII)
668
0
                   break;
669
27.3M
            }
670
69.3M
            cur += 1;
671
69.3M
        }
672
673
473k
        if (c == 0) {
674
19.9k
            chunkSize = 0;
675
19.9k
            repl = BAD_CAST "";
676
19.9k
            replSize = 0;
677
453k
        } else if (c == '<') {
678
      /*
679
       * Special handling of server side include in HTML attributes
680
       */
681
12.6k
      if ((flags & XML_ESCAPE_HTML) && (flags & XML_ESCAPE_ATTR) &&
682
12.2k
          (cur[1] == '!') && (cur[2] == '-') && (cur[3] == '-') &&
683
1.29k
          ((end = xmlStrstr(cur, BAD_CAST "-->")) != NULL)) {
684
655
                chunkSize = (end - cur) + 3;
685
655
                repl = cur;
686
655
                replSize = chunkSize;
687
11.9k
      } else {
688
11.9k
                repl = BAD_CAST "&lt;";
689
11.9k
                replSize = 4;
690
11.9k
            }
691
441k
  } else if (c == '>') {
692
394k
            repl = BAD_CAST "&gt;";
693
394k
            replSize = 4;
694
394k
  } else if (c == '&') {
695
      /*
696
       * Special handling of &{...} construct from HTML 4, see
697
       * http://www.w3.org/TR/html401/appendix/notes.html#h-B.7.1
698
       */
699
6.70k
      if ((flags & XML_ESCAPE_HTML) && (flags & XML_ESCAPE_ATTR) &&
700
6.58k
                (cur[1] == '{') && (end = xmlStrchr(cur, '}'))) {
701
1.60k
                chunkSize = (end - cur) + 1;
702
1.60k
                repl = cur;
703
1.60k
                replSize = chunkSize;
704
5.10k
      } else {
705
5.10k
                repl = BAD_CAST "&amp;";
706
5.10k
                replSize = 5;
707
5.10k
            }
708
39.6k
  } else if ((flags & XML_ESCAPE_QUOT) && (c == '"')) {
709
0
            repl = BAD_CAST "&quot;";
710
0
            replSize = 6;
711
39.6k
  } else if (((flags & XML_ESCAPE_HTML) == 0) && (c == '\r')) {
712
0
      repl = BAD_CAST "&#13;";
713
0
            replSize = 5;
714
39.6k
  } else if ((flags & XML_ESCAPE_NON_ASCII) && (c >= 0x80)) {
715
0
            int val;
716
717
0
            chunkSize = 4;
718
0
            val = xmlGetUTF8Char(cur, &chunkSize);
719
0
            if (val < 0) {
720
0
                val = 0xFFFD;
721
0
                chunkSize = 1;
722
0
            } else if (((flags & XML_ESCAPE_ALLOW_INVALID) == 0) &&
723
0
                       (!IS_CHAR(val))) {
724
0
                val = 0xFFFD;
725
0
            }
726
727
0
            replSize = xmlSerializeHexCharRef(buf, val);
728
0
            repl = BAD_CAST buf;
729
39.6k
  } else if ((flags & (XML_ESCAPE_ALLOW_INVALID | XML_ESCAPE_HTML)) ||
730
0
                   (c >= 0x20) ||
731
39.6k
             (c == '\n') || (c == '\t') || (c == '\r')) {
732
      /* default case, just copy */
733
39.6k
            cur += 1;
734
39.6k
            if (*cur != 0)
735
38.5k
                continue;
736
737
1.05k
            chunkSize = 0;
738
1.05k
            repl = BAD_CAST "";
739
1.05k
            replSize = 0;
740
1.05k
  } else {
741
            /* ignore */
742
0
            repl = BAD_CAST "";
743
0
            replSize = 0;
744
0
        }
745
746
435k
        used = out - buffer;
747
435k
        unescapedSize = cur - unescaped;
748
435k
        totalSize = unescapedSize + replSize;
749
750
435k
  cur += chunkSize;
751
752
435k
        if (totalSize > size - used) {
753
6.79k
            xmlChar *tmp;
754
6.79k
            int newSize;
755
756
6.79k
            if ((size > (SIZE_MAX - 1) / 2) ||
757
6.79k
                (totalSize > (SIZE_MAX - 1) / 2 - size)) {
758
0
                xmlFree(buffer);
759
0
                return(NULL);
760
0
            }
761
6.79k
            newSize = size + totalSize;
762
6.79k
            if (*cur != 0)
763
4.43k
                newSize *= 2;
764
6.79k
            tmp = xmlRealloc(buffer, newSize + 1);
765
6.79k
            if (tmp == NULL) {
766
7
                xmlFree(buffer);
767
7
                return(NULL);
768
7
            }
769
6.78k
            buffer = tmp;
770
6.78k
            size = newSize;
771
6.78k
            out = buffer + used;
772
6.78k
        }
773
774
435k
        memcpy(out, unescaped, unescapedSize);
775
435k
        out += unescapedSize;
776
435k
        memcpy(out, repl, replSize);
777
435k
        out += replSize;
778
779
435k
        unescaped = cur;
780
435k
    }
781
782
22.3k
    *out = 0;
783
22.3k
    return(buffer);
784
22.3k
}
785
786
/**
787
 * xmlEncodeEntitiesInternal:
788
 * @doc:  the document containing the string
789
 * @input:  A string to convert to XML.
790
 * @flags:  XML_ESCAPE flags
791
 *
792
 * Do a global encoding of a string, replacing the predefined entities
793
 * and non ASCII values with their entities and CharRef counterparts.
794
 * Contrary to xmlEncodeEntities, this routine is reentrant, and result
795
 * must be deallocated.
796
 *
797
 * Returns A newly allocated string with the substitution done.
798
 */
799
xmlChar *
800
xmlEncodeEntitiesInternal(xmlDocPtr doc, const xmlChar *input,
801
22.3k
                          unsigned flags) {
802
22.3k
    if (input == NULL)
803
0
        return(NULL);
804
805
22.3k
    if ((doc != NULL) && (doc->type == XML_HTML_DOCUMENT_NODE))
806
22.3k
        flags |= XML_ESCAPE_HTML;
807
0
    else if ((doc == NULL) || (doc->encoding == NULL))
808
0
        flags |= XML_ESCAPE_NON_ASCII;
809
810
22.3k
    return(xmlEscapeText(input, flags));
811
22.3k
}
812
813
/**
814
 * xmlEncodeEntitiesReentrant:
815
 * @doc:  the document containing the string
816
 * @input:  A string to convert to XML.
817
 *
818
 * Do a global encoding of a string, replacing the predefined entities
819
 * and non ASCII values with their entities and CharRef counterparts.
820
 * Contrary to xmlEncodeEntities, this routine is reentrant, and result
821
 * must be deallocated.
822
 *
823
 * This escapes '<', '>', '&' and '\r'. If the document has no encoding,
824
 * non-ASCII codepoints are escaped. There is some special handling for
825
 * HTML documents.
826
 *
827
 * Returns A newly allocated string with the substitution done.
828
 */
829
xmlChar *
830
14.0k
xmlEncodeEntitiesReentrant(xmlDocPtr doc, const xmlChar *input) {
831
14.0k
    return xmlEncodeEntitiesInternal(doc, input, 0);
832
14.0k
}
833
834
/**
835
 * xmlEncodeSpecialChars:
836
 * @doc:  unused
837
 * @input:  A string to convert to XML.
838
 *
839
 * Do a global encoding of a string, replacing the predefined entities
840
 * this routine is reentrant, and result must be deallocated.
841
 *
842
 * This escapes '<', '>', '&', '"' and '\r' chars.
843
 *
844
 * Returns A newly allocated string with the substitution done.
845
 */
846
xmlChar *
847
xmlEncodeSpecialChars(const xmlDoc *doc ATTRIBUTE_UNUSED,
848
0
                      const xmlChar *input) {
849
0
    if (input == NULL)
850
0
        return(NULL);
851
852
0
    return(xmlEscapeText(input, XML_ESCAPE_QUOT | XML_ESCAPE_ALLOW_INVALID));
853
0
}
854
855
/**
856
 * xmlCreateEntitiesTable:
857
 *
858
 * create and initialize an empty entities hash table.
859
 * This really doesn't make sense and should be deprecated
860
 *
861
 * Returns the xmlEntitiesTablePtr just created or NULL in case of error.
862
 */
863
xmlEntitiesTablePtr
864
0
xmlCreateEntitiesTable(void) {
865
0
    return((xmlEntitiesTablePtr) xmlHashCreate(0));
866
0
}
867
868
/**
869
 * xmlFreeEntityWrapper:
870
 * @entity:  An entity
871
 * @name:  its name
872
 *
873
 * Deallocate the memory used by an entities in the hash table.
874
 */
875
static void
876
73.9k
xmlFreeEntityWrapper(void *entity, const xmlChar *name ATTRIBUTE_UNUSED) {
877
73.9k
    if (entity != NULL)
878
73.9k
  xmlFreeEntity((xmlEntityPtr) entity);
879
73.9k
}
880
881
/**
882
 * xmlFreeEntitiesTable:
883
 * @table:  An entity table
884
 *
885
 * Deallocate the memory used by an entities hash table.
886
 */
887
void
888
41.2k
xmlFreeEntitiesTable(xmlEntitiesTablePtr table) {
889
41.2k
    xmlHashFree(table, xmlFreeEntityWrapper);
890
41.2k
}
891
892
/**
893
 * xmlCopyEntity:
894
 * @ent:  An entity
895
 *
896
 * Build a copy of an entity
897
 *
898
 * Returns the new xmlEntitiesPtr or NULL in case of error.
899
 */
900
static void *
901
11.5k
xmlCopyEntity(void *payload, const xmlChar *name ATTRIBUTE_UNUSED) {
902
11.5k
    xmlEntityPtr ent = (xmlEntityPtr) payload;
903
11.5k
    xmlEntityPtr cur;
904
905
11.5k
    cur = (xmlEntityPtr) xmlMalloc(sizeof(xmlEntity));
906
11.5k
    if (cur == NULL)
907
2
  return(NULL);
908
11.5k
    memset(cur, 0, sizeof(xmlEntity));
909
11.5k
    cur->type = XML_ENTITY_DECL;
910
911
11.5k
    cur->etype = ent->etype;
912
11.5k
    if (ent->name != NULL) {
913
11.5k
  cur->name = xmlStrdup(ent->name);
914
11.5k
        if (cur->name == NULL)
915
2
            goto error;
916
11.5k
    }
917
11.5k
    if (ent->ExternalID != NULL) {
918
0
  cur->ExternalID = xmlStrdup(ent->ExternalID);
919
0
        if (cur->ExternalID == NULL)
920
0
            goto error;
921
0
    }
922
11.5k
    if (ent->SystemID != NULL) {
923
1.61k
  cur->SystemID = xmlStrdup(ent->SystemID);
924
1.61k
        if (cur->SystemID == NULL)
925
2
            goto error;
926
1.61k
    }
927
11.5k
    if (ent->content != NULL) {
928
9.95k
  cur->content = xmlStrdup(ent->content);
929
9.95k
        if (cur->content == NULL)
930
1
            goto error;
931
9.95k
    }
932
11.5k
    if (ent->orig != NULL) {
933
9.94k
  cur->orig = xmlStrdup(ent->orig);
934
9.94k
        if (cur->orig == NULL)
935
2
            goto error;
936
9.94k
    }
937
11.5k
    if (ent->URI != NULL) {
938
1.59k
  cur->URI = xmlStrdup(ent->URI);
939
1.59k
        if (cur->URI == NULL)
940
2
            goto error;
941
1.59k
    }
942
11.5k
    return(cur);
943
944
9
error:
945
9
    xmlFreeEntity(cur);
946
9
    return(NULL);
947
11.5k
}
948
949
/**
950
 * xmlCopyEntitiesTable:
951
 * @table:  An entity table
952
 *
953
 * Build a copy of an entity table.
954
 *
955
 * Returns the new xmlEntitiesTablePtr or NULL in case of error.
956
 */
957
xmlEntitiesTablePtr
958
4.42k
xmlCopyEntitiesTable(xmlEntitiesTablePtr table) {
959
4.42k
    return(xmlHashCopySafe(table, xmlCopyEntity, xmlFreeEntityWrapper));
960
4.42k
}
961
962
#ifdef LIBXML_OUTPUT_ENABLED
963
964
/**
965
 * xmlDumpEntityDecl:
966
 * @buf:  An XML buffer.
967
 * @ent:  An entity table
968
 *
969
 * This will dump the content of the entity table as an XML DTD definition
970
 */
971
void
972
0
xmlDumpEntityDecl(xmlBufferPtr buf, xmlEntityPtr ent) {
973
0
    xmlSaveCtxtPtr save;
974
975
0
    if ((buf == NULL) || (ent == NULL))
976
0
        return;
977
978
0
    save = xmlSaveToBuffer(buf, NULL, 0);
979
0
    xmlSaveTree(save, (xmlNodePtr) ent);
980
0
    if (xmlSaveFinish(save) != XML_ERR_OK)
981
0
        xmlFree(xmlBufferDetach(buf));
982
0
}
983
984
/**
985
 * xmlDumpEntityDeclScan:
986
 * @ent:  An entity table
987
 * @buf:  An XML buffer.
988
 *
989
 * When using the hash table scan function, arguments need to be reversed
990
 */
991
static void
992
xmlDumpEntityDeclScan(void *ent, void *save,
993
0
                      const xmlChar *name ATTRIBUTE_UNUSED) {
994
0
    xmlSaveTree(save, ent);
995
0
}
996
997
/**
998
 * xmlDumpEntitiesTable:
999
 * @buf:  An XML buffer.
1000
 * @table:  An entity table
1001
 *
1002
 * This will dump the content of the entity table as an XML DTD definition
1003
 */
1004
void
1005
0
xmlDumpEntitiesTable(xmlBufferPtr buf, xmlEntitiesTablePtr table) {
1006
0
    xmlSaveCtxtPtr save;
1007
1008
0
    if ((buf == NULL) || (table == NULL))
1009
0
        return;
1010
1011
0
    save = xmlSaveToBuffer(buf, NULL, 0);
1012
0
    xmlHashScan(table, xmlDumpEntityDeclScan, save);
1013
0
    if (xmlSaveFinish(save) != XML_ERR_OK)
1014
0
        xmlFree(xmlBufferDetach(buf));
1015
0
}
1016
#endif /* LIBXML_OUTPUT_ENABLED */