Coverage Report

Created: 2026-04-27 06:55

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
/src/libxml2/entities.c
Line
Count
Source
1
/*
2
 * entities.c : implementation for the XML entities handling
3
 *
4
 * See Copyright for the status of this software.
5
 *
6
 * daniel@veillard.com
7
 */
8
9
/* To avoid EBCDIC trouble when parsing on zOS */
10
#if defined(__MVS__)
11
#pragma convert("ISO8859-1")
12
#endif
13
14
#define IN_LIBXML
15
#include "libxml.h"
16
17
#include <string.h>
18
#include <stdlib.h>
19
20
#include <libxml/xmlmemory.h>
21
#include <libxml/hash.h>
22
#include <libxml/entities.h>
23
#include <libxml/parser.h>
24
#include <libxml/parserInternals.h>
25
#include <libxml/xmlerror.h>
26
#include <libxml/dict.h>
27
#include <libxml/xmlsave.h>
28
29
#include "private/entities.h"
30
#include "private/error.h"
31
32
#ifndef SIZE_MAX
33
  #define SIZE_MAX ((size_t) -1)
34
#endif
35
36
/*
37
 * The XML predefined entities.
38
 */
39
40
static xmlEntity xmlEntityLt = {
41
    NULL, XML_ENTITY_DECL, BAD_CAST "lt",
42
    NULL, NULL, NULL, NULL, NULL, NULL,
43
    BAD_CAST "<", BAD_CAST "<", 1,
44
    XML_INTERNAL_PREDEFINED_ENTITY,
45
    NULL, NULL, NULL, NULL, 0, 0, 0
46
};
47
static xmlEntity xmlEntityGt = {
48
    NULL, XML_ENTITY_DECL, BAD_CAST "gt",
49
    NULL, NULL, NULL, NULL, NULL, NULL,
50
    BAD_CAST ">", BAD_CAST ">", 1,
51
    XML_INTERNAL_PREDEFINED_ENTITY,
52
    NULL, NULL, NULL, NULL, 0, 0, 0
53
};
54
static xmlEntity xmlEntityAmp = {
55
    NULL, XML_ENTITY_DECL, BAD_CAST "amp",
56
    NULL, NULL, NULL, NULL, NULL, NULL,
57
    BAD_CAST "&", BAD_CAST "&", 1,
58
    XML_INTERNAL_PREDEFINED_ENTITY,
59
    NULL, NULL, NULL, NULL, 0, 0, 0
60
};
61
static xmlEntity xmlEntityQuot = {
62
    NULL, XML_ENTITY_DECL, BAD_CAST "quot",
63
    NULL, NULL, NULL, NULL, NULL, NULL,
64
    BAD_CAST "\"", BAD_CAST "\"", 1,
65
    XML_INTERNAL_PREDEFINED_ENTITY,
66
    NULL, NULL, NULL, NULL, 0, 0, 0
67
};
68
static xmlEntity xmlEntityApos = {
69
    NULL, XML_ENTITY_DECL, BAD_CAST "apos",
70
    NULL, NULL, NULL, NULL, NULL, NULL,
71
    BAD_CAST "'", BAD_CAST "'", 1,
72
    XML_INTERNAL_PREDEFINED_ENTITY,
73
    NULL, NULL, NULL, NULL, 0, 0, 0
74
};
75
76
/*
77
 * xmlFreeEntity:
78
 * @entity:  an entity
79
 *
80
 * Frees the entity.
81
 */
82
void
83
xmlFreeEntity(xmlEntityPtr entity)
84
91.9k
{
85
91.9k
    xmlDictPtr dict = NULL;
86
87
91.9k
    if (entity == NULL)
88
0
        return;
89
90
91.9k
    if (entity->doc != NULL)
91
91.8k
        dict = entity->doc->dict;
92
93
94
91.9k
    if ((entity->children) &&
95
1.81k
        (entity == (xmlEntityPtr) entity->children->parent))
96
1.81k
        xmlFreeNodeList(entity->children);
97
91.9k
    if ((entity->name != NULL) &&
98
91.9k
        ((dict == NULL) || (!xmlDictOwns(dict, entity->name))))
99
25.0k
        xmlFree((char *) entity->name);
100
91.9k
    if (entity->ExternalID != NULL)
101
8.36k
        xmlFree((char *) entity->ExternalID);
102
91.9k
    if (entity->SystemID != NULL)
103
32.8k
        xmlFree((char *) entity->SystemID);
104
91.9k
    if (entity->URI != NULL)
105
31.5k
        xmlFree((char *) entity->URI);
106
91.9k
    if (entity->content != NULL)
107
57.2k
        xmlFree((char *) entity->content);
108
91.9k
    if (entity->orig != NULL)
109
44.1k
        xmlFree((char *) entity->orig);
110
91.9k
    xmlFree(entity);
111
91.9k
}
112
113
/*
114
 * xmlCreateEntity:
115
 *
116
 * internal routine doing the entity node structures allocations
117
 */
118
static xmlEntityPtr
119
xmlCreateEntity(xmlDocPtr doc, const xmlChar *name, int type,
120
          const xmlChar *ExternalID, const xmlChar *SystemID,
121
76.7k
          const xmlChar *content) {
122
76.7k
    xmlEntityPtr ret;
123
124
76.7k
    ret = (xmlEntityPtr) xmlMalloc(sizeof(xmlEntity));
125
76.7k
    if (ret == NULL)
126
6
  return(NULL);
127
76.7k
    memset(ret, 0, sizeof(xmlEntity));
128
76.7k
    ret->doc = doc;
129
76.7k
    ret->type = XML_ENTITY_DECL;
130
131
    /*
132
     * fill the structure.
133
     */
134
76.7k
    ret->etype = (xmlEntityType) type;
135
76.7k
    if ((doc == NULL) || (doc->dict == NULL))
136
9.80k
  ret->name = xmlStrdup(name);
137
66.9k
    else
138
66.9k
        ret->name = xmlDictLookup(doc->dict, name, -1);
139
76.7k
    if (ret->name == NULL)
140
2
        goto error;
141
76.7k
    if (ExternalID != NULL) {
142
8.36k
        ret->ExternalID = xmlStrdup(ExternalID);
143
8.36k
        if (ret->ExternalID == NULL)
144
1
            goto error;
145
8.36k
    }
146
76.7k
    if (SystemID != NULL) {
147
31.5k
        ret->SystemID = xmlStrdup(SystemID);
148
31.5k
        if (ret->SystemID == NULL)
149
7
            goto error;
150
31.5k
    }
151
76.7k
    if (content != NULL) {
152
42.6k
        ret->length = xmlStrlen(content);
153
42.6k
  ret->content = xmlStrndup(content, ret->length);
154
42.6k
        if (ret->content == NULL)
155
5
            goto error;
156
42.6k
     } else {
157
34.1k
        ret->length = 0;
158
34.1k
        ret->content = NULL;
159
34.1k
    }
160
76.7k
    ret->URI = NULL; /* to be computed by the layer knowing
161
      the defining entity */
162
76.7k
    ret->orig = NULL;
163
164
76.7k
    return(ret);
165
166
15
error:
167
15
    xmlFreeEntity(ret);
168
15
    return(NULL);
169
76.7k
}
170
171
/**
172
 * xmlAddEntity:
173
 * @doc:  the document
174
 * @extSubset:  add to the external or internal subset
175
 * @name:  the entity name
176
 * @type:  the entity type XML_xxx_yyy_ENTITY
177
 * @ExternalID:  the entity external ID if available
178
 * @SystemID:  the entity system ID if available
179
 * @content:  the entity content
180
 * @out:  pointer to resulting entity (optional)
181
 *
182
 * Register a new entity for this document.
183
 *
184
 * Available since 2.13.0.
185
 *
186
 * Returns an xmlParserErrors error code.
187
 */
188
int
189
xmlAddEntity(xmlDocPtr doc, int extSubset, const xmlChar *name, int type,
190
    const xmlChar *ExternalID, const xmlChar *SystemID,
191
90.2k
    const xmlChar *content, xmlEntityPtr *out) {
192
90.2k
    xmlDtdPtr dtd;
193
90.2k
    xmlDictPtr dict = NULL;
194
90.2k
    xmlEntitiesTablePtr table = NULL;
195
90.2k
    xmlEntityPtr ret, predef;
196
90.2k
    int res;
197
198
90.2k
    if (out != NULL)
199
90.2k
        *out = NULL;
200
90.2k
    if ((doc == NULL) || (name == NULL))
201
0
  return(XML_ERR_ARGUMENT);
202
90.2k
    dict = doc->dict;
203
204
90.2k
    if (extSubset)
205
7.20k
        dtd = doc->extSubset;
206
83.0k
    else
207
83.0k
        dtd = doc->intSubset;
208
90.2k
    if (dtd == NULL)
209
0
        return(XML_DTD_NO_DTD);
210
211
90.2k
    switch (type) {
212
38.2k
        case XML_INTERNAL_GENERAL_ENTITY:
213
49.5k
        case XML_EXTERNAL_GENERAL_PARSED_ENTITY:
214
49.7k
        case XML_EXTERNAL_GENERAL_UNPARSED_ENTITY:
215
49.7k
            predef = xmlGetPredefinedEntity(name);
216
49.7k
            if (predef != NULL) {
217
17.9k
                int valid = 0;
218
219
                /* 4.6 Predefined Entities */
220
17.9k
                if ((type == XML_INTERNAL_GENERAL_ENTITY) &&
221
16.4k
                    (content != NULL)) {
222
16.0k
                    int c = predef->content[0];
223
224
16.0k
                    if (((content[0] == c) && (content[1] == 0)) &&
225
1.04k
                        ((c == '>') || (c == '\'') || (c == '"'))) {
226
1.01k
                        valid = 1;
227
15.0k
                    } else if ((content[0] == '&') && (content[1] == '#')) {
228
8.47k
                        if (content[2] == 'x') {
229
7.45k
                            xmlChar *hex = BAD_CAST "0123456789ABCDEF";
230
7.45k
                            xmlChar ref[] = "00;";
231
232
7.45k
                            ref[0] = hex[c / 16 % 16];
233
7.45k
                            ref[1] = hex[c % 16];
234
7.45k
                            if (xmlStrcasecmp(&content[3], ref) == 0)
235
3.01k
                                valid = 1;
236
7.45k
                        } else {
237
1.01k
                            xmlChar ref[] = "00;";
238
239
1.01k
                            ref[0] = '0' + c / 10 % 10;
240
1.01k
                            ref[1] = '0' + c % 10;
241
1.01k
                            if (xmlStrEqual(&content[2], ref))
242
492
                                valid = 1;
243
1.01k
                        }
244
8.47k
                    }
245
16.0k
                }
246
17.9k
                if (!valid)
247
13.4k
                    return(XML_ERR_REDECL_PREDEF_ENTITY);
248
17.9k
            }
249
36.3k
      if (dtd->entities == NULL) {
250
20.0k
    dtd->entities = xmlHashCreateDict(0, dict);
251
20.0k
                if (dtd->entities == NULL)
252
4
                    return(XML_ERR_NO_MEMORY);
253
20.0k
            }
254
36.3k
      table = dtd->entities;
255
36.3k
      break;
256
16.9k
        case XML_INTERNAL_PARAMETER_ENTITY:
257
40.4k
        case XML_EXTERNAL_PARAMETER_ENTITY:
258
40.4k
      if (dtd->pentities == NULL) {
259
20.1k
    dtd->pentities = xmlHashCreateDict(0, dict);
260
20.1k
                if (dtd->pentities == NULL)
261
4
                    return(XML_ERR_NO_MEMORY);
262
20.1k
            }
263
40.4k
      table = dtd->pentities;
264
40.4k
      break;
265
0
        default:
266
0
      return(XML_ERR_ARGUMENT);
267
90.2k
    }
268
76.7k
    ret = xmlCreateEntity(dtd->doc, name, type, ExternalID, SystemID, content);
269
76.7k
    if (ret == NULL)
270
21
        return(XML_ERR_NO_MEMORY);
271
272
76.7k
    res = xmlHashAdd(table, name, ret);
273
76.7k
    if (res < 0) {
274
7
        xmlFreeEntity(ret);
275
7
        return(XML_ERR_NO_MEMORY);
276
76.7k
    } else if (res == 0) {
277
  /*
278
   * entity was already defined at another level.
279
   */
280
13.7k
        xmlFreeEntity(ret);
281
13.7k
  return(XML_WAR_ENTITY_REDEFINED);
282
13.7k
    }
283
284
    /*
285
     * Link it to the DTD
286
     */
287
63.0k
    ret->parent = dtd;
288
63.0k
    ret->doc = dtd->doc;
289
63.0k
    if (dtd->last == NULL) {
290
29.6k
  dtd->children = dtd->last = (xmlNodePtr) ret;
291
33.3k
    } else {
292
33.3k
  dtd->last->next = (xmlNodePtr) ret;
293
33.3k
  ret->prev = dtd->last;
294
33.3k
  dtd->last = (xmlNodePtr) ret;
295
33.3k
    }
296
297
63.0k
    if (out != NULL)
298
63.0k
        *out = ret;
299
63.0k
    return(0);
300
76.7k
}
301
302
/**
303
 * xmlGetPredefinedEntity:
304
 * @name:  the entity name
305
 *
306
 * Check whether this name is an predefined entity.
307
 *
308
 * Returns NULL if not, otherwise the entity
309
 */
310
xmlEntityPtr
311
1.42M
xmlGetPredefinedEntity(const xmlChar *name) {
312
1.42M
    if (name == NULL) return(NULL);
313
1.42M
    switch (name[0]) {
314
16.8k
        case 'l':
315
16.8k
      if (xmlStrEqual(name, BAD_CAST "lt"))
316
13.1k
          return(&xmlEntityLt);
317
3.62k
      break;
318
36.9k
        case 'g':
319
36.9k
      if (xmlStrEqual(name, BAD_CAST "gt"))
320
34.1k
          return(&xmlEntityGt);
321
2.83k
      break;
322
546k
        case 'a':
323
546k
      if (xmlStrEqual(name, BAD_CAST "amp"))
324
59.4k
          return(&xmlEntityAmp);
325
487k
      if (xmlStrEqual(name, BAD_CAST "apos"))
326
3.78k
          return(&xmlEntityApos);
327
483k
      break;
328
483k
        case 'q':
329
267k
      if (xmlStrEqual(name, BAD_CAST "quot"))
330
7.26k
          return(&xmlEntityQuot);
331
260k
      break;
332
556k
  default:
333
556k
      break;
334
1.42M
    }
335
1.30M
    return(NULL);
336
1.42M
}
337
338
/**
339
 * xmlAddDtdEntity:
340
 * @doc:  the document
341
 * @name:  the entity name
342
 * @type:  the entity type XML_xxx_yyy_ENTITY
343
 * @ExternalID:  the entity external ID if available
344
 * @SystemID:  the entity system ID if available
345
 * @content:  the entity content
346
 *
347
 * Register a new entity for this document DTD external subset.
348
 *
349
 * Returns a pointer to the entity or NULL in case of error
350
 */
351
xmlEntityPtr
352
xmlAddDtdEntity(xmlDocPtr doc, const xmlChar *name, int type,
353
          const xmlChar *ExternalID, const xmlChar *SystemID,
354
0
    const xmlChar *content) {
355
0
    xmlEntityPtr ret;
356
357
0
    xmlAddEntity(doc, 1, name, type, ExternalID, SystemID, content, &ret);
358
0
    return(ret);
359
0
}
360
361
/**
362
 * xmlAddDocEntity:
363
 * @doc:  the document
364
 * @name:  the entity name
365
 * @type:  the entity type XML_xxx_yyy_ENTITY
366
 * @ExternalID:  the entity external ID if available
367
 * @SystemID:  the entity system ID if available
368
 * @content:  the entity content
369
 *
370
 * Register a new entity for this document.
371
 *
372
 * Returns a pointer to the entity or NULL in case of error
373
 */
374
xmlEntityPtr
375
xmlAddDocEntity(xmlDocPtr doc, const xmlChar *name, int type,
376
          const xmlChar *ExternalID, const xmlChar *SystemID,
377
0
          const xmlChar *content) {
378
0
    xmlEntityPtr ret;
379
380
0
    xmlAddEntity(doc, 0, name, type, ExternalID, SystemID, content, &ret);
381
0
    return(ret);
382
0
}
383
384
/**
385
 * xmlNewEntity:
386
 * @doc:  the document
387
 * @name:  the entity name
388
 * @type:  the entity type XML_xxx_yyy_ENTITY
389
 * @ExternalID:  the entity external ID if available
390
 * @SystemID:  the entity system ID if available
391
 * @content:  the entity content
392
 *
393
 * Create a new entity, this differs from xmlAddDocEntity() that if
394
 * the document is NULL or has no internal subset defined, then an
395
 * unlinked entity structure will be returned, it is then the responsibility
396
 * of the caller to link it to the document later or free it when not needed
397
 * anymore.
398
 *
399
 * Returns a pointer to the entity or NULL in case of error
400
 */
401
xmlEntityPtr
402
xmlNewEntity(xmlDocPtr doc, const xmlChar *name, int type,
403
       const xmlChar *ExternalID, const xmlChar *SystemID,
404
0
       const xmlChar *content) {
405
0
    if ((doc != NULL) && (doc->intSubset != NULL)) {
406
0
  return(xmlAddDocEntity(doc, name, type, ExternalID, SystemID, content));
407
0
    }
408
0
    if (name == NULL)
409
0
        return(NULL);
410
0
    return(xmlCreateEntity(doc, name, type, ExternalID, SystemID, content));
411
0
}
412
413
/**
414
 * xmlGetEntityFromTable:
415
 * @table:  an entity table
416
 * @name:  the entity name
417
 * @parameter:  look for parameter entities
418
 *
419
 * Do an entity lookup in the table.
420
 * returns the corresponding parameter entity, if found.
421
 *
422
 * Returns A pointer to the entity structure or NULL if not found.
423
 */
424
static xmlEntityPtr
425
648k
xmlGetEntityFromTable(xmlEntitiesTablePtr table, const xmlChar *name) {
426
648k
    return((xmlEntityPtr) xmlHashLookup(table, name));
427
648k
}
428
429
/**
430
 * xmlGetParameterEntity:
431
 * @doc:  the document referencing the entity
432
 * @name:  the entity name
433
 *
434
 * Do an entity lookup in the internal and external subsets and
435
 * returns the corresponding parameter entity, if found.
436
 *
437
 * Returns A pointer to the entity structure or NULL if not found.
438
 */
439
xmlEntityPtr
440
90.3k
xmlGetParameterEntity(xmlDocPtr doc, const xmlChar *name) {
441
90.3k
    xmlEntitiesTablePtr table;
442
90.3k
    xmlEntityPtr ret;
443
444
90.3k
    if (doc == NULL)
445
1.03k
  return(NULL);
446
89.3k
    if ((doc->intSubset != NULL) && (doc->intSubset->pentities != NULL)) {
447
86.2k
  table = (xmlEntitiesTablePtr) doc->intSubset->pentities;
448
86.2k
  ret = xmlGetEntityFromTable(table, name);
449
86.2k
  if (ret != NULL)
450
65.6k
      return(ret);
451
86.2k
    }
452
23.6k
    if ((doc->extSubset != NULL) && (doc->extSubset->pentities != NULL)) {
453
6.88k
  table = (xmlEntitiesTablePtr) doc->extSubset->pentities;
454
6.88k
  return(xmlGetEntityFromTable(table, name));
455
6.88k
    }
456
16.7k
    return(NULL);
457
23.6k
}
458
459
/**
460
 * xmlGetDtdEntity:
461
 * @doc:  the document referencing the entity
462
 * @name:  the entity name
463
 *
464
 * Do an entity lookup in the DTD entity hash table and
465
 * returns the corresponding entity, if found.
466
 * Note: the first argument is the document node, not the DTD node.
467
 *
468
 * Returns A pointer to the entity structure or NULL if not found.
469
 */
470
xmlEntityPtr
471
0
xmlGetDtdEntity(xmlDocPtr doc, const xmlChar *name) {
472
0
    xmlEntitiesTablePtr table;
473
474
0
    if (doc == NULL)
475
0
  return(NULL);
476
0
    if ((doc->extSubset != NULL) && (doc->extSubset->entities != NULL)) {
477
0
  table = (xmlEntitiesTablePtr) doc->extSubset->entities;
478
0
  return(xmlGetEntityFromTable(table, name));
479
0
    }
480
0
    return(NULL);
481
0
}
482
483
/**
484
 * xmlGetDocEntity:
485
 * @doc:  the document referencing the entity
486
 * @name:  the entity name
487
 *
488
 * Do an entity lookup in the document entity hash table and
489
 * returns the corresponding entity, otherwise a lookup is done
490
 * in the predefined entities too.
491
 *
492
 * Returns A pointer to the entity structure or NULL if not found.
493
 */
494
xmlEntityPtr
495
642k
xmlGetDocEntity(const xmlDoc *doc, const xmlChar *name) {
496
642k
    xmlEntityPtr cur;
497
642k
    xmlEntitiesTablePtr table;
498
499
642k
    if (doc != NULL) {
500
618k
  if ((doc->intSubset != NULL) && (doc->intSubset->entities != NULL)) {
501
520k
      table = (xmlEntitiesTablePtr) doc->intSubset->entities;
502
520k
      cur = xmlGetEntityFromTable(table, name);
503
520k
      if (cur != NULL)
504
443k
    return(cur);
505
520k
  }
506
175k
  if (doc->standalone != 1) {
507
175k
      if ((doc->extSubset != NULL) &&
508
37.0k
    (doc->extSubset->entities != NULL)) {
509
35.3k
    table = (xmlEntitiesTablePtr) doc->extSubset->entities;
510
35.3k
    cur = xmlGetEntityFromTable(table, name);
511
35.3k
    if (cur != NULL)
512
312
        return(cur);
513
35.3k
      }
514
175k
  }
515
175k
    }
516
198k
    return(xmlGetPredefinedEntity(name));
517
642k
}
518
519
/*
520
 * xmlSerializeHexCharRef:
521
 * @buf:  a char buffer
522
 * @val:  a codepoint
523
 *
524
 * Serializes a hex char ref like &#xA0;
525
 *
526
 * Writes at most 9 bytes. Does not include a terminating zero byte.
527
 *
528
 * Returns the number of bytes written.
529
 */
530
int
531
1.84k
xmlSerializeHexCharRef(char *buf, int val) {
532
1.84k
    char *out = buf;
533
1.84k
    int shift = 0, bits;
534
535
1.84k
    *out++ = '&';
536
1.84k
    *out++ = '#';
537
1.84k
    *out++ = 'x';
538
539
1.84k
    bits = val;
540
1.84k
    if (bits & 0xFF0000) {
541
72
        shift = 16;
542
72
        bits &= 0xFF0000;
543
1.77k
    } else if (bits & 0x00FF00) {
544
671
        shift = 8;
545
671
        bits &= 0x00FF00;
546
671
    }
547
1.84k
    if (bits & 0xF0F0F0) {
548
1.74k
        shift += 4;
549
1.74k
    }
550
551
5.21k
    do {
552
5.21k
        int d = (val >> shift) & 0x0F;
553
554
5.21k
        if (d < 10)
555
2.30k
            *out++ = '0' + d;
556
2.91k
        else
557
2.91k
            *out++ = 'A' + (d - 10);
558
559
5.21k
  shift -= 4;
560
5.21k
    } while (shift >= 0);
561
562
1.84k
    *out++ = ';';
563
564
1.84k
    return(out - buf);
565
1.84k
}
566
567
/*
568
 * xmlSerializeDecCharRef:
569
 * @buf:  a char buffer
570
 * @val:  a codepoint
571
 *
572
 * Serializes a decimal char ref like &#38;
573
 *
574
 * Writes at most 10 bytes. Does not include a terminating zero byte.
575
 *
576
 * Returns the number of bytes written.
577
 */
578
int
579
49.8M
xmlSerializeDecCharRef(char *buf, int val) {
580
49.8M
    char *out = buf;
581
49.8M
    int len, i;
582
583
49.8M
    *out++ = '&';
584
49.8M
    *out++ = '#';
585
586
49.8M
    if (val < 100) {
587
229
        len = (val < 10) ? 1 : 2;
588
49.8M
    } else if (val < 10000) {
589
49.8M
        len = (val < 1000) ? 3 : 4;
590
49.8M
    } else if (val < 1000000) {
591
10.2k
        len = (val < 100000) ? 5 : 6;
592
10.2k
    } else {
593
231
        len = 7;
594
231
    }
595
596
208M
    for (i = len - 1; i >= 0; i--) {
597
158M
        out[i] = '0' + val % 10;
598
158M
        val /= 10;
599
158M
    }
600
601
49.8M
    out[len] = ';';
602
603
49.8M
    return(len + 3);
604
49.8M
}
605
606
static const char xmlEscapeSafe[128] = {
607
    0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0,
608
    0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
609
    1, 1, 0, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1,
610
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 1,
611
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
612
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
613
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
614
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1
615
};
616
617
/*
618
 * xmlEscapeText:
619
 * @text:  input text
620
 * @flags:  XML_ESCAPE flags
621
 *
622
 * Escapes certain characters with char refs.
623
 *
624
 * XML_ESCAPE_ATTR: for attribute content.
625
 * XML_ESCAPE_NON_ASCII: escape non-ASCII chars.
626
 * XML_ESCAPE_HTML: for HTML content.
627
 * XML_ESCAPE_QUOT: escape double quotes.
628
 * XML_ESCAPE_ALLOW_INVALID: allow invalid characters.
629
 *
630
 * Returns an escaped string or NULL if a memory allocation failed.
631
 */
632
xmlChar *
633
20.9k
xmlEscapeText(const xmlChar *text, int flags) {
634
20.9k
    const xmlChar *cur;
635
20.9k
    xmlChar *buffer;
636
20.9k
    xmlChar *out;
637
20.9k
    const xmlChar *unescaped;
638
20.9k
    size_t size = 50;
639
640
20.9k
    buffer = xmlMalloc(size + 1);
641
20.9k
    if (buffer == NULL)
642
53
        return(NULL);
643
20.8k
    out = buffer;
644
645
20.8k
    cur = text;
646
20.8k
    unescaped = cur;
647
648
2.31M
    while (*cur != '\0') {
649
2.29M
        char buf[12];
650
2.29M
  const xmlChar *end;
651
2.29M
        const xmlChar *repl;
652
2.29M
        size_t used;
653
2.29M
        size_t replSize;
654
2.29M
        size_t unescapedSize;
655
2.29M
        size_t totalSize;
656
2.29M
        int chunkSize = 1;
657
2.29M
        int c;
658
659
        /* accelerator */
660
111M
  while (1) {
661
111M
            c = *cur;
662
663
111M
            if (c < 0x80) {
664
55.0M
                if (!xmlEscapeSafe[*cur])
665
2.29M
                    break;
666
56.1M
            } else {
667
56.1M
               if (flags & XML_ESCAPE_NON_ASCII)
668
0
                   break;
669
56.1M
            }
670
108M
            cur += 1;
671
108M
        }
672
673
2.29M
        if (c == 0) {
674
18.9k
            chunkSize = 0;
675
18.9k
            repl = BAD_CAST "";
676
18.9k
            replSize = 0;
677
2.27M
        } else if (c == '<') {
678
      /*
679
       * Special handling of server side include in HTML attributes
680
       */
681
19.6k
      if ((flags & XML_ESCAPE_HTML) && (flags & XML_ESCAPE_ATTR) &&
682
17.6k
          (cur[1] == '!') && (cur[2] == '-') && (cur[3] == '-') &&
683
1.68k
          ((end = xmlStrstr(cur, BAD_CAST "-->")) != NULL)) {
684
1.26k
                chunkSize = (end - cur) + 3;
685
1.26k
                repl = cur;
686
1.26k
                replSize = chunkSize;
687
18.3k
      } else {
688
18.3k
                repl = BAD_CAST "&lt;";
689
18.3k
                replSize = 4;
690
18.3k
            }
691
2.25M
  } else if (c == '>') {
692
2.20M
            repl = BAD_CAST "&gt;";
693
2.20M
            replSize = 4;
694
2.20M
  } else if (c == '&') {
695
      /*
696
       * Special handling of &{...} construct from HTML 4, see
697
       * http://www.w3.org/TR/html401/appendix/notes.html#h-B.7.1
698
       */
699
10.5k
      if ((flags & XML_ESCAPE_HTML) && (flags & XML_ESCAPE_ATTR) &&
700
10.3k
                (cur[1] == '{') && (end = xmlStrchr(cur, '}'))) {
701
1.17k
                chunkSize = (end - cur) + 1;
702
1.17k
                repl = cur;
703
1.17k
                replSize = chunkSize;
704
9.33k
      } else {
705
9.33k
                repl = BAD_CAST "&amp;";
706
9.33k
                replSize = 5;
707
9.33k
            }
708
45.3k
  } else if ((flags & XML_ESCAPE_QUOT) && (c == '"')) {
709
0
            repl = BAD_CAST "&quot;";
710
0
            replSize = 6;
711
45.3k
  } else if (((flags & XML_ESCAPE_HTML) == 0) && (c == '\r')) {
712
0
      repl = BAD_CAST "&#13;";
713
0
            replSize = 5;
714
45.3k
  } else if ((flags & XML_ESCAPE_NON_ASCII) && (c >= 0x80)) {
715
0
            int val;
716
717
0
            chunkSize = 4;
718
0
            val = xmlGetUTF8Char(cur, &chunkSize);
719
0
            if (val < 0) {
720
0
                val = 0xFFFD;
721
0
                chunkSize = 1;
722
0
            } else if (((flags & XML_ESCAPE_ALLOW_INVALID) == 0) &&
723
0
                       (!IS_CHAR(val))) {
724
0
                val = 0xFFFD;
725
0
            }
726
727
0
            replSize = xmlSerializeHexCharRef(buf, val);
728
0
            repl = BAD_CAST buf;
729
45.3k
  } else if ((flags & (XML_ESCAPE_ALLOW_INVALID | XML_ESCAPE_HTML)) ||
730
0
                   (c >= 0x20) ||
731
45.3k
             (c == '\n') || (c == '\t') || (c == '\r')) {
732
      /* default case, just copy */
733
45.3k
            cur += 1;
734
45.3k
            if (*cur != 0)
735
44.5k
                continue;
736
737
807
            chunkSize = 0;
738
807
            repl = BAD_CAST "";
739
807
            replSize = 0;
740
807
  } else {
741
            /* ignore */
742
0
            repl = BAD_CAST "";
743
0
            replSize = 0;
744
0
        }
745
746
2.25M
        used = out - buffer;
747
2.25M
        unescapedSize = cur - unescaped;
748
2.25M
        totalSize = unescapedSize + replSize;
749
750
2.25M
  cur += chunkSize;
751
752
2.25M
        if (totalSize > size - used) {
753
6.99k
            xmlChar *tmp;
754
6.99k
            int newSize;
755
756
6.99k
            if ((size > (SIZE_MAX - 1) / 2) ||
757
6.99k
                (totalSize > (SIZE_MAX - 1) / 2 - size)) {
758
0
                xmlFree(buffer);
759
0
                return(NULL);
760
0
            }
761
6.99k
            newSize = size + totalSize;
762
6.99k
            if (*cur != 0)
763
4.76k
                newSize *= 2;
764
6.99k
            tmp = xmlRealloc(buffer, newSize + 1);
765
6.99k
            if (tmp == NULL) {
766
6
                xmlFree(buffer);
767
6
                return(NULL);
768
6
            }
769
6.98k
            buffer = tmp;
770
6.98k
            size = newSize;
771
6.98k
            out = buffer + used;
772
6.98k
        }
773
774
2.25M
        memcpy(out, unescaped, unescapedSize);
775
2.25M
        out += unescapedSize;
776
2.25M
        memcpy(out, repl, replSize);
777
2.25M
        out += replSize;
778
779
2.25M
        unescaped = cur;
780
2.25M
    }
781
782
20.8k
    *out = 0;
783
20.8k
    return(buffer);
784
20.8k
}
785
786
/**
787
 * xmlEncodeEntitiesInternal:
788
 * @doc:  the document containing the string
789
 * @input:  A string to convert to XML.
790
 * @flags:  XML_ESCAPE flags
791
 *
792
 * Do a global encoding of a string, replacing the predefined entities
793
 * and non ASCII values with their entities and CharRef counterparts.
794
 * Contrary to xmlEncodeEntities, this routine is reentrant, and result
795
 * must be deallocated.
796
 *
797
 * Returns A newly allocated string with the substitution done.
798
 */
799
xmlChar *
800
xmlEncodeEntitiesInternal(xmlDocPtr doc, const xmlChar *input,
801
20.9k
                          unsigned flags) {
802
20.9k
    if (input == NULL)
803
0
        return(NULL);
804
805
20.9k
    if ((doc != NULL) && (doc->type == XML_HTML_DOCUMENT_NODE))
806
20.9k
        flags |= XML_ESCAPE_HTML;
807
0
    else if ((doc == NULL) || (doc->encoding == NULL))
808
0
        flags |= XML_ESCAPE_NON_ASCII;
809
810
20.9k
    return(xmlEscapeText(input, flags));
811
20.9k
}
812
813
/**
814
 * xmlEncodeEntitiesReentrant:
815
 * @doc:  the document containing the string
816
 * @input:  A string to convert to XML.
817
 *
818
 * Do a global encoding of a string, replacing the predefined entities
819
 * and non ASCII values with their entities and CharRef counterparts.
820
 * Contrary to xmlEncodeEntities, this routine is reentrant, and result
821
 * must be deallocated.
822
 *
823
 * This escapes '<', '>', '&' and '\r'. If the document has no encoding,
824
 * non-ASCII codepoints are escaped. There is some special handling for
825
 * HTML documents.
826
 *
827
 * Returns A newly allocated string with the substitution done.
828
 */
829
xmlChar *
830
14.1k
xmlEncodeEntitiesReentrant(xmlDocPtr doc, const xmlChar *input) {
831
14.1k
    return xmlEncodeEntitiesInternal(doc, input, 0);
832
14.1k
}
833
834
/**
835
 * xmlEncodeSpecialChars:
836
 * @doc:  unused
837
 * @input:  A string to convert to XML.
838
 *
839
 * Do a global encoding of a string, replacing the predefined entities
840
 * this routine is reentrant, and result must be deallocated.
841
 *
842
 * This escapes '<', '>', '&', '"' and '\r' chars.
843
 *
844
 * Returns A newly allocated string with the substitution done.
845
 */
846
xmlChar *
847
xmlEncodeSpecialChars(const xmlDoc *doc ATTRIBUTE_UNUSED,
848
0
                      const xmlChar *input) {
849
0
    if (input == NULL)
850
0
        return(NULL);
851
852
0
    return(xmlEscapeText(input, XML_ESCAPE_QUOT | XML_ESCAPE_ALLOW_INVALID));
853
0
}
854
855
/**
856
 * xmlCreateEntitiesTable:
857
 *
858
 * create and initialize an empty entities hash table.
859
 * This really doesn't make sense and should be deprecated
860
 *
861
 * Returns the xmlEntitiesTablePtr just created or NULL in case of error.
862
 */
863
xmlEntitiesTablePtr
864
0
xmlCreateEntitiesTable(void) {
865
0
    return((xmlEntitiesTablePtr) xmlHashCreate(0));
866
0
}
867
868
/**
869
 * xmlFreeEntityWrapper:
870
 * @entity:  An entity
871
 * @name:  its name
872
 *
873
 * Deallocate the memory used by an entities in the hash table.
874
 */
875
static void
876
78.2k
xmlFreeEntityWrapper(void *entity, const xmlChar *name ATTRIBUTE_UNUSED) {
877
78.2k
    if (entity != NULL)
878
78.2k
  xmlFreeEntity((xmlEntityPtr) entity);
879
78.2k
}
880
881
/**
882
 * xmlFreeEntitiesTable:
883
 * @table:  An entity table
884
 *
885
 * Deallocate the memory used by an entities hash table.
886
 */
887
void
888
45.8k
xmlFreeEntitiesTable(xmlEntitiesTablePtr table) {
889
45.8k
    xmlHashFree(table, xmlFreeEntityWrapper);
890
45.8k
}
891
892
/**
893
 * xmlCopyEntity:
894
 * @ent:  An entity
895
 *
896
 * Build a copy of an entity
897
 *
898
 * Returns the new xmlEntitiesPtr or NULL in case of error.
899
 */
900
static void *
901
15.2k
xmlCopyEntity(void *payload, const xmlChar *name ATTRIBUTE_UNUSED) {
902
15.2k
    xmlEntityPtr ent = (xmlEntityPtr) payload;
903
15.2k
    xmlEntityPtr cur;
904
905
15.2k
    cur = (xmlEntityPtr) xmlMalloc(sizeof(xmlEntity));
906
15.2k
    if (cur == NULL)
907
4
  return(NULL);
908
15.2k
    memset(cur, 0, sizeof(xmlEntity));
909
15.2k
    cur->type = XML_ENTITY_DECL;
910
911
15.2k
    cur->etype = ent->etype;
912
15.2k
    if (ent->name != NULL) {
913
15.2k
  cur->name = xmlStrdup(ent->name);
914
15.2k
        if (cur->name == NULL)
915
4
            goto error;
916
15.2k
    }
917
15.2k
    if (ent->ExternalID != NULL) {
918
0
  cur->ExternalID = xmlStrdup(ent->ExternalID);
919
0
        if (cur->ExternalID == NULL)
920
0
            goto error;
921
0
    }
922
15.2k
    if (ent->SystemID != NULL) {
923
1.34k
  cur->SystemID = xmlStrdup(ent->SystemID);
924
1.34k
        if (cur->SystemID == NULL)
925
1
            goto error;
926
1.34k
    }
927
15.2k
    if (ent->content != NULL) {
928
13.8k
  cur->content = xmlStrdup(ent->content);
929
13.8k
        if (cur->content == NULL)
930
3
            goto error;
931
13.8k
    }
932
15.2k
    if (ent->orig != NULL) {
933
13.8k
  cur->orig = xmlStrdup(ent->orig);
934
13.8k
        if (cur->orig == NULL)
935
1
            goto error;
936
13.8k
    }
937
15.2k
    if (ent->URI != NULL) {
938
1.32k
  cur->URI = xmlStrdup(ent->URI);
939
1.32k
        if (cur->URI == NULL)
940
1
            goto error;
941
1.32k
    }
942
15.2k
    return(cur);
943
944
10
error:
945
10
    xmlFreeEntity(cur);
946
10
    return(NULL);
947
15.2k
}
948
949
/**
950
 * xmlCopyEntitiesTable:
951
 * @table:  An entity table
952
 *
953
 * Build a copy of an entity table.
954
 *
955
 * Returns the new xmlEntitiesTablePtr or NULL in case of error.
956
 */
957
xmlEntitiesTablePtr
958
5.67k
xmlCopyEntitiesTable(xmlEntitiesTablePtr table) {
959
5.67k
    return(xmlHashCopySafe(table, xmlCopyEntity, xmlFreeEntityWrapper));
960
5.67k
}
961
962
#ifdef LIBXML_OUTPUT_ENABLED
963
964
/**
965
 * xmlDumpEntityDecl:
966
 * @buf:  An XML buffer.
967
 * @ent:  An entity table
968
 *
969
 * This will dump the content of the entity table as an XML DTD definition
970
 */
971
void
972
0
xmlDumpEntityDecl(xmlBufferPtr buf, xmlEntityPtr ent) {
973
0
    xmlSaveCtxtPtr save;
974
975
0
    if ((buf == NULL) || (ent == NULL))
976
0
        return;
977
978
0
    save = xmlSaveToBuffer(buf, NULL, 0);
979
0
    xmlSaveTree(save, (xmlNodePtr) ent);
980
0
    if (xmlSaveFinish(save) != XML_ERR_OK)
981
0
        xmlFree(xmlBufferDetach(buf));
982
0
}
983
984
/**
985
 * xmlDumpEntityDeclScan:
986
 * @ent:  An entity table
987
 * @buf:  An XML buffer.
988
 *
989
 * When using the hash table scan function, arguments need to be reversed
990
 */
991
static void
992
xmlDumpEntityDeclScan(void *ent, void *save,
993
0
                      const xmlChar *name ATTRIBUTE_UNUSED) {
994
0
    xmlSaveTree(save, ent);
995
0
}
996
997
/**
998
 * xmlDumpEntitiesTable:
999
 * @buf:  An XML buffer.
1000
 * @table:  An entity table
1001
 *
1002
 * This will dump the content of the entity table as an XML DTD definition
1003
 */
1004
void
1005
0
xmlDumpEntitiesTable(xmlBufferPtr buf, xmlEntitiesTablePtr table) {
1006
0
    xmlSaveCtxtPtr save;
1007
1008
0
    if ((buf == NULL) || (table == NULL))
1009
0
        return;
1010
1011
0
    save = xmlSaveToBuffer(buf, NULL, 0);
1012
0
    xmlHashScan(table, xmlDumpEntityDeclScan, save);
1013
0
    if (xmlSaveFinish(save) != XML_ERR_OK)
1014
0
        xmlFree(xmlBufferDetach(buf));
1015
0
}
1016
#endif /* LIBXML_OUTPUT_ENABLED */