Coverage Report

Created: 2025-08-28 06:07

/src/libxml2/entities.c
Line
Count
Source (jump to first uncovered line)
1
/*
2
 * entities.c : implementation for the XML entities handling
3
 *
4
 * See Copyright for the status of this software.
5
 *
6
 * daniel@veillard.com
7
 */
8
9
/* To avoid EBCDIC trouble when parsing on zOS */
10
#if defined(__MVS__)
11
#pragma convert("ISO8859-1")
12
#endif
13
14
#define IN_LIBXML
15
#include "libxml.h"
16
17
#include <string.h>
18
#include <stdlib.h>
19
20
#include <libxml/xmlmemory.h>
21
#include <libxml/hash.h>
22
#include <libxml/entities.h>
23
#include <libxml/parser.h>
24
#include <libxml/parserInternals.h>
25
#include <libxml/xmlerror.h>
26
#include <libxml/dict.h>
27
#include <libxml/xmlsave.h>
28
29
#include "private/entities.h"
30
#include "private/error.h"
31
32
#ifndef SIZE_MAX
33
  #define SIZE_MAX ((size_t) -1)
34
#endif
35
36
/*
37
 * The XML predefined entities.
38
 */
39
40
static xmlEntity xmlEntityLt = {
41
    NULL, XML_ENTITY_DECL, BAD_CAST "lt",
42
    NULL, NULL, NULL, NULL, NULL, NULL,
43
    BAD_CAST "<", BAD_CAST "<", 1,
44
    XML_INTERNAL_PREDEFINED_ENTITY,
45
    NULL, NULL, NULL, NULL, 0, 0, 0
46
};
47
static xmlEntity xmlEntityGt = {
48
    NULL, XML_ENTITY_DECL, BAD_CAST "gt",
49
    NULL, NULL, NULL, NULL, NULL, NULL,
50
    BAD_CAST ">", BAD_CAST ">", 1,
51
    XML_INTERNAL_PREDEFINED_ENTITY,
52
    NULL, NULL, NULL, NULL, 0, 0, 0
53
};
54
static xmlEntity xmlEntityAmp = {
55
    NULL, XML_ENTITY_DECL, BAD_CAST "amp",
56
    NULL, NULL, NULL, NULL, NULL, NULL,
57
    BAD_CAST "&", BAD_CAST "&", 1,
58
    XML_INTERNAL_PREDEFINED_ENTITY,
59
    NULL, NULL, NULL, NULL, 0, 0, 0
60
};
61
static xmlEntity xmlEntityQuot = {
62
    NULL, XML_ENTITY_DECL, BAD_CAST "quot",
63
    NULL, NULL, NULL, NULL, NULL, NULL,
64
    BAD_CAST "\"", BAD_CAST "\"", 1,
65
    XML_INTERNAL_PREDEFINED_ENTITY,
66
    NULL, NULL, NULL, NULL, 0, 0, 0
67
};
68
static xmlEntity xmlEntityApos = {
69
    NULL, XML_ENTITY_DECL, BAD_CAST "apos",
70
    NULL, NULL, NULL, NULL, NULL, NULL,
71
    BAD_CAST "'", BAD_CAST "'", 1,
72
    XML_INTERNAL_PREDEFINED_ENTITY,
73
    NULL, NULL, NULL, NULL, 0, 0, 0
74
};
75
76
/*
77
 * xmlFreeEntity:
78
 * @entity:  an entity
79
 *
80
 * Frees the entity.
81
 */
82
void
83
xmlFreeEntity(xmlEntityPtr entity)
84
130k
{
85
130k
    xmlDictPtr dict = NULL;
86
87
130k
    if (entity == NULL)
88
0
        return;
89
90
130k
    if (entity->doc != NULL)
91
130k
        dict = entity->doc->dict;
92
93
94
130k
    if ((entity->children) &&
95
130k
        (entity == (xmlEntityPtr) entity->children->parent))
96
2.29k
        xmlFreeNodeList(entity->children);
97
130k
    if ((entity->name != NULL) &&
98
130k
        ((dict == NULL) || (!xmlDictOwns(dict, entity->name))))
99
13.6k
        xmlFree((char *) entity->name);
100
130k
    if (entity->ExternalID != NULL)
101
18.0k
        xmlFree((char *) entity->ExternalID);
102
130k
    if (entity->SystemID != NULL)
103
55.2k
        xmlFree((char *) entity->SystemID);
104
130k
    if (entity->URI != NULL)
105
53.6k
        xmlFree((char *) entity->URI);
106
130k
    if (entity->content != NULL)
107
73.4k
        xmlFree((char *) entity->content);
108
130k
    if (entity->orig != NULL)
109
46.3k
        xmlFree((char *) entity->orig);
110
130k
    xmlFree(entity);
111
130k
}
112
113
/*
114
 * xmlCreateEntity:
115
 *
116
 * internal routine doing the entity node structures allocations
117
 */
118
static xmlEntityPtr
119
xmlCreateEntity(xmlDocPtr doc, const xmlChar *name, int type,
120
          const xmlChar *ExternalID, const xmlChar *SystemID,
121
130k
          const xmlChar *content) {
122
130k
    xmlEntityPtr ret;
123
124
130k
    ret = (xmlEntityPtr) xmlMalloc(sizeof(xmlEntity));
125
130k
    if (ret == NULL)
126
10
  return(NULL);
127
130k
    memset(ret, 0, sizeof(xmlEntity));
128
130k
    ret->doc = doc;
129
130k
    ret->type = XML_ENTITY_DECL;
130
131
    /*
132
     * fill the structure.
133
     */
134
130k
    ret->etype = (xmlEntityType) type;
135
130k
    if ((doc == NULL) || (doc->dict == NULL))
136
13.7k
  ret->name = xmlStrdup(name);
137
116k
    else
138
116k
        ret->name = xmlDictLookup(doc->dict, name, -1);
139
130k
    if (ret->name == NULL)
140
2
        goto error;
141
130k
    if (ExternalID != NULL) {
142
18.0k
        ret->ExternalID = xmlStrdup(ExternalID);
143
18.0k
        if (ret->ExternalID == NULL)
144
2
            goto error;
145
18.0k
    }
146
130k
    if (SystemID != NULL) {
147
55.2k
        ret->SystemID = xmlStrdup(SystemID);
148
55.2k
        if (ret->SystemID == NULL)
149
6
            goto error;
150
55.2k
    }
151
130k
    if (content != NULL) {
152
72.9k
        ret->length = xmlStrlen(content);
153
72.9k
  ret->content = xmlStrndup(content, ret->length);
154
72.9k
        if (ret->content == NULL)
155
3
            goto error;
156
72.9k
     } else {
157
57.2k
        ret->length = 0;
158
57.2k
        ret->content = NULL;
159
57.2k
    }
160
130k
    ret->URI = NULL; /* to be computed by the layer knowing
161
      the defining entity */
162
130k
    ret->orig = NULL;
163
164
130k
    return(ret);
165
166
13
error:
167
13
    xmlFreeEntity(ret);
168
13
    return(NULL);
169
130k
}
170
171
/**
172
 * xmlAddEntity:
173
 * @doc:  the document
174
 * @extSubset:  add to the external or internal subset
175
 * @name:  the entity name
176
 * @type:  the entity type XML_xxx_yyy_ENTITY
177
 * @ExternalID:  the entity external ID if available
178
 * @SystemID:  the entity system ID if available
179
 * @content:  the entity content
180
 * @out:  pointer to resulting entity (optional)
181
 *
182
 * Register a new entity for this document.
183
 *
184
 * Available since 2.13.0.
185
 *
186
 * Returns an xmlParserErrors error code.
187
 */
188
int
189
xmlAddEntity(xmlDocPtr doc, int extSubset, const xmlChar *name, int type,
190
    const xmlChar *ExternalID, const xmlChar *SystemID,
191
134k
    const xmlChar *content, xmlEntityPtr *out) {
192
134k
    xmlDtdPtr dtd;
193
134k
    xmlDictPtr dict = NULL;
194
134k
    xmlEntitiesTablePtr table = NULL;
195
134k
    xmlEntityPtr ret, predef;
196
134k
    int res;
197
198
134k
    if (out != NULL)
199
134k
        *out = NULL;
200
134k
    if ((doc == NULL) || (name == NULL))
201
0
  return(XML_ERR_ARGUMENT);
202
134k
    dict = doc->dict;
203
204
134k
    if (extSubset)
205
3.90k
        dtd = doc->extSubset;
206
130k
    else
207
130k
        dtd = doc->intSubset;
208
134k
    if (dtd == NULL)
209
0
        return(XML_DTD_NO_DTD);
210
211
134k
    switch (type) {
212
50.6k
        case XML_INTERNAL_GENERAL_ENTITY:
213
69.8k
        case XML_EXTERNAL_GENERAL_PARSED_ENTITY:
214
70.0k
        case XML_EXTERNAL_GENERAL_UNPARSED_ENTITY:
215
70.0k
            predef = xmlGetPredefinedEntity(name);
216
70.0k
            if (predef != NULL) {
217
5.84k
                int valid = 0;
218
219
                /* 4.6 Predefined Entities */
220
5.84k
                if ((type == XML_INTERNAL_GENERAL_ENTITY) &&
221
5.84k
                    (content != NULL)) {
222
5.16k
                    int c = predef->content[0];
223
224
5.16k
                    if (((content[0] == c) && (content[1] == 0)) &&
225
5.16k
                        ((c == '>') || (c == '\'') || (c == '"'))) {
226
1.43k
                        valid = 1;
227
3.72k
                    } else if ((content[0] == '&') && (content[1] == '#')) {
228
1.20k
                        if (content[2] == 'x') {
229
214
                            xmlChar *hex = BAD_CAST "0123456789ABCDEF";
230
214
                            xmlChar ref[] = "00;";
231
232
214
                            ref[0] = hex[c / 16 % 16];
233
214
                            ref[1] = hex[c % 16];
234
214
                            if (xmlStrcasecmp(&content[3], ref) == 0)
235
0
                                valid = 1;
236
986
                        } else {
237
986
                            xmlChar ref[] = "00;";
238
239
986
                            ref[0] = '0' + c / 10 % 10;
240
986
                            ref[1] = '0' + c % 10;
241
986
                            if (xmlStrEqual(&content[2], ref))
242
587
                                valid = 1;
243
986
                        }
244
1.20k
                    }
245
5.16k
                }
246
5.84k
                if (!valid)
247
3.82k
                    return(XML_ERR_REDECL_PREDEF_ENTITY);
248
5.84k
            }
249
66.2k
      if (dtd->entities == NULL) {
250
35.9k
    dtd->entities = xmlHashCreateDict(0, dict);
251
35.9k
                if (dtd->entities == NULL)
252
3
                    return(XML_ERR_NO_MEMORY);
253
35.9k
            }
254
66.2k
      table = dtd->entities;
255
66.2k
      break;
256
26.8k
        case XML_INTERNAL_PARAMETER_ENTITY:
257
64.0k
        case XML_EXTERNAL_PARAMETER_ENTITY:
258
64.0k
      if (dtd->pentities == NULL) {
259
30.6k
    dtd->pentities = xmlHashCreateDict(0, dict);
260
30.6k
                if (dtd->pentities == NULL)
261
2
                    return(XML_ERR_NO_MEMORY);
262
30.6k
            }
263
64.0k
      table = dtd->pentities;
264
64.0k
      break;
265
0
        default:
266
0
      return(XML_ERR_ARGUMENT);
267
134k
    }
268
130k
    ret = xmlCreateEntity(dtd->doc, name, type, ExternalID, SystemID, content);
269
130k
    if (ret == NULL)
270
23
        return(XML_ERR_NO_MEMORY);
271
272
130k
    res = xmlHashAdd(table, name, ret);
273
130k
    if (res < 0) {
274
9
        xmlFreeEntity(ret);
275
9
        return(XML_ERR_NO_MEMORY);
276
130k
    } else if (res == 0) {
277
  /*
278
   * entity was already defined at another level.
279
   */
280
26.5k
        xmlFreeEntity(ret);
281
26.5k
  return(XML_WAR_ENTITY_REDEFINED);
282
26.5k
    }
283
284
    /*
285
     * Link it to the DTD
286
     */
287
103k
    ret->parent = dtd;
288
103k
    ret->doc = dtd->doc;
289
103k
    if (dtd->last == NULL) {
290
52.5k
  dtd->children = dtd->last = (xmlNodePtr) ret;
291
52.5k
    } else {
292
51.2k
  dtd->last->next = (xmlNodePtr) ret;
293
51.2k
  ret->prev = dtd->last;
294
51.2k
  dtd->last = (xmlNodePtr) ret;
295
51.2k
    }
296
297
103k
    if (out != NULL)
298
103k
        *out = ret;
299
103k
    return(0);
300
130k
}
301
302
/**
303
 * xmlGetPredefinedEntity:
304
 * @name:  the entity name
305
 *
306
 * Check whether this name is an predefined entity.
307
 *
308
 * Returns NULL if not, otherwise the entity
309
 */
310
xmlEntityPtr
311
3.73M
xmlGetPredefinedEntity(const xmlChar *name) {
312
3.73M
    if (name == NULL) return(NULL);
313
3.73M
    switch (name[0]) {
314
17.1k
        case 'l':
315
17.1k
      if (xmlStrEqual(name, BAD_CAST "lt"))
316
13.4k
          return(&xmlEntityLt);
317
3.72k
      break;
318
64.6k
        case 'g':
319
64.6k
      if (xmlStrEqual(name, BAD_CAST "gt"))
320
62.0k
          return(&xmlEntityGt);
321
2.63k
      break;
322
1.28M
        case 'a':
323
1.28M
      if (xmlStrEqual(name, BAD_CAST "amp"))
324
88.3k
          return(&xmlEntityAmp);
325
1.19M
      if (xmlStrEqual(name, BAD_CAST "apos"))
326
1.31k
          return(&xmlEntityApos);
327
1.19M
      break;
328
1.19M
        case 'q':
329
604k
      if (xmlStrEqual(name, BAD_CAST "quot"))
330
1.92k
          return(&xmlEntityQuot);
331
602k
      break;
332
1.76M
  default:
333
1.76M
      break;
334
3.73M
    }
335
3.57M
    return(NULL);
336
3.73M
}
337
338
/**
339
 * xmlAddDtdEntity:
340
 * @doc:  the document
341
 * @name:  the entity name
342
 * @type:  the entity type XML_xxx_yyy_ENTITY
343
 * @ExternalID:  the entity external ID if available
344
 * @SystemID:  the entity system ID if available
345
 * @content:  the entity content
346
 *
347
 * Register a new entity for this document DTD external subset.
348
 *
349
 * Returns a pointer to the entity or NULL in case of error
350
 */
351
xmlEntityPtr
352
xmlAddDtdEntity(xmlDocPtr doc, const xmlChar *name, int type,
353
          const xmlChar *ExternalID, const xmlChar *SystemID,
354
0
    const xmlChar *content) {
355
0
    xmlEntityPtr ret;
356
357
0
    xmlAddEntity(doc, 1, name, type, ExternalID, SystemID, content, &ret);
358
0
    return(ret);
359
0
}
360
361
/**
362
 * xmlAddDocEntity:
363
 * @doc:  the document
364
 * @name:  the entity name
365
 * @type:  the entity type XML_xxx_yyy_ENTITY
366
 * @ExternalID:  the entity external ID if available
367
 * @SystemID:  the entity system ID if available
368
 * @content:  the entity content
369
 *
370
 * Register a new entity for this document.
371
 *
372
 * Returns a pointer to the entity or NULL in case of error
373
 */
374
xmlEntityPtr
375
xmlAddDocEntity(xmlDocPtr doc, const xmlChar *name, int type,
376
          const xmlChar *ExternalID, const xmlChar *SystemID,
377
0
          const xmlChar *content) {
378
0
    xmlEntityPtr ret;
379
380
0
    xmlAddEntity(doc, 0, name, type, ExternalID, SystemID, content, &ret);
381
0
    return(ret);
382
0
}
383
384
/**
385
 * xmlNewEntity:
386
 * @doc:  the document
387
 * @name:  the entity name
388
 * @type:  the entity type XML_xxx_yyy_ENTITY
389
 * @ExternalID:  the entity external ID if available
390
 * @SystemID:  the entity system ID if available
391
 * @content:  the entity content
392
 *
393
 * Create a new entity, this differs from xmlAddDocEntity() that if
394
 * the document is NULL or has no internal subset defined, then an
395
 * unlinked entity structure will be returned, it is then the responsibility
396
 * of the caller to link it to the document later or free it when not needed
397
 * anymore.
398
 *
399
 * Returns a pointer to the entity or NULL in case of error
400
 */
401
xmlEntityPtr
402
xmlNewEntity(xmlDocPtr doc, const xmlChar *name, int type,
403
       const xmlChar *ExternalID, const xmlChar *SystemID,
404
0
       const xmlChar *content) {
405
0
    if ((doc != NULL) && (doc->intSubset != NULL)) {
406
0
  return(xmlAddDocEntity(doc, name, type, ExternalID, SystemID, content));
407
0
    }
408
0
    if (name == NULL)
409
0
        return(NULL);
410
0
    return(xmlCreateEntity(doc, name, type, ExternalID, SystemID, content));
411
0
}
412
413
/**
414
 * xmlGetEntityFromTable:
415
 * @table:  an entity table
416
 * @name:  the entity name
417
 * @parameter:  look for parameter entities
418
 *
419
 * Do an entity lookup in the table.
420
 * returns the corresponding parameter entity, if found.
421
 *
422
 * Returns A pointer to the entity structure or NULL if not found.
423
 */
424
static xmlEntityPtr
425
1.29M
xmlGetEntityFromTable(xmlEntitiesTablePtr table, const xmlChar *name) {
426
1.29M
    return((xmlEntityPtr) xmlHashLookup(table, name));
427
1.29M
}
428
429
/**
430
 * xmlGetParameterEntity:
431
 * @doc:  the document referencing the entity
432
 * @name:  the entity name
433
 *
434
 * Do an entity lookup in the internal and external subsets and
435
 * returns the corresponding parameter entity, if found.
436
 *
437
 * Returns A pointer to the entity structure or NULL if not found.
438
 */
439
xmlEntityPtr
440
150k
xmlGetParameterEntity(xmlDocPtr doc, const xmlChar *name) {
441
150k
    xmlEntitiesTablePtr table;
442
150k
    xmlEntityPtr ret;
443
444
150k
    if (doc == NULL)
445
318
  return(NULL);
446
149k
    if ((doc->intSubset != NULL) && (doc->intSubset->pentities != NULL)) {
447
146k
  table = (xmlEntitiesTablePtr) doc->intSubset->pentities;
448
146k
  ret = xmlGetEntityFromTable(table, name);
449
146k
  if (ret != NULL)
450
80.3k
      return(ret);
451
146k
    }
452
69.3k
    if ((doc->extSubset != NULL) && (doc->extSubset->pentities != NULL)) {
453
3.59k
  table = (xmlEntitiesTablePtr) doc->extSubset->pentities;
454
3.59k
  return(xmlGetEntityFromTable(table, name));
455
3.59k
    }
456
65.7k
    return(NULL);
457
69.3k
}
458
459
/**
460
 * xmlGetDtdEntity:
461
 * @doc:  the document referencing the entity
462
 * @name:  the entity name
463
 *
464
 * Do an entity lookup in the DTD entity hash table and
465
 * returns the corresponding entity, if found.
466
 * Note: the first argument is the document node, not the DTD node.
467
 *
468
 * Returns A pointer to the entity structure or NULL if not found.
469
 */
470
xmlEntityPtr
471
0
xmlGetDtdEntity(xmlDocPtr doc, const xmlChar *name) {
472
0
    xmlEntitiesTablePtr table;
473
474
0
    if (doc == NULL)
475
0
  return(NULL);
476
0
    if ((doc->extSubset != NULL) && (doc->extSubset->entities != NULL)) {
477
0
  table = (xmlEntitiesTablePtr) doc->extSubset->entities;
478
0
  return(xmlGetEntityFromTable(table, name));
479
0
    }
480
0
    return(NULL);
481
0
}
482
483
/**
484
 * xmlGetDocEntity:
485
 * @doc:  the document referencing the entity
486
 * @name:  the entity name
487
 *
488
 * Do an entity lookup in the document entity hash table and
489
 * returns the corresponding entity, otherwise a lookup is done
490
 * in the predefined entities too.
491
 *
492
 * Returns A pointer to the entity structure or NULL if not found.
493
 */
494
xmlEntityPtr
495
2.05M
xmlGetDocEntity(const xmlDoc *doc, const xmlChar *name) {
496
2.05M
    xmlEntityPtr cur;
497
2.05M
    xmlEntitiesTablePtr table;
498
499
2.05M
    if (doc != NULL) {
500
2.04M
  if ((doc->intSubset != NULL) && (doc->intSubset->entities != NULL)) {
501
1.03M
      table = (xmlEntitiesTablePtr) doc->intSubset->entities;
502
1.03M
      cur = xmlGetEntityFromTable(table, name);
503
1.03M
      if (cur != NULL)
504
642k
    return(cur);
505
1.03M
  }
506
1.40M
  if (doc->standalone != 1) {
507
1.40M
      if ((doc->extSubset != NULL) &&
508
1.40M
    (doc->extSubset->entities != NULL)) {
509
111k
    table = (xmlEntitiesTablePtr) doc->extSubset->entities;
510
111k
    cur = xmlGetEntityFromTable(table, name);
511
111k
    if (cur != NULL)
512
248
        return(cur);
513
111k
      }
514
1.40M
  }
515
1.40M
    }
516
1.40M
    return(xmlGetPredefinedEntity(name));
517
2.05M
}
518
519
/*
520
 * xmlSerializeHexCharRef:
521
 * @buf:  a char buffer
522
 * @val:  a codepoint
523
 *
524
 * Serializes a hex char ref like &#xA0;
525
 *
526
 * Writes at most 9 bytes. Does not include a terminating zero byte.
527
 *
528
 * Returns the number of bytes written.
529
 */
530
int
531
15.4k
xmlSerializeHexCharRef(char *buf, int val) {
532
15.4k
    char *out = buf;
533
15.4k
    int shift = 0, bits;
534
535
15.4k
    *out++ = '&';
536
15.4k
    *out++ = '#';
537
15.4k
    *out++ = 'x';
538
539
15.4k
    bits = val;
540
15.4k
    if (bits & 0xFF0000) {
541
19
        shift = 16;
542
19
        bits &= 0xFF0000;
543
15.4k
    } else if (bits & 0x00FF00) {
544
468
        shift = 8;
545
468
        bits &= 0x00FF00;
546
468
    }
547
15.4k
    if (bits & 0xF0F0F0) {
548
14.9k
        shift += 4;
549
14.9k
    }
550
551
31.4k
    do {
552
31.4k
        int d = (val >> shift) & 0x0F;
553
554
31.4k
        if (d < 10)
555
17.9k
            *out++ = '0' + d;
556
13.5k
        else
557
13.5k
            *out++ = 'A' + (d - 10);
558
559
31.4k
  shift -= 4;
560
31.4k
    } while (shift >= 0);
561
562
15.4k
    *out++ = ';';
563
564
15.4k
    return(out - buf);
565
15.4k
}
566
567
/*
568
 * xmlSerializeDecCharRef:
569
 * @buf:  a char buffer
570
 * @val:  a codepoint
571
 *
572
 * Serializes a decimal char ref like &#38;
573
 *
574
 * Writes at most 10 bytes. Does not include a terminating zero byte.
575
 *
576
 * Returns the number of bytes written.
577
 */
578
int
579
70.0M
xmlSerializeDecCharRef(char *buf, int val) {
580
70.0M
    char *out = buf;
581
70.0M
    int len, i;
582
583
70.0M
    *out++ = '&';
584
70.0M
    *out++ = '#';
585
586
70.0M
    if (val < 100) {
587
1.15k
        len = (val < 10) ? 1 : 2;
588
70.0M
    } else if (val < 10000) {
589
70.0M
        len = (val < 1000) ? 3 : 4;
590
70.0M
    } else if (val < 1000000) {
591
7.33k
        len = (val < 100000) ? 5 : 6;
592
7.33k
    } else {
593
116
        len = 7;
594
116
    }
595
596
281M
    for (i = len - 1; i >= 0; i--) {
597
211M
        out[i] = '0' + val % 10;
598
211M
        val /= 10;
599
211M
    }
600
601
70.0M
    out[len] = ';';
602
603
70.0M
    return(len + 3);
604
70.0M
}
605
606
static const char xmlEscapeSafe[128] = {
607
    0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0,
608
    0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
609
    1, 1, 0, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1,
610
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 1,
611
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
612
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
613
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
614
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1
615
};
616
617
/*
618
 * xmlEscapeText:
619
 * @text:  input text
620
 * @flags:  XML_ESCAPE flags
621
 *
622
 * Escapes certain characters with char refs.
623
 *
624
 * XML_ESCAPE_ATTR: for attribute content.
625
 * XML_ESCAPE_NON_ASCII: escape non-ASCII chars.
626
 * XML_ESCAPE_HTML: for HTML content.
627
 * XML_ESCAPE_QUOT: escape double quotes.
628
 * XML_ESCAPE_ALLOW_INVALID: allow invalid characters.
629
 *
630
 * Returns an escaped string or NULL if a memory allocation failed.
631
 */
632
xmlChar *
633
64.8k
xmlEscapeText(const xmlChar *text, int flags) {
634
64.8k
    const xmlChar *cur;
635
64.8k
    xmlChar *buffer;
636
64.8k
    xmlChar *out;
637
64.8k
    const xmlChar *unescaped;
638
64.8k
    size_t size = 50;
639
640
64.8k
    buffer = xmlMalloc(size + 1);
641
64.8k
    if (buffer == NULL)
642
61
        return(NULL);
643
64.7k
    out = buffer;
644
645
64.7k
    cur = text;
646
64.7k
    unescaped = cur;
647
648
455k
    while (*cur != '\0') {
649
390k
        char buf[12];
650
390k
  const xmlChar *end;
651
390k
        const xmlChar *repl;
652
390k
        size_t used;
653
390k
        size_t replSize;
654
390k
        size_t unescapedSize;
655
390k
        size_t totalSize;
656
390k
        int chunkSize = 1;
657
390k
        int c;
658
659
        /* accelerator */
660
153M
  while (1) {
661
153M
            c = *cur;
662
663
153M
            if (c < 0x80) {
664
21.2M
                if (!xmlEscapeSafe[*cur])
665
390k
                    break;
666
132M
            } else {
667
132M
               if (flags & XML_ESCAPE_NON_ASCII)
668
0
                   break;
669
132M
            }
670
153M
            cur += 1;
671
153M
        }
672
673
390k
        if (c == 0) {
674
58.8k
            chunkSize = 0;
675
58.8k
            repl = BAD_CAST "";
676
58.8k
            replSize = 0;
677
331k
        } else if (c == '<') {
678
      /*
679
       * Special handling of server side include in HTML attributes
680
       */
681
71.9k
      if ((flags & XML_ESCAPE_HTML) && (flags & XML_ESCAPE_ATTR) &&
682
71.9k
          (cur[1] == '!') && (cur[2] == '-') && (cur[3] == '-') &&
683
71.9k
          ((end = xmlStrstr(cur, BAD_CAST "-->")) != NULL)) {
684
6.49k
                chunkSize = (end - cur) + 3;
685
6.49k
                repl = cur;
686
6.49k
                replSize = chunkSize;
687
65.4k
      } else {
688
65.4k
                repl = BAD_CAST "&lt;";
689
65.4k
                replSize = 4;
690
65.4k
            }
691
259k
  } else if (c == '>') {
692
94.2k
            repl = BAD_CAST "&gt;";
693
94.2k
            replSize = 4;
694
165k
  } else if (c == '&') {
695
      /*
696
       * Special handling of &{...} construct from HTML 4, see
697
       * http://www.w3.org/TR/html401/appendix/notes.html#h-B.7.1
698
       */
699
13.4k
      if ((flags & XML_ESCAPE_HTML) && (flags & XML_ESCAPE_ATTR) &&
700
13.4k
                (cur[1] == '{') && (end = xmlStrchr(cur, '}'))) {
701
3.11k
                chunkSize = (end - cur) + 1;
702
3.11k
                repl = cur;
703
3.11k
                replSize = chunkSize;
704
10.3k
      } else {
705
10.3k
                repl = BAD_CAST "&amp;";
706
10.3k
                replSize = 5;
707
10.3k
            }
708
152k
  } else if ((flags & XML_ESCAPE_QUOT) && (c == '"')) {
709
0
            repl = BAD_CAST "&quot;";
710
0
            replSize = 6;
711
152k
  } else if (((flags & XML_ESCAPE_HTML) == 0) && (c == '\r')) {
712
0
      repl = BAD_CAST "&#13;";
713
0
            replSize = 5;
714
152k
  } else if ((flags & XML_ESCAPE_NON_ASCII) && (c >= 0x80)) {
715
0
            int val;
716
717
0
            chunkSize = 4;
718
0
            val = xmlGetUTF8Char(cur, &chunkSize);
719
0
            if (val < 0) {
720
0
                val = 0xFFFD;
721
0
                chunkSize = 1;
722
0
            } else if (((flags & XML_ESCAPE_ALLOW_INVALID) == 0) &&
723
0
                       (!IS_CHAR(val))) {
724
0
                val = 0xFFFD;
725
0
            }
726
727
0
            replSize = xmlSerializeHexCharRef(buf, val);
728
0
            repl = BAD_CAST buf;
729
152k
  } else if ((flags & (XML_ESCAPE_ALLOW_INVALID | XML_ESCAPE_HTML)) ||
730
152k
                   (c >= 0x20) ||
731
152k
             (c == '\n') || (c == '\t') || (c == '\r')) {
732
      /* default case, just copy */
733
152k
            cur += 1;
734
152k
            if (*cur != 0)
735
150k
                continue;
736
737
1.17k
            chunkSize = 0;
738
1.17k
            repl = BAD_CAST "";
739
1.17k
            replSize = 0;
740
1.17k
  } else {
741
            /* ignore */
742
0
            repl = BAD_CAST "";
743
0
            replSize = 0;
744
0
        }
745
746
239k
        used = out - buffer;
747
239k
        unescapedSize = cur - unescaped;
748
239k
        totalSize = unescapedSize + replSize;
749
750
239k
  cur += chunkSize;
751
752
239k
        if (totalSize > size - used) {
753
20.4k
            xmlChar *tmp;
754
20.4k
            int newSize;
755
756
20.4k
            if ((size > (SIZE_MAX - 1) / 2) ||
757
20.4k
                (totalSize > (SIZE_MAX - 1) / 2 - size)) {
758
0
                xmlFree(buffer);
759
0
                return(NULL);
760
0
            }
761
20.4k
            newSize = size + totalSize;
762
20.4k
            if (*cur != 0)
763
10.7k
                newSize *= 2;
764
20.4k
            tmp = xmlRealloc(buffer, newSize + 1);
765
20.4k
            if (tmp == NULL) {
766
6
                xmlFree(buffer);
767
6
                return(NULL);
768
6
            }
769
20.4k
            buffer = tmp;
770
20.4k
            size = newSize;
771
20.4k
            out = buffer + used;
772
20.4k
        }
773
774
239k
        memcpy(out, unescaped, unescapedSize);
775
239k
        out += unescapedSize;
776
239k
        memcpy(out, repl, replSize);
777
239k
        out += replSize;
778
779
239k
        unescaped = cur;
780
239k
    }
781
782
64.7k
    *out = 0;
783
64.7k
    return(buffer);
784
64.7k
}
785
786
/**
787
 * xmlEncodeEntitiesInternal:
788
 * @doc:  the document containing the string
789
 * @input:  A string to convert to XML.
790
 * @flags:  XML_ESCAPE flags
791
 *
792
 * Do a global encoding of a string, replacing the predefined entities
793
 * and non ASCII values with their entities and CharRef counterparts.
794
 * Contrary to xmlEncodeEntities, this routine is reentrant, and result
795
 * must be deallocated.
796
 *
797
 * Returns A newly allocated string with the substitution done.
798
 */
799
xmlChar *
800
xmlEncodeEntitiesInternal(xmlDocPtr doc, const xmlChar *input,
801
64.8k
                          unsigned flags) {
802
64.8k
    if (input == NULL)
803
0
        return(NULL);
804
805
64.8k
    if ((doc != NULL) && (doc->type == XML_HTML_DOCUMENT_NODE))
806
64.8k
        flags |= XML_ESCAPE_HTML;
807
0
    else if ((doc == NULL) || (doc->encoding == NULL))
808
0
        flags |= XML_ESCAPE_NON_ASCII;
809
810
64.8k
    return(xmlEscapeText(input, flags));
811
64.8k
}
812
813
/**
814
 * xmlEncodeEntitiesReentrant:
815
 * @doc:  the document containing the string
816
 * @input:  A string to convert to XML.
817
 *
818
 * Do a global encoding of a string, replacing the predefined entities
819
 * and non ASCII values with their entities and CharRef counterparts.
820
 * Contrary to xmlEncodeEntities, this routine is reentrant, and result
821
 * must be deallocated.
822
 *
823
 * This escapes '<', '>', '&' and '\r'. If the document has no encoding,
824
 * non-ASCII codepoints are escaped. There is some special handling for
825
 * HTML documents.
826
 *
827
 * Returns A newly allocated string with the substitution done.
828
 */
829
xmlChar *
830
42.9k
xmlEncodeEntitiesReentrant(xmlDocPtr doc, const xmlChar *input) {
831
42.9k
    return xmlEncodeEntitiesInternal(doc, input, 0);
832
42.9k
}
833
834
/**
835
 * xmlEncodeSpecialChars:
836
 * @doc:  unused
837
 * @input:  A string to convert to XML.
838
 *
839
 * Do a global encoding of a string, replacing the predefined entities
840
 * this routine is reentrant, and result must be deallocated.
841
 *
842
 * This escapes '<', '>', '&', '"' and '\r' chars.
843
 *
844
 * Returns A newly allocated string with the substitution done.
845
 */
846
xmlChar *
847
xmlEncodeSpecialChars(const xmlDoc *doc ATTRIBUTE_UNUSED,
848
0
                      const xmlChar *input) {
849
0
    if (input == NULL)
850
0
        return(NULL);
851
852
0
    return(xmlEscapeText(input, XML_ESCAPE_QUOT | XML_ESCAPE_ALLOW_INVALID));
853
0
}
854
855
/**
856
 * xmlCreateEntitiesTable:
857
 *
858
 * create and initialize an empty entities hash table.
859
 * This really doesn't make sense and should be deprecated
860
 *
861
 * Returns the xmlEntitiesTablePtr just created or NULL in case of error.
862
 */
863
xmlEntitiesTablePtr
864
0
xmlCreateEntitiesTable(void) {
865
0
    return((xmlEntitiesTablePtr) xmlHashCreate(0));
866
0
}
867
868
/**
869
 * xmlFreeEntityWrapper:
870
 * @entity:  An entity
871
 * @name:  its name
872
 *
873
 * Deallocate the memory used by an entities in the hash table.
874
 */
875
static void
876
103k
xmlFreeEntityWrapper(void *entity, const xmlChar *name ATTRIBUTE_UNUSED) {
877
103k
    if (entity != NULL)
878
103k
  xmlFreeEntity((xmlEntityPtr) entity);
879
103k
}
880
881
/**
882
 * xmlFreeEntitiesTable:
883
 * @table:  An entity table
884
 *
885
 * Deallocate the memory used by an entities hash table.
886
 */
887
void
888
66.5k
xmlFreeEntitiesTable(xmlEntitiesTablePtr table) {
889
66.5k
    xmlHashFree(table, xmlFreeEntityWrapper);
890
66.5k
}
891
892
/**
893
 * xmlCopyEntity:
894
 * @ent:  An entity
895
 *
896
 * Build a copy of an entity
897
 *
898
 * Returns the new xmlEntitiesPtr or NULL in case of error.
899
 */
900
static void *
901
0
xmlCopyEntity(void *payload, const xmlChar *name ATTRIBUTE_UNUSED) {
902
0
    xmlEntityPtr ent = (xmlEntityPtr) payload;
903
0
    xmlEntityPtr cur;
904
905
0
    cur = (xmlEntityPtr) xmlMalloc(sizeof(xmlEntity));
906
0
    if (cur == NULL)
907
0
  return(NULL);
908
0
    memset(cur, 0, sizeof(xmlEntity));
909
0
    cur->type = XML_ENTITY_DECL;
910
911
0
    cur->etype = ent->etype;
912
0
    if (ent->name != NULL) {
913
0
  cur->name = xmlStrdup(ent->name);
914
0
        if (cur->name == NULL)
915
0
            goto error;
916
0
    }
917
0
    if (ent->ExternalID != NULL) {
918
0
  cur->ExternalID = xmlStrdup(ent->ExternalID);
919
0
        if (cur->ExternalID == NULL)
920
0
            goto error;
921
0
    }
922
0
    if (ent->SystemID != NULL) {
923
0
  cur->SystemID = xmlStrdup(ent->SystemID);
924
0
        if (cur->SystemID == NULL)
925
0
            goto error;
926
0
    }
927
0
    if (ent->content != NULL) {
928
0
  cur->content = xmlStrdup(ent->content);
929
0
        if (cur->content == NULL)
930
0
            goto error;
931
0
    }
932
0
    if (ent->orig != NULL) {
933
0
  cur->orig = xmlStrdup(ent->orig);
934
0
        if (cur->orig == NULL)
935
0
            goto error;
936
0
    }
937
0
    if (ent->URI != NULL) {
938
0
  cur->URI = xmlStrdup(ent->URI);
939
0
        if (cur->URI == NULL)
940
0
            goto error;
941
0
    }
942
0
    return(cur);
943
944
0
error:
945
0
    xmlFreeEntity(cur);
946
0
    return(NULL);
947
0
}
948
949
/**
950
 * xmlCopyEntitiesTable:
951
 * @table:  An entity table
952
 *
953
 * Build a copy of an entity table.
954
 *
955
 * Returns the new xmlEntitiesTablePtr or NULL in case of error.
956
 */
957
xmlEntitiesTablePtr
958
0
xmlCopyEntitiesTable(xmlEntitiesTablePtr table) {
959
0
    return(xmlHashCopySafe(table, xmlCopyEntity, xmlFreeEntityWrapper));
960
0
}
961
962
#ifdef LIBXML_OUTPUT_ENABLED
963
964
/**
965
 * xmlDumpEntityDecl:
966
 * @buf:  An XML buffer.
967
 * @ent:  An entity table
968
 *
969
 * This will dump the content of the entity table as an XML DTD definition
970
 */
971
void
972
0
xmlDumpEntityDecl(xmlBufferPtr buf, xmlEntityPtr ent) {
973
0
    xmlSaveCtxtPtr save;
974
975
0
    if ((buf == NULL) || (ent == NULL))
976
0
        return;
977
978
0
    save = xmlSaveToBuffer(buf, NULL, 0);
979
0
    xmlSaveTree(save, (xmlNodePtr) ent);
980
0
    if (xmlSaveFinish(save) != XML_ERR_OK)
981
0
        xmlFree(xmlBufferDetach(buf));
982
0
}
983
984
/**
985
 * xmlDumpEntityDeclScan:
986
 * @ent:  An entity table
987
 * @buf:  An XML buffer.
988
 *
989
 * When using the hash table scan function, arguments need to be reversed
990
 */
991
static void
992
xmlDumpEntityDeclScan(void *ent, void *save,
993
0
                      const xmlChar *name ATTRIBUTE_UNUSED) {
994
0
    xmlSaveTree(save, ent);
995
0
}
996
997
/**
998
 * xmlDumpEntitiesTable:
999
 * @buf:  An XML buffer.
1000
 * @table:  An entity table
1001
 *
1002
 * This will dump the content of the entity table as an XML DTD definition
1003
 */
1004
void
1005
0
xmlDumpEntitiesTable(xmlBufferPtr buf, xmlEntitiesTablePtr table) {
1006
0
    xmlSaveCtxtPtr save;
1007
1008
0
    if ((buf == NULL) || (table == NULL))
1009
0
        return;
1010
1011
0
    save = xmlSaveToBuffer(buf, NULL, 0);
1012
0
    xmlHashScan(table, xmlDumpEntityDeclScan, save);
1013
0
    if (xmlSaveFinish(save) != XML_ERR_OK)
1014
0
        xmlFree(xmlBufferDetach(buf));
1015
0
}
1016
#endif /* LIBXML_OUTPUT_ENABLED */