Coverage Report

Created: 2025-10-13 06:56

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
/src/libxml2/entities.c
Line
Count
Source
1
/*
2
 * entities.c : implementation for the XML entities handling
3
 *
4
 * See Copyright for the status of this software.
5
 *
6
 * daniel@veillard.com
7
 */
8
9
/* To avoid EBCDIC trouble when parsing on zOS */
10
#if defined(__MVS__)
11
#pragma convert("ISO8859-1")
12
#endif
13
14
#define IN_LIBXML
15
#include "libxml.h"
16
17
#include <string.h>
18
#include <stdlib.h>
19
20
#include <libxml/xmlmemory.h>
21
#include <libxml/hash.h>
22
#include <libxml/entities.h>
23
#include <libxml/parser.h>
24
#include <libxml/parserInternals.h>
25
#include <libxml/xmlerror.h>
26
#include <libxml/dict.h>
27
#include <libxml/xmlsave.h>
28
29
#include "private/entities.h"
30
#include "private/error.h"
31
32
#ifndef SIZE_MAX
33
  #define SIZE_MAX ((size_t) -1)
34
#endif
35
36
/*
37
 * The XML predefined entities.
38
 */
39
40
static xmlEntity xmlEntityLt = {
41
    NULL, XML_ENTITY_DECL, BAD_CAST "lt",
42
    NULL, NULL, NULL, NULL, NULL, NULL,
43
    BAD_CAST "<", BAD_CAST "<", 1,
44
    XML_INTERNAL_PREDEFINED_ENTITY,
45
    NULL, NULL, NULL, NULL, 0, 0, 0
46
};
47
static xmlEntity xmlEntityGt = {
48
    NULL, XML_ENTITY_DECL, BAD_CAST "gt",
49
    NULL, NULL, NULL, NULL, NULL, NULL,
50
    BAD_CAST ">", BAD_CAST ">", 1,
51
    XML_INTERNAL_PREDEFINED_ENTITY,
52
    NULL, NULL, NULL, NULL, 0, 0, 0
53
};
54
static xmlEntity xmlEntityAmp = {
55
    NULL, XML_ENTITY_DECL, BAD_CAST "amp",
56
    NULL, NULL, NULL, NULL, NULL, NULL,
57
    BAD_CAST "&", BAD_CAST "&", 1,
58
    XML_INTERNAL_PREDEFINED_ENTITY,
59
    NULL, NULL, NULL, NULL, 0, 0, 0
60
};
61
static xmlEntity xmlEntityQuot = {
62
    NULL, XML_ENTITY_DECL, BAD_CAST "quot",
63
    NULL, NULL, NULL, NULL, NULL, NULL,
64
    BAD_CAST "\"", BAD_CAST "\"", 1,
65
    XML_INTERNAL_PREDEFINED_ENTITY,
66
    NULL, NULL, NULL, NULL, 0, 0, 0
67
};
68
static xmlEntity xmlEntityApos = {
69
    NULL, XML_ENTITY_DECL, BAD_CAST "apos",
70
    NULL, NULL, NULL, NULL, NULL, NULL,
71
    BAD_CAST "'", BAD_CAST "'", 1,
72
    XML_INTERNAL_PREDEFINED_ENTITY,
73
    NULL, NULL, NULL, NULL, 0, 0, 0
74
};
75
76
/*
77
 * xmlFreeEntity:
78
 * @entity:  an entity
79
 *
80
 * Frees the entity.
81
 */
82
void
83
xmlFreeEntity(xmlEntityPtr entity)
84
109k
{
85
109k
    xmlDictPtr dict = NULL;
86
87
109k
    if (entity == NULL)
88
0
        return;
89
90
109k
    if (entity->doc != NULL)
91
109k
        dict = entity->doc->dict;
92
93
94
109k
    if ((entity->children) &&
95
2.03k
        (entity == (xmlEntityPtr) entity->children->parent))
96
2.03k
        xmlFreeNodeList(entity->children);
97
109k
    if ((entity->name != NULL) &&
98
109k
        ((dict == NULL) || (!xmlDictOwns(dict, entity->name))))
99
11.9k
        xmlFree((char *) entity->name);
100
109k
    if (entity->ExternalID != NULL)
101
12.0k
        xmlFree((char *) entity->ExternalID);
102
109k
    if (entity->SystemID != NULL)
103
39.1k
        xmlFree((char *) entity->SystemID);
104
109k
    if (entity->URI != NULL)
105
36.6k
        xmlFree((char *) entity->URI);
106
109k
    if (entity->content != NULL)
107
69.9k
        xmlFree((char *) entity->content);
108
109k
    if (entity->orig != NULL)
109
46.2k
        xmlFree((char *) entity->orig);
110
109k
    xmlFree(entity);
111
109k
}
112
113
/*
114
 * xmlCreateEntity:
115
 *
116
 * internal routine doing the entity node structures allocations
117
 */
118
static xmlEntityPtr
119
xmlCreateEntity(xmlDocPtr doc, const xmlChar *name, int type,
120
          const xmlChar *ExternalID, const xmlChar *SystemID,
121
109k
          const xmlChar *content) {
122
109k
    xmlEntityPtr ret;
123
124
109k
    ret = (xmlEntityPtr) xmlMalloc(sizeof(xmlEntity));
125
109k
    if (ret == NULL)
126
7
  return(NULL);
127
109k
    memset(ret, 0, sizeof(xmlEntity));
128
109k
    ret->doc = doc;
129
109k
    ret->type = XML_ENTITY_DECL;
130
131
    /*
132
     * fill the structure.
133
     */
134
109k
    ret->etype = (xmlEntityType) type;
135
109k
    if ((doc == NULL) || (doc->dict == NULL))
136
11.9k
  ret->name = xmlStrdup(name);
137
97.8k
    else
138
97.8k
        ret->name = xmlDictLookup(doc->dict, name, -1);
139
109k
    if (ret->name == NULL)
140
3
        goto error;
141
109k
    if (ExternalID != NULL) {
142
12.0k
        ret->ExternalID = xmlStrdup(ExternalID);
143
12.0k
        if (ret->ExternalID == NULL)
144
1
            goto error;
145
12.0k
    }
146
109k
    if (SystemID != NULL) {
147
39.1k
        ret->SystemID = xmlStrdup(SystemID);
148
39.1k
        if (ret->SystemID == NULL)
149
2
            goto error;
150
39.1k
    }
151
109k
    if (content != NULL) {
152
69.2k
        ret->length = xmlStrlen(content);
153
69.2k
  ret->content = xmlStrndup(content, ret->length);
154
69.2k
        if (ret->content == NULL)
155
4
            goto error;
156
69.2k
     } else {
157
40.5k
        ret->length = 0;
158
40.5k
        ret->content = NULL;
159
40.5k
    }
160
109k
    ret->URI = NULL; /* to be computed by the layer knowing
161
      the defining entity */
162
109k
    ret->orig = NULL;
163
164
109k
    return(ret);
165
166
10
error:
167
10
    xmlFreeEntity(ret);
168
10
    return(NULL);
169
109k
}
170
171
/**
172
 * xmlAddEntity:
173
 * @doc:  the document
174
 * @extSubset:  add to the external or internal subset
175
 * @name:  the entity name
176
 * @type:  the entity type XML_xxx_yyy_ENTITY
177
 * @ExternalID:  the entity external ID if available
178
 * @SystemID:  the entity system ID if available
179
 * @content:  the entity content
180
 * @out:  pointer to resulting entity (optional)
181
 *
182
 * Register a new entity for this document.
183
 *
184
 * Available since 2.13.0.
185
 *
186
 * Returns an xmlParserErrors error code.
187
 */
188
int
189
xmlAddEntity(xmlDocPtr doc, int extSubset, const xmlChar *name, int type,
190
    const xmlChar *ExternalID, const xmlChar *SystemID,
191
117k
    const xmlChar *content, xmlEntityPtr *out) {
192
117k
    xmlDtdPtr dtd;
193
117k
    xmlDictPtr dict = NULL;
194
117k
    xmlEntitiesTablePtr table = NULL;
195
117k
    xmlEntityPtr ret, predef;
196
117k
    int res;
197
198
117k
    if (out != NULL)
199
117k
        *out = NULL;
200
117k
    if ((doc == NULL) || (name == NULL))
201
0
  return(XML_ERR_ARGUMENT);
202
117k
    dict = doc->dict;
203
204
117k
    if (extSubset)
205
14.6k
        dtd = doc->extSubset;
206
103k
    else
207
103k
        dtd = doc->intSubset;
208
117k
    if (dtd == NULL)
209
0
        return(XML_DTD_NO_DTD);
210
211
117k
    switch (type) {
212
46.4k
        case XML_INTERNAL_GENERAL_ENTITY:
213
59.9k
        case XML_EXTERNAL_GENERAL_PARSED_ENTITY:
214
60.1k
        case XML_EXTERNAL_GENERAL_UNPARSED_ENTITY:
215
60.1k
            predef = xmlGetPredefinedEntity(name);
216
60.1k
            if (predef != NULL) {
217
11.1k
                int valid = 0;
218
219
                /* 4.6 Predefined Entities */
220
11.1k
                if ((type == XML_INTERNAL_GENERAL_ENTITY) &&
221
10.4k
                    (content != NULL)) {
222
10.0k
                    int c = predef->content[0];
223
224
10.0k
                    if (((content[0] == c) && (content[1] == 0)) &&
225
2.03k
                        ((c == '>') || (c == '\'') || (c == '"'))) {
226
1.77k
                        valid = 1;
227
8.30k
                    } else if ((content[0] == '&') && (content[1] == '#')) {
228
3.69k
                        if (content[2] == 'x') {
229
2.43k
                            xmlChar *hex = BAD_CAST "0123456789ABCDEF";
230
2.43k
                            xmlChar ref[] = "00;";
231
232
2.43k
                            ref[0] = hex[c / 16 % 16];
233
2.43k
                            ref[1] = hex[c % 16];
234
2.43k
                            if (xmlStrcasecmp(&content[3], ref) == 0)
235
707
                                valid = 1;
236
2.43k
                        } else {
237
1.25k
                            xmlChar ref[] = "00;";
238
239
1.25k
                            ref[0] = '0' + c / 10 % 10;
240
1.25k
                            ref[1] = '0' + c % 10;
241
1.25k
                            if (xmlStrEqual(&content[2], ref))
242
746
                                valid = 1;
243
1.25k
                        }
244
3.69k
                    }
245
10.0k
                }
246
11.1k
                if (!valid)
247
7.90k
                    return(XML_ERR_REDECL_PREDEF_ENTITY);
248
11.1k
            }
249
52.2k
      if (dtd->entities == NULL) {
250
28.0k
    dtd->entities = xmlHashCreateDict(0, dict);
251
28.0k
                if (dtd->entities == NULL)
252
1
                    return(XML_ERR_NO_MEMORY);
253
28.0k
            }
254
52.2k
      table = dtd->entities;
255
52.2k
      break;
256
30.5k
        case XML_INTERNAL_PARAMETER_ENTITY:
257
57.5k
        case XML_EXTERNAL_PARAMETER_ENTITY:
258
57.5k
      if (dtd->pentities == NULL) {
259
23.5k
    dtd->pentities = xmlHashCreateDict(0, dict);
260
23.5k
                if (dtd->pentities == NULL)
261
6
                    return(XML_ERR_NO_MEMORY);
262
23.5k
            }
263
57.5k
      table = dtd->pentities;
264
57.5k
      break;
265
0
        default:
266
0
      return(XML_ERR_ARGUMENT);
267
117k
    }
268
109k
    ret = xmlCreateEntity(dtd->doc, name, type, ExternalID, SystemID, content);
269
109k
    if (ret == NULL)
270
17
        return(XML_ERR_NO_MEMORY);
271
272
109k
    res = xmlHashAdd(table, name, ret);
273
109k
    if (res < 0) {
274
4
        xmlFreeEntity(ret);
275
4
        return(XML_ERR_NO_MEMORY);
276
109k
    } else if (res == 0) {
277
  /*
278
   * entity was already defined at another level.
279
   */
280
23.7k
        xmlFreeEntity(ret);
281
23.7k
  return(XML_WAR_ENTITY_REDEFINED);
282
23.7k
    }
283
284
    /*
285
     * Link it to the DTD
286
     */
287
86.0k
    ret->parent = dtd;
288
86.0k
    ret->doc = dtd->doc;
289
86.0k
    if (dtd->last == NULL) {
290
36.3k
  dtd->children = dtd->last = (xmlNodePtr) ret;
291
49.7k
    } else {
292
49.7k
  dtd->last->next = (xmlNodePtr) ret;
293
49.7k
  ret->prev = dtd->last;
294
49.7k
  dtd->last = (xmlNodePtr) ret;
295
49.7k
    }
296
297
86.0k
    if (out != NULL)
298
86.0k
        *out = ret;
299
86.0k
    return(0);
300
109k
}
301
302
/**
303
 * xmlGetPredefinedEntity:
304
 * @name:  the entity name
305
 *
306
 * Check whether this name is an predefined entity.
307
 *
308
 * Returns NULL if not, otherwise the entity
309
 */
310
xmlEntityPtr
311
3.69M
xmlGetPredefinedEntity(const xmlChar *name) {
312
3.69M
    if (name == NULL) return(NULL);
313
3.69M
    switch (name[0]) {
314
28.2k
        case 'l':
315
28.2k
      if (xmlStrEqual(name, BAD_CAST "lt"))
316
15.7k
          return(&xmlEntityLt);
317
12.5k
      break;
318
40.4k
        case 'g':
319
40.4k
      if (xmlStrEqual(name, BAD_CAST "gt"))
320
37.8k
          return(&xmlEntityGt);
321
2.56k
      break;
322
1.24M
        case 'a':
323
1.24M
      if (xmlStrEqual(name, BAD_CAST "amp"))
324
59.8k
          return(&xmlEntityAmp);
325
1.18M
      if (xmlStrEqual(name, BAD_CAST "apos"))
326
2.69k
          return(&xmlEntityApos);
327
1.18M
      break;
328
1.18M
        case 'q':
329
492k
      if (xmlStrEqual(name, BAD_CAST "quot"))
330
4.98k
          return(&xmlEntityQuot);
331
487k
      break;
332
1.88M
  default:
333
1.88M
      break;
334
3.69M
    }
335
3.56M
    return(NULL);
336
3.69M
}
337
338
/**
339
 * xmlAddDtdEntity:
340
 * @doc:  the document
341
 * @name:  the entity name
342
 * @type:  the entity type XML_xxx_yyy_ENTITY
343
 * @ExternalID:  the entity external ID if available
344
 * @SystemID:  the entity system ID if available
345
 * @content:  the entity content
346
 *
347
 * Register a new entity for this document DTD external subset.
348
 *
349
 * Returns a pointer to the entity or NULL in case of error
350
 */
351
xmlEntityPtr
352
xmlAddDtdEntity(xmlDocPtr doc, const xmlChar *name, int type,
353
          const xmlChar *ExternalID, const xmlChar *SystemID,
354
0
    const xmlChar *content) {
355
0
    xmlEntityPtr ret;
356
357
0
    xmlAddEntity(doc, 1, name, type, ExternalID, SystemID, content, &ret);
358
0
    return(ret);
359
0
}
360
361
/**
362
 * xmlAddDocEntity:
363
 * @doc:  the document
364
 * @name:  the entity name
365
 * @type:  the entity type XML_xxx_yyy_ENTITY
366
 * @ExternalID:  the entity external ID if available
367
 * @SystemID:  the entity system ID if available
368
 * @content:  the entity content
369
 *
370
 * Register a new entity for this document.
371
 *
372
 * Returns a pointer to the entity or NULL in case of error
373
 */
374
xmlEntityPtr
375
xmlAddDocEntity(xmlDocPtr doc, const xmlChar *name, int type,
376
          const xmlChar *ExternalID, const xmlChar *SystemID,
377
0
          const xmlChar *content) {
378
0
    xmlEntityPtr ret;
379
380
0
    xmlAddEntity(doc, 0, name, type, ExternalID, SystemID, content, &ret);
381
0
    return(ret);
382
0
}
383
384
/**
385
 * xmlNewEntity:
386
 * @doc:  the document
387
 * @name:  the entity name
388
 * @type:  the entity type XML_xxx_yyy_ENTITY
389
 * @ExternalID:  the entity external ID if available
390
 * @SystemID:  the entity system ID if available
391
 * @content:  the entity content
392
 *
393
 * Create a new entity, this differs from xmlAddDocEntity() that if
394
 * the document is NULL or has no internal subset defined, then an
395
 * unlinked entity structure will be returned, it is then the responsibility
396
 * of the caller to link it to the document later or free it when not needed
397
 * anymore.
398
 *
399
 * Returns a pointer to the entity or NULL in case of error
400
 */
401
xmlEntityPtr
402
xmlNewEntity(xmlDocPtr doc, const xmlChar *name, int type,
403
       const xmlChar *ExternalID, const xmlChar *SystemID,
404
0
       const xmlChar *content) {
405
0
    if ((doc != NULL) && (doc->intSubset != NULL)) {
406
0
  return(xmlAddDocEntity(doc, name, type, ExternalID, SystemID, content));
407
0
    }
408
0
    if (name == NULL)
409
0
        return(NULL);
410
0
    return(xmlCreateEntity(doc, name, type, ExternalID, SystemID, content));
411
0
}
412
413
/**
414
 * xmlGetEntityFromTable:
415
 * @table:  an entity table
416
 * @name:  the entity name
417
 * @parameter:  look for parameter entities
418
 *
419
 * Do an entity lookup in the table.
420
 * returns the corresponding parameter entity, if found.
421
 *
422
 * Returns A pointer to the entity structure or NULL if not found.
423
 */
424
static xmlEntityPtr
425
1.42M
xmlGetEntityFromTable(xmlEntitiesTablePtr table, const xmlChar *name) {
426
1.42M
    return((xmlEntityPtr) xmlHashLookup(table, name));
427
1.42M
}
428
429
/**
430
 * xmlGetParameterEntity:
431
 * @doc:  the document referencing the entity
432
 * @name:  the entity name
433
 *
434
 * Do an entity lookup in the internal and external subsets and
435
 * returns the corresponding parameter entity, if found.
436
 *
437
 * Returns A pointer to the entity structure or NULL if not found.
438
 */
439
xmlEntityPtr
440
101k
xmlGetParameterEntity(xmlDocPtr doc, const xmlChar *name) {
441
101k
    xmlEntitiesTablePtr table;
442
101k
    xmlEntityPtr ret;
443
444
101k
    if (doc == NULL)
445
1.01k
  return(NULL);
446
100k
    if ((doc->intSubset != NULL) && (doc->intSubset->pentities != NULL)) {
447
87.9k
  table = (xmlEntitiesTablePtr) doc->intSubset->pentities;
448
87.9k
  ret = xmlGetEntityFromTable(table, name);
449
87.9k
  if (ret != NULL)
450
59.3k
      return(ret);
451
87.9k
    }
452
41.3k
    if ((doc->extSubset != NULL) && (doc->extSubset->pentities != NULL)) {
453
15.3k
  table = (xmlEntitiesTablePtr) doc->extSubset->pentities;
454
15.3k
  return(xmlGetEntityFromTable(table, name));
455
15.3k
    }
456
25.9k
    return(NULL);
457
41.3k
}
458
459
/**
460
 * xmlGetDtdEntity:
461
 * @doc:  the document referencing the entity
462
 * @name:  the entity name
463
 *
464
 * Do an entity lookup in the DTD entity hash table and
465
 * returns the corresponding entity, if found.
466
 * Note: the first argument is the document node, not the DTD node.
467
 *
468
 * Returns A pointer to the entity structure or NULL if not found.
469
 */
470
xmlEntityPtr
471
0
xmlGetDtdEntity(xmlDocPtr doc, const xmlChar *name) {
472
0
    xmlEntitiesTablePtr table;
473
474
0
    if (doc == NULL)
475
0
  return(NULL);
476
0
    if ((doc->extSubset != NULL) && (doc->extSubset->entities != NULL)) {
477
0
  table = (xmlEntitiesTablePtr) doc->extSubset->entities;
478
0
  return(xmlGetEntityFromTable(table, name));
479
0
    }
480
0
    return(NULL);
481
0
}
482
483
/**
484
 * xmlGetDocEntity:
485
 * @doc:  the document referencing the entity
486
 * @name:  the entity name
487
 *
488
 * Do an entity lookup in the document entity hash table and
489
 * returns the corresponding entity, otherwise a lookup is done
490
 * in the predefined entities too.
491
 *
492
 * Returns A pointer to the entity structure or NULL if not found.
493
 */
494
xmlEntityPtr
495
2.23M
xmlGetDocEntity(const xmlDoc *doc, const xmlChar *name) {
496
2.23M
    xmlEntityPtr cur;
497
2.23M
    xmlEntitiesTablePtr table;
498
499
2.23M
    if (doc != NULL) {
500
2.23M
  if ((doc->intSubset != NULL) && (doc->intSubset->entities != NULL)) {
501
1.25M
      table = (xmlEntitiesTablePtr) doc->intSubset->entities;
502
1.25M
      cur = xmlGetEntityFromTable(table, name);
503
1.25M
      if (cur != NULL)
504
1.13M
    return(cur);
505
1.25M
  }
506
1.10M
  if (doc->standalone != 1) {
507
1.10M
      if ((doc->extSubset != NULL) &&
508
65.7k
    (doc->extSubset->entities != NULL)) {
509
64.3k
    table = (xmlEntitiesTablePtr) doc->extSubset->entities;
510
64.3k
    cur = xmlGetEntityFromTable(table, name);
511
64.3k
    if (cur != NULL)
512
2.66k
        return(cur);
513
64.3k
      }
514
1.10M
  }
515
1.10M
    }
516
1.09M
    return(xmlGetPredefinedEntity(name));
517
2.23M
}
518
519
/*
520
 * xmlSerializeHexCharRef:
521
 * @buf:  a char buffer
522
 * @val:  a codepoint
523
 *
524
 * Serializes a hex char ref like &#xA0;
525
 *
526
 * Writes at most 9 bytes. Does not include a terminating zero byte.
527
 *
528
 * Returns the number of bytes written.
529
 */
530
int
531
1.60k
xmlSerializeHexCharRef(char *buf, int val) {
532
1.60k
    char *out = buf;
533
1.60k
    int shift = 0, bits;
534
535
1.60k
    *out++ = '&';
536
1.60k
    *out++ = '#';
537
1.60k
    *out++ = 'x';
538
539
1.60k
    bits = val;
540
1.60k
    if (bits & 0xFF0000) {
541
433
        shift = 16;
542
433
        bits &= 0xFF0000;
543
1.16k
    } else if (bits & 0x00FF00) {
544
532
        shift = 8;
545
532
        bits &= 0x00FF00;
546
532
    }
547
1.60k
    if (bits & 0xF0F0F0) {
548
675
        shift += 4;
549
675
    }
550
551
5.07k
    do {
552
5.07k
        int d = (val >> shift) & 0x0F;
553
554
5.07k
        if (d < 10)
555
3.31k
            *out++ = '0' + d;
556
1.75k
        else
557
1.75k
            *out++ = 'A' + (d - 10);
558
559
5.07k
  shift -= 4;
560
5.07k
    } while (shift >= 0);
561
562
1.60k
    *out++ = ';';
563
564
1.60k
    return(out - buf);
565
1.60k
}
566
567
/*
568
 * xmlSerializeDecCharRef:
569
 * @buf:  a char buffer
570
 * @val:  a codepoint
571
 *
572
 * Serializes a decimal char ref like &#38;
573
 *
574
 * Writes at most 10 bytes. Does not include a terminating zero byte.
575
 *
576
 * Returns the number of bytes written.
577
 */
578
int
579
148M
xmlSerializeDecCharRef(char *buf, int val) {
580
148M
    char *out = buf;
581
148M
    int len, i;
582
583
148M
    *out++ = '&';
584
148M
    *out++ = '#';
585
586
148M
    if (val < 100) {
587
1.53k
        len = (val < 10) ? 1 : 2;
588
148M
    } else if (val < 10000) {
589
148M
        len = (val < 1000) ? 3 : 4;
590
148M
    } else if (val < 1000000) {
591
7.59k
        len = (val < 100000) ? 5 : 6;
592
7.59k
    } else {
593
385
        len = 7;
594
385
    }
595
596
599M
    for (i = len - 1; i >= 0; i--) {
597
451M
        out[i] = '0' + val % 10;
598
451M
        val /= 10;
599
451M
    }
600
601
148M
    out[len] = ';';
602
603
148M
    return(len + 3);
604
148M
}
605
606
static const char xmlEscapeSafe[128] = {
607
    0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0,
608
    0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
609
    1, 1, 0, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1,
610
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 1,
611
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
612
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
613
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
614
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1
615
};
616
617
/*
618
 * xmlEscapeText:
619
 * @text:  input text
620
 * @flags:  XML_ESCAPE flags
621
 *
622
 * Escapes certain characters with char refs.
623
 *
624
 * XML_ESCAPE_ATTR: for attribute content.
625
 * XML_ESCAPE_NON_ASCII: escape non-ASCII chars.
626
 * XML_ESCAPE_HTML: for HTML content.
627
 * XML_ESCAPE_QUOT: escape double quotes.
628
 * XML_ESCAPE_ALLOW_INVALID: allow invalid characters.
629
 *
630
 * Returns an escaped string or NULL if a memory allocation failed.
631
 */
632
xmlChar *
633
53.4k
xmlEscapeText(const xmlChar *text, int flags) {
634
53.4k
    const xmlChar *cur;
635
53.4k
    xmlChar *buffer;
636
53.4k
    xmlChar *out;
637
53.4k
    const xmlChar *unescaped;
638
53.4k
    size_t size = 50;
639
640
53.4k
    buffer = xmlMalloc(size + 1);
641
53.4k
    if (buffer == NULL)
642
68
        return(NULL);
643
53.3k
    out = buffer;
644
645
53.3k
    cur = text;
646
53.3k
    unescaped = cur;
647
648
197k
    while (*cur != '\0') {
649
144k
        char buf[12];
650
144k
  const xmlChar *end;
651
144k
        const xmlChar *repl;
652
144k
        size_t used;
653
144k
        size_t replSize;
654
144k
        size_t unescapedSize;
655
144k
        size_t totalSize;
656
144k
        int chunkSize = 1;
657
144k
        int c;
658
659
        /* accelerator */
660
171M
  while (1) {
661
171M
            c = *cur;
662
663
171M
            if (c < 0x80) {
664
5.61M
                if (!xmlEscapeSafe[*cur])
665
144k
                    break;
666
165M
            } else {
667
165M
               if (flags & XML_ESCAPE_NON_ASCII)
668
0
                   break;
669
165M
            }
670
171M
            cur += 1;
671
171M
        }
672
673
144k
        if (c == 0) {
674
49.8k
            chunkSize = 0;
675
49.8k
            repl = BAD_CAST "";
676
49.8k
            replSize = 0;
677
94.6k
        } else if (c == '<') {
678
      /*
679
       * Special handling of server side include in HTML attributes
680
       */
681
12.2k
      if ((flags & XML_ESCAPE_HTML) && (flags & XML_ESCAPE_ATTR) &&
682
11.4k
          (cur[1] == '!') && (cur[2] == '-') && (cur[3] == '-') &&
683
1.08k
          ((end = xmlStrstr(cur, BAD_CAST "-->")) != NULL)) {
684
845
                chunkSize = (end - cur) + 3;
685
845
                repl = cur;
686
845
                replSize = chunkSize;
687
11.4k
      } else {
688
11.4k
                repl = BAD_CAST "&lt;";
689
11.4k
                replSize = 4;
690
11.4k
            }
691
82.4k
  } else if (c == '>') {
692
30.0k
            repl = BAD_CAST "&gt;";
693
30.0k
            replSize = 4;
694
52.3k
  } else if (c == '&') {
695
      /*
696
       * Special handling of &{...} construct from HTML 4, see
697
       * http://www.w3.org/TR/html401/appendix/notes.html#h-B.7.1
698
       */
699
4.87k
      if ((flags & XML_ESCAPE_HTML) && (flags & XML_ESCAPE_ATTR) &&
700
4.39k
                (cur[1] == '{') && (end = xmlStrchr(cur, '}'))) {
701
1.92k
                chunkSize = (end - cur) + 1;
702
1.92k
                repl = cur;
703
1.92k
                replSize = chunkSize;
704
2.94k
      } else {
705
2.94k
                repl = BAD_CAST "&amp;";
706
2.94k
                replSize = 5;
707
2.94k
            }
708
47.5k
  } else if ((flags & XML_ESCAPE_QUOT) && (c == '"')) {
709
0
            repl = BAD_CAST "&quot;";
710
0
            replSize = 6;
711
47.5k
  } else if (((flags & XML_ESCAPE_HTML) == 0) && (c == '\r')) {
712
0
      repl = BAD_CAST "&#13;";
713
0
            replSize = 5;
714
47.5k
  } else if ((flags & XML_ESCAPE_NON_ASCII) && (c >= 0x80)) {
715
0
            int val;
716
717
0
            chunkSize = 4;
718
0
            val = xmlGetUTF8Char(cur, &chunkSize);
719
0
            if (val < 0) {
720
0
                val = 0xFFFD;
721
0
                chunkSize = 1;
722
0
            } else if (((flags & XML_ESCAPE_ALLOW_INVALID) == 0) &&
723
0
                       (!IS_CHAR(val))) {
724
0
                val = 0xFFFD;
725
0
            }
726
727
0
            replSize = xmlSerializeHexCharRef(buf, val);
728
0
            repl = BAD_CAST buf;
729
47.5k
  } else if ((flags & (XML_ESCAPE_ALLOW_INVALID | XML_ESCAPE_HTML)) ||
730
0
                   (c >= 0x20) ||
731
47.5k
             (c == '\n') || (c == '\t') || (c == '\r')) {
732
      /* default case, just copy */
733
47.5k
            cur += 1;
734
47.5k
            if (*cur != 0)
735
46.6k
                continue;
736
737
861
            chunkSize = 0;
738
861
            repl = BAD_CAST "";
739
861
            replSize = 0;
740
861
  } else {
741
            /* ignore */
742
0
            repl = BAD_CAST "";
743
0
            replSize = 0;
744
0
        }
745
746
97.9k
        used = out - buffer;
747
97.9k
        unescapedSize = cur - unescaped;
748
97.9k
        totalSize = unescapedSize + replSize;
749
750
97.9k
  cur += chunkSize;
751
752
97.9k
        if (totalSize > size - used) {
753
9.70k
            xmlChar *tmp;
754
9.70k
            int newSize;
755
756
9.70k
            if ((size > (SIZE_MAX - 1) / 2) ||
757
9.70k
                (totalSize > (SIZE_MAX - 1) / 2 - size)) {
758
0
                xmlFree(buffer);
759
0
                return(NULL);
760
0
            }
761
9.70k
            newSize = size + totalSize;
762
9.70k
            if (*cur != 0)
763
5.87k
                newSize *= 2;
764
9.70k
            tmp = xmlRealloc(buffer, newSize + 1);
765
9.70k
            if (tmp == NULL) {
766
5
                xmlFree(buffer);
767
5
                return(NULL);
768
5
            }
769
9.70k
            buffer = tmp;
770
9.70k
            size = newSize;
771
9.70k
            out = buffer + used;
772
9.70k
        }
773
774
97.9k
        memcpy(out, unescaped, unescapedSize);
775
97.9k
        out += unescapedSize;
776
97.9k
        memcpy(out, repl, replSize);
777
97.9k
        out += replSize;
778
779
97.9k
        unescaped = cur;
780
97.9k
    }
781
782
53.3k
    *out = 0;
783
53.3k
    return(buffer);
784
53.3k
}
785
786
/**
787
 * xmlEncodeEntitiesInternal:
788
 * @doc:  the document containing the string
789
 * @input:  A string to convert to XML.
790
 * @flags:  XML_ESCAPE flags
791
 *
792
 * Do a global encoding of a string, replacing the predefined entities
793
 * and non ASCII values with their entities and CharRef counterparts.
794
 * Contrary to xmlEncodeEntities, this routine is reentrant, and result
795
 * must be deallocated.
796
 *
797
 * Returns A newly allocated string with the substitution done.
798
 */
799
xmlChar *
800
xmlEncodeEntitiesInternal(xmlDocPtr doc, const xmlChar *input,
801
53.4k
                          unsigned flags) {
802
53.4k
    if (input == NULL)
803
0
        return(NULL);
804
805
53.4k
    if ((doc != NULL) && (doc->type == XML_HTML_DOCUMENT_NODE))
806
53.4k
        flags |= XML_ESCAPE_HTML;
807
0
    else if ((doc == NULL) || (doc->encoding == NULL))
808
0
        flags |= XML_ESCAPE_NON_ASCII;
809
810
53.4k
    return(xmlEscapeText(input, flags));
811
53.4k
}
812
813
/**
814
 * xmlEncodeEntitiesReentrant:
815
 * @doc:  the document containing the string
816
 * @input:  A string to convert to XML.
817
 *
818
 * Do a global encoding of a string, replacing the predefined entities
819
 * and non ASCII values with their entities and CharRef counterparts.
820
 * Contrary to xmlEncodeEntities, this routine is reentrant, and result
821
 * must be deallocated.
822
 *
823
 * This escapes '<', '>', '&' and '\r'. If the document has no encoding,
824
 * non-ASCII codepoints are escaped. There is some special handling for
825
 * HTML documents.
826
 *
827
 * Returns A newly allocated string with the substitution done.
828
 */
829
xmlChar *
830
35.7k
xmlEncodeEntitiesReentrant(xmlDocPtr doc, const xmlChar *input) {
831
35.7k
    return xmlEncodeEntitiesInternal(doc, input, 0);
832
35.7k
}
833
834
/**
835
 * xmlEncodeSpecialChars:
836
 * @doc:  unused
837
 * @input:  A string to convert to XML.
838
 *
839
 * Do a global encoding of a string, replacing the predefined entities
840
 * this routine is reentrant, and result must be deallocated.
841
 *
842
 * This escapes '<', '>', '&', '"' and '\r' chars.
843
 *
844
 * Returns A newly allocated string with the substitution done.
845
 */
846
xmlChar *
847
xmlEncodeSpecialChars(const xmlDoc *doc ATTRIBUTE_UNUSED,
848
0
                      const xmlChar *input) {
849
0
    if (input == NULL)
850
0
        return(NULL);
851
852
0
    return(xmlEscapeText(input, XML_ESCAPE_QUOT | XML_ESCAPE_ALLOW_INVALID));
853
0
}
854
855
/**
856
 * xmlCreateEntitiesTable:
857
 *
858
 * create and initialize an empty entities hash table.
859
 * This really doesn't make sense and should be deprecated
860
 *
861
 * Returns the xmlEntitiesTablePtr just created or NULL in case of error.
862
 */
863
xmlEntitiesTablePtr
864
0
xmlCreateEntitiesTable(void) {
865
0
    return((xmlEntitiesTablePtr) xmlHashCreate(0));
866
0
}
867
868
/**
869
 * xmlFreeEntityWrapper:
870
 * @entity:  An entity
871
 * @name:  its name
872
 *
873
 * Deallocate the memory used by an entities in the hash table.
874
 */
875
static void
876
86.0k
xmlFreeEntityWrapper(void *entity, const xmlChar *name ATTRIBUTE_UNUSED) {
877
86.0k
    if (entity != NULL)
878
86.0k
  xmlFreeEntity((xmlEntityPtr) entity);
879
86.0k
}
880
881
/**
882
 * xmlFreeEntitiesTable:
883
 * @table:  An entity table
884
 *
885
 * Deallocate the memory used by an entities hash table.
886
 */
887
void
888
51.5k
xmlFreeEntitiesTable(xmlEntitiesTablePtr table) {
889
51.5k
    xmlHashFree(table, xmlFreeEntityWrapper);
890
51.5k
}
891
892
/**
893
 * xmlCopyEntity:
894
 * @ent:  An entity
895
 *
896
 * Build a copy of an entity
897
 *
898
 * Returns the new xmlEntitiesPtr or NULL in case of error.
899
 */
900
static void *
901
0
xmlCopyEntity(void *payload, const xmlChar *name ATTRIBUTE_UNUSED) {
902
0
    xmlEntityPtr ent = (xmlEntityPtr) payload;
903
0
    xmlEntityPtr cur;
904
905
0
    cur = (xmlEntityPtr) xmlMalloc(sizeof(xmlEntity));
906
0
    if (cur == NULL)
907
0
  return(NULL);
908
0
    memset(cur, 0, sizeof(xmlEntity));
909
0
    cur->type = XML_ENTITY_DECL;
910
911
0
    cur->etype = ent->etype;
912
0
    if (ent->name != NULL) {
913
0
  cur->name = xmlStrdup(ent->name);
914
0
        if (cur->name == NULL)
915
0
            goto error;
916
0
    }
917
0
    if (ent->ExternalID != NULL) {
918
0
  cur->ExternalID = xmlStrdup(ent->ExternalID);
919
0
        if (cur->ExternalID == NULL)
920
0
            goto error;
921
0
    }
922
0
    if (ent->SystemID != NULL) {
923
0
  cur->SystemID = xmlStrdup(ent->SystemID);
924
0
        if (cur->SystemID == NULL)
925
0
            goto error;
926
0
    }
927
0
    if (ent->content != NULL) {
928
0
  cur->content = xmlStrdup(ent->content);
929
0
        if (cur->content == NULL)
930
0
            goto error;
931
0
    }
932
0
    if (ent->orig != NULL) {
933
0
  cur->orig = xmlStrdup(ent->orig);
934
0
        if (cur->orig == NULL)
935
0
            goto error;
936
0
    }
937
0
    if (ent->URI != NULL) {
938
0
  cur->URI = xmlStrdup(ent->URI);
939
0
        if (cur->URI == NULL)
940
0
            goto error;
941
0
    }
942
0
    return(cur);
943
944
0
error:
945
0
    xmlFreeEntity(cur);
946
0
    return(NULL);
947
0
}
948
949
/**
950
 * xmlCopyEntitiesTable:
951
 * @table:  An entity table
952
 *
953
 * Build a copy of an entity table.
954
 *
955
 * Returns the new xmlEntitiesTablePtr or NULL in case of error.
956
 */
957
xmlEntitiesTablePtr
958
0
xmlCopyEntitiesTable(xmlEntitiesTablePtr table) {
959
0
    return(xmlHashCopySafe(table, xmlCopyEntity, xmlFreeEntityWrapper));
960
0
}
961
962
#ifdef LIBXML_OUTPUT_ENABLED
963
964
/**
965
 * xmlDumpEntityDecl:
966
 * @buf:  An XML buffer.
967
 * @ent:  An entity table
968
 *
969
 * This will dump the content of the entity table as an XML DTD definition
970
 */
971
void
972
0
xmlDumpEntityDecl(xmlBufferPtr buf, xmlEntityPtr ent) {
973
0
    xmlSaveCtxtPtr save;
974
975
0
    if ((buf == NULL) || (ent == NULL))
976
0
        return;
977
978
0
    save = xmlSaveToBuffer(buf, NULL, 0);
979
0
    xmlSaveTree(save, (xmlNodePtr) ent);
980
0
    if (xmlSaveFinish(save) != XML_ERR_OK)
981
0
        xmlFree(xmlBufferDetach(buf));
982
0
}
983
984
/**
985
 * xmlDumpEntityDeclScan:
986
 * @ent:  An entity table
987
 * @buf:  An XML buffer.
988
 *
989
 * When using the hash table scan function, arguments need to be reversed
990
 */
991
static void
992
xmlDumpEntityDeclScan(void *ent, void *save,
993
0
                      const xmlChar *name ATTRIBUTE_UNUSED) {
994
0
    xmlSaveTree(save, ent);
995
0
}
996
997
/**
998
 * xmlDumpEntitiesTable:
999
 * @buf:  An XML buffer.
1000
 * @table:  An entity table
1001
 *
1002
 * This will dump the content of the entity table as an XML DTD definition
1003
 */
1004
void
1005
0
xmlDumpEntitiesTable(xmlBufferPtr buf, xmlEntitiesTablePtr table) {
1006
0
    xmlSaveCtxtPtr save;
1007
1008
0
    if ((buf == NULL) || (table == NULL))
1009
0
        return;
1010
1011
0
    save = xmlSaveToBuffer(buf, NULL, 0);
1012
0
    xmlHashScan(table, xmlDumpEntityDeclScan, save);
1013
0
    if (xmlSaveFinish(save) != XML_ERR_OK)
1014
0
        xmlFree(xmlBufferDetach(buf));
1015
0
}
1016
#endif /* LIBXML_OUTPUT_ENABLED */