Coverage Report

Created: 2026-03-21 06:11

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
/src/libxml2/entities.c
Line
Count
Source
1
/*
2
 * entities.c : implementation for the XML entities handling
3
 *
4
 * See Copyright for the status of this software.
5
 *
6
 * daniel@veillard.com
7
 */
8
9
/* To avoid EBCDIC trouble when parsing on zOS */
10
#if defined(__MVS__)
11
#pragma convert("ISO8859-1")
12
#endif
13
14
#define IN_LIBXML
15
#include "libxml.h"
16
17
#include <string.h>
18
#include <stdlib.h>
19
20
#include <libxml/xmlmemory.h>
21
#include <libxml/hash.h>
22
#include <libxml/entities.h>
23
#include <libxml/parser.h>
24
#include <libxml/parserInternals.h>
25
#include <libxml/xmlerror.h>
26
#include <libxml/dict.h>
27
#include <libxml/xmlsave.h>
28
29
#include "private/entities.h"
30
#include "private/error.h"
31
32
#ifndef SIZE_MAX
33
  #define SIZE_MAX ((size_t) -1)
34
#endif
35
36
/*
37
 * The XML predefined entities.
38
 */
39
40
static xmlEntity xmlEntityLt = {
41
    NULL, XML_ENTITY_DECL, BAD_CAST "lt",
42
    NULL, NULL, NULL, NULL, NULL, NULL,
43
    BAD_CAST "<", BAD_CAST "<", 1,
44
    XML_INTERNAL_PREDEFINED_ENTITY,
45
    NULL, NULL, NULL, NULL, 0, 0, 0
46
};
47
static xmlEntity xmlEntityGt = {
48
    NULL, XML_ENTITY_DECL, BAD_CAST "gt",
49
    NULL, NULL, NULL, NULL, NULL, NULL,
50
    BAD_CAST ">", BAD_CAST ">", 1,
51
    XML_INTERNAL_PREDEFINED_ENTITY,
52
    NULL, NULL, NULL, NULL, 0, 0, 0
53
};
54
static xmlEntity xmlEntityAmp = {
55
    NULL, XML_ENTITY_DECL, BAD_CAST "amp",
56
    NULL, NULL, NULL, NULL, NULL, NULL,
57
    BAD_CAST "&", BAD_CAST "&", 1,
58
    XML_INTERNAL_PREDEFINED_ENTITY,
59
    NULL, NULL, NULL, NULL, 0, 0, 0
60
};
61
static xmlEntity xmlEntityQuot = {
62
    NULL, XML_ENTITY_DECL, BAD_CAST "quot",
63
    NULL, NULL, NULL, NULL, NULL, NULL,
64
    BAD_CAST "\"", BAD_CAST "\"", 1,
65
    XML_INTERNAL_PREDEFINED_ENTITY,
66
    NULL, NULL, NULL, NULL, 0, 0, 0
67
};
68
static xmlEntity xmlEntityApos = {
69
    NULL, XML_ENTITY_DECL, BAD_CAST "apos",
70
    NULL, NULL, NULL, NULL, NULL, NULL,
71
    BAD_CAST "'", BAD_CAST "'", 1,
72
    XML_INTERNAL_PREDEFINED_ENTITY,
73
    NULL, NULL, NULL, NULL, 0, 0, 0
74
};
75
76
/*
77
 * xmlFreeEntity:
78
 * @entity:  an entity
79
 *
80
 * Frees the entity.
81
 */
82
void
83
xmlFreeEntity(xmlEntityPtr entity)
84
71.5k
{
85
71.5k
    xmlDictPtr dict = NULL;
86
87
71.5k
    if (entity == NULL)
88
0
        return;
89
90
71.5k
    if (entity->doc != NULL)
91
71.4k
        dict = entity->doc->dict;
92
93
94
71.5k
    if ((entity->children) &&
95
1.39k
        (entity == (xmlEntityPtr) entity->children->parent))
96
1.39k
        xmlFreeNodeList(entity->children);
97
71.5k
    if ((entity->name != NULL) &&
98
71.5k
        ((dict == NULL) || (!xmlDictOwns(dict, entity->name))))
99
21.2k
        xmlFree((char *) entity->name);
100
71.5k
    if (entity->ExternalID != NULL)
101
6.78k
        xmlFree((char *) entity->ExternalID);
102
71.5k
    if (entity->SystemID != NULL)
103
26.7k
        xmlFree((char *) entity->SystemID);
104
71.5k
    if (entity->URI != NULL)
105
25.0k
        xmlFree((char *) entity->URI);
106
71.5k
    if (entity->content != NULL)
107
44.4k
        xmlFree((char *) entity->content);
108
71.5k
    if (entity->orig != NULL)
109
41.1k
        xmlFree((char *) entity->orig);
110
71.5k
    xmlFree(entity);
111
71.5k
}
112
113
/*
114
 * xmlCreateEntity:
115
 *
116
 * internal routine doing the entity node structures allocations
117
 */
118
static xmlEntityPtr
119
xmlCreateEntity(xmlDocPtr doc, const xmlChar *name, int type,
120
          const xmlChar *ExternalID, const xmlChar *SystemID,
121
59.5k
          const xmlChar *content) {
122
59.5k
    xmlEntityPtr ret;
123
124
59.5k
    ret = (xmlEntityPtr) xmlMalloc(sizeof(xmlEntity));
125
59.5k
    if (ret == NULL)
126
9
  return(NULL);
127
59.5k
    memset(ret, 0, sizeof(xmlEntity));
128
59.5k
    ret->doc = doc;
129
59.5k
    ret->type = XML_ENTITY_DECL;
130
131
    /*
132
     * fill the structure.
133
     */
134
59.5k
    ret->etype = (xmlEntityType) type;
135
59.5k
    if ((doc == NULL) || (doc->dict == NULL))
136
9.29k
  ret->name = xmlStrdup(name);
137
50.2k
    else
138
50.2k
        ret->name = xmlDictLookup(doc->dict, name, -1);
139
59.5k
    if (ret->name == NULL)
140
1
        goto error;
141
59.5k
    if (ExternalID != NULL) {
142
6.78k
        ret->ExternalID = xmlStrdup(ExternalID);
143
6.78k
        if (ret->ExternalID == NULL)
144
1
            goto error;
145
6.78k
    }
146
59.5k
    if (SystemID != NULL) {
147
25.2k
        ret->SystemID = xmlStrdup(SystemID);
148
25.2k
        if (ret->SystemID == NULL)
149
5
            goto error;
150
25.2k
    }
151
59.5k
    if (content != NULL) {
152
33.2k
        ret->length = xmlStrlen(content);
153
33.2k
  ret->content = xmlStrndup(content, ret->length);
154
33.2k
        if (ret->content == NULL)
155
4
            goto error;
156
33.2k
     } else {
157
26.3k
        ret->length = 0;
158
26.3k
        ret->content = NULL;
159
26.3k
    }
160
59.5k
    ret->URI = NULL; /* to be computed by the layer knowing
161
      the defining entity */
162
59.5k
    ret->orig = NULL;
163
164
59.5k
    return(ret);
165
166
11
error:
167
11
    xmlFreeEntity(ret);
168
11
    return(NULL);
169
59.5k
}
170
171
/**
172
 * xmlAddEntity:
173
 * @doc:  the document
174
 * @extSubset:  add to the external or internal subset
175
 * @name:  the entity name
176
 * @type:  the entity type XML_xxx_yyy_ENTITY
177
 * @ExternalID:  the entity external ID if available
178
 * @SystemID:  the entity system ID if available
179
 * @content:  the entity content
180
 * @out:  pointer to resulting entity (optional)
181
 *
182
 * Register a new entity for this document.
183
 *
184
 * Available since 2.13.0.
185
 *
186
 * Returns an xmlParserErrors error code.
187
 */
188
int
189
xmlAddEntity(xmlDocPtr doc, int extSubset, const xmlChar *name, int type,
190
    const xmlChar *ExternalID, const xmlChar *SystemID,
191
61.2k
    const xmlChar *content, xmlEntityPtr *out) {
192
61.2k
    xmlDtdPtr dtd;
193
61.2k
    xmlDictPtr dict = NULL;
194
61.2k
    xmlEntitiesTablePtr table = NULL;
195
61.2k
    xmlEntityPtr ret, predef;
196
61.2k
    int res;
197
198
61.2k
    if (out != NULL)
199
61.2k
        *out = NULL;
200
61.2k
    if ((doc == NULL) || (name == NULL))
201
0
  return(XML_ERR_ARGUMENT);
202
61.2k
    dict = doc->dict;
203
204
61.2k
    if (extSubset)
205
9.42k
        dtd = doc->extSubset;
206
51.8k
    else
207
51.8k
        dtd = doc->intSubset;
208
61.2k
    if (dtd == NULL)
209
0
        return(XML_DTD_NO_DTD);
210
211
61.2k
    switch (type) {
212
20.4k
        case XML_INTERNAL_GENERAL_ENTITY:
213
27.8k
        case XML_EXTERNAL_GENERAL_PARSED_ENTITY:
214
28.0k
        case XML_EXTERNAL_GENERAL_UNPARSED_ENTITY:
215
28.0k
            predef = xmlGetPredefinedEntity(name);
216
28.0k
            if (predef != NULL) {
217
2.85k
                int valid = 0;
218
219
                /* 4.6 Predefined Entities */
220
2.85k
                if ((type == XML_INTERNAL_GENERAL_ENTITY) &&
221
2.67k
                    (content != NULL)) {
222
2.57k
                    int c = predef->content[0];
223
224
2.57k
                    if (((content[0] == c) && (content[1] == 0)) &&
225
1.16k
                        ((c == '>') || (c == '\'') || (c == '"'))) {
226
939
                        valid = 1;
227
1.63k
                    } else if ((content[0] == '&') && (content[1] == '#')) {
228
515
                        if (content[2] == 'x') {
229
36
                            xmlChar *hex = BAD_CAST "0123456789ABCDEF";
230
36
                            xmlChar ref[] = "00;";
231
232
36
                            ref[0] = hex[c / 16 % 16];
233
36
                            ref[1] = hex[c % 16];
234
36
                            if (xmlStrcasecmp(&content[3], ref) == 0)
235
0
                                valid = 1;
236
479
                        } else {
237
479
                            xmlChar ref[] = "00;";
238
239
479
                            ref[0] = '0' + c / 10 % 10;
240
479
                            ref[1] = '0' + c % 10;
241
479
                            if (xmlStrEqual(&content[2], ref))
242
223
                                valid = 1;
243
479
                        }
244
515
                    }
245
2.57k
                }
246
2.85k
                if (!valid)
247
1.69k
                    return(XML_ERR_REDECL_PREDEF_ENTITY);
248
2.85k
            }
249
26.3k
      if (dtd->entities == NULL) {
250
18.0k
    dtd->entities = xmlHashCreateDict(0, dict);
251
18.0k
                if (dtd->entities == NULL)
252
3
                    return(XML_ERR_NO_MEMORY);
253
18.0k
            }
254
26.3k
      table = dtd->entities;
255
26.3k
      break;
256
14.8k
        case XML_INTERNAL_PARAMETER_ENTITY:
257
33.2k
        case XML_EXTERNAL_PARAMETER_ENTITY:
258
33.2k
      if (dtd->pentities == NULL) {
259
17.0k
    dtd->pentities = xmlHashCreateDict(0, dict);
260
17.0k
                if (dtd->pentities == NULL)
261
1
                    return(XML_ERR_NO_MEMORY);
262
17.0k
            }
263
33.2k
      table = dtd->pentities;
264
33.2k
      break;
265
0
        default:
266
0
      return(XML_ERR_ARGUMENT);
267
61.2k
    }
268
59.5k
    ret = xmlCreateEntity(dtd->doc, name, type, ExternalID, SystemID, content);
269
59.5k
    if (ret == NULL)
270
20
        return(XML_ERR_NO_MEMORY);
271
272
59.5k
    res = xmlHashAdd(table, name, ret);
273
59.5k
    if (res < 0) {
274
9
        xmlFreeEntity(ret);
275
9
        return(XML_ERR_NO_MEMORY);
276
59.5k
    } else if (res == 0) {
277
  /*
278
   * entity was already defined at another level.
279
   */
280
1.78k
        xmlFreeEntity(ret);
281
1.78k
  return(XML_WAR_ENTITY_REDEFINED);
282
1.78k
    }
283
284
    /*
285
     * Link it to the DTD
286
     */
287
57.7k
    ret->parent = dtd;
288
57.7k
    ret->doc = dtd->doc;
289
57.7k
    if (dtd->last == NULL) {
290
27.2k
  dtd->children = dtd->last = (xmlNodePtr) ret;
291
30.5k
    } else {
292
30.5k
  dtd->last->next = (xmlNodePtr) ret;
293
30.5k
  ret->prev = dtd->last;
294
30.5k
  dtd->last = (xmlNodePtr) ret;
295
30.5k
    }
296
297
57.7k
    if (out != NULL)
298
57.7k
        *out = ret;
299
57.7k
    return(0);
300
59.5k
}
301
302
/**
303
 * xmlGetPredefinedEntity:
304
 * @name:  the entity name
305
 *
306
 * Check whether this name is an predefined entity.
307
 *
308
 * Returns NULL if not, otherwise the entity
309
 */
310
xmlEntityPtr
311
1.20M
xmlGetPredefinedEntity(const xmlChar *name) {
312
1.20M
    if (name == NULL) return(NULL);
313
1.20M
    switch (name[0]) {
314
9.69k
        case 'l':
315
9.69k
      if (xmlStrEqual(name, BAD_CAST "lt"))
316
7.15k
          return(&xmlEntityLt);
317
2.53k
      break;
318
48.9k
        case 'g':
319
48.9k
      if (xmlStrEqual(name, BAD_CAST "gt"))
320
36.3k
          return(&xmlEntityGt);
321
12.5k
      break;
322
429k
        case 'a':
323
429k
      if (xmlStrEqual(name, BAD_CAST "amp"))
324
53.9k
          return(&xmlEntityAmp);
325
375k
      if (xmlStrEqual(name, BAD_CAST "apos"))
326
1.26k
          return(&xmlEntityApos);
327
374k
      break;
328
374k
        case 'q':
329
354k
      if (xmlStrEqual(name, BAD_CAST "quot"))
330
1.00k
          return(&xmlEntityQuot);
331
353k
      break;
332
365k
  default:
333
365k
      break;
334
1.20M
    }
335
1.10M
    return(NULL);
336
1.20M
}
337
338
/**
339
 * xmlAddDtdEntity:
340
 * @doc:  the document
341
 * @name:  the entity name
342
 * @type:  the entity type XML_xxx_yyy_ENTITY
343
 * @ExternalID:  the entity external ID if available
344
 * @SystemID:  the entity system ID if available
345
 * @content:  the entity content
346
 *
347
 * Register a new entity for this document DTD external subset.
348
 *
349
 * Returns a pointer to the entity or NULL in case of error
350
 */
351
xmlEntityPtr
352
xmlAddDtdEntity(xmlDocPtr doc, const xmlChar *name, int type,
353
          const xmlChar *ExternalID, const xmlChar *SystemID,
354
0
    const xmlChar *content) {
355
0
    xmlEntityPtr ret;
356
357
0
    xmlAddEntity(doc, 1, name, type, ExternalID, SystemID, content, &ret);
358
0
    return(ret);
359
0
}
360
361
/**
362
 * xmlAddDocEntity:
363
 * @doc:  the document
364
 * @name:  the entity name
365
 * @type:  the entity type XML_xxx_yyy_ENTITY
366
 * @ExternalID:  the entity external ID if available
367
 * @SystemID:  the entity system ID if available
368
 * @content:  the entity content
369
 *
370
 * Register a new entity for this document.
371
 *
372
 * Returns a pointer to the entity or NULL in case of error
373
 */
374
xmlEntityPtr
375
xmlAddDocEntity(xmlDocPtr doc, const xmlChar *name, int type,
376
          const xmlChar *ExternalID, const xmlChar *SystemID,
377
0
          const xmlChar *content) {
378
0
    xmlEntityPtr ret;
379
380
0
    xmlAddEntity(doc, 0, name, type, ExternalID, SystemID, content, &ret);
381
0
    return(ret);
382
0
}
383
384
/**
385
 * xmlNewEntity:
386
 * @doc:  the document
387
 * @name:  the entity name
388
 * @type:  the entity type XML_xxx_yyy_ENTITY
389
 * @ExternalID:  the entity external ID if available
390
 * @SystemID:  the entity system ID if available
391
 * @content:  the entity content
392
 *
393
 * Create a new entity, this differs from xmlAddDocEntity() that if
394
 * the document is NULL or has no internal subset defined, then an
395
 * unlinked entity structure will be returned, it is then the responsibility
396
 * of the caller to link it to the document later or free it when not needed
397
 * anymore.
398
 *
399
 * Returns a pointer to the entity or NULL in case of error
400
 */
401
xmlEntityPtr
402
xmlNewEntity(xmlDocPtr doc, const xmlChar *name, int type,
403
       const xmlChar *ExternalID, const xmlChar *SystemID,
404
0
       const xmlChar *content) {
405
0
    if ((doc != NULL) && (doc->intSubset != NULL)) {
406
0
  return(xmlAddDocEntity(doc, name, type, ExternalID, SystemID, content));
407
0
    }
408
0
    if (name == NULL)
409
0
        return(NULL);
410
0
    return(xmlCreateEntity(doc, name, type, ExternalID, SystemID, content));
411
0
}
412
413
/**
414
 * xmlGetEntityFromTable:
415
 * @table:  an entity table
416
 * @name:  the entity name
417
 * @parameter:  look for parameter entities
418
 *
419
 * Do an entity lookup in the table.
420
 * returns the corresponding parameter entity, if found.
421
 *
422
 * Returns A pointer to the entity structure or NULL if not found.
423
 */
424
static xmlEntityPtr
425
547k
xmlGetEntityFromTable(xmlEntitiesTablePtr table, const xmlChar *name) {
426
547k
    return((xmlEntityPtr) xmlHashLookup(table, name));
427
547k
}
428
429
/**
430
 * xmlGetParameterEntity:
431
 * @doc:  the document referencing the entity
432
 * @name:  the entity name
433
 *
434
 * Do an entity lookup in the internal and external subsets and
435
 * returns the corresponding parameter entity, if found.
436
 *
437
 * Returns A pointer to the entity structure or NULL if not found.
438
 */
439
xmlEntityPtr
440
68.6k
xmlGetParameterEntity(xmlDocPtr doc, const xmlChar *name) {
441
68.6k
    xmlEntitiesTablePtr table;
442
68.6k
    xmlEntityPtr ret;
443
444
68.6k
    if (doc == NULL)
445
934
  return(NULL);
446
67.7k
    if ((doc->intSubset != NULL) && (doc->intSubset->pentities != NULL)) {
447
64.5k
  table = (xmlEntitiesTablePtr) doc->intSubset->pentities;
448
64.5k
  ret = xmlGetEntityFromTable(table, name);
449
64.5k
  if (ret != NULL)
450
45.3k
      return(ret);
451
64.5k
    }
452
22.3k
    if ((doc->extSubset != NULL) && (doc->extSubset->pentities != NULL)) {
453
8.83k
  table = (xmlEntitiesTablePtr) doc->extSubset->pentities;
454
8.83k
  return(xmlGetEntityFromTable(table, name));
455
8.83k
    }
456
13.5k
    return(NULL);
457
22.3k
}
458
459
/**
460
 * xmlGetDtdEntity:
461
 * @doc:  the document referencing the entity
462
 * @name:  the entity name
463
 *
464
 * Do an entity lookup in the DTD entity hash table and
465
 * returns the corresponding entity, if found.
466
 * Note: the first argument is the document node, not the DTD node.
467
 *
468
 * Returns A pointer to the entity structure or NULL if not found.
469
 */
470
xmlEntityPtr
471
0
xmlGetDtdEntity(xmlDocPtr doc, const xmlChar *name) {
472
0
    xmlEntitiesTablePtr table;
473
474
0
    if (doc == NULL)
475
0
  return(NULL);
476
0
    if ((doc->extSubset != NULL) && (doc->extSubset->entities != NULL)) {
477
0
  table = (xmlEntitiesTablePtr) doc->extSubset->entities;
478
0
  return(xmlGetEntityFromTable(table, name));
479
0
    }
480
0
    return(NULL);
481
0
}
482
483
/**
484
 * xmlGetDocEntity:
485
 * @doc:  the document referencing the entity
486
 * @name:  the entity name
487
 *
488
 * Do an entity lookup in the document entity hash table and
489
 * returns the corresponding entity, otherwise a lookup is done
490
 * in the predefined entities too.
491
 *
492
 * Returns A pointer to the entity structure or NULL if not found.
493
 */
494
xmlEntityPtr
495
505k
xmlGetDocEntity(const xmlDoc *doc, const xmlChar *name) {
496
505k
    xmlEntityPtr cur;
497
505k
    xmlEntitiesTablePtr table;
498
499
505k
    if (doc != NULL) {
500
485k
  if ((doc->intSubset != NULL) && (doc->intSubset->entities != NULL)) {
501
420k
      table = (xmlEntitiesTablePtr) doc->intSubset->entities;
502
420k
      cur = xmlGetEntityFromTable(table, name);
503
420k
      if (cur != NULL)
504
357k
    return(cur);
505
420k
  }
506
127k
  if (doc->standalone != 1) {
507
127k
      if ((doc->extSubset != NULL) &&
508
55.1k
    (doc->extSubset->entities != NULL)) {
509
53.9k
    table = (xmlEntitiesTablePtr) doc->extSubset->entities;
510
53.9k
    cur = xmlGetEntityFromTable(table, name);
511
53.9k
    if (cur != NULL)
512
52
        return(cur);
513
53.9k
      }
514
127k
  }
515
127k
    }
516
148k
    return(xmlGetPredefinedEntity(name));
517
505k
}
518
519
/*
520
 * xmlSerializeHexCharRef:
521
 * @buf:  a char buffer
522
 * @val:  a codepoint
523
 *
524
 * Serializes a hex char ref like &#xA0;
525
 *
526
 * Writes at most 9 bytes. Does not include a terminating zero byte.
527
 *
528
 * Returns the number of bytes written.
529
 */
530
int
531
834
xmlSerializeHexCharRef(char *buf, int val) {
532
834
    char *out = buf;
533
834
    int shift = 0, bits;
534
535
834
    *out++ = '&';
536
834
    *out++ = '#';
537
834
    *out++ = 'x';
538
539
834
    bits = val;
540
834
    if (bits & 0xFF0000) {
541
79
        shift = 16;
542
79
        bits &= 0xFF0000;
543
755
    } else if (bits & 0x00FF00) {
544
408
        shift = 8;
545
408
        bits &= 0x00FF00;
546
408
    }
547
834
    if (bits & 0xF0F0F0) {
548
702
        shift += 4;
549
702
    }
550
551
2.66k
    do {
552
2.66k
        int d = (val >> shift) & 0x0F;
553
554
2.66k
        if (d < 10)
555
797
            *out++ = '0' + d;
556
1.87k
        else
557
1.87k
            *out++ = 'A' + (d - 10);
558
559
2.66k
  shift -= 4;
560
2.66k
    } while (shift >= 0);
561
562
834
    *out++ = ';';
563
564
834
    return(out - buf);
565
834
}
566
567
/*
568
 * xmlSerializeDecCharRef:
569
 * @buf:  a char buffer
570
 * @val:  a codepoint
571
 *
572
 * Serializes a decimal char ref like &#38;
573
 *
574
 * Writes at most 10 bytes. Does not include a terminating zero byte.
575
 *
576
 * Returns the number of bytes written.
577
 */
578
int
579
84.9M
xmlSerializeDecCharRef(char *buf, int val) {
580
84.9M
    char *out = buf;
581
84.9M
    int len, i;
582
583
84.9M
    *out++ = '&';
584
84.9M
    *out++ = '#';
585
586
84.9M
    if (val < 100) {
587
761
        len = (val < 10) ? 1 : 2;
588
84.9M
    } else if (val < 10000) {
589
84.9M
        len = (val < 1000) ? 3 : 4;
590
84.9M
    } else if (val < 1000000) {
591
5.38k
        len = (val < 100000) ? 5 : 6;
592
5.38k
    } else {
593
206
        len = 7;
594
206
    }
595
596
346M
    for (i = len - 1; i >= 0; i--) {
597
261M
        out[i] = '0' + val % 10;
598
261M
        val /= 10;
599
261M
    }
600
601
84.9M
    out[len] = ';';
602
603
84.9M
    return(len + 3);
604
84.9M
}
605
606
static const char xmlEscapeSafe[128] = {
607
    0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0,
608
    0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
609
    1, 1, 0, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1,
610
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 1,
611
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
612
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
613
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
614
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1
615
};
616
617
/*
618
 * xmlEscapeText:
619
 * @text:  input text
620
 * @flags:  XML_ESCAPE flags
621
 *
622
 * Escapes certain characters with char refs.
623
 *
624
 * XML_ESCAPE_ATTR: for attribute content.
625
 * XML_ESCAPE_NON_ASCII: escape non-ASCII chars.
626
 * XML_ESCAPE_HTML: for HTML content.
627
 * XML_ESCAPE_QUOT: escape double quotes.
628
 * XML_ESCAPE_ALLOW_INVALID: allow invalid characters.
629
 *
630
 * Returns an escaped string or NULL if a memory allocation failed.
631
 */
632
xmlChar *
633
19.0k
xmlEscapeText(const xmlChar *text, int flags) {
634
19.0k
    const xmlChar *cur;
635
19.0k
    xmlChar *buffer;
636
19.0k
    xmlChar *out;
637
19.0k
    const xmlChar *unescaped;
638
19.0k
    size_t size = 50;
639
640
19.0k
    buffer = xmlMalloc(size + 1);
641
19.0k
    if (buffer == NULL)
642
54
        return(NULL);
643
18.9k
    out = buffer;
644
645
18.9k
    cur = text;
646
18.9k
    unescaped = cur;
647
648
245k
    while (*cur != '\0') {
649
226k
        char buf[12];
650
226k
  const xmlChar *end;
651
226k
        const xmlChar *repl;
652
226k
        size_t used;
653
226k
        size_t replSize;
654
226k
        size_t unescapedSize;
655
226k
        size_t totalSize;
656
226k
        int chunkSize = 1;
657
226k
        int c;
658
659
        /* accelerator */
660
79.6M
  while (1) {
661
79.6M
            c = *cur;
662
663
79.6M
            if (c < 0x80) {
664
24.4M
                if (!xmlEscapeSafe[*cur])
665
226k
                    break;
666
55.2M
            } else {
667
55.2M
               if (flags & XML_ESCAPE_NON_ASCII)
668
0
                   break;
669
55.2M
            }
670
79.4M
            cur += 1;
671
79.4M
        }
672
673
226k
        if (c == 0) {
674
17.4k
            chunkSize = 0;
675
17.4k
            repl = BAD_CAST "";
676
17.4k
            replSize = 0;
677
208k
        } else if (c == '<') {
678
      /*
679
       * Special handling of server side include in HTML attributes
680
       */
681
10.6k
      if ((flags & XML_ESCAPE_HTML) && (flags & XML_ESCAPE_ATTR) &&
682
10.3k
          (cur[1] == '!') && (cur[2] == '-') && (cur[3] == '-') &&
683
1.23k
          ((end = xmlStrstr(cur, BAD_CAST "-->")) != NULL)) {
684
752
                chunkSize = (end - cur) + 3;
685
752
                repl = cur;
686
752
                replSize = chunkSize;
687
9.93k
      } else {
688
9.93k
                repl = BAD_CAST "&lt;";
689
9.93k
                replSize = 4;
690
9.93k
            }
691
198k
  } else if (c == '>') {
692
162k
            repl = BAD_CAST "&gt;";
693
162k
            replSize = 4;
694
162k
  } else if (c == '&') {
695
      /*
696
       * Special handling of &{...} construct from HTML 4, see
697
       * http://www.w3.org/TR/html401/appendix/notes.html#h-B.7.1
698
       */
699
5.65k
      if ((flags & XML_ESCAPE_HTML) && (flags & XML_ESCAPE_ATTR) &&
700
5.52k
                (cur[1] == '{') && (end = xmlStrchr(cur, '}'))) {
701
835
                chunkSize = (end - cur) + 1;
702
835
                repl = cur;
703
835
                replSize = chunkSize;
704
4.82k
      } else {
705
4.82k
                repl = BAD_CAST "&amp;";
706
4.82k
                replSize = 5;
707
4.82k
            }
708
29.7k
  } else if ((flags & XML_ESCAPE_QUOT) && (c == '"')) {
709
0
            repl = BAD_CAST "&quot;";
710
0
            replSize = 6;
711
29.7k
  } else if (((flags & XML_ESCAPE_HTML) == 0) && (c == '\r')) {
712
0
      repl = BAD_CAST "&#13;";
713
0
            replSize = 5;
714
29.7k
  } else if ((flags & XML_ESCAPE_NON_ASCII) && (c >= 0x80)) {
715
0
            int val;
716
717
0
            chunkSize = 4;
718
0
            val = xmlGetUTF8Char(cur, &chunkSize);
719
0
            if (val < 0) {
720
0
                val = 0xFFFD;
721
0
                chunkSize = 1;
722
0
            } else if (((flags & XML_ESCAPE_ALLOW_INVALID) == 0) &&
723
0
                       (!IS_CHAR(val))) {
724
0
                val = 0xFFFD;
725
0
            }
726
727
0
            replSize = xmlSerializeHexCharRef(buf, val);
728
0
            repl = BAD_CAST buf;
729
29.7k
  } else if ((flags & (XML_ESCAPE_ALLOW_INVALID | XML_ESCAPE_HTML)) ||
730
0
                   (c >= 0x20) ||
731
29.7k
             (c == '\n') || (c == '\t') || (c == '\r')) {
732
      /* default case, just copy */
733
29.7k
            cur += 1;
734
29.7k
            if (*cur != 0)
735
29.2k
                continue;
736
737
537
            chunkSize = 0;
738
537
            repl = BAD_CAST "";
739
537
            replSize = 0;
740
537
  } else {
741
            /* ignore */
742
0
            repl = BAD_CAST "";
743
0
            replSize = 0;
744
0
        }
745
746
197k
        used = out - buffer;
747
197k
        unescapedSize = cur - unescaped;
748
197k
        totalSize = unescapedSize + replSize;
749
750
197k
  cur += chunkSize;
751
752
197k
        if (totalSize > size - used) {
753
4.59k
            xmlChar *tmp;
754
4.59k
            int newSize;
755
756
4.59k
            if ((size > (SIZE_MAX - 1) / 2) ||
757
4.59k
                (totalSize > (SIZE_MAX - 1) / 2 - size)) {
758
0
                xmlFree(buffer);
759
0
                return(NULL);
760
0
            }
761
4.59k
            newSize = size + totalSize;
762
4.59k
            if (*cur != 0)
763
2.83k
                newSize *= 2;
764
4.59k
            tmp = xmlRealloc(buffer, newSize + 1);
765
4.59k
            if (tmp == NULL) {
766
3
                xmlFree(buffer);
767
3
                return(NULL);
768
3
            }
769
4.59k
            buffer = tmp;
770
4.59k
            size = newSize;
771
4.59k
            out = buffer + used;
772
4.59k
        }
773
774
197k
        memcpy(out, unescaped, unescapedSize);
775
197k
        out += unescapedSize;
776
197k
        memcpy(out, repl, replSize);
777
197k
        out += replSize;
778
779
197k
        unescaped = cur;
780
197k
    }
781
782
18.9k
    *out = 0;
783
18.9k
    return(buffer);
784
18.9k
}
785
786
/**
787
 * xmlEncodeEntitiesInternal:
788
 * @doc:  the document containing the string
789
 * @input:  A string to convert to XML.
790
 * @flags:  XML_ESCAPE flags
791
 *
792
 * Do a global encoding of a string, replacing the predefined entities
793
 * and non ASCII values with their entities and CharRef counterparts.
794
 * Contrary to xmlEncodeEntities, this routine is reentrant, and result
795
 * must be deallocated.
796
 *
797
 * Returns A newly allocated string with the substitution done.
798
 */
799
xmlChar *
800
xmlEncodeEntitiesInternal(xmlDocPtr doc, const xmlChar *input,
801
19.0k
                          unsigned flags) {
802
19.0k
    if (input == NULL)
803
0
        return(NULL);
804
805
19.0k
    if ((doc != NULL) && (doc->type == XML_HTML_DOCUMENT_NODE))
806
19.0k
        flags |= XML_ESCAPE_HTML;
807
0
    else if ((doc == NULL) || (doc->encoding == NULL))
808
0
        flags |= XML_ESCAPE_NON_ASCII;
809
810
19.0k
    return(xmlEscapeText(input, flags));
811
19.0k
}
812
813
/**
814
 * xmlEncodeEntitiesReentrant:
815
 * @doc:  the document containing the string
816
 * @input:  A string to convert to XML.
817
 *
818
 * Do a global encoding of a string, replacing the predefined entities
819
 * and non ASCII values with their entities and CharRef counterparts.
820
 * Contrary to xmlEncodeEntities, this routine is reentrant, and result
821
 * must be deallocated.
822
 *
823
 * This escapes '<', '>', '&' and '\r'. If the document has no encoding,
824
 * non-ASCII codepoints are escaped. There is some special handling for
825
 * HTML documents.
826
 *
827
 * Returns A newly allocated string with the substitution done.
828
 */
829
xmlChar *
830
13.7k
xmlEncodeEntitiesReentrant(xmlDocPtr doc, const xmlChar *input) {
831
13.7k
    return xmlEncodeEntitiesInternal(doc, input, 0);
832
13.7k
}
833
834
/**
835
 * xmlEncodeSpecialChars:
836
 * @doc:  unused
837
 * @input:  A string to convert to XML.
838
 *
839
 * Do a global encoding of a string, replacing the predefined entities
840
 * this routine is reentrant, and result must be deallocated.
841
 *
842
 * This escapes '<', '>', '&', '"' and '\r' chars.
843
 *
844
 * Returns A newly allocated string with the substitution done.
845
 */
846
xmlChar *
847
xmlEncodeSpecialChars(const xmlDoc *doc ATTRIBUTE_UNUSED,
848
0
                      const xmlChar *input) {
849
0
    if (input == NULL)
850
0
        return(NULL);
851
852
0
    return(xmlEscapeText(input, XML_ESCAPE_QUOT | XML_ESCAPE_ALLOW_INVALID));
853
0
}
854
855
/**
856
 * xmlCreateEntitiesTable:
857
 *
858
 * create and initialize an empty entities hash table.
859
 * This really doesn't make sense and should be deprecated
860
 *
861
 * Returns the xmlEntitiesTablePtr just created or NULL in case of error.
862
 */
863
xmlEntitiesTablePtr
864
0
xmlCreateEntitiesTable(void) {
865
0
    return((xmlEntitiesTablePtr) xmlHashCreate(0));
866
0
}
867
868
/**
869
 * xmlFreeEntityWrapper:
870
 * @entity:  An entity
871
 * @name:  its name
872
 *
873
 * Deallocate the memory used by an entities in the hash table.
874
 */
875
static void
876
69.7k
xmlFreeEntityWrapper(void *entity, const xmlChar *name ATTRIBUTE_UNUSED) {
877
69.7k
    if (entity != NULL)
878
69.7k
  xmlFreeEntity((xmlEntityPtr) entity);
879
69.7k
}
880
881
/**
882
 * xmlFreeEntitiesTable:
883
 * @table:  An entity table
884
 *
885
 * Deallocate the memory used by an entities hash table.
886
 */
887
void
888
39.6k
xmlFreeEntitiesTable(xmlEntitiesTablePtr table) {
889
39.6k
    xmlHashFree(table, xmlFreeEntityWrapper);
890
39.6k
}
891
892
/**
893
 * xmlCopyEntity:
894
 * @ent:  An entity
895
 *
896
 * Build a copy of an entity
897
 *
898
 * Returns the new xmlEntitiesPtr or NULL in case of error.
899
 */
900
static void *
901
11.9k
xmlCopyEntity(void *payload, const xmlChar *name ATTRIBUTE_UNUSED) {
902
11.9k
    xmlEntityPtr ent = (xmlEntityPtr) payload;
903
11.9k
    xmlEntityPtr cur;
904
905
11.9k
    cur = (xmlEntityPtr) xmlMalloc(sizeof(xmlEntity));
906
11.9k
    if (cur == NULL)
907
2
  return(NULL);
908
11.9k
    memset(cur, 0, sizeof(xmlEntity));
909
11.9k
    cur->type = XML_ENTITY_DECL;
910
911
11.9k
    cur->etype = ent->etype;
912
11.9k
    if (ent->name != NULL) {
913
11.9k
  cur->name = xmlStrdup(ent->name);
914
11.9k
        if (cur->name == NULL)
915
1
            goto error;
916
11.9k
    }
917
11.9k
    if (ent->ExternalID != NULL) {
918
0
  cur->ExternalID = xmlStrdup(ent->ExternalID);
919
0
        if (cur->ExternalID == NULL)
920
0
            goto error;
921
0
    }
922
11.9k
    if (ent->SystemID != NULL) {
923
1.50k
  cur->SystemID = xmlStrdup(ent->SystemID);
924
1.50k
        if (cur->SystemID == NULL)
925
1
            goto error;
926
1.50k
    }
927
11.9k
    if (ent->content != NULL) {
928
10.4k
  cur->content = xmlStrdup(ent->content);
929
10.4k
        if (cur->content == NULL)
930
4
            goto error;
931
10.4k
    }
932
11.9k
    if (ent->orig != NULL) {
933
10.4k
  cur->orig = xmlStrdup(ent->orig);
934
10.4k
        if (cur->orig == NULL)
935
3
            goto error;
936
10.4k
    }
937
11.9k
    if (ent->URI != NULL) {
938
809
  cur->URI = xmlStrdup(ent->URI);
939
809
        if (cur->URI == NULL)
940
1
            goto error;
941
809
    }
942
11.9k
    return(cur);
943
944
10
error:
945
10
    xmlFreeEntity(cur);
946
10
    return(NULL);
947
11.9k
}
948
949
/**
950
 * xmlCopyEntitiesTable:
951
 * @table:  An entity table
952
 *
953
 * Build a copy of an entity table.
954
 *
955
 * Returns the new xmlEntitiesTablePtr or NULL in case of error.
956
 */
957
xmlEntitiesTablePtr
958
4.63k
xmlCopyEntitiesTable(xmlEntitiesTablePtr table) {
959
4.63k
    return(xmlHashCopySafe(table, xmlCopyEntity, xmlFreeEntityWrapper));
960
4.63k
}
961
962
#ifdef LIBXML_OUTPUT_ENABLED
963
964
/**
965
 * xmlDumpEntityDecl:
966
 * @buf:  An XML buffer.
967
 * @ent:  An entity table
968
 *
969
 * This will dump the content of the entity table as an XML DTD definition
970
 */
971
void
972
0
xmlDumpEntityDecl(xmlBufferPtr buf, xmlEntityPtr ent) {
973
0
    xmlSaveCtxtPtr save;
974
975
0
    if ((buf == NULL) || (ent == NULL))
976
0
        return;
977
978
0
    save = xmlSaveToBuffer(buf, NULL, 0);
979
0
    xmlSaveTree(save, (xmlNodePtr) ent);
980
0
    if (xmlSaveFinish(save) != XML_ERR_OK)
981
0
        xmlFree(xmlBufferDetach(buf));
982
0
}
983
984
/**
985
 * xmlDumpEntityDeclScan:
986
 * @ent:  An entity table
987
 * @buf:  An XML buffer.
988
 *
989
 * When using the hash table scan function, arguments need to be reversed
990
 */
991
static void
992
xmlDumpEntityDeclScan(void *ent, void *save,
993
0
                      const xmlChar *name ATTRIBUTE_UNUSED) {
994
0
    xmlSaveTree(save, ent);
995
0
}
996
997
/**
998
 * xmlDumpEntitiesTable:
999
 * @buf:  An XML buffer.
1000
 * @table:  An entity table
1001
 *
1002
 * This will dump the content of the entity table as an XML DTD definition
1003
 */
1004
void
1005
0
xmlDumpEntitiesTable(xmlBufferPtr buf, xmlEntitiesTablePtr table) {
1006
0
    xmlSaveCtxtPtr save;
1007
1008
0
    if ((buf == NULL) || (table == NULL))
1009
0
        return;
1010
1011
0
    save = xmlSaveToBuffer(buf, NULL, 0);
1012
0
    xmlHashScan(table, xmlDumpEntityDeclScan, save);
1013
0
    if (xmlSaveFinish(save) != XML_ERR_OK)
1014
0
        xmlFree(xmlBufferDetach(buf));
1015
0
}
1016
#endif /* LIBXML_OUTPUT_ENABLED */