Coverage Report

Created: 2025-12-03 06:14

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
/src/libxml2/entities.c
Line
Count
Source
1
/*
2
 * entities.c : implementation for the XML entities handling
3
 *
4
 * See Copyright for the status of this software.
5
 *
6
 * daniel@veillard.com
7
 */
8
9
/* To avoid EBCDIC trouble when parsing on zOS */
10
#if defined(__MVS__)
11
#pragma convert("ISO8859-1")
12
#endif
13
14
#define IN_LIBXML
15
#include "libxml.h"
16
17
#include <string.h>
18
#include <stdlib.h>
19
20
#include <libxml/xmlmemory.h>
21
#include <libxml/hash.h>
22
#include <libxml/entities.h>
23
#include <libxml/parser.h>
24
#include <libxml/parserInternals.h>
25
#include <libxml/xmlerror.h>
26
#include <libxml/dict.h>
27
#include <libxml/xmlsave.h>
28
29
#include "private/entities.h"
30
#include "private/error.h"
31
32
#ifndef SIZE_MAX
33
  #define SIZE_MAX ((size_t) -1)
34
#endif
35
36
/*
37
 * The XML predefined entities.
38
 */
39
40
static xmlEntity xmlEntityLt = {
41
    NULL, XML_ENTITY_DECL, BAD_CAST "lt",
42
    NULL, NULL, NULL, NULL, NULL, NULL,
43
    BAD_CAST "<", BAD_CAST "<", 1,
44
    XML_INTERNAL_PREDEFINED_ENTITY,
45
    NULL, NULL, NULL, NULL, 0, 0, 0
46
};
47
static xmlEntity xmlEntityGt = {
48
    NULL, XML_ENTITY_DECL, BAD_CAST "gt",
49
    NULL, NULL, NULL, NULL, NULL, NULL,
50
    BAD_CAST ">", BAD_CAST ">", 1,
51
    XML_INTERNAL_PREDEFINED_ENTITY,
52
    NULL, NULL, NULL, NULL, 0, 0, 0
53
};
54
static xmlEntity xmlEntityAmp = {
55
    NULL, XML_ENTITY_DECL, BAD_CAST "amp",
56
    NULL, NULL, NULL, NULL, NULL, NULL,
57
    BAD_CAST "&", BAD_CAST "&", 1,
58
    XML_INTERNAL_PREDEFINED_ENTITY,
59
    NULL, NULL, NULL, NULL, 0, 0, 0
60
};
61
static xmlEntity xmlEntityQuot = {
62
    NULL, XML_ENTITY_DECL, BAD_CAST "quot",
63
    NULL, NULL, NULL, NULL, NULL, NULL,
64
    BAD_CAST "\"", BAD_CAST "\"", 1,
65
    XML_INTERNAL_PREDEFINED_ENTITY,
66
    NULL, NULL, NULL, NULL, 0, 0, 0
67
};
68
static xmlEntity xmlEntityApos = {
69
    NULL, XML_ENTITY_DECL, BAD_CAST "apos",
70
    NULL, NULL, NULL, NULL, NULL, NULL,
71
    BAD_CAST "'", BAD_CAST "'", 1,
72
    XML_INTERNAL_PREDEFINED_ENTITY,
73
    NULL, NULL, NULL, NULL, 0, 0, 0
74
};
75
76
/*
77
 * xmlFreeEntity:
78
 * @entity:  an entity
79
 *
80
 * Frees the entity.
81
 */
82
void
83
xmlFreeEntity(xmlEntityPtr entity)
84
99.4k
{
85
99.4k
    xmlDictPtr dict = NULL;
86
87
99.4k
    if (entity == NULL)
88
0
        return;
89
90
99.4k
    if (entity->doc != NULL)
91
99.4k
        dict = entity->doc->dict;
92
93
94
99.4k
    if ((entity->children) &&
95
2.07k
        (entity == (xmlEntityPtr) entity->children->parent))
96
2.07k
        xmlFreeNodeList(entity->children);
97
99.4k
    if ((entity->name != NULL) &&
98
99.4k
        ((dict == NULL) || (!xmlDictOwns(dict, entity->name))))
99
13.4k
        xmlFree((char *) entity->name);
100
99.4k
    if (entity->ExternalID != NULL)
101
11.9k
        xmlFree((char *) entity->ExternalID);
102
99.4k
    if (entity->SystemID != NULL)
103
40.8k
        xmlFree((char *) entity->SystemID);
104
99.4k
    if (entity->URI != NULL)
105
37.7k
        xmlFree((char *) entity->URI);
106
99.4k
    if (entity->content != NULL)
107
57.6k
        xmlFree((char *) entity->content);
108
99.4k
    if (entity->orig != NULL)
109
54.8k
        xmlFree((char *) entity->orig);
110
99.4k
    xmlFree(entity);
111
99.4k
}
112
113
/*
114
 * xmlCreateEntity:
115
 *
116
 * internal routine doing the entity node structures allocations
117
 */
118
static xmlEntityPtr
119
xmlCreateEntity(xmlDocPtr doc, const xmlChar *name, int type,
120
          const xmlChar *ExternalID, const xmlChar *SystemID,
121
99.5k
          const xmlChar *content) {
122
99.5k
    xmlEntityPtr ret;
123
124
99.5k
    ret = (xmlEntityPtr) xmlMalloc(sizeof(xmlEntity));
125
99.5k
    if (ret == NULL)
126
5
  return(NULL);
127
99.4k
    memset(ret, 0, sizeof(xmlEntity));
128
99.4k
    ret->doc = doc;
129
99.4k
    ret->type = XML_ENTITY_DECL;
130
131
    /*
132
     * fill the structure.
133
     */
134
99.4k
    ret->etype = (xmlEntityType) type;
135
99.4k
    if ((doc == NULL) || (doc->dict == NULL))
136
13.4k
  ret->name = xmlStrdup(name);
137
86.0k
    else
138
86.0k
        ret->name = xmlDictLookup(doc->dict, name, -1);
139
99.4k
    if (ret->name == NULL)
140
1
        goto error;
141
99.4k
    if (ExternalID != NULL) {
142
11.9k
        ret->ExternalID = xmlStrdup(ExternalID);
143
11.9k
        if (ret->ExternalID == NULL)
144
3
            goto error;
145
11.9k
    }
146
99.4k
    if (SystemID != NULL) {
147
40.8k
        ret->SystemID = xmlStrdup(SystemID);
148
40.8k
        if (ret->SystemID == NULL)
149
2
            goto error;
150
40.8k
    }
151
99.4k
    if (content != NULL) {
152
57.3k
        ret->length = xmlStrlen(content);
153
57.3k
  ret->content = xmlStrndup(content, ret->length);
154
57.3k
        if (ret->content == NULL)
155
5
            goto error;
156
57.3k
     } else {
157
42.1k
        ret->length = 0;
158
42.1k
        ret->content = NULL;
159
42.1k
    }
160
99.4k
    ret->URI = NULL; /* to be computed by the layer knowing
161
      the defining entity */
162
99.4k
    ret->orig = NULL;
163
164
99.4k
    return(ret);
165
166
11
error:
167
11
    xmlFreeEntity(ret);
168
11
    return(NULL);
169
99.4k
}
170
171
/**
172
 * xmlAddEntity:
173
 * @doc:  the document
174
 * @extSubset:  add to the external or internal subset
175
 * @name:  the entity name
176
 * @type:  the entity type XML_xxx_yyy_ENTITY
177
 * @ExternalID:  the entity external ID if available
178
 * @SystemID:  the entity system ID if available
179
 * @content:  the entity content
180
 * @out:  pointer to resulting entity (optional)
181
 *
182
 * Register a new entity for this document.
183
 *
184
 * Available since 2.13.0.
185
 *
186
 * Returns an xmlParserErrors error code.
187
 */
188
int
189
xmlAddEntity(xmlDocPtr doc, int extSubset, const xmlChar *name, int type,
190
    const xmlChar *ExternalID, const xmlChar *SystemID,
191
102k
    const xmlChar *content, xmlEntityPtr *out) {
192
102k
    xmlDtdPtr dtd;
193
102k
    xmlDictPtr dict = NULL;
194
102k
    xmlEntitiesTablePtr table = NULL;
195
102k
    xmlEntityPtr ret, predef;
196
102k
    int res;
197
198
102k
    if (out != NULL)
199
102k
        *out = NULL;
200
102k
    if ((doc == NULL) || (name == NULL))
201
0
  return(XML_ERR_ARGUMENT);
202
102k
    dict = doc->dict;
203
204
102k
    if (extSubset)
205
10.9k
        dtd = doc->extSubset;
206
91.1k
    else
207
91.1k
        dtd = doc->intSubset;
208
102k
    if (dtd == NULL)
209
0
        return(XML_DTD_NO_DTD);
210
211
102k
    switch (type) {
212
29.6k
        case XML_INTERNAL_GENERAL_ENTITY:
213
42.8k
        case XML_EXTERNAL_GENERAL_PARSED_ENTITY:
214
43.0k
        case XML_EXTERNAL_GENERAL_UNPARSED_ENTITY:
215
43.0k
            predef = xmlGetPredefinedEntity(name);
216
43.0k
            if (predef != NULL) {
217
3.29k
                int valid = 0;
218
219
                /* 4.6 Predefined Entities */
220
3.29k
                if ((type == XML_INTERNAL_GENERAL_ENTITY) &&
221
2.85k
                    (content != NULL)) {
222
2.61k
                    int c = predef->content[0];
223
224
2.61k
                    if (((content[0] == c) && (content[1] == 0)) &&
225
672
                        ((c == '>') || (c == '\'') || (c == '"'))) {
226
444
                        valid = 1;
227
2.17k
                    } else if ((content[0] == '&') && (content[1] == '#')) {
228
1.30k
                        if (content[2] == 'x') {
229
231
                            xmlChar *hex = BAD_CAST "0123456789ABCDEF";
230
231
                            xmlChar ref[] = "00;";
231
232
231
                            ref[0] = hex[c / 16 % 16];
233
231
                            ref[1] = hex[c % 16];
234
231
                            if (xmlStrcasecmp(&content[3], ref) == 0)
235
0
                                valid = 1;
236
1.06k
                        } else {
237
1.06k
                            xmlChar ref[] = "00;";
238
239
1.06k
                            ref[0] = '0' + c / 10 % 10;
240
1.06k
                            ref[1] = '0' + c % 10;
241
1.06k
                            if (xmlStrEqual(&content[2], ref))
242
215
                                valid = 1;
243
1.06k
                        }
244
1.30k
                    }
245
2.61k
                }
246
3.29k
                if (!valid)
247
2.63k
                    return(XML_ERR_REDECL_PREDEF_ENTITY);
248
3.29k
            }
249
40.4k
      if (dtd->entities == NULL) {
250
27.8k
    dtd->entities = xmlHashCreateDict(0, dict);
251
27.8k
                if (dtd->entities == NULL)
252
3
                    return(XML_ERR_NO_MEMORY);
253
27.8k
            }
254
40.4k
      table = dtd->entities;
255
40.4k
      break;
256
30.2k
        case XML_INTERNAL_PARAMETER_ENTITY:
257
59.0k
        case XML_EXTERNAL_PARAMETER_ENTITY:
258
59.0k
      if (dtd->pentities == NULL) {
259
24.6k
    dtd->pentities = xmlHashCreateDict(0, dict);
260
24.6k
                if (dtd->pentities == NULL)
261
1
                    return(XML_ERR_NO_MEMORY);
262
24.6k
            }
263
59.0k
      table = dtd->pentities;
264
59.0k
      break;
265
0
        default:
266
0
      return(XML_ERR_ARGUMENT);
267
102k
    }
268
99.5k
    ret = xmlCreateEntity(dtd->doc, name, type, ExternalID, SystemID, content);
269
99.5k
    if (ret == NULL)
270
16
        return(XML_ERR_NO_MEMORY);
271
272
99.4k
    res = xmlHashAdd(table, name, ret);
273
99.4k
    if (res < 0) {
274
3
        xmlFreeEntity(ret);
275
3
        return(XML_ERR_NO_MEMORY);
276
99.4k
    } else if (res == 0) {
277
  /*
278
   * entity was already defined at another level.
279
   */
280
2.55k
        xmlFreeEntity(ret);
281
2.55k
  return(XML_WAR_ENTITY_REDEFINED);
282
2.55k
    }
283
284
    /*
285
     * Link it to the DTD
286
     */
287
96.9k
    ret->parent = dtd;
288
96.9k
    ret->doc = dtd->doc;
289
96.9k
    if (dtd->last == NULL) {
290
39.4k
  dtd->children = dtd->last = (xmlNodePtr) ret;
291
57.4k
    } else {
292
57.4k
  dtd->last->next = (xmlNodePtr) ret;
293
57.4k
  ret->prev = dtd->last;
294
57.4k
  dtd->last = (xmlNodePtr) ret;
295
57.4k
    }
296
297
96.9k
    if (out != NULL)
298
96.9k
        *out = ret;
299
96.9k
    return(0);
300
99.4k
}
301
302
/**
303
 * xmlGetPredefinedEntity:
304
 * @name:  the entity name
305
 *
306
 * Check whether this name is an predefined entity.
307
 *
308
 * Returns NULL if not, otherwise the entity
309
 */
310
xmlEntityPtr
311
2.12M
xmlGetPredefinedEntity(const xmlChar *name) {
312
2.12M
    if (name == NULL) return(NULL);
313
2.12M
    switch (name[0]) {
314
20.2k
        case 'l':
315
20.2k
      if (xmlStrEqual(name, BAD_CAST "lt"))
316
13.2k
          return(&xmlEntityLt);
317
7.03k
      break;
318
39.9k
        case 'g':
319
39.9k
      if (xmlStrEqual(name, BAD_CAST "gt"))
320
35.5k
          return(&xmlEntityGt);
321
4.46k
      break;
322
930k
        case 'a':
323
930k
      if (xmlStrEqual(name, BAD_CAST "amp"))
324
105k
          return(&xmlEntityAmp);
325
824k
      if (xmlStrEqual(name, BAD_CAST "apos"))
326
529
          return(&xmlEntityApos);
327
824k
      break;
328
824k
        case 'q':
329
571k
      if (xmlStrEqual(name, BAD_CAST "quot"))
330
415
          return(&xmlEntityQuot);
331
571k
      break;
332
571k
  default:
333
559k
      break;
334
2.12M
    }
335
1.96M
    return(NULL);
336
2.12M
}
337
338
/**
339
 * xmlAddDtdEntity:
340
 * @doc:  the document
341
 * @name:  the entity name
342
 * @type:  the entity type XML_xxx_yyy_ENTITY
343
 * @ExternalID:  the entity external ID if available
344
 * @SystemID:  the entity system ID if available
345
 * @content:  the entity content
346
 *
347
 * Register a new entity for this document DTD external subset.
348
 *
349
 * Returns a pointer to the entity or NULL in case of error
350
 */
351
xmlEntityPtr
352
xmlAddDtdEntity(xmlDocPtr doc, const xmlChar *name, int type,
353
          const xmlChar *ExternalID, const xmlChar *SystemID,
354
0
    const xmlChar *content) {
355
0
    xmlEntityPtr ret;
356
357
0
    xmlAddEntity(doc, 1, name, type, ExternalID, SystemID, content, &ret);
358
0
    return(ret);
359
0
}
360
361
/**
362
 * xmlAddDocEntity:
363
 * @doc:  the document
364
 * @name:  the entity name
365
 * @type:  the entity type XML_xxx_yyy_ENTITY
366
 * @ExternalID:  the entity external ID if available
367
 * @SystemID:  the entity system ID if available
368
 * @content:  the entity content
369
 *
370
 * Register a new entity for this document.
371
 *
372
 * Returns a pointer to the entity or NULL in case of error
373
 */
374
xmlEntityPtr
375
xmlAddDocEntity(xmlDocPtr doc, const xmlChar *name, int type,
376
          const xmlChar *ExternalID, const xmlChar *SystemID,
377
0
          const xmlChar *content) {
378
0
    xmlEntityPtr ret;
379
380
0
    xmlAddEntity(doc, 0, name, type, ExternalID, SystemID, content, &ret);
381
0
    return(ret);
382
0
}
383
384
/**
385
 * xmlNewEntity:
386
 * @doc:  the document
387
 * @name:  the entity name
388
 * @type:  the entity type XML_xxx_yyy_ENTITY
389
 * @ExternalID:  the entity external ID if available
390
 * @SystemID:  the entity system ID if available
391
 * @content:  the entity content
392
 *
393
 * Create a new entity, this differs from xmlAddDocEntity() that if
394
 * the document is NULL or has no internal subset defined, then an
395
 * unlinked entity structure will be returned, it is then the responsibility
396
 * of the caller to link it to the document later or free it when not needed
397
 * anymore.
398
 *
399
 * Returns a pointer to the entity or NULL in case of error
400
 */
401
xmlEntityPtr
402
xmlNewEntity(xmlDocPtr doc, const xmlChar *name, int type,
403
       const xmlChar *ExternalID, const xmlChar *SystemID,
404
0
       const xmlChar *content) {
405
0
    if ((doc != NULL) && (doc->intSubset != NULL)) {
406
0
  return(xmlAddDocEntity(doc, name, type, ExternalID, SystemID, content));
407
0
    }
408
0
    if (name == NULL)
409
0
        return(NULL);
410
0
    return(xmlCreateEntity(doc, name, type, ExternalID, SystemID, content));
411
0
}
412
413
/**
414
 * xmlGetEntityFromTable:
415
 * @table:  an entity table
416
 * @name:  the entity name
417
 * @parameter:  look for parameter entities
418
 *
419
 * Do an entity lookup in the table.
420
 * returns the corresponding parameter entity, if found.
421
 *
422
 * Returns A pointer to the entity structure or NULL if not found.
423
 */
424
static xmlEntityPtr
425
1.00M
xmlGetEntityFromTable(xmlEntitiesTablePtr table, const xmlChar *name) {
426
1.00M
    return((xmlEntityPtr) xmlHashLookup(table, name));
427
1.00M
}
428
429
/**
430
 * xmlGetParameterEntity:
431
 * @doc:  the document referencing the entity
432
 * @name:  the entity name
433
 *
434
 * Do an entity lookup in the internal and external subsets and
435
 * returns the corresponding parameter entity, if found.
436
 *
437
 * Returns A pointer to the entity structure or NULL if not found.
438
 */
439
xmlEntityPtr
440
92.5k
xmlGetParameterEntity(xmlDocPtr doc, const xmlChar *name) {
441
92.5k
    xmlEntitiesTablePtr table;
442
92.5k
    xmlEntityPtr ret;
443
444
92.5k
    if (doc == NULL)
445
916
  return(NULL);
446
91.6k
    if ((doc->intSubset != NULL) && (doc->intSubset->pentities != NULL)) {
447
85.8k
  table = (xmlEntitiesTablePtr) doc->intSubset->pentities;
448
85.8k
  ret = xmlGetEntityFromTable(table, name);
449
85.8k
  if (ret != NULL)
450
63.2k
      return(ret);
451
85.8k
    }
452
28.4k
    if ((doc->extSubset != NULL) && (doc->extSubset->pentities != NULL)) {
453
9.76k
  table = (xmlEntitiesTablePtr) doc->extSubset->pentities;
454
9.76k
  return(xmlGetEntityFromTable(table, name));
455
9.76k
    }
456
18.6k
    return(NULL);
457
28.4k
}
458
459
/**
460
 * xmlGetDtdEntity:
461
 * @doc:  the document referencing the entity
462
 * @name:  the entity name
463
 *
464
 * Do an entity lookup in the DTD entity hash table and
465
 * returns the corresponding entity, if found.
466
 * Note: the first argument is the document node, not the DTD node.
467
 *
468
 * Returns A pointer to the entity structure or NULL if not found.
469
 */
470
xmlEntityPtr
471
0
xmlGetDtdEntity(xmlDocPtr doc, const xmlChar *name) {
472
0
    xmlEntitiesTablePtr table;
473
474
0
    if (doc == NULL)
475
0
  return(NULL);
476
0
    if ((doc->extSubset != NULL) && (doc->extSubset->entities != NULL)) {
477
0
  table = (xmlEntitiesTablePtr) doc->extSubset->entities;
478
0
  return(xmlGetEntityFromTable(table, name));
479
0
    }
480
0
    return(NULL);
481
0
}
482
483
/**
484
 * xmlGetDocEntity:
485
 * @doc:  the document referencing the entity
486
 * @name:  the entity name
487
 *
488
 * Do an entity lookup in the document entity hash table and
489
 * returns the corresponding entity, otherwise a lookup is done
490
 * in the predefined entities too.
491
 *
492
 * Returns A pointer to the entity structure or NULL if not found.
493
 */
494
xmlEntityPtr
495
916k
xmlGetDocEntity(const xmlDoc *doc, const xmlChar *name) {
496
916k
    xmlEntityPtr cur;
497
916k
    xmlEntitiesTablePtr table;
498
499
916k
    if (doc != NULL) {
500
911k
  if ((doc->intSubset != NULL) && (doc->intSubset->entities != NULL)) {
501
843k
      table = (xmlEntitiesTablePtr) doc->intSubset->entities;
502
843k
      cur = xmlGetEntityFromTable(table, name);
503
843k
      if (cur != NULL)
504
732k
    return(cur);
505
843k
  }
506
179k
  if (doc->standalone != 1) {
507
179k
      if ((doc->extSubset != NULL) &&
508
65.8k
    (doc->extSubset->entities != NULL)) {
509
63.8k
    table = (xmlEntitiesTablePtr) doc->extSubset->entities;
510
63.8k
    cur = xmlGetEntityFromTable(table, name);
511
63.8k
    if (cur != NULL)
512
212
        return(cur);
513
63.8k
      }
514
179k
  }
515
179k
    }
516
184k
    return(xmlGetPredefinedEntity(name));
517
916k
}
518
519
/*
520
 * xmlSerializeHexCharRef:
521
 * @buf:  a char buffer
522
 * @val:  a codepoint
523
 *
524
 * Serializes a hex char ref like &#xA0;
525
 *
526
 * Writes at most 9 bytes. Does not include a terminating zero byte.
527
 *
528
 * Returns the number of bytes written.
529
 */
530
int
531
3.82k
xmlSerializeHexCharRef(char *buf, int val) {
532
3.82k
    char *out = buf;
533
3.82k
    int shift = 0, bits;
534
535
3.82k
    *out++ = '&';
536
3.82k
    *out++ = '#';
537
3.82k
    *out++ = 'x';
538
539
3.82k
    bits = val;
540
3.82k
    if (bits & 0xFF0000) {
541
57
        shift = 16;
542
57
        bits &= 0xFF0000;
543
3.77k
    } else if (bits & 0x00FF00) {
544
1.29k
        shift = 8;
545
1.29k
        bits &= 0x00FF00;
546
1.29k
    }
547
3.82k
    if (bits & 0xF0F0F0) {
548
2.50k
        shift += 4;
549
2.50k
    }
550
551
9.15k
    do {
552
9.15k
        int d = (val >> shift) & 0x0F;
553
554
9.15k
        if (d < 10)
555
5.47k
            *out++ = '0' + d;
556
3.68k
        else
557
3.68k
            *out++ = 'A' + (d - 10);
558
559
9.15k
  shift -= 4;
560
9.15k
    } while (shift >= 0);
561
562
3.82k
    *out++ = ';';
563
564
3.82k
    return(out - buf);
565
3.82k
}
566
567
/*
568
 * xmlSerializeDecCharRef:
569
 * @buf:  a char buffer
570
 * @val:  a codepoint
571
 *
572
 * Serializes a decimal char ref like &#38;
573
 *
574
 * Writes at most 10 bytes. Does not include a terminating zero byte.
575
 *
576
 * Returns the number of bytes written.
577
 */
578
int
579
95.9M
xmlSerializeDecCharRef(char *buf, int val) {
580
95.9M
    char *out = buf;
581
95.9M
    int len, i;
582
583
95.9M
    *out++ = '&';
584
95.9M
    *out++ = '#';
585
586
95.9M
    if (val < 100) {
587
389
        len = (val < 10) ? 1 : 2;
588
95.9M
    } else if (val < 10000) {
589
95.9M
        len = (val < 1000) ? 3 : 4;
590
95.9M
    } else if (val < 1000000) {
591
4.49k
        len = (val < 100000) ? 5 : 6;
592
4.49k
    } else {
593
185
        len = 7;
594
185
    }
595
596
392M
    for (i = len - 1; i >= 0; i--) {
597
296M
        out[i] = '0' + val % 10;
598
296M
        val /= 10;
599
296M
    }
600
601
95.9M
    out[len] = ';';
602
603
95.9M
    return(len + 3);
604
95.9M
}
605
606
static const char xmlEscapeSafe[128] = {
607
    0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0,
608
    0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
609
    1, 1, 0, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1,
610
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 1,
611
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
612
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
613
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
614
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1
615
};
616
617
/*
618
 * xmlEscapeText:
619
 * @text:  input text
620
 * @flags:  XML_ESCAPE flags
621
 *
622
 * Escapes certain characters with char refs.
623
 *
624
 * XML_ESCAPE_ATTR: for attribute content.
625
 * XML_ESCAPE_NON_ASCII: escape non-ASCII chars.
626
 * XML_ESCAPE_HTML: for HTML content.
627
 * XML_ESCAPE_QUOT: escape double quotes.
628
 * XML_ESCAPE_ALLOW_INVALID: allow invalid characters.
629
 *
630
 * Returns an escaped string or NULL if a memory allocation failed.
631
 */
632
xmlChar *
633
76.3k
xmlEscapeText(const xmlChar *text, int flags) {
634
76.3k
    const xmlChar *cur;
635
76.3k
    xmlChar *buffer;
636
76.3k
    xmlChar *out;
637
76.3k
    const xmlChar *unescaped;
638
76.3k
    size_t size = 50;
639
640
76.3k
    buffer = xmlMalloc(size + 1);
641
76.3k
    if (buffer == NULL)
642
64
        return(NULL);
643
76.3k
    out = buffer;
644
645
76.3k
    cur = text;
646
76.3k
    unescaped = cur;
647
648
254k
    while (*cur != '\0') {
649
177k
        char buf[12];
650
177k
  const xmlChar *end;
651
177k
        const xmlChar *repl;
652
177k
        size_t used;
653
177k
        size_t replSize;
654
177k
        size_t unescapedSize;
655
177k
        size_t totalSize;
656
177k
        int chunkSize = 1;
657
177k
        int c;
658
659
        /* accelerator */
660
127M
  while (1) {
661
127M
            c = *cur;
662
663
127M
            if (c < 0x80) {
664
7.22M
                if (!xmlEscapeSafe[*cur])
665
177k
                    break;
666
120M
            } else {
667
120M
               if (flags & XML_ESCAPE_NON_ASCII)
668
0
                   break;
669
120M
            }
670
127M
            cur += 1;
671
127M
        }
672
673
177k
        if (c == 0) {
674
72.5k
            chunkSize = 0;
675
72.5k
            repl = BAD_CAST "";
676
72.5k
            replSize = 0;
677
105k
        } else if (c == '<') {
678
      /*
679
       * Special handling of server side include in HTML attributes
680
       */
681
6.49k
      if ((flags & XML_ESCAPE_HTML) && (flags & XML_ESCAPE_ATTR) &&
682
6.13k
          (cur[1] == '!') && (cur[2] == '-') && (cur[3] == '-') &&
683
587
          ((end = xmlStrstr(cur, BAD_CAST "-->")) != NULL)) {
684
496
                chunkSize = (end - cur) + 3;
685
496
                repl = cur;
686
496
                replSize = chunkSize;
687
6.00k
      } else {
688
6.00k
                repl = BAD_CAST "&lt;";
689
6.00k
                replSize = 4;
690
6.00k
            }
691
98.7k
  } else if (c == '>') {
692
35.3k
            repl = BAD_CAST "&gt;";
693
35.3k
            replSize = 4;
694
63.3k
  } else if (c == '&') {
695
      /*
696
       * Special handling of &{...} construct from HTML 4, see
697
       * http://www.w3.org/TR/html401/appendix/notes.html#h-B.7.1
698
       */
699
4.38k
      if ((flags & XML_ESCAPE_HTML) && (flags & XML_ESCAPE_ATTR) &&
700
4.02k
                (cur[1] == '{') && (end = xmlStrchr(cur, '}'))) {
701
1.76k
                chunkSize = (end - cur) + 1;
702
1.76k
                repl = cur;
703
1.76k
                replSize = chunkSize;
704
2.61k
      } else {
705
2.61k
                repl = BAD_CAST "&amp;";
706
2.61k
                replSize = 5;
707
2.61k
            }
708
58.9k
  } else if ((flags & XML_ESCAPE_QUOT) && (c == '"')) {
709
0
            repl = BAD_CAST "&quot;";
710
0
            replSize = 6;
711
58.9k
  } else if (((flags & XML_ESCAPE_HTML) == 0) && (c == '\r')) {
712
0
      repl = BAD_CAST "&#13;";
713
0
            replSize = 5;
714
58.9k
  } else if ((flags & XML_ESCAPE_NON_ASCII) && (c >= 0x80)) {
715
0
            int val;
716
717
0
            chunkSize = 4;
718
0
            val = xmlGetUTF8Char(cur, &chunkSize);
719
0
            if (val < 0) {
720
0
                val = 0xFFFD;
721
0
                chunkSize = 1;
722
0
            } else if (((flags & XML_ESCAPE_ALLOW_INVALID) == 0) &&
723
0
                       (!IS_CHAR(val))) {
724
0
                val = 0xFFFD;
725
0
            }
726
727
0
            replSize = xmlSerializeHexCharRef(buf, val);
728
0
            repl = BAD_CAST buf;
729
58.9k
  } else if ((flags & (XML_ESCAPE_ALLOW_INVALID | XML_ESCAPE_HTML)) ||
730
0
                   (c >= 0x20) ||
731
58.9k
             (c == '\n') || (c == '\t') || (c == '\r')) {
732
      /* default case, just copy */
733
58.9k
            cur += 1;
734
58.9k
            if (*cur != 0)
735
58.4k
                continue;
736
737
464
            chunkSize = 0;
738
464
            repl = BAD_CAST "";
739
464
            replSize = 0;
740
464
  } else {
741
            /* ignore */
742
0
            repl = BAD_CAST "";
743
0
            replSize = 0;
744
0
        }
745
746
119k
        used = out - buffer;
747
119k
        unescapedSize = cur - unescaped;
748
119k
        totalSize = unescapedSize + replSize;
749
750
119k
  cur += chunkSize;
751
752
119k
        if (totalSize > size - used) {
753
16.7k
            xmlChar *tmp;
754
16.7k
            int newSize;
755
756
16.7k
            if ((size > (SIZE_MAX - 1) / 2) ||
757
16.7k
                (totalSize > (SIZE_MAX - 1) / 2 - size)) {
758
0
                xmlFree(buffer);
759
0
                return(NULL);
760
0
            }
761
16.7k
            newSize = size + totalSize;
762
16.7k
            if (*cur != 0)
763
10.3k
                newSize *= 2;
764
16.7k
            tmp = xmlRealloc(buffer, newSize + 1);
765
16.7k
            if (tmp == NULL) {
766
6
                xmlFree(buffer);
767
6
                return(NULL);
768
6
            }
769
16.7k
            buffer = tmp;
770
16.7k
            size = newSize;
771
16.7k
            out = buffer + used;
772
16.7k
        }
773
774
119k
        memcpy(out, unescaped, unescapedSize);
775
119k
        out += unescapedSize;
776
119k
        memcpy(out, repl, replSize);
777
119k
        out += replSize;
778
779
119k
        unescaped = cur;
780
119k
    }
781
782
76.3k
    *out = 0;
783
76.3k
    return(buffer);
784
76.3k
}
785
786
/**
787
 * xmlEncodeEntitiesInternal:
788
 * @doc:  the document containing the string
789
 * @input:  A string to convert to XML.
790
 * @flags:  XML_ESCAPE flags
791
 *
792
 * Do a global encoding of a string, replacing the predefined entities
793
 * and non ASCII values with their entities and CharRef counterparts.
794
 * Contrary to xmlEncodeEntities, this routine is reentrant, and result
795
 * must be deallocated.
796
 *
797
 * Returns A newly allocated string with the substitution done.
798
 */
799
xmlChar *
800
xmlEncodeEntitiesInternal(xmlDocPtr doc, const xmlChar *input,
801
76.3k
                          unsigned flags) {
802
76.3k
    if (input == NULL)
803
0
        return(NULL);
804
805
76.3k
    if ((doc != NULL) && (doc->type == XML_HTML_DOCUMENT_NODE))
806
76.3k
        flags |= XML_ESCAPE_HTML;
807
0
    else if ((doc == NULL) || (doc->encoding == NULL))
808
0
        flags |= XML_ESCAPE_NON_ASCII;
809
810
76.3k
    return(xmlEscapeText(input, flags));
811
76.3k
}
812
813
/**
814
 * xmlEncodeEntitiesReentrant:
815
 * @doc:  the document containing the string
816
 * @input:  A string to convert to XML.
817
 *
818
 * Do a global encoding of a string, replacing the predefined entities
819
 * and non ASCII values with their entities and CharRef counterparts.
820
 * Contrary to xmlEncodeEntities, this routine is reentrant, and result
821
 * must be deallocated.
822
 *
823
 * This escapes '<', '>', '&' and '\r'. If the document has no encoding,
824
 * non-ASCII codepoints are escaped. There is some special handling for
825
 * HTML documents.
826
 *
827
 * Returns A newly allocated string with the substitution done.
828
 */
829
xmlChar *
830
42.8k
xmlEncodeEntitiesReentrant(xmlDocPtr doc, const xmlChar *input) {
831
42.8k
    return xmlEncodeEntitiesInternal(doc, input, 0);
832
42.8k
}
833
834
/**
835
 * xmlEncodeSpecialChars:
836
 * @doc:  unused
837
 * @input:  A string to convert to XML.
838
 *
839
 * Do a global encoding of a string, replacing the predefined entities
840
 * this routine is reentrant, and result must be deallocated.
841
 *
842
 * This escapes '<', '>', '&', '"' and '\r' chars.
843
 *
844
 * Returns A newly allocated string with the substitution done.
845
 */
846
xmlChar *
847
xmlEncodeSpecialChars(const xmlDoc *doc ATTRIBUTE_UNUSED,
848
0
                      const xmlChar *input) {
849
0
    if (input == NULL)
850
0
        return(NULL);
851
852
0
    return(xmlEscapeText(input, XML_ESCAPE_QUOT | XML_ESCAPE_ALLOW_INVALID));
853
0
}
854
855
/**
856
 * xmlCreateEntitiesTable:
857
 *
858
 * create and initialize an empty entities hash table.
859
 * This really doesn't make sense and should be deprecated
860
 *
861
 * Returns the xmlEntitiesTablePtr just created or NULL in case of error.
862
 */
863
xmlEntitiesTablePtr
864
0
xmlCreateEntitiesTable(void) {
865
0
    return((xmlEntitiesTablePtr) xmlHashCreate(0));
866
0
}
867
868
/**
869
 * xmlFreeEntityWrapper:
870
 * @entity:  An entity
871
 * @name:  its name
872
 *
873
 * Deallocate the memory used by an entities in the hash table.
874
 */
875
static void
876
96.9k
xmlFreeEntityWrapper(void *entity, const xmlChar *name ATTRIBUTE_UNUSED) {
877
96.9k
    if (entity != NULL)
878
96.9k
  xmlFreeEntity((xmlEntityPtr) entity);
879
96.9k
}
880
881
/**
882
 * xmlFreeEntitiesTable:
883
 * @table:  An entity table
884
 *
885
 * Deallocate the memory used by an entities hash table.
886
 */
887
void
888
52.4k
xmlFreeEntitiesTable(xmlEntitiesTablePtr table) {
889
52.4k
    xmlHashFree(table, xmlFreeEntityWrapper);
890
52.4k
}
891
892
/**
893
 * xmlCopyEntity:
894
 * @ent:  An entity
895
 *
896
 * Build a copy of an entity
897
 *
898
 * Returns the new xmlEntitiesPtr or NULL in case of error.
899
 */
900
static void *
901
0
xmlCopyEntity(void *payload, const xmlChar *name ATTRIBUTE_UNUSED) {
902
0
    xmlEntityPtr ent = (xmlEntityPtr) payload;
903
0
    xmlEntityPtr cur;
904
905
0
    cur = (xmlEntityPtr) xmlMalloc(sizeof(xmlEntity));
906
0
    if (cur == NULL)
907
0
  return(NULL);
908
0
    memset(cur, 0, sizeof(xmlEntity));
909
0
    cur->type = XML_ENTITY_DECL;
910
911
0
    cur->etype = ent->etype;
912
0
    if (ent->name != NULL) {
913
0
  cur->name = xmlStrdup(ent->name);
914
0
        if (cur->name == NULL)
915
0
            goto error;
916
0
    }
917
0
    if (ent->ExternalID != NULL) {
918
0
  cur->ExternalID = xmlStrdup(ent->ExternalID);
919
0
        if (cur->ExternalID == NULL)
920
0
            goto error;
921
0
    }
922
0
    if (ent->SystemID != NULL) {
923
0
  cur->SystemID = xmlStrdup(ent->SystemID);
924
0
        if (cur->SystemID == NULL)
925
0
            goto error;
926
0
    }
927
0
    if (ent->content != NULL) {
928
0
  cur->content = xmlStrdup(ent->content);
929
0
        if (cur->content == NULL)
930
0
            goto error;
931
0
    }
932
0
    if (ent->orig != NULL) {
933
0
  cur->orig = xmlStrdup(ent->orig);
934
0
        if (cur->orig == NULL)
935
0
            goto error;
936
0
    }
937
0
    if (ent->URI != NULL) {
938
0
  cur->URI = xmlStrdup(ent->URI);
939
0
        if (cur->URI == NULL)
940
0
            goto error;
941
0
    }
942
0
    return(cur);
943
944
0
error:
945
0
    xmlFreeEntity(cur);
946
0
    return(NULL);
947
0
}
948
949
/**
950
 * xmlCopyEntitiesTable:
951
 * @table:  An entity table
952
 *
953
 * Build a copy of an entity table.
954
 *
955
 * Returns the new xmlEntitiesTablePtr or NULL in case of error.
956
 */
957
xmlEntitiesTablePtr
958
0
xmlCopyEntitiesTable(xmlEntitiesTablePtr table) {
959
0
    return(xmlHashCopySafe(table, xmlCopyEntity, xmlFreeEntityWrapper));
960
0
}
961
962
#ifdef LIBXML_OUTPUT_ENABLED
963
964
/**
965
 * xmlDumpEntityDecl:
966
 * @buf:  An XML buffer.
967
 * @ent:  An entity table
968
 *
969
 * This will dump the content of the entity table as an XML DTD definition
970
 */
971
void
972
0
xmlDumpEntityDecl(xmlBufferPtr buf, xmlEntityPtr ent) {
973
0
    xmlSaveCtxtPtr save;
974
975
0
    if ((buf == NULL) || (ent == NULL))
976
0
        return;
977
978
0
    save = xmlSaveToBuffer(buf, NULL, 0);
979
0
    xmlSaveTree(save, (xmlNodePtr) ent);
980
0
    if (xmlSaveFinish(save) != XML_ERR_OK)
981
0
        xmlFree(xmlBufferDetach(buf));
982
0
}
983
984
/**
985
 * xmlDumpEntityDeclScan:
986
 * @ent:  An entity table
987
 * @buf:  An XML buffer.
988
 *
989
 * When using the hash table scan function, arguments need to be reversed
990
 */
991
static void
992
xmlDumpEntityDeclScan(void *ent, void *save,
993
0
                      const xmlChar *name ATTRIBUTE_UNUSED) {
994
0
    xmlSaveTree(save, ent);
995
0
}
996
997
/**
998
 * xmlDumpEntitiesTable:
999
 * @buf:  An XML buffer.
1000
 * @table:  An entity table
1001
 *
1002
 * This will dump the content of the entity table as an XML DTD definition
1003
 */
1004
void
1005
0
xmlDumpEntitiesTable(xmlBufferPtr buf, xmlEntitiesTablePtr table) {
1006
0
    xmlSaveCtxtPtr save;
1007
1008
0
    if ((buf == NULL) || (table == NULL))
1009
0
        return;
1010
1011
0
    save = xmlSaveToBuffer(buf, NULL, 0);
1012
0
    xmlHashScan(table, xmlDumpEntityDeclScan, save);
1013
0
    if (xmlSaveFinish(save) != XML_ERR_OK)
1014
0
        xmlFree(xmlBufferDetach(buf));
1015
0
}
1016
#endif /* LIBXML_OUTPUT_ENABLED */