Coverage Report

Created: 2025-11-24 06:51

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
/src/libxml2/entities.c
Line
Count
Source
1
/*
2
 * entities.c : implementation for the XML entities handling
3
 *
4
 * See Copyright for the status of this software.
5
 *
6
 * daniel@veillard.com
7
 */
8
9
/* To avoid EBCDIC trouble when parsing on zOS */
10
#if defined(__MVS__)
11
#pragma convert("ISO8859-1")
12
#endif
13
14
#define IN_LIBXML
15
#include "libxml.h"
16
17
#include <string.h>
18
#include <stdlib.h>
19
20
#include <libxml/xmlmemory.h>
21
#include <libxml/hash.h>
22
#include <libxml/entities.h>
23
#include <libxml/parser.h>
24
#include <libxml/parserInternals.h>
25
#include <libxml/xmlerror.h>
26
#include <libxml/dict.h>
27
#include <libxml/xmlsave.h>
28
29
#include "private/entities.h"
30
#include "private/error.h"
31
32
#ifndef SIZE_MAX
33
  #define SIZE_MAX ((size_t) -1)
34
#endif
35
36
/*
37
 * The XML predefined entities.
38
 */
39
40
static xmlEntity xmlEntityLt = {
41
    NULL, XML_ENTITY_DECL, BAD_CAST "lt",
42
    NULL, NULL, NULL, NULL, NULL, NULL,
43
    BAD_CAST "<", BAD_CAST "<", 1,
44
    XML_INTERNAL_PREDEFINED_ENTITY,
45
    NULL, NULL, NULL, NULL, 0, 0, 0
46
};
47
static xmlEntity xmlEntityGt = {
48
    NULL, XML_ENTITY_DECL, BAD_CAST "gt",
49
    NULL, NULL, NULL, NULL, NULL, NULL,
50
    BAD_CAST ">", BAD_CAST ">", 1,
51
    XML_INTERNAL_PREDEFINED_ENTITY,
52
    NULL, NULL, NULL, NULL, 0, 0, 0
53
};
54
static xmlEntity xmlEntityAmp = {
55
    NULL, XML_ENTITY_DECL, BAD_CAST "amp",
56
    NULL, NULL, NULL, NULL, NULL, NULL,
57
    BAD_CAST "&", BAD_CAST "&", 1,
58
    XML_INTERNAL_PREDEFINED_ENTITY,
59
    NULL, NULL, NULL, NULL, 0, 0, 0
60
};
61
static xmlEntity xmlEntityQuot = {
62
    NULL, XML_ENTITY_DECL, BAD_CAST "quot",
63
    NULL, NULL, NULL, NULL, NULL, NULL,
64
    BAD_CAST "\"", BAD_CAST "\"", 1,
65
    XML_INTERNAL_PREDEFINED_ENTITY,
66
    NULL, NULL, NULL, NULL, 0, 0, 0
67
};
68
static xmlEntity xmlEntityApos = {
69
    NULL, XML_ENTITY_DECL, BAD_CAST "apos",
70
    NULL, NULL, NULL, NULL, NULL, NULL,
71
    BAD_CAST "'", BAD_CAST "'", 1,
72
    XML_INTERNAL_PREDEFINED_ENTITY,
73
    NULL, NULL, NULL, NULL, 0, 0, 0
74
};
75
76
/*
77
 * xmlFreeEntity:
78
 * @entity:  an entity
79
 *
80
 * Frees the entity.
81
 */
82
void
83
xmlFreeEntity(xmlEntityPtr entity)
84
151k
{
85
151k
    xmlDictPtr dict = NULL;
86
87
151k
    if (entity == NULL)
88
0
        return;
89
90
151k
    if (entity->doc != NULL)
91
151k
        dict = entity->doc->dict;
92
93
94
151k
    if ((entity->children) &&
95
2.16k
        (entity == (xmlEntityPtr) entity->children->parent))
96
2.16k
        xmlFreeNodeList(entity->children);
97
151k
    if ((entity->name != NULL) &&
98
151k
        ((dict == NULL) || (!xmlDictOwns(dict, entity->name))))
99
15.5k
        xmlFree((char *) entity->name);
100
151k
    if (entity->ExternalID != NULL)
101
14.1k
        xmlFree((char *) entity->ExternalID);
102
151k
    if (entity->SystemID != NULL)
103
73.0k
        xmlFree((char *) entity->SystemID);
104
151k
    if (entity->URI != NULL)
105
67.5k
        xmlFree((char *) entity->URI);
106
151k
    if (entity->content != NULL)
107
80.2k
        xmlFree((char *) entity->content);
108
151k
    if (entity->orig != NULL)
109
75.1k
        xmlFree((char *) entity->orig);
110
151k
    xmlFree(entity);
111
151k
}
112
113
/*
114
 * xmlCreateEntity:
115
 *
116
 * internal routine doing the entity node structures allocations
117
 */
118
static xmlEntityPtr
119
xmlCreateEntity(xmlDocPtr doc, const xmlChar *name, int type,
120
          const xmlChar *ExternalID, const xmlChar *SystemID,
121
151k
          const xmlChar *content) {
122
151k
    xmlEntityPtr ret;
123
124
151k
    ret = (xmlEntityPtr) xmlMalloc(sizeof(xmlEntity));
125
151k
    if (ret == NULL)
126
8
  return(NULL);
127
151k
    memset(ret, 0, sizeof(xmlEntity));
128
151k
    ret->doc = doc;
129
151k
    ret->type = XML_ENTITY_DECL;
130
131
    /*
132
     * fill the structure.
133
     */
134
151k
    ret->etype = (xmlEntityType) type;
135
151k
    if ((doc == NULL) || (doc->dict == NULL))
136
15.5k
  ret->name = xmlStrdup(name);
137
135k
    else
138
135k
        ret->name = xmlDictLookup(doc->dict, name, -1);
139
151k
    if (ret->name == NULL)
140
1
        goto error;
141
151k
    if (ExternalID != NULL) {
142
14.1k
        ret->ExternalID = xmlStrdup(ExternalID);
143
14.1k
        if (ret->ExternalID == NULL)
144
2
            goto error;
145
14.1k
    }
146
151k
    if (SystemID != NULL) {
147
73.0k
        ret->SystemID = xmlStrdup(SystemID);
148
73.0k
        if (ret->SystemID == NULL)
149
3
            goto error;
150
73.0k
    }
151
151k
    if (content != NULL) {
152
77.5k
        ret->length = xmlStrlen(content);
153
77.5k
  ret->content = xmlStrndup(content, ret->length);
154
77.5k
        if (ret->content == NULL)
155
6
            goto error;
156
77.5k
     } else {
157
73.8k
        ret->length = 0;
158
73.8k
        ret->content = NULL;
159
73.8k
    }
160
151k
    ret->URI = NULL; /* to be computed by the layer knowing
161
      the defining entity */
162
151k
    ret->orig = NULL;
163
164
151k
    return(ret);
165
166
12
error:
167
12
    xmlFreeEntity(ret);
168
12
    return(NULL);
169
151k
}
170
171
/**
172
 * xmlAddEntity:
173
 * @doc:  the document
174
 * @extSubset:  add to the external or internal subset
175
 * @name:  the entity name
176
 * @type:  the entity type XML_xxx_yyy_ENTITY
177
 * @ExternalID:  the entity external ID if available
178
 * @SystemID:  the entity system ID if available
179
 * @content:  the entity content
180
 * @out:  pointer to resulting entity (optional)
181
 *
182
 * Register a new entity for this document.
183
 *
184
 * Available since 2.13.0.
185
 *
186
 * Returns an xmlParserErrors error code.
187
 */
188
int
189
xmlAddEntity(xmlDocPtr doc, int extSubset, const xmlChar *name, int type,
190
    const xmlChar *ExternalID, const xmlChar *SystemID,
191
154k
    const xmlChar *content, xmlEntityPtr *out) {
192
154k
    xmlDtdPtr dtd;
193
154k
    xmlDictPtr dict = NULL;
194
154k
    xmlEntitiesTablePtr table = NULL;
195
154k
    xmlEntityPtr ret, predef;
196
154k
    int res;
197
198
154k
    if (out != NULL)
199
154k
        *out = NULL;
200
154k
    if ((doc == NULL) || (name == NULL))
201
0
  return(XML_ERR_ARGUMENT);
202
154k
    dict = doc->dict;
203
204
154k
    if (extSubset)
205
8.49k
        dtd = doc->extSubset;
206
145k
    else
207
145k
        dtd = doc->intSubset;
208
154k
    if (dtd == NULL)
209
0
        return(XML_DTD_NO_DTD);
210
211
154k
    switch (type) {
212
62.5k
        case XML_INTERNAL_GENERAL_ENTITY:
213
77.4k
        case XML_EXTERNAL_GENERAL_PARSED_ENTITY:
214
77.7k
        case XML_EXTERNAL_GENERAL_UNPARSED_ENTITY:
215
77.7k
            predef = xmlGetPredefinedEntity(name);
216
77.7k
            if (predef != NULL) {
217
3.56k
                int valid = 0;
218
219
                /* 4.6 Predefined Entities */
220
3.56k
                if ((type == XML_INTERNAL_GENERAL_ENTITY) &&
221
3.10k
                    (content != NULL)) {
222
2.84k
                    int c = predef->content[0];
223
224
2.84k
                    if (((content[0] == c) && (content[1] == 0)) &&
225
1.01k
                        ((c == '>') || (c == '\'') || (c == '"'))) {
226
788
                        valid = 1;
227
2.05k
                    } else if ((content[0] == '&') && (content[1] == '#')) {
228
753
                        if (content[2] == 'x') {
229
302
                            xmlChar *hex = BAD_CAST "0123456789ABCDEF";
230
302
                            xmlChar ref[] = "00;";
231
232
302
                            ref[0] = hex[c / 16 % 16];
233
302
                            ref[1] = hex[c % 16];
234
302
                            if (xmlStrcasecmp(&content[3], ref) == 0)
235
0
                                valid = 1;
236
451
                        } else {
237
451
                            xmlChar ref[] = "00;";
238
239
451
                            ref[0] = '0' + c / 10 % 10;
240
451
                            ref[1] = '0' + c % 10;
241
451
                            if (xmlStrEqual(&content[2], ref))
242
186
                                valid = 1;
243
451
                        }
244
753
                    }
245
2.84k
                }
246
3.56k
                if (!valid)
247
2.59k
                    return(XML_ERR_REDECL_PREDEF_ENTITY);
248
3.56k
            }
249
75.1k
      if (dtd->entities == NULL) {
250
38.8k
    dtd->entities = xmlHashCreateDict(0, dict);
251
38.8k
                if (dtd->entities == NULL)
252
4
                    return(XML_ERR_NO_MEMORY);
253
38.8k
            }
254
75.1k
      table = dtd->entities;
255
75.1k
      break;
256
17.4k
        case XML_INTERNAL_PARAMETER_ENTITY:
257
76.3k
        case XML_EXTERNAL_PARAMETER_ENTITY:
258
76.3k
      if (dtd->pentities == NULL) {
259
43.5k
    dtd->pentities = xmlHashCreateDict(0, dict);
260
43.5k
                if (dtd->pentities == NULL)
261
3
                    return(XML_ERR_NO_MEMORY);
262
43.5k
            }
263
76.3k
      table = dtd->pentities;
264
76.3k
      break;
265
0
        default:
266
0
      return(XML_ERR_ARGUMENT);
267
154k
    }
268
151k
    ret = xmlCreateEntity(dtd->doc, name, type, ExternalID, SystemID, content);
269
151k
    if (ret == NULL)
270
20
        return(XML_ERR_NO_MEMORY);
271
272
151k
    res = xmlHashAdd(table, name, ret);
273
151k
    if (res < 0) {
274
4
        xmlFreeEntity(ret);
275
4
        return(XML_ERR_NO_MEMORY);
276
151k
    } else if (res == 0) {
277
  /*
278
   * entity was already defined at another level.
279
   */
280
6.04k
        xmlFreeEntity(ret);
281
6.04k
  return(XML_WAR_ENTITY_REDEFINED);
282
6.04k
    }
283
284
    /*
285
     * Link it to the DTD
286
     */
287
145k
    ret->parent = dtd;
288
145k
    ret->doc = dtd->doc;
289
145k
    if (dtd->last == NULL) {
290
54.0k
  dtd->children = dtd->last = (xmlNodePtr) ret;
291
91.2k
    } else {
292
91.2k
  dtd->last->next = (xmlNodePtr) ret;
293
91.2k
  ret->prev = dtd->last;
294
91.2k
  dtd->last = (xmlNodePtr) ret;
295
91.2k
    }
296
297
145k
    if (out != NULL)
298
145k
        *out = ret;
299
145k
    return(0);
300
151k
}
301
302
/**
303
 * xmlGetPredefinedEntity:
304
 * @name:  the entity name
305
 *
306
 * Check whether this name is an predefined entity.
307
 *
308
 * Returns NULL if not, otherwise the entity
309
 */
310
xmlEntityPtr
311
3.39M
xmlGetPredefinedEntity(const xmlChar *name) {
312
3.39M
    if (name == NULL) return(NULL);
313
3.39M
    switch (name[0]) {
314
15.6k
        case 'l':
315
15.6k
      if (xmlStrEqual(name, BAD_CAST "lt"))
316
9.27k
          return(&xmlEntityLt);
317
6.41k
      break;
318
51.7k
        case 'g':
319
51.7k
      if (xmlStrEqual(name, BAD_CAST "gt"))
320
50.1k
          return(&xmlEntityGt);
321
1.60k
      break;
322
1.70M
        case 'a':
323
1.70M
      if (xmlStrEqual(name, BAD_CAST "amp"))
324
59.9k
          return(&xmlEntityAmp);
325
1.64M
      if (xmlStrEqual(name, BAD_CAST "apos"))
326
597
          return(&xmlEntityApos);
327
1.64M
      break;
328
1.64M
        case 'q':
329
453k
      if (xmlStrEqual(name, BAD_CAST "quot"))
330
720
          return(&xmlEntityQuot);
331
452k
      break;
332
1.16M
  default:
333
1.16M
      break;
334
3.39M
    }
335
3.27M
    return(NULL);
336
3.39M
}
337
338
/**
339
 * xmlAddDtdEntity:
340
 * @doc:  the document
341
 * @name:  the entity name
342
 * @type:  the entity type XML_xxx_yyy_ENTITY
343
 * @ExternalID:  the entity external ID if available
344
 * @SystemID:  the entity system ID if available
345
 * @content:  the entity content
346
 *
347
 * Register a new entity for this document DTD external subset.
348
 *
349
 * Returns a pointer to the entity or NULL in case of error
350
 */
351
xmlEntityPtr
352
xmlAddDtdEntity(xmlDocPtr doc, const xmlChar *name, int type,
353
          const xmlChar *ExternalID, const xmlChar *SystemID,
354
0
    const xmlChar *content) {
355
0
    xmlEntityPtr ret;
356
357
0
    xmlAddEntity(doc, 1, name, type, ExternalID, SystemID, content, &ret);
358
0
    return(ret);
359
0
}
360
361
/**
362
 * xmlAddDocEntity:
363
 * @doc:  the document
364
 * @name:  the entity name
365
 * @type:  the entity type XML_xxx_yyy_ENTITY
366
 * @ExternalID:  the entity external ID if available
367
 * @SystemID:  the entity system ID if available
368
 * @content:  the entity content
369
 *
370
 * Register a new entity for this document.
371
 *
372
 * Returns a pointer to the entity or NULL in case of error
373
 */
374
xmlEntityPtr
375
xmlAddDocEntity(xmlDocPtr doc, const xmlChar *name, int type,
376
          const xmlChar *ExternalID, const xmlChar *SystemID,
377
0
          const xmlChar *content) {
378
0
    xmlEntityPtr ret;
379
380
0
    xmlAddEntity(doc, 0, name, type, ExternalID, SystemID, content, &ret);
381
0
    return(ret);
382
0
}
383
384
/**
385
 * xmlNewEntity:
386
 * @doc:  the document
387
 * @name:  the entity name
388
 * @type:  the entity type XML_xxx_yyy_ENTITY
389
 * @ExternalID:  the entity external ID if available
390
 * @SystemID:  the entity system ID if available
391
 * @content:  the entity content
392
 *
393
 * Create a new entity, this differs from xmlAddDocEntity() that if
394
 * the document is NULL or has no internal subset defined, then an
395
 * unlinked entity structure will be returned, it is then the responsibility
396
 * of the caller to link it to the document later or free it when not needed
397
 * anymore.
398
 *
399
 * Returns a pointer to the entity or NULL in case of error
400
 */
401
xmlEntityPtr
402
xmlNewEntity(xmlDocPtr doc, const xmlChar *name, int type,
403
       const xmlChar *ExternalID, const xmlChar *SystemID,
404
0
       const xmlChar *content) {
405
0
    if ((doc != NULL) && (doc->intSubset != NULL)) {
406
0
  return(xmlAddDocEntity(doc, name, type, ExternalID, SystemID, content));
407
0
    }
408
0
    if (name == NULL)
409
0
        return(NULL);
410
0
    return(xmlCreateEntity(doc, name, type, ExternalID, SystemID, content));
411
0
}
412
413
/**
414
 * xmlGetEntityFromTable:
415
 * @table:  an entity table
416
 * @name:  the entity name
417
 * @parameter:  look for parameter entities
418
 *
419
 * Do an entity lookup in the table.
420
 * returns the corresponding parameter entity, if found.
421
 *
422
 * Returns A pointer to the entity structure or NULL if not found.
423
 */
424
static xmlEntityPtr
425
1.69M
xmlGetEntityFromTable(xmlEntitiesTablePtr table, const xmlChar *name) {
426
1.69M
    return((xmlEntityPtr) xmlHashLookup(table, name));
427
1.69M
}
428
429
/**
430
 * xmlGetParameterEntity:
431
 * @doc:  the document referencing the entity
432
 * @name:  the entity name
433
 *
434
 * Do an entity lookup in the internal and external subsets and
435
 * returns the corresponding parameter entity, if found.
436
 *
437
 * Returns A pointer to the entity structure or NULL if not found.
438
 */
439
xmlEntityPtr
440
116k
xmlGetParameterEntity(xmlDocPtr doc, const xmlChar *name) {
441
116k
    xmlEntitiesTablePtr table;
442
116k
    xmlEntityPtr ret;
443
444
116k
    if (doc == NULL)
445
303
  return(NULL);
446
116k
    if ((doc->intSubset != NULL) && (doc->intSubset->pentities != NULL)) {
447
110k
  table = (xmlEntitiesTablePtr) doc->intSubset->pentities;
448
110k
  ret = xmlGetEntityFromTable(table, name);
449
110k
  if (ret != NULL)
450
80.3k
      return(ret);
451
110k
    }
452
36.1k
    if ((doc->extSubset != NULL) && (doc->extSubset->pentities != NULL)) {
453
9.02k
  table = (xmlEntitiesTablePtr) doc->extSubset->pentities;
454
9.02k
  return(xmlGetEntityFromTable(table, name));
455
9.02k
    }
456
27.1k
    return(NULL);
457
36.1k
}
458
459
/**
460
 * xmlGetDtdEntity:
461
 * @doc:  the document referencing the entity
462
 * @name:  the entity name
463
 *
464
 * Do an entity lookup in the DTD entity hash table and
465
 * returns the corresponding entity, if found.
466
 * Note: the first argument is the document node, not the DTD node.
467
 *
468
 * Returns A pointer to the entity structure or NULL if not found.
469
 */
470
xmlEntityPtr
471
0
xmlGetDtdEntity(xmlDocPtr doc, const xmlChar *name) {
472
0
    xmlEntitiesTablePtr table;
473
474
0
    if (doc == NULL)
475
0
  return(NULL);
476
0
    if ((doc->extSubset != NULL) && (doc->extSubset->entities != NULL)) {
477
0
  table = (xmlEntitiesTablePtr) doc->extSubset->entities;
478
0
  return(xmlGetEntityFromTable(table, name));
479
0
    }
480
0
    return(NULL);
481
0
}
482
483
/**
484
 * xmlGetDocEntity:
485
 * @doc:  the document referencing the entity
486
 * @name:  the entity name
487
 *
488
 * Do an entity lookup in the document entity hash table and
489
 * returns the corresponding entity, otherwise a lookup is done
490
 * in the predefined entities too.
491
 *
492
 * Returns A pointer to the entity structure or NULL if not found.
493
 */
494
xmlEntityPtr
495
1.58M
xmlGetDocEntity(const xmlDoc *doc, const xmlChar *name) {
496
1.58M
    xmlEntityPtr cur;
497
1.58M
    xmlEntitiesTablePtr table;
498
499
1.58M
    if (doc != NULL) {
500
1.58M
  if ((doc->intSubset != NULL) && (doc->intSubset->entities != NULL)) {
501
1.51M
      table = (xmlEntitiesTablePtr) doc->intSubset->entities;
502
1.51M
      cur = xmlGetEntityFromTable(table, name);
503
1.51M
      if (cur != NULL)
504
1.36M
    return(cur);
505
1.51M
  }
506
212k
  if (doc->standalone != 1) {
507
212k
      if ((doc->extSubset != NULL) &&
508
66.9k
    (doc->extSubset->entities != NULL)) {
509
65.1k
    table = (xmlEntitiesTablePtr) doc->extSubset->entities;
510
65.1k
    cur = xmlGetEntityFromTable(table, name);
511
65.1k
    if (cur != NULL)
512
234
        return(cur);
513
65.1k
      }
514
212k
  }
515
212k
    }
516
216k
    return(xmlGetPredefinedEntity(name));
517
1.58M
}
518
519
/*
520
 * xmlSerializeHexCharRef:
521
 * @buf:  a char buffer
522
 * @val:  a codepoint
523
 *
524
 * Serializes a hex char ref like &#xA0;
525
 *
526
 * Writes at most 9 bytes. Does not include a terminating zero byte.
527
 *
528
 * Returns the number of bytes written.
529
 */
530
int
531
16.5k
xmlSerializeHexCharRef(char *buf, int val) {
532
16.5k
    char *out = buf;
533
16.5k
    int shift = 0, bits;
534
535
16.5k
    *out++ = '&';
536
16.5k
    *out++ = '#';
537
16.5k
    *out++ = 'x';
538
539
16.5k
    bits = val;
540
16.5k
    if (bits & 0xFF0000) {
541
79
        shift = 16;
542
79
        bits &= 0xFF0000;
543
16.4k
    } else if (bits & 0x00FF00) {
544
1.73k
        shift = 8;
545
1.73k
        bits &= 0x00FF00;
546
1.73k
    }
547
16.5k
    if (bits & 0xF0F0F0) {
548
14.7k
        shift += 4;
549
14.7k
    }
550
551
35.0k
    do {
552
35.0k
        int d = (val >> shift) & 0x0F;
553
554
35.0k
        if (d < 10)
555
18.3k
            *out++ = '0' + d;
556
16.7k
        else
557
16.7k
            *out++ = 'A' + (d - 10);
558
559
35.0k
  shift -= 4;
560
35.0k
    } while (shift >= 0);
561
562
16.5k
    *out++ = ';';
563
564
16.5k
    return(out - buf);
565
16.5k
}
566
567
/*
568
 * xmlSerializeDecCharRef:
569
 * @buf:  a char buffer
570
 * @val:  a codepoint
571
 *
572
 * Serializes a decimal char ref like &#38;
573
 *
574
 * Writes at most 10 bytes. Does not include a terminating zero byte.
575
 *
576
 * Returns the number of bytes written.
577
 */
578
int
579
113M
xmlSerializeDecCharRef(char *buf, int val) {
580
113M
    char *out = buf;
581
113M
    int len, i;
582
583
113M
    *out++ = '&';
584
113M
    *out++ = '#';
585
586
113M
    if (val < 100) {
587
384
        len = (val < 10) ? 1 : 2;
588
113M
    } else if (val < 10000) {
589
113M
        len = (val < 1000) ? 3 : 4;
590
113M
    } else if (val < 1000000) {
591
7.28k
        len = (val < 100000) ? 5 : 6;
592
7.28k
    } else {
593
225
        len = 7;
594
225
    }
595
596
462M
    for (i = len - 1; i >= 0; i--) {
597
349M
        out[i] = '0' + val % 10;
598
349M
        val /= 10;
599
349M
    }
600
601
113M
    out[len] = ';';
602
603
113M
    return(len + 3);
604
113M
}
605
606
static const char xmlEscapeSafe[128] = {
607
    0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0,
608
    0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
609
    1, 1, 0, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1,
610
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 1,
611
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
612
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
613
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
614
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1
615
};
616
617
/*
618
 * xmlEscapeText:
619
 * @text:  input text
620
 * @flags:  XML_ESCAPE flags
621
 *
622
 * Escapes certain characters with char refs.
623
 *
624
 * XML_ESCAPE_ATTR: for attribute content.
625
 * XML_ESCAPE_NON_ASCII: escape non-ASCII chars.
626
 * XML_ESCAPE_HTML: for HTML content.
627
 * XML_ESCAPE_QUOT: escape double quotes.
628
 * XML_ESCAPE_ALLOW_INVALID: allow invalid characters.
629
 *
630
 * Returns an escaped string or NULL if a memory allocation failed.
631
 */
632
xmlChar *
633
113k
xmlEscapeText(const xmlChar *text, int flags) {
634
113k
    const xmlChar *cur;
635
113k
    xmlChar *buffer;
636
113k
    xmlChar *out;
637
113k
    const xmlChar *unescaped;
638
113k
    size_t size = 50;
639
640
113k
    buffer = xmlMalloc(size + 1);
641
113k
    if (buffer == NULL)
642
44
        return(NULL);
643
113k
    out = buffer;
644
645
113k
    cur = text;
646
113k
    unescaped = cur;
647
648
424k
    while (*cur != '\0') {
649
311k
        char buf[12];
650
311k
  const xmlChar *end;
651
311k
        const xmlChar *repl;
652
311k
        size_t used;
653
311k
        size_t replSize;
654
311k
        size_t unescapedSize;
655
311k
        size_t totalSize;
656
311k
        int chunkSize = 1;
657
311k
        int c;
658
659
        /* accelerator */
660
75.4M
  while (1) {
661
75.4M
            c = *cur;
662
663
75.4M
            if (c < 0x80) {
664
6.77M
                if (!xmlEscapeSafe[*cur])
665
311k
                    break;
666
68.7M
            } else {
667
68.7M
               if (flags & XML_ESCAPE_NON_ASCII)
668
0
                   break;
669
68.7M
            }
670
75.1M
            cur += 1;
671
75.1M
        }
672
673
311k
        if (c == 0) {
674
110k
            chunkSize = 0;
675
110k
            repl = BAD_CAST "";
676
110k
            replSize = 0;
677
201k
        } else if (c == '<') {
678
      /*
679
       * Special handling of server side include in HTML attributes
680
       */
681
6.64k
      if ((flags & XML_ESCAPE_HTML) && (flags & XML_ESCAPE_ATTR) &&
682
5.45k
          (cur[1] == '!') && (cur[2] == '-') && (cur[3] == '-') &&
683
568
          ((end = xmlStrstr(cur, BAD_CAST "-->")) != NULL)) {
684
514
                chunkSize = (end - cur) + 3;
685
514
                repl = cur;
686
514
                replSize = chunkSize;
687
6.13k
      } else {
688
6.13k
                repl = BAD_CAST "&lt;";
689
6.13k
                replSize = 4;
690
6.13k
            }
691
194k
  } else if (c == '>') {
692
120k
            repl = BAD_CAST "&gt;";
693
120k
            replSize = 4;
694
120k
  } else if (c == '&') {
695
      /*
696
       * Special handling of &{...} construct from HTML 4, see
697
       * http://www.w3.org/TR/html401/appendix/notes.html#h-B.7.1
698
       */
699
4.18k
      if ((flags & XML_ESCAPE_HTML) && (flags & XML_ESCAPE_ATTR) &&
700
2.98k
                (cur[1] == '{') && (end = xmlStrchr(cur, '}'))) {
701
1.25k
                chunkSize = (end - cur) + 1;
702
1.25k
                repl = cur;
703
1.25k
                replSize = chunkSize;
704
2.93k
      } else {
705
2.93k
                repl = BAD_CAST "&amp;";
706
2.93k
                replSize = 5;
707
2.93k
            }
708
70.5k
  } else if ((flags & XML_ESCAPE_QUOT) && (c == '"')) {
709
0
            repl = BAD_CAST "&quot;";
710
0
            replSize = 6;
711
70.5k
  } else if (((flags & XML_ESCAPE_HTML) == 0) && (c == '\r')) {
712
0
      repl = BAD_CAST "&#13;";
713
0
            replSize = 5;
714
70.5k
  } else if ((flags & XML_ESCAPE_NON_ASCII) && (c >= 0x80)) {
715
0
            int val;
716
717
0
            chunkSize = 4;
718
0
            val = xmlGetUTF8Char(cur, &chunkSize);
719
0
            if (val < 0) {
720
0
                val = 0xFFFD;
721
0
                chunkSize = 1;
722
0
            } else if (((flags & XML_ESCAPE_ALLOW_INVALID) == 0) &&
723
0
                       (!IS_CHAR(val))) {
724
0
                val = 0xFFFD;
725
0
            }
726
727
0
            replSize = xmlSerializeHexCharRef(buf, val);
728
0
            repl = BAD_CAST buf;
729
70.5k
  } else if ((flags & (XML_ESCAPE_ALLOW_INVALID | XML_ESCAPE_HTML)) ||
730
0
                   (c >= 0x20) ||
731
70.5k
             (c == '\n') || (c == '\t') || (c == '\r')) {
732
      /* default case, just copy */
733
70.5k
            cur += 1;
734
70.5k
            if (*cur != 0)
735
69.6k
                continue;
736
737
859
            chunkSize = 0;
738
859
            repl = BAD_CAST "";
739
859
            replSize = 0;
740
859
  } else {
741
            /* ignore */
742
0
            repl = BAD_CAST "";
743
0
            replSize = 0;
744
0
        }
745
746
241k
        used = out - buffer;
747
241k
        unescapedSize = cur - unescaped;
748
241k
        totalSize = unescapedSize + replSize;
749
750
241k
  cur += chunkSize;
751
752
241k
        if (totalSize > size - used) {
753
18.7k
            xmlChar *tmp;
754
18.7k
            int newSize;
755
756
18.7k
            if ((size > (SIZE_MAX - 1) / 2) ||
757
18.7k
                (totalSize > (SIZE_MAX - 1) / 2 - size)) {
758
0
                xmlFree(buffer);
759
0
                return(NULL);
760
0
            }
761
18.7k
            newSize = size + totalSize;
762
18.7k
            if (*cur != 0)
763
11.5k
                newSize *= 2;
764
18.7k
            tmp = xmlRealloc(buffer, newSize + 1);
765
18.7k
            if (tmp == NULL) {
766
1
                xmlFree(buffer);
767
1
                return(NULL);
768
1
            }
769
18.7k
            buffer = tmp;
770
18.7k
            size = newSize;
771
18.7k
            out = buffer + used;
772
18.7k
        }
773
774
241k
        memcpy(out, unescaped, unescapedSize);
775
241k
        out += unescapedSize;
776
241k
        memcpy(out, repl, replSize);
777
241k
        out += replSize;
778
779
241k
        unescaped = cur;
780
241k
    }
781
782
113k
    *out = 0;
783
113k
    return(buffer);
784
113k
}
785
786
/**
787
 * xmlEncodeEntitiesInternal:
788
 * @doc:  the document containing the string
789
 * @input:  A string to convert to XML.
790
 * @flags:  XML_ESCAPE flags
791
 *
792
 * Do a global encoding of a string, replacing the predefined entities
793
 * and non ASCII values with their entities and CharRef counterparts.
794
 * Contrary to xmlEncodeEntities, this routine is reentrant, and result
795
 * must be deallocated.
796
 *
797
 * Returns A newly allocated string with the substitution done.
798
 */
799
xmlChar *
800
xmlEncodeEntitiesInternal(xmlDocPtr doc, const xmlChar *input,
801
113k
                          unsigned flags) {
802
113k
    if (input == NULL)
803
0
        return(NULL);
804
805
113k
    if ((doc != NULL) && (doc->type == XML_HTML_DOCUMENT_NODE))
806
113k
        flags |= XML_ESCAPE_HTML;
807
0
    else if ((doc == NULL) || (doc->encoding == NULL))
808
0
        flags |= XML_ESCAPE_NON_ASCII;
809
810
113k
    return(xmlEscapeText(input, flags));
811
113k
}
812
813
/**
814
 * xmlEncodeEntitiesReentrant:
815
 * @doc:  the document containing the string
816
 * @input:  A string to convert to XML.
817
 *
818
 * Do a global encoding of a string, replacing the predefined entities
819
 * and non ASCII values with their entities and CharRef counterparts.
820
 * Contrary to xmlEncodeEntities, this routine is reentrant, and result
821
 * must be deallocated.
822
 *
823
 * This escapes '<', '>', '&' and '\r'. If the document has no encoding,
824
 * non-ASCII codepoints are escaped. There is some special handling for
825
 * HTML documents.
826
 *
827
 * Returns A newly allocated string with the substitution done.
828
 */
829
xmlChar *
830
57.7k
xmlEncodeEntitiesReentrant(xmlDocPtr doc, const xmlChar *input) {
831
57.7k
    return xmlEncodeEntitiesInternal(doc, input, 0);
832
57.7k
}
833
834
/**
835
 * xmlEncodeSpecialChars:
836
 * @doc:  unused
837
 * @input:  A string to convert to XML.
838
 *
839
 * Do a global encoding of a string, replacing the predefined entities
840
 * this routine is reentrant, and result must be deallocated.
841
 *
842
 * This escapes '<', '>', '&', '"' and '\r' chars.
843
 *
844
 * Returns A newly allocated string with the substitution done.
845
 */
846
xmlChar *
847
xmlEncodeSpecialChars(const xmlDoc *doc ATTRIBUTE_UNUSED,
848
0
                      const xmlChar *input) {
849
0
    if (input == NULL)
850
0
        return(NULL);
851
852
0
    return(xmlEscapeText(input, XML_ESCAPE_QUOT | XML_ESCAPE_ALLOW_INVALID));
853
0
}
854
855
/**
856
 * xmlCreateEntitiesTable:
857
 *
858
 * create and initialize an empty entities hash table.
859
 * This really doesn't make sense and should be deprecated
860
 *
861
 * Returns the xmlEntitiesTablePtr just created or NULL in case of error.
862
 */
863
xmlEntitiesTablePtr
864
0
xmlCreateEntitiesTable(void) {
865
0
    return((xmlEntitiesTablePtr) xmlHashCreate(0));
866
0
}
867
868
/**
869
 * xmlFreeEntityWrapper:
870
 * @entity:  An entity
871
 * @name:  its name
872
 *
873
 * Deallocate the memory used by an entities in the hash table.
874
 */
875
static void
876
145k
xmlFreeEntityWrapper(void *entity, const xmlChar *name ATTRIBUTE_UNUSED) {
877
145k
    if (entity != NULL)
878
145k
  xmlFreeEntity((xmlEntityPtr) entity);
879
145k
}
880
881
/**
882
 * xmlFreeEntitiesTable:
883
 * @table:  An entity table
884
 *
885
 * Deallocate the memory used by an entities hash table.
886
 */
887
void
888
82.3k
xmlFreeEntitiesTable(xmlEntitiesTablePtr table) {
889
82.3k
    xmlHashFree(table, xmlFreeEntityWrapper);
890
82.3k
}
891
892
/**
893
 * xmlCopyEntity:
894
 * @ent:  An entity
895
 *
896
 * Build a copy of an entity
897
 *
898
 * Returns the new xmlEntitiesPtr or NULL in case of error.
899
 */
900
static void *
901
0
xmlCopyEntity(void *payload, const xmlChar *name ATTRIBUTE_UNUSED) {
902
0
    xmlEntityPtr ent = (xmlEntityPtr) payload;
903
0
    xmlEntityPtr cur;
904
905
0
    cur = (xmlEntityPtr) xmlMalloc(sizeof(xmlEntity));
906
0
    if (cur == NULL)
907
0
  return(NULL);
908
0
    memset(cur, 0, sizeof(xmlEntity));
909
0
    cur->type = XML_ENTITY_DECL;
910
911
0
    cur->etype = ent->etype;
912
0
    if (ent->name != NULL) {
913
0
  cur->name = xmlStrdup(ent->name);
914
0
        if (cur->name == NULL)
915
0
            goto error;
916
0
    }
917
0
    if (ent->ExternalID != NULL) {
918
0
  cur->ExternalID = xmlStrdup(ent->ExternalID);
919
0
        if (cur->ExternalID == NULL)
920
0
            goto error;
921
0
    }
922
0
    if (ent->SystemID != NULL) {
923
0
  cur->SystemID = xmlStrdup(ent->SystemID);
924
0
        if (cur->SystemID == NULL)
925
0
            goto error;
926
0
    }
927
0
    if (ent->content != NULL) {
928
0
  cur->content = xmlStrdup(ent->content);
929
0
        if (cur->content == NULL)
930
0
            goto error;
931
0
    }
932
0
    if (ent->orig != NULL) {
933
0
  cur->orig = xmlStrdup(ent->orig);
934
0
        if (cur->orig == NULL)
935
0
            goto error;
936
0
    }
937
0
    if (ent->URI != NULL) {
938
0
  cur->URI = xmlStrdup(ent->URI);
939
0
        if (cur->URI == NULL)
940
0
            goto error;
941
0
    }
942
0
    return(cur);
943
944
0
error:
945
0
    xmlFreeEntity(cur);
946
0
    return(NULL);
947
0
}
948
949
/**
950
 * xmlCopyEntitiesTable:
951
 * @table:  An entity table
952
 *
953
 * Build a copy of an entity table.
954
 *
955
 * Returns the new xmlEntitiesTablePtr or NULL in case of error.
956
 */
957
xmlEntitiesTablePtr
958
0
xmlCopyEntitiesTable(xmlEntitiesTablePtr table) {
959
0
    return(xmlHashCopySafe(table, xmlCopyEntity, xmlFreeEntityWrapper));
960
0
}
961
962
#ifdef LIBXML_OUTPUT_ENABLED
963
964
/**
965
 * xmlDumpEntityDecl:
966
 * @buf:  An XML buffer.
967
 * @ent:  An entity table
968
 *
969
 * This will dump the content of the entity table as an XML DTD definition
970
 */
971
void
972
0
xmlDumpEntityDecl(xmlBufferPtr buf, xmlEntityPtr ent) {
973
0
    xmlSaveCtxtPtr save;
974
975
0
    if ((buf == NULL) || (ent == NULL))
976
0
        return;
977
978
0
    save = xmlSaveToBuffer(buf, NULL, 0);
979
0
    xmlSaveTree(save, (xmlNodePtr) ent);
980
0
    if (xmlSaveFinish(save) != XML_ERR_OK)
981
0
        xmlFree(xmlBufferDetach(buf));
982
0
}
983
984
/**
985
 * xmlDumpEntityDeclScan:
986
 * @ent:  An entity table
987
 * @buf:  An XML buffer.
988
 *
989
 * When using the hash table scan function, arguments need to be reversed
990
 */
991
static void
992
xmlDumpEntityDeclScan(void *ent, void *save,
993
0
                      const xmlChar *name ATTRIBUTE_UNUSED) {
994
0
    xmlSaveTree(save, ent);
995
0
}
996
997
/**
998
 * xmlDumpEntitiesTable:
999
 * @buf:  An XML buffer.
1000
 * @table:  An entity table
1001
 *
1002
 * This will dump the content of the entity table as an XML DTD definition
1003
 */
1004
void
1005
0
xmlDumpEntitiesTable(xmlBufferPtr buf, xmlEntitiesTablePtr table) {
1006
0
    xmlSaveCtxtPtr save;
1007
1008
0
    if ((buf == NULL) || (table == NULL))
1009
0
        return;
1010
1011
0
    save = xmlSaveToBuffer(buf, NULL, 0);
1012
0
    xmlHashScan(table, xmlDumpEntityDeclScan, save);
1013
0
    if (xmlSaveFinish(save) != XML_ERR_OK)
1014
0
        xmlFree(xmlBufferDetach(buf));
1015
0
}
1016
#endif /* LIBXML_OUTPUT_ENABLED */