Coverage Report

Created: 2026-01-09 07:04

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
/src/libxml2/entities.c
Line
Count
Source
1
/*
2
 * entities.c : implementation for the XML entities handling
3
 *
4
 * See Copyright for the status of this software.
5
 *
6
 * daniel@veillard.com
7
 */
8
9
/* To avoid EBCDIC trouble when parsing on zOS */
10
#if defined(__MVS__)
11
#pragma convert("ISO8859-1")
12
#endif
13
14
#define IN_LIBXML
15
#include "libxml.h"
16
17
#include <string.h>
18
#include <stdlib.h>
19
20
#include <libxml/xmlmemory.h>
21
#include <libxml/hash.h>
22
#include <libxml/entities.h>
23
#include <libxml/parser.h>
24
#include <libxml/parserInternals.h>
25
#include <libxml/xmlerror.h>
26
#include <libxml/dict.h>
27
#include <libxml/xmlsave.h>
28
29
#include "private/entities.h"
30
#include "private/error.h"
31
32
#ifndef SIZE_MAX
33
  #define SIZE_MAX ((size_t) -1)
34
#endif
35
36
/*
37
 * The XML predefined entities.
38
 */
39
40
static xmlEntity xmlEntityLt = {
41
    NULL, XML_ENTITY_DECL, BAD_CAST "lt",
42
    NULL, NULL, NULL, NULL, NULL, NULL,
43
    BAD_CAST "<", BAD_CAST "<", 1,
44
    XML_INTERNAL_PREDEFINED_ENTITY,
45
    NULL, NULL, NULL, NULL, 0, 0, 0
46
};
47
static xmlEntity xmlEntityGt = {
48
    NULL, XML_ENTITY_DECL, BAD_CAST "gt",
49
    NULL, NULL, NULL, NULL, NULL, NULL,
50
    BAD_CAST ">", BAD_CAST ">", 1,
51
    XML_INTERNAL_PREDEFINED_ENTITY,
52
    NULL, NULL, NULL, NULL, 0, 0, 0
53
};
54
static xmlEntity xmlEntityAmp = {
55
    NULL, XML_ENTITY_DECL, BAD_CAST "amp",
56
    NULL, NULL, NULL, NULL, NULL, NULL,
57
    BAD_CAST "&", BAD_CAST "&", 1,
58
    XML_INTERNAL_PREDEFINED_ENTITY,
59
    NULL, NULL, NULL, NULL, 0, 0, 0
60
};
61
static xmlEntity xmlEntityQuot = {
62
    NULL, XML_ENTITY_DECL, BAD_CAST "quot",
63
    NULL, NULL, NULL, NULL, NULL, NULL,
64
    BAD_CAST "\"", BAD_CAST "\"", 1,
65
    XML_INTERNAL_PREDEFINED_ENTITY,
66
    NULL, NULL, NULL, NULL, 0, 0, 0
67
};
68
static xmlEntity xmlEntityApos = {
69
    NULL, XML_ENTITY_DECL, BAD_CAST "apos",
70
    NULL, NULL, NULL, NULL, NULL, NULL,
71
    BAD_CAST "'", BAD_CAST "'", 1,
72
    XML_INTERNAL_PREDEFINED_ENTITY,
73
    NULL, NULL, NULL, NULL, 0, 0, 0
74
};
75
76
/*
77
 * xmlFreeEntity:
78
 * @entity:  an entity
79
 *
80
 * Frees the entity.
81
 */
82
void
83
xmlFreeEntity(xmlEntityPtr entity)
84
116k
{
85
116k
    xmlDictPtr dict = NULL;
86
87
116k
    if (entity == NULL)
88
0
        return;
89
90
116k
    if (entity->doc != NULL)
91
116k
        dict = entity->doc->dict;
92
93
94
116k
    if ((entity->children) &&
95
2.96k
        (entity == (xmlEntityPtr) entity->children->parent))
96
2.96k
        xmlFreeNodeList(entity->children);
97
116k
    if ((entity->name != NULL) &&
98
116k
        ((dict == NULL) || (!xmlDictOwns(dict, entity->name))))
99
32.5k
        xmlFree((char *) entity->name);
100
116k
    if (entity->ExternalID != NULL)
101
14.3k
        xmlFree((char *) entity->ExternalID);
102
116k
    if (entity->SystemID != NULL)
103
48.5k
        xmlFree((char *) entity->SystemID);
104
116k
    if (entity->URI != NULL)
105
45.9k
        xmlFree((char *) entity->URI);
106
116k
    if (entity->content != NULL)
107
65.9k
        xmlFree((char *) entity->content);
108
116k
    if (entity->orig != NULL)
109
60.2k
        xmlFree((char *) entity->orig);
110
116k
    xmlFree(entity);
111
116k
}
112
113
/*
114
 * xmlCreateEntity:
115
 *
116
 * internal routine doing the entity node structures allocations
117
 */
118
static xmlEntityPtr
119
xmlCreateEntity(xmlDocPtr doc, const xmlChar *name, int type,
120
          const xmlChar *ExternalID, const xmlChar *SystemID,
121
96.7k
          const xmlChar *content) {
122
96.7k
    xmlEntityPtr ret;
123
124
96.7k
    ret = (xmlEntityPtr) xmlMalloc(sizeof(xmlEntity));
125
96.7k
    if (ret == NULL)
126
9
  return(NULL);
127
96.7k
    memset(ret, 0, sizeof(xmlEntity));
128
96.7k
    ret->doc = doc;
129
96.7k
    ret->type = XML_ENTITY_DECL;
130
131
    /*
132
     * fill the structure.
133
     */
134
96.7k
    ret->etype = (xmlEntityType) type;
135
96.7k
    if ((doc == NULL) || (doc->dict == NULL))
136
12.3k
  ret->name = xmlStrdup(name);
137
84.3k
    else
138
84.3k
        ret->name = xmlDictLookup(doc->dict, name, -1);
139
96.7k
    if (ret->name == NULL)
140
3
        goto error;
141
96.7k
    if (ExternalID != NULL) {
142
14.3k
        ret->ExternalID = xmlStrdup(ExternalID);
143
14.3k
        if (ret->ExternalID == NULL)
144
1
            goto error;
145
14.3k
    }
146
96.7k
    if (SystemID != NULL) {
147
47.7k
        ret->SystemID = xmlStrdup(SystemID);
148
47.7k
        if (ret->SystemID == NULL)
149
5
            goto error;
150
47.7k
    }
151
96.7k
    if (content != NULL) {
152
45.7k
        ret->length = xmlStrlen(content);
153
45.7k
  ret->content = xmlStrndup(content, ret->length);
154
45.7k
        if (ret->content == NULL)
155
5
            goto error;
156
50.9k
     } else {
157
50.9k
        ret->length = 0;
158
50.9k
        ret->content = NULL;
159
50.9k
    }
160
96.7k
    ret->URI = NULL; /* to be computed by the layer knowing
161
      the defining entity */
162
96.7k
    ret->orig = NULL;
163
164
96.7k
    return(ret);
165
166
14
error:
167
14
    xmlFreeEntity(ret);
168
14
    return(NULL);
169
96.7k
}
170
171
/**
172
 * xmlAddEntity:
173
 * @doc:  the document
174
 * @extSubset:  add to the external or internal subset
175
 * @name:  the entity name
176
 * @type:  the entity type XML_xxx_yyy_ENTITY
177
 * @ExternalID:  the entity external ID if available
178
 * @SystemID:  the entity system ID if available
179
 * @content:  the entity content
180
 * @out:  pointer to resulting entity (optional)
181
 *
182
 * Register a new entity for this document.
183
 *
184
 * Available since 2.13.0.
185
 *
186
 * Returns an xmlParserErrors error code.
187
 */
188
int
189
xmlAddEntity(xmlDocPtr doc, int extSubset, const xmlChar *name, int type,
190
    const xmlChar *ExternalID, const xmlChar *SystemID,
191
99.3k
    const xmlChar *content, xmlEntityPtr *out) {
192
99.3k
    xmlDtdPtr dtd;
193
99.3k
    xmlDictPtr dict = NULL;
194
99.3k
    xmlEntitiesTablePtr table = NULL;
195
99.3k
    xmlEntityPtr ret, predef;
196
99.3k
    int res;
197
198
99.3k
    if (out != NULL)
199
99.3k
        *out = NULL;
200
99.3k
    if ((doc == NULL) || (name == NULL))
201
0
  return(XML_ERR_ARGUMENT);
202
99.3k
    dict = doc->dict;
203
204
99.3k
    if (extSubset)
205
13.2k
        dtd = doc->extSubset;
206
86.0k
    else
207
86.0k
        dtd = doc->intSubset;
208
99.3k
    if (dtd == NULL)
209
0
        return(XML_DTD_NO_DTD);
210
211
99.3k
    switch (type) {
212
25.0k
        case XML_INTERNAL_GENERAL_ENTITY:
213
42.1k
        case XML_EXTERNAL_GENERAL_PARSED_ENTITY:
214
42.4k
        case XML_EXTERNAL_GENERAL_UNPARSED_ENTITY:
215
42.4k
            predef = xmlGetPredefinedEntity(name);
216
42.4k
            if (predef != NULL) {
217
3.95k
                int valid = 0;
218
219
                /* 4.6 Predefined Entities */
220
3.95k
                if ((type == XML_INTERNAL_GENERAL_ENTITY) &&
221
3.67k
                    (content != NULL)) {
222
3.36k
                    int c = predef->content[0];
223
224
3.36k
                    if (((content[0] == c) && (content[1] == 0)) &&
225
1.32k
                        ((c == '>') || (c == '\'') || (c == '"'))) {
226
1.10k
                        valid = 1;
227
2.25k
                    } else if ((content[0] == '&') && (content[1] == '#')) {
228
830
                        if (content[2] == 'x') {
229
302
                            xmlChar *hex = BAD_CAST "0123456789ABCDEF";
230
302
                            xmlChar ref[] = "00;";
231
232
302
                            ref[0] = hex[c / 16 % 16];
233
302
                            ref[1] = hex[c % 16];
234
302
                            if (xmlStrcasecmp(&content[3], ref) == 0)
235
0
                                valid = 1;
236
528
                        } else {
237
528
                            xmlChar ref[] = "00;";
238
239
528
                            ref[0] = '0' + c / 10 % 10;
240
528
                            ref[1] = '0' + c % 10;
241
528
                            if (xmlStrEqual(&content[2], ref))
242
227
                                valid = 1;
243
528
                        }
244
830
                    }
245
3.36k
                }
246
3.95k
                if (!valid)
247
2.62k
                    return(XML_ERR_REDECL_PREDEF_ENTITY);
248
3.95k
            }
249
39.7k
      if (dtd->entities == NULL) {
250
29.7k
    dtd->entities = xmlHashCreateDict(0, dict);
251
29.7k
                if (dtd->entities == NULL)
252
6
                    return(XML_ERR_NO_MEMORY);
253
29.7k
            }
254
39.7k
      table = dtd->entities;
255
39.7k
      break;
256
23.5k
        case XML_INTERNAL_PARAMETER_ENTITY:
257
56.9k
        case XML_EXTERNAL_PARAMETER_ENTITY:
258
56.9k
      if (dtd->pentities == NULL) {
259
27.0k
    dtd->pentities = xmlHashCreateDict(0, dict);
260
27.0k
                if (dtd->pentities == NULL)
261
2
                    return(XML_ERR_NO_MEMORY);
262
27.0k
            }
263
56.9k
      table = dtd->pentities;
264
56.9k
      break;
265
0
        default:
266
0
      return(XML_ERR_ARGUMENT);
267
99.3k
    }
268
96.7k
    ret = xmlCreateEntity(dtd->doc, name, type, ExternalID, SystemID, content);
269
96.7k
    if (ret == NULL)
270
23
        return(XML_ERR_NO_MEMORY);
271
272
96.7k
    res = xmlHashAdd(table, name, ret);
273
96.7k
    if (res < 0) {
274
4
        xmlFreeEntity(ret);
275
4
        return(XML_ERR_NO_MEMORY);
276
96.6k
    } else if (res == 0) {
277
  /*
278
   * entity was already defined at another level.
279
   */
280
3.94k
        xmlFreeEntity(ret);
281
3.94k
  return(XML_WAR_ENTITY_REDEFINED);
282
3.94k
    }
283
284
    /*
285
     * Link it to the DTD
286
     */
287
92.7k
    ret->parent = dtd;
288
92.7k
    ret->doc = dtd->doc;
289
92.7k
    if (dtd->last == NULL) {
290
42.1k
  dtd->children = dtd->last = (xmlNodePtr) ret;
291
50.5k
    } else {
292
50.5k
  dtd->last->next = (xmlNodePtr) ret;
293
50.5k
  ret->prev = dtd->last;
294
50.5k
  dtd->last = (xmlNodePtr) ret;
295
50.5k
    }
296
297
92.7k
    if (out != NULL)
298
92.7k
        *out = ret;
299
92.7k
    return(0);
300
96.7k
}
301
302
/**
303
 * xmlGetPredefinedEntity:
304
 * @name:  the entity name
305
 *
306
 * Check whether this name is an predefined entity.
307
 *
308
 * Returns NULL if not, otherwise the entity
309
 */
310
xmlEntityPtr
311
1.31M
xmlGetPredefinedEntity(const xmlChar *name) {
312
1.31M
    if (name == NULL) return(NULL);
313
1.31M
    switch (name[0]) {
314
17.1k
        case 'l':
315
17.1k
      if (xmlStrEqual(name, BAD_CAST "lt"))
316
11.5k
          return(&xmlEntityLt);
317
5.63k
      break;
318
55.5k
        case 'g':
319
55.5k
      if (xmlStrEqual(name, BAD_CAST "gt"))
320
53.5k
          return(&xmlEntityGt);
321
1.95k
      break;
322
467k
        case 'a':
323
467k
      if (xmlStrEqual(name, BAD_CAST "amp"))
324
76.5k
          return(&xmlEntityAmp);
325
390k
      if (xmlStrEqual(name, BAD_CAST "apos"))
326
1.66k
          return(&xmlEntityApos);
327
389k
      break;
328
415k
        case 'q':
329
415k
      if (xmlStrEqual(name, BAD_CAST "quot"))
330
851
          return(&xmlEntityQuot);
331
414k
      break;
332
414k
  default:
333
357k
      break;
334
1.31M
    }
335
1.16M
    return(NULL);
336
1.31M
}
337
338
/**
339
 * xmlAddDtdEntity:
340
 * @doc:  the document
341
 * @name:  the entity name
342
 * @type:  the entity type XML_xxx_yyy_ENTITY
343
 * @ExternalID:  the entity external ID if available
344
 * @SystemID:  the entity system ID if available
345
 * @content:  the entity content
346
 *
347
 * Register a new entity for this document DTD external subset.
348
 *
349
 * Returns a pointer to the entity or NULL in case of error
350
 */
351
xmlEntityPtr
352
xmlAddDtdEntity(xmlDocPtr doc, const xmlChar *name, int type,
353
          const xmlChar *ExternalID, const xmlChar *SystemID,
354
0
    const xmlChar *content) {
355
0
    xmlEntityPtr ret;
356
357
0
    xmlAddEntity(doc, 1, name, type, ExternalID, SystemID, content, &ret);
358
0
    return(ret);
359
0
}
360
361
/**
362
 * xmlAddDocEntity:
363
 * @doc:  the document
364
 * @name:  the entity name
365
 * @type:  the entity type XML_xxx_yyy_ENTITY
366
 * @ExternalID:  the entity external ID if available
367
 * @SystemID:  the entity system ID if available
368
 * @content:  the entity content
369
 *
370
 * Register a new entity for this document.
371
 *
372
 * Returns a pointer to the entity or NULL in case of error
373
 */
374
xmlEntityPtr
375
xmlAddDocEntity(xmlDocPtr doc, const xmlChar *name, int type,
376
          const xmlChar *ExternalID, const xmlChar *SystemID,
377
0
          const xmlChar *content) {
378
0
    xmlEntityPtr ret;
379
380
0
    xmlAddEntity(doc, 0, name, type, ExternalID, SystemID, content, &ret);
381
0
    return(ret);
382
0
}
383
384
/**
385
 * xmlNewEntity:
386
 * @doc:  the document
387
 * @name:  the entity name
388
 * @type:  the entity type XML_xxx_yyy_ENTITY
389
 * @ExternalID:  the entity external ID if available
390
 * @SystemID:  the entity system ID if available
391
 * @content:  the entity content
392
 *
393
 * Create a new entity, this differs from xmlAddDocEntity() that if
394
 * the document is NULL or has no internal subset defined, then an
395
 * unlinked entity structure will be returned, it is then the responsibility
396
 * of the caller to link it to the document later or free it when not needed
397
 * anymore.
398
 *
399
 * Returns a pointer to the entity or NULL in case of error
400
 */
401
xmlEntityPtr
402
xmlNewEntity(xmlDocPtr doc, const xmlChar *name, int type,
403
       const xmlChar *ExternalID, const xmlChar *SystemID,
404
0
       const xmlChar *content) {
405
0
    if ((doc != NULL) && (doc->intSubset != NULL)) {
406
0
  return(xmlAddDocEntity(doc, name, type, ExternalID, SystemID, content));
407
0
    }
408
0
    if (name == NULL)
409
0
        return(NULL);
410
0
    return(xmlCreateEntity(doc, name, type, ExternalID, SystemID, content));
411
0
}
412
413
/**
414
 * xmlGetEntityFromTable:
415
 * @table:  an entity table
416
 * @name:  the entity name
417
 * @parameter:  look for parameter entities
418
 *
419
 * Do an entity lookup in the table.
420
 * returns the corresponding parameter entity, if found.
421
 *
422
 * Returns A pointer to the entity structure or NULL if not found.
423
 */
424
static xmlEntityPtr
425
624k
xmlGetEntityFromTable(xmlEntitiesTablePtr table, const xmlChar *name) {
426
624k
    return((xmlEntityPtr) xmlHashLookup(table, name));
427
624k
}
428
429
/**
430
 * xmlGetParameterEntity:
431
 * @doc:  the document referencing the entity
432
 * @name:  the entity name
433
 *
434
 * Do an entity lookup in the internal and external subsets and
435
 * returns the corresponding parameter entity, if found.
436
 *
437
 * Returns A pointer to the entity structure or NULL if not found.
438
 */
439
xmlEntityPtr
440
106k
xmlGetParameterEntity(xmlDocPtr doc, const xmlChar *name) {
441
106k
    xmlEntitiesTablePtr table;
442
106k
    xmlEntityPtr ret;
443
444
106k
    if (doc == NULL)
445
460
  return(NULL);
446
106k
    if ((doc->intSubset != NULL) && (doc->intSubset->pentities != NULL)) {
447
101k
  table = (xmlEntitiesTablePtr) doc->intSubset->pentities;
448
101k
  ret = xmlGetEntityFromTable(table, name);
449
101k
  if (ret != NULL)
450
70.3k
      return(ret);
451
101k
    }
452
35.7k
    if ((doc->extSubset != NULL) && (doc->extSubset->pentities != NULL)) {
453
12.4k
  table = (xmlEntitiesTablePtr) doc->extSubset->pentities;
454
12.4k
  return(xmlGetEntityFromTable(table, name));
455
12.4k
    }
456
23.2k
    return(NULL);
457
35.7k
}
458
459
/**
460
 * xmlGetDtdEntity:
461
 * @doc:  the document referencing the entity
462
 * @name:  the entity name
463
 *
464
 * Do an entity lookup in the DTD entity hash table and
465
 * returns the corresponding entity, if found.
466
 * Note: the first argument is the document node, not the DTD node.
467
 *
468
 * Returns A pointer to the entity structure or NULL if not found.
469
 */
470
xmlEntityPtr
471
0
xmlGetDtdEntity(xmlDocPtr doc, const xmlChar *name) {
472
0
    xmlEntitiesTablePtr table;
473
474
0
    if (doc == NULL)
475
0
  return(NULL);
476
0
    if ((doc->extSubset != NULL) && (doc->extSubset->entities != NULL)) {
477
0
  table = (xmlEntitiesTablePtr) doc->extSubset->entities;
478
0
  return(xmlGetEntityFromTable(table, name));
479
0
    }
480
0
    return(NULL);
481
0
}
482
483
/**
484
 * xmlGetDocEntity:
485
 * @doc:  the document referencing the entity
486
 * @name:  the entity name
487
 *
488
 * Do an entity lookup in the document entity hash table and
489
 * returns the corresponding entity, otherwise a lookup is done
490
 * in the predefined entities too.
491
 *
492
 * Returns A pointer to the entity structure or NULL if not found.
493
 */
494
xmlEntityPtr
495
531k
xmlGetDocEntity(const xmlDoc *doc, const xmlChar *name) {
496
531k
    xmlEntityPtr cur;
497
531k
    xmlEntitiesTablePtr table;
498
499
531k
    if (doc != NULL) {
500
528k
  if ((doc->intSubset != NULL) && (doc->intSubset->entities != NULL)) {
501
454k
      table = (xmlEntitiesTablePtr) doc->intSubset->entities;
502
454k
      cur = xmlGetEntityFromTable(table, name);
503
454k
      if (cur != NULL)
504
359k
    return(cur);
505
454k
  }
506
168k
  if (doc->standalone != 1) {
507
168k
      if ((doc->extSubset != NULL) &&
508
58.5k
    (doc->extSubset->entities != NULL)) {
509
56.2k
    table = (xmlEntitiesTablePtr) doc->extSubset->entities;
510
56.2k
    cur = xmlGetEntityFromTable(table, name);
511
56.2k
    if (cur != NULL)
512
347
        return(cur);
513
56.2k
      }
514
168k
  }
515
168k
    }
516
171k
    return(xmlGetPredefinedEntity(name));
517
531k
}
518
519
/*
520
 * xmlSerializeHexCharRef:
521
 * @buf:  a char buffer
522
 * @val:  a codepoint
523
 *
524
 * Serializes a hex char ref like &#xA0;
525
 *
526
 * Writes at most 9 bytes. Does not include a terminating zero byte.
527
 *
528
 * Returns the number of bytes written.
529
 */
530
int
531
2.86k
xmlSerializeHexCharRef(char *buf, int val) {
532
2.86k
    char *out = buf;
533
2.86k
    int shift = 0, bits;
534
535
2.86k
    *out++ = '&';
536
2.86k
    *out++ = '#';
537
2.86k
    *out++ = 'x';
538
539
2.86k
    bits = val;
540
2.86k
    if (bits & 0xFF0000) {
541
109
        shift = 16;
542
109
        bits &= 0xFF0000;
543
2.75k
    } else if (bits & 0x00FF00) {
544
610
        shift = 8;
545
610
        bits &= 0x00FF00;
546
610
    }
547
2.86k
    if (bits & 0xF0F0F0) {
548
2.49k
        shift += 4;
549
2.49k
    }
550
551
7.01k
    do {
552
7.01k
        int d = (val >> shift) & 0x0F;
553
554
7.01k
        if (d < 10)
555
3.10k
            *out++ = '0' + d;
556
3.91k
        else
557
3.91k
            *out++ = 'A' + (d - 10);
558
559
7.01k
  shift -= 4;
560
7.01k
    } while (shift >= 0);
561
562
2.86k
    *out++ = ';';
563
564
2.86k
    return(out - buf);
565
2.86k
}
566
567
/*
568
 * xmlSerializeDecCharRef:
569
 * @buf:  a char buffer
570
 * @val:  a codepoint
571
 *
572
 * Serializes a decimal char ref like &#38;
573
 *
574
 * Writes at most 10 bytes. Does not include a terminating zero byte.
575
 *
576
 * Returns the number of bytes written.
577
 */
578
int
579
144M
xmlSerializeDecCharRef(char *buf, int val) {
580
144M
    char *out = buf;
581
144M
    int len, i;
582
583
144M
    *out++ = '&';
584
144M
    *out++ = '#';
585
586
144M
    if (val < 100) {
587
470
        len = (val < 10) ? 1 : 2;
588
144M
    } else if (val < 10000) {
589
144M
        len = (val < 1000) ? 3 : 4;
590
144M
    } else if (val < 1000000) {
591
8.28k
        len = (val < 100000) ? 5 : 6;
592
8.28k
    } else {
593
326
        len = 7;
594
326
    }
595
596
585M
    for (i = len - 1; i >= 0; i--) {
597
441M
        out[i] = '0' + val % 10;
598
441M
        val /= 10;
599
441M
    }
600
601
144M
    out[len] = ';';
602
603
144M
    return(len + 3);
604
144M
}
605
606
static const char xmlEscapeSafe[128] = {
607
    0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0,
608
    0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
609
    1, 1, 0, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1,
610
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 1,
611
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
612
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
613
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
614
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1
615
};
616
617
/*
618
 * xmlEscapeText:
619
 * @text:  input text
620
 * @flags:  XML_ESCAPE flags
621
 *
622
 * Escapes certain characters with char refs.
623
 *
624
 * XML_ESCAPE_ATTR: for attribute content.
625
 * XML_ESCAPE_NON_ASCII: escape non-ASCII chars.
626
 * XML_ESCAPE_HTML: for HTML content.
627
 * XML_ESCAPE_QUOT: escape double quotes.
628
 * XML_ESCAPE_ALLOW_INVALID: allow invalid characters.
629
 *
630
 * Returns an escaped string or NULL if a memory allocation failed.
631
 */
632
xmlChar *
633
47.1k
xmlEscapeText(const xmlChar *text, int flags) {
634
47.1k
    const xmlChar *cur;
635
47.1k
    xmlChar *buffer;
636
47.1k
    xmlChar *out;
637
47.1k
    const xmlChar *unescaped;
638
47.1k
    size_t size = 50;
639
640
47.1k
    buffer = xmlMalloc(size + 1);
641
47.1k
    if (buffer == NULL)
642
59
        return(NULL);
643
47.0k
    out = buffer;
644
645
47.0k
    cur = text;
646
47.0k
    unescaped = cur;
647
648
250k
    while (*cur != '\0') {
649
203k
        char buf[12];
650
203k
  const xmlChar *end;
651
203k
        const xmlChar *repl;
652
203k
        size_t used;
653
203k
        size_t replSize;
654
203k
        size_t unescapedSize;
655
203k
        size_t totalSize;
656
203k
        int chunkSize = 1;
657
203k
        int c;
658
659
        /* accelerator */
660
136M
  while (1) {
661
136M
            c = *cur;
662
663
136M
            if (c < 0x80) {
664
41.3M
                if (!xmlEscapeSafe[*cur])
665
203k
                    break;
666
95.6M
            } else {
667
95.6M
               if (flags & XML_ESCAPE_NON_ASCII)
668
0
                   break;
669
95.6M
            }
670
136M
            cur += 1;
671
136M
        }
672
673
203k
        if (c == 0) {
674
44.4k
            chunkSize = 0;
675
44.4k
            repl = BAD_CAST "";
676
44.4k
            replSize = 0;
677
158k
        } else if (c == '<') {
678
      /*
679
       * Special handling of server side include in HTML attributes
680
       */
681
31.5k
      if ((flags & XML_ESCAPE_HTML) && (flags & XML_ESCAPE_ATTR) &&
682
30.9k
          (cur[1] == '!') && (cur[2] == '-') && (cur[3] == '-') &&
683
2.96k
          ((end = xmlStrstr(cur, BAD_CAST "-->")) != NULL)) {
684
2.66k
                chunkSize = (end - cur) + 3;
685
2.66k
                repl = cur;
686
2.66k
                replSize = chunkSize;
687
28.8k
      } else {
688
28.8k
                repl = BAD_CAST "&lt;";
689
28.8k
                replSize = 4;
690
28.8k
            }
691
127k
  } else if (c == '>') {
692
44.6k
            repl = BAD_CAST "&gt;";
693
44.6k
            replSize = 4;
694
82.7k
  } else if (c == '&') {
695
      /*
696
       * Special handling of &{...} construct from HTML 4, see
697
       * http://www.w3.org/TR/html401/appendix/notes.html#h-B.7.1
698
       */
699
9.03k
      if ((flags & XML_ESCAPE_HTML) && (flags & XML_ESCAPE_ATTR) &&
700
8.43k
                (cur[1] == '{') && (end = xmlStrchr(cur, '}'))) {
701
1.63k
                chunkSize = (end - cur) + 1;
702
1.63k
                repl = cur;
703
1.63k
                replSize = chunkSize;
704
7.39k
      } else {
705
7.39k
                repl = BAD_CAST "&amp;";
706
7.39k
                replSize = 5;
707
7.39k
            }
708
73.7k
  } else if ((flags & XML_ESCAPE_QUOT) && (c == '"')) {
709
0
            repl = BAD_CAST "&quot;";
710
0
            replSize = 6;
711
73.7k
  } else if (((flags & XML_ESCAPE_HTML) == 0) && (c == '\r')) {
712
0
      repl = BAD_CAST "&#13;";
713
0
            replSize = 5;
714
73.7k
  } else if ((flags & XML_ESCAPE_NON_ASCII) && (c >= 0x80)) {
715
0
            int val;
716
717
0
            chunkSize = 4;
718
0
            val = xmlGetUTF8Char(cur, &chunkSize);
719
0
            if (val < 0) {
720
0
                val = 0xFFFD;
721
0
                chunkSize = 1;
722
0
            } else if (((flags & XML_ESCAPE_ALLOW_INVALID) == 0) &&
723
0
                       (!IS_CHAR(val))) {
724
0
                val = 0xFFFD;
725
0
            }
726
727
0
            replSize = xmlSerializeHexCharRef(buf, val);
728
0
            repl = BAD_CAST buf;
729
73.7k
  } else if ((flags & (XML_ESCAPE_ALLOW_INVALID | XML_ESCAPE_HTML)) ||
730
0
                   (c >= 0x20) ||
731
73.7k
             (c == '\n') || (c == '\t') || (c == '\r')) {
732
      /* default case, just copy */
733
73.7k
            cur += 1;
734
73.7k
            if (*cur != 0)
735
72.9k
                continue;
736
737
746
            chunkSize = 0;
738
746
            repl = BAD_CAST "";
739
746
            replSize = 0;
740
746
  } else {
741
            /* ignore */
742
0
            repl = BAD_CAST "";
743
0
            replSize = 0;
744
0
        }
745
746
130k
        used = out - buffer;
747
130k
        unescapedSize = cur - unescaped;
748
130k
        totalSize = unescapedSize + replSize;
749
750
130k
  cur += chunkSize;
751
752
130k
        if (totalSize > size - used) {
753
9.54k
            xmlChar *tmp;
754
9.54k
            int newSize;
755
756
9.54k
            if ((size > (SIZE_MAX - 1) / 2) ||
757
9.54k
                (totalSize > (SIZE_MAX - 1) / 2 - size)) {
758
0
                xmlFree(buffer);
759
0
                return(NULL);
760
0
            }
761
9.54k
            newSize = size + totalSize;
762
9.54k
            if (*cur != 0)
763
5.16k
                newSize *= 2;
764
9.54k
            tmp = xmlRealloc(buffer, newSize + 1);
765
9.54k
            if (tmp == NULL) {
766
1
                xmlFree(buffer);
767
1
                return(NULL);
768
1
            }
769
9.53k
            buffer = tmp;
770
9.53k
            size = newSize;
771
9.53k
            out = buffer + used;
772
9.53k
        }
773
774
130k
        memcpy(out, unescaped, unescapedSize);
775
130k
        out += unescapedSize;
776
130k
        memcpy(out, repl, replSize);
777
130k
        out += replSize;
778
779
130k
        unescaped = cur;
780
130k
    }
781
782
47.0k
    *out = 0;
783
47.0k
    return(buffer);
784
47.0k
}
785
786
/**
787
 * xmlEncodeEntitiesInternal:
788
 * @doc:  the document containing the string
789
 * @input:  A string to convert to XML.
790
 * @flags:  XML_ESCAPE flags
791
 *
792
 * Do a global encoding of a string, replacing the predefined entities
793
 * and non ASCII values with their entities and CharRef counterparts.
794
 * Contrary to xmlEncodeEntities, this routine is reentrant, and result
795
 * must be deallocated.
796
 *
797
 * Returns A newly allocated string with the substitution done.
798
 */
799
xmlChar *
800
xmlEncodeEntitiesInternal(xmlDocPtr doc, const xmlChar *input,
801
47.1k
                          unsigned flags) {
802
47.1k
    if (input == NULL)
803
0
        return(NULL);
804
805
47.1k
    if ((doc != NULL) && (doc->type == XML_HTML_DOCUMENT_NODE))
806
47.1k
        flags |= XML_ESCAPE_HTML;
807
0
    else if ((doc == NULL) || (doc->encoding == NULL))
808
0
        flags |= XML_ESCAPE_NON_ASCII;
809
810
47.1k
    return(xmlEscapeText(input, flags));
811
47.1k
}
812
813
/**
814
 * xmlEncodeEntitiesReentrant:
815
 * @doc:  the document containing the string
816
 * @input:  A string to convert to XML.
817
 *
818
 * Do a global encoding of a string, replacing the predefined entities
819
 * and non ASCII values with their entities and CharRef counterparts.
820
 * Contrary to xmlEncodeEntities, this routine is reentrant, and result
821
 * must be deallocated.
822
 *
823
 * This escapes '<', '>', '&' and '\r'. If the document has no encoding,
824
 * non-ASCII codepoints are escaped. There is some special handling for
825
 * HTML documents.
826
 *
827
 * Returns A newly allocated string with the substitution done.
828
 */
829
xmlChar *
830
35.1k
xmlEncodeEntitiesReentrant(xmlDocPtr doc, const xmlChar *input) {
831
35.1k
    return xmlEncodeEntitiesInternal(doc, input, 0);
832
35.1k
}
833
834
/**
835
 * xmlEncodeSpecialChars:
836
 * @doc:  unused
837
 * @input:  A string to convert to XML.
838
 *
839
 * Do a global encoding of a string, replacing the predefined entities
840
 * this routine is reentrant, and result must be deallocated.
841
 *
842
 * This escapes '<', '>', '&', '"' and '\r' chars.
843
 *
844
 * Returns A newly allocated string with the substitution done.
845
 */
846
xmlChar *
847
xmlEncodeSpecialChars(const xmlDoc *doc ATTRIBUTE_UNUSED,
848
0
                      const xmlChar *input) {
849
0
    if (input == NULL)
850
0
        return(NULL);
851
852
0
    return(xmlEscapeText(input, XML_ESCAPE_QUOT | XML_ESCAPE_ALLOW_INVALID));
853
0
}
854
855
/**
856
 * xmlCreateEntitiesTable:
857
 *
858
 * create and initialize an empty entities hash table.
859
 * This really doesn't make sense and should be deprecated
860
 *
861
 * Returns the xmlEntitiesTablePtr just created or NULL in case of error.
862
 */
863
xmlEntitiesTablePtr
864
0
xmlCreateEntitiesTable(void) {
865
0
    return((xmlEntitiesTablePtr) xmlHashCreate(0));
866
0
}
867
868
/**
869
 * xmlFreeEntityWrapper:
870
 * @entity:  An entity
871
 * @name:  its name
872
 *
873
 * Deallocate the memory used by an entities in the hash table.
874
 */
875
static void
876
112k
xmlFreeEntityWrapper(void *entity, const xmlChar *name ATTRIBUTE_UNUSED) {
877
112k
    if (entity != NULL)
878
112k
  xmlFreeEntity((xmlEntityPtr) entity);
879
112k
}
880
881
/**
882
 * xmlFreeEntitiesTable:
883
 * @table:  An entity table
884
 *
885
 * Deallocate the memory used by an entities hash table.
886
 */
887
void
888
64.2k
xmlFreeEntitiesTable(xmlEntitiesTablePtr table) {
889
64.2k
    xmlHashFree(table, xmlFreeEntityWrapper);
890
64.2k
}
891
892
/**
893
 * xmlCopyEntity:
894
 * @ent:  An entity
895
 *
896
 * Build a copy of an entity
897
 *
898
 * Returns the new xmlEntitiesPtr or NULL in case of error.
899
 */
900
static void *
901
20.2k
xmlCopyEntity(void *payload, const xmlChar *name ATTRIBUTE_UNUSED) {
902
20.2k
    xmlEntityPtr ent = (xmlEntityPtr) payload;
903
20.2k
    xmlEntityPtr cur;
904
905
20.2k
    cur = (xmlEntityPtr) xmlMalloc(sizeof(xmlEntity));
906
20.2k
    if (cur == NULL)
907
2
  return(NULL);
908
20.2k
    memset(cur, 0, sizeof(xmlEntity));
909
20.2k
    cur->type = XML_ENTITY_DECL;
910
911
20.2k
    cur->etype = ent->etype;
912
20.2k
    if (ent->name != NULL) {
913
20.2k
  cur->name = xmlStrdup(ent->name);
914
20.2k
        if (cur->name == NULL)
915
3
            goto error;
916
20.2k
    }
917
20.2k
    if (ent->ExternalID != NULL) {
918
0
  cur->ExternalID = xmlStrdup(ent->ExternalID);
919
0
        if (cur->ExternalID == NULL)
920
0
            goto error;
921
0
    }
922
20.2k
    if (ent->SystemID != NULL) {
923
805
  cur->SystemID = xmlStrdup(ent->SystemID);
924
805
        if (cur->SystemID == NULL)
925
1
            goto error;
926
805
    }
927
20.2k
    if (ent->content != NULL) {
928
19.4k
  cur->content = xmlStrdup(ent->content);
929
19.4k
        if (cur->content == NULL)
930
3
            goto error;
931
19.4k
    }
932
20.2k
    if (ent->orig != NULL) {
933
19.4k
  cur->orig = xmlStrdup(ent->orig);
934
19.4k
        if (cur->orig == NULL)
935
4
            goto error;
936
19.4k
    }
937
20.2k
    if (ent->URI != NULL) {
938
47
  cur->URI = xmlStrdup(ent->URI);
939
47
        if (cur->URI == NULL)
940
1
            goto error;
941
47
    }
942
20.2k
    return(cur);
943
944
12
error:
945
12
    xmlFreeEntity(cur);
946
12
    return(NULL);
947
20.2k
}
948
949
/**
950
 * xmlCopyEntitiesTable:
951
 * @table:  An entity table
952
 *
953
 * Build a copy of an entity table.
954
 *
955
 * Returns the new xmlEntitiesTablePtr or NULL in case of error.
956
 */
957
xmlEntitiesTablePtr
958
7.51k
xmlCopyEntitiesTable(xmlEntitiesTablePtr table) {
959
7.51k
    return(xmlHashCopySafe(table, xmlCopyEntity, xmlFreeEntityWrapper));
960
7.51k
}
961
962
#ifdef LIBXML_OUTPUT_ENABLED
963
964
/**
965
 * xmlDumpEntityDecl:
966
 * @buf:  An XML buffer.
967
 * @ent:  An entity table
968
 *
969
 * This will dump the content of the entity table as an XML DTD definition
970
 */
971
void
972
0
xmlDumpEntityDecl(xmlBufferPtr buf, xmlEntityPtr ent) {
973
0
    xmlSaveCtxtPtr save;
974
975
0
    if ((buf == NULL) || (ent == NULL))
976
0
        return;
977
978
0
    save = xmlSaveToBuffer(buf, NULL, 0);
979
0
    xmlSaveTree(save, (xmlNodePtr) ent);
980
0
    if (xmlSaveFinish(save) != XML_ERR_OK)
981
0
        xmlFree(xmlBufferDetach(buf));
982
0
}
983
984
/**
985
 * xmlDumpEntityDeclScan:
986
 * @ent:  An entity table
987
 * @buf:  An XML buffer.
988
 *
989
 * When using the hash table scan function, arguments need to be reversed
990
 */
991
static void
992
xmlDumpEntityDeclScan(void *ent, void *save,
993
0
                      const xmlChar *name ATTRIBUTE_UNUSED) {
994
0
    xmlSaveTree(save, ent);
995
0
}
996
997
/**
998
 * xmlDumpEntitiesTable:
999
 * @buf:  An XML buffer.
1000
 * @table:  An entity table
1001
 *
1002
 * This will dump the content of the entity table as an XML DTD definition
1003
 */
1004
void
1005
0
xmlDumpEntitiesTable(xmlBufferPtr buf, xmlEntitiesTablePtr table) {
1006
0
    xmlSaveCtxtPtr save;
1007
1008
0
    if ((buf == NULL) || (table == NULL))
1009
0
        return;
1010
1011
0
    save = xmlSaveToBuffer(buf, NULL, 0);
1012
0
    xmlHashScan(table, xmlDumpEntityDeclScan, save);
1013
0
    if (xmlSaveFinish(save) != XML_ERR_OK)
1014
0
        xmlFree(xmlBufferDetach(buf));
1015
0
}
1016
#endif /* LIBXML_OUTPUT_ENABLED */