Coverage Report

Created: 2025-10-28 06:46

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
/src/libxml2/entities.c
Line
Count
Source
1
/*
2
 * entities.c : implementation for the XML entities handling
3
 *
4
 * See Copyright for the status of this software.
5
 *
6
 * daniel@veillard.com
7
 */
8
9
/* To avoid EBCDIC trouble when parsing on zOS */
10
#if defined(__MVS__)
11
#pragma convert("ISO8859-1")
12
#endif
13
14
#define IN_LIBXML
15
#include "libxml.h"
16
17
#include <string.h>
18
#include <stdlib.h>
19
20
#include <libxml/xmlmemory.h>
21
#include <libxml/hash.h>
22
#include <libxml/entities.h>
23
#include <libxml/parser.h>
24
#include <libxml/parserInternals.h>
25
#include <libxml/xmlerror.h>
26
#include <libxml/dict.h>
27
#include <libxml/xmlsave.h>
28
29
#include "private/entities.h"
30
#include "private/error.h"
31
32
#ifndef SIZE_MAX
33
  #define SIZE_MAX ((size_t) -1)
34
#endif
35
36
/*
37
 * The XML predefined entities.
38
 */
39
40
static xmlEntity xmlEntityLt = {
41
    NULL, XML_ENTITY_DECL, BAD_CAST "lt",
42
    NULL, NULL, NULL, NULL, NULL, NULL,
43
    BAD_CAST "<", BAD_CAST "<", 1,
44
    XML_INTERNAL_PREDEFINED_ENTITY,
45
    NULL, NULL, NULL, NULL, 0, 0, 0
46
};
47
static xmlEntity xmlEntityGt = {
48
    NULL, XML_ENTITY_DECL, BAD_CAST "gt",
49
    NULL, NULL, NULL, NULL, NULL, NULL,
50
    BAD_CAST ">", BAD_CAST ">", 1,
51
    XML_INTERNAL_PREDEFINED_ENTITY,
52
    NULL, NULL, NULL, NULL, 0, 0, 0
53
};
54
static xmlEntity xmlEntityAmp = {
55
    NULL, XML_ENTITY_DECL, BAD_CAST "amp",
56
    NULL, NULL, NULL, NULL, NULL, NULL,
57
    BAD_CAST "&", BAD_CAST "&", 1,
58
    XML_INTERNAL_PREDEFINED_ENTITY,
59
    NULL, NULL, NULL, NULL, 0, 0, 0
60
};
61
static xmlEntity xmlEntityQuot = {
62
    NULL, XML_ENTITY_DECL, BAD_CAST "quot",
63
    NULL, NULL, NULL, NULL, NULL, NULL,
64
    BAD_CAST "\"", BAD_CAST "\"", 1,
65
    XML_INTERNAL_PREDEFINED_ENTITY,
66
    NULL, NULL, NULL, NULL, 0, 0, 0
67
};
68
static xmlEntity xmlEntityApos = {
69
    NULL, XML_ENTITY_DECL, BAD_CAST "apos",
70
    NULL, NULL, NULL, NULL, NULL, NULL,
71
    BAD_CAST "'", BAD_CAST "'", 1,
72
    XML_INTERNAL_PREDEFINED_ENTITY,
73
    NULL, NULL, NULL, NULL, 0, 0, 0
74
};
75
76
/*
77
 * xmlFreeEntity:
78
 * @entity:  an entity
79
 *
80
 * Frees the entity.
81
 */
82
void
83
xmlFreeEntity(xmlEntityPtr entity)
84
100k
{
85
100k
    xmlDictPtr dict = NULL;
86
87
100k
    if (entity == NULL)
88
0
        return;
89
90
100k
    if (entity->doc != NULL)
91
100k
        dict = entity->doc->dict;
92
93
94
100k
    if ((entity->children) &&
95
1.97k
        (entity == (xmlEntityPtr) entity->children->parent))
96
1.97k
        xmlFreeNodeList(entity->children);
97
100k
    if ((entity->name != NULL) &&
98
100k
        ((dict == NULL) || (!xmlDictOwns(dict, entity->name))))
99
13.2k
        xmlFree((char *) entity->name);
100
100k
    if (entity->ExternalID != NULL)
101
9.19k
        xmlFree((char *) entity->ExternalID);
102
100k
    if (entity->SystemID != NULL)
103
49.9k
        xmlFree((char *) entity->SystemID);
104
100k
    if (entity->URI != NULL)
105
47.9k
        xmlFree((char *) entity->URI);
106
100k
    if (entity->content != NULL)
107
48.9k
        xmlFree((char *) entity->content);
108
100k
    if (entity->orig != NULL)
109
46.2k
        xmlFree((char *) entity->orig);
110
100k
    xmlFree(entity);
111
100k
}
112
113
/*
114
 * xmlCreateEntity:
115
 *
116
 * internal routine doing the entity node structures allocations
117
 */
118
static xmlEntityPtr
119
xmlCreateEntity(xmlDocPtr doc, const xmlChar *name, int type,
120
          const xmlChar *ExternalID, const xmlChar *SystemID,
121
100k
          const xmlChar *content) {
122
100k
    xmlEntityPtr ret;
123
124
100k
    ret = (xmlEntityPtr) xmlMalloc(sizeof(xmlEntity));
125
100k
    if (ret == NULL)
126
8
  return(NULL);
127
100k
    memset(ret, 0, sizeof(xmlEntity));
128
100k
    ret->doc = doc;
129
100k
    ret->type = XML_ENTITY_DECL;
130
131
    /*
132
     * fill the structure.
133
     */
134
100k
    ret->etype = (xmlEntityType) type;
135
100k
    if ((doc == NULL) || (doc->dict == NULL))
136
13.2k
  ret->name = xmlStrdup(name);
137
87.1k
    else
138
87.1k
        ret->name = xmlDictLookup(doc->dict, name, -1);
139
100k
    if (ret->name == NULL)
140
3
        goto error;
141
100k
    if (ExternalID != NULL) {
142
9.19k
        ret->ExternalID = xmlStrdup(ExternalID);
143
9.19k
        if (ret->ExternalID == NULL)
144
3
            goto error;
145
9.19k
    }
146
100k
    if (SystemID != NULL) {
147
49.9k
        ret->SystemID = xmlStrdup(SystemID);
148
49.9k
        if (ret->SystemID == NULL)
149
9
            goto error;
150
49.9k
    }
151
100k
    if (content != NULL) {
152
48.5k
        ret->length = xmlStrlen(content);
153
48.5k
  ret->content = xmlStrndup(content, ret->length);
154
48.5k
        if (ret->content == NULL)
155
4
            goto error;
156
51.9k
     } else {
157
51.9k
        ret->length = 0;
158
51.9k
        ret->content = NULL;
159
51.9k
    }
160
100k
    ret->URI = NULL; /* to be computed by the layer knowing
161
      the defining entity */
162
100k
    ret->orig = NULL;
163
164
100k
    return(ret);
165
166
19
error:
167
19
    xmlFreeEntity(ret);
168
19
    return(NULL);
169
100k
}
170
171
/**
172
 * xmlAddEntity:
173
 * @doc:  the document
174
 * @extSubset:  add to the external or internal subset
175
 * @name:  the entity name
176
 * @type:  the entity type XML_xxx_yyy_ENTITY
177
 * @ExternalID:  the entity external ID if available
178
 * @SystemID:  the entity system ID if available
179
 * @content:  the entity content
180
 * @out:  pointer to resulting entity (optional)
181
 *
182
 * Register a new entity for this document.
183
 *
184
 * Available since 2.13.0.
185
 *
186
 * Returns an xmlParserErrors error code.
187
 */
188
int
189
xmlAddEntity(xmlDocPtr doc, int extSubset, const xmlChar *name, int type,
190
    const xmlChar *ExternalID, const xmlChar *SystemID,
191
104k
    const xmlChar *content, xmlEntityPtr *out) {
192
104k
    xmlDtdPtr dtd;
193
104k
    xmlDictPtr dict = NULL;
194
104k
    xmlEntitiesTablePtr table = NULL;
195
104k
    xmlEntityPtr ret, predef;
196
104k
    int res;
197
198
104k
    if (out != NULL)
199
104k
        *out = NULL;
200
104k
    if ((doc == NULL) || (name == NULL))
201
0
  return(XML_ERR_ARGUMENT);
202
104k
    dict = doc->dict;
203
204
104k
    if (extSubset)
205
12.3k
        dtd = doc->extSubset;
206
91.8k
    else
207
91.8k
        dtd = doc->intSubset;
208
104k
    if (dtd == NULL)
209
0
        return(XML_DTD_NO_DTD);
210
211
104k
    switch (type) {
212
30.6k
        case XML_INTERNAL_GENERAL_ENTITY:
213
41.1k
        case XML_EXTERNAL_GENERAL_PARSED_ENTITY:
214
41.3k
        case XML_EXTERNAL_GENERAL_UNPARSED_ENTITY:
215
41.3k
            predef = xmlGetPredefinedEntity(name);
216
41.3k
            if (predef != NULL) {
217
4.81k
                int valid = 0;
218
219
                /* 4.6 Predefined Entities */
220
4.81k
                if ((type == XML_INTERNAL_GENERAL_ENTITY) &&
221
4.44k
                    (content != NULL)) {
222
4.18k
                    int c = predef->content[0];
223
224
4.18k
                    if (((content[0] == c) && (content[1] == 0)) &&
225
774
                        ((c == '>') || (c == '\'') || (c == '"'))) {
226
699
                        valid = 1;
227
3.48k
                    } else if ((content[0] == '&') && (content[1] == '#')) {
228
1.41k
                        if (content[2] == 'x') {
229
224
                            xmlChar *hex = BAD_CAST "0123456789ABCDEF";
230
224
                            xmlChar ref[] = "00;";
231
232
224
                            ref[0] = hex[c / 16 % 16];
233
224
                            ref[1] = hex[c % 16];
234
224
                            if (xmlStrcasecmp(&content[3], ref) == 0)
235
0
                                valid = 1;
236
1.18k
                        } else {
237
1.18k
                            xmlChar ref[] = "00;";
238
239
1.18k
                            ref[0] = '0' + c / 10 % 10;
240
1.18k
                            ref[1] = '0' + c % 10;
241
1.18k
                            if (xmlStrEqual(&content[2], ref))
242
420
                                valid = 1;
243
1.18k
                        }
244
1.41k
                    }
245
4.18k
                }
246
4.81k
                if (!valid)
247
3.69k
                    return(XML_ERR_REDECL_PREDEF_ENTITY);
248
4.81k
            }
249
37.6k
      if (dtd->entities == NULL) {
250
24.2k
    dtd->entities = xmlHashCreateDict(0, dict);
251
24.2k
                if (dtd->entities == NULL)
252
6
                    return(XML_ERR_NO_MEMORY);
253
24.2k
            }
254
37.6k
      table = dtd->entities;
255
37.6k
      break;
256
22.2k
        case XML_INTERNAL_PARAMETER_ENTITY:
257
62.8k
        case XML_EXTERNAL_PARAMETER_ENTITY:
258
62.8k
      if (dtd->pentities == NULL) {
259
30.6k
    dtd->pentities = xmlHashCreateDict(0, dict);
260
30.6k
                if (dtd->pentities == NULL)
261
3
                    return(XML_ERR_NO_MEMORY);
262
30.6k
            }
263
62.8k
      table = dtd->pentities;
264
62.8k
      break;
265
0
        default:
266
0
      return(XML_ERR_ARGUMENT);
267
104k
    }
268
100k
    ret = xmlCreateEntity(dtd->doc, name, type, ExternalID, SystemID, content);
269
100k
    if (ret == NULL)
270
27
        return(XML_ERR_NO_MEMORY);
271
272
100k
    res = xmlHashAdd(table, name, ret);
273
100k
    if (res < 0) {
274
6
        xmlFreeEntity(ret);
275
6
        return(XML_ERR_NO_MEMORY);
276
100k
    } else if (res == 0) {
277
  /*
278
   * entity was already defined at another level.
279
   */
280
2.70k
        xmlFreeEntity(ret);
281
2.70k
  return(XML_WAR_ENTITY_REDEFINED);
282
2.70k
    }
283
284
    /*
285
     * Link it to the DTD
286
     */
287
97.7k
    ret->parent = dtd;
288
97.7k
    ret->doc = dtd->doc;
289
97.7k
    if (dtd->last == NULL) {
290
34.4k
  dtd->children = dtd->last = (xmlNodePtr) ret;
291
63.2k
    } else {
292
63.2k
  dtd->last->next = (xmlNodePtr) ret;
293
63.2k
  ret->prev = dtd->last;
294
63.2k
  dtd->last = (xmlNodePtr) ret;
295
63.2k
    }
296
297
97.7k
    if (out != NULL)
298
97.7k
        *out = ret;
299
97.7k
    return(0);
300
100k
}
301
302
/**
303
 * xmlGetPredefinedEntity:
304
 * @name:  the entity name
305
 *
306
 * Check whether this name is an predefined entity.
307
 *
308
 * Returns NULL if not, otherwise the entity
309
 */
310
xmlEntityPtr
311
2.22M
xmlGetPredefinedEntity(const xmlChar *name) {
312
2.22M
    if (name == NULL) return(NULL);
313
2.22M
    switch (name[0]) {
314
16.4k
        case 'l':
315
16.4k
      if (xmlStrEqual(name, BAD_CAST "lt"))
316
13.7k
          return(&xmlEntityLt);
317
2.61k
      break;
318
24.7k
        case 'g':
319
24.7k
      if (xmlStrEqual(name, BAD_CAST "gt"))
320
22.2k
          return(&xmlEntityGt);
321
2.53k
      break;
322
1.07M
        case 'a':
323
1.07M
      if (xmlStrEqual(name, BAD_CAST "amp"))
324
35.2k
          return(&xmlEntityAmp);
325
1.03M
      if (xmlStrEqual(name, BAD_CAST "apos"))
326
1.22k
          return(&xmlEntityApos);
327
1.03M
      break;
328
1.03M
        case 'q':
329
426k
      if (xmlStrEqual(name, BAD_CAST "quot"))
330
621
          return(&xmlEntityQuot);
331
425k
      break;
332
684k
  default:
333
684k
      break;
334
2.22M
    }
335
2.15M
    return(NULL);
336
2.22M
}
337
338
/**
339
 * xmlAddDtdEntity:
340
 * @doc:  the document
341
 * @name:  the entity name
342
 * @type:  the entity type XML_xxx_yyy_ENTITY
343
 * @ExternalID:  the entity external ID if available
344
 * @SystemID:  the entity system ID if available
345
 * @content:  the entity content
346
 *
347
 * Register a new entity for this document DTD external subset.
348
 *
349
 * Returns a pointer to the entity or NULL in case of error
350
 */
351
xmlEntityPtr
352
xmlAddDtdEntity(xmlDocPtr doc, const xmlChar *name, int type,
353
          const xmlChar *ExternalID, const xmlChar *SystemID,
354
0
    const xmlChar *content) {
355
0
    xmlEntityPtr ret;
356
357
0
    xmlAddEntity(doc, 1, name, type, ExternalID, SystemID, content, &ret);
358
0
    return(ret);
359
0
}
360
361
/**
362
 * xmlAddDocEntity:
363
 * @doc:  the document
364
 * @name:  the entity name
365
 * @type:  the entity type XML_xxx_yyy_ENTITY
366
 * @ExternalID:  the entity external ID if available
367
 * @SystemID:  the entity system ID if available
368
 * @content:  the entity content
369
 *
370
 * Register a new entity for this document.
371
 *
372
 * Returns a pointer to the entity or NULL in case of error
373
 */
374
xmlEntityPtr
375
xmlAddDocEntity(xmlDocPtr doc, const xmlChar *name, int type,
376
          const xmlChar *ExternalID, const xmlChar *SystemID,
377
0
          const xmlChar *content) {
378
0
    xmlEntityPtr ret;
379
380
0
    xmlAddEntity(doc, 0, name, type, ExternalID, SystemID, content, &ret);
381
0
    return(ret);
382
0
}
383
384
/**
385
 * xmlNewEntity:
386
 * @doc:  the document
387
 * @name:  the entity name
388
 * @type:  the entity type XML_xxx_yyy_ENTITY
389
 * @ExternalID:  the entity external ID if available
390
 * @SystemID:  the entity system ID if available
391
 * @content:  the entity content
392
 *
393
 * Create a new entity, this differs from xmlAddDocEntity() that if
394
 * the document is NULL or has no internal subset defined, then an
395
 * unlinked entity structure will be returned, it is then the responsibility
396
 * of the caller to link it to the document later or free it when not needed
397
 * anymore.
398
 *
399
 * Returns a pointer to the entity or NULL in case of error
400
 */
401
xmlEntityPtr
402
xmlNewEntity(xmlDocPtr doc, const xmlChar *name, int type,
403
       const xmlChar *ExternalID, const xmlChar *SystemID,
404
0
       const xmlChar *content) {
405
0
    if ((doc != NULL) && (doc->intSubset != NULL)) {
406
0
  return(xmlAddDocEntity(doc, name, type, ExternalID, SystemID, content));
407
0
    }
408
0
    if (name == NULL)
409
0
        return(NULL);
410
0
    return(xmlCreateEntity(doc, name, type, ExternalID, SystemID, content));
411
0
}
412
413
/**
414
 * xmlGetEntityFromTable:
415
 * @table:  an entity table
416
 * @name:  the entity name
417
 * @parameter:  look for parameter entities
418
 *
419
 * Do an entity lookup in the table.
420
 * returns the corresponding parameter entity, if found.
421
 *
422
 * Returns A pointer to the entity structure or NULL if not found.
423
 */
424
static xmlEntityPtr
425
1.12M
xmlGetEntityFromTable(xmlEntitiesTablePtr table, const xmlChar *name) {
426
1.12M
    return((xmlEntityPtr) xmlHashLookup(table, name));
427
1.12M
}
428
429
/**
430
 * xmlGetParameterEntity:
431
 * @doc:  the document referencing the entity
432
 * @name:  the entity name
433
 *
434
 * Do an entity lookup in the internal and external subsets and
435
 * returns the corresponding parameter entity, if found.
436
 *
437
 * Returns A pointer to the entity structure or NULL if not found.
438
 */
439
xmlEntityPtr
440
101k
xmlGetParameterEntity(xmlDocPtr doc, const xmlChar *name) {
441
101k
    xmlEntitiesTablePtr table;
442
101k
    xmlEntityPtr ret;
443
444
101k
    if (doc == NULL)
445
244
  return(NULL);
446
101k
    if ((doc->intSubset != NULL) && (doc->intSubset->pentities != NULL)) {
447
91.2k
  table = (xmlEntitiesTablePtr) doc->intSubset->pentities;
448
91.2k
  ret = xmlGetEntityFromTable(table, name);
449
91.2k
  if (ret != NULL)
450
62.5k
      return(ret);
451
91.2k
    }
452
39.0k
    if ((doc->extSubset != NULL) && (doc->extSubset->pentities != NULL)) {
453
15.2k
  table = (xmlEntitiesTablePtr) doc->extSubset->pentities;
454
15.2k
  return(xmlGetEntityFromTable(table, name));
455
15.2k
    }
456
23.8k
    return(NULL);
457
39.0k
}
458
459
/**
460
 * xmlGetDtdEntity:
461
 * @doc:  the document referencing the entity
462
 * @name:  the entity name
463
 *
464
 * Do an entity lookup in the DTD entity hash table and
465
 * returns the corresponding entity, if found.
466
 * Note: the first argument is the document node, not the DTD node.
467
 *
468
 * Returns A pointer to the entity structure or NULL if not found.
469
 */
470
xmlEntityPtr
471
0
xmlGetDtdEntity(xmlDocPtr doc, const xmlChar *name) {
472
0
    xmlEntitiesTablePtr table;
473
474
0
    if (doc == NULL)
475
0
  return(NULL);
476
0
    if ((doc->extSubset != NULL) && (doc->extSubset->entities != NULL)) {
477
0
  table = (xmlEntitiesTablePtr) doc->extSubset->entities;
478
0
  return(xmlGetEntityFromTable(table, name));
479
0
    }
480
0
    return(NULL);
481
0
}
482
483
/**
484
 * xmlGetDocEntity:
485
 * @doc:  the document referencing the entity
486
 * @name:  the entity name
487
 *
488
 * Do an entity lookup in the document entity hash table and
489
 * returns the corresponding entity, otherwise a lookup is done
490
 * in the predefined entities too.
491
 *
492
 * Returns A pointer to the entity structure or NULL if not found.
493
 */
494
xmlEntityPtr
495
1.02M
xmlGetDocEntity(const xmlDoc *doc, const xmlChar *name) {
496
1.02M
    xmlEntityPtr cur;
497
1.02M
    xmlEntitiesTablePtr table;
498
499
1.02M
    if (doc != NULL) {
500
1.02M
  if ((doc->intSubset != NULL) && (doc->intSubset->entities != NULL)) {
501
952k
      table = (xmlEntitiesTablePtr) doc->intSubset->entities;
502
952k
      cur = xmlGetEntityFromTable(table, name);
503
952k
      if (cur != NULL)
504
844k
    return(cur);
505
952k
  }
506
182k
  if (doc->standalone != 1) {
507
182k
      if ((doc->extSubset != NULL) &&
508
64.1k
    (doc->extSubset->entities != NULL)) {
509
61.6k
    table = (xmlEntitiesTablePtr) doc->extSubset->entities;
510
61.6k
    cur = xmlGetEntityFromTable(table, name);
511
61.6k
    if (cur != NULL)
512
479
        return(cur);
513
61.6k
      }
514
182k
  }
515
182k
    }
516
182k
    return(xmlGetPredefinedEntity(name));
517
1.02M
}
518
519
/*
520
 * xmlSerializeHexCharRef:
521
 * @buf:  a char buffer
522
 * @val:  a codepoint
523
 *
524
 * Serializes a hex char ref like &#xA0;
525
 *
526
 * Writes at most 9 bytes. Does not include a terminating zero byte.
527
 *
528
 * Returns the number of bytes written.
529
 */
530
int
531
1.89k
xmlSerializeHexCharRef(char *buf, int val) {
532
1.89k
    char *out = buf;
533
1.89k
    int shift = 0, bits;
534
535
1.89k
    *out++ = '&';
536
1.89k
    *out++ = '#';
537
1.89k
    *out++ = 'x';
538
539
1.89k
    bits = val;
540
1.89k
    if (bits & 0xFF0000) {
541
86
        shift = 16;
542
86
        bits &= 0xFF0000;
543
1.81k
    } else if (bits & 0x00FF00) {
544
1.15k
        shift = 8;
545
1.15k
        bits &= 0x00FF00;
546
1.15k
    }
547
1.89k
    if (bits & 0xF0F0F0) {
548
683
        shift += 4;
549
683
    }
550
551
5.22k
    do {
552
5.22k
        int d = (val >> shift) & 0x0F;
553
554
5.22k
        if (d < 10)
555
3.15k
            *out++ = '0' + d;
556
2.07k
        else
557
2.07k
            *out++ = 'A' + (d - 10);
558
559
5.22k
  shift -= 4;
560
5.22k
    } while (shift >= 0);
561
562
1.89k
    *out++ = ';';
563
564
1.89k
    return(out - buf);
565
1.89k
}
566
567
/*
568
 * xmlSerializeDecCharRef:
569
 * @buf:  a char buffer
570
 * @val:  a codepoint
571
 *
572
 * Serializes a decimal char ref like &#38;
573
 *
574
 * Writes at most 10 bytes. Does not include a terminating zero byte.
575
 *
576
 * Returns the number of bytes written.
577
 */
578
int
579
91.1M
xmlSerializeDecCharRef(char *buf, int val) {
580
91.1M
    char *out = buf;
581
91.1M
    int len, i;
582
583
91.1M
    *out++ = '&';
584
91.1M
    *out++ = '#';
585
586
91.1M
    if (val < 100) {
587
2.45k
        len = (val < 10) ? 1 : 2;
588
91.1M
    } else if (val < 10000) {
589
91.1M
        len = (val < 1000) ? 3 : 4;
590
91.1M
    } else if (val < 1000000) {
591
4.18k
        len = (val < 100000) ? 5 : 6;
592
4.18k
    } else {
593
330
        len = 7;
594
330
    }
595
596
373M
    for (i = len - 1; i >= 0; i--) {
597
282M
        out[i] = '0' + val % 10;
598
282M
        val /= 10;
599
282M
    }
600
601
91.1M
    out[len] = ';';
602
603
91.1M
    return(len + 3);
604
91.1M
}
605
606
static const char xmlEscapeSafe[128] = {
607
    0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0,
608
    0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
609
    1, 1, 0, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1,
610
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 1,
611
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
612
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
613
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
614
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1
615
};
616
617
/*
618
 * xmlEscapeText:
619
 * @text:  input text
620
 * @flags:  XML_ESCAPE flags
621
 *
622
 * Escapes certain characters with char refs.
623
 *
624
 * XML_ESCAPE_ATTR: for attribute content.
625
 * XML_ESCAPE_NON_ASCII: escape non-ASCII chars.
626
 * XML_ESCAPE_HTML: for HTML content.
627
 * XML_ESCAPE_QUOT: escape double quotes.
628
 * XML_ESCAPE_ALLOW_INVALID: allow invalid characters.
629
 *
630
 * Returns an escaped string or NULL if a memory allocation failed.
631
 */
632
xmlChar *
633
59.8k
xmlEscapeText(const xmlChar *text, int flags) {
634
59.8k
    const xmlChar *cur;
635
59.8k
    xmlChar *buffer;
636
59.8k
    xmlChar *out;
637
59.8k
    const xmlChar *unescaped;
638
59.8k
    size_t size = 50;
639
640
59.8k
    buffer = xmlMalloc(size + 1);
641
59.8k
    if (buffer == NULL)
642
67
        return(NULL);
643
59.7k
    out = buffer;
644
645
59.7k
    cur = text;
646
59.7k
    unescaped = cur;
647
648
323k
    while (*cur != '\0') {
649
264k
        char buf[12];
650
264k
  const xmlChar *end;
651
264k
        const xmlChar *repl;
652
264k
        size_t used;
653
264k
        size_t replSize;
654
264k
        size_t unescapedSize;
655
264k
        size_t totalSize;
656
264k
        int chunkSize = 1;
657
264k
        int c;
658
659
        /* accelerator */
660
111M
  while (1) {
661
111M
            c = *cur;
662
663
111M
            if (c < 0x80) {
664
15.5M
                if (!xmlEscapeSafe[*cur])
665
264k
                    break;
666
95.6M
            } else {
667
95.6M
               if (flags & XML_ESCAPE_NON_ASCII)
668
0
                   break;
669
95.6M
            }
670
110M
            cur += 1;
671
110M
        }
672
673
264k
        if (c == 0) {
674
57.0k
            chunkSize = 0;
675
57.0k
            repl = BAD_CAST "";
676
57.0k
            replSize = 0;
677
207k
        } else if (c == '<') {
678
      /*
679
       * Special handling of server side include in HTML attributes
680
       */
681
38.9k
      if ((flags & XML_ESCAPE_HTML) && (flags & XML_ESCAPE_ATTR) &&
682
37.3k
          (cur[1] == '!') && (cur[2] == '-') && (cur[3] == '-') &&
683
3.66k
          ((end = xmlStrstr(cur, BAD_CAST "-->")) != NULL)) {
684
3.19k
                chunkSize = (end - cur) + 3;
685
3.19k
                repl = cur;
686
3.19k
                replSize = chunkSize;
687
35.7k
      } else {
688
35.7k
                repl = BAD_CAST "&lt;";
689
35.7k
                replSize = 4;
690
35.7k
            }
691
168k
  } else if (c == '>') {
692
55.0k
            repl = BAD_CAST "&gt;";
693
55.0k
            replSize = 4;
694
113k
  } else if (c == '&') {
695
      /*
696
       * Special handling of &{...} construct from HTML 4, see
697
       * http://www.w3.org/TR/html401/appendix/notes.html#h-B.7.1
698
       */
699
14.1k
      if ((flags & XML_ESCAPE_HTML) && (flags & XML_ESCAPE_ATTR) &&
700
12.5k
                (cur[1] == '{') && (end = xmlStrchr(cur, '}'))) {
701
1.59k
                chunkSize = (end - cur) + 1;
702
1.59k
                repl = cur;
703
1.59k
                replSize = chunkSize;
704
12.5k
      } else {
705
12.5k
                repl = BAD_CAST "&amp;";
706
12.5k
                replSize = 5;
707
12.5k
            }
708
98.9k
  } else if ((flags & XML_ESCAPE_QUOT) && (c == '"')) {
709
0
            repl = BAD_CAST "&quot;";
710
0
            replSize = 6;
711
98.9k
  } else if (((flags & XML_ESCAPE_HTML) == 0) && (c == '\r')) {
712
0
      repl = BAD_CAST "&#13;";
713
0
            replSize = 5;
714
98.9k
  } else if ((flags & XML_ESCAPE_NON_ASCII) && (c >= 0x80)) {
715
0
            int val;
716
717
0
            chunkSize = 4;
718
0
            val = xmlGetUTF8Char(cur, &chunkSize);
719
0
            if (val < 0) {
720
0
                val = 0xFFFD;
721
0
                chunkSize = 1;
722
0
            } else if (((flags & XML_ESCAPE_ALLOW_INVALID) == 0) &&
723
0
                       (!IS_CHAR(val))) {
724
0
                val = 0xFFFD;
725
0
            }
726
727
0
            replSize = xmlSerializeHexCharRef(buf, val);
728
0
            repl = BAD_CAST buf;
729
98.9k
  } else if ((flags & (XML_ESCAPE_ALLOW_INVALID | XML_ESCAPE_HTML)) ||
730
0
                   (c >= 0x20) ||
731
98.9k
             (c == '\n') || (c == '\t') || (c == '\r')) {
732
      /* default case, just copy */
733
98.9k
            cur += 1;
734
98.9k
            if (*cur != 0)
735
98.5k
                continue;
736
737
440
            chunkSize = 0;
738
440
            repl = BAD_CAST "";
739
440
            replSize = 0;
740
440
  } else {
741
            /* ignore */
742
0
            repl = BAD_CAST "";
743
0
            replSize = 0;
744
0
        }
745
746
165k
        used = out - buffer;
747
165k
        unescapedSize = cur - unescaped;
748
165k
        totalSize = unescapedSize + replSize;
749
750
165k
  cur += chunkSize;
751
752
165k
        if (totalSize > size - used) {
753
22.4k
            xmlChar *tmp;
754
22.4k
            int newSize;
755
756
22.4k
            if ((size > (SIZE_MAX - 1) / 2) ||
757
22.4k
                (totalSize > (SIZE_MAX - 1) / 2 - size)) {
758
0
                xmlFree(buffer);
759
0
                return(NULL);
760
0
            }
761
22.4k
            newSize = size + totalSize;
762
22.4k
            if (*cur != 0)
763
6.04k
                newSize *= 2;
764
22.4k
            tmp = xmlRealloc(buffer, newSize + 1);
765
22.4k
            if (tmp == NULL) {
766
6
                xmlFree(buffer);
767
6
                return(NULL);
768
6
            }
769
22.4k
            buffer = tmp;
770
22.4k
            size = newSize;
771
22.4k
            out = buffer + used;
772
22.4k
        }
773
774
165k
        memcpy(out, unescaped, unescapedSize);
775
165k
        out += unescapedSize;
776
165k
        memcpy(out, repl, replSize);
777
165k
        out += replSize;
778
779
165k
        unescaped = cur;
780
165k
    }
781
782
59.7k
    *out = 0;
783
59.7k
    return(buffer);
784
59.7k
}
785
786
/**
787
 * xmlEncodeEntitiesInternal:
788
 * @doc:  the document containing the string
789
 * @input:  A string to convert to XML.
790
 * @flags:  XML_ESCAPE flags
791
 *
792
 * Do a global encoding of a string, replacing the predefined entities
793
 * and non ASCII values with their entities and CharRef counterparts.
794
 * Contrary to xmlEncodeEntities, this routine is reentrant, and result
795
 * must be deallocated.
796
 *
797
 * Returns A newly allocated string with the substitution done.
798
 */
799
xmlChar *
800
xmlEncodeEntitiesInternal(xmlDocPtr doc, const xmlChar *input,
801
59.8k
                          unsigned flags) {
802
59.8k
    if (input == NULL)
803
0
        return(NULL);
804
805
59.8k
    if ((doc != NULL) && (doc->type == XML_HTML_DOCUMENT_NODE))
806
59.8k
        flags |= XML_ESCAPE_HTML;
807
0
    else if ((doc == NULL) || (doc->encoding == NULL))
808
0
        flags |= XML_ESCAPE_NON_ASCII;
809
810
59.8k
    return(xmlEscapeText(input, flags));
811
59.8k
}
812
813
/**
814
 * xmlEncodeEntitiesReentrant:
815
 * @doc:  the document containing the string
816
 * @input:  A string to convert to XML.
817
 *
818
 * Do a global encoding of a string, replacing the predefined entities
819
 * and non ASCII values with their entities and CharRef counterparts.
820
 * Contrary to xmlEncodeEntities, this routine is reentrant, and result
821
 * must be deallocated.
822
 *
823
 * This escapes '<', '>', '&' and '\r'. If the document has no encoding,
824
 * non-ASCII codepoints are escaped. There is some special handling for
825
 * HTML documents.
826
 *
827
 * Returns A newly allocated string with the substitution done.
828
 */
829
xmlChar *
830
37.2k
xmlEncodeEntitiesReentrant(xmlDocPtr doc, const xmlChar *input) {
831
37.2k
    return xmlEncodeEntitiesInternal(doc, input, 0);
832
37.2k
}
833
834
/**
835
 * xmlEncodeSpecialChars:
836
 * @doc:  unused
837
 * @input:  A string to convert to XML.
838
 *
839
 * Do a global encoding of a string, replacing the predefined entities
840
 * this routine is reentrant, and result must be deallocated.
841
 *
842
 * This escapes '<', '>', '&', '"' and '\r' chars.
843
 *
844
 * Returns A newly allocated string with the substitution done.
845
 */
846
xmlChar *
847
xmlEncodeSpecialChars(const xmlDoc *doc ATTRIBUTE_UNUSED,
848
0
                      const xmlChar *input) {
849
0
    if (input == NULL)
850
0
        return(NULL);
851
852
0
    return(xmlEscapeText(input, XML_ESCAPE_QUOT | XML_ESCAPE_ALLOW_INVALID));
853
0
}
854
855
/**
856
 * xmlCreateEntitiesTable:
857
 *
858
 * create and initialize an empty entities hash table.
859
 * This really doesn't make sense and should be deprecated
860
 *
861
 * Returns the xmlEntitiesTablePtr just created or NULL in case of error.
862
 */
863
xmlEntitiesTablePtr
864
0
xmlCreateEntitiesTable(void) {
865
0
    return((xmlEntitiesTablePtr) xmlHashCreate(0));
866
0
}
867
868
/**
869
 * xmlFreeEntityWrapper:
870
 * @entity:  An entity
871
 * @name:  its name
872
 *
873
 * Deallocate the memory used by an entities in the hash table.
874
 */
875
static void
876
97.7k
xmlFreeEntityWrapper(void *entity, const xmlChar *name ATTRIBUTE_UNUSED) {
877
97.7k
    if (entity != NULL)
878
97.7k
  xmlFreeEntity((xmlEntityPtr) entity);
879
97.7k
}
880
881
/**
882
 * xmlFreeEntitiesTable:
883
 * @table:  An entity table
884
 *
885
 * Deallocate the memory used by an entities hash table.
886
 */
887
void
888
54.9k
xmlFreeEntitiesTable(xmlEntitiesTablePtr table) {
889
54.9k
    xmlHashFree(table, xmlFreeEntityWrapper);
890
54.9k
}
891
892
/**
893
 * xmlCopyEntity:
894
 * @ent:  An entity
895
 *
896
 * Build a copy of an entity
897
 *
898
 * Returns the new xmlEntitiesPtr or NULL in case of error.
899
 */
900
static void *
901
0
xmlCopyEntity(void *payload, const xmlChar *name ATTRIBUTE_UNUSED) {
902
0
    xmlEntityPtr ent = (xmlEntityPtr) payload;
903
0
    xmlEntityPtr cur;
904
905
0
    cur = (xmlEntityPtr) xmlMalloc(sizeof(xmlEntity));
906
0
    if (cur == NULL)
907
0
  return(NULL);
908
0
    memset(cur, 0, sizeof(xmlEntity));
909
0
    cur->type = XML_ENTITY_DECL;
910
911
0
    cur->etype = ent->etype;
912
0
    if (ent->name != NULL) {
913
0
  cur->name = xmlStrdup(ent->name);
914
0
        if (cur->name == NULL)
915
0
            goto error;
916
0
    }
917
0
    if (ent->ExternalID != NULL) {
918
0
  cur->ExternalID = xmlStrdup(ent->ExternalID);
919
0
        if (cur->ExternalID == NULL)
920
0
            goto error;
921
0
    }
922
0
    if (ent->SystemID != NULL) {
923
0
  cur->SystemID = xmlStrdup(ent->SystemID);
924
0
        if (cur->SystemID == NULL)
925
0
            goto error;
926
0
    }
927
0
    if (ent->content != NULL) {
928
0
  cur->content = xmlStrdup(ent->content);
929
0
        if (cur->content == NULL)
930
0
            goto error;
931
0
    }
932
0
    if (ent->orig != NULL) {
933
0
  cur->orig = xmlStrdup(ent->orig);
934
0
        if (cur->orig == NULL)
935
0
            goto error;
936
0
    }
937
0
    if (ent->URI != NULL) {
938
0
  cur->URI = xmlStrdup(ent->URI);
939
0
        if (cur->URI == NULL)
940
0
            goto error;
941
0
    }
942
0
    return(cur);
943
944
0
error:
945
0
    xmlFreeEntity(cur);
946
0
    return(NULL);
947
0
}
948
949
/**
950
 * xmlCopyEntitiesTable:
951
 * @table:  An entity table
952
 *
953
 * Build a copy of an entity table.
954
 *
955
 * Returns the new xmlEntitiesTablePtr or NULL in case of error.
956
 */
957
xmlEntitiesTablePtr
958
0
xmlCopyEntitiesTable(xmlEntitiesTablePtr table) {
959
0
    return(xmlHashCopySafe(table, xmlCopyEntity, xmlFreeEntityWrapper));
960
0
}
961
962
#ifdef LIBXML_OUTPUT_ENABLED
963
964
/**
965
 * xmlDumpEntityDecl:
966
 * @buf:  An XML buffer.
967
 * @ent:  An entity table
968
 *
969
 * This will dump the content of the entity table as an XML DTD definition
970
 */
971
void
972
0
xmlDumpEntityDecl(xmlBufferPtr buf, xmlEntityPtr ent) {
973
0
    xmlSaveCtxtPtr save;
974
975
0
    if ((buf == NULL) || (ent == NULL))
976
0
        return;
977
978
0
    save = xmlSaveToBuffer(buf, NULL, 0);
979
0
    xmlSaveTree(save, (xmlNodePtr) ent);
980
0
    if (xmlSaveFinish(save) != XML_ERR_OK)
981
0
        xmlFree(xmlBufferDetach(buf));
982
0
}
983
984
/**
985
 * xmlDumpEntityDeclScan:
986
 * @ent:  An entity table
987
 * @buf:  An XML buffer.
988
 *
989
 * When using the hash table scan function, arguments need to be reversed
990
 */
991
static void
992
xmlDumpEntityDeclScan(void *ent, void *save,
993
0
                      const xmlChar *name ATTRIBUTE_UNUSED) {
994
0
    xmlSaveTree(save, ent);
995
0
}
996
997
/**
998
 * xmlDumpEntitiesTable:
999
 * @buf:  An XML buffer.
1000
 * @table:  An entity table
1001
 *
1002
 * This will dump the content of the entity table as an XML DTD definition
1003
 */
1004
void
1005
0
xmlDumpEntitiesTable(xmlBufferPtr buf, xmlEntitiesTablePtr table) {
1006
0
    xmlSaveCtxtPtr save;
1007
1008
0
    if ((buf == NULL) || (table == NULL))
1009
0
        return;
1010
1011
0
    save = xmlSaveToBuffer(buf, NULL, 0);
1012
0
    xmlHashScan(table, xmlDumpEntityDeclScan, save);
1013
0
    if (xmlSaveFinish(save) != XML_ERR_OK)
1014
0
        xmlFree(xmlBufferDetach(buf));
1015
0
}
1016
#endif /* LIBXML_OUTPUT_ENABLED */