Coverage Report

Created: 2025-07-18 06:31

/src/libxml2/entities.c
Line
Count
Source (jump to first uncovered line)
1
/*
2
 * entities.c : implementation for the XML entities handling
3
 *
4
 * See Copyright for the status of this software.
5
 *
6
 * daniel@veillard.com
7
 */
8
9
/* To avoid EBCDIC trouble when parsing on zOS */
10
#if defined(__MVS__)
11
#pragma convert("ISO8859-1")
12
#endif
13
14
#define IN_LIBXML
15
#include "libxml.h"
16
17
#include <string.h>
18
#include <stdlib.h>
19
20
#include <libxml/xmlmemory.h>
21
#include <libxml/hash.h>
22
#include <libxml/entities.h>
23
#include <libxml/parser.h>
24
#include <libxml/parserInternals.h>
25
#include <libxml/xmlerror.h>
26
#include <libxml/dict.h>
27
#include <libxml/xmlsave.h>
28
29
#include "private/entities.h"
30
#include "private/error.h"
31
32
#ifndef SIZE_MAX
33
  #define SIZE_MAX ((size_t) -1)
34
#endif
35
36
/*
37
 * The XML predefined entities.
38
 */
39
40
static xmlEntity xmlEntityLt = {
41
    NULL, XML_ENTITY_DECL, BAD_CAST "lt",
42
    NULL, NULL, NULL, NULL, NULL, NULL,
43
    BAD_CAST "<", BAD_CAST "<", 1,
44
    XML_INTERNAL_PREDEFINED_ENTITY,
45
    NULL, NULL, NULL, NULL, 0, 0, 0
46
};
47
static xmlEntity xmlEntityGt = {
48
    NULL, XML_ENTITY_DECL, BAD_CAST "gt",
49
    NULL, NULL, NULL, NULL, NULL, NULL,
50
    BAD_CAST ">", BAD_CAST ">", 1,
51
    XML_INTERNAL_PREDEFINED_ENTITY,
52
    NULL, NULL, NULL, NULL, 0, 0, 0
53
};
54
static xmlEntity xmlEntityAmp = {
55
    NULL, XML_ENTITY_DECL, BAD_CAST "amp",
56
    NULL, NULL, NULL, NULL, NULL, NULL,
57
    BAD_CAST "&", BAD_CAST "&", 1,
58
    XML_INTERNAL_PREDEFINED_ENTITY,
59
    NULL, NULL, NULL, NULL, 0, 0, 0
60
};
61
static xmlEntity xmlEntityQuot = {
62
    NULL, XML_ENTITY_DECL, BAD_CAST "quot",
63
    NULL, NULL, NULL, NULL, NULL, NULL,
64
    BAD_CAST "\"", BAD_CAST "\"", 1,
65
    XML_INTERNAL_PREDEFINED_ENTITY,
66
    NULL, NULL, NULL, NULL, 0, 0, 0
67
};
68
static xmlEntity xmlEntityApos = {
69
    NULL, XML_ENTITY_DECL, BAD_CAST "apos",
70
    NULL, NULL, NULL, NULL, NULL, NULL,
71
    BAD_CAST "'", BAD_CAST "'", 1,
72
    XML_INTERNAL_PREDEFINED_ENTITY,
73
    NULL, NULL, NULL, NULL, 0, 0, 0
74
};
75
76
/*
77
 * xmlFreeEntity:
78
 * @entity:  an entity
79
 *
80
 * Frees the entity.
81
 */
82
void
83
xmlFreeEntity(xmlEntityPtr entity)
84
145k
{
85
145k
    xmlDictPtr dict = NULL;
86
87
145k
    if (entity == NULL)
88
0
        return;
89
90
145k
    if (entity->doc != NULL)
91
145k
        dict = entity->doc->dict;
92
93
94
145k
    if ((entity->children) &&
95
145k
        (entity == (xmlEntityPtr) entity->children->parent))
96
2.48k
        xmlFreeNodeList(entity->children);
97
145k
    if ((entity->name != NULL) &&
98
145k
        ((dict == NULL) || (!xmlDictOwns(dict, entity->name))))
99
20.4k
        xmlFree((char *) entity->name);
100
145k
    if (entity->ExternalID != NULL)
101
14.2k
        xmlFree((char *) entity->ExternalID);
102
145k
    if (entity->SystemID != NULL)
103
57.1k
        xmlFree((char *) entity->SystemID);
104
145k
    if (entity->URI != NULL)
105
54.4k
        xmlFree((char *) entity->URI);
106
145k
    if (entity->content != NULL)
107
86.7k
        xmlFree((char *) entity->content);
108
145k
    if (entity->orig != NULL)
109
67.0k
        xmlFree((char *) entity->orig);
110
145k
    xmlFree(entity);
111
145k
}
112
113
/*
114
 * xmlCreateEntity:
115
 *
116
 * internal routine doing the entity node structures allocations
117
 */
118
static xmlEntityPtr
119
xmlCreateEntity(xmlDocPtr doc, const xmlChar *name, int type,
120
          const xmlChar *ExternalID, const xmlChar *SystemID,
121
145k
          const xmlChar *content) {
122
145k
    xmlEntityPtr ret;
123
124
145k
    ret = (xmlEntityPtr) xmlMalloc(sizeof(xmlEntity));
125
145k
    if (ret == NULL)
126
11
  return(NULL);
127
145k
    memset(ret, 0, sizeof(xmlEntity));
128
145k
    ret->doc = doc;
129
145k
    ret->type = XML_ENTITY_DECL;
130
131
    /*
132
     * fill the structure.
133
     */
134
145k
    ret->etype = (xmlEntityType) type;
135
145k
    if ((doc == NULL) || (doc->dict == NULL))
136
20.4k
  ret->name = xmlStrdup(name);
137
125k
    else
138
125k
        ret->name = xmlDictLookup(doc->dict, name, -1);
139
145k
    if (ret->name == NULL)
140
1
        goto error;
141
145k
    if (ExternalID != NULL) {
142
14.2k
        ret->ExternalID = xmlStrdup(ExternalID);
143
14.2k
        if (ret->ExternalID == NULL)
144
1
            goto error;
145
14.2k
    }
146
145k
    if (SystemID != NULL) {
147
57.1k
        ret->SystemID = xmlStrdup(SystemID);
148
57.1k
        if (ret->SystemID == NULL)
149
6
            goto error;
150
57.1k
    }
151
145k
    if (content != NULL) {
152
86.4k
        ret->length = xmlStrlen(content);
153
86.4k
  ret->content = xmlStrndup(content, ret->length);
154
86.4k
        if (ret->content == NULL)
155
2
            goto error;
156
86.4k
     } else {
157
59.3k
        ret->length = 0;
158
59.3k
        ret->content = NULL;
159
59.3k
    }
160
145k
    ret->URI = NULL; /* to be computed by the layer knowing
161
      the defining entity */
162
145k
    ret->orig = NULL;
163
164
145k
    return(ret);
165
166
10
error:
167
10
    xmlFreeEntity(ret);
168
10
    return(NULL);
169
145k
}
170
171
/**
172
 * xmlAddEntity:
173
 * @doc:  the document
174
 * @extSubset:  add to the external or internal subset
175
 * @name:  the entity name
176
 * @type:  the entity type XML_xxx_yyy_ENTITY
177
 * @ExternalID:  the entity external ID if available
178
 * @SystemID:  the entity system ID if available
179
 * @content:  the entity content
180
 * @out:  pointer to resulting entity (optional)
181
 *
182
 * Register a new entity for this document.
183
 *
184
 * Available since 2.13.0.
185
 *
186
 * Returns an xmlParserErrors error code.
187
 */
188
int
189
xmlAddEntity(xmlDocPtr doc, int extSubset, const xmlChar *name, int type,
190
    const xmlChar *ExternalID, const xmlChar *SystemID,
191
157k
    const xmlChar *content, xmlEntityPtr *out) {
192
157k
    xmlDtdPtr dtd;
193
157k
    xmlDictPtr dict = NULL;
194
157k
    xmlEntitiesTablePtr table = NULL;
195
157k
    xmlEntityPtr ret, predef;
196
157k
    int res;
197
198
157k
    if (out != NULL)
199
157k
        *out = NULL;
200
157k
    if ((doc == NULL) || (name == NULL))
201
0
  return(XML_ERR_ARGUMENT);
202
157k
    dict = doc->dict;
203
204
157k
    if (extSubset)
205
9.70k
        dtd = doc->extSubset;
206
147k
    else
207
147k
        dtd = doc->intSubset;
208
157k
    if (dtd == NULL)
209
0
        return(XML_DTD_NO_DTD);
210
211
157k
    switch (type) {
212
61.0k
        case XML_INTERNAL_GENERAL_ENTITY:
213
77.4k
        case XML_EXTERNAL_GENERAL_PARSED_ENTITY:
214
77.7k
        case XML_EXTERNAL_GENERAL_UNPARSED_ENTITY:
215
77.7k
            predef = xmlGetPredefinedEntity(name);
216
77.7k
            if (predef != NULL) {
217
18.6k
                int valid = 0;
218
219
                /* 4.6 Predefined Entities */
220
18.6k
                if ((type == XML_INTERNAL_GENERAL_ENTITY) &&
221
18.6k
                    (content != NULL)) {
222
17.3k
                    int c = predef->content[0];
223
224
17.3k
                    if (((content[0] == c) && (content[1] == 0)) &&
225
17.3k
                        ((c == '>') || (c == '\'') || (c == '"'))) {
226
4.98k
                        valid = 1;
227
12.3k
                    } else if ((content[0] == '&') && (content[1] == '#')) {
228
5.70k
                        if (content[2] == 'x') {
229
4.78k
                            xmlChar *hex = BAD_CAST "0123456789ABCDEF";
230
4.78k
                            xmlChar ref[] = "00;";
231
232
4.78k
                            ref[0] = hex[c / 16 % 16];
233
4.78k
                            ref[1] = hex[c % 16];
234
4.78k
                            if (xmlStrcasecmp(&content[3], ref) == 0)
235
1.85k
                                valid = 1;
236
4.78k
                        } else {
237
914
                            xmlChar ref[] = "00;";
238
239
914
                            ref[0] = '0' + c / 10 % 10;
240
914
                            ref[1] = '0' + c % 10;
241
914
                            if (xmlStrEqual(&content[2], ref))
242
306
                                valid = 1;
243
914
                        }
244
5.70k
                    }
245
17.3k
                }
246
18.6k
                if (!valid)
247
11.5k
                    return(XML_ERR_REDECL_PREDEF_ENTITY);
248
18.6k
            }
249
66.2k
      if (dtd->entities == NULL) {
250
35.1k
    dtd->entities = xmlHashCreateDict(0, dict);
251
35.1k
                if (dtd->entities == NULL)
252
2
                    return(XML_ERR_NO_MEMORY);
253
35.1k
            }
254
66.2k
      table = dtd->entities;
255
66.2k
      break;
256
36.6k
        case XML_INTERNAL_PARAMETER_ENTITY:
257
79.5k
        case XML_EXTERNAL_PARAMETER_ENTITY:
258
79.5k
      if (dtd->pentities == NULL) {
259
35.1k
    dtd->pentities = xmlHashCreateDict(0, dict);
260
35.1k
                if (dtd->pentities == NULL)
261
1
                    return(XML_ERR_NO_MEMORY);
262
35.1k
            }
263
79.5k
      table = dtd->pentities;
264
79.5k
      break;
265
0
        default:
266
0
      return(XML_ERR_ARGUMENT);
267
157k
    }
268
145k
    ret = xmlCreateEntity(dtd->doc, name, type, ExternalID, SystemID, content);
269
145k
    if (ret == NULL)
270
21
        return(XML_ERR_NO_MEMORY);
271
272
145k
    res = xmlHashAdd(table, name, ret);
273
145k
    if (res < 0) {
274
6
        xmlFreeEntity(ret);
275
6
        return(XML_ERR_NO_MEMORY);
276
145k
    } else if (res == 0) {
277
  /*
278
   * entity was already defined at another level.
279
   */
280
19.6k
        xmlFreeEntity(ret);
281
19.6k
  return(XML_WAR_ENTITY_REDEFINED);
282
19.6k
    }
283
284
    /*
285
     * Link it to the DTD
286
     */
287
126k
    ret->parent = dtd;
288
126k
    ret->doc = dtd->doc;
289
126k
    if (dtd->last == NULL) {
290
50.3k
  dtd->children = dtd->last = (xmlNodePtr) ret;
291
75.7k
    } else {
292
75.7k
  dtd->last->next = (xmlNodePtr) ret;
293
75.7k
  ret->prev = dtd->last;
294
75.7k
  dtd->last = (xmlNodePtr) ret;
295
75.7k
    }
296
297
126k
    if (out != NULL)
298
126k
        *out = ret;
299
126k
    return(0);
300
145k
}
301
302
/**
303
 * xmlGetPredefinedEntity:
304
 * @name:  the entity name
305
 *
306
 * Check whether this name is an predefined entity.
307
 *
308
 * Returns NULL if not, otherwise the entity
309
 */
310
xmlEntityPtr
311
3.50M
xmlGetPredefinedEntity(const xmlChar *name) {
312
3.50M
    if (name == NULL) return(NULL);
313
3.50M
    switch (name[0]) {
314
24.7k
        case 'l':
315
24.7k
      if (xmlStrEqual(name, BAD_CAST "lt"))
316
18.3k
          return(&xmlEntityLt);
317
6.39k
      break;
318
68.1k
        case 'g':
319
68.1k
      if (xmlStrEqual(name, BAD_CAST "gt"))
320
62.9k
          return(&xmlEntityGt);
321
5.24k
      break;
322
689k
        case 'a':
323
689k
      if (xmlStrEqual(name, BAD_CAST "amp"))
324
78.8k
          return(&xmlEntityAmp);
325
610k
      if (xmlStrEqual(name, BAD_CAST "apos"))
326
4.19k
          return(&xmlEntityApos);
327
606k
      break;
328
1.49M
        case 'q':
329
1.49M
      if (xmlStrEqual(name, BAD_CAST "quot"))
330
6.30k
          return(&xmlEntityQuot);
331
1.48M
      break;
332
1.48M
  default:
333
1.23M
      break;
334
3.50M
    }
335
3.33M
    return(NULL);
336
3.50M
}
337
338
/**
339
 * xmlAddDtdEntity:
340
 * @doc:  the document
341
 * @name:  the entity name
342
 * @type:  the entity type XML_xxx_yyy_ENTITY
343
 * @ExternalID:  the entity external ID if available
344
 * @SystemID:  the entity system ID if available
345
 * @content:  the entity content
346
 *
347
 * Register a new entity for this document DTD external subset.
348
 *
349
 * Returns a pointer to the entity or NULL in case of error
350
 */
351
xmlEntityPtr
352
xmlAddDtdEntity(xmlDocPtr doc, const xmlChar *name, int type,
353
          const xmlChar *ExternalID, const xmlChar *SystemID,
354
0
    const xmlChar *content) {
355
0
    xmlEntityPtr ret;
356
357
0
    xmlAddEntity(doc, 1, name, type, ExternalID, SystemID, content, &ret);
358
0
    return(ret);
359
0
}
360
361
/**
362
 * xmlAddDocEntity:
363
 * @doc:  the document
364
 * @name:  the entity name
365
 * @type:  the entity type XML_xxx_yyy_ENTITY
366
 * @ExternalID:  the entity external ID if available
367
 * @SystemID:  the entity system ID if available
368
 * @content:  the entity content
369
 *
370
 * Register a new entity for this document.
371
 *
372
 * Returns a pointer to the entity or NULL in case of error
373
 */
374
xmlEntityPtr
375
xmlAddDocEntity(xmlDocPtr doc, const xmlChar *name, int type,
376
          const xmlChar *ExternalID, const xmlChar *SystemID,
377
0
          const xmlChar *content) {
378
0
    xmlEntityPtr ret;
379
380
0
    xmlAddEntity(doc, 0, name, type, ExternalID, SystemID, content, &ret);
381
0
    return(ret);
382
0
}
383
384
/**
385
 * xmlNewEntity:
386
 * @doc:  the document
387
 * @name:  the entity name
388
 * @type:  the entity type XML_xxx_yyy_ENTITY
389
 * @ExternalID:  the entity external ID if available
390
 * @SystemID:  the entity system ID if available
391
 * @content:  the entity content
392
 *
393
 * Create a new entity, this differs from xmlAddDocEntity() that if
394
 * the document is NULL or has no internal subset defined, then an
395
 * unlinked entity structure will be returned, it is then the responsibility
396
 * of the caller to link it to the document later or free it when not needed
397
 * anymore.
398
 *
399
 * Returns a pointer to the entity or NULL in case of error
400
 */
401
xmlEntityPtr
402
xmlNewEntity(xmlDocPtr doc, const xmlChar *name, int type,
403
       const xmlChar *ExternalID, const xmlChar *SystemID,
404
0
       const xmlChar *content) {
405
0
    if ((doc != NULL) && (doc->intSubset != NULL)) {
406
0
  return(xmlAddDocEntity(doc, name, type, ExternalID, SystemID, content));
407
0
    }
408
0
    if (name == NULL)
409
0
        return(NULL);
410
0
    return(xmlCreateEntity(doc, name, type, ExternalID, SystemID, content));
411
0
}
412
413
/**
414
 * xmlGetEntityFromTable:
415
 * @table:  an entity table
416
 * @name:  the entity name
417
 * @parameter:  look for parameter entities
418
 *
419
 * Do an entity lookup in the table.
420
 * returns the corresponding parameter entity, if found.
421
 *
422
 * Returns A pointer to the entity structure or NULL if not found.
423
 */
424
static xmlEntityPtr
425
1.87M
xmlGetEntityFromTable(xmlEntitiesTablePtr table, const xmlChar *name) {
426
1.87M
    return((xmlEntityPtr) xmlHashLookup(table, name));
427
1.87M
}
428
429
/**
430
 * xmlGetParameterEntity:
431
 * @doc:  the document referencing the entity
432
 * @name:  the entity name
433
 *
434
 * Do an entity lookup in the internal and external subsets and
435
 * returns the corresponding parameter entity, if found.
436
 *
437
 * Returns A pointer to the entity structure or NULL if not found.
438
 */
439
xmlEntityPtr
440
141k
xmlGetParameterEntity(xmlDocPtr doc, const xmlChar *name) {
441
141k
    xmlEntitiesTablePtr table;
442
141k
    xmlEntityPtr ret;
443
444
141k
    if (doc == NULL)
445
906
  return(NULL);
446
141k
    if ((doc->intSubset != NULL) && (doc->intSubset->pentities != NULL)) {
447
138k
  table = (xmlEntitiesTablePtr) doc->intSubset->pentities;
448
138k
  ret = xmlGetEntityFromTable(table, name);
449
138k
  if (ret != NULL)
450
91.4k
      return(ret);
451
138k
    }
452
49.6k
    if ((doc->extSubset != NULL) && (doc->extSubset->pentities != NULL)) {
453
11.7k
  table = (xmlEntitiesTablePtr) doc->extSubset->pentities;
454
11.7k
  return(xmlGetEntityFromTable(table, name));
455
11.7k
    }
456
37.9k
    return(NULL);
457
49.6k
}
458
459
/**
460
 * xmlGetDtdEntity:
461
 * @doc:  the document referencing the entity
462
 * @name:  the entity name
463
 *
464
 * Do an entity lookup in the DTD entity hash table and
465
 * returns the corresponding entity, if found.
466
 * Note: the first argument is the document node, not the DTD node.
467
 *
468
 * Returns A pointer to the entity structure or NULL if not found.
469
 */
470
xmlEntityPtr
471
0
xmlGetDtdEntity(xmlDocPtr doc, const xmlChar *name) {
472
0
    xmlEntitiesTablePtr table;
473
474
0
    if (doc == NULL)
475
0
  return(NULL);
476
0
    if ((doc->extSubset != NULL) && (doc->extSubset->entities != NULL)) {
477
0
  table = (xmlEntitiesTablePtr) doc->extSubset->entities;
478
0
  return(xmlGetEntityFromTable(table, name));
479
0
    }
480
0
    return(NULL);
481
0
}
482
483
/**
484
 * xmlGetDocEntity:
485
 * @doc:  the document referencing the entity
486
 * @name:  the entity name
487
 *
488
 * Do an entity lookup in the document entity hash table and
489
 * returns the corresponding entity, otherwise a lookup is done
490
 * in the predefined entities too.
491
 *
492
 * Returns A pointer to the entity structure or NULL if not found.
493
 */
494
xmlEntityPtr
495
1.59M
xmlGetDocEntity(const xmlDoc *doc, const xmlChar *name) {
496
1.59M
    xmlEntityPtr cur;
497
1.59M
    xmlEntitiesTablePtr table;
498
499
1.59M
    if (doc != NULL) {
500
1.59M
  if ((doc->intSubset != NULL) && (doc->intSubset->entities != NULL)) {
501
1.49M
      table = (xmlEntitiesTablePtr) doc->intSubset->entities;
502
1.49M
      cur = xmlGetEntityFromTable(table, name);
503
1.49M
      if (cur != NULL)
504
1.14M
    return(cur);
505
1.49M
  }
506
447k
  if (doc->standalone != 1) {
507
447k
      if ((doc->extSubset != NULL) &&
508
447k
    (doc->extSubset->entities != NULL)) {
509
222k
    table = (xmlEntitiesTablePtr) doc->extSubset->entities;
510
222k
    cur = xmlGetEntityFromTable(table, name);
511
222k
    if (cur != NULL)
512
300
        return(cur);
513
222k
      }
514
447k
  }
515
447k
    }
516
449k
    return(xmlGetPredefinedEntity(name));
517
1.59M
}
518
519
/*
520
 * xmlSerializeHexCharRef:
521
 * @buf:  a char buffer
522
 * @val:  a codepoint
523
 *
524
 * Serializes a hex char ref like &#xA0;
525
 *
526
 * Writes at most 9 bytes. Does not include a terminating zero byte.
527
 *
528
 * Returns the number of bytes written.
529
 */
530
int
531
1.90k
xmlSerializeHexCharRef(char *buf, int val) {
532
1.90k
    char *out = buf;
533
1.90k
    int shift = 0, bits;
534
535
1.90k
    *out++ = '&';
536
1.90k
    *out++ = '#';
537
1.90k
    *out++ = 'x';
538
539
1.90k
    bits = val;
540
1.90k
    if (bits & 0xFF0000) {
541
267
        shift = 16;
542
267
        bits &= 0xFF0000;
543
1.63k
    } else if (bits & 0x00FF00) {
544
599
        shift = 8;
545
599
        bits &= 0x00FF00;
546
599
    }
547
1.90k
    if (bits & 0xF0F0F0) {
548
1.04k
        shift += 4;
549
1.04k
    }
550
551
5.21k
    do {
552
5.21k
        int d = (val >> shift) & 0x0F;
553
554
5.21k
        if (d < 10)
555
3.07k
            *out++ = '0' + d;
556
2.14k
        else
557
2.14k
            *out++ = 'A' + (d - 10);
558
559
5.21k
  shift -= 4;
560
5.21k
    } while (shift >= 0);
561
562
1.90k
    *out++ = ';';
563
564
1.90k
    return(out - buf);
565
1.90k
}
566
567
/*
568
 * xmlSerializeDecCharRef:
569
 * @buf:  a char buffer
570
 * @val:  a codepoint
571
 *
572
 * Serializes a decimal char ref like &#38;
573
 *
574
 * Writes at most 10 bytes. Does not include a terminating zero byte.
575
 *
576
 * Returns the number of bytes written.
577
 */
578
int
579
47.9M
xmlSerializeDecCharRef(char *buf, int val) {
580
47.9M
    char *out = buf;
581
47.9M
    int len, i;
582
583
47.9M
    *out++ = '&';
584
47.9M
    *out++ = '#';
585
586
47.9M
    if (val < 100) {
587
110
        len = (val < 10) ? 1 : 2;
588
47.9M
    } else if (val < 10000) {
589
47.9M
        len = (val < 1000) ? 3 : 4;
590
47.9M
    } else if (val < 1000000) {
591
12.1k
        len = (val < 100000) ? 5 : 6;
592
12.1k
    } else {
593
99
        len = 7;
594
99
    }
595
596
191M
    for (i = len - 1; i >= 0; i--) {
597
143M
        out[i] = '0' + val % 10;
598
143M
        val /= 10;
599
143M
    }
600
601
47.9M
    out[len] = ';';
602
603
47.9M
    return(len + 3);
604
47.9M
}
605
606
static const char xmlEscapeSafe[128] = {
607
    0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0,
608
    0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
609
    1, 1, 0, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1,
610
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 1,
611
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
612
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
613
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
614
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1
615
};
616
617
/*
618
 * xmlEscapeText:
619
 * @text:  input text
620
 * @flags:  XML_ESCAPE flags
621
 *
622
 * Escapes certain characters with char refs.
623
 *
624
 * XML_ESCAPE_ATTR: for attribute content.
625
 * XML_ESCAPE_NON_ASCII: escape non-ASCII chars.
626
 * XML_ESCAPE_HTML: for HTML content.
627
 * XML_ESCAPE_QUOT: escape double quotes.
628
 * XML_ESCAPE_ALLOW_INVALID: allow invalid characters.
629
 *
630
 * Returns an escaped string or NULL if a memory allocation failed.
631
 */
632
xmlChar *
633
65.5k
xmlEscapeText(const xmlChar *text, int flags) {
634
65.5k
    const xmlChar *cur;
635
65.5k
    xmlChar *buffer;
636
65.5k
    xmlChar *out;
637
65.5k
    const xmlChar *unescaped;
638
65.5k
    size_t size = 50;
639
640
65.5k
    buffer = xmlMalloc(size + 1);
641
65.5k
    if (buffer == NULL)
642
33
        return(NULL);
643
65.5k
    out = buffer;
644
645
65.5k
    cur = text;
646
65.5k
    unescaped = cur;
647
648
191k
    while (*cur != '\0') {
649
125k
        char buf[12];
650
125k
  const xmlChar *end;
651
125k
        const xmlChar *repl;
652
125k
        size_t used;
653
125k
        size_t replSize;
654
125k
        size_t unescapedSize;
655
125k
        size_t totalSize;
656
125k
        int chunkSize = 1;
657
125k
        int c;
658
659
        /* accelerator */
660
126M
  while (1) {
661
126M
            c = *cur;
662
663
126M
            if (c < 0x80) {
664
20.9M
                if (!xmlEscapeSafe[*cur])
665
125k
                    break;
666
105M
            } else {
667
105M
               if (flags & XML_ESCAPE_NON_ASCII)
668
0
                   break;
669
105M
            }
670
126M
            cur += 1;
671
126M
        }
672
673
125k
        if (c == 0) {
674
63.5k
            chunkSize = 0;
675
63.5k
            repl = BAD_CAST "";
676
63.5k
            replSize = 0;
677
63.5k
        } else if (c == '<') {
678
      /*
679
       * Special handling of server side include in HTML attributes
680
       */
681
8.94k
      if ((flags & XML_ESCAPE_HTML) && (flags & XML_ESCAPE_ATTR) &&
682
8.94k
          (cur[1] == '!') && (cur[2] == '-') && (cur[3] == '-') &&
683
8.94k
          ((end = xmlStrstr(cur, BAD_CAST "-->")) != NULL)) {
684
456
                chunkSize = (end - cur) + 3;
685
456
                repl = cur;
686
456
                replSize = chunkSize;
687
8.49k
      } else {
688
8.49k
                repl = BAD_CAST "&lt;";
689
8.49k
                replSize = 4;
690
8.49k
            }
691
52.9k
  } else if (c == '>') {
692
24.0k
            repl = BAD_CAST "&gt;";
693
24.0k
            replSize = 4;
694
28.9k
  } else if (c == '&') {
695
      /*
696
       * Special handling of &{...} construct from HTML 4, see
697
       * http://www.w3.org/TR/html401/appendix/notes.html#h-B.7.1
698
       */
699
7.79k
      if ((flags & XML_ESCAPE_HTML) && (flags & XML_ESCAPE_ATTR) &&
700
7.79k
                (cur[1] == '{') && (end = xmlStrchr(cur, '}'))) {
701
832
                chunkSize = (end - cur) + 1;
702
832
                repl = cur;
703
832
                replSize = chunkSize;
704
6.95k
      } else {
705
6.95k
                repl = BAD_CAST "&amp;";
706
6.95k
                replSize = 5;
707
6.95k
            }
708
21.2k
  } else if ((flags & XML_ESCAPE_QUOT) && (c == '"')) {
709
0
            repl = BAD_CAST "&quot;";
710
0
            replSize = 6;
711
21.2k
  } else if (((flags & XML_ESCAPE_HTML) == 0) && (c == '\r')) {
712
0
      repl = BAD_CAST "&#13;";
713
0
            replSize = 5;
714
21.2k
  } else if ((flags & XML_ESCAPE_NON_ASCII) && (c >= 0x80)) {
715
0
            int val;
716
717
0
            chunkSize = 4;
718
0
            val = xmlGetUTF8Char(cur, &chunkSize);
719
0
            if (val < 0) {
720
0
                val = 0xFFFD;
721
0
                chunkSize = 1;
722
0
            } else if (((flags & XML_ESCAPE_ALLOW_INVALID) == 0) &&
723
0
                       (!IS_CHAR(val))) {
724
0
                val = 0xFFFD;
725
0
            }
726
727
0
            replSize = xmlSerializeHexCharRef(buf, val);
728
0
            repl = BAD_CAST buf;
729
21.2k
  } else if ((flags & (XML_ESCAPE_ALLOW_INVALID | XML_ESCAPE_HTML)) ||
730
21.2k
                   (c >= 0x20) ||
731
21.2k
             (c == '\n') || (c == '\t') || (c == '\r')) {
732
      /* default case, just copy */
733
21.2k
            cur += 1;
734
21.2k
            if (*cur != 0)
735
21.1k
                continue;
736
737
76
            chunkSize = 0;
738
76
            repl = BAD_CAST "";
739
76
            replSize = 0;
740
76
  } else {
741
            /* ignore */
742
0
            repl = BAD_CAST "";
743
0
            replSize = 0;
744
0
        }
745
746
104k
        used = out - buffer;
747
104k
        unescapedSize = cur - unescaped;
748
104k
        totalSize = unescapedSize + replSize;
749
750
104k
  cur += chunkSize;
751
752
104k
        if (totalSize > size - used) {
753
16.5k
            xmlChar *tmp;
754
16.5k
            int newSize;
755
756
16.5k
            if ((size > (SIZE_MAX - 1) / 2) ||
757
16.5k
                (totalSize > (SIZE_MAX - 1) / 2 - size)) {
758
0
                xmlFree(buffer);
759
0
                return(NULL);
760
0
            }
761
16.5k
            newSize = size + totalSize;
762
16.5k
            if (*cur != 0)
763
7.18k
                newSize *= 2;
764
16.5k
            tmp = xmlRealloc(buffer, newSize + 1);
765
16.5k
            if (tmp == NULL) {
766
0
                xmlFree(buffer);
767
0
                return(NULL);
768
0
            }
769
16.5k
            buffer = tmp;
770
16.5k
            size = newSize;
771
16.5k
            out = buffer + used;
772
16.5k
        }
773
774
104k
        memcpy(out, unescaped, unescapedSize);
775
104k
        out += unescapedSize;
776
104k
        memcpy(out, repl, replSize);
777
104k
        out += replSize;
778
779
104k
        unescaped = cur;
780
104k
    }
781
782
65.5k
    *out = 0;
783
65.5k
    return(buffer);
784
65.5k
}
785
786
/**
787
 * xmlEncodeEntitiesInternal:
788
 * @doc:  the document containing the string
789
 * @input:  A string to convert to XML.
790
 * @flags:  XML_ESCAPE flags
791
 *
792
 * Do a global encoding of a string, replacing the predefined entities
793
 * and non ASCII values with their entities and CharRef counterparts.
794
 * Contrary to xmlEncodeEntities, this routine is reentrant, and result
795
 * must be deallocated.
796
 *
797
 * Returns A newly allocated string with the substitution done.
798
 */
799
xmlChar *
800
xmlEncodeEntitiesInternal(xmlDocPtr doc, const xmlChar *input,
801
65.5k
                          unsigned flags) {
802
65.5k
    if (input == NULL)
803
0
        return(NULL);
804
805
65.5k
    if ((doc != NULL) && (doc->type == XML_HTML_DOCUMENT_NODE))
806
65.5k
        flags |= XML_ESCAPE_HTML;
807
0
    else if ((doc == NULL) || (doc->encoding == NULL))
808
0
        flags |= XML_ESCAPE_NON_ASCII;
809
810
65.5k
    return(xmlEscapeText(input, flags));
811
65.5k
}
812
813
/**
814
 * xmlEncodeEntitiesReentrant:
815
 * @doc:  the document containing the string
816
 * @input:  A string to convert to XML.
817
 *
818
 * Do a global encoding of a string, replacing the predefined entities
819
 * and non ASCII values with their entities and CharRef counterparts.
820
 * Contrary to xmlEncodeEntities, this routine is reentrant, and result
821
 * must be deallocated.
822
 *
823
 * This escapes '<', '>', '&' and '\r'. If the document has no encoding,
824
 * non-ASCII codepoints are escaped. There is some special handling for
825
 * HTML documents.
826
 *
827
 * Returns A newly allocated string with the substitution done.
828
 */
829
xmlChar *
830
40.6k
xmlEncodeEntitiesReentrant(xmlDocPtr doc, const xmlChar *input) {
831
40.6k
    return xmlEncodeEntitiesInternal(doc, input, 0);
832
40.6k
}
833
834
/**
835
 * xmlEncodeSpecialChars:
836
 * @doc:  unused
837
 * @input:  A string to convert to XML.
838
 *
839
 * Do a global encoding of a string, replacing the predefined entities
840
 * this routine is reentrant, and result must be deallocated.
841
 *
842
 * This escapes '<', '>', '&', '"' and '\r' chars.
843
 *
844
 * Returns A newly allocated string with the substitution done.
845
 */
846
xmlChar *
847
xmlEncodeSpecialChars(const xmlDoc *doc ATTRIBUTE_UNUSED,
848
0
                      const xmlChar *input) {
849
0
    if (input == NULL)
850
0
        return(NULL);
851
852
0
    return(xmlEscapeText(input, XML_ESCAPE_QUOT | XML_ESCAPE_ALLOW_INVALID));
853
0
}
854
855
/**
856
 * xmlCreateEntitiesTable:
857
 *
858
 * create and initialize an empty entities hash table.
859
 * This really doesn't make sense and should be deprecated
860
 *
861
 * Returns the xmlEntitiesTablePtr just created or NULL in case of error.
862
 */
863
xmlEntitiesTablePtr
864
0
xmlCreateEntitiesTable(void) {
865
0
    return((xmlEntitiesTablePtr) xmlHashCreate(0));
866
0
}
867
868
/**
869
 * xmlFreeEntityWrapper:
870
 * @entity:  An entity
871
 * @name:  its name
872
 *
873
 * Deallocate the memory used by an entities in the hash table.
874
 */
875
static void
876
126k
xmlFreeEntityWrapper(void *entity, const xmlChar *name ATTRIBUTE_UNUSED) {
877
126k
    if (entity != NULL)
878
126k
  xmlFreeEntity((xmlEntityPtr) entity);
879
126k
}
880
881
/**
882
 * xmlFreeEntitiesTable:
883
 * @table:  An entity table
884
 *
885
 * Deallocate the memory used by an entities hash table.
886
 */
887
void
888
70.2k
xmlFreeEntitiesTable(xmlEntitiesTablePtr table) {
889
70.2k
    xmlHashFree(table, xmlFreeEntityWrapper);
890
70.2k
}
891
892
/**
893
 * xmlCopyEntity:
894
 * @ent:  An entity
895
 *
896
 * Build a copy of an entity
897
 *
898
 * Returns the new xmlEntitiesPtr or NULL in case of error.
899
 */
900
static void *
901
0
xmlCopyEntity(void *payload, const xmlChar *name ATTRIBUTE_UNUSED) {
902
0
    xmlEntityPtr ent = (xmlEntityPtr) payload;
903
0
    xmlEntityPtr cur;
904
905
0
    cur = (xmlEntityPtr) xmlMalloc(sizeof(xmlEntity));
906
0
    if (cur == NULL)
907
0
  return(NULL);
908
0
    memset(cur, 0, sizeof(xmlEntity));
909
0
    cur->type = XML_ENTITY_DECL;
910
911
0
    cur->etype = ent->etype;
912
0
    if (ent->name != NULL) {
913
0
  cur->name = xmlStrdup(ent->name);
914
0
        if (cur->name == NULL)
915
0
            goto error;
916
0
    }
917
0
    if (ent->ExternalID != NULL) {
918
0
  cur->ExternalID = xmlStrdup(ent->ExternalID);
919
0
        if (cur->ExternalID == NULL)
920
0
            goto error;
921
0
    }
922
0
    if (ent->SystemID != NULL) {
923
0
  cur->SystemID = xmlStrdup(ent->SystemID);
924
0
        if (cur->SystemID == NULL)
925
0
            goto error;
926
0
    }
927
0
    if (ent->content != NULL) {
928
0
  cur->content = xmlStrdup(ent->content);
929
0
        if (cur->content == NULL)
930
0
            goto error;
931
0
    }
932
0
    if (ent->orig != NULL) {
933
0
  cur->orig = xmlStrdup(ent->orig);
934
0
        if (cur->orig == NULL)
935
0
            goto error;
936
0
    }
937
0
    if (ent->URI != NULL) {
938
0
  cur->URI = xmlStrdup(ent->URI);
939
0
        if (cur->URI == NULL)
940
0
            goto error;
941
0
    }
942
0
    return(cur);
943
944
0
error:
945
0
    xmlFreeEntity(cur);
946
0
    return(NULL);
947
0
}
948
949
/**
950
 * xmlCopyEntitiesTable:
951
 * @table:  An entity table
952
 *
953
 * Build a copy of an entity table.
954
 *
955
 * Returns the new xmlEntitiesTablePtr or NULL in case of error.
956
 */
957
xmlEntitiesTablePtr
958
0
xmlCopyEntitiesTable(xmlEntitiesTablePtr table) {
959
0
    return(xmlHashCopySafe(table, xmlCopyEntity, xmlFreeEntityWrapper));
960
0
}
961
962
#ifdef LIBXML_OUTPUT_ENABLED
963
964
/**
965
 * xmlDumpEntityDecl:
966
 * @buf:  An XML buffer.
967
 * @ent:  An entity table
968
 *
969
 * This will dump the content of the entity table as an XML DTD definition
970
 */
971
void
972
0
xmlDumpEntityDecl(xmlBufferPtr buf, xmlEntityPtr ent) {
973
0
    xmlSaveCtxtPtr save;
974
975
0
    if ((buf == NULL) || (ent == NULL))
976
0
        return;
977
978
0
    save = xmlSaveToBuffer(buf, NULL, 0);
979
0
    xmlSaveTree(save, (xmlNodePtr) ent);
980
0
    if (xmlSaveFinish(save) != XML_ERR_OK)
981
0
        xmlFree(xmlBufferDetach(buf));
982
0
}
983
984
/**
985
 * xmlDumpEntityDeclScan:
986
 * @ent:  An entity table
987
 * @buf:  An XML buffer.
988
 *
989
 * When using the hash table scan function, arguments need to be reversed
990
 */
991
static void
992
xmlDumpEntityDeclScan(void *ent, void *save,
993
0
                      const xmlChar *name ATTRIBUTE_UNUSED) {
994
0
    xmlSaveTree(save, ent);
995
0
}
996
997
/**
998
 * xmlDumpEntitiesTable:
999
 * @buf:  An XML buffer.
1000
 * @table:  An entity table
1001
 *
1002
 * This will dump the content of the entity table as an XML DTD definition
1003
 */
1004
void
1005
0
xmlDumpEntitiesTable(xmlBufferPtr buf, xmlEntitiesTablePtr table) {
1006
0
    xmlSaveCtxtPtr save;
1007
1008
0
    if ((buf == NULL) || (table == NULL))
1009
0
        return;
1010
1011
0
    save = xmlSaveToBuffer(buf, NULL, 0);
1012
0
    xmlHashScan(table, xmlDumpEntityDeclScan, save);
1013
0
    if (xmlSaveFinish(save) != XML_ERR_OK)
1014
0
        xmlFree(xmlBufferDetach(buf));
1015
0
}
1016
#endif /* LIBXML_OUTPUT_ENABLED */