Coverage Report

Created: 2026-01-17 06:39

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
/src/libxml2/entities.c
Line
Count
Source
1
/*
2
 * entities.c : implementation for the XML entities handling
3
 *
4
 * See Copyright for the status of this software.
5
 *
6
 * daniel@veillard.com
7
 */
8
9
/* To avoid EBCDIC trouble when parsing on zOS */
10
#if defined(__MVS__)
11
#pragma convert("ISO8859-1")
12
#endif
13
14
#define IN_LIBXML
15
#include "libxml.h"
16
17
#include <string.h>
18
#include <stdlib.h>
19
20
#include <libxml/xmlmemory.h>
21
#include <libxml/hash.h>
22
#include <libxml/entities.h>
23
#include <libxml/parser.h>
24
#include <libxml/parserInternals.h>
25
#include <libxml/xmlerror.h>
26
#include <libxml/dict.h>
27
#include <libxml/xmlsave.h>
28
29
#include "private/entities.h"
30
#include "private/error.h"
31
32
#ifndef SIZE_MAX
33
  #define SIZE_MAX ((size_t) -1)
34
#endif
35
36
/*
37
 * The XML predefined entities.
38
 */
39
40
static xmlEntity xmlEntityLt = {
41
    NULL, XML_ENTITY_DECL, BAD_CAST "lt",
42
    NULL, NULL, NULL, NULL, NULL, NULL,
43
    BAD_CAST "<", BAD_CAST "<", 1,
44
    XML_INTERNAL_PREDEFINED_ENTITY,
45
    NULL, NULL, NULL, NULL, 0, 0, 0
46
};
47
static xmlEntity xmlEntityGt = {
48
    NULL, XML_ENTITY_DECL, BAD_CAST "gt",
49
    NULL, NULL, NULL, NULL, NULL, NULL,
50
    BAD_CAST ">", BAD_CAST ">", 1,
51
    XML_INTERNAL_PREDEFINED_ENTITY,
52
    NULL, NULL, NULL, NULL, 0, 0, 0
53
};
54
static xmlEntity xmlEntityAmp = {
55
    NULL, XML_ENTITY_DECL, BAD_CAST "amp",
56
    NULL, NULL, NULL, NULL, NULL, NULL,
57
    BAD_CAST "&", BAD_CAST "&", 1,
58
    XML_INTERNAL_PREDEFINED_ENTITY,
59
    NULL, NULL, NULL, NULL, 0, 0, 0
60
};
61
static xmlEntity xmlEntityQuot = {
62
    NULL, XML_ENTITY_DECL, BAD_CAST "quot",
63
    NULL, NULL, NULL, NULL, NULL, NULL,
64
    BAD_CAST "\"", BAD_CAST "\"", 1,
65
    XML_INTERNAL_PREDEFINED_ENTITY,
66
    NULL, NULL, NULL, NULL, 0, 0, 0
67
};
68
static xmlEntity xmlEntityApos = {
69
    NULL, XML_ENTITY_DECL, BAD_CAST "apos",
70
    NULL, NULL, NULL, NULL, NULL, NULL,
71
    BAD_CAST "'", BAD_CAST "'", 1,
72
    XML_INTERNAL_PREDEFINED_ENTITY,
73
    NULL, NULL, NULL, NULL, 0, 0, 0
74
};
75
76
/*
77
 * xmlFreeEntity:
78
 * @entity:  an entity
79
 *
80
 * Frees the entity.
81
 */
82
void
83
xmlFreeEntity(xmlEntityPtr entity)
84
137k
{
85
137k
    xmlDictPtr dict = NULL;
86
87
137k
    if (entity == NULL)
88
0
        return;
89
90
137k
    if (entity->doc != NULL)
91
136k
        dict = entity->doc->dict;
92
93
94
137k
    if ((entity->children) &&
95
1.35k
        (entity == (xmlEntityPtr) entity->children->parent))
96
1.35k
        xmlFreeNodeList(entity->children);
97
137k
    if ((entity->name != NULL) &&
98
137k
        ((dict == NULL) || (!xmlDictOwns(dict, entity->name))))
99
52.6k
        xmlFree((char *) entity->name);
100
137k
    if (entity->ExternalID != NULL)
101
10.2k
        xmlFree((char *) entity->ExternalID);
102
137k
    if (entity->SystemID != NULL)
103
40.4k
        xmlFree((char *) entity->SystemID);
104
137k
    if (entity->URI != NULL)
105
38.1k
        xmlFree((char *) entity->URI);
106
137k
    if (entity->content != NULL)
107
95.7k
        xmlFree((char *) entity->content);
108
137k
    if (entity->orig != NULL)
109
80.9k
        xmlFree((char *) entity->orig);
110
137k
    xmlFree(entity);
111
137k
}
112
113
/*
114
 * xmlCreateEntity:
115
 *
116
 * internal routine doing the entity node structures allocations
117
 */
118
static xmlEntityPtr
119
xmlCreateEntity(xmlDocPtr doc, const xmlChar *name, int type,
120
          const xmlChar *ExternalID, const xmlChar *SystemID,
121
96.7k
          const xmlChar *content) {
122
96.7k
    xmlEntityPtr ret;
123
124
96.7k
    ret = (xmlEntityPtr) xmlMalloc(sizeof(xmlEntity));
125
96.7k
    if (ret == NULL)
126
10
  return(NULL);
127
96.7k
    memset(ret, 0, sizeof(xmlEntity));
128
96.7k
    ret->doc = doc;
129
96.7k
    ret->type = XML_ENTITY_DECL;
130
131
    /*
132
     * fill the structure.
133
     */
134
96.7k
    ret->etype = (xmlEntityType) type;
135
96.7k
    if ((doc == NULL) || (doc->dict == NULL))
136
12.4k
  ret->name = xmlStrdup(name);
137
84.3k
    else
138
84.3k
        ret->name = xmlDictLookup(doc->dict, name, -1);
139
96.7k
    if (ret->name == NULL)
140
1
        goto error;
141
96.7k
    if (ExternalID != NULL) {
142
10.2k
        ret->ExternalID = xmlStrdup(ExternalID);
143
10.2k
        if (ret->ExternalID == NULL)
144
1
            goto error;
145
10.2k
    }
146
96.7k
    if (SystemID != NULL) {
147
39.2k
        ret->SystemID = xmlStrdup(SystemID);
148
39.2k
        if (ret->SystemID == NULL)
149
1
            goto error;
150
39.2k
    }
151
96.7k
    if (content != NULL) {
152
55.8k
        ret->length = xmlStrlen(content);
153
55.8k
  ret->content = xmlStrndup(content, ret->length);
154
55.8k
        if (ret->content == NULL)
155
4
            goto error;
156
55.8k
     } else {
157
40.9k
        ret->length = 0;
158
40.9k
        ret->content = NULL;
159
40.9k
    }
160
96.7k
    ret->URI = NULL; /* to be computed by the layer knowing
161
      the defining entity */
162
96.7k
    ret->orig = NULL;
163
164
96.7k
    return(ret);
165
166
7
error:
167
7
    xmlFreeEntity(ret);
168
7
    return(NULL);
169
96.7k
}
170
171
/**
172
 * xmlAddEntity:
173
 * @doc:  the document
174
 * @extSubset:  add to the external or internal subset
175
 * @name:  the entity name
176
 * @type:  the entity type XML_xxx_yyy_ENTITY
177
 * @ExternalID:  the entity external ID if available
178
 * @SystemID:  the entity system ID if available
179
 * @content:  the entity content
180
 * @out:  pointer to resulting entity (optional)
181
 *
182
 * Register a new entity for this document.
183
 *
184
 * Available since 2.13.0.
185
 *
186
 * Returns an xmlParserErrors error code.
187
 */
188
int
189
xmlAddEntity(xmlDocPtr doc, int extSubset, const xmlChar *name, int type,
190
    const xmlChar *ExternalID, const xmlChar *SystemID,
191
111k
    const xmlChar *content, xmlEntityPtr *out) {
192
111k
    xmlDtdPtr dtd;
193
111k
    xmlDictPtr dict = NULL;
194
111k
    xmlEntitiesTablePtr table = NULL;
195
111k
    xmlEntityPtr ret, predef;
196
111k
    int res;
197
198
111k
    if (out != NULL)
199
111k
        *out = NULL;
200
111k
    if ((doc == NULL) || (name == NULL))
201
0
  return(XML_ERR_ARGUMENT);
202
111k
    dict = doc->dict;
203
204
111k
    if (extSubset)
205
8.10k
        dtd = doc->extSubset;
206
103k
    else
207
103k
        dtd = doc->intSubset;
208
111k
    if (dtd == NULL)
209
0
        return(XML_DTD_NO_DTD);
210
211
111k
    switch (type) {
212
48.2k
        case XML_INTERNAL_GENERAL_ENTITY:
213
61.2k
        case XML_EXTERNAL_GENERAL_PARSED_ENTITY:
214
61.4k
        case XML_EXTERNAL_GENERAL_UNPARSED_ENTITY:
215
61.4k
            predef = xmlGetPredefinedEntity(name);
216
61.4k
            if (predef != NULL) {
217
20.2k
                int valid = 0;
218
219
                /* 4.6 Predefined Entities */
220
20.2k
                if ((type == XML_INTERNAL_GENERAL_ENTITY) &&
221
18.4k
                    (content != NULL)) {
222
18.1k
                    int c = predef->content[0];
223
224
18.1k
                    if (((content[0] == c) && (content[1] == 0)) &&
225
2.00k
                        ((c == '>') || (c == '\'') || (c == '"'))) {
226
1.78k
                        valid = 1;
227
16.4k
                    } else if ((content[0] == '&') && (content[1] == '#')) {
228
9.46k
                        if (content[2] == 'x') {
229
8.66k
                            xmlChar *hex = BAD_CAST "0123456789ABCDEF";
230
8.66k
                            xmlChar ref[] = "00;";
231
232
8.66k
                            ref[0] = hex[c / 16 % 16];
233
8.66k
                            ref[1] = hex[c % 16];
234
8.66k
                            if (xmlStrcasecmp(&content[3], ref) == 0)
235
3.46k
                                valid = 1;
236
8.66k
                        } else {
237
796
                            xmlChar ref[] = "00;";
238
239
796
                            ref[0] = '0' + c / 10 % 10;
240
796
                            ref[1] = '0' + c % 10;
241
796
                            if (xmlStrEqual(&content[2], ref))
242
225
                                valid = 1;
243
796
                        }
244
9.46k
                    }
245
18.1k
                }
246
20.2k
                if (!valid)
247
14.7k
                    return(XML_ERR_REDECL_PREDEF_ENTITY);
248
20.2k
            }
249
46.7k
      if (dtd->entities == NULL) {
250
25.0k
    dtd->entities = xmlHashCreateDict(0, dict);
251
25.0k
                if (dtd->entities == NULL)
252
3
                    return(XML_ERR_NO_MEMORY);
253
25.0k
            }
254
46.7k
      table = dtd->entities;
255
46.7k
      break;
256
21.0k
        case XML_INTERNAL_PARAMETER_ENTITY:
257
50.0k
        case XML_EXTERNAL_PARAMETER_ENTITY:
258
50.0k
      if (dtd->pentities == NULL) {
259
22.8k
    dtd->pentities = xmlHashCreateDict(0, dict);
260
22.8k
                if (dtd->pentities == NULL)
261
1
                    return(XML_ERR_NO_MEMORY);
262
22.8k
            }
263
50.0k
      table = dtd->pentities;
264
50.0k
      break;
265
0
        default:
266
0
      return(XML_ERR_ARGUMENT);
267
111k
    }
268
96.7k
    ret = xmlCreateEntity(dtd->doc, name, type, ExternalID, SystemID, content);
269
96.7k
    if (ret == NULL)
270
17
        return(XML_ERR_NO_MEMORY);
271
272
96.7k
    res = xmlHashAdd(table, name, ret);
273
96.7k
    if (res < 0) {
274
10
        xmlFreeEntity(ret);
275
10
        return(XML_ERR_NO_MEMORY);
276
96.7k
    } else if (res == 0) {
277
  /*
278
   * entity was already defined at another level.
279
   */
280
13.9k
        xmlFreeEntity(ret);
281
13.9k
  return(XML_WAR_ENTITY_REDEFINED);
282
13.9k
    }
283
284
    /*
285
     * Link it to the DTD
286
     */
287
82.8k
    ret->parent = dtd;
288
82.8k
    ret->doc = dtd->doc;
289
82.8k
    if (dtd->last == NULL) {
290
35.4k
  dtd->children = dtd->last = (xmlNodePtr) ret;
291
47.4k
    } else {
292
47.4k
  dtd->last->next = (xmlNodePtr) ret;
293
47.4k
  ret->prev = dtd->last;
294
47.4k
  dtd->last = (xmlNodePtr) ret;
295
47.4k
    }
296
297
82.8k
    if (out != NULL)
298
82.8k
        *out = ret;
299
82.8k
    return(0);
300
96.7k
}
301
302
/**
303
 * xmlGetPredefinedEntity:
304
 * @name:  the entity name
305
 *
306
 * Check whether this name is an predefined entity.
307
 *
308
 * Returns NULL if not, otherwise the entity
309
 */
310
xmlEntityPtr
311
1.94M
xmlGetPredefinedEntity(const xmlChar *name) {
312
1.94M
    if (name == NULL) return(NULL);
313
1.94M
    switch (name[0]) {
314
20.6k
        case 'l':
315
20.6k
      if (xmlStrEqual(name, BAD_CAST "lt"))
316
11.2k
          return(&xmlEntityLt);
317
9.42k
      break;
318
107k
        case 'g':
319
107k
      if (xmlStrEqual(name, BAD_CAST "gt"))
320
105k
          return(&xmlEntityGt);
321
2.03k
      break;
322
707k
        case 'a':
323
707k
      if (xmlStrEqual(name, BAD_CAST "amp"))
324
134k
          return(&xmlEntityAmp);
325
573k
      if (xmlStrEqual(name, BAD_CAST "apos"))
326
5.06k
          return(&xmlEntityApos);
327
567k
      break;
328
586k
        case 'q':
329
586k
      if (xmlStrEqual(name, BAD_CAST "quot"))
330
7.77k
          return(&xmlEntityQuot);
331
578k
      break;
332
578k
  default:
333
524k
      break;
334
1.94M
    }
335
1.68M
    return(NULL);
336
1.94M
}
337
338
/**
339
 * xmlAddDtdEntity:
340
 * @doc:  the document
341
 * @name:  the entity name
342
 * @type:  the entity type XML_xxx_yyy_ENTITY
343
 * @ExternalID:  the entity external ID if available
344
 * @SystemID:  the entity system ID if available
345
 * @content:  the entity content
346
 *
347
 * Register a new entity for this document DTD external subset.
348
 *
349
 * Returns a pointer to the entity or NULL in case of error
350
 */
351
xmlEntityPtr
352
xmlAddDtdEntity(xmlDocPtr doc, const xmlChar *name, int type,
353
          const xmlChar *ExternalID, const xmlChar *SystemID,
354
0
    const xmlChar *content) {
355
0
    xmlEntityPtr ret;
356
357
0
    xmlAddEntity(doc, 1, name, type, ExternalID, SystemID, content, &ret);
358
0
    return(ret);
359
0
}
360
361
/**
362
 * xmlAddDocEntity:
363
 * @doc:  the document
364
 * @name:  the entity name
365
 * @type:  the entity type XML_xxx_yyy_ENTITY
366
 * @ExternalID:  the entity external ID if available
367
 * @SystemID:  the entity system ID if available
368
 * @content:  the entity content
369
 *
370
 * Register a new entity for this document.
371
 *
372
 * Returns a pointer to the entity or NULL in case of error
373
 */
374
xmlEntityPtr
375
xmlAddDocEntity(xmlDocPtr doc, const xmlChar *name, int type,
376
          const xmlChar *ExternalID, const xmlChar *SystemID,
377
0
          const xmlChar *content) {
378
0
    xmlEntityPtr ret;
379
380
0
    xmlAddEntity(doc, 0, name, type, ExternalID, SystemID, content, &ret);
381
0
    return(ret);
382
0
}
383
384
/**
385
 * xmlNewEntity:
386
 * @doc:  the document
387
 * @name:  the entity name
388
 * @type:  the entity type XML_xxx_yyy_ENTITY
389
 * @ExternalID:  the entity external ID if available
390
 * @SystemID:  the entity system ID if available
391
 * @content:  the entity content
392
 *
393
 * Create a new entity, this differs from xmlAddDocEntity() that if
394
 * the document is NULL or has no internal subset defined, then an
395
 * unlinked entity structure will be returned, it is then the responsibility
396
 * of the caller to link it to the document later or free it when not needed
397
 * anymore.
398
 *
399
 * Returns a pointer to the entity or NULL in case of error
400
 */
401
xmlEntityPtr
402
xmlNewEntity(xmlDocPtr doc, const xmlChar *name, int type,
403
       const xmlChar *ExternalID, const xmlChar *SystemID,
404
0
       const xmlChar *content) {
405
0
    if ((doc != NULL) && (doc->intSubset != NULL)) {
406
0
  return(xmlAddDocEntity(doc, name, type, ExternalID, SystemID, content));
407
0
    }
408
0
    if (name == NULL)
409
0
        return(NULL);
410
0
    return(xmlCreateEntity(doc, name, type, ExternalID, SystemID, content));
411
0
}
412
413
/**
414
 * xmlGetEntityFromTable:
415
 * @table:  an entity table
416
 * @name:  the entity name
417
 * @parameter:  look for parameter entities
418
 *
419
 * Do an entity lookup in the table.
420
 * returns the corresponding parameter entity, if found.
421
 *
422
 * Returns A pointer to the entity structure or NULL if not found.
423
 */
424
static xmlEntityPtr
425
905k
xmlGetEntityFromTable(xmlEntitiesTablePtr table, const xmlChar *name) {
426
905k
    return((xmlEntityPtr) xmlHashLookup(table, name));
427
905k
}
428
429
/**
430
 * xmlGetParameterEntity:
431
 * @doc:  the document referencing the entity
432
 * @name:  the entity name
433
 *
434
 * Do an entity lookup in the internal and external subsets and
435
 * returns the corresponding parameter entity, if found.
436
 *
437
 * Returns A pointer to the entity structure or NULL if not found.
438
 */
439
xmlEntityPtr
440
104k
xmlGetParameterEntity(xmlDocPtr doc, const xmlChar *name) {
441
104k
    xmlEntitiesTablePtr table;
442
104k
    xmlEntityPtr ret;
443
444
104k
    if (doc == NULL)
445
332
  return(NULL);
446
103k
    if ((doc->intSubset != NULL) && (doc->intSubset->pentities != NULL)) {
447
100k
  table = (xmlEntitiesTablePtr) doc->intSubset->pentities;
448
100k
  ret = xmlGetEntityFromTable(table, name);
449
100k
  if (ret != NULL)
450
75.4k
      return(ret);
451
100k
    }
452
28.2k
    if ((doc->extSubset != NULL) && (doc->extSubset->pentities != NULL)) {
453
7.92k
  table = (xmlEntitiesTablePtr) doc->extSubset->pentities;
454
7.92k
  return(xmlGetEntityFromTable(table, name));
455
7.92k
    }
456
20.3k
    return(NULL);
457
28.2k
}
458
459
/**
460
 * xmlGetDtdEntity:
461
 * @doc:  the document referencing the entity
462
 * @name:  the entity name
463
 *
464
 * Do an entity lookup in the DTD entity hash table and
465
 * returns the corresponding entity, if found.
466
 * Note: the first argument is the document node, not the DTD node.
467
 *
468
 * Returns A pointer to the entity structure or NULL if not found.
469
 */
470
xmlEntityPtr
471
0
xmlGetDtdEntity(xmlDocPtr doc, const xmlChar *name) {
472
0
    xmlEntitiesTablePtr table;
473
474
0
    if (doc == NULL)
475
0
  return(NULL);
476
0
    if ((doc->extSubset != NULL) && (doc->extSubset->entities != NULL)) {
477
0
  table = (xmlEntitiesTablePtr) doc->extSubset->entities;
478
0
  return(xmlGetEntityFromTable(table, name));
479
0
    }
480
0
    return(NULL);
481
0
}
482
483
/**
484
 * xmlGetDocEntity:
485
 * @doc:  the document referencing the entity
486
 * @name:  the entity name
487
 *
488
 * Do an entity lookup in the document entity hash table and
489
 * returns the corresponding entity, otherwise a lookup is done
490
 * in the predefined entities too.
491
 *
492
 * Returns A pointer to the entity structure or NULL if not found.
493
 */
494
xmlEntityPtr
495
828k
xmlGetDocEntity(const xmlDoc *doc, const xmlChar *name) {
496
828k
    xmlEntityPtr cur;
497
828k
    xmlEntitiesTablePtr table;
498
499
828k
    if (doc != NULL) {
500
827k
  if ((doc->intSubset != NULL) && (doc->intSubset->entities != NULL)) {
501
734k
      table = (xmlEntitiesTablePtr) doc->intSubset->entities;
502
734k
      cur = xmlGetEntityFromTable(table, name);
503
734k
      if (cur != NULL)
504
645k
    return(cur);
505
734k
  }
506
181k
  if (doc->standalone != 1) {
507
180k
      if ((doc->extSubset != NULL) &&
508
65.7k
    (doc->extSubset->entities != NULL)) {
509
63.6k
    table = (xmlEntitiesTablePtr) doc->extSubset->entities;
510
63.6k
    cur = xmlGetEntityFromTable(table, name);
511
63.6k
    if (cur != NULL)
512
276
        return(cur);
513
63.6k
      }
514
180k
  }
515
181k
    }
516
182k
    return(xmlGetPredefinedEntity(name));
517
828k
}
518
519
/*
520
 * xmlSerializeHexCharRef:
521
 * @buf:  a char buffer
522
 * @val:  a codepoint
523
 *
524
 * Serializes a hex char ref like &#xA0;
525
 *
526
 * Writes at most 9 bytes. Does not include a terminating zero byte.
527
 *
528
 * Returns the number of bytes written.
529
 */
530
int
531
3.32k
xmlSerializeHexCharRef(char *buf, int val) {
532
3.32k
    char *out = buf;
533
3.32k
    int shift = 0, bits;
534
535
3.32k
    *out++ = '&';
536
3.32k
    *out++ = '#';
537
3.32k
    *out++ = 'x';
538
539
3.32k
    bits = val;
540
3.32k
    if (bits & 0xFF0000) {
541
93
        shift = 16;
542
93
        bits &= 0xFF0000;
543
3.23k
    } else if (bits & 0x00FF00) {
544
463
        shift = 8;
545
463
        bits &= 0x00FF00;
546
463
    }
547
3.32k
    if (bits & 0xF0F0F0) {
548
3.19k
        shift += 4;
549
3.19k
    }
550
551
7.81k
    do {
552
7.81k
        int d = (val >> shift) & 0x0F;
553
554
7.81k
        if (d < 10)
555
3.11k
            *out++ = '0' + d;
556
4.70k
        else
557
4.70k
            *out++ = 'A' + (d - 10);
558
559
7.81k
  shift -= 4;
560
7.81k
    } while (shift >= 0);
561
562
3.32k
    *out++ = ';';
563
564
3.32k
    return(out - buf);
565
3.32k
}
566
567
/*
568
 * xmlSerializeDecCharRef:
569
 * @buf:  a char buffer
570
 * @val:  a codepoint
571
 *
572
 * Serializes a decimal char ref like &#38;
573
 *
574
 * Writes at most 10 bytes. Does not include a terminating zero byte.
575
 *
576
 * Returns the number of bytes written.
577
 */
578
int
579
54.9M
xmlSerializeDecCharRef(char *buf, int val) {
580
54.9M
    char *out = buf;
581
54.9M
    int len, i;
582
583
54.9M
    *out++ = '&';
584
54.9M
    *out++ = '#';
585
586
54.9M
    if (val < 100) {
587
897
        len = (val < 10) ? 1 : 2;
588
54.9M
    } else if (val < 10000) {
589
54.9M
        len = (val < 1000) ? 3 : 4;
590
54.9M
    } else if (val < 1000000) {
591
4.44k
        len = (val < 100000) ? 5 : 6;
592
4.44k
    } else {
593
295
        len = 7;
594
295
    }
595
596
225M
    for (i = len - 1; i >= 0; i--) {
597
170M
        out[i] = '0' + val % 10;
598
170M
        val /= 10;
599
170M
    }
600
601
54.9M
    out[len] = ';';
602
603
54.9M
    return(len + 3);
604
54.9M
}
605
606
static const char xmlEscapeSafe[128] = {
607
    0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0,
608
    0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
609
    1, 1, 0, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1,
610
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 1,
611
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
612
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
613
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
614
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1
615
};
616
617
/*
618
 * xmlEscapeText:
619
 * @text:  input text
620
 * @flags:  XML_ESCAPE flags
621
 *
622
 * Escapes certain characters with char refs.
623
 *
624
 * XML_ESCAPE_ATTR: for attribute content.
625
 * XML_ESCAPE_NON_ASCII: escape non-ASCII chars.
626
 * XML_ESCAPE_HTML: for HTML content.
627
 * XML_ESCAPE_QUOT: escape double quotes.
628
 * XML_ESCAPE_ALLOW_INVALID: allow invalid characters.
629
 *
630
 * Returns an escaped string or NULL if a memory allocation failed.
631
 */
632
xmlChar *
633
38.1k
xmlEscapeText(const xmlChar *text, int flags) {
634
38.1k
    const xmlChar *cur;
635
38.1k
    xmlChar *buffer;
636
38.1k
    xmlChar *out;
637
38.1k
    const xmlChar *unescaped;
638
38.1k
    size_t size = 50;
639
640
38.1k
    buffer = xmlMalloc(size + 1);
641
38.1k
    if (buffer == NULL)
642
65
        return(NULL);
643
38.0k
    out = buffer;
644
645
38.0k
    cur = text;
646
38.0k
    unescaped = cur;
647
648
219k
    while (*cur != '\0') {
649
181k
        char buf[12];
650
181k
  const xmlChar *end;
651
181k
        const xmlChar *repl;
652
181k
        size_t used;
653
181k
        size_t replSize;
654
181k
        size_t unescapedSize;
655
181k
        size_t totalSize;
656
181k
        int chunkSize = 1;
657
181k
        int c;
658
659
        /* accelerator */
660
186M
  while (1) {
661
186M
            c = *cur;
662
663
186M
            if (c < 0x80) {
664
51.0M
                if (!xmlEscapeSafe[*cur])
665
181k
                    break;
666
135M
            } else {
667
135M
               if (flags & XML_ESCAPE_NON_ASCII)
668
0
                   break;
669
135M
            }
670
186M
            cur += 1;
671
186M
        }
672
673
181k
        if (c == 0) {
674
35.9k
            chunkSize = 0;
675
35.9k
            repl = BAD_CAST "";
676
35.9k
            replSize = 0;
677
145k
        } else if (c == '<') {
678
      /*
679
       * Special handling of server side include in HTML attributes
680
       */
681
25.8k
      if ((flags & XML_ESCAPE_HTML) && (flags & XML_ESCAPE_ATTR) &&
682
25.4k
          (cur[1] == '!') && (cur[2] == '-') && (cur[3] == '-') &&
683
2.64k
          ((end = xmlStrstr(cur, BAD_CAST "-->")) != NULL)) {
684
1.59k
                chunkSize = (end - cur) + 3;
685
1.59k
                repl = cur;
686
1.59k
                replSize = chunkSize;
687
24.2k
      } else {
688
24.2k
                repl = BAD_CAST "&lt;";
689
24.2k
                replSize = 4;
690
24.2k
            }
691
119k
  } else if (c == '>') {
692
38.7k
            repl = BAD_CAST "&gt;";
693
38.7k
            replSize = 4;
694
81.1k
  } else if (c == '&') {
695
      /*
696
       * Special handling of &{...} construct from HTML 4, see
697
       * http://www.w3.org/TR/html401/appendix/notes.html#h-B.7.1
698
       */
699
7.81k
      if ((flags & XML_ESCAPE_HTML) && (flags & XML_ESCAPE_ATTR) &&
700
7.43k
                (cur[1] == '{') && (end = xmlStrchr(cur, '}'))) {
701
2.38k
                chunkSize = (end - cur) + 1;
702
2.38k
                repl = cur;
703
2.38k
                replSize = chunkSize;
704
5.43k
      } else {
705
5.43k
                repl = BAD_CAST "&amp;";
706
5.43k
                replSize = 5;
707
5.43k
            }
708
73.3k
  } else if ((flags & XML_ESCAPE_QUOT) && (c == '"')) {
709
0
            repl = BAD_CAST "&quot;";
710
0
            replSize = 6;
711
73.3k
  } else if (((flags & XML_ESCAPE_HTML) == 0) && (c == '\r')) {
712
0
      repl = BAD_CAST "&#13;";
713
0
            replSize = 5;
714
73.3k
  } else if ((flags & XML_ESCAPE_NON_ASCII) && (c >= 0x80)) {
715
0
            int val;
716
717
0
            chunkSize = 4;
718
0
            val = xmlGetUTF8Char(cur, &chunkSize);
719
0
            if (val < 0) {
720
0
                val = 0xFFFD;
721
0
                chunkSize = 1;
722
0
            } else if (((flags & XML_ESCAPE_ALLOW_INVALID) == 0) &&
723
0
                       (!IS_CHAR(val))) {
724
0
                val = 0xFFFD;
725
0
            }
726
727
0
            replSize = xmlSerializeHexCharRef(buf, val);
728
0
            repl = BAD_CAST buf;
729
73.3k
  } else if ((flags & (XML_ESCAPE_ALLOW_INVALID | XML_ESCAPE_HTML)) ||
730
0
                   (c >= 0x20) ||
731
73.3k
             (c == '\n') || (c == '\t') || (c == '\r')) {
732
      /* default case, just copy */
733
73.3k
            cur += 1;
734
73.3k
            if (*cur != 0)
735
72.5k
                continue;
736
737
785
            chunkSize = 0;
738
785
            repl = BAD_CAST "";
739
785
            replSize = 0;
740
785
  } else {
741
            /* ignore */
742
0
            repl = BAD_CAST "";
743
0
            replSize = 0;
744
0
        }
745
746
109k
        used = out - buffer;
747
109k
        unescapedSize = cur - unescaped;
748
109k
        totalSize = unescapedSize + replSize;
749
750
109k
  cur += chunkSize;
751
752
109k
        if (totalSize > size - used) {
753
7.94k
            xmlChar *tmp;
754
7.94k
            int newSize;
755
756
7.94k
            if ((size > (SIZE_MAX - 1) / 2) ||
757
7.94k
                (totalSize > (SIZE_MAX - 1) / 2 - size)) {
758
0
                xmlFree(buffer);
759
0
                return(NULL);
760
0
            }
761
7.94k
            newSize = size + totalSize;
762
7.94k
            if (*cur != 0)
763
4.61k
                newSize *= 2;
764
7.94k
            tmp = xmlRealloc(buffer, newSize + 1);
765
7.94k
            if (tmp == NULL) {
766
5
                xmlFree(buffer);
767
5
                return(NULL);
768
5
            }
769
7.94k
            buffer = tmp;
770
7.94k
            size = newSize;
771
7.94k
            out = buffer + used;
772
7.94k
        }
773
774
109k
        memcpy(out, unescaped, unescapedSize);
775
109k
        out += unescapedSize;
776
109k
        memcpy(out, repl, replSize);
777
109k
        out += replSize;
778
779
109k
        unescaped = cur;
780
109k
    }
781
782
38.0k
    *out = 0;
783
38.0k
    return(buffer);
784
38.0k
}
785
786
/**
787
 * xmlEncodeEntitiesInternal:
788
 * @doc:  the document containing the string
789
 * @input:  A string to convert to XML.
790
 * @flags:  XML_ESCAPE flags
791
 *
792
 * Do a global encoding of a string, replacing the predefined entities
793
 * and non ASCII values with their entities and CharRef counterparts.
794
 * Contrary to xmlEncodeEntities, this routine is reentrant, and result
795
 * must be deallocated.
796
 *
797
 * Returns A newly allocated string with the substitution done.
798
 */
799
xmlChar *
800
xmlEncodeEntitiesInternal(xmlDocPtr doc, const xmlChar *input,
801
38.1k
                          unsigned flags) {
802
38.1k
    if (input == NULL)
803
0
        return(NULL);
804
805
38.1k
    if ((doc != NULL) && (doc->type == XML_HTML_DOCUMENT_NODE))
806
38.1k
        flags |= XML_ESCAPE_HTML;
807
0
    else if ((doc == NULL) || (doc->encoding == NULL))
808
0
        flags |= XML_ESCAPE_NON_ASCII;
809
810
38.1k
    return(xmlEscapeText(input, flags));
811
38.1k
}
812
813
/**
814
 * xmlEncodeEntitiesReentrant:
815
 * @doc:  the document containing the string
816
 * @input:  A string to convert to XML.
817
 *
818
 * Do a global encoding of a string, replacing the predefined entities
819
 * and non ASCII values with their entities and CharRef counterparts.
820
 * Contrary to xmlEncodeEntities, this routine is reentrant, and result
821
 * must be deallocated.
822
 *
823
 * This escapes '<', '>', '&' and '\r'. If the document has no encoding,
824
 * non-ASCII codepoints are escaped. There is some special handling for
825
 * HTML documents.
826
 *
827
 * Returns A newly allocated string with the substitution done.
828
 */
829
xmlChar *
830
27.4k
xmlEncodeEntitiesReentrant(xmlDocPtr doc, const xmlChar *input) {
831
27.4k
    return xmlEncodeEntitiesInternal(doc, input, 0);
832
27.4k
}
833
834
/**
835
 * xmlEncodeSpecialChars:
836
 * @doc:  unused
837
 * @input:  A string to convert to XML.
838
 *
839
 * Do a global encoding of a string, replacing the predefined entities
840
 * this routine is reentrant, and result must be deallocated.
841
 *
842
 * This escapes '<', '>', '&', '"' and '\r' chars.
843
 *
844
 * Returns A newly allocated string with the substitution done.
845
 */
846
xmlChar *
847
xmlEncodeSpecialChars(const xmlDoc *doc ATTRIBUTE_UNUSED,
848
0
                      const xmlChar *input) {
849
0
    if (input == NULL)
850
0
        return(NULL);
851
852
0
    return(xmlEscapeText(input, XML_ESCAPE_QUOT | XML_ESCAPE_ALLOW_INVALID));
853
0
}
854
855
/**
856
 * xmlCreateEntitiesTable:
857
 *
858
 * create and initialize an empty entities hash table.
859
 * This really doesn't make sense and should be deprecated
860
 *
861
 * Returns the xmlEntitiesTablePtr just created or NULL in case of error.
862
 */
863
xmlEntitiesTablePtr
864
0
xmlCreateEntitiesTable(void) {
865
0
    return((xmlEntitiesTablePtr) xmlHashCreate(0));
866
0
}
867
868
/**
869
 * xmlFreeEntityWrapper:
870
 * @entity:  An entity
871
 * @name:  its name
872
 *
873
 * Deallocate the memory used by an entities in the hash table.
874
 */
875
static void
876
123k
xmlFreeEntityWrapper(void *entity, const xmlChar *name ATTRIBUTE_UNUSED) {
877
123k
    if (entity != NULL)
878
123k
  xmlFreeEntity((xmlEntityPtr) entity);
879
123k
}
880
881
/**
882
 * xmlFreeEntitiesTable:
883
 * @table:  An entity table
884
 *
885
 * Deallocate the memory used by an entities hash table.
886
 */
887
void
888
62.2k
xmlFreeEntitiesTable(xmlEntitiesTablePtr table) {
889
62.2k
    xmlHashFree(table, xmlFreeEntityWrapper);
890
62.2k
}
891
892
/**
893
 * xmlCopyEntity:
894
 * @ent:  An entity
895
 *
896
 * Build a copy of an entity
897
 *
898
 * Returns the new xmlEntitiesPtr or NULL in case of error.
899
 */
900
static void *
901
40.2k
xmlCopyEntity(void *payload, const xmlChar *name ATTRIBUTE_UNUSED) {
902
40.2k
    xmlEntityPtr ent = (xmlEntityPtr) payload;
903
40.2k
    xmlEntityPtr cur;
904
905
40.2k
    cur = (xmlEntityPtr) xmlMalloc(sizeof(xmlEntity));
906
40.2k
    if (cur == NULL)
907
3
  return(NULL);
908
40.2k
    memset(cur, 0, sizeof(xmlEntity));
909
40.2k
    cur->type = XML_ENTITY_DECL;
910
911
40.2k
    cur->etype = ent->etype;
912
40.2k
    if (ent->name != NULL) {
913
40.2k
  cur->name = xmlStrdup(ent->name);
914
40.2k
        if (cur->name == NULL)
915
4
            goto error;
916
40.2k
    }
917
40.2k
    if (ent->ExternalID != NULL) {
918
0
  cur->ExternalID = xmlStrdup(ent->ExternalID);
919
0
        if (cur->ExternalID == NULL)
920
0
            goto error;
921
0
    }
922
40.2k
    if (ent->SystemID != NULL) {
923
1.18k
  cur->SystemID = xmlStrdup(ent->SystemID);
924
1.18k
        if (cur->SystemID == NULL)
925
2
            goto error;
926
1.18k
    }
927
40.2k
    if (ent->content != NULL) {
928
39.0k
  cur->content = xmlStrdup(ent->content);
929
39.0k
        if (cur->content == NULL)
930
4
            goto error;
931
39.0k
    }
932
40.2k
    if (ent->orig != NULL) {
933
39.0k
  cur->orig = xmlStrdup(ent->orig);
934
39.0k
        if (cur->orig == NULL)
935
2
            goto error;
936
39.0k
    }
937
40.2k
    if (ent->URI != NULL) {
938
662
  cur->URI = xmlStrdup(ent->URI);
939
662
        if (cur->URI == NULL)
940
2
            goto error;
941
662
    }
942
40.2k
    return(cur);
943
944
14
error:
945
14
    xmlFreeEntity(cur);
946
14
    return(NULL);
947
40.2k
}
948
949
/**
950
 * xmlCopyEntitiesTable:
951
 * @table:  An entity table
952
 *
953
 * Build a copy of an entity table.
954
 *
955
 * Returns the new xmlEntitiesTablePtr or NULL in case of error.
956
 */
957
xmlEntitiesTablePtr
958
14.3k
xmlCopyEntitiesTable(xmlEntitiesTablePtr table) {
959
14.3k
    return(xmlHashCopySafe(table, xmlCopyEntity, xmlFreeEntityWrapper));
960
14.3k
}
961
962
#ifdef LIBXML_OUTPUT_ENABLED
963
964
/**
965
 * xmlDumpEntityDecl:
966
 * @buf:  An XML buffer.
967
 * @ent:  An entity table
968
 *
969
 * This will dump the content of the entity table as an XML DTD definition
970
 */
971
void
972
0
xmlDumpEntityDecl(xmlBufferPtr buf, xmlEntityPtr ent) {
973
0
    xmlSaveCtxtPtr save;
974
975
0
    if ((buf == NULL) || (ent == NULL))
976
0
        return;
977
978
0
    save = xmlSaveToBuffer(buf, NULL, 0);
979
0
    xmlSaveTree(save, (xmlNodePtr) ent);
980
0
    if (xmlSaveFinish(save) != XML_ERR_OK)
981
0
        xmlFree(xmlBufferDetach(buf));
982
0
}
983
984
/**
985
 * xmlDumpEntityDeclScan:
986
 * @ent:  An entity table
987
 * @buf:  An XML buffer.
988
 *
989
 * When using the hash table scan function, arguments need to be reversed
990
 */
991
static void
992
xmlDumpEntityDeclScan(void *ent, void *save,
993
0
                      const xmlChar *name ATTRIBUTE_UNUSED) {
994
0
    xmlSaveTree(save, ent);
995
0
}
996
997
/**
998
 * xmlDumpEntitiesTable:
999
 * @buf:  An XML buffer.
1000
 * @table:  An entity table
1001
 *
1002
 * This will dump the content of the entity table as an XML DTD definition
1003
 */
1004
void
1005
0
xmlDumpEntitiesTable(xmlBufferPtr buf, xmlEntitiesTablePtr table) {
1006
0
    xmlSaveCtxtPtr save;
1007
1008
0
    if ((buf == NULL) || (table == NULL))
1009
0
        return;
1010
1011
0
    save = xmlSaveToBuffer(buf, NULL, 0);
1012
0
    xmlHashScan(table, xmlDumpEntityDeclScan, save);
1013
0
    if (xmlSaveFinish(save) != XML_ERR_OK)
1014
0
        xmlFree(xmlBufferDetach(buf));
1015
0
}
1016
#endif /* LIBXML_OUTPUT_ENABLED */