Coverage Report

Created: 2025-11-11 06:39

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
/src/libxml2/entities.c
Line
Count
Source
1
/*
2
 * entities.c : implementation for the XML entities handling
3
 *
4
 * See Copyright for the status of this software.
5
 *
6
 * daniel@veillard.com
7
 */
8
9
/* To avoid EBCDIC trouble when parsing on zOS */
10
#if defined(__MVS__)
11
#pragma convert("ISO8859-1")
12
#endif
13
14
#define IN_LIBXML
15
#include "libxml.h"
16
17
#include <string.h>
18
#include <stdlib.h>
19
20
#include <libxml/xmlmemory.h>
21
#include <libxml/hash.h>
22
#include <libxml/entities.h>
23
#include <libxml/parser.h>
24
#include <libxml/parserInternals.h>
25
#include <libxml/xmlerror.h>
26
#include <libxml/dict.h>
27
#include <libxml/xmlsave.h>
28
29
#include "private/entities.h"
30
#include "private/error.h"
31
32
#ifndef SIZE_MAX
33
  #define SIZE_MAX ((size_t) -1)
34
#endif
35
36
/*
37
 * The XML predefined entities.
38
 */
39
40
static xmlEntity xmlEntityLt = {
41
    NULL, XML_ENTITY_DECL, BAD_CAST "lt",
42
    NULL, NULL, NULL, NULL, NULL, NULL,
43
    BAD_CAST "<", BAD_CAST "<", 1,
44
    XML_INTERNAL_PREDEFINED_ENTITY,
45
    NULL, NULL, NULL, NULL, 0, 0, 0
46
};
47
static xmlEntity xmlEntityGt = {
48
    NULL, XML_ENTITY_DECL, BAD_CAST "gt",
49
    NULL, NULL, NULL, NULL, NULL, NULL,
50
    BAD_CAST ">", BAD_CAST ">", 1,
51
    XML_INTERNAL_PREDEFINED_ENTITY,
52
    NULL, NULL, NULL, NULL, 0, 0, 0
53
};
54
static xmlEntity xmlEntityAmp = {
55
    NULL, XML_ENTITY_DECL, BAD_CAST "amp",
56
    NULL, NULL, NULL, NULL, NULL, NULL,
57
    BAD_CAST "&", BAD_CAST "&", 1,
58
    XML_INTERNAL_PREDEFINED_ENTITY,
59
    NULL, NULL, NULL, NULL, 0, 0, 0
60
};
61
static xmlEntity xmlEntityQuot = {
62
    NULL, XML_ENTITY_DECL, BAD_CAST "quot",
63
    NULL, NULL, NULL, NULL, NULL, NULL,
64
    BAD_CAST "\"", BAD_CAST "\"", 1,
65
    XML_INTERNAL_PREDEFINED_ENTITY,
66
    NULL, NULL, NULL, NULL, 0, 0, 0
67
};
68
static xmlEntity xmlEntityApos = {
69
    NULL, XML_ENTITY_DECL, BAD_CAST "apos",
70
    NULL, NULL, NULL, NULL, NULL, NULL,
71
    BAD_CAST "'", BAD_CAST "'", 1,
72
    XML_INTERNAL_PREDEFINED_ENTITY,
73
    NULL, NULL, NULL, NULL, 0, 0, 0
74
};
75
76
/*
77
 * xmlFreeEntity:
78
 * @entity:  an entity
79
 *
80
 * Frees the entity.
81
 */
82
void
83
xmlFreeEntity(xmlEntityPtr entity)
84
141k
{
85
141k
    xmlDictPtr dict = NULL;
86
87
141k
    if (entity == NULL)
88
0
        return;
89
90
141k
    if (entity->doc != NULL)
91
141k
        dict = entity->doc->dict;
92
93
94
141k
    if ((entity->children) &&
95
2.38k
        (entity == (xmlEntityPtr) entity->children->parent))
96
2.38k
        xmlFreeNodeList(entity->children);
97
141k
    if ((entity->name != NULL) &&
98
141k
        ((dict == NULL) || (!xmlDictOwns(dict, entity->name))))
99
23.8k
        xmlFree((char *) entity->name);
100
141k
    if (entity->ExternalID != NULL)
101
13.3k
        xmlFree((char *) entity->ExternalID);
102
141k
    if (entity->SystemID != NULL)
103
73.2k
        xmlFree((char *) entity->SystemID);
104
141k
    if (entity->URI != NULL)
105
68.8k
        xmlFree((char *) entity->URI);
106
141k
    if (entity->content != NULL)
107
65.2k
        xmlFree((char *) entity->content);
108
141k
    if (entity->orig != NULL)
109
62.1k
        xmlFree((char *) entity->orig);
110
141k
    xmlFree(entity);
111
141k
}
112
113
/*
114
 * xmlCreateEntity:
115
 *
116
 * internal routine doing the entity node structures allocations
117
 */
118
static xmlEntityPtr
119
xmlCreateEntity(xmlDocPtr doc, const xmlChar *name, int type,
120
          const xmlChar *ExternalID, const xmlChar *SystemID,
121
141k
          const xmlChar *content) {
122
141k
    xmlEntityPtr ret;
123
124
141k
    ret = (xmlEntityPtr) xmlMalloc(sizeof(xmlEntity));
125
141k
    if (ret == NULL)
126
15
  return(NULL);
127
141k
    memset(ret, 0, sizeof(xmlEntity));
128
141k
    ret->doc = doc;
129
141k
    ret->type = XML_ENTITY_DECL;
130
131
    /*
132
     * fill the structure.
133
     */
134
141k
    ret->etype = (xmlEntityType) type;
135
141k
    if ((doc == NULL) || (doc->dict == NULL))
136
23.8k
  ret->name = xmlStrdup(name);
137
117k
    else
138
117k
        ret->name = xmlDictLookup(doc->dict, name, -1);
139
141k
    if (ret->name == NULL)
140
3
        goto error;
141
141k
    if (ExternalID != NULL) {
142
13.3k
        ret->ExternalID = xmlStrdup(ExternalID);
143
13.3k
        if (ret->ExternalID == NULL)
144
4
            goto error;
145
13.3k
    }
146
141k
    if (SystemID != NULL) {
147
73.2k
        ret->SystemID = xmlStrdup(SystemID);
148
73.2k
        if (ret->SystemID == NULL)
149
6
            goto error;
150
73.2k
    }
151
141k
    if (content != NULL) {
152
64.9k
        ret->length = xmlStrlen(content);
153
64.9k
  ret->content = xmlStrndup(content, ret->length);
154
64.9k
        if (ret->content == NULL)
155
1
            goto error;
156
76.7k
     } else {
157
76.7k
        ret->length = 0;
158
76.7k
        ret->content = NULL;
159
76.7k
    }
160
141k
    ret->URI = NULL; /* to be computed by the layer knowing
161
      the defining entity */
162
141k
    ret->orig = NULL;
163
164
141k
    return(ret);
165
166
14
error:
167
14
    xmlFreeEntity(ret);
168
14
    return(NULL);
169
141k
}
170
171
/**
172
 * xmlAddEntity:
173
 * @doc:  the document
174
 * @extSubset:  add to the external or internal subset
175
 * @name:  the entity name
176
 * @type:  the entity type XML_xxx_yyy_ENTITY
177
 * @ExternalID:  the entity external ID if available
178
 * @SystemID:  the entity system ID if available
179
 * @content:  the entity content
180
 * @out:  pointer to resulting entity (optional)
181
 *
182
 * Register a new entity for this document.
183
 *
184
 * Available since 2.13.0.
185
 *
186
 * Returns an xmlParserErrors error code.
187
 */
188
int
189
xmlAddEntity(xmlDocPtr doc, int extSubset, const xmlChar *name, int type,
190
    const xmlChar *ExternalID, const xmlChar *SystemID,
191
144k
    const xmlChar *content, xmlEntityPtr *out) {
192
144k
    xmlDtdPtr dtd;
193
144k
    xmlDictPtr dict = NULL;
194
144k
    xmlEntitiesTablePtr table = NULL;
195
144k
    xmlEntityPtr ret, predef;
196
144k
    int res;
197
198
144k
    if (out != NULL)
199
144k
        *out = NULL;
200
144k
    if ((doc == NULL) || (name == NULL))
201
0
  return(XML_ERR_ARGUMENT);
202
144k
    dict = doc->dict;
203
204
144k
    if (extSubset)
205
11.4k
        dtd = doc->extSubset;
206
133k
    else
207
133k
        dtd = doc->intSubset;
208
144k
    if (dtd == NULL)
209
0
        return(XML_DTD_NO_DTD);
210
211
144k
    switch (type) {
212
37.4k
        case XML_INTERNAL_GENERAL_ENTITY:
213
54.0k
        case XML_EXTERNAL_GENERAL_PARSED_ENTITY:
214
54.2k
        case XML_EXTERNAL_GENERAL_UNPARSED_ENTITY:
215
54.2k
            predef = xmlGetPredefinedEntity(name);
216
54.2k
            if (predef != NULL) {
217
3.83k
                int valid = 0;
218
219
                /* 4.6 Predefined Entities */
220
3.83k
                if ((type == XML_INTERNAL_GENERAL_ENTITY) &&
221
3.54k
                    (content != NULL)) {
222
2.93k
                    int c = predef->content[0];
223
224
2.93k
                    if (((content[0] == c) && (content[1] == 0)) &&
225
864
                        ((c == '>') || (c == '\'') || (c == '"'))) {
226
638
                        valid = 1;
227
2.29k
                    } else if ((content[0] == '&') && (content[1] == '#')) {
228
1.16k
                        if (content[2] == 'x') {
229
223
                            xmlChar *hex = BAD_CAST "0123456789ABCDEF";
230
223
                            xmlChar ref[] = "00;";
231
232
223
                            ref[0] = hex[c / 16 % 16];
233
223
                            ref[1] = hex[c % 16];
234
223
                            if (xmlStrcasecmp(&content[3], ref) == 0)
235
0
                                valid = 1;
236
946
                        } else {
237
946
                            xmlChar ref[] = "00;";
238
239
946
                            ref[0] = '0' + c / 10 % 10;
240
946
                            ref[1] = '0' + c % 10;
241
946
                            if (xmlStrEqual(&content[2], ref))
242
264
                                valid = 1;
243
946
                        }
244
1.16k
                    }
245
2.93k
                }
246
3.83k
                if (!valid)
247
2.93k
                    return(XML_ERR_REDECL_PREDEF_ENTITY);
248
3.83k
            }
249
51.3k
      if (dtd->entities == NULL) {
250
39.4k
    dtd->entities = xmlHashCreateDict(0, dict);
251
39.4k
                if (dtd->entities == NULL)
252
3
                    return(XML_ERR_NO_MEMORY);
253
39.4k
            }
254
51.3k
      table = dtd->entities;
255
51.3k
      break;
256
30.9k
        case XML_INTERNAL_PARAMETER_ENTITY:
257
90.3k
        case XML_EXTERNAL_PARAMETER_ENTITY:
258
90.3k
      if (dtd->pentities == NULL) {
259
43.2k
    dtd->pentities = xmlHashCreateDict(0, dict);
260
43.2k
                if (dtd->pentities == NULL)
261
6
                    return(XML_ERR_NO_MEMORY);
262
43.2k
            }
263
90.3k
      table = dtd->pentities;
264
90.3k
      break;
265
0
        default:
266
0
      return(XML_ERR_ARGUMENT);
267
144k
    }
268
141k
    ret = xmlCreateEntity(dtd->doc, name, type, ExternalID, SystemID, content);
269
141k
    if (ret == NULL)
270
29
        return(XML_ERR_NO_MEMORY);
271
272
141k
    res = xmlHashAdd(table, name, ret);
273
141k
    if (res < 0) {
274
11
        xmlFreeEntity(ret);
275
11
        return(XML_ERR_NO_MEMORY);
276
141k
    } else if (res == 0) {
277
  /*
278
   * entity was already defined at another level.
279
   */
280
5.08k
        xmlFreeEntity(ret);
281
5.08k
  return(XML_WAR_ENTITY_REDEFINED);
282
5.08k
    }
283
284
    /*
285
     * Link it to the DTD
286
     */
287
136k
    ret->parent = dtd;
288
136k
    ret->doc = dtd->doc;
289
136k
    if (dtd->last == NULL) {
290
58.6k
  dtd->children = dtd->last = (xmlNodePtr) ret;
291
77.9k
    } else {
292
77.9k
  dtd->last->next = (xmlNodePtr) ret;
293
77.9k
  ret->prev = dtd->last;
294
77.9k
  dtd->last = (xmlNodePtr) ret;
295
77.9k
    }
296
297
136k
    if (out != NULL)
298
136k
        *out = ret;
299
136k
    return(0);
300
141k
}
301
302
/**
303
 * xmlGetPredefinedEntity:
304
 * @name:  the entity name
305
 *
306
 * Check whether this name is an predefined entity.
307
 *
308
 * Returns NULL if not, otherwise the entity
309
 */
310
xmlEntityPtr
311
2.05M
xmlGetPredefinedEntity(const xmlChar *name) {
312
2.05M
    if (name == NULL) return(NULL);
313
2.05M
    switch (name[0]) {
314
18.3k
        case 'l':
315
18.3k
      if (xmlStrEqual(name, BAD_CAST "lt"))
316
11.6k
          return(&xmlEntityLt);
317
6.69k
      break;
318
56.3k
        case 'g':
319
56.3k
      if (xmlStrEqual(name, BAD_CAST "gt"))
320
50.1k
          return(&xmlEntityGt);
321
6.14k
      break;
322
929k
        case 'a':
323
929k
      if (xmlStrEqual(name, BAD_CAST "amp"))
324
72.9k
          return(&xmlEntityAmp);
325
856k
      if (xmlStrEqual(name, BAD_CAST "apos"))
326
1.07k
          return(&xmlEntityApos);
327
855k
      break;
328
855k
        case 'q':
329
452k
      if (xmlStrEqual(name, BAD_CAST "quot"))
330
521
          return(&xmlEntityQuot);
331
452k
      break;
332
600k
  default:
333
600k
      break;
334
2.05M
    }
335
1.92M
    return(NULL);
336
2.05M
}
337
338
/**
339
 * xmlAddDtdEntity:
340
 * @doc:  the document
341
 * @name:  the entity name
342
 * @type:  the entity type XML_xxx_yyy_ENTITY
343
 * @ExternalID:  the entity external ID if available
344
 * @SystemID:  the entity system ID if available
345
 * @content:  the entity content
346
 *
347
 * Register a new entity for this document DTD external subset.
348
 *
349
 * Returns a pointer to the entity or NULL in case of error
350
 */
351
xmlEntityPtr
352
xmlAddDtdEntity(xmlDocPtr doc, const xmlChar *name, int type,
353
          const xmlChar *ExternalID, const xmlChar *SystemID,
354
0
    const xmlChar *content) {
355
0
    xmlEntityPtr ret;
356
357
0
    xmlAddEntity(doc, 1, name, type, ExternalID, SystemID, content, &ret);
358
0
    return(ret);
359
0
}
360
361
/**
362
 * xmlAddDocEntity:
363
 * @doc:  the document
364
 * @name:  the entity name
365
 * @type:  the entity type XML_xxx_yyy_ENTITY
366
 * @ExternalID:  the entity external ID if available
367
 * @SystemID:  the entity system ID if available
368
 * @content:  the entity content
369
 *
370
 * Register a new entity for this document.
371
 *
372
 * Returns a pointer to the entity or NULL in case of error
373
 */
374
xmlEntityPtr
375
xmlAddDocEntity(xmlDocPtr doc, const xmlChar *name, int type,
376
          const xmlChar *ExternalID, const xmlChar *SystemID,
377
0
          const xmlChar *content) {
378
0
    xmlEntityPtr ret;
379
380
0
    xmlAddEntity(doc, 0, name, type, ExternalID, SystemID, content, &ret);
381
0
    return(ret);
382
0
}
383
384
/**
385
 * xmlNewEntity:
386
 * @doc:  the document
387
 * @name:  the entity name
388
 * @type:  the entity type XML_xxx_yyy_ENTITY
389
 * @ExternalID:  the entity external ID if available
390
 * @SystemID:  the entity system ID if available
391
 * @content:  the entity content
392
 *
393
 * Create a new entity, this differs from xmlAddDocEntity() that if
394
 * the document is NULL or has no internal subset defined, then an
395
 * unlinked entity structure will be returned, it is then the responsibility
396
 * of the caller to link it to the document later or free it when not needed
397
 * anymore.
398
 *
399
 * Returns a pointer to the entity or NULL in case of error
400
 */
401
xmlEntityPtr
402
xmlNewEntity(xmlDocPtr doc, const xmlChar *name, int type,
403
       const xmlChar *ExternalID, const xmlChar *SystemID,
404
0
       const xmlChar *content) {
405
0
    if ((doc != NULL) && (doc->intSubset != NULL)) {
406
0
  return(xmlAddDocEntity(doc, name, type, ExternalID, SystemID, content));
407
0
    }
408
0
    if (name == NULL)
409
0
        return(NULL);
410
0
    return(xmlCreateEntity(doc, name, type, ExternalID, SystemID, content));
411
0
}
412
413
/**
414
 * xmlGetEntityFromTable:
415
 * @table:  an entity table
416
 * @name:  the entity name
417
 * @parameter:  look for parameter entities
418
 *
419
 * Do an entity lookup in the table.
420
 * returns the corresponding parameter entity, if found.
421
 *
422
 * Returns A pointer to the entity structure or NULL if not found.
423
 */
424
static xmlEntityPtr
425
1.05M
xmlGetEntityFromTable(xmlEntitiesTablePtr table, const xmlChar *name) {
426
1.05M
    return((xmlEntityPtr) xmlHashLookup(table, name));
427
1.05M
}
428
429
/**
430
 * xmlGetParameterEntity:
431
 * @doc:  the document referencing the entity
432
 * @name:  the entity name
433
 *
434
 * Do an entity lookup in the internal and external subsets and
435
 * returns the corresponding parameter entity, if found.
436
 *
437
 * Returns A pointer to the entity structure or NULL if not found.
438
 */
439
xmlEntityPtr
440
130k
xmlGetParameterEntity(xmlDocPtr doc, const xmlChar *name) {
441
130k
    xmlEntitiesTablePtr table;
442
130k
    xmlEntityPtr ret;
443
444
130k
    if (doc == NULL)
445
661
  return(NULL);
446
130k
    if ((doc->intSubset != NULL) && (doc->intSubset->pentities != NULL)) {
447
123k
  table = (xmlEntitiesTablePtr) doc->intSubset->pentities;
448
123k
  ret = xmlGetEntityFromTable(table, name);
449
123k
  if (ret != NULL)
450
86.2k
      return(ret);
451
123k
    }
452
43.9k
    if ((doc->extSubset != NULL) && (doc->extSubset->pentities != NULL)) {
453
11.6k
  table = (xmlEntitiesTablePtr) doc->extSubset->pentities;
454
11.6k
  return(xmlGetEntityFromTable(table, name));
455
11.6k
    }
456
32.2k
    return(NULL);
457
43.9k
}
458
459
/**
460
 * xmlGetDtdEntity:
461
 * @doc:  the document referencing the entity
462
 * @name:  the entity name
463
 *
464
 * Do an entity lookup in the DTD entity hash table and
465
 * returns the corresponding entity, if found.
466
 * Note: the first argument is the document node, not the DTD node.
467
 *
468
 * Returns A pointer to the entity structure or NULL if not found.
469
 */
470
xmlEntityPtr
471
0
xmlGetDtdEntity(xmlDocPtr doc, const xmlChar *name) {
472
0
    xmlEntitiesTablePtr table;
473
474
0
    if (doc == NULL)
475
0
  return(NULL);
476
0
    if ((doc->extSubset != NULL) && (doc->extSubset->entities != NULL)) {
477
0
  table = (xmlEntitiesTablePtr) doc->extSubset->entities;
478
0
  return(xmlGetEntityFromTable(table, name));
479
0
    }
480
0
    return(NULL);
481
0
}
482
483
/**
484
 * xmlGetDocEntity:
485
 * @doc:  the document referencing the entity
486
 * @name:  the entity name
487
 *
488
 * Do an entity lookup in the document entity hash table and
489
 * returns the corresponding entity, otherwise a lookup is done
490
 * in the predefined entities too.
491
 *
492
 * Returns A pointer to the entity structure or NULL if not found.
493
 */
494
xmlEntityPtr
495
918k
xmlGetDocEntity(const xmlDoc *doc, const xmlChar *name) {
496
918k
    xmlEntityPtr cur;
497
918k
    xmlEntitiesTablePtr table;
498
499
918k
    if (doc != NULL) {
500
914k
  if ((doc->intSubset != NULL) && (doc->intSubset->entities != NULL)) {
501
861k
      table = (xmlEntitiesTablePtr) doc->intSubset->entities;
502
861k
      cur = xmlGetEntityFromTable(table, name);
503
861k
      if (cur != NULL)
504
760k
    return(cur);
505
861k
  }
506
153k
  if (doc->standalone != 1) {
507
153k
      if ((doc->extSubset != NULL) &&
508
65.4k
    (doc->extSubset->entities != NULL)) {
509
63.7k
    table = (xmlEntitiesTablePtr) doc->extSubset->entities;
510
63.7k
    cur = xmlGetEntityFromTable(table, name);
511
63.7k
    if (cur != NULL)
512
331
        return(cur);
513
63.7k
      }
514
153k
  }
515
153k
    }
516
158k
    return(xmlGetPredefinedEntity(name));
517
918k
}
518
519
/*
520
 * xmlSerializeHexCharRef:
521
 * @buf:  a char buffer
522
 * @val:  a codepoint
523
 *
524
 * Serializes a hex char ref like &#xA0;
525
 *
526
 * Writes at most 9 bytes. Does not include a terminating zero byte.
527
 *
528
 * Returns the number of bytes written.
529
 */
530
int
531
1.58k
xmlSerializeHexCharRef(char *buf, int val) {
532
1.58k
    char *out = buf;
533
1.58k
    int shift = 0, bits;
534
535
1.58k
    *out++ = '&';
536
1.58k
    *out++ = '#';
537
1.58k
    *out++ = 'x';
538
539
1.58k
    bits = val;
540
1.58k
    if (bits & 0xFF0000) {
541
149
        shift = 16;
542
149
        bits &= 0xFF0000;
543
1.43k
    } else if (bits & 0x00FF00) {
544
997
        shift = 8;
545
997
        bits &= 0x00FF00;
546
997
    }
547
1.58k
    if (bits & 0xF0F0F0) {
548
480
        shift += 4;
549
480
    }
550
551
4.65k
    do {
552
4.65k
        int d = (val >> shift) & 0x0F;
553
554
4.65k
        if (d < 10)
555
2.81k
            *out++ = '0' + d;
556
1.83k
        else
557
1.83k
            *out++ = 'A' + (d - 10);
558
559
4.65k
  shift -= 4;
560
4.65k
    } while (shift >= 0);
561
562
1.58k
    *out++ = ';';
563
564
1.58k
    return(out - buf);
565
1.58k
}
566
567
/*
568
 * xmlSerializeDecCharRef:
569
 * @buf:  a char buffer
570
 * @val:  a codepoint
571
 *
572
 * Serializes a decimal char ref like &#38;
573
 *
574
 * Writes at most 10 bytes. Does not include a terminating zero byte.
575
 *
576
 * Returns the number of bytes written.
577
 */
578
int
579
114M
xmlSerializeDecCharRef(char *buf, int val) {
580
114M
    char *out = buf;
581
114M
    int len, i;
582
583
114M
    *out++ = '&';
584
114M
    *out++ = '#';
585
586
114M
    if (val < 100) {
587
1.79k
        len = (val < 10) ? 1 : 2;
588
114M
    } else if (val < 10000) {
589
114M
        len = (val < 1000) ? 3 : 4;
590
114M
    } else if (val < 1000000) {
591
4.54k
        len = (val < 100000) ? 5 : 6;
592
4.54k
    } else {
593
67
        len = 7;
594
67
    }
595
596
466M
    for (i = len - 1; i >= 0; i--) {
597
351M
        out[i] = '0' + val % 10;
598
351M
        val /= 10;
599
351M
    }
600
601
114M
    out[len] = ';';
602
603
114M
    return(len + 3);
604
114M
}
605
606
static const char xmlEscapeSafe[128] = {
607
    0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0,
608
    0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
609
    1, 1, 0, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1,
610
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 1,
611
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
612
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
613
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
614
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1
615
};
616
617
/*
618
 * xmlEscapeText:
619
 * @text:  input text
620
 * @flags:  XML_ESCAPE flags
621
 *
622
 * Escapes certain characters with char refs.
623
 *
624
 * XML_ESCAPE_ATTR: for attribute content.
625
 * XML_ESCAPE_NON_ASCII: escape non-ASCII chars.
626
 * XML_ESCAPE_HTML: for HTML content.
627
 * XML_ESCAPE_QUOT: escape double quotes.
628
 * XML_ESCAPE_ALLOW_INVALID: allow invalid characters.
629
 *
630
 * Returns an escaped string or NULL if a memory allocation failed.
631
 */
632
xmlChar *
633
75.8k
xmlEscapeText(const xmlChar *text, int flags) {
634
75.8k
    const xmlChar *cur;
635
75.8k
    xmlChar *buffer;
636
75.8k
    xmlChar *out;
637
75.8k
    const xmlChar *unescaped;
638
75.8k
    size_t size = 50;
639
640
75.8k
    buffer = xmlMalloc(size + 1);
641
75.8k
    if (buffer == NULL)
642
59
        return(NULL);
643
75.8k
    out = buffer;
644
645
75.8k
    cur = text;
646
75.8k
    unescaped = cur;
647
648
263k
    while (*cur != '\0') {
649
188k
        char buf[12];
650
188k
  const xmlChar *end;
651
188k
        const xmlChar *repl;
652
188k
        size_t used;
653
188k
        size_t replSize;
654
188k
        size_t unescapedSize;
655
188k
        size_t totalSize;
656
188k
        int chunkSize = 1;
657
188k
        int c;
658
659
        /* accelerator */
660
182M
  while (1) {
661
182M
            c = *cur;
662
663
182M
            if (c < 0x80) {
664
10.5M
                if (!xmlEscapeSafe[*cur])
665
188k
                    break;
666
171M
            } else {
667
171M
               if (flags & XML_ESCAPE_NON_ASCII)
668
0
                   break;
669
171M
            }
670
182M
            cur += 1;
671
182M
        }
672
673
188k
        if (c == 0) {
674
73.1k
            chunkSize = 0;
675
73.1k
            repl = BAD_CAST "";
676
73.1k
            replSize = 0;
677
115k
        } else if (c == '<') {
678
      /*
679
       * Special handling of server side include in HTML attributes
680
       */
681
10.9k
      if ((flags & XML_ESCAPE_HTML) && (flags & XML_ESCAPE_ATTR) &&
682
10.4k
          (cur[1] == '!') && (cur[2] == '-') && (cur[3] == '-') &&
683
1.07k
          ((end = xmlStrstr(cur, BAD_CAST "-->")) != NULL)) {
684
974
                chunkSize = (end - cur) + 3;
685
974
                repl = cur;
686
974
                replSize = chunkSize;
687
9.99k
      } else {
688
9.99k
                repl = BAD_CAST "&lt;";
689
9.99k
                replSize = 4;
690
9.99k
            }
691
104k
  } else if (c == '>') {
692
38.0k
            repl = BAD_CAST "&gt;";
693
38.0k
            replSize = 4;
694
66.0k
  } else if (c == '&') {
695
      /*
696
       * Special handling of &{...} construct from HTML 4, see
697
       * http://www.w3.org/TR/html401/appendix/notes.html#h-B.7.1
698
       */
699
5.92k
      if ((flags & XML_ESCAPE_HTML) && (flags & XML_ESCAPE_ATTR) &&
700
5.51k
                (cur[1] == '{') && (end = xmlStrchr(cur, '}'))) {
701
2.46k
                chunkSize = (end - cur) + 1;
702
2.46k
                repl = cur;
703
2.46k
                replSize = chunkSize;
704
3.45k
      } else {
705
3.45k
                repl = BAD_CAST "&amp;";
706
3.45k
                replSize = 5;
707
3.45k
            }
708
60.1k
  } else if ((flags & XML_ESCAPE_QUOT) && (c == '"')) {
709
0
            repl = BAD_CAST "&quot;";
710
0
            replSize = 6;
711
60.1k
  } else if (((flags & XML_ESCAPE_HTML) == 0) && (c == '\r')) {
712
0
      repl = BAD_CAST "&#13;";
713
0
            replSize = 5;
714
60.1k
  } else if ((flags & XML_ESCAPE_NON_ASCII) && (c >= 0x80)) {
715
0
            int val;
716
717
0
            chunkSize = 4;
718
0
            val = xmlGetUTF8Char(cur, &chunkSize);
719
0
            if (val < 0) {
720
0
                val = 0xFFFD;
721
0
                chunkSize = 1;
722
0
            } else if (((flags & XML_ESCAPE_ALLOW_INVALID) == 0) &&
723
0
                       (!IS_CHAR(val))) {
724
0
                val = 0xFFFD;
725
0
            }
726
727
0
            replSize = xmlSerializeHexCharRef(buf, val);
728
0
            repl = BAD_CAST buf;
729
60.1k
  } else if ((flags & (XML_ESCAPE_ALLOW_INVALID | XML_ESCAPE_HTML)) ||
730
0
                   (c >= 0x20) ||
731
60.1k
             (c == '\n') || (c == '\t') || (c == '\r')) {
732
      /* default case, just copy */
733
60.1k
            cur += 1;
734
60.1k
            if (*cur != 0)
735
59.3k
                continue;
736
737
763
            chunkSize = 0;
738
763
            repl = BAD_CAST "";
739
763
            replSize = 0;
740
763
  } else {
741
            /* ignore */
742
0
            repl = BAD_CAST "";
743
0
            replSize = 0;
744
0
        }
745
746
128k
        used = out - buffer;
747
128k
        unescapedSize = cur - unescaped;
748
128k
        totalSize = unescapedSize + replSize;
749
750
128k
  cur += chunkSize;
751
752
128k
        if (totalSize > size - used) {
753
15.5k
            xmlChar *tmp;
754
15.5k
            int newSize;
755
756
15.5k
            if ((size > (SIZE_MAX - 1) / 2) ||
757
15.5k
                (totalSize > (SIZE_MAX - 1) / 2 - size)) {
758
0
                xmlFree(buffer);
759
0
                return(NULL);
760
0
            }
761
15.5k
            newSize = size + totalSize;
762
15.5k
            if (*cur != 0)
763
8.64k
                newSize *= 2;
764
15.5k
            tmp = xmlRealloc(buffer, newSize + 1);
765
15.5k
            if (tmp == NULL) {
766
3
                xmlFree(buffer);
767
3
                return(NULL);
768
3
            }
769
15.5k
            buffer = tmp;
770
15.5k
            size = newSize;
771
15.5k
            out = buffer + used;
772
15.5k
        }
773
774
128k
        memcpy(out, unescaped, unescapedSize);
775
128k
        out += unescapedSize;
776
128k
        memcpy(out, repl, replSize);
777
128k
        out += replSize;
778
779
128k
        unescaped = cur;
780
128k
    }
781
782
75.8k
    *out = 0;
783
75.8k
    return(buffer);
784
75.8k
}
785
786
/**
787
 * xmlEncodeEntitiesInternal:
788
 * @doc:  the document containing the string
789
 * @input:  A string to convert to XML.
790
 * @flags:  XML_ESCAPE flags
791
 *
792
 * Do a global encoding of a string, replacing the predefined entities
793
 * and non ASCII values with their entities and CharRef counterparts.
794
 * Contrary to xmlEncodeEntities, this routine is reentrant, and result
795
 * must be deallocated.
796
 *
797
 * Returns A newly allocated string with the substitution done.
798
 */
799
xmlChar *
800
xmlEncodeEntitiesInternal(xmlDocPtr doc, const xmlChar *input,
801
75.8k
                          unsigned flags) {
802
75.8k
    if (input == NULL)
803
0
        return(NULL);
804
805
75.8k
    if ((doc != NULL) && (doc->type == XML_HTML_DOCUMENT_NODE))
806
75.8k
        flags |= XML_ESCAPE_HTML;
807
0
    else if ((doc == NULL) || (doc->encoding == NULL))
808
0
        flags |= XML_ESCAPE_NON_ASCII;
809
810
75.8k
    return(xmlEscapeText(input, flags));
811
75.8k
}
812
813
/**
814
 * xmlEncodeEntitiesReentrant:
815
 * @doc:  the document containing the string
816
 * @input:  A string to convert to XML.
817
 *
818
 * Do a global encoding of a string, replacing the predefined entities
819
 * and non ASCII values with their entities and CharRef counterparts.
820
 * Contrary to xmlEncodeEntities, this routine is reentrant, and result
821
 * must be deallocated.
822
 *
823
 * This escapes '<', '>', '&' and '\r'. If the document has no encoding,
824
 * non-ASCII codepoints are escaped. There is some special handling for
825
 * HTML documents.
826
 *
827
 * Returns A newly allocated string with the substitution done.
828
 */
829
xmlChar *
830
43.4k
xmlEncodeEntitiesReentrant(xmlDocPtr doc, const xmlChar *input) {
831
43.4k
    return xmlEncodeEntitiesInternal(doc, input, 0);
832
43.4k
}
833
834
/**
835
 * xmlEncodeSpecialChars:
836
 * @doc:  unused
837
 * @input:  A string to convert to XML.
838
 *
839
 * Do a global encoding of a string, replacing the predefined entities
840
 * this routine is reentrant, and result must be deallocated.
841
 *
842
 * This escapes '<', '>', '&', '"' and '\r' chars.
843
 *
844
 * Returns A newly allocated string with the substitution done.
845
 */
846
xmlChar *
847
xmlEncodeSpecialChars(const xmlDoc *doc ATTRIBUTE_UNUSED,
848
0
                      const xmlChar *input) {
849
0
    if (input == NULL)
850
0
        return(NULL);
851
852
0
    return(xmlEscapeText(input, XML_ESCAPE_QUOT | XML_ESCAPE_ALLOW_INVALID));
853
0
}
854
855
/**
856
 * xmlCreateEntitiesTable:
857
 *
858
 * create and initialize an empty entities hash table.
859
 * This really doesn't make sense and should be deprecated
860
 *
861
 * Returns the xmlEntitiesTablePtr just created or NULL in case of error.
862
 */
863
xmlEntitiesTablePtr
864
0
xmlCreateEntitiesTable(void) {
865
0
    return((xmlEntitiesTablePtr) xmlHashCreate(0));
866
0
}
867
868
/**
869
 * xmlFreeEntityWrapper:
870
 * @entity:  An entity
871
 * @name:  its name
872
 *
873
 * Deallocate the memory used by an entities in the hash table.
874
 */
875
static void
876
136k
xmlFreeEntityWrapper(void *entity, const xmlChar *name ATTRIBUTE_UNUSED) {
877
136k
    if (entity != NULL)
878
136k
  xmlFreeEntity((xmlEntityPtr) entity);
879
136k
}
880
881
/**
882
 * xmlFreeEntitiesTable:
883
 * @table:  An entity table
884
 *
885
 * Deallocate the memory used by an entities hash table.
886
 */
887
void
888
82.6k
xmlFreeEntitiesTable(xmlEntitiesTablePtr table) {
889
82.6k
    xmlHashFree(table, xmlFreeEntityWrapper);
890
82.6k
}
891
892
/**
893
 * xmlCopyEntity:
894
 * @ent:  An entity
895
 *
896
 * Build a copy of an entity
897
 *
898
 * Returns the new xmlEntitiesPtr or NULL in case of error.
899
 */
900
static void *
901
0
xmlCopyEntity(void *payload, const xmlChar *name ATTRIBUTE_UNUSED) {
902
0
    xmlEntityPtr ent = (xmlEntityPtr) payload;
903
0
    xmlEntityPtr cur;
904
905
0
    cur = (xmlEntityPtr) xmlMalloc(sizeof(xmlEntity));
906
0
    if (cur == NULL)
907
0
  return(NULL);
908
0
    memset(cur, 0, sizeof(xmlEntity));
909
0
    cur->type = XML_ENTITY_DECL;
910
911
0
    cur->etype = ent->etype;
912
0
    if (ent->name != NULL) {
913
0
  cur->name = xmlStrdup(ent->name);
914
0
        if (cur->name == NULL)
915
0
            goto error;
916
0
    }
917
0
    if (ent->ExternalID != NULL) {
918
0
  cur->ExternalID = xmlStrdup(ent->ExternalID);
919
0
        if (cur->ExternalID == NULL)
920
0
            goto error;
921
0
    }
922
0
    if (ent->SystemID != NULL) {
923
0
  cur->SystemID = xmlStrdup(ent->SystemID);
924
0
        if (cur->SystemID == NULL)
925
0
            goto error;
926
0
    }
927
0
    if (ent->content != NULL) {
928
0
  cur->content = xmlStrdup(ent->content);
929
0
        if (cur->content == NULL)
930
0
            goto error;
931
0
    }
932
0
    if (ent->orig != NULL) {
933
0
  cur->orig = xmlStrdup(ent->orig);
934
0
        if (cur->orig == NULL)
935
0
            goto error;
936
0
    }
937
0
    if (ent->URI != NULL) {
938
0
  cur->URI = xmlStrdup(ent->URI);
939
0
        if (cur->URI == NULL)
940
0
            goto error;
941
0
    }
942
0
    return(cur);
943
944
0
error:
945
0
    xmlFreeEntity(cur);
946
0
    return(NULL);
947
0
}
948
949
/**
950
 * xmlCopyEntitiesTable:
951
 * @table:  An entity table
952
 *
953
 * Build a copy of an entity table.
954
 *
955
 * Returns the new xmlEntitiesTablePtr or NULL in case of error.
956
 */
957
xmlEntitiesTablePtr
958
0
xmlCopyEntitiesTable(xmlEntitiesTablePtr table) {
959
0
    return(xmlHashCopySafe(table, xmlCopyEntity, xmlFreeEntityWrapper));
960
0
}
961
962
#ifdef LIBXML_OUTPUT_ENABLED
963
964
/**
965
 * xmlDumpEntityDecl:
966
 * @buf:  An XML buffer.
967
 * @ent:  An entity table
968
 *
969
 * This will dump the content of the entity table as an XML DTD definition
970
 */
971
void
972
0
xmlDumpEntityDecl(xmlBufferPtr buf, xmlEntityPtr ent) {
973
0
    xmlSaveCtxtPtr save;
974
975
0
    if ((buf == NULL) || (ent == NULL))
976
0
        return;
977
978
0
    save = xmlSaveToBuffer(buf, NULL, 0);
979
0
    xmlSaveTree(save, (xmlNodePtr) ent);
980
0
    if (xmlSaveFinish(save) != XML_ERR_OK)
981
0
        xmlFree(xmlBufferDetach(buf));
982
0
}
983
984
/**
985
 * xmlDumpEntityDeclScan:
986
 * @ent:  An entity table
987
 * @buf:  An XML buffer.
988
 *
989
 * When using the hash table scan function, arguments need to be reversed
990
 */
991
static void
992
xmlDumpEntityDeclScan(void *ent, void *save,
993
0
                      const xmlChar *name ATTRIBUTE_UNUSED) {
994
0
    xmlSaveTree(save, ent);
995
0
}
996
997
/**
998
 * xmlDumpEntitiesTable:
999
 * @buf:  An XML buffer.
1000
 * @table:  An entity table
1001
 *
1002
 * This will dump the content of the entity table as an XML DTD definition
1003
 */
1004
void
1005
0
xmlDumpEntitiesTable(xmlBufferPtr buf, xmlEntitiesTablePtr table) {
1006
0
    xmlSaveCtxtPtr save;
1007
1008
0
    if ((buf == NULL) || (table == NULL))
1009
0
        return;
1010
1011
0
    save = xmlSaveToBuffer(buf, NULL, 0);
1012
0
    xmlHashScan(table, xmlDumpEntityDeclScan, save);
1013
0
    if (xmlSaveFinish(save) != XML_ERR_OK)
1014
0
        xmlFree(xmlBufferDetach(buf));
1015
0
}
1016
#endif /* LIBXML_OUTPUT_ENABLED */