Coverage Report

Created: 2025-08-03 06:44

/src/libxml2/entities.c
Line
Count
Source (jump to first uncovered line)
1
/*
2
 * entities.c : implementation for the XML entities handling
3
 *
4
 * See Copyright for the status of this software.
5
 *
6
 * daniel@veillard.com
7
 */
8
9
/* To avoid EBCDIC trouble when parsing on zOS */
10
#if defined(__MVS__)
11
#pragma convert("ISO8859-1")
12
#endif
13
14
#define IN_LIBXML
15
#include "libxml.h"
16
17
#include <string.h>
18
#include <stdlib.h>
19
20
#include <libxml/xmlmemory.h>
21
#include <libxml/hash.h>
22
#include <libxml/entities.h>
23
#include <libxml/parser.h>
24
#include <libxml/parserInternals.h>
25
#include <libxml/xmlerror.h>
26
#include <libxml/dict.h>
27
#include <libxml/xmlsave.h>
28
29
#include "private/entities.h"
30
#include "private/error.h"
31
32
#ifndef SIZE_MAX
33
  #define SIZE_MAX ((size_t) -1)
34
#endif
35
36
/*
37
 * The XML predefined entities.
38
 */
39
40
static xmlEntity xmlEntityLt = {
41
    NULL, XML_ENTITY_DECL, BAD_CAST "lt",
42
    NULL, NULL, NULL, NULL, NULL, NULL,
43
    BAD_CAST "<", BAD_CAST "<", 1,
44
    XML_INTERNAL_PREDEFINED_ENTITY,
45
    NULL, NULL, NULL, NULL, 0, 0, 0
46
};
47
static xmlEntity xmlEntityGt = {
48
    NULL, XML_ENTITY_DECL, BAD_CAST "gt",
49
    NULL, NULL, NULL, NULL, NULL, NULL,
50
    BAD_CAST ">", BAD_CAST ">", 1,
51
    XML_INTERNAL_PREDEFINED_ENTITY,
52
    NULL, NULL, NULL, NULL, 0, 0, 0
53
};
54
static xmlEntity xmlEntityAmp = {
55
    NULL, XML_ENTITY_DECL, BAD_CAST "amp",
56
    NULL, NULL, NULL, NULL, NULL, NULL,
57
    BAD_CAST "&", BAD_CAST "&", 1,
58
    XML_INTERNAL_PREDEFINED_ENTITY,
59
    NULL, NULL, NULL, NULL, 0, 0, 0
60
};
61
static xmlEntity xmlEntityQuot = {
62
    NULL, XML_ENTITY_DECL, BAD_CAST "quot",
63
    NULL, NULL, NULL, NULL, NULL, NULL,
64
    BAD_CAST "\"", BAD_CAST "\"", 1,
65
    XML_INTERNAL_PREDEFINED_ENTITY,
66
    NULL, NULL, NULL, NULL, 0, 0, 0
67
};
68
static xmlEntity xmlEntityApos = {
69
    NULL, XML_ENTITY_DECL, BAD_CAST "apos",
70
    NULL, NULL, NULL, NULL, NULL, NULL,
71
    BAD_CAST "'", BAD_CAST "'", 1,
72
    XML_INTERNAL_PREDEFINED_ENTITY,
73
    NULL, NULL, NULL, NULL, 0, 0, 0
74
};
75
76
/*
77
 * xmlFreeEntity:
78
 * @entity:  an entity
79
 *
80
 * Frees the entity.
81
 */
82
void
83
xmlFreeEntity(xmlEntityPtr entity)
84
153k
{
85
153k
    xmlDictPtr dict = NULL;
86
87
153k
    if (entity == NULL)
88
0
        return;
89
90
153k
    if (entity->doc != NULL)
91
153k
        dict = entity->doc->dict;
92
93
94
153k
    if ((entity->children) &&
95
153k
        (entity == (xmlEntityPtr) entity->children->parent))
96
2.53k
        xmlFreeNodeList(entity->children);
97
153k
    if ((entity->name != NULL) &&
98
153k
        ((dict == NULL) || (!xmlDictOwns(dict, entity->name))))
99
15.2k
        xmlFree((char *) entity->name);
100
153k
    if (entity->ExternalID != NULL)
101
15.1k
        xmlFree((char *) entity->ExternalID);
102
153k
    if (entity->SystemID != NULL)
103
59.2k
        xmlFree((char *) entity->SystemID);
104
153k
    if (entity->URI != NULL)
105
57.4k
        xmlFree((char *) entity->URI);
106
153k
    if (entity->content != NULL)
107
93.7k
        xmlFree((char *) entity->content);
108
153k
    if (entity->orig != NULL)
109
89.9k
        xmlFree((char *) entity->orig);
110
153k
    xmlFree(entity);
111
153k
}
112
113
/*
114
 * xmlCreateEntity:
115
 *
116
 * internal routine doing the entity node structures allocations
117
 */
118
static xmlEntityPtr
119
xmlCreateEntity(xmlDocPtr doc, const xmlChar *name, int type,
120
          const xmlChar *ExternalID, const xmlChar *SystemID,
121
153k
          const xmlChar *content) {
122
153k
    xmlEntityPtr ret;
123
124
153k
    ret = (xmlEntityPtr) xmlMalloc(sizeof(xmlEntity));
125
153k
    if (ret == NULL)
126
11
  return(NULL);
127
153k
    memset(ret, 0, sizeof(xmlEntity));
128
153k
    ret->doc = doc;
129
153k
    ret->type = XML_ENTITY_DECL;
130
131
    /*
132
     * fill the structure.
133
     */
134
153k
    ret->etype = (xmlEntityType) type;
135
153k
    if ((doc == NULL) || (doc->dict == NULL))
136
15.3k
  ret->name = xmlStrdup(name);
137
138k
    else
138
138k
        ret->name = xmlDictLookup(doc->dict, name, -1);
139
153k
    if (ret->name == NULL)
140
1
        goto error;
141
153k
    if (ExternalID != NULL) {
142
15.1k
        ret->ExternalID = xmlStrdup(ExternalID);
143
15.1k
        if (ret->ExternalID == NULL)
144
2
            goto error;
145
15.1k
    }
146
153k
    if (SystemID != NULL) {
147
59.2k
        ret->SystemID = xmlStrdup(SystemID);
148
59.2k
        if (ret->SystemID == NULL)
149
2
            goto error;
150
59.2k
    }
151
153k
    if (content != NULL) {
152
93.0k
        ret->length = xmlStrlen(content);
153
93.0k
  ret->content = xmlStrndup(content, ret->length);
154
93.0k
        if (ret->content == NULL)
155
2
            goto error;
156
93.0k
     } else {
157
60.4k
        ret->length = 0;
158
60.4k
        ret->content = NULL;
159
60.4k
    }
160
153k
    ret->URI = NULL; /* to be computed by the layer knowing
161
      the defining entity */
162
153k
    ret->orig = NULL;
163
164
153k
    return(ret);
165
166
7
error:
167
7
    xmlFreeEntity(ret);
168
7
    return(NULL);
169
153k
}
170
171
/**
172
 * xmlAddEntity:
173
 * @doc:  the document
174
 * @extSubset:  add to the external or internal subset
175
 * @name:  the entity name
176
 * @type:  the entity type XML_xxx_yyy_ENTITY
177
 * @ExternalID:  the entity external ID if available
178
 * @SystemID:  the entity system ID if available
179
 * @content:  the entity content
180
 * @out:  pointer to resulting entity (optional)
181
 *
182
 * Register a new entity for this document.
183
 *
184
 * Available since 2.13.0.
185
 *
186
 * Returns an xmlParserErrors error code.
187
 */
188
int
189
xmlAddEntity(xmlDocPtr doc, int extSubset, const xmlChar *name, int type,
190
    const xmlChar *ExternalID, const xmlChar *SystemID,
191
156k
    const xmlChar *content, xmlEntityPtr *out) {
192
156k
    xmlDtdPtr dtd;
193
156k
    xmlDictPtr dict = NULL;
194
156k
    xmlEntitiesTablePtr table = NULL;
195
156k
    xmlEntityPtr ret, predef;
196
156k
    int res;
197
198
156k
    if (out != NULL)
199
156k
        *out = NULL;
200
156k
    if ((doc == NULL) || (name == NULL))
201
0
  return(XML_ERR_ARGUMENT);
202
156k
    dict = doc->dict;
203
204
156k
    if (extSubset)
205
7.54k
        dtd = doc->extSubset;
206
149k
    else
207
149k
        dtd = doc->intSubset;
208
156k
    if (dtd == NULL)
209
0
        return(XML_DTD_NO_DTD);
210
211
156k
    switch (type) {
212
29.6k
        case XML_INTERNAL_GENERAL_ENTITY:
213
45.4k
        case XML_EXTERNAL_GENERAL_PARSED_ENTITY:
214
45.6k
        case XML_EXTERNAL_GENERAL_UNPARSED_ENTITY:
215
45.6k
            predef = xmlGetPredefinedEntity(name);
216
45.6k
            if (predef != NULL) {
217
3.80k
                int valid = 0;
218
219
                /* 4.6 Predefined Entities */
220
3.80k
                if ((type == XML_INTERNAL_GENERAL_ENTITY) &&
221
3.80k
                    (content != NULL)) {
222
3.05k
                    int c = predef->content[0];
223
224
3.05k
                    if (((content[0] == c) && (content[1] == 0)) &&
225
3.05k
                        ((c == '>') || (c == '\'') || (c == '"'))) {
226
187
                        valid = 1;
227
2.86k
                    } else if ((content[0] == '&') && (content[1] == '#')) {
228
934
                        if (content[2] == 'x') {
229
331
                            xmlChar *hex = BAD_CAST "0123456789ABCDEF";
230
331
                            xmlChar ref[] = "00;";
231
232
331
                            ref[0] = hex[c / 16 % 16];
233
331
                            ref[1] = hex[c % 16];
234
331
                            if (xmlStrcasecmp(&content[3], ref) == 0)
235
0
                                valid = 1;
236
603
                        } else {
237
603
                            xmlChar ref[] = "00;";
238
239
603
                            ref[0] = '0' + c / 10 % 10;
240
603
                            ref[1] = '0' + c % 10;
241
603
                            if (xmlStrEqual(&content[2], ref))
242
267
                                valid = 1;
243
603
                        }
244
934
                    }
245
3.05k
                }
246
3.80k
                if (!valid)
247
3.34k
                    return(XML_ERR_REDECL_PREDEF_ENTITY);
248
3.80k
            }
249
42.3k
      if (dtd->entities == NULL) {
250
30.8k
    dtd->entities = xmlHashCreateDict(0, dict);
251
30.8k
                if (dtd->entities == NULL)
252
5
                    return(XML_ERR_NO_MEMORY);
253
30.8k
            }
254
42.3k
      table = dtd->entities;
255
42.3k
      break;
256
67.1k
        case XML_INTERNAL_PARAMETER_ENTITY:
257
111k
        case XML_EXTERNAL_PARAMETER_ENTITY:
258
111k
      if (dtd->pentities == NULL) {
259
37.8k
    dtd->pentities = xmlHashCreateDict(0, dict);
260
37.8k
                if (dtd->pentities == NULL)
261
2
                    return(XML_ERR_NO_MEMORY);
262
37.8k
            }
263
111k
      table = dtd->pentities;
264
111k
      break;
265
0
        default:
266
0
      return(XML_ERR_ARGUMENT);
267
156k
    }
268
153k
    ret = xmlCreateEntity(dtd->doc, name, type, ExternalID, SystemID, content);
269
153k
    if (ret == NULL)
270
18
        return(XML_ERR_NO_MEMORY);
271
272
153k
    res = xmlHashAdd(table, name, ret);
273
153k
    if (res < 0) {
274
6
        xmlFreeEntity(ret);
275
6
        return(XML_ERR_NO_MEMORY);
276
153k
    } else if (res == 0) {
277
  /*
278
   * entity was already defined at another level.
279
   */
280
3.07k
        xmlFreeEntity(ret);
281
3.07k
  return(XML_WAR_ENTITY_REDEFINED);
282
3.07k
    }
283
284
    /*
285
     * Link it to the DTD
286
     */
287
150k
    ret->parent = dtd;
288
150k
    ret->doc = dtd->doc;
289
150k
    if (dtd->last == NULL) {
290
55.7k
  dtd->children = dtd->last = (xmlNodePtr) ret;
291
94.7k
    } else {
292
94.7k
  dtd->last->next = (xmlNodePtr) ret;
293
94.7k
  ret->prev = dtd->last;
294
94.7k
  dtd->last = (xmlNodePtr) ret;
295
94.7k
    }
296
297
150k
    if (out != NULL)
298
150k
        *out = ret;
299
150k
    return(0);
300
153k
}
301
302
/**
303
 * xmlGetPredefinedEntity:
304
 * @name:  the entity name
305
 *
306
 * Check whether this name is an predefined entity.
307
 *
308
 * Returns NULL if not, otherwise the entity
309
 */
310
xmlEntityPtr
311
2.28M
xmlGetPredefinedEntity(const xmlChar *name) {
312
2.28M
    if (name == NULL) return(NULL);
313
2.28M
    switch (name[0]) {
314
22.2k
        case 'l':
315
22.2k
      if (xmlStrEqual(name, BAD_CAST "lt"))
316
17.2k
          return(&xmlEntityLt);
317
5.01k
      break;
318
53.3k
        case 'g':
319
53.3k
      if (xmlStrEqual(name, BAD_CAST "gt"))
320
44.8k
          return(&xmlEntityGt);
321
8.45k
      break;
322
886k
        case 'a':
323
886k
      if (xmlStrEqual(name, BAD_CAST "amp"))
324
63.0k
          return(&xmlEntityAmp);
325
823k
      if (xmlStrEqual(name, BAD_CAST "apos"))
326
565
          return(&xmlEntityApos);
327
823k
      break;
328
823k
        case 'q':
329
646k
      if (xmlStrEqual(name, BAD_CAST "quot"))
330
837
          return(&xmlEntityQuot);
331
646k
      break;
332
675k
  default:
333
675k
      break;
334
2.28M
    }
335
2.15M
    return(NULL);
336
2.28M
}
337
338
/**
339
 * xmlAddDtdEntity:
340
 * @doc:  the document
341
 * @name:  the entity name
342
 * @type:  the entity type XML_xxx_yyy_ENTITY
343
 * @ExternalID:  the entity external ID if available
344
 * @SystemID:  the entity system ID if available
345
 * @content:  the entity content
346
 *
347
 * Register a new entity for this document DTD external subset.
348
 *
349
 * Returns a pointer to the entity or NULL in case of error
350
 */
351
xmlEntityPtr
352
xmlAddDtdEntity(xmlDocPtr doc, const xmlChar *name, int type,
353
          const xmlChar *ExternalID, const xmlChar *SystemID,
354
0
    const xmlChar *content) {
355
0
    xmlEntityPtr ret;
356
357
0
    xmlAddEntity(doc, 1, name, type, ExternalID, SystemID, content, &ret);
358
0
    return(ret);
359
0
}
360
361
/**
362
 * xmlAddDocEntity:
363
 * @doc:  the document
364
 * @name:  the entity name
365
 * @type:  the entity type XML_xxx_yyy_ENTITY
366
 * @ExternalID:  the entity external ID if available
367
 * @SystemID:  the entity system ID if available
368
 * @content:  the entity content
369
 *
370
 * Register a new entity for this document.
371
 *
372
 * Returns a pointer to the entity or NULL in case of error
373
 */
374
xmlEntityPtr
375
xmlAddDocEntity(xmlDocPtr doc, const xmlChar *name, int type,
376
          const xmlChar *ExternalID, const xmlChar *SystemID,
377
0
          const xmlChar *content) {
378
0
    xmlEntityPtr ret;
379
380
0
    xmlAddEntity(doc, 0, name, type, ExternalID, SystemID, content, &ret);
381
0
    return(ret);
382
0
}
383
384
/**
385
 * xmlNewEntity:
386
 * @doc:  the document
387
 * @name:  the entity name
388
 * @type:  the entity type XML_xxx_yyy_ENTITY
389
 * @ExternalID:  the entity external ID if available
390
 * @SystemID:  the entity system ID if available
391
 * @content:  the entity content
392
 *
393
 * Create a new entity, this differs from xmlAddDocEntity() that if
394
 * the document is NULL or has no internal subset defined, then an
395
 * unlinked entity structure will be returned, it is then the responsibility
396
 * of the caller to link it to the document later or free it when not needed
397
 * anymore.
398
 *
399
 * Returns a pointer to the entity or NULL in case of error
400
 */
401
xmlEntityPtr
402
xmlNewEntity(xmlDocPtr doc, const xmlChar *name, int type,
403
       const xmlChar *ExternalID, const xmlChar *SystemID,
404
0
       const xmlChar *content) {
405
0
    if ((doc != NULL) && (doc->intSubset != NULL)) {
406
0
  return(xmlAddDocEntity(doc, name, type, ExternalID, SystemID, content));
407
0
    }
408
0
    if (name == NULL)
409
0
        return(NULL);
410
0
    return(xmlCreateEntity(doc, name, type, ExternalID, SystemID, content));
411
0
}
412
413
/**
414
 * xmlGetEntityFromTable:
415
 * @table:  an entity table
416
 * @name:  the entity name
417
 * @parameter:  look for parameter entities
418
 *
419
 * Do an entity lookup in the table.
420
 * returns the corresponding parameter entity, if found.
421
 *
422
 * Returns A pointer to the entity structure or NULL if not found.
423
 */
424
static xmlEntityPtr
425
1.01M
xmlGetEntityFromTable(xmlEntitiesTablePtr table, const xmlChar *name) {
426
1.01M
    return((xmlEntityPtr) xmlHashLookup(table, name));
427
1.01M
}
428
429
/**
430
 * xmlGetParameterEntity:
431
 * @doc:  the document referencing the entity
432
 * @name:  the entity name
433
 *
434
 * Do an entity lookup in the internal and external subsets and
435
 * returns the corresponding parameter entity, if found.
436
 *
437
 * Returns A pointer to the entity structure or NULL if not found.
438
 */
439
xmlEntityPtr
440
186k
xmlGetParameterEntity(xmlDocPtr doc, const xmlChar *name) {
441
186k
    xmlEntitiesTablePtr table;
442
186k
    xmlEntityPtr ret;
443
444
186k
    if (doc == NULL)
445
647
  return(NULL);
446
186k
    if ((doc->intSubset != NULL) && (doc->intSubset->pentities != NULL)) {
447
179k
  table = (xmlEntitiesTablePtr) doc->intSubset->pentities;
448
179k
  ret = xmlGetEntityFromTable(table, name);
449
179k
  if (ret != NULL)
450
143k
      return(ret);
451
179k
    }
452
43.2k
    if ((doc->extSubset != NULL) && (doc->extSubset->pentities != NULL)) {
453
8.36k
  table = (xmlEntitiesTablePtr) doc->extSubset->pentities;
454
8.36k
  return(xmlGetEntityFromTable(table, name));
455
8.36k
    }
456
34.8k
    return(NULL);
457
43.2k
}
458
459
/**
460
 * xmlGetDtdEntity:
461
 * @doc:  the document referencing the entity
462
 * @name:  the entity name
463
 *
464
 * Do an entity lookup in the DTD entity hash table and
465
 * returns the corresponding entity, if found.
466
 * Note: the first argument is the document node, not the DTD node.
467
 *
468
 * Returns A pointer to the entity structure or NULL if not found.
469
 */
470
xmlEntityPtr
471
0
xmlGetDtdEntity(xmlDocPtr doc, const xmlChar *name) {
472
0
    xmlEntitiesTablePtr table;
473
474
0
    if (doc == NULL)
475
0
  return(NULL);
476
0
    if ((doc->extSubset != NULL) && (doc->extSubset->entities != NULL)) {
477
0
  table = (xmlEntitiesTablePtr) doc->extSubset->entities;
478
0
  return(xmlGetEntityFromTable(table, name));
479
0
    }
480
0
    return(NULL);
481
0
}
482
483
/**
484
 * xmlGetDocEntity:
485
 * @doc:  the document referencing the entity
486
 * @name:  the entity name
487
 *
488
 * Do an entity lookup in the document entity hash table and
489
 * returns the corresponding entity, otherwise a lookup is done
490
 * in the predefined entities too.
491
 *
492
 * Returns A pointer to the entity structure or NULL if not found.
493
 */
494
xmlEntityPtr
495
930k
xmlGetDocEntity(const xmlDoc *doc, const xmlChar *name) {
496
930k
    xmlEntityPtr cur;
497
930k
    xmlEntitiesTablePtr table;
498
499
930k
    if (doc != NULL) {
500
927k
  if ((doc->intSubset != NULL) && (doc->intSubset->entities != NULL)) {
501
746k
      table = (xmlEntitiesTablePtr) doc->intSubset->entities;
502
746k
      cur = xmlGetEntityFromTable(table, name);
503
746k
      if (cur != NULL)
504
573k
    return(cur);
505
746k
  }
506
354k
  if (doc->standalone != 1) {
507
354k
      if ((doc->extSubset != NULL) &&
508
354k
    (doc->extSubset->entities != NULL)) {
509
84.7k
    table = (xmlEntitiesTablePtr) doc->extSubset->entities;
510
84.7k
    cur = xmlGetEntityFromTable(table, name);
511
84.7k
    if (cur != NULL)
512
324
        return(cur);
513
84.7k
      }
514
354k
  }
515
354k
    }
516
356k
    return(xmlGetPredefinedEntity(name));
517
930k
}
518
519
/*
520
 * xmlSerializeHexCharRef:
521
 * @buf:  a char buffer
522
 * @val:  a codepoint
523
 *
524
 * Serializes a hex char ref like &#xA0;
525
 *
526
 * Writes at most 9 bytes. Does not include a terminating zero byte.
527
 *
528
 * Returns the number of bytes written.
529
 */
530
int
531
1.61k
xmlSerializeHexCharRef(char *buf, int val) {
532
1.61k
    char *out = buf;
533
1.61k
    int shift = 0, bits;
534
535
1.61k
    *out++ = '&';
536
1.61k
    *out++ = '#';
537
1.61k
    *out++ = 'x';
538
539
1.61k
    bits = val;
540
1.61k
    if (bits & 0xFF0000) {
541
39
        shift = 16;
542
39
        bits &= 0xFF0000;
543
1.57k
    } else if (bits & 0x00FF00) {
544
389
        shift = 8;
545
389
        bits &= 0x00FF00;
546
389
    }
547
1.61k
    if (bits & 0xF0F0F0) {
548
1.18k
        shift += 4;
549
1.18k
    }
550
551
3.73k
    do {
552
3.73k
        int d = (val >> shift) & 0x0F;
553
554
3.73k
        if (d < 10)
555
1.74k
            *out++ = '0' + d;
556
1.99k
        else
557
1.99k
            *out++ = 'A' + (d - 10);
558
559
3.73k
  shift -= 4;
560
3.73k
    } while (shift >= 0);
561
562
1.61k
    *out++ = ';';
563
564
1.61k
    return(out - buf);
565
1.61k
}
566
567
/*
568
 * xmlSerializeDecCharRef:
569
 * @buf:  a char buffer
570
 * @val:  a codepoint
571
 *
572
 * Serializes a decimal char ref like &#38;
573
 *
574
 * Writes at most 10 bytes. Does not include a terminating zero byte.
575
 *
576
 * Returns the number of bytes written.
577
 */
578
int
579
50.1M
xmlSerializeDecCharRef(char *buf, int val) {
580
50.1M
    char *out = buf;
581
50.1M
    int len, i;
582
583
50.1M
    *out++ = '&';
584
50.1M
    *out++ = '#';
585
586
50.1M
    if (val < 100) {
587
100
        len = (val < 10) ? 1 : 2;
588
50.1M
    } else if (val < 10000) {
589
50.1M
        len = (val < 1000) ? 3 : 4;
590
50.1M
    } else if (val < 1000000) {
591
3.86k
        len = (val < 100000) ? 5 : 6;
592
3.86k
    } else {
593
251
        len = 7;
594
251
    }
595
596
200M
    for (i = len - 1; i >= 0; i--) {
597
150M
        out[i] = '0' + val % 10;
598
150M
        val /= 10;
599
150M
    }
600
601
50.1M
    out[len] = ';';
602
603
50.1M
    return(len + 3);
604
50.1M
}
605
606
static const char xmlEscapeSafe[128] = {
607
    0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0,
608
    0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
609
    1, 1, 0, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1,
610
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 1,
611
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
612
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
613
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
614
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1
615
};
616
617
/*
618
 * xmlEscapeText:
619
 * @text:  input text
620
 * @flags:  XML_ESCAPE flags
621
 *
622
 * Escapes certain characters with char refs.
623
 *
624
 * XML_ESCAPE_ATTR: for attribute content.
625
 * XML_ESCAPE_NON_ASCII: escape non-ASCII chars.
626
 * XML_ESCAPE_HTML: for HTML content.
627
 * XML_ESCAPE_QUOT: escape double quotes.
628
 * XML_ESCAPE_ALLOW_INVALID: allow invalid characters.
629
 *
630
 * Returns an escaped string or NULL if a memory allocation failed.
631
 */
632
xmlChar *
633
99.2k
xmlEscapeText(const xmlChar *text, int flags) {
634
99.2k
    const xmlChar *cur;
635
99.2k
    xmlChar *buffer;
636
99.2k
    xmlChar *out;
637
99.2k
    const xmlChar *unescaped;
638
99.2k
    size_t size = 50;
639
640
99.2k
    buffer = xmlMalloc(size + 1);
641
99.2k
    if (buffer == NULL)
642
66
        return(NULL);
643
99.1k
    out = buffer;
644
645
99.1k
    cur = text;
646
99.1k
    unescaped = cur;
647
648
396k
    while (*cur != '\0') {
649
297k
        char buf[12];
650
297k
  const xmlChar *end;
651
297k
        const xmlChar *repl;
652
297k
        size_t used;
653
297k
        size_t replSize;
654
297k
        size_t unescapedSize;
655
297k
        size_t totalSize;
656
297k
        int chunkSize = 1;
657
297k
        int c;
658
659
        /* accelerator */
660
214M
  while (1) {
661
214M
            c = *cur;
662
663
214M
            if (c < 0x80) {
664
36.6M
                if (!xmlEscapeSafe[*cur])
665
297k
                    break;
666
177M
            } else {
667
177M
               if (flags & XML_ESCAPE_NON_ASCII)
668
0
                   break;
669
177M
            }
670
214M
            cur += 1;
671
214M
        }
672
673
297k
        if (c == 0) {
674
96.3k
            chunkSize = 0;
675
96.3k
            repl = BAD_CAST "";
676
96.3k
            replSize = 0;
677
201k
        } else if (c == '<') {
678
      /*
679
       * Special handling of server side include in HTML attributes
680
       */
681
40.7k
      if ((flags & XML_ESCAPE_HTML) && (flags & XML_ESCAPE_ATTR) &&
682
40.7k
          (cur[1] == '!') && (cur[2] == '-') && (cur[3] == '-') &&
683
40.7k
          ((end = xmlStrstr(cur, BAD_CAST "-->")) != NULL)) {
684
1.97k
                chunkSize = (end - cur) + 3;
685
1.97k
                repl = cur;
686
1.97k
                replSize = chunkSize;
687
38.8k
      } else {
688
38.8k
                repl = BAD_CAST "&lt;";
689
38.8k
                replSize = 4;
690
38.8k
            }
691
160k
  } else if (c == '>') {
692
60.2k
            repl = BAD_CAST "&gt;";
693
60.2k
            replSize = 4;
694
100k
  } else if (c == '&') {
695
      /*
696
       * Special handling of &{...} construct from HTML 4, see
697
       * http://www.w3.org/TR/html401/appendix/notes.html#h-B.7.1
698
       */
699
11.4k
      if ((flags & XML_ESCAPE_HTML) && (flags & XML_ESCAPE_ATTR) &&
700
11.4k
                (cur[1] == '{') && (end = xmlStrchr(cur, '}'))) {
701
3.54k
                chunkSize = (end - cur) + 1;
702
3.54k
                repl = cur;
703
3.54k
                replSize = chunkSize;
704
7.89k
      } else {
705
7.89k
                repl = BAD_CAST "&amp;";
706
7.89k
                replSize = 5;
707
7.89k
            }
708
88.8k
  } else if ((flags & XML_ESCAPE_QUOT) && (c == '"')) {
709
0
            repl = BAD_CAST "&quot;";
710
0
            replSize = 6;
711
88.8k
  } else if (((flags & XML_ESCAPE_HTML) == 0) && (c == '\r')) {
712
0
      repl = BAD_CAST "&#13;";
713
0
            replSize = 5;
714
88.8k
  } else if ((flags & XML_ESCAPE_NON_ASCII) && (c >= 0x80)) {
715
0
            int val;
716
717
0
            chunkSize = 4;
718
0
            val = xmlGetUTF8Char(cur, &chunkSize);
719
0
            if (val < 0) {
720
0
                val = 0xFFFD;
721
0
                chunkSize = 1;
722
0
            } else if (((flags & XML_ESCAPE_ALLOW_INVALID) == 0) &&
723
0
                       (!IS_CHAR(val))) {
724
0
                val = 0xFFFD;
725
0
            }
726
727
0
            replSize = xmlSerializeHexCharRef(buf, val);
728
0
            repl = BAD_CAST buf;
729
88.8k
  } else if ((flags & (XML_ESCAPE_ALLOW_INVALID | XML_ESCAPE_HTML)) ||
730
88.8k
                   (c >= 0x20) ||
731
88.8k
             (c == '\n') || (c == '\t') || (c == '\r')) {
732
      /* default case, just copy */
733
88.8k
            cur += 1;
734
88.8k
            if (*cur != 0)
735
88.3k
                continue;
736
737
462
            chunkSize = 0;
738
462
            repl = BAD_CAST "";
739
462
            replSize = 0;
740
462
  } else {
741
            /* ignore */
742
0
            repl = BAD_CAST "";
743
0
            replSize = 0;
744
0
        }
745
746
209k
        used = out - buffer;
747
209k
        unescapedSize = cur - unescaped;
748
209k
        totalSize = unescapedSize + replSize;
749
750
209k
  cur += chunkSize;
751
752
209k
        if (totalSize > size - used) {
753
33.7k
            xmlChar *tmp;
754
33.7k
            int newSize;
755
756
33.7k
            if ((size > (SIZE_MAX - 1) / 2) ||
757
33.7k
                (totalSize > (SIZE_MAX - 1) / 2 - size)) {
758
0
                xmlFree(buffer);
759
0
                return(NULL);
760
0
            }
761
33.7k
            newSize = size + totalSize;
762
33.7k
            if (*cur != 0)
763
9.68k
                newSize *= 2;
764
33.7k
            tmp = xmlRealloc(buffer, newSize + 1);
765
33.7k
            if (tmp == NULL) {
766
6
                xmlFree(buffer);
767
6
                return(NULL);
768
6
            }
769
33.7k
            buffer = tmp;
770
33.7k
            size = newSize;
771
33.7k
            out = buffer + used;
772
33.7k
        }
773
774
209k
        memcpy(out, unescaped, unescapedSize);
775
209k
        out += unescapedSize;
776
209k
        memcpy(out, repl, replSize);
777
209k
        out += replSize;
778
779
209k
        unescaped = cur;
780
209k
    }
781
782
99.1k
    *out = 0;
783
99.1k
    return(buffer);
784
99.1k
}
785
786
/**
787
 * xmlEncodeEntitiesInternal:
788
 * @doc:  the document containing the string
789
 * @input:  A string to convert to XML.
790
 * @flags:  XML_ESCAPE flags
791
 *
792
 * Do a global encoding of a string, replacing the predefined entities
793
 * and non ASCII values with their entities and CharRef counterparts.
794
 * Contrary to xmlEncodeEntities, this routine is reentrant, and result
795
 * must be deallocated.
796
 *
797
 * Returns A newly allocated string with the substitution done.
798
 */
799
xmlChar *
800
xmlEncodeEntitiesInternal(xmlDocPtr doc, const xmlChar *input,
801
99.2k
                          unsigned flags) {
802
99.2k
    if (input == NULL)
803
0
        return(NULL);
804
805
99.2k
    if ((doc != NULL) && (doc->type == XML_HTML_DOCUMENT_NODE))
806
99.2k
        flags |= XML_ESCAPE_HTML;
807
0
    else if ((doc == NULL) || (doc->encoding == NULL))
808
0
        flags |= XML_ESCAPE_NON_ASCII;
809
810
99.2k
    return(xmlEscapeText(input, flags));
811
99.2k
}
812
813
/**
814
 * xmlEncodeEntitiesReentrant:
815
 * @doc:  the document containing the string
816
 * @input:  A string to convert to XML.
817
 *
818
 * Do a global encoding of a string, replacing the predefined entities
819
 * and non ASCII values with their entities and CharRef counterparts.
820
 * Contrary to xmlEncodeEntities, this routine is reentrant, and result
821
 * must be deallocated.
822
 *
823
 * This escapes '<', '>', '&' and '\r'. If the document has no encoding,
824
 * non-ASCII codepoints are escaped. There is some special handling for
825
 * HTML documents.
826
 *
827
 * Returns A newly allocated string with the substitution done.
828
 */
829
xmlChar *
830
66.6k
xmlEncodeEntitiesReentrant(xmlDocPtr doc, const xmlChar *input) {
831
66.6k
    return xmlEncodeEntitiesInternal(doc, input, 0);
832
66.6k
}
833
834
/**
835
 * xmlEncodeSpecialChars:
836
 * @doc:  unused
837
 * @input:  A string to convert to XML.
838
 *
839
 * Do a global encoding of a string, replacing the predefined entities
840
 * this routine is reentrant, and result must be deallocated.
841
 *
842
 * This escapes '<', '>', '&', '"' and '\r' chars.
843
 *
844
 * Returns A newly allocated string with the substitution done.
845
 */
846
xmlChar *
847
xmlEncodeSpecialChars(const xmlDoc *doc ATTRIBUTE_UNUSED,
848
0
                      const xmlChar *input) {
849
0
    if (input == NULL)
850
0
        return(NULL);
851
852
0
    return(xmlEscapeText(input, XML_ESCAPE_QUOT | XML_ESCAPE_ALLOW_INVALID));
853
0
}
854
855
/**
856
 * xmlCreateEntitiesTable:
857
 *
858
 * create and initialize an empty entities hash table.
859
 * This really doesn't make sense and should be deprecated
860
 *
861
 * Returns the xmlEntitiesTablePtr just created or NULL in case of error.
862
 */
863
xmlEntitiesTablePtr
864
0
xmlCreateEntitiesTable(void) {
865
0
    return((xmlEntitiesTablePtr) xmlHashCreate(0));
866
0
}
867
868
/**
869
 * xmlFreeEntityWrapper:
870
 * @entity:  An entity
871
 * @name:  its name
872
 *
873
 * Deallocate the memory used by an entities in the hash table.
874
 */
875
static void
876
150k
xmlFreeEntityWrapper(void *entity, const xmlChar *name ATTRIBUTE_UNUSED) {
877
150k
    if (entity != NULL)
878
150k
  xmlFreeEntity((xmlEntityPtr) entity);
879
150k
}
880
881
/**
882
 * xmlFreeEntitiesTable:
883
 * @table:  An entity table
884
 *
885
 * Deallocate the memory used by an entities hash table.
886
 */
887
void
888
68.6k
xmlFreeEntitiesTable(xmlEntitiesTablePtr table) {
889
68.6k
    xmlHashFree(table, xmlFreeEntityWrapper);
890
68.6k
}
891
892
/**
893
 * xmlCopyEntity:
894
 * @ent:  An entity
895
 *
896
 * Build a copy of an entity
897
 *
898
 * Returns the new xmlEntitiesPtr or NULL in case of error.
899
 */
900
static void *
901
0
xmlCopyEntity(void *payload, const xmlChar *name ATTRIBUTE_UNUSED) {
902
0
    xmlEntityPtr ent = (xmlEntityPtr) payload;
903
0
    xmlEntityPtr cur;
904
905
0
    cur = (xmlEntityPtr) xmlMalloc(sizeof(xmlEntity));
906
0
    if (cur == NULL)
907
0
  return(NULL);
908
0
    memset(cur, 0, sizeof(xmlEntity));
909
0
    cur->type = XML_ENTITY_DECL;
910
911
0
    cur->etype = ent->etype;
912
0
    if (ent->name != NULL) {
913
0
  cur->name = xmlStrdup(ent->name);
914
0
        if (cur->name == NULL)
915
0
            goto error;
916
0
    }
917
0
    if (ent->ExternalID != NULL) {
918
0
  cur->ExternalID = xmlStrdup(ent->ExternalID);
919
0
        if (cur->ExternalID == NULL)
920
0
            goto error;
921
0
    }
922
0
    if (ent->SystemID != NULL) {
923
0
  cur->SystemID = xmlStrdup(ent->SystemID);
924
0
        if (cur->SystemID == NULL)
925
0
            goto error;
926
0
    }
927
0
    if (ent->content != NULL) {
928
0
  cur->content = xmlStrdup(ent->content);
929
0
        if (cur->content == NULL)
930
0
            goto error;
931
0
    }
932
0
    if (ent->orig != NULL) {
933
0
  cur->orig = xmlStrdup(ent->orig);
934
0
        if (cur->orig == NULL)
935
0
            goto error;
936
0
    }
937
0
    if (ent->URI != NULL) {
938
0
  cur->URI = xmlStrdup(ent->URI);
939
0
        if (cur->URI == NULL)
940
0
            goto error;
941
0
    }
942
0
    return(cur);
943
944
0
error:
945
0
    xmlFreeEntity(cur);
946
0
    return(NULL);
947
0
}
948
949
/**
950
 * xmlCopyEntitiesTable:
951
 * @table:  An entity table
952
 *
953
 * Build a copy of an entity table.
954
 *
955
 * Returns the new xmlEntitiesTablePtr or NULL in case of error.
956
 */
957
xmlEntitiesTablePtr
958
0
xmlCopyEntitiesTable(xmlEntitiesTablePtr table) {
959
0
    return(xmlHashCopySafe(table, xmlCopyEntity, xmlFreeEntityWrapper));
960
0
}
961
962
#ifdef LIBXML_OUTPUT_ENABLED
963
964
/**
965
 * xmlDumpEntityDecl:
966
 * @buf:  An XML buffer.
967
 * @ent:  An entity table
968
 *
969
 * This will dump the content of the entity table as an XML DTD definition
970
 */
971
void
972
0
xmlDumpEntityDecl(xmlBufferPtr buf, xmlEntityPtr ent) {
973
0
    xmlSaveCtxtPtr save;
974
975
0
    if ((buf == NULL) || (ent == NULL))
976
0
        return;
977
978
0
    save = xmlSaveToBuffer(buf, NULL, 0);
979
0
    xmlSaveTree(save, (xmlNodePtr) ent);
980
0
    if (xmlSaveFinish(save) != XML_ERR_OK)
981
0
        xmlFree(xmlBufferDetach(buf));
982
0
}
983
984
/**
985
 * xmlDumpEntityDeclScan:
986
 * @ent:  An entity table
987
 * @buf:  An XML buffer.
988
 *
989
 * When using the hash table scan function, arguments need to be reversed
990
 */
991
static void
992
xmlDumpEntityDeclScan(void *ent, void *save,
993
0
                      const xmlChar *name ATTRIBUTE_UNUSED) {
994
0
    xmlSaveTree(save, ent);
995
0
}
996
997
/**
998
 * xmlDumpEntitiesTable:
999
 * @buf:  An XML buffer.
1000
 * @table:  An entity table
1001
 *
1002
 * This will dump the content of the entity table as an XML DTD definition
1003
 */
1004
void
1005
0
xmlDumpEntitiesTable(xmlBufferPtr buf, xmlEntitiesTablePtr table) {
1006
0
    xmlSaveCtxtPtr save;
1007
1008
0
    if ((buf == NULL) || (table == NULL))
1009
0
        return;
1010
1011
0
    save = xmlSaveToBuffer(buf, NULL, 0);
1012
0
    xmlHashScan(table, xmlDumpEntityDeclScan, save);
1013
0
    if (xmlSaveFinish(save) != XML_ERR_OK)
1014
0
        xmlFree(xmlBufferDetach(buf));
1015
0
}
1016
#endif /* LIBXML_OUTPUT_ENABLED */