Coverage Report

Created: 2025-12-14 06:33

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
/src/libxml2/entities.c
Line
Count
Source
1
/*
2
 * entities.c : implementation for the XML entities handling
3
 *
4
 * See Copyright for the status of this software.
5
 *
6
 * daniel@veillard.com
7
 */
8
9
/* To avoid EBCDIC trouble when parsing on zOS */
10
#if defined(__MVS__)
11
#pragma convert("ISO8859-1")
12
#endif
13
14
#define IN_LIBXML
15
#include "libxml.h"
16
17
#include <string.h>
18
#include <stdlib.h>
19
20
#include <libxml/xmlmemory.h>
21
#include <libxml/hash.h>
22
#include <libxml/entities.h>
23
#include <libxml/parser.h>
24
#include <libxml/parserInternals.h>
25
#include <libxml/xmlerror.h>
26
#include <libxml/dict.h>
27
#include <libxml/xmlsave.h>
28
29
#include "private/entities.h"
30
#include "private/error.h"
31
32
#ifndef SIZE_MAX
33
  #define SIZE_MAX ((size_t) -1)
34
#endif
35
36
/*
37
 * The XML predefined entities.
38
 */
39
40
static xmlEntity xmlEntityLt = {
41
    NULL, XML_ENTITY_DECL, BAD_CAST "lt",
42
    NULL, NULL, NULL, NULL, NULL, NULL,
43
    BAD_CAST "<", BAD_CAST "<", 1,
44
    XML_INTERNAL_PREDEFINED_ENTITY,
45
    NULL, NULL, NULL, NULL, 0, 0, 0
46
};
47
static xmlEntity xmlEntityGt = {
48
    NULL, XML_ENTITY_DECL, BAD_CAST "gt",
49
    NULL, NULL, NULL, NULL, NULL, NULL,
50
    BAD_CAST ">", BAD_CAST ">", 1,
51
    XML_INTERNAL_PREDEFINED_ENTITY,
52
    NULL, NULL, NULL, NULL, 0, 0, 0
53
};
54
static xmlEntity xmlEntityAmp = {
55
    NULL, XML_ENTITY_DECL, BAD_CAST "amp",
56
    NULL, NULL, NULL, NULL, NULL, NULL,
57
    BAD_CAST "&", BAD_CAST "&", 1,
58
    XML_INTERNAL_PREDEFINED_ENTITY,
59
    NULL, NULL, NULL, NULL, 0, 0, 0
60
};
61
static xmlEntity xmlEntityQuot = {
62
    NULL, XML_ENTITY_DECL, BAD_CAST "quot",
63
    NULL, NULL, NULL, NULL, NULL, NULL,
64
    BAD_CAST "\"", BAD_CAST "\"", 1,
65
    XML_INTERNAL_PREDEFINED_ENTITY,
66
    NULL, NULL, NULL, NULL, 0, 0, 0
67
};
68
static xmlEntity xmlEntityApos = {
69
    NULL, XML_ENTITY_DECL, BAD_CAST "apos",
70
    NULL, NULL, NULL, NULL, NULL, NULL,
71
    BAD_CAST "'", BAD_CAST "'", 1,
72
    XML_INTERNAL_PREDEFINED_ENTITY,
73
    NULL, NULL, NULL, NULL, 0, 0, 0
74
};
75
76
/*
77
 * xmlFreeEntity:
78
 * @entity:  an entity
79
 *
80
 * Frees the entity.
81
 */
82
void
83
xmlFreeEntity(xmlEntityPtr entity)
84
123k
{
85
123k
    xmlDictPtr dict = NULL;
86
87
123k
    if (entity == NULL)
88
0
        return;
89
90
123k
    if (entity->doc != NULL)
91
123k
        dict = entity->doc->dict;
92
93
94
123k
    if ((entity->children) &&
95
1.42k
        (entity == (xmlEntityPtr) entity->children->parent))
96
1.42k
        xmlFreeNodeList(entity->children);
97
123k
    if ((entity->name != NULL) &&
98
123k
        ((dict == NULL) || (!xmlDictOwns(dict, entity->name))))
99
19.3k
        xmlFree((char *) entity->name);
100
123k
    if (entity->ExternalID != NULL)
101
12.3k
        xmlFree((char *) entity->ExternalID);
102
123k
    if (entity->SystemID != NULL)
103
40.7k
        xmlFree((char *) entity->SystemID);
104
123k
    if (entity->URI != NULL)
105
38.0k
        xmlFree((char *) entity->URI);
106
123k
    if (entity->content != NULL)
107
81.4k
        xmlFree((char *) entity->content);
108
123k
    if (entity->orig != NULL)
109
68.6k
        xmlFree((char *) entity->orig);
110
123k
    xmlFree(entity);
111
123k
}
112
113
/*
114
 * xmlCreateEntity:
115
 *
116
 * internal routine doing the entity node structures allocations
117
 */
118
static xmlEntityPtr
119
xmlCreateEntity(xmlDocPtr doc, const xmlChar *name, int type,
120
          const xmlChar *ExternalID, const xmlChar *SystemID,
121
123k
          const xmlChar *content) {
122
123k
    xmlEntityPtr ret;
123
124
123k
    ret = (xmlEntityPtr) xmlMalloc(sizeof(xmlEntity));
125
123k
    if (ret == NULL)
126
13
  return(NULL);
127
123k
    memset(ret, 0, sizeof(xmlEntity));
128
123k
    ret->doc = doc;
129
123k
    ret->type = XML_ENTITY_DECL;
130
131
    /*
132
     * fill the structure.
133
     */
134
123k
    ret->etype = (xmlEntityType) type;
135
123k
    if ((doc == NULL) || (doc->dict == NULL))
136
19.3k
  ret->name = xmlStrdup(name);
137
104k
    else
138
104k
        ret->name = xmlDictLookup(doc->dict, name, -1);
139
123k
    if (ret->name == NULL)
140
4
        goto error;
141
123k
    if (ExternalID != NULL) {
142
12.3k
        ret->ExternalID = xmlStrdup(ExternalID);
143
12.3k
        if (ret->ExternalID == NULL)
144
3
            goto error;
145
12.3k
    }
146
123k
    if (SystemID != NULL) {
147
40.7k
        ret->SystemID = xmlStrdup(SystemID);
148
40.7k
        if (ret->SystemID == NULL)
149
3
            goto error;
150
40.7k
    }
151
123k
    if (content != NULL) {
152
81.1k
        ret->length = xmlStrlen(content);
153
81.1k
  ret->content = xmlStrndup(content, ret->length);
154
81.1k
        if (ret->content == NULL)
155
5
            goto error;
156
81.1k
     } else {
157
42.3k
        ret->length = 0;
158
42.3k
        ret->content = NULL;
159
42.3k
    }
160
123k
    ret->URI = NULL; /* to be computed by the layer knowing
161
      the defining entity */
162
123k
    ret->orig = NULL;
163
164
123k
    return(ret);
165
166
15
error:
167
15
    xmlFreeEntity(ret);
168
15
    return(NULL);
169
123k
}
170
171
/**
172
 * xmlAddEntity:
173
 * @doc:  the document
174
 * @extSubset:  add to the external or internal subset
175
 * @name:  the entity name
176
 * @type:  the entity type XML_xxx_yyy_ENTITY
177
 * @ExternalID:  the entity external ID if available
178
 * @SystemID:  the entity system ID if available
179
 * @content:  the entity content
180
 * @out:  pointer to resulting entity (optional)
181
 *
182
 * Register a new entity for this document.
183
 *
184
 * Available since 2.13.0.
185
 *
186
 * Returns an xmlParserErrors error code.
187
 */
188
int
189
xmlAddEntity(xmlDocPtr doc, int extSubset, const xmlChar *name, int type,
190
    const xmlChar *ExternalID, const xmlChar *SystemID,
191
143k
    const xmlChar *content, xmlEntityPtr *out) {
192
143k
    xmlDtdPtr dtd;
193
143k
    xmlDictPtr dict = NULL;
194
143k
    xmlEntitiesTablePtr table = NULL;
195
143k
    xmlEntityPtr ret, predef;
196
143k
    int res;
197
198
143k
    if (out != NULL)
199
143k
        *out = NULL;
200
143k
    if ((doc == NULL) || (name == NULL))
201
0
  return(XML_ERR_ARGUMENT);
202
143k
    dict = doc->dict;
203
204
143k
    if (extSubset)
205
8.00k
        dtd = doc->extSubset;
206
135k
    else
207
135k
        dtd = doc->intSubset;
208
143k
    if (dtd == NULL)
209
0
        return(XML_DTD_NO_DTD);
210
211
143k
    switch (type) {
212
75.5k
        case XML_INTERNAL_GENERAL_ENTITY:
213
91.6k
        case XML_EXTERNAL_GENERAL_PARSED_ENTITY:
214
91.9k
        case XML_EXTERNAL_GENERAL_UNPARSED_ENTITY:
215
91.9k
            predef = xmlGetPredefinedEntity(name);
216
91.9k
            if (predef != NULL) {
217
25.9k
                int valid = 0;
218
219
                /* 4.6 Predefined Entities */
220
25.9k
                if ((type == XML_INTERNAL_GENERAL_ENTITY) &&
221
23.1k
                    (content != NULL)) {
222
22.9k
                    int c = predef->content[0];
223
224
22.9k
                    if (((content[0] == c) && (content[1] == 0)) &&
225
1.21k
                        ((c == '>') || (c == '\'') || (c == '"'))) {
226
989
                        valid = 1;
227
21.9k
                    } else if ((content[0] == '&') && (content[1] == '#')) {
228
13.1k
                        if (content[2] == 'x') {
229
11.0k
                            xmlChar *hex = BAD_CAST "0123456789ABCDEF";
230
11.0k
                            xmlChar ref[] = "00;";
231
232
11.0k
                            ref[0] = hex[c / 16 % 16];
233
11.0k
                            ref[1] = hex[c % 16];
234
11.0k
                            if (xmlStrcasecmp(&content[3], ref) == 0)
235
4.47k
                                valid = 1;
236
11.0k
                        } else {
237
2.08k
                            xmlChar ref[] = "00;";
238
239
2.08k
                            ref[0] = '0' + c / 10 % 10;
240
2.08k
                            ref[1] = '0' + c % 10;
241
2.08k
                            if (xmlStrEqual(&content[2], ref))
242
816
                                valid = 1;
243
2.08k
                        }
244
13.1k
                    }
245
22.9k
                }
246
25.9k
                if (!valid)
247
19.7k
                    return(XML_ERR_REDECL_PREDEF_ENTITY);
248
25.9k
            }
249
72.2k
      if (dtd->entities == NULL) {
250
36.7k
    dtd->entities = xmlHashCreateDict(0, dict);
251
36.7k
                if (dtd->entities == NULL)
252
3
                    return(XML_ERR_NO_MEMORY);
253
36.7k
            }
254
72.2k
      table = dtd->entities;
255
72.2k
      break;
256
22.8k
        case XML_INTERNAL_PARAMETER_ENTITY:
257
51.3k
        case XML_EXTERNAL_PARAMETER_ENTITY:
258
51.3k
      if (dtd->pentities == NULL) {
259
22.5k
    dtd->pentities = xmlHashCreateDict(0, dict);
260
22.5k
                if (dtd->pentities == NULL)
261
3
                    return(XML_ERR_NO_MEMORY);
262
22.5k
            }
263
51.3k
      table = dtd->pentities;
264
51.3k
      break;
265
0
        default:
266
0
      return(XML_ERR_ARGUMENT);
267
143k
    }
268
123k
    ret = xmlCreateEntity(dtd->doc, name, type, ExternalID, SystemID, content);
269
123k
    if (ret == NULL)
270
28
        return(XML_ERR_NO_MEMORY);
271
272
123k
    res = xmlHashAdd(table, name, ret);
273
123k
    if (res < 0) {
274
7
        xmlFreeEntity(ret);
275
7
        return(XML_ERR_NO_MEMORY);
276
123k
    } else if (res == 0) {
277
  /*
278
   * entity was already defined at another level.
279
   */
280
13.7k
        xmlFreeEntity(ret);
281
13.7k
  return(XML_WAR_ENTITY_REDEFINED);
282
13.7k
    }
283
284
    /*
285
     * Link it to the DTD
286
     */
287
109k
    ret->parent = dtd;
288
109k
    ret->doc = dtd->doc;
289
109k
    if (dtd->last == NULL) {
290
42.2k
  dtd->children = dtd->last = (xmlNodePtr) ret;
291
67.4k
    } else {
292
67.4k
  dtd->last->next = (xmlNodePtr) ret;
293
67.4k
  ret->prev = dtd->last;
294
67.4k
  dtd->last = (xmlNodePtr) ret;
295
67.4k
    }
296
297
109k
    if (out != NULL)
298
109k
        *out = ret;
299
109k
    return(0);
300
123k
}
301
302
/**
303
 * xmlGetPredefinedEntity:
304
 * @name:  the entity name
305
 *
306
 * Check whether this name is an predefined entity.
307
 *
308
 * Returns NULL if not, otherwise the entity
309
 */
310
xmlEntityPtr
311
3.02M
xmlGetPredefinedEntity(const xmlChar *name) {
312
3.02M
    if (name == NULL) return(NULL);
313
3.02M
    switch (name[0]) {
314
45.5k
        case 'l':
315
45.5k
      if (xmlStrEqual(name, BAD_CAST "lt"))
316
18.1k
          return(&xmlEntityLt);
317
27.4k
      break;
318
69.9k
        case 'g':
319
69.9k
      if (xmlStrEqual(name, BAD_CAST "gt"))
320
66.0k
          return(&xmlEntityGt);
321
3.86k
      break;
322
1.03M
        case 'a':
323
1.03M
      if (xmlStrEqual(name, BAD_CAST "amp"))
324
98.8k
          return(&xmlEntityAmp);
325
933k
      if (xmlStrEqual(name, BAD_CAST "apos"))
326
8.78k
          return(&xmlEntityApos);
327
924k
      break;
328
924k
        case 'q':
329
797k
      if (xmlStrEqual(name, BAD_CAST "quot"))
330
9.23k
          return(&xmlEntityQuot);
331
787k
      break;
332
1.07M
  default:
333
1.07M
      break;
334
3.02M
    }
335
2.82M
    return(NULL);
336
3.02M
}
337
338
/**
339
 * xmlAddDtdEntity:
340
 * @doc:  the document
341
 * @name:  the entity name
342
 * @type:  the entity type XML_xxx_yyy_ENTITY
343
 * @ExternalID:  the entity external ID if available
344
 * @SystemID:  the entity system ID if available
345
 * @content:  the entity content
346
 *
347
 * Register a new entity for this document DTD external subset.
348
 *
349
 * Returns a pointer to the entity or NULL in case of error
350
 */
351
xmlEntityPtr
352
xmlAddDtdEntity(xmlDocPtr doc, const xmlChar *name, int type,
353
          const xmlChar *ExternalID, const xmlChar *SystemID,
354
0
    const xmlChar *content) {
355
0
    xmlEntityPtr ret;
356
357
0
    xmlAddEntity(doc, 1, name, type, ExternalID, SystemID, content, &ret);
358
0
    return(ret);
359
0
}
360
361
/**
362
 * xmlAddDocEntity:
363
 * @doc:  the document
364
 * @name:  the entity name
365
 * @type:  the entity type XML_xxx_yyy_ENTITY
366
 * @ExternalID:  the entity external ID if available
367
 * @SystemID:  the entity system ID if available
368
 * @content:  the entity content
369
 *
370
 * Register a new entity for this document.
371
 *
372
 * Returns a pointer to the entity or NULL in case of error
373
 */
374
xmlEntityPtr
375
xmlAddDocEntity(xmlDocPtr doc, const xmlChar *name, int type,
376
          const xmlChar *ExternalID, const xmlChar *SystemID,
377
0
          const xmlChar *content) {
378
0
    xmlEntityPtr ret;
379
380
0
    xmlAddEntity(doc, 0, name, type, ExternalID, SystemID, content, &ret);
381
0
    return(ret);
382
0
}
383
384
/**
385
 * xmlNewEntity:
386
 * @doc:  the document
387
 * @name:  the entity name
388
 * @type:  the entity type XML_xxx_yyy_ENTITY
389
 * @ExternalID:  the entity external ID if available
390
 * @SystemID:  the entity system ID if available
391
 * @content:  the entity content
392
 *
393
 * Create a new entity, this differs from xmlAddDocEntity() that if
394
 * the document is NULL or has no internal subset defined, then an
395
 * unlinked entity structure will be returned, it is then the responsibility
396
 * of the caller to link it to the document later or free it when not needed
397
 * anymore.
398
 *
399
 * Returns a pointer to the entity or NULL in case of error
400
 */
401
xmlEntityPtr
402
xmlNewEntity(xmlDocPtr doc, const xmlChar *name, int type,
403
       const xmlChar *ExternalID, const xmlChar *SystemID,
404
0
       const xmlChar *content) {
405
0
    if ((doc != NULL) && (doc->intSubset != NULL)) {
406
0
  return(xmlAddDocEntity(doc, name, type, ExternalID, SystemID, content));
407
0
    }
408
0
    if (name == NULL)
409
0
        return(NULL);
410
0
    return(xmlCreateEntity(doc, name, type, ExternalID, SystemID, content));
411
0
}
412
413
/**
414
 * xmlGetEntityFromTable:
415
 * @table:  an entity table
416
 * @name:  the entity name
417
 * @parameter:  look for parameter entities
418
 *
419
 * Do an entity lookup in the table.
420
 * returns the corresponding parameter entity, if found.
421
 *
422
 * Returns A pointer to the entity structure or NULL if not found.
423
 */
424
static xmlEntityPtr
425
1.22M
xmlGetEntityFromTable(xmlEntitiesTablePtr table, const xmlChar *name) {
426
1.22M
    return((xmlEntityPtr) xmlHashLookup(table, name));
427
1.22M
}
428
429
/**
430
 * xmlGetParameterEntity:
431
 * @doc:  the document referencing the entity
432
 * @name:  the entity name
433
 *
434
 * Do an entity lookup in the internal and external subsets and
435
 * returns the corresponding parameter entity, if found.
436
 *
437
 * Returns A pointer to the entity structure or NULL if not found.
438
 */
439
xmlEntityPtr
440
85.1k
xmlGetParameterEntity(xmlDocPtr doc, const xmlChar *name) {
441
85.1k
    xmlEntitiesTablePtr table;
442
85.1k
    xmlEntityPtr ret;
443
444
85.1k
    if (doc == NULL)
445
494
  return(NULL);
446
84.6k
    if ((doc->intSubset != NULL) && (doc->intSubset->pentities != NULL)) {
447
78.2k
  table = (xmlEntitiesTablePtr) doc->intSubset->pentities;
448
78.2k
  ret = xmlGetEntityFromTable(table, name);
449
78.2k
  if (ret != NULL)
450
61.3k
      return(ret);
451
78.2k
    }
452
23.3k
    if ((doc->extSubset != NULL) && (doc->extSubset->pentities != NULL)) {
453
8.17k
  table = (xmlEntitiesTablePtr) doc->extSubset->pentities;
454
8.17k
  return(xmlGetEntityFromTable(table, name));
455
8.17k
    }
456
15.1k
    return(NULL);
457
23.3k
}
458
459
/**
460
 * xmlGetDtdEntity:
461
 * @doc:  the document referencing the entity
462
 * @name:  the entity name
463
 *
464
 * Do an entity lookup in the DTD entity hash table and
465
 * returns the corresponding entity, if found.
466
 * Note: the first argument is the document node, not the DTD node.
467
 *
468
 * Returns A pointer to the entity structure or NULL if not found.
469
 */
470
xmlEntityPtr
471
0
xmlGetDtdEntity(xmlDocPtr doc, const xmlChar *name) {
472
0
    xmlEntitiesTablePtr table;
473
474
0
    if (doc == NULL)
475
0
  return(NULL);
476
0
    if ((doc->extSubset != NULL) && (doc->extSubset->entities != NULL)) {
477
0
  table = (xmlEntitiesTablePtr) doc->extSubset->entities;
478
0
  return(xmlGetEntityFromTable(table, name));
479
0
    }
480
0
    return(NULL);
481
0
}
482
483
/**
484
 * xmlGetDocEntity:
485
 * @doc:  the document referencing the entity
486
 * @name:  the entity name
487
 *
488
 * Do an entity lookup in the document entity hash table and
489
 * returns the corresponding entity, otherwise a lookup is done
490
 * in the predefined entities too.
491
 *
492
 * Returns A pointer to the entity structure or NULL if not found.
493
 */
494
xmlEntityPtr
495
1.51M
xmlGetDocEntity(const xmlDoc *doc, const xmlChar *name) {
496
1.51M
    xmlEntityPtr cur;
497
1.51M
    xmlEntitiesTablePtr table;
498
499
1.51M
    if (doc != NULL) {
500
1.50M
  if ((doc->intSubset != NULL) && (doc->intSubset->entities != NULL)) {
501
1.05M
      table = (xmlEntitiesTablePtr) doc->intSubset->entities;
502
1.05M
      cur = xmlGetEntityFromTable(table, name);
503
1.05M
      if (cur != NULL)
504
920k
    return(cur);
505
1.05M
  }
506
581k
  if (doc->standalone != 1) {
507
581k
      if ((doc->extSubset != NULL) &&
508
84.9k
    (doc->extSubset->entities != NULL)) {
509
81.8k
    table = (xmlEntitiesTablePtr) doc->extSubset->entities;
510
81.8k
    cur = xmlGetEntityFromTable(table, name);
511
81.8k
    if (cur != NULL)
512
322
        return(cur);
513
81.8k
      }
514
581k
  }
515
581k
    }
516
591k
    return(xmlGetPredefinedEntity(name));
517
1.51M
}
518
519
/*
520
 * xmlSerializeHexCharRef:
521
 * @buf:  a char buffer
522
 * @val:  a codepoint
523
 *
524
 * Serializes a hex char ref like &#xA0;
525
 *
526
 * Writes at most 9 bytes. Does not include a terminating zero byte.
527
 *
528
 * Returns the number of bytes written.
529
 */
530
int
531
724
xmlSerializeHexCharRef(char *buf, int val) {
532
724
    char *out = buf;
533
724
    int shift = 0, bits;
534
535
724
    *out++ = '&';
536
724
    *out++ = '#';
537
724
    *out++ = 'x';
538
539
724
    bits = val;
540
724
    if (bits & 0xFF0000) {
541
53
        shift = 16;
542
53
        bits &= 0xFF0000;
543
671
    } else if (bits & 0x00FF00) {
544
110
        shift = 8;
545
110
        bits &= 0x00FF00;
546
110
    }
547
724
    if (bits & 0xF0F0F0) {
548
590
        shift += 4;
549
590
    }
550
551
1.74k
    do {
552
1.74k
        int d = (val >> shift) & 0x0F;
553
554
1.74k
        if (d < 10)
555
1.12k
            *out++ = '0' + d;
556
621
        else
557
621
            *out++ = 'A' + (d - 10);
558
559
1.74k
  shift -= 4;
560
1.74k
    } while (shift >= 0);
561
562
724
    *out++ = ';';
563
564
724
    return(out - buf);
565
724
}
566
567
/*
568
 * xmlSerializeDecCharRef:
569
 * @buf:  a char buffer
570
 * @val:  a codepoint
571
 *
572
 * Serializes a decimal char ref like &#38;
573
 *
574
 * Writes at most 10 bytes. Does not include a terminating zero byte.
575
 *
576
 * Returns the number of bytes written.
577
 */
578
int
579
112M
xmlSerializeDecCharRef(char *buf, int val) {
580
112M
    char *out = buf;
581
112M
    int len, i;
582
583
112M
    *out++ = '&';
584
112M
    *out++ = '#';
585
586
112M
    if (val < 100) {
587
911
        len = (val < 10) ? 1 : 2;
588
112M
    } else if (val < 10000) {
589
112M
        len = (val < 1000) ? 3 : 4;
590
112M
    } else if (val < 1000000) {
591
6.76k
        len = (val < 100000) ? 5 : 6;
592
6.76k
    } else {
593
120
        len = 7;
594
120
    }
595
596
462M
    for (i = len - 1; i >= 0; i--) {
597
349M
        out[i] = '0' + val % 10;
598
349M
        val /= 10;
599
349M
    }
600
601
112M
    out[len] = ';';
602
603
112M
    return(len + 3);
604
112M
}
605
606
static const char xmlEscapeSafe[128] = {
607
    0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0,
608
    0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
609
    1, 1, 0, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1,
610
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 1,
611
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
612
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
613
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
614
    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1
615
};
616
617
/*
618
 * xmlEscapeText:
619
 * @text:  input text
620
 * @flags:  XML_ESCAPE flags
621
 *
622
 * Escapes certain characters with char refs.
623
 *
624
 * XML_ESCAPE_ATTR: for attribute content.
625
 * XML_ESCAPE_NON_ASCII: escape non-ASCII chars.
626
 * XML_ESCAPE_HTML: for HTML content.
627
 * XML_ESCAPE_QUOT: escape double quotes.
628
 * XML_ESCAPE_ALLOW_INVALID: allow invalid characters.
629
 *
630
 * Returns an escaped string or NULL if a memory allocation failed.
631
 */
632
xmlChar *
633
63.7k
xmlEscapeText(const xmlChar *text, int flags) {
634
63.7k
    const xmlChar *cur;
635
63.7k
    xmlChar *buffer;
636
63.7k
    xmlChar *out;
637
63.7k
    const xmlChar *unescaped;
638
63.7k
    size_t size = 50;
639
640
63.7k
    buffer = xmlMalloc(size + 1);
641
63.7k
    if (buffer == NULL)
642
53
        return(NULL);
643
63.7k
    out = buffer;
644
645
63.7k
    cur = text;
646
63.7k
    unescaped = cur;
647
648
227k
    while (*cur != '\0') {
649
164k
        char buf[12];
650
164k
  const xmlChar *end;
651
164k
        const xmlChar *repl;
652
164k
        size_t used;
653
164k
        size_t replSize;
654
164k
        size_t unescapedSize;
655
164k
        size_t totalSize;
656
164k
        int chunkSize = 1;
657
164k
        int c;
658
659
        /* accelerator */
660
94.2M
  while (1) {
661
94.2M
            c = *cur;
662
663
94.2M
            if (c < 0x80) {
664
7.60M
                if (!xmlEscapeSafe[*cur])
665
164k
                    break;
666
86.6M
            } else {
667
86.6M
               if (flags & XML_ESCAPE_NON_ASCII)
668
0
                   break;
669
86.6M
            }
670
94.0M
            cur += 1;
671
94.0M
        }
672
673
164k
        if (c == 0) {
674
59.7k
            chunkSize = 0;
675
59.7k
            repl = BAD_CAST "";
676
59.7k
            replSize = 0;
677
104k
        } else if (c == '<') {
678
      /*
679
       * Special handling of server side include in HTML attributes
680
       */
681
7.54k
      if ((flags & XML_ESCAPE_HTML) && (flags & XML_ESCAPE_ATTR) &&
682
7.14k
          (cur[1] == '!') && (cur[2] == '-') && (cur[3] == '-') &&
683
622
          ((end = xmlStrstr(cur, BAD_CAST "-->")) != NULL)) {
684
430
                chunkSize = (end - cur) + 3;
685
430
                repl = cur;
686
430
                replSize = chunkSize;
687
7.11k
      } else {
688
7.11k
                repl = BAD_CAST "&lt;";
689
7.11k
                replSize = 4;
690
7.11k
            }
691
96.8k
  } else if (c == '>') {
692
33.4k
            repl = BAD_CAST "&gt;";
693
33.4k
            replSize = 4;
694
63.3k
  } else if (c == '&') {
695
      /*
696
       * Special handling of &{...} construct from HTML 4, see
697
       * http://www.w3.org/TR/html401/appendix/notes.html#h-B.7.1
698
       */
699
5.17k
      if ((flags & XML_ESCAPE_HTML) && (flags & XML_ESCAPE_ATTR) &&
700
4.78k
                (cur[1] == '{') && (end = xmlStrchr(cur, '}'))) {
701
3.19k
                chunkSize = (end - cur) + 1;
702
3.19k
                repl = cur;
703
3.19k
                replSize = chunkSize;
704
3.19k
      } else {
705
1.97k
                repl = BAD_CAST "&amp;";
706
1.97k
                replSize = 5;
707
1.97k
            }
708
58.2k
  } else if ((flags & XML_ESCAPE_QUOT) && (c == '"')) {
709
0
            repl = BAD_CAST "&quot;";
710
0
            replSize = 6;
711
58.2k
  } else if (((flags & XML_ESCAPE_HTML) == 0) && (c == '\r')) {
712
0
      repl = BAD_CAST "&#13;";
713
0
            replSize = 5;
714
58.2k
  } else if ((flags & XML_ESCAPE_NON_ASCII) && (c >= 0x80)) {
715
0
            int val;
716
717
0
            chunkSize = 4;
718
0
            val = xmlGetUTF8Char(cur, &chunkSize);
719
0
            if (val < 0) {
720
0
                val = 0xFFFD;
721
0
                chunkSize = 1;
722
0
            } else if (((flags & XML_ESCAPE_ALLOW_INVALID) == 0) &&
723
0
                       (!IS_CHAR(val))) {
724
0
                val = 0xFFFD;
725
0
            }
726
727
0
            replSize = xmlSerializeHexCharRef(buf, val);
728
0
            repl = BAD_CAST buf;
729
58.2k
  } else if ((flags & (XML_ESCAPE_ALLOW_INVALID | XML_ESCAPE_HTML)) ||
730
0
                   (c >= 0x20) ||
731
58.2k
             (c == '\n') || (c == '\t') || (c == '\r')) {
732
      /* default case, just copy */
733
58.2k
            cur += 1;
734
58.2k
            if (*cur != 0)
735
57.8k
                continue;
736
737
353
            chunkSize = 0;
738
353
            repl = BAD_CAST "";
739
353
            replSize = 0;
740
353
  } else {
741
            /* ignore */
742
0
            repl = BAD_CAST "";
743
0
            replSize = 0;
744
0
        }
745
746
106k
        used = out - buffer;
747
106k
        unescapedSize = cur - unescaped;
748
106k
        totalSize = unescapedSize + replSize;
749
750
106k
  cur += chunkSize;
751
752
106k
        if (totalSize > size - used) {
753
16.0k
            xmlChar *tmp;
754
16.0k
            int newSize;
755
756
16.0k
            if ((size > (SIZE_MAX - 1) / 2) ||
757
16.0k
                (totalSize > (SIZE_MAX - 1) / 2 - size)) {
758
0
                xmlFree(buffer);
759
0
                return(NULL);
760
0
            }
761
16.0k
            newSize = size + totalSize;
762
16.0k
            if (*cur != 0)
763
9.36k
                newSize *= 2;
764
16.0k
            tmp = xmlRealloc(buffer, newSize + 1);
765
16.0k
            if (tmp == NULL) {
766
4
                xmlFree(buffer);
767
4
                return(NULL);
768
4
            }
769
16.0k
            buffer = tmp;
770
16.0k
            size = newSize;
771
16.0k
            out = buffer + used;
772
16.0k
        }
773
774
106k
        memcpy(out, unescaped, unescapedSize);
775
106k
        out += unescapedSize;
776
106k
        memcpy(out, repl, replSize);
777
106k
        out += replSize;
778
779
106k
        unescaped = cur;
780
106k
    }
781
782
63.7k
    *out = 0;
783
63.7k
    return(buffer);
784
63.7k
}
785
786
/**
787
 * xmlEncodeEntitiesInternal:
788
 * @doc:  the document containing the string
789
 * @input:  A string to convert to XML.
790
 * @flags:  XML_ESCAPE flags
791
 *
792
 * Do a global encoding of a string, replacing the predefined entities
793
 * and non ASCII values with their entities and CharRef counterparts.
794
 * Contrary to xmlEncodeEntities, this routine is reentrant, and result
795
 * must be deallocated.
796
 *
797
 * Returns A newly allocated string with the substitution done.
798
 */
799
xmlChar *
800
xmlEncodeEntitiesInternal(xmlDocPtr doc, const xmlChar *input,
801
63.7k
                          unsigned flags) {
802
63.7k
    if (input == NULL)
803
0
        return(NULL);
804
805
63.7k
    if ((doc != NULL) && (doc->type == XML_HTML_DOCUMENT_NODE))
806
63.7k
        flags |= XML_ESCAPE_HTML;
807
0
    else if ((doc == NULL) || (doc->encoding == NULL))
808
0
        flags |= XML_ESCAPE_NON_ASCII;
809
810
63.7k
    return(xmlEscapeText(input, flags));
811
63.7k
}
812
813
/**
814
 * xmlEncodeEntitiesReentrant:
815
 * @doc:  the document containing the string
816
 * @input:  A string to convert to XML.
817
 *
818
 * Do a global encoding of a string, replacing the predefined entities
819
 * and non ASCII values with their entities and CharRef counterparts.
820
 * Contrary to xmlEncodeEntities, this routine is reentrant, and result
821
 * must be deallocated.
822
 *
823
 * This escapes '<', '>', '&' and '\r'. If the document has no encoding,
824
 * non-ASCII codepoints are escaped. There is some special handling for
825
 * HTML documents.
826
 *
827
 * Returns A newly allocated string with the substitution done.
828
 */
829
xmlChar *
830
38.6k
xmlEncodeEntitiesReentrant(xmlDocPtr doc, const xmlChar *input) {
831
38.6k
    return xmlEncodeEntitiesInternal(doc, input, 0);
832
38.6k
}
833
834
/**
835
 * xmlEncodeSpecialChars:
836
 * @doc:  unused
837
 * @input:  A string to convert to XML.
838
 *
839
 * Do a global encoding of a string, replacing the predefined entities
840
 * this routine is reentrant, and result must be deallocated.
841
 *
842
 * This escapes '<', '>', '&', '"' and '\r' chars.
843
 *
844
 * Returns A newly allocated string with the substitution done.
845
 */
846
xmlChar *
847
xmlEncodeSpecialChars(const xmlDoc *doc ATTRIBUTE_UNUSED,
848
0
                      const xmlChar *input) {
849
0
    if (input == NULL)
850
0
        return(NULL);
851
852
0
    return(xmlEscapeText(input, XML_ESCAPE_QUOT | XML_ESCAPE_ALLOW_INVALID));
853
0
}
854
855
/**
856
 * xmlCreateEntitiesTable:
857
 *
858
 * create and initialize an empty entities hash table.
859
 * This really doesn't make sense and should be deprecated
860
 *
861
 * Returns the xmlEntitiesTablePtr just created or NULL in case of error.
862
 */
863
xmlEntitiesTablePtr
864
0
xmlCreateEntitiesTable(void) {
865
0
    return((xmlEntitiesTablePtr) xmlHashCreate(0));
866
0
}
867
868
/**
869
 * xmlFreeEntityWrapper:
870
 * @entity:  An entity
871
 * @name:  its name
872
 *
873
 * Deallocate the memory used by an entities in the hash table.
874
 */
875
static void
876
109k
xmlFreeEntityWrapper(void *entity, const xmlChar *name ATTRIBUTE_UNUSED) {
877
109k
    if (entity != NULL)
878
109k
  xmlFreeEntity((xmlEntityPtr) entity);
879
109k
}
880
881
/**
882
 * xmlFreeEntitiesTable:
883
 * @table:  An entity table
884
 *
885
 * Deallocate the memory used by an entities hash table.
886
 */
887
void
888
59.3k
xmlFreeEntitiesTable(xmlEntitiesTablePtr table) {
889
59.3k
    xmlHashFree(table, xmlFreeEntityWrapper);
890
59.3k
}
891
892
/**
893
 * xmlCopyEntity:
894
 * @ent:  An entity
895
 *
896
 * Build a copy of an entity
897
 *
898
 * Returns the new xmlEntitiesPtr or NULL in case of error.
899
 */
900
static void *
901
0
xmlCopyEntity(void *payload, const xmlChar *name ATTRIBUTE_UNUSED) {
902
0
    xmlEntityPtr ent = (xmlEntityPtr) payload;
903
0
    xmlEntityPtr cur;
904
905
0
    cur = (xmlEntityPtr) xmlMalloc(sizeof(xmlEntity));
906
0
    if (cur == NULL)
907
0
  return(NULL);
908
0
    memset(cur, 0, sizeof(xmlEntity));
909
0
    cur->type = XML_ENTITY_DECL;
910
911
0
    cur->etype = ent->etype;
912
0
    if (ent->name != NULL) {
913
0
  cur->name = xmlStrdup(ent->name);
914
0
        if (cur->name == NULL)
915
0
            goto error;
916
0
    }
917
0
    if (ent->ExternalID != NULL) {
918
0
  cur->ExternalID = xmlStrdup(ent->ExternalID);
919
0
        if (cur->ExternalID == NULL)
920
0
            goto error;
921
0
    }
922
0
    if (ent->SystemID != NULL) {
923
0
  cur->SystemID = xmlStrdup(ent->SystemID);
924
0
        if (cur->SystemID == NULL)
925
0
            goto error;
926
0
    }
927
0
    if (ent->content != NULL) {
928
0
  cur->content = xmlStrdup(ent->content);
929
0
        if (cur->content == NULL)
930
0
            goto error;
931
0
    }
932
0
    if (ent->orig != NULL) {
933
0
  cur->orig = xmlStrdup(ent->orig);
934
0
        if (cur->orig == NULL)
935
0
            goto error;
936
0
    }
937
0
    if (ent->URI != NULL) {
938
0
  cur->URI = xmlStrdup(ent->URI);
939
0
        if (cur->URI == NULL)
940
0
            goto error;
941
0
    }
942
0
    return(cur);
943
944
0
error:
945
0
    xmlFreeEntity(cur);
946
0
    return(NULL);
947
0
}
948
949
/**
950
 * xmlCopyEntitiesTable:
951
 * @table:  An entity table
952
 *
953
 * Build a copy of an entity table.
954
 *
955
 * Returns the new xmlEntitiesTablePtr or NULL in case of error.
956
 */
957
xmlEntitiesTablePtr
958
0
xmlCopyEntitiesTable(xmlEntitiesTablePtr table) {
959
0
    return(xmlHashCopySafe(table, xmlCopyEntity, xmlFreeEntityWrapper));
960
0
}
961
962
#ifdef LIBXML_OUTPUT_ENABLED
963
964
/**
965
 * xmlDumpEntityDecl:
966
 * @buf:  An XML buffer.
967
 * @ent:  An entity table
968
 *
969
 * This will dump the content of the entity table as an XML DTD definition
970
 */
971
void
972
0
xmlDumpEntityDecl(xmlBufferPtr buf, xmlEntityPtr ent) {
973
0
    xmlSaveCtxtPtr save;
974
975
0
    if ((buf == NULL) || (ent == NULL))
976
0
        return;
977
978
0
    save = xmlSaveToBuffer(buf, NULL, 0);
979
0
    xmlSaveTree(save, (xmlNodePtr) ent);
980
0
    if (xmlSaveFinish(save) != XML_ERR_OK)
981
0
        xmlFree(xmlBufferDetach(buf));
982
0
}
983
984
/**
985
 * xmlDumpEntityDeclScan:
986
 * @ent:  An entity table
987
 * @buf:  An XML buffer.
988
 *
989
 * When using the hash table scan function, arguments need to be reversed
990
 */
991
static void
992
xmlDumpEntityDeclScan(void *ent, void *save,
993
0
                      const xmlChar *name ATTRIBUTE_UNUSED) {
994
0
    xmlSaveTree(save, ent);
995
0
}
996
997
/**
998
 * xmlDumpEntitiesTable:
999
 * @buf:  An XML buffer.
1000
 * @table:  An entity table
1001
 *
1002
 * This will dump the content of the entity table as an XML DTD definition
1003
 */
1004
void
1005
0
xmlDumpEntitiesTable(xmlBufferPtr buf, xmlEntitiesTablePtr table) {
1006
0
    xmlSaveCtxtPtr save;
1007
1008
0
    if ((buf == NULL) || (table == NULL))
1009
0
        return;
1010
1011
0
    save = xmlSaveToBuffer(buf, NULL, 0);
1012
0
    xmlHashScan(table, xmlDumpEntityDeclScan, save);
1013
0
    if (xmlSaveFinish(save) != XML_ERR_OK)
1014
0
        xmlFree(xmlBufferDetach(buf));
1015
0
}
1016
#endif /* LIBXML_OUTPUT_ENABLED */