Coverage Report

Created: 2024-01-17 17:01

/src/libxml2/entities.c
Line
Count
Source (jump to first uncovered line)
1
/*
2
 * entities.c : implementation for the XML entities handling
3
 *
4
 * See Copyright for the status of this software.
5
 *
6
 * daniel@veillard.com
7
 */
8
9
/* To avoid EBCDIC trouble when parsing on zOS */
10
#if defined(__MVS__)
11
#pragma convert("ISO8859-1")
12
#endif
13
14
#define IN_LIBXML
15
#include "libxml.h"
16
17
#include <string.h>
18
#include <stdlib.h>
19
20
#include <libxml/xmlmemory.h>
21
#include <libxml/hash.h>
22
#include <libxml/entities.h>
23
#include <libxml/parser.h>
24
#include <libxml/parserInternals.h>
25
#include <libxml/xmlerror.h>
26
#include <libxml/globals.h>
27
#include <libxml/dict.h>
28
29
#include "private/entities.h"
30
#include "private/error.h"
31
32
/*
33
 * The XML predefined entities.
34
 */
35
36
static xmlEntity xmlEntityLt = {
37
    NULL, XML_ENTITY_DECL, BAD_CAST "lt",
38
    NULL, NULL, NULL, NULL, NULL, NULL,
39
    BAD_CAST "<", BAD_CAST "<", 1,
40
    XML_INTERNAL_PREDEFINED_ENTITY,
41
    NULL, NULL, NULL, NULL, 0, 0, 0
42
};
43
static xmlEntity xmlEntityGt = {
44
    NULL, XML_ENTITY_DECL, BAD_CAST "gt",
45
    NULL, NULL, NULL, NULL, NULL, NULL,
46
    BAD_CAST ">", BAD_CAST ">", 1,
47
    XML_INTERNAL_PREDEFINED_ENTITY,
48
    NULL, NULL, NULL, NULL, 0, 0, 0
49
};
50
static xmlEntity xmlEntityAmp = {
51
    NULL, XML_ENTITY_DECL, BAD_CAST "amp",
52
    NULL, NULL, NULL, NULL, NULL, NULL,
53
    BAD_CAST "&", BAD_CAST "&", 1,
54
    XML_INTERNAL_PREDEFINED_ENTITY,
55
    NULL, NULL, NULL, NULL, 0, 0, 0
56
};
57
static xmlEntity xmlEntityQuot = {
58
    NULL, XML_ENTITY_DECL, BAD_CAST "quot",
59
    NULL, NULL, NULL, NULL, NULL, NULL,
60
    BAD_CAST "\"", BAD_CAST "\"", 1,
61
    XML_INTERNAL_PREDEFINED_ENTITY,
62
    NULL, NULL, NULL, NULL, 0, 0, 0
63
};
64
static xmlEntity xmlEntityApos = {
65
    NULL, XML_ENTITY_DECL, BAD_CAST "apos",
66
    NULL, NULL, NULL, NULL, NULL, NULL,
67
    BAD_CAST "'", BAD_CAST "'", 1,
68
    XML_INTERNAL_PREDEFINED_ENTITY,
69
    NULL, NULL, NULL, NULL, 0, 0, 0
70
};
71
72
/**
73
 * xmlEntitiesErrMemory:
74
 * @extra:  extra information
75
 *
76
 * Handle an out of memory condition
77
 */
78
static void
79
xmlEntitiesErrMemory(const char *extra)
80
0
{
81
0
    __xmlSimpleError(XML_FROM_TREE, XML_ERR_NO_MEMORY, NULL, NULL, extra);
82
0
}
83
84
/**
85
 * xmlEntitiesErr:
86
 * @code:  the error code
87
 * @msg:  the message
88
 *
89
 * Raise an error.
90
 */
91
static void LIBXML_ATTR_FORMAT(2,0)
92
xmlEntitiesErr(xmlParserErrors code, const char *msg)
93
0
{
94
0
    __xmlSimpleError(XML_FROM_TREE, code, NULL, msg, NULL);
95
0
}
96
97
/**
98
 * xmlEntitiesWarn:
99
 * @code:  the error code
100
 * @msg:  the message
101
 *
102
 * Raise a warning.
103
 */
104
static void LIBXML_ATTR_FORMAT(2,0)
105
xmlEntitiesWarn(xmlParserErrors code, const char *msg, const xmlChar *str1)
106
4.32k
{
107
4.32k
    __xmlRaiseError(NULL, NULL, NULL,
108
4.32k
                NULL, NULL, XML_FROM_TREE, code,
109
4.32k
                XML_ERR_WARNING, NULL, 0,
110
4.32k
                (const char *)str1, NULL, NULL, 0, 0,
111
4.32k
                msg, (const char *)str1, NULL);
112
4.32k
}
113
114
/*
115
 * xmlFreeEntity : clean-up an entity record.
116
 */
117
static void
118
xmlFreeEntity(xmlEntityPtr entity)
119
7.84M
{
120
7.84M
    xmlDictPtr dict = NULL;
121
122
7.84M
    if (entity == NULL)
123
0
        return;
124
125
7.84M
    if (entity->doc != NULL)
126
7.84M
        dict = entity->doc->dict;
127
128
129
7.84M
    if ((entity->children) && (entity->owner == 1) &&
130
7.84M
        (entity == (xmlEntityPtr) entity->children->parent))
131
417k
        xmlFreeNodeList(entity->children);
132
7.84M
    if ((entity->name != NULL) &&
133
7.84M
        ((dict == NULL) || (!xmlDictOwns(dict, entity->name))))
134
2.27M
        xmlFree((char *) entity->name);
135
7.84M
    if (entity->ExternalID != NULL)
136
188k
        xmlFree((char *) entity->ExternalID);
137
7.84M
    if (entity->SystemID != NULL)
138
351k
        xmlFree((char *) entity->SystemID);
139
7.84M
    if (entity->URI != NULL)
140
168k
        xmlFree((char *) entity->URI);
141
7.84M
    if (entity->content != NULL)
142
7.48M
        xmlFree((char *) entity->content);
143
7.84M
    if (entity->orig != NULL)
144
7.19M
        xmlFree((char *) entity->orig);
145
7.84M
    xmlFree(entity);
146
7.84M
}
147
148
/*
149
 * xmlCreateEntity:
150
 *
151
 * internal routine doing the entity node structures allocations
152
 */
153
static xmlEntityPtr
154
xmlCreateEntity(xmlDictPtr dict, const xmlChar *name, int type,
155
          const xmlChar *ExternalID, const xmlChar *SystemID,
156
7.84M
          const xmlChar *content) {
157
7.84M
    xmlEntityPtr ret;
158
159
7.84M
    ret = (xmlEntityPtr) xmlMalloc(sizeof(xmlEntity));
160
7.84M
    if (ret == NULL) {
161
0
        xmlEntitiesErrMemory("xmlCreateEntity: malloc failed");
162
0
  return(NULL);
163
0
    }
164
7.84M
    memset(ret, 0, sizeof(xmlEntity));
165
7.84M
    ret->type = XML_ENTITY_DECL;
166
167
    /*
168
     * fill the structure.
169
     */
170
7.84M
    ret->etype = (xmlEntityType) type;
171
7.84M
    if (dict == NULL) {
172
2.27M
  ret->name = xmlStrdup(name);
173
2.27M
  if (ExternalID != NULL)
174
169k
      ret->ExternalID = xmlStrdup(ExternalID);
175
2.27M
  if (SystemID != NULL)
176
197k
      ret->SystemID = xmlStrdup(SystemID);
177
5.57M
    } else {
178
5.57M
        ret->name = xmlDictLookup(dict, name, -1);
179
5.57M
  ret->ExternalID = xmlStrdup(ExternalID);
180
5.57M
  ret->SystemID = xmlStrdup(SystemID);
181
5.57M
    }
182
7.84M
    if (content != NULL) {
183
7.48M
        ret->length = xmlStrlen(content);
184
7.48M
  ret->content = xmlStrndup(content, ret->length);
185
7.48M
     } else {
186
364k
        ret->length = 0;
187
364k
        ret->content = NULL;
188
364k
    }
189
7.84M
    ret->URI = NULL; /* to be computed by the layer knowing
190
      the defining entity */
191
7.84M
    ret->orig = NULL;
192
7.84M
    ret->owner = 0;
193
194
7.84M
    return(ret);
195
7.84M
}
196
197
/*
198
 * xmlAddEntity : register a new entity for an entities table.
199
 */
200
static xmlEntityPtr
201
xmlAddEntity(xmlDtdPtr dtd, const xmlChar *name, int type,
202
    const xmlChar *ExternalID, const xmlChar *SystemID,
203
7.85M
    const xmlChar *content) {
204
7.85M
    xmlDictPtr dict = NULL;
205
7.85M
    xmlEntitiesTablePtr table = NULL;
206
7.85M
    xmlEntityPtr ret, predef;
207
208
7.85M
    if (name == NULL)
209
0
  return(NULL);
210
7.85M
    if (dtd == NULL)
211
0
  return(NULL);
212
7.85M
    if (dtd->doc != NULL)
213
7.85M
        dict = dtd->doc->dict;
214
215
7.85M
    switch (type) {
216
2.79M
        case XML_INTERNAL_GENERAL_ENTITY:
217
3.09M
        case XML_EXTERNAL_GENERAL_PARSED_ENTITY:
218
3.11M
        case XML_EXTERNAL_GENERAL_UNPARSED_ENTITY:
219
3.11M
            predef = xmlGetPredefinedEntity(name);
220
3.11M
            if (predef != NULL) {
221
555k
                int valid = 0;
222
223
                /* 4.6 Predefined Entities */
224
555k
                if ((type == XML_INTERNAL_GENERAL_ENTITY) &&
225
555k
                    (content != NULL)) {
226
554k
                    int c = predef->content[0];
227
228
554k
                    if (((content[0] == c) && (content[1] == 0)) &&
229
554k
                        ((c == '>') || (c == '\'') || (c == '"'))) {
230
313k
                        valid = 1;
231
313k
                    } else if ((content[0] == '&') && (content[1] == '#')) {
232
238k
                        if (content[2] == 'x') {
233
3.56k
                            xmlChar *hex = BAD_CAST "0123456789ABCDEF";
234
3.56k
                            xmlChar ref[] = "00;";
235
236
3.56k
                            ref[0] = hex[c / 16 % 16];
237
3.56k
                            ref[1] = hex[c % 16];
238
3.56k
                            if (xmlStrcasecmp(&content[3], ref) == 0)
239
2.88k
                                valid = 1;
240
235k
                        } else {
241
235k
                            xmlChar ref[] = "00;";
242
243
235k
                            ref[0] = '0' + c / 10 % 10;
244
235k
                            ref[1] = '0' + c % 10;
245
235k
                            if (xmlStrEqual(&content[2], ref))
246
234k
                                valid = 1;
247
235k
                        }
248
238k
                    }
249
554k
                }
250
555k
                if (!valid) {
251
4.32k
                    xmlEntitiesWarn(XML_ERR_ENTITY_PROCESSING,
252
4.32k
                            "xmlAddEntity: invalid redeclaration of predefined"
253
4.32k
                            " entity '%s'", name);
254
4.32k
                    return(NULL);
255
4.32k
                }
256
555k
            }
257
3.10M
      if (dtd->entities == NULL)
258
301k
    dtd->entities = xmlHashCreateDict(0, dict);
259
3.10M
      table = dtd->entities;
260
3.10M
      break;
261
4.68M
        case XML_INTERNAL_PARAMETER_ENTITY:
262
4.74M
        case XML_EXTERNAL_PARAMETER_ENTITY:
263
4.74M
      if (dtd->pentities == NULL)
264
161k
    dtd->pentities = xmlHashCreateDict(0, dict);
265
4.74M
      table = dtd->pentities;
266
4.74M
      break;
267
0
        case XML_INTERNAL_PREDEFINED_ENTITY:
268
0
      return(NULL);
269
7.85M
    }
270
7.84M
    if (table == NULL)
271
0
  return(NULL);
272
7.84M
    ret = xmlCreateEntity(dict, name, type, ExternalID, SystemID, content);
273
7.84M
    if (ret == NULL)
274
0
        return(NULL);
275
7.84M
    ret->doc = dtd->doc;
276
277
7.84M
    if (xmlHashAddEntry(table, name, ret)) {
278
  /*
279
   * entity was already defined at another level.
280
   */
281
255k
        xmlFreeEntity(ret);
282
255k
  return(NULL);
283
255k
    }
284
7.59M
    return(ret);
285
7.84M
}
286
287
/**
288
 * xmlGetPredefinedEntity:
289
 * @name:  the entity name
290
 *
291
 * Check whether this name is an predefined entity.
292
 *
293
 * Returns NULL if not, otherwise the entity
294
 */
295
xmlEntityPtr
296
777M
xmlGetPredefinedEntity(const xmlChar *name) {
297
777M
    if (name == NULL) return(NULL);
298
777M
    switch (name[0]) {
299
651M
        case 'l':
300
651M
      if (xmlStrEqual(name, BAD_CAST "lt"))
301
2.38M
          return(&xmlEntityLt);
302
649M
      break;
303
649M
        case 'g':
304
5.33M
      if (xmlStrEqual(name, BAD_CAST "gt"))
305
1.07M
          return(&xmlEntityGt);
306
4.26M
      break;
307
4.65M
        case 'a':
308
4.65M
      if (xmlStrEqual(name, BAD_CAST "amp"))
309
1.53M
          return(&xmlEntityAmp);
310
3.12M
      if (xmlStrEqual(name, BAD_CAST "apos"))
311
177k
          return(&xmlEntityApos);
312
2.94M
      break;
313
2.94M
        case 'q':
314
284k
      if (xmlStrEqual(name, BAD_CAST "quot"))
315
232k
          return(&xmlEntityQuot);
316
51.7k
      break;
317
115M
  default:
318
115M
      break;
319
777M
    }
320
771M
    return(NULL);
321
777M
}
322
323
/**
324
 * xmlAddDtdEntity:
325
 * @doc:  the document
326
 * @name:  the entity name
327
 * @type:  the entity type XML_xxx_yyy_ENTITY
328
 * @ExternalID:  the entity external ID if available
329
 * @SystemID:  the entity system ID if available
330
 * @content:  the entity content
331
 *
332
 * Register a new entity for this document DTD external subset.
333
 *
334
 * Returns a pointer to the entity or NULL in case of error
335
 */
336
xmlEntityPtr
337
xmlAddDtdEntity(xmlDocPtr doc, const xmlChar *name, int type,
338
          const xmlChar *ExternalID, const xmlChar *SystemID,
339
5.05M
    const xmlChar *content) {
340
5.05M
    xmlEntityPtr ret;
341
5.05M
    xmlDtdPtr dtd;
342
343
5.05M
    if (doc == NULL) {
344
0
  xmlEntitiesErr(XML_DTD_NO_DOC,
345
0
          "xmlAddDtdEntity: document is NULL");
346
0
  return(NULL);
347
0
    }
348
5.05M
    if (doc->extSubset == NULL) {
349
0
  xmlEntitiesErr(XML_DTD_NO_DTD,
350
0
          "xmlAddDtdEntity: document without external subset");
351
0
  return(NULL);
352
0
    }
353
5.05M
    dtd = doc->extSubset;
354
5.05M
    ret = xmlAddEntity(dtd, name, type, ExternalID, SystemID, content);
355
5.05M
    if (ret == NULL) return(NULL);
356
357
    /*
358
     * Link it to the DTD
359
     */
360
4.85M
    ret->parent = dtd;
361
4.85M
    ret->doc = dtd->doc;
362
4.85M
    if (dtd->last == NULL) {
363
5.44k
  dtd->children = dtd->last = (xmlNodePtr) ret;
364
4.84M
    } else {
365
4.84M
        dtd->last->next = (xmlNodePtr) ret;
366
4.84M
  ret->prev = dtd->last;
367
4.84M
  dtd->last = (xmlNodePtr) ret;
368
4.84M
    }
369
4.85M
    return(ret);
370
5.05M
}
371
372
/**
373
 * xmlAddDocEntity:
374
 * @doc:  the document
375
 * @name:  the entity name
376
 * @type:  the entity type XML_xxx_yyy_ENTITY
377
 * @ExternalID:  the entity external ID if available
378
 * @SystemID:  the entity system ID if available
379
 * @content:  the entity content
380
 *
381
 * Register a new entity for this document.
382
 *
383
 * Returns a pointer to the entity or NULL in case of error
384
 */
385
xmlEntityPtr
386
xmlAddDocEntity(xmlDocPtr doc, const xmlChar *name, int type,
387
          const xmlChar *ExternalID, const xmlChar *SystemID,
388
2.79M
          const xmlChar *content) {
389
2.79M
    xmlEntityPtr ret;
390
2.79M
    xmlDtdPtr dtd;
391
392
2.79M
    if (doc == NULL) {
393
0
  xmlEntitiesErr(XML_DTD_NO_DOC,
394
0
          "xmlAddDocEntity: document is NULL");
395
0
  return(NULL);
396
0
    }
397
2.79M
    if (doc->intSubset == NULL) {
398
0
  xmlEntitiesErr(XML_DTD_NO_DTD,
399
0
          "xmlAddDocEntity: document without internal subset");
400
0
  return(NULL);
401
0
    }
402
2.79M
    dtd = doc->intSubset;
403
2.79M
    ret = xmlAddEntity(dtd, name, type, ExternalID, SystemID, content);
404
2.79M
    if (ret == NULL) return(NULL);
405
406
    /*
407
     * Link it to the DTD
408
     */
409
2.74M
    ret->parent = dtd;
410
2.74M
    ret->doc = dtd->doc;
411
2.74M
    if (dtd->last == NULL) {
412
141k
  dtd->children = dtd->last = (xmlNodePtr) ret;
413
2.59M
    } else {
414
2.59M
  dtd->last->next = (xmlNodePtr) ret;
415
2.59M
  ret->prev = dtd->last;
416
2.59M
  dtd->last = (xmlNodePtr) ret;
417
2.59M
    }
418
2.74M
    return(ret);
419
2.79M
}
420
421
/**
422
 * xmlNewEntity:
423
 * @doc:  the document
424
 * @name:  the entity name
425
 * @type:  the entity type XML_xxx_yyy_ENTITY
426
 * @ExternalID:  the entity external ID if available
427
 * @SystemID:  the entity system ID if available
428
 * @content:  the entity content
429
 *
430
 * Create a new entity, this differs from xmlAddDocEntity() that if
431
 * the document is NULL or has no internal subset defined, then an
432
 * unlinked entity structure will be returned, it is then the responsibility
433
 * of the caller to link it to the document later or free it when not needed
434
 * anymore.
435
 *
436
 * Returns a pointer to the entity or NULL in case of error
437
 */
438
xmlEntityPtr
439
xmlNewEntity(xmlDocPtr doc, const xmlChar *name, int type,
440
       const xmlChar *ExternalID, const xmlChar *SystemID,
441
0
       const xmlChar *content) {
442
0
    xmlEntityPtr ret;
443
0
    xmlDictPtr dict;
444
445
0
    if ((doc != NULL) && (doc->intSubset != NULL)) {
446
0
  return(xmlAddDocEntity(doc, name, type, ExternalID, SystemID, content));
447
0
    }
448
0
    if (doc != NULL)
449
0
        dict = doc->dict;
450
0
    else
451
0
        dict = NULL;
452
0
    ret = xmlCreateEntity(dict, name, type, ExternalID, SystemID, content);
453
0
    if (ret == NULL)
454
0
        return(NULL);
455
0
    ret->doc = doc;
456
0
    return(ret);
457
0
}
458
459
/**
460
 * xmlGetEntityFromTable:
461
 * @table:  an entity table
462
 * @name:  the entity name
463
 * @parameter:  look for parameter entities
464
 *
465
 * Do an entity lookup in the table.
466
 * returns the corresponding parameter entity, if found.
467
 *
468
 * Returns A pointer to the entity structure or NULL if not found.
469
 */
470
static xmlEntityPtr
471
733M
xmlGetEntityFromTable(xmlEntitiesTablePtr table, const xmlChar *name) {
472
733M
    return((xmlEntityPtr) xmlHashLookup(table, name));
473
733M
}
474
475
/**
476
 * xmlGetParameterEntity:
477
 * @doc:  the document referencing the entity
478
 * @name:  the entity name
479
 *
480
 * Do an entity lookup in the internal and external subsets and
481
 * returns the corresponding parameter entity, if found.
482
 *
483
 * Returns A pointer to the entity structure or NULL if not found.
484
 */
485
xmlEntityPtr
486
343M
xmlGetParameterEntity(xmlDocPtr doc, const xmlChar *name) {
487
343M
    xmlEntitiesTablePtr table;
488
343M
    xmlEntityPtr ret;
489
490
343M
    if (doc == NULL)
491
2.71k
  return(NULL);
492
343M
    if ((doc->intSubset != NULL) && (doc->intSubset->pentities != NULL)) {
493
324M
  table = (xmlEntitiesTablePtr) doc->intSubset->pentities;
494
324M
  ret = xmlGetEntityFromTable(table, name);
495
324M
  if (ret != NULL)
496
295M
      return(ret);
497
324M
    }
498
48.1M
    if ((doc->extSubset != NULL) && (doc->extSubset->pentities != NULL)) {
499
19.7M
  table = (xmlEntitiesTablePtr) doc->extSubset->pentities;
500
19.7M
  return(xmlGetEntityFromTable(table, name));
501
19.7M
    }
502
28.3M
    return(NULL);
503
48.1M
}
504
505
/**
506
 * xmlGetDtdEntity:
507
 * @doc:  the document referencing the entity
508
 * @name:  the entity name
509
 *
510
 * Do an entity lookup in the DTD entity hash table and
511
 * returns the corresponding entity, if found.
512
 * Note: the first argument is the document node, not the DTD node.
513
 *
514
 * Returns A pointer to the entity structure or NULL if not found.
515
 */
516
xmlEntityPtr
517
0
xmlGetDtdEntity(xmlDocPtr doc, const xmlChar *name) {
518
0
    xmlEntitiesTablePtr table;
519
520
0
    if (doc == NULL)
521
0
  return(NULL);
522
0
    if ((doc->extSubset != NULL) && (doc->extSubset->entities != NULL)) {
523
0
  table = (xmlEntitiesTablePtr) doc->extSubset->entities;
524
0
  return(xmlGetEntityFromTable(table, name));
525
0
    }
526
0
    return(NULL);
527
0
}
528
529
/**
530
 * xmlGetDocEntity:
531
 * @doc:  the document referencing the entity
532
 * @name:  the entity name
533
 *
534
 * Do an entity lookup in the document entity hash table and
535
 * returns the corresponding entity, otherwise a lookup is done
536
 * in the predefined entities too.
537
 *
538
 * Returns A pointer to the entity structure or NULL if not found.
539
 */
540
xmlEntityPtr
541
385M
xmlGetDocEntity(const xmlDoc *doc, const xmlChar *name) {
542
385M
    xmlEntityPtr cur;
543
385M
    xmlEntitiesTablePtr table;
544
545
385M
    if (doc != NULL) {
546
385M
  if ((doc->intSubset != NULL) && (doc->intSubset->entities != NULL)) {
547
378M
      table = (xmlEntitiesTablePtr) doc->intSubset->entities;
548
378M
      cur = xmlGetEntityFromTable(table, name);
549
378M
      if (cur != NULL)
550
262M
    return(cur);
551
378M
  }
552
123M
  if (doc->standalone != 1) {
553
120M
      if ((doc->extSubset != NULL) &&
554
120M
    (doc->extSubset->entities != NULL)) {
555
10.1M
    table = (xmlEntitiesTablePtr) doc->extSubset->entities;
556
10.1M
    cur = xmlGetEntityFromTable(table, name);
557
10.1M
    if (cur != NULL)
558
458k
        return(cur);
559
10.1M
      }
560
120M
  }
561
123M
    }
562
122M
    return(xmlGetPredefinedEntity(name));
563
385M
}
564
565
/*
566
 * Macro used to grow the current buffer.
567
 */
568
1.57k
#define growBufferReentrant() {           \
569
1.57k
    xmlChar *tmp;                                                       \
570
1.57k
    size_t new_size = buffer_size * 2;                                  \
571
1.57k
    if (new_size < buffer_size) goto mem_error;                         \
572
1.57k
    tmp = (xmlChar *) xmlRealloc(buffer, new_size);                 \
573
1.57k
    if (tmp == NULL) goto mem_error;                                    \
574
1.57k
    buffer = tmp;             \
575
1.57k
    buffer_size = new_size;           \
576
1.57k
}
577
578
/**
579
 * xmlEncodeEntitiesInternal:
580
 * @doc:  the document containing the string
581
 * @input:  A string to convert to XML.
582
 * @attr: are we handling an attribute value
583
 *
584
 * Do a global encoding of a string, replacing the predefined entities
585
 * and non ASCII values with their entities and CharRef counterparts.
586
 * Contrary to xmlEncodeEntities, this routine is reentrant, and result
587
 * must be deallocated.
588
 *
589
 * Returns A newly allocated string with the substitution done.
590
 */
591
static xmlChar *
592
19.4k
xmlEncodeEntitiesInternal(xmlDocPtr doc, const xmlChar *input, int attr) {
593
19.4k
    const xmlChar *cur = input;
594
19.4k
    xmlChar *buffer = NULL;
595
19.4k
    xmlChar *out = NULL;
596
19.4k
    size_t buffer_size = 0;
597
19.4k
    int html = 0;
598
599
19.4k
    if (input == NULL) return(NULL);
600
19.4k
    if (doc != NULL)
601
19.4k
        html = (doc->type == XML_HTML_DOCUMENT_NODE);
602
603
    /*
604
     * allocate an translation buffer.
605
     */
606
19.4k
    buffer_size = 1000;
607
19.4k
    buffer = (xmlChar *) xmlMalloc(buffer_size);
608
19.4k
    if (buffer == NULL) {
609
0
        xmlEntitiesErrMemory("xmlEncodeEntities: malloc failed");
610
0
  return(NULL);
611
0
    }
612
19.4k
    out = buffer;
613
614
1.81M
    while (*cur != '\0') {
615
1.79M
        size_t indx = out - buffer;
616
1.79M
        if (indx + 100 > buffer_size) {
617
618
3.14k
      growBufferReentrant();
619
3.14k
      out = &buffer[indx];
620
3.14k
  }
621
622
  /*
623
   * By default one have to encode at least '<', '>', '"' and '&' !
624
   */
625
1.79M
  if (*cur == '<') {
626
53
      const xmlChar *end;
627
628
      /*
629
       * Special handling of server side include in HTML attributes
630
       */
631
53
      if (html && attr &&
632
53
          (cur[1] == '!') && (cur[2] == '-') && (cur[3] == '-') &&
633
53
          ((end = xmlStrstr(cur, BAD_CAST "-->")) != NULL)) {
634
0
          while (cur != end) {
635
0
        *out++ = *cur++;
636
0
        indx = out - buffer;
637
0
        if (indx + 100 > buffer_size) {
638
0
      growBufferReentrant();
639
0
      out = &buffer[indx];
640
0
        }
641
0
    }
642
0
    *out++ = *cur++;
643
0
    *out++ = *cur++;
644
0
    *out++ = *cur++;
645
0
    continue;
646
0
      }
647
53
      *out++ = '&';
648
53
      *out++ = 'l';
649
53
      *out++ = 't';
650
53
      *out++ = ';';
651
1.79M
  } else if (*cur == '>') {
652
139k
      *out++ = '&';
653
139k
      *out++ = 'g';
654
139k
      *out++ = 't';
655
139k
      *out++ = ';';
656
1.65M
  } else if (*cur == '&') {
657
      /*
658
       * Special handling of &{...} construct from HTML 4, see
659
       * http://www.w3.org/TR/html401/appendix/notes.html#h-B.7.1
660
       */
661
430
      if (html && attr && (cur[1] == '{') &&
662
430
          (strchr((const char *) cur, '}'))) {
663
0
          while (*cur != '}') {
664
0
        *out++ = *cur++;
665
0
        indx = out - buffer;
666
0
        if (indx + 100 > buffer_size) {
667
0
      growBufferReentrant();
668
0
      out = &buffer[indx];
669
0
        }
670
0
    }
671
0
    *out++ = *cur++;
672
0
    continue;
673
0
      }
674
430
      *out++ = '&';
675
430
      *out++ = 'a';
676
430
      *out++ = 'm';
677
430
      *out++ = 'p';
678
430
      *out++ = ';';
679
1.65M
  } else if (((*cur >= 0x20) && (*cur < 0x80)) ||
680
1.65M
      (*cur == '\n') || (*cur == '\t') || ((html) && (*cur == '\r'))) {
681
      /*
682
       * default case, just copy !
683
       */
684
1.03M
      *out++ = *cur;
685
1.03M
  } else if (*cur >= 0x80) {
686
615k
      if (((doc != NULL) && (doc->encoding != NULL)) || (html)) {
687
    /*
688
     * Bjørn Reese <br@sseusa.com> provided the patch
689
          xmlChar xc;
690
          xc = (*cur & 0x3F) << 6;
691
          if (cur[1] != 0) {
692
        xc += *(++cur) & 0x3F;
693
        *out++ = xc;
694
          } else
695
     */
696
473k
    *out++ = *cur;
697
473k
      } else {
698
    /*
699
     * We assume we have UTF-8 input.
700
     * It must match either:
701
     *   110xxxxx 10xxxxxx
702
     *   1110xxxx 10xxxxxx 10xxxxxx
703
     *   11110xxx 10xxxxxx 10xxxxxx 10xxxxxx
704
     * That is:
705
     *   cur[0] is 11xxxxxx
706
     *   cur[1] is 10xxxxxx
707
     *   cur[2] is 10xxxxxx if cur[0] is 111xxxxx
708
     *   cur[3] is 10xxxxxx if cur[0] is 1111xxxx
709
     *   cur[0] is not 11111xxx
710
     */
711
142k
    char buf[11], *ptr;
712
142k
    int val = 0, l = 1;
713
714
142k
    if (((cur[0] & 0xC0) != 0xC0) ||
715
142k
        ((cur[1] & 0xC0) != 0x80) ||
716
142k
        (((cur[0] & 0xE0) == 0xE0) && ((cur[2] & 0xC0) != 0x80)) ||
717
142k
        (((cur[0] & 0xF0) == 0xF0) && ((cur[3] & 0xC0) != 0x80)) ||
718
142k
        (((cur[0] & 0xF8) == 0xF8))) {
719
0
        xmlEntitiesErr(XML_CHECK_NOT_UTF8,
720
0
          "xmlEncodeEntities: input not UTF-8");
721
0
        if (doc != NULL)
722
0
      doc->encoding = xmlStrdup(BAD_CAST "ISO-8859-1");
723
0
        snprintf(buf, sizeof(buf), "&#%d;", *cur);
724
0
        buf[sizeof(buf) - 1] = 0;
725
0
        ptr = buf;
726
0
        while (*ptr != 0) *out++ = *ptr++;
727
0
        cur++;
728
0
        continue;
729
142k
    } else if (*cur < 0xE0) {
730
141k
                    val = (cur[0]) & 0x1F;
731
141k
        val <<= 6;
732
141k
        val |= (cur[1]) & 0x3F;
733
141k
        l = 2;
734
141k
    } else if (*cur < 0xF0) {
735
190
                    val = (cur[0]) & 0x0F;
736
190
        val <<= 6;
737
190
        val |= (cur[1]) & 0x3F;
738
190
        val <<= 6;
739
190
        val |= (cur[2]) & 0x3F;
740
190
        l = 3;
741
190
    } else if (*cur < 0xF8) {
742
102
                    val = (cur[0]) & 0x07;
743
102
        val <<= 6;
744
102
        val |= (cur[1]) & 0x3F;
745
102
        val <<= 6;
746
102
        val |= (cur[2]) & 0x3F;
747
102
        val <<= 6;
748
102
        val |= (cur[3]) & 0x3F;
749
102
        l = 4;
750
102
    }
751
142k
    if ((l == 1) || (!IS_CHAR(val))) {
752
0
        xmlEntitiesErr(XML_ERR_INVALID_CHAR,
753
0
      "xmlEncodeEntities: char out of range\n");
754
0
        if (doc != NULL)
755
0
      doc->encoding = xmlStrdup(BAD_CAST "ISO-8859-1");
756
0
        snprintf(buf, sizeof(buf), "&#%d;", *cur);
757
0
        buf[sizeof(buf) - 1] = 0;
758
0
        ptr = buf;
759
0
        while (*ptr != 0) *out++ = *ptr++;
760
0
        cur++;
761
0
        continue;
762
0
    }
763
    /*
764
     * We could do multiple things here. Just save as a char ref
765
     */
766
142k
    snprintf(buf, sizeof(buf), "&#x%X;", val);
767
142k
    buf[sizeof(buf) - 1] = 0;
768
142k
    ptr = buf;
769
1.00M
    while (*ptr != 0) *out++ = *ptr++;
770
142k
    cur += l;
771
142k
    continue;
772
142k
      }
773
615k
  } else if (IS_BYTE_CHAR(*cur)) {
774
0
      char buf[11], *ptr;
775
776
0
      snprintf(buf, sizeof(buf), "&#%d;", *cur);
777
0
      buf[sizeof(buf) - 1] = 0;
778
0
            ptr = buf;
779
0
      while (*ptr != 0) *out++ = *ptr++;
780
0
  }
781
1.65M
  cur++;
782
1.65M
    }
783
19.4k
    *out = 0;
784
19.4k
    return(buffer);
785
786
0
mem_error:
787
0
    xmlEntitiesErrMemory("xmlEncodeEntities: realloc failed");
788
0
    xmlFree(buffer);
789
0
    return(NULL);
790
19.4k
}
791
792
/**
793
 * xmlEncodeAttributeEntities:
794
 * @doc:  the document containing the string
795
 * @input:  A string to convert to XML.
796
 *
797
 * Do a global encoding of a string, replacing the predefined entities
798
 * and non ASCII values with their entities and CharRef counterparts for
799
 * attribute values.
800
 *
801
 * Returns A newly allocated string with the substitution done.
802
 */
803
xmlChar *
804
19.4k
xmlEncodeAttributeEntities(xmlDocPtr doc, const xmlChar *input) {
805
19.4k
    return xmlEncodeEntitiesInternal(doc, input, 1);
806
19.4k
}
807
808
/**
809
 * xmlEncodeEntitiesReentrant:
810
 * @doc:  the document containing the string
811
 * @input:  A string to convert to XML.
812
 *
813
 * Do a global encoding of a string, replacing the predefined entities
814
 * and non ASCII values with their entities and CharRef counterparts.
815
 * Contrary to xmlEncodeEntities, this routine is reentrant, and result
816
 * must be deallocated.
817
 *
818
 * Returns A newly allocated string with the substitution done.
819
 */
820
xmlChar *
821
0
xmlEncodeEntitiesReentrant(xmlDocPtr doc, const xmlChar *input) {
822
0
    return xmlEncodeEntitiesInternal(doc, input, 0);
823
0
}
824
825
/**
826
 * xmlEncodeSpecialChars:
827
 * @doc:  the document containing the string
828
 * @input:  A string to convert to XML.
829
 *
830
 * Do a global encoding of a string, replacing the predefined entities
831
 * this routine is reentrant, and result must be deallocated.
832
 *
833
 * Returns A newly allocated string with the substitution done.
834
 */
835
xmlChar *
836
0
xmlEncodeSpecialChars(const xmlDoc *doc ATTRIBUTE_UNUSED, const xmlChar *input) {
837
0
    const xmlChar *cur = input;
838
0
    xmlChar *buffer = NULL;
839
0
    xmlChar *out = NULL;
840
0
    size_t buffer_size = 0;
841
0
    if (input == NULL) return(NULL);
842
843
    /*
844
     * allocate an translation buffer.
845
     */
846
0
    buffer_size = 1000;
847
0
    buffer = (xmlChar *) xmlMalloc(buffer_size);
848
0
    if (buffer == NULL) {
849
0
        xmlEntitiesErrMemory("xmlEncodeSpecialChars: malloc failed");
850
0
  return(NULL);
851
0
    }
852
0
    out = buffer;
853
854
0
    while (*cur != '\0') {
855
0
        size_t indx = out - buffer;
856
0
        if (indx + 10 > buffer_size) {
857
858
0
      growBufferReentrant();
859
0
      out = &buffer[indx];
860
0
  }
861
862
  /*
863
   * By default one have to encode at least '<', '>', '"' and '&' !
864
   */
865
0
  if (*cur == '<') {
866
0
      *out++ = '&';
867
0
      *out++ = 'l';
868
0
      *out++ = 't';
869
0
      *out++ = ';';
870
0
  } else if (*cur == '>') {
871
0
      *out++ = '&';
872
0
      *out++ = 'g';
873
0
      *out++ = 't';
874
0
      *out++ = ';';
875
0
  } else if (*cur == '&') {
876
0
      *out++ = '&';
877
0
      *out++ = 'a';
878
0
      *out++ = 'm';
879
0
      *out++ = 'p';
880
0
      *out++ = ';';
881
0
  } else if (*cur == '"') {
882
0
      *out++ = '&';
883
0
      *out++ = 'q';
884
0
      *out++ = 'u';
885
0
      *out++ = 'o';
886
0
      *out++ = 't';
887
0
      *out++ = ';';
888
0
  } else if (*cur == '\r') {
889
0
      *out++ = '&';
890
0
      *out++ = '#';
891
0
      *out++ = '1';
892
0
      *out++ = '3';
893
0
      *out++ = ';';
894
0
  } else {
895
      /*
896
       * Works because on UTF-8, all extended sequences cannot
897
       * result in bytes in the ASCII range.
898
       */
899
0
      *out++ = *cur;
900
0
  }
901
0
  cur++;
902
0
    }
903
0
    *out = 0;
904
0
    return(buffer);
905
906
0
mem_error:
907
0
    xmlEntitiesErrMemory("xmlEncodeSpecialChars: realloc failed");
908
0
    xmlFree(buffer);
909
0
    return(NULL);
910
0
}
911
912
/**
913
 * xmlCreateEntitiesTable:
914
 *
915
 * create and initialize an empty entities hash table.
916
 * This really doesn't make sense and should be deprecated
917
 *
918
 * Returns the xmlEntitiesTablePtr just created or NULL in case of error.
919
 */
920
xmlEntitiesTablePtr
921
0
xmlCreateEntitiesTable(void) {
922
0
    return((xmlEntitiesTablePtr) xmlHashCreate(0));
923
0
}
924
925
/**
926
 * xmlFreeEntityWrapper:
927
 * @entity:  An entity
928
 * @name:  its name
929
 *
930
 * Deallocate the memory used by an entities in the hash table.
931
 */
932
static void
933
7.59M
xmlFreeEntityWrapper(void *entity, const xmlChar *name ATTRIBUTE_UNUSED) {
934
7.59M
    if (entity != NULL)
935
7.59M
  xmlFreeEntity((xmlEntityPtr) entity);
936
7.59M
}
937
938
/**
939
 * xmlFreeEntitiesTable:
940
 * @table:  An entity table
941
 *
942
 * Deallocate the memory used by an entities hash table.
943
 */
944
void
945
462k
xmlFreeEntitiesTable(xmlEntitiesTablePtr table) {
946
462k
    xmlHashFree(table, xmlFreeEntityWrapper);
947
462k
}
948
949
#ifdef LIBXML_TREE_ENABLED
950
/**
951
 * xmlCopyEntity:
952
 * @ent:  An entity
953
 *
954
 * Build a copy of an entity
955
 *
956
 * Returns the new xmlEntitiesPtr or NULL in case of error.
957
 */
958
static void *
959
0
xmlCopyEntity(void *payload, const xmlChar *name ATTRIBUTE_UNUSED) {
960
0
    xmlEntityPtr ent = (xmlEntityPtr) payload;
961
0
    xmlEntityPtr cur;
962
963
0
    cur = (xmlEntityPtr) xmlMalloc(sizeof(xmlEntity));
964
0
    if (cur == NULL) {
965
0
        xmlEntitiesErrMemory("xmlCopyEntity:: malloc failed");
966
0
  return(NULL);
967
0
    }
968
0
    memset(cur, 0, sizeof(xmlEntity));
969
0
    cur->type = XML_ENTITY_DECL;
970
971
0
    cur->etype = ent->etype;
972
0
    if (ent->name != NULL)
973
0
  cur->name = xmlStrdup(ent->name);
974
0
    if (ent->ExternalID != NULL)
975
0
  cur->ExternalID = xmlStrdup(ent->ExternalID);
976
0
    if (ent->SystemID != NULL)
977
0
  cur->SystemID = xmlStrdup(ent->SystemID);
978
0
    if (ent->content != NULL)
979
0
  cur->content = xmlStrdup(ent->content);
980
0
    if (ent->orig != NULL)
981
0
  cur->orig = xmlStrdup(ent->orig);
982
0
    if (ent->URI != NULL)
983
0
  cur->URI = xmlStrdup(ent->URI);
984
0
    return(cur);
985
0
}
986
987
/**
988
 * xmlCopyEntitiesTable:
989
 * @table:  An entity table
990
 *
991
 * Build a copy of an entity table.
992
 *
993
 * Returns the new xmlEntitiesTablePtr or NULL in case of error.
994
 */
995
xmlEntitiesTablePtr
996
0
xmlCopyEntitiesTable(xmlEntitiesTablePtr table) {
997
0
    return(xmlHashCopy(table, xmlCopyEntity));
998
0
}
999
#endif /* LIBXML_TREE_ENABLED */
1000
1001
#ifdef LIBXML_OUTPUT_ENABLED
1002
1003
/**
1004
 * xmlDumpEntityContent:
1005
 * @buf:  An XML buffer.
1006
 * @content:  The entity content.
1007
 *
1008
 * This will dump the quoted string value, taking care of the special
1009
 * treatment required by %
1010
 */
1011
static void
1012
2.54k
xmlDumpEntityContent(xmlBufferPtr buf, const xmlChar *content) {
1013
2.54k
    if (xmlStrchr(content, '%')) {
1014
0
        const xmlChar * base, *cur;
1015
1016
0
  xmlBufferCCat(buf, "\"");
1017
0
  base = cur = content;
1018
0
  while (*cur != 0) {
1019
0
      if (*cur == '"') {
1020
0
    if (base != cur)
1021
0
        xmlBufferAdd(buf, base, cur - base);
1022
0
    xmlBufferAdd(buf, BAD_CAST "&quot;", 6);
1023
0
    cur++;
1024
0
    base = cur;
1025
0
      } else if (*cur == '%') {
1026
0
    if (base != cur)
1027
0
        xmlBufferAdd(buf, base, cur - base);
1028
0
    xmlBufferAdd(buf, BAD_CAST "&#x25;", 6);
1029
0
    cur++;
1030
0
    base = cur;
1031
0
      } else {
1032
0
    cur++;
1033
0
      }
1034
0
  }
1035
0
  if (base != cur)
1036
0
      xmlBufferAdd(buf, base, cur - base);
1037
0
  xmlBufferCCat(buf, "\"");
1038
2.54k
    } else {
1039
2.54k
        xmlBufferWriteQuotedString(buf, content);
1040
2.54k
    }
1041
2.54k
}
1042
1043
/**
1044
 * xmlDumpEntityDecl:
1045
 * @buf:  An XML buffer.
1046
 * @ent:  An entity table
1047
 *
1048
 * This will dump the content of the entity table as an XML DTD definition
1049
 */
1050
void
1051
452k
xmlDumpEntityDecl(xmlBufferPtr buf, xmlEntityPtr ent) {
1052
452k
    if ((buf == NULL) || (ent == NULL)) return;
1053
452k
    switch (ent->etype) {
1054
352k
  case XML_INTERNAL_GENERAL_ENTITY:
1055
352k
      xmlBufferWriteChar(buf, "<!ENTITY ");
1056
352k
      xmlBufferWriteCHAR(buf, ent->name);
1057
352k
      xmlBufferWriteChar(buf, " ");
1058
352k
      if (ent->orig != NULL)
1059
349k
    xmlBufferWriteQuotedString(buf, ent->orig);
1060
2.54k
      else
1061
2.54k
    xmlDumpEntityContent(buf, ent->content);
1062
352k
      xmlBufferWriteChar(buf, ">\n");
1063
352k
      break;
1064
13.0k
  case XML_EXTERNAL_GENERAL_PARSED_ENTITY:
1065
13.0k
      xmlBufferWriteChar(buf, "<!ENTITY ");
1066
13.0k
      xmlBufferWriteCHAR(buf, ent->name);
1067
13.0k
      if (ent->ExternalID != NULL) {
1068
2.18k
     xmlBufferWriteChar(buf, " PUBLIC ");
1069
2.18k
     xmlBufferWriteQuotedString(buf, ent->ExternalID);
1070
2.18k
     xmlBufferWriteChar(buf, " ");
1071
2.18k
     xmlBufferWriteQuotedString(buf, ent->SystemID);
1072
10.8k
      } else {
1073
10.8k
     xmlBufferWriteChar(buf, " SYSTEM ");
1074
10.8k
     xmlBufferWriteQuotedString(buf, ent->SystemID);
1075
10.8k
      }
1076
13.0k
      xmlBufferWriteChar(buf, ">\n");
1077
13.0k
      break;
1078
1.49k
  case XML_EXTERNAL_GENERAL_UNPARSED_ENTITY:
1079
1.49k
      xmlBufferWriteChar(buf, "<!ENTITY ");
1080
1.49k
      xmlBufferWriteCHAR(buf, ent->name);
1081
1.49k
      if (ent->ExternalID != NULL) {
1082
377
     xmlBufferWriteChar(buf, " PUBLIC ");
1083
377
     xmlBufferWriteQuotedString(buf, ent->ExternalID);
1084
377
     xmlBufferWriteChar(buf, " ");
1085
377
     xmlBufferWriteQuotedString(buf, ent->SystemID);
1086
1.11k
      } else {
1087
1.11k
     xmlBufferWriteChar(buf, " SYSTEM ");
1088
1.11k
     xmlBufferWriteQuotedString(buf, ent->SystemID);
1089
1.11k
      }
1090
1.49k
      if (ent->content != NULL) { /* Should be true ! */
1091
1.38k
    xmlBufferWriteChar(buf, " NDATA ");
1092
1.38k
    if (ent->orig != NULL)
1093
98
        xmlBufferWriteCHAR(buf, ent->orig);
1094
1.28k
    else
1095
1.28k
        xmlBufferWriteCHAR(buf, ent->content);
1096
1.38k
      }
1097
1.49k
      xmlBufferWriteChar(buf, ">\n");
1098
1.49k
      break;
1099
77.8k
  case XML_INTERNAL_PARAMETER_ENTITY:
1100
77.8k
      xmlBufferWriteChar(buf, "<!ENTITY % ");
1101
77.8k
      xmlBufferWriteCHAR(buf, ent->name);
1102
77.8k
      xmlBufferWriteChar(buf, " ");
1103
77.8k
      if (ent->orig == NULL)
1104
0
    xmlDumpEntityContent(buf, ent->content);
1105
77.8k
      else
1106
77.8k
    xmlBufferWriteQuotedString(buf, ent->orig);
1107
77.8k
      xmlBufferWriteChar(buf, ">\n");
1108
77.8k
      break;
1109
7.88k
  case XML_EXTERNAL_PARAMETER_ENTITY:
1110
7.88k
      xmlBufferWriteChar(buf, "<!ENTITY % ");
1111
7.88k
      xmlBufferWriteCHAR(buf, ent->name);
1112
7.88k
      if (ent->ExternalID != NULL) {
1113
93
     xmlBufferWriteChar(buf, " PUBLIC ");
1114
93
     xmlBufferWriteQuotedString(buf, ent->ExternalID);
1115
93
     xmlBufferWriteChar(buf, " ");
1116
93
     xmlBufferWriteQuotedString(buf, ent->SystemID);
1117
7.79k
      } else {
1118
7.79k
     xmlBufferWriteChar(buf, " SYSTEM ");
1119
7.79k
     xmlBufferWriteQuotedString(buf, ent->SystemID);
1120
7.79k
      }
1121
7.88k
      xmlBufferWriteChar(buf, ">\n");
1122
7.88k
      break;
1123
0
  default:
1124
0
      xmlEntitiesErr(XML_DTD_UNKNOWN_ENTITY,
1125
0
    "xmlDumpEntitiesDecl: internal: unknown type entity type");
1126
452k
    }
1127
452k
}
1128
1129
/**
1130
 * xmlDumpEntityDeclScan:
1131
 * @ent:  An entity table
1132
 * @buf:  An XML buffer.
1133
 *
1134
 * When using the hash table scan function, arguments need to be reversed
1135
 */
1136
static void
1137
xmlDumpEntityDeclScan(void *ent, void *buf,
1138
0
                      const xmlChar *name ATTRIBUTE_UNUSED) {
1139
0
    xmlDumpEntityDecl((xmlBufferPtr) buf, (xmlEntityPtr) ent);
1140
0
}
1141
1142
/**
1143
 * xmlDumpEntitiesTable:
1144
 * @buf:  An XML buffer.
1145
 * @table:  An entity table
1146
 *
1147
 * This will dump the content of the entity table as an XML DTD definition
1148
 */
1149
void
1150
0
xmlDumpEntitiesTable(xmlBufferPtr buf, xmlEntitiesTablePtr table) {
1151
0
    xmlHashScan(table, xmlDumpEntityDeclScan, buf);
1152
0
}
1153
#endif /* LIBXML_OUTPUT_ENABLED */