Coverage Report

Created: 2026-04-01 07:17

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
/src/ghostpdl/expat/lib/xmlparse.c
Line
Count
Source
1
/* c5625880f4bf417c1463deee4eb92d86ff413f802048621c57e25fe483eb59e4 (2.6.4+)
2
                            __  __            _
3
                         ___\ \/ /_ __   __ _| |_
4
                        / _ \\  /| '_ \ / _` | __|
5
                       |  __//  \| |_) | (_| | |_
6
                        \___/_/\_\ .__/ \__,_|\__|
7
                                 |_| XML parser
8
9
   Copyright (c) 1997-2000 Thai Open Source Software Center Ltd
10
   Copyright (c) 2000      Clark Cooper <coopercc@users.sourceforge.net>
11
   Copyright (c) 2000-2006 Fred L. Drake, Jr. <fdrake@users.sourceforge.net>
12
   Copyright (c) 2001-2002 Greg Stein <gstein@users.sourceforge.net>
13
   Copyright (c) 2002-2016 Karl Waclawek <karl@waclawek.net>
14
   Copyright (c) 2005-2009 Steven Solie <steven@solie.ca>
15
   Copyright (c) 2016      Eric Rahm <erahm@mozilla.com>
16
   Copyright (c) 2016-2024 Sebastian Pipping <sebastian@pipping.org>
17
   Copyright (c) 2016      Gaurav <g.gupta@samsung.com>
18
   Copyright (c) 2016      Thomas Beutlich <tc@tbeu.de>
19
   Copyright (c) 2016      Gustavo Grieco <gustavo.grieco@imag.fr>
20
   Copyright (c) 2016      Pascal Cuoq <cuoq@trust-in-soft.com>
21
   Copyright (c) 2016      Ed Schouten <ed@nuxi.nl>
22
   Copyright (c) 2017-2022 Rhodri James <rhodri@wildebeest.org.uk>
23
   Copyright (c) 2017      Václav Slavík <vaclav@slavik.io>
24
   Copyright (c) 2017      Viktor Szakats <commit@vsz.me>
25
   Copyright (c) 2017      Chanho Park <chanho61.park@samsung.com>
26
   Copyright (c) 2017      Rolf Eike Beer <eike@sf-mail.de>
27
   Copyright (c) 2017      Hans Wennborg <hans@chromium.org>
28
   Copyright (c) 2018      Anton Maklakov <antmak.pub@gmail.com>
29
   Copyright (c) 2018      Benjamin Peterson <benjamin@python.org>
30
   Copyright (c) 2018      Marco Maggi <marco.maggi-ipsu@poste.it>
31
   Copyright (c) 2018      Mariusz Zaborski <oshogbo@vexillium.org>
32
   Copyright (c) 2019      David Loffredo <loffredo@steptools.com>
33
   Copyright (c) 2019-2020 Ben Wagner <bungeman@chromium.org>
34
   Copyright (c) 2019      Vadim Zeitlin <vadim@zeitlins.org>
35
   Copyright (c) 2021      Donghee Na <donghee.na@python.org>
36
   Copyright (c) 2022      Samanta Navarro <ferivoz@riseup.net>
37
   Copyright (c) 2022      Jeffrey Walton <noloader@gmail.com>
38
   Copyright (c) 2022      Jann Horn <jannh@google.com>
39
   Copyright (c) 2022      Sean McBride <sean@rogue-research.com>
40
   Copyright (c) 2023      Owain Davies <owaind@bath.edu>
41
   Copyright (c) 2023-2024 Sony Corporation / Snild Dolkow <snild@sony.com>
42
   Copyright (c) 2024      Berkay Eren Ürün <berkay.ueruen@siemens.com>
43
   Copyright (c) 2024      Hanno Böck <hanno@gentoo.org>
44
   Licensed under the MIT license:
45
46
   Permission is  hereby granted,  free of charge,  to any  person obtaining
47
   a  copy  of  this  software   and  associated  documentation  files  (the
48
   "Software"),  to  deal in  the  Software  without restriction,  including
49
   without  limitation the  rights  to use,  copy,  modify, merge,  publish,
50
   distribute, sublicense, and/or sell copies of the Software, and to permit
51
   persons  to whom  the Software  is  furnished to  do so,  subject to  the
52
   following conditions:
53
54
   The above copyright  notice and this permission notice  shall be included
55
   in all copies or substantial portions of the Software.
56
57
   THE  SOFTWARE  IS  PROVIDED  "AS  IS",  WITHOUT  WARRANTY  OF  ANY  KIND,
58
   EXPRESS  OR IMPLIED,  INCLUDING  BUT  NOT LIMITED  TO  THE WARRANTIES  OF
59
   MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN
60
   NO EVENT SHALL THE AUTHORS OR  COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM,
61
   DAMAGES OR  OTHER LIABILITY, WHETHER  IN AN  ACTION OF CONTRACT,  TORT OR
62
   OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
63
   USE OR OTHER DEALINGS IN THE SOFTWARE.
64
*/
65
66
#define XML_BUILDING_EXPAT 1
67
68
#include "expat_config.h"
69
70
#if ! defined(XML_GE) || (1 - XML_GE - 1 == 2) || (XML_GE < 0) || (XML_GE > 1)
71
#  error XML_GE (for general entities) must be defined, non-empty, either 1 or 0 (0 to disable, 1 to enable; 1 is a common default)
72
#endif
73
74
#if defined(XML_DTD) && XML_GE == 0
75
#  error Either undefine XML_DTD or define XML_GE to 1.
76
#endif
77
78
#if ! defined(XML_CONTEXT_BYTES) || (1 - XML_CONTEXT_BYTES - 1 == 2)           \
79
    || (XML_CONTEXT_BYTES + 0 < 0)
80
#  error XML_CONTEXT_BYTES must be defined, non-empty and >=0 (0 to disable, >=1 to enable; 1024 is a common default)
81
#endif
82
83
#if defined(HAVE_SYSCALL_GETRANDOM)
84
#  if ! defined(_GNU_SOURCE)
85
#    define _GNU_SOURCE 1 /* syscall prototype */
86
#  endif
87
#endif
88
89
#ifdef _WIN32
90
/* force stdlib to define rand_s() */
91
#  if ! defined(_CRT_RAND_S)
92
#    define _CRT_RAND_S
93
#  endif
94
#endif
95
96
#if defined(_MSC_VER) && _MSC_VER < 1700
97
typedef unsigned char bool;
98
#define true (bool)1
99
#define false (bool)0
100
#else
101
#include <stdbool.h>
102
#endif
103
104
#include <stddef.h>
105
#include <string.h> /* memset(), memcpy() */
106
#include <assert.h>
107
#include <limits.h> /* UINT_MAX */
108
#include <stdio.h>  /* fprintf */
109
#include <stdlib.h> /* getenv, rand_s */
110
111
#if !defined(_MSC_VER) || (defined(_MSC_VER) && _MSC_VER >= 1700)
112
#include <stdint.h> /* uintptr_t */
113
#endif
114
#include <math.h>   /* isnan */
115
116
#ifdef _WIN32
117
#  define getpid GetCurrentProcessId
118
#else
119
#  include <sys/time.h>  /* gettimeofday() */
120
#  include <sys/types.h> /* getpid() */
121
#  include <unistd.h>    /* getpid() */
122
#  include <fcntl.h>     /* O_RDONLY */
123
#  include <errno.h>
124
#endif
125
126
#ifdef _WIN32
127
#  include "winconfig.h"
128
#endif
129
130
#include "ascii.h"
131
#include "expat.h"
132
#include "siphash.h"
133
134
#if defined(HAVE_GETRANDOM) || defined(HAVE_SYSCALL_GETRANDOM)
135
#  if defined(HAVE_GETRANDOM)
136
#    include <sys/random.h> /* getrandom */
137
#  else
138
#    include <unistd.h>      /* syscall */
139
#    include <sys/syscall.h> /* SYS_getrandom */
140
#  endif
141
#  if ! defined(GRND_NONBLOCK)
142
#    define GRND_NONBLOCK 0x0001
143
#  endif /* defined(GRND_NONBLOCK) */
144
#endif   /* defined(HAVE_GETRANDOM) || defined(HAVE_SYSCALL_GETRANDOM) */
145
146
#if defined(HAVE_LIBBSD)                                                       \
147
    && (defined(HAVE_ARC4RANDOM_BUF) || defined(HAVE_ARC4RANDOM))
148
#  include <bsd/stdlib.h>
149
#endif
150
151
#if defined(_WIN32) && ! defined(LOAD_LIBRARY_SEARCH_SYSTEM32)
152
#  define LOAD_LIBRARY_SEARCH_SYSTEM32 0x00000800
153
#endif
154
155
#if ! defined(HAVE_GETRANDOM) && ! defined(HAVE_SYSCALL_GETRANDOM)             \
156
    && ! defined(HAVE_ARC4RANDOM_BUF) && ! defined(HAVE_ARC4RANDOM)            \
157
    && ! defined(XML_DEV_URANDOM) && ! defined(_WIN32)                         \
158
    && ! defined(XML_POOR_ENTROPY)
159
#  error You do not have support for any sources of high quality entropy \
160
    enabled.  For end user security, that is probably not what you want. \
161
    \
162
    Your options include: \
163
      * Linux >=3.17 + glibc >=2.25 (getrandom): HAVE_GETRANDOM, \
164
      * Linux >=3.17 + glibc (including <2.25) (syscall SYS_getrandom): HAVE_SYSCALL_GETRANDOM, \
165
      * BSD / macOS >=10.7 / glibc >=2.36 (arc4random_buf): HAVE_ARC4RANDOM_BUF, \
166
      * BSD / macOS (including <10.7) / glibc >=2.36 (arc4random): HAVE_ARC4RANDOM, \
167
      * libbsd (arc4random_buf): HAVE_ARC4RANDOM_BUF + HAVE_LIBBSD, \
168
      * libbsd (arc4random): HAVE_ARC4RANDOM + HAVE_LIBBSD, \
169
      * Linux (including <3.17) / BSD / macOS (including <10.7) / Solaris >=8 (/dev/urandom): XML_DEV_URANDOM, \
170
      * Windows >=Vista (rand_s): _WIN32. \
171
    \
172
    If insist on not using any of these, bypass this error by defining \
173
    XML_POOR_ENTROPY; you have been warned. \
174
    \
175
    If you have reasons to patch this detection code away or need changes \
176
    to the build system, please open a bug.  Thank you!
177
#endif
178
179
#ifdef XML_UNICODE
180
#  define XML_ENCODE_MAX XML_UTF16_ENCODE_MAX
181
#  define XmlConvert XmlUtf16Convert
182
#  define XmlGetInternalEncoding XmlGetUtf16InternalEncoding
183
#  define XmlGetInternalEncodingNS XmlGetUtf16InternalEncodingNS
184
#  define XmlEncode XmlUtf16Encode
185
#  define MUST_CONVERT(enc, s) (! (enc)->isUtf16 || (((uintptr_t)(s)) & 1))
186
typedef unsigned short ICHAR;
187
#else
188
#  define XML_ENCODE_MAX XML_UTF8_ENCODE_MAX
189
121k
#  define XmlConvert XmlUtf8Convert
190
69
#  define XmlGetInternalEncoding XmlGetUtf8InternalEncoding
191
20
#  define XmlGetInternalEncodingNS XmlGetUtf8InternalEncodingNS
192
0
#  define XmlEncode XmlUtf8Encode
193
10.9k
#  define MUST_CONVERT(enc, s) (! (enc)->isUtf8)
194
typedef char ICHAR;
195
#endif
196
197
#ifndef XML_NS
198
199
#  define XmlInitEncodingNS XmlInitEncoding
200
#  define XmlInitUnknownEncodingNS XmlInitUnknownEncoding
201
#  undef XmlGetInternalEncodingNS
202
#  define XmlGetInternalEncodingNS XmlGetInternalEncoding
203
#  define XmlParseXmlDeclNS XmlParseXmlDecl
204
205
#endif
206
207
#ifdef XML_UNICODE
208
209
#  ifdef XML_UNICODE_WCHAR_T
210
#    define XML_T(x) (const wchar_t) x
211
#    define XML_L(x) L##x
212
#  else
213
#    define XML_T(x) (const unsigned short)x
214
#    define XML_L(x) x
215
#  endif
216
217
#else
218
219
7.37k
#  define XML_T(x) x
220
34
#  define XML_L(x) x
221
222
#endif
223
224
/* Round up n to be a multiple of sz, where sz is a power of 2. */
225
0
#define ROUND_UP(n, sz) (((n) + ((sz) - 1)) & ~((sz) - 1))
226
227
/* Do safe (NULL-aware) pointer arithmetic */
228
534
#define EXPAT_SAFE_PTR_DIFF(p, q) (((p) && (q)) ? ((p) - (q)) : 0)
229
230
0
#define EXPAT_MIN(a, b) (((a) < (b)) ? (a) : (b))
231
232
#include "internal.h"
233
#include "xmltok.h"
234
#include "xmlrole.h"
235
236
typedef const XML_Char *KEY;
237
238
typedef struct {
239
  KEY name;
240
} NAMED;
241
242
typedef struct {
243
  NAMED **v;
244
  unsigned char power;
245
  size_t size;
246
  size_t used;
247
  const XML_Memory_Handling_Suite *mem;
248
} HASH_TABLE;
249
250
static size_t keylen(KEY s);
251
252
static void copy_salt_to_sipkey(XML_Parser parser, struct sipkey *key);
253
254
/* For probing (after a collision) we need a step size relative prime
255
   to the hash table size, which is a power of 2. We use double-hashing,
256
   since we can calculate a second hash value cheaply by taking those bits
257
   of the first hash value that were discarded (masked out) when the table
258
   index was calculated: index = hash & mask, where mask = table->size - 1.
259
   We limit the maximum step size to table->size / 4 (mask >> 2) and make
260
   it odd, since odd numbers are always relative prime to a power of 2.
261
*/
262
#define SECOND_HASH(hash, mask, power)                                         \
263
6.63k
  ((((hash) & ~(mask)) >> ((power) - 1)) & ((mask) >> 2))
264
#define PROBE_STEP(hash, mask, power)                                          \
265
6.63k
  ((unsigned char)((SECOND_HASH(hash, mask, power)) | 1))
266
267
typedef struct {
268
  NAMED **p;
269
  NAMED **end;
270
} HASH_TABLE_ITER;
271
272
110
#define INIT_TAG_BUF_SIZE 32 /* must be a multiple of sizeof(XML_Char) */
273
89
#define INIT_DATA_BUF_SIZE 1024
274
89
#define INIT_ATTS_SIZE 16
275
20
#define INIT_ATTS_VERSION 0xFFFFFFFF
276
377
#define INIT_BLOCK_SIZE 1024
277
89
#define INIT_BUFFER_SIZE 1024
278
279
80
#define EXPAND_SPARE 24
280
281
typedef struct binding {
282
  struct prefix *prefix;
283
  struct binding *nextTagBinding;
284
  struct binding *prevPrefixBinding;
285
  const struct attribute_id *attId;
286
  XML_Char *uri;
287
  int uriLen;
288
  int uriAlloc;
289
} BINDING;
290
291
typedef struct prefix {
292
  const XML_Char *name;
293
  BINDING *binding;
294
} PREFIX;
295
296
typedef struct {
297
  const XML_Char *str;
298
  const XML_Char *localPart;
299
  const XML_Char *prefix;
300
  int strLen;
301
  int uriLen;
302
  int prefixLen;
303
} TAG_NAME;
304
305
/* TAG represents an open element.
306
   The name of the element is stored in both the document and API
307
   encodings.  The memory buffer 'buf' is a separately-allocated
308
   memory area which stores the name.  During the XML_Parse()/
309
   XML_ParseBuffer() when the element is open, the memory for the 'raw'
310
   version of the name (in the document encoding) is shared with the
311
   document buffer.  If the element is open across calls to
312
   XML_Parse()/XML_ParseBuffer(), the buffer is re-allocated to
313
   contain the 'raw' name as well.
314
315
   A parser reuses these structures, maintaining a list of allocated
316
   TAG objects in a free list.
317
*/
318
typedef struct tag {
319
  struct tag *parent;  /* parent of this element */
320
  const char *rawName; /* tagName in the original encoding */
321
  int rawNameLength;
322
  TAG_NAME name; /* tagName in the API encoding */
323
  char *buf;     /* buffer for name components */
324
  char *bufEnd;  /* end of the buffer */
325
  BINDING *bindings;
326
} TAG;
327
328
typedef struct {
329
  const XML_Char *name;
330
  const XML_Char *textPtr;
331
  int textLen;   /* length in XML_Chars */
332
  int processed; /* # of processed bytes - when suspended */
333
  const XML_Char *systemId;
334
  const XML_Char *base;
335
  const XML_Char *publicId;
336
  const XML_Char *notation;
337
  XML_Bool open;
338
  XML_Bool is_param;
339
  XML_Bool is_internal; /* true if declared in internal subset outside PE */
340
} ENTITY;
341
342
typedef struct {
343
  enum XML_Content_Type type;
344
  enum XML_Content_Quant quant;
345
  const XML_Char *name;
346
  int firstchild;
347
  int lastchild;
348
  int childcnt;
349
  int nextsib;
350
} CONTENT_SCAFFOLD;
351
352
0
#define INIT_SCAFFOLD_ELEMENTS 32
353
354
typedef struct block {
355
  struct block *next;
356
  int size;
357
  XML_Char s[1];
358
} BLOCK;
359
360
typedef struct {
361
  BLOCK *blocks;
362
  BLOCK *freeBlocks;
363
  const XML_Char *end;
364
  XML_Char *ptr;
365
  XML_Char *start;
366
  const XML_Memory_Handling_Suite *mem;
367
} STRING_POOL;
368
369
/* The XML_Char before the name is used to determine whether
370
   an attribute has been specified. */
371
typedef struct attribute_id {
372
  XML_Char *name;
373
  PREFIX *prefix;
374
  XML_Bool maybeTokenized;
375
  XML_Bool xmlns;
376
} ATTRIBUTE_ID;
377
378
typedef struct {
379
  const ATTRIBUTE_ID *id;
380
  XML_Bool isCdata;
381
  const XML_Char *value;
382
} DEFAULT_ATTRIBUTE;
383
384
typedef struct {
385
  unsigned long version;
386
  unsigned long hash;
387
  const XML_Char *uriName;
388
} NS_ATT;
389
390
typedef struct {
391
  const XML_Char *name;
392
  PREFIX *prefix;
393
  const ATTRIBUTE_ID *idAtt;
394
  int nDefaultAtts;
395
  int allocDefaultAtts;
396
  DEFAULT_ATTRIBUTE *defaultAtts;
397
} ELEMENT_TYPE;
398
399
typedef struct {
400
  HASH_TABLE generalEntities;
401
  HASH_TABLE elementTypes;
402
  HASH_TABLE attributeIds;
403
  HASH_TABLE prefixes;
404
  STRING_POOL pool;
405
  STRING_POOL entityValuePool;
406
  /* false once a parameter entity reference has been skipped */
407
  XML_Bool keepProcessing;
408
  /* true once an internal or external PE reference has been encountered;
409
     this includes the reference to an external subset */
410
  XML_Bool hasParamEntityRefs;
411
  XML_Bool standalone;
412
#ifdef XML_DTD
413
  /* indicates if external PE has been read */
414
  XML_Bool paramEntityRead;
415
  HASH_TABLE paramEntities;
416
#endif /* XML_DTD */
417
  PREFIX defaultPrefix;
418
  /* === scaffolding for building content model === */
419
  XML_Bool in_eldecl;
420
  CONTENT_SCAFFOLD *scaffold;
421
  unsigned contentStringLen;
422
  unsigned scaffSize;
423
  unsigned scaffCount;
424
  int scaffLevel;
425
  int *scaffIndex;
426
} DTD;
427
428
typedef struct open_internal_entity {
429
  const char *internalEventPtr;
430
  const char *internalEventEndPtr;
431
  struct open_internal_entity *next;
432
  ENTITY *entity;
433
  int startTagLevel;
434
  XML_Bool betweenDecl; /* WFC: PE Between Declarations */
435
} OPEN_INTERNAL_ENTITY;
436
437
enum XML_Account {
438
  XML_ACCOUNT_DIRECT,           /* bytes directly passed to the Expat parser */
439
  XML_ACCOUNT_ENTITY_EXPANSION, /* intermediate bytes produced during entity
440
                                   expansion */
441
  XML_ACCOUNT_NONE              /* i.e. do not account, was accounted already */
442
};
443
444
#if XML_GE == 1
445
typedef unsigned long long XmlBigCount;
446
typedef struct accounting {
447
  XmlBigCount countBytesDirect;
448
  XmlBigCount countBytesIndirect;
449
  unsigned long debugLevel;
450
  float maximumAmplificationFactor; // >=1.0
451
  unsigned long long activationThresholdBytes;
452
} ACCOUNTING;
453
454
typedef struct entity_stats {
455
  unsigned int countEverOpened;
456
  unsigned int currentDepth;
457
  unsigned int maximumDepthSeen;
458
  unsigned long debugLevel;
459
} ENTITY_STATS;
460
#endif /* XML_GE == 1 */
461
462
typedef enum XML_Error PTRCALL Processor(XML_Parser parser, const char *start,
463
                                         const char *end, const char **endPtr);
464
465
static Processor prologProcessor;
466
static Processor prologInitProcessor;
467
static Processor contentProcessor;
468
static Processor cdataSectionProcessor;
469
#ifdef XML_DTD
470
static Processor ignoreSectionProcessor;
471
static Processor externalParEntProcessor;
472
static Processor externalParEntInitProcessor;
473
static Processor entityValueProcessor;
474
static Processor entityValueInitProcessor;
475
#endif /* XML_DTD */
476
static Processor epilogProcessor;
477
static Processor errorProcessor;
478
static Processor externalEntityInitProcessor;
479
static Processor externalEntityInitProcessor2;
480
static Processor externalEntityInitProcessor3;
481
static Processor externalEntityContentProcessor;
482
static Processor internalEntityProcessor;
483
484
static enum XML_Error handleUnknownEncoding(XML_Parser parser,
485
                                            const XML_Char *encodingName);
486
static enum XML_Error processXmlDecl(XML_Parser parser, int isGeneralTextEntity,
487
                                     const char *s, const char *next);
488
static enum XML_Error initializeEncoding(XML_Parser parser);
489
static enum XML_Error doProlog(XML_Parser parser, const ENCODING *enc,
490
                               const char *s, const char *end, int tok,
491
                               const char *next, const char **nextPtr,
492
                               XML_Bool haveMore, XML_Bool allowClosingDoctype,
493
                               enum XML_Account account);
494
static enum XML_Error processInternalEntity(XML_Parser parser, ENTITY *entity,
495
                                            XML_Bool betweenDecl);
496
static enum XML_Error doContent(XML_Parser parser, int startTagLevel,
497
                                const ENCODING *enc, const char *start,
498
                                const char *end, const char **endPtr,
499
                                XML_Bool haveMore, enum XML_Account account);
500
static enum XML_Error doCdataSection(XML_Parser parser, const ENCODING *enc,
501
                                     const char **startPtr, const char *end,
502
                                     const char **nextPtr, XML_Bool haveMore,
503
                                     enum XML_Account account);
504
#ifdef XML_DTD
505
static enum XML_Error doIgnoreSection(XML_Parser parser, const ENCODING *enc,
506
                                      const char **startPtr, const char *end,
507
                                      const char **nextPtr, XML_Bool haveMore);
508
#endif /* XML_DTD */
509
510
static void freeBindings(XML_Parser parser, BINDING *bindings);
511
static enum XML_Error storeAtts(XML_Parser parser, const ENCODING *enc,
512
                                const char *attStr, TAG_NAME *tagNamePtr,
513
                                BINDING **bindingsPtr,
514
                                enum XML_Account account);
515
static enum XML_Error addBinding(XML_Parser parser, PREFIX *prefix,
516
                                 const ATTRIBUTE_ID *attId, const XML_Char *uri,
517
                                 BINDING **bindingsPtr);
518
static int defineAttribute(ELEMENT_TYPE *type, ATTRIBUTE_ID *attId,
519
                           XML_Bool isCdata, XML_Bool isId,
520
                           const XML_Char *value, XML_Parser parser);
521
static enum XML_Error storeAttributeValue(XML_Parser parser,
522
                                          const ENCODING *enc, XML_Bool isCdata,
523
                                          const char *ptr, const char *end,
524
                                          STRING_POOL *pool,
525
                                          enum XML_Account account);
526
static enum XML_Error appendAttributeValue(XML_Parser parser,
527
                                           const ENCODING *enc,
528
                                           XML_Bool isCdata, const char *ptr,
529
                                           const char *end, STRING_POOL *pool,
530
                                           enum XML_Account account);
531
static ATTRIBUTE_ID *getAttributeId(XML_Parser parser, const ENCODING *enc,
532
                                    const char *start, const char *end);
533
static int setElementTypePrefix(XML_Parser parser, ELEMENT_TYPE *elementType);
534
#if XML_GE == 1
535
static enum XML_Error storeEntityValue(XML_Parser parser, const ENCODING *enc,
536
                                       const char *start, const char *end,
537
                                       enum XML_Account account);
538
#else
539
static enum XML_Error storeSelfEntityValue(XML_Parser parser, ENTITY *entity);
540
#endif
541
static int reportProcessingInstruction(XML_Parser parser, const ENCODING *enc,
542
                                       const char *start, const char *end);
543
static int reportComment(XML_Parser parser, const ENCODING *enc,
544
                         const char *start, const char *end);
545
static void reportDefault(XML_Parser parser, const ENCODING *enc,
546
                          const char *start, const char *end);
547
548
static const XML_Char *getContext(XML_Parser parser);
549
static XML_Bool setContext(XML_Parser parser, const XML_Char *context);
550
551
static void FASTCALL normalizePublicId(XML_Char *s);
552
553
static DTD *dtdCreate(const XML_Memory_Handling_Suite *ms);
554
/* do not call if m_parentParser != NULL */
555
static void dtdReset(DTD *p, const XML_Memory_Handling_Suite *ms);
556
static void dtdDestroy(DTD *p, XML_Bool isDocEntity,
557
                       const XML_Memory_Handling_Suite *ms);
558
static int dtdCopy(XML_Parser oldParser, DTD *newDtd, const DTD *oldDtd,
559
                   const XML_Memory_Handling_Suite *ms);
560
static int copyEntityTable(XML_Parser oldParser, HASH_TABLE *newTable,
561
                           STRING_POOL *newPool, const HASH_TABLE *oldTable);
562
static NAMED *lookup(XML_Parser parser, HASH_TABLE *table, KEY name,
563
                     size_t createSize);
564
static void FASTCALL hashTableInit(HASH_TABLE *table,
565
                                   const XML_Memory_Handling_Suite *ms);
566
static void FASTCALL hashTableClear(HASH_TABLE *table);
567
static void FASTCALL hashTableDestroy(HASH_TABLE *table);
568
static void FASTCALL hashTableIterInit(HASH_TABLE_ITER *iter,
569
                                       const HASH_TABLE *table);
570
static NAMED *FASTCALL hashTableIterNext(HASH_TABLE_ITER *iter);
571
572
static void FASTCALL poolInit(STRING_POOL *pool,
573
                              const XML_Memory_Handling_Suite *ms);
574
static void FASTCALL poolClear(STRING_POOL *pool);
575
static void FASTCALL poolDestroy(STRING_POOL *pool);
576
static XML_Char *poolAppend(STRING_POOL *pool, const ENCODING *enc,
577
                            const char *ptr, const char *end);
578
static XML_Char *poolStoreString(STRING_POOL *pool, const ENCODING *enc,
579
                                 const char *ptr, const char *end);
580
static XML_Bool FASTCALL poolGrow(STRING_POOL *pool);
581
static const XML_Char *FASTCALL poolCopyString(STRING_POOL *pool,
582
                                               const XML_Char *s);
583
static const XML_Char *poolCopyStringN(STRING_POOL *pool, const XML_Char *s,
584
                                       int n);
585
static const XML_Char *FASTCALL poolAppendString(STRING_POOL *pool,
586
                                                 const XML_Char *s);
587
588
static int FASTCALL nextScaffoldPart(XML_Parser parser);
589
static XML_Content *build_model(XML_Parser parser);
590
static ELEMENT_TYPE *getElementType(XML_Parser parser, const ENCODING *enc,
591
                                    const char *ptr, const char *end);
592
593
static XML_Char *copyString(const XML_Char *s,
594
                            const XML_Memory_Handling_Suite *memsuite);
595
596
static unsigned long generate_hash_secret_salt(XML_Parser parser);
597
static XML_Bool startParsing(XML_Parser parser);
598
599
static XML_Parser parserCreate(const XML_Char *encodingName,
600
                               const XML_Memory_Handling_Suite *memsuite,
601
                               const XML_Char *nameSep, DTD *dtd);
602
603
static void parserInit(XML_Parser parser, const XML_Char *encodingName);
604
605
#if XML_GE == 1
606
static float accountingGetCurrentAmplification(XML_Parser rootParser);
607
static void accountingReportStats(XML_Parser originParser, const char *epilog);
608
static void accountingOnAbort(XML_Parser originParser);
609
static void accountingReportDiff(XML_Parser rootParser,
610
                                 unsigned int levelsAwayFromRootParser,
611
                                 const char *before, const char *after,
612
                                 ptrdiff_t bytesMore, int source_line,
613
                                 enum XML_Account account);
614
static XML_Bool accountingDiffTolerated(XML_Parser originParser, int tok,
615
                                        const char *before, const char *after,
616
                                        int source_line,
617
                                        enum XML_Account account);
618
619
static void entityTrackingReportStats(XML_Parser parser, ENTITY *entity,
620
                                      const char *action, int sourceLine);
621
static void entityTrackingOnOpen(XML_Parser parser, ENTITY *entity,
622
                                 int sourceLine);
623
static void entityTrackingOnClose(XML_Parser parser, ENTITY *entity,
624
                                  int sourceLine);
625
626
static XML_Parser getRootParserOf(XML_Parser parser,
627
                                  unsigned int *outLevelDiff);
628
#endif /* XML_GE == 1 */
629
630
static unsigned long getDebugLevel(const char *variableName,
631
                                   unsigned long defaultDebugLevel);
632
633
848
#define poolStart(pool) ((pool)->start)
634
748
#define poolLength(pool) ((pool)->ptr - (pool)->start)
635
0
#define poolChop(pool) ((void)--(pool->ptr))
636
0
#define poolLastChar(pool) (((pool)->ptr)[-1])
637
23.2k
#define poolDiscard(pool) ((pool)->ptr = (pool)->start)
638
46.3k
#define poolFinish(pool) ((pool)->start = (pool)->ptr)
639
#define poolAppendChar(pool, c)                                                \
640
100k
  (((pool)->ptr == (pool)->end && ! poolGrow(pool))                            \
641
100k
       ? 0                                                                     \
642
100k
       : ((*((pool)->ptr)++ = c), 1))
643
644
#if ! defined(XML_TESTING)
645
const
646
#endif
647
    XML_Bool g_reparseDeferralEnabledDefault
648
    = XML_TRUE; // write ONLY in runtests.c
649
#if defined(XML_TESTING)
650
unsigned int g_bytesScanned = 0; // used for testing only
651
#endif
652
653
struct XML_ParserStruct {
654
  /* The first member must be m_userData so that the XML_GetUserData
655
     macro works. */
656
  void *m_userData;
657
  void *m_handlerArg;
658
659
  // How the four parse buffer pointers below relate in time and space:
660
  //
661
  //   m_buffer <= m_bufferPtr <= m_bufferEnd  <= m_bufferLim
662
  //   |           |              |               |
663
  //   <--parsed-->|              |               |
664
  //               <---parsing--->|               |
665
  //                              <--unoccupied-->|
666
  //   <---------total-malloced/realloced-------->|
667
668
  char *m_buffer; // malloc/realloc base pointer of parse buffer
669
  const XML_Memory_Handling_Suite m_mem;
670
  const char *m_bufferPtr; // first character to be parsed
671
  char *m_bufferEnd;       // past last character to be parsed
672
  const char *m_bufferLim; // allocated end of m_buffer
673
674
  XML_Index m_parseEndByteIndex;
675
  const char *m_parseEndPtr;
676
  size_t m_partialTokenBytesBefore; /* used in heuristic to avoid O(n^2) */
677
  XML_Bool m_reparseDeferralEnabled;
678
  int m_lastBufferRequestSize;
679
  XML_Char *m_dataBuf;
680
  XML_Char *m_dataBufEnd;
681
  XML_StartElementHandler m_startElementHandler;
682
  XML_EndElementHandler m_endElementHandler;
683
  XML_CharacterDataHandler m_characterDataHandler;
684
  XML_ProcessingInstructionHandler m_processingInstructionHandler;
685
  XML_CommentHandler m_commentHandler;
686
  XML_StartCdataSectionHandler m_startCdataSectionHandler;
687
  XML_EndCdataSectionHandler m_endCdataSectionHandler;
688
  XML_DefaultHandler m_defaultHandler;
689
  XML_StartDoctypeDeclHandler m_startDoctypeDeclHandler;
690
  XML_EndDoctypeDeclHandler m_endDoctypeDeclHandler;
691
  XML_UnparsedEntityDeclHandler m_unparsedEntityDeclHandler;
692
  XML_NotationDeclHandler m_notationDeclHandler;
693
  XML_StartNamespaceDeclHandler m_startNamespaceDeclHandler;
694
  XML_EndNamespaceDeclHandler m_endNamespaceDeclHandler;
695
  XML_NotStandaloneHandler m_notStandaloneHandler;
696
  XML_ExternalEntityRefHandler m_externalEntityRefHandler;
697
  XML_Parser m_externalEntityRefHandlerArg;
698
  XML_SkippedEntityHandler m_skippedEntityHandler;
699
  XML_UnknownEncodingHandler m_unknownEncodingHandler;
700
  XML_ElementDeclHandler m_elementDeclHandler;
701
  XML_AttlistDeclHandler m_attlistDeclHandler;
702
  XML_EntityDeclHandler m_entityDeclHandler;
703
  XML_XmlDeclHandler m_xmlDeclHandler;
704
  const ENCODING *m_encoding;
705
  INIT_ENCODING m_initEncoding;
706
  const ENCODING *m_internalEncoding;
707
  const XML_Char *m_protocolEncodingName;
708
  XML_Bool m_ns;
709
  XML_Bool m_ns_triplets;
710
  void *m_unknownEncodingMem;
711
  void *m_unknownEncodingData;
712
  void *m_unknownEncodingHandlerData;
713
  void(XMLCALL *m_unknownEncodingRelease)(void *);
714
  PROLOG_STATE m_prologState;
715
  Processor *m_processor;
716
  enum XML_Error m_errorCode;
717
  const char *m_eventPtr;
718
  const char *m_eventEndPtr;
719
  const char *m_positionPtr;
720
  OPEN_INTERNAL_ENTITY *m_openInternalEntities;
721
  OPEN_INTERNAL_ENTITY *m_freeInternalEntities;
722
  XML_Bool m_defaultExpandInternalEntities;
723
  int m_tagLevel;
724
  ENTITY *m_declEntity;
725
  const XML_Char *m_doctypeName;
726
  const XML_Char *m_doctypeSysid;
727
  const XML_Char *m_doctypePubid;
728
  const XML_Char *m_declAttributeType;
729
  const XML_Char *m_declNotationName;
730
  const XML_Char *m_declNotationPublicId;
731
  ELEMENT_TYPE *m_declElementType;
732
  ATTRIBUTE_ID *m_declAttributeId;
733
  XML_Bool m_declAttributeIsCdata;
734
  XML_Bool m_declAttributeIsId;
735
  DTD *m_dtd;
736
  const XML_Char *m_curBase;
737
  TAG *m_tagStack;
738
  TAG *m_freeTagList;
739
  BINDING *m_inheritedBindings;
740
  BINDING *m_freeBindingList;
741
  int m_attsSize;
742
  int m_nSpecifiedAtts;
743
  int m_idAttIndex;
744
  ATTRIBUTE *m_atts;
745
  NS_ATT *m_nsAtts;
746
  unsigned long m_nsAttsVersion;
747
  unsigned char m_nsAttsPower;
748
#ifdef XML_ATTR_INFO
749
  XML_AttrInfo *m_attInfo;
750
#endif
751
  POSITION m_position;
752
  STRING_POOL m_tempPool;
753
  STRING_POOL m_temp2Pool;
754
  char *m_groupConnector;
755
  unsigned int m_groupSize;
756
  XML_Char m_namespaceSeparator;
757
  XML_Parser m_parentParser;
758
  XML_ParsingStatus m_parsingStatus;
759
#ifdef XML_DTD
760
  XML_Bool m_isParamEntity;
761
  XML_Bool m_useForeignDTD;
762
  enum XML_ParamEntityParsing m_paramEntityParsing;
763
#endif
764
  unsigned long m_hash_secret_salt;
765
#if XML_GE == 1
766
  ACCOUNTING m_accounting;
767
  ENTITY_STATS m_entity_stats;
768
#endif
769
};
770
771
567
#define MALLOC(parser, s) (parser->m_mem.malloc_fcn((s)))
772
20
#define REALLOC(parser, p, s) (parser->m_mem.realloc_fcn((p), (s)))
773
1.01k
#define FREE(parser, p) (parser->m_mem.free_fcn((p)))
774
775
XML_Parser XMLCALL
776
69
XML_ParserCreate(const XML_Char *encodingName) {
777
69
  return XML_ParserCreate_MM(encodingName, NULL, NULL);
778
69
}
779
780
XML_Parser XMLCALL
781
20
XML_ParserCreateNS(const XML_Char *encodingName, XML_Char nsSep) {
782
20
  XML_Char tmp[2] = {nsSep, 0};
783
20
  return XML_ParserCreate_MM(encodingName, NULL, tmp);
784
20
}
785
786
// "xml=http://www.w3.org/XML/1998/namespace"
787
static const XML_Char implicitContext[]
788
    = {ASCII_x,     ASCII_m,     ASCII_l,      ASCII_EQUALS, ASCII_h,
789
       ASCII_t,     ASCII_t,     ASCII_p,      ASCII_COLON,  ASCII_SLASH,
790
       ASCII_SLASH, ASCII_w,     ASCII_w,      ASCII_w,      ASCII_PERIOD,
791
       ASCII_w,     ASCII_3,     ASCII_PERIOD, ASCII_o,      ASCII_r,
792
       ASCII_g,     ASCII_SLASH, ASCII_X,      ASCII_M,      ASCII_L,
793
       ASCII_SLASH, ASCII_1,     ASCII_9,      ASCII_9,      ASCII_8,
794
       ASCII_SLASH, ASCII_n,     ASCII_a,      ASCII_m,      ASCII_e,
795
       ASCII_s,     ASCII_p,     ASCII_a,      ASCII_c,      ASCII_e,
796
       '\0'};
797
798
/* To avoid warnings about unused functions: */
799
#if ! defined(HAVE_ARC4RANDOM_BUF) && ! defined(HAVE_ARC4RANDOM)
800
801
#  if defined(HAVE_GETRANDOM) || defined(HAVE_SYSCALL_GETRANDOM)
802
803
/* Obtain entropy on Linux 3.17+ */
804
static int
805
writeRandomBytes_getrandom_nonblock(void *target, size_t count) {
806
  int success = 0; /* full count bytes written? */
807
  size_t bytesWrittenTotal = 0;
808
  const unsigned int getrandomFlags = GRND_NONBLOCK;
809
810
  do {
811
    void *const currentTarget = (void *)((char *)target + bytesWrittenTotal);
812
    const size_t bytesToWrite = count - bytesWrittenTotal;
813
814
    const int bytesWrittenMore =
815
#    if defined(HAVE_GETRANDOM)
816
        getrandom(currentTarget, bytesToWrite, getrandomFlags);
817
#    else
818
        syscall(SYS_getrandom, currentTarget, bytesToWrite, getrandomFlags);
819
#    endif
820
821
    if (bytesWrittenMore > 0) {
822
      bytesWrittenTotal += bytesWrittenMore;
823
      if (bytesWrittenTotal >= count)
824
        success = 1;
825
    }
826
  } while (! success && (errno == EINTR));
827
828
  return success;
829
}
830
831
#  endif /* defined(HAVE_GETRANDOM) || defined(HAVE_SYSCALL_GETRANDOM) */
832
833
#  if ! defined(_WIN32) && defined(XML_DEV_URANDOM)
834
835
/* Extract entropy from /dev/urandom */
836
static int
837
89
writeRandomBytes_dev_urandom(void *target, size_t count) {
838
89
  int success = 0; /* full count bytes written? */
839
89
  size_t bytesWrittenTotal = 0;
840
841
89
  const int fd = open("/dev/urandom", O_RDONLY);
842
89
  if (fd < 0) {
843
0
    return 0;
844
0
  }
845
846
89
  do {
847
89
    void *const currentTarget = (void *)((char *)target + bytesWrittenTotal);
848
89
    const size_t bytesToWrite = count - bytesWrittenTotal;
849
850
89
    const ssize_t bytesWrittenMore = read(fd, currentTarget, bytesToWrite);
851
852
89
    if (bytesWrittenMore > 0) {
853
89
      bytesWrittenTotal += bytesWrittenMore;
854
89
      if (bytesWrittenTotal >= count)
855
89
        success = 1;
856
89
    }
857
89
  } while (! success && (errno == EINTR));
858
859
89
  close(fd);
860
89
  return success;
861
89
}
862
863
#  endif /* ! defined(_WIN32) && defined(XML_DEV_URANDOM) */
864
865
#endif /* ! defined(HAVE_ARC4RANDOM_BUF) && ! defined(HAVE_ARC4RANDOM) */
866
867
#if defined(HAVE_ARC4RANDOM) && ! defined(HAVE_ARC4RANDOM_BUF)
868
869
static void
870
writeRandomBytes_arc4random(void *target, size_t count) {
871
  size_t bytesWrittenTotal = 0;
872
873
  while (bytesWrittenTotal < count) {
874
    const uint32_t random32 = arc4random();
875
    size_t i = 0;
876
877
    for (; (i < sizeof(random32)) && (bytesWrittenTotal < count);
878
         i++, bytesWrittenTotal++) {
879
      const uint8_t random8 = (uint8_t)(random32 >> (i * 8));
880
      ((uint8_t *)target)[bytesWrittenTotal] = random8;
881
    }
882
  }
883
}
884
885
#endif /* defined(HAVE_ARC4RANDOM) && ! defined(HAVE_ARC4RANDOM_BUF) */
886
887
#ifdef _WIN32
888
889
/* Provide declaration of rand_s() for MinGW-32 (not 64, which has it),
890
   as it didn't declare it in its header prior to version 5.3.0 of its
891
   runtime package (mingwrt, containing stdlib.h).  The upstream fix
892
   was introduced at https://osdn.net/projects/mingw/ticket/39658 . */
893
#  if defined(__MINGW32__) && defined(__MINGW32_VERSION)                       \
894
      && __MINGW32_VERSION < 5003000L && ! defined(__MINGW64_VERSION_MAJOR)
895
__declspec(dllimport) int rand_s(unsigned int *);
896
#  endif
897
898
/* Obtain entropy on Windows using the rand_s() function which
899
 * generates cryptographically secure random numbers.  Internally it
900
 * uses RtlGenRandom API which is present in Windows XP and later.
901
 */
902
static int
903
writeRandomBytes_rand_s(void *target, size_t count) {
904
  size_t bytesWrittenTotal = 0;
905
906
  while (bytesWrittenTotal < count) {
907
    unsigned int random32 = 0;
908
    size_t i = 0;
909
910
    if (rand_s(&random32))
911
      return 0; /* failure */
912
913
    for (; (i < sizeof(random32)) && (bytesWrittenTotal < count);
914
         i++, bytesWrittenTotal++) {
915
      const uint8_t random8 = (uint8_t)(random32 >> (i * 8));
916
      ((uint8_t *)target)[bytesWrittenTotal] = random8;
917
    }
918
  }
919
  return 1; /* success */
920
}
921
922
#endif /* _WIN32 */
923
924
#if ! defined(HAVE_ARC4RANDOM_BUF) && ! defined(HAVE_ARC4RANDOM)
925
926
static unsigned long
927
0
gather_time_entropy(void) {
928
#  ifdef _WIN32
929
  FILETIME ft;
930
  GetSystemTimeAsFileTime(&ft); /* never fails */
931
  return ft.dwHighDateTime ^ ft.dwLowDateTime;
932
#  else
933
0
  struct timeval tv;
934
0
  int gettimeofday_res;
935
936
0
  gettimeofday_res = gettimeofday(&tv, NULL);
937
938
0
#    if defined(NDEBUG)
939
0
  (void)gettimeofday_res;
940
#    else
941
  assert(gettimeofday_res == 0);
942
#    endif /* defined(NDEBUG) */
943
944
  /* Microseconds time is <20 bits entropy */
945
0
  return tv.tv_usec;
946
0
#  endif
947
0
}
948
949
#endif /* ! defined(HAVE_ARC4RANDOM_BUF) && ! defined(HAVE_ARC4RANDOM) */
950
951
static unsigned long
952
89
ENTROPY_DEBUG(const char *label, unsigned long entropy) {
953
89
  if (getDebugLevel("EXPAT_ENTROPY_DEBUG", 0) >= 1u) {
954
0
    fprintf(stderr, "expat: Entropy: %s --> 0x%0*lx (%lu bytes)\n", label,
955
0
            (int)sizeof(entropy) * 2, entropy, (unsigned long)sizeof(entropy));
956
0
  }
957
89
  return entropy;
958
89
}
959
960
static unsigned long
961
89
generate_hash_secret_salt(XML_Parser parser) {
962
89
  unsigned long entropy;
963
89
  (void)parser;
964
965
  /* "Failproof" high quality providers: */
966
#if defined(HAVE_ARC4RANDOM_BUF)
967
  arc4random_buf(&entropy, sizeof(entropy));
968
  return ENTROPY_DEBUG("arc4random_buf", entropy);
969
#elif defined(HAVE_ARC4RANDOM)
970
  writeRandomBytes_arc4random((void *)&entropy, sizeof(entropy));
971
  return ENTROPY_DEBUG("arc4random", entropy);
972
#else
973
  /* Try high quality providers first .. */
974
#  ifdef _WIN32
975
  if (writeRandomBytes_rand_s((void *)&entropy, sizeof(entropy))) {
976
    return ENTROPY_DEBUG("rand_s", entropy);
977
  }
978
#  elif defined(HAVE_GETRANDOM) || defined(HAVE_SYSCALL_GETRANDOM)
979
  if (writeRandomBytes_getrandom_nonblock((void *)&entropy, sizeof(entropy))) {
980
    return ENTROPY_DEBUG("getrandom", entropy);
981
  }
982
#  endif
983
89
#  if ! defined(_WIN32) && defined(XML_DEV_URANDOM)
984
89
  if (writeRandomBytes_dev_urandom((void *)&entropy, sizeof(entropy))) {
985
89
    return ENTROPY_DEBUG("/dev/urandom", entropy);
986
89
  }
987
0
#  endif /* ! defined(_WIN32) && defined(XML_DEV_URANDOM) */
988
  /* .. and self-made low quality for backup: */
989
990
  /* Process ID is 0 bits entropy if attacker has local access */
991
0
  entropy = gather_time_entropy() ^ getpid();
992
993
  /* Factors are 2^31-1 and 2^61-1 (Mersenne primes M31 and M61) */
994
0
  if (sizeof(unsigned long) == 4) {
995
0
    return ENTROPY_DEBUG("fallback(4)", entropy * 2147483647);
996
0
  } else {
997
0
    return ENTROPY_DEBUG("fallback(8)",
998
0
                         entropy * (unsigned long)2305843009213693951ULL);
999
0
  }
1000
0
#endif
1001
0
}
1002
1003
static unsigned long
1004
34.9k
get_hash_secret_salt(XML_Parser parser) {
1005
34.9k
  if (parser->m_parentParser != NULL)
1006
0
    return get_hash_secret_salt(parser->m_parentParser);
1007
34.9k
  return parser->m_hash_secret_salt;
1008
34.9k
}
1009
1010
static enum XML_Error
1011
callProcessor(XML_Parser parser, const char *start, const char *end,
1012
89
              const char **endPtr) {
1013
89
  const size_t have_now = EXPAT_SAFE_PTR_DIFF(end, start);
1014
89
  bool enough;
1015
89
  enum XML_Error ret;
1016
1017
89
  if (parser->m_reparseDeferralEnabled
1018
89
      && ! parser->m_parsingStatus.finalBuffer) {
1019
    // Heuristic: don't try to parse a partial token again until the amount of
1020
    // available data has increased significantly.
1021
0
    const size_t had_before = parser->m_partialTokenBytesBefore;
1022
    // ...but *do* try anyway if we're close to causing a reallocation.
1023
0
    size_t available_buffer
1024
0
        = EXPAT_SAFE_PTR_DIFF(parser->m_bufferPtr, parser->m_buffer);
1025
0
#if XML_CONTEXT_BYTES > 0
1026
0
    available_buffer -= EXPAT_MIN(available_buffer, XML_CONTEXT_BYTES);
1027
0
#endif
1028
0
    available_buffer
1029
0
        += EXPAT_SAFE_PTR_DIFF(parser->m_bufferLim, parser->m_bufferEnd);
1030
    // m_lastBufferRequestSize is never assigned a value < 0, so the cast is ok
1031
0
    enough
1032
0
        = (have_now >= 2 * had_before)
1033
0
          || ((size_t)parser->m_lastBufferRequestSize > available_buffer);
1034
1035
0
    if (! enough) {
1036
0
      *endPtr = start; // callers may expect this to be set
1037
0
      return XML_ERROR_NONE;
1038
0
    }
1039
0
  }
1040
#if defined(XML_TESTING)
1041
  g_bytesScanned += (unsigned)have_now;
1042
#endif
1043
89
  ret = parser->m_processor(parser, start, end, endPtr);
1044
89
  if (ret == XML_ERROR_NONE) {
1045
    // if we consumed nothing, remember what we had on this parse attempt.
1046
72
    if (*endPtr == start) {
1047
0
      parser->m_partialTokenBytesBefore = have_now;
1048
72
    } else {
1049
72
      parser->m_partialTokenBytesBefore = 0;
1050
72
    }
1051
72
  }
1052
89
  return ret;
1053
89
}
1054
1055
static XML_Bool /* only valid for root parser */
1056
89
startParsing(XML_Parser parser) {
1057
  /* hash functions must be initialized before setContext() is called */
1058
89
  if (parser->m_hash_secret_salt == 0)
1059
89
    parser->m_hash_secret_salt = generate_hash_secret_salt(parser);
1060
89
  if (parser->m_ns) {
1061
    /* implicit context only set for root parser, since child
1062
       parsers (i.e. external entity parsers) will inherit it
1063
    */
1064
20
    return setContext(parser, implicitContext);
1065
20
  }
1066
69
  return XML_TRUE;
1067
89
}
1068
1069
XML_Parser XMLCALL
1070
XML_ParserCreate_MM(const XML_Char *encodingName,
1071
                    const XML_Memory_Handling_Suite *memsuite,
1072
89
                    const XML_Char *nameSep) {
1073
89
  return parserCreate(encodingName, memsuite, nameSep, NULL);
1074
89
}
1075
1076
static XML_Parser
1077
parserCreate(const XML_Char *encodingName,
1078
             const XML_Memory_Handling_Suite *memsuite, const XML_Char *nameSep,
1079
89
             DTD *dtd) {
1080
89
  XML_Parser parser;
1081
1082
89
  if (memsuite) {
1083
0
    XML_Memory_Handling_Suite *mtemp;
1084
0
    parser = memsuite->malloc_fcn(sizeof(struct XML_ParserStruct));
1085
0
    if (parser != NULL) {
1086
0
      mtemp = (XML_Memory_Handling_Suite *)&(parser->m_mem);
1087
0
      mtemp->malloc_fcn = memsuite->malloc_fcn;
1088
0
      mtemp->realloc_fcn = memsuite->realloc_fcn;
1089
0
      mtemp->free_fcn = memsuite->free_fcn;
1090
0
    }
1091
89
  } else {
1092
89
    XML_Memory_Handling_Suite *mtemp;
1093
89
    parser = (XML_Parser)malloc(sizeof(struct XML_ParserStruct));
1094
89
    if (parser != NULL) {
1095
89
      mtemp = (XML_Memory_Handling_Suite *)&(parser->m_mem);
1096
89
      mtemp->malloc_fcn = malloc;
1097
89
      mtemp->realloc_fcn = realloc;
1098
89
      mtemp->free_fcn = free;
1099
89
    }
1100
89
  }
1101
1102
89
  if (! parser)
1103
0
    return parser;
1104
1105
89
  parser->m_buffer = NULL;
1106
89
  parser->m_bufferLim = NULL;
1107
1108
89
  parser->m_attsSize = INIT_ATTS_SIZE;
1109
89
  parser->m_atts
1110
89
      = (ATTRIBUTE *)MALLOC(parser, parser->m_attsSize * sizeof(ATTRIBUTE));
1111
89
  if (parser->m_atts == NULL) {
1112
0
    FREE(parser, parser);
1113
0
    return NULL;
1114
0
  }
1115
#ifdef XML_ATTR_INFO
1116
  parser->m_attInfo = (XML_AttrInfo *)MALLOC(
1117
      parser, parser->m_attsSize * sizeof(XML_AttrInfo));
1118
  if (parser->m_attInfo == NULL) {
1119
    FREE(parser, parser->m_atts);
1120
    FREE(parser, parser);
1121
    return NULL;
1122
  }
1123
#endif
1124
89
  parser->m_dataBuf
1125
89
      = (XML_Char *)MALLOC(parser, INIT_DATA_BUF_SIZE * sizeof(XML_Char));
1126
89
  if (parser->m_dataBuf == NULL) {
1127
0
    FREE(parser, parser->m_atts);
1128
#ifdef XML_ATTR_INFO
1129
    FREE(parser, parser->m_attInfo);
1130
#endif
1131
0
    FREE(parser, parser);
1132
0
    return NULL;
1133
0
  }
1134
89
  parser->m_dataBufEnd = parser->m_dataBuf + INIT_DATA_BUF_SIZE;
1135
1136
89
  if (dtd)
1137
0
    parser->m_dtd = dtd;
1138
89
  else {
1139
89
    parser->m_dtd = dtdCreate(&parser->m_mem);
1140
89
    if (parser->m_dtd == NULL) {
1141
0
      FREE(parser, parser->m_dataBuf);
1142
0
      FREE(parser, parser->m_atts);
1143
#ifdef XML_ATTR_INFO
1144
      FREE(parser, parser->m_attInfo);
1145
#endif
1146
0
      FREE(parser, parser);
1147
0
      return NULL;
1148
0
    }
1149
89
  }
1150
1151
89
  parser->m_freeBindingList = NULL;
1152
89
  parser->m_freeTagList = NULL;
1153
89
  parser->m_freeInternalEntities = NULL;
1154
1155
89
  parser->m_groupSize = 0;
1156
89
  parser->m_groupConnector = NULL;
1157
1158
89
  parser->m_unknownEncodingHandler = NULL;
1159
89
  parser->m_unknownEncodingHandlerData = NULL;
1160
1161
89
  parser->m_namespaceSeparator = ASCII_EXCL;
1162
89
  parser->m_ns = XML_FALSE;
1163
89
  parser->m_ns_triplets = XML_FALSE;
1164
1165
89
  parser->m_nsAtts = NULL;
1166
89
  parser->m_nsAttsVersion = 0;
1167
89
  parser->m_nsAttsPower = 0;
1168
1169
89
  parser->m_protocolEncodingName = NULL;
1170
1171
89
  poolInit(&parser->m_tempPool, &(parser->m_mem));
1172
89
  poolInit(&parser->m_temp2Pool, &(parser->m_mem));
1173
89
  parserInit(parser, encodingName);
1174
1175
89
  if (encodingName && ! parser->m_protocolEncodingName) {
1176
0
    if (dtd) {
1177
      // We need to stop the upcoming call to XML_ParserFree from happily
1178
      // destroying parser->m_dtd because the DTD is shared with the parent
1179
      // parser and the only guard that keeps XML_ParserFree from destroying
1180
      // parser->m_dtd is parser->m_isParamEntity but it will be set to
1181
      // XML_TRUE only later in XML_ExternalEntityParserCreate (or not at all).
1182
0
      parser->m_dtd = NULL;
1183
0
    }
1184
0
    XML_ParserFree(parser);
1185
0
    return NULL;
1186
0
  }
1187
1188
89
  if (nameSep) {
1189
20
    parser->m_ns = XML_TRUE;
1190
20
    parser->m_internalEncoding = XmlGetInternalEncodingNS();
1191
20
    parser->m_namespaceSeparator = *nameSep;
1192
69
  } else {
1193
69
    parser->m_internalEncoding = XmlGetInternalEncoding();
1194
69
  }
1195
1196
89
  return parser;
1197
89
}
1198
1199
static void
1200
89
parserInit(XML_Parser parser, const XML_Char *encodingName) {
1201
89
  parser->m_processor = prologInitProcessor;
1202
89
  XmlPrologStateInit(&parser->m_prologState);
1203
89
  if (encodingName != NULL) {
1204
0
    parser->m_protocolEncodingName = copyString(encodingName, &(parser->m_mem));
1205
0
  }
1206
89
  parser->m_curBase = NULL;
1207
89
  XmlInitEncoding(&parser->m_initEncoding, &parser->m_encoding, 0);
1208
89
  parser->m_userData = NULL;
1209
89
  parser->m_handlerArg = NULL;
1210
89
  parser->m_startElementHandler = NULL;
1211
89
  parser->m_endElementHandler = NULL;
1212
89
  parser->m_characterDataHandler = NULL;
1213
89
  parser->m_processingInstructionHandler = NULL;
1214
89
  parser->m_commentHandler = NULL;
1215
89
  parser->m_startCdataSectionHandler = NULL;
1216
89
  parser->m_endCdataSectionHandler = NULL;
1217
89
  parser->m_defaultHandler = NULL;
1218
89
  parser->m_startDoctypeDeclHandler = NULL;
1219
89
  parser->m_endDoctypeDeclHandler = NULL;
1220
89
  parser->m_unparsedEntityDeclHandler = NULL;
1221
89
  parser->m_notationDeclHandler = NULL;
1222
89
  parser->m_startNamespaceDeclHandler = NULL;
1223
89
  parser->m_endNamespaceDeclHandler = NULL;
1224
89
  parser->m_notStandaloneHandler = NULL;
1225
89
  parser->m_externalEntityRefHandler = NULL;
1226
89
  parser->m_externalEntityRefHandlerArg = parser;
1227
89
  parser->m_skippedEntityHandler = NULL;
1228
89
  parser->m_elementDeclHandler = NULL;
1229
89
  parser->m_attlistDeclHandler = NULL;
1230
89
  parser->m_entityDeclHandler = NULL;
1231
89
  parser->m_xmlDeclHandler = NULL;
1232
89
  parser->m_bufferPtr = parser->m_buffer;
1233
89
  parser->m_bufferEnd = parser->m_buffer;
1234
89
  parser->m_parseEndByteIndex = 0;
1235
89
  parser->m_parseEndPtr = NULL;
1236
89
  parser->m_partialTokenBytesBefore = 0;
1237
89
  parser->m_reparseDeferralEnabled = g_reparseDeferralEnabledDefault;
1238
89
  parser->m_lastBufferRequestSize = 0;
1239
89
  parser->m_declElementType = NULL;
1240
89
  parser->m_declAttributeId = NULL;
1241
89
  parser->m_declEntity = NULL;
1242
89
  parser->m_doctypeName = NULL;
1243
89
  parser->m_doctypeSysid = NULL;
1244
89
  parser->m_doctypePubid = NULL;
1245
89
  parser->m_declAttributeType = NULL;
1246
89
  parser->m_declNotationName = NULL;
1247
89
  parser->m_declNotationPublicId = NULL;
1248
89
  parser->m_declAttributeIsCdata = XML_FALSE;
1249
89
  parser->m_declAttributeIsId = XML_FALSE;
1250
89
  memset(&parser->m_position, 0, sizeof(POSITION));
1251
89
  parser->m_errorCode = XML_ERROR_NONE;
1252
89
  parser->m_eventPtr = NULL;
1253
89
  parser->m_eventEndPtr = NULL;
1254
89
  parser->m_positionPtr = NULL;
1255
89
  parser->m_openInternalEntities = NULL;
1256
89
  parser->m_defaultExpandInternalEntities = XML_TRUE;
1257
89
  parser->m_tagLevel = 0;
1258
89
  parser->m_tagStack = NULL;
1259
89
  parser->m_inheritedBindings = NULL;
1260
89
  parser->m_nSpecifiedAtts = 0;
1261
89
  parser->m_unknownEncodingMem = NULL;
1262
89
  parser->m_unknownEncodingRelease = NULL;
1263
89
  parser->m_unknownEncodingData = NULL;
1264
89
  parser->m_parentParser = NULL;
1265
89
  parser->m_parsingStatus.parsing = XML_INITIALIZED;
1266
89
#ifdef XML_DTD
1267
89
  parser->m_isParamEntity = XML_FALSE;
1268
89
  parser->m_useForeignDTD = XML_FALSE;
1269
89
  parser->m_paramEntityParsing = XML_PARAM_ENTITY_PARSING_NEVER;
1270
89
#endif
1271
89
  parser->m_hash_secret_salt = 0;
1272
1273
89
#if XML_GE == 1
1274
89
  memset(&parser->m_accounting, 0, sizeof(ACCOUNTING));
1275
89
  parser->m_accounting.debugLevel = getDebugLevel("EXPAT_ACCOUNTING_DEBUG", 0u);
1276
89
  parser->m_accounting.maximumAmplificationFactor
1277
89
      = EXPAT_BILLION_LAUGHS_ATTACK_PROTECTION_MAXIMUM_AMPLIFICATION_DEFAULT;
1278
89
  parser->m_accounting.activationThresholdBytes
1279
89
      = EXPAT_BILLION_LAUGHS_ATTACK_PROTECTION_ACTIVATION_THRESHOLD_DEFAULT;
1280
1281
89
  memset(&parser->m_entity_stats, 0, sizeof(ENTITY_STATS));
1282
89
  parser->m_entity_stats.debugLevel = getDebugLevel("EXPAT_ENTITY_DEBUG", 0u);
1283
89
#endif
1284
89
}
1285
1286
/* moves list of bindings to m_freeBindingList */
1287
static void FASTCALL
1288
0
moveToFreeBindingList(XML_Parser parser, BINDING *bindings) {
1289
0
  while (bindings) {
1290
0
    BINDING *b = bindings;
1291
0
    bindings = bindings->nextTagBinding;
1292
0
    b->nextTagBinding = parser->m_freeBindingList;
1293
0
    parser->m_freeBindingList = b;
1294
0
  }
1295
0
}
1296
1297
XML_Bool XMLCALL
1298
0
XML_ParserReset(XML_Parser parser, const XML_Char *encodingName) {
1299
0
  TAG *tStk;
1300
0
  OPEN_INTERNAL_ENTITY *openEntityList;
1301
1302
0
  if (parser == NULL)
1303
0
    return XML_FALSE;
1304
1305
0
  if (parser->m_parentParser)
1306
0
    return XML_FALSE;
1307
  /* move m_tagStack to m_freeTagList */
1308
0
  tStk = parser->m_tagStack;
1309
0
  while (tStk) {
1310
0
    TAG *tag = tStk;
1311
0
    tStk = tStk->parent;
1312
0
    tag->parent = parser->m_freeTagList;
1313
0
    moveToFreeBindingList(parser, tag->bindings);
1314
0
    tag->bindings = NULL;
1315
0
    parser->m_freeTagList = tag;
1316
0
  }
1317
  /* move m_openInternalEntities to m_freeInternalEntities */
1318
0
  openEntityList = parser->m_openInternalEntities;
1319
0
  while (openEntityList) {
1320
0
    OPEN_INTERNAL_ENTITY *openEntity = openEntityList;
1321
0
    openEntityList = openEntity->next;
1322
0
    openEntity->next = parser->m_freeInternalEntities;
1323
0
    parser->m_freeInternalEntities = openEntity;
1324
0
  }
1325
0
  moveToFreeBindingList(parser, parser->m_inheritedBindings);
1326
0
  FREE(parser, parser->m_unknownEncodingMem);
1327
0
  if (parser->m_unknownEncodingRelease)
1328
0
    parser->m_unknownEncodingRelease(parser->m_unknownEncodingData);
1329
0
  poolClear(&parser->m_tempPool);
1330
0
  poolClear(&parser->m_temp2Pool);
1331
0
  FREE(parser, (void *)parser->m_protocolEncodingName);
1332
0
  parser->m_protocolEncodingName = NULL;
1333
0
  parserInit(parser, encodingName);
1334
0
  dtdReset(parser->m_dtd, &parser->m_mem);
1335
0
  return XML_TRUE;
1336
0
}
1337
1338
enum XML_Status XMLCALL
1339
0
XML_SetEncoding(XML_Parser parser, const XML_Char *encodingName) {
1340
0
  if (parser == NULL)
1341
0
    return XML_STATUS_ERROR;
1342
  /* Block after XML_Parse()/XML_ParseBuffer() has been called.
1343
     XXX There's no way for the caller to determine which of the
1344
     XXX possible error cases caused the XML_STATUS_ERROR return.
1345
  */
1346
0
  if (parser->m_parsingStatus.parsing == XML_PARSING
1347
0
      || parser->m_parsingStatus.parsing == XML_SUSPENDED)
1348
0
    return XML_STATUS_ERROR;
1349
1350
  /* Get rid of any previous encoding name */
1351
0
  FREE(parser, (void *)parser->m_protocolEncodingName);
1352
1353
0
  if (encodingName == NULL)
1354
    /* No new encoding name */
1355
0
    parser->m_protocolEncodingName = NULL;
1356
0
  else {
1357
    /* Copy the new encoding name into allocated memory */
1358
0
    parser->m_protocolEncodingName = copyString(encodingName, &(parser->m_mem));
1359
0
    if (! parser->m_protocolEncodingName)
1360
0
      return XML_STATUS_ERROR;
1361
0
  }
1362
0
  return XML_STATUS_OK;
1363
0
}
1364
1365
XML_Parser XMLCALL
1366
XML_ExternalEntityParserCreate(XML_Parser oldParser, const XML_Char *context,
1367
0
                               const XML_Char *encodingName) {
1368
0
  XML_Parser parser = oldParser;
1369
0
  DTD *newDtd = NULL;
1370
0
  DTD *oldDtd;
1371
0
  XML_StartElementHandler oldStartElementHandler;
1372
0
  XML_EndElementHandler oldEndElementHandler;
1373
0
  XML_CharacterDataHandler oldCharacterDataHandler;
1374
0
  XML_ProcessingInstructionHandler oldProcessingInstructionHandler;
1375
0
  XML_CommentHandler oldCommentHandler;
1376
0
  XML_StartCdataSectionHandler oldStartCdataSectionHandler;
1377
0
  XML_EndCdataSectionHandler oldEndCdataSectionHandler;
1378
0
  XML_DefaultHandler oldDefaultHandler;
1379
0
  XML_UnparsedEntityDeclHandler oldUnparsedEntityDeclHandler;
1380
0
  XML_NotationDeclHandler oldNotationDeclHandler;
1381
0
  XML_StartNamespaceDeclHandler oldStartNamespaceDeclHandler;
1382
0
  XML_EndNamespaceDeclHandler oldEndNamespaceDeclHandler;
1383
0
  XML_NotStandaloneHandler oldNotStandaloneHandler;
1384
0
  XML_ExternalEntityRefHandler oldExternalEntityRefHandler;
1385
0
  XML_SkippedEntityHandler oldSkippedEntityHandler;
1386
0
  XML_UnknownEncodingHandler oldUnknownEncodingHandler;
1387
0
  XML_ElementDeclHandler oldElementDeclHandler;
1388
0
  XML_AttlistDeclHandler oldAttlistDeclHandler;
1389
0
  XML_EntityDeclHandler oldEntityDeclHandler;
1390
0
  XML_XmlDeclHandler oldXmlDeclHandler;
1391
0
  ELEMENT_TYPE *oldDeclElementType;
1392
1393
0
  void *oldUserData;
1394
0
  void *oldHandlerArg;
1395
0
  XML_Bool oldDefaultExpandInternalEntities;
1396
0
  XML_Parser oldExternalEntityRefHandlerArg;
1397
0
#ifdef XML_DTD
1398
0
  enum XML_ParamEntityParsing oldParamEntityParsing;
1399
0
  int oldInEntityValue;
1400
0
#endif
1401
0
  XML_Bool oldns_triplets;
1402
  /* Note that the new parser shares the same hash secret as the old
1403
     parser, so that dtdCopy and copyEntityTable can lookup values
1404
     from hash tables associated with either parser without us having
1405
     to worry which hash secrets each table has.
1406
  */
1407
0
  unsigned long oldhash_secret_salt;
1408
0
  XML_Bool oldReparseDeferralEnabled;
1409
1410
  /* Validate the oldParser parameter before we pull everything out of it */
1411
0
  if (oldParser == NULL)
1412
0
    return NULL;
1413
1414
  /* Stash the original parser contents on the stack */
1415
0
  oldDtd = parser->m_dtd;
1416
0
  oldStartElementHandler = parser->m_startElementHandler;
1417
0
  oldEndElementHandler = parser->m_endElementHandler;
1418
0
  oldCharacterDataHandler = parser->m_characterDataHandler;
1419
0
  oldProcessingInstructionHandler = parser->m_processingInstructionHandler;
1420
0
  oldCommentHandler = parser->m_commentHandler;
1421
0
  oldStartCdataSectionHandler = parser->m_startCdataSectionHandler;
1422
0
  oldEndCdataSectionHandler = parser->m_endCdataSectionHandler;
1423
0
  oldDefaultHandler = parser->m_defaultHandler;
1424
0
  oldUnparsedEntityDeclHandler = parser->m_unparsedEntityDeclHandler;
1425
0
  oldNotationDeclHandler = parser->m_notationDeclHandler;
1426
0
  oldStartNamespaceDeclHandler = parser->m_startNamespaceDeclHandler;
1427
0
  oldEndNamespaceDeclHandler = parser->m_endNamespaceDeclHandler;
1428
0
  oldNotStandaloneHandler = parser->m_notStandaloneHandler;
1429
0
  oldExternalEntityRefHandler = parser->m_externalEntityRefHandler;
1430
0
  oldSkippedEntityHandler = parser->m_skippedEntityHandler;
1431
0
  oldUnknownEncodingHandler = parser->m_unknownEncodingHandler;
1432
0
  oldElementDeclHandler = parser->m_elementDeclHandler;
1433
0
  oldAttlistDeclHandler = parser->m_attlistDeclHandler;
1434
0
  oldEntityDeclHandler = parser->m_entityDeclHandler;
1435
0
  oldXmlDeclHandler = parser->m_xmlDeclHandler;
1436
0
  oldDeclElementType = parser->m_declElementType;
1437
1438
0
  oldUserData = parser->m_userData;
1439
0
  oldHandlerArg = parser->m_handlerArg;
1440
0
  oldDefaultExpandInternalEntities = parser->m_defaultExpandInternalEntities;
1441
0
  oldExternalEntityRefHandlerArg = parser->m_externalEntityRefHandlerArg;
1442
0
#ifdef XML_DTD
1443
0
  oldParamEntityParsing = parser->m_paramEntityParsing;
1444
0
  oldInEntityValue = parser->m_prologState.inEntityValue;
1445
0
#endif
1446
0
  oldns_triplets = parser->m_ns_triplets;
1447
  /* Note that the new parser shares the same hash secret as the old
1448
     parser, so that dtdCopy and copyEntityTable can lookup values
1449
     from hash tables associated with either parser without us having
1450
     to worry which hash secrets each table has.
1451
  */
1452
0
  oldhash_secret_salt = parser->m_hash_secret_salt;
1453
0
  oldReparseDeferralEnabled = parser->m_reparseDeferralEnabled;
1454
1455
0
#ifdef XML_DTD
1456
0
  if (! context)
1457
0
    newDtd = oldDtd;
1458
0
#endif /* XML_DTD */
1459
1460
  /* Note that the magical uses of the pre-processor to make field
1461
     access look more like C++ require that `parser' be overwritten
1462
     here.  This makes this function more painful to follow than it
1463
     would be otherwise.
1464
  */
1465
0
  if (parser->m_ns) {
1466
0
    XML_Char tmp[2] = {parser->m_namespaceSeparator, 0};
1467
0
    parser = parserCreate(encodingName, &parser->m_mem, tmp, newDtd);
1468
0
  } else {
1469
0
    parser = parserCreate(encodingName, &parser->m_mem, NULL, newDtd);
1470
0
  }
1471
1472
0
  if (! parser)
1473
0
    return NULL;
1474
1475
0
  parser->m_startElementHandler = oldStartElementHandler;
1476
0
  parser->m_endElementHandler = oldEndElementHandler;
1477
0
  parser->m_characterDataHandler = oldCharacterDataHandler;
1478
0
  parser->m_processingInstructionHandler = oldProcessingInstructionHandler;
1479
0
  parser->m_commentHandler = oldCommentHandler;
1480
0
  parser->m_startCdataSectionHandler = oldStartCdataSectionHandler;
1481
0
  parser->m_endCdataSectionHandler = oldEndCdataSectionHandler;
1482
0
  parser->m_defaultHandler = oldDefaultHandler;
1483
0
  parser->m_unparsedEntityDeclHandler = oldUnparsedEntityDeclHandler;
1484
0
  parser->m_notationDeclHandler = oldNotationDeclHandler;
1485
0
  parser->m_startNamespaceDeclHandler = oldStartNamespaceDeclHandler;
1486
0
  parser->m_endNamespaceDeclHandler = oldEndNamespaceDeclHandler;
1487
0
  parser->m_notStandaloneHandler = oldNotStandaloneHandler;
1488
0
  parser->m_externalEntityRefHandler = oldExternalEntityRefHandler;
1489
0
  parser->m_skippedEntityHandler = oldSkippedEntityHandler;
1490
0
  parser->m_unknownEncodingHandler = oldUnknownEncodingHandler;
1491
0
  parser->m_elementDeclHandler = oldElementDeclHandler;
1492
0
  parser->m_attlistDeclHandler = oldAttlistDeclHandler;
1493
0
  parser->m_entityDeclHandler = oldEntityDeclHandler;
1494
0
  parser->m_xmlDeclHandler = oldXmlDeclHandler;
1495
0
  parser->m_declElementType = oldDeclElementType;
1496
0
  parser->m_userData = oldUserData;
1497
0
  if (oldUserData == oldHandlerArg)
1498
0
    parser->m_handlerArg = parser->m_userData;
1499
0
  else
1500
0
    parser->m_handlerArg = parser;
1501
0
  if (oldExternalEntityRefHandlerArg != oldParser)
1502
0
    parser->m_externalEntityRefHandlerArg = oldExternalEntityRefHandlerArg;
1503
0
  parser->m_defaultExpandInternalEntities = oldDefaultExpandInternalEntities;
1504
0
  parser->m_ns_triplets = oldns_triplets;
1505
0
  parser->m_hash_secret_salt = oldhash_secret_salt;
1506
0
  parser->m_reparseDeferralEnabled = oldReparseDeferralEnabled;
1507
0
  parser->m_parentParser = oldParser;
1508
0
#ifdef XML_DTD
1509
0
  parser->m_paramEntityParsing = oldParamEntityParsing;
1510
0
  parser->m_prologState.inEntityValue = oldInEntityValue;
1511
0
  if (context) {
1512
0
#endif /* XML_DTD */
1513
0
    if (! dtdCopy(oldParser, parser->m_dtd, oldDtd, &parser->m_mem)
1514
0
        || ! setContext(parser, context)) {
1515
0
      XML_ParserFree(parser);
1516
0
      return NULL;
1517
0
    }
1518
0
    parser->m_processor = externalEntityInitProcessor;
1519
0
#ifdef XML_DTD
1520
0
  } else {
1521
    /* The DTD instance referenced by parser->m_dtd is shared between the
1522
       document's root parser and external PE parsers, therefore one does not
1523
       need to call setContext. In addition, one also *must* not call
1524
       setContext, because this would overwrite existing prefix->binding
1525
       pointers in parser->m_dtd with ones that get destroyed with the external
1526
       PE parser. This would leave those prefixes with dangling pointers.
1527
    */
1528
0
    parser->m_isParamEntity = XML_TRUE;
1529
0
    XmlPrologStateInitExternalEntity(&parser->m_prologState);
1530
0
    parser->m_processor = externalParEntInitProcessor;
1531
0
  }
1532
0
#endif /* XML_DTD */
1533
0
  return parser;
1534
0
}
1535
1536
static void FASTCALL
1537
288
destroyBindings(BINDING *bindings, XML_Parser parser) {
1538
328
  for (;;) {
1539
328
    BINDING *b = bindings;
1540
328
    if (! b)
1541
288
      break;
1542
40
    bindings = b->nextTagBinding;
1543
40
    FREE(parser, b->uri);
1544
40
    FREE(parser, b);
1545
40
  }
1546
288
}
1547
1548
void XMLCALL
1549
89
XML_ParserFree(XML_Parser parser) {
1550
89
  TAG *tagList;
1551
89
  OPEN_INTERNAL_ENTITY *entityList;
1552
89
  if (parser == NULL)
1553
0
    return;
1554
  /* free m_tagStack and m_freeTagList */
1555
89
  tagList = parser->m_tagStack;
1556
199
  for (;;) {
1557
199
    TAG *p;
1558
199
    if (tagList == NULL) {
1559
163
      if (parser->m_freeTagList == NULL)
1560
89
        break;
1561
74
      tagList = parser->m_freeTagList;
1562
74
      parser->m_freeTagList = NULL;
1563
74
    }
1564
110
    p = tagList;
1565
110
    tagList = tagList->parent;
1566
110
    FREE(parser, p->buf);
1567
110
    destroyBindings(p->bindings, parser);
1568
110
    FREE(parser, p);
1569
110
  }
1570
  /* free m_openInternalEntities and m_freeInternalEntities */
1571
89
  entityList = parser->m_openInternalEntities;
1572
89
  for (;;) {
1573
89
    OPEN_INTERNAL_ENTITY *openEntity;
1574
89
    if (entityList == NULL) {
1575
89
      if (parser->m_freeInternalEntities == NULL)
1576
89
        break;
1577
0
      entityList = parser->m_freeInternalEntities;
1578
0
      parser->m_freeInternalEntities = NULL;
1579
0
    }
1580
0
    openEntity = entityList;
1581
0
    entityList = entityList->next;
1582
0
    FREE(parser, openEntity);
1583
0
  }
1584
1585
89
  destroyBindings(parser->m_freeBindingList, parser);
1586
89
  destroyBindings(parser->m_inheritedBindings, parser);
1587
89
  poolDestroy(&parser->m_tempPool);
1588
89
  poolDestroy(&parser->m_temp2Pool);
1589
89
  FREE(parser, (void *)parser->m_protocolEncodingName);
1590
89
#ifdef XML_DTD
1591
  /* external parameter entity parsers share the DTD structure
1592
     parser->m_dtd with the root parser, so we must not destroy it
1593
  */
1594
89
  if (! parser->m_isParamEntity && parser->m_dtd)
1595
#else
1596
  if (parser->m_dtd)
1597
#endif /* XML_DTD */
1598
89
    dtdDestroy(parser->m_dtd, (XML_Bool)! parser->m_parentParser,
1599
89
               &parser->m_mem);
1600
89
  FREE(parser, (void *)parser->m_atts);
1601
#ifdef XML_ATTR_INFO
1602
  FREE(parser, (void *)parser->m_attInfo);
1603
#endif
1604
89
  FREE(parser, parser->m_groupConnector);
1605
89
  FREE(parser, parser->m_buffer);
1606
89
  FREE(parser, parser->m_dataBuf);
1607
89
  FREE(parser, parser->m_nsAtts);
1608
89
  FREE(parser, parser->m_unknownEncodingMem);
1609
89
  if (parser->m_unknownEncodingRelease)
1610
0
    parser->m_unknownEncodingRelease(parser->m_unknownEncodingData);
1611
89
  FREE(parser, parser);
1612
89
}
1613
1614
void XMLCALL
1615
0
XML_UseParserAsHandlerArg(XML_Parser parser) {
1616
0
  if (parser != NULL)
1617
0
    parser->m_handlerArg = parser;
1618
0
}
1619
1620
enum XML_Error XMLCALL
1621
0
XML_UseForeignDTD(XML_Parser parser, XML_Bool useDTD) {
1622
0
  if (parser == NULL)
1623
0
    return XML_ERROR_INVALID_ARGUMENT;
1624
0
#ifdef XML_DTD
1625
  /* block after XML_Parse()/XML_ParseBuffer() has been called */
1626
0
  if (parser->m_parsingStatus.parsing == XML_PARSING
1627
0
      || parser->m_parsingStatus.parsing == XML_SUSPENDED)
1628
0
    return XML_ERROR_CANT_CHANGE_FEATURE_ONCE_PARSING;
1629
0
  parser->m_useForeignDTD = useDTD;
1630
0
  return XML_ERROR_NONE;
1631
#else
1632
  UNUSED_P(useDTD);
1633
  return XML_ERROR_FEATURE_REQUIRES_XML_DTD;
1634
#endif
1635
0
}
1636
1637
void XMLCALL
1638
0
XML_SetReturnNSTriplet(XML_Parser parser, int do_nst) {
1639
0
  if (parser == NULL)
1640
0
    return;
1641
  /* block after XML_Parse()/XML_ParseBuffer() has been called */
1642
0
  if (parser->m_parsingStatus.parsing == XML_PARSING
1643
0
      || parser->m_parsingStatus.parsing == XML_SUSPENDED)
1644
0
    return;
1645
0
  parser->m_ns_triplets = do_nst ? XML_TRUE : XML_FALSE;
1646
0
}
1647
1648
void XMLCALL
1649
89
XML_SetUserData(XML_Parser parser, void *p) {
1650
89
  if (parser == NULL)
1651
0
    return;
1652
89
  if (parser->m_handlerArg == parser->m_userData)
1653
89
    parser->m_handlerArg = parser->m_userData = p;
1654
0
  else
1655
0
    parser->m_userData = p;
1656
89
}
1657
1658
enum XML_Status XMLCALL
1659
0
XML_SetBase(XML_Parser parser, const XML_Char *p) {
1660
0
  if (parser == NULL)
1661
0
    return XML_STATUS_ERROR;
1662
0
  if (p) {
1663
0
    p = poolCopyString(&parser->m_dtd->pool, p);
1664
0
    if (! p)
1665
0
      return XML_STATUS_ERROR;
1666
0
    parser->m_curBase = p;
1667
0
  } else
1668
0
    parser->m_curBase = NULL;
1669
0
  return XML_STATUS_OK;
1670
0
}
1671
1672
const XML_Char *XMLCALL
1673
0
XML_GetBase(XML_Parser parser) {
1674
0
  if (parser == NULL)
1675
0
    return NULL;
1676
0
  return parser->m_curBase;
1677
0
}
1678
1679
int XMLCALL
1680
0
XML_GetSpecifiedAttributeCount(XML_Parser parser) {
1681
0
  if (parser == NULL)
1682
0
    return -1;
1683
0
  return parser->m_nSpecifiedAtts;
1684
0
}
1685
1686
int XMLCALL
1687
0
XML_GetIdAttributeIndex(XML_Parser parser) {
1688
0
  if (parser == NULL)
1689
0
    return -1;
1690
0
  return parser->m_idAttIndex;
1691
0
}
1692
1693
#ifdef XML_ATTR_INFO
1694
const XML_AttrInfo *XMLCALL
1695
XML_GetAttributeInfo(XML_Parser parser) {
1696
  if (parser == NULL)
1697
    return NULL;
1698
  return parser->m_attInfo;
1699
}
1700
#endif
1701
1702
void XMLCALL
1703
XML_SetElementHandler(XML_Parser parser, XML_StartElementHandler start,
1704
0
                      XML_EndElementHandler end) {
1705
0
  if (parser == NULL)
1706
0
    return;
1707
0
  parser->m_startElementHandler = start;
1708
0
  parser->m_endElementHandler = end;
1709
0
}
1710
1711
void XMLCALL
1712
89
XML_SetStartElementHandler(XML_Parser parser, XML_StartElementHandler start) {
1713
89
  if (parser != NULL)
1714
89
    parser->m_startElementHandler = start;
1715
89
}
1716
1717
void XMLCALL
1718
20
XML_SetEndElementHandler(XML_Parser parser, XML_EndElementHandler end) {
1719
20
  if (parser != NULL)
1720
20
    parser->m_endElementHandler = end;
1721
20
}
1722
1723
void XMLCALL
1724
XML_SetCharacterDataHandler(XML_Parser parser,
1725
20
                            XML_CharacterDataHandler handler) {
1726
20
  if (parser != NULL)
1727
20
    parser->m_characterDataHandler = handler;
1728
20
}
1729
1730
void XMLCALL
1731
XML_SetProcessingInstructionHandler(XML_Parser parser,
1732
0
                                    XML_ProcessingInstructionHandler handler) {
1733
0
  if (parser != NULL)
1734
0
    parser->m_processingInstructionHandler = handler;
1735
0
}
1736
1737
void XMLCALL
1738
0
XML_SetCommentHandler(XML_Parser parser, XML_CommentHandler handler) {
1739
0
  if (parser != NULL)
1740
0
    parser->m_commentHandler = handler;
1741
0
}
1742
1743
void XMLCALL
1744
XML_SetCdataSectionHandler(XML_Parser parser,
1745
                           XML_StartCdataSectionHandler start,
1746
0
                           XML_EndCdataSectionHandler end) {
1747
0
  if (parser == NULL)
1748
0
    return;
1749
0
  parser->m_startCdataSectionHandler = start;
1750
0
  parser->m_endCdataSectionHandler = end;
1751
0
}
1752
1753
void XMLCALL
1754
XML_SetStartCdataSectionHandler(XML_Parser parser,
1755
0
                                XML_StartCdataSectionHandler start) {
1756
0
  if (parser != NULL)
1757
0
    parser->m_startCdataSectionHandler = start;
1758
0
}
1759
1760
void XMLCALL
1761
XML_SetEndCdataSectionHandler(XML_Parser parser,
1762
0
                              XML_EndCdataSectionHandler end) {
1763
0
  if (parser != NULL)
1764
0
    parser->m_endCdataSectionHandler = end;
1765
0
}
1766
1767
void XMLCALL
1768
0
XML_SetDefaultHandler(XML_Parser parser, XML_DefaultHandler handler) {
1769
0
  if (parser == NULL)
1770
0
    return;
1771
0
  parser->m_defaultHandler = handler;
1772
0
  parser->m_defaultExpandInternalEntities = XML_FALSE;
1773
0
}
1774
1775
void XMLCALL
1776
0
XML_SetDefaultHandlerExpand(XML_Parser parser, XML_DefaultHandler handler) {
1777
0
  if (parser == NULL)
1778
0
    return;
1779
0
  parser->m_defaultHandler = handler;
1780
0
  parser->m_defaultExpandInternalEntities = XML_TRUE;
1781
0
}
1782
1783
void XMLCALL
1784
XML_SetDoctypeDeclHandler(XML_Parser parser, XML_StartDoctypeDeclHandler start,
1785
0
                          XML_EndDoctypeDeclHandler end) {
1786
0
  if (parser == NULL)
1787
0
    return;
1788
0
  parser->m_startDoctypeDeclHandler = start;
1789
0
  parser->m_endDoctypeDeclHandler = end;
1790
0
}
1791
1792
void XMLCALL
1793
XML_SetStartDoctypeDeclHandler(XML_Parser parser,
1794
0
                               XML_StartDoctypeDeclHandler start) {
1795
0
  if (parser != NULL)
1796
0
    parser->m_startDoctypeDeclHandler = start;
1797
0
}
1798
1799
void XMLCALL
1800
0
XML_SetEndDoctypeDeclHandler(XML_Parser parser, XML_EndDoctypeDeclHandler end) {
1801
0
  if (parser != NULL)
1802
0
    parser->m_endDoctypeDeclHandler = end;
1803
0
}
1804
1805
void XMLCALL
1806
XML_SetUnparsedEntityDeclHandler(XML_Parser parser,
1807
0
                                 XML_UnparsedEntityDeclHandler handler) {
1808
0
  if (parser != NULL)
1809
0
    parser->m_unparsedEntityDeclHandler = handler;
1810
0
}
1811
1812
void XMLCALL
1813
0
XML_SetNotationDeclHandler(XML_Parser parser, XML_NotationDeclHandler handler) {
1814
0
  if (parser != NULL)
1815
0
    parser->m_notationDeclHandler = handler;
1816
0
}
1817
1818
void XMLCALL
1819
XML_SetNamespaceDeclHandler(XML_Parser parser,
1820
                            XML_StartNamespaceDeclHandler start,
1821
0
                            XML_EndNamespaceDeclHandler end) {
1822
0
  if (parser == NULL)
1823
0
    return;
1824
0
  parser->m_startNamespaceDeclHandler = start;
1825
0
  parser->m_endNamespaceDeclHandler = end;
1826
0
}
1827
1828
void XMLCALL
1829
XML_SetStartNamespaceDeclHandler(XML_Parser parser,
1830
0
                                 XML_StartNamespaceDeclHandler start) {
1831
0
  if (parser != NULL)
1832
0
    parser->m_startNamespaceDeclHandler = start;
1833
0
}
1834
1835
void XMLCALL
1836
XML_SetEndNamespaceDeclHandler(XML_Parser parser,
1837
0
                               XML_EndNamespaceDeclHandler end) {
1838
0
  if (parser != NULL)
1839
0
    parser->m_endNamespaceDeclHandler = end;
1840
0
}
1841
1842
void XMLCALL
1843
XML_SetNotStandaloneHandler(XML_Parser parser,
1844
0
                            XML_NotStandaloneHandler handler) {
1845
0
  if (parser != NULL)
1846
0
    parser->m_notStandaloneHandler = handler;
1847
0
}
1848
1849
void XMLCALL
1850
XML_SetExternalEntityRefHandler(XML_Parser parser,
1851
0
                                XML_ExternalEntityRefHandler handler) {
1852
0
  if (parser != NULL)
1853
0
    parser->m_externalEntityRefHandler = handler;
1854
0
}
1855
1856
void XMLCALL
1857
0
XML_SetExternalEntityRefHandlerArg(XML_Parser parser, void *arg) {
1858
0
  if (parser == NULL)
1859
0
    return;
1860
0
  if (arg)
1861
0
    parser->m_externalEntityRefHandlerArg = (XML_Parser)arg;
1862
0
  else
1863
0
    parser->m_externalEntityRefHandlerArg = parser;
1864
0
}
1865
1866
void XMLCALL
1867
XML_SetSkippedEntityHandler(XML_Parser parser,
1868
0
                            XML_SkippedEntityHandler handler) {
1869
0
  if (parser != NULL)
1870
0
    parser->m_skippedEntityHandler = handler;
1871
0
}
1872
1873
void XMLCALL
1874
XML_SetUnknownEncodingHandler(XML_Parser parser,
1875
0
                              XML_UnknownEncodingHandler handler, void *data) {
1876
0
  if (parser == NULL)
1877
0
    return;
1878
0
  parser->m_unknownEncodingHandler = handler;
1879
0
  parser->m_unknownEncodingHandlerData = data;
1880
0
}
1881
1882
void XMLCALL
1883
0
XML_SetElementDeclHandler(XML_Parser parser, XML_ElementDeclHandler eldecl) {
1884
0
  if (parser != NULL)
1885
0
    parser->m_elementDeclHandler = eldecl;
1886
0
}
1887
1888
void XMLCALL
1889
0
XML_SetAttlistDeclHandler(XML_Parser parser, XML_AttlistDeclHandler attdecl) {
1890
0
  if (parser != NULL)
1891
0
    parser->m_attlistDeclHandler = attdecl;
1892
0
}
1893
1894
void XMLCALL
1895
0
XML_SetEntityDeclHandler(XML_Parser parser, XML_EntityDeclHandler handler) {
1896
0
  if (parser != NULL)
1897
0
    parser->m_entityDeclHandler = handler;
1898
0
}
1899
1900
void XMLCALL
1901
0
XML_SetXmlDeclHandler(XML_Parser parser, XML_XmlDeclHandler handler) {
1902
0
  if (parser != NULL)
1903
0
    parser->m_xmlDeclHandler = handler;
1904
0
}
1905
1906
int XMLCALL
1907
XML_SetParamEntityParsing(XML_Parser parser,
1908
89
                          enum XML_ParamEntityParsing peParsing) {
1909
89
  if (parser == NULL)
1910
0
    return 0;
1911
  /* block after XML_Parse()/XML_ParseBuffer() has been called */
1912
89
  if (parser->m_parsingStatus.parsing == XML_PARSING
1913
89
      || parser->m_parsingStatus.parsing == XML_SUSPENDED)
1914
0
    return 0;
1915
89
#ifdef XML_DTD
1916
89
  parser->m_paramEntityParsing = peParsing;
1917
89
  return 1;
1918
#else
1919
  return peParsing == XML_PARAM_ENTITY_PARSING_NEVER;
1920
#endif
1921
89
}
1922
1923
int XMLCALL
1924
0
XML_SetHashSalt(XML_Parser parser, unsigned long hash_salt) {
1925
0
  if (parser == NULL)
1926
0
    return 0;
1927
0
  if (parser->m_parentParser)
1928
0
    return XML_SetHashSalt(parser->m_parentParser, hash_salt);
1929
  /* block after XML_Parse()/XML_ParseBuffer() has been called */
1930
0
  if (parser->m_parsingStatus.parsing == XML_PARSING
1931
0
      || parser->m_parsingStatus.parsing == XML_SUSPENDED)
1932
0
    return 0;
1933
0
  parser->m_hash_secret_salt = hash_salt;
1934
0
  return 1;
1935
0
}
1936
1937
enum XML_Status XMLCALL
1938
89
XML_Parse(XML_Parser parser, const char *s, int len, int isFinal) {
1939
89
  void *buff;
1940
1941
89
  if ((parser == NULL) || (len < 0) || ((s == NULL) && (len != 0))) {
1942
0
    if (parser != NULL)
1943
0
      parser->m_errorCode = XML_ERROR_INVALID_ARGUMENT;
1944
0
    return XML_STATUS_ERROR;
1945
0
  }
1946
89
  switch (parser->m_parsingStatus.parsing) {
1947
0
  case XML_SUSPENDED:
1948
0
    parser->m_errorCode = XML_ERROR_SUSPENDED;
1949
0
    return XML_STATUS_ERROR;
1950
0
  case XML_FINISHED:
1951
0
    parser->m_errorCode = XML_ERROR_FINISHED;
1952
0
    return XML_STATUS_ERROR;
1953
89
  case XML_INITIALIZED:
1954
89
    if (parser->m_parentParser == NULL && ! startParsing(parser)) {
1955
0
      parser->m_errorCode = XML_ERROR_NO_MEMORY;
1956
0
      return XML_STATUS_ERROR;
1957
0
    }
1958
    /* fall through */
1959
89
  default:
1960
89
    parser->m_parsingStatus.parsing = XML_PARSING;
1961
89
  }
1962
1963
#if XML_CONTEXT_BYTES == 0
1964
  if (parser->m_bufferPtr == parser->m_bufferEnd) {
1965
    const char *end;
1966
    int nLeftOver;
1967
    enum XML_Status result;
1968
    /* Detect overflow (a+b > MAX <==> b > MAX-a) */
1969
    if ((XML_Size)len > ((XML_Size)-1) / 2 - parser->m_parseEndByteIndex) {
1970
      parser->m_errorCode = XML_ERROR_NO_MEMORY;
1971
      parser->m_eventPtr = parser->m_eventEndPtr = NULL;
1972
      parser->m_processor = errorProcessor;
1973
      return XML_STATUS_ERROR;
1974
    }
1975
    // though this isn't a buffer request, we assume that `len` is the app's
1976
    // preferred buffer fill size, and therefore save it here.
1977
    parser->m_lastBufferRequestSize = len;
1978
    parser->m_parseEndByteIndex += len;
1979
    parser->m_positionPtr = s;
1980
    parser->m_parsingStatus.finalBuffer = (XML_Bool)isFinal;
1981
1982
    parser->m_errorCode
1983
        = callProcessor(parser, s, parser->m_parseEndPtr = s + len, &end);
1984
1985
    if (parser->m_errorCode != XML_ERROR_NONE) {
1986
      parser->m_eventEndPtr = parser->m_eventPtr;
1987
      parser->m_processor = errorProcessor;
1988
      return XML_STATUS_ERROR;
1989
    } else {
1990
      switch (parser->m_parsingStatus.parsing) {
1991
      case XML_SUSPENDED:
1992
        result = XML_STATUS_SUSPENDED;
1993
        break;
1994
      case XML_INITIALIZED:
1995
      case XML_PARSING:
1996
        if (isFinal) {
1997
          parser->m_parsingStatus.parsing = XML_FINISHED;
1998
          return XML_STATUS_OK;
1999
        }
2000
      /* fall through */
2001
      default:
2002
        result = XML_STATUS_OK;
2003
      }
2004
    }
2005
2006
    XmlUpdatePosition(parser->m_encoding, parser->m_positionPtr, end,
2007
                      &parser->m_position);
2008
    nLeftOver = s + len - end;
2009
    if (nLeftOver) {
2010
      // Back up and restore the parsing status to avoid XML_ERROR_SUSPENDED
2011
      // (and XML_ERROR_FINISHED) from XML_GetBuffer.
2012
      const enum XML_Parsing originalStatus = parser->m_parsingStatus.parsing;
2013
      parser->m_parsingStatus.parsing = XML_PARSING;
2014
      void *const temp = XML_GetBuffer(parser, nLeftOver);
2015
      parser->m_parsingStatus.parsing = originalStatus;
2016
      // GetBuffer may have overwritten this, but we want to remember what the
2017
      // app requested, not how many bytes were left over after parsing.
2018
      parser->m_lastBufferRequestSize = len;
2019
      if (temp == NULL) {
2020
        // NOTE: parser->m_errorCode has already been set by XML_GetBuffer().
2021
        parser->m_eventPtr = parser->m_eventEndPtr = NULL;
2022
        parser->m_processor = errorProcessor;
2023
        return XML_STATUS_ERROR;
2024
      }
2025
      // Since we know that the buffer was empty and XML_CONTEXT_BYTES is 0, we
2026
      // don't have any data to preserve, and can copy straight into the start
2027
      // of the buffer rather than the GetBuffer return pointer (which may be
2028
      // pointing further into the allocated buffer).
2029
      memcpy(parser->m_buffer, end, nLeftOver);
2030
    }
2031
    parser->m_bufferPtr = parser->m_buffer;
2032
    parser->m_bufferEnd = parser->m_buffer + nLeftOver;
2033
    parser->m_positionPtr = parser->m_bufferPtr;
2034
    parser->m_parseEndPtr = parser->m_bufferEnd;
2035
    parser->m_eventPtr = parser->m_bufferPtr;
2036
    parser->m_eventEndPtr = parser->m_bufferPtr;
2037
    return result;
2038
  }
2039
#endif /* XML_CONTEXT_BYTES == 0 */
2040
89
  buff = XML_GetBuffer(parser, len);
2041
89
  if (buff == NULL)
2042
0
    return XML_STATUS_ERROR;
2043
89
  if (len > 0) {
2044
89
    assert(s != NULL); // make sure s==NULL && len!=0 was rejected above
2045
89
    memcpy(buff, s, len);
2046
89
  }
2047
89
  return XML_ParseBuffer(parser, len, isFinal);
2048
89
}
2049
2050
enum XML_Status XMLCALL
2051
89
XML_ParseBuffer(XML_Parser parser, int len, int isFinal) {
2052
89
  const char *start;
2053
89
  enum XML_Status result = XML_STATUS_OK;
2054
2055
89
  if (parser == NULL)
2056
0
    return XML_STATUS_ERROR;
2057
2058
89
  if (len < 0) {
2059
0
    parser->m_errorCode = XML_ERROR_INVALID_ARGUMENT;
2060
0
    return XML_STATUS_ERROR;
2061
0
  }
2062
2063
89
  switch (parser->m_parsingStatus.parsing) {
2064
0
  case XML_SUSPENDED:
2065
0
    parser->m_errorCode = XML_ERROR_SUSPENDED;
2066
0
    return XML_STATUS_ERROR;
2067
0
  case XML_FINISHED:
2068
0
    parser->m_errorCode = XML_ERROR_FINISHED;
2069
0
    return XML_STATUS_ERROR;
2070
0
  case XML_INITIALIZED:
2071
    /* Has someone called XML_GetBuffer successfully before? */
2072
0
    if (! parser->m_bufferPtr) {
2073
0
      parser->m_errorCode = XML_ERROR_NO_BUFFER;
2074
0
      return XML_STATUS_ERROR;
2075
0
    }
2076
2077
0
    if (parser->m_parentParser == NULL && ! startParsing(parser)) {
2078
0
      parser->m_errorCode = XML_ERROR_NO_MEMORY;
2079
0
      return XML_STATUS_ERROR;
2080
0
    }
2081
    /* fall through */
2082
89
  default:
2083
89
    parser->m_parsingStatus.parsing = XML_PARSING;
2084
89
  }
2085
2086
89
  start = parser->m_bufferPtr;
2087
89
  parser->m_positionPtr = start;
2088
89
  parser->m_bufferEnd += len;
2089
89
  parser->m_parseEndPtr = parser->m_bufferEnd;
2090
89
  parser->m_parseEndByteIndex += len;
2091
89
  parser->m_parsingStatus.finalBuffer = (XML_Bool)isFinal;
2092
2093
89
  parser->m_errorCode = callProcessor(parser, start, parser->m_parseEndPtr,
2094
89
                                      &parser->m_bufferPtr);
2095
2096
89
  if (parser->m_errorCode != XML_ERROR_NONE) {
2097
17
    parser->m_eventEndPtr = parser->m_eventPtr;
2098
17
    parser->m_processor = errorProcessor;
2099
17
    return XML_STATUS_ERROR;
2100
72
  } else {
2101
72
    switch (parser->m_parsingStatus.parsing) {
2102
0
    case XML_SUSPENDED:
2103
0
      result = XML_STATUS_SUSPENDED;
2104
0
      break;
2105
0
    case XML_INITIALIZED:
2106
72
    case XML_PARSING:
2107
72
      if (isFinal) {
2108
72
        parser->m_parsingStatus.parsing = XML_FINISHED;
2109
72
        return result;
2110
72
      }
2111
0
    default:; /* should not happen */
2112
72
    }
2113
72
  }
2114
2115
0
  XmlUpdatePosition(parser->m_encoding, parser->m_positionPtr,
2116
0
                    parser->m_bufferPtr, &parser->m_position);
2117
0
  parser->m_positionPtr = parser->m_bufferPtr;
2118
0
  return result;
2119
89
}
2120
2121
void *XMLCALL
2122
89
XML_GetBuffer(XML_Parser parser, int len) {
2123
89
  if (parser == NULL)
2124
0
    return NULL;
2125
89
  if (len < 0) {
2126
0
    parser->m_errorCode = XML_ERROR_NO_MEMORY;
2127
0
    return NULL;
2128
0
  }
2129
89
  switch (parser->m_parsingStatus.parsing) {
2130
0
  case XML_SUSPENDED:
2131
0
    parser->m_errorCode = XML_ERROR_SUSPENDED;
2132
0
    return NULL;
2133
0
  case XML_FINISHED:
2134
0
    parser->m_errorCode = XML_ERROR_FINISHED;
2135
0
    return NULL;
2136
89
  default:;
2137
89
  }
2138
2139
  // whether or not the request succeeds, `len` seems to be the app's preferred
2140
  // buffer fill size; remember it.
2141
89
  parser->m_lastBufferRequestSize = len;
2142
89
  if (len > EXPAT_SAFE_PTR_DIFF(parser->m_bufferLim, parser->m_bufferEnd)
2143
89
      || parser->m_buffer == NULL) {
2144
89
#if XML_CONTEXT_BYTES > 0
2145
89
    int keep;
2146
89
#endif /* XML_CONTEXT_BYTES > 0 */
2147
    /* Do not invoke signed arithmetic overflow: */
2148
89
    int neededSize = (int)((unsigned)len
2149
89
                           + (unsigned)EXPAT_SAFE_PTR_DIFF(
2150
89
                               parser->m_bufferEnd, parser->m_bufferPtr));
2151
89
    if (neededSize < 0) {
2152
0
      parser->m_errorCode = XML_ERROR_NO_MEMORY;
2153
0
      return NULL;
2154
0
    }
2155
89
#if XML_CONTEXT_BYTES > 0
2156
89
    keep = (int)EXPAT_SAFE_PTR_DIFF(parser->m_bufferPtr, parser->m_buffer);
2157
89
    if (keep > XML_CONTEXT_BYTES)
2158
0
      keep = XML_CONTEXT_BYTES;
2159
    /* Detect and prevent integer overflow */
2160
89
    if (keep > INT_MAX - neededSize) {
2161
0
      parser->m_errorCode = XML_ERROR_NO_MEMORY;
2162
0
      return NULL;
2163
0
    }
2164
89
    neededSize += keep;
2165
89
#endif /* XML_CONTEXT_BYTES > 0 */
2166
89
    if (parser->m_buffer && parser->m_bufferPtr
2167
0
        && neededSize
2168
0
               <= EXPAT_SAFE_PTR_DIFF(parser->m_bufferLim, parser->m_buffer)) {
2169
0
#if XML_CONTEXT_BYTES > 0
2170
0
      if (keep < EXPAT_SAFE_PTR_DIFF(parser->m_bufferPtr, parser->m_buffer)) {
2171
0
        int offset
2172
0
            = (int)EXPAT_SAFE_PTR_DIFF(parser->m_bufferPtr, parser->m_buffer)
2173
0
              - keep;
2174
        /* The buffer pointers cannot be NULL here; we have at least some bytes
2175
         * in the buffer */
2176
0
        memmove(parser->m_buffer, &parser->m_buffer[offset],
2177
0
                parser->m_bufferEnd - parser->m_bufferPtr + keep);
2178
0
        parser->m_bufferEnd -= offset;
2179
0
        parser->m_bufferPtr -= offset;
2180
0
      }
2181
#else
2182
      memmove(parser->m_buffer, parser->m_bufferPtr,
2183
              EXPAT_SAFE_PTR_DIFF(parser->m_bufferEnd, parser->m_bufferPtr));
2184
      parser->m_bufferEnd
2185
          = parser->m_buffer
2186
            + EXPAT_SAFE_PTR_DIFF(parser->m_bufferEnd, parser->m_bufferPtr);
2187
      parser->m_bufferPtr = parser->m_buffer;
2188
#endif /* XML_CONTEXT_BYTES > 0 */
2189
89
    } else {
2190
89
      char *newBuf;
2191
89
      int bufferSize
2192
89
          = (int)EXPAT_SAFE_PTR_DIFF(parser->m_bufferLim, parser->m_buffer);
2193
89
      if (bufferSize == 0)
2194
89
        bufferSize = INIT_BUFFER_SIZE;
2195
216
      do {
2196
        /* Do not invoke signed arithmetic overflow: */
2197
216
        bufferSize = (int)(2U * (unsigned)bufferSize);
2198
216
      } while (bufferSize < neededSize && bufferSize > 0);
2199
89
      if (bufferSize <= 0) {
2200
0
        parser->m_errorCode = XML_ERROR_NO_MEMORY;
2201
0
        return NULL;
2202
0
      }
2203
89
      newBuf = (char *)MALLOC(parser, bufferSize);
2204
89
      if (newBuf == 0) {
2205
0
        parser->m_errorCode = XML_ERROR_NO_MEMORY;
2206
0
        return NULL;
2207
0
      }
2208
89
      parser->m_bufferLim = newBuf + bufferSize;
2209
89
#if XML_CONTEXT_BYTES > 0
2210
89
      if (parser->m_bufferPtr) {
2211
0
        memcpy(newBuf, &parser->m_bufferPtr[-keep],
2212
0
               EXPAT_SAFE_PTR_DIFF(parser->m_bufferEnd, parser->m_bufferPtr)
2213
0
                   + keep);
2214
0
        FREE(parser, parser->m_buffer);
2215
0
        parser->m_buffer = newBuf;
2216
0
        parser->m_bufferEnd
2217
0
            = parser->m_buffer
2218
0
              + EXPAT_SAFE_PTR_DIFF(parser->m_bufferEnd, parser->m_bufferPtr)
2219
0
              + keep;
2220
0
        parser->m_bufferPtr = parser->m_buffer + keep;
2221
89
      } else {
2222
        /* This must be a brand new buffer with no data in it yet */
2223
89
        parser->m_bufferEnd = newBuf;
2224
89
        parser->m_bufferPtr = parser->m_buffer = newBuf;
2225
89
      }
2226
#else
2227
      if (parser->m_bufferPtr) {
2228
        memcpy(newBuf, parser->m_bufferPtr,
2229
               EXPAT_SAFE_PTR_DIFF(parser->m_bufferEnd, parser->m_bufferPtr));
2230
        FREE(parser, parser->m_buffer);
2231
        parser->m_bufferEnd
2232
            = newBuf
2233
              + EXPAT_SAFE_PTR_DIFF(parser->m_bufferEnd, parser->m_bufferPtr);
2234
      } else {
2235
        /* This must be a brand new buffer with no data in it yet */
2236
        parser->m_bufferEnd = newBuf;
2237
      }
2238
      parser->m_bufferPtr = parser->m_buffer = newBuf;
2239
#endif /* XML_CONTEXT_BYTES > 0 */
2240
89
    }
2241
89
    parser->m_eventPtr = parser->m_eventEndPtr = NULL;
2242
89
    parser->m_positionPtr = NULL;
2243
89
  }
2244
89
  return parser->m_bufferEnd;
2245
89
}
2246
2247
enum XML_Status XMLCALL
2248
0
XML_StopParser(XML_Parser parser, XML_Bool resumable) {
2249
0
  if (parser == NULL)
2250
0
    return XML_STATUS_ERROR;
2251
0
  switch (parser->m_parsingStatus.parsing) {
2252
0
  case XML_INITIALIZED:
2253
0
    parser->m_errorCode = XML_ERROR_NOT_STARTED;
2254
0
    return XML_STATUS_ERROR;
2255
0
  case XML_SUSPENDED:
2256
0
    if (resumable) {
2257
0
      parser->m_errorCode = XML_ERROR_SUSPENDED;
2258
0
      return XML_STATUS_ERROR;
2259
0
    }
2260
0
    parser->m_parsingStatus.parsing = XML_FINISHED;
2261
0
    break;
2262
0
  case XML_FINISHED:
2263
0
    parser->m_errorCode = XML_ERROR_FINISHED;
2264
0
    return XML_STATUS_ERROR;
2265
0
  case XML_PARSING:
2266
0
    if (resumable) {
2267
0
#ifdef XML_DTD
2268
0
      if (parser->m_isParamEntity) {
2269
0
        parser->m_errorCode = XML_ERROR_SUSPEND_PE;
2270
0
        return XML_STATUS_ERROR;
2271
0
      }
2272
0
#endif
2273
0
      parser->m_parsingStatus.parsing = XML_SUSPENDED;
2274
0
    } else
2275
0
      parser->m_parsingStatus.parsing = XML_FINISHED;
2276
0
    break;
2277
0
  default:
2278
0
    assert(0);
2279
0
  }
2280
0
  return XML_STATUS_OK;
2281
0
}
2282
2283
enum XML_Status XMLCALL
2284
0
XML_ResumeParser(XML_Parser parser) {
2285
0
  enum XML_Status result = XML_STATUS_OK;
2286
2287
0
  if (parser == NULL)
2288
0
    return XML_STATUS_ERROR;
2289
0
  if (parser->m_parsingStatus.parsing != XML_SUSPENDED) {
2290
0
    parser->m_errorCode = XML_ERROR_NOT_SUSPENDED;
2291
0
    return XML_STATUS_ERROR;
2292
0
  }
2293
0
  parser->m_parsingStatus.parsing = XML_PARSING;
2294
2295
0
  parser->m_errorCode = callProcessor(
2296
0
      parser, parser->m_bufferPtr, parser->m_parseEndPtr, &parser->m_bufferPtr);
2297
2298
0
  if (parser->m_errorCode != XML_ERROR_NONE) {
2299
0
    parser->m_eventEndPtr = parser->m_eventPtr;
2300
0
    parser->m_processor = errorProcessor;
2301
0
    return XML_STATUS_ERROR;
2302
0
  } else {
2303
0
    switch (parser->m_parsingStatus.parsing) {
2304
0
    case XML_SUSPENDED:
2305
0
      result = XML_STATUS_SUSPENDED;
2306
0
      break;
2307
0
    case XML_INITIALIZED:
2308
0
    case XML_PARSING:
2309
0
      if (parser->m_parsingStatus.finalBuffer) {
2310
0
        parser->m_parsingStatus.parsing = XML_FINISHED;
2311
0
        return result;
2312
0
      }
2313
0
    default:;
2314
0
    }
2315
0
  }
2316
2317
0
  XmlUpdatePosition(parser->m_encoding, parser->m_positionPtr,
2318
0
                    parser->m_bufferPtr, &parser->m_position);
2319
0
  parser->m_positionPtr = parser->m_bufferPtr;
2320
0
  return result;
2321
0
}
2322
2323
void XMLCALL
2324
0
XML_GetParsingStatus(XML_Parser parser, XML_ParsingStatus *status) {
2325
0
  if (parser == NULL)
2326
0
    return;
2327
0
  assert(status != NULL);
2328
0
  *status = parser->m_parsingStatus;
2329
0
}
2330
2331
enum XML_Error XMLCALL
2332
34
XML_GetErrorCode(XML_Parser parser) {
2333
34
  if (parser == NULL)
2334
0
    return XML_ERROR_INVALID_ARGUMENT;
2335
34
  return parser->m_errorCode;
2336
34
}
2337
2338
XML_Index XMLCALL
2339
0
XML_GetCurrentByteIndex(XML_Parser parser) {
2340
0
  if (parser == NULL)
2341
0
    return -1;
2342
0
  if (parser->m_eventPtr)
2343
0
    return (XML_Index)(parser->m_parseEndByteIndex
2344
0
                       - (parser->m_parseEndPtr - parser->m_eventPtr));
2345
0
  return -1;
2346
0
}
2347
2348
int XMLCALL
2349
0
XML_GetCurrentByteCount(XML_Parser parser) {
2350
0
  if (parser == NULL)
2351
0
    return 0;
2352
0
  if (parser->m_eventEndPtr && parser->m_eventPtr)
2353
0
    return (int)(parser->m_eventEndPtr - parser->m_eventPtr);
2354
0
  return 0;
2355
0
}
2356
2357
const char *XMLCALL
2358
0
XML_GetInputContext(XML_Parser parser, int *offset, int *size) {
2359
0
#if XML_CONTEXT_BYTES > 0
2360
0
  if (parser == NULL)
2361
0
    return NULL;
2362
0
  if (parser->m_eventPtr && parser->m_buffer) {
2363
0
    if (offset != NULL)
2364
0
      *offset = (int)(parser->m_eventPtr - parser->m_buffer);
2365
0
    if (size != NULL)
2366
0
      *size = (int)(parser->m_bufferEnd - parser->m_buffer);
2367
0
    return parser->m_buffer;
2368
0
  }
2369
#else
2370
  (void)parser;
2371
  (void)offset;
2372
  (void)size;
2373
#endif /* XML_CONTEXT_BYTES > 0 */
2374
0
  return (const char *)0;
2375
0
}
2376
2377
XML_Size XMLCALL
2378
0
XML_GetCurrentLineNumber(XML_Parser parser) {
2379
0
  if (parser == NULL)
2380
0
    return 0;
2381
0
  if (parser->m_eventPtr && parser->m_eventPtr >= parser->m_positionPtr) {
2382
0
    XmlUpdatePosition(parser->m_encoding, parser->m_positionPtr,
2383
0
                      parser->m_eventPtr, &parser->m_position);
2384
0
    parser->m_positionPtr = parser->m_eventPtr;
2385
0
  }
2386
0
  return parser->m_position.lineNumber + 1;
2387
0
}
2388
2389
XML_Size XMLCALL
2390
0
XML_GetCurrentColumnNumber(XML_Parser parser) {
2391
0
  if (parser == NULL)
2392
0
    return 0;
2393
0
  if (parser->m_eventPtr && parser->m_eventPtr >= parser->m_positionPtr) {
2394
0
    XmlUpdatePosition(parser->m_encoding, parser->m_positionPtr,
2395
0
                      parser->m_eventPtr, &parser->m_position);
2396
0
    parser->m_positionPtr = parser->m_eventPtr;
2397
0
  }
2398
0
  return parser->m_position.columnNumber;
2399
0
}
2400
2401
void XMLCALL
2402
0
XML_FreeContentModel(XML_Parser parser, XML_Content *model) {
2403
0
  if (parser != NULL)
2404
0
    FREE(parser, model);
2405
0
}
2406
2407
void *XMLCALL
2408
0
XML_MemMalloc(XML_Parser parser, size_t size) {
2409
0
  if (parser == NULL)
2410
0
    return NULL;
2411
0
  return MALLOC(parser, size);
2412
0
}
2413
2414
void *XMLCALL
2415
0
XML_MemRealloc(XML_Parser parser, void *ptr, size_t size) {
2416
0
  if (parser == NULL)
2417
0
    return NULL;
2418
0
  return REALLOC(parser, ptr, size);
2419
0
}
2420
2421
void XMLCALL
2422
0
XML_MemFree(XML_Parser parser, void *ptr) {
2423
0
  if (parser != NULL)
2424
0
    FREE(parser, ptr);
2425
0
}
2426
2427
void XMLCALL
2428
0
XML_DefaultCurrent(XML_Parser parser) {
2429
0
  if (parser == NULL)
2430
0
    return;
2431
0
  if (parser->m_defaultHandler) {
2432
0
    if (parser->m_openInternalEntities)
2433
0
      reportDefault(parser, parser->m_internalEncoding,
2434
0
                    parser->m_openInternalEntities->internalEventPtr,
2435
0
                    parser->m_openInternalEntities->internalEventEndPtr);
2436
0
    else
2437
0
      reportDefault(parser, parser->m_encoding, parser->m_eventPtr,
2438
0
                    parser->m_eventEndPtr);
2439
0
  }
2440
0
}
2441
2442
const XML_LChar *XMLCALL
2443
34
XML_ErrorString(enum XML_Error code) {
2444
34
  switch (code) {
2445
0
  case XML_ERROR_NONE:
2446
0
    return NULL;
2447
0
  case XML_ERROR_NO_MEMORY:
2448
0
    return XML_L("out of memory");
2449
0
  case XML_ERROR_SYNTAX:
2450
0
    return XML_L("syntax error");
2451
0
  case XML_ERROR_NO_ELEMENTS:
2452
0
    return XML_L("no element found");
2453
34
  case XML_ERROR_INVALID_TOKEN:
2454
34
    return XML_L("not well-formed (invalid token)");
2455
0
  case XML_ERROR_UNCLOSED_TOKEN:
2456
0
    return XML_L("unclosed token");
2457
0
  case XML_ERROR_PARTIAL_CHAR:
2458
0
    return XML_L("partial character");
2459
0
  case XML_ERROR_TAG_MISMATCH:
2460
0
    return XML_L("mismatched tag");
2461
0
  case XML_ERROR_DUPLICATE_ATTRIBUTE:
2462
0
    return XML_L("duplicate attribute");
2463
0
  case XML_ERROR_JUNK_AFTER_DOC_ELEMENT:
2464
0
    return XML_L("junk after document element");
2465
0
  case XML_ERROR_PARAM_ENTITY_REF:
2466
0
    return XML_L("illegal parameter entity reference");
2467
0
  case XML_ERROR_UNDEFINED_ENTITY:
2468
0
    return XML_L("undefined entity");
2469
0
  case XML_ERROR_RECURSIVE_ENTITY_REF:
2470
0
    return XML_L("recursive entity reference");
2471
0
  case XML_ERROR_ASYNC_ENTITY:
2472
0
    return XML_L("asynchronous entity");
2473
0
  case XML_ERROR_BAD_CHAR_REF:
2474
0
    return XML_L("reference to invalid character number");
2475
0
  case XML_ERROR_BINARY_ENTITY_REF:
2476
0
    return XML_L("reference to binary entity");
2477
0
  case XML_ERROR_ATTRIBUTE_EXTERNAL_ENTITY_REF:
2478
0
    return XML_L("reference to external entity in attribute");
2479
0
  case XML_ERROR_MISPLACED_XML_PI:
2480
0
    return XML_L("XML or text declaration not at start of entity");
2481
0
  case XML_ERROR_UNKNOWN_ENCODING:
2482
0
    return XML_L("unknown encoding");
2483
0
  case XML_ERROR_INCORRECT_ENCODING:
2484
0
    return XML_L("encoding specified in XML declaration is incorrect");
2485
0
  case XML_ERROR_UNCLOSED_CDATA_SECTION:
2486
0
    return XML_L("unclosed CDATA section");
2487
0
  case XML_ERROR_EXTERNAL_ENTITY_HANDLING:
2488
0
    return XML_L("error in processing external entity reference");
2489
0
  case XML_ERROR_NOT_STANDALONE:
2490
0
    return XML_L("document is not standalone");
2491
0
  case XML_ERROR_UNEXPECTED_STATE:
2492
0
    return XML_L("unexpected parser state - please send a bug report");
2493
0
  case XML_ERROR_ENTITY_DECLARED_IN_PE:
2494
0
    return XML_L("entity declared in parameter entity");
2495
0
  case XML_ERROR_FEATURE_REQUIRES_XML_DTD:
2496
0
    return XML_L("requested feature requires XML_DTD support in Expat");
2497
0
  case XML_ERROR_CANT_CHANGE_FEATURE_ONCE_PARSING:
2498
0
    return XML_L("cannot change setting once parsing has begun");
2499
  /* Added in 1.95.7. */
2500
0
  case XML_ERROR_UNBOUND_PREFIX:
2501
0
    return XML_L("unbound prefix");
2502
  /* Added in 1.95.8. */
2503
0
  case XML_ERROR_UNDECLARING_PREFIX:
2504
0
    return XML_L("must not undeclare prefix");
2505
0
  case XML_ERROR_INCOMPLETE_PE:
2506
0
    return XML_L("incomplete markup in parameter entity");
2507
0
  case XML_ERROR_XML_DECL:
2508
0
    return XML_L("XML declaration not well-formed");
2509
0
  case XML_ERROR_TEXT_DECL:
2510
0
    return XML_L("text declaration not well-formed");
2511
0
  case XML_ERROR_PUBLICID:
2512
0
    return XML_L("illegal character(s) in public id");
2513
0
  case XML_ERROR_SUSPENDED:
2514
0
    return XML_L("parser suspended");
2515
0
  case XML_ERROR_NOT_SUSPENDED:
2516
0
    return XML_L("parser not suspended");
2517
0
  case XML_ERROR_ABORTED:
2518
0
    return XML_L("parsing aborted");
2519
0
  case XML_ERROR_FINISHED:
2520
0
    return XML_L("parsing finished");
2521
0
  case XML_ERROR_SUSPEND_PE:
2522
0
    return XML_L("cannot suspend in external parameter entity");
2523
  /* Added in 2.0.0. */
2524
0
  case XML_ERROR_RESERVED_PREFIX_XML:
2525
0
    return XML_L(
2526
0
        "reserved prefix (xml) must not be undeclared or bound to another namespace name");
2527
0
  case XML_ERROR_RESERVED_PREFIX_XMLNS:
2528
0
    return XML_L("reserved prefix (xmlns) must not be declared or undeclared");
2529
0
  case XML_ERROR_RESERVED_NAMESPACE_URI:
2530
0
    return XML_L(
2531
0
        "prefix must not be bound to one of the reserved namespace names");
2532
  /* Added in 2.2.5. */
2533
0
  case XML_ERROR_INVALID_ARGUMENT: /* Constant added in 2.2.1, already */
2534
0
    return XML_L("invalid argument");
2535
    /* Added in 2.3.0. */
2536
0
  case XML_ERROR_NO_BUFFER:
2537
0
    return XML_L(
2538
0
        "a successful prior call to function XML_GetBuffer is required");
2539
  /* Added in 2.4.0. */
2540
0
  case XML_ERROR_AMPLIFICATION_LIMIT_BREACH:
2541
0
    return XML_L(
2542
0
        "limit on input amplification factor (from DTD and entities) breached");
2543
  /* Added in 2.6.4. */
2544
0
  case XML_ERROR_NOT_STARTED:
2545
0
    return XML_L("parser not started");
2546
34
  }
2547
0
  return NULL;
2548
34
}
2549
2550
const XML_LChar *XMLCALL
2551
0
XML_ExpatVersion(void) {
2552
  /* V1 is used to string-ize the version number. However, it would
2553
     string-ize the actual version macro *names* unless we get them
2554
     substituted before being passed to V1. CPP is defined to expand
2555
     a macro, then rescan for more expansions. Thus, we use V2 to expand
2556
     the version macros, then CPP will expand the resulting V1() macro
2557
     with the correct numerals. */
2558
  /* ### I'm assuming cpp is portable in this respect... */
2559
2560
0
#define V1(a, b, c) XML_L(#a) XML_L(".") XML_L(#b) XML_L(".") XML_L(#c)
2561
0
#define V2(a, b, c) XML_L("expat_") V1(a, b, c)
2562
2563
0
  return V2(XML_MAJOR_VERSION, XML_MINOR_VERSION, XML_MICRO_VERSION);
2564
2565
0
#undef V1
2566
0
#undef V2
2567
0
}
2568
2569
XML_Expat_Version XMLCALL
2570
0
XML_ExpatVersionInfo(void) {
2571
0
  XML_Expat_Version version;
2572
2573
0
  version.major = XML_MAJOR_VERSION;
2574
0
  version.minor = XML_MINOR_VERSION;
2575
0
  version.micro = XML_MICRO_VERSION;
2576
2577
0
  return version;
2578
0
}
2579
2580
const XML_Feature *XMLCALL
2581
0
XML_GetFeatureList(void) {
2582
0
  static const XML_Feature features[] = {
2583
0
      {XML_FEATURE_SIZEOF_XML_CHAR, XML_L("sizeof(XML_Char)"),
2584
0
       sizeof(XML_Char)},
2585
0
      {XML_FEATURE_SIZEOF_XML_LCHAR, XML_L("sizeof(XML_LChar)"),
2586
0
       sizeof(XML_LChar)},
2587
#ifdef XML_UNICODE
2588
      {XML_FEATURE_UNICODE, XML_L("XML_UNICODE"), 0},
2589
#endif
2590
#ifdef XML_UNICODE_WCHAR_T
2591
      {XML_FEATURE_UNICODE_WCHAR_T, XML_L("XML_UNICODE_WCHAR_T"), 0},
2592
#endif
2593
0
#ifdef XML_DTD
2594
0
      {XML_FEATURE_DTD, XML_L("XML_DTD"), 0},
2595
0
#endif
2596
0
#if XML_CONTEXT_BYTES > 0
2597
0
      {XML_FEATURE_CONTEXT_BYTES, XML_L("XML_CONTEXT_BYTES"),
2598
0
       XML_CONTEXT_BYTES},
2599
0
#endif
2600
#ifdef XML_MIN_SIZE
2601
      {XML_FEATURE_MIN_SIZE, XML_L("XML_MIN_SIZE"), 0},
2602
#endif
2603
0
#ifdef XML_NS
2604
0
      {XML_FEATURE_NS, XML_L("XML_NS"), 0},
2605
0
#endif
2606
#ifdef XML_LARGE_SIZE
2607
      {XML_FEATURE_LARGE_SIZE, XML_L("XML_LARGE_SIZE"), 0},
2608
#endif
2609
#ifdef XML_ATTR_INFO
2610
      {XML_FEATURE_ATTR_INFO, XML_L("XML_ATTR_INFO"), 0},
2611
#endif
2612
0
#if XML_GE == 1
2613
      /* Added in Expat 2.4.0 for XML_DTD defined and
2614
       * added in Expat 2.6.0 for XML_GE == 1. */
2615
0
      {XML_FEATURE_BILLION_LAUGHS_ATTACK_PROTECTION_MAXIMUM_AMPLIFICATION_DEFAULT,
2616
0
       XML_L("XML_BLAP_MAX_AMP"),
2617
0
       (long int)
2618
0
           EXPAT_BILLION_LAUGHS_ATTACK_PROTECTION_MAXIMUM_AMPLIFICATION_DEFAULT},
2619
0
      {XML_FEATURE_BILLION_LAUGHS_ATTACK_PROTECTION_ACTIVATION_THRESHOLD_DEFAULT,
2620
0
       XML_L("XML_BLAP_ACT_THRES"),
2621
0
       EXPAT_BILLION_LAUGHS_ATTACK_PROTECTION_ACTIVATION_THRESHOLD_DEFAULT},
2622
      /* Added in Expat 2.6.0. */
2623
0
      {XML_FEATURE_GE, XML_L("XML_GE"), 0},
2624
0
#endif
2625
0
      {XML_FEATURE_END, NULL, 0}};
2626
2627
0
  return features;
2628
0
}
2629
2630
#if XML_GE == 1
2631
XML_Bool XMLCALL
2632
XML_SetBillionLaughsAttackProtectionMaximumAmplification(
2633
0
    XML_Parser parser, float maximumAmplificationFactor) {
2634
0
  if ((parser == NULL) || (parser->m_parentParser != NULL)
2635
0
#if !defined(_MSC_VER) || (defined(_MSC_VER) && _MSC_VER >= 1700)
2636
0
      || isnan(maximumAmplificationFactor)
2637
0
#endif
2638
0
      || (maximumAmplificationFactor < 1.0f)) {
2639
0
    return XML_FALSE;
2640
0
  }
2641
0
  parser->m_accounting.maximumAmplificationFactor = maximumAmplificationFactor;
2642
0
  return XML_TRUE;
2643
0
}
2644
2645
XML_Bool XMLCALL
2646
XML_SetBillionLaughsAttackProtectionActivationThreshold(
2647
0
    XML_Parser parser, unsigned long long activationThresholdBytes) {
2648
0
  if ((parser == NULL) || (parser->m_parentParser != NULL)) {
2649
0
    return XML_FALSE;
2650
0
  }
2651
0
  parser->m_accounting.activationThresholdBytes = activationThresholdBytes;
2652
0
  return XML_TRUE;
2653
0
}
2654
#endif /* XML_GE == 1 */
2655
2656
XML_Bool XMLCALL
2657
0
XML_SetReparseDeferralEnabled(XML_Parser parser, XML_Bool enabled) {
2658
0
  if (parser != NULL && (enabled == XML_TRUE || enabled == XML_FALSE)) {
2659
0
    parser->m_reparseDeferralEnabled = enabled;
2660
0
    return XML_TRUE;
2661
0
  }
2662
0
  return XML_FALSE;
2663
0
}
2664
2665
/* Initially tag->rawName always points into the parse buffer;
2666
   for those TAG instances opened while the current parse buffer was
2667
   processed, and not yet closed, we need to store tag->rawName in a more
2668
   permanent location, since the parse buffer is about to be discarded.
2669
*/
2670
static XML_Bool
2671
72
storeRawNames(XML_Parser parser) {
2672
72
  TAG *tag = parser->m_tagStack;
2673
72
  while (tag) {
2674
0
    int bufSize;
2675
0
    int nameLen = sizeof(XML_Char) * (tag->name.strLen + 1);
2676
0
    size_t rawNameLen;
2677
0
    char *rawNameBuf = tag->buf + nameLen;
2678
    /* Stop if already stored.  Since m_tagStack is a stack, we can stop
2679
       at the first entry that has already been copied; everything
2680
       below it in the stack is already been accounted for in a
2681
       previous call to this function.
2682
    */
2683
0
    if (tag->rawName == rawNameBuf)
2684
0
      break;
2685
    /* For reuse purposes we need to ensure that the
2686
       size of tag->buf is a multiple of sizeof(XML_Char).
2687
    */
2688
0
    rawNameLen = ROUND_UP(tag->rawNameLength, sizeof(XML_Char));
2689
    /* Detect and prevent integer overflow. */
2690
0
    if (rawNameLen > (size_t)INT_MAX - nameLen)
2691
0
      return XML_FALSE;
2692
0
    bufSize = nameLen + (int)rawNameLen;
2693
0
    if (bufSize > tag->bufEnd - tag->buf) {
2694
0
      char *temp = (char *)REALLOC(parser, tag->buf, bufSize);
2695
0
      if (temp == NULL)
2696
0
        return XML_FALSE;
2697
      /* if tag->name.str points to tag->buf (only when namespace
2698
         processing is off) then we have to update it
2699
      */
2700
0
      if (tag->name.str == (XML_Char *)tag->buf)
2701
0
        tag->name.str = (XML_Char *)temp;
2702
      /* if tag->name.localPart is set (when namespace processing is on)
2703
         then update it as well, since it will always point into tag->buf
2704
      */
2705
0
      if (tag->name.localPart)
2706
0
        tag->name.localPart
2707
0
            = (XML_Char *)temp + (tag->name.localPart - (XML_Char *)tag->buf);
2708
0
      tag->buf = temp;
2709
0
      tag->bufEnd = temp + bufSize;
2710
0
      rawNameBuf = temp + nameLen;
2711
0
    }
2712
0
    memcpy(rawNameBuf, tag->rawName, tag->rawNameLength);
2713
0
    tag->rawName = rawNameBuf;
2714
0
    tag = tag->parent;
2715
0
  }
2716
72
  return XML_TRUE;
2717
72
}
2718
2719
static enum XML_Error PTRCALL
2720
contentProcessor(XML_Parser parser, const char *start, const char *end,
2721
89
                 const char **endPtr) {
2722
89
  enum XML_Error result = doContent(
2723
89
      parser, 0, parser->m_encoding, start, end, endPtr,
2724
89
      (XML_Bool)! parser->m_parsingStatus.finalBuffer, XML_ACCOUNT_DIRECT);
2725
89
  if (result == XML_ERROR_NONE) {
2726
72
    if (! storeRawNames(parser))
2727
0
      return XML_ERROR_NO_MEMORY;
2728
72
  }
2729
89
  return result;
2730
89
}
2731
2732
static enum XML_Error PTRCALL
2733
externalEntityInitProcessor(XML_Parser parser, const char *start,
2734
0
                            const char *end, const char **endPtr) {
2735
0
  enum XML_Error result = initializeEncoding(parser);
2736
0
  if (result != XML_ERROR_NONE)
2737
0
    return result;
2738
0
  parser->m_processor = externalEntityInitProcessor2;
2739
0
  return externalEntityInitProcessor2(parser, start, end, endPtr);
2740
0
}
2741
2742
static enum XML_Error PTRCALL
2743
externalEntityInitProcessor2(XML_Parser parser, const char *start,
2744
0
                             const char *end, const char **endPtr) {
2745
0
  const char *next = start; /* XmlContentTok doesn't always set the last arg */
2746
0
  int tok = XmlContentTok(parser->m_encoding, start, end, &next);
2747
0
  switch (tok) {
2748
0
  case XML_TOK_BOM:
2749
0
#if XML_GE == 1
2750
0
    if (! accountingDiffTolerated(parser, tok, start, next, __LINE__,
2751
0
                                  XML_ACCOUNT_DIRECT)) {
2752
0
      accountingOnAbort(parser);
2753
0
      return XML_ERROR_AMPLIFICATION_LIMIT_BREACH;
2754
0
    }
2755
0
#endif /* XML_GE == 1 */
2756
2757
    /* If we are at the end of the buffer, this would cause the next stage,
2758
       i.e. externalEntityInitProcessor3, to pass control directly to
2759
       doContent (by detecting XML_TOK_NONE) without processing any xml text
2760
       declaration - causing the error XML_ERROR_MISPLACED_XML_PI in doContent.
2761
    */
2762
0
    if (next == end && ! parser->m_parsingStatus.finalBuffer) {
2763
0
      *endPtr = next;
2764
0
      return XML_ERROR_NONE;
2765
0
    }
2766
0
    start = next;
2767
0
    break;
2768
0
  case XML_TOK_PARTIAL:
2769
0
    if (! parser->m_parsingStatus.finalBuffer) {
2770
0
      *endPtr = start;
2771
0
      return XML_ERROR_NONE;
2772
0
    }
2773
0
    parser->m_eventPtr = start;
2774
0
    return XML_ERROR_UNCLOSED_TOKEN;
2775
0
  case XML_TOK_PARTIAL_CHAR:
2776
0
    if (! parser->m_parsingStatus.finalBuffer) {
2777
0
      *endPtr = start;
2778
0
      return XML_ERROR_NONE;
2779
0
    }
2780
0
    parser->m_eventPtr = start;
2781
0
    return XML_ERROR_PARTIAL_CHAR;
2782
0
  }
2783
0
  parser->m_processor = externalEntityInitProcessor3;
2784
0
  return externalEntityInitProcessor3(parser, start, end, endPtr);
2785
0
}
2786
2787
static enum XML_Error PTRCALL
2788
externalEntityInitProcessor3(XML_Parser parser, const char *start,
2789
0
                             const char *end, const char **endPtr) {
2790
0
  int tok;
2791
0
  const char *next = start; /* XmlContentTok doesn't always set the last arg */
2792
0
  parser->m_eventPtr = start;
2793
0
  tok = XmlContentTok(parser->m_encoding, start, end, &next);
2794
  /* Note: These bytes are accounted later in:
2795
           - processXmlDecl
2796
           - externalEntityContentProcessor
2797
  */
2798
0
  parser->m_eventEndPtr = next;
2799
2800
0
  switch (tok) {
2801
0
  case XML_TOK_XML_DECL: {
2802
0
    enum XML_Error result;
2803
0
    result = processXmlDecl(parser, 1, start, next);
2804
0
    if (result != XML_ERROR_NONE)
2805
0
      return result;
2806
0
    switch (parser->m_parsingStatus.parsing) {
2807
0
    case XML_SUSPENDED:
2808
0
      *endPtr = next;
2809
0
      return XML_ERROR_NONE;
2810
0
    case XML_FINISHED:
2811
0
      return XML_ERROR_ABORTED;
2812
0
    default:
2813
0
      start = next;
2814
0
    }
2815
0
  } break;
2816
0
  case XML_TOK_PARTIAL:
2817
0
    if (! parser->m_parsingStatus.finalBuffer) {
2818
0
      *endPtr = start;
2819
0
      return XML_ERROR_NONE;
2820
0
    }
2821
0
    return XML_ERROR_UNCLOSED_TOKEN;
2822
0
  case XML_TOK_PARTIAL_CHAR:
2823
0
    if (! parser->m_parsingStatus.finalBuffer) {
2824
0
      *endPtr = start;
2825
0
      return XML_ERROR_NONE;
2826
0
    }
2827
0
    return XML_ERROR_PARTIAL_CHAR;
2828
0
  }
2829
0
  parser->m_processor = externalEntityContentProcessor;
2830
0
  parser->m_tagLevel = 1;
2831
0
  return externalEntityContentProcessor(parser, start, end, endPtr);
2832
0
}
2833
2834
static enum XML_Error PTRCALL
2835
externalEntityContentProcessor(XML_Parser parser, const char *start,
2836
0
                               const char *end, const char **endPtr) {
2837
0
  enum XML_Error result
2838
0
      = doContent(parser, 1, parser->m_encoding, start, end, endPtr,
2839
0
                  (XML_Bool)! parser->m_parsingStatus.finalBuffer,
2840
0
                  XML_ACCOUNT_ENTITY_EXPANSION);
2841
0
  if (result == XML_ERROR_NONE) {
2842
0
    if (! storeRawNames(parser))
2843
0
      return XML_ERROR_NO_MEMORY;
2844
0
  }
2845
0
  return result;
2846
0
}
2847
2848
static enum XML_Error
2849
doContent(XML_Parser parser, int startTagLevel, const ENCODING *enc,
2850
          const char *s, const char *end, const char **nextPtr,
2851
89
          XML_Bool haveMore, enum XML_Account account) {
2852
  /* save one level of indirection */
2853
89
  DTD *const dtd = parser->m_dtd;
2854
2855
89
  const char **eventPP;
2856
89
  const char **eventEndPP;
2857
89
  if (enc == parser->m_encoding) {
2858
89
    eventPP = &parser->m_eventPtr;
2859
89
    eventEndPP = &parser->m_eventEndPtr;
2860
89
  } else {
2861
0
    eventPP = &(parser->m_openInternalEntities->internalEventPtr);
2862
0
    eventEndPP = &(parser->m_openInternalEntities->internalEventEndPtr);
2863
0
  }
2864
89
  *eventPP = s;
2865
2866
33.0k
  for (;;) {
2867
33.0k
    const char *next = s; /* XmlContentTok doesn't always set the last arg */
2868
33.0k
    int tok = XmlContentTok(enc, s, end, &next);
2869
33.0k
#if XML_GE == 1
2870
33.0k
    const char *accountAfter
2871
33.0k
        = ((tok == XML_TOK_TRAILING_RSQB) || (tok == XML_TOK_TRAILING_CR))
2872
33.0k
              ? (haveMore ? s /* i.e. 0 bytes */ : end)
2873
33.0k
              : next;
2874
33.0k
    if (! accountingDiffTolerated(parser, tok, s, accountAfter, __LINE__,
2875
33.0k
                                  account)) {
2876
0
      accountingOnAbort(parser);
2877
0
      return XML_ERROR_AMPLIFICATION_LIMIT_BREACH;
2878
0
    }
2879
33.0k
#endif
2880
33.0k
    *eventEndPP = next;
2881
33.0k
    switch (tok) {
2882
0
    case XML_TOK_TRAILING_CR:
2883
0
      if (haveMore) {
2884
0
        *nextPtr = s;
2885
0
        return XML_ERROR_NONE;
2886
0
      }
2887
0
      *eventEndPP = end;
2888
0
      if (parser->m_characterDataHandler) {
2889
0
        XML_Char c = 0xA;
2890
0
        parser->m_characterDataHandler(parser->m_handlerArg, &c, 1);
2891
0
      } else if (parser->m_defaultHandler)
2892
0
        reportDefault(parser, enc, s, end);
2893
      /* We are at the end of the final buffer, should we check for
2894
         XML_SUSPENDED, XML_FINISHED?
2895
      */
2896
0
      if (startTagLevel == 0)
2897
0
        return XML_ERROR_NO_ELEMENTS;
2898
0
      if (parser->m_tagLevel != startTagLevel)
2899
0
        return XML_ERROR_ASYNC_ENTITY;
2900
0
      *nextPtr = end;
2901
0
      return XML_ERROR_NONE;
2902
0
    case XML_TOK_NONE:
2903
0
      if (haveMore) {
2904
0
        *nextPtr = s;
2905
0
        return XML_ERROR_NONE;
2906
0
      }
2907
0
      if (startTagLevel > 0) {
2908
0
        if (parser->m_tagLevel != startTagLevel)
2909
0
          return XML_ERROR_ASYNC_ENTITY;
2910
0
        *nextPtr = s;
2911
0
        return XML_ERROR_NONE;
2912
0
      }
2913
0
      return XML_ERROR_NO_ELEMENTS;
2914
15
    case XML_TOK_INVALID:
2915
15
      *eventPP = next;
2916
15
      return XML_ERROR_INVALID_TOKEN;
2917
0
    case XML_TOK_PARTIAL:
2918
0
      if (haveMore) {
2919
0
        *nextPtr = s;
2920
0
        return XML_ERROR_NONE;
2921
0
      }
2922
0
      return XML_ERROR_UNCLOSED_TOKEN;
2923
0
    case XML_TOK_PARTIAL_CHAR:
2924
0
      if (haveMore) {
2925
0
        *nextPtr = s;
2926
0
        return XML_ERROR_NONE;
2927
0
      }
2928
0
      return XML_ERROR_PARTIAL_CHAR;
2929
0
    case XML_TOK_ENTITY_REF: {
2930
0
      const XML_Char *name;
2931
0
      ENTITY *entity;
2932
0
      XML_Char ch = (XML_Char)XmlPredefinedEntityName(
2933
0
          enc, s + enc->minBytesPerChar, next - enc->minBytesPerChar);
2934
0
      if (ch) {
2935
0
#if XML_GE == 1
2936
        /* NOTE: We are replacing 4-6 characters original input for 1 character
2937
         *       so there is no amplification and hence recording without
2938
         *       protection. */
2939
0
        accountingDiffTolerated(parser, tok, (char *)&ch,
2940
0
                                ((char *)&ch) + sizeof(XML_Char), __LINE__,
2941
0
                                XML_ACCOUNT_ENTITY_EXPANSION);
2942
0
#endif /* XML_GE == 1 */
2943
0
        if (parser->m_characterDataHandler)
2944
0
          parser->m_characterDataHandler(parser->m_handlerArg, &ch, 1);
2945
0
        else if (parser->m_defaultHandler)
2946
0
          reportDefault(parser, enc, s, next);
2947
0
        break;
2948
0
      }
2949
0
      name = poolStoreString(&dtd->pool, enc, s + enc->minBytesPerChar,
2950
0
                             next - enc->minBytesPerChar);
2951
0
      if (! name)
2952
0
        return XML_ERROR_NO_MEMORY;
2953
0
      entity = (ENTITY *)lookup(parser, &dtd->generalEntities, name, 0);
2954
0
      poolDiscard(&dtd->pool);
2955
      /* First, determine if a check for an existing declaration is needed;
2956
         if yes, check that the entity exists, and that it is internal,
2957
         otherwise call the skipped entity or default handler.
2958
      */
2959
0
      if (! dtd->hasParamEntityRefs || dtd->standalone) {
2960
0
        if (! entity)
2961
0
          return XML_ERROR_UNDEFINED_ENTITY;
2962
0
        else if (! entity->is_internal)
2963
0
          return XML_ERROR_ENTITY_DECLARED_IN_PE;
2964
0
      } else if (! entity) {
2965
0
        if (parser->m_skippedEntityHandler)
2966
0
          parser->m_skippedEntityHandler(parser->m_handlerArg, name, 0);
2967
0
        else if (parser->m_defaultHandler)
2968
0
          reportDefault(parser, enc, s, next);
2969
0
        break;
2970
0
      }
2971
0
      if (entity->open)
2972
0
        return XML_ERROR_RECURSIVE_ENTITY_REF;
2973
0
      if (entity->notation)
2974
0
        return XML_ERROR_BINARY_ENTITY_REF;
2975
0
      if (entity->textPtr) {
2976
0
        enum XML_Error result;
2977
0
        if (! parser->m_defaultExpandInternalEntities) {
2978
0
          if (parser->m_skippedEntityHandler)
2979
0
            parser->m_skippedEntityHandler(parser->m_handlerArg, entity->name,
2980
0
                                           0);
2981
0
          else if (parser->m_defaultHandler)
2982
0
            reportDefault(parser, enc, s, next);
2983
0
          break;
2984
0
        }
2985
0
        result = processInternalEntity(parser, entity, XML_FALSE);
2986
0
        if (result != XML_ERROR_NONE)
2987
0
          return result;
2988
0
      } else if (parser->m_externalEntityRefHandler) {
2989
0
        const XML_Char *context;
2990
0
        entity->open = XML_TRUE;
2991
0
        context = getContext(parser);
2992
0
        entity->open = XML_FALSE;
2993
0
        if (! context)
2994
0
          return XML_ERROR_NO_MEMORY;
2995
0
        if (! parser->m_externalEntityRefHandler(
2996
0
                parser->m_externalEntityRefHandlerArg, context, entity->base,
2997
0
                entity->systemId, entity->publicId))
2998
0
          return XML_ERROR_EXTERNAL_ENTITY_HANDLING;
2999
0
        poolDiscard(&parser->m_tempPool);
3000
0
      } else if (parser->m_defaultHandler)
3001
0
        reportDefault(parser, enc, s, next);
3002
0
      break;
3003
0
    }
3004
0
    case XML_TOK_START_TAG_NO_ATTS:
3005
      /* fall through */
3006
110
    case XML_TOK_START_TAG_WITH_ATTS: {
3007
110
      TAG *tag;
3008
110
      enum XML_Error result;
3009
110
      XML_Char *toPtr;
3010
110
      if (parser->m_freeTagList) {
3011
0
        tag = parser->m_freeTagList;
3012
0
        parser->m_freeTagList = parser->m_freeTagList->parent;
3013
110
      } else {
3014
110
        tag = (TAG *)MALLOC(parser, sizeof(TAG));
3015
110
        if (! tag)
3016
0
          return XML_ERROR_NO_MEMORY;
3017
110
        tag->buf = (char *)MALLOC(parser, INIT_TAG_BUF_SIZE);
3018
110
        if (! tag->buf) {
3019
0
          FREE(parser, tag);
3020
0
          return XML_ERROR_NO_MEMORY;
3021
0
        }
3022
110
        tag->bufEnd = tag->buf + INIT_TAG_BUF_SIZE;
3023
110
      }
3024
110
      tag->bindings = NULL;
3025
110
      tag->parent = parser->m_tagStack;
3026
110
      parser->m_tagStack = tag;
3027
110
      tag->name.localPart = NULL;
3028
110
      tag->name.prefix = NULL;
3029
110
      tag->rawName = s + enc->minBytesPerChar;
3030
110
      tag->rawNameLength = XmlNameLength(enc, tag->rawName);
3031
110
      ++parser->m_tagLevel;
3032
110
      {
3033
110
        const char *rawNameEnd = tag->rawName + tag->rawNameLength;
3034
110
        const char *fromPtr = tag->rawName;
3035
110
        toPtr = (XML_Char *)tag->buf;
3036
110
        for (;;) {
3037
110
          int bufSize;
3038
110
          int convLen;
3039
110
          const enum XML_Convert_Result convert_res
3040
110
              = XmlConvert(enc, &fromPtr, rawNameEnd, (ICHAR **)&toPtr,
3041
110
                           (ICHAR *)tag->bufEnd - 1);
3042
110
          convLen = (int)(toPtr - (XML_Char *)tag->buf);
3043
110
          if ((fromPtr >= rawNameEnd)
3044
110
              || (convert_res == XML_CONVERT_INPUT_INCOMPLETE)) {
3045
110
            tag->name.strLen = convLen;
3046
110
            break;
3047
110
          }
3048
0
          bufSize = (int)(tag->bufEnd - tag->buf) << 1;
3049
0
          {
3050
0
            char *temp = (char *)REALLOC(parser, tag->buf, bufSize);
3051
0
            if (temp == NULL)
3052
0
              return XML_ERROR_NO_MEMORY;
3053
0
            tag->buf = temp;
3054
0
            tag->bufEnd = temp + bufSize;
3055
0
            toPtr = (XML_Char *)temp + convLen;
3056
0
          }
3057
0
        }
3058
110
      }
3059
110
      tag->name.str = (XML_Char *)tag->buf;
3060
110
      *toPtr = XML_T('\0');
3061
110
      result
3062
110
          = storeAtts(parser, enc, s, &(tag->name), &(tag->bindings), account);
3063
110
      if (result)
3064
0
        return result;
3065
110
      if (parser->m_startElementHandler)
3066
110
        parser->m_startElementHandler(parser->m_handlerArg, tag->name.str,
3067
110
                                      (const XML_Char **)parser->m_atts);
3068
0
      else if (parser->m_defaultHandler)
3069
0
        reportDefault(parser, enc, s, next);
3070
110
      poolClear(&parser->m_tempPool);
3071
110
      break;
3072
110
    }
3073
0
    case XML_TOK_EMPTY_ELEMENT_NO_ATTS:
3074
      /* fall through */
3075
11.0k
    case XML_TOK_EMPTY_ELEMENT_WITH_ATTS: {
3076
11.0k
      const char *rawName = s + enc->minBytesPerChar;
3077
11.0k
      enum XML_Error result;
3078
11.0k
      BINDING *bindings = NULL;
3079
11.0k
      XML_Bool noElmHandlers = XML_TRUE;
3080
11.0k
      TAG_NAME name;
3081
11.0k
      name.str = poolStoreString(&parser->m_tempPool, enc, rawName,
3082
11.0k
                                 rawName + XmlNameLength(enc, rawName));
3083
11.0k
      if (! name.str)
3084
0
        return XML_ERROR_NO_MEMORY;
3085
11.0k
      poolFinish(&parser->m_tempPool);
3086
11.0k
      result = storeAtts(parser, enc, s, &name, &bindings,
3087
11.0k
                         XML_ACCOUNT_NONE /* token spans whole start tag */);
3088
11.0k
      if (result != XML_ERROR_NONE) {
3089
0
        freeBindings(parser, bindings);
3090
0
        return result;
3091
0
      }
3092
11.0k
      poolFinish(&parser->m_tempPool);
3093
11.0k
      if (parser->m_startElementHandler) {
3094
11.0k
        parser->m_startElementHandler(parser->m_handlerArg, name.str,
3095
11.0k
                                      (const XML_Char **)parser->m_atts);
3096
11.0k
        noElmHandlers = XML_FALSE;
3097
11.0k
      }
3098
11.0k
      if (parser->m_endElementHandler) {
3099
10.9k
        if (parser->m_startElementHandler)
3100
10.9k
          *eventPP = *eventEndPP;
3101
10.9k
        parser->m_endElementHandler(parser->m_handlerArg, name.str);
3102
10.9k
        noElmHandlers = XML_FALSE;
3103
10.9k
      }
3104
11.0k
      if (noElmHandlers && parser->m_defaultHandler)
3105
0
        reportDefault(parser, enc, s, next);
3106
11.0k
      poolClear(&parser->m_tempPool);
3107
11.0k
      freeBindings(parser, bindings);
3108
11.0k
    }
3109
11.0k
      if ((parser->m_tagLevel == 0)
3110
0
          && (parser->m_parsingStatus.parsing != XML_FINISHED)) {
3111
0
        if (parser->m_parsingStatus.parsing == XML_SUSPENDED)
3112
0
          parser->m_processor = epilogProcessor;
3113
0
        else
3114
0
          return epilogProcessor(parser, next, end, nextPtr);
3115
0
      }
3116
11.0k
      break;
3117
11.0k
    case XML_TOK_END_TAG:
3118
79
      if (parser->m_tagLevel == startTagLevel)
3119
0
        return XML_ERROR_ASYNC_ENTITY;
3120
79
      else {
3121
79
        int len;
3122
79
        const char *rawName;
3123
79
        TAG *tag = parser->m_tagStack;
3124
79
        rawName = s + enc->minBytesPerChar * 2;
3125
79
        len = XmlNameLength(enc, rawName);
3126
79
        if (len != tag->rawNameLength
3127
79
            || memcmp(tag->rawName, rawName, len) != 0) {
3128
0
          *eventPP = rawName;
3129
0
          return XML_ERROR_TAG_MISMATCH;
3130
0
        }
3131
79
        parser->m_tagStack = tag->parent;
3132
79
        tag->parent = parser->m_freeTagList;
3133
79
        parser->m_freeTagList = tag;
3134
79
        --parser->m_tagLevel;
3135
79
        if (parser->m_endElementHandler) {
3136
10
          const XML_Char *localPart;
3137
10
          const XML_Char *prefix;
3138
10
          XML_Char *uri;
3139
10
          localPart = tag->name.localPart;
3140
10
          if (parser->m_ns && localPart) {
3141
            /* localPart and prefix may have been overwritten in
3142
               tag->name.str, since this points to the binding->uri
3143
               buffer which gets reused; so we have to add them again
3144
            */
3145
10
            uri = (XML_Char *)tag->name.str + tag->name.uriLen;
3146
            /* don't need to check for space - already done in storeAtts() */
3147
85
            while (*localPart)
3148
75
              *uri++ = *localPart++;
3149
10
            prefix = tag->name.prefix;
3150
10
            if (parser->m_ns_triplets && prefix) {
3151
0
              *uri++ = parser->m_namespaceSeparator;
3152
0
              while (*prefix)
3153
0
                *uri++ = *prefix++;
3154
0
            }
3155
10
            *uri = XML_T('\0');
3156
10
          }
3157
10
          parser->m_endElementHandler(parser->m_handlerArg, tag->name.str);
3158
69
        } else if (parser->m_defaultHandler)
3159
0
          reportDefault(parser, enc, s, next);
3160
84
        while (tag->bindings) {
3161
5
          BINDING *b = tag->bindings;
3162
5
          if (parser->m_endNamespaceDeclHandler)
3163
0
            parser->m_endNamespaceDeclHandler(parser->m_handlerArg,
3164
0
                                              b->prefix->name);
3165
5
          tag->bindings = tag->bindings->nextTagBinding;
3166
5
          b->nextTagBinding = parser->m_freeBindingList;
3167
5
          parser->m_freeBindingList = b;
3168
5
          b->prefix->binding = b->prevPrefixBinding;
3169
5
        }
3170
79
        if ((parser->m_tagLevel == 0)
3171
74
            && (parser->m_parsingStatus.parsing != XML_FINISHED)) {
3172
74
          if (parser->m_parsingStatus.parsing == XML_SUSPENDED)
3173
0
            parser->m_processor = epilogProcessor;
3174
74
          else
3175
74
            return epilogProcessor(parser, next, end, nextPtr);
3176
74
        }
3177
79
      }
3178
5
      break;
3179
5
    case XML_TOK_CHAR_REF: {
3180
0
      int n = XmlCharRefNumber(enc, s);
3181
0
      if (n < 0)
3182
0
        return XML_ERROR_BAD_CHAR_REF;
3183
0
      if (parser->m_characterDataHandler) {
3184
0
        XML_Char buf[XML_ENCODE_MAX];
3185
0
        parser->m_characterDataHandler(parser->m_handlerArg, buf,
3186
0
                                       XmlEncode(n, (ICHAR *)buf));
3187
0
      } else if (parser->m_defaultHandler)
3188
0
        reportDefault(parser, enc, s, next);
3189
0
    } break;
3190
0
    case XML_TOK_XML_DECL:
3191
0
      return XML_ERROR_MISPLACED_XML_PI;
3192
10.8k
    case XML_TOK_DATA_NEWLINE:
3193
10.8k
      if (parser->m_characterDataHandler) {
3194
10.7k
        XML_Char c = 0xA;
3195
10.7k
        parser->m_characterDataHandler(parser->m_handlerArg, &c, 1);
3196
10.7k
      } else if (parser->m_defaultHandler)
3197
0
        reportDefault(parser, enc, s, next);
3198
10.8k
      break;
3199
0
    case XML_TOK_CDATA_SECT_OPEN: {
3200
0
      enum XML_Error result;
3201
0
      if (parser->m_startCdataSectionHandler)
3202
0
        parser->m_startCdataSectionHandler(parser->m_handlerArg);
3203
      /* BEGIN disabled code */
3204
      /* Suppose you doing a transformation on a document that involves
3205
         changing only the character data.  You set up a defaultHandler
3206
         and a characterDataHandler.  The defaultHandler simply copies
3207
         characters through.  The characterDataHandler does the
3208
         transformation and writes the characters out escaping them as
3209
         necessary.  This case will fail to work if we leave out the
3210
         following two lines (because & and < inside CDATA sections will
3211
         be incorrectly escaped).
3212
3213
         However, now we have a start/endCdataSectionHandler, so it seems
3214
         easier to let the user deal with this.
3215
      */
3216
0
      else if ((0) && parser->m_characterDataHandler)
3217
0
        parser->m_characterDataHandler(parser->m_handlerArg, parser->m_dataBuf,
3218
0
                                       0);
3219
      /* END disabled code */
3220
0
      else if (parser->m_defaultHandler)
3221
0
        reportDefault(parser, enc, s, next);
3222
0
      result
3223
0
          = doCdataSection(parser, enc, &next, end, nextPtr, haveMore, account);
3224
0
      if (result != XML_ERROR_NONE)
3225
0
        return result;
3226
0
      else if (! next) {
3227
0
        parser->m_processor = cdataSectionProcessor;
3228
0
        return result;
3229
0
      }
3230
0
    } break;
3231
0
    case XML_TOK_TRAILING_RSQB:
3232
0
      if (haveMore) {
3233
0
        *nextPtr = s;
3234
0
        return XML_ERROR_NONE;
3235
0
      }
3236
0
      if (parser->m_characterDataHandler) {
3237
0
        if (MUST_CONVERT(enc, s)) {
3238
0
          ICHAR *dataPtr = (ICHAR *)parser->m_dataBuf;
3239
0
          XmlConvert(enc, &s, end, &dataPtr, (ICHAR *)parser->m_dataBufEnd);
3240
0
          parser->m_characterDataHandler(
3241
0
              parser->m_handlerArg, parser->m_dataBuf,
3242
0
              (int)(dataPtr - (ICHAR *)parser->m_dataBuf));
3243
0
        } else
3244
0
          parser->m_characterDataHandler(
3245
0
              parser->m_handlerArg, (const XML_Char *)s,
3246
0
              (int)((const XML_Char *)end - (const XML_Char *)s));
3247
0
      } else if (parser->m_defaultHandler)
3248
0
        reportDefault(parser, enc, s, end);
3249
      /* We are at the end of the final buffer, should we check for
3250
         XML_SUSPENDED, XML_FINISHED?
3251
      */
3252
0
      if (startTagLevel == 0) {
3253
0
        *eventPP = end;
3254
0
        return XML_ERROR_NO_ELEMENTS;
3255
0
      }
3256
0
      if (parser->m_tagLevel != startTagLevel) {
3257
0
        *eventPP = end;
3258
0
        return XML_ERROR_ASYNC_ENTITY;
3259
0
      }
3260
0
      *nextPtr = end;
3261
0
      return XML_ERROR_NONE;
3262
10.9k
    case XML_TOK_DATA_CHARS: {
3263
10.9k
      XML_CharacterDataHandler charDataHandler = parser->m_characterDataHandler;
3264
10.9k
      if (charDataHandler) {
3265
10.9k
        if (MUST_CONVERT(enc, s)) {
3266
0
          for (;;) {
3267
0
            ICHAR *dataPtr = (ICHAR *)parser->m_dataBuf;
3268
0
            const enum XML_Convert_Result convert_res = XmlConvert(
3269
0
                enc, &s, next, &dataPtr, (ICHAR *)parser->m_dataBufEnd);
3270
0
            *eventEndPP = s;
3271
0
            charDataHandler(parser->m_handlerArg, parser->m_dataBuf,
3272
0
                            (int)(dataPtr - (ICHAR *)parser->m_dataBuf));
3273
0
            if ((convert_res == XML_CONVERT_COMPLETED)
3274
0
                || (convert_res == XML_CONVERT_INPUT_INCOMPLETE))
3275
0
              break;
3276
0
            *eventPP = s;
3277
0
          }
3278
0
        } else
3279
10.9k
          charDataHandler(parser->m_handlerArg, (const XML_Char *)s,
3280
10.9k
                          (int)((const XML_Char *)next - (const XML_Char *)s));
3281
10.9k
      } else if (parser->m_defaultHandler)
3282
0
        reportDefault(parser, enc, s, next);
3283
10.9k
    } break;
3284
0
    case XML_TOK_PI:
3285
0
      if (! reportProcessingInstruction(parser, enc, s, next))
3286
0
        return XML_ERROR_NO_MEMORY;
3287
0
      break;
3288
0
    case XML_TOK_COMMENT:
3289
0
      if (! reportComment(parser, enc, s, next))
3290
0
        return XML_ERROR_NO_MEMORY;
3291
0
      break;
3292
0
    default:
3293
      /* All of the tokens produced by XmlContentTok() have their own
3294
       * explicit cases, so this default is not strictly necessary.
3295
       * However it is a useful safety net, so we retain the code and
3296
       * simply exclude it from the coverage tests.
3297
       *
3298
       * LCOV_EXCL_START
3299
       */
3300
0
      if (parser->m_defaultHandler)
3301
0
        reportDefault(parser, enc, s, next);
3302
0
      break;
3303
      /* LCOV_EXCL_STOP */
3304
33.0k
    }
3305
32.9k
    *eventPP = s = next;
3306
32.9k
    switch (parser->m_parsingStatus.parsing) {
3307
0
    case XML_SUSPENDED:
3308
0
      *nextPtr = next;
3309
0
      return XML_ERROR_NONE;
3310
0
    case XML_FINISHED:
3311
0
      return XML_ERROR_ABORTED;
3312
32.9k
    default:;
3313
32.9k
    }
3314
32.9k
  }
3315
  /* not reached */
3316
89
}
3317
3318
/* This function does not call free() on the allocated memory, merely
3319
 * moving it to the parser's m_freeBindingList where it can be freed or
3320
 * reused as appropriate.
3321
 */
3322
static void
3323
11.0k
freeBindings(XML_Parser parser, BINDING *bindings) {
3324
11.0k
  while (bindings) {
3325
0
    BINDING *b = bindings;
3326
3327
    /* m_startNamespaceDeclHandler will have been called for this
3328
     * binding in addBindings(), so call the end handler now.
3329
     */
3330
0
    if (parser->m_endNamespaceDeclHandler)
3331
0
      parser->m_endNamespaceDeclHandler(parser->m_handlerArg, b->prefix->name);
3332
3333
0
    bindings = bindings->nextTagBinding;
3334
0
    b->nextTagBinding = parser->m_freeBindingList;
3335
0
    parser->m_freeBindingList = b;
3336
0
    b->prefix->binding = b->prevPrefixBinding;
3337
0
  }
3338
11.0k
}
3339
3340
/* Precondition: all arguments must be non-NULL;
3341
   Purpose:
3342
   - normalize attributes
3343
   - check attributes for well-formedness
3344
   - generate namespace aware attribute names (URI, prefix)
3345
   - build list of attributes for startElementHandler
3346
   - default attributes
3347
   - process namespace declarations (check and report them)
3348
   - generate namespace aware element name (URI, prefix)
3349
*/
3350
static enum XML_Error
3351
storeAtts(XML_Parser parser, const ENCODING *enc, const char *attStr,
3352
          TAG_NAME *tagNamePtr, BINDING **bindingsPtr,
3353
11.1k
          enum XML_Account account) {
3354
11.1k
  DTD *const dtd = parser->m_dtd; /* save one level of indirection */
3355
11.1k
  ELEMENT_TYPE *elementType;
3356
11.1k
  int nDefaultAtts;
3357
11.1k
  const XML_Char **appAtts; /* the attribute list for the application */
3358
11.1k
  int attIndex = 0;
3359
11.1k
  int prefixLen;
3360
11.1k
  int i;
3361
11.1k
  int n;
3362
11.1k
  XML_Char *uri;
3363
11.1k
  int nPrefixes = 0;
3364
11.1k
  BINDING *binding;
3365
11.1k
  const XML_Char *localPart;
3366
3367
  /* lookup the element type name */
3368
11.1k
  elementType
3369
11.1k
      = (ELEMENT_TYPE *)lookup(parser, &dtd->elementTypes, tagNamePtr->str, 0);
3370
11.1k
  if (! elementType) {
3371
211
    const XML_Char *name = poolCopyString(&dtd->pool, tagNamePtr->str);
3372
211
    if (! name)
3373
0
      return XML_ERROR_NO_MEMORY;
3374
211
    elementType = (ELEMENT_TYPE *)lookup(parser, &dtd->elementTypes, name,
3375
211
                                         sizeof(ELEMENT_TYPE));
3376
211
    if (! elementType)
3377
0
      return XML_ERROR_NO_MEMORY;
3378
211
    if (parser->m_ns && ! setElementTypePrefix(parser, elementType))
3379
0
      return XML_ERROR_NO_MEMORY;
3380
211
  }
3381
11.1k
  nDefaultAtts = elementType->nDefaultAtts;
3382
3383
  /* get the attributes from the tokenizer */
3384
11.1k
  n = XmlGetAttributes(enc, attStr, parser->m_attsSize, parser->m_atts);
3385
3386
  /* Detect and prevent integer overflow */
3387
11.1k
  if (n > INT_MAX - nDefaultAtts) {
3388
0
    return XML_ERROR_NO_MEMORY;
3389
0
  }
3390
3391
11.1k
  if (n + nDefaultAtts > parser->m_attsSize) {
3392
0
    int oldAttsSize = parser->m_attsSize;
3393
0
    ATTRIBUTE *temp;
3394
#ifdef XML_ATTR_INFO
3395
    XML_AttrInfo *temp2;
3396
#endif
3397
3398
    /* Detect and prevent integer overflow */
3399
0
    if ((nDefaultAtts > INT_MAX - INIT_ATTS_SIZE)
3400
0
        || (n > INT_MAX - (nDefaultAtts + INIT_ATTS_SIZE))) {
3401
0
      return XML_ERROR_NO_MEMORY;
3402
0
    }
3403
3404
0
    parser->m_attsSize = n + nDefaultAtts + INIT_ATTS_SIZE;
3405
3406
    /* Detect and prevent integer overflow.
3407
     * The preprocessor guard addresses the "always false" warning
3408
     * from -Wtype-limits on platforms where
3409
     * sizeof(unsigned int) < sizeof(size_t), e.g. on x86_64. */
3410
#if UINT_MAX >= SIZE_MAX
3411
    if ((unsigned)parser->m_attsSize > (size_t)(-1) / sizeof(ATTRIBUTE)) {
3412
      parser->m_attsSize = oldAttsSize;
3413
      return XML_ERROR_NO_MEMORY;
3414
    }
3415
#endif
3416
3417
0
    temp = (ATTRIBUTE *)REALLOC(parser, (void *)parser->m_atts,
3418
0
                                parser->m_attsSize * sizeof(ATTRIBUTE));
3419
0
    if (temp == NULL) {
3420
0
      parser->m_attsSize = oldAttsSize;
3421
0
      return XML_ERROR_NO_MEMORY;
3422
0
    }
3423
0
    parser->m_atts = temp;
3424
#ifdef XML_ATTR_INFO
3425
    /* Detect and prevent integer overflow.
3426
     * The preprocessor guard addresses the "always false" warning
3427
     * from -Wtype-limits on platforms where
3428
     * sizeof(unsigned int) < sizeof(size_t), e.g. on x86_64. */
3429
#  if UINT_MAX >= SIZE_MAX
3430
    if ((unsigned)parser->m_attsSize > (size_t)(-1) / sizeof(XML_AttrInfo)) {
3431
      parser->m_attsSize = oldAttsSize;
3432
      return XML_ERROR_NO_MEMORY;
3433
    }
3434
#  endif
3435
3436
    temp2 = (XML_AttrInfo *)REALLOC(parser, (void *)parser->m_attInfo,
3437
                                    parser->m_attsSize * sizeof(XML_AttrInfo));
3438
    if (temp2 == NULL) {
3439
      parser->m_attsSize = oldAttsSize;
3440
      return XML_ERROR_NO_MEMORY;
3441
    }
3442
    parser->m_attInfo = temp2;
3443
#endif
3444
0
    if (n > oldAttsSize)
3445
0
      XmlGetAttributes(enc, attStr, n, parser->m_atts);
3446
0
  }
3447
3448
11.1k
  appAtts = (const XML_Char **)parser->m_atts;
3449
34.7k
  for (i = 0; i < n; i++) {
3450
23.6k
    ATTRIBUTE *currAtt = &parser->m_atts[i];
3451
#ifdef XML_ATTR_INFO
3452
    XML_AttrInfo *currAttInfo = &parser->m_attInfo[i];
3453
#endif
3454
    /* add the name and value to the attribute list */
3455
23.6k
    ATTRIBUTE_ID *attId
3456
23.6k
        = getAttributeId(parser, enc, currAtt->name,
3457
23.6k
                         currAtt->name + XmlNameLength(enc, currAtt->name));
3458
23.6k
    if (! attId)
3459
0
      return XML_ERROR_NO_MEMORY;
3460
#ifdef XML_ATTR_INFO
3461
    currAttInfo->nameStart
3462
        = parser->m_parseEndByteIndex - (parser->m_parseEndPtr - currAtt->name);
3463
    currAttInfo->nameEnd
3464
        = currAttInfo->nameStart + XmlNameLength(enc, currAtt->name);
3465
    currAttInfo->valueStart = parser->m_parseEndByteIndex
3466
                              - (parser->m_parseEndPtr - currAtt->valuePtr);
3467
    currAttInfo->valueEnd = parser->m_parseEndByteIndex
3468
                            - (parser->m_parseEndPtr - currAtt->valueEnd);
3469
#endif
3470
    /* Detect duplicate attributes by their QNames. This does not work when
3471
       namespace processing is turned on and different prefixes for the same
3472
       namespace are used. For this case we have a check further down.
3473
    */
3474
23.6k
    if ((attId->name)[-1]) {
3475
0
      if (enc == parser->m_encoding)
3476
0
        parser->m_eventPtr = parser->m_atts[i].name;
3477
0
      return XML_ERROR_DUPLICATE_ATTRIBUTE;
3478
0
    }
3479
23.6k
    (attId->name)[-1] = 1;
3480
23.6k
    appAtts[attIndex++] = attId->name;
3481
23.6k
    if (! parser->m_atts[i].normalized) {
3482
728
      enum XML_Error result;
3483
728
      XML_Bool isCdata = XML_TRUE;
3484
3485
      /* figure out whether declared as other than CDATA */
3486
728
      if (attId->maybeTokenized) {
3487
0
        int j;
3488
0
        for (j = 0; j < nDefaultAtts; j++) {
3489
0
          if (attId == elementType->defaultAtts[j].id) {
3490
0
            isCdata = elementType->defaultAtts[j].isCdata;
3491
0
            break;
3492
0
          }
3493
0
        }
3494
0
      }
3495
3496
      /* normalize the attribute value */
3497
728
      result = storeAttributeValue(
3498
728
          parser, enc, isCdata, parser->m_atts[i].valuePtr,
3499
728
          parser->m_atts[i].valueEnd, &parser->m_tempPool, account);
3500
728
      if (result)
3501
0
        return result;
3502
728
      appAtts[attIndex] = poolStart(&parser->m_tempPool);
3503
728
      poolFinish(&parser->m_tempPool);
3504
22.9k
    } else {
3505
      /* the value did not need normalizing */
3506
22.9k
      appAtts[attIndex] = poolStoreString(&parser->m_tempPool, enc,
3507
22.9k
                                          parser->m_atts[i].valuePtr,
3508
22.9k
                                          parser->m_atts[i].valueEnd);
3509
22.9k
      if (appAtts[attIndex] == 0)
3510
0
        return XML_ERROR_NO_MEMORY;
3511
22.9k
      poolFinish(&parser->m_tempPool);
3512
22.9k
    }
3513
    /* handle prefixed attribute names */
3514
23.6k
    if (attId->prefix) {
3515
40
      if (attId->xmlns) {
3516
        /* deal with namespace declarations here */
3517
20
        enum XML_Error result = addBinding(parser, attId->prefix, attId,
3518
20
                                           appAtts[attIndex], bindingsPtr);
3519
20
        if (result)
3520
0
          return result;
3521
20
        --attIndex;
3522
20
      } else {
3523
        /* deal with other prefixed names later */
3524
20
        attIndex++;
3525
20
        nPrefixes++;
3526
20
        (attId->name)[-1] = 2;
3527
20
      }
3528
40
    } else
3529
23.6k
      attIndex++;
3530
23.6k
  }
3531
3532
  /* set-up for XML_GetSpecifiedAttributeCount and XML_GetIdAttributeIndex */
3533
11.1k
  parser->m_nSpecifiedAtts = attIndex;
3534
11.1k
  if (elementType->idAtt && (elementType->idAtt->name)[-1]) {
3535
0
    for (i = 0; i < attIndex; i += 2)
3536
0
      if (appAtts[i] == elementType->idAtt->name) {
3537
0
        parser->m_idAttIndex = i;
3538
0
        break;
3539
0
      }
3540
0
  } else
3541
11.1k
    parser->m_idAttIndex = -1;
3542
3543
  /* do attribute defaulting */
3544
11.1k
  for (i = 0; i < nDefaultAtts; i++) {
3545
0
    const DEFAULT_ATTRIBUTE *da = elementType->defaultAtts + i;
3546
0
    if (! (da->id->name)[-1] && da->value) {
3547
0
      if (da->id->prefix) {
3548
0
        if (da->id->xmlns) {
3549
0
          enum XML_Error result = addBinding(parser, da->id->prefix, da->id,
3550
0
                                             da->value, bindingsPtr);
3551
0
          if (result)
3552
0
            return result;
3553
0
        } else {
3554
0
          (da->id->name)[-1] = 2;
3555
0
          nPrefixes++;
3556
0
          appAtts[attIndex++] = da->id->name;
3557
0
          appAtts[attIndex++] = da->value;
3558
0
        }
3559
0
      } else {
3560
0
        (da->id->name)[-1] = 1;
3561
0
        appAtts[attIndex++] = da->id->name;
3562
0
        appAtts[attIndex++] = da->value;
3563
0
      }
3564
0
    }
3565
0
  }
3566
11.1k
  appAtts[attIndex] = 0;
3567
3568
  /* expand prefixed attribute names, check for duplicates,
3569
     and clear flags that say whether attributes were specified */
3570
11.1k
  i = 0;
3571
11.1k
  if (nPrefixes) {
3572
20
    int j; /* hash table index */
3573
20
    unsigned long version = parser->m_nsAttsVersion;
3574
20
    unsigned int nsAttsSize;
3575
20
    unsigned char oldNsAttsPower;
3576
3577
    /* Detect and prevent invalid shift */
3578
20
    if (parser->m_nsAttsPower >= sizeof(unsigned int) * 8 /* bits per byte */) {
3579
0
      return XML_ERROR_NO_MEMORY;
3580
0
    }
3581
3582
20
    nsAttsSize = 1u << parser->m_nsAttsPower;
3583
20
    oldNsAttsPower = parser->m_nsAttsPower;
3584
    /* size of hash table must be at least 2 * (# of prefixed attributes) */
3585
20
    if ((nPrefixes << 1)
3586
20
        >> parser->m_nsAttsPower) { /* true for m_nsAttsPower = 0 */
3587
20
      NS_ATT *temp;
3588
      /* hash table size must also be a power of 2 and >= 8 */
3589
40
      while (nPrefixes >> parser->m_nsAttsPower++)
3590
20
        ;
3591
20
      if (parser->m_nsAttsPower < 3)
3592
20
        parser->m_nsAttsPower = 3;
3593
3594
      /* Detect and prevent invalid shift */
3595
20
      if (parser->m_nsAttsPower >= sizeof(nsAttsSize) * 8 /* bits per byte */) {
3596
        /* Restore actual size of memory in m_nsAtts */
3597
0
        parser->m_nsAttsPower = oldNsAttsPower;
3598
0
        return XML_ERROR_NO_MEMORY;
3599
0
      }
3600
3601
20
      nsAttsSize = 1u << parser->m_nsAttsPower;
3602
3603
      /* Detect and prevent integer overflow.
3604
       * The preprocessor guard addresses the "always false" warning
3605
       * from -Wtype-limits on platforms where
3606
       * sizeof(unsigned int) < sizeof(size_t), e.g. on x86_64. */
3607
#if UINT_MAX >= SIZE_MAX
3608
      if (nsAttsSize > (size_t)(-1) / sizeof(NS_ATT)) {
3609
        /* Restore actual size of memory in m_nsAtts */
3610
        parser->m_nsAttsPower = oldNsAttsPower;
3611
        return XML_ERROR_NO_MEMORY;
3612
      }
3613
#endif
3614
3615
20
      temp = (NS_ATT *)REALLOC(parser, parser->m_nsAtts,
3616
20
                               nsAttsSize * sizeof(NS_ATT));
3617
20
      if (! temp) {
3618
        /* Restore actual size of memory in m_nsAtts */
3619
0
        parser->m_nsAttsPower = oldNsAttsPower;
3620
0
        return XML_ERROR_NO_MEMORY;
3621
0
      }
3622
20
      parser->m_nsAtts = temp;
3623
20
      version = 0; /* force re-initialization of m_nsAtts hash table */
3624
20
    }
3625
    /* using a version flag saves us from initializing m_nsAtts every time */
3626
20
    if (! version) { /* initialize version flags when version wraps around */
3627
20
      version = INIT_ATTS_VERSION;
3628
180
      for (j = nsAttsSize; j != 0;)
3629
160
        parser->m_nsAtts[--j].version = version;
3630
20
    }
3631
20
    parser->m_nsAttsVersion = --version;
3632
3633
    /* expand prefixed names and check for duplicates */
3634
60
    for (; i < attIndex; i += 2) {
3635
60
      const XML_Char *s = appAtts[i];
3636
60
      if (s[-1] == 2) { /* prefixed */
3637
20
        ATTRIBUTE_ID *id;
3638
20
        const BINDING *b;
3639
20
        unsigned long uriHash;
3640
20
        struct siphash sip_state;
3641
20
        struct sipkey sip_key;
3642
3643
20
        copy_salt_to_sipkey(parser, &sip_key);
3644
20
        sip24_init(&sip_state, &sip_key);
3645
3646
20
        ((XML_Char *)s)[-1] = 0; /* clear flag */
3647
20
        id = (ATTRIBUTE_ID *)lookup(parser, &dtd->attributeIds, s, 0);
3648
20
        if (! id || ! id->prefix) {
3649
          /* This code is walking through the appAtts array, dealing
3650
           * with (in this case) a prefixed attribute name.  To be in
3651
           * the array, the attribute must have already been bound, so
3652
           * has to have passed through the hash table lookup once
3653
           * already.  That implies that an entry for it already
3654
           * exists, so the lookup above will return a pointer to
3655
           * already allocated memory.  There is no opportunaity for
3656
           * the allocator to fail, so the condition above cannot be
3657
           * fulfilled.
3658
           *
3659
           * Since it is difficult to be certain that the above
3660
           * analysis is complete, we retain the test and merely
3661
           * remove the code from coverage tests.
3662
           */
3663
0
          return XML_ERROR_NO_MEMORY; /* LCOV_EXCL_LINE */
3664
0
        }
3665
20
        b = id->prefix->binding;
3666
20
        if (! b)
3667
0
          return XML_ERROR_UNBOUND_PREFIX;
3668
3669
760
        for (j = 0; j < b->uriLen; j++) {
3670
740
          const XML_Char c = b->uri[j];
3671
740
          if (! poolAppendChar(&parser->m_tempPool, c))
3672
0
            return XML_ERROR_NO_MEMORY;
3673
740
        }
3674
3675
20
        sip24_update(&sip_state, b->uri, b->uriLen * sizeof(XML_Char));
3676
3677
80
        while (*s++ != XML_T(ASCII_COLON))
3678
60
          ;
3679
3680
20
        sip24_update(&sip_state, s, keylen(s) * sizeof(XML_Char));
3681
3682
100
        do { /* copies null terminator */
3683
100
          if (! poolAppendChar(&parser->m_tempPool, *s))
3684
0
            return XML_ERROR_NO_MEMORY;
3685
100
        } while (*s++);
3686
3687
20
        uriHash = (unsigned long)sip24_final(&sip_state);
3688
3689
20
        { /* Check hash table for duplicate of expanded name (uriName).
3690
             Derived from code in lookup(parser, HASH_TABLE *table, ...).
3691
          */
3692
20
          unsigned char step = 0;
3693
20
          unsigned long mask = nsAttsSize - 1;
3694
20
          j = uriHash & mask; /* index into hash table */
3695
20
          while (parser->m_nsAtts[j].version == version) {
3696
            /* for speed we compare stored hash values first */
3697
0
            if (uriHash == parser->m_nsAtts[j].hash) {
3698
0
              const XML_Char *s1 = poolStart(&parser->m_tempPool);
3699
0
              const XML_Char *s2 = parser->m_nsAtts[j].uriName;
3700
              /* s1 is null terminated, but not s2 */
3701
0
              for (; *s1 == *s2 && *s1 != 0; s1++, s2++)
3702
0
                ;
3703
0
              if (*s1 == 0)
3704
0
                return XML_ERROR_DUPLICATE_ATTRIBUTE;
3705
0
            }
3706
0
            if (! step)
3707
0
              step = PROBE_STEP(uriHash, mask, parser->m_nsAttsPower);
3708
0
            j < step ? (j += nsAttsSize - step) : (j -= step);
3709
0
          }
3710
20
        }
3711
3712
20
        if (parser->m_ns_triplets) { /* append namespace separator and prefix */
3713
0
          parser->m_tempPool.ptr[-1] = parser->m_namespaceSeparator;
3714
0
          s = b->prefix->name;
3715
0
          do {
3716
0
            if (! poolAppendChar(&parser->m_tempPool, *s))
3717
0
              return XML_ERROR_NO_MEMORY;
3718
0
          } while (*s++);
3719
0
        }
3720
3721
        /* store expanded name in attribute list */
3722
20
        s = poolStart(&parser->m_tempPool);
3723
20
        poolFinish(&parser->m_tempPool);
3724
20
        appAtts[i] = s;
3725
3726
        /* fill empty slot with new version, uriName and hash value */
3727
20
        parser->m_nsAtts[j].version = version;
3728
20
        parser->m_nsAtts[j].hash = uriHash;
3729
20
        parser->m_nsAtts[j].uriName = s;
3730
3731
20
        if (! --nPrefixes) {
3732
20
          i += 2;
3733
20
          break;
3734
20
        }
3735
20
      } else                     /* not prefixed */
3736
40
        ((XML_Char *)s)[-1] = 0; /* clear flag */
3737
60
    }
3738
20
  }
3739
  /* clear flags for the remaining attributes */
3740
34.7k
  for (; i < attIndex; i += 2)
3741
23.5k
    ((XML_Char *)(appAtts[i]))[-1] = 0;
3742
11.1k
  for (binding = *bindingsPtr; binding; binding = binding->nextTagBinding)
3743
20
    binding->attId->name[-1] = 0;
3744
3745
11.1k
  if (! parser->m_ns)
3746
162
    return XML_ERROR_NONE;
3747
3748
  /* expand the element type name */
3749
10.9k
  if (elementType->prefix) {
3750
0
    binding = elementType->prefix->binding;
3751
0
    if (! binding)
3752
0
      return XML_ERROR_UNBOUND_PREFIX;
3753
0
    localPart = tagNamePtr->str;
3754
0
    while (*localPart++ != XML_T(ASCII_COLON))
3755
0
      ;
3756
10.9k
  } else if (dtd->defaultPrefix.binding) {
3757
10.9k
    binding = dtd->defaultPrefix.binding;
3758
10.9k
    localPart = tagNamePtr->str;
3759
10.9k
  } else
3760
0
    return XML_ERROR_NONE;
3761
10.9k
  prefixLen = 0;
3762
10.9k
  if (parser->m_ns_triplets && binding->prefix->name) {
3763
0
    for (; binding->prefix->name[prefixLen++];)
3764
0
      ; /* prefixLen includes null terminator */
3765
0
  }
3766
10.9k
  tagNamePtr->localPart = localPart;
3767
10.9k
  tagNamePtr->uriLen = binding->uriLen;
3768
10.9k
  tagNamePtr->prefix = binding->prefix->name;
3769
10.9k
  tagNamePtr->prefixLen = prefixLen;
3770
55.2k
  for (i = 0; localPart[i++];)
3771
44.2k
    ; /* i includes null terminator */
3772
3773
  /* Detect and prevent integer overflow */
3774
10.9k
  if (binding->uriLen > INT_MAX - prefixLen
3775
10.9k
      || i > INT_MAX - (binding->uriLen + prefixLen)) {
3776
0
    return XML_ERROR_NO_MEMORY;
3777
0
  }
3778
3779
10.9k
  n = i + binding->uriLen + prefixLen;
3780
10.9k
  if (n > binding->uriAlloc) {
3781
0
    TAG *p;
3782
3783
    /* Detect and prevent integer overflow */
3784
0
    if (n > INT_MAX - EXPAND_SPARE) {
3785
0
      return XML_ERROR_NO_MEMORY;
3786
0
    }
3787
    /* Detect and prevent integer overflow.
3788
     * The preprocessor guard addresses the "always false" warning
3789
     * from -Wtype-limits on platforms where
3790
     * sizeof(unsigned int) < sizeof(size_t), e.g. on x86_64. */
3791
#if UINT_MAX >= SIZE_MAX
3792
    if ((unsigned)(n + EXPAND_SPARE) > (size_t)(-1) / sizeof(XML_Char)) {
3793
      return XML_ERROR_NO_MEMORY;
3794
    }
3795
#endif
3796
3797
0
    uri = (XML_Char *)MALLOC(parser, (n + EXPAND_SPARE) * sizeof(XML_Char));
3798
0
    if (! uri)
3799
0
      return XML_ERROR_NO_MEMORY;
3800
0
    binding->uriAlloc = n + EXPAND_SPARE;
3801
0
    memcpy(uri, binding->uri, binding->uriLen * sizeof(XML_Char));
3802
0
    for (p = parser->m_tagStack; p; p = p->parent)
3803
0
      if (p->name.str == binding->uri)
3804
0
        p->name.str = uri;
3805
0
    FREE(parser, binding->uri);
3806
0
    binding->uri = uri;
3807
0
  }
3808
  /* if m_namespaceSeparator != '\0' then uri includes it already */
3809
10.9k
  uri = binding->uri + binding->uriLen;
3810
10.9k
  memcpy(uri, localPart, i * sizeof(XML_Char));
3811
  /* we always have a namespace separator between localPart and prefix */
3812
10.9k
  if (prefixLen) {
3813
0
    uri += i - 1;
3814
0
    *uri = parser->m_namespaceSeparator; /* replace null terminator */
3815
0
    memcpy(uri + 1, binding->prefix->name, prefixLen * sizeof(XML_Char));
3816
0
  }
3817
10.9k
  tagNamePtr->str = binding->uri;
3818
10.9k
  return XML_ERROR_NONE;
3819
10.9k
}
3820
3821
static XML_Bool
3822
0
is_rfc3986_uri_char(XML_Char candidate) {
3823
  // For the RFC 3986 ANBF grammar see
3824
  // https://datatracker.ietf.org/doc/html/rfc3986#appendix-A
3825
3826
0
  switch (candidate) {
3827
  // From rule "ALPHA" (uppercase half)
3828
0
  case 'A':
3829
0
  case 'B':
3830
0
  case 'C':
3831
0
  case 'D':
3832
0
  case 'E':
3833
0
  case 'F':
3834
0
  case 'G':
3835
0
  case 'H':
3836
0
  case 'I':
3837
0
  case 'J':
3838
0
  case 'K':
3839
0
  case 'L':
3840
0
  case 'M':
3841
0
  case 'N':
3842
0
  case 'O':
3843
0
  case 'P':
3844
0
  case 'Q':
3845
0
  case 'R':
3846
0
  case 'S':
3847
0
  case 'T':
3848
0
  case 'U':
3849
0
  case 'V':
3850
0
  case 'W':
3851
0
  case 'X':
3852
0
  case 'Y':
3853
0
  case 'Z':
3854
3855
  // From rule "ALPHA" (lowercase half)
3856
0
  case 'a':
3857
0
  case 'b':
3858
0
  case 'c':
3859
0
  case 'd':
3860
0
  case 'e':
3861
0
  case 'f':
3862
0
  case 'g':
3863
0
  case 'h':
3864
0
  case 'i':
3865
0
  case 'j':
3866
0
  case 'k':
3867
0
  case 'l':
3868
0
  case 'm':
3869
0
  case 'n':
3870
0
  case 'o':
3871
0
  case 'p':
3872
0
  case 'q':
3873
0
  case 'r':
3874
0
  case 's':
3875
0
  case 't':
3876
0
  case 'u':
3877
0
  case 'v':
3878
0
  case 'w':
3879
0
  case 'x':
3880
0
  case 'y':
3881
0
  case 'z':
3882
3883
  // From rule "DIGIT"
3884
0
  case '0':
3885
0
  case '1':
3886
0
  case '2':
3887
0
  case '3':
3888
0
  case '4':
3889
0
  case '5':
3890
0
  case '6':
3891
0
  case '7':
3892
0
  case '8':
3893
0
  case '9':
3894
3895
  // From rule "pct-encoded"
3896
0
  case '%':
3897
3898
  // From rule "unreserved"
3899
0
  case '-':
3900
0
  case '.':
3901
0
  case '_':
3902
0
  case '~':
3903
3904
  // From rule "gen-delims"
3905
0
  case ':':
3906
0
  case '/':
3907
0
  case '?':
3908
0
  case '#':
3909
0
  case '[':
3910
0
  case ']':
3911
0
  case '@':
3912
3913
  // From rule "sub-delims"
3914
0
  case '!':
3915
0
  case '$':
3916
0
  case '&':
3917
0
  case '\'':
3918
0
  case '(':
3919
0
  case ')':
3920
0
  case '*':
3921
0
  case '+':
3922
0
  case ',':
3923
0
  case ';':
3924
0
  case '=':
3925
0
    return XML_TRUE;
3926
3927
0
  default:
3928
0
    return XML_FALSE;
3929
0
  }
3930
0
}
3931
3932
/* addBinding() overwrites the value of prefix->binding without checking.
3933
   Therefore one must keep track of the old value outside of addBinding().
3934
*/
3935
static enum XML_Error
3936
addBinding(XML_Parser parser, PREFIX *prefix, const ATTRIBUTE_ID *attId,
3937
40
           const XML_Char *uri, BINDING **bindingsPtr) {
3938
  // "http://www.w3.org/XML/1998/namespace"
3939
40
  static const XML_Char xmlNamespace[]
3940
40
      = {ASCII_h,      ASCII_t,     ASCII_t,     ASCII_p,      ASCII_COLON,
3941
40
         ASCII_SLASH,  ASCII_SLASH, ASCII_w,     ASCII_w,      ASCII_w,
3942
40
         ASCII_PERIOD, ASCII_w,     ASCII_3,     ASCII_PERIOD, ASCII_o,
3943
40
         ASCII_r,      ASCII_g,     ASCII_SLASH, ASCII_X,      ASCII_M,
3944
40
         ASCII_L,      ASCII_SLASH, ASCII_1,     ASCII_9,      ASCII_9,
3945
40
         ASCII_8,      ASCII_SLASH, ASCII_n,     ASCII_a,      ASCII_m,
3946
40
         ASCII_e,      ASCII_s,     ASCII_p,     ASCII_a,      ASCII_c,
3947
40
         ASCII_e,      '\0'};
3948
40
  static const int xmlLen = (int)sizeof(xmlNamespace) / sizeof(XML_Char) - 1;
3949
  // "http://www.w3.org/2000/xmlns/"
3950
40
  static const XML_Char xmlnsNamespace[]
3951
40
      = {ASCII_h,     ASCII_t,      ASCII_t, ASCII_p, ASCII_COLON,  ASCII_SLASH,
3952
40
         ASCII_SLASH, ASCII_w,      ASCII_w, ASCII_w, ASCII_PERIOD, ASCII_w,
3953
40
         ASCII_3,     ASCII_PERIOD, ASCII_o, ASCII_r, ASCII_g,      ASCII_SLASH,
3954
40
         ASCII_2,     ASCII_0,      ASCII_0, ASCII_0, ASCII_SLASH,  ASCII_x,
3955
40
         ASCII_m,     ASCII_l,      ASCII_n, ASCII_s, ASCII_SLASH,  '\0'};
3956
40
  static const int xmlnsLen
3957
40
      = (int)sizeof(xmlnsNamespace) / sizeof(XML_Char) - 1;
3958
3959
40
  XML_Bool mustBeXML = XML_FALSE;
3960
40
  XML_Bool isXML = XML_TRUE;
3961
40
  XML_Bool isXMLNS = XML_TRUE;
3962
3963
40
  BINDING *b;
3964
40
  int len;
3965
3966
  /* empty URI is only valid for default namespace per XML NS 1.0 (not 1.1) */
3967
40
  if (*uri == XML_T('\0') && prefix->name)
3968
0
    return XML_ERROR_UNDECLARING_PREFIX;
3969
3970
40
  if (prefix->name && prefix->name[0] == XML_T(ASCII_x)
3971
20
      && prefix->name[1] == XML_T(ASCII_m)
3972
20
      && prefix->name[2] == XML_T(ASCII_l)) {
3973
    /* Not allowed to bind xmlns */
3974
20
    if (prefix->name[3] == XML_T(ASCII_n) && prefix->name[4] == XML_T(ASCII_s)
3975
0
        && prefix->name[5] == XML_T('\0'))
3976
0
      return XML_ERROR_RESERVED_PREFIX_XMLNS;
3977
3978
20
    if (prefix->name[3] == XML_T('\0'))
3979
20
      mustBeXML = XML_TRUE;
3980
20
  }
3981
3982
1.56k
  for (len = 0; uri[len]; len++) {
3983
1.52k
    if (isXML && (len > xmlLen || uri[len] != xmlNamespace[len]))
3984
20
      isXML = XML_FALSE;
3985
3986
1.52k
    if (! mustBeXML && isXMLNS
3987
160
        && (len > xmlnsLen || uri[len] != xmlnsNamespace[len]))
3988
20
      isXMLNS = XML_FALSE;
3989
3990
    // NOTE: While Expat does not validate namespace URIs against RFC 3986
3991
    //       today (and is not REQUIRED to do so with regard to the XML 1.0
3992
    //       namespaces specification) we have to at least make sure, that
3993
    //       the application on top of Expat (that is likely splitting expanded
3994
    //       element names ("qualified names") of form
3995
    //       "[uri sep] local [sep prefix] '\0'" back into 1, 2 or 3 pieces
3996
    //       in its element handler code) cannot be confused by an attacker
3997
    //       putting additional namespace separator characters into namespace
3998
    //       declarations.  That would be ambiguous and not to be expected.
3999
    //
4000
    //       While the HTML API docs of function XML_ParserCreateNS have been
4001
    //       advising against use of a namespace separator character that can
4002
    //       appear in a URI for >20 years now, some widespread applications
4003
    //       are using URI characters (':' (colon) in particular) for a
4004
    //       namespace separator, in practice.  To keep these applications
4005
    //       functional, we only reject namespaces URIs containing the
4006
    //       application-chosen namespace separator if the chosen separator
4007
    //       is a non-URI character with regard to RFC 3986.
4008
1.52k
    if (parser->m_ns && (uri[len] == parser->m_namespaceSeparator)
4009
0
        && ! is_rfc3986_uri_char(uri[len])) {
4010
0
      return XML_ERROR_SYNTAX;
4011
0
    }
4012
1.52k
  }
4013
40
  isXML = isXML && len == xmlLen;
4014
40
  isXMLNS = isXMLNS && len == xmlnsLen;
4015
4016
40
  if (mustBeXML != isXML)
4017
0
    return mustBeXML ? XML_ERROR_RESERVED_PREFIX_XML
4018
0
                     : XML_ERROR_RESERVED_NAMESPACE_URI;
4019
4020
40
  if (isXMLNS)
4021
0
    return XML_ERROR_RESERVED_NAMESPACE_URI;
4022
4023
40
  if (parser->m_namespaceSeparator)
4024
40
    len++;
4025
40
  if (parser->m_freeBindingList) {
4026
0
    b = parser->m_freeBindingList;
4027
0
    if (len > b->uriAlloc) {
4028
0
      XML_Char *temp;
4029
      /* Detect and prevent integer overflow */
4030
0
      if (len > INT_MAX - EXPAND_SPARE) {
4031
0
        return XML_ERROR_NO_MEMORY;
4032
0
      }
4033
4034
      /* Detect and prevent integer overflow.
4035
       * The preprocessor guard addresses the "always false" warning
4036
       * from -Wtype-limits on platforms where
4037
       * sizeof(unsigned int) < sizeof(size_t), e.g. on x86_64. */
4038
#if UINT_MAX >= SIZE_MAX
4039
      if ((unsigned)(len + EXPAND_SPARE) > (size_t)(-1) / sizeof(XML_Char)) {
4040
        return XML_ERROR_NO_MEMORY;
4041
      }
4042
#endif
4043
4044
0
      temp = (XML_Char *)REALLOC(
4045
0
          parser, b->uri, sizeof(XML_Char) * (len + EXPAND_SPARE));
4046
0
      if (temp == NULL)
4047
0
        return XML_ERROR_NO_MEMORY;
4048
0
      b->uri = temp;
4049
0
      b->uriAlloc = len + EXPAND_SPARE;
4050
0
    }
4051
0
    parser->m_freeBindingList = b->nextTagBinding;
4052
40
  } else {
4053
40
    b = (BINDING *)MALLOC(parser, sizeof(BINDING));
4054
40
    if (! b)
4055
0
      return XML_ERROR_NO_MEMORY;
4056
4057
    /* Detect and prevent integer overflow */
4058
40
    if (len > INT_MAX - EXPAND_SPARE) {
4059
0
      return XML_ERROR_NO_MEMORY;
4060
0
    }
4061
    /* Detect and prevent integer overflow.
4062
     * The preprocessor guard addresses the "always false" warning
4063
     * from -Wtype-limits on platforms where
4064
     * sizeof(unsigned int) < sizeof(size_t), e.g. on x86_64. */
4065
#if UINT_MAX >= SIZE_MAX
4066
    if ((unsigned)(len + EXPAND_SPARE) > (size_t)(-1) / sizeof(XML_Char)) {
4067
      return XML_ERROR_NO_MEMORY;
4068
    }
4069
#endif
4070
4071
40
    b->uri
4072
40
        = (XML_Char *)MALLOC(parser, sizeof(XML_Char) * (len + EXPAND_SPARE));
4073
40
    if (! b->uri) {
4074
0
      FREE(parser, b);
4075
0
      return XML_ERROR_NO_MEMORY;
4076
0
    }
4077
40
    b->uriAlloc = len + EXPAND_SPARE;
4078
40
  }
4079
40
  b->uriLen = len;
4080
40
  memcpy(b->uri, uri, len * sizeof(XML_Char));
4081
40
  if (parser->m_namespaceSeparator)
4082
40
    b->uri[len - 1] = parser->m_namespaceSeparator;
4083
40
  b->prefix = prefix;
4084
40
  b->attId = attId;
4085
40
  b->prevPrefixBinding = prefix->binding;
4086
  /* NULL binding when default namespace undeclared */
4087
40
  if (*uri == XML_T('\0') && prefix == &parser->m_dtd->defaultPrefix)
4088
0
    prefix->binding = NULL;
4089
40
  else
4090
40
    prefix->binding = b;
4091
40
  b->nextTagBinding = *bindingsPtr;
4092
40
  *bindingsPtr = b;
4093
  /* if attId == NULL then we are not starting a namespace scope */
4094
40
  if (attId && parser->m_startNamespaceDeclHandler)
4095
0
    parser->m_startNamespaceDeclHandler(parser->m_handlerArg, prefix->name,
4096
0
                                        prefix->binding ? uri : 0);
4097
40
  return XML_ERROR_NONE;
4098
40
}
4099
4100
/* The idea here is to avoid using stack for each CDATA section when
4101
   the whole file is parsed with one call.
4102
*/
4103
static enum XML_Error PTRCALL
4104
cdataSectionProcessor(XML_Parser parser, const char *start, const char *end,
4105
0
                      const char **endPtr) {
4106
0
  enum XML_Error result = doCdataSection(
4107
0
      parser, parser->m_encoding, &start, end, endPtr,
4108
0
      (XML_Bool)! parser->m_parsingStatus.finalBuffer, XML_ACCOUNT_DIRECT);
4109
0
  if (result != XML_ERROR_NONE)
4110
0
    return result;
4111
0
  if (start) {
4112
0
    if (parser->m_parentParser) { /* we are parsing an external entity */
4113
0
      parser->m_processor = externalEntityContentProcessor;
4114
0
      return externalEntityContentProcessor(parser, start, end, endPtr);
4115
0
    } else {
4116
0
      parser->m_processor = contentProcessor;
4117
0
      return contentProcessor(parser, start, end, endPtr);
4118
0
    }
4119
0
  }
4120
0
  return result;
4121
0
}
4122
4123
/* startPtr gets set to non-null if the section is closed, and to null if
4124
   the section is not yet closed.
4125
*/
4126
static enum XML_Error
4127
doCdataSection(XML_Parser parser, const ENCODING *enc, const char **startPtr,
4128
               const char *end, const char **nextPtr, XML_Bool haveMore,
4129
0
               enum XML_Account account) {
4130
0
  const char *s = *startPtr;
4131
0
  const char **eventPP;
4132
0
  const char **eventEndPP;
4133
0
  if (enc == parser->m_encoding) {
4134
0
    eventPP = &parser->m_eventPtr;
4135
0
    *eventPP = s;
4136
0
    eventEndPP = &parser->m_eventEndPtr;
4137
0
  } else {
4138
0
    eventPP = &(parser->m_openInternalEntities->internalEventPtr);
4139
0
    eventEndPP = &(parser->m_openInternalEntities->internalEventEndPtr);
4140
0
  }
4141
0
  *eventPP = s;
4142
0
  *startPtr = NULL;
4143
4144
0
  for (;;) {
4145
0
    const char *next = s; /* in case of XML_TOK_NONE or XML_TOK_PARTIAL */
4146
0
    int tok = XmlCdataSectionTok(enc, s, end, &next);
4147
0
#if XML_GE == 1
4148
0
    if (! accountingDiffTolerated(parser, tok, s, next, __LINE__, account)) {
4149
0
      accountingOnAbort(parser);
4150
0
      return XML_ERROR_AMPLIFICATION_LIMIT_BREACH;
4151
0
    }
4152
#else
4153
    UNUSED_P(account);
4154
#endif
4155
0
    *eventEndPP = next;
4156
0
    switch (tok) {
4157
0
    case XML_TOK_CDATA_SECT_CLOSE:
4158
0
      if (parser->m_endCdataSectionHandler)
4159
0
        parser->m_endCdataSectionHandler(parser->m_handlerArg);
4160
      /* BEGIN disabled code */
4161
      /* see comment under XML_TOK_CDATA_SECT_OPEN */
4162
0
      else if ((0) && parser->m_characterDataHandler)
4163
0
        parser->m_characterDataHandler(parser->m_handlerArg, parser->m_dataBuf,
4164
0
                                       0);
4165
      /* END disabled code */
4166
0
      else if (parser->m_defaultHandler)
4167
0
        reportDefault(parser, enc, s, next);
4168
0
      *startPtr = next;
4169
0
      *nextPtr = next;
4170
0
      if (parser->m_parsingStatus.parsing == XML_FINISHED)
4171
0
        return XML_ERROR_ABORTED;
4172
0
      else
4173
0
        return XML_ERROR_NONE;
4174
0
    case XML_TOK_DATA_NEWLINE:
4175
0
      if (parser->m_characterDataHandler) {
4176
0
        XML_Char c = 0xA;
4177
0
        parser->m_characterDataHandler(parser->m_handlerArg, &c, 1);
4178
0
      } else if (parser->m_defaultHandler)
4179
0
        reportDefault(parser, enc, s, next);
4180
0
      break;
4181
0
    case XML_TOK_DATA_CHARS: {
4182
0
      XML_CharacterDataHandler charDataHandler = parser->m_characterDataHandler;
4183
0
      if (charDataHandler) {
4184
0
        if (MUST_CONVERT(enc, s)) {
4185
0
          for (;;) {
4186
0
            ICHAR *dataPtr = (ICHAR *)parser->m_dataBuf;
4187
0
            const enum XML_Convert_Result convert_res = XmlConvert(
4188
0
                enc, &s, next, &dataPtr, (ICHAR *)parser->m_dataBufEnd);
4189
0
            *eventEndPP = next;
4190
0
            charDataHandler(parser->m_handlerArg, parser->m_dataBuf,
4191
0
                            (int)(dataPtr - (ICHAR *)parser->m_dataBuf));
4192
0
            if ((convert_res == XML_CONVERT_COMPLETED)
4193
0
                || (convert_res == XML_CONVERT_INPUT_INCOMPLETE))
4194
0
              break;
4195
0
            *eventPP = s;
4196
0
          }
4197
0
        } else
4198
0
          charDataHandler(parser->m_handlerArg, (const XML_Char *)s,
4199
0
                          (int)((const XML_Char *)next - (const XML_Char *)s));
4200
0
      } else if (parser->m_defaultHandler)
4201
0
        reportDefault(parser, enc, s, next);
4202
0
    } break;
4203
0
    case XML_TOK_INVALID:
4204
0
      *eventPP = next;
4205
0
      return XML_ERROR_INVALID_TOKEN;
4206
0
    case XML_TOK_PARTIAL_CHAR:
4207
0
      if (haveMore) {
4208
0
        *nextPtr = s;
4209
0
        return XML_ERROR_NONE;
4210
0
      }
4211
0
      return XML_ERROR_PARTIAL_CHAR;
4212
0
    case XML_TOK_PARTIAL:
4213
0
    case XML_TOK_NONE:
4214
0
      if (haveMore) {
4215
0
        *nextPtr = s;
4216
0
        return XML_ERROR_NONE;
4217
0
      }
4218
0
      return XML_ERROR_UNCLOSED_CDATA_SECTION;
4219
0
    default:
4220
      /* Every token returned by XmlCdataSectionTok() has its own
4221
       * explicit case, so this default case will never be executed.
4222
       * We retain it as a safety net and exclude it from the coverage
4223
       * statistics.
4224
       *
4225
       * LCOV_EXCL_START
4226
       */
4227
0
      *eventPP = next;
4228
0
      return XML_ERROR_UNEXPECTED_STATE;
4229
      /* LCOV_EXCL_STOP */
4230
0
    }
4231
4232
0
    *eventPP = s = next;
4233
0
    switch (parser->m_parsingStatus.parsing) {
4234
0
    case XML_SUSPENDED:
4235
0
      *nextPtr = next;
4236
0
      return XML_ERROR_NONE;
4237
0
    case XML_FINISHED:
4238
0
      return XML_ERROR_ABORTED;
4239
0
    default:;
4240
0
    }
4241
0
  }
4242
  /* not reached */
4243
0
}
4244
4245
#ifdef XML_DTD
4246
4247
/* The idea here is to avoid using stack for each IGNORE section when
4248
   the whole file is parsed with one call.
4249
*/
4250
static enum XML_Error PTRCALL
4251
ignoreSectionProcessor(XML_Parser parser, const char *start, const char *end,
4252
0
                       const char **endPtr) {
4253
0
  enum XML_Error result
4254
0
      = doIgnoreSection(parser, parser->m_encoding, &start, end, endPtr,
4255
0
                        (XML_Bool)! parser->m_parsingStatus.finalBuffer);
4256
0
  if (result != XML_ERROR_NONE)
4257
0
    return result;
4258
0
  if (start) {
4259
0
    parser->m_processor = prologProcessor;
4260
0
    return prologProcessor(parser, start, end, endPtr);
4261
0
  }
4262
0
  return result;
4263
0
}
4264
4265
/* startPtr gets set to non-null is the section is closed, and to null
4266
   if the section is not yet closed.
4267
*/
4268
static enum XML_Error
4269
doIgnoreSection(XML_Parser parser, const ENCODING *enc, const char **startPtr,
4270
0
                const char *end, const char **nextPtr, XML_Bool haveMore) {
4271
0
  const char *next = *startPtr; /* in case of XML_TOK_NONE or XML_TOK_PARTIAL */
4272
0
  int tok;
4273
0
  const char *s = *startPtr;
4274
0
  const char **eventPP;
4275
0
  const char **eventEndPP;
4276
0
  if (enc == parser->m_encoding) {
4277
0
    eventPP = &parser->m_eventPtr;
4278
0
    *eventPP = s;
4279
0
    eventEndPP = &parser->m_eventEndPtr;
4280
0
  } else {
4281
    /* It's not entirely clear, but it seems the following two lines
4282
     * of code cannot be executed.  The only occasions on which 'enc'
4283
     * is not 'encoding' are when this function is called
4284
     * from the internal entity processing, and IGNORE sections are an
4285
     * error in internal entities.
4286
     *
4287
     * Since it really isn't clear that this is true, we keep the code
4288
     * and just remove it from our coverage tests.
4289
     *
4290
     * LCOV_EXCL_START
4291
     */
4292
0
    eventPP = &(parser->m_openInternalEntities->internalEventPtr);
4293
0
    eventEndPP = &(parser->m_openInternalEntities->internalEventEndPtr);
4294
    /* LCOV_EXCL_STOP */
4295
0
  }
4296
0
  *eventPP = s;
4297
0
  *startPtr = NULL;
4298
0
  tok = XmlIgnoreSectionTok(enc, s, end, &next);
4299
0
#  if XML_GE == 1
4300
0
  if (! accountingDiffTolerated(parser, tok, s, next, __LINE__,
4301
0
                                XML_ACCOUNT_DIRECT)) {
4302
0
    accountingOnAbort(parser);
4303
0
    return XML_ERROR_AMPLIFICATION_LIMIT_BREACH;
4304
0
  }
4305
0
#  endif
4306
0
  *eventEndPP = next;
4307
0
  switch (tok) {
4308
0
  case XML_TOK_IGNORE_SECT:
4309
0
    if (parser->m_defaultHandler)
4310
0
      reportDefault(parser, enc, s, next);
4311
0
    *startPtr = next;
4312
0
    *nextPtr = next;
4313
0
    if (parser->m_parsingStatus.parsing == XML_FINISHED)
4314
0
      return XML_ERROR_ABORTED;
4315
0
    else
4316
0
      return XML_ERROR_NONE;
4317
0
  case XML_TOK_INVALID:
4318
0
    *eventPP = next;
4319
0
    return XML_ERROR_INVALID_TOKEN;
4320
0
  case XML_TOK_PARTIAL_CHAR:
4321
0
    if (haveMore) {
4322
0
      *nextPtr = s;
4323
0
      return XML_ERROR_NONE;
4324
0
    }
4325
0
    return XML_ERROR_PARTIAL_CHAR;
4326
0
  case XML_TOK_PARTIAL:
4327
0
  case XML_TOK_NONE:
4328
0
    if (haveMore) {
4329
0
      *nextPtr = s;
4330
0
      return XML_ERROR_NONE;
4331
0
    }
4332
0
    return XML_ERROR_SYNTAX; /* XML_ERROR_UNCLOSED_IGNORE_SECTION */
4333
0
  default:
4334
    /* All of the tokens that XmlIgnoreSectionTok() returns have
4335
     * explicit cases to handle them, so this default case is never
4336
     * executed.  We keep it as a safety net anyway, and remove it
4337
     * from our test coverage statistics.
4338
     *
4339
     * LCOV_EXCL_START
4340
     */
4341
0
    *eventPP = next;
4342
0
    return XML_ERROR_UNEXPECTED_STATE;
4343
    /* LCOV_EXCL_STOP */
4344
0
  }
4345
  /* not reached */
4346
0
}
4347
4348
#endif /* XML_DTD */
4349
4350
static enum XML_Error
4351
89
initializeEncoding(XML_Parser parser) {
4352
89
  const char *s;
4353
#ifdef XML_UNICODE
4354
  char encodingBuf[128];
4355
  /* See comments about `protocolEncodingName` in parserInit() */
4356
  if (! parser->m_protocolEncodingName)
4357
    s = NULL;
4358
  else {
4359
    int i;
4360
    for (i = 0; parser->m_protocolEncodingName[i]; i++) {
4361
      if (i == sizeof(encodingBuf) - 1
4362
          || (parser->m_protocolEncodingName[i] & ~0x7f) != 0) {
4363
        encodingBuf[0] = '\0';
4364
        break;
4365
      }
4366
      encodingBuf[i] = (char)parser->m_protocolEncodingName[i];
4367
    }
4368
    encodingBuf[i] = '\0';
4369
    s = encodingBuf;
4370
  }
4371
#else
4372
89
  s = parser->m_protocolEncodingName;
4373
89
#endif
4374
89
  if ((parser->m_ns ? XmlInitEncodingNS : XmlInitEncoding)(
4375
89
          &parser->m_initEncoding, &parser->m_encoding, s))
4376
89
    return XML_ERROR_NONE;
4377
0
  return handleUnknownEncoding(parser, parser->m_protocolEncodingName);
4378
89
}
4379
4380
static enum XML_Error
4381
processXmlDecl(XML_Parser parser, int isGeneralTextEntity, const char *s,
4382
69
               const char *next) {
4383
69
  const char *encodingName = NULL;
4384
69
  const XML_Char *storedEncName = NULL;
4385
69
  const ENCODING *newEncoding = NULL;
4386
69
  const char *version = NULL;
4387
69
  const char *versionend = NULL;
4388
69
  const XML_Char *storedversion = NULL;
4389
69
  int standalone = -1;
4390
4391
69
#if XML_GE == 1
4392
69
  if (! accountingDiffTolerated(parser, XML_TOK_XML_DECL, s, next, __LINE__,
4393
69
                                XML_ACCOUNT_DIRECT)) {
4394
0
    accountingOnAbort(parser);
4395
0
    return XML_ERROR_AMPLIFICATION_LIMIT_BREACH;
4396
0
  }
4397
69
#endif
4398
4399
69
  if (! (parser->m_ns ? XmlParseXmlDeclNS : XmlParseXmlDecl)(
4400
69
          isGeneralTextEntity, parser->m_encoding, s, next, &parser->m_eventPtr,
4401
69
          &version, &versionend, &encodingName, &newEncoding, &standalone)) {
4402
0
    if (isGeneralTextEntity)
4403
0
      return XML_ERROR_TEXT_DECL;
4404
0
    else
4405
0
      return XML_ERROR_XML_DECL;
4406
0
  }
4407
69
  if (! isGeneralTextEntity && standalone == 1) {
4408
0
    parser->m_dtd->standalone = XML_TRUE;
4409
0
#ifdef XML_DTD
4410
0
    if (parser->m_paramEntityParsing
4411
0
        == XML_PARAM_ENTITY_PARSING_UNLESS_STANDALONE)
4412
0
      parser->m_paramEntityParsing = XML_PARAM_ENTITY_PARSING_NEVER;
4413
0
#endif /* XML_DTD */
4414
0
  }
4415
69
  if (parser->m_xmlDeclHandler) {
4416
0
    if (encodingName != NULL) {
4417
0
      storedEncName = poolStoreString(
4418
0
          &parser->m_temp2Pool, parser->m_encoding, encodingName,
4419
0
          encodingName + XmlNameLength(parser->m_encoding, encodingName));
4420
0
      if (! storedEncName)
4421
0
        return XML_ERROR_NO_MEMORY;
4422
0
      poolFinish(&parser->m_temp2Pool);
4423
0
    }
4424
0
    if (version) {
4425
0
      storedversion
4426
0
          = poolStoreString(&parser->m_temp2Pool, parser->m_encoding, version,
4427
0
                            versionend - parser->m_encoding->minBytesPerChar);
4428
0
      if (! storedversion)
4429
0
        return XML_ERROR_NO_MEMORY;
4430
0
    }
4431
0
    parser->m_xmlDeclHandler(parser->m_handlerArg, storedversion, storedEncName,
4432
0
                             standalone);
4433
69
  } else if (parser->m_defaultHandler)
4434
0
    reportDefault(parser, parser->m_encoding, s, next);
4435
69
  if (parser->m_protocolEncodingName == NULL) {
4436
69
    if (newEncoding) {
4437
      /* Check that the specified encoding does not conflict with what
4438
       * the parser has already deduced.  Do we have the same number
4439
       * of bytes in the smallest representation of a character?  If
4440
       * this is UTF-16, is it the same endianness?
4441
       */
4442
69
      if (newEncoding->minBytesPerChar != parser->m_encoding->minBytesPerChar
4443
69
          || (newEncoding->minBytesPerChar == 2
4444
0
              && newEncoding != parser->m_encoding)) {
4445
0
        parser->m_eventPtr = encodingName;
4446
0
        return XML_ERROR_INCORRECT_ENCODING;
4447
0
      }
4448
69
      parser->m_encoding = newEncoding;
4449
69
    } else if (encodingName) {
4450
0
      enum XML_Error result;
4451
0
      if (! storedEncName) {
4452
0
        storedEncName = poolStoreString(
4453
0
            &parser->m_temp2Pool, parser->m_encoding, encodingName,
4454
0
            encodingName + XmlNameLength(parser->m_encoding, encodingName));
4455
0
        if (! storedEncName)
4456
0
          return XML_ERROR_NO_MEMORY;
4457
0
      }
4458
0
      result = handleUnknownEncoding(parser, storedEncName);
4459
0
      poolClear(&parser->m_temp2Pool);
4460
0
      if (result == XML_ERROR_UNKNOWN_ENCODING)
4461
0
        parser->m_eventPtr = encodingName;
4462
0
      return result;
4463
0
    }
4464
69
  }
4465
4466
69
  if (storedEncName || storedversion)
4467
0
    poolClear(&parser->m_temp2Pool);
4468
4469
69
  return XML_ERROR_NONE;
4470
69
}
4471
4472
static enum XML_Error
4473
0
handleUnknownEncoding(XML_Parser parser, const XML_Char *encodingName) {
4474
0
  if (parser->m_unknownEncodingHandler) {
4475
0
    XML_Encoding info;
4476
0
    int i;
4477
0
    for (i = 0; i < 256; i++)
4478
0
      info.map[i] = -1;
4479
0
    info.convert = NULL;
4480
0
    info.data = NULL;
4481
0
    info.release = NULL;
4482
0
    if (parser->m_unknownEncodingHandler(parser->m_unknownEncodingHandlerData,
4483
0
                                         encodingName, &info)) {
4484
0
      ENCODING *enc;
4485
0
      parser->m_unknownEncodingMem = MALLOC(parser, XmlSizeOfUnknownEncoding());
4486
0
      if (! parser->m_unknownEncodingMem) {
4487
0
        if (info.release)
4488
0
          info.release(info.data);
4489
0
        return XML_ERROR_NO_MEMORY;
4490
0
      }
4491
0
      enc = (parser->m_ns ? XmlInitUnknownEncodingNS : XmlInitUnknownEncoding)(
4492
0
          parser->m_unknownEncodingMem, info.map, info.convert, info.data);
4493
0
      if (enc) {
4494
0
        parser->m_unknownEncodingData = info.data;
4495
0
        parser->m_unknownEncodingRelease = info.release;
4496
0
        parser->m_encoding = enc;
4497
0
        return XML_ERROR_NONE;
4498
0
      }
4499
0
    }
4500
0
    if (info.release != NULL)
4501
0
      info.release(info.data);
4502
0
  }
4503
0
  return XML_ERROR_UNKNOWN_ENCODING;
4504
0
}
4505
4506
static enum XML_Error PTRCALL
4507
prologInitProcessor(XML_Parser parser, const char *s, const char *end,
4508
89
                    const char **nextPtr) {
4509
89
  enum XML_Error result = initializeEncoding(parser);
4510
89
  if (result != XML_ERROR_NONE)
4511
0
    return result;
4512
89
  parser->m_processor = prologProcessor;
4513
89
  return prologProcessor(parser, s, end, nextPtr);
4514
89
}
4515
4516
#ifdef XML_DTD
4517
4518
static enum XML_Error PTRCALL
4519
externalParEntInitProcessor(XML_Parser parser, const char *s, const char *end,
4520
0
                            const char **nextPtr) {
4521
0
  enum XML_Error result = initializeEncoding(parser);
4522
0
  if (result != XML_ERROR_NONE)
4523
0
    return result;
4524
4525
  /* we know now that XML_Parse(Buffer) has been called,
4526
     so we consider the external parameter entity read */
4527
0
  parser->m_dtd->paramEntityRead = XML_TRUE;
4528
4529
0
  if (parser->m_prologState.inEntityValue) {
4530
0
    parser->m_processor = entityValueInitProcessor;
4531
0
    return entityValueInitProcessor(parser, s, end, nextPtr);
4532
0
  } else {
4533
0
    parser->m_processor = externalParEntProcessor;
4534
0
    return externalParEntProcessor(parser, s, end, nextPtr);
4535
0
  }
4536
0
}
4537
4538
static enum XML_Error PTRCALL
4539
entityValueInitProcessor(XML_Parser parser, const char *s, const char *end,
4540
0
                         const char **nextPtr) {
4541
0
  int tok;
4542
0
  const char *start = s;
4543
0
  const char *next = start;
4544
0
  parser->m_eventPtr = start;
4545
4546
0
  for (;;) {
4547
0
    tok = XmlPrologTok(parser->m_encoding, start, end, &next);
4548
    /* Note: Except for XML_TOK_BOM below, these bytes are accounted later in:
4549
             - storeEntityValue
4550
             - processXmlDecl
4551
    */
4552
0
    parser->m_eventEndPtr = next;
4553
0
    if (tok <= 0) {
4554
0
      if (! parser->m_parsingStatus.finalBuffer && tok != XML_TOK_INVALID) {
4555
0
        *nextPtr = s;
4556
0
        return XML_ERROR_NONE;
4557
0
      }
4558
0
      switch (tok) {
4559
0
      case XML_TOK_INVALID:
4560
0
        return XML_ERROR_INVALID_TOKEN;
4561
0
      case XML_TOK_PARTIAL:
4562
0
        return XML_ERROR_UNCLOSED_TOKEN;
4563
0
      case XML_TOK_PARTIAL_CHAR:
4564
0
        return XML_ERROR_PARTIAL_CHAR;
4565
0
      case XML_TOK_NONE: /* start == end */
4566
0
      default:
4567
0
        break;
4568
0
      }
4569
      /* found end of entity value - can store it now */
4570
0
      return storeEntityValue(parser, parser->m_encoding, s, end,
4571
0
                              XML_ACCOUNT_DIRECT);
4572
0
    } else if (tok == XML_TOK_XML_DECL) {
4573
0
      enum XML_Error result;
4574
0
      result = processXmlDecl(parser, 0, start, next);
4575
0
      if (result != XML_ERROR_NONE)
4576
0
        return result;
4577
      /* At this point, m_parsingStatus.parsing cannot be XML_SUSPENDED.  For
4578
       * that to happen, a parameter entity parsing handler must have attempted
4579
       * to suspend the parser, which fails and raises an error.  The parser can
4580
       * be aborted, but can't be suspended.
4581
       */
4582
0
      if (parser->m_parsingStatus.parsing == XML_FINISHED)
4583
0
        return XML_ERROR_ABORTED;
4584
0
      *nextPtr = next;
4585
      /* stop scanning for text declaration - we found one */
4586
0
      parser->m_processor = entityValueProcessor;
4587
0
      return entityValueProcessor(parser, next, end, nextPtr);
4588
0
    }
4589
    /* XmlPrologTok has now set the encoding based on the BOM it found, and we
4590
       must move s and nextPtr forward to consume the BOM.
4591
4592
       If we didn't, and got XML_TOK_NONE from the next XmlPrologTok call, we
4593
       would leave the BOM in the buffer and return. On the next call to this
4594
       function, our XmlPrologTok call would return XML_TOK_INVALID, since it
4595
       is not valid to have multiple BOMs.
4596
    */
4597
0
    else if (tok == XML_TOK_BOM) {
4598
0
#  if XML_GE == 1
4599
0
      if (! accountingDiffTolerated(parser, tok, s, next, __LINE__,
4600
0
                                    XML_ACCOUNT_DIRECT)) {
4601
0
        accountingOnAbort(parser);
4602
0
        return XML_ERROR_AMPLIFICATION_LIMIT_BREACH;
4603
0
      }
4604
0
#  endif
4605
4606
0
      *nextPtr = next;
4607
0
      s = next;
4608
0
    }
4609
    /* If we get this token, we have the start of what might be a
4610
       normal tag, but not a declaration (i.e. it doesn't begin with
4611
       "<!").  In a DTD context, that isn't legal.
4612
    */
4613
0
    else if (tok == XML_TOK_INSTANCE_START) {
4614
0
      *nextPtr = next;
4615
0
      return XML_ERROR_SYNTAX;
4616
0
    }
4617
0
    start = next;
4618
0
    parser->m_eventPtr = start;
4619
0
  }
4620
0
}
4621
4622
static enum XML_Error PTRCALL
4623
externalParEntProcessor(XML_Parser parser, const char *s, const char *end,
4624
0
                        const char **nextPtr) {
4625
0
  const char *next = s;
4626
0
  int tok;
4627
4628
0
  tok = XmlPrologTok(parser->m_encoding, s, end, &next);
4629
0
  if (tok <= 0) {
4630
0
    if (! parser->m_parsingStatus.finalBuffer && tok != XML_TOK_INVALID) {
4631
0
      *nextPtr = s;
4632
0
      return XML_ERROR_NONE;
4633
0
    }
4634
0
    switch (tok) {
4635
0
    case XML_TOK_INVALID:
4636
0
      return XML_ERROR_INVALID_TOKEN;
4637
0
    case XML_TOK_PARTIAL:
4638
0
      return XML_ERROR_UNCLOSED_TOKEN;
4639
0
    case XML_TOK_PARTIAL_CHAR:
4640
0
      return XML_ERROR_PARTIAL_CHAR;
4641
0
    case XML_TOK_NONE: /* start == end */
4642
0
    default:
4643
0
      break;
4644
0
    }
4645
0
  }
4646
  /* This would cause the next stage, i.e. doProlog to be passed XML_TOK_BOM.
4647
     However, when parsing an external subset, doProlog will not accept a BOM
4648
     as valid, and report a syntax error, so we have to skip the BOM, and
4649
     account for the BOM bytes.
4650
  */
4651
0
  else if (tok == XML_TOK_BOM) {
4652
0
    if (! accountingDiffTolerated(parser, tok, s, next, __LINE__,
4653
0
                                  XML_ACCOUNT_DIRECT)) {
4654
0
      accountingOnAbort(parser);
4655
0
      return XML_ERROR_AMPLIFICATION_LIMIT_BREACH;
4656
0
    }
4657
4658
0
    s = next;
4659
0
    tok = XmlPrologTok(parser->m_encoding, s, end, &next);
4660
0
  }
4661
4662
0
  parser->m_processor = prologProcessor;
4663
0
  return doProlog(parser, parser->m_encoding, s, end, tok, next, nextPtr,
4664
0
                  (XML_Bool)! parser->m_parsingStatus.finalBuffer, XML_TRUE,
4665
0
                  XML_ACCOUNT_DIRECT);
4666
0
}
4667
4668
static enum XML_Error PTRCALL
4669
entityValueProcessor(XML_Parser parser, const char *s, const char *end,
4670
0
                     const char **nextPtr) {
4671
0
  const char *start = s;
4672
0
  const char *next = s;
4673
0
  const ENCODING *enc = parser->m_encoding;
4674
0
  int tok;
4675
4676
0
  for (;;) {
4677
0
    tok = XmlPrologTok(enc, start, end, &next);
4678
    /* Note: These bytes are accounted later in:
4679
             - storeEntityValue
4680
    */
4681
0
    if (tok <= 0) {
4682
0
      if (! parser->m_parsingStatus.finalBuffer && tok != XML_TOK_INVALID) {
4683
0
        *nextPtr = s;
4684
0
        return XML_ERROR_NONE;
4685
0
      }
4686
0
      switch (tok) {
4687
0
      case XML_TOK_INVALID:
4688
0
        return XML_ERROR_INVALID_TOKEN;
4689
0
      case XML_TOK_PARTIAL:
4690
0
        return XML_ERROR_UNCLOSED_TOKEN;
4691
0
      case XML_TOK_PARTIAL_CHAR:
4692
0
        return XML_ERROR_PARTIAL_CHAR;
4693
0
      case XML_TOK_NONE: /* start == end */
4694
0
      default:
4695
0
        break;
4696
0
      }
4697
      /* found end of entity value - can store it now */
4698
0
      return storeEntityValue(parser, enc, s, end, XML_ACCOUNT_DIRECT);
4699
0
    }
4700
0
    start = next;
4701
0
  }
4702
0
}
4703
4704
#endif /* XML_DTD */
4705
4706
static enum XML_Error PTRCALL
4707
prologProcessor(XML_Parser parser, const char *s, const char *end,
4708
89
                const char **nextPtr) {
4709
89
  const char *next = s;
4710
89
  int tok = XmlPrologTok(parser->m_encoding, s, end, &next);
4711
89
  return doProlog(parser, parser->m_encoding, s, end, tok, next, nextPtr,
4712
89
                  (XML_Bool)! parser->m_parsingStatus.finalBuffer, XML_TRUE,
4713
89
                  XML_ACCOUNT_DIRECT);
4714
89
}
4715
4716
static enum XML_Error
4717
doProlog(XML_Parser parser, const ENCODING *enc, const char *s, const char *end,
4718
         int tok, const char *next, const char **nextPtr, XML_Bool haveMore,
4719
89
         XML_Bool allowClosingDoctype, enum XML_Account account) {
4720
89
#ifdef XML_DTD
4721
89
  static const XML_Char externalSubsetName[] = {ASCII_HASH, '\0'};
4722
89
#endif /* XML_DTD */
4723
89
  static const XML_Char atypeCDATA[]
4724
89
      = {ASCII_C, ASCII_D, ASCII_A, ASCII_T, ASCII_A, '\0'};
4725
89
  static const XML_Char atypeID[] = {ASCII_I, ASCII_D, '\0'};
4726
89
  static const XML_Char atypeIDREF[]
4727
89
      = {ASCII_I, ASCII_D, ASCII_R, ASCII_E, ASCII_F, '\0'};
4728
89
  static const XML_Char atypeIDREFS[]
4729
89
      = {ASCII_I, ASCII_D, ASCII_R, ASCII_E, ASCII_F, ASCII_S, '\0'};
4730
89
  static const XML_Char atypeENTITY[]
4731
89
      = {ASCII_E, ASCII_N, ASCII_T, ASCII_I, ASCII_T, ASCII_Y, '\0'};
4732
89
  static const XML_Char atypeENTITIES[]
4733
89
      = {ASCII_E, ASCII_N, ASCII_T, ASCII_I, ASCII_T,
4734
89
         ASCII_I, ASCII_E, ASCII_S, '\0'};
4735
89
  static const XML_Char atypeNMTOKEN[]
4736
89
      = {ASCII_N, ASCII_M, ASCII_T, ASCII_O, ASCII_K, ASCII_E, ASCII_N, '\0'};
4737
89
  static const XML_Char atypeNMTOKENS[]
4738
89
      = {ASCII_N, ASCII_M, ASCII_T, ASCII_O, ASCII_K,
4739
89
         ASCII_E, ASCII_N, ASCII_S, '\0'};
4740
89
  static const XML_Char notationPrefix[]
4741
89
      = {ASCII_N, ASCII_O, ASCII_T, ASCII_A,      ASCII_T,
4742
89
         ASCII_I, ASCII_O, ASCII_N, ASCII_LPAREN, '\0'};
4743
89
  static const XML_Char enumValueSep[] = {ASCII_PIPE, '\0'};
4744
89
  static const XML_Char enumValueStart[] = {ASCII_LPAREN, '\0'};
4745
4746
#ifndef XML_DTD
4747
  UNUSED_P(account);
4748
#endif
4749
4750
  /* save one level of indirection */
4751
89
  DTD *const dtd = parser->m_dtd;
4752
4753
89
  const char **eventPP;
4754
89
  const char **eventEndPP;
4755
89
  enum XML_Content_Quant quant;
4756
4757
89
  if (enc == parser->m_encoding) {
4758
89
    eventPP = &parser->m_eventPtr;
4759
89
    eventEndPP = &parser->m_eventEndPtr;
4760
89
  } else {
4761
0
    eventPP = &(parser->m_openInternalEntities->internalEventPtr);
4762
0
    eventEndPP = &(parser->m_openInternalEntities->internalEventEndPtr);
4763
0
  }
4764
4765
296
  for (;;) {
4766
296
    int role;
4767
296
    XML_Bool handleDefault = XML_TRUE;
4768
296
    *eventPP = s;
4769
296
    *eventEndPP = next;
4770
296
    if (tok <= 0) {
4771
0
      if (haveMore && tok != XML_TOK_INVALID) {
4772
0
        *nextPtr = s;
4773
0
        return XML_ERROR_NONE;
4774
0
      }
4775
0
      switch (tok) {
4776
0
      case XML_TOK_INVALID:
4777
0
        *eventPP = next;
4778
0
        return XML_ERROR_INVALID_TOKEN;
4779
0
      case XML_TOK_PARTIAL:
4780
0
        return XML_ERROR_UNCLOSED_TOKEN;
4781
0
      case XML_TOK_PARTIAL_CHAR:
4782
0
        return XML_ERROR_PARTIAL_CHAR;
4783
0
      case -XML_TOK_PROLOG_S:
4784
0
        tok = -tok;
4785
0
        break;
4786
0
      case XML_TOK_NONE:
4787
0
#ifdef XML_DTD
4788
        /* for internal PE NOT referenced between declarations */
4789
0
        if (enc != parser->m_encoding
4790
0
            && ! parser->m_openInternalEntities->betweenDecl) {
4791
0
          *nextPtr = s;
4792
0
          return XML_ERROR_NONE;
4793
0
        }
4794
        /* WFC: PE Between Declarations - must check that PE contains
4795
           complete markup, not only for external PEs, but also for
4796
           internal PEs if the reference occurs between declarations.
4797
        */
4798
0
        if (parser->m_isParamEntity || enc != parser->m_encoding) {
4799
0
          if (XmlTokenRole(&parser->m_prologState, XML_TOK_NONE, end, end, enc)
4800
0
              == XML_ROLE_ERROR)
4801
0
            return XML_ERROR_INCOMPLETE_PE;
4802
0
          *nextPtr = s;
4803
0
          return XML_ERROR_NONE;
4804
0
        }
4805
0
#endif /* XML_DTD */
4806
0
        return XML_ERROR_NO_ELEMENTS;
4807
0
      default:
4808
0
        tok = -tok;
4809
0
        next = end;
4810
0
        break;
4811
0
      }
4812
0
    }
4813
296
    role = XmlTokenRole(&parser->m_prologState, tok, s, next, enc);
4814
296
#if XML_GE == 1
4815
296
    switch (role) {
4816
89
    case XML_ROLE_INSTANCE_START: // bytes accounted in contentProcessor
4817
158
    case XML_ROLE_XML_DECL:       // bytes accounted in processXmlDecl
4818
158
#  ifdef XML_DTD
4819
158
    case XML_ROLE_TEXT_DECL: // bytes accounted in processXmlDecl
4820
158
#  endif
4821
158
      break;
4822
138
    default:
4823
138
      if (! accountingDiffTolerated(parser, tok, s, next, __LINE__, account)) {
4824
0
        accountingOnAbort(parser);
4825
0
        return XML_ERROR_AMPLIFICATION_LIMIT_BREACH;
4826
0
      }
4827
296
    }
4828
296
#endif
4829
296
    switch (role) {
4830
69
    case XML_ROLE_XML_DECL: {
4831
69
      enum XML_Error result = processXmlDecl(parser, 0, s, next);
4832
69
      if (result != XML_ERROR_NONE)
4833
0
        return result;
4834
69
      enc = parser->m_encoding;
4835
69
      handleDefault = XML_FALSE;
4836
69
    } break;
4837
0
    case XML_ROLE_DOCTYPE_NAME:
4838
0
      if (parser->m_startDoctypeDeclHandler) {
4839
0
        parser->m_doctypeName
4840
0
            = poolStoreString(&parser->m_tempPool, enc, s, next);
4841
0
        if (! parser->m_doctypeName)
4842
0
          return XML_ERROR_NO_MEMORY;
4843
0
        poolFinish(&parser->m_tempPool);
4844
0
        parser->m_doctypePubid = NULL;
4845
0
        handleDefault = XML_FALSE;
4846
0
      }
4847
0
      parser->m_doctypeSysid = NULL; /* always initialize to NULL */
4848
0
      break;
4849
0
    case XML_ROLE_DOCTYPE_INTERNAL_SUBSET:
4850
0
      if (parser->m_startDoctypeDeclHandler) {
4851
0
        parser->m_startDoctypeDeclHandler(
4852
0
            parser->m_handlerArg, parser->m_doctypeName, parser->m_doctypeSysid,
4853
0
            parser->m_doctypePubid, 1);
4854
0
        parser->m_doctypeName = NULL;
4855
0
        poolClear(&parser->m_tempPool);
4856
0
        handleDefault = XML_FALSE;
4857
0
      }
4858
0
      break;
4859
0
#ifdef XML_DTD
4860
0
    case XML_ROLE_TEXT_DECL: {
4861
0
      enum XML_Error result = processXmlDecl(parser, 1, s, next);
4862
0
      if (result != XML_ERROR_NONE)
4863
0
        return result;
4864
0
      enc = parser->m_encoding;
4865
0
      handleDefault = XML_FALSE;
4866
0
    } break;
4867
0
#endif /* XML_DTD */
4868
0
    case XML_ROLE_DOCTYPE_PUBLIC_ID:
4869
0
#ifdef XML_DTD
4870
0
      parser->m_useForeignDTD = XML_FALSE;
4871
0
      parser->m_declEntity = (ENTITY *)lookup(
4872
0
          parser, &dtd->paramEntities, externalSubsetName, sizeof(ENTITY));
4873
0
      if (! parser->m_declEntity)
4874
0
        return XML_ERROR_NO_MEMORY;
4875
0
#endif /* XML_DTD */
4876
0
      dtd->hasParamEntityRefs = XML_TRUE;
4877
0
      if (parser->m_startDoctypeDeclHandler) {
4878
0
        XML_Char *pubId;
4879
0
        if (! XmlIsPublicId(enc, s, next, eventPP))
4880
0
          return XML_ERROR_PUBLICID;
4881
0
        pubId = poolStoreString(&parser->m_tempPool, enc,
4882
0
                                s + enc->minBytesPerChar,
4883
0
                                next - enc->minBytesPerChar);
4884
0
        if (! pubId)
4885
0
          return XML_ERROR_NO_MEMORY;
4886
0
        normalizePublicId(pubId);
4887
0
        poolFinish(&parser->m_tempPool);
4888
0
        parser->m_doctypePubid = pubId;
4889
0
        handleDefault = XML_FALSE;
4890
0
        goto alreadyChecked;
4891
0
      }
4892
      /* fall through */
4893
0
    case XML_ROLE_ENTITY_PUBLIC_ID:
4894
0
      if (! XmlIsPublicId(enc, s, next, eventPP))
4895
0
        return XML_ERROR_PUBLICID;
4896
0
    alreadyChecked:
4897
0
      if (dtd->keepProcessing && parser->m_declEntity) {
4898
0
        XML_Char *tem
4899
0
            = poolStoreString(&dtd->pool, enc, s + enc->minBytesPerChar,
4900
0
                              next - enc->minBytesPerChar);
4901
0
        if (! tem)
4902
0
          return XML_ERROR_NO_MEMORY;
4903
0
        normalizePublicId(tem);
4904
0
        parser->m_declEntity->publicId = tem;
4905
0
        poolFinish(&dtd->pool);
4906
        /* Don't suppress the default handler if we fell through from
4907
         * the XML_ROLE_DOCTYPE_PUBLIC_ID case.
4908
         */
4909
0
        if (parser->m_entityDeclHandler && role == XML_ROLE_ENTITY_PUBLIC_ID)
4910
0
          handleDefault = XML_FALSE;
4911
0
      }
4912
0
      break;
4913
0
    case XML_ROLE_DOCTYPE_CLOSE:
4914
0
      if (allowClosingDoctype != XML_TRUE) {
4915
        /* Must not close doctype from within expanded parameter entities */
4916
0
        return XML_ERROR_INVALID_TOKEN;
4917
0
      }
4918
4919
0
      if (parser->m_doctypeName) {
4920
0
        parser->m_startDoctypeDeclHandler(
4921
0
            parser->m_handlerArg, parser->m_doctypeName, parser->m_doctypeSysid,
4922
0
            parser->m_doctypePubid, 0);
4923
0
        poolClear(&parser->m_tempPool);
4924
0
        handleDefault = XML_FALSE;
4925
0
      }
4926
      /* parser->m_doctypeSysid will be non-NULL in the case of a previous
4927
         XML_ROLE_DOCTYPE_SYSTEM_ID, even if parser->m_startDoctypeDeclHandler
4928
         was not set, indicating an external subset
4929
      */
4930
0
#ifdef XML_DTD
4931
0
      if (parser->m_doctypeSysid || parser->m_useForeignDTD) {
4932
0
        XML_Bool hadParamEntityRefs = dtd->hasParamEntityRefs;
4933
0
        dtd->hasParamEntityRefs = XML_TRUE;
4934
0
        if (parser->m_paramEntityParsing
4935
0
            && parser->m_externalEntityRefHandler) {
4936
0
          ENTITY *entity = (ENTITY *)lookup(parser, &dtd->paramEntities,
4937
0
                                            externalSubsetName, sizeof(ENTITY));
4938
0
          if (! entity) {
4939
            /* The external subset name "#" will have already been
4940
             * inserted into the hash table at the start of the
4941
             * external entity parsing, so no allocation will happen
4942
             * and lookup() cannot fail.
4943
             */
4944
0
            return XML_ERROR_NO_MEMORY; /* LCOV_EXCL_LINE */
4945
0
          }
4946
0
          if (parser->m_useForeignDTD)
4947
0
            entity->base = parser->m_curBase;
4948
0
          dtd->paramEntityRead = XML_FALSE;
4949
0
          if (! parser->m_externalEntityRefHandler(
4950
0
                  parser->m_externalEntityRefHandlerArg, 0, entity->base,
4951
0
                  entity->systemId, entity->publicId))
4952
0
            return XML_ERROR_EXTERNAL_ENTITY_HANDLING;
4953
0
          if (dtd->paramEntityRead) {
4954
0
            if (! dtd->standalone && parser->m_notStandaloneHandler
4955
0
                && ! parser->m_notStandaloneHandler(parser->m_handlerArg))
4956
0
              return XML_ERROR_NOT_STANDALONE;
4957
0
          }
4958
          /* if we didn't read the foreign DTD then this means that there
4959
             is no external subset and we must reset dtd->hasParamEntityRefs
4960
          */
4961
0
          else if (! parser->m_doctypeSysid)
4962
0
            dtd->hasParamEntityRefs = hadParamEntityRefs;
4963
          /* end of DTD - no need to update dtd->keepProcessing */
4964
0
        }
4965
0
        parser->m_useForeignDTD = XML_FALSE;
4966
0
      }
4967
0
#endif /* XML_DTD */
4968
0
      if (parser->m_endDoctypeDeclHandler) {
4969
0
        parser->m_endDoctypeDeclHandler(parser->m_handlerArg);
4970
0
        handleDefault = XML_FALSE;
4971
0
      }
4972
0
      break;
4973
89
    case XML_ROLE_INSTANCE_START:
4974
89
#ifdef XML_DTD
4975
      /* if there is no DOCTYPE declaration then now is the
4976
         last chance to read the foreign DTD
4977
      */
4978
89
      if (parser->m_useForeignDTD) {
4979
0
        XML_Bool hadParamEntityRefs = dtd->hasParamEntityRefs;
4980
0
        dtd->hasParamEntityRefs = XML_TRUE;
4981
0
        if (parser->m_paramEntityParsing
4982
0
            && parser->m_externalEntityRefHandler) {
4983
0
          ENTITY *entity = (ENTITY *)lookup(parser, &dtd->paramEntities,
4984
0
                                            externalSubsetName, sizeof(ENTITY));
4985
0
          if (! entity)
4986
0
            return XML_ERROR_NO_MEMORY;
4987
0
          entity->base = parser->m_curBase;
4988
0
          dtd->paramEntityRead = XML_FALSE;
4989
0
          if (! parser->m_externalEntityRefHandler(
4990
0
                  parser->m_externalEntityRefHandlerArg, 0, entity->base,
4991
0
                  entity->systemId, entity->publicId))
4992
0
            return XML_ERROR_EXTERNAL_ENTITY_HANDLING;
4993
0
          if (dtd->paramEntityRead) {
4994
0
            if (! dtd->standalone && parser->m_notStandaloneHandler
4995
0
                && ! parser->m_notStandaloneHandler(parser->m_handlerArg))
4996
0
              return XML_ERROR_NOT_STANDALONE;
4997
0
          }
4998
          /* if we didn't read the foreign DTD then this means that there
4999
             is no external subset and we must reset dtd->hasParamEntityRefs
5000
          */
5001
0
          else
5002
0
            dtd->hasParamEntityRefs = hadParamEntityRefs;
5003
          /* end of DTD - no need to update dtd->keepProcessing */
5004
0
        }
5005
0
      }
5006
89
#endif /* XML_DTD */
5007
89
      parser->m_processor = contentProcessor;
5008
89
      return contentProcessor(parser, s, end, nextPtr);
5009
0
    case XML_ROLE_ATTLIST_ELEMENT_NAME:
5010
0
      parser->m_declElementType = getElementType(parser, enc, s, next);
5011
0
      if (! parser->m_declElementType)
5012
0
        return XML_ERROR_NO_MEMORY;
5013
0
      goto checkAttListDeclHandler;
5014
0
    case XML_ROLE_ATTRIBUTE_NAME:
5015
0
      parser->m_declAttributeId = getAttributeId(parser, enc, s, next);
5016
0
      if (! parser->m_declAttributeId)
5017
0
        return XML_ERROR_NO_MEMORY;
5018
0
      parser->m_declAttributeIsCdata = XML_FALSE;
5019
0
      parser->m_declAttributeType = NULL;
5020
0
      parser->m_declAttributeIsId = XML_FALSE;
5021
0
      goto checkAttListDeclHandler;
5022
0
    case XML_ROLE_ATTRIBUTE_TYPE_CDATA:
5023
0
      parser->m_declAttributeIsCdata = XML_TRUE;
5024
0
      parser->m_declAttributeType = atypeCDATA;
5025
0
      goto checkAttListDeclHandler;
5026
0
    case XML_ROLE_ATTRIBUTE_TYPE_ID:
5027
0
      parser->m_declAttributeIsId = XML_TRUE;
5028
0
      parser->m_declAttributeType = atypeID;
5029
0
      goto checkAttListDeclHandler;
5030
0
    case XML_ROLE_ATTRIBUTE_TYPE_IDREF:
5031
0
      parser->m_declAttributeType = atypeIDREF;
5032
0
      goto checkAttListDeclHandler;
5033
0
    case XML_ROLE_ATTRIBUTE_TYPE_IDREFS:
5034
0
      parser->m_declAttributeType = atypeIDREFS;
5035
0
      goto checkAttListDeclHandler;
5036
0
    case XML_ROLE_ATTRIBUTE_TYPE_ENTITY:
5037
0
      parser->m_declAttributeType = atypeENTITY;
5038
0
      goto checkAttListDeclHandler;
5039
0
    case XML_ROLE_ATTRIBUTE_TYPE_ENTITIES:
5040
0
      parser->m_declAttributeType = atypeENTITIES;
5041
0
      goto checkAttListDeclHandler;
5042
0
    case XML_ROLE_ATTRIBUTE_TYPE_NMTOKEN:
5043
0
      parser->m_declAttributeType = atypeNMTOKEN;
5044
0
      goto checkAttListDeclHandler;
5045
0
    case XML_ROLE_ATTRIBUTE_TYPE_NMTOKENS:
5046
0
      parser->m_declAttributeType = atypeNMTOKENS;
5047
0
    checkAttListDeclHandler:
5048
0
      if (dtd->keepProcessing && parser->m_attlistDeclHandler)
5049
0
        handleDefault = XML_FALSE;
5050
0
      break;
5051
0
    case XML_ROLE_ATTRIBUTE_ENUM_VALUE:
5052
0
    case XML_ROLE_ATTRIBUTE_NOTATION_VALUE:
5053
0
      if (dtd->keepProcessing && parser->m_attlistDeclHandler) {
5054
0
        const XML_Char *prefix;
5055
0
        if (parser->m_declAttributeType) {
5056
0
          prefix = enumValueSep;
5057
0
        } else {
5058
0
          prefix = (role == XML_ROLE_ATTRIBUTE_NOTATION_VALUE ? notationPrefix
5059
0
                                                              : enumValueStart);
5060
0
        }
5061
0
        if (! poolAppendString(&parser->m_tempPool, prefix))
5062
0
          return XML_ERROR_NO_MEMORY;
5063
0
        if (! poolAppend(&parser->m_tempPool, enc, s, next))
5064
0
          return XML_ERROR_NO_MEMORY;
5065
0
        parser->m_declAttributeType = parser->m_tempPool.start;
5066
0
        handleDefault = XML_FALSE;
5067
0
      }
5068
0
      break;
5069
0
    case XML_ROLE_IMPLIED_ATTRIBUTE_VALUE:
5070
0
    case XML_ROLE_REQUIRED_ATTRIBUTE_VALUE:
5071
0
      if (dtd->keepProcessing) {
5072
0
        if (! defineAttribute(parser->m_declElementType,
5073
0
                              parser->m_declAttributeId,
5074
0
                              parser->m_declAttributeIsCdata,
5075
0
                              parser->m_declAttributeIsId, 0, parser))
5076
0
          return XML_ERROR_NO_MEMORY;
5077
0
        if (parser->m_attlistDeclHandler && parser->m_declAttributeType) {
5078
0
          if (*parser->m_declAttributeType == XML_T(ASCII_LPAREN)
5079
0
              || (*parser->m_declAttributeType == XML_T(ASCII_N)
5080
0
                  && parser->m_declAttributeType[1] == XML_T(ASCII_O))) {
5081
            /* Enumerated or Notation type */
5082
0
            if (! poolAppendChar(&parser->m_tempPool, XML_T(ASCII_RPAREN))
5083
0
                || ! poolAppendChar(&parser->m_tempPool, XML_T('\0')))
5084
0
              return XML_ERROR_NO_MEMORY;
5085
0
            parser->m_declAttributeType = parser->m_tempPool.start;
5086
0
            poolFinish(&parser->m_tempPool);
5087
0
          }
5088
0
          *eventEndPP = s;
5089
0
          parser->m_attlistDeclHandler(
5090
0
              parser->m_handlerArg, parser->m_declElementType->name,
5091
0
              parser->m_declAttributeId->name, parser->m_declAttributeType, 0,
5092
0
              role == XML_ROLE_REQUIRED_ATTRIBUTE_VALUE);
5093
0
          handleDefault = XML_FALSE;
5094
0
        }
5095
0
      }
5096
0
      poolClear(&parser->m_tempPool);
5097
0
      break;
5098
0
    case XML_ROLE_DEFAULT_ATTRIBUTE_VALUE:
5099
0
    case XML_ROLE_FIXED_ATTRIBUTE_VALUE:
5100
0
      if (dtd->keepProcessing) {
5101
0
        const XML_Char *attVal;
5102
0
        enum XML_Error result = storeAttributeValue(
5103
0
            parser, enc, parser->m_declAttributeIsCdata,
5104
0
            s + enc->minBytesPerChar, next - enc->minBytesPerChar, &dtd->pool,
5105
0
            XML_ACCOUNT_NONE);
5106
0
        if (result)
5107
0
          return result;
5108
0
        attVal = poolStart(&dtd->pool);
5109
0
        poolFinish(&dtd->pool);
5110
        /* ID attributes aren't allowed to have a default */
5111
0
        if (! defineAttribute(
5112
0
                parser->m_declElementType, parser->m_declAttributeId,
5113
0
                parser->m_declAttributeIsCdata, XML_FALSE, attVal, parser))
5114
0
          return XML_ERROR_NO_MEMORY;
5115
0
        if (parser->m_attlistDeclHandler && parser->m_declAttributeType) {
5116
0
          if (*parser->m_declAttributeType == XML_T(ASCII_LPAREN)
5117
0
              || (*parser->m_declAttributeType == XML_T(ASCII_N)
5118
0
                  && parser->m_declAttributeType[1] == XML_T(ASCII_O))) {
5119
            /* Enumerated or Notation type */
5120
0
            if (! poolAppendChar(&parser->m_tempPool, XML_T(ASCII_RPAREN))
5121
0
                || ! poolAppendChar(&parser->m_tempPool, XML_T('\0')))
5122
0
              return XML_ERROR_NO_MEMORY;
5123
0
            parser->m_declAttributeType = parser->m_tempPool.start;
5124
0
            poolFinish(&parser->m_tempPool);
5125
0
          }
5126
0
          *eventEndPP = s;
5127
0
          parser->m_attlistDeclHandler(
5128
0
              parser->m_handlerArg, parser->m_declElementType->name,
5129
0
              parser->m_declAttributeId->name, parser->m_declAttributeType,
5130
0
              attVal, role == XML_ROLE_FIXED_ATTRIBUTE_VALUE);
5131
0
          poolClear(&parser->m_tempPool);
5132
0
          handleDefault = XML_FALSE;
5133
0
        }
5134
0
      }
5135
0
      break;
5136
0
    case XML_ROLE_ENTITY_VALUE:
5137
0
      if (dtd->keepProcessing) {
5138
0
#if XML_GE == 1
5139
        // This will store the given replacement text in
5140
        // parser->m_declEntity->textPtr.
5141
0
        enum XML_Error result
5142
0
            = storeEntityValue(parser, enc, s + enc->minBytesPerChar,
5143
0
                               next - enc->minBytesPerChar, XML_ACCOUNT_NONE);
5144
0
        if (parser->m_declEntity) {
5145
0
          parser->m_declEntity->textPtr = poolStart(&dtd->entityValuePool);
5146
0
          parser->m_declEntity->textLen
5147
0
              = (int)(poolLength(&dtd->entityValuePool));
5148
0
          poolFinish(&dtd->entityValuePool);
5149
0
          if (parser->m_entityDeclHandler) {
5150
0
            *eventEndPP = s;
5151
0
            parser->m_entityDeclHandler(
5152
0
                parser->m_handlerArg, parser->m_declEntity->name,
5153
0
                parser->m_declEntity->is_param, parser->m_declEntity->textPtr,
5154
0
                parser->m_declEntity->textLen, parser->m_curBase, 0, 0, 0);
5155
0
            handleDefault = XML_FALSE;
5156
0
          }
5157
0
        } else
5158
0
          poolDiscard(&dtd->entityValuePool);
5159
0
        if (result != XML_ERROR_NONE)
5160
0
          return result;
5161
#else
5162
        // This will store "&amp;entity123;" in parser->m_declEntity->textPtr
5163
        // to end up as "&entity123;" in the handler.
5164
        if (parser->m_declEntity != NULL) {
5165
          const enum XML_Error result
5166
              = storeSelfEntityValue(parser, parser->m_declEntity);
5167
          if (result != XML_ERROR_NONE)
5168
            return result;
5169
5170
          if (parser->m_entityDeclHandler) {
5171
            *eventEndPP = s;
5172
            parser->m_entityDeclHandler(
5173
                parser->m_handlerArg, parser->m_declEntity->name,
5174
                parser->m_declEntity->is_param, parser->m_declEntity->textPtr,
5175
                parser->m_declEntity->textLen, parser->m_curBase, 0, 0, 0);
5176
            handleDefault = XML_FALSE;
5177
          }
5178
        }
5179
#endif
5180
0
      }
5181
0
      break;
5182
0
    case XML_ROLE_DOCTYPE_SYSTEM_ID:
5183
0
#ifdef XML_DTD
5184
0
      parser->m_useForeignDTD = XML_FALSE;
5185
0
#endif /* XML_DTD */
5186
0
      dtd->hasParamEntityRefs = XML_TRUE;
5187
0
      if (parser->m_startDoctypeDeclHandler) {
5188
0
        parser->m_doctypeSysid = poolStoreString(&parser->m_tempPool, enc,
5189
0
                                                 s + enc->minBytesPerChar,
5190
0
                                                 next - enc->minBytesPerChar);
5191
0
        if (parser->m_doctypeSysid == NULL)
5192
0
          return XML_ERROR_NO_MEMORY;
5193
0
        poolFinish(&parser->m_tempPool);
5194
0
        handleDefault = XML_FALSE;
5195
0
      }
5196
0
#ifdef XML_DTD
5197
0
      else
5198
        /* use externalSubsetName to make parser->m_doctypeSysid non-NULL
5199
           for the case where no parser->m_startDoctypeDeclHandler is set */
5200
0
        parser->m_doctypeSysid = externalSubsetName;
5201
0
#endif /* XML_DTD */
5202
0
      if (! dtd->standalone
5203
0
#ifdef XML_DTD
5204
0
          && ! parser->m_paramEntityParsing
5205
0
#endif /* XML_DTD */
5206
0
          && parser->m_notStandaloneHandler
5207
0
          && ! parser->m_notStandaloneHandler(parser->m_handlerArg))
5208
0
        return XML_ERROR_NOT_STANDALONE;
5209
#ifndef XML_DTD
5210
      break;
5211
#else  /* XML_DTD */
5212
0
      if (! parser->m_declEntity) {
5213
0
        parser->m_declEntity = (ENTITY *)lookup(
5214
0
            parser, &dtd->paramEntities, externalSubsetName, sizeof(ENTITY));
5215
0
        if (! parser->m_declEntity)
5216
0
          return XML_ERROR_NO_MEMORY;
5217
0
        parser->m_declEntity->publicId = NULL;
5218
0
      }
5219
0
#endif /* XML_DTD */
5220
      /* fall through */
5221
0
    case XML_ROLE_ENTITY_SYSTEM_ID:
5222
0
      if (dtd->keepProcessing && parser->m_declEntity) {
5223
0
        parser->m_declEntity->systemId
5224
0
            = poolStoreString(&dtd->pool, enc, s + enc->minBytesPerChar,
5225
0
                              next - enc->minBytesPerChar);
5226
0
        if (! parser->m_declEntity->systemId)
5227
0
          return XML_ERROR_NO_MEMORY;
5228
0
        parser->m_declEntity->base = parser->m_curBase;
5229
0
        poolFinish(&dtd->pool);
5230
        /* Don't suppress the default handler if we fell through from
5231
         * the XML_ROLE_DOCTYPE_SYSTEM_ID case.
5232
         */
5233
0
        if (parser->m_entityDeclHandler && role == XML_ROLE_ENTITY_SYSTEM_ID)
5234
0
          handleDefault = XML_FALSE;
5235
0
      }
5236
0
      break;
5237
0
    case XML_ROLE_ENTITY_COMPLETE:
5238
#if XML_GE == 0
5239
      // This will store "&amp;entity123;" in entity->textPtr
5240
      // to end up as "&entity123;" in the handler.
5241
      if (parser->m_declEntity != NULL) {
5242
        const enum XML_Error result
5243
            = storeSelfEntityValue(parser, parser->m_declEntity);
5244
        if (result != XML_ERROR_NONE)
5245
          return result;
5246
      }
5247
#endif
5248
0
      if (dtd->keepProcessing && parser->m_declEntity
5249
0
          && parser->m_entityDeclHandler) {
5250
0
        *eventEndPP = s;
5251
0
        parser->m_entityDeclHandler(
5252
0
            parser->m_handlerArg, parser->m_declEntity->name,
5253
0
            parser->m_declEntity->is_param, 0, 0, parser->m_declEntity->base,
5254
0
            parser->m_declEntity->systemId, parser->m_declEntity->publicId, 0);
5255
0
        handleDefault = XML_FALSE;
5256
0
      }
5257
0
      break;
5258
0
    case XML_ROLE_ENTITY_NOTATION_NAME:
5259
0
      if (dtd->keepProcessing && parser->m_declEntity) {
5260
0
        parser->m_declEntity->notation
5261
0
            = poolStoreString(&dtd->pool, enc, s, next);
5262
0
        if (! parser->m_declEntity->notation)
5263
0
          return XML_ERROR_NO_MEMORY;
5264
0
        poolFinish(&dtd->pool);
5265
0
        if (parser->m_unparsedEntityDeclHandler) {
5266
0
          *eventEndPP = s;
5267
0
          parser->m_unparsedEntityDeclHandler(
5268
0
              parser->m_handlerArg, parser->m_declEntity->name,
5269
0
              parser->m_declEntity->base, parser->m_declEntity->systemId,
5270
0
              parser->m_declEntity->publicId, parser->m_declEntity->notation);
5271
0
          handleDefault = XML_FALSE;
5272
0
        } else if (parser->m_entityDeclHandler) {
5273
0
          *eventEndPP = s;
5274
0
          parser->m_entityDeclHandler(
5275
0
              parser->m_handlerArg, parser->m_declEntity->name, 0, 0, 0,
5276
0
              parser->m_declEntity->base, parser->m_declEntity->systemId,
5277
0
              parser->m_declEntity->publicId, parser->m_declEntity->notation);
5278
0
          handleDefault = XML_FALSE;
5279
0
        }
5280
0
      }
5281
0
      break;
5282
0
    case XML_ROLE_GENERAL_ENTITY_NAME: {
5283
0
      if (XmlPredefinedEntityName(enc, s, next)) {
5284
0
        parser->m_declEntity = NULL;
5285
0
        break;
5286
0
      }
5287
0
      if (dtd->keepProcessing) {
5288
0
        const XML_Char *name = poolStoreString(&dtd->pool, enc, s, next);
5289
0
        if (! name)
5290
0
          return XML_ERROR_NO_MEMORY;
5291
0
        parser->m_declEntity = (ENTITY *)lookup(parser, &dtd->generalEntities,
5292
0
                                                name, sizeof(ENTITY));
5293
0
        if (! parser->m_declEntity)
5294
0
          return XML_ERROR_NO_MEMORY;
5295
0
        if (parser->m_declEntity->name != name) {
5296
0
          poolDiscard(&dtd->pool);
5297
0
          parser->m_declEntity = NULL;
5298
0
        } else {
5299
0
          poolFinish(&dtd->pool);
5300
0
          parser->m_declEntity->publicId = NULL;
5301
0
          parser->m_declEntity->is_param = XML_FALSE;
5302
          /* if we have a parent parser or are reading an internal parameter
5303
             entity, then the entity declaration is not considered "internal"
5304
          */
5305
0
          parser->m_declEntity->is_internal
5306
0
              = ! (parser->m_parentParser || parser->m_openInternalEntities);
5307
0
          if (parser->m_entityDeclHandler)
5308
0
            handleDefault = XML_FALSE;
5309
0
        }
5310
0
      } else {
5311
0
        poolDiscard(&dtd->pool);
5312
0
        parser->m_declEntity = NULL;
5313
0
      }
5314
0
    } break;
5315
0
    case XML_ROLE_PARAM_ENTITY_NAME:
5316
0
#ifdef XML_DTD
5317
0
      if (dtd->keepProcessing) {
5318
0
        const XML_Char *name = poolStoreString(&dtd->pool, enc, s, next);
5319
0
        if (! name)
5320
0
          return XML_ERROR_NO_MEMORY;
5321
0
        parser->m_declEntity = (ENTITY *)lookup(parser, &dtd->paramEntities,
5322
0
                                                name, sizeof(ENTITY));
5323
0
        if (! parser->m_declEntity)
5324
0
          return XML_ERROR_NO_MEMORY;
5325
0
        if (parser->m_declEntity->name != name) {
5326
0
          poolDiscard(&dtd->pool);
5327
0
          parser->m_declEntity = NULL;
5328
0
        } else {
5329
0
          poolFinish(&dtd->pool);
5330
0
          parser->m_declEntity->publicId = NULL;
5331
0
          parser->m_declEntity->is_param = XML_TRUE;
5332
          /* if we have a parent parser or are reading an internal parameter
5333
             entity, then the entity declaration is not considered "internal"
5334
          */
5335
0
          parser->m_declEntity->is_internal
5336
0
              = ! (parser->m_parentParser || parser->m_openInternalEntities);
5337
0
          if (parser->m_entityDeclHandler)
5338
0
            handleDefault = XML_FALSE;
5339
0
        }
5340
0
      } else {
5341
0
        poolDiscard(&dtd->pool);
5342
0
        parser->m_declEntity = NULL;
5343
0
      }
5344
#else  /* not XML_DTD */
5345
      parser->m_declEntity = NULL;
5346
#endif /* XML_DTD */
5347
0
      break;
5348
0
    case XML_ROLE_NOTATION_NAME:
5349
0
      parser->m_declNotationPublicId = NULL;
5350
0
      parser->m_declNotationName = NULL;
5351
0
      if (parser->m_notationDeclHandler) {
5352
0
        parser->m_declNotationName
5353
0
            = poolStoreString(&parser->m_tempPool, enc, s, next);
5354
0
        if (! parser->m_declNotationName)
5355
0
          return XML_ERROR_NO_MEMORY;
5356
0
        poolFinish(&parser->m_tempPool);
5357
0
        handleDefault = XML_FALSE;
5358
0
      }
5359
0
      break;
5360
0
    case XML_ROLE_NOTATION_PUBLIC_ID:
5361
0
      if (! XmlIsPublicId(enc, s, next, eventPP))
5362
0
        return XML_ERROR_PUBLICID;
5363
0
      if (parser
5364
0
              ->m_declNotationName) { /* means m_notationDeclHandler != NULL */
5365
0
        XML_Char *tem = poolStoreString(&parser->m_tempPool, enc,
5366
0
                                        s + enc->minBytesPerChar,
5367
0
                                        next - enc->minBytesPerChar);
5368
0
        if (! tem)
5369
0
          return XML_ERROR_NO_MEMORY;
5370
0
        normalizePublicId(tem);
5371
0
        parser->m_declNotationPublicId = tem;
5372
0
        poolFinish(&parser->m_tempPool);
5373
0
        handleDefault = XML_FALSE;
5374
0
      }
5375
0
      break;
5376
0
    case XML_ROLE_NOTATION_SYSTEM_ID:
5377
0
      if (parser->m_declNotationName && parser->m_notationDeclHandler) {
5378
0
        const XML_Char *systemId = poolStoreString(&parser->m_tempPool, enc,
5379
0
                                                   s + enc->minBytesPerChar,
5380
0
                                                   next - enc->minBytesPerChar);
5381
0
        if (! systemId)
5382
0
          return XML_ERROR_NO_MEMORY;
5383
0
        *eventEndPP = s;
5384
0
        parser->m_notationDeclHandler(
5385
0
            parser->m_handlerArg, parser->m_declNotationName, parser->m_curBase,
5386
0
            systemId, parser->m_declNotationPublicId);
5387
0
        handleDefault = XML_FALSE;
5388
0
      }
5389
0
      poolClear(&parser->m_tempPool);
5390
0
      break;
5391
0
    case XML_ROLE_NOTATION_NO_SYSTEM_ID:
5392
0
      if (parser->m_declNotationPublicId && parser->m_notationDeclHandler) {
5393
0
        *eventEndPP = s;
5394
0
        parser->m_notationDeclHandler(
5395
0
            parser->m_handlerArg, parser->m_declNotationName, parser->m_curBase,
5396
0
            0, parser->m_declNotationPublicId);
5397
0
        handleDefault = XML_FALSE;
5398
0
      }
5399
0
      poolClear(&parser->m_tempPool);
5400
0
      break;
5401
0
    case XML_ROLE_ERROR:
5402
0
      switch (tok) {
5403
0
      case XML_TOK_PARAM_ENTITY_REF:
5404
        /* PE references in internal subset are
5405
           not allowed within declarations. */
5406
0
        return XML_ERROR_PARAM_ENTITY_REF;
5407
0
      case XML_TOK_XML_DECL:
5408
0
        return XML_ERROR_MISPLACED_XML_PI;
5409
0
      default:
5410
0
        return XML_ERROR_SYNTAX;
5411
0
      }
5412
0
#ifdef XML_DTD
5413
0
    case XML_ROLE_IGNORE_SECT: {
5414
0
      enum XML_Error result;
5415
0
      if (parser->m_defaultHandler)
5416
0
        reportDefault(parser, enc, s, next);
5417
0
      handleDefault = XML_FALSE;
5418
0
      result = doIgnoreSection(parser, enc, &next, end, nextPtr, haveMore);
5419
0
      if (result != XML_ERROR_NONE)
5420
0
        return result;
5421
0
      else if (! next) {
5422
0
        parser->m_processor = ignoreSectionProcessor;
5423
0
        return result;
5424
0
      }
5425
0
    } break;
5426
0
#endif /* XML_DTD */
5427
0
    case XML_ROLE_GROUP_OPEN:
5428
0
      if (parser->m_prologState.level >= parser->m_groupSize) {
5429
0
        if (parser->m_groupSize) {
5430
0
          {
5431
            /* Detect and prevent integer overflow */
5432
0
            if (parser->m_groupSize > (unsigned int)(-1) / 2u) {
5433
0
              return XML_ERROR_NO_MEMORY;
5434
0
            }
5435
5436
0
            {
5437
0
               char *const new_connector = (char *)REALLOC(
5438
0
                   parser, parser->m_groupConnector, parser->m_groupSize *= 2);
5439
0
               if (new_connector == NULL) {
5440
0
                 parser->m_groupSize /= 2;
5441
0
                 return XML_ERROR_NO_MEMORY;
5442
0
               }
5443
0
               parser->m_groupConnector = new_connector;
5444
0
            }
5445
0
          }
5446
5447
0
          if (dtd->scaffIndex) {
5448
0
            int *new_scaff_index;
5449
            /* Detect and prevent integer overflow.
5450
             * The preprocessor guard addresses the "always false" warning
5451
             * from -Wtype-limits on platforms where
5452
             * sizeof(unsigned int) < sizeof(size_t), e.g. on x86_64. */
5453
#if UINT_MAX >= SIZE_MAX
5454
            if (parser->m_groupSize > (size_t)(-1) / sizeof(int)) {
5455
              return XML_ERROR_NO_MEMORY;
5456
            }
5457
#endif
5458
5459
0
            new_scaff_index = (int *)REALLOC(
5460
0
                parser, dtd->scaffIndex, parser->m_groupSize * sizeof(int));
5461
0
            if (new_scaff_index == NULL)
5462
0
              return XML_ERROR_NO_MEMORY;
5463
0
            dtd->scaffIndex = new_scaff_index;
5464
0
          }
5465
0
        } else {
5466
0
          parser->m_groupConnector
5467
0
              = (char *)MALLOC(parser, parser->m_groupSize = 32);
5468
0
          if (! parser->m_groupConnector) {
5469
0
            parser->m_groupSize = 0;
5470
0
            return XML_ERROR_NO_MEMORY;
5471
0
          }
5472
0
        }
5473
0
      }
5474
0
      parser->m_groupConnector[parser->m_prologState.level] = 0;
5475
0
      if (dtd->in_eldecl) {
5476
0
        int myindex = nextScaffoldPart(parser);
5477
0
        if (myindex < 0)
5478
0
          return XML_ERROR_NO_MEMORY;
5479
0
        assert(dtd->scaffIndex != NULL);
5480
0
        dtd->scaffIndex[dtd->scaffLevel] = myindex;
5481
0
        dtd->scaffLevel++;
5482
0
        dtd->scaffold[myindex].type = XML_CTYPE_SEQ;
5483
0
        if (parser->m_elementDeclHandler)
5484
0
          handleDefault = XML_FALSE;
5485
0
      }
5486
0
      break;
5487
0
    case XML_ROLE_GROUP_SEQUENCE:
5488
0
      if (parser->m_groupConnector[parser->m_prologState.level] == ASCII_PIPE)
5489
0
        return XML_ERROR_SYNTAX;
5490
0
      parser->m_groupConnector[parser->m_prologState.level] = ASCII_COMMA;
5491
0
      if (dtd->in_eldecl && parser->m_elementDeclHandler)
5492
0
        handleDefault = XML_FALSE;
5493
0
      break;
5494
0
    case XML_ROLE_GROUP_CHOICE:
5495
0
      if (parser->m_groupConnector[parser->m_prologState.level] == ASCII_COMMA)
5496
0
        return XML_ERROR_SYNTAX;
5497
0
      if (dtd->in_eldecl
5498
0
          && ! parser->m_groupConnector[parser->m_prologState.level]
5499
0
          && (dtd->scaffold[dtd->scaffIndex[dtd->scaffLevel - 1]].type
5500
0
              != XML_CTYPE_MIXED)) {
5501
0
        dtd->scaffold[dtd->scaffIndex[dtd->scaffLevel - 1]].type
5502
0
            = XML_CTYPE_CHOICE;
5503
0
        if (parser->m_elementDeclHandler)
5504
0
          handleDefault = XML_FALSE;
5505
0
      }
5506
0
      parser->m_groupConnector[parser->m_prologState.level] = ASCII_PIPE;
5507
0
      break;
5508
0
    case XML_ROLE_PARAM_ENTITY_REF:
5509
0
#ifdef XML_DTD
5510
0
    case XML_ROLE_INNER_PARAM_ENTITY_REF:
5511
0
      dtd->hasParamEntityRefs = XML_TRUE;
5512
0
      if (! parser->m_paramEntityParsing)
5513
0
        dtd->keepProcessing = dtd->standalone;
5514
0
      else {
5515
0
        const XML_Char *name;
5516
0
        ENTITY *entity;
5517
0
        name = poolStoreString(&dtd->pool, enc, s + enc->minBytesPerChar,
5518
0
                               next - enc->minBytesPerChar);
5519
0
        if (! name)
5520
0
          return XML_ERROR_NO_MEMORY;
5521
0
        entity = (ENTITY *)lookup(parser, &dtd->paramEntities, name, 0);
5522
0
        poolDiscard(&dtd->pool);
5523
        /* first, determine if a check for an existing declaration is needed;
5524
           if yes, check that the entity exists, and that it is internal,
5525
           otherwise call the skipped entity handler
5526
        */
5527
0
        if (parser->m_prologState.documentEntity
5528
0
            && (dtd->standalone ? ! parser->m_openInternalEntities
5529
0
                                : ! dtd->hasParamEntityRefs)) {
5530
0
          if (! entity)
5531
0
            return XML_ERROR_UNDEFINED_ENTITY;
5532
0
          else if (! entity->is_internal) {
5533
            /* It's hard to exhaustively search the code to be sure,
5534
             * but there doesn't seem to be a way of executing the
5535
             * following line.  There are two cases:
5536
             *
5537
             * If 'standalone' is false, the DTD must have no
5538
             * parameter entities or we wouldn't have passed the outer
5539
             * 'if' statement.  That means the only entity in the hash
5540
             * table is the external subset name "#" which cannot be
5541
             * given as a parameter entity name in XML syntax, so the
5542
             * lookup must have returned NULL and we don't even reach
5543
             * the test for an internal entity.
5544
             *
5545
             * If 'standalone' is true, it does not seem to be
5546
             * possible to create entities taking this code path that
5547
             * are not internal entities, so fail the test above.
5548
             *
5549
             * Because this analysis is very uncertain, the code is
5550
             * being left in place and merely removed from the
5551
             * coverage test statistics.
5552
             */
5553
0
            return XML_ERROR_ENTITY_DECLARED_IN_PE; /* LCOV_EXCL_LINE */
5554
0
          }
5555
0
        } else if (! entity) {
5556
0
          dtd->keepProcessing = dtd->standalone;
5557
          /* cannot report skipped entities in declarations */
5558
0
          if ((role == XML_ROLE_PARAM_ENTITY_REF)
5559
0
              && parser->m_skippedEntityHandler) {
5560
0
            parser->m_skippedEntityHandler(parser->m_handlerArg, name, 1);
5561
0
            handleDefault = XML_FALSE;
5562
0
          }
5563
0
          break;
5564
0
        }
5565
0
        if (entity->open)
5566
0
          return XML_ERROR_RECURSIVE_ENTITY_REF;
5567
0
        if (entity->textPtr) {
5568
0
          enum XML_Error result;
5569
0
          XML_Bool betweenDecl
5570
0
              = (role == XML_ROLE_PARAM_ENTITY_REF ? XML_TRUE : XML_FALSE);
5571
0
          result = processInternalEntity(parser, entity, betweenDecl);
5572
0
          if (result != XML_ERROR_NONE)
5573
0
            return result;
5574
0
          handleDefault = XML_FALSE;
5575
0
          break;
5576
0
        }
5577
0
        if (parser->m_externalEntityRefHandler) {
5578
0
          dtd->paramEntityRead = XML_FALSE;
5579
0
          entity->open = XML_TRUE;
5580
0
          entityTrackingOnOpen(parser, entity, __LINE__);
5581
0
          if (! parser->m_externalEntityRefHandler(
5582
0
                  parser->m_externalEntityRefHandlerArg, 0, entity->base,
5583
0
                  entity->systemId, entity->publicId)) {
5584
0
            entityTrackingOnClose(parser, entity, __LINE__);
5585
0
            entity->open = XML_FALSE;
5586
0
            return XML_ERROR_EXTERNAL_ENTITY_HANDLING;
5587
0
          }
5588
0
          entityTrackingOnClose(parser, entity, __LINE__);
5589
0
          entity->open = XML_FALSE;
5590
0
          handleDefault = XML_FALSE;
5591
0
          if (! dtd->paramEntityRead) {
5592
0
            dtd->keepProcessing = dtd->standalone;
5593
0
            break;
5594
0
          }
5595
0
        } else {
5596
0
          dtd->keepProcessing = dtd->standalone;
5597
0
          break;
5598
0
        }
5599
0
      }
5600
0
#endif /* XML_DTD */
5601
0
      if (! dtd->standalone && parser->m_notStandaloneHandler
5602
0
          && ! parser->m_notStandaloneHandler(parser->m_handlerArg))
5603
0
        return XML_ERROR_NOT_STANDALONE;
5604
0
      break;
5605
5606
      /* Element declaration stuff */
5607
5608
0
    case XML_ROLE_ELEMENT_NAME:
5609
0
      if (parser->m_elementDeclHandler) {
5610
0
        parser->m_declElementType = getElementType(parser, enc, s, next);
5611
0
        if (! parser->m_declElementType)
5612
0
          return XML_ERROR_NO_MEMORY;
5613
0
        dtd->scaffLevel = 0;
5614
0
        dtd->scaffCount = 0;
5615
0
        dtd->in_eldecl = XML_TRUE;
5616
0
        handleDefault = XML_FALSE;
5617
0
      }
5618
0
      break;
5619
5620
0
    case XML_ROLE_CONTENT_ANY:
5621
0
    case XML_ROLE_CONTENT_EMPTY:
5622
0
      if (dtd->in_eldecl) {
5623
0
        if (parser->m_elementDeclHandler) {
5624
0
          XML_Content *content
5625
0
              = (XML_Content *)MALLOC(parser, sizeof(XML_Content));
5626
0
          if (! content)
5627
0
            return XML_ERROR_NO_MEMORY;
5628
0
          content->quant = XML_CQUANT_NONE;
5629
0
          content->name = NULL;
5630
0
          content->numchildren = 0;
5631
0
          content->children = NULL;
5632
0
          content->type = ((role == XML_ROLE_CONTENT_ANY) ? XML_CTYPE_ANY
5633
0
                                                          : XML_CTYPE_EMPTY);
5634
0
          *eventEndPP = s;
5635
0
          parser->m_elementDeclHandler(
5636
0
              parser->m_handlerArg, parser->m_declElementType->name, content);
5637
0
          handleDefault = XML_FALSE;
5638
0
        }
5639
0
        dtd->in_eldecl = XML_FALSE;
5640
0
      }
5641
0
      break;
5642
5643
0
    case XML_ROLE_CONTENT_PCDATA:
5644
0
      if (dtd->in_eldecl) {
5645
0
        dtd->scaffold[dtd->scaffIndex[dtd->scaffLevel - 1]].type
5646
0
            = XML_CTYPE_MIXED;
5647
0
        if (parser->m_elementDeclHandler)
5648
0
          handleDefault = XML_FALSE;
5649
0
      }
5650
0
      break;
5651
5652
0
    case XML_ROLE_CONTENT_ELEMENT:
5653
0
      quant = XML_CQUANT_NONE;
5654
0
      goto elementContent;
5655
0
    case XML_ROLE_CONTENT_ELEMENT_OPT:
5656
0
      quant = XML_CQUANT_OPT;
5657
0
      goto elementContent;
5658
0
    case XML_ROLE_CONTENT_ELEMENT_REP:
5659
0
      quant = XML_CQUANT_REP;
5660
0
      goto elementContent;
5661
0
    case XML_ROLE_CONTENT_ELEMENT_PLUS:
5662
0
      quant = XML_CQUANT_PLUS;
5663
0
    elementContent:
5664
0
      if (dtd->in_eldecl) {
5665
0
        ELEMENT_TYPE *el;
5666
0
        const XML_Char *name;
5667
0
        size_t nameLen;
5668
0
        const char *nxt
5669
0
            = (quant == XML_CQUANT_NONE ? next : next - enc->minBytesPerChar);
5670
0
        int myindex = nextScaffoldPart(parser);
5671
0
        if (myindex < 0)
5672
0
          return XML_ERROR_NO_MEMORY;
5673
0
        dtd->scaffold[myindex].type = XML_CTYPE_NAME;
5674
0
        dtd->scaffold[myindex].quant = quant;
5675
0
        el = getElementType(parser, enc, s, nxt);
5676
0
        if (! el)
5677
0
          return XML_ERROR_NO_MEMORY;
5678
0
        name = el->name;
5679
0
        dtd->scaffold[myindex].name = name;
5680
0
        nameLen = 0;
5681
0
        for (; name[nameLen++];)
5682
0
          ;
5683
5684
        /* Detect and prevent integer overflow */
5685
0
        if (nameLen > UINT_MAX - dtd->contentStringLen) {
5686
0
          return XML_ERROR_NO_MEMORY;
5687
0
        }
5688
5689
0
        dtd->contentStringLen += (unsigned)nameLen;
5690
0
        if (parser->m_elementDeclHandler)
5691
0
          handleDefault = XML_FALSE;
5692
0
      }
5693
0
      break;
5694
5695
0
    case XML_ROLE_GROUP_CLOSE:
5696
0
      quant = XML_CQUANT_NONE;
5697
0
      goto closeGroup;
5698
0
    case XML_ROLE_GROUP_CLOSE_OPT:
5699
0
      quant = XML_CQUANT_OPT;
5700
0
      goto closeGroup;
5701
0
    case XML_ROLE_GROUP_CLOSE_REP:
5702
0
      quant = XML_CQUANT_REP;
5703
0
      goto closeGroup;
5704
0
    case XML_ROLE_GROUP_CLOSE_PLUS:
5705
0
      quant = XML_CQUANT_PLUS;
5706
0
    closeGroup:
5707
0
      if (dtd->in_eldecl) {
5708
0
        if (parser->m_elementDeclHandler)
5709
0
          handleDefault = XML_FALSE;
5710
0
        dtd->scaffLevel--;
5711
0
        dtd->scaffold[dtd->scaffIndex[dtd->scaffLevel]].quant = quant;
5712
0
        if (dtd->scaffLevel == 0) {
5713
0
          if (! handleDefault) {
5714
0
            XML_Content *model = build_model(parser);
5715
0
            if (! model)
5716
0
              return XML_ERROR_NO_MEMORY;
5717
0
            *eventEndPP = s;
5718
0
            parser->m_elementDeclHandler(
5719
0
                parser->m_handlerArg, parser->m_declElementType->name, model);
5720
0
          }
5721
0
          dtd->in_eldecl = XML_FALSE;
5722
0
          dtd->contentStringLen = 0;
5723
0
        }
5724
0
      }
5725
0
      break;
5726
      /* End element declaration stuff */
5727
5728
0
    case XML_ROLE_PI:
5729
0
      if (! reportProcessingInstruction(parser, enc, s, next))
5730
0
        return XML_ERROR_NO_MEMORY;
5731
0
      handleDefault = XML_FALSE;
5732
0
      break;
5733
0
    case XML_ROLE_COMMENT:
5734
0
      if (! reportComment(parser, enc, s, next))
5735
0
        return XML_ERROR_NO_MEMORY;
5736
0
      handleDefault = XML_FALSE;
5737
0
      break;
5738
138
    case XML_ROLE_NONE:
5739
138
      switch (tok) {
5740
69
      case XML_TOK_BOM:
5741
69
        handleDefault = XML_FALSE;
5742
69
        break;
5743
138
      }
5744
138
      break;
5745
138
    case XML_ROLE_DOCTYPE_NONE:
5746
0
      if (parser->m_startDoctypeDeclHandler)
5747
0
        handleDefault = XML_FALSE;
5748
0
      break;
5749
0
    case XML_ROLE_ENTITY_NONE:
5750
0
      if (dtd->keepProcessing && parser->m_entityDeclHandler)
5751
0
        handleDefault = XML_FALSE;
5752
0
      break;
5753
0
    case XML_ROLE_NOTATION_NONE:
5754
0
      if (parser->m_notationDeclHandler)
5755
0
        handleDefault = XML_FALSE;
5756
0
      break;
5757
0
    case XML_ROLE_ATTLIST_NONE:
5758
0
      if (dtd->keepProcessing && parser->m_attlistDeclHandler)
5759
0
        handleDefault = XML_FALSE;
5760
0
      break;
5761
0
    case XML_ROLE_ELEMENT_NONE:
5762
0
      if (parser->m_elementDeclHandler)
5763
0
        handleDefault = XML_FALSE;
5764
0
      break;
5765
296
    } /* end of big switch */
5766
5767
207
    if (handleDefault && parser->m_defaultHandler)
5768
0
      reportDefault(parser, enc, s, next);
5769
5770
207
    switch (parser->m_parsingStatus.parsing) {
5771
0
    case XML_SUSPENDED:
5772
0
      *nextPtr = next;
5773
0
      return XML_ERROR_NONE;
5774
0
    case XML_FINISHED:
5775
0
      return XML_ERROR_ABORTED;
5776
207
    default:
5777
207
      s = next;
5778
207
      tok = XmlPrologTok(enc, s, end, &next);
5779
207
    }
5780
207
  }
5781
  /* not reached */
5782
89
}
5783
5784
static enum XML_Error PTRCALL
5785
epilogProcessor(XML_Parser parser, const char *s, const char *end,
5786
74
                const char **nextPtr) {
5787
74
  parser->m_processor = epilogProcessor;
5788
74
  parser->m_eventPtr = s;
5789
148
  for (;;) {
5790
148
    const char *next = NULL;
5791
148
    int tok = XmlPrologTok(parser->m_encoding, s, end, &next);
5792
148
#if XML_GE == 1
5793
148
    if (! accountingDiffTolerated(parser, tok, s, next, __LINE__,
5794
148
                                  XML_ACCOUNT_DIRECT)) {
5795
0
      accountingOnAbort(parser);
5796
0
      return XML_ERROR_AMPLIFICATION_LIMIT_BREACH;
5797
0
    }
5798
148
#endif
5799
148
    parser->m_eventEndPtr = next;
5800
148
    switch (tok) {
5801
    /* report partial linebreak - it might be the last token */
5802
0
    case -XML_TOK_PROLOG_S:
5803
0
      if (parser->m_defaultHandler) {
5804
0
        reportDefault(parser, parser->m_encoding, s, next);
5805
0
        if (parser->m_parsingStatus.parsing == XML_FINISHED)
5806
0
          return XML_ERROR_ABORTED;
5807
0
      }
5808
0
      *nextPtr = next;
5809
0
      return XML_ERROR_NONE;
5810
72
    case XML_TOK_NONE:
5811
72
      *nextPtr = s;
5812
72
      return XML_ERROR_NONE;
5813
74
    case XML_TOK_PROLOG_S:
5814
74
      if (parser->m_defaultHandler)
5815
0
        reportDefault(parser, parser->m_encoding, s, next);
5816
74
      break;
5817
0
    case XML_TOK_PI:
5818
0
      if (! reportProcessingInstruction(parser, parser->m_encoding, s, next))
5819
0
        return XML_ERROR_NO_MEMORY;
5820
0
      break;
5821
0
    case XML_TOK_COMMENT:
5822
0
      if (! reportComment(parser, parser->m_encoding, s, next))
5823
0
        return XML_ERROR_NO_MEMORY;
5824
0
      break;
5825
2
    case XML_TOK_INVALID:
5826
2
      parser->m_eventPtr = next;
5827
2
      return XML_ERROR_INVALID_TOKEN;
5828
0
    case XML_TOK_PARTIAL:
5829
0
      if (! parser->m_parsingStatus.finalBuffer) {
5830
0
        *nextPtr = s;
5831
0
        return XML_ERROR_NONE;
5832
0
      }
5833
0
      return XML_ERROR_UNCLOSED_TOKEN;
5834
0
    case XML_TOK_PARTIAL_CHAR:
5835
0
      if (! parser->m_parsingStatus.finalBuffer) {
5836
0
        *nextPtr = s;
5837
0
        return XML_ERROR_NONE;
5838
0
      }
5839
0
      return XML_ERROR_PARTIAL_CHAR;
5840
0
    default:
5841
0
      return XML_ERROR_JUNK_AFTER_DOC_ELEMENT;
5842
148
    }
5843
74
    parser->m_eventPtr = s = next;
5844
74
    switch (parser->m_parsingStatus.parsing) {
5845
0
    case XML_SUSPENDED:
5846
0
      *nextPtr = next;
5847
0
      return XML_ERROR_NONE;
5848
0
    case XML_FINISHED:
5849
0
      return XML_ERROR_ABORTED;
5850
74
    default:;
5851
74
    }
5852
74
  }
5853
74
}
5854
5855
static enum XML_Error
5856
0
processInternalEntity(XML_Parser parser, ENTITY *entity, XML_Bool betweenDecl) {
5857
0
  const char *textStart, *textEnd;
5858
0
  const char *next;
5859
0
  enum XML_Error result;
5860
0
  OPEN_INTERNAL_ENTITY *openEntity;
5861
5862
0
  if (parser->m_freeInternalEntities) {
5863
0
    openEntity = parser->m_freeInternalEntities;
5864
0
    parser->m_freeInternalEntities = openEntity->next;
5865
0
  } else {
5866
0
    openEntity
5867
0
        = (OPEN_INTERNAL_ENTITY *)MALLOC(parser, sizeof(OPEN_INTERNAL_ENTITY));
5868
0
    if (! openEntity)
5869
0
      return XML_ERROR_NO_MEMORY;
5870
0
  }
5871
0
  entity->open = XML_TRUE;
5872
0
#if XML_GE == 1
5873
0
  entityTrackingOnOpen(parser, entity, __LINE__);
5874
0
#endif
5875
0
  entity->processed = 0;
5876
0
  openEntity->next = parser->m_openInternalEntities;
5877
0
  parser->m_openInternalEntities = openEntity;
5878
0
  openEntity->entity = entity;
5879
0
  openEntity->startTagLevel = parser->m_tagLevel;
5880
0
  openEntity->betweenDecl = betweenDecl;
5881
0
  openEntity->internalEventPtr = NULL;
5882
0
  openEntity->internalEventEndPtr = NULL;
5883
0
  textStart = (const char *)entity->textPtr;
5884
0
  textEnd = (const char *)(entity->textPtr + entity->textLen);
5885
  /* Set a safe default value in case 'next' does not get set */
5886
0
  next = textStart;
5887
5888
0
  if (entity->is_param) {
5889
0
    int tok
5890
0
        = XmlPrologTok(parser->m_internalEncoding, textStart, textEnd, &next);
5891
0
    result = doProlog(parser, parser->m_internalEncoding, textStart, textEnd,
5892
0
                      tok, next, &next, XML_FALSE, XML_FALSE,
5893
0
                      XML_ACCOUNT_ENTITY_EXPANSION);
5894
0
  } else {
5895
0
    result = doContent(parser, parser->m_tagLevel, parser->m_internalEncoding,
5896
0
                       textStart, textEnd, &next, XML_FALSE,
5897
0
                       XML_ACCOUNT_ENTITY_EXPANSION);
5898
0
  }
5899
5900
0
  if (result == XML_ERROR_NONE) {
5901
0
    if (textEnd != next && parser->m_parsingStatus.parsing == XML_SUSPENDED) {
5902
0
      entity->processed = (int)(next - textStart);
5903
0
      parser->m_processor = internalEntityProcessor;
5904
0
    } else if (parser->m_openInternalEntities->entity == entity) {
5905
0
#if XML_GE == 1
5906
0
      entityTrackingOnClose(parser, entity, __LINE__);
5907
0
#endif /* XML_GE == 1 */
5908
0
      entity->open = XML_FALSE;
5909
0
      parser->m_openInternalEntities = openEntity->next;
5910
      /* put openEntity back in list of free instances */
5911
0
      openEntity->next = parser->m_freeInternalEntities;
5912
0
      parser->m_freeInternalEntities = openEntity;
5913
0
    }
5914
0
  }
5915
0
  return result;
5916
0
}
5917
5918
static enum XML_Error PTRCALL
5919
internalEntityProcessor(XML_Parser parser, const char *s, const char *end,
5920
0
                        const char **nextPtr) {
5921
0
  ENTITY *entity;
5922
0
  const char *textStart, *textEnd;
5923
0
  const char *next;
5924
0
  enum XML_Error result;
5925
0
  OPEN_INTERNAL_ENTITY *openEntity = parser->m_openInternalEntities;
5926
0
  if (! openEntity)
5927
0
    return XML_ERROR_UNEXPECTED_STATE;
5928
5929
0
  entity = openEntity->entity;
5930
0
  textStart = ((const char *)entity->textPtr) + entity->processed;
5931
0
  textEnd = (const char *)(entity->textPtr + entity->textLen);
5932
  /* Set a safe default value in case 'next' does not get set */
5933
0
  next = textStart;
5934
5935
0
  if (entity->is_param) {
5936
0
    int tok
5937
0
        = XmlPrologTok(parser->m_internalEncoding, textStart, textEnd, &next);
5938
0
    result = doProlog(parser, parser->m_internalEncoding, textStart, textEnd,
5939
0
                      tok, next, &next, XML_FALSE, XML_TRUE,
5940
0
                      XML_ACCOUNT_ENTITY_EXPANSION);
5941
0
  } else {
5942
0
    result = doContent(parser, openEntity->startTagLevel,
5943
0
                       parser->m_internalEncoding, textStart, textEnd, &next,
5944
0
                       XML_FALSE, XML_ACCOUNT_ENTITY_EXPANSION);
5945
0
  }
5946
5947
0
  if (result != XML_ERROR_NONE)
5948
0
    return result;
5949
5950
0
  if (textEnd != next && parser->m_parsingStatus.parsing == XML_SUSPENDED) {
5951
0
    entity->processed = (int)(next - (const char *)entity->textPtr);
5952
0
    return result;
5953
0
  }
5954
5955
0
#if XML_GE == 1
5956
0
  entityTrackingOnClose(parser, entity, __LINE__);
5957
0
#endif
5958
0
  entity->open = XML_FALSE;
5959
0
  parser->m_openInternalEntities = openEntity->next;
5960
  /* put openEntity back in list of free instances */
5961
0
  openEntity->next = parser->m_freeInternalEntities;
5962
0
  parser->m_freeInternalEntities = openEntity;
5963
5964
  // If there are more open entities we want to stop right here and have the
5965
  // upcoming call to XML_ResumeParser continue with entity content, or it would
5966
  // be ignored altogether.
5967
0
  if (parser->m_openInternalEntities != NULL
5968
0
      && parser->m_parsingStatus.parsing == XML_SUSPENDED) {
5969
0
    return XML_ERROR_NONE;
5970
0
  }
5971
5972
0
  if (entity->is_param) {
5973
0
    int tok;
5974
0
    parser->m_processor = prologProcessor;
5975
0
    tok = XmlPrologTok(parser->m_encoding, s, end, &next);
5976
0
    return doProlog(parser, parser->m_encoding, s, end, tok, next, nextPtr,
5977
0
                    (XML_Bool)! parser->m_parsingStatus.finalBuffer, XML_TRUE,
5978
0
                    XML_ACCOUNT_DIRECT);
5979
0
  } else {
5980
0
    parser->m_processor = contentProcessor;
5981
    /* see externalEntityContentProcessor vs contentProcessor */
5982
0
    result = doContent(parser, parser->m_parentParser ? 1 : 0,
5983
0
                       parser->m_encoding, s, end, nextPtr,
5984
0
                       (XML_Bool)! parser->m_parsingStatus.finalBuffer,
5985
0
                       XML_ACCOUNT_DIRECT);
5986
0
    if (result == XML_ERROR_NONE) {
5987
0
      if (! storeRawNames(parser))
5988
0
        return XML_ERROR_NO_MEMORY;
5989
0
    }
5990
0
    return result;
5991
0
  }
5992
0
}
5993
5994
static enum XML_Error PTRCALL
5995
errorProcessor(XML_Parser parser, const char *s, const char *end,
5996
0
               const char **nextPtr) {
5997
0
  UNUSED_P(s);
5998
0
  UNUSED_P(end);
5999
0
  UNUSED_P(nextPtr);
6000
0
  return parser->m_errorCode;
6001
0
}
6002
6003
static enum XML_Error
6004
storeAttributeValue(XML_Parser parser, const ENCODING *enc, XML_Bool isCdata,
6005
                    const char *ptr, const char *end, STRING_POOL *pool,
6006
728
                    enum XML_Account account) {
6007
728
  enum XML_Error result
6008
728
      = appendAttributeValue(parser, enc, isCdata, ptr, end, pool, account);
6009
728
  if (result)
6010
0
    return result;
6011
728
  if (! isCdata && poolLength(pool) && poolLastChar(pool) == 0x20)
6012
0
    poolChop(pool);
6013
728
  if (! poolAppendChar(pool, XML_T('\0')))
6014
0
    return XML_ERROR_NO_MEMORY;
6015
728
  return XML_ERROR_NONE;
6016
728
}
6017
6018
static enum XML_Error
6019
appendAttributeValue(XML_Parser parser, const ENCODING *enc, XML_Bool isCdata,
6020
                     const char *ptr, const char *end, STRING_POOL *pool,
6021
728
                     enum XML_Account account) {
6022
728
  DTD *const dtd = parser->m_dtd; /* save one level of indirection */
6023
#ifndef XML_DTD
6024
  UNUSED_P(account);
6025
#endif
6026
6027
135k
  for (;;) {
6028
135k
    const char *next
6029
135k
        = ptr; /* XmlAttributeValueTok doesn't always set the last arg */
6030
135k
    int tok = XmlAttributeValueTok(enc, ptr, end, &next);
6031
135k
#if XML_GE == 1
6032
135k
    if (! accountingDiffTolerated(parser, tok, ptr, next, __LINE__, account)) {
6033
0
      accountingOnAbort(parser);
6034
0
      return XML_ERROR_AMPLIFICATION_LIMIT_BREACH;
6035
0
    }
6036
135k
#endif
6037
135k
    switch (tok) {
6038
728
    case XML_TOK_NONE:
6039
728
      return XML_ERROR_NONE;
6040
0
    case XML_TOK_INVALID:
6041
0
      if (enc == parser->m_encoding)
6042
0
        parser->m_eventPtr = next;
6043
0
      return XML_ERROR_INVALID_TOKEN;
6044
0
    case XML_TOK_PARTIAL:
6045
0
      if (enc == parser->m_encoding)
6046
0
        parser->m_eventPtr = ptr;
6047
0
      return XML_ERROR_INVALID_TOKEN;
6048
0
    case XML_TOK_CHAR_REF: {
6049
0
      XML_Char buf[XML_ENCODE_MAX];
6050
0
      int i;
6051
0
      int n = XmlCharRefNumber(enc, ptr);
6052
0
      if (n < 0) {
6053
0
        if (enc == parser->m_encoding)
6054
0
          parser->m_eventPtr = ptr;
6055
0
        return XML_ERROR_BAD_CHAR_REF;
6056
0
      }
6057
0
      if (! isCdata && n == 0x20 /* space */
6058
0
          && (poolLength(pool) == 0 || poolLastChar(pool) == 0x20))
6059
0
        break;
6060
0
      n = XmlEncode(n, (ICHAR *)buf);
6061
      /* The XmlEncode() functions can never return 0 here.  That
6062
       * error return happens if the code point passed in is either
6063
       * negative or greater than or equal to 0x110000.  The
6064
       * XmlCharRefNumber() functions will all return a number
6065
       * strictly less than 0x110000 or a negative value if an error
6066
       * occurred.  The negative value is intercepted above, so
6067
       * XmlEncode() is never passed a value it might return an
6068
       * error for.
6069
       */
6070
0
      for (i = 0; i < n; i++) {
6071
0
        if (! poolAppendChar(pool, buf[i]))
6072
0
          return XML_ERROR_NO_MEMORY;
6073
0
      }
6074
0
    } break;
6075
63.6k
    case XML_TOK_DATA_CHARS:
6076
63.6k
      if (! poolAppend(pool, enc, ptr, next))
6077
0
        return XML_ERROR_NO_MEMORY;
6078
63.6k
      break;
6079
63.6k
    case XML_TOK_TRAILING_CR:
6080
0
      next = ptr + enc->minBytesPerChar;
6081
      /* fall through */
6082
68.0k
    case XML_TOK_ATTRIBUTE_VALUE_S:
6083
71.2k
    case XML_TOK_DATA_NEWLINE:
6084
71.2k
      if (! isCdata && (poolLength(pool) == 0 || poolLastChar(pool) == 0x20))
6085
0
        break;
6086
71.2k
      if (! poolAppendChar(pool, 0x20))
6087
0
        return XML_ERROR_NO_MEMORY;
6088
71.2k
      break;
6089
71.2k
    case XML_TOK_ENTITY_REF: {
6090
0
      const XML_Char *name;
6091
0
      ENTITY *entity;
6092
0
      char checkEntityDecl;
6093
0
      XML_Char ch = (XML_Char)XmlPredefinedEntityName(
6094
0
          enc, ptr + enc->minBytesPerChar, next - enc->minBytesPerChar);
6095
0
      if (ch) {
6096
0
#if XML_GE == 1
6097
        /* NOTE: We are replacing 4-6 characters original input for 1 character
6098
         *       so there is no amplification and hence recording without
6099
         *       protection. */
6100
0
        accountingDiffTolerated(parser, tok, (char *)&ch,
6101
0
                                ((char *)&ch) + sizeof(XML_Char), __LINE__,
6102
0
                                XML_ACCOUNT_ENTITY_EXPANSION);
6103
0
#endif /* XML_GE == 1 */
6104
0
        if (! poolAppendChar(pool, ch))
6105
0
          return XML_ERROR_NO_MEMORY;
6106
0
        break;
6107
0
      }
6108
0
      name = poolStoreString(&parser->m_temp2Pool, enc,
6109
0
                             ptr + enc->minBytesPerChar,
6110
0
                             next - enc->minBytesPerChar);
6111
0
      if (! name)
6112
0
        return XML_ERROR_NO_MEMORY;
6113
0
      entity = (ENTITY *)lookup(parser, &dtd->generalEntities, name, 0);
6114
0
      poolDiscard(&parser->m_temp2Pool);
6115
      /* First, determine if a check for an existing declaration is needed;
6116
         if yes, check that the entity exists, and that it is internal.
6117
      */
6118
0
      if (pool == &dtd->pool) /* are we called from prolog? */
6119
0
        checkEntityDecl =
6120
0
#ifdef XML_DTD
6121
0
            parser->m_prologState.documentEntity &&
6122
0
#endif /* XML_DTD */
6123
0
            (dtd->standalone ? ! parser->m_openInternalEntities
6124
0
                             : ! dtd->hasParamEntityRefs);
6125
0
      else /* if (pool == &parser->m_tempPool): we are called from content */
6126
0
        checkEntityDecl = ! dtd->hasParamEntityRefs || dtd->standalone;
6127
0
      if (checkEntityDecl) {
6128
0
        if (! entity)
6129
0
          return XML_ERROR_UNDEFINED_ENTITY;
6130
0
        else if (! entity->is_internal)
6131
0
          return XML_ERROR_ENTITY_DECLARED_IN_PE;
6132
0
      } else if (! entity) {
6133
        /* Cannot report skipped entity here - see comments on
6134
           parser->m_skippedEntityHandler.
6135
        if (parser->m_skippedEntityHandler)
6136
          parser->m_skippedEntityHandler(parser->m_handlerArg, name, 0);
6137
        */
6138
        /* Cannot call the default handler because this would be
6139
           out of sync with the call to the startElementHandler.
6140
        if ((pool == &parser->m_tempPool) && parser->m_defaultHandler)
6141
          reportDefault(parser, enc, ptr, next);
6142
        */
6143
0
        break;
6144
0
      }
6145
0
      if (entity->open) {
6146
0
        if (enc == parser->m_encoding) {
6147
          /* It does not appear that this line can be executed.
6148
           *
6149
           * The "if (entity->open)" check catches recursive entity
6150
           * definitions.  In order to be called with an open
6151
           * entity, it must have gone through this code before and
6152
           * been through the recursive call to
6153
           * appendAttributeValue() some lines below.  That call
6154
           * sets the local encoding ("enc") to the parser's
6155
           * internal encoding (internal_utf8 or internal_utf16),
6156
           * which can never be the same as the principle encoding.
6157
           * It doesn't appear there is another code path that gets
6158
           * here with entity->open being TRUE.
6159
           *
6160
           * Since it is not certain that this logic is watertight,
6161
           * we keep the line and merely exclude it from coverage
6162
           * tests.
6163
           */
6164
0
          parser->m_eventPtr = ptr; /* LCOV_EXCL_LINE */
6165
0
        }
6166
0
        return XML_ERROR_RECURSIVE_ENTITY_REF;
6167
0
      }
6168
0
      if (entity->notation) {
6169
0
        if (enc == parser->m_encoding)
6170
0
          parser->m_eventPtr = ptr;
6171
0
        return XML_ERROR_BINARY_ENTITY_REF;
6172
0
      }
6173
0
      if (! entity->textPtr) {
6174
0
        if (enc == parser->m_encoding)
6175
0
          parser->m_eventPtr = ptr;
6176
0
        return XML_ERROR_ATTRIBUTE_EXTERNAL_ENTITY_REF;
6177
0
      } else {
6178
0
        enum XML_Error result;
6179
0
        const XML_Char *textEnd = entity->textPtr + entity->textLen;
6180
0
        entity->open = XML_TRUE;
6181
0
#if XML_GE == 1
6182
0
        entityTrackingOnOpen(parser, entity, __LINE__);
6183
0
#endif
6184
0
        result = appendAttributeValue(parser, parser->m_internalEncoding,
6185
0
                                      isCdata, (const char *)entity->textPtr,
6186
0
                                      (const char *)textEnd, pool,
6187
0
                                      XML_ACCOUNT_ENTITY_EXPANSION);
6188
0
#if XML_GE == 1
6189
0
        entityTrackingOnClose(parser, entity, __LINE__);
6190
0
#endif
6191
0
        entity->open = XML_FALSE;
6192
0
        if (result)
6193
0
          return result;
6194
0
      }
6195
0
    } break;
6196
0
    default:
6197
      /* The only token returned by XmlAttributeValueTok() that does
6198
       * not have an explicit case here is XML_TOK_PARTIAL_CHAR.
6199
       * Getting that would require an entity name to contain an
6200
       * incomplete XML character (e.g. \xE2\x82); however previous
6201
       * tokenisers will have already recognised and rejected such
6202
       * names before XmlAttributeValueTok() gets a look-in.  This
6203
       * default case should be retained as a safety net, but the code
6204
       * excluded from coverage tests.
6205
       *
6206
       * LCOV_EXCL_START
6207
       */
6208
0
      if (enc == parser->m_encoding)
6209
0
        parser->m_eventPtr = ptr;
6210
0
      return XML_ERROR_UNEXPECTED_STATE;
6211
      /* LCOV_EXCL_STOP */
6212
135k
    }
6213
134k
    ptr = next;
6214
134k
  }
6215
  /* not reached */
6216
728
}
6217
6218
#if XML_GE == 1
6219
static enum XML_Error
6220
storeEntityValue(XML_Parser parser, const ENCODING *enc,
6221
                 const char *entityTextPtr, const char *entityTextEnd,
6222
0
                 enum XML_Account account) {
6223
0
  DTD *const dtd = parser->m_dtd; /* save one level of indirection */
6224
0
  STRING_POOL *pool = &(dtd->entityValuePool);
6225
0
  enum XML_Error result = XML_ERROR_NONE;
6226
0
#  ifdef XML_DTD
6227
0
  int oldInEntityValue = parser->m_prologState.inEntityValue;
6228
0
  parser->m_prologState.inEntityValue = 1;
6229
#  else
6230
  UNUSED_P(account);
6231
#  endif /* XML_DTD */
6232
  /* never return Null for the value argument in EntityDeclHandler,
6233
     since this would indicate an external entity; therefore we
6234
     have to make sure that entityValuePool.start is not null */
6235
0
  if (! pool->blocks) {
6236
0
    if (! poolGrow(pool))
6237
0
      return XML_ERROR_NO_MEMORY;
6238
0
  }
6239
6240
0
  for (;;) {
6241
0
    const char *next
6242
0
        = entityTextPtr; /* XmlEntityValueTok doesn't always set the last arg */
6243
0
    int tok = XmlEntityValueTok(enc, entityTextPtr, entityTextEnd, &next);
6244
6245
0
    if (! accountingDiffTolerated(parser, tok, entityTextPtr, next, __LINE__,
6246
0
                                  account)) {
6247
0
      accountingOnAbort(parser);
6248
0
      result = XML_ERROR_AMPLIFICATION_LIMIT_BREACH;
6249
0
      goto endEntityValue;
6250
0
    }
6251
6252
0
    switch (tok) {
6253
0
    case XML_TOK_PARAM_ENTITY_REF:
6254
0
#  ifdef XML_DTD
6255
0
      if (parser->m_isParamEntity || enc != parser->m_encoding) {
6256
0
        const XML_Char *name;
6257
0
        ENTITY *entity;
6258
0
        name = poolStoreString(&parser->m_tempPool, enc,
6259
0
                               entityTextPtr + enc->minBytesPerChar,
6260
0
                               next - enc->minBytesPerChar);
6261
0
        if (! name) {
6262
0
          result = XML_ERROR_NO_MEMORY;
6263
0
          goto endEntityValue;
6264
0
        }
6265
0
        entity = (ENTITY *)lookup(parser, &dtd->paramEntities, name, 0);
6266
0
        poolDiscard(&parser->m_tempPool);
6267
0
        if (! entity) {
6268
          /* not a well-formedness error - see XML 1.0: WFC Entity Declared */
6269
          /* cannot report skipped entity here - see comments on
6270
             parser->m_skippedEntityHandler
6271
          if (parser->m_skippedEntityHandler)
6272
            parser->m_skippedEntityHandler(parser->m_handlerArg, name, 0);
6273
          */
6274
0
          dtd->keepProcessing = dtd->standalone;
6275
0
          goto endEntityValue;
6276
0
        }
6277
0
        if (entity->open || (entity == parser->m_declEntity)) {
6278
0
          if (enc == parser->m_encoding)
6279
0
            parser->m_eventPtr = entityTextPtr;
6280
0
          result = XML_ERROR_RECURSIVE_ENTITY_REF;
6281
0
          goto endEntityValue;
6282
0
        }
6283
0
        if (entity->systemId) {
6284
0
          if (parser->m_externalEntityRefHandler) {
6285
0
            dtd->paramEntityRead = XML_FALSE;
6286
0
            entity->open = XML_TRUE;
6287
0
            entityTrackingOnOpen(parser, entity, __LINE__);
6288
0
            if (! parser->m_externalEntityRefHandler(
6289
0
                    parser->m_externalEntityRefHandlerArg, 0, entity->base,
6290
0
                    entity->systemId, entity->publicId)) {
6291
0
              entityTrackingOnClose(parser, entity, __LINE__);
6292
0
              entity->open = XML_FALSE;
6293
0
              result = XML_ERROR_EXTERNAL_ENTITY_HANDLING;
6294
0
              goto endEntityValue;
6295
0
            }
6296
0
            entityTrackingOnClose(parser, entity, __LINE__);
6297
0
            entity->open = XML_FALSE;
6298
0
            if (! dtd->paramEntityRead)
6299
0
              dtd->keepProcessing = dtd->standalone;
6300
0
          } else
6301
0
            dtd->keepProcessing = dtd->standalone;
6302
0
        } else {
6303
0
          entity->open = XML_TRUE;
6304
0
          entityTrackingOnOpen(parser, entity, __LINE__);
6305
0
          result = storeEntityValue(
6306
0
              parser, parser->m_internalEncoding, (const char *)entity->textPtr,
6307
0
              (const char *)(entity->textPtr + entity->textLen),
6308
0
              XML_ACCOUNT_ENTITY_EXPANSION);
6309
0
          entityTrackingOnClose(parser, entity, __LINE__);
6310
0
          entity->open = XML_FALSE;
6311
0
          if (result)
6312
0
            goto endEntityValue;
6313
0
        }
6314
0
        break;
6315
0
      }
6316
0
#  endif /* XML_DTD */
6317
      /* In the internal subset, PE references are not legal
6318
         within markup declarations, e.g entity values in this case. */
6319
0
      parser->m_eventPtr = entityTextPtr;
6320
0
      result = XML_ERROR_PARAM_ENTITY_REF;
6321
0
      goto endEntityValue;
6322
0
    case XML_TOK_NONE:
6323
0
      result = XML_ERROR_NONE;
6324
0
      goto endEntityValue;
6325
0
    case XML_TOK_ENTITY_REF:
6326
0
    case XML_TOK_DATA_CHARS:
6327
0
      if (! poolAppend(pool, enc, entityTextPtr, next)) {
6328
0
        result = XML_ERROR_NO_MEMORY;
6329
0
        goto endEntityValue;
6330
0
      }
6331
0
      break;
6332
0
    case XML_TOK_TRAILING_CR:
6333
0
      next = entityTextPtr + enc->minBytesPerChar;
6334
      /* fall through */
6335
0
    case XML_TOK_DATA_NEWLINE:
6336
0
      if (pool->end == pool->ptr && ! poolGrow(pool)) {
6337
0
        result = XML_ERROR_NO_MEMORY;
6338
0
        goto endEntityValue;
6339
0
      }
6340
0
      *(pool->ptr)++ = 0xA;
6341
0
      break;
6342
0
    case XML_TOK_CHAR_REF: {
6343
0
      XML_Char buf[XML_ENCODE_MAX];
6344
0
      int i;
6345
0
      int n = XmlCharRefNumber(enc, entityTextPtr);
6346
0
      if (n < 0) {
6347
0
        if (enc == parser->m_encoding)
6348
0
          parser->m_eventPtr = entityTextPtr;
6349
0
        result = XML_ERROR_BAD_CHAR_REF;
6350
0
        goto endEntityValue;
6351
0
      }
6352
0
      n = XmlEncode(n, (ICHAR *)buf);
6353
      /* The XmlEncode() functions can never return 0 here.  That
6354
       * error return happens if the code point passed in is either
6355
       * negative or greater than or equal to 0x110000.  The
6356
       * XmlCharRefNumber() functions will all return a number
6357
       * strictly less than 0x110000 or a negative value if an error
6358
       * occurred.  The negative value is intercepted above, so
6359
       * XmlEncode() is never passed a value it might return an
6360
       * error for.
6361
       */
6362
0
      for (i = 0; i < n; i++) {
6363
0
        if (pool->end == pool->ptr && ! poolGrow(pool)) {
6364
0
          result = XML_ERROR_NO_MEMORY;
6365
0
          goto endEntityValue;
6366
0
        }
6367
0
        *(pool->ptr)++ = buf[i];
6368
0
      }
6369
0
    } break;
6370
0
    case XML_TOK_PARTIAL:
6371
0
      if (enc == parser->m_encoding)
6372
0
        parser->m_eventPtr = entityTextPtr;
6373
0
      result = XML_ERROR_INVALID_TOKEN;
6374
0
      goto endEntityValue;
6375
0
    case XML_TOK_INVALID:
6376
0
      if (enc == parser->m_encoding)
6377
0
        parser->m_eventPtr = next;
6378
0
      result = XML_ERROR_INVALID_TOKEN;
6379
0
      goto endEntityValue;
6380
0
    default:
6381
      /* This default case should be unnecessary -- all the tokens
6382
       * that XmlEntityValueTok() can return have their own explicit
6383
       * cases -- but should be retained for safety.  We do however
6384
       * exclude it from the coverage statistics.
6385
       *
6386
       * LCOV_EXCL_START
6387
       */
6388
0
      if (enc == parser->m_encoding)
6389
0
        parser->m_eventPtr = entityTextPtr;
6390
0
      result = XML_ERROR_UNEXPECTED_STATE;
6391
0
      goto endEntityValue;
6392
      /* LCOV_EXCL_STOP */
6393
0
    }
6394
0
    entityTextPtr = next;
6395
0
  }
6396
0
endEntityValue:
6397
0
#  ifdef XML_DTD
6398
0
  parser->m_prologState.inEntityValue = oldInEntityValue;
6399
0
#  endif /* XML_DTD */
6400
0
  return result;
6401
0
}
6402
6403
#else /* XML_GE == 0 */
6404
6405
static enum XML_Error
6406
storeSelfEntityValue(XML_Parser parser, ENTITY *entity) {
6407
  // This will store "&amp;entity123;" in entity->textPtr
6408
  // to end up as "&entity123;" in the handler.
6409
  const char *const entity_start = "&amp;";
6410
  const char *const entity_end = ";";
6411
6412
  STRING_POOL *const pool = &(parser->m_dtd->entityValuePool);
6413
  if (! poolAppendString(pool, entity_start)
6414
      || ! poolAppendString(pool, entity->name)
6415
      || ! poolAppendString(pool, entity_end)) {
6416
    poolDiscard(pool);
6417
    return XML_ERROR_NO_MEMORY;
6418
  }
6419
6420
  entity->textPtr = poolStart(pool);
6421
  entity->textLen = (int)(poolLength(pool));
6422
  poolFinish(pool);
6423
6424
  return XML_ERROR_NONE;
6425
}
6426
6427
#endif /* XML_GE == 0 */
6428
6429
static void FASTCALL
6430
0
normalizeLines(XML_Char *s) {
6431
0
  XML_Char *p;
6432
0
  for (;; s++) {
6433
0
    if (*s == XML_T('\0'))
6434
0
      return;
6435
0
    if (*s == 0xD)
6436
0
      break;
6437
0
  }
6438
0
  p = s;
6439
0
  do {
6440
0
    if (*s == 0xD) {
6441
0
      *p++ = 0xA;
6442
0
      if (*++s == 0xA)
6443
0
        s++;
6444
0
    } else
6445
0
      *p++ = *s++;
6446
0
  } while (*s);
6447
0
  *p = XML_T('\0');
6448
0
}
6449
6450
static int
6451
reportProcessingInstruction(XML_Parser parser, const ENCODING *enc,
6452
0
                            const char *start, const char *end) {
6453
0
  const XML_Char *target;
6454
0
  XML_Char *data;
6455
0
  const char *tem;
6456
0
  if (! parser->m_processingInstructionHandler) {
6457
0
    if (parser->m_defaultHandler)
6458
0
      reportDefault(parser, enc, start, end);
6459
0
    return 1;
6460
0
  }
6461
0
  start += enc->minBytesPerChar * 2;
6462
0
  tem = start + XmlNameLength(enc, start);
6463
0
  target = poolStoreString(&parser->m_tempPool, enc, start, tem);
6464
0
  if (! target)
6465
0
    return 0;
6466
0
  poolFinish(&parser->m_tempPool);
6467
0
  data = poolStoreString(&parser->m_tempPool, enc, XmlSkipS(enc, tem),
6468
0
                         end - enc->minBytesPerChar * 2);
6469
0
  if (! data)
6470
0
    return 0;
6471
0
  normalizeLines(data);
6472
0
  parser->m_processingInstructionHandler(parser->m_handlerArg, target, data);
6473
0
  poolClear(&parser->m_tempPool);
6474
0
  return 1;
6475
0
}
6476
6477
static int
6478
reportComment(XML_Parser parser, const ENCODING *enc, const char *start,
6479
0
              const char *end) {
6480
0
  XML_Char *data;
6481
0
  if (! parser->m_commentHandler) {
6482
0
    if (parser->m_defaultHandler)
6483
0
      reportDefault(parser, enc, start, end);
6484
0
    return 1;
6485
0
  }
6486
0
  data = poolStoreString(&parser->m_tempPool, enc,
6487
0
                         start + enc->minBytesPerChar * 4,
6488
0
                         end - enc->minBytesPerChar * 3);
6489
0
  if (! data)
6490
0
    return 0;
6491
0
  normalizeLines(data);
6492
0
  parser->m_commentHandler(parser->m_handlerArg, data);
6493
0
  poolClear(&parser->m_tempPool);
6494
0
  return 1;
6495
0
}
6496
6497
static void
6498
reportDefault(XML_Parser parser, const ENCODING *enc, const char *s,
6499
0
              const char *end) {
6500
0
  if (MUST_CONVERT(enc, s)) {
6501
0
    enum XML_Convert_Result convert_res;
6502
0
    const char **eventPP;
6503
0
    const char **eventEndPP;
6504
0
    if (enc == parser->m_encoding) {
6505
0
      eventPP = &parser->m_eventPtr;
6506
0
      eventEndPP = &parser->m_eventEndPtr;
6507
0
    } else {
6508
      /* To get here, two things must be true; the parser must be
6509
       * using a character encoding that is not the same as the
6510
       * encoding passed in, and the encoding passed in must need
6511
       * conversion to the internal format (UTF-8 unless XML_UNICODE
6512
       * is defined).  The only occasions on which the encoding passed
6513
       * in is not the same as the parser's encoding are when it is
6514
       * the internal encoding (e.g. a previously defined parameter
6515
       * entity, already converted to internal format).  This by
6516
       * definition doesn't need conversion, so the whole branch never
6517
       * gets executed.
6518
       *
6519
       * For safety's sake we don't delete these lines and merely
6520
       * exclude them from coverage statistics.
6521
       *
6522
       * LCOV_EXCL_START
6523
       */
6524
0
      eventPP = &(parser->m_openInternalEntities->internalEventPtr);
6525
0
      eventEndPP = &(parser->m_openInternalEntities->internalEventEndPtr);
6526
      /* LCOV_EXCL_STOP */
6527
0
    }
6528
0
    do {
6529
0
      ICHAR *dataPtr = (ICHAR *)parser->m_dataBuf;
6530
0
      convert_res
6531
0
          = XmlConvert(enc, &s, end, &dataPtr, (ICHAR *)parser->m_dataBufEnd);
6532
0
      *eventEndPP = s;
6533
0
      parser->m_defaultHandler(parser->m_handlerArg, parser->m_dataBuf,
6534
0
                               (int)(dataPtr - (ICHAR *)parser->m_dataBuf));
6535
0
      *eventPP = s;
6536
0
    } while ((convert_res != XML_CONVERT_COMPLETED)
6537
0
             && (convert_res != XML_CONVERT_INPUT_INCOMPLETE));
6538
0
  } else
6539
0
    parser->m_defaultHandler(
6540
0
        parser->m_handlerArg, (const XML_Char *)s,
6541
0
        (int)((const XML_Char *)end - (const XML_Char *)s));
6542
0
}
6543
6544
static int
6545
defineAttribute(ELEMENT_TYPE *type, ATTRIBUTE_ID *attId, XML_Bool isCdata,
6546
0
                XML_Bool isId, const XML_Char *value, XML_Parser parser) {
6547
0
  DEFAULT_ATTRIBUTE *att;
6548
0
  if (value || isId) {
6549
    /* The handling of default attributes gets messed up if we have
6550
       a default which duplicates a non-default. */
6551
0
    int i;
6552
0
    for (i = 0; i < type->nDefaultAtts; i++)
6553
0
      if (attId == type->defaultAtts[i].id)
6554
0
        return 1;
6555
0
    if (isId && ! type->idAtt && ! attId->xmlns)
6556
0
      type->idAtt = attId;
6557
0
  }
6558
0
  if (type->nDefaultAtts == type->allocDefaultAtts) {
6559
0
    int count;
6560
0
    if (type->allocDefaultAtts == 0) {
6561
0
      type->allocDefaultAtts = 8;
6562
0
      type->defaultAtts = (DEFAULT_ATTRIBUTE *)MALLOC(
6563
0
          parser, type->allocDefaultAtts * sizeof(DEFAULT_ATTRIBUTE));
6564
0
      if (! type->defaultAtts) {
6565
0
        type->allocDefaultAtts = 0;
6566
0
        return 0;
6567
0
      }
6568
0
    } else {
6569
0
      DEFAULT_ATTRIBUTE *temp;
6570
6571
      /* Detect and prevent integer overflow */
6572
0
      if (type->allocDefaultAtts > INT_MAX / 2) {
6573
0
        return 0;
6574
0
      }
6575
6576
0
      count = type->allocDefaultAtts * 2;
6577
6578
      /* Detect and prevent integer overflow.
6579
       * The preprocessor guard addresses the "always false" warning
6580
       * from -Wtype-limits on platforms where
6581
       * sizeof(unsigned int) < sizeof(size_t), e.g. on x86_64. */
6582
#if UINT_MAX >= SIZE_MAX
6583
      if ((unsigned)count > (size_t)(-1) / sizeof(DEFAULT_ATTRIBUTE)) {
6584
        return 0;
6585
      }
6586
#endif
6587
6588
0
      temp = (DEFAULT_ATTRIBUTE *)REALLOC(parser, type->defaultAtts,
6589
0
                                          (count * sizeof(DEFAULT_ATTRIBUTE)));
6590
0
      if (temp == NULL)
6591
0
        return 0;
6592
0
      type->allocDefaultAtts = count;
6593
0
      type->defaultAtts = temp;
6594
0
    }
6595
0
  }
6596
0
  att = type->defaultAtts + type->nDefaultAtts;
6597
0
  att->id = attId;
6598
0
  att->value = value;
6599
0
  att->isCdata = isCdata;
6600
0
  if (! isCdata)
6601
0
    attId->maybeTokenized = XML_TRUE;
6602
0
  type->nDefaultAtts += 1;
6603
0
  return 1;
6604
0
}
6605
6606
static int
6607
73
setElementTypePrefix(XML_Parser parser, ELEMENT_TYPE *elementType) {
6608
73
  DTD *const dtd = parser->m_dtd; /* save one level of indirection */
6609
73
  const XML_Char *name;
6610
531
  for (name = elementType->name; *name; name++) {
6611
458
    if (*name == XML_T(ASCII_COLON)) {
6612
0
      PREFIX *prefix;
6613
0
      const XML_Char *s;
6614
0
      for (s = elementType->name; s != name; s++) {
6615
0
        if (! poolAppendChar(&dtd->pool, *s))
6616
0
          return 0;
6617
0
      }
6618
0
      if (! poolAppendChar(&dtd->pool, XML_T('\0')))
6619
0
        return 0;
6620
0
      prefix = (PREFIX *)lookup(parser, &dtd->prefixes, poolStart(&dtd->pool),
6621
0
                                sizeof(PREFIX));
6622
0
      if (! prefix)
6623
0
        return 0;
6624
0
      if (prefix->name == poolStart(&dtd->pool))
6625
0
        poolFinish(&dtd->pool);
6626
0
      else
6627
0
        poolDiscard(&dtd->pool);
6628
0
      elementType->prefix = prefix;
6629
0
      break;
6630
0
    }
6631
458
  }
6632
73
  return 1;
6633
73
}
6634
6635
static ATTRIBUTE_ID *
6636
getAttributeId(XML_Parser parser, const ENCODING *enc, const char *start,
6637
23.6k
               const char *end) {
6638
23.6k
  DTD *const dtd = parser->m_dtd; /* save one level of indirection */
6639
23.6k
  ATTRIBUTE_ID *id;
6640
23.6k
  const XML_Char *name;
6641
23.6k
  if (! poolAppendChar(&dtd->pool, XML_T('\0')))
6642
0
    return NULL;
6643
23.6k
  name = poolStoreString(&dtd->pool, enc, start, end);
6644
23.6k
  if (! name)
6645
0
    return NULL;
6646
  /* skip quotation mark - its storage will be reused (like in name[-1]) */
6647
23.6k
  ++name;
6648
23.6k
  id = (ATTRIBUTE_ID *)lookup(parser, &dtd->attributeIds, name,
6649
23.6k
                              sizeof(ATTRIBUTE_ID));
6650
23.6k
  if (! id)
6651
0
    return NULL;
6652
23.6k
  if (id->name != name)
6653
23.1k
    poolDiscard(&dtd->pool);
6654
446
  else {
6655
446
    poolFinish(&dtd->pool);
6656
446
    if (! parser->m_ns)
6657
186
      ;
6658
260
    else if (name[0] == XML_T(ASCII_x) && name[1] == XML_T(ASCII_m)
6659
40
             && name[2] == XML_T(ASCII_l) && name[3] == XML_T(ASCII_n)
6660
20
             && name[4] == XML_T(ASCII_s)
6661
20
             && (name[5] == XML_T('\0') || name[5] == XML_T(ASCII_COLON))) {
6662
20
      if (name[5] == XML_T('\0'))
6663
20
        id->prefix = &dtd->defaultPrefix;
6664
0
      else
6665
0
        id->prefix = (PREFIX *)lookup(parser, &dtd->prefixes, name + 6,
6666
0
                                      sizeof(PREFIX));
6667
20
      id->xmlns = XML_TRUE;
6668
240
    } else {
6669
240
      int i;
6670
2.13k
      for (i = 0; name[i]; i++) {
6671
        /* attributes without prefix are *not* in the default namespace */
6672
1.91k
        if (name[i] == XML_T(ASCII_COLON)) {
6673
20
          int j;
6674
80
          for (j = 0; j < i; j++) {
6675
60
            if (! poolAppendChar(&dtd->pool, name[j]))
6676
0
              return NULL;
6677
60
          }
6678
20
          if (! poolAppendChar(&dtd->pool, XML_T('\0')))
6679
0
            return NULL;
6680
20
          id->prefix = (PREFIX *)lookup(parser, &dtd->prefixes,
6681
20
                                        poolStart(&dtd->pool), sizeof(PREFIX));
6682
20
          if (! id->prefix)
6683
0
            return NULL;
6684
20
          if (id->prefix->name == poolStart(&dtd->pool))
6685
0
            poolFinish(&dtd->pool);
6686
20
          else
6687
20
            poolDiscard(&dtd->pool);
6688
20
          break;
6689
20
        }
6690
1.91k
      }
6691
240
    }
6692
446
  }
6693
23.6k
  return id;
6694
23.6k
}
6695
6696
820
#define CONTEXT_SEP XML_T(ASCII_FF)
6697
6698
static const XML_Char *
6699
0
getContext(XML_Parser parser) {
6700
0
  DTD *const dtd = parser->m_dtd; /* save one level of indirection */
6701
0
  HASH_TABLE_ITER iter;
6702
0
  XML_Bool needSep = XML_FALSE;
6703
6704
0
  if (dtd->defaultPrefix.binding) {
6705
0
    int i;
6706
0
    int len;
6707
0
    if (! poolAppendChar(&parser->m_tempPool, XML_T(ASCII_EQUALS)))
6708
0
      return NULL;
6709
0
    len = dtd->defaultPrefix.binding->uriLen;
6710
0
    if (parser->m_namespaceSeparator)
6711
0
      len--;
6712
0
    for (i = 0; i < len; i++) {
6713
0
      if (! poolAppendChar(&parser->m_tempPool,
6714
0
                           dtd->defaultPrefix.binding->uri[i])) {
6715
        /* Because of memory caching, I don't believe this line can be
6716
         * executed.
6717
         *
6718
         * This is part of a loop copying the default prefix binding
6719
         * URI into the parser's temporary string pool.  Previously,
6720
         * that URI was copied into the same string pool, with a
6721
         * terminating NUL character, as part of setContext().  When
6722
         * the pool was cleared, that leaves a block definitely big
6723
         * enough to hold the URI on the free block list of the pool.
6724
         * The URI copy in getContext() therefore cannot run out of
6725
         * memory.
6726
         *
6727
         * If the pool is used between the setContext() and
6728
         * getContext() calls, the worst it can do is leave a bigger
6729
         * block on the front of the free list.  Given that this is
6730
         * all somewhat inobvious and program logic can be changed, we
6731
         * don't delete the line but we do exclude it from the test
6732
         * coverage statistics.
6733
         */
6734
0
        return NULL; /* LCOV_EXCL_LINE */
6735
0
      }
6736
0
    }
6737
0
    needSep = XML_TRUE;
6738
0
  }
6739
6740
0
  hashTableIterInit(&iter, &(dtd->prefixes));
6741
0
  for (;;) {
6742
0
    int i;
6743
0
    int len;
6744
0
    const XML_Char *s;
6745
0
    PREFIX *prefix = (PREFIX *)hashTableIterNext(&iter);
6746
0
    if (! prefix)
6747
0
      break;
6748
0
    if (! prefix->binding) {
6749
      /* This test appears to be (justifiable) paranoia.  There does
6750
       * not seem to be a way of injecting a prefix without a binding
6751
       * that doesn't get errored long before this function is called.
6752
       * The test should remain for safety's sake, so we instead
6753
       * exclude the following line from the coverage statistics.
6754
       */
6755
0
      continue; /* LCOV_EXCL_LINE */
6756
0
    }
6757
0
    if (needSep && ! poolAppendChar(&parser->m_tempPool, CONTEXT_SEP))
6758
0
      return NULL;
6759
0
    for (s = prefix->name; *s; s++)
6760
0
      if (! poolAppendChar(&parser->m_tempPool, *s))
6761
0
        return NULL;
6762
0
    if (! poolAppendChar(&parser->m_tempPool, XML_T(ASCII_EQUALS)))
6763
0
      return NULL;
6764
0
    len = prefix->binding->uriLen;
6765
0
    if (parser->m_namespaceSeparator)
6766
0
      len--;
6767
0
    for (i = 0; i < len; i++)
6768
0
      if (! poolAppendChar(&parser->m_tempPool, prefix->binding->uri[i]))
6769
0
        return NULL;
6770
0
    needSep = XML_TRUE;
6771
0
  }
6772
6773
0
  hashTableIterInit(&iter, &(dtd->generalEntities));
6774
0
  for (;;) {
6775
0
    const XML_Char *s;
6776
0
    ENTITY *e = (ENTITY *)hashTableIterNext(&iter);
6777
0
    if (! e)
6778
0
      break;
6779
0
    if (! e->open)
6780
0
      continue;
6781
0
    if (needSep && ! poolAppendChar(&parser->m_tempPool, CONTEXT_SEP))
6782
0
      return NULL;
6783
0
    for (s = e->name; *s; s++)
6784
0
      if (! poolAppendChar(&parser->m_tempPool, *s))
6785
0
        return 0;
6786
0
    needSep = XML_TRUE;
6787
0
  }
6788
6789
0
  if (! poolAppendChar(&parser->m_tempPool, XML_T('\0')))
6790
0
    return NULL;
6791
0
  return parser->m_tempPool.start;
6792
0
}
6793
6794
static XML_Bool
6795
20
setContext(XML_Parser parser, const XML_Char *context) {
6796
20
  DTD *const dtd = parser->m_dtd; /* save one level of indirection */
6797
20
  const XML_Char *s = context;
6798
20
  if (context == NULL) {
6799
0
    return XML_FALSE;
6800
0
  }
6801
6802
6803
100
  while (*context != XML_T('\0')) {
6804
80
    if (*s == CONTEXT_SEP || *s == XML_T('\0')) {
6805
0
      ENTITY *e;
6806
0
      if (! poolAppendChar(&parser->m_tempPool, XML_T('\0')))
6807
0
        return XML_FALSE;
6808
0
      e = (ENTITY *)lookup(parser, &dtd->generalEntities,
6809
0
                           poolStart(&parser->m_tempPool), 0);
6810
0
      if (e)
6811
0
        e->open = XML_TRUE;
6812
0
      if (*s != XML_T('\0'))
6813
0
        s++;
6814
0
      context = s;
6815
0
      poolDiscard(&parser->m_tempPool);
6816
80
    } else if (*s == XML_T(ASCII_EQUALS)) {
6817
20
      PREFIX *prefix;
6818
20
      if (poolLength(&parser->m_tempPool) == 0)
6819
0
        prefix = &dtd->defaultPrefix;
6820
20
      else {
6821
20
        if (! poolAppendChar(&parser->m_tempPool, XML_T('\0')))
6822
0
          return XML_FALSE;
6823
20
        prefix
6824
20
            = (PREFIX *)lookup(parser, &dtd->prefixes,
6825
20
                               poolStart(&parser->m_tempPool), sizeof(PREFIX));
6826
20
        if (! prefix)
6827
0
          return XML_FALSE;
6828
20
        if (prefix->name == poolStart(&parser->m_tempPool)) {
6829
20
          prefix->name = poolCopyString(&dtd->pool, prefix->name);
6830
20
          if (! prefix->name)
6831
0
            return XML_FALSE;
6832
20
        }
6833
20
        poolDiscard(&parser->m_tempPool);
6834
20
      }
6835
740
      for (context = s + 1; *context != CONTEXT_SEP && *context != XML_T('\0');
6836
720
           context++)
6837
720
        if (! poolAppendChar(&parser->m_tempPool, *context))
6838
0
          return XML_FALSE;
6839
20
      if (! poolAppendChar(&parser->m_tempPool, XML_T('\0')))
6840
0
        return XML_FALSE;
6841
20
      if (addBinding(parser, prefix, NULL, poolStart(&parser->m_tempPool),
6842
20
                     &parser->m_inheritedBindings)
6843
20
          != XML_ERROR_NONE)
6844
0
        return XML_FALSE;
6845
20
      poolDiscard(&parser->m_tempPool);
6846
20
      if (*context != XML_T('\0'))
6847
0
        ++context;
6848
20
      s = context;
6849
60
    } else {
6850
60
      if (! poolAppendChar(&parser->m_tempPool, *s))
6851
0
        return XML_FALSE;
6852
60
      s++;
6853
60
    }
6854
80
  }
6855
20
  return XML_TRUE;
6856
20
}
6857
6858
static void FASTCALL
6859
0
normalizePublicId(XML_Char *publicId) {
6860
0
  XML_Char *p = publicId;
6861
0
  XML_Char *s;
6862
0
  for (s = publicId; *s; s++) {
6863
0
    switch (*s) {
6864
0
    case 0x20:
6865
0
    case 0xD:
6866
0
    case 0xA:
6867
0
      if (p != publicId && p[-1] != 0x20)
6868
0
        *p++ = 0x20;
6869
0
      break;
6870
0
    default:
6871
0
      *p++ = *s;
6872
0
    }
6873
0
  }
6874
0
  if (p != publicId && p[-1] == 0x20)
6875
0
    --p;
6876
0
  *p = XML_T('\0');
6877
0
}
6878
6879
static DTD *
6880
89
dtdCreate(const XML_Memory_Handling_Suite *ms) {
6881
89
  DTD *p = ms->malloc_fcn(sizeof(DTD));
6882
89
  if (p == NULL)
6883
0
    return p;
6884
89
  poolInit(&(p->pool), ms);
6885
89
  poolInit(&(p->entityValuePool), ms);
6886
89
  hashTableInit(&(p->generalEntities), ms);
6887
89
  hashTableInit(&(p->elementTypes), ms);
6888
89
  hashTableInit(&(p->attributeIds), ms);
6889
89
  hashTableInit(&(p->prefixes), ms);
6890
89
#ifdef XML_DTD
6891
89
  p->paramEntityRead = XML_FALSE;
6892
89
  hashTableInit(&(p->paramEntities), ms);
6893
89
#endif /* XML_DTD */
6894
89
  p->defaultPrefix.name = NULL;
6895
89
  p->defaultPrefix.binding = NULL;
6896
6897
89
  p->in_eldecl = XML_FALSE;
6898
89
  p->scaffIndex = NULL;
6899
89
  p->scaffold = NULL;
6900
89
  p->scaffLevel = 0;
6901
89
  p->scaffSize = 0;
6902
89
  p->scaffCount = 0;
6903
89
  p->contentStringLen = 0;
6904
6905
89
  p->keepProcessing = XML_TRUE;
6906
89
  p->hasParamEntityRefs = XML_FALSE;
6907
89
  p->standalone = XML_FALSE;
6908
89
  return p;
6909
89
}
6910
6911
static void
6912
0
dtdReset(DTD *p, const XML_Memory_Handling_Suite *ms) {
6913
0
  HASH_TABLE_ITER iter;
6914
0
  hashTableIterInit(&iter, &(p->elementTypes));
6915
0
  for (;;) {
6916
0
    ELEMENT_TYPE *e = (ELEMENT_TYPE *)hashTableIterNext(&iter);
6917
0
    if (! e)
6918
0
      break;
6919
0
    if (e->allocDefaultAtts != 0)
6920
0
      ms->free_fcn(e->defaultAtts);
6921
0
  }
6922
0
  hashTableClear(&(p->generalEntities));
6923
0
#ifdef XML_DTD
6924
0
  p->paramEntityRead = XML_FALSE;
6925
0
  hashTableClear(&(p->paramEntities));
6926
0
#endif /* XML_DTD */
6927
0
  hashTableClear(&(p->elementTypes));
6928
0
  hashTableClear(&(p->attributeIds));
6929
0
  hashTableClear(&(p->prefixes));
6930
0
  poolClear(&(p->pool));
6931
0
  poolClear(&(p->entityValuePool));
6932
0
  p->defaultPrefix.name = NULL;
6933
0
  p->defaultPrefix.binding = NULL;
6934
6935
0
  p->in_eldecl = XML_FALSE;
6936
6937
0
  ms->free_fcn(p->scaffIndex);
6938
0
  p->scaffIndex = NULL;
6939
0
  ms->free_fcn(p->scaffold);
6940
0
  p->scaffold = NULL;
6941
6942
0
  p->scaffLevel = 0;
6943
0
  p->scaffSize = 0;
6944
0
  p->scaffCount = 0;
6945
0
  p->contentStringLen = 0;
6946
6947
0
  p->keepProcessing = XML_TRUE;
6948
0
  p->hasParamEntityRefs = XML_FALSE;
6949
0
  p->standalone = XML_FALSE;
6950
0
}
6951
6952
static void
6953
89
dtdDestroy(DTD *p, XML_Bool isDocEntity, const XML_Memory_Handling_Suite *ms) {
6954
89
  HASH_TABLE_ITER iter;
6955
89
  hashTableIterInit(&iter, &(p->elementTypes));
6956
300
  for (;;) {
6957
300
    ELEMENT_TYPE *e = (ELEMENT_TYPE *)hashTableIterNext(&iter);
6958
300
    if (! e)
6959
89
      break;
6960
211
    if (e->allocDefaultAtts != 0)
6961
0
      ms->free_fcn(e->defaultAtts);
6962
211
  }
6963
89
  hashTableDestroy(&(p->generalEntities));
6964
89
#ifdef XML_DTD
6965
89
  hashTableDestroy(&(p->paramEntities));
6966
89
#endif /* XML_DTD */
6967
89
  hashTableDestroy(&(p->elementTypes));
6968
89
  hashTableDestroy(&(p->attributeIds));
6969
89
  hashTableDestroy(&(p->prefixes));
6970
89
  poolDestroy(&(p->pool));
6971
89
  poolDestroy(&(p->entityValuePool));
6972
89
  if (isDocEntity) {
6973
89
    ms->free_fcn(p->scaffIndex);
6974
89
    ms->free_fcn(p->scaffold);
6975
89
  }
6976
89
  ms->free_fcn(p);
6977
89
}
6978
6979
/* Do a deep copy of the DTD. Return 0 for out of memory, non-zero otherwise.
6980
   The new DTD has already been initialized.
6981
*/
6982
static int
6983
dtdCopy(XML_Parser oldParser, DTD *newDtd, const DTD *oldDtd,
6984
0
        const XML_Memory_Handling_Suite *ms) {
6985
0
  HASH_TABLE_ITER iter;
6986
6987
  /* Copy the prefix table. */
6988
6989
0
  hashTableIterInit(&iter, &(oldDtd->prefixes));
6990
0
  for (;;) {
6991
0
    const XML_Char *name;
6992
0
    const PREFIX *oldP = (PREFIX *)hashTableIterNext(&iter);
6993
0
    if (! oldP)
6994
0
      break;
6995
0
    name = poolCopyString(&(newDtd->pool), oldP->name);
6996
0
    if (! name)
6997
0
      return 0;
6998
0
    if (! lookup(oldParser, &(newDtd->prefixes), name, sizeof(PREFIX)))
6999
0
      return 0;
7000
0
  }
7001
7002
0
  hashTableIterInit(&iter, &(oldDtd->attributeIds));
7003
7004
  /* Copy the attribute id table. */
7005
7006
0
  for (;;) {
7007
0
    ATTRIBUTE_ID *newA;
7008
0
    const XML_Char *name;
7009
0
    const ATTRIBUTE_ID *oldA = (ATTRIBUTE_ID *)hashTableIterNext(&iter);
7010
7011
0
    if (! oldA)
7012
0
      break;
7013
    /* Remember to allocate the scratch byte before the name. */
7014
0
    if (! poolAppendChar(&(newDtd->pool), XML_T('\0')))
7015
0
      return 0;
7016
0
    name = poolCopyString(&(newDtd->pool), oldA->name);
7017
0
    if (! name)
7018
0
      return 0;
7019
0
    ++name;
7020
0
    newA = (ATTRIBUTE_ID *)lookup(oldParser, &(newDtd->attributeIds), name,
7021
0
                                  sizeof(ATTRIBUTE_ID));
7022
0
    if (! newA)
7023
0
      return 0;
7024
0
    newA->maybeTokenized = oldA->maybeTokenized;
7025
0
    if (oldA->prefix) {
7026
0
      newA->xmlns = oldA->xmlns;
7027
0
      if (oldA->prefix == &oldDtd->defaultPrefix)
7028
0
        newA->prefix = &newDtd->defaultPrefix;
7029
0
      else
7030
0
        newA->prefix = (PREFIX *)lookup(oldParser, &(newDtd->prefixes),
7031
0
                                        oldA->prefix->name, 0);
7032
0
    }
7033
0
  }
7034
7035
  /* Copy the element type table. */
7036
7037
0
  hashTableIterInit(&iter, &(oldDtd->elementTypes));
7038
7039
0
  for (;;) {
7040
0
    int i;
7041
0
    ELEMENT_TYPE *newE;
7042
0
    const XML_Char *name;
7043
0
    const ELEMENT_TYPE *oldE = (ELEMENT_TYPE *)hashTableIterNext(&iter);
7044
0
    if (! oldE)
7045
0
      break;
7046
0
    name = poolCopyString(&(newDtd->pool), oldE->name);
7047
0
    if (! name)
7048
0
      return 0;
7049
0
    newE = (ELEMENT_TYPE *)lookup(oldParser, &(newDtd->elementTypes), name,
7050
0
                                  sizeof(ELEMENT_TYPE));
7051
0
    if (! newE)
7052
0
      return 0;
7053
0
    if (oldE->nDefaultAtts) {
7054
      /* Detect and prevent integer overflow.
7055
       * The preprocessor guard addresses the "always false" warning
7056
       * from -Wtype-limits on platforms where
7057
       * sizeof(int) < sizeof(size_t), e.g. on x86_64. */
7058
#if UINT_MAX >= SIZE_MAX
7059
      if ((size_t)oldE->nDefaultAtts
7060
          > ((size_t)(-1) / sizeof(DEFAULT_ATTRIBUTE))) {
7061
        return 0;
7062
      }
7063
#endif
7064
0
      newE->defaultAtts
7065
0
          = ms->malloc_fcn(oldE->nDefaultAtts * sizeof(DEFAULT_ATTRIBUTE));
7066
0
      if (! newE->defaultAtts) {
7067
0
        return 0;
7068
0
      }
7069
0
    }
7070
0
    if (oldE->idAtt)
7071
0
      newE->idAtt = (ATTRIBUTE_ID *)lookup(oldParser, &(newDtd->attributeIds),
7072
0
                                           oldE->idAtt->name, 0);
7073
0
    newE->allocDefaultAtts = newE->nDefaultAtts = oldE->nDefaultAtts;
7074
0
    if (oldE->prefix)
7075
0
      newE->prefix = (PREFIX *)lookup(oldParser, &(newDtd->prefixes),
7076
0
                                      oldE->prefix->name, 0);
7077
0
    for (i = 0; i < newE->nDefaultAtts; i++) {
7078
0
      newE->defaultAtts[i].id = (ATTRIBUTE_ID *)lookup(
7079
0
          oldParser, &(newDtd->attributeIds), oldE->defaultAtts[i].id->name, 0);
7080
0
      newE->defaultAtts[i].isCdata = oldE->defaultAtts[i].isCdata;
7081
0
      if (oldE->defaultAtts[i].value) {
7082
0
        newE->defaultAtts[i].value
7083
0
            = poolCopyString(&(newDtd->pool), oldE->defaultAtts[i].value);
7084
0
        if (! newE->defaultAtts[i].value)
7085
0
          return 0;
7086
0
      } else
7087
0
        newE->defaultAtts[i].value = NULL;
7088
0
    }
7089
0
  }
7090
7091
  /* Copy the entity tables. */
7092
0
  if (! copyEntityTable(oldParser, &(newDtd->generalEntities), &(newDtd->pool),
7093
0
                        &(oldDtd->generalEntities)))
7094
0
    return 0;
7095
7096
0
#ifdef XML_DTD
7097
0
  if (! copyEntityTable(oldParser, &(newDtd->paramEntities), &(newDtd->pool),
7098
0
                        &(oldDtd->paramEntities)))
7099
0
    return 0;
7100
0
  newDtd->paramEntityRead = oldDtd->paramEntityRead;
7101
0
#endif /* XML_DTD */
7102
7103
0
  newDtd->keepProcessing = oldDtd->keepProcessing;
7104
0
  newDtd->hasParamEntityRefs = oldDtd->hasParamEntityRefs;
7105
0
  newDtd->standalone = oldDtd->standalone;
7106
7107
  /* Don't want deep copying for scaffolding */
7108
0
  newDtd->in_eldecl = oldDtd->in_eldecl;
7109
0
  newDtd->scaffold = oldDtd->scaffold;
7110
0
  newDtd->contentStringLen = oldDtd->contentStringLen;
7111
0
  newDtd->scaffSize = oldDtd->scaffSize;
7112
0
  newDtd->scaffLevel = oldDtd->scaffLevel;
7113
0
  newDtd->scaffIndex = oldDtd->scaffIndex;
7114
7115
0
  return 1;
7116
0
} /* End dtdCopy */
7117
7118
static int
7119
copyEntityTable(XML_Parser oldParser, HASH_TABLE *newTable,
7120
0
                STRING_POOL *newPool, const HASH_TABLE *oldTable) {
7121
0
  HASH_TABLE_ITER iter;
7122
0
  const XML_Char *cachedOldBase = NULL;
7123
0
  const XML_Char *cachedNewBase = NULL;
7124
7125
0
  hashTableIterInit(&iter, oldTable);
7126
7127
0
  for (;;) {
7128
0
    ENTITY *newE;
7129
0
    const XML_Char *name;
7130
0
    const ENTITY *oldE = (ENTITY *)hashTableIterNext(&iter);
7131
0
    if (! oldE)
7132
0
      break;
7133
0
    name = poolCopyString(newPool, oldE->name);
7134
0
    if (! name)
7135
0
      return 0;
7136
0
    newE = (ENTITY *)lookup(oldParser, newTable, name, sizeof(ENTITY));
7137
0
    if (! newE)
7138
0
      return 0;
7139
0
    if (oldE->systemId) {
7140
0
      const XML_Char *tem = poolCopyString(newPool, oldE->systemId);
7141
0
      if (! tem)
7142
0
        return 0;
7143
0
      newE->systemId = tem;
7144
0
      if (oldE->base) {
7145
0
        if (oldE->base == cachedOldBase)
7146
0
          newE->base = cachedNewBase;
7147
0
        else {
7148
0
          cachedOldBase = oldE->base;
7149
0
          tem = poolCopyString(newPool, cachedOldBase);
7150
0
          if (! tem)
7151
0
            return 0;
7152
0
          cachedNewBase = newE->base = tem;
7153
0
        }
7154
0
      }
7155
0
      if (oldE->publicId) {
7156
0
        tem = poolCopyString(newPool, oldE->publicId);
7157
0
        if (! tem)
7158
0
          return 0;
7159
0
        newE->publicId = tem;
7160
0
      }
7161
0
    } else {
7162
0
      const XML_Char *tem
7163
0
          = poolCopyStringN(newPool, oldE->textPtr, oldE->textLen);
7164
0
      if (! tem)
7165
0
        return 0;
7166
0
      newE->textPtr = tem;
7167
0
      newE->textLen = oldE->textLen;
7168
0
    }
7169
0
    if (oldE->notation) {
7170
0
      const XML_Char *tem = poolCopyString(newPool, oldE->notation);
7171
0
      if (! tem)
7172
0
        return 0;
7173
0
      newE->notation = tem;
7174
0
    }
7175
0
    newE->is_param = oldE->is_param;
7176
0
    newE->is_internal = oldE->is_internal;
7177
0
  }
7178
0
  return 1;
7179
0
}
7180
7181
396
#define INIT_POWER 6
7182
7183
static XML_Bool FASTCALL
7184
41.5k
keyeq(KEY s1, KEY s2) {
7185
192k
  for (; *s1 == *s2; s1++, s2++)
7186
185k
    if (*s1 == 0)
7187
34.1k
      return XML_TRUE;
7188
7.34k
  return XML_FALSE;
7189
41.5k
}
7190
7191
static size_t
7192
34.9k
keylen(KEY s) {
7193
34.9k
  size_t len = 0;
7194
193k
  for (; *s; s++, len++)
7195
158k
    ;
7196
34.9k
  return len;
7197
34.9k
}
7198
7199
static void
7200
34.9k
copy_salt_to_sipkey(XML_Parser parser, struct sipkey *key) {
7201
34.9k
  key->k[0] = 0;
7202
34.9k
  key->k[1] = get_hash_secret_salt(parser);
7203
34.9k
}
7204
7205
static unsigned long FASTCALL
7206
34.9k
hash(XML_Parser parser, KEY s) {
7207
34.9k
  struct siphash state;
7208
34.9k
  struct sipkey key;
7209
34.9k
  (void)sip24_valid;
7210
34.9k
  copy_salt_to_sipkey(parser, &key);
7211
34.9k
  sip24_init(&state, &key);
7212
34.9k
  sip24_update(&state, s, keylen(s) * sizeof(XML_Char));
7213
34.9k
  return (unsigned long)sip24_final(&state);
7214
34.9k
}
7215
7216
static NAMED *
7217
35.0k
lookup(XML_Parser parser, HASH_TABLE *table, KEY name, size_t createSize) {
7218
35.0k
  size_t i;
7219
35.0k
  if (table->size == 0) {
7220
287
    size_t tsize;
7221
287
    if (! createSize)
7222
89
      return NULL;
7223
198
    table->power = INIT_POWER;
7224
    /* table->size is a power of 2 */
7225
198
    table->size = (size_t)1 << INIT_POWER;
7226
198
    tsize = table->size * sizeof(NAMED *);
7227
198
    table->v = table->mem->malloc_fcn(tsize);
7228
198
    if (! table->v) {
7229
0
      table->size = 0;
7230
0
      return NULL;
7231
0
    }
7232
198
    memset(table->v, 0, tsize);
7233
198
    i = hash(parser, name) & ((unsigned long)table->size - 1);
7234
34.7k
  } else {
7235
34.7k
    unsigned long h = hash(parser, name);
7236
34.7k
    unsigned long mask = (unsigned long)table->size - 1;
7237
34.7k
    unsigned char step = 0;
7238
34.7k
    size_t newSize;
7239
34.7k
    unsigned long newMask;
7240
7241
34.7k
    i = h & mask;
7242
42.1k
    while (table->v[i]) {
7243
41.5k
      if (keyeq(name, table->v[i]->name))
7244
34.1k
        return table->v[i];
7245
7.34k
      if (! step)
7246
6.63k
        step = PROBE_STEP(h, mask, table->power);
7247
7.34k
      i < step ? (i += table->size - step) : (i -= step);
7248
7.34k
    }
7249
601
    if (! createSize)
7250
122
      return NULL;
7251
7252
    /* check for overflow (table is half full) */
7253
479
    if (table->used >> (table->power - 1)) {
7254
0
      unsigned char newPower = table->power + 1;
7255
0
      size_t tsize;
7256
0
      NAMED **newV;
7257
7258
      /* Detect and prevent invalid shift */
7259
0
      if (newPower >= sizeof(unsigned long) * 8 /* bits per byte */) {
7260
0
        return NULL;
7261
0
      }
7262
7263
0
      newSize = (size_t)1 << newPower;
7264
0
      newMask = (unsigned long)newSize - 1;
7265
7266
      /* Detect and prevent integer overflow */
7267
0
      if (newSize > (size_t)(-1) / sizeof(NAMED *)) {
7268
0
        return NULL;
7269
0
      }
7270
7271
0
      tsize = newSize * sizeof(NAMED *);
7272
0
      newV = table->mem->malloc_fcn(tsize);
7273
0
      if (! newV)
7274
0
        return NULL;
7275
0
      memset(newV, 0, tsize);
7276
0
      for (i = 0; i < table->size; i++)
7277
0
        if (table->v[i]) {
7278
0
          unsigned long newHash = hash(parser, table->v[i]->name);
7279
0
          size_t j = newHash & newMask;
7280
0
          step = 0;
7281
0
          while (newV[j]) {
7282
0
            if (! step)
7283
0
              step = PROBE_STEP(newHash, newMask, newPower);
7284
0
            j < step ? (j += newSize - step) : (j -= step);
7285
0
          }
7286
0
          newV[j] = table->v[i];
7287
0
        }
7288
0
      table->mem->free_fcn(table->v);
7289
0
      table->v = newV;
7290
0
      table->power = newPower;
7291
0
      table->size = newSize;
7292
0
      i = h & newMask;
7293
0
      step = 0;
7294
0
      while (table->v[i]) {
7295
0
        if (! step)
7296
0
          step = PROBE_STEP(h, newMask, newPower);
7297
0
        i < step ? (i += newSize - step) : (i -= step);
7298
0
      }
7299
0
    }
7300
479
  }
7301
677
  table->v[i] = table->mem->malloc_fcn(createSize);
7302
677
  if (! table->v[i])
7303
0
    return NULL;
7304
677
  memset(table->v[i], 0, createSize);
7305
677
  table->v[i]->name = name;
7306
677
  (table->used)++;
7307
677
  return table->v[i];
7308
677
}
7309
7310
static void FASTCALL
7311
0
hashTableClear(HASH_TABLE *table) {
7312
0
  size_t i;
7313
0
  for (i = 0; i < table->size; i++) {
7314
0
    table->mem->free_fcn(table->v[i]);
7315
0
    table->v[i] = NULL;
7316
0
  }
7317
0
  table->used = 0;
7318
0
}
7319
7320
static void FASTCALL
7321
445
hashTableDestroy(HASH_TABLE *table) {
7322
445
  size_t i;
7323
13.1k
  for (i = 0; i < table->size; i++)
7324
12.6k
    table->mem->free_fcn(table->v[i]);
7325
445
  table->mem->free_fcn(table->v);
7326
445
}
7327
7328
static void FASTCALL
7329
445
hashTableInit(HASH_TABLE *p, const XML_Memory_Handling_Suite *ms) {
7330
445
  p->power = 0;
7331
445
  p->size = 0;
7332
445
  p->used = 0;
7333
445
  p->v = NULL;
7334
445
  p->mem = ms;
7335
445
}
7336
7337
static void FASTCALL
7338
89
hashTableIterInit(HASH_TABLE_ITER *iter, const HASH_TABLE *table) {
7339
89
  iter->p = table->v;
7340
89
  iter->end = iter->p ? iter->p + table->size : NULL;
7341
89
}
7342
7343
static NAMED *FASTCALL
7344
300
hashTableIterNext(HASH_TABLE_ITER *iter) {
7345
5.78k
  while (iter->p != iter->end) {
7346
5.69k
    NAMED *tem = *(iter->p)++;
7347
5.69k
    if (tem)
7348
211
      return tem;
7349
5.69k
  }
7350
89
  return NULL;
7351
300
}
7352
7353
static void FASTCALL
7354
356
poolInit(STRING_POOL *pool, const XML_Memory_Handling_Suite *ms) {
7355
356
  pool->blocks = NULL;
7356
356
  pool->freeBlocks = NULL;
7357
356
  pool->start = NULL;
7358
356
  pool->ptr = NULL;
7359
356
  pool->end = NULL;
7360
356
  pool->mem = ms;
7361
356
}
7362
7363
static void FASTCALL
7364
11.1k
poolClear(STRING_POOL *pool) {
7365
11.1k
  if (! pool->freeBlocks)
7366
9.65k
    pool->freeBlocks = pool->blocks;
7367
1.48k
  else {
7368
1.48k
    BLOCK *p = pool->blocks;
7369
2.99k
    while (p) {
7370
1.50k
      BLOCK *tem = p->next;
7371
1.50k
      p->next = pool->freeBlocks;
7372
1.50k
      pool->freeBlocks = p;
7373
1.50k
      p = tem;
7374
1.50k
    }
7375
1.48k
  }
7376
11.1k
  pool->blocks = NULL;
7377
11.1k
  pool->start = NULL;
7378
11.1k
  pool->ptr = NULL;
7379
11.1k
  pool->end = NULL;
7380
11.1k
}
7381
7382
static void FASTCALL
7383
356
poolDestroy(STRING_POOL *pool) {
7384
356
  BLOCK *p = pool->blocks;
7385
445
  while (p) {
7386
89
    BLOCK *tem = p->next;
7387
89
    pool->mem->free_fcn(p);
7388
89
    p = tem;
7389
89
  }
7390
356
  p = pool->freeBlocks;
7391
459
  while (p) {
7392
103
    BLOCK *tem = p->next;
7393
103
    pool->mem->free_fcn(p);
7394
103
    p = tem;
7395
103
  }
7396
356
}
7397
7398
static XML_Char *
7399
poolAppend(STRING_POOL *pool, const ENCODING *enc, const char *ptr,
7400
121k
           const char *end) {
7401
121k
  if (! pool->ptr && ! poolGrow(pool))
7402
0
    return NULL;
7403
121k
  for (;;) {
7404
121k
    const enum XML_Convert_Result convert_res = XmlConvert(
7405
121k
        enc, &ptr, end, (ICHAR **)&(pool->ptr), (const ICHAR *)pool->end);
7406
121k
    if ((convert_res == XML_CONVERT_COMPLETED)
7407
41
        || (convert_res == XML_CONVERT_INPUT_INCOMPLETE))
7408
121k
      break;
7409
41
    if (! poolGrow(pool))
7410
0
      return NULL;
7411
41
  }
7412
121k
  return pool->start;
7413
121k
}
7414
7415
static const XML_Char *FASTCALL
7416
231
poolCopyString(STRING_POOL *pool, const XML_Char *s) {
7417
2.75k
  do {
7418
2.75k
    if (! poolAppendChar(pool, *s))
7419
0
      return NULL;
7420
2.75k
  } while (*s++);
7421
231
  s = pool->start;
7422
231
  poolFinish(pool);
7423
231
  return s;
7424
231
}
7425
7426
static const XML_Char *
7427
0
poolCopyStringN(STRING_POOL *pool, const XML_Char *s, int n) {
7428
0
  if (! pool->ptr && ! poolGrow(pool)) {
7429
    /* The following line is unreachable given the current usage of
7430
     * poolCopyStringN().  Currently it is called from exactly one
7431
     * place to copy the text of a simple general entity.  By that
7432
     * point, the name of the entity is already stored in the pool, so
7433
     * pool->ptr cannot be NULL.
7434
     *
7435
     * If poolCopyStringN() is used elsewhere as it well might be,
7436
     * this line may well become executable again.  Regardless, this
7437
     * sort of check shouldn't be removed lightly, so we just exclude
7438
     * it from the coverage statistics.
7439
     */
7440
0
    return NULL; /* LCOV_EXCL_LINE */
7441
0
  }
7442
0
  for (; n > 0; --n, s++) {
7443
0
    if (! poolAppendChar(pool, *s))
7444
0
      return NULL;
7445
0
  }
7446
0
  s = pool->start;
7447
0
  poolFinish(pool);
7448
0
  return s;
7449
0
}
7450
7451
static const XML_Char *FASTCALL
7452
0
poolAppendString(STRING_POOL *pool, const XML_Char *s) {
7453
0
  while (*s) {
7454
0
    if (! poolAppendChar(pool, *s))
7455
0
      return NULL;
7456
0
    s++;
7457
0
  }
7458
0
  return pool->start;
7459
0
}
7460
7461
static XML_Char *
7462
poolStoreString(STRING_POOL *pool, const ENCODING *enc, const char *ptr,
7463
57.5k
                const char *end) {
7464
57.5k
  if (! poolAppend(pool, enc, ptr, end))
7465
0
    return NULL;
7466
57.5k
  if (pool->ptr == pool->end && ! poolGrow(pool))
7467
0
    return NULL;
7468
57.5k
  *(pool->ptr)++ = 0;
7469
57.5k
  return pool->start;
7470
57.5k
}
7471
7472
static size_t
7473
227
poolBytesToAllocateFor(int blockSize) {
7474
  /* Unprotected math would be:
7475
  ** return offsetof(BLOCK, s) + blockSize * sizeof(XML_Char);
7476
  **
7477
  ** Detect overflow, avoiding _signed_ overflow undefined behavior
7478
  ** For a + b * c we check b * c in isolation first, so that addition of a
7479
  ** on top has no chance of making us accept a small non-negative number
7480
  */
7481
227
  const size_t stretch = sizeof(XML_Char); /* can be 4 bytes */
7482
7483
227
  if (blockSize <= 0)
7484
0
    return 0;
7485
7486
227
  if (blockSize > (int)(INT_MAX / stretch))
7487
0
    return 0;
7488
7489
227
  {
7490
227
    const int stretchedBlockSize = blockSize * (int)stretch;
7491
227
    const int bytesToAllocate
7492
227
        = (int)(offsetof(BLOCK, s) + (unsigned)stretchedBlockSize);
7493
227
    if (bytesToAllocate < 0)
7494
0
      return 0;
7495
7496
227
    return (size_t)bytesToAllocate;
7497
227
  }
7498
227
}
7499
7500
static XML_Bool FASTCALL
7501
11.2k
poolGrow(STRING_POOL *pool) {
7502
11.2k
  if (pool->freeBlocks) {
7503
11.0k
    if (pool->start == 0) {
7504
11.0k
      pool->blocks = pool->freeBlocks;
7505
11.0k
      pool->freeBlocks = pool->freeBlocks->next;
7506
11.0k
      pool->blocks->next = NULL;
7507
11.0k
      pool->start = pool->blocks->s;
7508
11.0k
      pool->end = pool->start + pool->blocks->size;
7509
11.0k
      pool->ptr = pool->start;
7510
11.0k
      return XML_TRUE;
7511
11.0k
    }
7512
40
    if (pool->end - pool->start < pool->freeBlocks->size) {
7513
12
      BLOCK *tem = pool->freeBlocks->next;
7514
12
      pool->freeBlocks->next = pool->blocks;
7515
12
      pool->blocks = pool->freeBlocks;
7516
12
      pool->freeBlocks = tem;
7517
12
      memcpy(pool->blocks->s, pool->start,
7518
12
             (pool->end - pool->start) * sizeof(XML_Char));
7519
12
      pool->ptr = pool->blocks->s + (pool->ptr - pool->start);
7520
12
      pool->start = pool->blocks->s;
7521
12
      pool->end = pool->start + pool->blocks->size;
7522
12
      return XML_TRUE;
7523
12
    }
7524
40
  }
7525
227
  if (pool->blocks && pool->start == pool->blocks->s) {
7526
35
    BLOCK *temp;
7527
35
    int blockSize = (int)((unsigned)(pool->end - pool->start) * 2U);
7528
35
    size_t bytesToAllocate;
7529
7530
    /* NOTE: Needs to be calculated prior to calling `realloc`
7531
             to avoid dangling pointers: */
7532
35
    const ptrdiff_t offsetInsideBlock = pool->ptr - pool->start;
7533
7534
35
    if (blockSize < 0) {
7535
      /* This condition traps a situation where either more than
7536
       * INT_MAX/2 bytes have already been allocated.  This isn't
7537
       * readily testable, since it is unlikely that an average
7538
       * machine will have that much memory, so we exclude it from the
7539
       * coverage statistics.
7540
       */
7541
0
      return XML_FALSE; /* LCOV_EXCL_LINE */
7542
0
    }
7543
7544
35
    bytesToAllocate = poolBytesToAllocateFor(blockSize);
7545
35
    if (bytesToAllocate == 0)
7546
0
      return XML_FALSE;
7547
7548
35
    temp = (BLOCK *)pool->mem->realloc_fcn(pool->blocks,
7549
35
                                           (unsigned)bytesToAllocate);
7550
35
    if (temp == NULL)
7551
0
      return XML_FALSE;
7552
35
    pool->blocks = temp;
7553
35
    pool->blocks->size = blockSize;
7554
35
    pool->ptr = pool->blocks->s + offsetInsideBlock;
7555
35
    pool->start = pool->blocks->s;
7556
35
    pool->end = pool->start + blockSize;
7557
192
  } else {
7558
192
    BLOCK *tem;
7559
192
    int blockSize = (int)(pool->end - pool->start);
7560
192
    size_t bytesToAllocate;
7561
7562
192
    if (blockSize < 0) {
7563
      /* This condition traps a situation where either more than
7564
       * INT_MAX bytes have already been allocated (which is prevented
7565
       * by various pieces of program logic, not least this one, never
7566
       * mind the unlikelihood of actually having that much memory) or
7567
       * the pool control fields have been corrupted (which could
7568
       * conceivably happen in an extremely buggy user handler
7569
       * function).  Either way it isn't readily testable, so we
7570
       * exclude it from the coverage statistics.
7571
       */
7572
0
      return XML_FALSE; /* LCOV_EXCL_LINE */
7573
0
    }
7574
7575
192
    if (blockSize < INIT_BLOCK_SIZE)
7576
185
      blockSize = INIT_BLOCK_SIZE;
7577
7
    else {
7578
      /* Detect overflow, avoiding _signed_ overflow undefined behavior */
7579
7
      if ((int)((unsigned)blockSize * 2U) < 0) {
7580
0
        return XML_FALSE;
7581
0
      }
7582
7
      blockSize *= 2;
7583
7
    }
7584
7585
192
    bytesToAllocate = poolBytesToAllocateFor(blockSize);
7586
192
    if (bytesToAllocate == 0)
7587
0
      return XML_FALSE;
7588
7589
192
    tem = pool->mem->malloc_fcn(bytesToAllocate);
7590
192
    if (! tem)
7591
0
      return XML_FALSE;
7592
192
    tem->size = blockSize;
7593
192
    tem->next = pool->blocks;
7594
192
    pool->blocks = tem;
7595
192
    if (pool->ptr != pool->start)
7596
14
      memcpy(tem->s, pool->start, (pool->ptr - pool->start) * sizeof(XML_Char));
7597
192
    pool->ptr = tem->s + (pool->ptr - pool->start);
7598
192
    pool->start = tem->s;
7599
192
    pool->end = tem->s + blockSize;
7600
192
  }
7601
227
  return XML_TRUE;
7602
227
}
7603
7604
static int FASTCALL
7605
0
nextScaffoldPart(XML_Parser parser) {
7606
0
  DTD *const dtd = parser->m_dtd; /* save one level of indirection */
7607
0
  CONTENT_SCAFFOLD *me;
7608
0
  int next;
7609
7610
0
  if (! dtd->scaffIndex) {
7611
    /* Detect and prevent integer overflow.
7612
     * The preprocessor guard addresses the "always false" warning
7613
     * from -Wtype-limits on platforms where
7614
     * sizeof(unsigned int) < sizeof(size_t), e.g. on x86_64. */
7615
#if UINT_MAX >= SIZE_MAX
7616
    if (parser->m_groupSize > ((size_t)(-1) / sizeof(int))) {
7617
      return -1;
7618
    }
7619
#endif
7620
0
    dtd->scaffIndex = (int *)MALLOC(parser, parser->m_groupSize * sizeof(int));
7621
0
    if (! dtd->scaffIndex)
7622
0
      return -1;
7623
0
    dtd->scaffIndex[0] = 0;
7624
0
  }
7625
7626
0
  if (dtd->scaffCount >= dtd->scaffSize) {
7627
0
    CONTENT_SCAFFOLD *temp;
7628
0
    if (dtd->scaffold) {
7629
      /* Detect and prevent integer overflow */
7630
0
      if (dtd->scaffSize > UINT_MAX / 2u) {
7631
0
        return -1;
7632
0
      }
7633
      /* Detect and prevent integer overflow.
7634
       * The preprocessor guard addresses the "always false" warning
7635
       * from -Wtype-limits on platforms where
7636
       * sizeof(unsigned int) < sizeof(size_t), e.g. on x86_64. */
7637
#if UINT_MAX >= SIZE_MAX
7638
      if (dtd->scaffSize > (size_t)(-1) / 2u / sizeof(CONTENT_SCAFFOLD)) {
7639
        return -1;
7640
      }
7641
#endif
7642
7643
0
      temp = (CONTENT_SCAFFOLD *)REALLOC(
7644
0
          parser, dtd->scaffold, dtd->scaffSize * 2 * sizeof(CONTENT_SCAFFOLD));
7645
0
      if (temp == NULL)
7646
0
        return -1;
7647
0
      dtd->scaffSize *= 2;
7648
0
    } else {
7649
0
      temp = (CONTENT_SCAFFOLD *)MALLOC(parser, INIT_SCAFFOLD_ELEMENTS
7650
0
                                                    * sizeof(CONTENT_SCAFFOLD));
7651
0
      if (temp == NULL)
7652
0
        return -1;
7653
0
      dtd->scaffSize = INIT_SCAFFOLD_ELEMENTS;
7654
0
    }
7655
0
    dtd->scaffold = temp;
7656
0
  }
7657
0
  next = dtd->scaffCount++;
7658
0
  me = &dtd->scaffold[next];
7659
0
  if (dtd->scaffLevel) {
7660
0
    CONTENT_SCAFFOLD *parent
7661
0
        = &dtd->scaffold[dtd->scaffIndex[dtd->scaffLevel - 1]];
7662
0
    if (parent->lastchild) {
7663
0
      dtd->scaffold[parent->lastchild].nextsib = next;
7664
0
    }
7665
0
    if (! parent->childcnt)
7666
0
      parent->firstchild = next;
7667
0
    parent->lastchild = next;
7668
0
    parent->childcnt++;
7669
0
  }
7670
0
  me->firstchild = me->lastchild = me->childcnt = me->nextsib = 0;
7671
0
  return next;
7672
0
}
7673
7674
static XML_Content *
7675
0
build_model(XML_Parser parser) {
7676
  /* Function build_model transforms the existing parser->m_dtd->scaffold
7677
   * array of CONTENT_SCAFFOLD tree nodes into a new array of
7678
   * XML_Content tree nodes followed by a gapless list of zero-terminated
7679
   * strings. */
7680
0
  DTD *const dtd = parser->m_dtd; /* save one level of indirection */
7681
0
  XML_Content *ret;
7682
0
  XML_Char *str; /* the current string writing location */
7683
0
  size_t allocsize;
7684
0
  XML_Content *dest;
7685
0
  XML_Content *destLimit;
7686
0
  XML_Content *jobDest;
7687
7688
  /* Detect and prevent integer overflow.
7689
   * The preprocessor guard addresses the "always false" warning
7690
   * from -Wtype-limits on platforms where
7691
   * sizeof(unsigned int) < sizeof(size_t), e.g. on x86_64. */
7692
#if UINT_MAX >= SIZE_MAX
7693
  if (dtd->scaffCount > (size_t)(-1) / sizeof(XML_Content)) {
7694
    return NULL;
7695
  }
7696
  if (dtd->contentStringLen > (size_t)(-1) / sizeof(XML_Char)) {
7697
    return NULL;
7698
  }
7699
#endif
7700
0
  if (dtd->scaffCount * sizeof(XML_Content)
7701
0
      > (size_t)(-1) - dtd->contentStringLen * sizeof(XML_Char)) {
7702
0
    return NULL;
7703
0
  }
7704
7705
0
  allocsize = (dtd->scaffCount * sizeof(XML_Content)
7706
0
                            + (dtd->contentStringLen * sizeof(XML_Char)));
7707
7708
0
  ret = (XML_Content *)MALLOC(parser, allocsize);
7709
0
  if (! ret)
7710
0
    return NULL;
7711
7712
  /* What follows is an iterative implementation (of what was previously done
7713
   * recursively in a dedicated function called "build_node".  The old recursive
7714
   * build_node could be forced into stack exhaustion from input as small as a
7715
   * few megabyte, and so that was a security issue.  Hence, a function call
7716
   * stack is avoided now by resolving recursion.)
7717
   *
7718
   * The iterative approach works as follows:
7719
   *
7720
   * - We have two writing pointers, both walking up the result array; one does
7721
   *   the work, the other creates "jobs" for its colleague to do, and leads
7722
   *   the way:
7723
   *
7724
   *   - The faster one, pointer jobDest, always leads and writes "what job
7725
   *     to do" by the other, once they reach that place in the
7726
   *     array: leader "jobDest" stores the source node array index (relative
7727
   *     to array dtd->scaffold) in field "numchildren".
7728
   *
7729
   *   - The slower one, pointer dest, looks at the value stored in the
7730
   *     "numchildren" field (which actually holds a source node array index
7731
   *     at that time) and puts the real data from dtd->scaffold in.
7732
   *
7733
   * - Before the loop starts, jobDest writes source array index 0
7734
   *   (where the root node is located) so that dest will have something to do
7735
   *   when it starts operation.
7736
   *
7737
   * - Whenever nodes with children are encountered, jobDest appends
7738
   *   them as new jobs, in order.  As a result, tree node siblings are
7739
   *   adjacent in the resulting array, for example:
7740
   *
7741
   *     [0] root, has two children
7742
   *       [1] first child of 0, has three children
7743
   *         [3] first child of 1, does not have children
7744
   *         [4] second child of 1, does not have children
7745
   *         [5] third child of 1, does not have children
7746
   *       [2] second child of 0, does not have children
7747
   *
7748
   *   Or (the same data) presented in flat array view:
7749
   *
7750
   *     [0] root, has two children
7751
   *
7752
   *     [1] first child of 0, has three children
7753
   *     [2] second child of 0, does not have children
7754
   *
7755
   *     [3] first child of 1, does not have children
7756
   *     [4] second child of 1, does not have children
7757
   *     [5] third child of 1, does not have children
7758
   *
7759
   * - The algorithm repeats until all target array indices have been processed.
7760
   */
7761
0
  dest = ret; /* tree node writing location, moves upwards */
7762
0
  destLimit = &ret[dtd->scaffCount];
7763
0
  jobDest = ret; /* next free writing location in target array */
7764
0
  str = (XML_Char *)&ret[dtd->scaffCount];
7765
7766
  /* Add the starting job, the root node (index 0) of the source tree  */
7767
0
  (jobDest++)->numchildren = 0;
7768
7769
0
  for (; dest < destLimit; dest++) {
7770
    /* Retrieve source tree array index from job storage */
7771
0
    const int src_node = (int)dest->numchildren;
7772
7773
    /* Convert item */
7774
0
    dest->type = dtd->scaffold[src_node].type;
7775
0
    dest->quant = dtd->scaffold[src_node].quant;
7776
0
    if (dest->type == XML_CTYPE_NAME) {
7777
0
      const XML_Char *src;
7778
0
      dest->name = str;
7779
0
      src = dtd->scaffold[src_node].name;
7780
0
      for (;;) {
7781
0
        *str++ = *src;
7782
0
        if (! *src)
7783
0
          break;
7784
0
        src++;
7785
0
      }
7786
0
      dest->numchildren = 0;
7787
0
      dest->children = NULL;
7788
0
    } else {
7789
0
      unsigned int i;
7790
0
      int cn;
7791
0
      dest->name = NULL;
7792
0
      dest->numchildren = dtd->scaffold[src_node].childcnt;
7793
0
      dest->children = jobDest;
7794
7795
      /* Append scaffold indices of children to array */
7796
0
      for (i = 0, cn = dtd->scaffold[src_node].firstchild;
7797
0
           i < dest->numchildren; i++, cn = dtd->scaffold[cn].nextsib)
7798
0
        (jobDest++)->numchildren = (unsigned int)cn;
7799
0
    }
7800
0
  }
7801
7802
0
  return ret;
7803
0
}
7804
7805
static ELEMENT_TYPE *
7806
getElementType(XML_Parser parser, const ENCODING *enc, const char *ptr,
7807
0
               const char *end) {
7808
0
  DTD *const dtd = parser->m_dtd; /* save one level of indirection */
7809
0
  const XML_Char *name = poolStoreString(&dtd->pool, enc, ptr, end);
7810
0
  ELEMENT_TYPE *ret;
7811
7812
0
  if (! name)
7813
0
    return NULL;
7814
0
  ret = (ELEMENT_TYPE *)lookup(parser, &dtd->elementTypes, name,
7815
0
                               sizeof(ELEMENT_TYPE));
7816
0
  if (! ret)
7817
0
    return NULL;
7818
0
  if (ret->name != name)
7819
0
    poolDiscard(&dtd->pool);
7820
0
  else {
7821
0
    poolFinish(&dtd->pool);
7822
0
    if (! setElementTypePrefix(parser, ret))
7823
0
      return NULL;
7824
0
  }
7825
0
  return ret;
7826
0
}
7827
7828
static XML_Char *
7829
0
copyString(const XML_Char *s, const XML_Memory_Handling_Suite *memsuite) {
7830
0
  size_t charsRequired = 0;
7831
0
  XML_Char *result;
7832
7833
  /* First determine how long the string is */
7834
0
  while (s[charsRequired] != 0) {
7835
0
    charsRequired++;
7836
0
  }
7837
  /* Include the terminator */
7838
0
  charsRequired++;
7839
7840
  /* Now allocate space for the copy */
7841
0
  result = memsuite->malloc_fcn(charsRequired * sizeof(XML_Char));
7842
0
  if (result == NULL)
7843
0
    return NULL;
7844
  /* Copy the original into place */
7845
0
  memcpy(result, s, charsRequired * sizeof(XML_Char));
7846
0
  return result;
7847
0
}
7848
7849
#if XML_GE == 1
7850
7851
static float
7852
33.3k
accountingGetCurrentAmplification(XML_Parser rootParser) {
7853
  //                                          1.........1.........12 => 22
7854
33.3k
  const size_t lenOfShortestInclude = sizeof("<!ENTITY a SYSTEM 'b'>") - 1;
7855
33.3k
  const XmlBigCount countBytesOutput
7856
33.3k
      = rootParser->m_accounting.countBytesDirect
7857
33.3k
        + rootParser->m_accounting.countBytesIndirect;
7858
33.3k
  const float amplificationFactor
7859
33.3k
      = rootParser->m_accounting.countBytesDirect
7860
33.3k
            ? (countBytesOutput
7861
33.3k
               / (float)(rootParser->m_accounting.countBytesDirect))
7862
33.3k
            : ((lenOfShortestInclude
7863
0
                + rootParser->m_accounting.countBytesIndirect)
7864
0
               / (float)lenOfShortestInclude);
7865
33.3k
  assert(! rootParser->m_parentParser);
7866
33.3k
  return amplificationFactor;
7867
33.3k
}
7868
7869
static void
7870
0
accountingReportStats(XML_Parser originParser, const char *epilog) {
7871
0
  const XML_Parser rootParser = getRootParserOf(originParser, NULL);
7872
0
  float amplificationFactor;
7873
0
  assert(! rootParser->m_parentParser);
7874
7875
0
  if (rootParser->m_accounting.debugLevel == 0u) {
7876
0
    return;
7877
0
  }
7878
7879
0
  amplificationFactor
7880
0
      = accountingGetCurrentAmplification(rootParser);
7881
0
  fprintf(stderr,
7882
0
          "expat: Accounting(%p): Direct " EXPAT_FMT_ULL(
7883
0
              "10") ", indirect " EXPAT_FMT_ULL("10") ", amplification %8.2f%s",
7884
0
          (void *)rootParser, rootParser->m_accounting.countBytesDirect,
7885
0
          rootParser->m_accounting.countBytesIndirect,
7886
0
          (double)amplificationFactor, epilog);
7887
0
}
7888
7889
static void
7890
0
accountingOnAbort(XML_Parser originParser) {
7891
0
  accountingReportStats(originParser, " ABORTING\n");
7892
0
}
7893
7894
static void
7895
accountingReportDiff(XML_Parser rootParser,
7896
                     unsigned int levelsAwayFromRootParser, const char *before,
7897
                     const char *after, ptrdiff_t bytesMore, int source_line,
7898
0
                     enum XML_Account account) {
7899
0
  const char ellipis[] = "[..]";
7900
0
  const size_t ellipsisLength = sizeof(ellipis) /* because compile-time */ - 1;
7901
0
  const unsigned int contextLength = 10;
7902
0
  char *walker;
7903
0
  assert(! rootParser->m_parentParser);
7904
7905
0
  fprintf(stderr,
7906
0
          " (+" EXPAT_FMT_PTRDIFF_T("6") " bytes %s|%u, xmlparse.c:%d) %*s\"",
7907
0
          bytesMore, (account == XML_ACCOUNT_DIRECT) ? "DIR" : "EXP",
7908
0
          levelsAwayFromRootParser, source_line, 10, "");
7909
7910
7911
  /* Note: Performance is of no concern here */
7912
0
  walker = (char *)before;
7913
0
  if ((rootParser->m_accounting.debugLevel >= 3u)
7914
0
      || (after - before)
7915
0
             <= (ptrdiff_t)(contextLength + ellipsisLength + contextLength)) {
7916
0
    for (; walker < after; walker++) {
7917
0
      fprintf(stderr, "%s", unsignedCharToPrintable(walker[0]));
7918
0
    }
7919
0
  } else {
7920
0
    for (; walker < before + contextLength; walker++) {
7921
0
      fprintf(stderr, "%s", unsignedCharToPrintable(walker[0]));
7922
0
    }
7923
0
    fprintf(stderr, ellipis);
7924
0
    walker = (char *)(after - contextLength);
7925
0
    for (; walker < after; walker++) {
7926
0
      fprintf(stderr, "%s", unsignedCharToPrintable(walker[0]));
7927
0
    }
7928
0
  }
7929
0
  fprintf(stderr, "\"\n");
7930
0
}
7931
7932
static XML_Bool
7933
accountingDiffTolerated(XML_Parser originParser, int tok, const char *before,
7934
                        const char *after, int source_line,
7935
169k
                        enum XML_Account account) {
7936
169k
  unsigned int levelsAwayFromRootParser;
7937
169k
  XML_Parser rootParser;
7938
169k
  int isDirect;
7939
169k
  ptrdiff_t bytesMore;
7940
169k
  XmlBigCount *additionTarget;
7941
169k
  XmlBigCount countBytesOutput;
7942
169k
  float amplificationFactor;
7943
169k
  XML_Bool tolerated;
7944
7945
  /* Note: We need to check the token type *first* to be sure that
7946
   *       we can even access variable <after>, safely.
7947
   *       E.g. for XML_TOK_NONE <after> may hold an invalid pointer. */
7948
169k
  switch (tok) {
7949
17
  case XML_TOK_INVALID:
7950
17
  case XML_TOK_PARTIAL:
7951
17
  case XML_TOK_PARTIAL_CHAR:
7952
817
  case XML_TOK_NONE:
7953
817
    return XML_TRUE;
7954
169k
  }
7955
7956
168k
  if (account == XML_ACCOUNT_NONE)
7957
134k
    return XML_TRUE; /* because these bytes have been accounted for, already */
7958
7959
33.3k
  rootParser
7960
33.3k
      = getRootParserOf(originParser, &levelsAwayFromRootParser);
7961
33.3k
  assert(! rootParser->m_parentParser);
7962
7963
33.3k
  isDirect
7964
33.3k
      = (account == XML_ACCOUNT_DIRECT) && (originParser == rootParser);
7965
33.3k
  bytesMore = after - before;
7966
7967
33.3k
  additionTarget
7968
33.3k
      = isDirect ? &rootParser->m_accounting.countBytesDirect
7969
33.3k
                 : &rootParser->m_accounting.countBytesIndirect;
7970
7971
  /* Detect and avoid integer overflow */
7972
33.3k
  if (*additionTarget > (XmlBigCount)(-1) - (XmlBigCount)bytesMore)
7973
0
    return XML_FALSE;
7974
33.3k
  *additionTarget += bytesMore;
7975
7976
33.3k
  countBytesOutput
7977
33.3k
      = rootParser->m_accounting.countBytesDirect
7978
33.3k
        + rootParser->m_accounting.countBytesIndirect;
7979
33.3k
  amplificationFactor
7980
33.3k
      = accountingGetCurrentAmplification(rootParser);
7981
33.3k
  tolerated
7982
33.3k
      = (countBytesOutput < rootParser->m_accounting.activationThresholdBytes)
7983
0
        || (amplificationFactor
7984
0
            <= rootParser->m_accounting.maximumAmplificationFactor);
7985
7986
33.3k
  if (rootParser->m_accounting.debugLevel >= 2u) {
7987
0
    accountingReportStats(rootParser, "");
7988
0
    accountingReportDiff(rootParser, levelsAwayFromRootParser, before, after,
7989
0
                         bytesMore, source_line, account);
7990
0
  }
7991
7992
33.3k
  return tolerated;
7993
33.3k
}
7994
7995
unsigned long long
7996
0
testingAccountingGetCountBytesDirect(XML_Parser parser) {
7997
0
  if (! parser)
7998
0
    return 0;
7999
0
  return parser->m_accounting.countBytesDirect;
8000
0
}
8001
8002
unsigned long long
8003
0
testingAccountingGetCountBytesIndirect(XML_Parser parser) {
8004
0
  if (! parser)
8005
0
    return 0;
8006
0
  return parser->m_accounting.countBytesIndirect;
8007
0
}
8008
8009
static void
8010
entityTrackingReportStats(XML_Parser rootParser, ENTITY *entity,
8011
0
                          const char *action, int sourceLine) {
8012
#  if defined(XML_UNICODE)
8013
  const char *const entityName = "[..]";
8014
#  else
8015
0
  const char *const entityName = entity->name;
8016
0
#  endif
8017
0
  assert(! rootParser->m_parentParser);
8018
0
  if (rootParser->m_entity_stats.debugLevel == 0u)
8019
0
    return;
8020
8021
8022
0
  fprintf(
8023
0
      stderr,
8024
0
      "expat: Entities(%p): Count %9u, depth %2u/%2u %*s%s%s; %s length %d (xmlparse.c:%d)\n",
8025
0
      (void *)rootParser, rootParser->m_entity_stats.countEverOpened,
8026
0
      rootParser->m_entity_stats.currentDepth,
8027
0
      rootParser->m_entity_stats.maximumDepthSeen,
8028
0
      (rootParser->m_entity_stats.currentDepth - 1) * 2, "",
8029
0
      entity->is_param ? "%" : "&", entityName, action, entity->textLen,
8030
0
      sourceLine);
8031
0
}
8032
8033
static void
8034
0
entityTrackingOnOpen(XML_Parser originParser, ENTITY *entity, int sourceLine) {
8035
0
  const XML_Parser rootParser = getRootParserOf(originParser, NULL);
8036
0
  assert(! rootParser->m_parentParser);
8037
8038
0
  rootParser->m_entity_stats.countEverOpened++;
8039
0
  rootParser->m_entity_stats.currentDepth++;
8040
0
  if (rootParser->m_entity_stats.currentDepth
8041
0
      > rootParser->m_entity_stats.maximumDepthSeen) {
8042
0
    rootParser->m_entity_stats.maximumDepthSeen++;
8043
0
  }
8044
8045
0
  entityTrackingReportStats(rootParser, entity, "OPEN ", sourceLine);
8046
0
}
8047
8048
static void
8049
0
entityTrackingOnClose(XML_Parser originParser, ENTITY *entity, int sourceLine) {
8050
0
  const XML_Parser rootParser = getRootParserOf(originParser, NULL);
8051
0
  assert(! rootParser->m_parentParser);
8052
8053
0
  entityTrackingReportStats(rootParser, entity, "CLOSE", sourceLine);
8054
0
  rootParser->m_entity_stats.currentDepth--;
8055
0
}
8056
8057
static XML_Parser
8058
33.3k
getRootParserOf(XML_Parser parser, unsigned int *outLevelDiff) {
8059
33.3k
  XML_Parser rootParser = parser;
8060
33.3k
  unsigned int stepsTakenUpwards = 0;
8061
33.3k
  while (rootParser->m_parentParser) {
8062
0
    rootParser = rootParser->m_parentParser;
8063
0
    stepsTakenUpwards++;
8064
0
  }
8065
33.3k
  assert(! rootParser->m_parentParser);
8066
33.3k
  if (outLevelDiff != NULL) {
8067
33.3k
    *outLevelDiff = stepsTakenUpwards;
8068
33.3k
  }
8069
33.3k
  return rootParser;
8070
33.3k
}
8071
8072
const char *
8073
0
unsignedCharToPrintable(unsigned char c) {
8074
0
  switch (c) {
8075
0
  case 0:
8076
0
    return "\\0";
8077
0
  case 1:
8078
0
    return "\\x1";
8079
0
  case 2:
8080
0
    return "\\x2";
8081
0
  case 3:
8082
0
    return "\\x3";
8083
0
  case 4:
8084
0
    return "\\x4";
8085
0
  case 5:
8086
0
    return "\\x5";
8087
0
  case 6:
8088
0
    return "\\x6";
8089
0
  case 7:
8090
0
    return "\\x7";
8091
0
  case 8:
8092
0
    return "\\x8";
8093
0
  case 9:
8094
0
    return "\\t";
8095
0
  case 10:
8096
0
    return "\\n";
8097
0
  case 11:
8098
0
    return "\\xB";
8099
0
  case 12:
8100
0
    return "\\xC";
8101
0
  case 13:
8102
0
    return "\\r";
8103
0
  case 14:
8104
0
    return "\\xE";
8105
0
  case 15:
8106
0
    return "\\xF";
8107
0
  case 16:
8108
0
    return "\\x10";
8109
0
  case 17:
8110
0
    return "\\x11";
8111
0
  case 18:
8112
0
    return "\\x12";
8113
0
  case 19:
8114
0
    return "\\x13";
8115
0
  case 20:
8116
0
    return "\\x14";
8117
0
  case 21:
8118
0
    return "\\x15";
8119
0
  case 22:
8120
0
    return "\\x16";
8121
0
  case 23:
8122
0
    return "\\x17";
8123
0
  case 24:
8124
0
    return "\\x18";
8125
0
  case 25:
8126
0
    return "\\x19";
8127
0
  case 26:
8128
0
    return "\\x1A";
8129
0
  case 27:
8130
0
    return "\\x1B";
8131
0
  case 28:
8132
0
    return "\\x1C";
8133
0
  case 29:
8134
0
    return "\\x1D";
8135
0
  case 30:
8136
0
    return "\\x1E";
8137
0
  case 31:
8138
0
    return "\\x1F";
8139
0
  case 32:
8140
0
    return " ";
8141
0
  case 33:
8142
0
    return "!";
8143
0
  case 34:
8144
0
    return "\\\"";
8145
0
  case 35:
8146
0
    return "#";
8147
0
  case 36:
8148
0
    return "$";
8149
0
  case 37:
8150
0
    return "%";
8151
0
  case 38:
8152
0
    return "&";
8153
0
  case 39:
8154
0
    return "'";
8155
0
  case 40:
8156
0
    return "(";
8157
0
  case 41:
8158
0
    return ")";
8159
0
  case 42:
8160
0
    return "*";
8161
0
  case 43:
8162
0
    return "+";
8163
0
  case 44:
8164
0
    return ",";
8165
0
  case 45:
8166
0
    return "-";
8167
0
  case 46:
8168
0
    return ".";
8169
0
  case 47:
8170
0
    return "/";
8171
0
  case 48:
8172
0
    return "0";
8173
0
  case 49:
8174
0
    return "1";
8175
0
  case 50:
8176
0
    return "2";
8177
0
  case 51:
8178
0
    return "3";
8179
0
  case 52:
8180
0
    return "4";
8181
0
  case 53:
8182
0
    return "5";
8183
0
  case 54:
8184
0
    return "6";
8185
0
  case 55:
8186
0
    return "7";
8187
0
  case 56:
8188
0
    return "8";
8189
0
  case 57:
8190
0
    return "9";
8191
0
  case 58:
8192
0
    return ":";
8193
0
  case 59:
8194
0
    return ";";
8195
0
  case 60:
8196
0
    return "<";
8197
0
  case 61:
8198
0
    return "=";
8199
0
  case 62:
8200
0
    return ">";
8201
0
  case 63:
8202
0
    return "?";
8203
0
  case 64:
8204
0
    return "@";
8205
0
  case 65:
8206
0
    return "A";
8207
0
  case 66:
8208
0
    return "B";
8209
0
  case 67:
8210
0
    return "C";
8211
0
  case 68:
8212
0
    return "D";
8213
0
  case 69:
8214
0
    return "E";
8215
0
  case 70:
8216
0
    return "F";
8217
0
  case 71:
8218
0
    return "G";
8219
0
  case 72:
8220
0
    return "H";
8221
0
  case 73:
8222
0
    return "I";
8223
0
  case 74:
8224
0
    return "J";
8225
0
  case 75:
8226
0
    return "K";
8227
0
  case 76:
8228
0
    return "L";
8229
0
  case 77:
8230
0
    return "M";
8231
0
  case 78:
8232
0
    return "N";
8233
0
  case 79:
8234
0
    return "O";
8235
0
  case 80:
8236
0
    return "P";
8237
0
  case 81:
8238
0
    return "Q";
8239
0
  case 82:
8240
0
    return "R";
8241
0
  case 83:
8242
0
    return "S";
8243
0
  case 84:
8244
0
    return "T";
8245
0
  case 85:
8246
0
    return "U";
8247
0
  case 86:
8248
0
    return "V";
8249
0
  case 87:
8250
0
    return "W";
8251
0
  case 88:
8252
0
    return "X";
8253
0
  case 89:
8254
0
    return "Y";
8255
0
  case 90:
8256
0
    return "Z";
8257
0
  case 91:
8258
0
    return "[";
8259
0
  case 92:
8260
0
    return "\\\\";
8261
0
  case 93:
8262
0
    return "]";
8263
0
  case 94:
8264
0
    return "^";
8265
0
  case 95:
8266
0
    return "_";
8267
0
  case 96:
8268
0
    return "`";
8269
0
  case 97:
8270
0
    return "a";
8271
0
  case 98:
8272
0
    return "b";
8273
0
  case 99:
8274
0
    return "c";
8275
0
  case 100:
8276
0
    return "d";
8277
0
  case 101:
8278
0
    return "e";
8279
0
  case 102:
8280
0
    return "f";
8281
0
  case 103:
8282
0
    return "g";
8283
0
  case 104:
8284
0
    return "h";
8285
0
  case 105:
8286
0
    return "i";
8287
0
  case 106:
8288
0
    return "j";
8289
0
  case 107:
8290
0
    return "k";
8291
0
  case 108:
8292
0
    return "l";
8293
0
  case 109:
8294
0
    return "m";
8295
0
  case 110:
8296
0
    return "n";
8297
0
  case 111:
8298
0
    return "o";
8299
0
  case 112:
8300
0
    return "p";
8301
0
  case 113:
8302
0
    return "q";
8303
0
  case 114:
8304
0
    return "r";
8305
0
  case 115:
8306
0
    return "s";
8307
0
  case 116:
8308
0
    return "t";
8309
0
  case 117:
8310
0
    return "u";
8311
0
  case 118:
8312
0
    return "v";
8313
0
  case 119:
8314
0
    return "w";
8315
0
  case 120:
8316
0
    return "x";
8317
0
  case 121:
8318
0
    return "y";
8319
0
  case 122:
8320
0
    return "z";
8321
0
  case 123:
8322
0
    return "{";
8323
0
  case 124:
8324
0
    return "|";
8325
0
  case 125:
8326
0
    return "}";
8327
0
  case 126:
8328
0
    return "~";
8329
0
  case 127:
8330
0
    return "\\x7F";
8331
0
  case 128:
8332
0
    return "\\x80";
8333
0
  case 129:
8334
0
    return "\\x81";
8335
0
  case 130:
8336
0
    return "\\x82";
8337
0
  case 131:
8338
0
    return "\\x83";
8339
0
  case 132:
8340
0
    return "\\x84";
8341
0
  case 133:
8342
0
    return "\\x85";
8343
0
  case 134:
8344
0
    return "\\x86";
8345
0
  case 135:
8346
0
    return "\\x87";
8347
0
  case 136:
8348
0
    return "\\x88";
8349
0
  case 137:
8350
0
    return "\\x89";
8351
0
  case 138:
8352
0
    return "\\x8A";
8353
0
  case 139:
8354
0
    return "\\x8B";
8355
0
  case 140:
8356
0
    return "\\x8C";
8357
0
  case 141:
8358
0
    return "\\x8D";
8359
0
  case 142:
8360
0
    return "\\x8E";
8361
0
  case 143:
8362
0
    return "\\x8F";
8363
0
  case 144:
8364
0
    return "\\x90";
8365
0
  case 145:
8366
0
    return "\\x91";
8367
0
  case 146:
8368
0
    return "\\x92";
8369
0
  case 147:
8370
0
    return "\\x93";
8371
0
  case 148:
8372
0
    return "\\x94";
8373
0
  case 149:
8374
0
    return "\\x95";
8375
0
  case 150:
8376
0
    return "\\x96";
8377
0
  case 151:
8378
0
    return "\\x97";
8379
0
  case 152:
8380
0
    return "\\x98";
8381
0
  case 153:
8382
0
    return "\\x99";
8383
0
  case 154:
8384
0
    return "\\x9A";
8385
0
  case 155:
8386
0
    return "\\x9B";
8387
0
  case 156:
8388
0
    return "\\x9C";
8389
0
  case 157:
8390
0
    return "\\x9D";
8391
0
  case 158:
8392
0
    return "\\x9E";
8393
0
  case 159:
8394
0
    return "\\x9F";
8395
0
  case 160:
8396
0
    return "\\xA0";
8397
0
  case 161:
8398
0
    return "\\xA1";
8399
0
  case 162:
8400
0
    return "\\xA2";
8401
0
  case 163:
8402
0
    return "\\xA3";
8403
0
  case 164:
8404
0
    return "\\xA4";
8405
0
  case 165:
8406
0
    return "\\xA5";
8407
0
  case 166:
8408
0
    return "\\xA6";
8409
0
  case 167:
8410
0
    return "\\xA7";
8411
0
  case 168:
8412
0
    return "\\xA8";
8413
0
  case 169:
8414
0
    return "\\xA9";
8415
0
  case 170:
8416
0
    return "\\xAA";
8417
0
  case 171:
8418
0
    return "\\xAB";
8419
0
  case 172:
8420
0
    return "\\xAC";
8421
0
  case 173:
8422
0
    return "\\xAD";
8423
0
  case 174:
8424
0
    return "\\xAE";
8425
0
  case 175:
8426
0
    return "\\xAF";
8427
0
  case 176:
8428
0
    return "\\xB0";
8429
0
  case 177:
8430
0
    return "\\xB1";
8431
0
  case 178:
8432
0
    return "\\xB2";
8433
0
  case 179:
8434
0
    return "\\xB3";
8435
0
  case 180:
8436
0
    return "\\xB4";
8437
0
  case 181:
8438
0
    return "\\xB5";
8439
0
  case 182:
8440
0
    return "\\xB6";
8441
0
  case 183:
8442
0
    return "\\xB7";
8443
0
  case 184:
8444
0
    return "\\xB8";
8445
0
  case 185:
8446
0
    return "\\xB9";
8447
0
  case 186:
8448
0
    return "\\xBA";
8449
0
  case 187:
8450
0
    return "\\xBB";
8451
0
  case 188:
8452
0
    return "\\xBC";
8453
0
  case 189:
8454
0
    return "\\xBD";
8455
0
  case 190:
8456
0
    return "\\xBE";
8457
0
  case 191:
8458
0
    return "\\xBF";
8459
0
  case 192:
8460
0
    return "\\xC0";
8461
0
  case 193:
8462
0
    return "\\xC1";
8463
0
  case 194:
8464
0
    return "\\xC2";
8465
0
  case 195:
8466
0
    return "\\xC3";
8467
0
  case 196:
8468
0
    return "\\xC4";
8469
0
  case 197:
8470
0
    return "\\xC5";
8471
0
  case 198:
8472
0
    return "\\xC6";
8473
0
  case 199:
8474
0
    return "\\xC7";
8475
0
  case 200:
8476
0
    return "\\xC8";
8477
0
  case 201:
8478
0
    return "\\xC9";
8479
0
  case 202:
8480
0
    return "\\xCA";
8481
0
  case 203:
8482
0
    return "\\xCB";
8483
0
  case 204:
8484
0
    return "\\xCC";
8485
0
  case 205:
8486
0
    return "\\xCD";
8487
0
  case 206:
8488
0
    return "\\xCE";
8489
0
  case 207:
8490
0
    return "\\xCF";
8491
0
  case 208:
8492
0
    return "\\xD0";
8493
0
  case 209:
8494
0
    return "\\xD1";
8495
0
  case 210:
8496
0
    return "\\xD2";
8497
0
  case 211:
8498
0
    return "\\xD3";
8499
0
  case 212:
8500
0
    return "\\xD4";
8501
0
  case 213:
8502
0
    return "\\xD5";
8503
0
  case 214:
8504
0
    return "\\xD6";
8505
0
  case 215:
8506
0
    return "\\xD7";
8507
0
  case 216:
8508
0
    return "\\xD8";
8509
0
  case 217:
8510
0
    return "\\xD9";
8511
0
  case 218:
8512
0
    return "\\xDA";
8513
0
  case 219:
8514
0
    return "\\xDB";
8515
0
  case 220:
8516
0
    return "\\xDC";
8517
0
  case 221:
8518
0
    return "\\xDD";
8519
0
  case 222:
8520
0
    return "\\xDE";
8521
0
  case 223:
8522
0
    return "\\xDF";
8523
0
  case 224:
8524
0
    return "\\xE0";
8525
0
  case 225:
8526
0
    return "\\xE1";
8527
0
  case 226:
8528
0
    return "\\xE2";
8529
0
  case 227:
8530
0
    return "\\xE3";
8531
0
  case 228:
8532
0
    return "\\xE4";
8533
0
  case 229:
8534
0
    return "\\xE5";
8535
0
  case 230:
8536
0
    return "\\xE6";
8537
0
  case 231:
8538
0
    return "\\xE7";
8539
0
  case 232:
8540
0
    return "\\xE8";
8541
0
  case 233:
8542
0
    return "\\xE9";
8543
0
  case 234:
8544
0
    return "\\xEA";
8545
0
  case 235:
8546
0
    return "\\xEB";
8547
0
  case 236:
8548
0
    return "\\xEC";
8549
0
  case 237:
8550
0
    return "\\xED";
8551
0
  case 238:
8552
0
    return "\\xEE";
8553
0
  case 239:
8554
0
    return "\\xEF";
8555
0
  case 240:
8556
0
    return "\\xF0";
8557
0
  case 241:
8558
0
    return "\\xF1";
8559
0
  case 242:
8560
0
    return "\\xF2";
8561
0
  case 243:
8562
0
    return "\\xF3";
8563
0
  case 244:
8564
0
    return "\\xF4";
8565
0
  case 245:
8566
0
    return "\\xF5";
8567
0
  case 246:
8568
0
    return "\\xF6";
8569
0
  case 247:
8570
0
    return "\\xF7";
8571
0
  case 248:
8572
0
    return "\\xF8";
8573
0
  case 249:
8574
0
    return "\\xF9";
8575
0
  case 250:
8576
0
    return "\\xFA";
8577
0
  case 251:
8578
0
    return "\\xFB";
8579
0
  case 252:
8580
0
    return "\\xFC";
8581
0
  case 253:
8582
0
    return "\\xFD";
8583
0
  case 254:
8584
0
    return "\\xFE";
8585
0
  case 255:
8586
0
    return "\\xFF";
8587
0
  default:
8588
0
    assert(0); /* never gets here */
8589
0
    return "dead code";
8590
0
  }
8591
0
  assert(0); /* never gets here */
8592
0
}
8593
8594
#endif /* XML_GE == 1 */
8595
8596
static unsigned long
8597
267
getDebugLevel(const char *variableName, unsigned long defaultDebugLevel) {
8598
267
  const char *const valueOrNull = getenv(variableName);
8599
267
  const char *const value = valueOrNull;
8600
267
  char *afterValue = NULL;
8601
267
  unsigned long debugLevel;
8602
267
  if (valueOrNull == NULL) {
8603
267
    return defaultDebugLevel;
8604
267
  }
8605
8606
267
  errno = 0;
8607
0
  afterValue = NULL;
8608
0
  debugLevel = strtoul(value, &afterValue, 10);
8609
0
  if ((errno != 0) || (afterValue == value) || (afterValue[0] != '\0')) {
8610
0
    errno = 0;
8611
0
    return defaultDebugLevel;
8612
0
  }
8613
8614
0
  return debugLevel;
8615
0
}