Coverage Report

Created: 2024-04-26 11:09

/src/libxml2/SAX2.c
Line
Count
Source (jump to first uncovered line)
1
/*
2
 * SAX2.c : Default SAX2 handler to build a tree.
3
 *
4
 * See Copyright for the status of this software.
5
 *
6
 * Daniel Veillard <daniel@veillard.com>
7
 */
8
9
10
#define IN_LIBXML
11
#include "libxml.h"
12
#include <stdlib.h>
13
#include <string.h>
14
#include <limits.h>
15
#include <stddef.h>
16
#include <libxml/xmlmemory.h>
17
#include <libxml/tree.h>
18
#include <libxml/parser.h>
19
#include <libxml/parserInternals.h>
20
#include <libxml/valid.h>
21
#include <libxml/entities.h>
22
#include <libxml/xmlerror.h>
23
#include <libxml/debugXML.h>
24
#include <libxml/xmlIO.h>
25
#include <libxml/SAX.h>
26
#include <libxml/uri.h>
27
#include <libxml/valid.h>
28
#include <libxml/HTMLtree.h>
29
#include <libxml/globals.h>
30
31
#include "private/error.h"
32
#include "private/parser.h"
33
#include "private/tree.h"
34
35
/* #define DEBUG_SAX2 */
36
/* #define DEBUG_SAX2_TREE */
37
38
/**
39
 * TODO:
40
 *
41
 * macro to flag unimplemented blocks
42
 * XML_CATALOG_PREFER user env to select between system/public preferred
43
 * option. C.f. Richard Tobin <richard@cogsci.ed.ac.uk>
44
 *> Just FYI, I am using an environment variable XML_CATALOG_PREFER with
45
 *> values "system" and "public".  I have made the default be "system" to
46
 *> match yours.
47
 */
48
#define TODO                \
49
    xmlGenericError(xmlGenericErrorContext,       \
50
      "Unimplemented block at %s:%d\n",       \
51
            __FILE__, __LINE__);
52
53
/*
54
 * xmlSAX2ErrMemory:
55
 * @ctxt:  an XML validation parser context
56
 * @msg:   a string to accompany the error message
57
 */
58
static void LIBXML_ATTR_FORMAT(2,0)
59
4
xmlSAX2ErrMemory(xmlParserCtxtPtr ctxt, const char *msg) {
60
4
    xmlStructuredErrorFunc schannel = NULL;
61
4
    const char *str1 = "out of memory\n";
62
63
4
    if (ctxt != NULL) {
64
4
  ctxt->errNo = XML_ERR_NO_MEMORY;
65
4
  if ((ctxt->sax != NULL) && (ctxt->sax->initialized == XML_SAX2_MAGIC))
66
4
      schannel = ctxt->sax->serror;
67
4
  __xmlRaiseError(schannel,
68
4
      ctxt->vctxt.error, ctxt->vctxt.userData,
69
4
      ctxt, NULL, XML_FROM_PARSER, XML_ERR_NO_MEMORY,
70
4
      XML_ERR_ERROR, NULL, 0, (const char *) str1,
71
4
      NULL, NULL, 0, 0,
72
4
      msg, (const char *) str1, NULL);
73
4
  ctxt->errNo = XML_ERR_NO_MEMORY;
74
4
  ctxt->instate = XML_PARSER_EOF;
75
4
  ctxt->disableSAX = 1;
76
4
    } else {
77
0
  __xmlRaiseError(schannel,
78
0
      NULL, NULL,
79
0
      ctxt, NULL, XML_FROM_PARSER, XML_ERR_NO_MEMORY,
80
0
      XML_ERR_ERROR, NULL, 0, (const char *) str1,
81
0
      NULL, NULL, 0, 0,
82
0
      msg, (const char *) str1, NULL);
83
0
    }
84
4
}
85
86
/**
87
 * xmlValidError:
88
 * @ctxt:  an XML validation parser context
89
 * @error:  the error number
90
 * @msg:  the error message
91
 * @str1:  extra data
92
 * @str2:  extra data
93
 *
94
 * Handle a validation error
95
 */
96
static void LIBXML_ATTR_FORMAT(3,0)
97
xmlErrValid(xmlParserCtxtPtr ctxt, xmlParserErrors error,
98
            const char *msg, const char *str1, const char *str2)
99
2.64M
{
100
2.64M
    xmlStructuredErrorFunc schannel = NULL;
101
102
2.64M
    if ((ctxt != NULL) && (ctxt->disableSAX != 0) &&
103
2.64M
        (ctxt->instate == XML_PARSER_EOF))
104
0
  return;
105
2.64M
    if (ctxt != NULL) {
106
2.64M
  ctxt->errNo = error;
107
2.64M
  if ((ctxt->sax != NULL) && (ctxt->sax->initialized == XML_SAX2_MAGIC))
108
1.45M
      schannel = ctxt->sax->serror;
109
2.64M
  __xmlRaiseError(schannel,
110
2.64M
      ctxt->vctxt.error, ctxt->vctxt.userData,
111
2.64M
      ctxt, NULL, XML_FROM_DTD, error,
112
2.64M
      XML_ERR_ERROR, NULL, 0, (const char *) str1,
113
2.64M
      (const char *) str2, NULL, 0, 0,
114
2.64M
      msg, (const char *) str1, (const char *) str2);
115
2.64M
  ctxt->valid = 0;
116
2.64M
    } else {
117
0
  __xmlRaiseError(schannel,
118
0
      NULL, NULL,
119
0
      ctxt, NULL, XML_FROM_DTD, error,
120
0
      XML_ERR_ERROR, NULL, 0, (const char *) str1,
121
0
      (const char *) str2, NULL, 0, 0,
122
0
      msg, (const char *) str1, (const char *) str2);
123
0
    }
124
2.64M
}
125
126
/**
127
 * xmlFatalErrMsg:
128
 * @ctxt:  an XML parser context
129
 * @error:  the error number
130
 * @msg:  the error message
131
 * @str1:  an error string
132
 * @str2:  an error string
133
 *
134
 * Handle a fatal parser error, i.e. violating Well-Formedness constraints
135
 */
136
static void LIBXML_ATTR_FORMAT(3,0)
137
xmlFatalErrMsg(xmlParserCtxtPtr ctxt, xmlParserErrors error,
138
               const char *msg, const xmlChar *str1, const xmlChar *str2)
139
4.03k
{
140
4.03k
    if ((ctxt != NULL) && (ctxt->disableSAX != 0) &&
141
4.03k
        (ctxt->instate == XML_PARSER_EOF))
142
0
  return;
143
4.03k
    if (ctxt != NULL)
144
4.03k
  ctxt->errNo = error;
145
4.03k
    __xmlRaiseError(NULL, NULL, NULL, ctxt, NULL, XML_FROM_PARSER, error,
146
4.03k
                    XML_ERR_FATAL, NULL, 0,
147
4.03k
        (const char *) str1, (const char *) str2,
148
4.03k
        NULL, 0, 0, msg, str1, str2);
149
4.03k
    if (ctxt != NULL) {
150
4.03k
  ctxt->wellFormed = 0;
151
4.03k
  ctxt->valid = 0;
152
4.03k
  if (ctxt->recovery == 0)
153
783
      ctxt->disableSAX = 1;
154
4.03k
    }
155
4.03k
}
156
157
/**
158
 * xmlWarnMsg:
159
 * @ctxt:  an XML parser context
160
 * @error:  the error number
161
 * @msg:  the error message
162
 * @str1:  an error string
163
 * @str2:  an error string
164
 *
165
 * Handle a parser warning
166
 */
167
static void LIBXML_ATTR_FORMAT(3,0)
168
xmlWarnMsg(xmlParserCtxtPtr ctxt, xmlParserErrors error,
169
               const char *msg, const xmlChar *str1)
170
83.1k
{
171
83.1k
    if ((ctxt != NULL) && (ctxt->disableSAX != 0) &&
172
83.1k
        (ctxt->instate == XML_PARSER_EOF))
173
0
  return;
174
83.1k
    if (ctxt != NULL)
175
83.1k
  ctxt->errNo = error;
176
83.1k
    __xmlRaiseError(NULL, NULL, NULL, ctxt, NULL, XML_FROM_PARSER, error,
177
83.1k
                    XML_ERR_WARNING, NULL, 0,
178
83.1k
        (const char *) str1, NULL,
179
83.1k
        NULL, 0, 0, msg, str1);
180
83.1k
}
181
182
/**
183
 * xmlNsWarnMsg:
184
 * @ctxt:  an XML parser context
185
 * @error:  the error number
186
 * @msg:  the error message
187
 * @str1:  an error string
188
 *
189
 * Handle a namespace warning
190
 */
191
static void LIBXML_ATTR_FORMAT(3,0)
192
xmlNsWarnMsg(xmlParserCtxtPtr ctxt, xmlParserErrors error,
193
             const char *msg, const xmlChar *str1, const xmlChar *str2)
194
15.7M
{
195
15.7M
    if ((ctxt != NULL) && (ctxt->disableSAX != 0) &&
196
15.7M
        (ctxt->instate == XML_PARSER_EOF))
197
0
  return;
198
15.7M
    if (ctxt != NULL)
199
15.7M
  ctxt->errNo = error;
200
15.7M
    __xmlRaiseError(NULL, NULL, NULL, ctxt, NULL, XML_FROM_NAMESPACE, error,
201
15.7M
                    XML_ERR_WARNING, NULL, 0,
202
15.7M
        (const char *) str1, (const char *) str2,
203
15.7M
        NULL, 0, 0, msg, str1, str2);
204
15.7M
}
205
206
/**
207
 * xmlSAX2GetPublicId:
208
 * @ctx: the user data (XML parser context)
209
 *
210
 * Provides the public ID e.g. "-//SGMLSOURCE//DTD DEMO//EN"
211
 *
212
 * Returns a xmlChar *
213
 */
214
const xmlChar *
215
xmlSAX2GetPublicId(void *ctx ATTRIBUTE_UNUSED)
216
0
{
217
    /* xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx; */
218
0
    return(NULL);
219
0
}
220
221
/**
222
 * xmlSAX2GetSystemId:
223
 * @ctx: the user data (XML parser context)
224
 *
225
 * Provides the system ID, basically URL or filename e.g.
226
 * http://www.sgmlsource.com/dtds/memo.dtd
227
 *
228
 * Returns a xmlChar *
229
 */
230
const xmlChar *
231
xmlSAX2GetSystemId(void *ctx)
232
0
{
233
0
    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
234
0
    if ((ctx == NULL) || (ctxt->input == NULL)) return(NULL);
235
0
    return((const xmlChar *) ctxt->input->filename);
236
0
}
237
238
/**
239
 * xmlSAX2GetLineNumber:
240
 * @ctx: the user data (XML parser context)
241
 *
242
 * Provide the line number of the current parsing point.
243
 *
244
 * Returns an int
245
 */
246
int
247
xmlSAX2GetLineNumber(void *ctx)
248
0
{
249
0
    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
250
0
    if ((ctx == NULL) || (ctxt->input == NULL)) return(0);
251
0
    return(ctxt->input->line);
252
0
}
253
254
/**
255
 * xmlSAX2GetColumnNumber:
256
 * @ctx: the user data (XML parser context)
257
 *
258
 * Provide the column number of the current parsing point.
259
 *
260
 * Returns an int
261
 */
262
int
263
xmlSAX2GetColumnNumber(void *ctx)
264
0
{
265
0
    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
266
0
    if ((ctx == NULL) || (ctxt->input == NULL)) return(0);
267
0
    return(ctxt->input->col);
268
0
}
269
270
/**
271
 * xmlSAX2IsStandalone:
272
 * @ctx: the user data (XML parser context)
273
 *
274
 * Is this document tagged standalone ?
275
 *
276
 * Returns 1 if true
277
 */
278
int
279
xmlSAX2IsStandalone(void *ctx)
280
0
{
281
0
    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
282
0
    if ((ctx == NULL) || (ctxt->myDoc == NULL)) return(0);
283
0
    return(ctxt->myDoc->standalone == 1);
284
0
}
285
286
/**
287
 * xmlSAX2HasInternalSubset:
288
 * @ctx: the user data (XML parser context)
289
 *
290
 * Does this document has an internal subset
291
 *
292
 * Returns 1 if true
293
 */
294
int
295
xmlSAX2HasInternalSubset(void *ctx)
296
0
{
297
0
    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
298
0
    if ((ctxt == NULL) || (ctxt->myDoc == NULL)) return(0);
299
0
    return(ctxt->myDoc->intSubset != NULL);
300
0
}
301
302
/**
303
 * xmlSAX2HasExternalSubset:
304
 * @ctx: the user data (XML parser context)
305
 *
306
 * Does this document has an external subset
307
 *
308
 * Returns 1 if true
309
 */
310
int
311
xmlSAX2HasExternalSubset(void *ctx)
312
0
{
313
0
    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
314
0
    if ((ctxt == NULL) || (ctxt->myDoc == NULL)) return(0);
315
0
    return(ctxt->myDoc->extSubset != NULL);
316
0
}
317
318
/**
319
 * xmlSAX2InternalSubset:
320
 * @ctx:  the user data (XML parser context)
321
 * @name:  the root element name
322
 * @ExternalID:  the external ID
323
 * @SystemID:  the SYSTEM ID (e.g. filename or URL)
324
 *
325
 * Callback on internal subset declaration.
326
 */
327
void
328
xmlSAX2InternalSubset(void *ctx, const xmlChar *name,
329
         const xmlChar *ExternalID, const xmlChar *SystemID)
330
5.16M
{
331
5.16M
    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
332
5.16M
    xmlDtdPtr dtd;
333
5.16M
    if (ctx == NULL) return;
334
#ifdef DEBUG_SAX
335
    xmlGenericError(xmlGenericErrorContext,
336
      "SAX.xmlSAX2InternalSubset(%s, %s, %s)\n",
337
            name, ExternalID, SystemID);
338
#endif
339
340
5.16M
    if (ctxt->myDoc == NULL)
341
0
  return;
342
5.16M
    dtd = xmlGetIntSubset(ctxt->myDoc);
343
5.16M
    if (dtd != NULL) {
344
0
  if (ctxt->html)
345
0
      return;
346
0
  xmlUnlinkNode((xmlNodePtr) dtd);
347
0
  xmlFreeDtd(dtd);
348
0
  ctxt->myDoc->intSubset = NULL;
349
0
    }
350
5.16M
    ctxt->myDoc->intSubset =
351
5.16M
  xmlCreateIntSubset(ctxt->myDoc, name, ExternalID, SystemID);
352
5.16M
    if (ctxt->myDoc->intSubset == NULL)
353
0
        xmlSAX2ErrMemory(ctxt, "xmlSAX2InternalSubset");
354
5.16M
}
355
356
/**
357
 * xmlSAX2ExternalSubset:
358
 * @ctx: the user data (XML parser context)
359
 * @name:  the root element name
360
 * @ExternalID:  the external ID
361
 * @SystemID:  the SYSTEM ID (e.g. filename or URL)
362
 *
363
 * Callback on external subset declaration.
364
 */
365
void
366
xmlSAX2ExternalSubset(void *ctx, const xmlChar *name,
367
         const xmlChar *ExternalID, const xmlChar *SystemID)
368
3.10M
{
369
3.10M
    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
370
3.10M
    if (ctx == NULL) return;
371
#ifdef DEBUG_SAX
372
    xmlGenericError(xmlGenericErrorContext,
373
      "SAX.xmlSAX2ExternalSubset(%s, %s, %s)\n",
374
            name, ExternalID, SystemID);
375
#endif
376
3.10M
    if (((ExternalID != NULL) || (SystemID != NULL)) &&
377
3.10M
        (((ctxt->validate) || (ctxt->loadsubset != 0)) &&
378
1.52M
   (ctxt->wellFormed && ctxt->myDoc))) {
379
  /*
380
   * Try to fetch and parse the external subset.
381
   */
382
1.28M
  xmlParserInputPtr oldinput;
383
1.28M
  int oldinputNr;
384
1.28M
  int oldinputMax;
385
1.28M
  xmlParserInputPtr *oldinputTab;
386
1.28M
  xmlParserInputPtr input = NULL;
387
1.28M
  xmlCharEncoding enc;
388
1.28M
  int oldcharset;
389
1.28M
  const xmlChar *oldencoding;
390
1.28M
  int oldprogressive;
391
1.28M
        unsigned long consumed;
392
1.28M
        size_t buffered;
393
394
  /*
395
   * Ask the Entity resolver to load the damn thing
396
   */
397
1.28M
  if ((ctxt->sax != NULL) && (ctxt->sax->resolveEntity != NULL))
398
1.28M
      input = ctxt->sax->resolveEntity(ctxt->userData, ExternalID,
399
1.28M
                                          SystemID);
400
1.28M
  if (input == NULL) {
401
698k
      return;
402
698k
  }
403
404
587k
  xmlNewDtd(ctxt->myDoc, name, ExternalID, SystemID);
405
406
  /*
407
   * make sure we won't destroy the main document context
408
   */
409
587k
  oldinput = ctxt->input;
410
587k
  oldinputNr = ctxt->inputNr;
411
587k
  oldinputMax = ctxt->inputMax;
412
587k
  oldinputTab = ctxt->inputTab;
413
587k
  oldcharset = ctxt->charset;
414
587k
  oldencoding = ctxt->encoding;
415
587k
        oldprogressive = ctxt->progressive;
416
587k
  ctxt->encoding = NULL;
417
587k
        ctxt->progressive = 0;
418
419
587k
  ctxt->inputTab = (xmlParserInputPtr *)
420
587k
                   xmlMalloc(5 * sizeof(xmlParserInputPtr));
421
587k
  if (ctxt->inputTab == NULL) {
422
0
      xmlSAX2ErrMemory(ctxt, "xmlSAX2ExternalSubset");
423
0
            xmlFreeInputStream(input);
424
0
      ctxt->input = oldinput;
425
0
      ctxt->inputNr = oldinputNr;
426
0
      ctxt->inputMax = oldinputMax;
427
0
      ctxt->inputTab = oldinputTab;
428
0
      ctxt->charset = oldcharset;
429
0
      ctxt->encoding = oldencoding;
430
0
            ctxt->progressive = oldprogressive;
431
0
      return;
432
0
  }
433
587k
  ctxt->inputNr = 0;
434
587k
  ctxt->inputMax = 5;
435
587k
  ctxt->input = NULL;
436
587k
  xmlPushInput(ctxt, input);
437
438
  /*
439
   * On the fly encoding conversion if needed
440
   */
441
587k
  if (ctxt->input->length >= 4) {
442
0
      enc = xmlDetectCharEncoding(ctxt->input->cur, 4);
443
0
      xmlSwitchEncoding(ctxt, enc);
444
0
  }
445
446
587k
  if (input->filename == NULL)
447
587k
      input->filename = (char *) xmlCanonicPath(SystemID);
448
587k
  input->line = 1;
449
587k
  input->col = 1;
450
587k
  input->base = ctxt->input->cur;
451
587k
  input->cur = ctxt->input->cur;
452
587k
  input->free = NULL;
453
454
  /*
455
   * let's parse that entity knowing it's an external subset.
456
   */
457
587k
  xmlParseExternalSubset(ctxt, ExternalID, SystemID);
458
459
        /*
460
   * Free up the external entities
461
   */
462
463
587k
  while (ctxt->inputNr > 1)
464
0
      xmlPopInput(ctxt);
465
466
587k
        consumed = ctxt->input->consumed;
467
587k
        buffered = ctxt->input->cur - ctxt->input->base;
468
587k
        if (buffered > ULONG_MAX - consumed)
469
0
            consumed = ULONG_MAX;
470
587k
        else
471
587k
            consumed += buffered;
472
587k
        if (consumed > ULONG_MAX - ctxt->sizeentities)
473
0
            ctxt->sizeentities = ULONG_MAX;
474
587k
        else
475
587k
            ctxt->sizeentities += consumed;
476
477
587k
  xmlFreeInputStream(ctxt->input);
478
587k
        xmlFree(ctxt->inputTab);
479
480
  /*
481
   * Restore the parsing context of the main entity
482
   */
483
587k
  ctxt->input = oldinput;
484
587k
  ctxt->inputNr = oldinputNr;
485
587k
  ctxt->inputMax = oldinputMax;
486
587k
  ctxt->inputTab = oldinputTab;
487
587k
  ctxt->charset = oldcharset;
488
587k
  if ((ctxt->encoding != NULL) &&
489
587k
      ((ctxt->dict == NULL) ||
490
24.1k
       (!xmlDictOwns(ctxt->dict, ctxt->encoding))))
491
24.1k
      xmlFree((xmlChar *) ctxt->encoding);
492
587k
  ctxt->encoding = oldencoding;
493
587k
        ctxt->progressive = oldprogressive;
494
  /* ctxt->wellFormed = oldwellFormed; */
495
587k
    }
496
3.10M
}
497
498
/**
499
 * xmlSAX2ResolveEntity:
500
 * @ctx: the user data (XML parser context)
501
 * @publicId: The public ID of the entity
502
 * @systemId: The system ID of the entity
503
 *
504
 * The entity loader, to control the loading of external entities,
505
 * the application can either:
506
 *    - override this xmlSAX2ResolveEntity() callback in the SAX block
507
 *    - or better use the xmlSetExternalEntityLoader() function to
508
 *      set up it's own entity resolution routine
509
 *
510
 * Returns the xmlParserInputPtr if inlined or NULL for DOM behaviour.
511
 */
512
xmlParserInputPtr
513
xmlSAX2ResolveEntity(void *ctx, const xmlChar *publicId, const xmlChar *systemId)
514
1.28M
{
515
1.28M
    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
516
1.28M
    xmlParserInputPtr ret;
517
1.28M
    xmlChar *URI;
518
1.28M
    const char *base = NULL;
519
520
1.28M
    if (ctx == NULL) return(NULL);
521
1.28M
    if (ctxt->input != NULL)
522
1.28M
  base = ctxt->input->filename;
523
1.28M
    if (base == NULL)
524
428k
  base = ctxt->directory;
525
526
1.28M
    URI = xmlBuildURI(systemId, (const xmlChar *) base);
527
528
#ifdef DEBUG_SAX
529
    xmlGenericError(xmlGenericErrorContext,
530
      "SAX.xmlSAX2ResolveEntity(%s, %s)\n", publicId, systemId);
531
#endif
532
533
1.28M
    ret = xmlLoadExternalEntity((const char *) URI,
534
1.28M
        (const char *) publicId, ctxt);
535
1.28M
    if (URI != NULL)
536
1.27M
  xmlFree(URI);
537
1.28M
    return(ret);
538
1.28M
}
539
540
/**
541
 * xmlSAX2GetEntity:
542
 * @ctx: the user data (XML parser context)
543
 * @name: The entity name
544
 *
545
 * Get an entity by name
546
 *
547
 * Returns the xmlEntityPtr if found.
548
 */
549
xmlEntityPtr
550
xmlSAX2GetEntity(void *ctx, const xmlChar *name)
551
321M
{
552
321M
    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
553
321M
    xmlEntityPtr ret = NULL;
554
555
321M
    if (ctx == NULL) return(NULL);
556
#ifdef DEBUG_SAX
557
    xmlGenericError(xmlGenericErrorContext,
558
      "SAX.xmlSAX2GetEntity(%s)\n", name);
559
#endif
560
561
321M
    if (ctxt->inSubset == 0) {
562
316M
  ret = xmlGetPredefinedEntity(name);
563
316M
  if (ret != NULL)
564
1.26M
      return(ret);
565
316M
    }
566
320M
    if ((ctxt->myDoc != NULL) && (ctxt->myDoc->standalone == 1)) {
567
313k
  if (ctxt->inSubset == 2) {
568
0
      ctxt->myDoc->standalone = 0;
569
0
      ret = xmlGetDocEntity(ctxt->myDoc, name);
570
0
      ctxt->myDoc->standalone = 1;
571
313k
  } else {
572
313k
      ret = xmlGetDocEntity(ctxt->myDoc, name);
573
313k
      if (ret == NULL) {
574
185k
    ctxt->myDoc->standalone = 0;
575
185k
    ret = xmlGetDocEntity(ctxt->myDoc, name);
576
185k
    if (ret != NULL) {
577
0
        xmlFatalErrMsg(ctxt, XML_ERR_NOT_STANDALONE,
578
0
   "Entity(%s) document marked standalone but requires external subset\n",
579
0
           name, NULL);
580
0
    }
581
185k
    ctxt->myDoc->standalone = 1;
582
185k
      }
583
313k
  }
584
320M
    } else {
585
320M
  ret = xmlGetDocEntity(ctxt->myDoc, name);
586
320M
    }
587
320M
    return(ret);
588
321M
}
589
590
/**
591
 * xmlSAX2GetParameterEntity:
592
 * @ctx: the user data (XML parser context)
593
 * @name: The entity name
594
 *
595
 * Get a parameter entity by name
596
 *
597
 * Returns the xmlEntityPtr if found.
598
 */
599
xmlEntityPtr
600
xmlSAX2GetParameterEntity(void *ctx, const xmlChar *name)
601
276M
{
602
276M
    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
603
276M
    xmlEntityPtr ret;
604
605
276M
    if (ctx == NULL) return(NULL);
606
#ifdef DEBUG_SAX
607
    xmlGenericError(xmlGenericErrorContext,
608
      "SAX.xmlSAX2GetParameterEntity(%s)\n", name);
609
#endif
610
611
276M
    ret = xmlGetParameterEntity(ctxt->myDoc, name);
612
276M
    return(ret);
613
276M
}
614
615
616
/**
617
 * xmlSAX2EntityDecl:
618
 * @ctx: the user data (XML parser context)
619
 * @name:  the entity name
620
 * @type:  the entity type
621
 * @publicId: The public ID of the entity
622
 * @systemId: The system ID of the entity
623
 * @content: the entity value (without processing).
624
 *
625
 * An entity definition has been parsed
626
 */
627
void
628
xmlSAX2EntityDecl(void *ctx, const xmlChar *name, int type,
629
          const xmlChar *publicId, const xmlChar *systemId, xmlChar *content)
630
7.40M
{
631
7.40M
    xmlEntityPtr ent;
632
7.40M
    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
633
634
7.40M
    if (ctx == NULL) return;
635
#ifdef DEBUG_SAX
636
    xmlGenericError(xmlGenericErrorContext,
637
      "SAX.xmlSAX2EntityDecl(%s, %d, %s, %s, %s)\n",
638
            name, type, publicId, systemId, content);
639
#endif
640
7.40M
    if (ctxt->inSubset == 1) {
641
6.02M
  ent = xmlAddDocEntity(ctxt->myDoc, name, type, publicId,
642
6.02M
                  systemId, content);
643
6.02M
  if ((ent == NULL) && (ctxt->pedantic))
644
83.1k
      xmlWarnMsg(ctxt, XML_WAR_ENTITY_REDEFINED,
645
83.1k
       "Entity(%s) already defined in the internal subset\n",
646
83.1k
                 name);
647
6.02M
  if ((ent != NULL) && (ent->URI == NULL) && (systemId != NULL)) {
648
1.36M
      xmlChar *URI;
649
1.36M
      const char *base = NULL;
650
651
1.36M
      if (ctxt->input != NULL)
652
1.36M
    base = ctxt->input->filename;
653
1.36M
      if (base == NULL)
654
444k
    base = ctxt->directory;
655
656
1.36M
      URI = xmlBuildURI(systemId, (const xmlChar *) base);
657
1.36M
      ent->URI = URI;
658
1.36M
  }
659
6.02M
    } else if (ctxt->inSubset == 2) {
660
1.37M
  ent = xmlAddDtdEntity(ctxt->myDoc, name, type, publicId,
661
1.37M
                  systemId, content);
662
1.37M
  if ((ent == NULL) && (ctxt->pedantic) &&
663
1.37M
      (ctxt->sax != NULL) && (ctxt->sax->warning != NULL))
664
3.21k
      ctxt->sax->warning(ctxt->userData,
665
3.21k
       "Entity(%s) already defined in the external subset\n", name);
666
1.37M
  if ((ent != NULL) && (ent->URI == NULL) && (systemId != NULL)) {
667
109k
      xmlChar *URI;
668
109k
      const char *base = NULL;
669
670
109k
      if (ctxt->input != NULL)
671
109k
    base = ctxt->input->filename;
672
109k
      if (base == NULL)
673
0
    base = ctxt->directory;
674
675
109k
      URI = xmlBuildURI(systemId, (const xmlChar *) base);
676
109k
      ent->URI = URI;
677
109k
  }
678
1.37M
    } else {
679
0
  xmlFatalErrMsg(ctxt, XML_ERR_ENTITY_PROCESSING,
680
0
                 "SAX.xmlSAX2EntityDecl(%s) called while not in subset\n",
681
0
           name, NULL);
682
0
    }
683
7.40M
}
684
685
/**
686
 * xmlSAX2AttributeDecl:
687
 * @ctx: the user data (XML parser context)
688
 * @elem:  the name of the element
689
 * @fullname:  the attribute name
690
 * @type:  the attribute type
691
 * @def:  the type of default value
692
 * @defaultValue: the attribute default value
693
 * @tree:  the tree of enumerated value set
694
 *
695
 * An attribute definition has been parsed
696
 */
697
void
698
xmlSAX2AttributeDecl(void *ctx, const xmlChar *elem, const xmlChar *fullname,
699
              int type, int def, const xmlChar *defaultValue,
700
        xmlEnumerationPtr tree)
701
9.34M
{
702
9.34M
    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
703
9.34M
    xmlAttributePtr attr;
704
9.34M
    xmlChar *name = NULL, *prefix = NULL;
705
706
    /* Avoid unused variable warning if features are disabled. */
707
9.34M
    (void) attr;
708
709
9.34M
    if ((ctxt == NULL) || (ctxt->myDoc == NULL))
710
0
        return;
711
712
#ifdef DEBUG_SAX
713
    xmlGenericError(xmlGenericErrorContext,
714
      "SAX.xmlSAX2AttributeDecl(%s, %s, %d, %d, %s, ...)\n",
715
            elem, fullname, type, def, defaultValue);
716
#endif
717
9.34M
    if ((xmlStrEqual(fullname, BAD_CAST "xml:id")) &&
718
9.34M
        (type != XML_ATTRIBUTE_ID)) {
719
  /*
720
   * Raise the error but keep the validity flag
721
   */
722
5.11k
  int tmp = ctxt->valid;
723
5.11k
  xmlErrValid(ctxt, XML_DTD_XMLID_TYPE,
724
5.11k
        "xml:id : attribute type should be ID\n", NULL, NULL);
725
5.11k
  ctxt->valid = tmp;
726
5.11k
    }
727
    /* TODO: optimize name/prefix allocation */
728
9.34M
    name = xmlSplitQName(ctxt, fullname, &prefix);
729
9.34M
    ctxt->vctxt.valid = 1;
730
9.34M
    if (ctxt->inSubset == 1)
731
6.40M
  attr = xmlAddAttributeDecl(&ctxt->vctxt, ctxt->myDoc->intSubset, elem,
732
6.40M
         name, prefix, (xmlAttributeType) type,
733
6.40M
         (xmlAttributeDefault) def, defaultValue, tree);
734
2.94M
    else if (ctxt->inSubset == 2)
735
2.94M
  attr = xmlAddAttributeDecl(&ctxt->vctxt, ctxt->myDoc->extSubset, elem,
736
2.94M
     name, prefix, (xmlAttributeType) type,
737
2.94M
     (xmlAttributeDefault) def, defaultValue, tree);
738
0
    else {
739
0
        xmlFatalErrMsg(ctxt, XML_ERR_INTERNAL_ERROR,
740
0
       "SAX.xmlSAX2AttributeDecl(%s) called while not in subset\n",
741
0
                 name, NULL);
742
0
  xmlFree(name);
743
0
  xmlFreeEnumeration(tree);
744
0
  return;
745
0
    }
746
9.34M
#ifdef LIBXML_VALID_ENABLED
747
9.34M
    if (ctxt->vctxt.valid == 0)
748
941k
  ctxt->valid = 0;
749
9.34M
    if ((attr != NULL) && (ctxt->validate) && (ctxt->wellFormed) &&
750
9.34M
        (ctxt->myDoc->intSubset != NULL))
751
1.85M
  ctxt->valid &= xmlValidateAttributeDecl(&ctxt->vctxt, ctxt->myDoc,
752
1.85M
                                          attr);
753
9.34M
#endif /* LIBXML_VALID_ENABLED */
754
9.34M
    if (prefix != NULL)
755
1.06M
  xmlFree(prefix);
756
9.34M
    if (name != NULL)
757
9.34M
  xmlFree(name);
758
9.34M
}
759
760
/**
761
 * xmlSAX2ElementDecl:
762
 * @ctx: the user data (XML parser context)
763
 * @name:  the element name
764
 * @type:  the element type
765
 * @content: the element value tree
766
 *
767
 * An element definition has been parsed
768
 */
769
void
770
xmlSAX2ElementDecl(void *ctx, const xmlChar * name, int type,
771
            xmlElementContentPtr content)
772
5.92M
{
773
5.92M
    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
774
5.92M
    xmlElementPtr elem = NULL;
775
776
    /* Avoid unused variable warning if features are disabled. */
777
5.92M
    (void) elem;
778
779
5.92M
    if ((ctxt == NULL) || (ctxt->myDoc == NULL))
780
0
        return;
781
782
#ifdef DEBUG_SAX
783
    xmlGenericError(xmlGenericErrorContext,
784
                    "SAX.xmlSAX2ElementDecl(%s, %d, ...)\n", name, type);
785
#endif
786
787
5.92M
    if (ctxt->inSubset == 1)
788
4.34M
        elem = xmlAddElementDecl(&ctxt->vctxt, ctxt->myDoc->intSubset,
789
4.34M
                                 name, (xmlElementTypeVal) type, content);
790
1.57M
    else if (ctxt->inSubset == 2)
791
1.57M
        elem = xmlAddElementDecl(&ctxt->vctxt, ctxt->myDoc->extSubset,
792
1.57M
                                 name, (xmlElementTypeVal) type, content);
793
0
    else {
794
0
        xmlFatalErrMsg(ctxt, XML_ERR_INTERNAL_ERROR,
795
0
       "SAX.xmlSAX2ElementDecl(%s) called while not in subset\n",
796
0
                 name, NULL);
797
0
        return;
798
0
    }
799
5.92M
#ifdef LIBXML_VALID_ENABLED
800
5.92M
    if (elem == NULL)
801
168k
        ctxt->valid = 0;
802
5.92M
    if (ctxt->validate && ctxt->wellFormed &&
803
5.92M
        ctxt->myDoc && ctxt->myDoc->intSubset)
804
2.06M
        ctxt->valid &=
805
2.06M
            xmlValidateElementDecl(&ctxt->vctxt, ctxt->myDoc, elem);
806
5.92M
#endif /* LIBXML_VALID_ENABLED */
807
5.92M
}
808
809
/**
810
 * xmlSAX2NotationDecl:
811
 * @ctx: the user data (XML parser context)
812
 * @name: The name of the notation
813
 * @publicId: The public ID of the entity
814
 * @systemId: The system ID of the entity
815
 *
816
 * What to do when a notation declaration has been parsed.
817
 */
818
void
819
xmlSAX2NotationDecl(void *ctx, const xmlChar *name,
820
       const xmlChar *publicId, const xmlChar *systemId)
821
57.8k
{
822
57.8k
    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
823
57.8k
    xmlNotationPtr nota = NULL;
824
825
    /* Avoid unused variable warning if features are disabled. */
826
57.8k
    (void) nota;
827
828
57.8k
    if ((ctxt == NULL) || (ctxt->myDoc == NULL))
829
0
        return;
830
831
#ifdef DEBUG_SAX
832
    xmlGenericError(xmlGenericErrorContext,
833
      "SAX.xmlSAX2NotationDecl(%s, %s, %s)\n", name, publicId, systemId);
834
#endif
835
836
57.8k
    if ((publicId == NULL) && (systemId == NULL)) {
837
4.03k
  xmlFatalErrMsg(ctxt, XML_ERR_NOTATION_PROCESSING,
838
4.03k
       "SAX.xmlSAX2NotationDecl(%s) externalID or PublicID missing\n",
839
4.03k
                 name, NULL);
840
4.03k
  return;
841
53.8k
    } else if (ctxt->inSubset == 1)
842
46.0k
  nota = xmlAddNotationDecl(&ctxt->vctxt, ctxt->myDoc->intSubset, name,
843
46.0k
                              publicId, systemId);
844
7.82k
    else if (ctxt->inSubset == 2)
845
7.82k
  nota = xmlAddNotationDecl(&ctxt->vctxt, ctxt->myDoc->extSubset, name,
846
7.82k
                              publicId, systemId);
847
0
    else {
848
0
  xmlFatalErrMsg(ctxt, XML_ERR_NOTATION_PROCESSING,
849
0
       "SAX.xmlSAX2NotationDecl(%s) called while not in subset\n",
850
0
                 name, NULL);
851
0
  return;
852
0
    }
853
53.8k
#ifdef LIBXML_VALID_ENABLED
854
53.8k
    if (nota == NULL) ctxt->valid = 0;
855
53.8k
    if ((ctxt->validate) && (ctxt->wellFormed) &&
856
53.8k
        (ctxt->myDoc->intSubset != NULL))
857
20.0k
  ctxt->valid &= xmlValidateNotationDecl(&ctxt->vctxt, ctxt->myDoc,
858
20.0k
                                         nota);
859
53.8k
#endif /* LIBXML_VALID_ENABLED */
860
53.8k
}
861
862
/**
863
 * xmlSAX2UnparsedEntityDecl:
864
 * @ctx: the user data (XML parser context)
865
 * @name: The name of the entity
866
 * @publicId: The public ID of the entity
867
 * @systemId: The system ID of the entity
868
 * @notationName: the name of the notation
869
 *
870
 * What to do when an unparsed entity declaration is parsed
871
 */
872
void
873
xmlSAX2UnparsedEntityDecl(void *ctx, const xmlChar *name,
874
       const xmlChar *publicId, const xmlChar *systemId,
875
       const xmlChar *notationName)
876
104k
{
877
104k
    xmlEntityPtr ent;
878
104k
    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
879
104k
    if (ctx == NULL) return;
880
#ifdef DEBUG_SAX
881
    xmlGenericError(xmlGenericErrorContext,
882
      "SAX.xmlSAX2UnparsedEntityDecl(%s, %s, %s, %s)\n",
883
            name, publicId, systemId, notationName);
884
#endif
885
104k
    if (ctxt->inSubset == 1) {
886
100k
  ent = xmlAddDocEntity(ctxt->myDoc, name,
887
100k
      XML_EXTERNAL_GENERAL_UNPARSED_ENTITY,
888
100k
      publicId, systemId, notationName);
889
100k
  if ((ent == NULL) && (ctxt->pedantic) &&
890
100k
      (ctxt->sax != NULL) && (ctxt->sax->warning != NULL))
891
2.79k
      ctxt->sax->warning(ctxt->userData,
892
2.79k
       "Entity(%s) already defined in the internal subset\n", name);
893
100k
  if ((ent != NULL) && (ent->URI == NULL) && (systemId != NULL)) {
894
86.1k
      xmlChar *URI;
895
86.1k
      const char *base = NULL;
896
897
86.1k
      if (ctxt->input != NULL)
898
86.1k
    base = ctxt->input->filename;
899
86.1k
      if (base == NULL)
900
28.4k
    base = ctxt->directory;
901
902
86.1k
      URI = xmlBuildURI(systemId, (const xmlChar *) base);
903
86.1k
      ent->URI = URI;
904
86.1k
  }
905
100k
    } else if (ctxt->inSubset == 2) {
906
4.12k
  ent = xmlAddDtdEntity(ctxt->myDoc, name,
907
4.12k
      XML_EXTERNAL_GENERAL_UNPARSED_ENTITY,
908
4.12k
      publicId, systemId, notationName);
909
4.12k
  if ((ent == NULL) && (ctxt->pedantic) &&
910
4.12k
      (ctxt->sax != NULL) && (ctxt->sax->warning != NULL))
911
42
      ctxt->sax->warning(ctxt->userData,
912
42
       "Entity(%s) already defined in the external subset\n", name);
913
4.12k
  if ((ent != NULL) && (ent->URI == NULL) && (systemId != NULL)) {
914
3.64k
      xmlChar *URI;
915
3.64k
      const char *base = NULL;
916
917
3.64k
      if (ctxt->input != NULL)
918
3.64k
    base = ctxt->input->filename;
919
3.64k
      if (base == NULL)
920
0
    base = ctxt->directory;
921
922
3.64k
      URI = xmlBuildURI(systemId, (const xmlChar *) base);
923
3.64k
      ent->URI = URI;
924
3.64k
  }
925
4.12k
    } else {
926
0
        xmlFatalErrMsg(ctxt, XML_ERR_INTERNAL_ERROR,
927
0
       "SAX.xmlSAX2UnparsedEntityDecl(%s) called while not in subset\n",
928
0
                 name, NULL);
929
0
    }
930
104k
}
931
932
/**
933
 * xmlSAX2SetDocumentLocator:
934
 * @ctx: the user data (XML parser context)
935
 * @loc: A SAX Locator
936
 *
937
 * Receive the document locator at startup, actually xmlDefaultSAXLocator
938
 * Everything is available on the context, so this is useless in our case.
939
 */
940
void
941
xmlSAX2SetDocumentLocator(void *ctx ATTRIBUTE_UNUSED, xmlSAXLocatorPtr loc ATTRIBUTE_UNUSED)
942
10.7M
{
943
    /* xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx; */
944
#ifdef DEBUG_SAX
945
    xmlGenericError(xmlGenericErrorContext,
946
      "SAX.xmlSAX2SetDocumentLocator()\n");
947
#endif
948
10.7M
}
949
950
/**
951
 * xmlSAX2StartDocument:
952
 * @ctx: the user data (XML parser context)
953
 *
954
 * called when the document start being processed.
955
 */
956
void
957
xmlSAX2StartDocument(void *ctx)
958
10.2M
{
959
10.2M
    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
960
10.2M
    xmlDocPtr doc;
961
962
10.2M
    if (ctx == NULL) return;
963
964
#ifdef DEBUG_SAX
965
    xmlGenericError(xmlGenericErrorContext,
966
      "SAX.xmlSAX2StartDocument()\n");
967
#endif
968
10.2M
    if (ctxt->html) {
969
0
#ifdef LIBXML_HTML_ENABLED
970
0
  if (ctxt->myDoc == NULL)
971
0
      ctxt->myDoc = htmlNewDocNoDtD(NULL, NULL);
972
0
  if (ctxt->myDoc == NULL) {
973
0
      xmlSAX2ErrMemory(ctxt, "xmlSAX2StartDocument");
974
0
      return;
975
0
  }
976
0
  ctxt->myDoc->properties = XML_DOC_HTML;
977
0
  ctxt->myDoc->parseFlags = ctxt->options;
978
#else
979
        xmlGenericError(xmlGenericErrorContext,
980
    "libxml2 built without HTML support\n");
981
  ctxt->errNo = XML_ERR_INTERNAL_ERROR;
982
  ctxt->instate = XML_PARSER_EOF;
983
  ctxt->disableSAX = 1;
984
  return;
985
#endif
986
10.2M
    } else {
987
10.2M
  doc = ctxt->myDoc = xmlNewDoc(ctxt->version);
988
10.2M
  if (doc != NULL) {
989
10.2M
      doc->properties = 0;
990
10.2M
      if (ctxt->options & XML_PARSE_OLD10)
991
3.59M
          doc->properties |= XML_DOC_OLD10;
992
10.2M
      doc->parseFlags = ctxt->options;
993
10.2M
      if (ctxt->encoding != NULL)
994
893k
    doc->encoding = xmlStrdup(ctxt->encoding);
995
9.34M
      else
996
9.34M
    doc->encoding = NULL;
997
10.2M
      doc->standalone = ctxt->standalone;
998
10.2M
  } else {
999
0
      xmlSAX2ErrMemory(ctxt, "xmlSAX2StartDocument");
1000
0
      return;
1001
0
  }
1002
10.2M
  if ((ctxt->dictNames) && (doc != NULL)) {
1003
6.57M
      doc->dict = ctxt->dict;
1004
6.57M
      xmlDictReference(doc->dict);
1005
6.57M
  }
1006
10.2M
    }
1007
10.2M
    if ((ctxt->myDoc != NULL) && (ctxt->myDoc->URL == NULL) &&
1008
10.2M
  (ctxt->input != NULL) && (ctxt->input->filename != NULL)) {
1009
6.83M
  ctxt->myDoc->URL = xmlPathToURI((const xmlChar *)ctxt->input->filename);
1010
6.83M
  if (ctxt->myDoc->URL == NULL)
1011
4
      xmlSAX2ErrMemory(ctxt, "xmlSAX2StartDocument");
1012
6.83M
    }
1013
10.2M
}
1014
1015
/**
1016
 * xmlSAX2EndDocument:
1017
 * @ctx: the user data (XML parser context)
1018
 *
1019
 * called when the document end has been detected.
1020
 */
1021
void
1022
xmlSAX2EndDocument(void *ctx)
1023
6.06M
{
1024
6.06M
    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
1025
#ifdef DEBUG_SAX
1026
    xmlGenericError(xmlGenericErrorContext,
1027
      "SAX.xmlSAX2EndDocument()\n");
1028
#endif
1029
6.06M
    if (ctx == NULL) return;
1030
6.06M
#ifdef LIBXML_VALID_ENABLED
1031
6.06M
    if (ctxt->validate && ctxt->wellFormed &&
1032
6.06M
        ctxt->myDoc && ctxt->myDoc->intSubset)
1033
281k
  ctxt->valid &= xmlValidateDocumentFinal(&ctxt->vctxt, ctxt->myDoc);
1034
6.06M
#endif /* LIBXML_VALID_ENABLED */
1035
1036
    /*
1037
     * Grab the encoding if it was added on-the-fly
1038
     */
1039
6.06M
    if ((ctxt->encoding != NULL) && (ctxt->myDoc != NULL) &&
1040
6.06M
  (ctxt->myDoc->encoding == NULL)) {
1041
744
  ctxt->myDoc->encoding = ctxt->encoding;
1042
744
  ctxt->encoding = NULL;
1043
744
    }
1044
6.06M
    if ((ctxt->inputTab != NULL) &&
1045
6.06M
        (ctxt->inputNr > 0) && (ctxt->inputTab[0] != NULL) &&
1046
6.06M
        (ctxt->inputTab[0]->encoding != NULL) && (ctxt->myDoc != NULL) &&
1047
6.06M
  (ctxt->myDoc->encoding == NULL)) {
1048
173k
  ctxt->myDoc->encoding = xmlStrdup(ctxt->inputTab[0]->encoding);
1049
173k
    }
1050
6.06M
    if ((ctxt->charset != XML_CHAR_ENCODING_NONE) && (ctxt->myDoc != NULL) &&
1051
6.06M
  (ctxt->myDoc->charset == XML_CHAR_ENCODING_NONE)) {
1052
0
  ctxt->myDoc->charset = ctxt->charset;
1053
0
    }
1054
6.06M
}
1055
1056
#if defined(LIBXML_SAX1_ENABLED) || defined(LIBXML_HTML_ENABLED) || defined(LIBXML_WRITER_ENABLED) || defined(LIBXML_LEGACY_ENABLED)
1057
/**
1058
 * xmlNsErrMsg:
1059
 * @ctxt:  an XML parser context
1060
 * @error:  the error number
1061
 * @msg:  the error message
1062
 * @str1:  an error string
1063
 * @str2:  an error string
1064
 *
1065
 * Handle a namespace error
1066
 */
1067
static void LIBXML_ATTR_FORMAT(3,0)
1068
xmlNsErrMsg(xmlParserCtxtPtr ctxt, xmlParserErrors error,
1069
            const char *msg, const xmlChar *str1, const xmlChar *str2)
1070
1.44M
{
1071
1.44M
    if ((ctxt != NULL) && (ctxt->disableSAX != 0) &&
1072
1.44M
        (ctxt->instate == XML_PARSER_EOF))
1073
0
  return;
1074
1.44M
    if (ctxt != NULL)
1075
1.44M
  ctxt->errNo = error;
1076
1.44M
    __xmlRaiseError(NULL, NULL, NULL, ctxt, NULL, XML_FROM_NAMESPACE, error,
1077
1.44M
                    XML_ERR_ERROR, NULL, 0,
1078
1.44M
        (const char *) str1, (const char *) str2,
1079
1.44M
        NULL, 0, 0, msg, str1, str2);
1080
1.44M
}
1081
1082
/**
1083
 * xmlSAX2AttributeInternal:
1084
 * @ctx: the user data (XML parser context)
1085
 * @fullname:  The attribute name, including namespace prefix
1086
 * @value:  The attribute value
1087
 * @prefix: the prefix on the element node
1088
 *
1089
 * Handle an attribute that has been read by the parser.
1090
 * The default handling is to convert the attribute into an
1091
 * DOM subtree and past it in a new xmlAttr element added to
1092
 * the element.
1093
 */
1094
static void
1095
xmlSAX2AttributeInternal(void *ctx, const xmlChar *fullname,
1096
             const xmlChar *value, const xmlChar *prefix ATTRIBUTE_UNUSED)
1097
38.4M
{
1098
38.4M
    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
1099
38.4M
    xmlAttrPtr ret;
1100
38.4M
    xmlChar *name;
1101
38.4M
    xmlChar *ns;
1102
38.4M
    xmlChar *nval;
1103
38.4M
    xmlNsPtr namespace;
1104
1105
38.4M
    if (ctxt->html) {
1106
0
  name = xmlStrdup(fullname);
1107
0
  ns = NULL;
1108
0
  namespace = NULL;
1109
38.4M
    } else {
1110
  /*
1111
   * Split the full name into a namespace prefix and the tag name
1112
   */
1113
38.4M
  name = xmlSplitQName(ctxt, fullname, &ns);
1114
38.4M
  if ((name != NULL) && (name[0] == 0)) {
1115
0
      if (xmlStrEqual(ns, BAD_CAST "xmlns")) {
1116
0
    xmlNsErrMsg(ctxt, XML_ERR_NS_DECL_ERROR,
1117
0
          "invalid namespace declaration '%s'\n",
1118
0
          fullname, NULL);
1119
0
      } else {
1120
0
    xmlNsWarnMsg(ctxt, XML_WAR_NS_COLUMN,
1121
0
           "Avoid attribute ending with ':' like '%s'\n",
1122
0
           fullname, NULL);
1123
0
      }
1124
0
      if (ns != NULL)
1125
0
    xmlFree(ns);
1126
0
      ns = NULL;
1127
0
      xmlFree(name);
1128
0
      name = xmlStrdup(fullname);
1129
0
  }
1130
38.4M
    }
1131
38.4M
    if (name == NULL) {
1132
0
        xmlSAX2ErrMemory(ctxt, "xmlSAX2StartElement");
1133
0
  if (ns != NULL)
1134
0
      xmlFree(ns);
1135
0
  return;
1136
0
    }
1137
1138
38.4M
#ifdef LIBXML_HTML_ENABLED
1139
38.4M
    if ((ctxt->html) &&
1140
38.4M
        (value == NULL) && (htmlIsBooleanAttr(fullname))) {
1141
0
            nval = xmlStrdup(fullname);
1142
0
            value = (const xmlChar *) nval;
1143
0
    } else
1144
38.4M
#endif
1145
38.4M
    {
1146
38.4M
#ifdef LIBXML_VALID_ENABLED
1147
        /*
1148
         * Do the last stage of the attribute normalization
1149
         * Needed for HTML too:
1150
         *   http://www.w3.org/TR/html4/types.html#h-6.2
1151
         */
1152
38.4M
        ctxt->vctxt.valid = 1;
1153
38.4M
        nval = xmlValidCtxtNormalizeAttributeValue(&ctxt->vctxt,
1154
38.4M
                                               ctxt->myDoc, ctxt->node,
1155
38.4M
                                               fullname, value);
1156
38.4M
        if (ctxt->vctxt.valid != 1) {
1157
5.61k
            ctxt->valid = 0;
1158
5.61k
        }
1159
38.4M
        if (nval != NULL)
1160
595k
            value = nval;
1161
#else
1162
        nval = NULL;
1163
#endif /* LIBXML_VALID_ENABLED */
1164
38.4M
    }
1165
1166
    /*
1167
     * Check whether it's a namespace definition
1168
     */
1169
38.4M
    if ((!ctxt->html) && (ns == NULL) &&
1170
38.4M
        (name[0] == 'x') && (name[1] == 'm') && (name[2] == 'l') &&
1171
38.4M
        (name[3] == 'n') && (name[4] == 's') && (name[5] == 0)) {
1172
2.33M
  xmlNsPtr nsret;
1173
2.33M
  xmlChar *val;
1174
1175
        /* Avoid unused variable warning if features are disabled. */
1176
2.33M
        (void) nsret;
1177
1178
2.33M
        if (!ctxt->replaceEntities) {
1179
1.16M
      ctxt->depth++;
1180
1.16M
      val = xmlStringDecodeEntities(ctxt, value, XML_SUBSTITUTE_REF,
1181
1.16M
                              0,0,0);
1182
1.16M
      ctxt->depth--;
1183
1.16M
      if (val == NULL) {
1184
0
          xmlSAX2ErrMemory(ctxt, "xmlSAX2StartElement");
1185
0
    if (name != NULL)
1186
0
        xmlFree(name);
1187
0
                if (nval != NULL)
1188
0
                    xmlFree(nval);
1189
0
    return;
1190
0
      }
1191
1.16M
  } else {
1192
1.16M
      val = (xmlChar *) value;
1193
1.16M
  }
1194
1195
2.33M
  if (val[0] != 0) {
1196
2.26M
      xmlURIPtr uri;
1197
1198
2.26M
      uri = xmlParseURI((const char *)val);
1199
2.26M
      if (uri == NULL) {
1200
1.25M
    if ((ctxt->sax != NULL) && (ctxt->sax->warning != NULL))
1201
676k
        ctxt->sax->warning(ctxt->userData,
1202
676k
       "xmlns: %s not a valid URI\n", val);
1203
1.25M
      } else {
1204
1.01M
    if (uri->scheme == NULL) {
1205
285k
        if ((ctxt->sax != NULL) && (ctxt->sax->warning != NULL))
1206
174k
      ctxt->sax->warning(ctxt->userData,
1207
174k
           "xmlns: URI %s is not absolute\n", val);
1208
285k
    }
1209
1.01M
    xmlFreeURI(uri);
1210
1.01M
      }
1211
2.26M
  }
1212
1213
  /* a default namespace definition */
1214
2.33M
  nsret = xmlNewNs(ctxt->node, val, NULL);
1215
1216
2.33M
#ifdef LIBXML_VALID_ENABLED
1217
  /*
1218
   * Validate also for namespace decls, they are attributes from
1219
   * an XML-1.0 perspective
1220
   */
1221
2.33M
        if (nsret != NULL && ctxt->validate && ctxt->wellFormed &&
1222
2.33M
      ctxt->myDoc && ctxt->myDoc->intSubset)
1223
21.5k
      ctxt->valid &= xmlValidateOneNamespace(&ctxt->vctxt, ctxt->myDoc,
1224
21.5k
             ctxt->node, prefix, nsret, val);
1225
2.33M
#endif /* LIBXML_VALID_ENABLED */
1226
2.33M
  if (name != NULL)
1227
2.33M
      xmlFree(name);
1228
2.33M
  if (nval != NULL)
1229
571
      xmlFree(nval);
1230
2.33M
  if (val != value)
1231
1.16M
      xmlFree(val);
1232
2.33M
  return;
1233
2.33M
    }
1234
36.0M
    if ((!ctxt->html) &&
1235
36.0M
  (ns != NULL) && (ns[0] == 'x') && (ns[1] == 'm') && (ns[2] == 'l') &&
1236
36.0M
        (ns[3] == 'n') && (ns[4] == 's') && (ns[5] == 0)) {
1237
1.88M
  xmlNsPtr nsret;
1238
1.88M
  xmlChar *val;
1239
1240
        /* Avoid unused variable warning if features are disabled. */
1241
1.88M
        (void) nsret;
1242
1243
1.88M
        if (!ctxt->replaceEntities) {
1244
1.00M
      ctxt->depth++;
1245
1.00M
      val = xmlStringDecodeEntities(ctxt, value, XML_SUBSTITUTE_REF,
1246
1.00M
                              0,0,0);
1247
1.00M
      ctxt->depth--;
1248
1.00M
      if (val == NULL) {
1249
0
          xmlSAX2ErrMemory(ctxt, "xmlSAX2StartElement");
1250
0
          xmlFree(ns);
1251
0
    if (name != NULL)
1252
0
        xmlFree(name);
1253
0
                if (nval != NULL)
1254
0
                    xmlFree(nval);
1255
0
    return;
1256
0
      }
1257
1.00M
  } else {
1258
887k
      val = (xmlChar *) value;
1259
887k
  }
1260
1261
1.88M
  if (val[0] == 0) {
1262
54.5k
      xmlNsErrMsg(ctxt, XML_NS_ERR_EMPTY,
1263
54.5k
            "Empty namespace name for prefix %s\n", name, NULL);
1264
54.5k
  }
1265
1.88M
  if ((ctxt->pedantic != 0) && (val[0] != 0)) {
1266
986k
      xmlURIPtr uri;
1267
1268
986k
      uri = xmlParseURI((const char *)val);
1269
986k
      if (uri == NULL) {
1270
204k
          xmlNsWarnMsg(ctxt, XML_WAR_NS_URI,
1271
204k
       "xmlns:%s: %s not a valid URI\n", name, value);
1272
781k
      } else {
1273
781k
    if (uri->scheme == NULL) {
1274
379k
        xmlNsWarnMsg(ctxt, XML_WAR_NS_URI_RELATIVE,
1275
379k
         "xmlns:%s: URI %s is not absolute\n", name, value);
1276
379k
    }
1277
781k
    xmlFreeURI(uri);
1278
781k
      }
1279
986k
  }
1280
1281
  /* a standard namespace definition */
1282
1.88M
  nsret = xmlNewNs(ctxt->node, val, name);
1283
1.88M
  xmlFree(ns);
1284
1.88M
#ifdef LIBXML_VALID_ENABLED
1285
  /*
1286
   * Validate also for namespace decls, they are attributes from
1287
   * an XML-1.0 perspective
1288
   */
1289
1.88M
        if (nsret != NULL && ctxt->validate && ctxt->wellFormed &&
1290
1.88M
      ctxt->myDoc && ctxt->myDoc->intSubset)
1291
55.4k
      ctxt->valid &= xmlValidateOneNamespace(&ctxt->vctxt, ctxt->myDoc,
1292
55.4k
             ctxt->node, prefix, nsret, value);
1293
1.88M
#endif /* LIBXML_VALID_ENABLED */
1294
1.88M
  if (name != NULL)
1295
1.88M
      xmlFree(name);
1296
1.88M
  if (nval != NULL)
1297
27.7k
      xmlFree(nval);
1298
1.88M
  if (val != value)
1299
1.00M
      xmlFree(val);
1300
1.88M
  return;
1301
1.88M
    }
1302
1303
34.1M
    if (ns != NULL) {
1304
3.32M
  namespace = xmlSearchNs(ctxt->myDoc, ctxt->node, ns);
1305
1306
3.32M
  if (namespace == NULL) {
1307
1.38M
      xmlNsErrMsg(ctxt, XML_NS_ERR_UNDEFINED_NAMESPACE,
1308
1.38M
        "Namespace prefix %s of attribute %s is not defined\n",
1309
1.38M
                 ns, name);
1310
1.93M
  } else {
1311
1.93M
            xmlAttrPtr prop;
1312
1313
1.93M
            prop = ctxt->node->properties;
1314
2.53M
            while (prop != NULL) {
1315
611k
                if (prop->ns != NULL) {
1316
209k
                    if ((xmlStrEqual(name, prop->name)) &&
1317
209k
                        ((namespace == prop->ns) ||
1318
5.69k
                         (xmlStrEqual(namespace->href, prop->ns->href)))) {
1319
3.71k
                            xmlNsErrMsg(ctxt, XML_ERR_ATTRIBUTE_REDEFINED,
1320
3.71k
                                    "Attribute %s in %s redefined\n",
1321
3.71k
                                             name, namespace->href);
1322
3.71k
                        ctxt->wellFormed = 0;
1323
3.71k
                        if (ctxt->recovery == 0) ctxt->disableSAX = 1;
1324
3.71k
                        if (name != NULL)
1325
3.71k
                            xmlFree(name);
1326
3.71k
                        goto error;
1327
3.71k
                    }
1328
209k
                }
1329
607k
                prop = prop->next;
1330
607k
            }
1331
1.93M
        }
1332
30.8M
    } else {
1333
30.8M
  namespace = NULL;
1334
30.8M
    }
1335
1336
    /* !!!!!! <a toto:arg="" xmlns:toto="http://toto.com"> */
1337
34.1M
    ret = xmlNewNsPropEatName(ctxt->node, namespace, name, NULL);
1338
34.1M
    if (ret == NULL)
1339
0
        goto error;
1340
1341
34.1M
    if ((ctxt->replaceEntities == 0) && (!ctxt->html)) {
1342
20.4M
        xmlNodePtr tmp;
1343
1344
20.4M
        ret->children = xmlStringGetNodeList(ctxt->myDoc, value);
1345
20.4M
        tmp = ret->children;
1346
41.7M
        while (tmp != NULL) {
1347
21.3M
            tmp->parent = (xmlNodePtr) ret;
1348
21.3M
            if (tmp->next == NULL)
1349
20.2M
                ret->last = tmp;
1350
21.3M
            tmp = tmp->next;
1351
21.3M
        }
1352
20.4M
    } else if (value != NULL) {
1353
13.7M
        ret->children = xmlNewDocText(ctxt->myDoc, value);
1354
13.7M
        ret->last = ret->children;
1355
13.7M
        if (ret->children != NULL)
1356
13.7M
            ret->children->parent = (xmlNodePtr) ret;
1357
13.7M
    }
1358
1359
34.1M
#ifdef LIBXML_VALID_ENABLED
1360
34.1M
    if ((!ctxt->html) && ctxt->validate && ctxt->wellFormed &&
1361
34.1M
        ctxt->myDoc && ctxt->myDoc->intSubset) {
1362
1363
  /*
1364
   * If we don't substitute entities, the validation should be
1365
   * done on a value with replaced entities anyway.
1366
   */
1367
1.52M
        if (!ctxt->replaceEntities) {
1368
936k
      xmlChar *val;
1369
1370
936k
      ctxt->depth++;
1371
936k
      val = xmlStringDecodeEntities(ctxt, value, XML_SUBSTITUTE_REF,
1372
936k
                              0,0,0);
1373
936k
      ctxt->depth--;
1374
1375
936k
      if (val == NULL)
1376
0
    ctxt->valid &= xmlValidateOneAttribute(&ctxt->vctxt,
1377
0
        ctxt->myDoc, ctxt->node, ret, value);
1378
936k
      else {
1379
936k
    xmlChar *nvalnorm;
1380
1381
    /*
1382
     * Do the last stage of the attribute normalization
1383
     * It need to be done twice ... it's an extra burden related
1384
     * to the ability to keep xmlSAX2References in attributes
1385
     */
1386
936k
    nvalnorm = xmlValidNormalizeAttributeValue(ctxt->myDoc,
1387
936k
              ctxt->node, fullname, val);
1388
936k
    if (nvalnorm != NULL) {
1389
69.1k
        xmlFree(val);
1390
69.1k
        val = nvalnorm;
1391
69.1k
    }
1392
1393
936k
    ctxt->valid &= xmlValidateOneAttribute(&ctxt->vctxt,
1394
936k
              ctxt->myDoc, ctxt->node, ret, val);
1395
936k
                xmlFree(val);
1396
936k
      }
1397
936k
  } else {
1398
589k
      ctxt->valid &= xmlValidateOneAttribute(&ctxt->vctxt, ctxt->myDoc,
1399
589k
                 ctxt->node, ret, value);
1400
589k
  }
1401
1.52M
    } else
1402
32.6M
#endif /* LIBXML_VALID_ENABLED */
1403
32.6M
           if (((ctxt->loadsubset & XML_SKIP_IDS) == 0) &&
1404
32.6M
         (((ctxt->replaceEntities == 0) && (ctxt->external != 2)) ||
1405
32.6M
          ((ctxt->replaceEntities != 0) && (ctxt->inSubset == 0))) &&
1406
               /* Don't create IDs containing entity references */
1407
32.6M
               (ret->children != NULL) &&
1408
32.6M
               (ret->children->type == XML_TEXT_NODE) &&
1409
32.6M
               (ret->children->next == NULL)) {
1410
32.3M
        xmlChar *content = ret->children->content;
1411
        /*
1412
   * when validating, the ID registration is done at the attribute
1413
   * validation level. Otherwise we have to do specific handling here.
1414
   */
1415
32.3M
  if (xmlStrEqual(fullname, BAD_CAST "xml:id")) {
1416
      /*
1417
       * Add the xml:id value
1418
       *
1419
       * Open issue: normalization of the value.
1420
       */
1421
552k
      if (xmlValidateNCName(content, 1) != 0) {
1422
290k
          xmlErrValid(ctxt, XML_DTD_XMLID_VALUE,
1423
290k
          "xml:id : attribute value %s is not an NCName\n",
1424
290k
          (const char *) content, NULL);
1425
290k
      }
1426
552k
      xmlAddID(&ctxt->vctxt, ctxt->myDoc, content, ret);
1427
31.8M
  } else if (xmlIsID(ctxt->myDoc, ctxt->node, ret))
1428
27.7k
      xmlAddID(&ctxt->vctxt, ctxt->myDoc, content, ret);
1429
31.7M
  else if (xmlIsRef(ctxt->myDoc, ctxt->node, ret))
1430
29.1k
      xmlAddRef(&ctxt->vctxt, ctxt->myDoc, content, ret);
1431
32.3M
    }
1432
1433
34.1M
error:
1434
34.1M
    if (nval != NULL)
1435
567k
  xmlFree(nval);
1436
34.1M
    if (ns != NULL)
1437
3.32M
  xmlFree(ns);
1438
34.1M
}
1439
1440
/*
1441
 * xmlCheckDefaultedAttributes:
1442
 *
1443
 * Check defaulted attributes from the DTD
1444
 */
1445
static void
1446
xmlCheckDefaultedAttributes(xmlParserCtxtPtr ctxt, const xmlChar *name,
1447
10.5M
  const xmlChar *prefix, const xmlChar **atts) {
1448
10.5M
    xmlElementPtr elemDecl;
1449
10.5M
    const xmlChar *att;
1450
10.5M
    int internal = 1;
1451
10.5M
    int i;
1452
1453
10.5M
    elemDecl = xmlGetDtdQElementDesc(ctxt->myDoc->intSubset, name, prefix);
1454
10.5M
    if (elemDecl == NULL) {
1455
9.27M
  elemDecl = xmlGetDtdQElementDesc(ctxt->myDoc->extSubset, name, prefix);
1456
9.27M
  internal = 0;
1457
9.27M
    }
1458
1459
11.7M
process_external_subset:
1460
1461
11.7M
    if (elemDecl != NULL) {
1462
1.40M
  xmlAttributePtr attr = elemDecl->attributes;
1463
  /*
1464
   * Check against defaulted attributes from the external subset
1465
   * if the document is stamped as standalone
1466
   */
1467
1.40M
  if ((ctxt->myDoc->standalone == 1) &&
1468
1.40M
      (ctxt->myDoc->extSubset != NULL) &&
1469
1.40M
      (ctxt->validate)) {
1470
0
      while (attr != NULL) {
1471
0
    if ((attr->defaultValue != NULL) &&
1472
0
        (xmlGetDtdQAttrDesc(ctxt->myDoc->extSubset,
1473
0
          attr->elem, attr->name,
1474
0
          attr->prefix) == attr) &&
1475
0
        (xmlGetDtdQAttrDesc(ctxt->myDoc->intSubset,
1476
0
          attr->elem, attr->name,
1477
0
          attr->prefix) == NULL)) {
1478
0
        xmlChar *fulln;
1479
1480
0
        if (attr->prefix != NULL) {
1481
0
      fulln = xmlStrdup(attr->prefix);
1482
0
      fulln = xmlStrcat(fulln, BAD_CAST ":");
1483
0
      fulln = xmlStrcat(fulln, attr->name);
1484
0
        } else {
1485
0
      fulln = xmlStrdup(attr->name);
1486
0
        }
1487
0
                    if (fulln == NULL) {
1488
0
                        xmlSAX2ErrMemory(ctxt, "xmlSAX2StartElement");
1489
0
                        break;
1490
0
                    }
1491
1492
        /*
1493
         * Check that the attribute is not declared in the
1494
         * serialization
1495
         */
1496
0
        att = NULL;
1497
0
        if (atts != NULL) {
1498
0
      i = 0;
1499
0
      att = atts[i];
1500
0
      while (att != NULL) {
1501
0
          if (xmlStrEqual(att, fulln))
1502
0
        break;
1503
0
          i += 2;
1504
0
          att = atts[i];
1505
0
      }
1506
0
        }
1507
0
        if (att == NULL) {
1508
0
            xmlErrValid(ctxt, XML_DTD_STANDALONE_DEFAULTED,
1509
0
      "standalone: attribute %s on %s defaulted from external subset\n",
1510
0
            (const char *)fulln,
1511
0
            (const char *)attr->elem);
1512
0
        }
1513
0
                    xmlFree(fulln);
1514
0
    }
1515
0
    attr = attr->nexth;
1516
0
      }
1517
0
  }
1518
1519
  /*
1520
   * Actually insert defaulted values when needed
1521
   */
1522
1.40M
  attr = elemDecl->attributes;
1523
2.68M
  while (attr != NULL) {
1524
      /*
1525
       * Make sure that attributes redefinition occurring in the
1526
       * internal subset are not overridden by definitions in the
1527
       * external subset.
1528
       */
1529
1.27M
      if (attr->defaultValue != NULL) {
1530
    /*
1531
     * the element should be instantiated in the tree if:
1532
     *  - this is a namespace prefix
1533
     *  - the user required for completion in the tree
1534
     *    like XSLT
1535
     *  - there isn't already an attribute definition
1536
     *    in the internal subset overriding it.
1537
     */
1538
381k
    if (((attr->prefix != NULL) &&
1539
381k
         (xmlStrEqual(attr->prefix, BAD_CAST "xmlns"))) ||
1540
381k
        ((attr->prefix == NULL) &&
1541
296k
         (xmlStrEqual(attr->name, BAD_CAST "xmlns"))) ||
1542
381k
        (ctxt->loadsubset & XML_COMPLETE_ATTRS)) {
1543
324k
        xmlAttributePtr tst;
1544
1545
324k
        tst = xmlGetDtdQAttrDesc(ctxt->myDoc->intSubset,
1546
324k
               attr->elem, attr->name,
1547
324k
               attr->prefix);
1548
324k
        if ((tst == attr) || (tst == NULL)) {
1549
324k
            xmlChar fn[50];
1550
324k
      xmlChar *fulln;
1551
1552
324k
                        fulln = xmlBuildQName(attr->name, attr->prefix, fn, 50);
1553
324k
      if (fulln == NULL) {
1554
0
          xmlSAX2ErrMemory(ctxt, "xmlSAX2StartElement");
1555
0
          return;
1556
0
      }
1557
1558
      /*
1559
       * Check that the attribute is not declared in the
1560
       * serialization
1561
       */
1562
324k
      att = NULL;
1563
324k
      if (atts != NULL) {
1564
146k
          i = 0;
1565
146k
          att = atts[i];
1566
292k
          while (att != NULL) {
1567
156k
        if (xmlStrEqual(att, fulln))
1568
9.64k
            break;
1569
146k
        i += 2;
1570
146k
        att = atts[i];
1571
146k
          }
1572
146k
      }
1573
324k
      if (att == NULL) {
1574
315k
          xmlSAX2AttributeInternal(ctxt, fulln,
1575
315k
             attr->defaultValue, prefix);
1576
315k
      }
1577
324k
      if ((fulln != fn) && (fulln != attr->name))
1578
47.0k
          xmlFree(fulln);
1579
324k
        }
1580
324k
    }
1581
381k
      }
1582
1.27M
      attr = attr->nexth;
1583
1.27M
  }
1584
1.40M
  if (internal == 1) {
1585
1.24M
      elemDecl = xmlGetDtdQElementDesc(ctxt->myDoc->extSubset,
1586
1.24M
                                 name, prefix);
1587
1.24M
      internal = 0;
1588
1.24M
      goto process_external_subset;
1589
1.24M
  }
1590
1.40M
    }
1591
11.7M
}
1592
1593
/**
1594
 * xmlSAX2StartElement:
1595
 * @ctx: the user data (XML parser context)
1596
 * @fullname:  The element name, including namespace prefix
1597
 * @atts:  An array of name/value attributes pairs, NULL terminated
1598
 *
1599
 * called when an opening tag has been processed.
1600
 */
1601
void
1602
xmlSAX2StartElement(void *ctx, const xmlChar *fullname, const xmlChar **atts)
1603
39.1M
{
1604
39.1M
    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
1605
39.1M
    xmlNodePtr ret;
1606
39.1M
    xmlNodePtr parent;
1607
39.1M
    xmlNsPtr ns;
1608
39.1M
    xmlChar *name;
1609
39.1M
    xmlChar *prefix;
1610
39.1M
    const xmlChar *att;
1611
39.1M
    const xmlChar *value;
1612
39.1M
    int i;
1613
1614
39.1M
    if ((ctx == NULL) || (fullname == NULL) || (ctxt->myDoc == NULL)) return;
1615
39.1M
    parent = ctxt->node;
1616
#ifdef DEBUG_SAX
1617
    xmlGenericError(xmlGenericErrorContext,
1618
      "SAX.xmlSAX2StartElement(%s)\n", fullname);
1619
#endif
1620
1621
    /*
1622
     * First check on validity:
1623
     */
1624
39.1M
    if (ctxt->validate && (ctxt->myDoc->extSubset == NULL) &&
1625
39.1M
        ((ctxt->myDoc->intSubset == NULL) ||
1626
4.80M
   ((ctxt->myDoc->intSubset->notations == NULL) &&
1627
4.02M
    (ctxt->myDoc->intSubset->elements == NULL) &&
1628
4.02M
    (ctxt->myDoc->intSubset->attributes == NULL) &&
1629
4.02M
    (ctxt->myDoc->intSubset->entities == NULL)))) {
1630
895k
  xmlErrValid(ctxt, XML_ERR_NO_DTD,
1631
895k
    "Validation failed: no DTD found !", NULL, NULL);
1632
895k
  ctxt->validate = 0;
1633
895k
    }
1634
1635
1636
    /*
1637
     * Split the full name into a namespace prefix and the tag name
1638
     */
1639
39.1M
    name = xmlSplitQName(ctxt, fullname, &prefix);
1640
1641
1642
    /*
1643
     * Note : the namespace resolution is deferred until the end of the
1644
     *        attributes parsing, since local namespace can be defined as
1645
     *        an attribute at this level.
1646
     */
1647
39.1M
    ret = xmlNewDocNodeEatName(ctxt->myDoc, NULL, name, NULL);
1648
39.1M
    if (ret == NULL) {
1649
0
        if (prefix != NULL)
1650
0
      xmlFree(prefix);
1651
0
  xmlSAX2ErrMemory(ctxt, "xmlSAX2StartElement");
1652
0
        return;
1653
0
    }
1654
39.1M
    if (ctxt->myDoc->children == NULL) {
1655
#ifdef DEBUG_SAX_TREE
1656
  xmlGenericError(xmlGenericErrorContext, "Setting %s as root\n", name);
1657
#endif
1658
1.30M
        xmlAddChild((xmlNodePtr) ctxt->myDoc, (xmlNodePtr) ret);
1659
37.8M
    } else if (parent == NULL) {
1660
5.29M
        parent = ctxt->myDoc->children;
1661
5.29M
    }
1662
39.1M
    ctxt->nodemem = -1;
1663
39.1M
    if (ctxt->linenumbers) {
1664
39.0M
  if (ctxt->input != NULL) {
1665
39.0M
      if ((unsigned) ctxt->input->line < (unsigned) USHRT_MAX)
1666
38.6M
    ret->line = ctxt->input->line;
1667
438k
      else
1668
438k
          ret->line = USHRT_MAX;
1669
39.0M
  }
1670
39.0M
    }
1671
1672
    /*
1673
     * We are parsing a new node.
1674
     */
1675
#ifdef DEBUG_SAX_TREE
1676
    xmlGenericError(xmlGenericErrorContext, "pushing(%s)\n", name);
1677
#endif
1678
39.1M
    if (nodePush(ctxt, ret) < 0) {
1679
554
        xmlUnlinkNode(ret);
1680
554
        xmlFreeNode(ret);
1681
554
        if (prefix != NULL)
1682
368
            xmlFree(prefix);
1683
554
        return;
1684
554
    }
1685
1686
    /*
1687
     * Link the child element
1688
     */
1689
39.1M
    if (parent != NULL) {
1690
37.8M
        if (parent->type == XML_ELEMENT_NODE) {
1691
#ifdef DEBUG_SAX_TREE
1692
      xmlGenericError(xmlGenericErrorContext,
1693
        "adding child %s to %s\n", name, parent->name);
1694
#endif
1695
36.2M
      xmlAddChild(parent, ret);
1696
36.2M
  } else {
1697
#ifdef DEBUG_SAX_TREE
1698
      xmlGenericError(xmlGenericErrorContext,
1699
        "adding sibling %s to ", name);
1700
      xmlDebugDumpOneNode(stderr, parent, 0);
1701
#endif
1702
1.61M
      xmlAddSibling(parent, ret);
1703
1.61M
  }
1704
37.8M
    }
1705
1706
39.1M
    if (!ctxt->html) {
1707
        /*
1708
         * Insert all the defaulted attributes from the DTD especially
1709
         * namespaces
1710
         */
1711
39.1M
        if ((ctxt->myDoc->intSubset != NULL) ||
1712
39.1M
            (ctxt->myDoc->extSubset != NULL)) {
1713
10.5M
            xmlCheckDefaultedAttributes(ctxt, name, prefix, atts);
1714
10.5M
        }
1715
1716
        /*
1717
         * process all the attributes whose name start with "xmlns"
1718
         */
1719
39.1M
        if (atts != NULL) {
1720
23.1M
            i = 0;
1721
23.1M
            att = atts[i++];
1722
23.1M
            value = atts[i++];
1723
61.2M
      while ((att != NULL) && (value != NULL)) {
1724
38.0M
    if ((att[0] == 'x') && (att[1] == 'm') && (att[2] == 'l') &&
1725
38.0M
        (att[3] == 'n') && (att[4] == 's'))
1726
4.14M
        xmlSAX2AttributeInternal(ctxt, att, value, prefix);
1727
1728
38.0M
    att = atts[i++];
1729
38.0M
    value = atts[i++];
1730
38.0M
      }
1731
23.1M
        }
1732
1733
        /*
1734
         * Search the namespace, note that since the attributes have been
1735
         * processed, the local namespaces are available.
1736
         */
1737
39.1M
        ns = xmlSearchNs(ctxt->myDoc, ret, prefix);
1738
39.1M
        if ((ns == NULL) && (parent != NULL))
1739
30.9M
            ns = xmlSearchNs(ctxt->myDoc, parent, prefix);
1740
39.1M
        if ((prefix != NULL) && (ns == NULL)) {
1741
8.40M
            ns = xmlNewNs(ret, NULL, prefix);
1742
8.40M
            xmlNsWarnMsg(ctxt, XML_NS_ERR_UNDEFINED_NAMESPACE,
1743
8.40M
                         "Namespace prefix %s is not defined\n",
1744
8.40M
                         prefix, NULL);
1745
8.40M
        }
1746
1747
        /*
1748
         * set the namespace node, making sure that if the default namespace
1749
         * is unbound on a parent we simply keep it NULL
1750
         */
1751
39.1M
        if ((ns != NULL) && (ns->href != NULL) &&
1752
39.1M
            ((ns->href[0] != 0) || (ns->prefix != NULL)))
1753
6.92M
            xmlSetNs(ret, ns);
1754
39.1M
    }
1755
1756
    /*
1757
     * process all the other attributes
1758
     */
1759
39.1M
    if (atts != NULL) {
1760
23.1M
        i = 0;
1761
23.1M
  att = atts[i++];
1762
23.1M
  value = atts[i++];
1763
23.1M
  if (ctxt->html) {
1764
0
      while (att != NULL) {
1765
0
    xmlSAX2AttributeInternal(ctxt, att, value, NULL);
1766
0
    att = atts[i++];
1767
0
    value = atts[i++];
1768
0
      }
1769
23.1M
  } else {
1770
61.2M
      while ((att != NULL) && (value != NULL)) {
1771
38.0M
    if ((att[0] != 'x') || (att[1] != 'm') || (att[2] != 'l') ||
1772
38.0M
        (att[3] != 'n') || (att[4] != 's'))
1773
33.9M
        xmlSAX2AttributeInternal(ctxt, att, value, NULL);
1774
1775
    /*
1776
     * Next ones
1777
     */
1778
38.0M
    att = atts[i++];
1779
38.0M
    value = atts[i++];
1780
38.0M
      }
1781
23.1M
  }
1782
23.1M
    }
1783
1784
39.1M
#ifdef LIBXML_VALID_ENABLED
1785
    /*
1786
     * If it's the Document root, finish the DTD validation and
1787
     * check the document root element for validity
1788
     */
1789
39.1M
    if ((ctxt->validate) &&
1790
39.1M
        ((ctxt->vctxt.flags & XML_VCTXT_DTD_VALIDATED) == 0)) {
1791
474k
  int chk;
1792
1793
474k
  chk = xmlValidateDtdFinal(&ctxt->vctxt, ctxt->myDoc);
1794
474k
  if (chk <= 0)
1795
6.55k
      ctxt->valid = 0;
1796
474k
  if (chk < 0)
1797
0
      ctxt->wellFormed = 0;
1798
474k
  ctxt->valid &= xmlValidateRoot(&ctxt->vctxt, ctxt->myDoc);
1799
474k
  ctxt->vctxt.flags |= XML_VCTXT_DTD_VALIDATED;
1800
474k
    }
1801
39.1M
#endif /* LIBXML_VALID_ENABLED */
1802
1803
39.1M
    if (prefix != NULL)
1804
10.5M
  xmlFree(prefix);
1805
1806
39.1M
}
1807
1808
/**
1809
 * xmlSAX2EndElement:
1810
 * @ctx: the user data (XML parser context)
1811
 * @name:  The element name
1812
 *
1813
 * called when the end of an element has been detected.
1814
 */
1815
void
1816
xmlSAX2EndElement(void *ctx, const xmlChar *name ATTRIBUTE_UNUSED)
1817
25.2M
{
1818
25.2M
    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
1819
25.2M
    xmlNodePtr cur;
1820
1821
25.2M
    if (ctx == NULL) return;
1822
25.2M
    cur = ctxt->node;
1823
#ifdef DEBUG_SAX
1824
    if (name == NULL)
1825
        xmlGenericError(xmlGenericErrorContext, "SAX.xmlSAX2EndElement(NULL)\n");
1826
    else
1827
  xmlGenericError(xmlGenericErrorContext, "SAX.xmlSAX2EndElement(%s)\n", name);
1828
#endif
1829
1830
    /* Capture end position and add node */
1831
25.2M
    if (cur != NULL && ctxt->record_info) {
1832
0
      ctxt->nodeInfo->end_pos = ctxt->input->cur - ctxt->input->base;
1833
0
      ctxt->nodeInfo->end_line = ctxt->input->line;
1834
0
      ctxt->nodeInfo->node = cur;
1835
0
      xmlParserAddNodeInfo(ctxt, ctxt->nodeInfo);
1836
0
    }
1837
25.2M
    ctxt->nodemem = -1;
1838
1839
25.2M
#ifdef LIBXML_VALID_ENABLED
1840
25.2M
    if (ctxt->validate && ctxt->wellFormed &&
1841
25.2M
        ctxt->myDoc && ctxt->myDoc->intSubset)
1842
1.16M
        ctxt->valid &= xmlValidateOneElement(&ctxt->vctxt, ctxt->myDoc,
1843
1.16M
               cur);
1844
25.2M
#endif /* LIBXML_VALID_ENABLED */
1845
1846
1847
    /*
1848
     * end of parsing of this node.
1849
     */
1850
#ifdef DEBUG_SAX_TREE
1851
    xmlGenericError(xmlGenericErrorContext, "popping(%s)\n", cur->name);
1852
#endif
1853
25.2M
    nodePop(ctxt);
1854
25.2M
}
1855
#endif /* LIBXML_SAX1_ENABLED || LIBXML_HTML_ENABLED || LIBXML_LEGACY_ENABLED */
1856
1857
/*
1858
 * xmlSAX2TextNode:
1859
 * @ctxt:  the parser context
1860
 * @str:  the input string
1861
 * @len: the string length
1862
 *
1863
 * Callback for a text node
1864
 *
1865
 * Returns the newly allocated string or NULL if not needed or error
1866
 */
1867
static xmlNodePtr
1868
314M
xmlSAX2TextNode(xmlParserCtxtPtr ctxt, const xmlChar *str, int len) {
1869
314M
    xmlNodePtr ret;
1870
314M
    const xmlChar *intern = NULL;
1871
1872
    /*
1873
     * Allocate
1874
     */
1875
314M
    if (ctxt->freeElems != NULL) {
1876
796k
  ret = ctxt->freeElems;
1877
796k
  ctxt->freeElems = ret->next;
1878
796k
  ctxt->freeElemsNr--;
1879
313M
    } else {
1880
313M
  ret = (xmlNodePtr) xmlMalloc(sizeof(xmlNode));
1881
313M
    }
1882
314M
    if (ret == NULL) {
1883
0
        xmlErrMemory(ctxt, "xmlSAX2Characters");
1884
0
  return(NULL);
1885
0
    }
1886
314M
    memset(ret, 0, sizeof(xmlNode));
1887
    /*
1888
     * intern the formatting blanks found between tags, or the
1889
     * very short strings
1890
     */
1891
314M
    if (ctxt->dictNames) {
1892
261M
        xmlChar cur = str[len];
1893
1894
261M
  if ((len < (int) (2 * sizeof(void *))) &&
1895
261M
      (ctxt->options & XML_PARSE_COMPACT)) {
1896
      /* store the string in the node overriding properties and nsDef */
1897
86.1M
      xmlChar *tmp = (xmlChar *) &(ret->properties);
1898
86.1M
      memcpy(tmp, str, len);
1899
86.1M
      tmp[len] = 0;
1900
86.1M
      intern = tmp;
1901
175M
  } else if ((len <= 3) && ((cur == '"') || (cur == '\'') ||
1902
37.4M
      ((cur == '<') && (str[len + 1] != '!')))) {
1903
33.9M
      intern = xmlDictLookup(ctxt->dict, str, len);
1904
141M
  } else if (IS_BLANK_CH(*str) && (len < 60) && (cur == '<') &&
1905
141M
             (str[len + 1] != '!')) {
1906
48.2M
      int i;
1907
1908
284M
      for (i = 1;i < len;i++) {
1909
238M
    if (!IS_BLANK_CH(str[i])) goto skip;
1910
238M
      }
1911
46.1M
      intern = xmlDictLookup(ctxt->dict, str, len);
1912
46.1M
  }
1913
261M
    }
1914
314M
skip:
1915
314M
    ret->type = XML_TEXT_NODE;
1916
1917
314M
    ret->name = xmlStringText;
1918
314M
    if (intern == NULL) {
1919
147M
  ret->content = xmlStrndup(str, len);
1920
147M
  if (ret->content == NULL) {
1921
0
      xmlSAX2ErrMemory(ctxt, "xmlSAX2TextNode");
1922
0
      xmlFree(ret);
1923
0
      return(NULL);
1924
0
  }
1925
147M
    } else
1926
166M
  ret->content = (xmlChar *) intern;
1927
1928
314M
    if (ctxt->linenumbers) {
1929
313M
  if (ctxt->input != NULL) {
1930
313M
      if ((unsigned) ctxt->input->line < (unsigned) USHRT_MAX)
1931
310M
    ret->line = ctxt->input->line;
1932
3.27M
      else {
1933
3.27M
          ret->line = USHRT_MAX;
1934
3.27M
    if (ctxt->options & XML_PARSE_BIG_LINES)
1935
1.05M
        ret->psvi = (void *) (ptrdiff_t) ctxt->input->line;
1936
3.27M
      }
1937
313M
  }
1938
313M
    }
1939
1940
314M
    if ((__xmlRegisterCallbacks) && (xmlRegisterNodeDefaultValue))
1941
0
  xmlRegisterNodeDefaultValue(ret);
1942
314M
    return(ret);
1943
314M
}
1944
1945
#ifdef LIBXML_VALID_ENABLED
1946
/*
1947
 * xmlSAX2DecodeAttrEntities:
1948
 * @ctxt:  the parser context
1949
 * @str:  the input string
1950
 * @len: the string length
1951
 *
1952
 * Remove the entities from an attribute value
1953
 *
1954
 * Returns the newly allocated string or NULL if not needed or error
1955
 */
1956
static xmlChar *
1957
xmlSAX2DecodeAttrEntities(xmlParserCtxtPtr ctxt, const xmlChar *str,
1958
1.42M
                          const xmlChar *end) {
1959
1.42M
    const xmlChar *in;
1960
1.42M
    xmlChar *ret;
1961
1962
1.42M
    in = str;
1963
273M
    while (in < end)
1964
271M
        if (*in++ == '&')
1965
48.3k
      goto decode;
1966
1.37M
    return(NULL);
1967
48.3k
decode:
1968
48.3k
    ctxt->depth++;
1969
48.3k
    ret = xmlStringLenDecodeEntities(ctxt, str, end - str,
1970
48.3k
             XML_SUBSTITUTE_REF, 0,0,0);
1971
48.3k
    ctxt->depth--;
1972
48.3k
    return(ret);
1973
1.42M
}
1974
#endif /* LIBXML_VALID_ENABLED */
1975
1976
/**
1977
 * xmlSAX2AttributeNs:
1978
 * @ctx: the user data (XML parser context)
1979
 * @localname:  the local name of the attribute
1980
 * @prefix:  the attribute namespace prefix if available
1981
 * @URI:  the attribute namespace name if available
1982
 * @value:  Start of the attribute value
1983
 * @valueend: end of the attribute value
1984
 *
1985
 * Handle an attribute that has been read by the parser.
1986
 * The default handling is to convert the attribute into an
1987
 * DOM subtree and past it in a new xmlAttr element added to
1988
 * the element.
1989
 */
1990
static void
1991
xmlSAX2AttributeNs(xmlParserCtxtPtr ctxt,
1992
                   const xmlChar * localname,
1993
                   const xmlChar * prefix,
1994
       const xmlChar * value,
1995
       const xmlChar * valueend)
1996
154M
{
1997
154M
    xmlAttrPtr ret;
1998
154M
    xmlNsPtr namespace = NULL;
1999
154M
    xmlChar *dup = NULL;
2000
2001
    /*
2002
     * Note: if prefix == NULL, the attribute is not in the default namespace
2003
     */
2004
154M
    if (prefix != NULL)
2005
3.43M
  namespace = xmlSearchNs(ctxt->myDoc, ctxt->node, prefix);
2006
2007
    /*
2008
     * allocate the node
2009
     */
2010
154M
    if (ctxt->freeAttrs != NULL) {
2011
1.53M
        ret = ctxt->freeAttrs;
2012
1.53M
  ctxt->freeAttrs = ret->next;
2013
1.53M
  ctxt->freeAttrsNr--;
2014
1.53M
  memset(ret, 0, sizeof(xmlAttr));
2015
1.53M
  ret->type = XML_ATTRIBUTE_NODE;
2016
2017
1.53M
  ret->parent = ctxt->node;
2018
1.53M
  ret->doc = ctxt->myDoc;
2019
1.53M
  ret->ns = namespace;
2020
2021
1.53M
  if (ctxt->dictNames)
2022
1.46M
      ret->name = localname;
2023
65.5k
  else
2024
65.5k
      ret->name = xmlStrdup(localname);
2025
2026
        /* link at the end to preserve order, TODO speed up with a last */
2027
1.53M
  if (ctxt->node->properties == NULL) {
2028
1.53M
      ctxt->node->properties = ret;
2029
1.53M
  } else {
2030
0
      xmlAttrPtr prev = ctxt->node->properties;
2031
2032
0
      while (prev->next != NULL) prev = prev->next;
2033
0
      prev->next = ret;
2034
0
      ret->prev = prev;
2035
0
  }
2036
2037
1.53M
  if ((__xmlRegisterCallbacks) && (xmlRegisterNodeDefaultValue))
2038
0
      xmlRegisterNodeDefaultValue((xmlNodePtr)ret);
2039
152M
    } else {
2040
152M
  if (ctxt->dictNames)
2041
133M
      ret = xmlNewNsPropEatName(ctxt->node, namespace,
2042
133M
                                (xmlChar *) localname, NULL);
2043
19.4M
  else
2044
19.4M
      ret = xmlNewNsProp(ctxt->node, namespace, localname, NULL);
2045
152M
  if (ret == NULL) {
2046
0
      xmlErrMemory(ctxt, "xmlSAX2AttributeNs");
2047
0
      return;
2048
0
  }
2049
152M
    }
2050
2051
154M
    if ((ctxt->replaceEntities == 0) && (!ctxt->html)) {
2052
29.0M
  xmlNodePtr tmp;
2053
2054
  /*
2055
   * We know that if there is an entity reference, then
2056
   * the string has been dup'ed and terminates with 0
2057
   * otherwise with ' or "
2058
   */
2059
29.0M
  if (*valueend != 0) {
2060
26.4M
      tmp = xmlSAX2TextNode(ctxt, value, valueend - value);
2061
26.4M
      ret->children = tmp;
2062
26.4M
      ret->last = tmp;
2063
26.4M
      if (tmp != NULL) {
2064
26.4M
    tmp->doc = ret->doc;
2065
26.4M
    tmp->parent = (xmlNodePtr) ret;
2066
26.4M
      }
2067
26.4M
  } else {
2068
2.56M
      ret->children = xmlStringLenGetNodeList(ctxt->myDoc, value,
2069
2.56M
                valueend - value);
2070
2.56M
      tmp = ret->children;
2071
6.41M
      while (tmp != NULL) {
2072
3.85M
          tmp->doc = ret->doc;
2073
3.85M
    tmp->parent = (xmlNodePtr) ret;
2074
3.85M
    if (tmp->next == NULL)
2075
2.56M
        ret->last = tmp;
2076
3.85M
    tmp = tmp->next;
2077
3.85M
      }
2078
2.56M
  }
2079
125M
    } else if (value != NULL) {
2080
125M
  xmlNodePtr tmp;
2081
2082
125M
  tmp = xmlSAX2TextNode(ctxt, value, valueend - value);
2083
125M
  ret->children = tmp;
2084
125M
  ret->last = tmp;
2085
125M
  if (tmp != NULL) {
2086
125M
      tmp->doc = ret->doc;
2087
125M
      tmp->parent = (xmlNodePtr) ret;
2088
125M
  }
2089
125M
    }
2090
2091
154M
#ifdef LIBXML_VALID_ENABLED
2092
154M
    if ((!ctxt->html) && ctxt->validate && ctxt->wellFormed &&
2093
154M
        ctxt->myDoc && ctxt->myDoc->intSubset) {
2094
  /*
2095
   * If we don't substitute entities, the validation should be
2096
   * done on a value with replaced entities anyway.
2097
   */
2098
2.17M
        if (!ctxt->replaceEntities) {
2099
1.42M
      dup = xmlSAX2DecodeAttrEntities(ctxt, value, valueend);
2100
1.42M
      if (dup == NULL) {
2101
1.37M
          if (*valueend == 0) {
2102
250k
        ctxt->valid &= xmlValidateOneAttribute(&ctxt->vctxt,
2103
250k
            ctxt->myDoc, ctxt->node, ret, value);
2104
1.12M
    } else {
2105
        /*
2106
         * That should already be normalized.
2107
         * cheaper to finally allocate here than duplicate
2108
         * entry points in the full validation code
2109
         */
2110
1.12M
        dup = xmlStrndup(value, valueend - value);
2111
2112
1.12M
        ctxt->valid &= xmlValidateOneAttribute(&ctxt->vctxt,
2113
1.12M
            ctxt->myDoc, ctxt->node, ret, dup);
2114
1.12M
    }
2115
1.37M
      } else {
2116
          /*
2117
     * dup now contains a string of the flattened attribute
2118
     * content with entities substituted. Check if we need to
2119
     * apply an extra layer of normalization.
2120
     * It need to be done twice ... it's an extra burden related
2121
     * to the ability to keep references in attributes
2122
     */
2123
48.3k
    if (ctxt->attsSpecial != NULL) {
2124
35.4k
        xmlChar *nvalnorm;
2125
35.4k
        xmlChar fn[50];
2126
35.4k
        xmlChar *fullname;
2127
2128
35.4k
        fullname = xmlBuildQName(localname, prefix, fn, 50);
2129
35.4k
        if (fullname != NULL) {
2130
35.4k
      ctxt->vctxt.valid = 1;
2131
35.4k
            nvalnorm = xmlValidCtxtNormalizeAttributeValue(
2132
35.4k
                       &ctxt->vctxt, ctxt->myDoc,
2133
35.4k
           ctxt->node, fullname, dup);
2134
35.4k
      if (ctxt->vctxt.valid != 1)
2135
0
          ctxt->valid = 0;
2136
2137
35.4k
      if ((fullname != fn) && (fullname != localname))
2138
0
          xmlFree(fullname);
2139
35.4k
      if (nvalnorm != NULL) {
2140
12.1k
          xmlFree(dup);
2141
12.1k
          dup = nvalnorm;
2142
12.1k
      }
2143
35.4k
        }
2144
35.4k
    }
2145
2146
48.3k
    ctxt->valid &= xmlValidateOneAttribute(&ctxt->vctxt,
2147
48.3k
              ctxt->myDoc, ctxt->node, ret, dup);
2148
48.3k
      }
2149
1.42M
  } else {
2150
      /*
2151
       * if entities already have been substituted, then
2152
       * the attribute as passed is already normalized
2153
       */
2154
750k
      dup = xmlStrndup(value, valueend - value);
2155
2156
750k
      ctxt->valid &= xmlValidateOneAttribute(&ctxt->vctxt,
2157
750k
                               ctxt->myDoc, ctxt->node, ret, dup);
2158
750k
  }
2159
2.17M
    } else
2160
152M
#endif /* LIBXML_VALID_ENABLED */
2161
152M
           if (((ctxt->loadsubset & XML_SKIP_IDS) == 0) &&
2162
152M
         (((ctxt->replaceEntities == 0) && (ctxt->external != 2)) ||
2163
152M
          ((ctxt->replaceEntities != 0) && (ctxt->inSubset == 0))) &&
2164
               /* Don't create IDs containing entity references */
2165
152M
               (ret->children != NULL) &&
2166
152M
               (ret->children->type == XML_TEXT_NODE) &&
2167
152M
               (ret->children->next == NULL)) {
2168
152M
        xmlChar *content = ret->children->content;
2169
        /*
2170
   * when validating, the ID registration is done at the attribute
2171
   * validation level. Otherwise we have to do specific handling here.
2172
   */
2173
152M
        if ((prefix == ctxt->str_xml) &&
2174
152M
             (localname[0] == 'i') && (localname[1] == 'd') &&
2175
152M
       (localname[2] == 0)) {
2176
      /*
2177
       * Add the xml:id value
2178
       *
2179
       * Open issue: normalization of the value.
2180
       */
2181
791k
#if defined(LIBXML_SAX1_ENABLED) || defined(LIBXML_HTML_ENABLED) || defined(LIBXML_WRITER_ENABLED) || defined(LIBXML_LEGACY_ENABLED)
2182
791k
#ifdef LIBXML_VALID_ENABLED
2183
791k
      if (xmlValidateNCName(content, 1) != 0) {
2184
440k
          xmlErrValid(ctxt, XML_DTD_XMLID_VALUE,
2185
440k
          "xml:id : attribute value %s is not an NCName\n",
2186
440k
          (const char *) content, NULL);
2187
440k
      }
2188
791k
#endif
2189
791k
#endif
2190
791k
      xmlAddID(&ctxt->vctxt, ctxt->myDoc, content, ret);
2191
151M
  } else if (xmlIsID(ctxt->myDoc, ctxt->node, ret)) {
2192
400k
      xmlAddID(&ctxt->vctxt, ctxt->myDoc, content, ret);
2193
150M
  } else if (xmlIsRef(ctxt->myDoc, ctxt->node, ret)) {
2194
717k
      xmlAddRef(&ctxt->vctxt, ctxt->myDoc, content, ret);
2195
717k
  }
2196
152M
    }
2197
154M
    if (dup != NULL)
2198
1.92M
  xmlFree(dup);
2199
154M
}
2200
2201
/**
2202
 * xmlSAX2StartElementNs:
2203
 * @ctx:  the user data (XML parser context)
2204
 * @localname:  the local name of the element
2205
 * @prefix:  the element namespace prefix if available
2206
 * @URI:  the element namespace name if available
2207
 * @nb_namespaces:  number of namespace definitions on that node
2208
 * @namespaces:  pointer to the array of prefix/URI pairs namespace definitions
2209
 * @nb_attributes:  the number of attributes on that node
2210
 * @nb_defaulted:  the number of defaulted attributes.
2211
 * @attributes:  pointer to the array of (localname/prefix/URI/value/end)
2212
 *               attribute values.
2213
 *
2214
 * SAX2 callback when an element start has been detected by the parser.
2215
 * It provides the namespace information for the element, as well as
2216
 * the new namespace declarations on the element.
2217
 */
2218
void
2219
xmlSAX2StartElementNs(void *ctx,
2220
                      const xmlChar *localname,
2221
          const xmlChar *prefix,
2222
          const xmlChar *URI,
2223
          int nb_namespaces,
2224
          const xmlChar **namespaces,
2225
          int nb_attributes,
2226
          int nb_defaulted,
2227
          const xmlChar **attributes)
2228
124M
{
2229
124M
    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
2230
124M
    xmlNodePtr ret;
2231
124M
    xmlNodePtr parent;
2232
124M
    xmlNsPtr last = NULL, ns;
2233
124M
    const xmlChar *uri, *pref;
2234
124M
    xmlChar *lname = NULL;
2235
124M
    int i, j;
2236
2237
124M
    if (ctx == NULL) return;
2238
124M
    parent = ctxt->node;
2239
    /*
2240
     * First check on validity:
2241
     */
2242
124M
    if (ctxt->validate && (ctxt->myDoc->extSubset == NULL) &&
2243
124M
        ((ctxt->myDoc->intSubset == NULL) ||
2244
10.0M
   ((ctxt->myDoc->intSubset->notations == NULL) &&
2245
9.11M
    (ctxt->myDoc->intSubset->elements == NULL) &&
2246
9.11M
    (ctxt->myDoc->intSubset->attributes == NULL) &&
2247
9.11M
    (ctxt->myDoc->intSubset->entities == NULL)))) {
2248
1.01M
  xmlErrValid(ctxt, XML_DTD_NO_DTD,
2249
1.01M
    "Validation failed: no DTD found !", NULL, NULL);
2250
1.01M
  ctxt->validate = 0;
2251
1.01M
    }
2252
2253
    /*
2254
     * Take care of the rare case of an undefined namespace prefix
2255
     */
2256
124M
    if ((prefix != NULL) && (URI == NULL)) {
2257
15.6M
        if (ctxt->dictNames) {
2258
13.9M
      const xmlChar *fullname;
2259
2260
13.9M
      fullname = xmlDictQLookup(ctxt->dict, prefix, localname);
2261
13.9M
      if (fullname != NULL)
2262
13.9M
          localname = fullname;
2263
13.9M
  } else {
2264
1.71M
      lname = xmlBuildQName(localname, prefix, NULL, 0);
2265
1.71M
  }
2266
15.6M
    }
2267
    /*
2268
     * allocate the node
2269
     */
2270
124M
    if (ctxt->freeElems != NULL) {
2271
1.04M
        ret = ctxt->freeElems;
2272
1.04M
  ctxt->freeElems = ret->next;
2273
1.04M
  ctxt->freeElemsNr--;
2274
1.04M
  memset(ret, 0, sizeof(xmlNode));
2275
1.04M
        ret->doc = ctxt->myDoc;
2276
1.04M
  ret->type = XML_ELEMENT_NODE;
2277
2278
1.04M
  if (ctxt->dictNames)
2279
987k
      ret->name = localname;
2280
60.9k
  else {
2281
60.9k
      if (lname == NULL)
2282
58.9k
    ret->name = xmlStrdup(localname);
2283
2.01k
      else
2284
2.01k
          ret->name = lname;
2285
60.9k
      if (ret->name == NULL) {
2286
0
          xmlSAX2ErrMemory(ctxt, "xmlSAX2StartElementNs");
2287
0
    return;
2288
0
      }
2289
60.9k
  }
2290
1.04M
  if ((__xmlRegisterCallbacks) && (xmlRegisterNodeDefaultValue))
2291
0
      xmlRegisterNodeDefaultValue(ret);
2292
122M
    } else {
2293
122M
  if (ctxt->dictNames)
2294
105M
      ret = xmlNewDocNodeEatName(ctxt->myDoc, NULL,
2295
105M
                                 (xmlChar *) localname, NULL);
2296
17.7M
  else if (lname == NULL)
2297
16.0M
      ret = xmlNewDocNode(ctxt->myDoc, NULL, localname, NULL);
2298
1.71M
  else
2299
1.71M
      ret = xmlNewDocNodeEatName(ctxt->myDoc, NULL,
2300
1.71M
                                 (xmlChar *) lname, NULL);
2301
122M
  if (ret == NULL) {
2302
0
      xmlSAX2ErrMemory(ctxt, "xmlSAX2StartElementNs");
2303
0
      return;
2304
0
  }
2305
122M
    }
2306
124M
    if (ctxt->linenumbers) {
2307
123M
  if (ctxt->input != NULL) {
2308
123M
      if ((unsigned) ctxt->input->line < (unsigned) USHRT_MAX)
2309
122M
    ret->line = ctxt->input->line;
2310
1.14M
      else
2311
1.14M
          ret->line = USHRT_MAX;
2312
123M
  }
2313
123M
    }
2314
2315
124M
    if (parent == NULL) {
2316
11.0M
        xmlAddChild((xmlNodePtr) ctxt->myDoc, (xmlNodePtr) ret);
2317
11.0M
    }
2318
    /*
2319
     * Build the namespace list
2320
     */
2321
129M
    for (i = 0,j = 0;j < nb_namespaces;j++) {
2322
5.03M
        pref = namespaces[i++];
2323
5.03M
  uri = namespaces[i++];
2324
5.03M
  ns = xmlNewNs(NULL, uri, pref);
2325
5.03M
  if (ns != NULL) {
2326
5.03M
      if (last == NULL) {
2327
3.83M
          ret->nsDef = last = ns;
2328
3.83M
      } else {
2329
1.20M
          last->next = ns;
2330
1.20M
    last = ns;
2331
1.20M
      }
2332
5.03M
      if ((URI != NULL) && (prefix == pref))
2333
2.19M
    ret->ns = ns;
2334
5.03M
  } else {
2335
            /*
2336
             * any out of memory error would already have been raised
2337
             * but we can't be guaranteed it's the actual error due to the
2338
             * API, best is to skip in this case
2339
             */
2340
0
      continue;
2341
0
  }
2342
5.03M
#ifdef LIBXML_VALID_ENABLED
2343
5.03M
  if ((!ctxt->html) && ctxt->validate && ctxt->wellFormed &&
2344
5.03M
      ctxt->myDoc && ctxt->myDoc->intSubset) {
2345
123k
      ctxt->valid &= xmlValidateOneNamespace(&ctxt->vctxt, ctxt->myDoc,
2346
123k
                                             ret, prefix, ns, uri);
2347
123k
  }
2348
5.03M
#endif /* LIBXML_VALID_ENABLED */
2349
5.03M
    }
2350
124M
    ctxt->nodemem = -1;
2351
2352
    /*
2353
     * We are parsing a new node.
2354
     */
2355
124M
    if (nodePush(ctxt, ret) < 0) {
2356
687
        xmlUnlinkNode(ret);
2357
687
        xmlFreeNode(ret);
2358
687
        return;
2359
687
    }
2360
2361
    /*
2362
     * Link the child element
2363
     */
2364
124M
    if (parent != NULL) {
2365
112M
        if (parent->type == XML_ELEMENT_NODE) {
2366
112M
      xmlAddChild(parent, ret);
2367
112M
  } else {
2368
0
      xmlAddSibling(parent, ret);
2369
0
  }
2370
112M
    }
2371
2372
    /*
2373
     * Insert the defaulted attributes from the DTD only if requested:
2374
     */
2375
124M
    if ((nb_defaulted != 0) &&
2376
124M
        ((ctxt->loadsubset & XML_COMPLETE_ATTRS) == 0))
2377
268k
  nb_attributes -= nb_defaulted;
2378
2379
    /*
2380
     * Search the namespace if it wasn't already found
2381
     * Note that, if prefix is NULL, this searches for the default Ns
2382
     */
2383
124M
    if ((URI != NULL) && (ret->ns == NULL)) {
2384
12.3M
        ret->ns = xmlSearchNs(ctxt->myDoc, parent, prefix);
2385
12.3M
  if ((ret->ns == NULL) && (xmlStrEqual(prefix, BAD_CAST "xml"))) {
2386
37.7k
      ret->ns = xmlSearchNs(ctxt->myDoc, ret, prefix);
2387
37.7k
  }
2388
12.3M
  if (ret->ns == NULL) {
2389
6.77M
      ns = xmlNewNs(ret, NULL, prefix);
2390
6.77M
      if (ns == NULL) {
2391
2392
0
          xmlSAX2ErrMemory(ctxt, "xmlSAX2StartElementNs");
2393
0
    return;
2394
0
      }
2395
6.77M
            if (prefix != NULL)
2396
3.46M
                xmlNsWarnMsg(ctxt, XML_NS_ERR_UNDEFINED_NAMESPACE,
2397
3.46M
                             "Namespace prefix %s was not found\n",
2398
3.46M
                             prefix, NULL);
2399
3.31M
            else
2400
3.31M
                xmlNsWarnMsg(ctxt, XML_NS_ERR_UNDEFINED_NAMESPACE,
2401
3.31M
                             "Namespace default prefix was not found\n",
2402
3.31M
                             NULL, NULL);
2403
6.77M
  }
2404
12.3M
    }
2405
2406
    /*
2407
     * process all the other attributes
2408
     */
2409
124M
    if (nb_attributes > 0) {
2410
237M
        for (j = 0,i = 0;i < nb_attributes;i++,j+=5) {
2411
      /*
2412
       * Handle the rare case of an undefined attribute prefix
2413
       */
2414
154M
      if ((attributes[j+1] != NULL) && (attributes[j+2] == NULL)) {
2415
1.54M
    if (ctxt->dictNames) {
2416
1.12M
        const xmlChar *fullname;
2417
2418
1.12M
        fullname = xmlDictQLookup(ctxt->dict, attributes[j+1],
2419
1.12M
                                  attributes[j]);
2420
1.12M
        if (fullname != NULL) {
2421
1.12M
      xmlSAX2AttributeNs(ctxt, fullname, NULL,
2422
1.12M
                         attributes[j+3], attributes[j+4]);
2423
1.12M
            continue;
2424
1.12M
        }
2425
1.12M
    } else {
2426
413k
        lname = xmlBuildQName(attributes[j], attributes[j+1],
2427
413k
                              NULL, 0);
2428
413k
        if (lname != NULL) {
2429
413k
      xmlSAX2AttributeNs(ctxt, lname, NULL,
2430
413k
                         attributes[j+3], attributes[j+4]);
2431
413k
      xmlFree(lname);
2432
413k
            continue;
2433
413k
        }
2434
413k
    }
2435
1.54M
      }
2436
152M
      xmlSAX2AttributeNs(ctxt, attributes[j], attributes[j+1],
2437
152M
             attributes[j+3], attributes[j+4]);
2438
152M
  }
2439
83.4M
    }
2440
2441
124M
#ifdef LIBXML_VALID_ENABLED
2442
    /*
2443
     * If it's the Document root, finish the DTD validation and
2444
     * check the document root element for validity
2445
     */
2446
124M
    if ((ctxt->validate) &&
2447
124M
        ((ctxt->vctxt.flags & XML_VCTXT_DTD_VALIDATED) == 0)) {
2448
655k
  int chk;
2449
2450
655k
  chk = xmlValidateDtdFinal(&ctxt->vctxt, ctxt->myDoc);
2451
655k
  if (chk <= 0)
2452
9.08k
      ctxt->valid = 0;
2453
655k
  if (chk < 0)
2454
0
      ctxt->wellFormed = 0;
2455
655k
  ctxt->valid &= xmlValidateRoot(&ctxt->vctxt, ctxt->myDoc);
2456
655k
  ctxt->vctxt.flags |= XML_VCTXT_DTD_VALIDATED;
2457
655k
    }
2458
124M
#endif /* LIBXML_VALID_ENABLED */
2459
124M
}
2460
2461
/**
2462
 * xmlSAX2EndElementNs:
2463
 * @ctx:  the user data (XML parser context)
2464
 * @localname:  the local name of the element
2465
 * @prefix:  the element namespace prefix if available
2466
 * @URI:  the element namespace name if available
2467
 *
2468
 * SAX2 callback when an element end has been detected by the parser.
2469
 * It provides the namespace information for the element.
2470
 */
2471
void
2472
xmlSAX2EndElementNs(void *ctx,
2473
                    const xmlChar * localname ATTRIBUTE_UNUSED,
2474
                    const xmlChar * prefix ATTRIBUTE_UNUSED,
2475
        const xmlChar * URI ATTRIBUTE_UNUSED)
2476
103M
{
2477
103M
    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
2478
103M
    xmlParserNodeInfo node_info;
2479
103M
    xmlNodePtr cur;
2480
2481
103M
    if (ctx == NULL) return;
2482
103M
    cur = ctxt->node;
2483
    /* Capture end position and add node */
2484
103M
    if ((ctxt->record_info) && (cur != NULL)) {
2485
0
        node_info.end_pos = ctxt->input->cur - ctxt->input->base;
2486
0
        node_info.end_line = ctxt->input->line;
2487
0
        node_info.node = cur;
2488
0
        xmlParserAddNodeInfo(ctxt, &node_info);
2489
0
    }
2490
103M
    ctxt->nodemem = -1;
2491
2492
103M
#ifdef LIBXML_VALID_ENABLED
2493
103M
    if (ctxt->validate && ctxt->wellFormed &&
2494
103M
        ctxt->myDoc && ctxt->myDoc->intSubset)
2495
1.73M
        ctxt->valid &= xmlValidateOneElement(&ctxt->vctxt, ctxt->myDoc, cur);
2496
103M
#endif /* LIBXML_VALID_ENABLED */
2497
2498
    /*
2499
     * end of parsing of this node.
2500
     */
2501
103M
    nodePop(ctxt);
2502
103M
}
2503
2504
/**
2505
 * xmlSAX2Reference:
2506
 * @ctx: the user data (XML parser context)
2507
 * @name:  The entity name
2508
 *
2509
 * called when an entity xmlSAX2Reference is detected.
2510
 */
2511
void
2512
xmlSAX2Reference(void *ctx, const xmlChar *name)
2513
3.05M
{
2514
3.05M
    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
2515
3.05M
    xmlNodePtr ret;
2516
2517
3.05M
    if (ctx == NULL) return;
2518
#ifdef DEBUG_SAX
2519
    xmlGenericError(xmlGenericErrorContext,
2520
      "SAX.xmlSAX2Reference(%s)\n", name);
2521
#endif
2522
3.05M
    if (name[0] == '#')
2523
84.5k
  ret = xmlNewCharRef(ctxt->myDoc, name);
2524
2.97M
    else
2525
2.97M
  ret = xmlNewReference(ctxt->myDoc, name);
2526
#ifdef DEBUG_SAX_TREE
2527
    xmlGenericError(xmlGenericErrorContext,
2528
      "add xmlSAX2Reference %s to %s \n", name, ctxt->node->name);
2529
#endif
2530
3.05M
    if (xmlAddChild(ctxt->node, ret) == NULL) {
2531
345k
        xmlFreeNode(ret);
2532
345k
    }
2533
3.05M
}
2534
2535
/**
2536
 * xmlSAX2Text:
2537
 * @ctx: the user data (XML parser context)
2538
 * @ch:  a xmlChar string
2539
 * @len: the number of xmlChar
2540
 * @type: text or cdata
2541
 *
2542
 * Append characters.
2543
 */
2544
static void
2545
xmlSAX2Text(xmlParserCtxtPtr ctxt, const xmlChar *ch, int len,
2546
            xmlElementType type)
2547
314M
{
2548
314M
    xmlNodePtr lastChild;
2549
2550
314M
    if (ctxt == NULL) return;
2551
#ifdef DEBUG_SAX
2552
    xmlGenericError(xmlGenericErrorContext,
2553
      "SAX.xmlSAX2Characters(%.30s, %d)\n", ch, len);
2554
#endif
2555
    /*
2556
     * Handle the data if any. If there is no child
2557
     * add it as content, otherwise if the last child is text,
2558
     * concatenate it, else create a new node of type text.
2559
     */
2560
2561
314M
    if (ctxt->node == NULL) {
2562
#ifdef DEBUG_SAX_TREE
2563
  xmlGenericError(xmlGenericErrorContext,
2564
    "add chars: ctxt->node == NULL !\n");
2565
#endif
2566
48.5M
        return;
2567
48.5M
    }
2568
266M
    lastChild = ctxt->node->last;
2569
#ifdef DEBUG_SAX_TREE
2570
    xmlGenericError(xmlGenericErrorContext,
2571
      "add chars to %s \n", ctxt->node->name);
2572
#endif
2573
2574
    /*
2575
     * Here we needed an accelerator mechanism in case of very large
2576
     * elements. Use an attribute in the structure !!!
2577
     */
2578
266M
    if (lastChild == NULL) {
2579
38.0M
        if (type == XML_TEXT_NODE)
2580
37.8M
            lastChild = xmlSAX2TextNode(ctxt, ch, len);
2581
194k
        else
2582
194k
            lastChild = xmlNewCDataBlock(ctxt->myDoc, ch, len);
2583
38.0M
  if (lastChild != NULL) {
2584
38.0M
      ctxt->node->children = lastChild;
2585
38.0M
      ctxt->node->last = lastChild;
2586
38.0M
      lastChild->parent = ctxt->node;
2587
38.0M
      lastChild->doc = ctxt->node->doc;
2588
38.0M
      ctxt->nodelen = len;
2589
38.0M
      ctxt->nodemem = len + 1;
2590
38.0M
  } else {
2591
0
      xmlSAX2ErrMemory(ctxt, "xmlSAX2Characters");
2592
0
      return;
2593
0
  }
2594
228M
    } else {
2595
228M
  int coalesceText = (lastChild != NULL) &&
2596
228M
      (lastChild->type == type) &&
2597
228M
      ((type != XML_TEXT_NODE) ||
2598
103M
             (lastChild->name == xmlStringText));
2599
228M
  if ((coalesceText) && (ctxt->nodemem != 0)) {
2600
      /*
2601
       * The whole point of maintaining nodelen and nodemem,
2602
       * xmlTextConcat is too costly, i.e. compute length,
2603
       * reallocate a new buffer, move data, append ch. Here
2604
       * We try to minimize realloc() uses and avoid copying
2605
       * and recomputing length over and over.
2606
       */
2607
101M
      if (lastChild->content == (xmlChar *)&(lastChild->properties)) {
2608
4.72M
    lastChild->content = xmlStrdup(lastChild->content);
2609
4.72M
    lastChild->properties = NULL;
2610
97.0M
      } else if ((ctxt->nodemem == ctxt->nodelen + 1) &&
2611
97.0M
                 (xmlDictOwns(ctxt->dict, lastChild->content))) {
2612
48.3k
    lastChild->content = xmlStrdup(lastChild->content);
2613
48.3k
      }
2614
101M
      if (lastChild->content == NULL) {
2615
0
    xmlSAX2ErrMemory(ctxt, "xmlSAX2Characters: xmlStrdup returned NULL");
2616
0
    return;
2617
0
      }
2618
101M
      if (ctxt->nodelen > INT_MAX - len) {
2619
0
                xmlSAX2ErrMemory(ctxt, "xmlSAX2Characters overflow prevented");
2620
0
                return;
2621
0
      }
2622
101M
            if ((ctxt->nodelen + len > XML_MAX_TEXT_LENGTH) &&
2623
101M
                ((ctxt->options & XML_PARSE_HUGE) == 0)) {
2624
0
                xmlSAX2ErrMemory(ctxt, "xmlSAX2Characters: huge text node");
2625
0
                return;
2626
0
            }
2627
101M
      if (ctxt->nodelen + len >= ctxt->nodemem) {
2628
29.1M
    xmlChar *newbuf;
2629
29.1M
    int size;
2630
2631
29.1M
    size = ctxt->nodemem > INT_MAX - len ?
2632
0
                       INT_MAX :
2633
29.1M
                       ctxt->nodemem + len;
2634
29.1M
    size = size > INT_MAX / 2 ? INT_MAX : size * 2;
2635
29.1M
                newbuf = (xmlChar *) xmlRealloc(lastChild->content,size);
2636
29.1M
    if (newbuf == NULL) {
2637
0
        xmlSAX2ErrMemory(ctxt, "xmlSAX2Characters");
2638
0
        return;
2639
0
    }
2640
29.1M
    ctxt->nodemem = size;
2641
29.1M
    lastChild->content = newbuf;
2642
29.1M
      }
2643
101M
      memcpy(&lastChild->content[ctxt->nodelen], ch, len);
2644
101M
      ctxt->nodelen += len;
2645
101M
      lastChild->content[ctxt->nodelen] = 0;
2646
126M
  } else if (coalesceText) {
2647
1.77M
      if (xmlTextConcat(lastChild, ch, len)) {
2648
0
    xmlSAX2ErrMemory(ctxt, "xmlSAX2Characters");
2649
0
      }
2650
1.77M
      if (ctxt->node->children != NULL) {
2651
1.77M
    ctxt->nodelen = xmlStrlen(lastChild->content);
2652
1.77M
    ctxt->nodemem = ctxt->nodelen + 1;
2653
1.77M
      }
2654
124M
  } else {
2655
      /* Mixed content, first time */
2656
124M
            if (type == XML_TEXT_NODE) {
2657
124M
                lastChild = xmlSAX2TextNode(ctxt, ch, len);
2658
124M
                if (lastChild != NULL)
2659
124M
                    lastChild->doc = ctxt->myDoc;
2660
124M
            } else
2661
228k
                lastChild = xmlNewCDataBlock(ctxt->myDoc, ch, len);
2662
124M
      if (lastChild != NULL) {
2663
124M
    xmlAddChild(ctxt->node, lastChild);
2664
124M
    if (ctxt->node->children != NULL) {
2665
124M
        ctxt->nodelen = len;
2666
124M
        ctxt->nodemem = len + 1;
2667
124M
    }
2668
124M
      }
2669
124M
  }
2670
228M
    }
2671
266M
}
2672
2673
/**
2674
 * xmlSAX2Characters:
2675
 * @ctx: the user data (XML parser context)
2676
 * @ch:  a xmlChar string
2677
 * @len: the number of xmlChar
2678
 *
2679
 * receiving some chars from the parser.
2680
 */
2681
void
2682
xmlSAX2Characters(void *ctx, const xmlChar *ch, int len)
2683
313M
{
2684
313M
    xmlSAX2Text((xmlParserCtxtPtr) ctx, ch, len, XML_TEXT_NODE);
2685
313M
}
2686
2687
/**
2688
 * xmlSAX2IgnorableWhitespace:
2689
 * @ctx: the user data (XML parser context)
2690
 * @ch:  a xmlChar string
2691
 * @len: the number of xmlChar
2692
 *
2693
 * receiving some ignorable whitespaces from the parser.
2694
 * UNUSED: by default the DOM building will use xmlSAX2Characters
2695
 */
2696
void
2697
xmlSAX2IgnorableWhitespace(void *ctx ATTRIBUTE_UNUSED, const xmlChar *ch ATTRIBUTE_UNUSED, int len ATTRIBUTE_UNUSED)
2698
19.0M
{
2699
    /* xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx; */
2700
#ifdef DEBUG_SAX
2701
    xmlGenericError(xmlGenericErrorContext,
2702
      "SAX.xmlSAX2IgnorableWhitespace(%.30s, %d)\n", ch, len);
2703
#endif
2704
19.0M
}
2705
2706
/**
2707
 * xmlSAX2ProcessingInstruction:
2708
 * @ctx: the user data (XML parser context)
2709
 * @target:  the target name
2710
 * @data: the PI data's
2711
 *
2712
 * A processing instruction has been parsed.
2713
 */
2714
void
2715
xmlSAX2ProcessingInstruction(void *ctx, const xmlChar *target,
2716
                      const xmlChar *data)
2717
2.87M
{
2718
2.87M
    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
2719
2.87M
    xmlNodePtr ret;
2720
2.87M
    xmlNodePtr parent;
2721
2722
2.87M
    if (ctx == NULL) return;
2723
2.87M
    parent = ctxt->node;
2724
#ifdef DEBUG_SAX
2725
    xmlGenericError(xmlGenericErrorContext,
2726
      "SAX.xmlSAX2ProcessingInstruction(%s, %s)\n", target, data);
2727
#endif
2728
2729
2.87M
    ret = xmlNewDocPI(ctxt->myDoc, target, data);
2730
2.87M
    if (ret == NULL) return;
2731
2732
2.87M
    if (ctxt->linenumbers) {
2733
2.86M
  if (ctxt->input != NULL) {
2734
2.86M
      if ((unsigned) ctxt->input->line < (unsigned) USHRT_MAX)
2735
2.84M
    ret->line = ctxt->input->line;
2736
17.6k
      else
2737
17.6k
          ret->line = USHRT_MAX;
2738
2.86M
  }
2739
2.86M
    }
2740
2.87M
    if (ctxt->inSubset == 1) {
2741
96.2k
  xmlAddChild((xmlNodePtr) ctxt->myDoc->intSubset, ret);
2742
96.2k
  return;
2743
2.78M
    } else if (ctxt->inSubset == 2) {
2744
35.1k
  xmlAddChild((xmlNodePtr) ctxt->myDoc->extSubset, ret);
2745
35.1k
  return;
2746
35.1k
    }
2747
2.74M
    if (parent == NULL) {
2748
#ifdef DEBUG_SAX_TREE
2749
      xmlGenericError(xmlGenericErrorContext,
2750
        "Setting PI %s as root\n", target);
2751
#endif
2752
1.36M
        xmlAddChild((xmlNodePtr) ctxt->myDoc, (xmlNodePtr) ret);
2753
1.36M
  return;
2754
1.36M
    }
2755
1.38M
    if (parent->type == XML_ELEMENT_NODE) {
2756
#ifdef DEBUG_SAX_TREE
2757
  xmlGenericError(xmlGenericErrorContext,
2758
    "adding PI %s child to %s\n", target, parent->name);
2759
#endif
2760
1.38M
  xmlAddChild(parent, ret);
2761
1.38M
    } else {
2762
#ifdef DEBUG_SAX_TREE
2763
  xmlGenericError(xmlGenericErrorContext,
2764
    "adding PI %s sibling to ", target);
2765
  xmlDebugDumpOneNode(stderr, parent, 0);
2766
#endif
2767
0
  xmlAddSibling(parent, ret);
2768
0
    }
2769
1.38M
}
2770
2771
/**
2772
 * xmlSAX2Comment:
2773
 * @ctx: the user data (XML parser context)
2774
 * @value:  the xmlSAX2Comment content
2775
 *
2776
 * A xmlSAX2Comment has been parsed.
2777
 */
2778
void
2779
xmlSAX2Comment(void *ctx, const xmlChar *value)
2780
275M
{
2781
275M
    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
2782
275M
    xmlNodePtr ret;
2783
275M
    xmlNodePtr parent;
2784
2785
275M
    if (ctx == NULL) return;
2786
275M
    parent = ctxt->node;
2787
#ifdef DEBUG_SAX
2788
    xmlGenericError(xmlGenericErrorContext, "SAX.xmlSAX2Comment(%s)\n", value);
2789
#endif
2790
275M
    ret = xmlNewDocComment(ctxt->myDoc, value);
2791
275M
    if (ret == NULL) return;
2792
275M
    if (ctxt->linenumbers) {
2793
275M
  if (ctxt->input != NULL) {
2794
275M
      if ((unsigned) ctxt->input->line < (unsigned) USHRT_MAX)
2795
275M
    ret->line = ctxt->input->line;
2796
35.4k
      else
2797
35.4k
          ret->line = USHRT_MAX;
2798
275M
  }
2799
275M
    }
2800
2801
275M
    if (ctxt->inSubset == 1) {
2802
269M
  xmlAddChild((xmlNodePtr) ctxt->myDoc->intSubset, ret);
2803
269M
  return;
2804
269M
    } else if (ctxt->inSubset == 2) {
2805
1.53M
  xmlAddChild((xmlNodePtr) ctxt->myDoc->extSubset, ret);
2806
1.53M
  return;
2807
1.53M
    }
2808
3.90M
    if (parent == NULL) {
2809
#ifdef DEBUG_SAX_TREE
2810
      xmlGenericError(xmlGenericErrorContext,
2811
        "Setting xmlSAX2Comment as root\n");
2812
#endif
2813
1.32M
        xmlAddChild((xmlNodePtr) ctxt->myDoc, (xmlNodePtr) ret);
2814
1.32M
  return;
2815
1.32M
    }
2816
2.58M
    if (parent->type == XML_ELEMENT_NODE) {
2817
#ifdef DEBUG_SAX_TREE
2818
  xmlGenericError(xmlGenericErrorContext,
2819
    "adding xmlSAX2Comment child to %s\n", parent->name);
2820
#endif
2821
2.58M
  xmlAddChild(parent, ret);
2822
2.58M
    } else {
2823
#ifdef DEBUG_SAX_TREE
2824
  xmlGenericError(xmlGenericErrorContext,
2825
    "adding xmlSAX2Comment sibling to ");
2826
  xmlDebugDumpOneNode(stderr, parent, 0);
2827
#endif
2828
0
  xmlAddSibling(parent, ret);
2829
0
    }
2830
2.58M
}
2831
2832
/**
2833
 * xmlSAX2CDataBlock:
2834
 * @ctx: the user data (XML parser context)
2835
 * @value:  The pcdata content
2836
 * @len:  the block length
2837
 *
2838
 * called when a pcdata block has been parsed
2839
 */
2840
void
2841
xmlSAX2CDataBlock(void *ctx, const xmlChar *value, int len)
2842
1.10M
{
2843
1.10M
    xmlSAX2Text((xmlParserCtxtPtr) ctx, value, len, XML_CDATA_SECTION_NODE);
2844
1.10M
}
2845
2846
static int xmlSAX2DefaultVersionValue = 2;
2847
2848
#ifdef LIBXML_SAX1_ENABLED
2849
/**
2850
 * xmlSAXDefaultVersion:
2851
 * @version:  the version, 1 or 2
2852
 *
2853
 * DEPRECATED: Use parser option XML_PARSE_SAX1.
2854
 *
2855
 * Set the default version of SAX used globally by the library.
2856
 * By default, during initialization the default is set to 2.
2857
 * Note that it is generally a better coding style to use
2858
 * xmlSAXVersion() to set up the version explicitly for a given
2859
 * parsing context.
2860
 *
2861
 * Returns the previous value in case of success and -1 in case of error.
2862
 */
2863
int
2864
xmlSAXDefaultVersion(int version)
2865
0
{
2866
0
    int ret = xmlSAX2DefaultVersionValue;
2867
2868
0
    if ((version != 1) && (version != 2))
2869
0
        return(-1);
2870
0
    xmlSAX2DefaultVersionValue = version;
2871
0
    return(ret);
2872
0
}
2873
#endif /* LIBXML_SAX1_ENABLED */
2874
2875
/**
2876
 * xmlSAXVersion:
2877
 * @hdlr:  the SAX handler
2878
 * @version:  the version, 1 or 2
2879
 *
2880
 * Initialize the default XML SAX handler according to the version
2881
 *
2882
 * Returns 0 in case of success and -1 in case of error.
2883
 */
2884
int
2885
xmlSAXVersion(xmlSAXHandler *hdlr, int version)
2886
15.0M
{
2887
15.0M
    if (hdlr == NULL) return(-1);
2888
15.0M
    if (version == 2) {
2889
15.0M
  hdlr->startElement = NULL;
2890
15.0M
  hdlr->endElement = NULL;
2891
15.0M
  hdlr->startElementNs = xmlSAX2StartElementNs;
2892
15.0M
  hdlr->endElementNs = xmlSAX2EndElementNs;
2893
15.0M
  hdlr->serror = NULL;
2894
15.0M
  hdlr->initialized = XML_SAX2_MAGIC;
2895
15.0M
#ifdef LIBXML_SAX1_ENABLED
2896
15.0M
    } else if (version == 1) {
2897
0
  hdlr->startElement = xmlSAX2StartElement;
2898
0
  hdlr->endElement = xmlSAX2EndElement;
2899
0
  hdlr->initialized = 1;
2900
0
#endif /* LIBXML_SAX1_ENABLED */
2901
0
    } else
2902
0
        return(-1);
2903
15.0M
    hdlr->internalSubset = xmlSAX2InternalSubset;
2904
15.0M
    hdlr->externalSubset = xmlSAX2ExternalSubset;
2905
15.0M
    hdlr->isStandalone = xmlSAX2IsStandalone;
2906
15.0M
    hdlr->hasInternalSubset = xmlSAX2HasInternalSubset;
2907
15.0M
    hdlr->hasExternalSubset = xmlSAX2HasExternalSubset;
2908
15.0M
    hdlr->resolveEntity = xmlSAX2ResolveEntity;
2909
15.0M
    hdlr->getEntity = xmlSAX2GetEntity;
2910
15.0M
    hdlr->getParameterEntity = xmlSAX2GetParameterEntity;
2911
15.0M
    hdlr->entityDecl = xmlSAX2EntityDecl;
2912
15.0M
    hdlr->attributeDecl = xmlSAX2AttributeDecl;
2913
15.0M
    hdlr->elementDecl = xmlSAX2ElementDecl;
2914
15.0M
    hdlr->notationDecl = xmlSAX2NotationDecl;
2915
15.0M
    hdlr->unparsedEntityDecl = xmlSAX2UnparsedEntityDecl;
2916
15.0M
    hdlr->setDocumentLocator = xmlSAX2SetDocumentLocator;
2917
15.0M
    hdlr->startDocument = xmlSAX2StartDocument;
2918
15.0M
    hdlr->endDocument = xmlSAX2EndDocument;
2919
15.0M
    hdlr->reference = xmlSAX2Reference;
2920
15.0M
    hdlr->characters = xmlSAX2Characters;
2921
15.0M
    hdlr->cdataBlock = xmlSAX2CDataBlock;
2922
15.0M
    hdlr->ignorableWhitespace = xmlSAX2Characters;
2923
15.0M
    hdlr->processingInstruction = xmlSAX2ProcessingInstruction;
2924
15.0M
    hdlr->comment = xmlSAX2Comment;
2925
15.0M
    hdlr->warning = xmlParserWarning;
2926
15.0M
    hdlr->error = xmlParserError;
2927
15.0M
    hdlr->fatalError = xmlParserError;
2928
2929
15.0M
    return(0);
2930
15.0M
}
2931
2932
/**
2933
 * xmlSAX2InitDefaultSAXHandler:
2934
 * @hdlr:  the SAX handler
2935
 * @warning:  flag if non-zero sets the handler warning procedure
2936
 *
2937
 * Initialize the default XML SAX2 handler
2938
 */
2939
void
2940
xmlSAX2InitDefaultSAXHandler(xmlSAXHandler *hdlr, int warning)
2941
0
{
2942
0
    if ((hdlr == NULL) || (hdlr->initialized != 0))
2943
0
  return;
2944
2945
0
    xmlSAXVersion(hdlr, xmlSAX2DefaultVersionValue);
2946
0
    if (warning == 0)
2947
0
  hdlr->warning = NULL;
2948
0
    else
2949
0
  hdlr->warning = xmlParserWarning;
2950
0
}
2951
2952
/**
2953
 * xmlDefaultSAXHandlerInit:
2954
 *
2955
 * DEPRECATED: This function is a no-op. Call xmlInitParser to
2956
 * initialize the library.
2957
 *
2958
 * Initialize the default SAX2 handler
2959
 */
2960
void
2961
xmlDefaultSAXHandlerInit(void)
2962
0
{
2963
0
}
2964
2965
#ifdef LIBXML_HTML_ENABLED
2966
2967
/**
2968
 * xmlSAX2InitHtmlDefaultSAXHandler:
2969
 * @hdlr:  the SAX handler
2970
 *
2971
 * Initialize the default HTML SAX2 handler
2972
 */
2973
void
2974
xmlSAX2InitHtmlDefaultSAXHandler(xmlSAXHandler *hdlr)
2975
0
{
2976
0
    if ((hdlr == NULL) || (hdlr->initialized != 0))
2977
0
  return;
2978
2979
0
    hdlr->internalSubset = xmlSAX2InternalSubset;
2980
0
    hdlr->externalSubset = NULL;
2981
0
    hdlr->isStandalone = NULL;
2982
0
    hdlr->hasInternalSubset = NULL;
2983
0
    hdlr->hasExternalSubset = NULL;
2984
0
    hdlr->resolveEntity = NULL;
2985
0
    hdlr->getEntity = xmlSAX2GetEntity;
2986
0
    hdlr->getParameterEntity = NULL;
2987
0
    hdlr->entityDecl = NULL;
2988
0
    hdlr->attributeDecl = NULL;
2989
0
    hdlr->elementDecl = NULL;
2990
0
    hdlr->notationDecl = NULL;
2991
0
    hdlr->unparsedEntityDecl = NULL;
2992
0
    hdlr->setDocumentLocator = xmlSAX2SetDocumentLocator;
2993
0
    hdlr->startDocument = xmlSAX2StartDocument;
2994
0
    hdlr->endDocument = xmlSAX2EndDocument;
2995
0
    hdlr->startElement = xmlSAX2StartElement;
2996
0
    hdlr->endElement = xmlSAX2EndElement;
2997
0
    hdlr->reference = NULL;
2998
0
    hdlr->characters = xmlSAX2Characters;
2999
0
    hdlr->cdataBlock = xmlSAX2CDataBlock;
3000
0
    hdlr->ignorableWhitespace = xmlSAX2IgnorableWhitespace;
3001
0
    hdlr->processingInstruction = xmlSAX2ProcessingInstruction;
3002
0
    hdlr->comment = xmlSAX2Comment;
3003
0
    hdlr->warning = xmlParserWarning;
3004
0
    hdlr->error = xmlParserError;
3005
0
    hdlr->fatalError = xmlParserError;
3006
3007
0
    hdlr->initialized = 1;
3008
0
}
3009
3010
/**
3011
 * htmlDefaultSAXHandlerInit:
3012
 *
3013
 * DEPRECATED: This function is a no-op. Call xmlInitParser to
3014
 * initialize the library.
3015
 */
3016
void
3017
htmlDefaultSAXHandlerInit(void)
3018
0
{
3019
0
}
3020
3021
#endif /* LIBXML_HTML_ENABLED */