Coverage Report

Created: 2024-08-17 06:44

/src/libxml2/SAX2.c
Line
Count
Source (jump to first uncovered line)
1
/*
2
 * SAX2.c : Default SAX2 handler to build a tree.
3
 *
4
 * See Copyright for the status of this software.
5
 *
6
 * Daniel Veillard <daniel@veillard.com>
7
 */
8
9
10
#define IN_LIBXML
11
#include "libxml.h"
12
#include <stdlib.h>
13
#include <string.h>
14
#include <limits.h>
15
#include <stddef.h>
16
#include <libxml/xmlmemory.h>
17
#include <libxml/tree.h>
18
#include <libxml/parser.h>
19
#include <libxml/parserInternals.h>
20
#include <libxml/valid.h>
21
#include <libxml/entities.h>
22
#include <libxml/xmlerror.h>
23
#include <libxml/debugXML.h>
24
#include <libxml/xmlIO.h>
25
#include <libxml/SAX.h>
26
#include <libxml/uri.h>
27
#include <libxml/valid.h>
28
#include <libxml/HTMLtree.h>
29
#include <libxml/globals.h>
30
31
#include "private/error.h"
32
#include "private/parser.h"
33
#include "private/tree.h"
34
35
/* #define DEBUG_SAX2 */
36
/* #define DEBUG_SAX2_TREE */
37
38
/**
39
 * TODO:
40
 *
41
 * macro to flag unimplemented blocks
42
 * XML_CATALOG_PREFER user env to select between system/public preferred
43
 * option. C.f. Richard Tobin <richard@cogsci.ed.ac.uk>
44
 *> Just FYI, I am using an environment variable XML_CATALOG_PREFER with
45
 *> values "system" and "public".  I have made the default be "system" to
46
 *> match yours.
47
 */
48
#define TODO                \
49
    xmlGenericError(xmlGenericErrorContext,       \
50
      "Unimplemented block at %s:%d\n",       \
51
            __FILE__, __LINE__);
52
53
/*
54
 * xmlSAX2ErrMemory:
55
 * @ctxt:  an XML validation parser context
56
 * @msg:   a string to accompany the error message
57
 */
58
static void LIBXML_ATTR_FORMAT(2,0)
59
0
xmlSAX2ErrMemory(xmlParserCtxtPtr ctxt, const char *msg) {
60
0
    xmlStructuredErrorFunc schannel = NULL;
61
0
    const char *str1 = "out of memory\n";
62
63
0
    if (ctxt != NULL) {
64
0
  ctxt->errNo = XML_ERR_NO_MEMORY;
65
0
  if ((ctxt->sax != NULL) && (ctxt->sax->initialized == XML_SAX2_MAGIC))
66
0
      schannel = ctxt->sax->serror;
67
0
  __xmlRaiseError(schannel,
68
0
      ctxt->vctxt.error, ctxt->vctxt.userData,
69
0
      ctxt, NULL, XML_FROM_PARSER, XML_ERR_NO_MEMORY,
70
0
      XML_ERR_ERROR, NULL, 0, (const char *) str1,
71
0
      NULL, NULL, 0, 0,
72
0
      msg, (const char *) str1, NULL);
73
0
  ctxt->errNo = XML_ERR_NO_MEMORY;
74
0
  ctxt->instate = XML_PARSER_EOF;
75
0
  ctxt->disableSAX = 1;
76
0
    } else {
77
0
  __xmlRaiseError(schannel,
78
0
      NULL, NULL,
79
0
      ctxt, NULL, XML_FROM_PARSER, XML_ERR_NO_MEMORY,
80
0
      XML_ERR_ERROR, NULL, 0, (const char *) str1,
81
0
      NULL, NULL, 0, 0,
82
0
      msg, (const char *) str1, NULL);
83
0
    }
84
0
}
85
86
/**
87
 * xmlValidError:
88
 * @ctxt:  an XML validation parser context
89
 * @error:  the error number
90
 * @msg:  the error message
91
 * @str1:  extra data
92
 * @str2:  extra data
93
 *
94
 * Handle a validation error
95
 */
96
static void LIBXML_ATTR_FORMAT(3,0)
97
xmlErrValid(xmlParserCtxtPtr ctxt, xmlParserErrors error,
98
            const char *msg, const char *str1, const char *str2)
99
756
{
100
756
    xmlStructuredErrorFunc schannel = NULL;
101
102
756
    if ((ctxt != NULL) && (ctxt->disableSAX != 0) &&
103
756
        (ctxt->instate == XML_PARSER_EOF))
104
0
  return;
105
756
    if (ctxt != NULL) {
106
756
  ctxt->errNo = error;
107
756
  if ((ctxt->sax != NULL) && (ctxt->sax->initialized == XML_SAX2_MAGIC))
108
195
      schannel = ctxt->sax->serror;
109
756
  __xmlRaiseError(schannel,
110
756
      ctxt->vctxt.error, ctxt->vctxt.userData,
111
756
      ctxt, NULL, XML_FROM_DTD, error,
112
756
      XML_ERR_ERROR, NULL, 0, (const char *) str1,
113
756
      (const char *) str2, NULL, 0, 0,
114
756
      msg, (const char *) str1, (const char *) str2);
115
756
  ctxt->valid = 0;
116
756
    } else {
117
0
  __xmlRaiseError(schannel,
118
0
      NULL, NULL,
119
0
      ctxt, NULL, XML_FROM_DTD, error,
120
0
      XML_ERR_ERROR, NULL, 0, (const char *) str1,
121
0
      (const char *) str2, NULL, 0, 0,
122
0
      msg, (const char *) str1, (const char *) str2);
123
0
    }
124
756
}
125
126
/**
127
 * xmlFatalErrMsg:
128
 * @ctxt:  an XML parser context
129
 * @error:  the error number
130
 * @msg:  the error message
131
 * @str1:  an error string
132
 * @str2:  an error string
133
 *
134
 * Handle a fatal parser error, i.e. violating Well-Formedness constraints
135
 */
136
static void LIBXML_ATTR_FORMAT(3,0)
137
xmlFatalErrMsg(xmlParserCtxtPtr ctxt, xmlParserErrors error,
138
               const char *msg, const xmlChar *str1, const xmlChar *str2)
139
0
{
140
0
    if ((ctxt != NULL) && (ctxt->disableSAX != 0) &&
141
0
        (ctxt->instate == XML_PARSER_EOF))
142
0
  return;
143
0
    if (ctxt != NULL)
144
0
  ctxt->errNo = error;
145
0
    __xmlRaiseError(NULL, NULL, NULL, ctxt, NULL, XML_FROM_PARSER, error,
146
0
                    XML_ERR_FATAL, NULL, 0,
147
0
        (const char *) str1, (const char *) str2,
148
0
        NULL, 0, 0, msg, str1, str2);
149
0
    if (ctxt != NULL) {
150
0
  ctxt->wellFormed = 0;
151
0
  ctxt->valid = 0;
152
0
  if (ctxt->recovery == 0)
153
0
      ctxt->disableSAX = 1;
154
0
    }
155
0
}
156
157
/**
158
 * xmlWarnMsg:
159
 * @ctxt:  an XML parser context
160
 * @error:  the error number
161
 * @msg:  the error message
162
 * @str1:  an error string
163
 * @str2:  an error string
164
 *
165
 * Handle a parser warning
166
 */
167
static void LIBXML_ATTR_FORMAT(3,0)
168
xmlWarnMsg(xmlParserCtxtPtr ctxt, xmlParserErrors error,
169
               const char *msg, const xmlChar *str1)
170
6
{
171
6
    if ((ctxt != NULL) && (ctxt->disableSAX != 0) &&
172
6
        (ctxt->instate == XML_PARSER_EOF))
173
0
  return;
174
6
    if (ctxt != NULL)
175
6
  ctxt->errNo = error;
176
6
    __xmlRaiseError(NULL, NULL, NULL, ctxt, NULL, XML_FROM_PARSER, error,
177
6
                    XML_ERR_WARNING, NULL, 0,
178
6
        (const char *) str1, NULL,
179
6
        NULL, 0, 0, msg, str1);
180
6
}
181
182
/**
183
 * xmlNsWarnMsg:
184
 * @ctxt:  an XML parser context
185
 * @error:  the error number
186
 * @msg:  the error message
187
 * @str1:  an error string
188
 *
189
 * Handle a namespace warning
190
 */
191
static void LIBXML_ATTR_FORMAT(3,0)
192
xmlNsWarnMsg(xmlParserCtxtPtr ctxt, xmlParserErrors error,
193
             const char *msg, const xmlChar *str1, const xmlChar *str2)
194
3.95k
{
195
3.95k
    if ((ctxt != NULL) && (ctxt->disableSAX != 0) &&
196
3.95k
        (ctxt->instate == XML_PARSER_EOF))
197
0
  return;
198
3.95k
    if (ctxt != NULL)
199
3.95k
  ctxt->errNo = error;
200
3.95k
    __xmlRaiseError(NULL, NULL, NULL, ctxt, NULL, XML_FROM_NAMESPACE, error,
201
3.95k
                    XML_ERR_WARNING, NULL, 0,
202
3.95k
        (const char *) str1, (const char *) str2,
203
3.95k
        NULL, 0, 0, msg, str1, str2);
204
3.95k
}
205
206
/**
207
 * xmlSAX2GetPublicId:
208
 * @ctx: the user data (XML parser context)
209
 *
210
 * Provides the public ID e.g. "-//SGMLSOURCE//DTD DEMO//EN"
211
 *
212
 * Returns a xmlChar *
213
 */
214
const xmlChar *
215
xmlSAX2GetPublicId(void *ctx ATTRIBUTE_UNUSED)
216
0
{
217
    /* xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx; */
218
0
    return(NULL);
219
0
}
220
221
/**
222
 * xmlSAX2GetSystemId:
223
 * @ctx: the user data (XML parser context)
224
 *
225
 * Provides the system ID, basically URL or filename e.g.
226
 * http://www.sgmlsource.com/dtds/memo.dtd
227
 *
228
 * Returns a xmlChar *
229
 */
230
const xmlChar *
231
xmlSAX2GetSystemId(void *ctx)
232
0
{
233
0
    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
234
0
    if ((ctx == NULL) || (ctxt->input == NULL)) return(NULL);
235
0
    return((const xmlChar *) ctxt->input->filename);
236
0
}
237
238
/**
239
 * xmlSAX2GetLineNumber:
240
 * @ctx: the user data (XML parser context)
241
 *
242
 * Provide the line number of the current parsing point.
243
 *
244
 * Returns an int
245
 */
246
int
247
xmlSAX2GetLineNumber(void *ctx)
248
0
{
249
0
    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
250
0
    if ((ctx == NULL) || (ctxt->input == NULL)) return(0);
251
0
    return(ctxt->input->line);
252
0
}
253
254
/**
255
 * xmlSAX2GetColumnNumber:
256
 * @ctx: the user data (XML parser context)
257
 *
258
 * Provide the column number of the current parsing point.
259
 *
260
 * Returns an int
261
 */
262
int
263
xmlSAX2GetColumnNumber(void *ctx)
264
0
{
265
0
    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
266
0
    if ((ctx == NULL) || (ctxt->input == NULL)) return(0);
267
0
    return(ctxt->input->col);
268
0
}
269
270
/**
271
 * xmlSAX2IsStandalone:
272
 * @ctx: the user data (XML parser context)
273
 *
274
 * Is this document tagged standalone ?
275
 *
276
 * Returns 1 if true
277
 */
278
int
279
xmlSAX2IsStandalone(void *ctx)
280
0
{
281
0
    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
282
0
    if ((ctx == NULL) || (ctxt->myDoc == NULL)) return(0);
283
0
    return(ctxt->myDoc->standalone == 1);
284
0
}
285
286
/**
287
 * xmlSAX2HasInternalSubset:
288
 * @ctx: the user data (XML parser context)
289
 *
290
 * Does this document has an internal subset
291
 *
292
 * Returns 1 if true
293
 */
294
int
295
xmlSAX2HasInternalSubset(void *ctx)
296
0
{
297
0
    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
298
0
    if ((ctxt == NULL) || (ctxt->myDoc == NULL)) return(0);
299
0
    return(ctxt->myDoc->intSubset != NULL);
300
0
}
301
302
/**
303
 * xmlSAX2HasExternalSubset:
304
 * @ctx: the user data (XML parser context)
305
 *
306
 * Does this document has an external subset
307
 *
308
 * Returns 1 if true
309
 */
310
int
311
xmlSAX2HasExternalSubset(void *ctx)
312
0
{
313
0
    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
314
0
    if ((ctxt == NULL) || (ctxt->myDoc == NULL)) return(0);
315
0
    return(ctxt->myDoc->extSubset != NULL);
316
0
}
317
318
/**
319
 * xmlSAX2InternalSubset:
320
 * @ctx:  the user data (XML parser context)
321
 * @name:  the root element name
322
 * @ExternalID:  the external ID
323
 * @SystemID:  the SYSTEM ID (e.g. filename or URL)
324
 *
325
 * Callback on internal subset declaration.
326
 */
327
void
328
xmlSAX2InternalSubset(void *ctx, const xmlChar *name,
329
         const xmlChar *ExternalID, const xmlChar *SystemID)
330
7.64k
{
331
7.64k
    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
332
7.64k
    xmlDtdPtr dtd;
333
7.64k
    if (ctx == NULL) return;
334
#ifdef DEBUG_SAX
335
    xmlGenericError(xmlGenericErrorContext,
336
      "SAX.xmlSAX2InternalSubset(%s, %s, %s)\n",
337
            name, ExternalID, SystemID);
338
#endif
339
340
7.64k
    if (ctxt->myDoc == NULL)
341
0
  return;
342
7.64k
    dtd = xmlGetIntSubset(ctxt->myDoc);
343
7.64k
    if (dtd != NULL) {
344
0
  if (ctxt->html)
345
0
      return;
346
0
  xmlUnlinkNode((xmlNodePtr) dtd);
347
0
  xmlFreeDtd(dtd);
348
0
  ctxt->myDoc->intSubset = NULL;
349
0
    }
350
7.64k
    ctxt->myDoc->intSubset =
351
7.64k
  xmlCreateIntSubset(ctxt->myDoc, name, ExternalID, SystemID);
352
7.64k
    if (ctxt->myDoc->intSubset == NULL)
353
0
        xmlSAX2ErrMemory(ctxt, "xmlSAX2InternalSubset");
354
7.64k
}
355
356
/**
357
 * xmlSAX2ExternalSubset:
358
 * @ctx: the user data (XML parser context)
359
 * @name:  the root element name
360
 * @ExternalID:  the external ID
361
 * @SystemID:  the SYSTEM ID (e.g. filename or URL)
362
 *
363
 * Callback on external subset declaration.
364
 */
365
void
366
xmlSAX2ExternalSubset(void *ctx, const xmlChar *name,
367
         const xmlChar *ExternalID, const xmlChar *SystemID)
368
5.97k
{
369
5.97k
    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
370
5.97k
    if (ctx == NULL) return;
371
#ifdef DEBUG_SAX
372
    xmlGenericError(xmlGenericErrorContext,
373
      "SAX.xmlSAX2ExternalSubset(%s, %s, %s)\n",
374
            name, ExternalID, SystemID);
375
#endif
376
5.97k
    if (((ExternalID != NULL) || (SystemID != NULL)) &&
377
5.97k
        (((ctxt->validate) || (ctxt->loadsubset != 0)) &&
378
4.34k
   (ctxt->wellFormed && ctxt->myDoc))) {
379
  /*
380
   * Try to fetch and parse the external subset.
381
   */
382
3.33k
  xmlParserInputPtr oldinput;
383
3.33k
  int oldinputNr;
384
3.33k
  int oldinputMax;
385
3.33k
  xmlParserInputPtr *oldinputTab;
386
3.33k
  xmlParserInputPtr input = NULL;
387
3.33k
  xmlCharEncoding enc;
388
3.33k
  int oldcharset;
389
3.33k
  const xmlChar *oldencoding;
390
3.33k
  int oldprogressive;
391
3.33k
        unsigned long consumed;
392
3.33k
        size_t buffered;
393
394
  /*
395
   * Ask the Entity resolver to load the damn thing
396
   */
397
3.33k
  if ((ctxt->sax != NULL) && (ctxt->sax->resolveEntity != NULL))
398
3.33k
      input = ctxt->sax->resolveEntity(ctxt->userData, ExternalID,
399
3.33k
                                          SystemID);
400
3.33k
  if (input == NULL) {
401
1.06k
      return;
402
1.06k
  }
403
404
2.26k
  xmlNewDtd(ctxt->myDoc, name, ExternalID, SystemID);
405
406
  /*
407
   * make sure we won't destroy the main document context
408
   */
409
2.26k
  oldinput = ctxt->input;
410
2.26k
  oldinputNr = ctxt->inputNr;
411
2.26k
  oldinputMax = ctxt->inputMax;
412
2.26k
  oldinputTab = ctxt->inputTab;
413
2.26k
  oldcharset = ctxt->charset;
414
2.26k
  oldencoding = ctxt->encoding;
415
2.26k
        oldprogressive = ctxt->progressive;
416
2.26k
  ctxt->encoding = NULL;
417
2.26k
        ctxt->progressive = 0;
418
419
2.26k
  ctxt->inputTab = (xmlParserInputPtr *)
420
2.26k
                   xmlMalloc(5 * sizeof(xmlParserInputPtr));
421
2.26k
  if (ctxt->inputTab == NULL) {
422
0
      xmlSAX2ErrMemory(ctxt, "xmlSAX2ExternalSubset");
423
0
            xmlFreeInputStream(input);
424
0
      ctxt->input = oldinput;
425
0
      ctxt->inputNr = oldinputNr;
426
0
      ctxt->inputMax = oldinputMax;
427
0
      ctxt->inputTab = oldinputTab;
428
0
      ctxt->charset = oldcharset;
429
0
      ctxt->encoding = oldencoding;
430
0
            ctxt->progressive = oldprogressive;
431
0
      return;
432
0
  }
433
2.26k
  ctxt->inputNr = 0;
434
2.26k
  ctxt->inputMax = 5;
435
2.26k
  ctxt->input = NULL;
436
2.26k
  xmlPushInput(ctxt, input);
437
438
  /*
439
   * On the fly encoding conversion if needed
440
   */
441
2.26k
  if (ctxt->input->length >= 4) {
442
0
      enc = xmlDetectCharEncoding(ctxt->input->cur, 4);
443
0
      xmlSwitchEncoding(ctxt, enc);
444
0
  }
445
446
2.26k
  if (input->filename == NULL)
447
2.26k
      input->filename = (char *) xmlCanonicPath(SystemID);
448
2.26k
  input->line = 1;
449
2.26k
  input->col = 1;
450
2.26k
  input->base = ctxt->input->cur;
451
2.26k
  input->cur = ctxt->input->cur;
452
2.26k
  input->free = NULL;
453
454
  /*
455
   * let's parse that entity knowing it's an external subset.
456
   */
457
2.26k
  xmlParseExternalSubset(ctxt, ExternalID, SystemID);
458
459
        /*
460
   * Free up the external entities
461
   */
462
463
2.26k
  while (ctxt->inputNr > 1)
464
0
      xmlPopInput(ctxt);
465
466
2.26k
        consumed = ctxt->input->consumed;
467
2.26k
        buffered = ctxt->input->cur - ctxt->input->base;
468
2.26k
        if (buffered > ULONG_MAX - consumed)
469
0
            consumed = ULONG_MAX;
470
2.26k
        else
471
2.26k
            consumed += buffered;
472
2.26k
        if (consumed > ULONG_MAX - ctxt->sizeentities)
473
0
            ctxt->sizeentities = ULONG_MAX;
474
2.26k
        else
475
2.26k
            ctxt->sizeentities += consumed;
476
477
2.26k
  xmlFreeInputStream(ctxt->input);
478
2.26k
        xmlFree(ctxt->inputTab);
479
480
  /*
481
   * Restore the parsing context of the main entity
482
   */
483
2.26k
  ctxt->input = oldinput;
484
2.26k
  ctxt->inputNr = oldinputNr;
485
2.26k
  ctxt->inputMax = oldinputMax;
486
2.26k
  ctxt->inputTab = oldinputTab;
487
2.26k
  ctxt->charset = oldcharset;
488
2.26k
  if ((ctxt->encoding != NULL) &&
489
2.26k
      ((ctxt->dict == NULL) ||
490
87
       (!xmlDictOwns(ctxt->dict, ctxt->encoding))))
491
87
      xmlFree((xmlChar *) ctxt->encoding);
492
2.26k
  ctxt->encoding = oldencoding;
493
2.26k
        ctxt->progressive = oldprogressive;
494
  /* ctxt->wellFormed = oldwellFormed; */
495
2.26k
    }
496
5.97k
}
497
498
/**
499
 * xmlSAX2ResolveEntity:
500
 * @ctx: the user data (XML parser context)
501
 * @publicId: The public ID of the entity
502
 * @systemId: The system ID of the entity
503
 *
504
 * The entity loader, to control the loading of external entities,
505
 * the application can either:
506
 *    - override this xmlSAX2ResolveEntity() callback in the SAX block
507
 *    - or better use the xmlSetExternalEntityLoader() function to
508
 *      set up it's own entity resolution routine
509
 *
510
 * Returns the xmlParserInputPtr if inlined or NULL for DOM behaviour.
511
 */
512
xmlParserInputPtr
513
xmlSAX2ResolveEntity(void *ctx, const xmlChar *publicId, const xmlChar *systemId)
514
3.33k
{
515
3.33k
    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
516
3.33k
    xmlParserInputPtr ret;
517
3.33k
    xmlChar *URI;
518
3.33k
    const char *base = NULL;
519
520
3.33k
    if (ctx == NULL) return(NULL);
521
3.33k
    if (ctxt->input != NULL)
522
3.33k
  base = ctxt->input->filename;
523
3.33k
    if (base == NULL)
524
1.11k
  base = ctxt->directory;
525
526
3.33k
    URI = xmlBuildURI(systemId, (const xmlChar *) base);
527
528
#ifdef DEBUG_SAX
529
    xmlGenericError(xmlGenericErrorContext,
530
      "SAX.xmlSAX2ResolveEntity(%s, %s)\n", publicId, systemId);
531
#endif
532
533
3.33k
    ret = xmlLoadExternalEntity((const char *) URI,
534
3.33k
        (const char *) publicId, ctxt);
535
3.33k
    if (URI != NULL)
536
3.31k
  xmlFree(URI);
537
3.33k
    return(ret);
538
3.33k
}
539
540
/**
541
 * xmlSAX2GetEntity:
542
 * @ctx: the user data (XML parser context)
543
 * @name: The entity name
544
 *
545
 * Get an entity by name
546
 *
547
 * Returns the xmlEntityPtr if found.
548
 */
549
xmlEntityPtr
550
xmlSAX2GetEntity(void *ctx, const xmlChar *name)
551
3.25M
{
552
3.25M
    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
553
3.25M
    xmlEntityPtr ret = NULL;
554
555
3.25M
    if (ctx == NULL) return(NULL);
556
#ifdef DEBUG_SAX
557
    xmlGenericError(xmlGenericErrorContext,
558
      "SAX.xmlSAX2GetEntity(%s)\n", name);
559
#endif
560
561
3.25M
    if (ctxt->inSubset == 0) {
562
3.17M
  ret = xmlGetPredefinedEntity(name);
563
3.17M
  if (ret != NULL)
564
14.3k
      return(ret);
565
3.17M
    }
566
3.24M
    if ((ctxt->myDoc != NULL) && (ctxt->myDoc->standalone == 1)) {
567
102
  if (ctxt->inSubset == 2) {
568
0
      ctxt->myDoc->standalone = 0;
569
0
      ret = xmlGetDocEntity(ctxt->myDoc, name);
570
0
      ctxt->myDoc->standalone = 1;
571
102
  } else {
572
102
      ret = xmlGetDocEntity(ctxt->myDoc, name);
573
102
      if (ret == NULL) {
574
0
    ctxt->myDoc->standalone = 0;
575
0
    ret = xmlGetDocEntity(ctxt->myDoc, name);
576
0
    if (ret != NULL) {
577
0
        xmlFatalErrMsg(ctxt, XML_ERR_NOT_STANDALONE,
578
0
   "Entity(%s) document marked standalone but requires external subset\n",
579
0
           name, NULL);
580
0
    }
581
0
    ctxt->myDoc->standalone = 1;
582
0
      }
583
102
  }
584
3.24M
    } else {
585
3.24M
  ret = xmlGetDocEntity(ctxt->myDoc, name);
586
3.24M
    }
587
3.24M
    return(ret);
588
3.25M
}
589
590
/**
591
 * xmlSAX2GetParameterEntity:
592
 * @ctx: the user data (XML parser context)
593
 * @name: The entity name
594
 *
595
 * Get a parameter entity by name
596
 *
597
 * Returns the xmlEntityPtr if found.
598
 */
599
xmlEntityPtr
600
xmlSAX2GetParameterEntity(void *ctx, const xmlChar *name)
601
2.28M
{
602
2.28M
    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
603
2.28M
    xmlEntityPtr ret;
604
605
2.28M
    if (ctx == NULL) return(NULL);
606
#ifdef DEBUG_SAX
607
    xmlGenericError(xmlGenericErrorContext,
608
      "SAX.xmlSAX2GetParameterEntity(%s)\n", name);
609
#endif
610
611
2.28M
    ret = xmlGetParameterEntity(ctxt->myDoc, name);
612
2.28M
    return(ret);
613
2.28M
}
614
615
616
/**
617
 * xmlSAX2EntityDecl:
618
 * @ctx: the user data (XML parser context)
619
 * @name:  the entity name
620
 * @type:  the entity type
621
 * @publicId: The public ID of the entity
622
 * @systemId: The system ID of the entity
623
 * @content: the entity value (without processing).
624
 *
625
 * An entity definition has been parsed
626
 */
627
void
628
xmlSAX2EntityDecl(void *ctx, const xmlChar *name, int type,
629
          const xmlChar *publicId, const xmlChar *systemId, xmlChar *content)
630
164k
{
631
164k
    xmlEntityPtr ent;
632
164k
    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
633
634
164k
    if (ctx == NULL) return;
635
#ifdef DEBUG_SAX
636
    xmlGenericError(xmlGenericErrorContext,
637
      "SAX.xmlSAX2EntityDecl(%s, %d, %s, %s, %s)\n",
638
            name, type, publicId, systemId, content);
639
#endif
640
164k
    if (ctxt->inSubset == 1) {
641
74.5k
  ent = xmlAddDocEntity(ctxt->myDoc, name, type, publicId,
642
74.5k
                  systemId, content);
643
74.5k
  if ((ent == NULL) && (ctxt->pedantic))
644
6
      xmlWarnMsg(ctxt, XML_WAR_ENTITY_REDEFINED,
645
6
       "Entity(%s) already defined in the internal subset\n",
646
6
                 name);
647
74.5k
  if ((ent != NULL) && (ent->URI == NULL) && (systemId != NULL)) {
648
1.63k
      xmlChar *URI;
649
1.63k
      const char *base = NULL;
650
651
1.63k
      if (ctxt->input != NULL)
652
1.63k
    base = ctxt->input->filename;
653
1.63k
      if (base == NULL)
654
541
    base = ctxt->directory;
655
656
1.63k
      URI = xmlBuildURI(systemId, (const xmlChar *) base);
657
1.63k
      ent->URI = URI;
658
1.63k
  }
659
89.9k
    } else if (ctxt->inSubset == 2) {
660
89.9k
  ent = xmlAddDtdEntity(ctxt->myDoc, name, type, publicId,
661
89.9k
                  systemId, content);
662
89.9k
  if ((ent == NULL) && (ctxt->pedantic) &&
663
89.9k
      (ctxt->sax != NULL) && (ctxt->sax->warning != NULL))
664
0
      ctxt->sax->warning(ctxt->userData,
665
0
       "Entity(%s) already defined in the external subset\n", name);
666
89.9k
  if ((ent != NULL) && (ent->URI == NULL) && (systemId != NULL)) {
667
21
      xmlChar *URI;
668
21
      const char *base = NULL;
669
670
21
      if (ctxt->input != NULL)
671
21
    base = ctxt->input->filename;
672
21
      if (base == NULL)
673
0
    base = ctxt->directory;
674
675
21
      URI = xmlBuildURI(systemId, (const xmlChar *) base);
676
21
      ent->URI = URI;
677
21
  }
678
89.9k
    } else {
679
0
  xmlFatalErrMsg(ctxt, XML_ERR_ENTITY_PROCESSING,
680
0
                 "SAX.xmlSAX2EntityDecl(%s) called while not in subset\n",
681
0
           name, NULL);
682
0
    }
683
164k
}
684
685
/**
686
 * xmlSAX2AttributeDecl:
687
 * @ctx: the user data (XML parser context)
688
 * @elem:  the name of the element
689
 * @fullname:  the attribute name
690
 * @type:  the attribute type
691
 * @def:  the type of default value
692
 * @defaultValue: the attribute default value
693
 * @tree:  the tree of enumerated value set
694
 *
695
 * An attribute definition has been parsed
696
 */
697
void
698
xmlSAX2AttributeDecl(void *ctx, const xmlChar *elem, const xmlChar *fullname,
699
              int type, int def, const xmlChar *defaultValue,
700
        xmlEnumerationPtr tree)
701
289k
{
702
289k
    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
703
289k
    xmlAttributePtr attr;
704
289k
    xmlChar *name = NULL, *prefix = NULL;
705
706
    /* Avoid unused variable warning if features are disabled. */
707
289k
    (void) attr;
708
709
289k
    if ((ctxt == NULL) || (ctxt->myDoc == NULL))
710
0
        return;
711
712
#ifdef DEBUG_SAX
713
    xmlGenericError(xmlGenericErrorContext,
714
      "SAX.xmlSAX2AttributeDecl(%s, %s, %d, %d, %s, ...)\n",
715
            elem, fullname, type, def, defaultValue);
716
#endif
717
289k
    if ((xmlStrEqual(fullname, BAD_CAST "xml:id")) &&
718
289k
        (type != XML_ATTRIBUTE_ID)) {
719
  /*
720
   * Raise the error but keep the validity flag
721
   */
722
12
  int tmp = ctxt->valid;
723
12
  xmlErrValid(ctxt, XML_DTD_XMLID_TYPE,
724
12
        "xml:id : attribute type should be ID\n", NULL, NULL);
725
12
  ctxt->valid = tmp;
726
12
    }
727
    /* TODO: optimize name/prefix allocation */
728
289k
    name = xmlSplitQName(ctxt, fullname, &prefix);
729
289k
    ctxt->vctxt.valid = 1;
730
289k
    if (ctxt->inSubset == 1)
731
36.9k
  attr = xmlAddAttributeDecl(&ctxt->vctxt, ctxt->myDoc->intSubset, elem,
732
36.9k
         name, prefix, (xmlAttributeType) type,
733
36.9k
         (xmlAttributeDefault) def, defaultValue, tree);
734
253k
    else if (ctxt->inSubset == 2)
735
253k
  attr = xmlAddAttributeDecl(&ctxt->vctxt, ctxt->myDoc->extSubset, elem,
736
253k
     name, prefix, (xmlAttributeType) type,
737
253k
     (xmlAttributeDefault) def, defaultValue, tree);
738
0
    else {
739
0
        xmlFatalErrMsg(ctxt, XML_ERR_INTERNAL_ERROR,
740
0
       "SAX.xmlSAX2AttributeDecl(%s) called while not in subset\n",
741
0
                 name, NULL);
742
0
  xmlFree(name);
743
0
  xmlFreeEnumeration(tree);
744
0
  return;
745
0
    }
746
289k
#ifdef LIBXML_VALID_ENABLED
747
289k
    if (ctxt->vctxt.valid == 0)
748
87
  ctxt->valid = 0;
749
289k
    if ((attr != NULL) && (ctxt->validate) && (ctxt->wellFormed) &&
750
289k
        (ctxt->myDoc->intSubset != NULL))
751
9
  ctxt->valid &= xmlValidateAttributeDecl(&ctxt->vctxt, ctxt->myDoc,
752
9
                                          attr);
753
289k
#endif /* LIBXML_VALID_ENABLED */
754
289k
    if (prefix != NULL)
755
4.65k
  xmlFree(prefix);
756
289k
    if (name != NULL)
757
289k
  xmlFree(name);
758
289k
}
759
760
/**
761
 * xmlSAX2ElementDecl:
762
 * @ctx: the user data (XML parser context)
763
 * @name:  the element name
764
 * @type:  the element type
765
 * @content: the element value tree
766
 *
767
 * An element definition has been parsed
768
 */
769
void
770
xmlSAX2ElementDecl(void *ctx, const xmlChar * name, int type,
771
            xmlElementContentPtr content)
772
120k
{
773
120k
    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
774
120k
    xmlElementPtr elem = NULL;
775
776
    /* Avoid unused variable warning if features are disabled. */
777
120k
    (void) elem;
778
779
120k
    if ((ctxt == NULL) || (ctxt->myDoc == NULL))
780
0
        return;
781
782
#ifdef DEBUG_SAX
783
    xmlGenericError(xmlGenericErrorContext,
784
                    "SAX.xmlSAX2ElementDecl(%s, %d, ...)\n", name, type);
785
#endif
786
787
120k
    if (ctxt->inSubset == 1)
788
13.5k
        elem = xmlAddElementDecl(&ctxt->vctxt, ctxt->myDoc->intSubset,
789
13.5k
                                 name, (xmlElementTypeVal) type, content);
790
107k
    else if (ctxt->inSubset == 2)
791
107k
        elem = xmlAddElementDecl(&ctxt->vctxt, ctxt->myDoc->extSubset,
792
107k
                                 name, (xmlElementTypeVal) type, content);
793
0
    else {
794
0
        xmlFatalErrMsg(ctxt, XML_ERR_INTERNAL_ERROR,
795
0
       "SAX.xmlSAX2ElementDecl(%s) called while not in subset\n",
796
0
                 name, NULL);
797
0
        return;
798
0
    }
799
120k
#ifdef LIBXML_VALID_ENABLED
800
120k
    if (elem == NULL)
801
12
        ctxt->valid = 0;
802
120k
    if (ctxt->validate && ctxt->wellFormed &&
803
120k
        ctxt->myDoc && ctxt->myDoc->intSubset)
804
84
        ctxt->valid &=
805
84
            xmlValidateElementDecl(&ctxt->vctxt, ctxt->myDoc, elem);
806
120k
#endif /* LIBXML_VALID_ENABLED */
807
120k
}
808
809
/**
810
 * xmlSAX2NotationDecl:
811
 * @ctx: the user data (XML parser context)
812
 * @name: The name of the notation
813
 * @publicId: The public ID of the entity
814
 * @systemId: The system ID of the entity
815
 *
816
 * What to do when a notation declaration has been parsed.
817
 */
818
void
819
xmlSAX2NotationDecl(void *ctx, const xmlChar *name,
820
       const xmlChar *publicId, const xmlChar *systemId)
821
0
{
822
0
    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
823
0
    xmlNotationPtr nota = NULL;
824
825
    /* Avoid unused variable warning if features are disabled. */
826
0
    (void) nota;
827
828
0
    if ((ctxt == NULL) || (ctxt->myDoc == NULL))
829
0
        return;
830
831
#ifdef DEBUG_SAX
832
    xmlGenericError(xmlGenericErrorContext,
833
      "SAX.xmlSAX2NotationDecl(%s, %s, %s)\n", name, publicId, systemId);
834
#endif
835
836
0
    if ((publicId == NULL) && (systemId == NULL)) {
837
0
  xmlFatalErrMsg(ctxt, XML_ERR_NOTATION_PROCESSING,
838
0
       "SAX.xmlSAX2NotationDecl(%s) externalID or PublicID missing\n",
839
0
                 name, NULL);
840
0
  return;
841
0
    } else if (ctxt->inSubset == 1)
842
0
  nota = xmlAddNotationDecl(&ctxt->vctxt, ctxt->myDoc->intSubset, name,
843
0
                              publicId, systemId);
844
0
    else if (ctxt->inSubset == 2)
845
0
  nota = xmlAddNotationDecl(&ctxt->vctxt, ctxt->myDoc->extSubset, name,
846
0
                              publicId, systemId);
847
0
    else {
848
0
  xmlFatalErrMsg(ctxt, XML_ERR_NOTATION_PROCESSING,
849
0
       "SAX.xmlSAX2NotationDecl(%s) called while not in subset\n",
850
0
                 name, NULL);
851
0
  return;
852
0
    }
853
0
#ifdef LIBXML_VALID_ENABLED
854
0
    if (nota == NULL) ctxt->valid = 0;
855
0
    if ((ctxt->validate) && (ctxt->wellFormed) &&
856
0
        (ctxt->myDoc->intSubset != NULL))
857
0
  ctxt->valid &= xmlValidateNotationDecl(&ctxt->vctxt, ctxt->myDoc,
858
0
                                         nota);
859
0
#endif /* LIBXML_VALID_ENABLED */
860
0
}
861
862
/**
863
 * xmlSAX2UnparsedEntityDecl:
864
 * @ctx: the user data (XML parser context)
865
 * @name: The name of the entity
866
 * @publicId: The public ID of the entity
867
 * @systemId: The system ID of the entity
868
 * @notationName: the name of the notation
869
 *
870
 * What to do when an unparsed entity declaration is parsed
871
 */
872
void
873
xmlSAX2UnparsedEntityDecl(void *ctx, const xmlChar *name,
874
       const xmlChar *publicId, const xmlChar *systemId,
875
       const xmlChar *notationName)
876
18
{
877
18
    xmlEntityPtr ent;
878
18
    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
879
18
    if (ctx == NULL) return;
880
#ifdef DEBUG_SAX
881
    xmlGenericError(xmlGenericErrorContext,
882
      "SAX.xmlSAX2UnparsedEntityDecl(%s, %s, %s, %s)\n",
883
            name, publicId, systemId, notationName);
884
#endif
885
18
    if (ctxt->inSubset == 1) {
886
18
  ent = xmlAddDocEntity(ctxt->myDoc, name,
887
18
      XML_EXTERNAL_GENERAL_UNPARSED_ENTITY,
888
18
      publicId, systemId, notationName);
889
18
  if ((ent == NULL) && (ctxt->pedantic) &&
890
18
      (ctxt->sax != NULL) && (ctxt->sax->warning != NULL))
891
0
      ctxt->sax->warning(ctxt->userData,
892
0
       "Entity(%s) already defined in the internal subset\n", name);
893
18
  if ((ent != NULL) && (ent->URI == NULL) && (systemId != NULL)) {
894
18
      xmlChar *URI;
895
18
      const char *base = NULL;
896
897
18
      if (ctxt->input != NULL)
898
18
    base = ctxt->input->filename;
899
18
      if (base == NULL)
900
6
    base = ctxt->directory;
901
902
18
      URI = xmlBuildURI(systemId, (const xmlChar *) base);
903
18
      ent->URI = URI;
904
18
  }
905
18
    } else if (ctxt->inSubset == 2) {
906
0
  ent = xmlAddDtdEntity(ctxt->myDoc, name,
907
0
      XML_EXTERNAL_GENERAL_UNPARSED_ENTITY,
908
0
      publicId, systemId, notationName);
909
0
  if ((ent == NULL) && (ctxt->pedantic) &&
910
0
      (ctxt->sax != NULL) && (ctxt->sax->warning != NULL))
911
0
      ctxt->sax->warning(ctxt->userData,
912
0
       "Entity(%s) already defined in the external subset\n", name);
913
0
  if ((ent != NULL) && (ent->URI == NULL) && (systemId != NULL)) {
914
0
      xmlChar *URI;
915
0
      const char *base = NULL;
916
917
0
      if (ctxt->input != NULL)
918
0
    base = ctxt->input->filename;
919
0
      if (base == NULL)
920
0
    base = ctxt->directory;
921
922
0
      URI = xmlBuildURI(systemId, (const xmlChar *) base);
923
0
      ent->URI = URI;
924
0
  }
925
0
    } else {
926
0
        xmlFatalErrMsg(ctxt, XML_ERR_INTERNAL_ERROR,
927
0
       "SAX.xmlSAX2UnparsedEntityDecl(%s) called while not in subset\n",
928
0
                 name, NULL);
929
0
    }
930
18
}
931
932
/**
933
 * xmlSAX2SetDocumentLocator:
934
 * @ctx: the user data (XML parser context)
935
 * @loc: A SAX Locator
936
 *
937
 * Receive the document locator at startup, actually xmlDefaultSAXLocator
938
 * Everything is available on the context, so this is useless in our case.
939
 */
940
void
941
xmlSAX2SetDocumentLocator(void *ctx ATTRIBUTE_UNUSED, xmlSAXLocatorPtr loc ATTRIBUTE_UNUSED)
942
13.2k
{
943
    /* xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx; */
944
#ifdef DEBUG_SAX
945
    xmlGenericError(xmlGenericErrorContext,
946
      "SAX.xmlSAX2SetDocumentLocator()\n");
947
#endif
948
13.2k
}
949
950
/**
951
 * xmlSAX2StartDocument:
952
 * @ctx: the user data (XML parser context)
953
 *
954
 * called when the document start being processed.
955
 */
956
void
957
xmlSAX2StartDocument(void *ctx)
958
12.4k
{
959
12.4k
    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
960
12.4k
    xmlDocPtr doc;
961
962
12.4k
    if (ctx == NULL) return;
963
964
#ifdef DEBUG_SAX
965
    xmlGenericError(xmlGenericErrorContext,
966
      "SAX.xmlSAX2StartDocument()\n");
967
#endif
968
12.4k
    if (ctxt->html) {
969
0
#ifdef LIBXML_HTML_ENABLED
970
0
  if (ctxt->myDoc == NULL)
971
0
      ctxt->myDoc = htmlNewDocNoDtD(NULL, NULL);
972
0
  if (ctxt->myDoc == NULL) {
973
0
      xmlSAX2ErrMemory(ctxt, "xmlSAX2StartDocument");
974
0
      return;
975
0
  }
976
0
  ctxt->myDoc->properties = XML_DOC_HTML;
977
0
  ctxt->myDoc->parseFlags = ctxt->options;
978
#else
979
        xmlGenericError(xmlGenericErrorContext,
980
    "libxml2 built without HTML support\n");
981
  ctxt->errNo = XML_ERR_INTERNAL_ERROR;
982
  ctxt->instate = XML_PARSER_EOF;
983
  ctxt->disableSAX = 1;
984
  return;
985
#endif
986
12.4k
    } else {
987
12.4k
  doc = ctxt->myDoc = xmlNewDoc(ctxt->version);
988
12.4k
  if (doc != NULL) {
989
12.4k
      doc->properties = 0;
990
12.4k
      if (ctxt->options & XML_PARSE_OLD10)
991
2.42k
          doc->properties |= XML_DOC_OLD10;
992
12.4k
      doc->parseFlags = ctxt->options;
993
12.4k
      if (ctxt->encoding != NULL)
994
2.67k
    doc->encoding = xmlStrdup(ctxt->encoding);
995
9.76k
      else
996
9.76k
    doc->encoding = NULL;
997
12.4k
      doc->standalone = ctxt->standalone;
998
12.4k
  } else {
999
0
      xmlSAX2ErrMemory(ctxt, "xmlSAX2StartDocument");
1000
0
      return;
1001
0
  }
1002
12.4k
  if ((ctxt->dictNames) && (doc != NULL)) {
1003
10.2k
      doc->dict = ctxt->dict;
1004
10.2k
      xmlDictReference(doc->dict);
1005
10.2k
  }
1006
12.4k
    }
1007
12.4k
    if ((ctxt->myDoc != NULL) && (ctxt->myDoc->URL == NULL) &&
1008
12.4k
  (ctxt->input != NULL) && (ctxt->input->filename != NULL)) {
1009
8.30k
  ctxt->myDoc->URL = xmlPathToURI((const xmlChar *)ctxt->input->filename);
1010
8.30k
  if (ctxt->myDoc->URL == NULL)
1011
0
      xmlSAX2ErrMemory(ctxt, "xmlSAX2StartDocument");
1012
8.30k
    }
1013
12.4k
}
1014
1015
/**
1016
 * xmlSAX2EndDocument:
1017
 * @ctx: the user data (XML parser context)
1018
 *
1019
 * called when the document end has been detected.
1020
 */
1021
void
1022
xmlSAX2EndDocument(void *ctx)
1023
7.00k
{
1024
7.00k
    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
1025
#ifdef DEBUG_SAX
1026
    xmlGenericError(xmlGenericErrorContext,
1027
      "SAX.xmlSAX2EndDocument()\n");
1028
#endif
1029
7.00k
    if (ctx == NULL) return;
1030
7.00k
#ifdef LIBXML_VALID_ENABLED
1031
7.00k
    if (ctxt->validate && ctxt->wellFormed &&
1032
7.00k
        ctxt->myDoc && ctxt->myDoc->intSubset)
1033
6
  ctxt->valid &= xmlValidateDocumentFinal(&ctxt->vctxt, ctxt->myDoc);
1034
7.00k
#endif /* LIBXML_VALID_ENABLED */
1035
1036
    /*
1037
     * Grab the encoding if it was added on-the-fly
1038
     */
1039
7.00k
    if ((ctxt->encoding != NULL) && (ctxt->myDoc != NULL) &&
1040
7.00k
  (ctxt->myDoc->encoding == NULL)) {
1041
1
  ctxt->myDoc->encoding = ctxt->encoding;
1042
1
  ctxt->encoding = NULL;
1043
1
    }
1044
7.00k
    if ((ctxt->inputTab != NULL) &&
1045
7.00k
        (ctxt->inputNr > 0) && (ctxt->inputTab[0] != NULL) &&
1046
7.00k
        (ctxt->inputTab[0]->encoding != NULL) && (ctxt->myDoc != NULL) &&
1047
7.00k
  (ctxt->myDoc->encoding == NULL)) {
1048
640
  ctxt->myDoc->encoding = xmlStrdup(ctxt->inputTab[0]->encoding);
1049
640
    }
1050
7.00k
    if ((ctxt->charset != XML_CHAR_ENCODING_NONE) && (ctxt->myDoc != NULL) &&
1051
7.00k
  (ctxt->myDoc->charset == XML_CHAR_ENCODING_NONE)) {
1052
0
  ctxt->myDoc->charset = ctxt->charset;
1053
0
    }
1054
7.00k
}
1055
1056
#if defined(LIBXML_SAX1_ENABLED) || defined(LIBXML_HTML_ENABLED) || defined(LIBXML_WRITER_ENABLED) || defined(LIBXML_LEGACY_ENABLED)
1057
/**
1058
 * xmlNsErrMsg:
1059
 * @ctxt:  an XML parser context
1060
 * @error:  the error number
1061
 * @msg:  the error message
1062
 * @str1:  an error string
1063
 * @str2:  an error string
1064
 *
1065
 * Handle a namespace error
1066
 */
1067
static void LIBXML_ATTR_FORMAT(3,0)
1068
xmlNsErrMsg(xmlParserCtxtPtr ctxt, xmlParserErrors error,
1069
            const char *msg, const xmlChar *str1, const xmlChar *str2)
1070
23
{
1071
23
    if ((ctxt != NULL) && (ctxt->disableSAX != 0) &&
1072
23
        (ctxt->instate == XML_PARSER_EOF))
1073
0
  return;
1074
23
    if (ctxt != NULL)
1075
23
  ctxt->errNo = error;
1076
23
    __xmlRaiseError(NULL, NULL, NULL, ctxt, NULL, XML_FROM_NAMESPACE, error,
1077
23
                    XML_ERR_ERROR, NULL, 0,
1078
23
        (const char *) str1, (const char *) str2,
1079
23
        NULL, 0, 0, msg, str1, str2);
1080
23
}
1081
1082
/**
1083
 * xmlSAX2AttributeInternal:
1084
 * @ctx: the user data (XML parser context)
1085
 * @fullname:  The attribute name, including namespace prefix
1086
 * @value:  The attribute value
1087
 * @prefix: the prefix on the element node
1088
 *
1089
 * Handle an attribute that has been read by the parser.
1090
 * The default handling is to convert the attribute into an
1091
 * DOM subtree and past it in a new xmlAttr element added to
1092
 * the element.
1093
 */
1094
static void
1095
xmlSAX2AttributeInternal(void *ctx, const xmlChar *fullname,
1096
             const xmlChar *value, const xmlChar *prefix ATTRIBUTE_UNUSED)
1097
355k
{
1098
355k
    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
1099
355k
    xmlAttrPtr ret;
1100
355k
    xmlChar *name;
1101
355k
    xmlChar *ns;
1102
355k
    xmlChar *nval;
1103
355k
    xmlNsPtr namespace;
1104
1105
355k
    if (ctxt->html) {
1106
0
  name = xmlStrdup(fullname);
1107
0
  ns = NULL;
1108
0
  namespace = NULL;
1109
355k
    } else {
1110
  /*
1111
   * Split the full name into a namespace prefix and the tag name
1112
   */
1113
355k
  name = xmlSplitQName(ctxt, fullname, &ns);
1114
355k
  if ((name != NULL) && (name[0] == 0)) {
1115
0
      if (xmlStrEqual(ns, BAD_CAST "xmlns")) {
1116
0
    xmlNsErrMsg(ctxt, XML_ERR_NS_DECL_ERROR,
1117
0
          "invalid namespace declaration '%s'\n",
1118
0
          fullname, NULL);
1119
0
      } else {
1120
0
    xmlNsWarnMsg(ctxt, XML_WAR_NS_COLUMN,
1121
0
           "Avoid attribute ending with ':' like '%s'\n",
1122
0
           fullname, NULL);
1123
0
      }
1124
0
      if (ns != NULL)
1125
0
    xmlFree(ns);
1126
0
      ns = NULL;
1127
0
      xmlFree(name);
1128
0
      name = xmlStrdup(fullname);
1129
0
  }
1130
355k
    }
1131
355k
    if (name == NULL) {
1132
0
        xmlSAX2ErrMemory(ctxt, "xmlSAX2StartElement");
1133
0
  if (ns != NULL)
1134
0
      xmlFree(ns);
1135
0
  return;
1136
0
    }
1137
1138
355k
#ifdef LIBXML_HTML_ENABLED
1139
355k
    if ((ctxt->html) &&
1140
355k
        (value == NULL) && (htmlIsBooleanAttr(fullname))) {
1141
0
            nval = xmlStrdup(fullname);
1142
0
            value = (const xmlChar *) nval;
1143
0
    } else
1144
355k
#endif
1145
355k
    {
1146
355k
#ifdef LIBXML_VALID_ENABLED
1147
        /*
1148
         * Do the last stage of the attribute normalization
1149
         * Needed for HTML too:
1150
         *   http://www.w3.org/TR/html4/types.html#h-6.2
1151
         */
1152
355k
        ctxt->vctxt.valid = 1;
1153
355k
        nval = xmlValidCtxtNormalizeAttributeValue(&ctxt->vctxt,
1154
355k
                                               ctxt->myDoc, ctxt->node,
1155
355k
                                               fullname, value);
1156
355k
        if (ctxt->vctxt.valid != 1) {
1157
0
            ctxt->valid = 0;
1158
0
        }
1159
355k
        if (nval != NULL)
1160
0
            value = nval;
1161
#else
1162
        nval = NULL;
1163
#endif /* LIBXML_VALID_ENABLED */
1164
355k
    }
1165
1166
    /*
1167
     * Check whether it's a namespace definition
1168
     */
1169
355k
    if ((!ctxt->html) && (ns == NULL) &&
1170
355k
        (name[0] == 'x') && (name[1] == 'm') && (name[2] == 'l') &&
1171
355k
        (name[3] == 'n') && (name[4] == 's') && (name[5] == 0)) {
1172
41
  xmlNsPtr nsret;
1173
41
  xmlChar *val;
1174
1175
        /* Avoid unused variable warning if features are disabled. */
1176
41
        (void) nsret;
1177
1178
41
        if (!ctxt->replaceEntities) {
1179
9
      ctxt->depth++;
1180
9
      val = xmlStringDecodeEntities(ctxt, value, XML_SUBSTITUTE_REF,
1181
9
                              0,0,0);
1182
9
      ctxt->depth--;
1183
9
      if (val == NULL) {
1184
0
          xmlSAX2ErrMemory(ctxt, "xmlSAX2StartElement");
1185
0
    if (name != NULL)
1186
0
        xmlFree(name);
1187
0
                if (nval != NULL)
1188
0
                    xmlFree(nval);
1189
0
    return;
1190
0
      }
1191
32
  } else {
1192
32
      val = (xmlChar *) value;
1193
32
  }
1194
1195
41
  if (val[0] != 0) {
1196
35
      xmlURIPtr uri;
1197
1198
35
      uri = xmlParseURI((const char *)val);
1199
35
      if (uri == NULL) {
1200
6
    if ((ctxt->sax != NULL) && (ctxt->sax->warning != NULL))
1201
3
        ctxt->sax->warning(ctxt->userData,
1202
3
       "xmlns: %s not a valid URI\n", val);
1203
29
      } else {
1204
29
    if (uri->scheme == NULL) {
1205
9
        if ((ctxt->sax != NULL) && (ctxt->sax->warning != NULL))
1206
9
      ctxt->sax->warning(ctxt->userData,
1207
9
           "xmlns: URI %s is not absolute\n", val);
1208
9
    }
1209
29
    xmlFreeURI(uri);
1210
29
      }
1211
35
  }
1212
1213
  /* a default namespace definition */
1214
41
  nsret = xmlNewNs(ctxt->node, val, NULL);
1215
1216
41
#ifdef LIBXML_VALID_ENABLED
1217
  /*
1218
   * Validate also for namespace decls, they are attributes from
1219
   * an XML-1.0 perspective
1220
   */
1221
41
        if (nsret != NULL && ctxt->validate && ctxt->wellFormed &&
1222
41
      ctxt->myDoc && ctxt->myDoc->intSubset)
1223
0
      ctxt->valid &= xmlValidateOneNamespace(&ctxt->vctxt, ctxt->myDoc,
1224
0
             ctxt->node, prefix, nsret, val);
1225
41
#endif /* LIBXML_VALID_ENABLED */
1226
41
  if (name != NULL)
1227
41
      xmlFree(name);
1228
41
  if (nval != NULL)
1229
0
      xmlFree(nval);
1230
41
  if (val != value)
1231
9
      xmlFree(val);
1232
41
  return;
1233
41
    }
1234
355k
    if ((!ctxt->html) &&
1235
355k
  (ns != NULL) && (ns[0] == 'x') && (ns[1] == 'm') && (ns[2] == 'l') &&
1236
355k
        (ns[3] == 'n') && (ns[4] == 's') && (ns[5] == 0)) {
1237
57
  xmlNsPtr nsret;
1238
57
  xmlChar *val;
1239
1240
        /* Avoid unused variable warning if features are disabled. */
1241
57
        (void) nsret;
1242
1243
57
        if (!ctxt->replaceEntities) {
1244
21
      ctxt->depth++;
1245
21
      val = xmlStringDecodeEntities(ctxt, value, XML_SUBSTITUTE_REF,
1246
21
                              0,0,0);
1247
21
      ctxt->depth--;
1248
21
      if (val == NULL) {
1249
0
          xmlSAX2ErrMemory(ctxt, "xmlSAX2StartElement");
1250
0
          xmlFree(ns);
1251
0
    if (name != NULL)
1252
0
        xmlFree(name);
1253
0
                if (nval != NULL)
1254
0
                    xmlFree(nval);
1255
0
    return;
1256
0
      }
1257
36
  } else {
1258
36
      val = (xmlChar *) value;
1259
36
  }
1260
1261
57
  if (val[0] == 0) {
1262
0
      xmlNsErrMsg(ctxt, XML_NS_ERR_EMPTY,
1263
0
            "Empty namespace name for prefix %s\n", name, NULL);
1264
0
  }
1265
57
  if ((ctxt->pedantic != 0) && (val[0] != 0)) {
1266
48
      xmlURIPtr uri;
1267
1268
48
      uri = xmlParseURI((const char *)val);
1269
48
      if (uri == NULL) {
1270
5
          xmlNsWarnMsg(ctxt, XML_WAR_NS_URI,
1271
5
       "xmlns:%s: %s not a valid URI\n", name, value);
1272
43
      } else {
1273
43
    if (uri->scheme == NULL) {
1274
2
        xmlNsWarnMsg(ctxt, XML_WAR_NS_URI_RELATIVE,
1275
2
         "xmlns:%s: URI %s is not absolute\n", name, value);
1276
2
    }
1277
43
    xmlFreeURI(uri);
1278
43
      }
1279
48
  }
1280
1281
  /* a standard namespace definition */
1282
57
  nsret = xmlNewNs(ctxt->node, val, name);
1283
57
  xmlFree(ns);
1284
57
#ifdef LIBXML_VALID_ENABLED
1285
  /*
1286
   * Validate also for namespace decls, they are attributes from
1287
   * an XML-1.0 perspective
1288
   */
1289
57
        if (nsret != NULL && ctxt->validate && ctxt->wellFormed &&
1290
57
      ctxt->myDoc && ctxt->myDoc->intSubset)
1291
0
      ctxt->valid &= xmlValidateOneNamespace(&ctxt->vctxt, ctxt->myDoc,
1292
0
             ctxt->node, prefix, nsret, value);
1293
57
#endif /* LIBXML_VALID_ENABLED */
1294
57
  if (name != NULL)
1295
57
      xmlFree(name);
1296
57
  if (nval != NULL)
1297
0
      xmlFree(nval);
1298
57
  if (val != value)
1299
21
      xmlFree(val);
1300
57
  return;
1301
57
    }
1302
1303
355k
    if (ns != NULL) {
1304
188
  namespace = xmlSearchNs(ctxt->myDoc, ctxt->node, ns);
1305
1306
188
  if (namespace == NULL) {
1307
23
      xmlNsErrMsg(ctxt, XML_NS_ERR_UNDEFINED_NAMESPACE,
1308
23
        "Namespace prefix %s of attribute %s is not defined\n",
1309
23
                 ns, name);
1310
165
  } else {
1311
165
            xmlAttrPtr prop;
1312
1313
165
            prop = ctxt->node->properties;
1314
168
            while (prop != NULL) {
1315
3
                if (prop->ns != NULL) {
1316
3
                    if ((xmlStrEqual(name, prop->name)) &&
1317
3
                        ((namespace == prop->ns) ||
1318
0
                         (xmlStrEqual(namespace->href, prop->ns->href)))) {
1319
0
                            xmlNsErrMsg(ctxt, XML_ERR_ATTRIBUTE_REDEFINED,
1320
0
                                    "Attribute %s in %s redefined\n",
1321
0
                                             name, namespace->href);
1322
0
                        ctxt->wellFormed = 0;
1323
0
                        if (ctxt->recovery == 0) ctxt->disableSAX = 1;
1324
0
                        if (name != NULL)
1325
0
                            xmlFree(name);
1326
0
                        goto error;
1327
0
                    }
1328
3
                }
1329
3
                prop = prop->next;
1330
3
            }
1331
165
        }
1332
355k
    } else {
1333
355k
  namespace = NULL;
1334
355k
    }
1335
1336
    /* !!!!!! <a toto:arg="" xmlns:toto="http://toto.com"> */
1337
355k
    ret = xmlNewNsPropEatName(ctxt->node, namespace, name, NULL);
1338
355k
    if (ret == NULL)
1339
0
        goto error;
1340
1341
355k
    if ((ctxt->replaceEntities == 0) && (!ctxt->html)) {
1342
29
        xmlNodePtr tmp;
1343
1344
29
        ret->children = xmlStringGetNodeList(ctxt->myDoc, value);
1345
29
        tmp = ret->children;
1346
52
        while (tmp != NULL) {
1347
23
            tmp->parent = (xmlNodePtr) ret;
1348
23
            if (tmp->next == NULL)
1349
23
                ret->last = tmp;
1350
23
            tmp = tmp->next;
1351
23
        }
1352
355k
    } else if (value != NULL) {
1353
355k
        ret->children = xmlNewDocText(ctxt->myDoc, value);
1354
355k
        ret->last = ret->children;
1355
355k
        if (ret->children != NULL)
1356
355k
            ret->children->parent = (xmlNodePtr) ret;
1357
355k
    }
1358
1359
355k
#ifdef LIBXML_VALID_ENABLED
1360
355k
    if ((!ctxt->html) && ctxt->validate && ctxt->wellFormed &&
1361
355k
        ctxt->myDoc && ctxt->myDoc->intSubset) {
1362
1363
  /*
1364
   * If we don't substitute entities, the validation should be
1365
   * done on a value with replaced entities anyway.
1366
   */
1367
0
        if (!ctxt->replaceEntities) {
1368
0
      xmlChar *val;
1369
1370
0
      ctxt->depth++;
1371
0
      val = xmlStringDecodeEntities(ctxt, value, XML_SUBSTITUTE_REF,
1372
0
                              0,0,0);
1373
0
      ctxt->depth--;
1374
1375
0
      if (val == NULL)
1376
0
    ctxt->valid &= xmlValidateOneAttribute(&ctxt->vctxt,
1377
0
        ctxt->myDoc, ctxt->node, ret, value);
1378
0
      else {
1379
0
    xmlChar *nvalnorm;
1380
1381
    /*
1382
     * Do the last stage of the attribute normalization
1383
     * It need to be done twice ... it's an extra burden related
1384
     * to the ability to keep xmlSAX2References in attributes
1385
     */
1386
0
    nvalnorm = xmlValidNormalizeAttributeValue(ctxt->myDoc,
1387
0
              ctxt->node, fullname, val);
1388
0
    if (nvalnorm != NULL) {
1389
0
        xmlFree(val);
1390
0
        val = nvalnorm;
1391
0
    }
1392
1393
0
    ctxt->valid &= xmlValidateOneAttribute(&ctxt->vctxt,
1394
0
              ctxt->myDoc, ctxt->node, ret, val);
1395
0
                xmlFree(val);
1396
0
      }
1397
0
  } else {
1398
0
      ctxt->valid &= xmlValidateOneAttribute(&ctxt->vctxt, ctxt->myDoc,
1399
0
                 ctxt->node, ret, value);
1400
0
  }
1401
0
    } else
1402
355k
#endif /* LIBXML_VALID_ENABLED */
1403
355k
           if (((ctxt->loadsubset & XML_SKIP_IDS) == 0) &&
1404
355k
         (((ctxt->replaceEntities == 0) && (ctxt->external != 2)) ||
1405
355k
          ((ctxt->replaceEntities != 0) && (ctxt->inSubset == 0))) &&
1406
               /* Don't create IDs containing entity references */
1407
355k
               (ret->children != NULL) &&
1408
355k
               (ret->children->type == XML_TEXT_NODE) &&
1409
355k
               (ret->children->next == NULL)) {
1410
355k
        xmlChar *content = ret->children->content;
1411
        /*
1412
   * when validating, the ID registration is done at the attribute
1413
   * validation level. Otherwise we have to do specific handling here.
1414
   */
1415
355k
  if (xmlStrEqual(fullname, BAD_CAST "xml:id")) {
1416
      /*
1417
       * Add the xml:id value
1418
       *
1419
       * Open issue: normalization of the value.
1420
       */
1421
3
      if (xmlValidateNCName(content, 1) != 0) {
1422
0
          xmlErrValid(ctxt, XML_DTD_XMLID_VALUE,
1423
0
          "xml:id : attribute value %s is not an NCName\n",
1424
0
          (const char *) content, NULL);
1425
0
      }
1426
3
      xmlAddID(&ctxt->vctxt, ctxt->myDoc, content, ret);
1427
355k
  } else if (xmlIsID(ctxt->myDoc, ctxt->node, ret))
1428
0
      xmlAddID(&ctxt->vctxt, ctxt->myDoc, content, ret);
1429
355k
  else if (xmlIsRef(ctxt->myDoc, ctxt->node, ret))
1430
0
      xmlAddRef(&ctxt->vctxt, ctxt->myDoc, content, ret);
1431
355k
    }
1432
1433
355k
error:
1434
355k
    if (nval != NULL)
1435
0
  xmlFree(nval);
1436
355k
    if (ns != NULL)
1437
188
  xmlFree(ns);
1438
355k
}
1439
1440
/*
1441
 * xmlCheckDefaultedAttributes:
1442
 *
1443
 * Check defaulted attributes from the DTD
1444
 */
1445
static void
1446
xmlCheckDefaultedAttributes(xmlParserCtxtPtr ctxt, const xmlChar *name,
1447
258k
  const xmlChar *prefix, const xmlChar **atts) {
1448
258k
    xmlElementPtr elemDecl;
1449
258k
    const xmlChar *att;
1450
258k
    int internal = 1;
1451
258k
    int i;
1452
1453
258k
    elemDecl = xmlGetDtdQElementDesc(ctxt->myDoc->intSubset, name, prefix);
1454
258k
    if (elemDecl == NULL) {
1455
258k
  elemDecl = xmlGetDtdQElementDesc(ctxt->myDoc->extSubset, name, prefix);
1456
258k
  internal = 0;
1457
258k
    }
1458
1459
258k
process_external_subset:
1460
1461
258k
    if (elemDecl != NULL) {
1462
27
  xmlAttributePtr attr = elemDecl->attributes;
1463
  /*
1464
   * Check against defaulted attributes from the external subset
1465
   * if the document is stamped as standalone
1466
   */
1467
27
  if ((ctxt->myDoc->standalone == 1) &&
1468
27
      (ctxt->myDoc->extSubset != NULL) &&
1469
27
      (ctxt->validate)) {
1470
0
      while (attr != NULL) {
1471
0
    if ((attr->defaultValue != NULL) &&
1472
0
        (xmlGetDtdQAttrDesc(ctxt->myDoc->extSubset,
1473
0
          attr->elem, attr->name,
1474
0
          attr->prefix) == attr) &&
1475
0
        (xmlGetDtdQAttrDesc(ctxt->myDoc->intSubset,
1476
0
          attr->elem, attr->name,
1477
0
          attr->prefix) == NULL)) {
1478
0
        xmlChar *fulln;
1479
1480
0
        if (attr->prefix != NULL) {
1481
0
      fulln = xmlStrdup(attr->prefix);
1482
0
      fulln = xmlStrcat(fulln, BAD_CAST ":");
1483
0
      fulln = xmlStrcat(fulln, attr->name);
1484
0
        } else {
1485
0
      fulln = xmlStrdup(attr->name);
1486
0
        }
1487
0
                    if (fulln == NULL) {
1488
0
                        xmlSAX2ErrMemory(ctxt, "xmlSAX2StartElement");
1489
0
                        break;
1490
0
                    }
1491
1492
        /*
1493
         * Check that the attribute is not declared in the
1494
         * serialization
1495
         */
1496
0
        att = NULL;
1497
0
        if (atts != NULL) {
1498
0
      i = 0;
1499
0
      att = atts[i];
1500
0
      while (att != NULL) {
1501
0
          if (xmlStrEqual(att, fulln))
1502
0
        break;
1503
0
          i += 2;
1504
0
          att = atts[i];
1505
0
      }
1506
0
        }
1507
0
        if (att == NULL) {
1508
0
            xmlErrValid(ctxt, XML_DTD_STANDALONE_DEFAULTED,
1509
0
      "standalone: attribute %s on %s defaulted from external subset\n",
1510
0
            (const char *)fulln,
1511
0
            (const char *)attr->elem);
1512
0
        }
1513
0
                    xmlFree(fulln);
1514
0
    }
1515
0
    attr = attr->nexth;
1516
0
      }
1517
0
  }
1518
1519
  /*
1520
   * Actually insert defaulted values when needed
1521
   */
1522
27
  attr = elemDecl->attributes;
1523
27
  while (attr != NULL) {
1524
      /*
1525
       * Make sure that attributes redefinition occurring in the
1526
       * internal subset are not overridden by definitions in the
1527
       * external subset.
1528
       */
1529
0
      if (attr->defaultValue != NULL) {
1530
    /*
1531
     * the element should be instantiated in the tree if:
1532
     *  - this is a namespace prefix
1533
     *  - the user required for completion in the tree
1534
     *    like XSLT
1535
     *  - there isn't already an attribute definition
1536
     *    in the internal subset overriding it.
1537
     */
1538
0
    if (((attr->prefix != NULL) &&
1539
0
         (xmlStrEqual(attr->prefix, BAD_CAST "xmlns"))) ||
1540
0
        ((attr->prefix == NULL) &&
1541
0
         (xmlStrEqual(attr->name, BAD_CAST "xmlns"))) ||
1542
0
        (ctxt->loadsubset & XML_COMPLETE_ATTRS)) {
1543
0
        xmlAttributePtr tst;
1544
1545
0
        tst = xmlGetDtdQAttrDesc(ctxt->myDoc->intSubset,
1546
0
               attr->elem, attr->name,
1547
0
               attr->prefix);
1548
0
        if ((tst == attr) || (tst == NULL)) {
1549
0
            xmlChar fn[50];
1550
0
      xmlChar *fulln;
1551
1552
0
                        fulln = xmlBuildQName(attr->name, attr->prefix, fn, 50);
1553
0
      if (fulln == NULL) {
1554
0
          xmlSAX2ErrMemory(ctxt, "xmlSAX2StartElement");
1555
0
          return;
1556
0
      }
1557
1558
      /*
1559
       * Check that the attribute is not declared in the
1560
       * serialization
1561
       */
1562
0
      att = NULL;
1563
0
      if (atts != NULL) {
1564
0
          i = 0;
1565
0
          att = atts[i];
1566
0
          while (att != NULL) {
1567
0
        if (xmlStrEqual(att, fulln))
1568
0
            break;
1569
0
        i += 2;
1570
0
        att = atts[i];
1571
0
          }
1572
0
      }
1573
0
      if (att == NULL) {
1574
0
          xmlSAX2AttributeInternal(ctxt, fulln,
1575
0
             attr->defaultValue, prefix);
1576
0
      }
1577
0
      if ((fulln != fn) && (fulln != attr->name))
1578
0
          xmlFree(fulln);
1579
0
        }
1580
0
    }
1581
0
      }
1582
0
      attr = attr->nexth;
1583
0
  }
1584
27
  if (internal == 1) {
1585
27
      elemDecl = xmlGetDtdQElementDesc(ctxt->myDoc->extSubset,
1586
27
                                 name, prefix);
1587
27
      internal = 0;
1588
27
      goto process_external_subset;
1589
27
  }
1590
27
    }
1591
258k
}
1592
1593
/**
1594
 * xmlSAX2StartElement:
1595
 * @ctx: the user data (XML parser context)
1596
 * @fullname:  The element name, including namespace prefix
1597
 * @atts:  An array of name/value attributes pairs, NULL terminated
1598
 *
1599
 * called when an opening tag has been processed.
1600
 */
1601
void
1602
xmlSAX2StartElement(void *ctx, const xmlChar *fullname, const xmlChar **atts)
1603
356k
{
1604
356k
    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
1605
356k
    xmlNodePtr ret;
1606
356k
    xmlNodePtr parent;
1607
356k
    xmlNsPtr ns;
1608
356k
    xmlChar *name;
1609
356k
    xmlChar *prefix;
1610
356k
    const xmlChar *att;
1611
356k
    const xmlChar *value;
1612
356k
    int i;
1613
1614
356k
    if ((ctx == NULL) || (fullname == NULL) || (ctxt->myDoc == NULL)) return;
1615
356k
    parent = ctxt->node;
1616
#ifdef DEBUG_SAX
1617
    xmlGenericError(xmlGenericErrorContext,
1618
      "SAX.xmlSAX2StartElement(%s)\n", fullname);
1619
#endif
1620
1621
    /*
1622
     * First check on validity:
1623
     */
1624
356k
    if (ctxt->validate && (ctxt->myDoc->extSubset == NULL) &&
1625
356k
        ((ctxt->myDoc->intSubset == NULL) ||
1626
258k
   ((ctxt->myDoc->intSubset->notations == NULL) &&
1627
258k
    (ctxt->myDoc->intSubset->elements == NULL) &&
1628
258k
    (ctxt->myDoc->intSubset->attributes == NULL) &&
1629
258k
    (ctxt->myDoc->intSubset->entities == NULL)))) {
1630
561
  xmlErrValid(ctxt, XML_ERR_NO_DTD,
1631
561
    "Validation failed: no DTD found !", NULL, NULL);
1632
561
  ctxt->validate = 0;
1633
561
    }
1634
1635
1636
    /*
1637
     * Split the full name into a namespace prefix and the tag name
1638
     */
1639
356k
    name = xmlSplitQName(ctxt, fullname, &prefix);
1640
1641
1642
    /*
1643
     * Note : the namespace resolution is deferred until the end of the
1644
     *        attributes parsing, since local namespace can be defined as
1645
     *        an attribute at this level.
1646
     */
1647
356k
    ret = xmlNewDocNodeEatName(ctxt->myDoc, NULL, name, NULL);
1648
356k
    if (ret == NULL) {
1649
0
        if (prefix != NULL)
1650
0
      xmlFree(prefix);
1651
0
  xmlSAX2ErrMemory(ctxt, "xmlSAX2StartElement");
1652
0
        return;
1653
0
    }
1654
356k
    if (ctxt->myDoc->children == NULL) {
1655
#ifdef DEBUG_SAX_TREE
1656
  xmlGenericError(xmlGenericErrorContext, "Setting %s as root\n", name);
1657
#endif
1658
642
        xmlAddChild((xmlNodePtr) ctxt->myDoc, (xmlNodePtr) ret);
1659
356k
    } else if (parent == NULL) {
1660
6.46k
        parent = ctxt->myDoc->children;
1661
6.46k
    }
1662
356k
    ctxt->nodemem = -1;
1663
356k
    if (ctxt->linenumbers) {
1664
356k
  if (ctxt->input != NULL) {
1665
356k
      if ((unsigned) ctxt->input->line < (unsigned) USHRT_MAX)
1666
356k
    ret->line = ctxt->input->line;
1667
164
      else
1668
164
          ret->line = USHRT_MAX;
1669
356k
  }
1670
356k
    }
1671
1672
    /*
1673
     * We are parsing a new node.
1674
     */
1675
#ifdef DEBUG_SAX_TREE
1676
    xmlGenericError(xmlGenericErrorContext, "pushing(%s)\n", name);
1677
#endif
1678
356k
    if (nodePush(ctxt, ret) < 0) {
1679
0
        xmlUnlinkNode(ret);
1680
0
        xmlFreeNode(ret);
1681
0
        if (prefix != NULL)
1682
0
            xmlFree(prefix);
1683
0
        return;
1684
0
    }
1685
1686
    /*
1687
     * Link the child element
1688
     */
1689
356k
    if (parent != NULL) {
1690
356k
        if (parent->type == XML_ELEMENT_NODE) {
1691
#ifdef DEBUG_SAX_TREE
1692
      xmlGenericError(xmlGenericErrorContext,
1693
        "adding child %s to %s\n", name, parent->name);
1694
#endif
1695
353k
      xmlAddChild(parent, ret);
1696
353k
  } else {
1697
#ifdef DEBUG_SAX_TREE
1698
      xmlGenericError(xmlGenericErrorContext,
1699
        "adding sibling %s to ", name);
1700
      xmlDebugDumpOneNode(stderr, parent, 0);
1701
#endif
1702
3.28k
      xmlAddSibling(parent, ret);
1703
3.28k
  }
1704
356k
    }
1705
1706
356k
    if (!ctxt->html) {
1707
        /*
1708
         * Insert all the defaulted attributes from the DTD especially
1709
         * namespaces
1710
         */
1711
356k
        if ((ctxt->myDoc->intSubset != NULL) ||
1712
356k
            (ctxt->myDoc->extSubset != NULL)) {
1713
258k
            xmlCheckDefaultedAttributes(ctxt, name, prefix, atts);
1714
258k
        }
1715
1716
        /*
1717
         * process all the attributes whose name start with "xmlns"
1718
         */
1719
356k
        if (atts != NULL) {
1720
222k
            i = 0;
1721
222k
            att = atts[i++];
1722
222k
            value = atts[i++];
1723
578k
      while ((att != NULL) && (value != NULL)) {
1724
355k
    if ((att[0] == 'x') && (att[1] == 'm') && (att[2] == 'l') &&
1725
355k
        (att[3] == 'n') && (att[4] == 's'))
1726
104
        xmlSAX2AttributeInternal(ctxt, att, value, prefix);
1727
1728
355k
    att = atts[i++];
1729
355k
    value = atts[i++];
1730
355k
      }
1731
222k
        }
1732
1733
        /*
1734
         * Search the namespace, note that since the attributes have been
1735
         * processed, the local namespaces are available.
1736
         */
1737
356k
        ns = xmlSearchNs(ctxt->myDoc, ret, prefix);
1738
356k
        if ((ns == NULL) && (parent != NULL))
1739
356k
            ns = xmlSearchNs(ctxt->myDoc, parent, prefix);
1740
356k
        if ((prefix != NULL) && (ns == NULL)) {
1741
3.95k
            ns = xmlNewNs(ret, NULL, prefix);
1742
3.95k
            xmlNsWarnMsg(ctxt, XML_NS_ERR_UNDEFINED_NAMESPACE,
1743
3.95k
                         "Namespace prefix %s is not defined\n",
1744
3.95k
                         prefix, NULL);
1745
3.95k
        }
1746
1747
        /*
1748
         * set the namespace node, making sure that if the default namespace
1749
         * is unbound on a parent we simply keep it NULL
1750
         */
1751
356k
        if ((ns != NULL) && (ns->href != NULL) &&
1752
356k
            ((ns->href[0] != 0) || (ns->prefix != NULL)))
1753
214
            xmlSetNs(ret, ns);
1754
356k
    }
1755
1756
    /*
1757
     * process all the other attributes
1758
     */
1759
356k
    if (atts != NULL) {
1760
222k
        i = 0;
1761
222k
  att = atts[i++];
1762
222k
  value = atts[i++];
1763
222k
  if (ctxt->html) {
1764
0
      while (att != NULL) {
1765
0
    xmlSAX2AttributeInternal(ctxt, att, value, NULL);
1766
0
    att = atts[i++];
1767
0
    value = atts[i++];
1768
0
      }
1769
222k
  } else {
1770
578k
      while ((att != NULL) && (value != NULL)) {
1771
355k
    if ((att[0] != 'x') || (att[1] != 'm') || (att[2] != 'l') ||
1772
355k
        (att[3] != 'n') || (att[4] != 's'))
1773
355k
        xmlSAX2AttributeInternal(ctxt, att, value, NULL);
1774
1775
    /*
1776
     * Next ones
1777
     */
1778
355k
    att = atts[i++];
1779
355k
    value = atts[i++];
1780
355k
      }
1781
222k
  }
1782
222k
    }
1783
1784
356k
#ifdef LIBXML_VALID_ENABLED
1785
    /*
1786
     * If it's the Document root, finish the DTD validation and
1787
     * check the document root element for validity
1788
     */
1789
356k
    if ((ctxt->validate) &&
1790
356k
        ((ctxt->vctxt.flags & XML_VCTXT_DTD_VALIDATED) == 0)) {
1791
946
  int chk;
1792
1793
946
  chk = xmlValidateDtdFinal(&ctxt->vctxt, ctxt->myDoc);
1794
946
  if (chk <= 0)
1795
0
      ctxt->valid = 0;
1796
946
  if (chk < 0)
1797
0
      ctxt->wellFormed = 0;
1798
946
  ctxt->valid &= xmlValidateRoot(&ctxt->vctxt, ctxt->myDoc);
1799
946
  ctxt->vctxt.flags |= XML_VCTXT_DTD_VALIDATED;
1800
946
    }
1801
356k
#endif /* LIBXML_VALID_ENABLED */
1802
1803
356k
    if (prefix != NULL)
1804
4.13k
  xmlFree(prefix);
1805
1806
356k
}
1807
1808
/**
1809
 * xmlSAX2EndElement:
1810
 * @ctx: the user data (XML parser context)
1811
 * @name:  The element name
1812
 *
1813
 * called when the end of an element has been detected.
1814
 */
1815
void
1816
xmlSAX2EndElement(void *ctx, const xmlChar *name ATTRIBUTE_UNUSED)
1817
348k
{
1818
348k
    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
1819
348k
    xmlNodePtr cur;
1820
1821
348k
    if (ctx == NULL) return;
1822
348k
    cur = ctxt->node;
1823
#ifdef DEBUG_SAX
1824
    if (name == NULL)
1825
        xmlGenericError(xmlGenericErrorContext, "SAX.xmlSAX2EndElement(NULL)\n");
1826
    else
1827
  xmlGenericError(xmlGenericErrorContext, "SAX.xmlSAX2EndElement(%s)\n", name);
1828
#endif
1829
1830
    /* Capture end position and add node */
1831
348k
    if (cur != NULL && ctxt->record_info) {
1832
0
      ctxt->nodeInfo->end_pos = ctxt->input->cur - ctxt->input->base;
1833
0
      ctxt->nodeInfo->end_line = ctxt->input->line;
1834
0
      ctxt->nodeInfo->node = cur;
1835
0
      xmlParserAddNodeInfo(ctxt, ctxt->nodeInfo);
1836
0
    }
1837
348k
    ctxt->nodemem = -1;
1838
1839
348k
#ifdef LIBXML_VALID_ENABLED
1840
348k
    if (ctxt->validate && ctxt->wellFormed &&
1841
348k
        ctxt->myDoc && ctxt->myDoc->intSubset)
1842
0
        ctxt->valid &= xmlValidateOneElement(&ctxt->vctxt, ctxt->myDoc,
1843
0
               cur);
1844
348k
#endif /* LIBXML_VALID_ENABLED */
1845
1846
1847
    /*
1848
     * end of parsing of this node.
1849
     */
1850
#ifdef DEBUG_SAX_TREE
1851
    xmlGenericError(xmlGenericErrorContext, "popping(%s)\n", cur->name);
1852
#endif
1853
348k
    nodePop(ctxt);
1854
348k
}
1855
#endif /* LIBXML_SAX1_ENABLED || LIBXML_HTML_ENABLED || LIBXML_LEGACY_ENABLED */
1856
1857
/*
1858
 * xmlSAX2TextNode:
1859
 * @ctxt:  the parser context
1860
 * @str:  the input string
1861
 * @len: the string length
1862
 *
1863
 * Callback for a text node
1864
 *
1865
 * Returns the newly allocated string or NULL if not needed or error
1866
 */
1867
static xmlNodePtr
1868
3.98M
xmlSAX2TextNode(xmlParserCtxtPtr ctxt, const xmlChar *str, int len) {
1869
3.98M
    xmlNodePtr ret;
1870
3.98M
    const xmlChar *intern = NULL;
1871
1872
    /*
1873
     * Allocate
1874
     */
1875
3.98M
    if (ctxt->freeElems != NULL) {
1876
24.7k
  ret = ctxt->freeElems;
1877
24.7k
  ctxt->freeElems = ret->next;
1878
24.7k
  ctxt->freeElemsNr--;
1879
3.96M
    } else {
1880
3.96M
  ret = (xmlNodePtr) xmlMalloc(sizeof(xmlNode));
1881
3.96M
    }
1882
3.98M
    if (ret == NULL) {
1883
0
        xmlErrMemory(ctxt, "xmlSAX2Characters");
1884
0
  return(NULL);
1885
0
    }
1886
3.98M
    memset(ret, 0, sizeof(xmlNode));
1887
    /*
1888
     * intern the formatting blanks found between tags, or the
1889
     * very short strings
1890
     */
1891
3.98M
    if (ctxt->dictNames) {
1892
3.68M
        xmlChar cur = str[len];
1893
1894
3.68M
  if ((len < (int) (2 * sizeof(void *))) &&
1895
3.68M
      (ctxt->options & XML_PARSE_COMPACT)) {
1896
      /* store the string in the node overriding properties and nsDef */
1897
1.12M
      xmlChar *tmp = (xmlChar *) &(ret->properties);
1898
1.12M
      memcpy(tmp, str, len);
1899
1.12M
      tmp[len] = 0;
1900
1.12M
      intern = tmp;
1901
2.55M
  } else if ((len <= 3) && ((cur == '"') || (cur == '\'') ||
1902
610k
      ((cur == '<') && (str[len + 1] != '!')))) {
1903
592k
      intern = xmlDictLookup(ctxt->dict, str, len);
1904
1.96M
  } else if (IS_BLANK_CH(*str) && (len < 60) && (cur == '<') &&
1905
1.96M
             (str[len + 1] != '!')) {
1906
616k
      int i;
1907
1908
3.45M
      for (i = 1;i < len;i++) {
1909
2.88M
    if (!IS_BLANK_CH(str[i])) goto skip;
1910
2.88M
      }
1911
566k
      intern = xmlDictLookup(ctxt->dict, str, len);
1912
566k
  }
1913
3.68M
    }
1914
3.98M
skip:
1915
3.98M
    ret->type = XML_TEXT_NODE;
1916
1917
3.98M
    ret->name = xmlStringText;
1918
3.98M
    if (intern == NULL) {
1919
1.70M
  ret->content = xmlStrndup(str, len);
1920
1.70M
  if (ret->content == NULL) {
1921
0
      xmlSAX2ErrMemory(ctxt, "xmlSAX2TextNode");
1922
0
      xmlFree(ret);
1923
0
      return(NULL);
1924
0
  }
1925
1.70M
    } else
1926
2.28M
  ret->content = (xmlChar *) intern;
1927
1928
3.98M
    if (ctxt->linenumbers) {
1929
3.97M
  if (ctxt->input != NULL) {
1930
3.97M
      if ((unsigned) ctxt->input->line < (unsigned) USHRT_MAX)
1931
3.97M
    ret->line = ctxt->input->line;
1932
877
      else {
1933
877
          ret->line = USHRT_MAX;
1934
877
    if (ctxt->options & XML_PARSE_BIG_LINES)
1935
303
        ret->psvi = (void *) (ptrdiff_t) ctxt->input->line;
1936
877
      }
1937
3.97M
  }
1938
3.97M
    }
1939
1940
3.98M
    if ((__xmlRegisterCallbacks) && (xmlRegisterNodeDefaultValue))
1941
0
  xmlRegisterNodeDefaultValue(ret);
1942
3.98M
    return(ret);
1943
3.98M
}
1944
1945
#ifdef LIBXML_VALID_ENABLED
1946
/*
1947
 * xmlSAX2DecodeAttrEntities:
1948
 * @ctxt:  the parser context
1949
 * @str:  the input string
1950
 * @len: the string length
1951
 *
1952
 * Remove the entities from an attribute value
1953
 *
1954
 * Returns the newly allocated string or NULL if not needed or error
1955
 */
1956
static xmlChar *
1957
xmlSAX2DecodeAttrEntities(xmlParserCtxtPtr ctxt, const xmlChar *str,
1958
0
                          const xmlChar *end) {
1959
0
    const xmlChar *in;
1960
0
    xmlChar *ret;
1961
1962
0
    in = str;
1963
0
    while (in < end)
1964
0
        if (*in++ == '&')
1965
0
      goto decode;
1966
0
    return(NULL);
1967
0
decode:
1968
0
    ctxt->depth++;
1969
0
    ret = xmlStringLenDecodeEntities(ctxt, str, end - str,
1970
0
             XML_SUBSTITUTE_REF, 0,0,0);
1971
0
    ctxt->depth--;
1972
0
    return(ret);
1973
0
}
1974
#endif /* LIBXML_VALID_ENABLED */
1975
1976
/**
1977
 * xmlSAX2AttributeNs:
1978
 * @ctx: the user data (XML parser context)
1979
 * @localname:  the local name of the attribute
1980
 * @prefix:  the attribute namespace prefix if available
1981
 * @URI:  the attribute namespace name if available
1982
 * @value:  Start of the attribute value
1983
 * @valueend: end of the attribute value
1984
 *
1985
 * Handle an attribute that has been read by the parser.
1986
 * The default handling is to convert the attribute into an
1987
 * DOM subtree and past it in a new xmlAttr element added to
1988
 * the element.
1989
 */
1990
static void
1991
xmlSAX2AttributeNs(xmlParserCtxtPtr ctxt,
1992
                   const xmlChar * localname,
1993
                   const xmlChar * prefix,
1994
       const xmlChar * value,
1995
       const xmlChar * valueend)
1996
1.90M
{
1997
1.90M
    xmlAttrPtr ret;
1998
1.90M
    xmlNsPtr namespace = NULL;
1999
1.90M
    xmlChar *dup = NULL;
2000
2001
    /*
2002
     * Note: if prefix == NULL, the attribute is not in the default namespace
2003
     */
2004
1.90M
    if (prefix != NULL)
2005
1.51k
  namespace = xmlSearchNs(ctxt->myDoc, ctxt->node, prefix);
2006
2007
    /*
2008
     * allocate the node
2009
     */
2010
1.90M
    if (ctxt->freeAttrs != NULL) {
2011
35.3k
        ret = ctxt->freeAttrs;
2012
35.3k
  ctxt->freeAttrs = ret->next;
2013
35.3k
  ctxt->freeAttrsNr--;
2014
35.3k
  memset(ret, 0, sizeof(xmlAttr));
2015
35.3k
  ret->type = XML_ATTRIBUTE_NODE;
2016
2017
35.3k
  ret->parent = ctxt->node;
2018
35.3k
  ret->doc = ctxt->myDoc;
2019
35.3k
  ret->ns = namespace;
2020
2021
35.3k
  if (ctxt->dictNames)
2022
35.3k
      ret->name = localname;
2023
0
  else
2024
0
      ret->name = xmlStrdup(localname);
2025
2026
        /* link at the end to preserve order, TODO speed up with a last */
2027
35.3k
  if (ctxt->node->properties == NULL) {
2028
35.3k
      ctxt->node->properties = ret;
2029
35.3k
  } else {
2030
0
      xmlAttrPtr prev = ctxt->node->properties;
2031
2032
0
      while (prev->next != NULL) prev = prev->next;
2033
0
      prev->next = ret;
2034
0
      ret->prev = prev;
2035
0
  }
2036
2037
35.3k
  if ((__xmlRegisterCallbacks) && (xmlRegisterNodeDefaultValue))
2038
0
      xmlRegisterNodeDefaultValue((xmlNodePtr)ret);
2039
1.87M
    } else {
2040
1.87M
  if (ctxt->dictNames)
2041
1.87M
      ret = xmlNewNsPropEatName(ctxt->node, namespace,
2042
1.87M
                                (xmlChar *) localname, NULL);
2043
15
  else
2044
15
      ret = xmlNewNsProp(ctxt->node, namespace, localname, NULL);
2045
1.87M
  if (ret == NULL) {
2046
0
      xmlErrMemory(ctxt, "xmlSAX2AttributeNs");
2047
0
      return;
2048
0
  }
2049
1.87M
    }
2050
2051
1.90M
    if ((ctxt->replaceEntities == 0) && (!ctxt->html)) {
2052
41
  xmlNodePtr tmp;
2053
2054
  /*
2055
   * We know that if there is an entity reference, then
2056
   * the string has been dup'ed and terminates with 0
2057
   * otherwise with ' or "
2058
   */
2059
41
  if (*valueend != 0) {
2060
3
      tmp = xmlSAX2TextNode(ctxt, value, valueend - value);
2061
3
      ret->children = tmp;
2062
3
      ret->last = tmp;
2063
3
      if (tmp != NULL) {
2064
3
    tmp->doc = ret->doc;
2065
3
    tmp->parent = (xmlNodePtr) ret;
2066
3
      }
2067
38
  } else {
2068
38
      ret->children = xmlStringLenGetNodeList(ctxt->myDoc, value,
2069
38
                valueend - value);
2070
38
      tmp = ret->children;
2071
76
      while (tmp != NULL) {
2072
38
          tmp->doc = ret->doc;
2073
38
    tmp->parent = (xmlNodePtr) ret;
2074
38
    if (tmp->next == NULL)
2075
38
        ret->last = tmp;
2076
38
    tmp = tmp->next;
2077
38
      }
2078
38
  }
2079
1.90M
    } else if (value != NULL) {
2080
1.90M
  xmlNodePtr tmp;
2081
2082
1.90M
  tmp = xmlSAX2TextNode(ctxt, value, valueend - value);
2083
1.90M
  ret->children = tmp;
2084
1.90M
  ret->last = tmp;
2085
1.90M
  if (tmp != NULL) {
2086
1.90M
      tmp->doc = ret->doc;
2087
1.90M
      tmp->parent = (xmlNodePtr) ret;
2088
1.90M
  }
2089
1.90M
    }
2090
2091
1.90M
#ifdef LIBXML_VALID_ENABLED
2092
1.90M
    if ((!ctxt->html) && ctxt->validate && ctxt->wellFormed &&
2093
1.90M
        ctxt->myDoc && ctxt->myDoc->intSubset) {
2094
  /*
2095
   * If we don't substitute entities, the validation should be
2096
   * done on a value with replaced entities anyway.
2097
   */
2098
0
        if (!ctxt->replaceEntities) {
2099
0
      dup = xmlSAX2DecodeAttrEntities(ctxt, value, valueend);
2100
0
      if (dup == NULL) {
2101
0
          if (*valueend == 0) {
2102
0
        ctxt->valid &= xmlValidateOneAttribute(&ctxt->vctxt,
2103
0
            ctxt->myDoc, ctxt->node, ret, value);
2104
0
    } else {
2105
        /*
2106
         * That should already be normalized.
2107
         * cheaper to finally allocate here than duplicate
2108
         * entry points in the full validation code
2109
         */
2110
0
        dup = xmlStrndup(value, valueend - value);
2111
2112
0
        ctxt->valid &= xmlValidateOneAttribute(&ctxt->vctxt,
2113
0
            ctxt->myDoc, ctxt->node, ret, dup);
2114
0
    }
2115
0
      } else {
2116
          /*
2117
     * dup now contains a string of the flattened attribute
2118
     * content with entities substituted. Check if we need to
2119
     * apply an extra layer of normalization.
2120
     * It need to be done twice ... it's an extra burden related
2121
     * to the ability to keep references in attributes
2122
     */
2123
0
    if (ctxt->attsSpecial != NULL) {
2124
0
        xmlChar *nvalnorm;
2125
0
        xmlChar fn[50];
2126
0
        xmlChar *fullname;
2127
2128
0
        fullname = xmlBuildQName(localname, prefix, fn, 50);
2129
0
        if (fullname != NULL) {
2130
0
      ctxt->vctxt.valid = 1;
2131
0
            nvalnorm = xmlValidCtxtNormalizeAttributeValue(
2132
0
                       &ctxt->vctxt, ctxt->myDoc,
2133
0
           ctxt->node, fullname, dup);
2134
0
      if (ctxt->vctxt.valid != 1)
2135
0
          ctxt->valid = 0;
2136
2137
0
      if ((fullname != fn) && (fullname != localname))
2138
0
          xmlFree(fullname);
2139
0
      if (nvalnorm != NULL) {
2140
0
          xmlFree(dup);
2141
0
          dup = nvalnorm;
2142
0
      }
2143
0
        }
2144
0
    }
2145
2146
0
    ctxt->valid &= xmlValidateOneAttribute(&ctxt->vctxt,
2147
0
              ctxt->myDoc, ctxt->node, ret, dup);
2148
0
      }
2149
0
  } else {
2150
      /*
2151
       * if entities already have been substituted, then
2152
       * the attribute as passed is already normalized
2153
       */
2154
0
      dup = xmlStrndup(value, valueend - value);
2155
2156
0
      ctxt->valid &= xmlValidateOneAttribute(&ctxt->vctxt,
2157
0
                               ctxt->myDoc, ctxt->node, ret, dup);
2158
0
  }
2159
0
    } else
2160
1.90M
#endif /* LIBXML_VALID_ENABLED */
2161
1.90M
           if (((ctxt->loadsubset & XML_SKIP_IDS) == 0) &&
2162
1.90M
         (((ctxt->replaceEntities == 0) && (ctxt->external != 2)) ||
2163
1.90M
          ((ctxt->replaceEntities != 0) && (ctxt->inSubset == 0))) &&
2164
               /* Don't create IDs containing entity references */
2165
1.90M
               (ret->children != NULL) &&
2166
1.90M
               (ret->children->type == XML_TEXT_NODE) &&
2167
1.90M
               (ret->children->next == NULL)) {
2168
1.90M
        xmlChar *content = ret->children->content;
2169
        /*
2170
   * when validating, the ID registration is done at the attribute
2171
   * validation level. Otherwise we have to do specific handling here.
2172
   */
2173
1.90M
        if ((prefix == ctxt->str_xml) &&
2174
1.90M
             (localname[0] == 'i') && (localname[1] == 'd') &&
2175
1.90M
       (localname[2] == 0)) {
2176
      /*
2177
       * Add the xml:id value
2178
       *
2179
       * Open issue: normalization of the value.
2180
       */
2181
81
#if defined(LIBXML_SAX1_ENABLED) || defined(LIBXML_HTML_ENABLED) || defined(LIBXML_WRITER_ENABLED) || defined(LIBXML_LEGACY_ENABLED)
2182
81
#ifdef LIBXML_VALID_ENABLED
2183
81
      if (xmlValidateNCName(content, 1) != 0) {
2184
15
          xmlErrValid(ctxt, XML_DTD_XMLID_VALUE,
2185
15
          "xml:id : attribute value %s is not an NCName\n",
2186
15
          (const char *) content, NULL);
2187
15
      }
2188
81
#endif
2189
81
#endif
2190
81
      xmlAddID(&ctxt->vctxt, ctxt->myDoc, content, ret);
2191
1.90M
  } else if (xmlIsID(ctxt->myDoc, ctxt->node, ret)) {
2192
48.9k
      xmlAddID(&ctxt->vctxt, ctxt->myDoc, content, ret);
2193
1.86M
  } else if (xmlIsRef(ctxt->myDoc, ctxt->node, ret)) {
2194
110k
      xmlAddRef(&ctxt->vctxt, ctxt->myDoc, content, ret);
2195
110k
  }
2196
1.90M
    }
2197
1.90M
    if (dup != NULL)
2198
0
  xmlFree(dup);
2199
1.90M
}
2200
2201
/**
2202
 * xmlSAX2StartElementNs:
2203
 * @ctx:  the user data (XML parser context)
2204
 * @localname:  the local name of the element
2205
 * @prefix:  the element namespace prefix if available
2206
 * @URI:  the element namespace name if available
2207
 * @nb_namespaces:  number of namespace definitions on that node
2208
 * @namespaces:  pointer to the array of prefix/URI pairs namespace definitions
2209
 * @nb_attributes:  the number of attributes on that node
2210
 * @nb_defaulted:  the number of defaulted attributes.
2211
 * @attributes:  pointer to the array of (localname/prefix/URI/value/end)
2212
 *               attribute values.
2213
 *
2214
 * SAX2 callback when an element start has been detected by the parser.
2215
 * It provides the namespace information for the element, as well as
2216
 * the new namespace declarations on the element.
2217
 */
2218
void
2219
xmlSAX2StartElementNs(void *ctx,
2220
                      const xmlChar *localname,
2221
          const xmlChar *prefix,
2222
          const xmlChar *URI,
2223
          int nb_namespaces,
2224
          const xmlChar **namespaces,
2225
          int nb_attributes,
2226
          int nb_defaulted,
2227
          const xmlChar **attributes)
2228
1.37M
{
2229
1.37M
    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
2230
1.37M
    xmlNodePtr ret;
2231
1.37M
    xmlNodePtr parent;
2232
1.37M
    xmlNsPtr last = NULL, ns;
2233
1.37M
    const xmlChar *uri, *pref;
2234
1.37M
    xmlChar *lname = NULL;
2235
1.37M
    int i, j;
2236
2237
1.37M
    if (ctx == NULL) return;
2238
1.37M
    parent = ctxt->node;
2239
    /*
2240
     * First check on validity:
2241
     */
2242
1.37M
    if (ctxt->validate && (ctxt->myDoc->extSubset == NULL) &&
2243
1.37M
        ((ctxt->myDoc->intSubset == NULL) ||
2244
191
   ((ctxt->myDoc->intSubset->notations == NULL) &&
2245
26
    (ctxt->myDoc->intSubset->elements == NULL) &&
2246
26
    (ctxt->myDoc->intSubset->attributes == NULL) &&
2247
168
    (ctxt->myDoc->intSubset->entities == NULL)))) {
2248
168
  xmlErrValid(ctxt, XML_DTD_NO_DTD,
2249
168
    "Validation failed: no DTD found !", NULL, NULL);
2250
168
  ctxt->validate = 0;
2251
168
    }
2252
2253
    /*
2254
     * Take care of the rare case of an undefined namespace prefix
2255
     */
2256
1.37M
    if ((prefix != NULL) && (URI == NULL)) {
2257
302
        if (ctxt->dictNames) {
2258
291
      const xmlChar *fullname;
2259
2260
291
      fullname = xmlDictQLookup(ctxt->dict, prefix, localname);
2261
291
      if (fullname != NULL)
2262
291
          localname = fullname;
2263
291
  } else {
2264
11
      lname = xmlBuildQName(localname, prefix, NULL, 0);
2265
11
  }
2266
302
    }
2267
    /*
2268
     * allocate the node
2269
     */
2270
1.37M
    if (ctxt->freeElems != NULL) {
2271
19.2k
        ret = ctxt->freeElems;
2272
19.2k
  ctxt->freeElems = ret->next;
2273
19.2k
  ctxt->freeElemsNr--;
2274
19.2k
  memset(ret, 0, sizeof(xmlNode));
2275
19.2k
        ret->doc = ctxt->myDoc;
2276
19.2k
  ret->type = XML_ELEMENT_NODE;
2277
2278
19.2k
  if (ctxt->dictNames)
2279
19.2k
      ret->name = localname;
2280
0
  else {
2281
0
      if (lname == NULL)
2282
0
    ret->name = xmlStrdup(localname);
2283
0
      else
2284
0
          ret->name = lname;
2285
0
      if (ret->name == NULL) {
2286
0
          xmlSAX2ErrMemory(ctxt, "xmlSAX2StartElementNs");
2287
0
    return;
2288
0
      }
2289
0
  }
2290
19.2k
  if ((__xmlRegisterCallbacks) && (xmlRegisterNodeDefaultValue))
2291
0
      xmlRegisterNodeDefaultValue(ret);
2292
1.35M
    } else {
2293
1.35M
  if (ctxt->dictNames)
2294
1.35M
      ret = xmlNewDocNodeEatName(ctxt->myDoc, NULL,
2295
1.35M
                                 (xmlChar *) localname, NULL);
2296
197
  else if (lname == NULL)
2297
186
      ret = xmlNewDocNode(ctxt->myDoc, NULL, localname, NULL);
2298
11
  else
2299
11
      ret = xmlNewDocNodeEatName(ctxt->myDoc, NULL,
2300
11
                                 (xmlChar *) lname, NULL);
2301
1.35M
  if (ret == NULL) {
2302
0
      xmlSAX2ErrMemory(ctxt, "xmlSAX2StartElementNs");
2303
0
      return;
2304
0
  }
2305
1.35M
    }
2306
1.37M
    if (ctxt->linenumbers) {
2307
1.37M
  if (ctxt->input != NULL) {
2308
1.37M
      if ((unsigned) ctxt->input->line < (unsigned) USHRT_MAX)
2309
1.37M
    ret->line = ctxt->input->line;
2310
240
      else
2311
240
          ret->line = USHRT_MAX;
2312
1.37M
  }
2313
1.37M
    }
2314
2315
1.37M
    if (parent == NULL) {
2316
6.05k
        xmlAddChild((xmlNodePtr) ctxt->myDoc, (xmlNodePtr) ret);
2317
6.05k
    }
2318
    /*
2319
     * Build the namespace list
2320
     */
2321
1.37M
    for (i = 0,j = 0;j < nb_namespaces;j++) {
2322
1.35k
        pref = namespaces[i++];
2323
1.35k
  uri = namespaces[i++];
2324
1.35k
  ns = xmlNewNs(NULL, uri, pref);
2325
1.35k
  if (ns != NULL) {
2326
1.35k
      if (last == NULL) {
2327
941
          ret->nsDef = last = ns;
2328
941
      } else {
2329
417
          last->next = ns;
2330
417
    last = ns;
2331
417
      }
2332
1.35k
      if ((URI != NULL) && (prefix == pref))
2333
860
    ret->ns = ns;
2334
1.35k
  } else {
2335
            /*
2336
             * any out of memory error would already have been raised
2337
             * but we can't be guaranteed it's the actual error due to the
2338
             * API, best is to skip in this case
2339
             */
2340
0
      continue;
2341
0
  }
2342
1.35k
#ifdef LIBXML_VALID_ENABLED
2343
1.35k
  if ((!ctxt->html) && ctxt->validate && ctxt->wellFormed &&
2344
1.35k
      ctxt->myDoc && ctxt->myDoc->intSubset) {
2345
0
      ctxt->valid &= xmlValidateOneNamespace(&ctxt->vctxt, ctxt->myDoc,
2346
0
                                             ret, prefix, ns, uri);
2347
0
  }
2348
1.35k
#endif /* LIBXML_VALID_ENABLED */
2349
1.35k
    }
2350
1.37M
    ctxt->nodemem = -1;
2351
2352
    /*
2353
     * We are parsing a new node.
2354
     */
2355
1.37M
    if (nodePush(ctxt, ret) < 0) {
2356
0
        xmlUnlinkNode(ret);
2357
0
        xmlFreeNode(ret);
2358
0
        return;
2359
0
    }
2360
2361
    /*
2362
     * Link the child element
2363
     */
2364
1.37M
    if (parent != NULL) {
2365
1.37M
        if (parent->type == XML_ELEMENT_NODE) {
2366
1.37M
      xmlAddChild(parent, ret);
2367
1.37M
  } else {
2368
0
      xmlAddSibling(parent, ret);
2369
0
  }
2370
1.37M
    }
2371
2372
    /*
2373
     * Insert the defaulted attributes from the DTD only if requested:
2374
     */
2375
1.37M
    if ((nb_defaulted != 0) &&
2376
1.37M
        ((ctxt->loadsubset & XML_COMPLETE_ATTRS) == 0))
2377
24.7k
  nb_attributes -= nb_defaulted;
2378
2379
    /*
2380
     * Search the namespace if it wasn't already found
2381
     * Note that, if prefix is NULL, this searches for the default Ns
2382
     */
2383
1.37M
    if ((URI != NULL) && (ret->ns == NULL)) {
2384
6.98k
        ret->ns = xmlSearchNs(ctxt->myDoc, parent, prefix);
2385
6.98k
  if ((ret->ns == NULL) && (xmlStrEqual(prefix, BAD_CAST "xml"))) {
2386
12
      ret->ns = xmlSearchNs(ctxt->myDoc, ret, prefix);
2387
12
  }
2388
6.98k
  if (ret->ns == NULL) {
2389
0
      ns = xmlNewNs(ret, NULL, prefix);
2390
0
      if (ns == NULL) {
2391
2392
0
          xmlSAX2ErrMemory(ctxt, "xmlSAX2StartElementNs");
2393
0
    return;
2394
0
      }
2395
0
            if (prefix != NULL)
2396
0
                xmlNsWarnMsg(ctxt, XML_NS_ERR_UNDEFINED_NAMESPACE,
2397
0
                             "Namespace prefix %s was not found\n",
2398
0
                             prefix, NULL);
2399
0
            else
2400
0
                xmlNsWarnMsg(ctxt, XML_NS_ERR_UNDEFINED_NAMESPACE,
2401
0
                             "Namespace default prefix was not found\n",
2402
0
                             NULL, NULL);
2403
0
  }
2404
6.98k
    }
2405
2406
    /*
2407
     * process all the other attributes
2408
     */
2409
1.37M
    if (nb_attributes > 0) {
2410
2.96M
        for (j = 0,i = 0;i < nb_attributes;i++,j+=5) {
2411
      /*
2412
       * Handle the rare case of an undefined attribute prefix
2413
       */
2414
1.90M
      if ((attributes[j+1] != NULL) && (attributes[j+2] == NULL)) {
2415
62
    if (ctxt->dictNames) {
2416
59
        const xmlChar *fullname;
2417
2418
59
        fullname = xmlDictQLookup(ctxt->dict, attributes[j+1],
2419
59
                                  attributes[j]);
2420
59
        if (fullname != NULL) {
2421
59
      xmlSAX2AttributeNs(ctxt, fullname, NULL,
2422
59
                         attributes[j+3], attributes[j+4]);
2423
59
            continue;
2424
59
        }
2425
59
    } else {
2426
3
        lname = xmlBuildQName(attributes[j], attributes[j+1],
2427
3
                              NULL, 0);
2428
3
        if (lname != NULL) {
2429
3
      xmlSAX2AttributeNs(ctxt, lname, NULL,
2430
3
                         attributes[j+3], attributes[j+4]);
2431
3
      xmlFree(lname);
2432
3
            continue;
2433
3
        }
2434
3
    }
2435
62
      }
2436
1.90M
      xmlSAX2AttributeNs(ctxt, attributes[j], attributes[j+1],
2437
1.90M
             attributes[j+3], attributes[j+4]);
2438
1.90M
  }
2439
1.05M
    }
2440
2441
1.37M
#ifdef LIBXML_VALID_ENABLED
2442
    /*
2443
     * If it's the Document root, finish the DTD validation and
2444
     * check the document root element for validity
2445
     */
2446
1.37M
    if ((ctxt->validate) &&
2447
1.37M
        ((ctxt->vctxt.flags & XML_VCTXT_DTD_VALIDATED) == 0)) {
2448
26
  int chk;
2449
2450
26
  chk = xmlValidateDtdFinal(&ctxt->vctxt, ctxt->myDoc);
2451
26
  if (chk <= 0)
2452
0
      ctxt->valid = 0;
2453
26
  if (chk < 0)
2454
0
      ctxt->wellFormed = 0;
2455
26
  ctxt->valid &= xmlValidateRoot(&ctxt->vctxt, ctxt->myDoc);
2456
26
  ctxt->vctxt.flags |= XML_VCTXT_DTD_VALIDATED;
2457
26
    }
2458
1.37M
#endif /* LIBXML_VALID_ENABLED */
2459
1.37M
}
2460
2461
/**
2462
 * xmlSAX2EndElementNs:
2463
 * @ctx:  the user data (XML parser context)
2464
 * @localname:  the local name of the element
2465
 * @prefix:  the element namespace prefix if available
2466
 * @URI:  the element namespace name if available
2467
 *
2468
 * SAX2 callback when an element end has been detected by the parser.
2469
 * It provides the namespace information for the element.
2470
 */
2471
void
2472
xmlSAX2EndElementNs(void *ctx,
2473
                    const xmlChar * localname ATTRIBUTE_UNUSED,
2474
                    const xmlChar * prefix ATTRIBUTE_UNUSED,
2475
        const xmlChar * URI ATTRIBUTE_UNUSED)
2476
1.36M
{
2477
1.36M
    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
2478
1.36M
    xmlParserNodeInfo node_info;
2479
1.36M
    xmlNodePtr cur;
2480
2481
1.36M
    if (ctx == NULL) return;
2482
1.36M
    cur = ctxt->node;
2483
    /* Capture end position and add node */
2484
1.36M
    if ((ctxt->record_info) && (cur != NULL)) {
2485
0
        node_info.end_pos = ctxt->input->cur - ctxt->input->base;
2486
0
        node_info.end_line = ctxt->input->line;
2487
0
        node_info.node = cur;
2488
0
        xmlParserAddNodeInfo(ctxt, &node_info);
2489
0
    }
2490
1.36M
    ctxt->nodemem = -1;
2491
2492
1.36M
#ifdef LIBXML_VALID_ENABLED
2493
1.36M
    if (ctxt->validate && ctxt->wellFormed &&
2494
1.36M
        ctxt->myDoc && ctxt->myDoc->intSubset)
2495
6
        ctxt->valid &= xmlValidateOneElement(&ctxt->vctxt, ctxt->myDoc, cur);
2496
1.36M
#endif /* LIBXML_VALID_ENABLED */
2497
2498
    /*
2499
     * end of parsing of this node.
2500
     */
2501
1.36M
    nodePop(ctxt);
2502
1.36M
}
2503
2504
/**
2505
 * xmlSAX2Reference:
2506
 * @ctx: the user data (XML parser context)
2507
 * @name:  The entity name
2508
 *
2509
 * called when an entity xmlSAX2Reference is detected.
2510
 */
2511
void
2512
xmlSAX2Reference(void *ctx, const xmlChar *name)
2513
14.9k
{
2514
14.9k
    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
2515
14.9k
    xmlNodePtr ret;
2516
2517
14.9k
    if (ctx == NULL) return;
2518
#ifdef DEBUG_SAX
2519
    xmlGenericError(xmlGenericErrorContext,
2520
      "SAX.xmlSAX2Reference(%s)\n", name);
2521
#endif
2522
14.9k
    if (name[0] == '#')
2523
18
  ret = xmlNewCharRef(ctxt->myDoc, name);
2524
14.9k
    else
2525
14.9k
  ret = xmlNewReference(ctxt->myDoc, name);
2526
#ifdef DEBUG_SAX_TREE
2527
    xmlGenericError(xmlGenericErrorContext,
2528
      "add xmlSAX2Reference %s to %s \n", name, ctxt->node->name);
2529
#endif
2530
14.9k
    if (xmlAddChild(ctxt->node, ret) == NULL) {
2531
929
        xmlFreeNode(ret);
2532
929
    }
2533
14.9k
}
2534
2535
/**
2536
 * xmlSAX2Text:
2537
 * @ctx: the user data (XML parser context)
2538
 * @ch:  a xmlChar string
2539
 * @len: the number of xmlChar
2540
 * @type: text or cdata
2541
 *
2542
 * Append characters.
2543
 */
2544
static void
2545
xmlSAX2Text(xmlParserCtxtPtr ctxt, const xmlChar *ch, int len,
2546
            xmlElementType type)
2547
3.11M
{
2548
3.11M
    xmlNodePtr lastChild;
2549
2550
3.11M
    if (ctxt == NULL) return;
2551
#ifdef DEBUG_SAX
2552
    xmlGenericError(xmlGenericErrorContext,
2553
      "SAX.xmlSAX2Characters(%.30s, %d)\n", ch, len);
2554
#endif
2555
    /*
2556
     * Handle the data if any. If there is no child
2557
     * add it as content, otherwise if the last child is text,
2558
     * concatenate it, else create a new node of type text.
2559
     */
2560
2561
3.11M
    if (ctxt->node == NULL) {
2562
#ifdef DEBUG_SAX_TREE
2563
  xmlGenericError(xmlGenericErrorContext,
2564
    "add chars: ctxt->node == NULL !\n");
2565
#endif
2566
162k
        return;
2567
162k
    }
2568
2.95M
    lastChild = ctxt->node->last;
2569
#ifdef DEBUG_SAX_TREE
2570
    xmlGenericError(xmlGenericErrorContext,
2571
      "add chars to %s \n", ctxt->node->name);
2572
#endif
2573
2574
    /*
2575
     * Here we needed an accelerator mechanism in case of very large
2576
     * elements. Use an attribute in the structure !!!
2577
     */
2578
2.95M
    if (lastChild == NULL) {
2579
619k
        if (type == XML_TEXT_NODE)
2580
616k
            lastChild = xmlSAX2TextNode(ctxt, ch, len);
2581
2.76k
        else
2582
2.76k
            lastChild = xmlNewCDataBlock(ctxt->myDoc, ch, len);
2583
619k
  if (lastChild != NULL) {
2584
619k
      ctxt->node->children = lastChild;
2585
619k
      ctxt->node->last = lastChild;
2586
619k
      lastChild->parent = ctxt->node;
2587
619k
      lastChild->doc = ctxt->node->doc;
2588
619k
      ctxt->nodelen = len;
2589
619k
      ctxt->nodemem = len + 1;
2590
619k
  } else {
2591
0
      xmlSAX2ErrMemory(ctxt, "xmlSAX2Characters");
2592
0
      return;
2593
0
  }
2594
2.33M
    } else {
2595
2.33M
  int coalesceText = (lastChild != NULL) &&
2596
2.33M
      (lastChild->type == type) &&
2597
2.33M
      ((type != XML_TEXT_NODE) ||
2598
874k
             (lastChild->name == xmlStringText));
2599
2.33M
  if ((coalesceText) && (ctxt->nodemem != 0)) {
2600
      /*
2601
       * The whole point of maintaining nodelen and nodemem,
2602
       * xmlTextConcat is too costly, i.e. compute length,
2603
       * reallocate a new buffer, move data, append ch. Here
2604
       * We try to minimize realloc() uses and avoid copying
2605
       * and recomputing length over and over.
2606
       */
2607
828k
      if (lastChild->content == (xmlChar *)&(lastChild->properties)) {
2608
5.76k
    lastChild->content = xmlStrdup(lastChild->content);
2609
5.76k
    lastChild->properties = NULL;
2610
822k
      } else if ((ctxt->nodemem == ctxt->nodelen + 1) &&
2611
822k
                 (xmlDictOwns(ctxt->dict, lastChild->content))) {
2612
146
    lastChild->content = xmlStrdup(lastChild->content);
2613
146
      }
2614
828k
      if (lastChild->content == NULL) {
2615
0
    xmlSAX2ErrMemory(ctxt, "xmlSAX2Characters: xmlStrdup returned NULL");
2616
0
    return;
2617
0
      }
2618
828k
      if (ctxt->nodelen > INT_MAX - len) {
2619
0
                xmlSAX2ErrMemory(ctxt, "xmlSAX2Characters overflow prevented");
2620
0
                return;
2621
0
      }
2622
828k
            if ((ctxt->nodelen + len > XML_MAX_TEXT_LENGTH) &&
2623
828k
                ((ctxt->options & XML_PARSE_HUGE) == 0)) {
2624
0
                xmlSAX2ErrMemory(ctxt, "xmlSAX2Characters: huge text node");
2625
0
                return;
2626
0
            }
2627
828k
      if (ctxt->nodelen + len >= ctxt->nodemem) {
2628
83.8k
    xmlChar *newbuf;
2629
83.8k
    int size;
2630
2631
83.8k
    size = ctxt->nodemem > INT_MAX - len ?
2632
0
                       INT_MAX :
2633
83.8k
                       ctxt->nodemem + len;
2634
83.8k
    size = size > INT_MAX / 2 ? INT_MAX : size * 2;
2635
83.8k
                newbuf = (xmlChar *) xmlRealloc(lastChild->content,size);
2636
83.8k
    if (newbuf == NULL) {
2637
0
        xmlSAX2ErrMemory(ctxt, "xmlSAX2Characters");
2638
0
        return;
2639
0
    }
2640
83.8k
    ctxt->nodemem = size;
2641
83.8k
    lastChild->content = newbuf;
2642
83.8k
      }
2643
828k
      memcpy(&lastChild->content[ctxt->nodelen], ch, len);
2644
828k
      ctxt->nodelen += len;
2645
828k
      lastChild->content[ctxt->nodelen] = 0;
2646
1.50M
  } else if (coalesceText) {
2647
45.7k
      if (xmlTextConcat(lastChild, ch, len)) {
2648
0
    xmlSAX2ErrMemory(ctxt, "xmlSAX2Characters");
2649
0
      }
2650
45.7k
      if (ctxt->node->children != NULL) {
2651
45.7k
    ctxt->nodelen = xmlStrlen(lastChild->content);
2652
45.7k
    ctxt->nodemem = ctxt->nodelen + 1;
2653
45.7k
      }
2654
1.46M
  } else {
2655
      /* Mixed content, first time */
2656
1.46M
            if (type == XML_TEXT_NODE) {
2657
1.46M
                lastChild = xmlSAX2TextNode(ctxt, ch, len);
2658
1.46M
                if (lastChild != NULL)
2659
1.46M
                    lastChild->doc = ctxt->myDoc;
2660
1.46M
            } else
2661
58
                lastChild = xmlNewCDataBlock(ctxt->myDoc, ch, len);
2662
1.46M
      if (lastChild != NULL) {
2663
1.46M
    xmlAddChild(ctxt->node, lastChild);
2664
1.46M
    if (ctxt->node->children != NULL) {
2665
1.46M
        ctxt->nodelen = len;
2666
1.46M
        ctxt->nodemem = len + 1;
2667
1.46M
    }
2668
1.46M
      }
2669
1.46M
  }
2670
2.33M
    }
2671
2.95M
}
2672
2673
/**
2674
 * xmlSAX2Characters:
2675
 * @ctx: the user data (XML parser context)
2676
 * @ch:  a xmlChar string
2677
 * @len: the number of xmlChar
2678
 *
2679
 * receiving some chars from the parser.
2680
 */
2681
void
2682
xmlSAX2Characters(void *ctx, const xmlChar *ch, int len)
2683
3.11M
{
2684
3.11M
    xmlSAX2Text((xmlParserCtxtPtr) ctx, ch, len, XML_TEXT_NODE);
2685
3.11M
}
2686
2687
/**
2688
 * xmlSAX2IgnorableWhitespace:
2689
 * @ctx: the user data (XML parser context)
2690
 * @ch:  a xmlChar string
2691
 * @len: the number of xmlChar
2692
 *
2693
 * receiving some ignorable whitespaces from the parser.
2694
 * UNUSED: by default the DOM building will use xmlSAX2Characters
2695
 */
2696
void
2697
xmlSAX2IgnorableWhitespace(void *ctx ATTRIBUTE_UNUSED, const xmlChar *ch ATTRIBUTE_UNUSED, int len ATTRIBUTE_UNUSED)
2698
223k
{
2699
    /* xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx; */
2700
#ifdef DEBUG_SAX
2701
    xmlGenericError(xmlGenericErrorContext,
2702
      "SAX.xmlSAX2IgnorableWhitespace(%.30s, %d)\n", ch, len);
2703
#endif
2704
223k
}
2705
2706
/**
2707
 * xmlSAX2ProcessingInstruction:
2708
 * @ctx: the user data (XML parser context)
2709
 * @target:  the target name
2710
 * @data: the PI data's
2711
 *
2712
 * A processing instruction has been parsed.
2713
 */
2714
void
2715
xmlSAX2ProcessingInstruction(void *ctx, const xmlChar *target,
2716
                      const xmlChar *data)
2717
2.66k
{
2718
2.66k
    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
2719
2.66k
    xmlNodePtr ret;
2720
2.66k
    xmlNodePtr parent;
2721
2722
2.66k
    if (ctx == NULL) return;
2723
2.66k
    parent = ctxt->node;
2724
#ifdef DEBUG_SAX
2725
    xmlGenericError(xmlGenericErrorContext,
2726
      "SAX.xmlSAX2ProcessingInstruction(%s, %s)\n", target, data);
2727
#endif
2728
2729
2.66k
    ret = xmlNewDocPI(ctxt->myDoc, target, data);
2730
2.66k
    if (ret == NULL) return;
2731
2732
2.66k
    if (ctxt->linenumbers) {
2733
2.66k
  if (ctxt->input != NULL) {
2734
2.66k
      if ((unsigned) ctxt->input->line < (unsigned) USHRT_MAX)
2735
2.66k
    ret->line = ctxt->input->line;
2736
0
      else
2737
0
          ret->line = USHRT_MAX;
2738
2.66k
  }
2739
2.66k
    }
2740
2.66k
    if (ctxt->inSubset == 1) {
2741
0
  xmlAddChild((xmlNodePtr) ctxt->myDoc->intSubset, ret);
2742
0
  return;
2743
2.66k
    } else if (ctxt->inSubset == 2) {
2744
0
  xmlAddChild((xmlNodePtr) ctxt->myDoc->extSubset, ret);
2745
0
  return;
2746
0
    }
2747
2.66k
    if (parent == NULL) {
2748
#ifdef DEBUG_SAX_TREE
2749
      xmlGenericError(xmlGenericErrorContext,
2750
        "Setting PI %s as root\n", target);
2751
#endif
2752
2.43k
        xmlAddChild((xmlNodePtr) ctxt->myDoc, (xmlNodePtr) ret);
2753
2.43k
  return;
2754
2.43k
    }
2755
229
    if (parent->type == XML_ELEMENT_NODE) {
2756
#ifdef DEBUG_SAX_TREE
2757
  xmlGenericError(xmlGenericErrorContext,
2758
    "adding PI %s child to %s\n", target, parent->name);
2759
#endif
2760
229
  xmlAddChild(parent, ret);
2761
229
    } else {
2762
#ifdef DEBUG_SAX_TREE
2763
  xmlGenericError(xmlGenericErrorContext,
2764
    "adding PI %s sibling to ", target);
2765
  xmlDebugDumpOneNode(stderr, parent, 0);
2766
#endif
2767
0
  xmlAddSibling(parent, ret);
2768
0
    }
2769
229
}
2770
2771
/**
2772
 * xmlSAX2Comment:
2773
 * @ctx: the user data (XML parser context)
2774
 * @value:  the xmlSAX2Comment content
2775
 *
2776
 * A xmlSAX2Comment has been parsed.
2777
 */
2778
void
2779
xmlSAX2Comment(void *ctx, const xmlChar *value)
2780
2.08M
{
2781
2.08M
    xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
2782
2.08M
    xmlNodePtr ret;
2783
2.08M
    xmlNodePtr parent;
2784
2785
2.08M
    if (ctx == NULL) return;
2786
2.08M
    parent = ctxt->node;
2787
#ifdef DEBUG_SAX
2788
    xmlGenericError(xmlGenericErrorContext, "SAX.xmlSAX2Comment(%s)\n", value);
2789
#endif
2790
2.08M
    ret = xmlNewDocComment(ctxt->myDoc, value);
2791
2.08M
    if (ret == NULL) return;
2792
2.08M
    if (ctxt->linenumbers) {
2793
2.08M
  if (ctxt->input != NULL) {
2794
2.08M
      if ((unsigned) ctxt->input->line < (unsigned) USHRT_MAX)
2795
2.08M
    ret->line = ctxt->input->line;
2796
95
      else
2797
95
          ret->line = USHRT_MAX;
2798
2.08M
  }
2799
2.08M
    }
2800
2801
2.08M
    if (ctxt->inSubset == 1) {
2802
1.92M
  xmlAddChild((xmlNodePtr) ctxt->myDoc->intSubset, ret);
2803
1.92M
  return;
2804
1.92M
    } else if (ctxt->inSubset == 2) {
2805
131k
  xmlAddChild((xmlNodePtr) ctxt->myDoc->extSubset, ret);
2806
131k
  return;
2807
131k
    }
2808
27.1k
    if (parent == NULL) {
2809
#ifdef DEBUG_SAX_TREE
2810
      xmlGenericError(xmlGenericErrorContext,
2811
        "Setting xmlSAX2Comment as root\n");
2812
#endif
2813
4.35k
        xmlAddChild((xmlNodePtr) ctxt->myDoc, (xmlNodePtr) ret);
2814
4.35k
  return;
2815
4.35k
    }
2816
22.7k
    if (parent->type == XML_ELEMENT_NODE) {
2817
#ifdef DEBUG_SAX_TREE
2818
  xmlGenericError(xmlGenericErrorContext,
2819
    "adding xmlSAX2Comment child to %s\n", parent->name);
2820
#endif
2821
22.7k
  xmlAddChild(parent, ret);
2822
22.7k
    } else {
2823
#ifdef DEBUG_SAX_TREE
2824
  xmlGenericError(xmlGenericErrorContext,
2825
    "adding xmlSAX2Comment sibling to ");
2826
  xmlDebugDumpOneNode(stderr, parent, 0);
2827
#endif
2828
0
  xmlAddSibling(parent, ret);
2829
0
    }
2830
22.7k
}
2831
2832
/**
2833
 * xmlSAX2CDataBlock:
2834
 * @ctx: the user data (XML parser context)
2835
 * @value:  The pcdata content
2836
 * @len:  the block length
2837
 *
2838
 * called when a pcdata block has been parsed
2839
 */
2840
void
2841
xmlSAX2CDataBlock(void *ctx, const xmlChar *value, int len)
2842
3.17k
{
2843
3.17k
    xmlSAX2Text((xmlParserCtxtPtr) ctx, value, len, XML_CDATA_SECTION_NODE);
2844
3.17k
}
2845
2846
static int xmlSAX2DefaultVersionValue = 2;
2847
2848
#ifdef LIBXML_SAX1_ENABLED
2849
/**
2850
 * xmlSAXDefaultVersion:
2851
 * @version:  the version, 1 or 2
2852
 *
2853
 * DEPRECATED: Use parser option XML_PARSE_SAX1.
2854
 *
2855
 * Set the default version of SAX used globally by the library.
2856
 * By default, during initialization the default is set to 2.
2857
 * Note that it is generally a better coding style to use
2858
 * xmlSAXVersion() to set up the version explicitly for a given
2859
 * parsing context.
2860
 *
2861
 * Returns the previous value in case of success and -1 in case of error.
2862
 */
2863
int
2864
xmlSAXDefaultVersion(int version)
2865
0
{
2866
0
    int ret = xmlSAX2DefaultVersionValue;
2867
2868
0
    if ((version != 1) && (version != 2))
2869
0
        return(-1);
2870
0
    xmlSAX2DefaultVersionValue = version;
2871
0
    return(ret);
2872
0
}
2873
#endif /* LIBXML_SAX1_ENABLED */
2874
2875
/**
2876
 * xmlSAXVersion:
2877
 * @hdlr:  the SAX handler
2878
 * @version:  the version, 1 or 2
2879
 *
2880
 * Initialize the default XML SAX handler according to the version
2881
 *
2882
 * Returns 0 in case of success and -1 in case of error.
2883
 */
2884
int
2885
xmlSAXVersion(xmlSAXHandler *hdlr, int version)
2886
27.6k
{
2887
27.6k
    if (hdlr == NULL) return(-1);
2888
27.6k
    if (version == 2) {
2889
27.6k
  hdlr->startElement = NULL;
2890
27.6k
  hdlr->endElement = NULL;
2891
27.6k
  hdlr->startElementNs = xmlSAX2StartElementNs;
2892
27.6k
  hdlr->endElementNs = xmlSAX2EndElementNs;
2893
27.6k
  hdlr->serror = NULL;
2894
27.6k
  hdlr->initialized = XML_SAX2_MAGIC;
2895
27.6k
#ifdef LIBXML_SAX1_ENABLED
2896
27.6k
    } else if (version == 1) {
2897
0
  hdlr->startElement = xmlSAX2StartElement;
2898
0
  hdlr->endElement = xmlSAX2EndElement;
2899
0
  hdlr->initialized = 1;
2900
0
#endif /* LIBXML_SAX1_ENABLED */
2901
0
    } else
2902
0
        return(-1);
2903
27.6k
    hdlr->internalSubset = xmlSAX2InternalSubset;
2904
27.6k
    hdlr->externalSubset = xmlSAX2ExternalSubset;
2905
27.6k
    hdlr->isStandalone = xmlSAX2IsStandalone;
2906
27.6k
    hdlr->hasInternalSubset = xmlSAX2HasInternalSubset;
2907
27.6k
    hdlr->hasExternalSubset = xmlSAX2HasExternalSubset;
2908
27.6k
    hdlr->resolveEntity = xmlSAX2ResolveEntity;
2909
27.6k
    hdlr->getEntity = xmlSAX2GetEntity;
2910
27.6k
    hdlr->getParameterEntity = xmlSAX2GetParameterEntity;
2911
27.6k
    hdlr->entityDecl = xmlSAX2EntityDecl;
2912
27.6k
    hdlr->attributeDecl = xmlSAX2AttributeDecl;
2913
27.6k
    hdlr->elementDecl = xmlSAX2ElementDecl;
2914
27.6k
    hdlr->notationDecl = xmlSAX2NotationDecl;
2915
27.6k
    hdlr->unparsedEntityDecl = xmlSAX2UnparsedEntityDecl;
2916
27.6k
    hdlr->setDocumentLocator = xmlSAX2SetDocumentLocator;
2917
27.6k
    hdlr->startDocument = xmlSAX2StartDocument;
2918
27.6k
    hdlr->endDocument = xmlSAX2EndDocument;
2919
27.6k
    hdlr->reference = xmlSAX2Reference;
2920
27.6k
    hdlr->characters = xmlSAX2Characters;
2921
27.6k
    hdlr->cdataBlock = xmlSAX2CDataBlock;
2922
27.6k
    hdlr->ignorableWhitespace = xmlSAX2Characters;
2923
27.6k
    hdlr->processingInstruction = xmlSAX2ProcessingInstruction;
2924
27.6k
    hdlr->comment = xmlSAX2Comment;
2925
27.6k
    hdlr->warning = xmlParserWarning;
2926
27.6k
    hdlr->error = xmlParserError;
2927
27.6k
    hdlr->fatalError = xmlParserError;
2928
2929
27.6k
    return(0);
2930
27.6k
}
2931
2932
/**
2933
 * xmlSAX2InitDefaultSAXHandler:
2934
 * @hdlr:  the SAX handler
2935
 * @warning:  flag if non-zero sets the handler warning procedure
2936
 *
2937
 * Initialize the default XML SAX2 handler
2938
 */
2939
void
2940
xmlSAX2InitDefaultSAXHandler(xmlSAXHandler *hdlr, int warning)
2941
0
{
2942
0
    if ((hdlr == NULL) || (hdlr->initialized != 0))
2943
0
  return;
2944
2945
0
    xmlSAXVersion(hdlr, xmlSAX2DefaultVersionValue);
2946
0
    if (warning == 0)
2947
0
  hdlr->warning = NULL;
2948
0
    else
2949
0
  hdlr->warning = xmlParserWarning;
2950
0
}
2951
2952
/**
2953
 * xmlDefaultSAXHandlerInit:
2954
 *
2955
 * DEPRECATED: This function is a no-op. Call xmlInitParser to
2956
 * initialize the library.
2957
 *
2958
 * Initialize the default SAX2 handler
2959
 */
2960
void
2961
xmlDefaultSAXHandlerInit(void)
2962
0
{
2963
0
}
2964
2965
#ifdef LIBXML_HTML_ENABLED
2966
2967
/**
2968
 * xmlSAX2InitHtmlDefaultSAXHandler:
2969
 * @hdlr:  the SAX handler
2970
 *
2971
 * Initialize the default HTML SAX2 handler
2972
 */
2973
void
2974
xmlSAX2InitHtmlDefaultSAXHandler(xmlSAXHandler *hdlr)
2975
0
{
2976
0
    if ((hdlr == NULL) || (hdlr->initialized != 0))
2977
0
  return;
2978
2979
0
    hdlr->internalSubset = xmlSAX2InternalSubset;
2980
0
    hdlr->externalSubset = NULL;
2981
0
    hdlr->isStandalone = NULL;
2982
0
    hdlr->hasInternalSubset = NULL;
2983
0
    hdlr->hasExternalSubset = NULL;
2984
0
    hdlr->resolveEntity = NULL;
2985
0
    hdlr->getEntity = xmlSAX2GetEntity;
2986
0
    hdlr->getParameterEntity = NULL;
2987
0
    hdlr->entityDecl = NULL;
2988
0
    hdlr->attributeDecl = NULL;
2989
0
    hdlr->elementDecl = NULL;
2990
0
    hdlr->notationDecl = NULL;
2991
0
    hdlr->unparsedEntityDecl = NULL;
2992
0
    hdlr->setDocumentLocator = xmlSAX2SetDocumentLocator;
2993
0
    hdlr->startDocument = xmlSAX2StartDocument;
2994
0
    hdlr->endDocument = xmlSAX2EndDocument;
2995
0
    hdlr->startElement = xmlSAX2StartElement;
2996
0
    hdlr->endElement = xmlSAX2EndElement;
2997
0
    hdlr->reference = NULL;
2998
0
    hdlr->characters = xmlSAX2Characters;
2999
0
    hdlr->cdataBlock = xmlSAX2CDataBlock;
3000
0
    hdlr->ignorableWhitespace = xmlSAX2IgnorableWhitespace;
3001
0
    hdlr->processingInstruction = xmlSAX2ProcessingInstruction;
3002
0
    hdlr->comment = xmlSAX2Comment;
3003
0
    hdlr->warning = xmlParserWarning;
3004
0
    hdlr->error = xmlParserError;
3005
0
    hdlr->fatalError = xmlParserError;
3006
3007
0
    hdlr->initialized = 1;
3008
0
}
3009
3010
/**
3011
 * htmlDefaultSAXHandlerInit:
3012
 *
3013
 * DEPRECATED: This function is a no-op. Call xmlInitParser to
3014
 * initialize the library.
3015
 */
3016
void
3017
htmlDefaultSAXHandlerInit(void)
3018
0
{
3019
0
}
3020
3021
#endif /* LIBXML_HTML_ENABLED */