Line | Count | Source |
1 | | /* |
2 | | * pattern.c: Implementation of selectors for nodes |
3 | | * |
4 | | * Reference: |
5 | | * http://www.w3.org/TR/2001/REC-xmlschema-1-20010502/ |
6 | | * to some extent |
7 | | * http://www.w3.org/TR/1999/REC-xml-19991116 |
8 | | * |
9 | | * See Copyright for the status of this software. |
10 | | * |
11 | | * Author: Daniel Veillard |
12 | | */ |
13 | | |
14 | | /* |
15 | | * TODO: |
16 | | * - compilation flags to check for specific syntaxes |
17 | | * using flags of #xmlPatterncompile |
18 | | * - making clear how pattern starting with / or . need to be handled, |
19 | | * currently push(NULL, NULL) means a reset of the streaming context |
20 | | * and indicating we are on / (the document node), probably need |
21 | | * something similar for . |
22 | | * - get rid of the "compile" starting with lowercase |
23 | | * - DONE (2006-05-16): get rid of the Strdup/Strndup in case of dictionary |
24 | | */ |
25 | | |
26 | | #define IN_LIBXML |
27 | | #include "libxml.h" |
28 | | |
29 | | #include <string.h> |
30 | | #include <libxml/pattern.h> |
31 | | #include <libxml/xmlmemory.h> |
32 | | #include <libxml/tree.h> |
33 | | #include <libxml/dict.h> |
34 | | #include <libxml/xmlerror.h> |
35 | | #include <libxml/parserInternals.h> |
36 | | |
37 | | #include "private/memory.h" |
38 | | #include "private/parser.h" |
39 | | |
40 | | #ifdef LIBXML_PATTERN_ENABLED |
41 | | |
42 | | #ifdef ERROR |
43 | | #undef ERROR |
44 | | #endif |
45 | | #define ERROR(a, b, c, d) |
46 | | #define ERROR5(a, b, c, d, e) |
47 | | |
48 | 1.68M | #define XML_STREAM_STEP_DESC 1 |
49 | 247k | #define XML_STREAM_STEP_FINAL 2 |
50 | 607k | #define XML_STREAM_STEP_ROOT 4 |
51 | 17.8k | #define XML_STREAM_STEP_ATTR 8 |
52 | 1.77k | #define XML_STREAM_STEP_NODE 16 |
53 | 7.71k | #define XML_STREAM_STEP_IN_SET 32 |
54 | | |
55 | | /* |
56 | | * NOTE: Those private flags (XML_STREAM_xxx) are used |
57 | | * in _xmlStreamCtxt->flag. They extend the public |
58 | | * xmlPatternFlags, so be careful not to interfere with the |
59 | | * reserved values for xmlPatternFlags. |
60 | | */ |
61 | 4.41k | #define XML_STREAM_FINAL_IS_ANY_NODE 1<<14 |
62 | 12.9k | #define XML_STREAM_FROM_ROOT 1<<15 |
63 | 842k | #define XML_STREAM_DESC 1<<16 |
64 | | |
65 | | /* |
66 | | * XML_STREAM_ANY_NODE is used for comparison against |
67 | | * xmlElementType enums, to indicate a node of any type. |
68 | | */ |
69 | 240k | #define XML_STREAM_ANY_NODE 100 |
70 | | |
71 | 821k | #define XML_PATTERN_NOTPATTERN (XML_PATTERN_XPATH | \ |
72 | 821k | XML_PATTERN_XSSEL | \ |
73 | 821k | XML_PATTERN_XSFIELD) |
74 | | |
75 | 219k | #define XML_STREAM_XS_IDC(c) ((c)->flags & \ |
76 | 219k | (XML_PATTERN_XSSEL | XML_PATTERN_XSFIELD)) |
77 | | |
78 | 31.3k | #define XML_STREAM_XS_IDC_SEL(c) ((c)->flags & XML_PATTERN_XSSEL) |
79 | | |
80 | | #define XML_STREAM_XS_IDC_FIELD(c) ((c)->flags & XML_PATTERN_XSFIELD) |
81 | | |
82 | | #define XML_PAT_COPY_NSNAME(c, r, nsname) \ |
83 | 24.3k | if ((c)->comp->dict) \ |
84 | 24.3k | r = (xmlChar *) xmlDictLookup((c)->comp->dict, BAD_CAST nsname, -1); \ |
85 | 24.3k | else r = xmlStrdup(BAD_CAST nsname); |
86 | | |
87 | 41.9k | #define XML_PAT_FREE_STRING(c, r) if ((c)->comp->dict == NULL) xmlFree(r); |
88 | | |
89 | | typedef struct _xmlStreamStep xmlStreamStep; |
90 | | typedef xmlStreamStep *xmlStreamStepPtr; |
91 | | struct _xmlStreamStep { |
92 | | int flags; /* properties of that step */ |
93 | | const xmlChar *name; /* first string value if NULL accept all */ |
94 | | const xmlChar *ns; /* second string value */ |
95 | | int nodeType; /* type of node */ |
96 | | }; |
97 | | |
98 | | typedef struct _xmlStreamComp xmlStreamComp; |
99 | | typedef xmlStreamComp *xmlStreamCompPtr; |
100 | | struct _xmlStreamComp { |
101 | | xmlDict *dict; /* the dictionary if any */ |
102 | | int nbStep; /* number of steps in the automata */ |
103 | | int maxStep; /* allocated number of steps */ |
104 | | xmlStreamStepPtr steps; /* the array of steps */ |
105 | | int flags; |
106 | | }; |
107 | | |
108 | | struct _xmlStreamCtxt { |
109 | | struct _xmlStreamCtxt *next;/* link to next sub pattern if | */ |
110 | | xmlStreamCompPtr comp; /* the compiled stream */ |
111 | | int nbState; /* number of states in the automata */ |
112 | | int maxState; /* allocated number of states */ |
113 | | int level; /* how deep are we ? */ |
114 | | int *states; /* the array of step indexes */ |
115 | | int flags; /* validation options */ |
116 | | int blockLevel; |
117 | | }; |
118 | | |
119 | | static void xmlFreeStreamComp(xmlStreamCompPtr comp); |
120 | | |
121 | | /* |
122 | | * Types are private: |
123 | | */ |
124 | | |
125 | | typedef enum { |
126 | | XML_OP_END=0, |
127 | | XML_OP_ROOT, |
128 | | XML_OP_ELEM, |
129 | | XML_OP_CHILD, |
130 | | XML_OP_ATTR, |
131 | | XML_OP_PARENT, |
132 | | XML_OP_ANCESTOR, |
133 | | XML_OP_NS, |
134 | | XML_OP_ALL |
135 | | } xmlPatOp; |
136 | | |
137 | | |
138 | | typedef struct _xmlStepState xmlStepState; |
139 | | typedef xmlStepState *xmlStepStatePtr; |
140 | | struct _xmlStepState { |
141 | | int step; |
142 | | xmlNodePtr node; |
143 | | }; |
144 | | |
145 | | typedef struct _xmlStepStates xmlStepStates; |
146 | | typedef xmlStepStates *xmlStepStatesPtr; |
147 | | struct _xmlStepStates { |
148 | | int nbstates; |
149 | | int maxstates; |
150 | | xmlStepStatePtr states; |
151 | | }; |
152 | | |
153 | | typedef struct _xmlStepOp xmlStepOp; |
154 | | typedef xmlStepOp *xmlStepOpPtr; |
155 | | struct _xmlStepOp { |
156 | | xmlPatOp op; |
157 | | const xmlChar *value; |
158 | | const xmlChar *value2; /* The namespace name */ |
159 | | }; |
160 | | |
161 | 101k | #define PAT_FROM_ROOT (1<<8) |
162 | 94.8k | #define PAT_FROM_CUR (1<<9) |
163 | | |
164 | | struct _xmlPattern { |
165 | | void *data; /* the associated template */ |
166 | | xmlDictPtr dict; /* the optional dictionary */ |
167 | | struct _xmlPattern *next; /* next pattern if | is used */ |
168 | | const xmlChar *pattern; /* the pattern */ |
169 | | int flags; /* flags */ |
170 | | int nbStep; |
171 | | int maxStep; |
172 | | xmlStepOpPtr steps; /* ops for computation */ |
173 | | xmlStreamCompPtr stream; /* the streaming data if any */ |
174 | | }; |
175 | | |
176 | | typedef struct _xmlPatParserContext xmlPatParserContext; |
177 | | typedef xmlPatParserContext *xmlPatParserContextPtr; |
178 | | struct _xmlPatParserContext { |
179 | | const xmlChar *cur; /* the current char being parsed */ |
180 | | const xmlChar *base; /* the full expression */ |
181 | | int error; /* error code */ |
182 | | xmlDictPtr dict; /* the dictionary if any */ |
183 | | xmlPatternPtr comp; /* the result */ |
184 | | xmlNodePtr elem; /* the current node if any */ |
185 | | const xmlChar **namespaces; /* the namespaces definitions */ |
186 | | int nb_namespaces; /* the number of namespaces */ |
187 | | }; |
188 | | |
189 | | /************************************************************************ |
190 | | * * |
191 | | * Type functions * |
192 | | * * |
193 | | ************************************************************************/ |
194 | | |
195 | | /** |
196 | | * Create a new XSLT Pattern |
197 | | * |
198 | | * @returns the newly allocated xmlPattern or NULL in case of error |
199 | | */ |
200 | | static xmlPatternPtr |
201 | 65.3k | xmlNewPattern(void) { |
202 | 65.3k | xmlPatternPtr cur; |
203 | | |
204 | 65.3k | cur = (xmlPatternPtr) xmlMalloc(sizeof(xmlPattern)); |
205 | 65.3k | if (cur == NULL) { |
206 | 9 | ERROR(NULL, NULL, NULL, |
207 | 9 | "xmlNewPattern : malloc failed\n"); |
208 | 9 | return(NULL); |
209 | 9 | } |
210 | 65.3k | memset(cur, 0, sizeof(xmlPattern)); |
211 | 65.3k | cur->steps = NULL; |
212 | 65.3k | cur->maxStep = 0; |
213 | 65.3k | return(cur); |
214 | 65.3k | } |
215 | | |
216 | | /** |
217 | | * Free up the memory allocated by `comp` |
218 | | * |
219 | | * @param comp an XSLT comp |
220 | | */ |
221 | | void |
222 | 30.2k | xmlFreePattern(xmlPattern *comp) { |
223 | 30.2k | xmlFreePatternList(comp); |
224 | 30.2k | } |
225 | | |
226 | | static void |
227 | 65.3k | xmlFreePatternInternal(xmlPatternPtr comp) { |
228 | 65.3k | xmlStepOpPtr op; |
229 | 65.3k | int i; |
230 | | |
231 | 65.3k | if (comp == NULL) |
232 | 0 | return; |
233 | 65.3k | if (comp->stream != NULL) |
234 | 40.7k | xmlFreeStreamComp(comp->stream); |
235 | 65.3k | if (comp->pattern != NULL) |
236 | 0 | xmlFree((xmlChar *)comp->pattern); |
237 | 65.3k | if (comp->steps != NULL) { |
238 | 56.7k | if (comp->dict == NULL) { |
239 | 24.3M | for (i = 0;i < comp->nbStep;i++) { |
240 | 24.3M | op = &comp->steps[i]; |
241 | 24.3M | if (op->value != NULL) |
242 | 7.27M | xmlFree((xmlChar *) op->value); |
243 | 24.3M | if (op->value2 != NULL) |
244 | 8.38k | xmlFree((xmlChar *) op->value2); |
245 | 24.3M | } |
246 | 56.7k | } |
247 | 56.7k | xmlFree(comp->steps); |
248 | 56.7k | } |
249 | 65.3k | if (comp->dict != NULL) |
250 | 0 | xmlDictFree(comp->dict); |
251 | | |
252 | 65.3k | memset(comp, -1, sizeof(xmlPattern)); |
253 | 65.3k | xmlFree(comp); |
254 | 65.3k | } |
255 | | |
256 | | /** |
257 | | * Free up the memory allocated by all the elements of `comp` |
258 | | * |
259 | | * @param comp an XSLT comp list |
260 | | */ |
261 | | void |
262 | 30.2k | xmlFreePatternList(xmlPattern *comp) { |
263 | 30.2k | xmlPatternPtr cur; |
264 | | |
265 | 95.5k | while (comp != NULL) { |
266 | 65.3k | cur = comp; |
267 | 65.3k | comp = comp->next; |
268 | 65.3k | cur->next = NULL; |
269 | 65.3k | xmlFreePatternInternal(cur); |
270 | 65.3k | } |
271 | 30.2k | } |
272 | | |
273 | | /** |
274 | | * Create a new XML pattern parser context |
275 | | * |
276 | | * @param pattern the pattern context |
277 | | * @param dict the inherited dictionary or NULL |
278 | | * @param namespaces the prefix definitions, array of [URI, prefix] terminated |
279 | | * with [NULL, NULL] or NULL if no namespace is used |
280 | | * @returns the newly allocated xmlPatParserContext or NULL in case of error |
281 | | */ |
282 | | static xmlPatParserContextPtr |
283 | | xmlNewPatParserContext(const xmlChar *pattern, xmlDictPtr dict, |
284 | 65.3k | const xmlChar **namespaces) { |
285 | 65.3k | xmlPatParserContextPtr cur; |
286 | | |
287 | 65.3k | if (pattern == NULL) |
288 | 0 | return(NULL); |
289 | | |
290 | 65.3k | cur = (xmlPatParserContextPtr) xmlMalloc(sizeof(xmlPatParserContext)); |
291 | 65.3k | if (cur == NULL) { |
292 | 38 | ERROR(NULL, NULL, NULL, |
293 | 38 | "xmlNewPatParserContext : malloc failed\n"); |
294 | 38 | return(NULL); |
295 | 38 | } |
296 | 65.3k | memset(cur, 0, sizeof(xmlPatParserContext)); |
297 | 65.3k | cur->dict = dict; |
298 | 65.3k | cur->cur = pattern; |
299 | 65.3k | cur->base = pattern; |
300 | 65.3k | if (namespaces != NULL) { |
301 | 60.0k | int i; |
302 | 115k | for (i = 0;namespaces[2 * i] != NULL;i++) |
303 | 55.7k | ; |
304 | 60.0k | cur->nb_namespaces = i; |
305 | 60.0k | } else { |
306 | 5.31k | cur->nb_namespaces = 0; |
307 | 5.31k | } |
308 | 65.3k | cur->namespaces = namespaces; |
309 | 65.3k | return(cur); |
310 | 65.3k | } |
311 | | |
312 | | /** |
313 | | * Free up the memory allocated by `ctxt` |
314 | | * |
315 | | * @param ctxt an XSLT parser context |
316 | | */ |
317 | | static void |
318 | 65.3k | xmlFreePatParserContext(xmlPatParserContextPtr ctxt) { |
319 | 65.3k | if (ctxt == NULL) |
320 | 0 | return; |
321 | 65.3k | memset(ctxt, -1, sizeof(xmlPatParserContext)); |
322 | 65.3k | xmlFree(ctxt); |
323 | 65.3k | } |
324 | | |
325 | | static int |
326 | 182k | xmlPatternGrow(xmlPatternPtr comp) { |
327 | 182k | xmlStepOpPtr temp; |
328 | 182k | int newSize; |
329 | | |
330 | 182k | newSize = xmlGrowCapacity(comp->maxStep, sizeof(temp[0]), |
331 | 182k | 10, XML_MAX_ITEMS); |
332 | 182k | if (newSize < 0) |
333 | 0 | return(-1); |
334 | 182k | temp = xmlRealloc(comp->steps, newSize * sizeof(temp[0])); |
335 | 182k | if (temp == NULL) |
336 | 31 | return(-1); |
337 | 182k | comp->steps = temp; |
338 | 182k | comp->maxStep = newSize; |
339 | | |
340 | 182k | return(0); |
341 | 182k | } |
342 | | |
343 | | /** |
344 | | * Add a step to an XSLT Compiled Match |
345 | | * |
346 | | * @param ctxt the pattern parser context |
347 | | * @param comp the compiled match expression |
348 | | * @param op an op |
349 | | * @param value the first value |
350 | | * @param value2 the second value |
351 | | * @returns -1 in case of failure, 0 otherwise. |
352 | | */ |
353 | | static int |
354 | | xmlPatternAdd(xmlPatParserContextPtr ctxt, xmlPatternPtr comp, |
355 | | xmlPatOp op, xmlChar * value, xmlChar * value2) |
356 | 24.2M | { |
357 | 24.2M | if (comp->nbStep >= comp->maxStep) { |
358 | 149k | if (xmlPatternGrow(comp) < 0) { |
359 | 28 | ctxt->error = -1; |
360 | 28 | return(-1); |
361 | 28 | } |
362 | 149k | } |
363 | 24.2M | comp->steps[comp->nbStep].op = op; |
364 | 24.2M | comp->steps[comp->nbStep].value = value; |
365 | 24.2M | comp->steps[comp->nbStep].value2 = value2; |
366 | 24.2M | comp->nbStep++; |
367 | 24.2M | return(0); |
368 | 24.2M | } |
369 | | |
370 | | /** |
371 | | * reverse all the stack of expressions |
372 | | * |
373 | | * @param comp the compiled match expression |
374 | | * @returns 0 in case of success and -1 in case of error. |
375 | | */ |
376 | | static int |
377 | 42.6k | xmlReversePattern(xmlPatternPtr comp) { |
378 | 42.6k | int i, j; |
379 | | |
380 | | /* |
381 | | * remove the leading // for //a or .//a |
382 | | */ |
383 | 42.6k | if ((comp->nbStep > 0) && (comp->steps[0].op == XML_OP_ANCESTOR)) { |
384 | 4.42M | for (i = 0, j = 1;j < comp->nbStep;i++,j++) { |
385 | 4.41M | comp->steps[i].value = comp->steps[j].value; |
386 | 4.41M | comp->steps[i].value2 = comp->steps[j].value2; |
387 | 4.41M | comp->steps[i].op = comp->steps[j].op; |
388 | 4.41M | } |
389 | 4.75k | comp->nbStep--; |
390 | 4.75k | } |
391 | | |
392 | | /* |
393 | | * Grow to add OP_END later |
394 | | */ |
395 | 42.6k | if (comp->nbStep >= comp->maxStep) { |
396 | 33.4k | if (xmlPatternGrow(comp) < 0) |
397 | 3 | return(-1); |
398 | 33.4k | } |
399 | | |
400 | 42.6k | i = 0; |
401 | 42.6k | j = comp->nbStep - 1; |
402 | 10.2M | while (j > i) { |
403 | 10.2M | register const xmlChar *tmp; |
404 | 10.2M | register xmlPatOp op; |
405 | 10.2M | tmp = comp->steps[i].value; |
406 | 10.2M | comp->steps[i].value = comp->steps[j].value; |
407 | 10.2M | comp->steps[j].value = tmp; |
408 | 10.2M | tmp = comp->steps[i].value2; |
409 | 10.2M | comp->steps[i].value2 = comp->steps[j].value2; |
410 | 10.2M | comp->steps[j].value2 = tmp; |
411 | 10.2M | op = comp->steps[i].op; |
412 | 10.2M | comp->steps[i].op = comp->steps[j].op; |
413 | 10.2M | comp->steps[j].op = op; |
414 | 10.2M | j--; |
415 | 10.2M | i++; |
416 | 10.2M | } |
417 | | |
418 | 42.6k | comp->steps[comp->nbStep].value = NULL; |
419 | 42.6k | comp->steps[comp->nbStep].value2 = NULL; |
420 | 42.6k | comp->steps[comp->nbStep++].op = XML_OP_END; |
421 | 42.6k | return(0); |
422 | 42.6k | } |
423 | | |
424 | | /************************************************************************ |
425 | | * * |
426 | | * The interpreter for the precompiled patterns * |
427 | | * * |
428 | | ************************************************************************/ |
429 | | |
430 | | static int |
431 | 0 | xmlPatPushState(xmlStepStates *states, int step, xmlNodePtr node) { |
432 | 0 | if (states->maxstates <= states->nbstates) { |
433 | 0 | xmlStepState *tmp; |
434 | 0 | int newSize; |
435 | |
|
436 | 0 | newSize = xmlGrowCapacity(states->maxstates, sizeof(tmp[0]), |
437 | 0 | 4, XML_MAX_ITEMS); |
438 | 0 | if (newSize < 0) |
439 | 0 | return(-1); |
440 | 0 | tmp = xmlRealloc(states->states, newSize * sizeof(tmp[0])); |
441 | 0 | if (tmp == NULL) |
442 | 0 | return(-1); |
443 | 0 | states->states = tmp; |
444 | 0 | states->maxstates = newSize; |
445 | 0 | } |
446 | 0 | states->states[states->nbstates].step = step; |
447 | 0 | states->states[states->nbstates++].node = node; |
448 | 0 | return(0); |
449 | 0 | } |
450 | | |
451 | | /** |
452 | | * Test whether the node matches the pattern |
453 | | * |
454 | | * @param comp the precompiled pattern |
455 | | * @param node a node |
456 | | * @returns 1 if it matches, 0 if it doesn't and -1 in case of failure |
457 | | */ |
458 | | static int |
459 | 5.19k | xmlPatMatch(xmlPatternPtr comp, xmlNodePtr node) { |
460 | 5.19k | int i; |
461 | 5.19k | xmlStepOpPtr step; |
462 | 5.19k | xmlStepStates states = {0, 0, NULL}; /* // may require backtrack */ |
463 | | |
464 | 5.19k | if ((comp == NULL) || (node == NULL)) return(-1); |
465 | 5.19k | i = 0; |
466 | 5.19k | restart: |
467 | 8.62k | for (;i < comp->nbStep;i++) { |
468 | 8.62k | step = &comp->steps[i]; |
469 | 8.62k | switch (step->op) { |
470 | 88 | case XML_OP_END: |
471 | 88 | goto found; |
472 | 31 | case XML_OP_ROOT: |
473 | 31 | if (node->type == XML_NAMESPACE_DECL) |
474 | 0 | goto rollback; |
475 | 31 | node = node->parent; |
476 | 31 | if ((node->type == XML_DOCUMENT_NODE) || |
477 | 0 | (node->type == XML_HTML_DOCUMENT_NODE)) |
478 | 31 | continue; |
479 | 0 | goto rollback; |
480 | 4.07k | case XML_OP_ELEM: |
481 | 4.07k | if (node->type != XML_ELEMENT_NODE) |
482 | 668 | goto rollback; |
483 | 3.40k | if (step->value == NULL) |
484 | 738 | continue; |
485 | 2.66k | if (step->value[0] != node->name[0]) |
486 | 1.71k | goto rollback; |
487 | 953 | if (!xmlStrEqual(step->value, node->name)) |
488 | 551 | goto rollback; |
489 | | |
490 | | /* Namespace test */ |
491 | 402 | if (node->ns == NULL) { |
492 | 402 | if (step->value2 != NULL) |
493 | 194 | goto rollback; |
494 | 402 | } else if (node->ns->href != NULL) { |
495 | 0 | if (step->value2 == NULL) |
496 | 0 | goto rollback; |
497 | 0 | if (!xmlStrEqual(step->value2, node->ns->href)) |
498 | 0 | goto rollback; |
499 | 0 | } |
500 | 208 | continue; |
501 | 208 | case XML_OP_CHILD: { |
502 | 0 | xmlNodePtr lst; |
503 | |
|
504 | 0 | if ((node->type != XML_ELEMENT_NODE) && |
505 | 0 | (node->type != XML_DOCUMENT_NODE) && |
506 | 0 | (node->type != XML_HTML_DOCUMENT_NODE)) |
507 | 0 | goto rollback; |
508 | | |
509 | 0 | lst = node->children; |
510 | |
|
511 | 0 | if (step->value != NULL) { |
512 | 0 | while (lst != NULL) { |
513 | 0 | if ((lst->type == XML_ELEMENT_NODE) && |
514 | 0 | (step->value[0] == lst->name[0]) && |
515 | 0 | (xmlStrEqual(step->value, lst->name))) |
516 | 0 | break; |
517 | 0 | lst = lst->next; |
518 | 0 | } |
519 | 0 | if (lst != NULL) |
520 | 0 | continue; |
521 | 0 | } |
522 | 0 | goto rollback; |
523 | 0 | } |
524 | 476 | case XML_OP_ATTR: |
525 | 476 | if (node->type != XML_ATTRIBUTE_NODE) |
526 | 476 | goto rollback; |
527 | 0 | if (step->value != NULL) { |
528 | 0 | if (step->value[0] != node->name[0]) |
529 | 0 | goto rollback; |
530 | 0 | if (!xmlStrEqual(step->value, node->name)) |
531 | 0 | goto rollback; |
532 | 0 | } |
533 | | /* Namespace test */ |
534 | 0 | if (node->ns == NULL) { |
535 | 0 | if (step->value2 != NULL) |
536 | 0 | goto rollback; |
537 | 0 | } else if (step->value2 != NULL) { |
538 | 0 | if (!xmlStrEqual(step->value2, node->ns->href)) |
539 | 0 | goto rollback; |
540 | 0 | } |
541 | 0 | continue; |
542 | 1.40k | case XML_OP_PARENT: |
543 | 1.40k | if ((node->type == XML_DOCUMENT_NODE) || |
544 | 1.40k | (node->type == XML_HTML_DOCUMENT_NODE) || |
545 | 1.40k | (node->type == XML_NAMESPACE_DECL)) |
546 | 0 | goto rollback; |
547 | 1.40k | node = node->parent; |
548 | 1.40k | if (node == NULL) |
549 | 0 | goto rollback; |
550 | 1.40k | if (step->value == NULL) |
551 | 1.40k | continue; |
552 | 0 | if (step->value[0] != node->name[0]) |
553 | 0 | goto rollback; |
554 | 0 | if (!xmlStrEqual(step->value, node->name)) |
555 | 0 | goto rollback; |
556 | | /* Namespace test */ |
557 | 0 | if (node->ns == NULL) { |
558 | 0 | if (step->value2 != NULL) |
559 | 0 | goto rollback; |
560 | 0 | } else if (node->ns->href != NULL) { |
561 | 0 | if (step->value2 == NULL) |
562 | 0 | goto rollback; |
563 | 0 | if (!xmlStrEqual(step->value2, node->ns->href)) |
564 | 0 | goto rollback; |
565 | 0 | } |
566 | 0 | continue; |
567 | 449 | case XML_OP_ANCESTOR: |
568 | | /* TODO: implement coalescing of ANCESTOR/NODE ops */ |
569 | 449 | if (step->value == NULL) { |
570 | 449 | i++; |
571 | 449 | step = &comp->steps[i]; |
572 | 449 | if (step->op == XML_OP_ROOT) |
573 | 0 | goto found; |
574 | 449 | if (step->op != XML_OP_ELEM) |
575 | 228 | goto rollback; |
576 | 221 | if (step->value == NULL) |
577 | 8 | return(-1); |
578 | 221 | } |
579 | 213 | if (node == NULL) |
580 | 0 | goto rollback; |
581 | 213 | if ((node->type == XML_DOCUMENT_NODE) || |
582 | 213 | (node->type == XML_HTML_DOCUMENT_NODE) || |
583 | 213 | (node->type == XML_NAMESPACE_DECL)) |
584 | 0 | goto rollback; |
585 | 213 | node = node->parent; |
586 | 426 | while (node != NULL) { |
587 | 213 | if ((node->type == XML_ELEMENT_NODE) && |
588 | 0 | (step->value[0] == node->name[0]) && |
589 | 0 | (xmlStrEqual(step->value, node->name))) { |
590 | | /* Namespace test */ |
591 | 0 | if (node->ns == NULL) { |
592 | 0 | if (step->value2 == NULL) |
593 | 0 | break; |
594 | 0 | } else if (node->ns->href != NULL) { |
595 | 0 | if ((step->value2 != NULL) && |
596 | 0 | (xmlStrEqual(step->value2, node->ns->href))) |
597 | 0 | break; |
598 | 0 | } |
599 | 0 | } |
600 | 213 | node = node->parent; |
601 | 213 | } |
602 | 213 | if (node == NULL) |
603 | 213 | goto rollback; |
604 | | /* |
605 | | * prepare a potential rollback from here |
606 | | * for ancestors of that node. |
607 | | */ |
608 | 0 | if (step->op == XML_OP_ANCESTOR) |
609 | 0 | xmlPatPushState(&states, i, node); |
610 | 0 | else |
611 | 0 | xmlPatPushState(&states, i - 1, node); |
612 | 0 | continue; |
613 | 520 | case XML_OP_NS: |
614 | 520 | if (node->type != XML_ELEMENT_NODE) |
615 | 205 | goto rollback; |
616 | 315 | if (node->ns == NULL) { |
617 | 315 | if (step->value != NULL) |
618 | 315 | goto rollback; |
619 | 315 | } else if (node->ns->href != NULL) { |
620 | 0 | if (step->value == NULL) |
621 | 0 | goto rollback; |
622 | 0 | if (!xmlStrEqual(step->value, node->ns->href)) |
623 | 0 | goto rollback; |
624 | 0 | } |
625 | 0 | break; |
626 | 1.58k | case XML_OP_ALL: |
627 | 1.58k | if (node->type != XML_ELEMENT_NODE) |
628 | 536 | goto rollback; |
629 | 1.04k | break; |
630 | 8.62k | } |
631 | 8.62k | } |
632 | 88 | found: |
633 | 88 | if (states.states != NULL) { |
634 | | /* Free the rollback states */ |
635 | 0 | xmlFree(states.states); |
636 | 0 | } |
637 | 88 | return(1); |
638 | 5.10k | rollback: |
639 | | /* got an error try to rollback */ |
640 | 5.10k | if (states.states == NULL) |
641 | 5.10k | return(0); |
642 | 0 | if (states.nbstates <= 0) { |
643 | 0 | xmlFree(states.states); |
644 | 0 | return(0); |
645 | 0 | } |
646 | 0 | states.nbstates--; |
647 | 0 | i = states.states[states.nbstates].step; |
648 | 0 | node = states.states[states.nbstates].node; |
649 | 0 | goto restart; |
650 | 0 | } |
651 | | |
652 | | /************************************************************************ |
653 | | * * |
654 | | * Dedicated parser for templates * |
655 | | * * |
656 | | ************************************************************************/ |
657 | | |
658 | 62.1M | #define CUR (*ctxt->cur) |
659 | | #define SKIP(val) ctxt->cur += (val) |
660 | 12.0M | #define NXT(val) ctxt->cur[(val)] |
661 | | #define PEEKPREV(val) ctxt->cur[-(val)] |
662 | 16.6M | #define CUR_PTR ctxt->cur |
663 | | |
664 | | #define SKIP_BLANKS \ |
665 | 34.2M | while (IS_BLANK_CH(CUR)) NEXT |
666 | | |
667 | | #define CURRENT (*ctxt->cur) |
668 | 30.7M | #define NEXT ((*ctxt->cur) ? ctxt->cur++: ctxt->cur) |
669 | | |
670 | | |
671 | | #define PUSH(op, val, val2) \ |
672 | 24.2M | if (xmlPatternAdd(ctxt, ctxt->comp, (op), (val), (val2))) goto error; |
673 | | |
674 | | /** |
675 | | * [4] NameChar ::= Letter | Digit | '.' | '-' | '_' | |
676 | | * CombiningChar | Extender |
677 | | * |
678 | | * [5] Name ::= (Letter | '_' | ':') (NameChar)* |
679 | | * |
680 | | * [6] Names ::= Name (S Name)* |
681 | | * |
682 | | * @param ctxt the XPath Parser context |
683 | | * @returns the Name parsed or NULL |
684 | | */ |
685 | | |
686 | | static xmlChar * |
687 | 33.6k | xmlPatScanName(xmlPatParserContextPtr ctxt) { |
688 | 33.6k | const xmlChar *q, *cur; |
689 | 33.6k | xmlChar *ret = NULL; |
690 | | |
691 | 33.6k | SKIP_BLANKS; |
692 | | |
693 | 33.6k | q = CUR_PTR; |
694 | 33.6k | cur = xmlScanName(q, XML_MAX_NAME_LENGTH, 0); |
695 | 33.6k | if ((cur == NULL) || (cur == q)) |
696 | 21.6k | return(NULL); |
697 | 11.9k | if (ctxt->dict) |
698 | 0 | ret = (xmlChar *) xmlDictLookup(ctxt->dict, q, cur - q); |
699 | 11.9k | else |
700 | 11.9k | ret = xmlStrndup(q, cur - q); |
701 | 11.9k | CUR_PTR = cur; |
702 | 11.9k | return(ret); |
703 | 33.6k | } |
704 | | |
705 | | /** |
706 | | * Parses a non qualified name |
707 | | * |
708 | | * @param ctxt the XPath Parser context |
709 | | * @returns the Name parsed or NULL |
710 | | */ |
711 | | |
712 | | static xmlChar * |
713 | 9.34M | xmlPatScanNCName(xmlPatParserContextPtr ctxt) { |
714 | 9.34M | const xmlChar *q, *cur; |
715 | 9.34M | xmlChar *ret = NULL; |
716 | | |
717 | 9.34M | SKIP_BLANKS; |
718 | | |
719 | 9.34M | q = CUR_PTR; |
720 | 9.34M | cur = xmlScanName(q, XML_MAX_NAME_LENGTH, XML_SCAN_NC); |
721 | 9.34M | if ((cur == NULL) || (cur == q)) |
722 | 2.05M | return(NULL); |
723 | 7.29M | if (ctxt->dict) |
724 | 0 | ret = (xmlChar *) xmlDictLookup(ctxt->dict, q, cur - q); |
725 | 7.29M | else |
726 | 7.29M | ret = xmlStrndup(q, cur - q); |
727 | 7.29M | if (ret == NULL) |
728 | 10 | ctxt->error = -1; |
729 | 7.29M | CUR_PTR = cur; |
730 | 7.29M | return(ret); |
731 | 9.34M | } |
732 | | |
733 | | /** |
734 | | * Compile an attribute test. |
735 | | * |
736 | | * @param ctxt the compilation context |
737 | | */ |
738 | | static void |
739 | 31.6k | xmlCompileAttributeTest(xmlPatParserContextPtr ctxt) { |
740 | 31.6k | xmlChar *token = NULL; |
741 | 31.6k | xmlChar *name = NULL; |
742 | 31.6k | xmlChar *URL = NULL; |
743 | | |
744 | 31.6k | SKIP_BLANKS; |
745 | 31.6k | name = xmlPatScanNCName(ctxt); |
746 | 31.6k | if (ctxt->error < 0) |
747 | 4 | return; |
748 | 31.6k | if (name == NULL) { |
749 | 5.89k | if (CUR == '*') { |
750 | 4.68k | PUSH(XML_OP_ATTR, NULL, NULL); |
751 | 4.68k | NEXT; |
752 | 4.68k | } else { |
753 | 1.20k | ERROR(NULL, NULL, NULL, |
754 | 1.20k | "xmlCompileAttributeTest : Name expected\n"); |
755 | 1.20k | ctxt->error = 1; |
756 | 1.20k | } |
757 | 5.88k | return; |
758 | 5.89k | } |
759 | 25.7k | if (CUR == ':') { |
760 | 7.18k | int i; |
761 | 7.18k | xmlChar *prefix = name; |
762 | | |
763 | 7.18k | NEXT; |
764 | | |
765 | 7.18k | if (IS_BLANK_CH(CUR)) { |
766 | 579 | ERROR5(NULL, NULL, NULL, "Invalid QName.\n", NULL); |
767 | 579 | ctxt->error = 1; |
768 | 579 | goto error; |
769 | 579 | } |
770 | | /* |
771 | | * This is a namespace match |
772 | | */ |
773 | 6.60k | token = xmlPatScanName(ctxt); |
774 | 6.60k | if ((prefix[0] == 'x') && |
775 | 6.05k | (prefix[1] == 'm') && |
776 | 3.58k | (prefix[2] == 'l') && |
777 | 3.56k | (prefix[3] == 0)) |
778 | 3.33k | { |
779 | 3.33k | XML_PAT_COPY_NSNAME(ctxt, URL, XML_XML_NAMESPACE); |
780 | 3.33k | } else { |
781 | 5.21k | for (i = 0;i < ctxt->nb_namespaces;i++) { |
782 | 4.15k | if (xmlStrEqual(ctxt->namespaces[2 * i + 1], prefix)) { |
783 | 2.21k | XML_PAT_COPY_NSNAME(ctxt, URL, ctxt->namespaces[2 * i]) |
784 | 2.21k | break; |
785 | 2.21k | } |
786 | 4.15k | } |
787 | 3.27k | if (i >= ctxt->nb_namespaces) { |
788 | 1.06k | ERROR5(NULL, NULL, NULL, |
789 | 1.06k | "xmlCompileAttributeTest : no namespace bound to prefix %s\n", |
790 | 1.06k | prefix); |
791 | 1.06k | ctxt->error = 1; |
792 | 1.06k | goto error; |
793 | 1.06k | } |
794 | 3.27k | } |
795 | 5.54k | XML_PAT_FREE_STRING(ctxt, name); |
796 | 5.54k | name = NULL; |
797 | 5.54k | if (token == NULL) { |
798 | 3.69k | if (CUR == '*') { |
799 | 3.32k | NEXT; |
800 | 3.32k | PUSH(XML_OP_ATTR, NULL, URL); |
801 | 3.32k | } else { |
802 | 369 | ERROR(NULL, NULL, NULL, |
803 | 369 | "xmlCompileAttributeTest : Name expected\n"); |
804 | 369 | ctxt->error = 1; |
805 | 369 | goto error; |
806 | 369 | } |
807 | 3.69k | } else { |
808 | 1.85k | PUSH(XML_OP_ATTR, token, URL); |
809 | 1.85k | } |
810 | 18.5k | } else { |
811 | 18.5k | PUSH(XML_OP_ATTR, name, NULL); |
812 | 18.5k | } |
813 | 23.7k | return; |
814 | 23.7k | error: |
815 | 2.01k | if (name != NULL) |
816 | 1.64k | XML_PAT_FREE_STRING(ctxt, name); |
817 | 2.01k | if (URL != NULL) |
818 | 371 | XML_PAT_FREE_STRING(ctxt, URL) |
819 | 2.01k | if (token != NULL) |
820 | 559 | XML_PAT_FREE_STRING(ctxt, token); |
821 | 2.01k | } |
822 | | |
823 | | /** |
824 | | * Compile the Step Pattern and generates a precompiled |
825 | | * form suitable for fast matching. |
826 | | * |
827 | | * [3] Step ::= '.' | NameTest |
828 | | * [4] NameTest ::= QName | '*' | NCName ':' '*' |
829 | | * |
830 | | * @param ctxt the compilation context |
831 | | */ |
832 | | |
833 | | static void |
834 | 12.1M | xmlCompileStepPattern(xmlPatParserContextPtr ctxt) { |
835 | 12.1M | xmlChar *token = NULL; |
836 | 12.1M | xmlChar *name = NULL; |
837 | 12.1M | xmlChar *URL = NULL; |
838 | 12.1M | int hasBlanks = 0; |
839 | | |
840 | 12.1M | SKIP_BLANKS; |
841 | 12.1M | if (CUR == '.') { |
842 | | /* |
843 | | * Context node. |
844 | | */ |
845 | 2.81M | NEXT; |
846 | 2.81M | PUSH(XML_OP_ELEM, NULL, NULL); |
847 | 2.81M | return; |
848 | 2.81M | } |
849 | 9.34M | if (CUR == '@') { |
850 | | /* |
851 | | * Attribute test. |
852 | | */ |
853 | 29.8k | if (XML_STREAM_XS_IDC_SEL(ctxt->comp)) { |
854 | 609 | ERROR5(NULL, NULL, NULL, |
855 | 609 | "Unexpected attribute axis in '%s'.\n", ctxt->base); |
856 | 609 | ctxt->error = 1; |
857 | 609 | return; |
858 | 609 | } |
859 | 29.2k | NEXT; |
860 | 29.2k | xmlCompileAttributeTest(ctxt); |
861 | 29.2k | if (ctxt->error != 0) |
862 | 2.71k | goto error; |
863 | 26.5k | return; |
864 | 29.2k | } |
865 | 9.31M | name = xmlPatScanNCName(ctxt); |
866 | 9.31M | if (ctxt->error < 0) |
867 | 6 | return; |
868 | 9.31M | if (name == NULL) { |
869 | 2.04M | if (CUR == '*') { |
870 | 2.04M | NEXT; |
871 | 2.04M | PUSH(XML_OP_ALL, NULL, NULL); |
872 | 2.04M | return; |
873 | 2.04M | } else { |
874 | 2.51k | ERROR(NULL, NULL, NULL, |
875 | 2.51k | "xmlCompileStepPattern : Name expected\n"); |
876 | 2.51k | ctxt->error = 1; |
877 | 2.51k | return; |
878 | 2.51k | } |
879 | 2.04M | } |
880 | 7.26M | if (IS_BLANK_CH(CUR)) { |
881 | 394k | hasBlanks = 1; |
882 | 394k | SKIP_BLANKS; |
883 | 394k | } |
884 | 7.26M | if (CUR == ':') { |
885 | 30.2k | NEXT; |
886 | 30.2k | if (CUR != ':') { |
887 | 23.1k | xmlChar *prefix = name; |
888 | 23.1k | int i; |
889 | | |
890 | 23.1k | if (hasBlanks || IS_BLANK_CH(CUR)) { |
891 | 899 | ERROR5(NULL, NULL, NULL, "Invalid QName.\n", NULL); |
892 | 899 | ctxt->error = 1; |
893 | 899 | goto error; |
894 | 899 | } |
895 | | /* |
896 | | * This is a namespace match |
897 | | */ |
898 | 22.2k | token = xmlPatScanName(ctxt); |
899 | 22.2k | if ((prefix[0] == 'x') && |
900 | 19.0k | (prefix[1] == 'm') && |
901 | 6.13k | (prefix[2] == 'l') && |
902 | 5.77k | (prefix[3] == 0)) |
903 | 5.56k | { |
904 | 5.56k | XML_PAT_COPY_NSNAME(ctxt, URL, XML_XML_NAMESPACE) |
905 | 16.6k | } else { |
906 | 22.4k | for (i = 0;i < ctxt->nb_namespaces;i++) { |
907 | 18.9k | if (xmlStrEqual(ctxt->namespaces[2 * i + 1], prefix)) { |
908 | 13.2k | XML_PAT_COPY_NSNAME(ctxt, URL, ctxt->namespaces[2 * i]) |
909 | 13.2k | break; |
910 | 13.2k | } |
911 | 18.9k | } |
912 | 16.6k | if (i >= ctxt->nb_namespaces) { |
913 | 3.48k | ERROR5(NULL, NULL, NULL, |
914 | 3.48k | "xmlCompileStepPattern : no namespace bound to prefix %s\n", |
915 | 3.48k | prefix); |
916 | 3.48k | ctxt->error = 1; |
917 | 3.48k | goto error; |
918 | 3.48k | } |
919 | 16.6k | } |
920 | 18.7k | XML_PAT_FREE_STRING(ctxt, prefix); |
921 | 18.7k | name = NULL; |
922 | 18.7k | if (token == NULL) { |
923 | 15.5k | if (CUR == '*') { |
924 | 15.0k | NEXT; |
925 | 15.0k | PUSH(XML_OP_NS, URL, NULL); |
926 | 15.0k | } else { |
927 | 474 | ERROR(NULL, NULL, NULL, |
928 | 474 | "xmlCompileStepPattern : Name expected\n"); |
929 | 474 | ctxt->error = 1; |
930 | 474 | goto error; |
931 | 474 | } |
932 | 15.5k | } else { |
933 | 3.21k | PUSH(XML_OP_ELEM, token, URL); |
934 | 3.21k | } |
935 | 18.7k | } else { |
936 | 7.12k | NEXT; |
937 | 7.12k | if (xmlStrEqual(name, (const xmlChar *) "child")) { |
938 | 4.76k | XML_PAT_FREE_STRING(ctxt, name); |
939 | 4.76k | name = xmlPatScanName(ctxt); |
940 | 4.76k | if (name == NULL) { |
941 | 957 | if (CUR == '*') { |
942 | 310 | NEXT; |
943 | 310 | PUSH(XML_OP_ALL, NULL, NULL); |
944 | 308 | return; |
945 | 647 | } else { |
946 | 647 | ERROR(NULL, NULL, NULL, |
947 | 647 | "xmlCompileStepPattern : QName expected\n"); |
948 | 647 | ctxt->error = 1; |
949 | 647 | goto error; |
950 | 647 | } |
951 | 957 | } |
952 | 3.80k | if (CUR == ':') { |
953 | 0 | xmlChar *prefix = name; |
954 | 0 | int i; |
955 | |
|
956 | 0 | NEXT; |
957 | 0 | if (IS_BLANK_CH(CUR)) { |
958 | 0 | ERROR5(NULL, NULL, NULL, "Invalid QName.\n", NULL); |
959 | 0 | ctxt->error = 1; |
960 | 0 | goto error; |
961 | 0 | } |
962 | | /* |
963 | | * This is a namespace match |
964 | | */ |
965 | 0 | token = xmlPatScanName(ctxt); |
966 | 0 | if ((prefix[0] == 'x') && |
967 | 0 | (prefix[1] == 'm') && |
968 | 0 | (prefix[2] == 'l') && |
969 | 0 | (prefix[3] == 0)) |
970 | 0 | { |
971 | 0 | XML_PAT_COPY_NSNAME(ctxt, URL, XML_XML_NAMESPACE) |
972 | 0 | } else { |
973 | 0 | for (i = 0;i < ctxt->nb_namespaces;i++) { |
974 | 0 | if (xmlStrEqual(ctxt->namespaces[2 * i + 1], prefix)) { |
975 | 0 | XML_PAT_COPY_NSNAME(ctxt, URL, ctxt->namespaces[2 * i]) |
976 | 0 | break; |
977 | 0 | } |
978 | 0 | } |
979 | 0 | if (i >= ctxt->nb_namespaces) { |
980 | 0 | ERROR5(NULL, NULL, NULL, |
981 | 0 | "xmlCompileStepPattern : no namespace bound " |
982 | 0 | "to prefix %s\n", prefix); |
983 | 0 | ctxt->error = 1; |
984 | 0 | goto error; |
985 | 0 | } |
986 | 0 | } |
987 | 0 | XML_PAT_FREE_STRING(ctxt, prefix); |
988 | 0 | name = NULL; |
989 | 0 | if (token == NULL) { |
990 | 0 | if (CUR == '*') { |
991 | 0 | NEXT; |
992 | 0 | PUSH(XML_OP_NS, URL, NULL); |
993 | 0 | } else { |
994 | 0 | ERROR(NULL, NULL, NULL, |
995 | 0 | "xmlCompileStepPattern : Name expected\n"); |
996 | 0 | ctxt->error = 1; |
997 | 0 | goto error; |
998 | 0 | } |
999 | 0 | } else { |
1000 | 0 | PUSH(XML_OP_ELEM, token, URL); |
1001 | 0 | } |
1002 | 0 | } else |
1003 | 3.80k | PUSH(XML_OP_ELEM, name, NULL); |
1004 | 3.80k | return; |
1005 | 3.80k | } else if (xmlStrEqual(name, (const xmlChar *) "attribute")) { |
1006 | 1.45k | XML_PAT_FREE_STRING(ctxt, name) |
1007 | 1.45k | name = NULL; |
1008 | 1.45k | if (XML_STREAM_XS_IDC_SEL(ctxt->comp)) { |
1009 | 214 | ERROR5(NULL, NULL, NULL, |
1010 | 214 | "Unexpected attribute axis in '%s'.\n", ctxt->base); |
1011 | 214 | ctxt->error = 1; |
1012 | 214 | goto error; |
1013 | 214 | } |
1014 | 1.23k | xmlCompileAttributeTest(ctxt); |
1015 | 1.23k | if (ctxt->error != 0) |
1016 | 449 | goto error; |
1017 | 788 | return; |
1018 | 1.23k | } else { |
1019 | 909 | ERROR5(NULL, NULL, NULL, |
1020 | 909 | "The 'element' or 'attribute' axis is expected.\n", NULL); |
1021 | 909 | ctxt->error = 1; |
1022 | 909 | goto error; |
1023 | 909 | } |
1024 | 7.12k | } |
1025 | 7.23M | } else if (CUR == '*') { |
1026 | 514 | if (name != NULL) { |
1027 | 514 | ctxt->error = 1; |
1028 | 514 | goto error; |
1029 | 514 | } |
1030 | 0 | NEXT; |
1031 | 0 | PUSH(XML_OP_ALL, token, NULL); |
1032 | 7.23M | } else { |
1033 | 7.23M | PUSH(XML_OP_ELEM, name, NULL); |
1034 | 7.23M | } |
1035 | 7.25M | return; |
1036 | 7.25M | error: |
1037 | 10.3k | if (URL != NULL) |
1038 | 476 | XML_PAT_FREE_STRING(ctxt, URL) |
1039 | 10.3k | if (token != NULL) |
1040 | 2.56k | XML_PAT_FREE_STRING(ctxt, token) |
1041 | 10.3k | if (name != NULL) |
1042 | 5.81k | XML_PAT_FREE_STRING(ctxt, name) |
1043 | 10.3k | } |
1044 | | |
1045 | | /** |
1046 | | * Compile the Path Pattern and generates a precompiled |
1047 | | * form suitable for fast matching. |
1048 | | * |
1049 | | * [5] Path ::= ('.//')? ( Step '/' )* ( Step | '@' NameTest ) |
1050 | | * |
1051 | | * @param ctxt the compilation context |
1052 | | */ |
1053 | | static void |
1054 | 14.3k | xmlCompilePathPattern(xmlPatParserContextPtr ctxt) { |
1055 | 14.3k | SKIP_BLANKS; |
1056 | 14.3k | if (CUR == '/') { |
1057 | 5.56k | ctxt->comp->flags |= PAT_FROM_ROOT; |
1058 | 8.82k | } else if ((CUR == '.') || (ctxt->comp->flags & XML_PATTERN_NOTPATTERN)) { |
1059 | 2.41k | ctxt->comp->flags |= PAT_FROM_CUR; |
1060 | 2.41k | } |
1061 | | |
1062 | 14.3k | if ((CUR == '/') && (NXT(1) == '/')) { |
1063 | 904 | PUSH(XML_OP_ANCESTOR, NULL, NULL); |
1064 | 904 | NEXT; |
1065 | 904 | NEXT; |
1066 | 13.4k | } else if ((CUR == '.') && (NXT(1) == '/') && (NXT(2) == '/')) { |
1067 | 351 | PUSH(XML_OP_ANCESTOR, NULL, NULL); |
1068 | 351 | NEXT; |
1069 | 351 | NEXT; |
1070 | 351 | NEXT; |
1071 | | /* Check for incompleteness. */ |
1072 | 351 | SKIP_BLANKS; |
1073 | 351 | if (CUR == 0) { |
1074 | 23 | ERROR5(NULL, NULL, NULL, |
1075 | 23 | "Incomplete expression '%s'.\n", ctxt->base); |
1076 | 23 | ctxt->error = 1; |
1077 | 23 | goto error; |
1078 | 23 | } |
1079 | 351 | } |
1080 | 14.3k | if (CUR == '@') { |
1081 | 1.18k | NEXT; |
1082 | 1.18k | xmlCompileAttributeTest(ctxt); |
1083 | 1.18k | if (ctxt->error != 0) |
1084 | 62 | goto error; |
1085 | 1.12k | SKIP_BLANKS; |
1086 | | /* TODO: check for incompleteness */ |
1087 | 1.12k | if (CUR != 0) { |
1088 | 428 | xmlCompileStepPattern(ctxt); |
1089 | 428 | if (ctxt->error != 0) |
1090 | 27 | goto error; |
1091 | 428 | } |
1092 | 13.1k | } else { |
1093 | 13.1k | if (CUR == '/') { |
1094 | 4.88k | PUSH(XML_OP_ROOT, NULL, NULL); |
1095 | 4.88k | NEXT; |
1096 | | /* Check for incompleteness. */ |
1097 | 4.88k | SKIP_BLANKS; |
1098 | 4.88k | if (CUR == 0) { |
1099 | 28 | ERROR5(NULL, NULL, NULL, |
1100 | 28 | "Incomplete expression '%s'.\n", ctxt->base); |
1101 | 28 | ctxt->error = 1; |
1102 | 28 | goto error; |
1103 | 28 | } |
1104 | 4.88k | } |
1105 | 13.1k | xmlCompileStepPattern(ctxt); |
1106 | 13.1k | if (ctxt->error != 0) |
1107 | 227 | goto error; |
1108 | 12.9k | SKIP_BLANKS; |
1109 | 12.0M | while (CUR == '/') { |
1110 | 12.0M | if (NXT(1) == '/') { |
1111 | 596k | PUSH(XML_OP_ANCESTOR, NULL, NULL); |
1112 | 596k | NEXT; |
1113 | 596k | NEXT; |
1114 | 596k | SKIP_BLANKS; |
1115 | 596k | xmlCompileStepPattern(ctxt); |
1116 | 596k | if (ctxt->error != 0) |
1117 | 33 | goto error; |
1118 | 11.4M | } else { |
1119 | 11.4M | PUSH(XML_OP_PARENT, NULL, NULL); |
1120 | 11.4M | NEXT; |
1121 | 11.4M | SKIP_BLANKS; |
1122 | 11.4M | if (CUR == 0) { |
1123 | 35 | ERROR5(NULL, NULL, NULL, |
1124 | 35 | "Incomplete expression '%s'.\n", ctxt->base); |
1125 | 35 | ctxt->error = 1; |
1126 | 35 | goto error; |
1127 | 35 | } |
1128 | 11.4M | xmlCompileStepPattern(ctxt); |
1129 | 11.4M | if (ctxt->error != 0) |
1130 | 38 | goto error; |
1131 | 11.4M | } |
1132 | 12.0M | } |
1133 | 12.9k | } |
1134 | 13.9k | if (CUR != 0) { |
1135 | 116 | ERROR5(NULL, NULL, NULL, |
1136 | 116 | "Failed to compile pattern %s\n", ctxt->base); |
1137 | 116 | ctxt->error = 1; |
1138 | 116 | } |
1139 | 14.3k | error: |
1140 | 14.3k | return; |
1141 | 13.9k | } |
1142 | | |
1143 | | /** |
1144 | | * Compile the Path Pattern and generates a precompiled |
1145 | | * form suitable for fast matching. |
1146 | | * |
1147 | | * [5] Path ::= ('.//')? ( Step '/' )* ( Step | '@' NameTest ) |
1148 | | * |
1149 | | * @param ctxt the compilation context |
1150 | | */ |
1151 | | static void |
1152 | 50.9k | xmlCompileIDCXPathPath(xmlPatParserContextPtr ctxt) { |
1153 | 50.9k | SKIP_BLANKS; |
1154 | 50.9k | if (CUR == '/') { |
1155 | 411 | ERROR5(NULL, NULL, NULL, |
1156 | 411 | "Unexpected selection of the document root in '%s'.\n", |
1157 | 411 | ctxt->base); |
1158 | 411 | goto error; |
1159 | 411 | } |
1160 | 50.5k | ctxt->comp->flags |= PAT_FROM_CUR; |
1161 | | |
1162 | 50.5k | if (CUR == '.') { |
1163 | | /* "." - "self::node()" */ |
1164 | 10.0k | NEXT; |
1165 | 10.0k | SKIP_BLANKS; |
1166 | 10.0k | if (CUR == 0) { |
1167 | | /* |
1168 | | * Selection of the context node. |
1169 | | */ |
1170 | 1.70k | PUSH(XML_OP_ELEM, NULL, NULL); |
1171 | 1.70k | return; |
1172 | 1.70k | } |
1173 | 8.37k | if (CUR != '/') { |
1174 | | /* TODO: A more meaningful error message. */ |
1175 | 847 | ERROR5(NULL, NULL, NULL, |
1176 | 847 | "Unexpected token after '.' in '%s'.\n", ctxt->base); |
1177 | 847 | goto error; |
1178 | 847 | } |
1179 | | /* "./" - "self::node()/" */ |
1180 | 7.52k | NEXT; |
1181 | 7.52k | SKIP_BLANKS; |
1182 | 7.52k | if (CUR == '/') { |
1183 | 4.50k | if (IS_BLANK_CH(PEEKPREV(1))) { |
1184 | | /* |
1185 | | * Disallow "./ /" |
1186 | | */ |
1187 | 309 | ERROR5(NULL, NULL, NULL, |
1188 | 309 | "Unexpected '/' token in '%s'.\n", ctxt->base); |
1189 | 309 | goto error; |
1190 | 309 | } |
1191 | | /* ".//" - "self:node()/descendant-or-self::node()/" */ |
1192 | 4.19k | PUSH(XML_OP_ANCESTOR, NULL, NULL); |
1193 | 4.19k | NEXT; |
1194 | 4.19k | SKIP_BLANKS; |
1195 | 4.19k | } |
1196 | 7.21k | if (CUR == 0) |
1197 | 570 | goto error_unfinished; |
1198 | 7.21k | } |
1199 | | /* |
1200 | | * Process steps. |
1201 | | */ |
1202 | 113k | do { |
1203 | 113k | xmlCompileStepPattern(ctxt); |
1204 | 113k | if (ctxt->error != 0) |
1205 | 13.1k | goto error; |
1206 | 100k | SKIP_BLANKS; |
1207 | 100k | if (CUR != '/') |
1208 | 32.5k | break; |
1209 | 67.8k | PUSH(XML_OP_PARENT, NULL, NULL); |
1210 | 67.8k | NEXT; |
1211 | 67.8k | SKIP_BLANKS; |
1212 | 67.8k | if (CUR == '/') { |
1213 | | /* |
1214 | | * Disallow subsequent '//'. |
1215 | | */ |
1216 | 1.09k | ERROR5(NULL, NULL, NULL, |
1217 | 1.09k | "Unexpected subsequent '//' in '%s'.\n", |
1218 | 1.09k | ctxt->base); |
1219 | 1.09k | goto error; |
1220 | 1.09k | } |
1221 | 66.7k | if (CUR == 0) |
1222 | 327 | goto error_unfinished; |
1223 | | |
1224 | 66.7k | } while (CUR != 0); |
1225 | | |
1226 | 32.5k | if (CUR != 0) { |
1227 | 5.37k | ERROR5(NULL, NULL, NULL, |
1228 | 5.37k | "Failed to compile expression '%s'.\n", ctxt->base); |
1229 | 5.37k | ctxt->error = 1; |
1230 | 5.37k | } |
1231 | 32.5k | return; |
1232 | 15.7k | error: |
1233 | 15.7k | ctxt->error = 1; |
1234 | 15.7k | return; |
1235 | | |
1236 | 897 | error_unfinished: |
1237 | 897 | ctxt->error = 1; |
1238 | 897 | ERROR5(NULL, NULL, NULL, |
1239 | 897 | "Unfinished expression '%s'.\n", ctxt->base); |
1240 | 897 | } |
1241 | | |
1242 | | /************************************************************************ |
1243 | | * * |
1244 | | * The streaming code * |
1245 | | * * |
1246 | | ************************************************************************/ |
1247 | | |
1248 | | /** |
1249 | | * build a new compiled pattern for streaming |
1250 | | * |
1251 | | * @param size the number of expected steps |
1252 | | * @returns the new structure or NULL in case of error. |
1253 | | */ |
1254 | | static xmlStreamCompPtr |
1255 | 41.9k | xmlNewStreamComp(int size) { |
1256 | 41.9k | xmlStreamCompPtr cur; |
1257 | | |
1258 | 41.9k | if (size < 4) |
1259 | 36.2k | size = 4; |
1260 | | |
1261 | 41.9k | cur = (xmlStreamCompPtr) xmlMalloc(sizeof(xmlStreamComp)); |
1262 | 41.9k | if (cur == NULL) { |
1263 | 7 | ERROR(NULL, NULL, NULL, |
1264 | 7 | "xmlNewStreamComp: malloc failed\n"); |
1265 | 7 | return(NULL); |
1266 | 7 | } |
1267 | 41.9k | memset(cur, 0, sizeof(xmlStreamComp)); |
1268 | 41.9k | cur->steps = (xmlStreamStepPtr) xmlMalloc(size * sizeof(xmlStreamStep)); |
1269 | 41.9k | if (cur->steps == NULL) { |
1270 | 4 | xmlFree(cur); |
1271 | 4 | ERROR(NULL, NULL, NULL, |
1272 | 4 | "xmlNewStreamComp: malloc failed\n"); |
1273 | 4 | return(NULL); |
1274 | 4 | } |
1275 | 41.9k | cur->nbStep = 0; |
1276 | 41.9k | cur->maxStep = size; |
1277 | 41.9k | return(cur); |
1278 | 41.9k | } |
1279 | | |
1280 | | /** |
1281 | | * Free the compiled pattern for streaming |
1282 | | * |
1283 | | * @param comp the compiled pattern for streaming |
1284 | | */ |
1285 | | static void |
1286 | 41.9k | xmlFreeStreamComp(xmlStreamCompPtr comp) { |
1287 | 41.9k | if (comp != NULL) { |
1288 | 41.9k | if (comp->steps != NULL) |
1289 | 41.9k | xmlFree(comp->steps); |
1290 | 41.9k | if (comp->dict != NULL) |
1291 | 0 | xmlDictFree(comp->dict); |
1292 | 41.9k | xmlFree(comp); |
1293 | 41.9k | } |
1294 | 41.9k | } |
1295 | | |
1296 | | /** |
1297 | | * Add a new step to the compiled pattern |
1298 | | * |
1299 | | * @param comp the compiled pattern for streaming |
1300 | | * @param name the first string, the name, or NULL for * |
1301 | | * @param ns the second step, the namespace name |
1302 | | * @param nodeType the node type |
1303 | | * @param flags the flags for that step |
1304 | | * @returns -1 in case of error or the step index if successful |
1305 | | */ |
1306 | | static int |
1307 | | xmlStreamCompAddStep(xmlStreamCompPtr comp, const xmlChar *name, |
1308 | 8.07M | const xmlChar *ns, int nodeType, int flags) { |
1309 | 8.07M | xmlStreamStepPtr cur; |
1310 | | |
1311 | 8.07M | if (comp->nbStep >= comp->maxStep) { |
1312 | 0 | xmlStreamStepPtr tmp; |
1313 | 0 | int newSize; |
1314 | |
|
1315 | 0 | newSize = xmlGrowCapacity(comp->maxStep, sizeof(tmp[0]), |
1316 | 0 | 4, XML_MAX_ITEMS); |
1317 | 0 | if (newSize < 0) { |
1318 | 0 | ERROR(NULL, NULL, NULL, |
1319 | 0 | "xmlNewStreamComp: growCapacity failed\n"); |
1320 | 0 | return(-1); |
1321 | 0 | } |
1322 | 0 | cur = xmlRealloc(comp->steps, newSize * sizeof(tmp[0])); |
1323 | 0 | if (cur == NULL) { |
1324 | 0 | ERROR(NULL, NULL, NULL, |
1325 | 0 | "xmlNewStreamComp: malloc failed\n"); |
1326 | 0 | return(-1); |
1327 | 0 | } |
1328 | 0 | comp->steps = cur; |
1329 | 0 | comp->maxStep = newSize; |
1330 | 0 | } |
1331 | 8.07M | cur = &comp->steps[comp->nbStep++]; |
1332 | 8.07M | cur->flags = flags; |
1333 | 8.07M | cur->name = name; |
1334 | 8.07M | cur->ns = ns; |
1335 | 8.07M | cur->nodeType = nodeType; |
1336 | 8.07M | return(comp->nbStep - 1); |
1337 | 8.07M | } |
1338 | | |
1339 | | /** |
1340 | | * Tries to stream compile a pattern |
1341 | | * |
1342 | | * @param comp the precompiled pattern |
1343 | | * @returns -1 in case of failure and 0 in case of success. |
1344 | | */ |
1345 | | static int |
1346 | 41.9k | xmlStreamCompile(xmlPatternPtr comp) { |
1347 | 41.9k | xmlStreamCompPtr stream; |
1348 | 41.9k | int i, s = 0, root = 0, flags = 0, prevs = -1; |
1349 | 41.9k | xmlStepOp step; |
1350 | | |
1351 | 41.9k | if ((comp == NULL) || (comp->steps == NULL)) |
1352 | 0 | return(-1); |
1353 | | /* |
1354 | | * special case for . |
1355 | | */ |
1356 | 41.9k | if ((comp->nbStep == 1) && |
1357 | 21.6k | (comp->steps[0].op == XML_OP_ELEM) && |
1358 | 17.9k | (comp->steps[0].value == NULL) && |
1359 | 2.64k | (comp->steps[0].value2 == NULL)) { |
1360 | 2.64k | stream = xmlNewStreamComp(0); |
1361 | 2.64k | if (stream == NULL) |
1362 | 2 | return(-1); |
1363 | | /* Note that the stream will have no steps in this case. */ |
1364 | 2.64k | stream->flags |= XML_STREAM_FINAL_IS_ANY_NODE; |
1365 | 2.64k | comp->stream = stream; |
1366 | 2.64k | return(0); |
1367 | 2.64k | } |
1368 | | |
1369 | 39.2k | stream = xmlNewStreamComp((comp->nbStep / 2) + 1); |
1370 | 39.2k | if (stream == NULL) |
1371 | 9 | return(-1); |
1372 | 39.2k | if (comp->dict != NULL) { |
1373 | 0 | stream->dict = comp->dict; |
1374 | 0 | xmlDictReference(stream->dict); |
1375 | 0 | } |
1376 | | |
1377 | 39.2k | i = 0; |
1378 | 39.2k | if (comp->flags & PAT_FROM_ROOT) |
1379 | 5.39k | stream->flags |= XML_STREAM_FROM_ROOT; |
1380 | | |
1381 | 20.5M | for (;i < comp->nbStep;i++) { |
1382 | 20.5M | step = comp->steps[i]; |
1383 | 20.5M | switch (step.op) { |
1384 | 0 | case XML_OP_END: |
1385 | 0 | break; |
1386 | 4.75k | case XML_OP_ROOT: |
1387 | 4.75k | if (i != 0) |
1388 | 210 | goto error; |
1389 | 4.54k | root = 1; |
1390 | 4.54k | break; |
1391 | 5.42k | case XML_OP_NS: |
1392 | 5.42k | s = xmlStreamCompAddStep(stream, NULL, step.value, |
1393 | 5.42k | XML_ELEMENT_NODE, flags); |
1394 | 5.42k | if (s < 0) |
1395 | 0 | goto error; |
1396 | 5.42k | prevs = s; |
1397 | 5.42k | flags = 0; |
1398 | 5.42k | break; |
1399 | 17.8k | case XML_OP_ATTR: |
1400 | 17.8k | flags |= XML_STREAM_STEP_ATTR; |
1401 | 17.8k | prevs = -1; |
1402 | 17.8k | s = xmlStreamCompAddStep(stream, |
1403 | 17.8k | step.value, step.value2, XML_ATTRIBUTE_NODE, flags); |
1404 | 17.8k | flags = 0; |
1405 | 17.8k | if (s < 0) |
1406 | 0 | goto error; |
1407 | 17.8k | break; |
1408 | 8.62M | case XML_OP_ELEM: |
1409 | 8.62M | if ((step.value == NULL) && (step.value2 == NULL)) { |
1410 | | /* |
1411 | | * We have a "." or "self::node()" here. |
1412 | | * Eliminate redundant self::node() tests like in "/./." |
1413 | | * or "//./" |
1414 | | * The only case we won't eliminate is "//.", i.e. if |
1415 | | * self::node() is the last node test and we had |
1416 | | * continuation somewhere beforehand. |
1417 | | */ |
1418 | 2.19M | if ((comp->nbStep == i + 1) && |
1419 | 3.52k | (flags & XML_STREAM_STEP_DESC)) { |
1420 | | /* |
1421 | | * Mark the special case where the expression resolves |
1422 | | * to any type of node. |
1423 | | */ |
1424 | 1.77k | if (comp->nbStep == i + 1) { |
1425 | 1.77k | stream->flags |= XML_STREAM_FINAL_IS_ANY_NODE; |
1426 | 1.77k | } |
1427 | 1.77k | flags |= XML_STREAM_STEP_NODE; |
1428 | 1.77k | s = xmlStreamCompAddStep(stream, NULL, NULL, |
1429 | 1.77k | XML_STREAM_ANY_NODE, flags); |
1430 | 1.77k | if (s < 0) |
1431 | 0 | goto error; |
1432 | 1.77k | flags = 0; |
1433 | | /* |
1434 | | * If there was a previous step, mark it to be added to |
1435 | | * the result node-set; this is needed since only |
1436 | | * the last step will be marked as "final" and only |
1437 | | * "final" nodes are added to the resulting set. |
1438 | | */ |
1439 | 1.77k | if (prevs != -1) { |
1440 | 669 | stream->steps[prevs].flags |= XML_STREAM_STEP_IN_SET; |
1441 | 669 | prevs = -1; |
1442 | 669 | } |
1443 | 1.77k | break; |
1444 | | |
1445 | 2.19M | } else { |
1446 | | /* Just skip this one. */ |
1447 | 2.19M | continue; |
1448 | 2.19M | } |
1449 | 2.19M | } |
1450 | | /* An element node. */ |
1451 | 6.42M | s = xmlStreamCompAddStep(stream, step.value, step.value2, |
1452 | 6.42M | XML_ELEMENT_NODE, flags); |
1453 | 6.42M | if (s < 0) |
1454 | 0 | goto error; |
1455 | 6.42M | prevs = s; |
1456 | 6.42M | flags = 0; |
1457 | 6.42M | break; |
1458 | 0 | case XML_OP_CHILD: |
1459 | | /* An element node child. */ |
1460 | 0 | s = xmlStreamCompAddStep(stream, step.value, step.value2, |
1461 | 0 | XML_ELEMENT_NODE, flags); |
1462 | 0 | if (s < 0) |
1463 | 0 | goto error; |
1464 | 0 | prevs = s; |
1465 | 0 | flags = 0; |
1466 | 0 | break; |
1467 | 1.62M | case XML_OP_ALL: |
1468 | 1.62M | s = xmlStreamCompAddStep(stream, NULL, NULL, |
1469 | 1.62M | XML_ELEMENT_NODE, flags); |
1470 | 1.62M | if (s < 0) |
1471 | 0 | goto error; |
1472 | 1.62M | prevs = s; |
1473 | 1.62M | flags = 0; |
1474 | 1.62M | break; |
1475 | 9.76M | case XML_OP_PARENT: |
1476 | 9.76M | break; |
1477 | 468k | case XML_OP_ANCESTOR: |
1478 | | /* Skip redundant continuations. */ |
1479 | 468k | if (flags & XML_STREAM_STEP_DESC) |
1480 | 613 | break; |
1481 | 468k | flags |= XML_STREAM_STEP_DESC; |
1482 | | /* |
1483 | | * Mark the expression as having "//". |
1484 | | */ |
1485 | 468k | if ((stream->flags & XML_STREAM_DESC) == 0) |
1486 | 6.16k | stream->flags |= XML_STREAM_DESC; |
1487 | 468k | break; |
1488 | 20.5M | } |
1489 | 20.5M | } |
1490 | 39.0k | if ((! root) && (comp->flags & XML_PATTERN_NOTPATTERN) == 0) { |
1491 | | /* |
1492 | | * If this should behave like a real pattern, we will mark |
1493 | | * the first step as having "//", to be reentrant on every |
1494 | | * tree level. |
1495 | | */ |
1496 | 7.39k | if ((stream->flags & XML_STREAM_DESC) == 0) |
1497 | 5.76k | stream->flags |= XML_STREAM_DESC; |
1498 | | |
1499 | 7.39k | if (stream->nbStep > 0) { |
1500 | 7.10k | if ((stream->steps[0].flags & XML_STREAM_STEP_DESC) == 0) |
1501 | 6.11k | stream->steps[0].flags |= XML_STREAM_STEP_DESC; |
1502 | 7.10k | } |
1503 | 7.39k | } |
1504 | 39.0k | if (stream->nbStep <= s) |
1505 | 736 | goto error; |
1506 | 38.3k | stream->steps[s].flags |= XML_STREAM_STEP_FINAL; |
1507 | 38.3k | if (root) |
1508 | 4.30k | stream->steps[0].flags |= XML_STREAM_STEP_ROOT; |
1509 | 38.3k | comp->stream = stream; |
1510 | 38.3k | return(0); |
1511 | 946 | error: |
1512 | 946 | xmlFreeStreamComp(stream); |
1513 | 946 | return(0); |
1514 | 39.0k | } |
1515 | | |
1516 | | /** |
1517 | | * build a new stream context |
1518 | | * |
1519 | | * @param stream the copmiled stream |
1520 | | * @returns the new structure or NULL in case of error. |
1521 | | */ |
1522 | | static xmlStreamCtxtPtr |
1523 | 123k | xmlNewStreamCtxt(xmlStreamCompPtr stream) { |
1524 | 123k | xmlStreamCtxtPtr cur; |
1525 | | |
1526 | 123k | cur = (xmlStreamCtxtPtr) xmlMalloc(sizeof(xmlStreamCtxt)); |
1527 | 123k | if (cur == NULL) { |
1528 | 26 | ERROR(NULL, NULL, NULL, |
1529 | 26 | "xmlNewStreamCtxt: malloc failed\n"); |
1530 | 26 | return(NULL); |
1531 | 26 | } |
1532 | 123k | memset(cur, 0, sizeof(xmlStreamCtxt)); |
1533 | 123k | cur->states = NULL; |
1534 | 123k | cur->nbState = 0; |
1535 | 123k | cur->maxState = 0; |
1536 | 123k | cur->level = 0; |
1537 | 123k | cur->comp = stream; |
1538 | 123k | cur->blockLevel = -1; |
1539 | 123k | return(cur); |
1540 | 123k | } |
1541 | | |
1542 | | /** |
1543 | | * Free the stream context |
1544 | | * |
1545 | | * @param stream the stream context |
1546 | | */ |
1547 | | void |
1548 | 104k | xmlFreeStreamCtxt(xmlStreamCtxt *stream) { |
1549 | 104k | xmlStreamCtxtPtr next; |
1550 | | |
1551 | 227k | while (stream != NULL) { |
1552 | 123k | next = stream->next; |
1553 | 123k | if (stream->states != NULL) |
1554 | 4.30k | xmlFree(stream->states); |
1555 | 123k | xmlFree(stream); |
1556 | 123k | stream = next; |
1557 | 123k | } |
1558 | 104k | } |
1559 | | |
1560 | | /** |
1561 | | * Add a new state to the stream context |
1562 | | * |
1563 | | * @param comp the stream context |
1564 | | * @param idx the step index for that streaming state |
1565 | | * @param level the level |
1566 | | * @returns -1 in case of error or the state index if successful |
1567 | | */ |
1568 | | static int |
1569 | 15.6k | xmlStreamCtxtAddState(xmlStreamCtxtPtr comp, int idx, int level) { |
1570 | 15.6k | int i; |
1571 | 100k | for (i = 0;i < comp->nbState;i++) { |
1572 | 84.8k | if (comp->states[2 * i] < 0) { |
1573 | 0 | comp->states[2 * i] = idx; |
1574 | 0 | comp->states[2 * i + 1] = level; |
1575 | 0 | return(i); |
1576 | 0 | } |
1577 | 84.8k | } |
1578 | 15.6k | if (comp->nbState >= comp->maxState) { |
1579 | 6.59k | int *tmp; |
1580 | 6.59k | int newSize; |
1581 | | |
1582 | 6.59k | newSize = xmlGrowCapacity(comp->maxState, sizeof(tmp[0]) * 2, |
1583 | 6.59k | 4, XML_MAX_ITEMS); |
1584 | 6.59k | if (newSize < 0) { |
1585 | 0 | ERROR(NULL, NULL, NULL, |
1586 | 0 | "xmlNewStreamCtxt: growCapacity failed\n"); |
1587 | 0 | return(-1); |
1588 | 0 | } |
1589 | 6.59k | tmp = xmlRealloc(comp->states, newSize * sizeof(tmp[0]) * 2); |
1590 | 6.59k | if (tmp == NULL) { |
1591 | 5 | ERROR(NULL, NULL, NULL, |
1592 | 5 | "xmlNewStreamCtxt: malloc failed\n"); |
1593 | 5 | return(-1); |
1594 | 5 | } |
1595 | 6.58k | comp->states = tmp; |
1596 | 6.58k | comp->maxState = newSize; |
1597 | 6.58k | } |
1598 | 15.6k | comp->states[2 * comp->nbState] = idx; |
1599 | 15.6k | comp->states[2 * comp->nbState++ + 1] = level; |
1600 | 15.6k | return(comp->nbState - 1); |
1601 | 15.6k | } |
1602 | | |
1603 | | /** |
1604 | | * Push new data onto the stream. NOTE: if the call #xmlPatterncompile |
1605 | | * indicated a dictionary, then strings for name and ns will be expected |
1606 | | * to come from the dictionary. |
1607 | | * Both `name` and `ns` being NULL means the / i.e. the root of the document. |
1608 | | * This can also act as a reset. |
1609 | | * |
1610 | | * @param stream the stream context |
1611 | | * @param name the current name |
1612 | | * @param ns the namespace name |
1613 | | * @param nodeType the type of the node |
1614 | | * @returns -1 in case of error, 1 if the current state in the stream is a |
1615 | | * match and 0 otherwise. |
1616 | | */ |
1617 | | static int |
1618 | | xmlStreamPushInternal(xmlStreamCtxtPtr stream, |
1619 | | const xmlChar *name, const xmlChar *ns, |
1620 | 941k | int nodeType) { |
1621 | 941k | int ret = 0, final = 0, tmp, i, m, match, stepNr, desc; |
1622 | 941k | xmlStreamCompPtr comp; |
1623 | 941k | xmlStreamStep step; |
1624 | | |
1625 | 941k | if ((stream == NULL) || (stream->nbState < 0)) |
1626 | 0 | return(-1); |
1627 | | |
1628 | 2.11M | while (stream != NULL) { |
1629 | 1.17M | comp = stream->comp; |
1630 | | |
1631 | 1.17M | if ((nodeType == XML_ELEMENT_NODE) && |
1632 | 924k | (name == NULL) && (ns == NULL)) { |
1633 | | /* We have a document node here (or a reset). */ |
1634 | 7.51k | stream->nbState = 0; |
1635 | 7.51k | stream->level = 0; |
1636 | 7.51k | stream->blockLevel = -1; |
1637 | 7.51k | if (comp->flags & XML_STREAM_FROM_ROOT) { |
1638 | 3.67k | if (comp->nbStep == 0) { |
1639 | | /* TODO: We have a "/." here? */ |
1640 | 0 | ret = 1; |
1641 | 3.67k | } else { |
1642 | 3.67k | if ((comp->nbStep == 1) && |
1643 | 2.32k | (comp->steps[0].nodeType == XML_STREAM_ANY_NODE) && |
1644 | 200 | (comp->steps[0].flags & XML_STREAM_STEP_DESC)) |
1645 | 200 | { |
1646 | | /* |
1647 | | * In the case of "//." the document node will match |
1648 | | * as well. |
1649 | | */ |
1650 | 200 | ret = 1; |
1651 | 3.47k | } else if (comp->steps[0].flags & XML_STREAM_STEP_ROOT) { |
1652 | 3.21k | if (xmlStreamCtxtAddState(stream, 0, 0) < 0) |
1653 | 0 | return(-1); |
1654 | 3.21k | } |
1655 | 3.67k | } |
1656 | 3.67k | } |
1657 | 7.51k | stream = stream->next; |
1658 | 7.51k | continue; /* while */ |
1659 | 7.51k | } |
1660 | | |
1661 | | /* |
1662 | | * Fast check for ".". |
1663 | | */ |
1664 | 1.16M | if (comp->nbStep == 0) { |
1665 | | /* |
1666 | | * / and . are handled at the XPath node set creation |
1667 | | * level by checking min depth |
1668 | | */ |
1669 | 235k | if (stream->flags & XML_PATTERN_XPATH) { |
1670 | 0 | stream = stream->next; |
1671 | 0 | continue; /* while */ |
1672 | 0 | } |
1673 | | /* |
1674 | | * For non-pattern like evaluation like XML Schema IDCs |
1675 | | * or traditional XPath expressions, this will match if |
1676 | | * we are at the first level only, otherwise on every level. |
1677 | | */ |
1678 | 235k | if ((nodeType != XML_ATTRIBUTE_NODE) && |
1679 | 184k | (((stream->flags & XML_PATTERN_NOTPATTERN) == 0) || |
1680 | 183k | (stream->level == 0))) { |
1681 | 42.3k | ret = 1; |
1682 | 42.3k | } |
1683 | 235k | stream->level++; |
1684 | 235k | goto stream_next; |
1685 | 235k | } |
1686 | 931k | if (stream->blockLevel != -1) { |
1687 | | /* |
1688 | | * Skip blocked expressions. |
1689 | | */ |
1690 | 331k | stream->level++; |
1691 | 331k | goto stream_next; |
1692 | 331k | } |
1693 | | |
1694 | 599k | if ((nodeType != XML_ELEMENT_NODE) && |
1695 | 143k | (nodeType != XML_ATTRIBUTE_NODE) && |
1696 | 0 | ((comp->flags & XML_STREAM_FINAL_IS_ANY_NODE) == 0)) { |
1697 | | /* |
1698 | | * No need to process nodes of other types if we don't |
1699 | | * resolve to those types. |
1700 | | * TODO: Do we need to block the context here? |
1701 | | */ |
1702 | 0 | stream->level++; |
1703 | 0 | goto stream_next; |
1704 | 0 | } |
1705 | | |
1706 | | /* |
1707 | | * Check evolution of existing states |
1708 | | */ |
1709 | 599k | i = 0; |
1710 | 599k | m = stream->nbState; |
1711 | 737k | while (i < m) { |
1712 | 137k | if ((comp->flags & XML_STREAM_DESC) == 0) { |
1713 | | /* |
1714 | | * If there is no "//", then only the last |
1715 | | * added state is of interest. |
1716 | | */ |
1717 | 5.24k | stepNr = stream->states[2 * (stream->nbState -1)]; |
1718 | | /* |
1719 | | * TODO: Security check, should not happen, remove it. |
1720 | | */ |
1721 | 5.24k | if (stream->states[(2 * (stream->nbState -1)) + 1] < |
1722 | 5.24k | stream->level) { |
1723 | 0 | return (-1); |
1724 | 0 | } |
1725 | 5.24k | desc = 0; |
1726 | | /* loop-stopper */ |
1727 | 5.24k | i = m; |
1728 | 132k | } else { |
1729 | | /* |
1730 | | * If there are "//", then we need to process every "//" |
1731 | | * occurring in the states, plus any other state for this |
1732 | | * level. |
1733 | | */ |
1734 | 132k | stepNr = stream->states[2 * i]; |
1735 | | |
1736 | | /* TODO: should not happen anymore: dead states */ |
1737 | 132k | if (stepNr < 0) |
1738 | 0 | goto next_state; |
1739 | | |
1740 | 132k | tmp = stream->states[(2 * i) + 1]; |
1741 | | |
1742 | | /* skip new states just added */ |
1743 | 132k | if (tmp > stream->level) |
1744 | 0 | goto next_state; |
1745 | | |
1746 | | /* skip states at ancestor levels, except if "//" */ |
1747 | 132k | desc = comp->steps[stepNr].flags & XML_STREAM_STEP_DESC; |
1748 | 132k | if ((tmp < stream->level) && (!desc)) |
1749 | 117k | goto next_state; |
1750 | 132k | } |
1751 | | /* |
1752 | | * Check for correct node-type. |
1753 | | */ |
1754 | 20.3k | step = comp->steps[stepNr]; |
1755 | 20.3k | if (step.nodeType != nodeType) { |
1756 | 5.43k | if (step.nodeType == XML_ATTRIBUTE_NODE) { |
1757 | | /* |
1758 | | * Block this expression for deeper evaluation. |
1759 | | */ |
1760 | 292 | if ((comp->flags & XML_STREAM_DESC) == 0) |
1761 | 225 | stream->blockLevel = stream->level +1; |
1762 | 292 | goto next_state; |
1763 | 5.14k | } else if (step.nodeType != XML_STREAM_ANY_NODE) |
1764 | 5.14k | goto next_state; |
1765 | 5.43k | } |
1766 | | /* |
1767 | | * Compare local/namespace-name. |
1768 | | */ |
1769 | 14.9k | match = 0; |
1770 | 14.9k | if (step.nodeType == XML_STREAM_ANY_NODE) { |
1771 | 0 | match = 1; |
1772 | 14.9k | } else if (step.name == NULL) { |
1773 | 6.68k | if (step.ns == NULL) { |
1774 | | /* |
1775 | | * This lets through all elements/attributes. |
1776 | | */ |
1777 | 6.34k | match = 1; |
1778 | 6.34k | } else if (ns != NULL) |
1779 | 0 | match = xmlStrEqual(step.ns, ns); |
1780 | 8.26k | } else if (((step.ns != NULL) == (ns != NULL)) && |
1781 | 8.02k | (name != NULL) && |
1782 | 8.02k | (step.name[0] == name[0]) && |
1783 | 1.07k | xmlStrEqual(step.name, name) && |
1784 | 352 | ((step.ns == ns) || xmlStrEqual(step.ns, ns))) |
1785 | 352 | { |
1786 | 352 | match = 1; |
1787 | 352 | } |
1788 | 14.9k | if (match) { |
1789 | 6.69k | final = step.flags & XML_STREAM_STEP_FINAL; |
1790 | 6.69k | if (final) { |
1791 | 5.68k | ret = 1; |
1792 | 5.68k | } else if (xmlStreamCtxtAddState(stream, stepNr + 1, |
1793 | 1.01k | stream->level + 1) < 0) { |
1794 | 1 | return(-1); |
1795 | 1 | } |
1796 | 6.69k | if ((ret != 1) && (step.flags & XML_STREAM_STEP_IN_SET)) { |
1797 | | /* |
1798 | | * Check if we have a special case like "foo/bar//.", where |
1799 | | * "foo" is selected as well. |
1800 | | */ |
1801 | 4 | ret = 1; |
1802 | 4 | } |
1803 | 6.69k | } |
1804 | 14.9k | if (((comp->flags & XML_STREAM_DESC) == 0) && |
1805 | 4.86k | ((! match) || final)) { |
1806 | | /* |
1807 | | * Mark this expression as blocked for any evaluation at |
1808 | | * deeper levels. Note that this includes "/foo" |
1809 | | * expressions if the *pattern* behaviour is used. |
1810 | | */ |
1811 | 4.29k | stream->blockLevel = stream->level +1; |
1812 | 4.29k | } |
1813 | 137k | next_state: |
1814 | 137k | i++; |
1815 | 137k | } |
1816 | | |
1817 | 599k | stream->level++; |
1818 | | |
1819 | | /* |
1820 | | * Re/enter the expression. |
1821 | | * Don't reenter if it's an absolute expression like "/foo", |
1822 | | * except "//foo". |
1823 | | */ |
1824 | 599k | step = comp->steps[0]; |
1825 | 599k | if (step.flags & XML_STREAM_STEP_ROOT) |
1826 | 3.21k | goto stream_next; |
1827 | | |
1828 | 596k | desc = step.flags & XML_STREAM_STEP_DESC; |
1829 | 596k | if (stream->flags & XML_PATTERN_NOTPATTERN) { |
1830 | | /* |
1831 | | * Re/enter the expression if it is a "descendant" one, |
1832 | | * or if we are at the 1st level of evaluation. |
1833 | | */ |
1834 | | |
1835 | 592k | if (stream->level == 1) { |
1836 | 73.1k | if (XML_STREAM_XS_IDC(stream)) { |
1837 | | /* |
1838 | | * XS-IDC: The missing "self::node()" will always |
1839 | | * match the first given node. |
1840 | | */ |
1841 | 73.1k | goto stream_next; |
1842 | 73.1k | } else |
1843 | 0 | goto compare; |
1844 | 73.1k | } |
1845 | | /* |
1846 | | * A "//" is always reentrant. |
1847 | | */ |
1848 | 519k | if (desc) |
1849 | 192k | goto compare; |
1850 | | |
1851 | | /* |
1852 | | * XS-IDC: Process the 2nd level, since the missing |
1853 | | * "self::node()" is responsible for the 2nd level being |
1854 | | * the real start level. |
1855 | | */ |
1856 | 326k | if ((stream->level == 2) && XML_STREAM_XS_IDC(stream)) |
1857 | 80.9k | goto compare; |
1858 | | |
1859 | 245k | goto stream_next; |
1860 | 326k | } |
1861 | | |
1862 | 277k | compare: |
1863 | | /* |
1864 | | * Check expected node-type. |
1865 | | */ |
1866 | 277k | if (step.nodeType != nodeType) { |
1867 | 75.4k | if (nodeType == XML_ATTRIBUTE_NODE) |
1868 | 60.9k | goto stream_next; |
1869 | 14.4k | else if (step.nodeType != XML_STREAM_ANY_NODE) |
1870 | 14.2k | goto stream_next; |
1871 | 75.4k | } |
1872 | | /* |
1873 | | * Compare local/namespace-name. |
1874 | | */ |
1875 | 202k | match = 0; |
1876 | 202k | if (step.nodeType == XML_STREAM_ANY_NODE) { |
1877 | 200 | match = 1; |
1878 | 201k | } else if (step.name == NULL) { |
1879 | 12.2k | if (step.ns == NULL) { |
1880 | | /* |
1881 | | * This lets through all elements/attributes. |
1882 | | */ |
1883 | 12.0k | match = 1; |
1884 | 12.0k | } else if (ns != NULL) |
1885 | 0 | match = xmlStrEqual(step.ns, ns); |
1886 | 189k | } else if (((step.ns != NULL) == (ns != NULL)) && |
1887 | 189k | (name != NULL) && |
1888 | 189k | (step.name[0] == name[0]) && |
1889 | 117k | xmlStrEqual(step.name, name) && |
1890 | 88.0k | ((step.ns == ns) || xmlStrEqual(step.ns, ns))) |
1891 | 88.0k | { |
1892 | 88.0k | match = 1; |
1893 | 88.0k | } |
1894 | 202k | final = step.flags & XML_STREAM_STEP_FINAL; |
1895 | 202k | if (match) { |
1896 | 100k | if (final) { |
1897 | 88.8k | ret = 1; |
1898 | 88.8k | } else if (xmlStreamCtxtAddState(stream, 1, stream->level) < 0) { |
1899 | 4 | return(-1); |
1900 | 4 | } |
1901 | 100k | if ((ret != 1) && (step.flags & XML_STREAM_STEP_IN_SET)) { |
1902 | | /* |
1903 | | * Check if we have a special case like "foo//.", where |
1904 | | * "foo" is selected as well. |
1905 | | */ |
1906 | 6 | ret = 1; |
1907 | 6 | } |
1908 | 100k | } |
1909 | 202k | if (((comp->flags & XML_STREAM_DESC) == 0) && |
1910 | 57.5k | ((! match) || final)) { |
1911 | | /* |
1912 | | * Mark this expression as blocked for any evaluation at |
1913 | | * deeper levels. |
1914 | | */ |
1915 | 57.1k | stream->blockLevel = stream->level; |
1916 | 57.1k | } |
1917 | | |
1918 | 1.16M | stream_next: |
1919 | 1.16M | stream = stream->next; |
1920 | 1.16M | } /* while stream != NULL */ |
1921 | | |
1922 | 941k | return(ret); |
1923 | 941k | } |
1924 | | |
1925 | | /** |
1926 | | * Push new data onto the stream. NOTE: if the call #xmlPatterncompile |
1927 | | * indicated a dictionary, then strings for name and ns will be expected |
1928 | | * to come from the dictionary. |
1929 | | * Both `name` and `ns` being NULL means the / i.e. the root of the document. |
1930 | | * This can also act as a reset. |
1931 | | * Otherwise the function will act as if it has been given an element-node. |
1932 | | * |
1933 | | * @param stream the stream context |
1934 | | * @param name the current name |
1935 | | * @param ns the namespace name |
1936 | | * @returns -1 in case of error, 1 if the current state in the stream is a |
1937 | | * match and 0 otherwise. |
1938 | | */ |
1939 | | int |
1940 | | xmlStreamPush(xmlStreamCtxt *stream, |
1941 | 753k | const xmlChar *name, const xmlChar *ns) { |
1942 | 753k | return (xmlStreamPushInternal(stream, name, ns, XML_ELEMENT_NODE)); |
1943 | 753k | } |
1944 | | |
1945 | | /** |
1946 | | * Push new data onto the stream. NOTE: if the call #xmlPatterncompile |
1947 | | * indicated a dictionary, then strings for name and ns will be expected |
1948 | | * to come from the dictionary. |
1949 | | * Both `name` and `ns` being NULL means the / i.e. the root of the document. |
1950 | | * This can also act as a reset. |
1951 | | * Different from #xmlStreamPush this function can be fed with nodes of type: |
1952 | | * element-, attribute-, text-, cdata-section-, comment- and |
1953 | | * processing-instruction-node. |
1954 | | * |
1955 | | * @param stream the stream context |
1956 | | * @param name the current name |
1957 | | * @param ns the namespace name |
1958 | | * @param nodeType the type of the node being pushed |
1959 | | * @returns -1 in case of error, 1 if the current state in the stream is a |
1960 | | * match and 0 otherwise. |
1961 | | */ |
1962 | | int |
1963 | | xmlStreamPushNode(xmlStreamCtxt *stream, |
1964 | | const xmlChar *name, const xmlChar *ns, |
1965 | | int nodeType) |
1966 | 0 | { |
1967 | 0 | return (xmlStreamPushInternal(stream, name, ns, |
1968 | 0 | nodeType)); |
1969 | 0 | } |
1970 | | |
1971 | | /** |
1972 | | * Push new attribute data onto the stream. |
1973 | | * |
1974 | | * NOTE: If the call to #xmlPatterncompile indicated a dictionary, |
1975 | | * then strings for `name` and `ns` will be expected to come from |
1976 | | * the dictionary. |
1977 | | * |
1978 | | * Both `name` and `ns` being NULL means the root of the document. |
1979 | | * This can also act as a reset. Otherwise the function will act as |
1980 | | * if it has been given an attribute-node. |
1981 | | * |
1982 | | * @param stream the stream context |
1983 | | * @param name the current name |
1984 | | * @param ns the namespace name |
1985 | | * @returns -1 in case of error, 1 if the current state in the stream |
1986 | | * is a match and 0 otherwise. |
1987 | | */ |
1988 | | int |
1989 | | xmlStreamPushAttr(xmlStreamCtxt *stream, |
1990 | 187k | const xmlChar *name, const xmlChar *ns) { |
1991 | 187k | return (xmlStreamPushInternal(stream, name, ns, XML_ATTRIBUTE_NODE)); |
1992 | 187k | } |
1993 | | |
1994 | | /** |
1995 | | * push one level from the stream. |
1996 | | * |
1997 | | * @param stream the stream context |
1998 | | * @returns -1 in case of error, 0 otherwise. |
1999 | | */ |
2000 | | int |
2001 | 914k | xmlStreamPop(xmlStreamCtxt *stream) { |
2002 | 914k | int i, lev; |
2003 | | |
2004 | 914k | if (stream == NULL) |
2005 | 0 | return(-1); |
2006 | 2.03M | while (stream != NULL) { |
2007 | | /* |
2008 | | * Reset block-level. |
2009 | | */ |
2010 | 1.12M | if (stream->blockLevel == stream->level) |
2011 | 61.0k | stream->blockLevel = -1; |
2012 | | |
2013 | | /* |
2014 | | * stream->level can be zero when XML_FINAL_IS_ANY_NODE is set |
2015 | | * (see the thread at |
2016 | | * http://mail.gnome.org/archives/xslt/2008-July/msg00027.html) |
2017 | | */ |
2018 | 1.12M | if (stream->level) |
2019 | 1.12M | stream->level--; |
2020 | | /* |
2021 | | * Check evolution of existing states |
2022 | | */ |
2023 | 1.13M | for (i = stream->nbState -1; i >= 0; i--) { |
2024 | | /* discard obsoleted states */ |
2025 | 40.2k | lev = stream->states[(2 * i) + 1]; |
2026 | 40.2k | if (lev > stream->level) |
2027 | 11.3k | stream->nbState--; |
2028 | 40.2k | if (lev <= stream->level) |
2029 | 28.9k | break; |
2030 | 40.2k | } |
2031 | 1.12M | stream = stream->next; |
2032 | 1.12M | } |
2033 | 914k | return(0); |
2034 | 914k | } |
2035 | | |
2036 | | /** |
2037 | | * Query if the streaming pattern additionally needs to be fed with |
2038 | | * text-, cdata-section-, comment- and processing-instruction-nodes. |
2039 | | * If the result is 0 then only element-nodes and attribute-nodes |
2040 | | * need to be pushed. |
2041 | | * |
2042 | | * @param streamCtxt the stream context |
2043 | | * @returns 1 in case of need of nodes of the above described types, |
2044 | | * 0 otherwise. -1 on API errors. |
2045 | | */ |
2046 | | int |
2047 | | xmlStreamWantsAnyNode(xmlStreamCtxt *streamCtxt) |
2048 | 0 | { |
2049 | 0 | if (streamCtxt == NULL) |
2050 | 0 | return(-1); |
2051 | 0 | while (streamCtxt != NULL) { |
2052 | 0 | if (streamCtxt->comp->flags & XML_STREAM_FINAL_IS_ANY_NODE) |
2053 | 0 | return(1); |
2054 | 0 | streamCtxt = streamCtxt->next; |
2055 | 0 | } |
2056 | 0 | return(0); |
2057 | 0 | } |
2058 | | |
2059 | | /************************************************************************ |
2060 | | * * |
2061 | | * The public interfaces * |
2062 | | * * |
2063 | | ************************************************************************/ |
2064 | | |
2065 | | /** |
2066 | | * Compile a pattern. |
2067 | | * |
2068 | | * @since 2.13.0 |
2069 | | * |
2070 | | * @param pattern the pattern to compile |
2071 | | * @param dict an optional dictionary for interned strings |
2072 | | * @param flags compilation flags, see xmlPatternFlags |
2073 | | * @param namespaces the prefix definitions, array of [URI, prefix] or NULL |
2074 | | * @param patternOut output pattern |
2075 | | * @returns 0 on success, 1 on error, -1 if a memory allocation failed. |
2076 | | */ |
2077 | | int |
2078 | | xmlPatternCompileSafe(const xmlChar *pattern, xmlDict *dict, int flags, |
2079 | 30.4k | const xmlChar **namespaces, xmlPattern **patternOut) { |
2080 | 30.4k | xmlPatternPtr ret = NULL, cur; |
2081 | 30.4k | xmlPatParserContextPtr ctxt = NULL; |
2082 | 30.4k | const xmlChar *or, *start; |
2083 | 30.4k | xmlChar *tmp = NULL; |
2084 | 30.4k | int type = 0; |
2085 | 30.4k | int streamable = 1; |
2086 | 30.4k | int error; |
2087 | | |
2088 | 30.4k | if (patternOut == NULL) |
2089 | 0 | return(1); |
2090 | | |
2091 | 30.4k | if (pattern == NULL) { |
2092 | 0 | error = 1; |
2093 | 0 | goto error; |
2094 | 0 | } |
2095 | | |
2096 | 30.4k | start = pattern; |
2097 | 30.4k | or = start; |
2098 | 73.0k | while (*or != 0) { |
2099 | 65.3k | tmp = NULL; |
2100 | 31.9M | while ((*or != 0) && (*or != '|')) or++; |
2101 | 65.3k | if (*or == 0) |
2102 | 19.5k | ctxt = xmlNewPatParserContext(start, dict, namespaces); |
2103 | 45.8k | else { |
2104 | 45.8k | tmp = xmlStrndup(start, or - start); |
2105 | 45.8k | if (tmp != NULL) { |
2106 | 45.8k | ctxt = xmlNewPatParserContext(tmp, dict, namespaces); |
2107 | 45.8k | } |
2108 | 45.8k | or++; |
2109 | 45.8k | } |
2110 | 65.3k | if (ctxt == NULL) { |
2111 | 64 | error = -1; |
2112 | 64 | goto error; |
2113 | 64 | } |
2114 | 65.3k | cur = xmlNewPattern(); |
2115 | 65.3k | if (cur == NULL) { |
2116 | 9 | error = -1; |
2117 | 9 | goto error; |
2118 | 9 | } |
2119 | | /* |
2120 | | * Assign string dict. |
2121 | | */ |
2122 | 65.3k | if (dict) { |
2123 | 0 | cur->dict = dict; |
2124 | 0 | xmlDictReference(dict); |
2125 | 0 | } |
2126 | 65.3k | if (ret == NULL) |
2127 | 30.2k | ret = cur; |
2128 | 35.0k | else { |
2129 | 35.0k | cur->next = ret->next; |
2130 | 35.0k | ret->next = cur; |
2131 | 35.0k | } |
2132 | 65.3k | cur->flags = flags; |
2133 | 65.3k | ctxt->comp = cur; |
2134 | | |
2135 | 65.3k | if (XML_STREAM_XS_IDC(cur)) |
2136 | 50.9k | xmlCompileIDCXPathPath(ctxt); |
2137 | 14.3k | else |
2138 | 14.3k | xmlCompilePathPattern(ctxt); |
2139 | 65.3k | if (ctxt->error != 0) { |
2140 | 22.6k | error = ctxt->error; |
2141 | 22.6k | goto error; |
2142 | 22.6k | } |
2143 | 42.6k | xmlFreePatParserContext(ctxt); |
2144 | 42.6k | ctxt = NULL; |
2145 | | |
2146 | | |
2147 | 42.6k | if (streamable) { |
2148 | 41.9k | if (type == 0) { |
2149 | 20.9k | type = cur->flags & (PAT_FROM_ROOT | PAT_FROM_CUR); |
2150 | 21.0k | } else if (type == PAT_FROM_ROOT) { |
2151 | 6.51k | if (cur->flags & PAT_FROM_CUR) |
2152 | 21 | streamable = 0; |
2153 | 14.5k | } else if (type == PAT_FROM_CUR) { |
2154 | 14.5k | if (cur->flags & PAT_FROM_ROOT) |
2155 | 11 | streamable = 0; |
2156 | 14.5k | } |
2157 | 41.9k | } |
2158 | 42.6k | if (streamable) { |
2159 | 41.9k | error = xmlStreamCompile(cur); |
2160 | 41.9k | if (error != 0) |
2161 | 11 | goto error; |
2162 | 41.9k | } |
2163 | 42.6k | error = xmlReversePattern(cur); |
2164 | 42.6k | if (error != 0) |
2165 | 3 | goto error; |
2166 | 42.6k | if (tmp != NULL) { |
2167 | 35.1k | xmlFree(tmp); |
2168 | 35.1k | tmp = NULL; |
2169 | 35.1k | } |
2170 | 42.6k | start = or; |
2171 | 42.6k | } |
2172 | 7.70k | if (streamable == 0) { |
2173 | 30 | cur = ret; |
2174 | 1.01k | while (cur != NULL) { |
2175 | 988 | if (cur->stream != NULL) { |
2176 | 260 | xmlFreeStreamComp(cur->stream); |
2177 | 260 | cur->stream = NULL; |
2178 | 260 | } |
2179 | 988 | cur = cur->next; |
2180 | 988 | } |
2181 | 30 | } |
2182 | | |
2183 | 7.70k | *patternOut = ret; |
2184 | 7.70k | return(0); |
2185 | 22.7k | error: |
2186 | 22.7k | if (ctxt != NULL) xmlFreePatParserContext(ctxt); |
2187 | 22.7k | if (ret != NULL) xmlFreePattern(ret); |
2188 | 22.7k | if (tmp != NULL) xmlFree(tmp); |
2189 | 22.7k | *patternOut = NULL; |
2190 | 22.7k | return(error); |
2191 | 30.4k | } |
2192 | | |
2193 | | /** |
2194 | | * Compile a pattern. |
2195 | | * |
2196 | | * @param pattern the pattern to compile |
2197 | | * @param dict an optional dictionary for interned strings |
2198 | | * @param flags compilation flags, see xmlPatternFlags |
2199 | | * @param namespaces the prefix definitions, array of [URI, prefix] or NULL |
2200 | | * @returns the compiled form of the pattern or NULL in case of error |
2201 | | */ |
2202 | | xmlPattern * |
2203 | | xmlPatterncompile(const xmlChar *pattern, xmlDict *dict, int flags, |
2204 | 28.9k | const xmlChar **namespaces) { |
2205 | 28.9k | xmlPatternPtr ret; |
2206 | 28.9k | xmlPatternCompileSafe(pattern, dict, flags, namespaces, &ret); |
2207 | 28.9k | return(ret); |
2208 | 28.9k | } |
2209 | | |
2210 | | /** |
2211 | | * Test whether the node matches the pattern |
2212 | | * |
2213 | | * @param comp the precompiled pattern |
2214 | | * @param node a node |
2215 | | * @returns 1 if it matches, 0 if it doesn't and -1 in case of failure |
2216 | | */ |
2217 | | int |
2218 | | xmlPatternMatch(xmlPattern *comp, xmlNode *node) |
2219 | 394 | { |
2220 | 394 | int ret = 0; |
2221 | | |
2222 | 394 | if ((comp == NULL) || (node == NULL)) |
2223 | 0 | return(-1); |
2224 | | |
2225 | 5.49k | while (comp != NULL) { |
2226 | 5.19k | ret = xmlPatMatch(comp, node); |
2227 | 5.19k | if (ret != 0) |
2228 | 96 | return(ret); |
2229 | 5.10k | comp = comp->next; |
2230 | 5.10k | } |
2231 | 298 | return(ret); |
2232 | 394 | } |
2233 | | |
2234 | | /** |
2235 | | * Get a streaming context for that pattern |
2236 | | * Use #xmlFreeStreamCtxt to free the context. |
2237 | | * |
2238 | | * @param comp the precompiled pattern |
2239 | | * @returns a pointer to the context or NULL in case of failure |
2240 | | */ |
2241 | | xmlStreamCtxt * |
2242 | | xmlPatternGetStreamCtxt(xmlPattern *comp) |
2243 | 104k | { |
2244 | 104k | xmlStreamCtxtPtr ret = NULL, cur; |
2245 | | |
2246 | 104k | if ((comp == NULL) || (comp->stream == NULL)) |
2247 | 20 | return(NULL); |
2248 | | |
2249 | 227k | while (comp != NULL) { |
2250 | 123k | if (comp->stream == NULL) |
2251 | 13 | goto failed; |
2252 | 123k | cur = xmlNewStreamCtxt(comp->stream); |
2253 | 123k | if (cur == NULL) |
2254 | 26 | goto failed; |
2255 | 123k | if (ret == NULL) |
2256 | 104k | ret = cur; |
2257 | 18.2k | else { |
2258 | 18.2k | cur->next = ret->next; |
2259 | 18.2k | ret->next = cur; |
2260 | 18.2k | } |
2261 | 123k | cur->flags = comp->flags; |
2262 | 123k | comp = comp->next; |
2263 | 123k | } |
2264 | 104k | return(ret); |
2265 | 39 | failed: |
2266 | 39 | xmlFreeStreamCtxt(ret); |
2267 | 39 | return(NULL); |
2268 | 104k | } |
2269 | | |
2270 | | /** |
2271 | | * Check if the pattern is streamable i.e. #xmlPatternGetStreamCtxt |
2272 | | * should work. |
2273 | | * |
2274 | | * @param comp the precompiled pattern |
2275 | | * @returns 1 if streamable, 0 if not and -1 in case of error. |
2276 | | */ |
2277 | | int |
2278 | 0 | xmlPatternStreamable(xmlPattern *comp) { |
2279 | 0 | if (comp == NULL) |
2280 | 0 | return(-1); |
2281 | 0 | while (comp != NULL) { |
2282 | 0 | if (comp->stream == NULL) |
2283 | 0 | return(0); |
2284 | 0 | comp = comp->next; |
2285 | 0 | } |
2286 | 0 | return(1); |
2287 | 0 | } |
2288 | | |
2289 | | /** |
2290 | | * Check the maximum depth reachable by a pattern |
2291 | | * |
2292 | | * @param comp the precompiled pattern |
2293 | | * @returns -2 if no limit (using //), otherwise the depth, |
2294 | | * and -1 in case of error |
2295 | | */ |
2296 | | int |
2297 | 0 | xmlPatternMaxDepth(xmlPattern *comp) { |
2298 | 0 | int ret = 0, i; |
2299 | 0 | if (comp == NULL) |
2300 | 0 | return(-1); |
2301 | 0 | while (comp != NULL) { |
2302 | 0 | if (comp->stream == NULL) |
2303 | 0 | return(-1); |
2304 | 0 | for (i = 0;i < comp->stream->nbStep;i++) |
2305 | 0 | if (comp->stream->steps[i].flags & XML_STREAM_STEP_DESC) |
2306 | 0 | return(-2); |
2307 | 0 | if (comp->stream->nbStep > ret) |
2308 | 0 | ret = comp->stream->nbStep; |
2309 | 0 | comp = comp->next; |
2310 | 0 | } |
2311 | 0 | return(ret); |
2312 | 0 | } |
2313 | | |
2314 | | /** |
2315 | | * Check the minimum depth reachable by a pattern, 0 mean the / or . are |
2316 | | * part of the set. |
2317 | | * |
2318 | | * @param comp the precompiled pattern |
2319 | | * @returns -1 in case of error otherwise the depth, |
2320 | | */ |
2321 | | int |
2322 | 0 | xmlPatternMinDepth(xmlPattern *comp) { |
2323 | 0 | int ret = 12345678; |
2324 | 0 | if (comp == NULL) |
2325 | 0 | return(-1); |
2326 | 0 | while (comp != NULL) { |
2327 | 0 | if (comp->stream == NULL) |
2328 | 0 | return(-1); |
2329 | 0 | if (comp->stream->nbStep < ret) |
2330 | 0 | ret = comp->stream->nbStep; |
2331 | 0 | if (ret == 0) |
2332 | 0 | return(0); |
2333 | 0 | comp = comp->next; |
2334 | 0 | } |
2335 | 0 | return(ret); |
2336 | 0 | } |
2337 | | |
2338 | | /** |
2339 | | * Check if the pattern must be looked at from the root. |
2340 | | * |
2341 | | * @param comp the precompiled pattern |
2342 | | * @returns 1 if true, 0 if false and -1 in case of error |
2343 | | */ |
2344 | | int |
2345 | 0 | xmlPatternFromRoot(xmlPattern *comp) { |
2346 | 0 | if (comp == NULL) |
2347 | 0 | return(-1); |
2348 | 0 | while (comp != NULL) { |
2349 | 0 | if (comp->stream == NULL) |
2350 | 0 | return(-1); |
2351 | 0 | if (comp->flags & PAT_FROM_ROOT) |
2352 | 0 | return(1); |
2353 | 0 | comp = comp->next; |
2354 | 0 | } |
2355 | 0 | return(0); |
2356 | |
|
2357 | 0 | } |
2358 | | |
2359 | | #endif /* LIBXML_PATTERN_ENABLED */ |