/src/mozilla-central/parser/expat/lib/xmltok_impl.c
Line | Count | Source (jump to first uncovered line) |
1 | | /* Copyright (c) 1998, 1999 Thai Open Source Software Center Ltd |
2 | | See the file COPYING for copying permission. |
3 | | */ |
4 | | |
5 | | #ifndef IS_INVALID_CHAR |
6 | 0 | #define IS_INVALID_CHAR(enc, ptr, n) (0) |
7 | | #endif |
8 | | |
9 | | #define INVALID_LEAD_CASE(n, ptr, nextTokPtr) \ |
10 | 0 | case BT_LEAD ## n: \ |
11 | 0 | if (end - ptr < n) \ |
12 | 0 | return XML_TOK_PARTIAL_CHAR; \ |
13 | 0 | if (IS_INVALID_CHAR(enc, ptr, n)) { \ |
14 | 0 | *(nextTokPtr) = (ptr); \ |
15 | 0 | return XML_TOK_INVALID; \ |
16 | 0 | } \ |
17 | 0 | ptr += n; \ |
18 | 0 | break; |
19 | | |
20 | | #define INVALID_CASES(ptr, nextTokPtr) \ |
21 | 0 | INVALID_LEAD_CASE(2, ptr, nextTokPtr) \ |
22 | 0 | INVALID_LEAD_CASE(3, ptr, nextTokPtr) \ |
23 | 0 | INVALID_LEAD_CASE(4, ptr, nextTokPtr) \ |
24 | 0 | case BT_NONXML: \ |
25 | 0 | case BT_MALFORM: \ |
26 | 0 | case BT_TRAIL: \ |
27 | 0 | *(nextTokPtr) = (ptr); \ |
28 | 0 | return XML_TOK_INVALID; |
29 | | |
30 | | #define CHECK_NAME_CASE(n, enc, ptr, end, nextTokPtr) \ |
31 | 0 | case BT_LEAD ## n: \ |
32 | 0 | if (end - ptr < n) \ |
33 | 0 | return XML_TOK_PARTIAL_CHAR; \ |
34 | 0 | if (!IS_NAME_CHAR(enc, ptr, n)) { \ |
35 | 0 | *nextTokPtr = ptr; \ |
36 | 0 | return XML_TOK_INVALID; \ |
37 | 0 | } \ |
38 | 0 | ptr += n; \ |
39 | 0 | break; |
40 | | |
41 | | #define CHECK_NAME_CASES(enc, ptr, end, nextTokPtr) \ |
42 | 0 | case BT_NONASCII: \ |
43 | 0 | if (!IS_NAME_CHAR_MINBPC(enc, ptr)) { \ |
44 | 0 | *nextTokPtr = ptr; \ |
45 | 0 | return XML_TOK_INVALID; \ |
46 | 0 | } \ |
47 | 0 | case BT_NMSTRT: \ |
48 | 0 | case BT_HEX: \ |
49 | 0 | case BT_DIGIT: \ |
50 | 0 | case BT_NAME: \ |
51 | 0 | case BT_MINUS: \ |
52 | 0 | ptr += MINBPC(enc); \ |
53 | 0 | break; \ |
54 | 0 | CHECK_NAME_CASE(2, enc, ptr, end, nextTokPtr) \ |
55 | 0 | CHECK_NAME_CASE(3, enc, ptr, end, nextTokPtr) \ |
56 | 0 | CHECK_NAME_CASE(4, enc, ptr, end, nextTokPtr) |
57 | | |
58 | | #define CHECK_NMSTRT_CASE(n, enc, ptr, end, nextTokPtr) \ |
59 | 0 | case BT_LEAD ## n: \ |
60 | 0 | if (end - ptr < n) \ |
61 | 0 | return XML_TOK_PARTIAL_CHAR; \ |
62 | 0 | if (!IS_NMSTRT_CHAR(enc, ptr, n)) { \ |
63 | 0 | *nextTokPtr = ptr; \ |
64 | 0 | return XML_TOK_INVALID; \ |
65 | 0 | } \ |
66 | 0 | ptr += n; \ |
67 | 0 | break; |
68 | | |
69 | | #define CHECK_NMSTRT_CASES(enc, ptr, end, nextTokPtr) \ |
70 | 0 | case BT_NONASCII: \ |
71 | 0 | if (!IS_NMSTRT_CHAR_MINBPC(enc, ptr)) { \ |
72 | 0 | *nextTokPtr = ptr; \ |
73 | 0 | return XML_TOK_INVALID; \ |
74 | 0 | } \ |
75 | 0 | case BT_NMSTRT: \ |
76 | 0 | case BT_HEX: \ |
77 | 0 | ptr += MINBPC(enc); \ |
78 | 0 | break; \ |
79 | 0 | CHECK_NMSTRT_CASE(2, enc, ptr, end, nextTokPtr) \ |
80 | 0 | CHECK_NMSTRT_CASE(3, enc, ptr, end, nextTokPtr) \ |
81 | 0 | CHECK_NMSTRT_CASE(4, enc, ptr, end, nextTokPtr) |
82 | | |
83 | | #ifndef PREFIX |
84 | | #define PREFIX(ident) ident |
85 | | #endif |
86 | | |
87 | | /* ptr points to character following "<!-" */ |
88 | | |
89 | | static int PTRCALL |
90 | | PREFIX(scanComment)(const ENCODING *enc, const char *ptr, |
91 | | const char *end, const char **nextTokPtr) |
92 | 0 | { |
93 | 0 | if (ptr != end) { |
94 | 0 | if (!CHAR_MATCHES(enc, ptr, ASCII_MINUS)) { |
95 | 0 | *nextTokPtr = ptr; |
96 | 0 | return XML_TOK_INVALID; |
97 | 0 | } |
98 | 0 | ptr += MINBPC(enc); |
99 | 0 | while (ptr != end) { |
100 | 0 | switch (BYTE_TYPE(enc, ptr)) { |
101 | 0 | INVALID_CASES(ptr, nextTokPtr) |
102 | 0 | case BT_MINUS: |
103 | 0 | if ((ptr += MINBPC(enc)) == end) |
104 | 0 | return XML_TOK_PARTIAL; |
105 | 0 | if (CHAR_MATCHES(enc, ptr, ASCII_MINUS)) { |
106 | 0 | if ((ptr += MINBPC(enc)) == end) |
107 | 0 | return XML_TOK_PARTIAL; |
108 | 0 | if (!CHAR_MATCHES(enc, ptr, ASCII_GT)) { |
109 | 0 | *nextTokPtr = ptr; |
110 | 0 | return XML_TOK_INVALID; |
111 | 0 | } |
112 | 0 | *nextTokPtr = ptr + MINBPC(enc); |
113 | 0 | return XML_TOK_COMMENT; |
114 | 0 | } |
115 | 0 | break; |
116 | 0 | default: |
117 | 0 | ptr += MINBPC(enc); |
118 | 0 | break; |
119 | 0 | } |
120 | 0 | } |
121 | 0 | } |
122 | 0 | return XML_TOK_PARTIAL; |
123 | 0 | } Unexecuted instantiation: xmltok.c:normal_scanComment Unexecuted instantiation: xmltok.c:little2_scanComment Unexecuted instantiation: xmltok.c:big2_scanComment |
124 | | |
125 | | /* ptr points to character following "<!" */ |
126 | | |
127 | | static int PTRCALL |
128 | | PREFIX(scanDecl)(const ENCODING *enc, const char *ptr, |
129 | | const char *end, const char **nextTokPtr) |
130 | 0 | { |
131 | 0 | if (ptr == end) |
132 | 0 | return XML_TOK_PARTIAL; |
133 | 0 | switch (BYTE_TYPE(enc, ptr)) { |
134 | 0 | case BT_MINUS: |
135 | 0 | return PREFIX(scanComment)(enc, ptr + MINBPC(enc), end, nextTokPtr); |
136 | 0 | case BT_LSQB: |
137 | 0 | *nextTokPtr = ptr + MINBPC(enc); |
138 | 0 | return XML_TOK_COND_SECT_OPEN; |
139 | 0 | case BT_NMSTRT: |
140 | 0 | case BT_HEX: |
141 | 0 | ptr += MINBPC(enc); |
142 | 0 | break; |
143 | 0 | default: |
144 | 0 | *nextTokPtr = ptr; |
145 | 0 | return XML_TOK_INVALID; |
146 | 0 | } |
147 | 0 | while (ptr != end) { |
148 | 0 | switch (BYTE_TYPE(enc, ptr)) { |
149 | 0 | case BT_PERCNT: |
150 | 0 | if (ptr + MINBPC(enc) == end) |
151 | 0 | return XML_TOK_PARTIAL; |
152 | 0 | /* don't allow <!ENTITY% foo "whatever"> */ |
153 | 0 | switch (BYTE_TYPE(enc, ptr + MINBPC(enc))) { |
154 | 0 | case BT_S: case BT_CR: case BT_LF: case BT_PERCNT: |
155 | 0 | *nextTokPtr = ptr; |
156 | 0 | return XML_TOK_INVALID; |
157 | 0 | } |
158 | 0 | /* fall through */ |
159 | 0 | case BT_S: case BT_CR: case BT_LF: |
160 | 0 | *nextTokPtr = ptr; |
161 | 0 | return XML_TOK_DECL_OPEN; |
162 | 0 | case BT_NMSTRT: |
163 | 0 | case BT_HEX: |
164 | 0 | ptr += MINBPC(enc); |
165 | 0 | break; |
166 | 0 | default: |
167 | 0 | *nextTokPtr = ptr; |
168 | 0 | return XML_TOK_INVALID; |
169 | 0 | } |
170 | 0 | } |
171 | 0 | return XML_TOK_PARTIAL; |
172 | 0 | } Unexecuted instantiation: xmltok.c:normal_scanDecl Unexecuted instantiation: xmltok.c:little2_scanDecl Unexecuted instantiation: xmltok.c:big2_scanDecl |
173 | | |
174 | | static int PTRCALL |
175 | | PREFIX(checkPiTarget)(const ENCODING *enc, const char *ptr, |
176 | | const char *end, int *tokPtr) |
177 | 0 | { |
178 | 0 | int upper = 0; |
179 | 0 | *tokPtr = XML_TOK_PI; |
180 | 0 | if (end - ptr != MINBPC(enc)*3) |
181 | 0 | return 1; |
182 | 0 | switch (BYTE_TO_ASCII(enc, ptr)) { |
183 | 0 | case ASCII_x: |
184 | 0 | break; |
185 | 0 | case ASCII_X: |
186 | 0 | upper = 1; |
187 | 0 | break; |
188 | 0 | default: |
189 | 0 | return 1; |
190 | 0 | } |
191 | 0 | ptr += MINBPC(enc); |
192 | 0 | switch (BYTE_TO_ASCII(enc, ptr)) { |
193 | 0 | case ASCII_m: |
194 | 0 | break; |
195 | 0 | case ASCII_M: |
196 | 0 | upper = 1; |
197 | 0 | break; |
198 | 0 | default: |
199 | 0 | return 1; |
200 | 0 | } |
201 | 0 | ptr += MINBPC(enc); |
202 | 0 | switch (BYTE_TO_ASCII(enc, ptr)) { |
203 | 0 | case ASCII_l: |
204 | 0 | break; |
205 | 0 | case ASCII_L: |
206 | 0 | upper = 1; |
207 | 0 | break; |
208 | 0 | default: |
209 | 0 | return 1; |
210 | 0 | } |
211 | 0 | if (upper) |
212 | 0 | return 0; |
213 | 0 | *tokPtr = XML_TOK_XML_DECL; |
214 | 0 | return 1; |
215 | 0 | } Unexecuted instantiation: xmltok.c:normal_checkPiTarget Unexecuted instantiation: xmltok.c:little2_checkPiTarget Unexecuted instantiation: xmltok.c:big2_checkPiTarget |
216 | | |
217 | | /* ptr points to character following "<?" */ |
218 | | |
219 | | static int PTRCALL |
220 | | PREFIX(scanPi)(const ENCODING *enc, const char *ptr, |
221 | | const char *end, const char **nextTokPtr) |
222 | 0 | { |
223 | 0 | int tok; |
224 | 0 | const char *target = ptr; |
225 | 0 | if (ptr == end) |
226 | 0 | return XML_TOK_PARTIAL; |
227 | 0 | switch (BYTE_TYPE(enc, ptr)) { |
228 | 0 | CHECK_NMSTRT_CASES(enc, ptr, end, nextTokPtr) |
229 | 0 | default: |
230 | 0 | *nextTokPtr = ptr; |
231 | 0 | return XML_TOK_INVALID; |
232 | 0 | } |
233 | 0 | while (ptr != end) { |
234 | 0 | switch (BYTE_TYPE(enc, ptr)) { |
235 | 0 | CHECK_NAME_CASES(enc, ptr, end, nextTokPtr) |
236 | 0 | case BT_S: case BT_CR: case BT_LF: |
237 | 0 | if (!PREFIX(checkPiTarget)(enc, target, ptr, &tok)) { |
238 | 0 | *nextTokPtr = ptr; |
239 | 0 | return XML_TOK_INVALID; |
240 | 0 | } |
241 | 0 | ptr += MINBPC(enc); |
242 | 0 | while (ptr != end) { |
243 | 0 | switch (BYTE_TYPE(enc, ptr)) { |
244 | 0 | INVALID_CASES(ptr, nextTokPtr) |
245 | 0 | case BT_QUEST: |
246 | 0 | ptr += MINBPC(enc); |
247 | 0 | if (ptr == end) |
248 | 0 | return XML_TOK_PARTIAL; |
249 | 0 | if (CHAR_MATCHES(enc, ptr, ASCII_GT)) { |
250 | 0 | *nextTokPtr = ptr + MINBPC(enc); |
251 | 0 | return tok; |
252 | 0 | } |
253 | 0 | break; |
254 | 0 | default: |
255 | 0 | ptr += MINBPC(enc); |
256 | 0 | break; |
257 | 0 | } |
258 | 0 | } |
259 | 0 | return XML_TOK_PARTIAL; |
260 | 0 | case BT_QUEST: |
261 | 0 | if (!PREFIX(checkPiTarget)(enc, target, ptr, &tok)) { |
262 | 0 | *nextTokPtr = ptr; |
263 | 0 | return XML_TOK_INVALID; |
264 | 0 | } |
265 | 0 | ptr += MINBPC(enc); |
266 | 0 | if (ptr == end) |
267 | 0 | return XML_TOK_PARTIAL; |
268 | 0 | if (CHAR_MATCHES(enc, ptr, ASCII_GT)) { |
269 | 0 | *nextTokPtr = ptr + MINBPC(enc); |
270 | 0 | return tok; |
271 | 0 | } |
272 | 0 | /* fall through */ |
273 | 0 | default: |
274 | 0 | *nextTokPtr = ptr; |
275 | 0 | return XML_TOK_INVALID; |
276 | 0 | } |
277 | 0 | } |
278 | 0 | return XML_TOK_PARTIAL; |
279 | 0 | } Unexecuted instantiation: xmltok.c:normal_scanPi Unexecuted instantiation: xmltok.c:little2_scanPi Unexecuted instantiation: xmltok.c:big2_scanPi |
280 | | |
281 | | static int PTRCALL |
282 | | PREFIX(scanCdataSection)(const ENCODING *enc, const char *ptr, |
283 | | const char *end, const char **nextTokPtr) |
284 | 0 | { |
285 | 0 | static const char CDATA_LSQB[] = { ASCII_C, ASCII_D, ASCII_A, |
286 | 0 | ASCII_T, ASCII_A, ASCII_LSQB }; |
287 | 0 | int i; |
288 | 0 | /* CDATA[ */ |
289 | 0 | if (end - ptr < 6 * MINBPC(enc)) |
290 | 0 | return XML_TOK_PARTIAL; |
291 | 0 | for (i = 0; i < 6; i++, ptr += MINBPC(enc)) { |
292 | 0 | if (!CHAR_MATCHES(enc, ptr, CDATA_LSQB[i])) { |
293 | 0 | *nextTokPtr = ptr; |
294 | 0 | return XML_TOK_INVALID; |
295 | 0 | } |
296 | 0 | } |
297 | 0 | *nextTokPtr = ptr; |
298 | 0 | return XML_TOK_CDATA_SECT_OPEN; |
299 | 0 | } Unexecuted instantiation: xmltok.c:normal_scanCdataSection Unexecuted instantiation: xmltok.c:little2_scanCdataSection Unexecuted instantiation: xmltok.c:big2_scanCdataSection |
300 | | |
301 | | static int PTRCALL |
302 | | PREFIX(cdataSectionTok)(const ENCODING *enc, const char *ptr, |
303 | | const char *end, const char **nextTokPtr) |
304 | 0 | { |
305 | 0 | if (ptr == end) |
306 | 0 | return XML_TOK_NONE; |
307 | 0 | if (MINBPC(enc) > 1) { |
308 | 0 | size_t n = end - ptr; |
309 | 0 | if (n & (MINBPC(enc) - 1)) { |
310 | 0 | n &= ~(MINBPC(enc) - 1); |
311 | 0 | if (n == 0) |
312 | 0 | return XML_TOK_PARTIAL; |
313 | 0 | end = ptr + n; |
314 | 0 | } |
315 | 0 | } |
316 | 0 | switch (BYTE_TYPE(enc, ptr)) { |
317 | 0 | case BT_RSQB: |
318 | 0 | ptr += MINBPC(enc); |
319 | 0 | if (ptr == end) |
320 | 0 | return XML_TOK_PARTIAL; |
321 | 0 | if (!CHAR_MATCHES(enc, ptr, ASCII_RSQB)) |
322 | 0 | break; |
323 | 0 | ptr += MINBPC(enc); |
324 | 0 | if (ptr == end) |
325 | 0 | return XML_TOK_PARTIAL; |
326 | 0 | if (!CHAR_MATCHES(enc, ptr, ASCII_GT)) { |
327 | 0 | ptr -= MINBPC(enc); |
328 | 0 | break; |
329 | 0 | } |
330 | 0 | *nextTokPtr = ptr + MINBPC(enc); |
331 | 0 | return XML_TOK_CDATA_SECT_CLOSE; |
332 | 0 | case BT_CR: |
333 | 0 | ptr += MINBPC(enc); |
334 | 0 | if (ptr == end) |
335 | 0 | return XML_TOK_PARTIAL; |
336 | 0 | if (BYTE_TYPE(enc, ptr) == BT_LF) |
337 | 0 | ptr += MINBPC(enc); |
338 | 0 | *nextTokPtr = ptr; |
339 | 0 | return XML_TOK_DATA_NEWLINE; |
340 | 0 | case BT_LF: |
341 | 0 | *nextTokPtr = ptr + MINBPC(enc); |
342 | 0 | return XML_TOK_DATA_NEWLINE; |
343 | 0 | INVALID_CASES(ptr, nextTokPtr) |
344 | 0 | default: |
345 | 0 | ptr += MINBPC(enc); |
346 | 0 | break; |
347 | 0 | } |
348 | 0 | while (ptr != end) { |
349 | 0 | switch (BYTE_TYPE(enc, ptr)) { |
350 | 0 | #define LEAD_CASE(n) \ |
351 | 0 | case BT_LEAD ## n: \ |
352 | 0 | if (end - ptr < n || IS_INVALID_CHAR(enc, ptr, n)) { \ |
353 | 0 | *nextTokPtr = ptr; \ |
354 | 0 | return XML_TOK_DATA_CHARS; \ |
355 | 0 | } \ |
356 | 0 | ptr += n; \ |
357 | 0 | break; |
358 | 0 | LEAD_CASE(2) LEAD_CASE(3) LEAD_CASE(4) |
359 | 0 | #undef LEAD_CASE |
360 | 0 | case BT_NONXML: |
361 | 0 | case BT_MALFORM: |
362 | 0 | case BT_TRAIL: |
363 | 0 | case BT_CR: |
364 | 0 | case BT_LF: |
365 | 0 | case BT_RSQB: |
366 | 0 | *nextTokPtr = ptr; |
367 | 0 | return XML_TOK_DATA_CHARS; |
368 | 0 | default: |
369 | 0 | ptr += MINBPC(enc); |
370 | 0 | break; |
371 | 0 | } |
372 | 0 | } |
373 | 0 | *nextTokPtr = ptr; |
374 | 0 | return XML_TOK_DATA_CHARS; |
375 | 0 | } Unexecuted instantiation: xmltok.c:normal_cdataSectionTok Unexecuted instantiation: xmltok.c:little2_cdataSectionTok Unexecuted instantiation: xmltok.c:big2_cdataSectionTok |
376 | | |
377 | | /* ptr points to character following "</" */ |
378 | | |
379 | | static int PTRCALL |
380 | | PREFIX(scanEndTag)(const ENCODING *enc, const char *ptr, |
381 | | const char *end, const char **nextTokPtr) |
382 | 0 | { |
383 | 0 | if (ptr == end) |
384 | 0 | return XML_TOK_PARTIAL; |
385 | 0 | switch (BYTE_TYPE(enc, ptr)) { |
386 | 0 | CHECK_NMSTRT_CASES(enc, ptr, end, nextTokPtr) |
387 | 0 | default: |
388 | 0 | *nextTokPtr = ptr; |
389 | 0 | return XML_TOK_INVALID; |
390 | 0 | } |
391 | 0 | while (ptr != end) { |
392 | 0 | switch (BYTE_TYPE(enc, ptr)) { |
393 | 0 | CHECK_NAME_CASES(enc, ptr, end, nextTokPtr) |
394 | 0 | case BT_S: case BT_CR: case BT_LF: |
395 | 0 | for (ptr += MINBPC(enc); ptr != end; ptr += MINBPC(enc)) { |
396 | 0 | switch (BYTE_TYPE(enc, ptr)) { |
397 | 0 | case BT_S: case BT_CR: case BT_LF: |
398 | 0 | break; |
399 | 0 | case BT_GT: |
400 | 0 | *nextTokPtr = ptr + MINBPC(enc); |
401 | 0 | return XML_TOK_END_TAG; |
402 | 0 | default: |
403 | 0 | *nextTokPtr = ptr; |
404 | 0 | return XML_TOK_INVALID; |
405 | 0 | } |
406 | 0 | } |
407 | 0 | return XML_TOK_PARTIAL; |
408 | 0 | #ifdef XML_NS |
409 | 0 | case BT_COLON: |
410 | 0 | /* no need to check qname syntax here, |
411 | 0 | since end-tag must match exactly */ |
412 | 0 | ptr += MINBPC(enc); |
413 | 0 | break; |
414 | 0 | #endif |
415 | 0 | case BT_GT: |
416 | 0 | *nextTokPtr = ptr + MINBPC(enc); |
417 | 0 | return XML_TOK_END_TAG; |
418 | 0 | default: |
419 | 0 | *nextTokPtr = ptr; |
420 | 0 | return XML_TOK_INVALID; |
421 | 0 | } |
422 | 0 | } |
423 | 0 | return XML_TOK_PARTIAL; |
424 | 0 | } Unexecuted instantiation: xmltok.c:normal_scanEndTag Unexecuted instantiation: xmltok.c:little2_scanEndTag Unexecuted instantiation: xmltok.c:big2_scanEndTag |
425 | | |
426 | | /* ptr points to character following "&#X" */ |
427 | | |
428 | | static int PTRCALL |
429 | | PREFIX(scanHexCharRef)(const ENCODING *enc, const char *ptr, |
430 | | const char *end, const char **nextTokPtr) |
431 | 0 | { |
432 | 0 | if (ptr != end) { |
433 | 0 | switch (BYTE_TYPE(enc, ptr)) { |
434 | 0 | case BT_DIGIT: |
435 | 0 | case BT_HEX: |
436 | 0 | break; |
437 | 0 | default: |
438 | 0 | *nextTokPtr = ptr; |
439 | 0 | return XML_TOK_INVALID; |
440 | 0 | } |
441 | 0 | for (ptr += MINBPC(enc); ptr != end; ptr += MINBPC(enc)) { |
442 | 0 | switch (BYTE_TYPE(enc, ptr)) { |
443 | 0 | case BT_DIGIT: |
444 | 0 | case BT_HEX: |
445 | 0 | break; |
446 | 0 | case BT_SEMI: |
447 | 0 | *nextTokPtr = ptr + MINBPC(enc); |
448 | 0 | return XML_TOK_CHAR_REF; |
449 | 0 | default: |
450 | 0 | *nextTokPtr = ptr; |
451 | 0 | return XML_TOK_INVALID; |
452 | 0 | } |
453 | 0 | } |
454 | 0 | } |
455 | 0 | return XML_TOK_PARTIAL; |
456 | 0 | } Unexecuted instantiation: xmltok.c:normal_scanHexCharRef Unexecuted instantiation: xmltok.c:big2_scanHexCharRef Unexecuted instantiation: xmltok.c:little2_scanHexCharRef |
457 | | |
458 | | /* ptr points to character following "&#" */ |
459 | | |
460 | | static int PTRCALL |
461 | | PREFIX(scanCharRef)(const ENCODING *enc, const char *ptr, |
462 | | const char *end, const char **nextTokPtr) |
463 | 0 | { |
464 | 0 | if (ptr != end) { |
465 | 0 | if (CHAR_MATCHES(enc, ptr, ASCII_x)) |
466 | 0 | return PREFIX(scanHexCharRef)(enc, ptr + MINBPC(enc), end, nextTokPtr); |
467 | 0 | switch (BYTE_TYPE(enc, ptr)) { |
468 | 0 | case BT_DIGIT: |
469 | 0 | break; |
470 | 0 | default: |
471 | 0 | *nextTokPtr = ptr; |
472 | 0 | return XML_TOK_INVALID; |
473 | 0 | } |
474 | 0 | for (ptr += MINBPC(enc); ptr != end; ptr += MINBPC(enc)) { |
475 | 0 | switch (BYTE_TYPE(enc, ptr)) { |
476 | 0 | case BT_DIGIT: |
477 | 0 | break; |
478 | 0 | case BT_SEMI: |
479 | 0 | *nextTokPtr = ptr + MINBPC(enc); |
480 | 0 | return XML_TOK_CHAR_REF; |
481 | 0 | default: |
482 | 0 | *nextTokPtr = ptr; |
483 | 0 | return XML_TOK_INVALID; |
484 | 0 | } |
485 | 0 | } |
486 | 0 | } |
487 | 0 | return XML_TOK_PARTIAL; |
488 | 0 | } Unexecuted instantiation: xmltok.c:normal_scanCharRef Unexecuted instantiation: xmltok.c:big2_scanCharRef Unexecuted instantiation: xmltok.c:little2_scanCharRef |
489 | | |
490 | | /* ptr points to character following "&" */ |
491 | | |
492 | | static int PTRCALL |
493 | | PREFIX(scanRef)(const ENCODING *enc, const char *ptr, const char *end, |
494 | | const char **nextTokPtr) |
495 | 0 | { |
496 | 0 | if (ptr == end) |
497 | 0 | return XML_TOK_PARTIAL; |
498 | 0 | switch (BYTE_TYPE(enc, ptr)) { |
499 | 0 | CHECK_NMSTRT_CASES(enc, ptr, end, nextTokPtr) |
500 | 0 | case BT_NUM: |
501 | 0 | return PREFIX(scanCharRef)(enc, ptr + MINBPC(enc), end, nextTokPtr); |
502 | 0 | default: |
503 | 0 | *nextTokPtr = ptr; |
504 | 0 | return XML_TOK_INVALID; |
505 | 0 | } |
506 | 0 | while (ptr != end) { |
507 | 0 | switch (BYTE_TYPE(enc, ptr)) { |
508 | 0 | CHECK_NAME_CASES(enc, ptr, end, nextTokPtr) |
509 | 0 | case BT_SEMI: |
510 | 0 | *nextTokPtr = ptr + MINBPC(enc); |
511 | 0 | return XML_TOK_ENTITY_REF; |
512 | 0 | default: |
513 | 0 | *nextTokPtr = ptr; |
514 | 0 | return XML_TOK_INVALID; |
515 | 0 | } |
516 | 0 | } |
517 | 0 | return XML_TOK_PARTIAL; |
518 | 0 | } Unexecuted instantiation: xmltok.c:normal_scanRef Unexecuted instantiation: xmltok.c:big2_scanRef Unexecuted instantiation: xmltok.c:little2_scanRef |
519 | | |
520 | | /* ptr points to character following first character of attribute name */ |
521 | | |
522 | | static int PTRCALL |
523 | | PREFIX(scanAtts)(const ENCODING *enc, const char *ptr, const char *end, |
524 | | const char **nextTokPtr) |
525 | 0 | { |
526 | 0 | #ifdef XML_NS |
527 | 0 | int hadColon = 0; |
528 | 0 | #endif |
529 | 0 | while (ptr != end) { |
530 | 0 | switch (BYTE_TYPE(enc, ptr)) { |
531 | 0 | CHECK_NAME_CASES(enc, ptr, end, nextTokPtr) |
532 | 0 | #ifdef XML_NS |
533 | 0 | case BT_COLON: |
534 | 0 | if (hadColon) { |
535 | 0 | *nextTokPtr = ptr; |
536 | 0 | return XML_TOK_INVALID; |
537 | 0 | } |
538 | 0 | hadColon = 1; |
539 | 0 | ptr += MINBPC(enc); |
540 | 0 | if (ptr == end) |
541 | 0 | return XML_TOK_PARTIAL; |
542 | 0 | switch (BYTE_TYPE(enc, ptr)) { |
543 | 0 | CHECK_NMSTRT_CASES(enc, ptr, end, nextTokPtr) |
544 | 0 | default: |
545 | 0 | *nextTokPtr = ptr; |
546 | 0 | return XML_TOK_INVALID; |
547 | 0 | } |
548 | 0 | break; |
549 | 0 | #endif |
550 | 0 | case BT_S: case BT_CR: case BT_LF: |
551 | 0 | for (;;) { |
552 | 0 | int t; |
553 | 0 |
|
554 | 0 | ptr += MINBPC(enc); |
555 | 0 | if (ptr == end) |
556 | 0 | return XML_TOK_PARTIAL; |
557 | 0 | t = BYTE_TYPE(enc, ptr); |
558 | 0 | if (t == BT_EQUALS) |
559 | 0 | break; |
560 | 0 | switch (t) { |
561 | 0 | case BT_S: |
562 | 0 | case BT_LF: |
563 | 0 | case BT_CR: |
564 | 0 | break; |
565 | 0 | default: |
566 | 0 | *nextTokPtr = ptr; |
567 | 0 | return XML_TOK_INVALID; |
568 | 0 | } |
569 | 0 | } |
570 | 0 | /* fall through */ |
571 | 0 | case BT_EQUALS: |
572 | 0 | { |
573 | 0 | int open; |
574 | 0 | #ifdef XML_NS |
575 | 0 | hadColon = 0; |
576 | 0 | #endif |
577 | 0 | for (;;) { |
578 | 0 | ptr += MINBPC(enc); |
579 | 0 | if (ptr == end) |
580 | 0 | return XML_TOK_PARTIAL; |
581 | 0 | open = BYTE_TYPE(enc, ptr); |
582 | 0 | if (open == BT_QUOT || open == BT_APOS) |
583 | 0 | break; |
584 | 0 | switch (open) { |
585 | 0 | case BT_S: |
586 | 0 | case BT_LF: |
587 | 0 | case BT_CR: |
588 | 0 | break; |
589 | 0 | default: |
590 | 0 | *nextTokPtr = ptr; |
591 | 0 | return XML_TOK_INVALID; |
592 | 0 | } |
593 | 0 | } |
594 | 0 | ptr += MINBPC(enc); |
595 | 0 | /* in attribute value */ |
596 | 0 | for (;;) { |
597 | 0 | int t; |
598 | 0 | if (ptr == end) |
599 | 0 | return XML_TOK_PARTIAL; |
600 | 0 | t = BYTE_TYPE(enc, ptr); |
601 | 0 | if (t == open) |
602 | 0 | break; |
603 | 0 | switch (t) { |
604 | 0 | INVALID_CASES(ptr, nextTokPtr) |
605 | 0 | case BT_AMP: |
606 | 0 | { |
607 | 0 | int tok = PREFIX(scanRef)(enc, ptr + MINBPC(enc), end, &ptr); |
608 | 0 | if (tok <= 0) { |
609 | 0 | if (tok == XML_TOK_INVALID) |
610 | 0 | *nextTokPtr = ptr; |
611 | 0 | return tok; |
612 | 0 | } |
613 | 0 | break; |
614 | 0 | } |
615 | 0 | case BT_LT: |
616 | 0 | *nextTokPtr = ptr; |
617 | 0 | return XML_TOK_INVALID; |
618 | 0 | default: |
619 | 0 | ptr += MINBPC(enc); |
620 | 0 | break; |
621 | 0 | } |
622 | 0 | } |
623 | 0 | ptr += MINBPC(enc); |
624 | 0 | if (ptr == end) |
625 | 0 | return XML_TOK_PARTIAL; |
626 | 0 | switch (BYTE_TYPE(enc, ptr)) { |
627 | 0 | case BT_S: |
628 | 0 | case BT_CR: |
629 | 0 | case BT_LF: |
630 | 0 | break; |
631 | 0 | case BT_SOL: |
632 | 0 | goto sol; |
633 | 0 | case BT_GT: |
634 | 0 | goto gt; |
635 | 0 | default: |
636 | 0 | *nextTokPtr = ptr; |
637 | 0 | return XML_TOK_INVALID; |
638 | 0 | } |
639 | 0 | /* ptr points to closing quote */ |
640 | 0 | for (;;) { |
641 | 0 | ptr += MINBPC(enc); |
642 | 0 | if (ptr == end) |
643 | 0 | return XML_TOK_PARTIAL; |
644 | 0 | switch (BYTE_TYPE(enc, ptr)) { |
645 | 0 | CHECK_NMSTRT_CASES(enc, ptr, end, nextTokPtr) |
646 | 0 | case BT_S: case BT_CR: case BT_LF: |
647 | 0 | continue; |
648 | 0 | case BT_GT: |
649 | 0 | gt: |
650 | 0 | *nextTokPtr = ptr + MINBPC(enc); |
651 | 0 | return XML_TOK_START_TAG_WITH_ATTS; |
652 | 0 | case BT_SOL: |
653 | 0 | sol: |
654 | 0 | ptr += MINBPC(enc); |
655 | 0 | if (ptr == end) |
656 | 0 | return XML_TOK_PARTIAL; |
657 | 0 | if (!CHAR_MATCHES(enc, ptr, ASCII_GT)) { |
658 | 0 | *nextTokPtr = ptr; |
659 | 0 | return XML_TOK_INVALID; |
660 | 0 | } |
661 | 0 | *nextTokPtr = ptr + MINBPC(enc); |
662 | 0 | return XML_TOK_EMPTY_ELEMENT_WITH_ATTS; |
663 | 0 | default: |
664 | 0 | *nextTokPtr = ptr; |
665 | 0 | return XML_TOK_INVALID; |
666 | 0 | } |
667 | 0 | break; |
668 | 0 | } |
669 | 0 | break; |
670 | 0 | } |
671 | 0 | default: |
672 | 0 | *nextTokPtr = ptr; |
673 | 0 | return XML_TOK_INVALID; |
674 | 0 | } |
675 | 0 | } |
676 | 0 | return XML_TOK_PARTIAL; |
677 | 0 | } Unexecuted instantiation: xmltok.c:normal_scanAtts Unexecuted instantiation: xmltok.c:little2_scanAtts Unexecuted instantiation: xmltok.c:big2_scanAtts |
678 | | |
679 | | /* ptr points to character following "<" */ |
680 | | |
681 | | static int PTRCALL |
682 | | PREFIX(scanLt)(const ENCODING *enc, const char *ptr, const char *end, |
683 | | const char **nextTokPtr) |
684 | 0 | { |
685 | 0 | #ifdef XML_NS |
686 | 0 | int hadColon; |
687 | 0 | #endif |
688 | 0 | if (ptr == end) |
689 | 0 | return XML_TOK_PARTIAL; |
690 | 0 | switch (BYTE_TYPE(enc, ptr)) { |
691 | 0 | CHECK_NMSTRT_CASES(enc, ptr, end, nextTokPtr) |
692 | 0 | case BT_EXCL: |
693 | 0 | if ((ptr += MINBPC(enc)) == end) |
694 | 0 | return XML_TOK_PARTIAL; |
695 | 0 | switch (BYTE_TYPE(enc, ptr)) { |
696 | 0 | case BT_MINUS: |
697 | 0 | return PREFIX(scanComment)(enc, ptr + MINBPC(enc), end, nextTokPtr); |
698 | 0 | case BT_LSQB: |
699 | 0 | return PREFIX(scanCdataSection)(enc, ptr + MINBPC(enc), |
700 | 0 | end, nextTokPtr); |
701 | 0 | } |
702 | 0 | *nextTokPtr = ptr; |
703 | 0 | return XML_TOK_INVALID; |
704 | 0 | case BT_QUEST: |
705 | 0 | return PREFIX(scanPi)(enc, ptr + MINBPC(enc), end, nextTokPtr); |
706 | 0 | case BT_SOL: |
707 | 0 | return PREFIX(scanEndTag)(enc, ptr + MINBPC(enc), end, nextTokPtr); |
708 | 0 | default: |
709 | 0 | *nextTokPtr = ptr; |
710 | 0 | return XML_TOK_INVALID; |
711 | 0 | } |
712 | 0 | #ifdef XML_NS |
713 | 0 | hadColon = 0; |
714 | 0 | #endif |
715 | 0 | /* we have a start-tag */ |
716 | 0 | while (ptr != end) { |
717 | 0 | switch (BYTE_TYPE(enc, ptr)) { |
718 | 0 | CHECK_NAME_CASES(enc, ptr, end, nextTokPtr) |
719 | 0 | #ifdef XML_NS |
720 | 0 | case BT_COLON: |
721 | 0 | if (hadColon) { |
722 | 0 | *nextTokPtr = ptr; |
723 | 0 | return XML_TOK_INVALID; |
724 | 0 | } |
725 | 0 | hadColon = 1; |
726 | 0 | ptr += MINBPC(enc); |
727 | 0 | if (ptr == end) |
728 | 0 | return XML_TOK_PARTIAL; |
729 | 0 | switch (BYTE_TYPE(enc, ptr)) { |
730 | 0 | CHECK_NMSTRT_CASES(enc, ptr, end, nextTokPtr) |
731 | 0 | default: |
732 | 0 | *nextTokPtr = ptr; |
733 | 0 | return XML_TOK_INVALID; |
734 | 0 | } |
735 | 0 | break; |
736 | 0 | #endif |
737 | 0 | case BT_S: case BT_CR: case BT_LF: |
738 | 0 | { |
739 | 0 | ptr += MINBPC(enc); |
740 | 0 | while (ptr != end) { |
741 | 0 | switch (BYTE_TYPE(enc, ptr)) { |
742 | 0 | CHECK_NMSTRT_CASES(enc, ptr, end, nextTokPtr) |
743 | 0 | case BT_GT: |
744 | 0 | goto gt; |
745 | 0 | case BT_SOL: |
746 | 0 | goto sol; |
747 | 0 | case BT_S: case BT_CR: case BT_LF: |
748 | 0 | ptr += MINBPC(enc); |
749 | 0 | continue; |
750 | 0 | default: |
751 | 0 | *nextTokPtr = ptr; |
752 | 0 | return XML_TOK_INVALID; |
753 | 0 | } |
754 | 0 | return PREFIX(scanAtts)(enc, ptr, end, nextTokPtr); |
755 | 0 | } |
756 | 0 | return XML_TOK_PARTIAL; |
757 | 0 | } |
758 | 0 | case BT_GT: |
759 | 0 | gt: |
760 | 0 | *nextTokPtr = ptr + MINBPC(enc); |
761 | 0 | return XML_TOK_START_TAG_NO_ATTS; |
762 | 0 | case BT_SOL: |
763 | 0 | sol: |
764 | 0 | ptr += MINBPC(enc); |
765 | 0 | if (ptr == end) |
766 | 0 | return XML_TOK_PARTIAL; |
767 | 0 | if (!CHAR_MATCHES(enc, ptr, ASCII_GT)) { |
768 | 0 | *nextTokPtr = ptr; |
769 | 0 | return XML_TOK_INVALID; |
770 | 0 | } |
771 | 0 | *nextTokPtr = ptr + MINBPC(enc); |
772 | 0 | return XML_TOK_EMPTY_ELEMENT_NO_ATTS; |
773 | 0 | default: |
774 | 0 | *nextTokPtr = ptr; |
775 | 0 | return XML_TOK_INVALID; |
776 | 0 | } |
777 | 0 | } |
778 | 0 | return XML_TOK_PARTIAL; |
779 | 0 | } Unexecuted instantiation: xmltok.c:normal_scanLt Unexecuted instantiation: xmltok.c:little2_scanLt Unexecuted instantiation: xmltok.c:big2_scanLt |
780 | | |
781 | | static int PTRCALL |
782 | | PREFIX(contentTok)(const ENCODING *enc, const char *ptr, const char *end, |
783 | | const char **nextTokPtr) |
784 | 0 | { |
785 | 0 | if (ptr == end) |
786 | 0 | return XML_TOK_NONE; |
787 | 0 | if (MINBPC(enc) > 1) { |
788 | 0 | size_t n = end - ptr; |
789 | 0 | if (n & (MINBPC(enc) - 1)) { |
790 | 0 | n &= ~(MINBPC(enc) - 1); |
791 | 0 | if (n == 0) |
792 | 0 | return XML_TOK_PARTIAL; |
793 | 0 | end = ptr + n; |
794 | 0 | } |
795 | 0 | } |
796 | 0 | switch (BYTE_TYPE(enc, ptr)) { |
797 | 0 | case BT_LT: |
798 | 0 | return PREFIX(scanLt)(enc, ptr + MINBPC(enc), end, nextTokPtr); |
799 | 0 | case BT_AMP: |
800 | 0 | return PREFIX(scanRef)(enc, ptr + MINBPC(enc), end, nextTokPtr); |
801 | 0 | case BT_CR: |
802 | 0 | ptr += MINBPC(enc); |
803 | 0 | if (ptr == end) |
804 | 0 | return XML_TOK_TRAILING_CR; |
805 | 0 | if (BYTE_TYPE(enc, ptr) == BT_LF) |
806 | 0 | ptr += MINBPC(enc); |
807 | 0 | *nextTokPtr = ptr; |
808 | 0 | return XML_TOK_DATA_NEWLINE; |
809 | 0 | case BT_LF: |
810 | 0 | *nextTokPtr = ptr + MINBPC(enc); |
811 | 0 | return XML_TOK_DATA_NEWLINE; |
812 | 0 | case BT_RSQB: |
813 | 0 | ptr += MINBPC(enc); |
814 | 0 | if (ptr == end) |
815 | 0 | return XML_TOK_TRAILING_RSQB; |
816 | 0 | if (!CHAR_MATCHES(enc, ptr, ASCII_RSQB)) |
817 | 0 | break; |
818 | 0 | ptr += MINBPC(enc); |
819 | 0 | if (ptr == end) |
820 | 0 | return XML_TOK_TRAILING_RSQB; |
821 | 0 | if (!CHAR_MATCHES(enc, ptr, ASCII_GT)) { |
822 | 0 | ptr -= MINBPC(enc); |
823 | 0 | break; |
824 | 0 | } |
825 | 0 | *nextTokPtr = ptr; |
826 | 0 | return XML_TOK_INVALID; |
827 | 0 | INVALID_CASES(ptr, nextTokPtr) |
828 | 0 | default: |
829 | 0 | ptr += MINBPC(enc); |
830 | 0 | break; |
831 | 0 | } |
832 | 0 | while (ptr != end) { |
833 | 0 | switch (BYTE_TYPE(enc, ptr)) { |
834 | 0 | #define LEAD_CASE(n) \ |
835 | 0 | case BT_LEAD ## n: \ |
836 | 0 | if (end - ptr < n || IS_INVALID_CHAR(enc, ptr, n)) { \ |
837 | 0 | *nextTokPtr = ptr; \ |
838 | 0 | return XML_TOK_DATA_CHARS; \ |
839 | 0 | } \ |
840 | 0 | ptr += n; \ |
841 | 0 | break; |
842 | 0 | LEAD_CASE(2) LEAD_CASE(3) LEAD_CASE(4) |
843 | 0 | #undef LEAD_CASE |
844 | 0 | case BT_RSQB: |
845 | 0 | if (ptr + MINBPC(enc) != end) { |
846 | 0 | if (!CHAR_MATCHES(enc, ptr + MINBPC(enc), ASCII_RSQB)) { |
847 | 0 | ptr += MINBPC(enc); |
848 | 0 | break; |
849 | 0 | } |
850 | 0 | if (ptr + 2*MINBPC(enc) != end) { |
851 | 0 | if (!CHAR_MATCHES(enc, ptr + 2*MINBPC(enc), ASCII_GT)) { |
852 | 0 | ptr += MINBPC(enc); |
853 | 0 | break; |
854 | 0 | } |
855 | 0 | *nextTokPtr = ptr + 2*MINBPC(enc); |
856 | 0 | return XML_TOK_INVALID; |
857 | 0 | } |
858 | 0 | } |
859 | 0 | /* fall through */ |
860 | 0 | case BT_AMP: |
861 | 0 | case BT_LT: |
862 | 0 | case BT_NONXML: |
863 | 0 | case BT_MALFORM: |
864 | 0 | case BT_TRAIL: |
865 | 0 | case BT_CR: |
866 | 0 | case BT_LF: |
867 | 0 | *nextTokPtr = ptr; |
868 | 0 | return XML_TOK_DATA_CHARS; |
869 | 0 | default: |
870 | 0 | ptr += MINBPC(enc); |
871 | 0 | break; |
872 | 0 | } |
873 | 0 | } |
874 | 0 | *nextTokPtr = ptr; |
875 | 0 | return XML_TOK_DATA_CHARS; |
876 | 0 | } Unexecuted instantiation: xmltok.c:normal_contentTok Unexecuted instantiation: xmltok.c:little2_contentTok Unexecuted instantiation: xmltok.c:big2_contentTok |
877 | | |
878 | | /* ptr points to character following "%" */ |
879 | | |
880 | | static int PTRCALL |
881 | | PREFIX(scanPercent)(const ENCODING *enc, const char *ptr, const char *end, |
882 | | const char **nextTokPtr) |
883 | 0 | { |
884 | 0 | if (ptr == end) |
885 | 0 | return -XML_TOK_PERCENT; |
886 | 0 | switch (BYTE_TYPE(enc, ptr)) { |
887 | 0 | CHECK_NMSTRT_CASES(enc, ptr, end, nextTokPtr) |
888 | 0 | case BT_S: case BT_LF: case BT_CR: case BT_PERCNT: |
889 | 0 | *nextTokPtr = ptr; |
890 | 0 | return XML_TOK_PERCENT; |
891 | 0 | default: |
892 | 0 | *nextTokPtr = ptr; |
893 | 0 | return XML_TOK_INVALID; |
894 | 0 | } |
895 | 0 | while (ptr != end) { |
896 | 0 | switch (BYTE_TYPE(enc, ptr)) { |
897 | 0 | CHECK_NAME_CASES(enc, ptr, end, nextTokPtr) |
898 | 0 | case BT_SEMI: |
899 | 0 | *nextTokPtr = ptr + MINBPC(enc); |
900 | 0 | return XML_TOK_PARAM_ENTITY_REF; |
901 | 0 | default: |
902 | 0 | *nextTokPtr = ptr; |
903 | 0 | return XML_TOK_INVALID; |
904 | 0 | } |
905 | 0 | } |
906 | 0 | return XML_TOK_PARTIAL; |
907 | 0 | } Unexecuted instantiation: xmltok.c:normal_scanPercent Unexecuted instantiation: xmltok.c:little2_scanPercent Unexecuted instantiation: xmltok.c:big2_scanPercent |
908 | | |
909 | | static int PTRCALL |
910 | | PREFIX(scanPoundName)(const ENCODING *enc, const char *ptr, const char *end, |
911 | | const char **nextTokPtr) |
912 | 0 | { |
913 | 0 | if (ptr == end) |
914 | 0 | return XML_TOK_PARTIAL; |
915 | 0 | switch (BYTE_TYPE(enc, ptr)) { |
916 | 0 | CHECK_NMSTRT_CASES(enc, ptr, end, nextTokPtr) |
917 | 0 | default: |
918 | 0 | *nextTokPtr = ptr; |
919 | 0 | return XML_TOK_INVALID; |
920 | 0 | } |
921 | 0 | while (ptr != end) { |
922 | 0 | switch (BYTE_TYPE(enc, ptr)) { |
923 | 0 | CHECK_NAME_CASES(enc, ptr, end, nextTokPtr) |
924 | 0 | case BT_CR: case BT_LF: case BT_S: |
925 | 0 | case BT_RPAR: case BT_GT: case BT_PERCNT: case BT_VERBAR: |
926 | 0 | *nextTokPtr = ptr; |
927 | 0 | return XML_TOK_POUND_NAME; |
928 | 0 | default: |
929 | 0 | *nextTokPtr = ptr; |
930 | 0 | return XML_TOK_INVALID; |
931 | 0 | } |
932 | 0 | } |
933 | 0 | return -XML_TOK_POUND_NAME; |
934 | 0 | } Unexecuted instantiation: xmltok.c:normal_scanPoundName Unexecuted instantiation: xmltok.c:little2_scanPoundName Unexecuted instantiation: xmltok.c:big2_scanPoundName |
935 | | |
936 | | static int PTRCALL |
937 | | PREFIX(scanLit)(int open, const ENCODING *enc, |
938 | | const char *ptr, const char *end, |
939 | | const char **nextTokPtr) |
940 | 0 | { |
941 | 0 | while (ptr != end) { |
942 | 0 | int t = BYTE_TYPE(enc, ptr); |
943 | 0 | switch (t) { |
944 | 0 | INVALID_CASES(ptr, nextTokPtr) |
945 | 0 | case BT_QUOT: |
946 | 0 | case BT_APOS: |
947 | 0 | ptr += MINBPC(enc); |
948 | 0 | if (t != open) |
949 | 0 | break; |
950 | 0 | if (ptr == end) |
951 | 0 | return -XML_TOK_LITERAL; |
952 | 0 | *nextTokPtr = ptr; |
953 | 0 | switch (BYTE_TYPE(enc, ptr)) { |
954 | 0 | case BT_S: case BT_CR: case BT_LF: |
955 | 0 | case BT_GT: case BT_PERCNT: case BT_LSQB: |
956 | 0 | return XML_TOK_LITERAL; |
957 | 0 | default: |
958 | 0 | return XML_TOK_INVALID; |
959 | 0 | } |
960 | 0 | default: |
961 | 0 | ptr += MINBPC(enc); |
962 | 0 | break; |
963 | 0 | } |
964 | 0 | } |
965 | 0 | return XML_TOK_PARTIAL; |
966 | 0 | } Unexecuted instantiation: xmltok.c:normal_scanLit Unexecuted instantiation: xmltok.c:little2_scanLit Unexecuted instantiation: xmltok.c:big2_scanLit |
967 | | |
968 | | static int PTRCALL |
969 | | PREFIX(prologTok)(const ENCODING *enc, const char *ptr, const char *end, |
970 | | const char **nextTokPtr) |
971 | 0 | { |
972 | 0 | int tok; |
973 | 0 | if (ptr == end) |
974 | 0 | return XML_TOK_NONE; |
975 | 0 | if (MINBPC(enc) > 1) { |
976 | 0 | size_t n = end - ptr; |
977 | 0 | if (n & (MINBPC(enc) - 1)) { |
978 | 0 | n &= ~(MINBPC(enc) - 1); |
979 | 0 | if (n == 0) |
980 | 0 | return XML_TOK_PARTIAL; |
981 | 0 | end = ptr + n; |
982 | 0 | } |
983 | 0 | } |
984 | 0 | switch (BYTE_TYPE(enc, ptr)) { |
985 | 0 | case BT_QUOT: |
986 | 0 | return PREFIX(scanLit)(BT_QUOT, enc, ptr + MINBPC(enc), end, nextTokPtr); |
987 | 0 | case BT_APOS: |
988 | 0 | return PREFIX(scanLit)(BT_APOS, enc, ptr + MINBPC(enc), end, nextTokPtr); |
989 | 0 | case BT_LT: |
990 | 0 | { |
991 | 0 | ptr += MINBPC(enc); |
992 | 0 | if (ptr == end) |
993 | 0 | return XML_TOK_PARTIAL; |
994 | 0 | switch (BYTE_TYPE(enc, ptr)) { |
995 | 0 | case BT_EXCL: |
996 | 0 | return PREFIX(scanDecl)(enc, ptr + MINBPC(enc), end, nextTokPtr); |
997 | 0 | case BT_QUEST: |
998 | 0 | return PREFIX(scanPi)(enc, ptr + MINBPC(enc), end, nextTokPtr); |
999 | 0 | case BT_NMSTRT: |
1000 | 0 | case BT_HEX: |
1001 | 0 | case BT_NONASCII: |
1002 | 0 | case BT_LEAD2: |
1003 | 0 | case BT_LEAD3: |
1004 | 0 | case BT_LEAD4: |
1005 | 0 | *nextTokPtr = ptr - MINBPC(enc); |
1006 | 0 | return XML_TOK_INSTANCE_START; |
1007 | 0 | } |
1008 | 0 | *nextTokPtr = ptr; |
1009 | 0 | return XML_TOK_INVALID; |
1010 | 0 | } |
1011 | 0 | case BT_CR: |
1012 | 0 | if (ptr + MINBPC(enc) == end) { |
1013 | 0 | *nextTokPtr = end; |
1014 | 0 | /* indicate that this might be part of a CR/LF pair */ |
1015 | 0 | return -XML_TOK_PROLOG_S; |
1016 | 0 | } |
1017 | 0 | /* fall through */ |
1018 | 0 | case BT_S: case BT_LF: |
1019 | 0 | for (;;) { |
1020 | 0 | ptr += MINBPC(enc); |
1021 | 0 | if (ptr == end) |
1022 | 0 | break; |
1023 | 0 | switch (BYTE_TYPE(enc, ptr)) { |
1024 | 0 | case BT_S: case BT_LF: |
1025 | 0 | break; |
1026 | 0 | case BT_CR: |
1027 | 0 | /* don't split CR/LF pair */ |
1028 | 0 | if (ptr + MINBPC(enc) != end) |
1029 | 0 | break; |
1030 | 0 | /* fall through */ |
1031 | 0 | default: |
1032 | 0 | *nextTokPtr = ptr; |
1033 | 0 | return XML_TOK_PROLOG_S; |
1034 | 0 | } |
1035 | 0 | } |
1036 | 0 | *nextTokPtr = ptr; |
1037 | 0 | return XML_TOK_PROLOG_S; |
1038 | 0 | case BT_PERCNT: |
1039 | 0 | return PREFIX(scanPercent)(enc, ptr + MINBPC(enc), end, nextTokPtr); |
1040 | 0 | case BT_COMMA: |
1041 | 0 | *nextTokPtr = ptr + MINBPC(enc); |
1042 | 0 | return XML_TOK_COMMA; |
1043 | 0 | case BT_LSQB: |
1044 | 0 | *nextTokPtr = ptr + MINBPC(enc); |
1045 | 0 | return XML_TOK_OPEN_BRACKET; |
1046 | 0 | case BT_RSQB: |
1047 | 0 | ptr += MINBPC(enc); |
1048 | 0 | if (ptr == end) |
1049 | 0 | return -XML_TOK_CLOSE_BRACKET; |
1050 | 0 | if (CHAR_MATCHES(enc, ptr, ASCII_RSQB)) { |
1051 | 0 | if (ptr + MINBPC(enc) == end) |
1052 | 0 | return XML_TOK_PARTIAL; |
1053 | 0 | if (CHAR_MATCHES(enc, ptr + MINBPC(enc), ASCII_GT)) { |
1054 | 0 | *nextTokPtr = ptr + 2*MINBPC(enc); |
1055 | 0 | return XML_TOK_COND_SECT_CLOSE; |
1056 | 0 | } |
1057 | 0 | } |
1058 | 0 | *nextTokPtr = ptr; |
1059 | 0 | return XML_TOK_CLOSE_BRACKET; |
1060 | 0 | case BT_LPAR: |
1061 | 0 | *nextTokPtr = ptr + MINBPC(enc); |
1062 | 0 | return XML_TOK_OPEN_PAREN; |
1063 | 0 | case BT_RPAR: |
1064 | 0 | ptr += MINBPC(enc); |
1065 | 0 | if (ptr == end) |
1066 | 0 | return -XML_TOK_CLOSE_PAREN; |
1067 | 0 | switch (BYTE_TYPE(enc, ptr)) { |
1068 | 0 | case BT_AST: |
1069 | 0 | *nextTokPtr = ptr + MINBPC(enc); |
1070 | 0 | return XML_TOK_CLOSE_PAREN_ASTERISK; |
1071 | 0 | case BT_QUEST: |
1072 | 0 | *nextTokPtr = ptr + MINBPC(enc); |
1073 | 0 | return XML_TOK_CLOSE_PAREN_QUESTION; |
1074 | 0 | case BT_PLUS: |
1075 | 0 | *nextTokPtr = ptr + MINBPC(enc); |
1076 | 0 | return XML_TOK_CLOSE_PAREN_PLUS; |
1077 | 0 | case BT_CR: case BT_LF: case BT_S: |
1078 | 0 | case BT_GT: case BT_COMMA: case BT_VERBAR: |
1079 | 0 | case BT_RPAR: |
1080 | 0 | *nextTokPtr = ptr; |
1081 | 0 | return XML_TOK_CLOSE_PAREN; |
1082 | 0 | } |
1083 | 0 | *nextTokPtr = ptr; |
1084 | 0 | return XML_TOK_INVALID; |
1085 | 0 | case BT_VERBAR: |
1086 | 0 | *nextTokPtr = ptr + MINBPC(enc); |
1087 | 0 | return XML_TOK_OR; |
1088 | 0 | case BT_GT: |
1089 | 0 | *nextTokPtr = ptr + MINBPC(enc); |
1090 | 0 | return XML_TOK_DECL_CLOSE; |
1091 | 0 | case BT_NUM: |
1092 | 0 | return PREFIX(scanPoundName)(enc, ptr + MINBPC(enc), end, nextTokPtr); |
1093 | 0 | #define LEAD_CASE(n) \ |
1094 | 0 | case BT_LEAD ## n: \ |
1095 | 0 | if (end - ptr < n) \ |
1096 | 0 | return XML_TOK_PARTIAL_CHAR; \ |
1097 | 0 | if (IS_NMSTRT_CHAR(enc, ptr, n)) { \ |
1098 | 0 | ptr += n; \ |
1099 | 0 | tok = XML_TOK_NAME; \ |
1100 | 0 | break; \ |
1101 | 0 | } \ |
1102 | 0 | if (IS_NAME_CHAR(enc, ptr, n)) { \ |
1103 | 0 | ptr += n; \ |
1104 | 0 | tok = XML_TOK_NMTOKEN; \ |
1105 | 0 | break; \ |
1106 | 0 | } \ |
1107 | 0 | *nextTokPtr = ptr; \ |
1108 | 0 | return XML_TOK_INVALID; |
1109 | 0 | LEAD_CASE(2) LEAD_CASE(3) LEAD_CASE(4) |
1110 | 0 | #undef LEAD_CASE |
1111 | 0 | case BT_NMSTRT: |
1112 | 0 | case BT_HEX: |
1113 | 0 | tok = XML_TOK_NAME; |
1114 | 0 | ptr += MINBPC(enc); |
1115 | 0 | break; |
1116 | 0 | case BT_DIGIT: |
1117 | 0 | case BT_NAME: |
1118 | 0 | case BT_MINUS: |
1119 | 0 | #ifdef XML_NS |
1120 | 0 | case BT_COLON: |
1121 | 0 | #endif |
1122 | 0 | tok = XML_TOK_NMTOKEN; |
1123 | 0 | ptr += MINBPC(enc); |
1124 | 0 | break; |
1125 | 0 | case BT_NONASCII: |
1126 | 0 | if (IS_NMSTRT_CHAR_MINBPC(enc, ptr)) { |
1127 | 0 | ptr += MINBPC(enc); |
1128 | 0 | tok = XML_TOK_NAME; |
1129 | 0 | break; |
1130 | 0 | } |
1131 | 0 | if (IS_NAME_CHAR_MINBPC(enc, ptr)) { |
1132 | 0 | ptr += MINBPC(enc); |
1133 | 0 | tok = XML_TOK_NMTOKEN; |
1134 | 0 | break; |
1135 | 0 | } |
1136 | 0 | /* fall through */ |
1137 | 0 | default: |
1138 | 0 | *nextTokPtr = ptr; |
1139 | 0 | return XML_TOK_INVALID; |
1140 | 0 | } |
1141 | 0 | while (ptr != end) { |
1142 | 0 | switch (BYTE_TYPE(enc, ptr)) { |
1143 | 0 | CHECK_NAME_CASES(enc, ptr, end, nextTokPtr) |
1144 | 0 | case BT_GT: case BT_RPAR: case BT_COMMA: |
1145 | 0 | case BT_VERBAR: case BT_LSQB: case BT_PERCNT: |
1146 | 0 | case BT_S: case BT_CR: case BT_LF: |
1147 | 0 | *nextTokPtr = ptr; |
1148 | 0 | return tok; |
1149 | 0 | #ifdef XML_NS |
1150 | 0 | case BT_COLON: |
1151 | 0 | ptr += MINBPC(enc); |
1152 | 0 | switch (tok) { |
1153 | 0 | case XML_TOK_NAME: |
1154 | 0 | if (ptr == end) |
1155 | 0 | return XML_TOK_PARTIAL; |
1156 | 0 | tok = XML_TOK_PREFIXED_NAME; |
1157 | 0 | switch (BYTE_TYPE(enc, ptr)) { |
1158 | 0 | CHECK_NAME_CASES(enc, ptr, end, nextTokPtr) |
1159 | 0 | default: |
1160 | 0 | tok = XML_TOK_NMTOKEN; |
1161 | 0 | break; |
1162 | 0 | } |
1163 | 0 | break; |
1164 | 0 | case XML_TOK_PREFIXED_NAME: |
1165 | 0 | tok = XML_TOK_NMTOKEN; |
1166 | 0 | break; |
1167 | 0 | } |
1168 | 0 | break; |
1169 | 0 | #endif |
1170 | 0 | case BT_PLUS: |
1171 | 0 | if (tok == XML_TOK_NMTOKEN) { |
1172 | 0 | *nextTokPtr = ptr; |
1173 | 0 | return XML_TOK_INVALID; |
1174 | 0 | } |
1175 | 0 | *nextTokPtr = ptr + MINBPC(enc); |
1176 | 0 | return XML_TOK_NAME_PLUS; |
1177 | 0 | case BT_AST: |
1178 | 0 | if (tok == XML_TOK_NMTOKEN) { |
1179 | 0 | *nextTokPtr = ptr; |
1180 | 0 | return XML_TOK_INVALID; |
1181 | 0 | } |
1182 | 0 | *nextTokPtr = ptr + MINBPC(enc); |
1183 | 0 | return XML_TOK_NAME_ASTERISK; |
1184 | 0 | case BT_QUEST: |
1185 | 0 | if (tok == XML_TOK_NMTOKEN) { |
1186 | 0 | *nextTokPtr = ptr; |
1187 | 0 | return XML_TOK_INVALID; |
1188 | 0 | } |
1189 | 0 | *nextTokPtr = ptr + MINBPC(enc); |
1190 | 0 | return XML_TOK_NAME_QUESTION; |
1191 | 0 | default: |
1192 | 0 | *nextTokPtr = ptr; |
1193 | 0 | return XML_TOK_INVALID; |
1194 | 0 | } |
1195 | 0 | } |
1196 | 0 | return -tok; |
1197 | 0 | } Unexecuted instantiation: xmltok.c:normal_prologTok Unexecuted instantiation: xmltok.c:little2_prologTok Unexecuted instantiation: xmltok.c:big2_prologTok |
1198 | | |
1199 | | static int PTRCALL |
1200 | | PREFIX(attributeValueTok)(const ENCODING *enc, const char *ptr, |
1201 | | const char *end, const char **nextTokPtr) |
1202 | 0 | { |
1203 | 0 | const char *start; |
1204 | 0 | if (ptr == end) |
1205 | 0 | return XML_TOK_NONE; |
1206 | 0 | start = ptr; |
1207 | 0 | while (ptr != end) { |
1208 | 0 | switch (BYTE_TYPE(enc, ptr)) { |
1209 | 0 | #define LEAD_CASE(n) \ |
1210 | 0 | case BT_LEAD ## n: ptr += n; break; |
1211 | 0 | LEAD_CASE(2) LEAD_CASE(3) LEAD_CASE(4) |
1212 | 0 | #undef LEAD_CASE |
1213 | 0 | case BT_AMP: |
1214 | 0 | if (ptr == start) |
1215 | 0 | return PREFIX(scanRef)(enc, ptr + MINBPC(enc), end, nextTokPtr); |
1216 | 0 | *nextTokPtr = ptr; |
1217 | 0 | return XML_TOK_DATA_CHARS; |
1218 | 0 | case BT_LT: |
1219 | 0 | /* this is for inside entity references */ |
1220 | 0 | *nextTokPtr = ptr; |
1221 | 0 | return XML_TOK_INVALID; |
1222 | 0 | case BT_LF: |
1223 | 0 | if (ptr == start) { |
1224 | 0 | *nextTokPtr = ptr + MINBPC(enc); |
1225 | 0 | return XML_TOK_DATA_NEWLINE; |
1226 | 0 | } |
1227 | 0 | *nextTokPtr = ptr; |
1228 | 0 | return XML_TOK_DATA_CHARS; |
1229 | 0 | case BT_CR: |
1230 | 0 | if (ptr == start) { |
1231 | 0 | ptr += MINBPC(enc); |
1232 | 0 | if (ptr == end) |
1233 | 0 | return XML_TOK_TRAILING_CR; |
1234 | 0 | if (BYTE_TYPE(enc, ptr) == BT_LF) |
1235 | 0 | ptr += MINBPC(enc); |
1236 | 0 | *nextTokPtr = ptr; |
1237 | 0 | return XML_TOK_DATA_NEWLINE; |
1238 | 0 | } |
1239 | 0 | *nextTokPtr = ptr; |
1240 | 0 | return XML_TOK_DATA_CHARS; |
1241 | 0 | case BT_S: |
1242 | 0 | if (ptr == start) { |
1243 | 0 | *nextTokPtr = ptr + MINBPC(enc); |
1244 | 0 | return XML_TOK_ATTRIBUTE_VALUE_S; |
1245 | 0 | } |
1246 | 0 | *nextTokPtr = ptr; |
1247 | 0 | return XML_TOK_DATA_CHARS; |
1248 | 0 | default: |
1249 | 0 | ptr += MINBPC(enc); |
1250 | 0 | break; |
1251 | 0 | } |
1252 | 0 | } |
1253 | 0 | *nextTokPtr = ptr; |
1254 | 0 | return XML_TOK_DATA_CHARS; |
1255 | 0 | } Unexecuted instantiation: xmltok.c:normal_attributeValueTok Unexecuted instantiation: xmltok.c:little2_attributeValueTok Unexecuted instantiation: xmltok.c:big2_attributeValueTok |
1256 | | |
1257 | | static int PTRCALL |
1258 | | PREFIX(entityValueTok)(const ENCODING *enc, const char *ptr, |
1259 | | const char *end, const char **nextTokPtr) |
1260 | 0 | { |
1261 | 0 | const char *start; |
1262 | 0 | if (ptr == end) |
1263 | 0 | return XML_TOK_NONE; |
1264 | 0 | start = ptr; |
1265 | 0 | while (ptr != end) { |
1266 | 0 | switch (BYTE_TYPE(enc, ptr)) { |
1267 | 0 | #define LEAD_CASE(n) \ |
1268 | 0 | case BT_LEAD ## n: ptr += n; break; |
1269 | 0 | LEAD_CASE(2) LEAD_CASE(3) LEAD_CASE(4) |
1270 | 0 | #undef LEAD_CASE |
1271 | 0 | case BT_AMP: |
1272 | 0 | if (ptr == start) |
1273 | 0 | return PREFIX(scanRef)(enc, ptr + MINBPC(enc), end, nextTokPtr); |
1274 | 0 | *nextTokPtr = ptr; |
1275 | 0 | return XML_TOK_DATA_CHARS; |
1276 | 0 | case BT_PERCNT: |
1277 | 0 | if (ptr == start) { |
1278 | 0 | int tok = PREFIX(scanPercent)(enc, ptr + MINBPC(enc), |
1279 | 0 | end, nextTokPtr); |
1280 | 0 | return (tok == XML_TOK_PERCENT) ? XML_TOK_INVALID : tok; |
1281 | 0 | } |
1282 | 0 | *nextTokPtr = ptr; |
1283 | 0 | return XML_TOK_DATA_CHARS; |
1284 | 0 | case BT_LF: |
1285 | 0 | if (ptr == start) { |
1286 | 0 | *nextTokPtr = ptr + MINBPC(enc); |
1287 | 0 | return XML_TOK_DATA_NEWLINE; |
1288 | 0 | } |
1289 | 0 | *nextTokPtr = ptr; |
1290 | 0 | return XML_TOK_DATA_CHARS; |
1291 | 0 | case BT_CR: |
1292 | 0 | if (ptr == start) { |
1293 | 0 | ptr += MINBPC(enc); |
1294 | 0 | if (ptr == end) |
1295 | 0 | return XML_TOK_TRAILING_CR; |
1296 | 0 | if (BYTE_TYPE(enc, ptr) == BT_LF) |
1297 | 0 | ptr += MINBPC(enc); |
1298 | 0 | *nextTokPtr = ptr; |
1299 | 0 | return XML_TOK_DATA_NEWLINE; |
1300 | 0 | } |
1301 | 0 | *nextTokPtr = ptr; |
1302 | 0 | return XML_TOK_DATA_CHARS; |
1303 | 0 | default: |
1304 | 0 | ptr += MINBPC(enc); |
1305 | 0 | break; |
1306 | 0 | } |
1307 | 0 | } |
1308 | 0 | *nextTokPtr = ptr; |
1309 | 0 | return XML_TOK_DATA_CHARS; |
1310 | 0 | } Unexecuted instantiation: xmltok.c:normal_entityValueTok Unexecuted instantiation: xmltok.c:little2_entityValueTok Unexecuted instantiation: xmltok.c:big2_entityValueTok |
1311 | | |
1312 | | #ifdef XML_DTD |
1313 | | |
1314 | | static int PTRCALL |
1315 | | PREFIX(ignoreSectionTok)(const ENCODING *enc, const char *ptr, |
1316 | | const char *end, const char **nextTokPtr) |
1317 | 0 | { |
1318 | 0 | int level = 0; |
1319 | 0 | if (MINBPC(enc) > 1) { |
1320 | 0 | size_t n = end - ptr; |
1321 | 0 | if (n & (MINBPC(enc) - 1)) { |
1322 | 0 | n &= ~(MINBPC(enc) - 1); |
1323 | 0 | end = ptr + n; |
1324 | 0 | } |
1325 | 0 | } |
1326 | 0 | while (ptr != end) { |
1327 | 0 | switch (BYTE_TYPE(enc, ptr)) { |
1328 | 0 | INVALID_CASES(ptr, nextTokPtr) |
1329 | 0 | case BT_LT: |
1330 | 0 | if ((ptr += MINBPC(enc)) == end) |
1331 | 0 | return XML_TOK_PARTIAL; |
1332 | 0 | if (CHAR_MATCHES(enc, ptr, ASCII_EXCL)) { |
1333 | 0 | if ((ptr += MINBPC(enc)) == end) |
1334 | 0 | return XML_TOK_PARTIAL; |
1335 | 0 | if (CHAR_MATCHES(enc, ptr, ASCII_LSQB)) { |
1336 | 0 | ++level; |
1337 | 0 | ptr += MINBPC(enc); |
1338 | 0 | } |
1339 | 0 | } |
1340 | 0 | break; |
1341 | 0 | case BT_RSQB: |
1342 | 0 | if ((ptr += MINBPC(enc)) == end) |
1343 | 0 | return XML_TOK_PARTIAL; |
1344 | 0 | if (CHAR_MATCHES(enc, ptr, ASCII_RSQB)) { |
1345 | 0 | if ((ptr += MINBPC(enc)) == end) |
1346 | 0 | return XML_TOK_PARTIAL; |
1347 | 0 | if (CHAR_MATCHES(enc, ptr, ASCII_GT)) { |
1348 | 0 | ptr += MINBPC(enc); |
1349 | 0 | if (level == 0) { |
1350 | 0 | *nextTokPtr = ptr; |
1351 | 0 | return XML_TOK_IGNORE_SECT; |
1352 | 0 | } |
1353 | 0 | --level; |
1354 | 0 | } |
1355 | 0 | } |
1356 | 0 | break; |
1357 | 0 | default: |
1358 | 0 | ptr += MINBPC(enc); |
1359 | 0 | break; |
1360 | 0 | } |
1361 | 0 | } |
1362 | 0 | return XML_TOK_PARTIAL; |
1363 | 0 | } Unexecuted instantiation: xmltok.c:normal_ignoreSectionTok Unexecuted instantiation: xmltok.c:little2_ignoreSectionTok Unexecuted instantiation: xmltok.c:big2_ignoreSectionTok |
1364 | | |
1365 | | #endif /* XML_DTD */ |
1366 | | |
1367 | | static int PTRCALL |
1368 | | PREFIX(isPublicId)(const ENCODING *enc, const char *ptr, const char *end, |
1369 | | const char **badPtr) |
1370 | 0 | { |
1371 | 0 | ptr += MINBPC(enc); |
1372 | 0 | end -= MINBPC(enc); |
1373 | 0 | for (; ptr != end; ptr += MINBPC(enc)) { |
1374 | 0 | switch (BYTE_TYPE(enc, ptr)) { |
1375 | 0 | case BT_DIGIT: |
1376 | 0 | case BT_HEX: |
1377 | 0 | case BT_MINUS: |
1378 | 0 | case BT_APOS: |
1379 | 0 | case BT_LPAR: |
1380 | 0 | case BT_RPAR: |
1381 | 0 | case BT_PLUS: |
1382 | 0 | case BT_COMMA: |
1383 | 0 | case BT_SOL: |
1384 | 0 | case BT_EQUALS: |
1385 | 0 | case BT_QUEST: |
1386 | 0 | case BT_CR: |
1387 | 0 | case BT_LF: |
1388 | 0 | case BT_SEMI: |
1389 | 0 | case BT_EXCL: |
1390 | 0 | case BT_AST: |
1391 | 0 | case BT_PERCNT: |
1392 | 0 | case BT_NUM: |
1393 | 0 | #ifdef XML_NS |
1394 | 0 | case BT_COLON: |
1395 | 0 | #endif |
1396 | 0 | break; |
1397 | 0 | case BT_S: |
1398 | 0 | if (CHAR_MATCHES(enc, ptr, ASCII_TAB)) { |
1399 | 0 | *badPtr = ptr; |
1400 | 0 | return 0; |
1401 | 0 | } |
1402 | 0 | break; |
1403 | 0 | case BT_NAME: |
1404 | 0 | case BT_NMSTRT: |
1405 | 0 | if (!(BYTE_TO_ASCII(enc, ptr) & ~0x7f)) |
1406 | 0 | break; |
1407 | 0 | default: |
1408 | 0 | switch (BYTE_TO_ASCII(enc, ptr)) { |
1409 | 0 | case 0x24: /* $ */ |
1410 | 0 | case 0x40: /* @ */ |
1411 | 0 | break; |
1412 | 0 | default: |
1413 | 0 | *badPtr = ptr; |
1414 | 0 | return 0; |
1415 | 0 | } |
1416 | 0 | break; |
1417 | 0 | } |
1418 | 0 | } |
1419 | 0 | return 1; |
1420 | 0 | } Unexecuted instantiation: xmltok.c:normal_isPublicId Unexecuted instantiation: xmltok.c:little2_isPublicId Unexecuted instantiation: xmltok.c:big2_isPublicId |
1421 | | |
1422 | | /* This must only be called for a well-formed start-tag or empty |
1423 | | element tag. Returns the number of attributes. Pointers to the |
1424 | | first attsMax attributes are stored in atts. |
1425 | | */ |
1426 | | |
1427 | | static int PTRCALL |
1428 | | PREFIX(getAtts)(const ENCODING *enc, const char *ptr, |
1429 | | int attsMax, ATTRIBUTE *atts) |
1430 | 0 | { |
1431 | 0 | enum { other, inName, inValue } state = inName; |
1432 | 0 | int nAtts = 0; |
1433 | 0 | int open = 0; /* defined when state == inValue; |
1434 | 0 | initialization just to shut up compilers */ |
1435 | 0 |
|
1436 | 0 | for (ptr += MINBPC(enc);; ptr += MINBPC(enc)) { |
1437 | 0 | switch (BYTE_TYPE(enc, ptr)) { |
1438 | 0 | #define START_NAME \ |
1439 | 0 | if (state == other) { \ |
1440 | 0 | if (nAtts < attsMax) { \ |
1441 | 0 | atts[nAtts].name = ptr; \ |
1442 | 0 | atts[nAtts].normalized = 1; \ |
1443 | 0 | } \ |
1444 | 0 | state = inName; \ |
1445 | 0 | } |
1446 | 0 | #define LEAD_CASE(n) \ |
1447 | 0 | case BT_LEAD ## n: START_NAME ptr += (n - MINBPC(enc)); break; |
1448 | 0 | LEAD_CASE(2) LEAD_CASE(3) LEAD_CASE(4) |
1449 | 0 | #undef LEAD_CASE |
1450 | 0 | case BT_NONASCII: |
1451 | 0 | case BT_NMSTRT: |
1452 | 0 | case BT_HEX: |
1453 | 0 | START_NAME |
1454 | 0 | break; |
1455 | 0 | #undef START_NAME |
1456 | 0 | case BT_QUOT: |
1457 | 0 | if (state != inValue) { |
1458 | 0 | if (nAtts < attsMax) |
1459 | 0 | atts[nAtts].valuePtr = ptr + MINBPC(enc); |
1460 | 0 | state = inValue; |
1461 | 0 | open = BT_QUOT; |
1462 | 0 | } |
1463 | 0 | else if (open == BT_QUOT) { |
1464 | 0 | state = other; |
1465 | 0 | if (nAtts < attsMax) |
1466 | 0 | atts[nAtts].valueEnd = ptr; |
1467 | 0 | nAtts++; |
1468 | 0 | } |
1469 | 0 | break; |
1470 | 0 | case BT_APOS: |
1471 | 0 | if (state != inValue) { |
1472 | 0 | if (nAtts < attsMax) |
1473 | 0 | atts[nAtts].valuePtr = ptr + MINBPC(enc); |
1474 | 0 | state = inValue; |
1475 | 0 | open = BT_APOS; |
1476 | 0 | } |
1477 | 0 | else if (open == BT_APOS) { |
1478 | 0 | state = other; |
1479 | 0 | if (nAtts < attsMax) |
1480 | 0 | atts[nAtts].valueEnd = ptr; |
1481 | 0 | nAtts++; |
1482 | 0 | } |
1483 | 0 | break; |
1484 | 0 | case BT_AMP: |
1485 | 0 | if (nAtts < attsMax) |
1486 | 0 | atts[nAtts].normalized = 0; |
1487 | 0 | break; |
1488 | 0 | case BT_S: |
1489 | 0 | if (state == inName) |
1490 | 0 | state = other; |
1491 | 0 | else if (state == inValue |
1492 | 0 | && nAtts < attsMax |
1493 | 0 | && atts[nAtts].normalized |
1494 | 0 | && (ptr == atts[nAtts].valuePtr |
1495 | 0 | || BYTE_TO_ASCII(enc, ptr) != ASCII_SPACE |
1496 | 0 | || BYTE_TO_ASCII(enc, ptr + MINBPC(enc)) == ASCII_SPACE |
1497 | 0 | || BYTE_TYPE(enc, ptr + MINBPC(enc)) == open)) |
1498 | 0 | atts[nAtts].normalized = 0; |
1499 | 0 | break; |
1500 | 0 | case BT_CR: case BT_LF: |
1501 | 0 | /* This case ensures that the first attribute name is counted |
1502 | 0 | Apart from that we could just change state on the quote. */ |
1503 | 0 | if (state == inName) |
1504 | 0 | state = other; |
1505 | 0 | else if (state == inValue && nAtts < attsMax) |
1506 | 0 | atts[nAtts].normalized = 0; |
1507 | 0 | break; |
1508 | 0 | case BT_GT: |
1509 | 0 | case BT_SOL: |
1510 | 0 | if (state != inValue) |
1511 | 0 | return nAtts; |
1512 | 0 | break; |
1513 | 0 | default: |
1514 | 0 | break; |
1515 | 0 | } |
1516 | 0 | } |
1517 | 0 | /* not reached */ |
1518 | 0 | } Unexecuted instantiation: xmltok.c:normal_getAtts Unexecuted instantiation: xmltok.c:little2_getAtts Unexecuted instantiation: xmltok.c:big2_getAtts |
1519 | | |
1520 | | static int PTRFASTCALL |
1521 | | PREFIX(charRefNumber)(const ENCODING *enc, const char *ptr) |
1522 | 0 | { |
1523 | 0 | int result = 0; |
1524 | 0 | /* skip &# */ |
1525 | 0 | ptr += 2*MINBPC(enc); |
1526 | 0 | if (CHAR_MATCHES(enc, ptr, ASCII_x)) { |
1527 | 0 | for (ptr += MINBPC(enc); |
1528 | 0 | !CHAR_MATCHES(enc, ptr, ASCII_SEMI); |
1529 | 0 | ptr += MINBPC(enc)) { |
1530 | 0 | int c = BYTE_TO_ASCII(enc, ptr); |
1531 | 0 | switch (c) { |
1532 | 0 | case ASCII_0: case ASCII_1: case ASCII_2: case ASCII_3: case ASCII_4: |
1533 | 0 | case ASCII_5: case ASCII_6: case ASCII_7: case ASCII_8: case ASCII_9: |
1534 | 0 | result <<= 4; |
1535 | 0 | result |= (c - ASCII_0); |
1536 | 0 | break; |
1537 | 0 | case ASCII_A: case ASCII_B: case ASCII_C: |
1538 | 0 | case ASCII_D: case ASCII_E: case ASCII_F: |
1539 | 0 | result <<= 4; |
1540 | 0 | result += 10 + (c - ASCII_A); |
1541 | 0 | break; |
1542 | 0 | case ASCII_a: case ASCII_b: case ASCII_c: |
1543 | 0 | case ASCII_d: case ASCII_e: case ASCII_f: |
1544 | 0 | result <<= 4; |
1545 | 0 | result += 10 + (c - ASCII_a); |
1546 | 0 | break; |
1547 | 0 | } |
1548 | 0 | if (result >= 0x110000) |
1549 | 0 | return -1; |
1550 | 0 | } |
1551 | 0 | } |
1552 | 0 | else { |
1553 | 0 | for (; !CHAR_MATCHES(enc, ptr, ASCII_SEMI); ptr += MINBPC(enc)) { |
1554 | 0 | int c = BYTE_TO_ASCII(enc, ptr); |
1555 | 0 | result *= 10; |
1556 | 0 | result += (c - ASCII_0); |
1557 | 0 | if (result >= 0x110000) |
1558 | 0 | return -1; |
1559 | 0 | } |
1560 | 0 | } |
1561 | 0 | return checkCharRefNumber(result); |
1562 | 0 | } Unexecuted instantiation: xmltok.c:normal_charRefNumber Unexecuted instantiation: xmltok.c:little2_charRefNumber Unexecuted instantiation: xmltok.c:big2_charRefNumber |
1563 | | |
1564 | | static int PTRCALL |
1565 | | PREFIX(predefinedEntityName)(const ENCODING *enc, const char *ptr, |
1566 | | const char *end) |
1567 | 0 | { |
1568 | 0 | switch ((end - ptr)/MINBPC(enc)) { |
1569 | 0 | case 2: |
1570 | 0 | if (CHAR_MATCHES(enc, ptr + MINBPC(enc), ASCII_t)) { |
1571 | 0 | switch (BYTE_TO_ASCII(enc, ptr)) { |
1572 | 0 | case ASCII_l: |
1573 | 0 | return ASCII_LT; |
1574 | 0 | case ASCII_g: |
1575 | 0 | return ASCII_GT; |
1576 | 0 | } |
1577 | 0 | } |
1578 | 0 | break; |
1579 | 0 | case 3: |
1580 | 0 | if (CHAR_MATCHES(enc, ptr, ASCII_a)) { |
1581 | 0 | ptr += MINBPC(enc); |
1582 | 0 | if (CHAR_MATCHES(enc, ptr, ASCII_m)) { |
1583 | 0 | ptr += MINBPC(enc); |
1584 | 0 | if (CHAR_MATCHES(enc, ptr, ASCII_p)) |
1585 | 0 | return ASCII_AMP; |
1586 | 0 | } |
1587 | 0 | } |
1588 | 0 | break; |
1589 | 0 | case 4: |
1590 | 0 | switch (BYTE_TO_ASCII(enc, ptr)) { |
1591 | 0 | case ASCII_q: |
1592 | 0 | ptr += MINBPC(enc); |
1593 | 0 | if (CHAR_MATCHES(enc, ptr, ASCII_u)) { |
1594 | 0 | ptr += MINBPC(enc); |
1595 | 0 | if (CHAR_MATCHES(enc, ptr, ASCII_o)) { |
1596 | 0 | ptr += MINBPC(enc); |
1597 | 0 | if (CHAR_MATCHES(enc, ptr, ASCII_t)) |
1598 | 0 | return ASCII_QUOT; |
1599 | 0 | } |
1600 | 0 | } |
1601 | 0 | break; |
1602 | 0 | case ASCII_a: |
1603 | 0 | ptr += MINBPC(enc); |
1604 | 0 | if (CHAR_MATCHES(enc, ptr, ASCII_p)) { |
1605 | 0 | ptr += MINBPC(enc); |
1606 | 0 | if (CHAR_MATCHES(enc, ptr, ASCII_o)) { |
1607 | 0 | ptr += MINBPC(enc); |
1608 | 0 | if (CHAR_MATCHES(enc, ptr, ASCII_s)) |
1609 | 0 | return ASCII_APOS; |
1610 | 0 | } |
1611 | 0 | } |
1612 | 0 | break; |
1613 | 0 | } |
1614 | 0 | } |
1615 | 0 | return 0; |
1616 | 0 | } Unexecuted instantiation: xmltok.c:normal_predefinedEntityName Unexecuted instantiation: xmltok.c:little2_predefinedEntityName Unexecuted instantiation: xmltok.c:big2_predefinedEntityName |
1617 | | |
1618 | | static int PTRCALL |
1619 | | PREFIX(sameName)(const ENCODING *enc, const char *ptr1, const char *ptr2) |
1620 | 0 | { |
1621 | 0 | for (;;) { |
1622 | 0 | switch (BYTE_TYPE(enc, ptr1)) { |
1623 | 0 | #define LEAD_CASE(n) \ |
1624 | 0 | case BT_LEAD ## n: \ |
1625 | 0 | if (*ptr1++ != *ptr2++) \ |
1626 | 0 | return 0; |
1627 | 0 | LEAD_CASE(4) LEAD_CASE(3) LEAD_CASE(2) |
1628 | 0 | #undef LEAD_CASE |
1629 | 0 | /* fall through */ |
1630 | 0 | if (*ptr1++ != *ptr2++) |
1631 | 0 | return 0; |
1632 | 0 | break; |
1633 | 0 | case BT_NONASCII: |
1634 | 0 | case BT_NMSTRT: |
1635 | 0 | #ifdef XML_NS |
1636 | 0 | case BT_COLON: |
1637 | 0 | #endif |
1638 | 0 | case BT_HEX: |
1639 | 0 | case BT_DIGIT: |
1640 | 0 | case BT_NAME: |
1641 | 0 | case BT_MINUS: |
1642 | 0 | if (*ptr2++ != *ptr1++) |
1643 | 0 | return 0; |
1644 | 0 | if (MINBPC(enc) > 1) { |
1645 | 0 | if (*ptr2++ != *ptr1++) |
1646 | 0 | return 0; |
1647 | 0 | if (MINBPC(enc) > 2) { |
1648 | 0 | if (*ptr2++ != *ptr1++) |
1649 | 0 | return 0; |
1650 | 0 | if (MINBPC(enc) > 3) { |
1651 | 0 | if (*ptr2++ != *ptr1++) |
1652 | 0 | return 0; |
1653 | 0 | } |
1654 | 0 | } |
1655 | 0 | } |
1656 | 0 | break; |
1657 | 0 | default: |
1658 | 0 | if (MINBPC(enc) == 1 && *ptr1 == *ptr2) |
1659 | 0 | return 1; |
1660 | 0 | switch (BYTE_TYPE(enc, ptr2)) { |
1661 | 0 | case BT_LEAD2: |
1662 | 0 | case BT_LEAD3: |
1663 | 0 | case BT_LEAD4: |
1664 | 0 | case BT_NONASCII: |
1665 | 0 | case BT_NMSTRT: |
1666 | 0 | #ifdef XML_NS |
1667 | 0 | case BT_COLON: |
1668 | 0 | #endif |
1669 | 0 | case BT_HEX: |
1670 | 0 | case BT_DIGIT: |
1671 | 0 | case BT_NAME: |
1672 | 0 | case BT_MINUS: |
1673 | 0 | return 0; |
1674 | 0 | default: |
1675 | 0 | return 1; |
1676 | 0 | } |
1677 | 0 | } |
1678 | 0 | } |
1679 | 0 | /* not reached */ |
1680 | 0 | } Unexecuted instantiation: xmltok.c:normal_sameName Unexecuted instantiation: xmltok.c:little2_sameName Unexecuted instantiation: xmltok.c:big2_sameName |
1681 | | |
1682 | | static int PTRCALL |
1683 | | PREFIX(nameMatchesAscii)(const ENCODING *enc, const char *ptr1, |
1684 | | const char *end1, const char *ptr2) |
1685 | 0 | { |
1686 | 0 | for (; *ptr2; ptr1 += MINBPC(enc), ptr2++) { |
1687 | 0 | if (ptr1 == end1) |
1688 | 0 | return 0; |
1689 | 0 | if (!CHAR_MATCHES(enc, ptr1, *ptr2)) |
1690 | 0 | return 0; |
1691 | 0 | } |
1692 | 0 | return ptr1 == end1; |
1693 | 0 | } Unexecuted instantiation: xmltok.c:normal_nameMatchesAscii Unexecuted instantiation: xmltok.c:little2_nameMatchesAscii Unexecuted instantiation: xmltok.c:big2_nameMatchesAscii |
1694 | | |
1695 | | static int PTRFASTCALL |
1696 | | PREFIX(nameLength)(const ENCODING *enc, const char *ptr) |
1697 | 0 | { |
1698 | 0 | const char *start = ptr; |
1699 | 0 | for (;;) { |
1700 | 0 | switch (BYTE_TYPE(enc, ptr)) { |
1701 | 0 | #define LEAD_CASE(n) \ |
1702 | 0 | case BT_LEAD ## n: ptr += n; break; |
1703 | 0 | LEAD_CASE(2) LEAD_CASE(3) LEAD_CASE(4) |
1704 | 0 | #undef LEAD_CASE |
1705 | 0 | case BT_NONASCII: |
1706 | 0 | case BT_NMSTRT: |
1707 | 0 | #ifdef XML_NS |
1708 | 0 | case BT_COLON: |
1709 | 0 | #endif |
1710 | 0 | case BT_HEX: |
1711 | 0 | case BT_DIGIT: |
1712 | 0 | case BT_NAME: |
1713 | 0 | case BT_MINUS: |
1714 | 0 | ptr += MINBPC(enc); |
1715 | 0 | break; |
1716 | 0 | default: |
1717 | 0 | return (int)(ptr - start); |
1718 | 0 | } |
1719 | 0 | } |
1720 | 0 | } Unexecuted instantiation: xmltok.c:normal_nameLength Unexecuted instantiation: xmltok.c:little2_nameLength Unexecuted instantiation: xmltok.c:big2_nameLength |
1721 | | |
1722 | | static const char * PTRFASTCALL |
1723 | | PREFIX(skipS)(const ENCODING *enc, const char *ptr) |
1724 | 0 | { |
1725 | 0 | for (;;) { |
1726 | 0 | switch (BYTE_TYPE(enc, ptr)) { |
1727 | 0 | case BT_LF: |
1728 | 0 | case BT_CR: |
1729 | 0 | case BT_S: |
1730 | 0 | ptr += MINBPC(enc); |
1731 | 0 | break; |
1732 | 0 | default: |
1733 | 0 | return ptr; |
1734 | 0 | } |
1735 | 0 | } |
1736 | 0 | } Unexecuted instantiation: xmltok.c:normal_skipS Unexecuted instantiation: xmltok.c:little2_skipS Unexecuted instantiation: xmltok.c:big2_skipS |
1737 | | |
1738 | | static void PTRCALL |
1739 | | PREFIX(updatePosition)(const ENCODING *enc, |
1740 | | const char *ptr, |
1741 | | const char *end, |
1742 | | POSITION *pos) |
1743 | 0 | { |
1744 | 0 | while (ptr != end) { |
1745 | 0 | switch (BYTE_TYPE(enc, ptr)) { |
1746 | 0 | #define LEAD_CASE(n) \ |
1747 | 0 | case BT_LEAD ## n: \ |
1748 | 0 | ptr += n; \ |
1749 | 0 | break; |
1750 | 0 | LEAD_CASE(2) LEAD_CASE(3) LEAD_CASE(4) |
1751 | 0 | #undef LEAD_CASE |
1752 | 0 | case BT_LF: |
1753 | 0 | pos->columnNumber = (XML_Size)-1; |
1754 | 0 | pos->lineNumber++; |
1755 | 0 | ptr += MINBPC(enc); |
1756 | 0 | break; |
1757 | 0 | case BT_CR: |
1758 | 0 | pos->lineNumber++; |
1759 | 0 | ptr += MINBPC(enc); |
1760 | 0 | if (ptr != end && BYTE_TYPE(enc, ptr) == BT_LF) |
1761 | 0 | ptr += MINBPC(enc); |
1762 | 0 | pos->columnNumber = (XML_Size)-1; |
1763 | 0 | break; |
1764 | 0 | default: |
1765 | 0 | ptr += MINBPC(enc); |
1766 | 0 | break; |
1767 | 0 | } |
1768 | 0 | pos->columnNumber++; |
1769 | 0 | } |
1770 | 0 | } Unexecuted instantiation: xmltok.c:normal_updatePosition Unexecuted instantiation: xmltok.c:little2_updatePosition Unexecuted instantiation: xmltok.c:big2_updatePosition |
1771 | | |
1772 | | #undef DO_LEAD_CASE |
1773 | | #undef MULTIBYTE_CASES |
1774 | | #undef INVALID_CASES |
1775 | | #undef CHECK_NAME_CASE |
1776 | | #undef CHECK_NAME_CASES |
1777 | | #undef CHECK_NMSTRT_CASE |
1778 | | #undef CHECK_NMSTRT_CASES |
1779 | | |