Coverage Report

Created: 2026-05-16 06:54

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
/src/open62541/deps/yxml.c
Line
Count
Source
1
/* This file is generated by yxml-gen.pl using yxml-states and yxml.c.in as input files.
2
 * It is preferable to edit those files instead of this one if you want to make a change.
3
 * The source files can be found through the homepage: https://dev.yorhel.nl/yxml */
4
5
/* Copyright (c) 2013-2014 Yoran Heling
6
7
  Permission is hereby granted, free of charge, to any person obtaining
8
  a copy of this software and associated documentation files (the
9
  "Software"), to deal in the Software without restriction, including
10
  without limitation the rights to use, copy, modify, merge, publish,
11
  distribute, sublicense, and/or sell copies of the Software, and to
12
  permit persons to whom the Software is furnished to do so, subject to
13
  the following conditions:
14
15
  The above copyright notice and this permission notice shall be included
16
  in all copies or substantial portions of the Software.
17
18
  THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
19
  EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20
  MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.
21
  IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY
22
  CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
23
  TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
24
  SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
25
*/
26
27
#include "yxml.h"
28
#include <string.h>
29
30
typedef enum {
31
  YXMLS_string,
32
  YXMLS_attr0,
33
  YXMLS_attr1,
34
  YXMLS_attr2,
35
  YXMLS_attr3,
36
  YXMLS_attr4,
37
  YXMLS_cd0,
38
  YXMLS_cd1,
39
  YXMLS_cd2,
40
  YXMLS_comment0,
41
  YXMLS_comment1,
42
  YXMLS_comment2,
43
  YXMLS_comment3,
44
  YXMLS_comment4,
45
  YXMLS_dt0,
46
  YXMLS_dt1,
47
  YXMLS_dt2,
48
  YXMLS_dt3,
49
  YXMLS_dt4,
50
  YXMLS_elem0,
51
  YXMLS_elem1,
52
  YXMLS_elem2,
53
  YXMLS_elem3,
54
  YXMLS_enc0,
55
  YXMLS_enc1,
56
  YXMLS_enc2,
57
  YXMLS_enc3,
58
  YXMLS_etag0,
59
  YXMLS_etag1,
60
  YXMLS_etag2,
61
  YXMLS_init,
62
  YXMLS_le0,
63
  YXMLS_le1,
64
  YXMLS_le2,
65
  YXMLS_le3,
66
  YXMLS_lee1,
67
  YXMLS_lee2,
68
  YXMLS_leq0,
69
  YXMLS_misc0,
70
  YXMLS_misc1,
71
  YXMLS_misc2,
72
  YXMLS_misc2a,
73
  YXMLS_misc3,
74
  YXMLS_pi0,
75
  YXMLS_pi1,
76
  YXMLS_pi2,
77
  YXMLS_pi3,
78
  YXMLS_pi4,
79
  YXMLS_std0,
80
  YXMLS_std1,
81
  YXMLS_std2,
82
  YXMLS_std3,
83
  YXMLS_ver0,
84
  YXMLS_ver1,
85
  YXMLS_ver2,
86
  YXMLS_ver3,
87
  YXMLS_xmldecl0,
88
  YXMLS_xmldecl1,
89
  YXMLS_xmldecl2,
90
  YXMLS_xmldecl3,
91
  YXMLS_xmldecl4,
92
  YXMLS_xmldecl5,
93
  YXMLS_xmldecl6,
94
  YXMLS_xmldecl7,
95
  YXMLS_xmldecl8,
96
  YXMLS_xmldecl9
97
} yxml_state_t;
98
99
456M
#define yxml_isChar(c) 1
100
/* 0xd should be part of SP, too, but yxml_parse() already normalizes that into 0xa */
101
7.23M
#define yxml_isSP(c) (c == 0x20 || c == 0x09 || c == 0x0a)
102
109M
#define yxml_isAlpha(c) ((c|32)-'a' < 26)
103
55.3M
#define yxml_isNum(c) (c-'0' < 10)
104
0
#define yxml_isHex(c) (yxml_isNum(c) || (c|32)-'a' < 6)
105
0
#define yxml_isEncName(c) (yxml_isAlpha(c) || yxml_isNum(c) || c == '.' || c == '_' || c == '-')
106
104M
#define yxml_isNameStart(c) (yxml_isAlpha(c) || c == ':' || c == '_' || c >= 128)
107
49.2M
#define yxml_isName(c) (yxml_isNameStart(c) || yxml_isNum(c) || c == '-' || c == '.')
108
/* XXX: The valid characters are dependent on the quote char, hence the access to x->quote */
109
12.6M
#define yxml_isAttValue(c) (yxml_isChar(c) && c != x->quote && c != '<' && c != '&')
110
/* Anything between '&' and ';', the yxml_ref* functions will do further
111
 * validation. Strictly speaking, this is "yxml_isName(c) || c == '#'", but
112
 * this parser doesn't understand entities with '.', ':', etc, anwyay.  */
113
0
#define yxml_isRef(c) (yxml_isNum(c) || yxml_isAlpha(c) || c == '#')
114
115
0
#define INTFROM5CHARS(a, b, c, d, e) ((((uint64_t)(a))<<32) | (((uint64_t)(b))<<24) | (((uint64_t)(c))<<16) | (((uint64_t)(d))<<8) | (uint64_t)(e))
116
117
/* Set the given char value to ch (0<=ch<=255). */
118
443M
static inline void yxml_setchar(char *dest, unsigned ch) {
119
443M
  *(unsigned char *)dest = (unsigned char)ch;
120
443M
}
121
122
/* Similar to yxml_setchar(), but will convert ch (any valid unicode point) to
123
 * UTF-8 and appends a '\0'. dest must have room for at least 5 bytes. */
124
0
static void yxml_setutf8(char *dest, unsigned ch) {
125
0
  if(ch <= 0x007F)
126
0
    yxml_setchar(dest++, ch);
127
0
  else if(ch <= 0x07FF) {
128
0
    yxml_setchar(dest++, 0xC0 | (ch>>6));
129
0
    yxml_setchar(dest++, 0x80 | (ch & 0x3F));
130
0
  } else if(ch <= 0xFFFF) {
131
0
    yxml_setchar(dest++, 0xE0 | (ch>>12));
132
0
    yxml_setchar(dest++, 0x80 | ((ch>>6) & 0x3F));
133
0
    yxml_setchar(dest++, 0x80 | (ch & 0x3F));
134
0
  } else {
135
0
    yxml_setchar(dest++, 0xF0 | (ch>>18));
136
0
    yxml_setchar(dest++, 0x80 | ((ch>>12) & 0x3F));
137
0
    yxml_setchar(dest++, 0x80 | ((ch>>6) & 0x3F));
138
0
    yxml_setchar(dest++, 0x80 | (ch & 0x3F));
139
0
  }
140
0
  *dest = 0;
141
0
}
142
143
431M
static inline yxml_ret_t yxml_datacontent(yxml_t *x, unsigned ch) {
144
431M
  yxml_setchar(x->data, ch);
145
431M
  x->data[1] = 0;
146
431M
  return YXML_CONTENT;
147
431M
}
148
149
0
static inline yxml_ret_t yxml_datapi1(yxml_t *x, unsigned ch) {
150
0
  yxml_setchar(x->data, ch);
151
0
  x->data[1] = 0;
152
0
  return YXML_PICONTENT;
153
0
}
154
155
0
static inline yxml_ret_t yxml_datapi2(yxml_t *x, unsigned ch) {
156
0
  x->data[0] = '?';
157
0
  yxml_setchar(x->data+1, ch);
158
0
  x->data[2] = 0;
159
0
  return YXML_PICONTENT;
160
0
}
161
162
0
static inline yxml_ret_t yxml_datacd1(yxml_t *x, unsigned ch) {
163
0
  x->data[0] = ']';
164
0
  yxml_setchar(x->data+1, ch);
165
0
  x->data[2] = 0;
166
0
  return YXML_CONTENT;
167
0
}
168
169
0
static inline yxml_ret_t yxml_datacd2(yxml_t *x, unsigned ch) {
170
0
  x->data[0] = ']';
171
0
  x->data[1] = ']';
172
0
  yxml_setchar(x->data+2, ch);
173
0
  x->data[3] = 0;
174
0
  return YXML_CONTENT;
175
0
}
176
177
12.2M
static inline yxml_ret_t yxml_dataattr(yxml_t *x, unsigned ch) {
178
  /* Normalize attribute values according to the XML spec section 3.3.3. */
179
12.2M
  yxml_setchar(x->data, ch == 0x9 || ch == 0xa ? 0x20 : ch);
180
12.2M
  x->data[1] = 0;
181
12.2M
  return YXML_ATTRVAL;
182
12.2M
}
183
184
3.25M
static yxml_ret_t yxml_pushstack(yxml_t *x, char **res, unsigned ch) {
185
3.25M
  if(x->stacklen+2 >= x->stacksize)
186
0
    return YXML_ESTACK;
187
3.25M
  x->stacklen++;
188
3.25M
  *res = (char *)x->stack+x->stacklen;
189
3.25M
  x->stack[x->stacklen] = (unsigned char)ch;
190
3.25M
  x->stacklen++;
191
3.25M
  x->stack[x->stacklen] = 0;
192
3.25M
  return YXML_OK;
193
3.25M
}
194
195
25.2M
static yxml_ret_t yxml_pushstackc(yxml_t *x, unsigned ch) {
196
25.2M
  if(x->stacklen+1 >= x->stacksize)
197
0
    return YXML_ESTACK;
198
25.2M
  x->stack[x->stacklen] = (unsigned char)ch;
199
25.2M
  x->stacklen++;
200
25.2M
  x->stack[x->stacklen] = 0;
201
25.2M
  return YXML_OK;
202
25.2M
}
203
204
3.25M
static void yxml_popstack(yxml_t *x) {
205
3.25M
  do
206
31.8M
    x->stacklen--;
207
31.8M
  while(x->stack[x->stacklen]);
208
3.25M
}
209
210
2.84M
static inline yxml_ret_t yxml_elemstart  (yxml_t *x, unsigned ch) { return yxml_pushstack(x, &x->elem, ch); }
211
23.0M
static inline yxml_ret_t yxml_elemname   (yxml_t *x, unsigned ch) { return yxml_pushstackc(x, ch); }
212
2.84M
static inline yxml_ret_t yxml_elemnameend(yxml_t *x, unsigned ch) { return YXML_ELEMSTART; }
213
214
/* Also used in yxml_elemcloseend(), since this function just removes the last
215
 * element from the stack and returns ELEMEND. */
216
2.84M
static yxml_ret_t yxml_selfclose(yxml_t *x, unsigned ch) {
217
2.84M
  yxml_popstack(x);
218
2.84M
  if(x->stacklen) {
219
2.57M
    x->elem = (char *)x->stack+x->stacklen-1;
220
25.0M
    while(*(x->elem-1))
221
22.4M
      x->elem--;
222
2.57M
    return YXML_ELEMEND;
223
2.57M
  }
224
264k
  x->elem = (char *)x->stack;
225
264k
  x->state = YXMLS_misc3;
226
264k
  return YXML_ELEMEND;
227
2.84M
}
228
229
20.6M
static inline yxml_ret_t yxml_elemclose(yxml_t *x, unsigned ch) {
230
20.6M
  if(*((unsigned char *)x->elem) != ch)
231
0
    return YXML_ECLOSE;
232
20.6M
  x->elem++;
233
20.6M
  return YXML_OK;
234
20.6M
}
235
236
2.45M
static inline yxml_ret_t yxml_elemcloseend(yxml_t *x, unsigned ch) {
237
2.45M
  if(*x->elem)
238
0
    return YXML_ECLOSE;
239
2.45M
  return yxml_selfclose(x, ch);
240
2.45M
}
241
242
417k
static inline yxml_ret_t yxml_attrstart  (yxml_t *x, unsigned ch) { return yxml_pushstack(x, &x->attr, ch); }
243
2.25M
static inline yxml_ret_t yxml_attrname   (yxml_t *x, unsigned ch) { return yxml_pushstackc(x, ch); }
244
417k
static inline yxml_ret_t yxml_attrnameend(yxml_t *x, unsigned ch) { return YXML_ATTRSTART; }
245
417k
static inline yxml_ret_t yxml_attrvalend (yxml_t *x, unsigned ch) { yxml_popstack(x); return YXML_ATTREND; }
246
247
0
static inline yxml_ret_t yxml_pistart  (yxml_t *x, unsigned ch) { return yxml_pushstack(x, &x->pi, ch); }
248
0
static inline yxml_ret_t yxml_piname   (yxml_t *x, unsigned ch) { return yxml_pushstackc(x, ch); }
249
0
static inline yxml_ret_t yxml_piabort  (yxml_t *x, unsigned ch) { yxml_popstack(x); return YXML_OK; }
250
0
static inline yxml_ret_t yxml_pinameend(yxml_t *x, unsigned ch) {
251
0
  return (x->pi[0]|32) == 'x' && (x->pi[1]|32) == 'm' && (x->pi[2]|32) == 'l' && !x->pi[3] ? YXML_ESYN : YXML_PISTART;
252
0
}
253
0
static inline yxml_ret_t yxml_pivalend (yxml_t *x, unsigned ch) { yxml_popstack(x); x->pi = (char *)x->stack; return YXML_PIEND; }
254
255
0
static inline yxml_ret_t yxml_refstart(yxml_t *x, unsigned ch) {
256
0
  memset(x->data, 0, sizeof(x->data));
257
0
  x->reflen = 0;
258
0
  return YXML_OK;
259
0
}
260
261
0
static yxml_ret_t yxml_ref(yxml_t *x, unsigned ch) {
262
0
  if(x->reflen >= sizeof(x->data)-1)
263
0
    return YXML_EREF;
264
0
  yxml_setchar(x->data+x->reflen, ch);
265
0
  x->reflen++;
266
0
  return YXML_OK;
267
0
}
268
269
0
static yxml_ret_t yxml_refend(yxml_t *x, yxml_ret_t ret) {
270
0
  unsigned char *r = (unsigned char *)x->data;
271
0
  unsigned ch = 0;
272
0
  if(*r == '#') {
273
0
    if(r[1] == 'x')
274
0
      for(r += 2; yxml_isHex((unsigned)*r); r++)
275
0
        ch = (ch<<4) + (*r <= '9' ? *r-'0' : (*r|32)-'a' + 10);
276
0
    else
277
0
      for(r++; yxml_isNum((unsigned)*r); r++)
278
0
        ch = (ch*10) + (*r-'0');
279
0
    if(*r)
280
0
      ch = 0;
281
0
  } else {
282
0
    uint64_t i = INTFROM5CHARS(r[0], r[1], r[2], r[3], r[4]);
283
0
    ch =
284
0
      i == INTFROM5CHARS('l','t', 0,  0, 0) ? '<' :
285
0
      i == INTFROM5CHARS('g','t', 0,  0, 0) ? '>' :
286
0
      i == INTFROM5CHARS('a','m','p', 0, 0) ? '&' :
287
0
      i == INTFROM5CHARS('a','p','o','s',0) ? '\'':
288
0
      i == INTFROM5CHARS('q','u','o','t',0) ? '"' : 0;
289
0
  }
290
291
  /* Codepoints not allowed in the XML 1.1 definition of a Char */
292
0
  if(!ch || ch > 0x10FFFF || ch == 0xFFFE || ch == 0xFFFF || (ch-0xDFFF) < 0x7FF)
293
0
    return YXML_EREF;
294
0
  yxml_setutf8(x->data, ch);
295
0
  return ret;
296
0
}
297
298
0
static inline yxml_ret_t yxml_refcontent(yxml_t *x, unsigned ch) { return yxml_refend(x, YXML_CONTENT); }
299
0
static inline yxml_ret_t yxml_refattrval(yxml_t *x, unsigned ch) { return yxml_refend(x, YXML_ATTRVAL); }
300
301
264k
void yxml_init(yxml_t *x, void *stack, size_t stacksize) {
302
264k
  memset(x, 0, sizeof(*x));
303
264k
  x->line = 1;
304
264k
  x->stack = (unsigned char*)stack;
305
264k
  x->stacksize = stacksize;
306
264k
  *x->stack = 0;
307
264k
  x->elem = x->pi = x->attr = (char *)x->stack;
308
264k
  x->state = YXMLS_init;
309
264k
}
310
311
507M
yxml_ret_t yxml_parse(yxml_t *x, int _ch) {
312
  /* Ensure that characters are in the range of 0..255 rather than -126..125.
313
   * All character comparisons are done with positive integers. */
314
507M
  unsigned ch = (unsigned)(_ch+256) & 0xff;
315
507M
  if(!ch)
316
0
    return YXML_ESYN;
317
507M
  x->total++;
318
319
  /* End-of-Line normalization, "\rX", "\r\n" and "\n" are recognized and
320
   * normalized to a single '\n' as per XML 1.0 section 2.11. XML 1.1 adds
321
   * some non-ASCII character sequences to this list, but we can only handle
322
   * ASCII here without making assumptions about the input encoding. */
323
507M
  if(x->ignore == ch) {
324
0
    x->ignore = 0;
325
0
    return YXML_OK;
326
0
  }
327
507M
  x->ignore = (ch == 0xd) * 0xa;
328
507M
  if(ch == 0xa || ch == 0xd) {
329
0
    ch = 0xa;
330
0
    x->line++;
331
0
    x->byte = 0;
332
0
  }
333
507M
  x->byte++;
334
335
507M
  switch((yxml_state_t)x->state) {
336
0
  case YXMLS_string:
337
0
    if(ch == *x->string) {
338
0
      x->string++;
339
0
      if(!*x->string)
340
0
        x->state = x->nextstate;
341
0
      return YXML_OK;
342
0
    }
343
0
    break;
344
2.67M
  case YXMLS_attr0:
345
2.67M
    if(yxml_isName(ch))
346
2.25M
      return yxml_attrname(x, ch);
347
417k
    if(yxml_isSP(ch)) {
348
0
      x->state = YXMLS_attr1;
349
0
      return yxml_attrnameend(x, ch);
350
0
    }
351
417k
    if(ch == (unsigned char)'=') {
352
417k
      x->state = YXMLS_attr2;
353
417k
      return yxml_attrnameend(x, ch);
354
417k
    }
355
0
    break;
356
0
  case YXMLS_attr1:
357
0
    if(yxml_isSP(ch))
358
0
      return YXML_OK;
359
0
    if(ch == (unsigned char)'=') {
360
0
      x->state = YXMLS_attr2;
361
0
      return YXML_OK;
362
0
    }
363
0
    break;
364
417k
  case YXMLS_attr2:
365
417k
    if(yxml_isSP(ch))
366
0
      return YXML_OK;
367
417k
    if(ch == (unsigned char)'\'' || ch == (unsigned char)'"') {
368
417k
      x->state = YXMLS_attr3;
369
417k
      x->quote = ch;
370
417k
      return YXML_OK;
371
417k
    }
372
0
    break;
373
12.6M
  case YXMLS_attr3:
374
12.6M
    if(yxml_isAttValue(ch))
375
12.2M
      return yxml_dataattr(x, ch);
376
417k
    if(ch == (unsigned char)'&') {
377
0
      x->state = YXMLS_attr4;
378
0
      return yxml_refstart(x, ch);
379
0
    }
380
417k
    if(x->quote == ch) {
381
417k
      x->state = YXMLS_elem2;
382
417k
      return yxml_attrvalend(x, ch);
383
417k
    }
384
0
    break;
385
0
  case YXMLS_attr4:
386
0
    if(yxml_isRef(ch))
387
0
      return yxml_ref(x, ch);
388
0
    if(ch == (unsigned char)'\x3b') {
389
0
      x->state = YXMLS_attr3;
390
0
      return yxml_refattrval(x, ch);
391
0
    }
392
0
    break;
393
0
  case YXMLS_cd0:
394
0
    if(ch == (unsigned char)']') {
395
0
      x->state = YXMLS_cd1;
396
0
      return YXML_OK;
397
0
    }
398
0
    if(yxml_isChar(ch))
399
0
      return yxml_datacontent(x, ch);
400
0
    break;
401
0
  case YXMLS_cd1:
402
0
    if(ch == (unsigned char)']') {
403
0
      x->state = YXMLS_cd2;
404
0
      return YXML_OK;
405
0
    }
406
0
    if(yxml_isChar(ch)) {
407
0
      x->state = YXMLS_cd0;
408
0
      return yxml_datacd1(x, ch);
409
0
    }
410
0
    break;
411
0
  case YXMLS_cd2:
412
0
    if(ch == (unsigned char)']')
413
0
      return yxml_datacontent(x, ch);
414
0
    if(ch == (unsigned char)'>') {
415
0
      x->state = YXMLS_misc2;
416
0
      return YXML_OK;
417
0
    }
418
0
    if(yxml_isChar(ch)) {
419
0
      x->state = YXMLS_cd0;
420
0
      return yxml_datacd2(x, ch);
421
0
    }
422
0
    break;
423
0
  case YXMLS_comment0:
424
0
    if(ch == (unsigned char)'-') {
425
0
      x->state = YXMLS_comment1;
426
0
      return YXML_OK;
427
0
    }
428
0
    break;
429
0
  case YXMLS_comment1:
430
0
    if(ch == (unsigned char)'-') {
431
0
      x->state = YXMLS_comment2;
432
0
      return YXML_OK;
433
0
    }
434
0
    break;
435
0
  case YXMLS_comment2:
436
0
    if(ch == (unsigned char)'-') {
437
0
      x->state = YXMLS_comment3;
438
0
      return YXML_OK;
439
0
    }
440
0
    if(yxml_isChar(ch))
441
0
      return YXML_OK;
442
0
    break;
443
0
  case YXMLS_comment3:
444
0
    if(ch == (unsigned char)'-') {
445
0
      x->state = YXMLS_comment4;
446
0
      return YXML_OK;
447
0
    }
448
0
    if(yxml_isChar(ch)) {
449
0
      x->state = YXMLS_comment2;
450
0
      return YXML_OK;
451
0
    }
452
0
    break;
453
0
  case YXMLS_comment4:
454
0
    if(ch == (unsigned char)'>') {
455
0
      x->state = x->nextstate;
456
0
      return YXML_OK;
457
0
    }
458
0
    break;
459
0
  case YXMLS_dt0:
460
0
    if(ch == (unsigned char)'>') {
461
0
      x->state = YXMLS_misc1;
462
0
      return YXML_OK;
463
0
    }
464
0
    if(ch == (unsigned char)'\'' || ch == (unsigned char)'"') {
465
0
      x->state = YXMLS_dt1;
466
0
      x->quote = ch;
467
0
      x->nextstate = YXMLS_dt0;
468
0
      return YXML_OK;
469
0
    }
470
0
    if(ch == (unsigned char)'<') {
471
0
      x->state = YXMLS_dt2;
472
0
      return YXML_OK;
473
0
    }
474
0
    if(yxml_isChar(ch))
475
0
      return YXML_OK;
476
0
    break;
477
0
  case YXMLS_dt1:
478
0
    if(x->quote == ch) {
479
0
      x->state = x->nextstate;
480
0
      return YXML_OK;
481
0
    }
482
0
    if(yxml_isChar(ch))
483
0
      return YXML_OK;
484
0
    break;
485
0
  case YXMLS_dt2:
486
0
    if(ch == (unsigned char)'?') {
487
0
      x->state = YXMLS_pi0;
488
0
      x->nextstate = YXMLS_dt0;
489
0
      return YXML_OK;
490
0
    }
491
0
    if(ch == (unsigned char)'!') {
492
0
      x->state = YXMLS_dt3;
493
0
      return YXML_OK;
494
0
    }
495
0
    break;
496
0
  case YXMLS_dt3:
497
0
    if(ch == (unsigned char)'-') {
498
0
      x->state = YXMLS_comment1;
499
0
      x->nextstate = YXMLS_dt0;
500
0
      return YXML_OK;
501
0
    }
502
0
    if(yxml_isChar(ch)) {
503
0
      x->state = YXMLS_dt4;
504
0
      return YXML_OK;
505
0
    }
506
0
    break;
507
0
  case YXMLS_dt4:
508
0
    if(ch == (unsigned char)'\'' || ch == (unsigned char)'"') {
509
0
      x->state = YXMLS_dt1;
510
0
      x->quote = ch;
511
0
      x->nextstate = YXMLS_dt4;
512
0
      return YXML_OK;
513
0
    }
514
0
    if(ch == (unsigned char)'>') {
515
0
      x->state = YXMLS_dt0;
516
0
      return YXML_OK;
517
0
    }
518
0
    if(yxml_isChar(ch))
519
0
      return YXML_OK;
520
0
    break;
521
25.8M
  case YXMLS_elem0:
522
25.8M
    if(yxml_isName(ch))
523
23.0M
      return yxml_elemname(x, ch);
524
2.84M
    if(yxml_isSP(ch)) {
525
271k
      x->state = YXMLS_elem1;
526
271k
      return yxml_elemnameend(x, ch);
527
271k
    }
528
2.57M
    if(ch == (unsigned char)'/') {
529
239k
      x->state = YXMLS_elem3;
530
239k
      return yxml_elemnameend(x, ch);
531
239k
    }
532
2.33M
    if(ch == (unsigned char)'>') {
533
2.33M
      x->state = YXMLS_misc2;
534
2.33M
      return yxml_elemnameend(x, ch);
535
2.33M
    }
536
0
    break;
537
417k
  case YXMLS_elem1:
538
417k
    if(yxml_isSP(ch))
539
0
      return YXML_OK;
540
417k
    if(ch == (unsigned char)'/') {
541
0
      x->state = YXMLS_elem3;
542
0
      return YXML_OK;
543
0
    }
544
417k
    if(ch == (unsigned char)'>') {
545
0
      x->state = YXMLS_misc2;
546
0
      return YXML_OK;
547
0
    }
548
417k
    if(yxml_isNameStart(ch)) {
549
417k
      x->state = YXMLS_attr0;
550
417k
      return yxml_attrstart(x, ch);
551
417k
    }
552
0
    break;
553
417k
  case YXMLS_elem2:
554
417k
    if(yxml_isSP(ch)) {
555
146k
      x->state = YXMLS_elem1;
556
146k
      return YXML_OK;
557
146k
    }
558
271k
    if(ch == (unsigned char)'/') {
559
146k
      x->state = YXMLS_elem3;
560
146k
      return YXML_OK;
561
146k
    }
562
125k
    if(ch == (unsigned char)'>') {
563
125k
      x->state = YXMLS_misc2;
564
125k
      return YXML_OK;
565
125k
    }
566
0
    break;
567
385k
  case YXMLS_elem3:
568
385k
    if(ch == (unsigned char)'>') {
569
385k
      x->state = YXMLS_misc2;
570
385k
      return yxml_selfclose(x, ch);
571
385k
    }
572
0
    break;
573
0
  case YXMLS_enc0:
574
0
    if(yxml_isSP(ch))
575
0
      return YXML_OK;
576
0
    if(ch == (unsigned char)'=') {
577
0
      x->state = YXMLS_enc1;
578
0
      return YXML_OK;
579
0
    }
580
0
    break;
581
0
  case YXMLS_enc1:
582
0
    if(yxml_isSP(ch))
583
0
      return YXML_OK;
584
0
    if(ch == (unsigned char)'\'' || ch == (unsigned char)'"') {
585
0
      x->state = YXMLS_enc2;
586
0
      x->quote = ch;
587
0
      return YXML_OK;
588
0
    }
589
0
    break;
590
0
  case YXMLS_enc2:
591
0
    if(yxml_isAlpha(ch)) {
592
0
      x->state = YXMLS_enc3;
593
0
      return YXML_OK;
594
0
    }
595
0
    break;
596
0
  case YXMLS_enc3:
597
0
    if(yxml_isEncName(ch))
598
0
      return YXML_OK;
599
0
    if(x->quote == ch) {
600
0
      x->state = YXMLS_xmldecl6;
601
0
      return YXML_OK;
602
0
    }
603
0
    break;
604
2.45M
  case YXMLS_etag0:
605
2.45M
    if(yxml_isNameStart(ch)) {
606
2.45M
      x->state = YXMLS_etag1;
607
2.45M
      return yxml_elemclose(x, ch);
608
2.45M
    }
609
0
    break;
610
20.6M
  case YXMLS_etag1:
611
20.6M
    if(yxml_isName(ch))
612
18.2M
      return yxml_elemclose(x, ch);
613
2.45M
    if(yxml_isSP(ch)) {
614
0
      x->state = YXMLS_etag2;
615
0
      return yxml_elemcloseend(x, ch);
616
0
    }
617
2.45M
    if(ch == (unsigned char)'>') {
618
2.45M
      x->state = YXMLS_misc2;
619
2.45M
      return yxml_elemcloseend(x, ch);
620
2.45M
    }
621
0
    break;
622
0
  case YXMLS_etag2:
623
0
    if(yxml_isSP(ch))
624
0
      return YXML_OK;
625
0
    if(ch == (unsigned char)'>') {
626
0
      x->state = YXMLS_misc2;
627
0
      return YXML_OK;
628
0
    }
629
0
    break;
630
264k
  case YXMLS_init:
631
264k
    if(ch == (unsigned char)'\xef') {
632
0
      x->state = YXMLS_string;
633
0
      x->nextstate = YXMLS_misc0;
634
0
      x->string = (unsigned char *)"\xbb\xbf";
635
0
      return YXML_OK;
636
0
    }
637
264k
    if(yxml_isSP(ch)) {
638
0
      x->state = YXMLS_misc0;
639
0
      return YXML_OK;
640
0
    }
641
264k
    if(ch == (unsigned char)'<') {
642
264k
      x->state = YXMLS_le0;
643
264k
      return YXML_OK;
644
264k
    }
645
0
    break;
646
264k
  case YXMLS_le0:
647
264k
    if(ch == (unsigned char)'!') {
648
0
      x->state = YXMLS_lee1;
649
0
      return YXML_OK;
650
0
    }
651
264k
    if(ch == (unsigned char)'?') {
652
0
      x->state = YXMLS_leq0;
653
0
      return YXML_OK;
654
0
    }
655
264k
    if(yxml_isNameStart(ch)) {
656
264k
      x->state = YXMLS_elem0;
657
264k
      return yxml_elemstart(x, ch);
658
264k
    }
659
0
    break;
660
0
  case YXMLS_le1:
661
0
    if(ch == (unsigned char)'!') {
662
0
      x->state = YXMLS_lee1;
663
0
      return YXML_OK;
664
0
    }
665
0
    if(ch == (unsigned char)'?') {
666
0
      x->state = YXMLS_pi0;
667
0
      x->nextstate = YXMLS_misc1;
668
0
      return YXML_OK;
669
0
    }
670
0
    if(yxml_isNameStart(ch)) {
671
0
      x->state = YXMLS_elem0;
672
0
      return yxml_elemstart(x, ch);
673
0
    }
674
0
    break;
675
5.03M
  case YXMLS_le2:
676
5.03M
    if(ch == (unsigned char)'!') {
677
0
      x->state = YXMLS_lee2;
678
0
      return YXML_OK;
679
0
    }
680
5.03M
    if(ch == (unsigned char)'?') {
681
0
      x->state = YXMLS_pi0;
682
0
      x->nextstate = YXMLS_misc2;
683
0
      return YXML_OK;
684
0
    }
685
5.03M
    if(ch == (unsigned char)'/') {
686
2.45M
      x->state = YXMLS_etag0;
687
2.45M
      return YXML_OK;
688
2.45M
    }
689
2.57M
    if(yxml_isNameStart(ch)) {
690
2.57M
      x->state = YXMLS_elem0;
691
2.57M
      return yxml_elemstart(x, ch);
692
2.57M
    }
693
0
    break;
694
0
  case YXMLS_le3:
695
0
    if(ch == (unsigned char)'!') {
696
0
      x->state = YXMLS_comment0;
697
0
      x->nextstate = YXMLS_misc3;
698
0
      return YXML_OK;
699
0
    }
700
0
    if(ch == (unsigned char)'?') {
701
0
      x->state = YXMLS_pi0;
702
0
      x->nextstate = YXMLS_misc3;
703
0
      return YXML_OK;
704
0
    }
705
0
    break;
706
0
  case YXMLS_lee1:
707
0
    if(ch == (unsigned char)'-') {
708
0
      x->state = YXMLS_comment1;
709
0
      x->nextstate = YXMLS_misc1;
710
0
      return YXML_OK;
711
0
    }
712
0
    if(ch == (unsigned char)'D') {
713
0
      x->state = YXMLS_string;
714
0
      x->nextstate = YXMLS_dt0;
715
0
      x->string = (unsigned char *)"OCTYPE";
716
0
      return YXML_OK;
717
0
    }
718
0
    break;
719
0
  case YXMLS_lee2:
720
0
    if(ch == (unsigned char)'-') {
721
0
      x->state = YXMLS_comment1;
722
0
      x->nextstate = YXMLS_misc2;
723
0
      return YXML_OK;
724
0
    }
725
0
    if(ch == (unsigned char)'[') {
726
0
      x->state = YXMLS_string;
727
0
      x->nextstate = YXMLS_cd0;
728
0
      x->string = (unsigned char *)"CDATA[";
729
0
      return YXML_OK;
730
0
    }
731
0
    break;
732
0
  case YXMLS_leq0:
733
0
    if(ch == (unsigned char)'x') {
734
0
      x->state = YXMLS_xmldecl0;
735
0
      x->nextstate = YXMLS_misc1;
736
0
      return yxml_pistart(x, ch);
737
0
    }
738
0
    if(yxml_isNameStart(ch)) {
739
0
      x->state = YXMLS_pi1;
740
0
      x->nextstate = YXMLS_misc1;
741
0
      return yxml_pistart(x, ch);
742
0
    }
743
0
    break;
744
0
  case YXMLS_misc0:
745
0
    if(yxml_isSP(ch))
746
0
      return YXML_OK;
747
0
    if(ch == (unsigned char)'<') {
748
0
      x->state = YXMLS_le0;
749
0
      return YXML_OK;
750
0
    }
751
0
    break;
752
0
  case YXMLS_misc1:
753
0
    if(yxml_isSP(ch))
754
0
      return YXML_OK;
755
0
    if(ch == (unsigned char)'<') {
756
0
      x->state = YXMLS_le1;
757
0
      return YXML_OK;
758
0
    }
759
0
    break;
760
436M
  case YXMLS_misc2:
761
436M
    if(ch == (unsigned char)'<') {
762
5.03M
      x->state = YXMLS_le2;
763
5.03M
      return YXML_OK;
764
5.03M
    }
765
431M
    if(ch == (unsigned char)'&') {
766
0
      x->state = YXMLS_misc2a;
767
0
      return yxml_refstart(x, ch);
768
0
    }
769
431M
    if(yxml_isChar(ch))
770
431M
      return yxml_datacontent(x, ch);
771
0
    break;
772
0
  case YXMLS_misc2a:
773
0
    if(yxml_isRef(ch))
774
0
      return yxml_ref(x, ch);
775
0
    if(ch == (unsigned char)'\x3b') {
776
0
      x->state = YXMLS_misc2;
777
0
      return yxml_refcontent(x, ch);
778
0
    }
779
0
    break;
780
0
  case YXMLS_misc3:
781
0
    if(yxml_isSP(ch))
782
0
      return YXML_OK;
783
0
    if(ch == (unsigned char)'<') {
784
0
      x->state = YXMLS_le3;
785
0
      return YXML_OK;
786
0
    }
787
0
    break;
788
0
  case YXMLS_pi0:
789
0
    if(yxml_isNameStart(ch)) {
790
0
      x->state = YXMLS_pi1;
791
0
      return yxml_pistart(x, ch);
792
0
    }
793
0
    break;
794
0
  case YXMLS_pi1:
795
0
    if(yxml_isName(ch))
796
0
      return yxml_piname(x, ch);
797
0
    if(ch == (unsigned char)'?') {
798
0
      x->state = YXMLS_pi4;
799
0
      return yxml_pinameend(x, ch);
800
0
    }
801
0
    if(yxml_isSP(ch)) {
802
0
      x->state = YXMLS_pi2;
803
0
      return yxml_pinameend(x, ch);
804
0
    }
805
0
    break;
806
0
  case YXMLS_pi2:
807
0
    if(ch == (unsigned char)'?') {
808
0
      x->state = YXMLS_pi3;
809
0
      return YXML_OK;
810
0
    }
811
0
    if(yxml_isChar(ch))
812
0
      return yxml_datapi1(x, ch);
813
0
    break;
814
0
  case YXMLS_pi3:
815
0
    if(ch == (unsigned char)'>') {
816
0
      x->state = x->nextstate;
817
0
      return yxml_pivalend(x, ch);
818
0
    }
819
0
    if(yxml_isChar(ch)) {
820
0
      x->state = YXMLS_pi2;
821
0
      return yxml_datapi2(x, ch);
822
0
    }
823
0
    break;
824
0
  case YXMLS_pi4:
825
0
    if(ch == (unsigned char)'>') {
826
0
      x->state = x->nextstate;
827
0
      return yxml_pivalend(x, ch);
828
0
    }
829
0
    break;
830
0
  case YXMLS_std0:
831
0
    if(yxml_isSP(ch))
832
0
      return YXML_OK;
833
0
    if(ch == (unsigned char)'=') {
834
0
      x->state = YXMLS_std1;
835
0
      return YXML_OK;
836
0
    }
837
0
    break;
838
0
  case YXMLS_std1:
839
0
    if(yxml_isSP(ch))
840
0
      return YXML_OK;
841
0
    if(ch == (unsigned char)'\'' || ch == (unsigned char)'"') {
842
0
      x->state = YXMLS_std2;
843
0
      x->quote = ch;
844
0
      return YXML_OK;
845
0
    }
846
0
    break;
847
0
  case YXMLS_std2:
848
0
    if(ch == (unsigned char)'y') {
849
0
      x->state = YXMLS_string;
850
0
      x->nextstate = YXMLS_std3;
851
0
      x->string = (unsigned char *)"es";
852
0
      return YXML_OK;
853
0
    }
854
0
    if(ch == (unsigned char)'n') {
855
0
      x->state = YXMLS_string;
856
0
      x->nextstate = YXMLS_std3;
857
0
      x->string = (unsigned char *)"o";
858
0
      return YXML_OK;
859
0
    }
860
0
    break;
861
0
  case YXMLS_std3:
862
0
    if(x->quote == ch) {
863
0
      x->state = YXMLS_xmldecl8;
864
0
      return YXML_OK;
865
0
    }
866
0
    break;
867
0
  case YXMLS_ver0:
868
0
    if(yxml_isSP(ch))
869
0
      return YXML_OK;
870
0
    if(ch == (unsigned char)'=') {
871
0
      x->state = YXMLS_ver1;
872
0
      return YXML_OK;
873
0
    }
874
0
    break;
875
0
  case YXMLS_ver1:
876
0
    if(yxml_isSP(ch))
877
0
      return YXML_OK;
878
0
    if(ch == (unsigned char)'\'' || ch == (unsigned char)'"') {
879
0
      x->state = YXMLS_string;
880
0
      x->quote = ch;
881
0
      x->nextstate = YXMLS_ver2;
882
0
      x->string = (unsigned char *)"1.";
883
0
      return YXML_OK;
884
0
    }
885
0
    break;
886
0
  case YXMLS_ver2:
887
0
    if(yxml_isNum(ch)) {
888
0
      x->state = YXMLS_ver3;
889
0
      return YXML_OK;
890
0
    }
891
0
    break;
892
0
  case YXMLS_ver3:
893
0
    if(yxml_isNum(ch))
894
0
      return YXML_OK;
895
0
    if(x->quote == ch) {
896
0
      x->state = YXMLS_xmldecl4;
897
0
      return YXML_OK;
898
0
    }
899
0
    break;
900
0
  case YXMLS_xmldecl0:
901
0
    if(ch == (unsigned char)'m') {
902
0
      x->state = YXMLS_xmldecl1;
903
0
      return yxml_piname(x, ch);
904
0
    }
905
0
    if(yxml_isName(ch)) {
906
0
      x->state = YXMLS_pi1;
907
0
      return yxml_piname(x, ch);
908
0
    }
909
0
    if(ch == (unsigned char)'?') {
910
0
      x->state = YXMLS_pi4;
911
0
      return yxml_pinameend(x, ch);
912
0
    }
913
0
    if(yxml_isSP(ch)) {
914
0
      x->state = YXMLS_pi2;
915
0
      return yxml_pinameend(x, ch);
916
0
    }
917
0
    break;
918
0
  case YXMLS_xmldecl1:
919
0
    if(ch == (unsigned char)'l') {
920
0
      x->state = YXMLS_xmldecl2;
921
0
      return yxml_piname(x, ch);
922
0
    }
923
0
    if(yxml_isName(ch)) {
924
0
      x->state = YXMLS_pi1;
925
0
      return yxml_piname(x, ch);
926
0
    }
927
0
    if(ch == (unsigned char)'?') {
928
0
      x->state = YXMLS_pi4;
929
0
      return yxml_pinameend(x, ch);
930
0
    }
931
0
    if(yxml_isSP(ch)) {
932
0
      x->state = YXMLS_pi2;
933
0
      return yxml_pinameend(x, ch);
934
0
    }
935
0
    break;
936
0
  case YXMLS_xmldecl2:
937
0
    if(yxml_isSP(ch)) {
938
0
      x->state = YXMLS_xmldecl3;
939
0
      return yxml_piabort(x, ch);
940
0
    }
941
0
    if(yxml_isName(ch)) {
942
0
      x->state = YXMLS_pi1;
943
0
      return yxml_piname(x, ch);
944
0
    }
945
0
    break;
946
0
  case YXMLS_xmldecl3:
947
0
    if(yxml_isSP(ch))
948
0
      return YXML_OK;
949
0
    if(ch == (unsigned char)'v') {
950
0
      x->state = YXMLS_string;
951
0
      x->nextstate = YXMLS_ver0;
952
0
      x->string = (unsigned char *)"ersion";
953
0
      return YXML_OK;
954
0
    }
955
0
    break;
956
0
  case YXMLS_xmldecl4:
957
0
    if(yxml_isSP(ch)) {
958
0
      x->state = YXMLS_xmldecl5;
959
0
      return YXML_OK;
960
0
    }
961
0
    if(ch == (unsigned char)'?') {
962
0
      x->state = YXMLS_xmldecl9;
963
0
      return YXML_OK;
964
0
    }
965
0
    break;
966
0
  case YXMLS_xmldecl5:
967
0
    if(yxml_isSP(ch))
968
0
      return YXML_OK;
969
0
    if(ch == (unsigned char)'?') {
970
0
      x->state = YXMLS_xmldecl9;
971
0
      return YXML_OK;
972
0
    }
973
0
    if(ch == (unsigned char)'e') {
974
0
      x->state = YXMLS_string;
975
0
      x->nextstate = YXMLS_enc0;
976
0
      x->string = (unsigned char *)"ncoding";
977
0
      return YXML_OK;
978
0
    }
979
0
    if(ch == (unsigned char)'s') {
980
0
      x->state = YXMLS_string;
981
0
      x->nextstate = YXMLS_std0;
982
0
      x->string = (unsigned char *)"tandalone";
983
0
      return YXML_OK;
984
0
    }
985
0
    break;
986
0
  case YXMLS_xmldecl6:
987
0
    if(yxml_isSP(ch)) {
988
0
      x->state = YXMLS_xmldecl7;
989
0
      return YXML_OK;
990
0
    }
991
0
    if(ch == (unsigned char)'?') {
992
0
      x->state = YXMLS_xmldecl9;
993
0
      return YXML_OK;
994
0
    }
995
0
    break;
996
0
  case YXMLS_xmldecl7:
997
0
    if(yxml_isSP(ch))
998
0
      return YXML_OK;
999
0
    if(ch == (unsigned char)'?') {
1000
0
      x->state = YXMLS_xmldecl9;
1001
0
      return YXML_OK;
1002
0
    }
1003
0
    if(ch == (unsigned char)'s') {
1004
0
      x->state = YXMLS_string;
1005
0
      x->nextstate = YXMLS_std0;
1006
0
      x->string = (unsigned char *)"tandalone";
1007
0
      return YXML_OK;
1008
0
    }
1009
0
    break;
1010
0
  case YXMLS_xmldecl8:
1011
0
    if(yxml_isSP(ch))
1012
0
      return YXML_OK;
1013
0
    if(ch == (unsigned char)'?') {
1014
0
      x->state = YXMLS_xmldecl9;
1015
0
      return YXML_OK;
1016
0
    }
1017
0
    break;
1018
0
  case YXMLS_xmldecl9:
1019
0
    if(ch == (unsigned char)'>') {
1020
0
      x->state = YXMLS_misc1;
1021
0
      return YXML_OK;
1022
0
    }
1023
0
    break;
1024
507M
  }
1025
0
  return YXML_ESYN;
1026
507M
}
1027
1028
264k
yxml_ret_t yxml_eof(yxml_t *x) {
1029
264k
  if(x->state != YXMLS_misc3)
1030
0
    return YXML_EEOF;
1031
264k
  return YXML_OK;
1032
264k
}
1033