Coverage Report

Created: 2026-02-04 06:13

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
/src/xpdf-4.06/xpdf/Zoox.cc
Line
Count
Source
1
//========================================================================
2
//
3
// Zoox.cc
4
//
5
//========================================================================
6
7
#include <aconf.h>
8
9
#include <stdlib.h>
10
#include <stdio.h>
11
#include <string.h>
12
#include "gmem.h"
13
#include "gmempp.h"
14
#include "GString.h"
15
#include "GList.h"
16
#include "GHash.h"
17
#include "Zoox.h"
18
19
//~ all of this code assumes the encoding is UTF-8 or ASCII or something
20
//~   similar (ISO-8859-*)
21
22
//------------------------------------------------------------------------
23
24
static char nameStartChar[256] = {
25
  0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, // 00
26
  0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, // 10
27
  0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, // 20
28
  0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, // 30
29
  0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, // 40
30
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 1, // 50
31
  0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, // 60
32
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, // 70
33
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, // 80
34
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, // 90
35
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, // a0
36
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, // b0
37
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, // c0
38
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, // d0
39
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, // e0
40
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1  // f0
41
};
42
43
static char nameChar[256] = {
44
  0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, // 00
45
  0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, // 10
46
  0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, // 20
47
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, // 30
48
  0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, // 40
49
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 1, // 50
50
  0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, // 60
51
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, // 70
52
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, // 80
53
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, // 90
54
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, // a0
55
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, // b0
56
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, // c0
57
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, // d0
58
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, // e0
59
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1  // f0
60
};
61
62
//------------------------------------------------------------------------
63
64
2.06M
ZxNode::ZxNode() {
65
2.06M
  next = NULL;
66
2.06M
  parent = NULL;
67
2.06M
  firstChild = lastChild = NULL;
68
2.06M
}
69
70
2.06M
ZxNode::~ZxNode() {
71
2.06M
  ZxNode *child;
72
73
4.12M
  while (firstChild) {
74
2.06M
    child = firstChild;
75
2.06M
    firstChild = firstChild->next;
76
2.06M
    delete child;
77
2.06M
  }
78
2.06M
}
79
80
0
ZxNode *ZxNode::deleteChild(ZxNode *child) {
81
0
  ZxNode *p1, *p2;
82
83
0
  for (p1 = NULL, p2 = firstChild;
84
0
       p2 && p2 != child;
85
0
       p1 = p2, p2 = p2->next) ;
86
0
  if (!p2) {
87
0
    return NULL;
88
0
  }
89
0
  if (p1) {
90
0
    p1->next = child->next;
91
0
  } else {
92
0
    firstChild = child->next;
93
0
  }
94
0
  child->parent = NULL;
95
0
  child->next = NULL;
96
0
  return child;
97
0
}
98
99
0
void ZxNode::appendChild(ZxNode *child) {
100
0
  ZxNode *p1;
101
102
0
  if (child->parent || child->next) {
103
0
    return;
104
0
  }
105
0
  if (firstChild) {
106
0
    for (p1 = firstChild; p1->next; p1 = p1->next) ;
107
0
    p1->next = child;
108
0
  } else {
109
0
    firstChild = child;
110
0
  }
111
0
  child->parent = this;
112
0
}
113
114
0
void ZxNode::insertChildAfter(ZxNode *child, ZxNode *prev) {
115
0
  if (child->parent || child->next || (prev && prev->parent != this)) {
116
0
    return;
117
0
  }
118
0
  if (prev) {
119
0
    child->next = prev->next;
120
0
    prev->next = child;
121
0
  } else {
122
0
    child->next = firstChild;
123
0
    firstChild = child;
124
0
  }
125
0
  child->parent = this;
126
0
}
127
128
0
ZxElement *ZxNode::findFirstElement(const char *type) {
129
0
  ZxNode *child;
130
0
  ZxElement *result;
131
132
0
  if (isElement(type)) {
133
0
    return (ZxElement *)this;
134
0
  }
135
0
  for (child = firstChild; child; child = child->next) {
136
0
    if ((result = child->findFirstElement(type))) {
137
0
      return result;
138
0
    }
139
0
  }
140
0
  return NULL;
141
0
}
142
143
130k
ZxElement *ZxNode::findFirstChildElement(const char *type) {
144
130k
  ZxNode *child;
145
146
460k
  for (child = firstChild; child; child = child->next) {
147
336k
    if (child->isElement(type)) {
148
7.29k
      return (ZxElement *)child;
149
7.29k
    }
150
336k
  }
151
123k
  return NULL;
152
130k
}
153
154
0
GList *ZxNode::findAllElements(const char *type) {
155
0
  GList *results;
156
157
0
  results = new GList();
158
0
  findAllElements(type, results);
159
0
  return results;
160
0
}
161
162
0
void ZxNode::findAllElements(const char *type, GList *results) {
163
0
  ZxNode *child;
164
165
0
  if (isElement(type)) {
166
0
    results->append(this);
167
0
  }
168
0
  for (child = firstChild; child; child = child->next) {
169
0
    child->findAllElements(type, results);
170
0
  }
171
0
}
172
173
0
GList *ZxNode::findAllChildElements(const char *type) {
174
0
  GList *results;
175
0
  ZxNode *child;
176
177
0
  results = new GList();
178
0
  for (child = firstChild; child; child = child->next) {
179
0
    if (child->isElement(type)) {
180
0
      results->append(child);
181
0
    }
182
0
  }
183
0
  return results;
184
0
}
185
186
2.06M
void ZxNode::addChild(ZxNode *child) {
187
2.06M
  if (lastChild) {
188
1.80M
    lastChild->next = child;
189
1.80M
    lastChild = child;
190
1.80M
  } else {
191
256k
    firstChild = lastChild = child;
192
256k
  }
193
2.06M
  child->parent = this;
194
2.06M
  child->next = NULL;
195
2.06M
}
196
197
//------------------------------------------------------------------------
198
199
978
ZxDoc::ZxDoc() {
200
978
  xmlDecl = NULL;
201
978
  docTypeDecl = NULL;
202
978
  root = NULL;
203
978
}
204
205
978
ZxDoc *ZxDoc::loadMem(const char *data, Guint dataLen) {
206
978
  ZxDoc *doc;
207
208
978
  doc = new ZxDoc();
209
978
  if (!doc->parse(data, dataLen)) {
210
314
    delete doc;
211
314
    return NULL;
212
314
  }
213
664
  return doc;
214
978
}
215
216
0
ZxDoc *ZxDoc::loadFile(const char *fileName) {
217
0
  ZxDoc *doc;
218
0
  FILE *f;
219
0
  char *data;
220
0
  Guint dataLen;
221
222
0
  if (!(f = fopen(fileName, "rb"))) {
223
0
    return NULL;
224
0
  }
225
0
  fseek(f, 0, SEEK_END);
226
0
  dataLen = (Guint)ftell(f);
227
0
  if (!dataLen) {
228
0
    fclose(f);
229
0
    return NULL;
230
0
  }
231
0
  fseek(f, 0, SEEK_SET);
232
0
  data = (char *)gmalloc(dataLen);
233
0
  if (fread(data, 1, dataLen, f) != dataLen) {
234
0
    fclose(f);
235
0
    gfree(data);
236
0
    return NULL;
237
0
  }
238
0
  fclose(f);
239
0
  doc = loadMem(data, dataLen);
240
0
  gfree(data);
241
0
  return doc;
242
0
}
243
244
ZxDoc::~ZxDoc() {
245
}
246
247
0
static bool writeToFileFunc(void *stream, const char *data, int length) {
248
0
  return (int)fwrite(data, 1, length, (FILE *)stream) == length;
249
0
}
250
251
0
bool ZxDoc::writeFile(const char *fileName) {
252
0
  FILE *f;
253
254
0
  if (!(f = fopen(fileName, "wb"))) {
255
0
    return false;
256
0
  }
257
0
  write(&writeToFileFunc, f);
258
0
  fclose(f);
259
0
  return true;
260
0
}
261
262
1.71k
void ZxDoc::addChild(ZxNode *node) {
263
1.71k
  if (node->isXMLDecl() && !xmlDecl) {
264
400
    xmlDecl = (ZxXMLDecl *)node;
265
1.31k
  } else if (node->isDocTypeDecl() && !docTypeDecl) {
266
70
    docTypeDecl = (ZxDocTypeDecl *)node;
267
1.24k
  } else if (node->isElement() && !root) {
268
664
    root = (ZxElement *)node;
269
664
  }
270
1.71k
  ZxNode::addChild(node);
271
1.71k
}
272
273
978
bool ZxDoc::parse(const char *data, Guint dataLen) {
274
978
  parsePtr = data;
275
978
  parseEnd = data + dataLen;
276
  
277
978
  parseSpace();
278
978
  parseBOM();
279
978
  parseSpace();
280
978
  parseXMLDecl(this);
281
978
  parseMisc(this);
282
978
  parseDocTypeDecl(this);
283
978
  parseMisc(this);
284
978
  if (match("<")) {
285
664
    parseElement(this);
286
664
  }
287
978
  parseMisc(this);
288
978
  return root != NULL;
289
978
}
290
291
978
void ZxDoc::parseXMLDecl(ZxNode *par) {
292
978
  GString *version, *encoding, *s;
293
978
  bool standalone;
294
295
978
  if (!match("<?xml")) {
296
578
    return;
297
578
  }
298
400
  parsePtr += 5;
299
400
  parseSpace();
300
301
  // version
302
400
  version = NULL;
303
400
  if (match("version")) {
304
381
    parsePtr += 7;
305
381
    parseSpace();
306
381
    if (match("=")) {
307
364
      ++parsePtr;
308
364
      parseSpace();
309
364
      version = parseQuotedString();
310
364
    }
311
381
  }
312
400
  if (!version) {
313
36
    version = new GString("1.0");
314
36
  }
315
400
  parseSpace();
316
  
317
  // encoding
318
400
  encoding = NULL;
319
400
  if (match("encoding")) {
320
275
    parsePtr += 8;
321
275
    parseSpace();
322
275
    if (match("=")) {
323
254
      ++parsePtr;
324
254
      parseSpace();
325
254
      encoding = parseQuotedString();
326
254
    }
327
275
  }
328
400
  parseSpace();
329
330
  // standalone
331
400
  standalone = false;
332
400
  if (match("standalone")) {
333
55
    parsePtr += 10;
334
55
    parseSpace();
335
55
    if (match("=")) {
336
37
      ++parsePtr;
337
37
      parseSpace();
338
37
      s = parseQuotedString();
339
37
      standalone = !s->cmp("yes");
340
37
      delete s;
341
37
    }
342
55
  }
343
400
  parseSpace();
344
345
400
  if (match("?>")) {
346
215
    parsePtr += 2;
347
215
  }
348
349
400
  par->addChild(new ZxXMLDecl(version, encoding, standalone));
350
400
}
351
352
//~ this just skips everything after the name
353
978
void ZxDoc::parseDocTypeDecl(ZxNode *par) {
354
978
  GString *name;
355
978
  int state;
356
978
  char c, quote;
357
358
978
  if (!match("<!DOCTYPE")) {
359
908
    return;
360
908
  }
361
70
  parsePtr += 9;
362
70
  parseSpace();
363
364
70
  name = parseName();
365
70
  parseSpace();
366
367
70
  state = 0;
368
70
  quote = '\0';
369
223k
  while (parsePtr < parseEnd && state < 4) {
370
223k
    c = *parsePtr++;
371
223k
    switch (state) {
372
28.1k
    case 0: // not in square brackets; not in quotes
373
28.1k
      if (c == '>') {
374
46
  state = 4;
375
28.0k
      } else if (c == '"' || c == '\'') {
376
439
  state = 1;
377
27.6k
      } else if (c == '[') {
378
287
  state = 2;
379
287
      }
380
28.1k
      break;
381
44.6k
    case 1: // not in square brackets; in quotes
382
44.6k
      if (c == quote) {
383
434
  state = 0;
384
434
      }
385
44.6k
      break;
386
67.0k
    case 2: // in square brackets; not in quotes
387
67.0k
      if (c == ']') {
388
276
  state = 0;
389
66.7k
      } else if (c == '"' || c == '\'') {
390
602
  state = 3;
391
602
      }
392
67.0k
      break;
393
83.8k
    case 3: // in square brackets; in quotes
394
83.8k
      if (c == quote) {
395
602
  state = 2;
396
602
      }
397
83.8k
      break;
398
223k
    }
399
223k
  }
400
401
70
  par->addChild(new ZxDocTypeDecl(name));
402
70
}
403
404
// assumes match("<")
405
1.46M
void ZxDoc::parseElement(ZxNode *par) {
406
1.46M
  GString *type;
407
1.46M
  ZxElement *elem;
408
1.46M
  ZxAttr *attr;
409
410
1.46M
  ++parsePtr;
411
1.46M
  type = parseName();
412
1.46M
  elem = new ZxElement(type);
413
1.46M
  parseSpace();
414
1.55M
  while ((attr = parseAttr())) {
415
92.9k
    elem->addAttr(attr);
416
92.9k
    parseSpace();
417
92.9k
  }
418
1.46M
  if (match("/>")) {
419
22.8k
    parsePtr += 2;
420
1.43M
  } else if (match(">")) {
421
255k
    ++parsePtr;
422
255k
    parseContent(elem);
423
255k
  }
424
1.46M
  par->addChild(elem);
425
1.46M
}
426
427
1.55M
ZxAttr *ZxDoc::parseAttr() {
428
1.55M
  GString *name, *value;
429
1.55M
  const char *start;
430
1.55M
  char quote, c;
431
1.55M
  unsigned int x;
432
1.55M
  int n;
433
434
1.55M
  name = parseName();
435
1.55M
  parseSpace();
436
1.55M
  if (!match("=")) {
437
1.44M
    delete name;
438
1.44M
    return NULL;
439
1.44M
  }
440
110k
  ++parsePtr;
441
110k
  parseSpace();
442
110k
  if (!(parsePtr < parseEnd && (*parsePtr == '"' || *parsePtr == '\''))) {
443
17.3k
    delete name;
444
17.3k
    return NULL;
445
17.3k
  }
446
92.9k
  quote = *parsePtr++;
447
92.9k
  value = new GString();
448
234k
  while (parsePtr < parseEnd && *parsePtr != quote) {
449
141k
    if (*parsePtr == '&') {
450
33.3k
      ++parsePtr;
451
33.3k
      if (parsePtr < parseEnd && *parsePtr == '#') {
452
15.9k
  ++parsePtr;
453
15.9k
  if (parsePtr < parseEnd && *parsePtr == 'x') {
454
6.92k
    ++parsePtr;
455
6.92k
    x = 0;
456
12.4k
    while (parsePtr < parseEnd) {
457
12.4k
      c = *parsePtr;
458
12.4k
      if (c >= '0' && c <= '9') {
459
1.41k
        x = (x << 4) + (c - '0');
460
10.9k
      } else if (c >= 'a' && c <= 'f') {
461
2.18k
        x = (x << 4) + (10 + c - 'a');
462
8.81k
      } else if (c >= 'A' && c <= 'F') {
463
1.89k
        x = (x << 4) + (10 + c - 'A');
464
6.92k
      } else {
465
6.92k
        break;
466
6.92k
      }
467
5.48k
      ++parsePtr;
468
5.48k
    }
469
6.92k
    if (parsePtr < parseEnd && *parsePtr == ';') {
470
280
      ++parsePtr;
471
280
    }
472
6.92k
    appendUTF8(value, x);
473
9.04k
  } else {
474
9.04k
    x = 0;
475
9.73k
    while (parsePtr < parseEnd) {
476
9.73k
      c = *parsePtr;
477
9.73k
      if (c >= '0' && c <= '9') {
478
687
        x = x * 10 + (c - '0');
479
9.04k
      } else {
480
9.04k
        break;
481
9.04k
      }
482
687
      ++parsePtr;
483
687
    }
484
9.04k
    if (parsePtr < parseEnd && *parsePtr == ';') {
485
251
      ++parsePtr;
486
251
    }
487
9.04k
    appendUTF8(value, x);
488
9.04k
  }
489
17.4k
      } else {
490
17.4k
  start = parsePtr;
491
17.4k
  for (++parsePtr;
492
1.41M
       parsePtr < parseEnd && *parsePtr != ';' &&
493
1.41M
         *parsePtr != quote && *parsePtr != '&';
494
1.39M
       ++parsePtr) ;
495
17.4k
  n = (int)(parsePtr - start);
496
17.4k
  if (parsePtr < parseEnd && *parsePtr == ';') {
497
260
    ++parsePtr;
498
260
  }
499
17.4k
  if (n == 2 && !strncmp(start, "lt", 2)) {
500
116
    value->append('<');
501
17.3k
  } else if (n == 2 && !strncmp(start, "gt", 2)) {
502
254
    value->append('>');
503
17.0k
  } else if (n == 3 && !strncmp(start, "amp", 3)) {
504
0
    value->append('&');
505
17.0k
  } else if (n == 4 && !strncmp(start, "apos", 4)) {
506
0
    value->append('\'');
507
17.0k
  } else if (n == 4 && !strncmp(start, "quot", 4)) {
508
0
    value->append('"');
509
17.0k
  } else {
510
17.0k
    value->append(start - 1, (int)(parsePtr - start) + 1);
511
17.0k
  }
512
17.4k
      }
513
108k
    } else {
514
108k
      start = parsePtr;
515
108k
      for (++parsePtr;
516
5.26M
     parsePtr < parseEnd && *parsePtr != quote && *parsePtr != '&';
517
5.15M
     ++parsePtr) ;
518
108k
      value->append(start, (int)(parsePtr - start));
519
108k
    }
520
141k
  }
521
92.9k
  if (parsePtr < parseEnd && *parsePtr == quote) {
522
92.8k
    ++parsePtr;
523
92.8k
  }
524
92.9k
  return new ZxAttr(name, value);
525
110k
}
526
527
// this consumes the end tag
528
255k
void ZxDoc::parseContent(ZxElement *par) {
529
255k
  GString *endType;
530
531
255k
  endType = (new GString("</"))->append(par->getType());
532
533
2.31M
  while (parsePtr < parseEnd) {
534
2.10M
    if (match(endType->getCString())) {
535
45.4k
      parsePtr += endType->getLength();
536
45.4k
      parseSpace();
537
45.4k
      if (match(">")) {
538
31.5k
  ++parsePtr;
539
31.5k
      }
540
45.4k
      break;
541
2.06M
    } else if (match("<?")) {
542
8.42k
      parsePI(par);
543
2.05M
    } else if (match("<![CDATA[")) {
544
93
      parseCDSect(par);
545
2.05M
    } else if (match("<!--")) {
546
3.00k
      parseComment(par);
547
2.05M
    } else if (match("<")) {
548
1.46M
      parseElement(par);
549
1.46M
    } else {
550
590k
      parseCharData(par);
551
590k
    }
552
2.10M
  }
553
554
255k
  delete endType;
555
255k
}
556
557
590k
void ZxDoc::parseCharData(ZxElement *par) {
558
590k
  GString *data;
559
590k
  const char *start;
560
590k
  char c;
561
590k
  unsigned int x;
562
590k
  int n;
563
564
590k
  data = new GString();
565
1.48M
  while (parsePtr < parseEnd && *parsePtr != '<') {
566
897k
    if (*parsePtr == '&') {
567
256k
      ++parsePtr;
568
256k
      if (parsePtr < parseEnd && *parsePtr == '#') {
569
76.4k
  ++parsePtr;
570
76.4k
  if (parsePtr < parseEnd && *parsePtr == 'x') {
571
11.2k
    ++parsePtr;
572
11.2k
    x = 0;
573
18.4k
    while (parsePtr < parseEnd) {
574
18.4k
      c = *parsePtr;
575
18.4k
      if (c >= '0' && c <= '9') {
576
1.18k
        x = (x << 4) + (c - '0');
577
17.3k
      } else if (c >= 'a' && c <= 'f') {
578
2.49k
        x = (x << 4) + (10 + c - 'a');
579
14.8k
      } else if (c >= 'A' && c <= 'F') {
580
3.59k
        x = (x << 4) + (10 + c - 'A');
581
11.2k
      } else {
582
11.2k
        break;
583
11.2k
      }
584
7.27k
      ++parsePtr;
585
7.27k
    }
586
11.2k
    if (parsePtr < parseEnd && *parsePtr == ';') {
587
212
      ++parsePtr;
588
212
    }
589
11.2k
    appendUTF8(data, x);
590
65.2k
  } else {
591
65.2k
    x = 0;
592
72.5k
    while (parsePtr < parseEnd) {
593
72.5k
      c = *parsePtr;
594
72.5k
      if (c >= '0' && c <= '9') {
595
7.33k
        x = x * 10 + (c - '0');
596
65.2k
      } else {
597
65.2k
        break;
598
65.2k
      }
599
7.33k
      ++parsePtr;
600
7.33k
    }
601
65.2k
    if (parsePtr < parseEnd && *parsePtr == ';') {
602
349
      ++parsePtr;
603
349
    }
604
65.2k
    appendUTF8(data, x);
605
65.2k
  }
606
180k
      } else {
607
180k
  start = parsePtr;
608
180k
  for (++parsePtr;
609
68.6M
       parsePtr < parseEnd && *parsePtr != ';' &&
610
68.6M
         *parsePtr != '<' && *parsePtr != '&';
611
68.4M
       ++parsePtr) ;
612
180k
  n = (int)(parsePtr - start);
613
180k
  if (parsePtr < parseEnd && *parsePtr == ';') {
614
655
    ++parsePtr;
615
655
  }
616
180k
  if (n == 2 && !strncmp(start, "lt", 2)) {
617
268
    data->append('<');
618
179k
  } else if (n == 2 && !strncmp(start, "gt", 2)) {
619
653
    data->append('>');
620
179k
  } else if (n == 3 && !strncmp(start, "amp", 3)) {
621
339
    data->append('&');
622
178k
  } else if (n == 4 && !strncmp(start, "apos", 4)) {
623
0
    data->append('\'');
624
178k
  } else if (n == 4 && !strncmp(start, "quot", 4)) {
625
0
    data->append('"');
626
178k
  } else {
627
178k
    data->append(start - 1, (int)(parsePtr - start) + 1);
628
178k
  }
629
180k
      }
630
640k
    } else {
631
640k
      start = parsePtr;
632
640k
      for (++parsePtr;
633
18.2M
     parsePtr < parseEnd && *parsePtr != '<' && *parsePtr != '&';
634
17.6M
     ++parsePtr) ;
635
640k
      data->append(start, (int)(parsePtr - start));
636
640k
    }
637
897k
  }
638
590k
  par->addChild(new ZxCharData(data, true));
639
590k
}
640
641
92.4k
void ZxDoc::appendUTF8(GString *s, unsigned int c) {
642
92.4k
  if (c <= 0x7f) {
643
89.1k
    s->append((char)c);
644
89.1k
  } else if (c <= 0x7ff) {
645
939
    s->append((char)(0xc0 + (c >> 6)));
646
939
    s->append((char)(0x80 + (c & 0x3f)));
647
2.41k
  } else if (c <= 0xffff) {
648
1.06k
    s->append((char)(0xe0 + (c >> 12)));
649
1.06k
    s->append((char)(0x80 + ((c >> 6) & 0x3f)));
650
1.06k
    s->append((char)(0x80 + (c & 0x3f)));
651
1.35k
  } else if (c <= 0x1fffff) {
652
672
    s->append((char)(0xf0 + (c >> 18)));
653
672
    s->append((char)(0x80 + ((c >> 12) & 0x3f)));
654
672
    s->append((char)(0x80 + ((c >> 6) & 0x3f)));
655
672
    s->append((char)(0x80 + (c & 0x3f)));
656
678
  } else if (c <= 0x3ffffff) {
657
128
    s->append((char)(0xf8 + (c >> 24)));
658
128
    s->append((char)(0x80 + ((c >> 18) & 0x3f)));
659
128
    s->append((char)(0x80 + ((c >> 12) & 0x3f)));
660
128
    s->append((char)(0x80 + ((c >> 6) & 0x3f)));
661
128
    s->append((char)(0x80 + (c & 0x3f)));
662
550
  } else if (c <= 0x7fffffff) {
663
294
    s->append((char)(0xfc + (c >> 30)));
664
294
    s->append((char)(0x80 + ((c >> 24) & 0x3f)));
665
294
    s->append((char)(0x80 + ((c >> 18) & 0x3f)));
666
294
    s->append((char)(0x80 + ((c >> 12) & 0x3f)));
667
294
    s->append((char)(0x80 + ((c >> 6) & 0x3f)));
668
294
    s->append((char)(0x80 + (c & 0x3f)));
669
294
  }
670
92.4k
}
671
672
// assumes match("<![CDATA[")
673
93
void ZxDoc::parseCDSect(ZxNode *par) {
674
93
  const char *start;
675
676
93
  parsePtr += 9;
677
93
  start = parsePtr;
678
217k
  while (parsePtr < parseEnd - 3) {
679
217k
    if (!strncmp(parsePtr, "]]>", 3)) {
680
83
      par->addChild(new ZxCharData(new GString(start, (int)(parsePtr - start)),
681
83
           false));
682
83
      parsePtr += 3;
683
83
      return;
684
83
    }
685
217k
    ++parsePtr;
686
217k
  }
687
10
  parsePtr = parseEnd;
688
10
  par->addChild(new ZxCharData(new GString(start, (int)(parsePtr - start)),
689
10
             false));
690
10
}
691
692
2.93k
void ZxDoc::parseMisc(ZxNode *par) {
693
14.4k
  while (1) {
694
14.4k
    if (match("<!--")) {
695
116
      parseComment(par);
696
14.3k
    } else if (match("<?")) {
697
477
      parsePI(par);
698
13.8k
    } else if (parsePtr < parseEnd && (*parsePtr == '\x20' ||
699
8.33k
               *parsePtr == '\x09' ||
700
6.83k
               *parsePtr == '\x0d' ||
701
10.9k
               *parsePtr == '\x0a')) {
702
10.9k
      ++parsePtr;
703
10.9k
    } else {
704
2.93k
      break;
705
2.93k
    }
706
14.4k
  }
707
2.93k
}
708
709
// assumes match("<!--")
710
3.12k
void ZxDoc::parseComment(ZxNode *par) {
711
3.12k
  const char *start;
712
713
3.12k
  parsePtr += 4;
714
3.12k
  start = parsePtr;
715
401k
  while (parsePtr <= parseEnd - 3) {
716
401k
    if (!strncmp(parsePtr, "-->", 3)) {
717
3.11k
      par->addChild(new ZxComment(new GString(start, (int)(parsePtr - start))));
718
3.11k
      parsePtr += 3;
719
3.11k
      return;
720
3.11k
    }
721
398k
    ++parsePtr;
722
398k
  }
723
14
  parsePtr = parseEnd;
724
14
}
725
726
// assumes match("<?")
727
8.89k
void ZxDoc::parsePI(ZxNode *par) {
728
8.89k
  GString *target;
729
8.89k
  const char *start;
730
731
8.89k
  parsePtr += 2;
732
8.89k
  target = parseName();
733
8.89k
  parseSpace();
734
8.89k
  start = parsePtr;
735
1.11M
  while (parsePtr <= parseEnd - 2) {
736
1.11M
    if (!strncmp(parsePtr, "?>", 2)) {
737
8.83k
      par->addChild(new ZxPI(target, new GString(start,
738
8.83k
             (int)(parsePtr - start))));
739
8.83k
      parsePtr += 2;
740
8.83k
      return;
741
8.83k
    }
742
1.10M
    ++parsePtr;
743
1.10M
  }
744
60
  parsePtr = parseEnd;
745
60
  par->addChild(new ZxPI(target, new GString(start, (int)(parsePtr - start))));
746
60
}
747
748
//~ this accepts all chars >= 0x80
749
//~ this doesn't check for properly-formed UTF-8
750
3.02M
GString *ZxDoc::parseName() {
751
3.02M
  GString *name;
752
753
3.02M
  name = new GString();
754
3.02M
  if (parsePtr < parseEnd && nameStartChar[*parsePtr & 0xff]) {
755
1.41M
    name->append(*parsePtr++);
756
4.26M
    while (parsePtr < parseEnd && nameChar[*parsePtr & 0xff]) {
757
2.84M
      name->append(*parsePtr++);
758
2.84M
    }
759
1.41M
  }
760
3.02M
  return name;
761
3.02M
}
762
763
655
GString *ZxDoc::parseQuotedString() {
764
655
  GString *s;
765
655
  const char *start;
766
655
  char quote;
767
768
655
  if (parsePtr < parseEnd && (*parsePtr == '"' || *parsePtr == '\'')) {
769
608
    quote = *parsePtr++;
770
608
    start = parsePtr;
771
29.1k
    while (parsePtr < parseEnd && *parsePtr != quote) {
772
28.5k
      ++parsePtr;
773
28.5k
    }
774
608
    s = new GString(start, (int)(parsePtr - start));
775
608
    if (parsePtr < parseEnd && *parsePtr == quote) {
776
606
      ++parsePtr;
777
606
    }
778
608
  } else {
779
47
    s = new GString();
780
47
  }
781
655
  return s;
782
655
}
783
784
978
void ZxDoc::parseBOM() {
785
978
  if (match("\xef\xbb\xbf")) {
786
16
    parsePtr += 3;
787
16
  }
788
978
}
789
790
3.27M
void ZxDoc::parseSpace() {
791
3.81M
  while (parsePtr < parseEnd && (*parsePtr == '\x20' ||
792
3.46M
         *parsePtr == '\x09' ||
793
3.45M
         *parsePtr == '\x0d' ||
794
3.41M
         *parsePtr == '\x0a')) {
795
535k
    ++parsePtr;
796
535k
  }
797
3.27M
}
798
799
14.8M
bool ZxDoc::match(const char *s) {
800
14.8M
  int n;
801
802
14.8M
  n = (int)strlen(s);
803
14.8M
  return parseEnd - parsePtr >= n && !strncmp(parsePtr, s, n);
804
14.8M
}
805
806
0
bool ZxDoc::write(ZxWriteFunc writeFunc, void *stream) {
807
0
  ZxNode *child;
808
809
0
  for (child = getFirstChild(); child; child = child->getNextChild()) {
810
0
    if (!child->write(writeFunc, stream)) {
811
0
      return false;
812
0
    }
813
0
    if (!(*writeFunc)(stream, "\n", 1)) {
814
0
      return false;
815
0
    }
816
0
  }
817
0
  return true;
818
0
}
819
820
//------------------------------------------------------------------------
821
822
400
ZxXMLDecl::ZxXMLDecl(GString *versionA, GString *encodingA, bool standaloneA) {
823
400
  version = versionA;
824
400
  encoding = encodingA;
825
400
  standalone = standaloneA;
826
400
}
827
828
400
ZxXMLDecl::~ZxXMLDecl() {
829
400
  delete version;
830
400
  if (encoding) {
831
254
    delete encoding;
832
254
  }
833
400
}
834
835
0
bool ZxXMLDecl::write(ZxWriteFunc writeFunc, void *stream) {
836
0
  GString *s;
837
0
  bool ok;
838
839
0
  s = new GString("<?xml version=\"");
840
0
  s->append(version);
841
0
  s->append("\"");
842
0
  if (encoding) {
843
0
    s->append(" encoding=\"");
844
0
    s->append(encoding);
845
0
    s->append("\"");
846
0
  }
847
0
  if (standalone) {
848
0
    s->append(" standlone=\"yes\"");
849
0
  }
850
0
  s->append("?>");
851
0
  ok = (*writeFunc)(stream, s->getCString(), s->getLength());
852
0
  delete s;
853
0
  return ok;
854
0
}
855
856
//------------------------------------------------------------------------
857
858
70
ZxDocTypeDecl::ZxDocTypeDecl(GString *nameA) {
859
70
  name = nameA;
860
70
}
861
862
70
ZxDocTypeDecl::~ZxDocTypeDecl() {
863
70
  delete name;
864
70
}
865
866
0
bool ZxDocTypeDecl::write(ZxWriteFunc writeFunc, void *stream) {
867
0
  GString *s;
868
0
  bool ok;
869
870
0
  s = new GString("<!DOCTYPE ");
871
0
  s->append(name);
872
0
  s->append(">");
873
0
  ok = (*writeFunc)(stream, s->getCString(), s->getLength());
874
0
  delete s;
875
0
  return ok;
876
0
}
877
878
//------------------------------------------------------------------------
879
880
3.11k
ZxComment::ZxComment(GString *textA) {
881
3.11k
  text = textA;
882
3.11k
}
883
884
3.11k
ZxComment::~ZxComment() {
885
3.11k
  delete text;
886
3.11k
}
887
888
0
bool ZxComment::write(ZxWriteFunc writeFunc, void *stream) {
889
0
  GString *s;
890
0
  bool ok;
891
892
0
  s = new GString("<!--");
893
0
  s->append(text);
894
0
  s->append("-->");
895
0
  ok = (*writeFunc)(stream, s->getCString(), s->getLength());
896
0
  delete s;
897
0
  return ok;
898
0
}
899
900
//------------------------------------------------------------------------
901
902
8.89k
ZxPI::ZxPI(GString *targetA, GString *textA) {
903
8.89k
  target = targetA;
904
8.89k
  text = textA;
905
8.89k
}
906
907
8.89k
ZxPI::~ZxPI() {
908
8.89k
  delete target;
909
8.89k
  delete text;
910
8.89k
}
911
912
0
bool ZxPI::write(ZxWriteFunc writeFunc, void *stream) {
913
0
  GString *s;
914
0
  bool ok;
915
916
0
  s = new GString("<?");
917
0
  s->append(target);
918
0
  s->append(" ");
919
0
  s->append(text);
920
0
  s->append("?>");
921
0
  ok = (*writeFunc)(stream, s->getCString(), s->getLength());
922
0
  delete s;
923
0
  return ok;
924
0
}
925
926
//------------------------------------------------------------------------
927
928
1.46M
ZxElement::ZxElement(GString *typeA) {
929
1.46M
  type = typeA;
930
1.46M
  attrs = new GHash();
931
1.46M
  firstAttr = lastAttr = NULL;
932
1.46M
}
933
  
934
1.46M
ZxElement::~ZxElement() {
935
1.46M
  delete type;
936
1.46M
  deleteGHash(attrs, ZxAttr);
937
1.46M
}
938
939
1.03M
bool ZxElement::isElement(const char *typeA) {
940
1.03M
  return !type->cmp(typeA);
941
1.03M
}
942
943
214k
ZxAttr *ZxElement::findAttr(const char *attrName) {
944
214k
  return (ZxAttr *)attrs->lookup(attrName);
945
214k
}
946
947
92.9k
void ZxElement::addAttr(ZxAttr *attr) {
948
92.9k
  attrs->add(attr->getName(), attr);
949
92.9k
  if (lastAttr) {
950
25.4k
    lastAttr->next = attr;
951
25.4k
    lastAttr= attr;
952
67.4k
  } else {
953
67.4k
    firstAttr = lastAttr = attr;
954
67.4k
  }
955
92.9k
  attr->parent = this;
956
92.9k
  attr->next = NULL;
957
92.9k
}
958
959
0
bool ZxElement::write(ZxWriteFunc writeFunc, void *stream) {
960
0
  GString *s;
961
0
  ZxAttr *attr;
962
0
  ZxNode *child;
963
0
  bool ok;
964
965
0
  s = new GString("<");
966
0
  s->append(type);
967
0
  for (attr = firstAttr; attr; attr = attr->getNextAttr()) {
968
0
    s->append(" ");
969
0
    s->append(attr->name);
970
0
    s->append("=\"");
971
0
    appendEscapedAttrValue(s, attr->value);
972
0
    s->append("\"");
973
0
  }
974
0
  if ((child = getFirstChild())) {
975
0
    s->append(">");
976
0
  } else {
977
0
    s->append("/>");
978
0
  }
979
0
  ok = (*writeFunc)(stream, s->getCString(), s->getLength());
980
0
  delete s;
981
0
  if (!ok) {
982
0
    return false;
983
0
  }
984
0
  if (child) {
985
0
    for (; child; child = child->getNextChild()) {
986
0
      if (!child->write(writeFunc, stream)) {
987
0
  return false;
988
0
      }
989
0
    }
990
0
    s = new GString();
991
0
    s->append("</");
992
0
    s->append(type);
993
0
    s->append(">");
994
0
    ok = (*writeFunc)(stream, s->getCString(), s->getLength());
995
0
    delete s;
996
0
    if (!ok) {
997
0
      return false;
998
0
    }
999
0
  }
1000
0
  return true;
1001
0
}
1002
1003
0
void ZxElement::appendEscapedAttrValue(GString *out, GString *s) {
1004
0
  char c;
1005
0
  int i;
1006
1007
0
  for (i = 0; i < s->getLength(); ++i) {
1008
0
    c = s->getChar(i);
1009
0
    if (c == '<') {
1010
0
      out->append("&lt;");
1011
0
    } else if (c == '>') {
1012
0
      out->append("&gt;");
1013
0
    } else if (c == '&') {
1014
0
      out->append("&amp;");
1015
0
    } else if (c == '"') {
1016
0
      out->append("&quot;");
1017
0
    } else {
1018
0
      out->append(c);
1019
0
    }
1020
0
  }
1021
0
}
1022
1023
//------------------------------------------------------------------------
1024
1025
92.9k
ZxAttr::ZxAttr(GString *nameA, GString *valueA) {
1026
92.9k
  name = nameA;
1027
92.9k
  value = valueA;
1028
92.9k
  parent = NULL;
1029
92.9k
  next = NULL;
1030
92.9k
}
1031
1032
92.9k
ZxAttr::~ZxAttr() {
1033
92.9k
  delete name;
1034
92.9k
  delete value;
1035
92.9k
}
1036
1037
//------------------------------------------------------------------------
1038
1039
590k
ZxCharData::ZxCharData(GString *dataA, bool parsedA) {
1040
590k
  data = dataA;
1041
590k
  parsed = parsedA;
1042
590k
}
1043
1044
590k
ZxCharData::~ZxCharData() {
1045
590k
  delete data;
1046
590k
}
1047
1048
0
bool ZxCharData::write(ZxWriteFunc writeFunc, void *stream) {
1049
0
  GString *s;
1050
0
  char c;
1051
0
  int i;
1052
0
  bool ok;
1053
1054
0
  s = new GString();
1055
0
  if (parsed) {
1056
0
    for (i = 0; i < data->getLength(); ++i) {
1057
0
      c = data->getChar(i);
1058
0
      if (c == '<') {
1059
0
  s->append("&lt;");
1060
0
      } else if (c == '>') {
1061
0
  s->append("&gt;");
1062
0
      } else if (c == '&') {
1063
0
  s->append("&amp;");
1064
0
      } else {
1065
0
  s->append(c);
1066
0
      }
1067
0
    }
1068
0
  } else {
1069
0
    s->append("<![CDATA[");
1070
0
    s->append(data);
1071
0
    s->append("]]>");
1072
0
  }
1073
0
  ok = (*writeFunc)(stream, s->getCString(), s->getLength());
1074
0
  delete s;
1075
0
  return ok;
1076
0
}