Coverage Report

Created: 2026-05-30 06:30

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
/src/xpdf-4.06/xpdf/Zoox.cc
Line
Count
Source
1
//========================================================================
2
//
3
// Zoox.cc
4
//
5
//========================================================================
6
7
#include <aconf.h>
8
9
#include <stdlib.h>
10
#include <stdio.h>
11
#include <string.h>
12
#include "gmem.h"
13
#include "gmempp.h"
14
#include "GString.h"
15
#include "GList.h"
16
#include "GHash.h"
17
#include "Zoox.h"
18
19
//~ all of this code assumes the encoding is UTF-8 or ASCII or something
20
//~   similar (ISO-8859-*)
21
22
//------------------------------------------------------------------------
23
24
static char nameStartChar[256] = {
25
  0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, // 00
26
  0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, // 10
27
  0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, // 20
28
  0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, // 30
29
  0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, // 40
30
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 1, // 50
31
  0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, // 60
32
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, // 70
33
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, // 80
34
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, // 90
35
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, // a0
36
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, // b0
37
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, // c0
38
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, // d0
39
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, // e0
40
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1  // f0
41
};
42
43
static char nameChar[256] = {
44
  0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, // 00
45
  0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, // 10
46
  0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, // 20
47
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, // 30
48
  0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, // 40
49
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 1, // 50
50
  0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, // 60
51
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, // 70
52
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, // 80
53
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, // 90
54
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, // a0
55
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, // b0
56
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, // c0
57
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, // d0
58
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, // e0
59
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1  // f0
60
};
61
62
//------------------------------------------------------------------------
63
64
3.40M
ZxNode::ZxNode() {
65
3.40M
  next = NULL;
66
3.40M
  parent = NULL;
67
3.40M
  firstChild = lastChild = NULL;
68
3.40M
}
69
70
3.40M
ZxNode::~ZxNode() {
71
3.40M
  ZxNode *child;
72
73
6.79M
  while (firstChild) {
74
3.39M
    child = firstChild;
75
3.39M
    firstChild = firstChild->next;
76
3.39M
    delete child;
77
3.39M
  }
78
3.40M
}
79
80
0
ZxNode *ZxNode::deleteChild(ZxNode *child) {
81
0
  ZxNode *p1, *p2;
82
83
0
  for (p1 = NULL, p2 = firstChild;
84
0
       p2 && p2 != child;
85
0
       p1 = p2, p2 = p2->next) ;
86
0
  if (!p2) {
87
0
    return NULL;
88
0
  }
89
0
  if (p1) {
90
0
    p1->next = child->next;
91
0
  } else {
92
0
    firstChild = child->next;
93
0
  }
94
0
  child->parent = NULL;
95
0
  child->next = NULL;
96
0
  return child;
97
0
}
98
99
0
void ZxNode::appendChild(ZxNode *child) {
100
0
  ZxNode *p1;
101
102
0
  if (child->parent || child->next) {
103
0
    return;
104
0
  }
105
0
  if (firstChild) {
106
0
    for (p1 = firstChild; p1->next; p1 = p1->next) ;
107
0
    p1->next = child;
108
0
  } else {
109
0
    firstChild = child;
110
0
  }
111
0
  child->parent = this;
112
0
}
113
114
0
void ZxNode::insertChildAfter(ZxNode *child, ZxNode *prev) {
115
0
  if (child->parent || child->next || (prev && prev->parent != this)) {
116
0
    return;
117
0
  }
118
0
  if (prev) {
119
0
    child->next = prev->next;
120
0
    prev->next = child;
121
0
  } else {
122
0
    child->next = firstChild;
123
0
    firstChild = child;
124
0
  }
125
0
  child->parent = this;
126
0
}
127
128
0
ZxElement *ZxNode::findFirstElement(const char *type) {
129
0
  ZxNode *child;
130
0
  ZxElement *result;
131
132
0
  if (isElement(type)) {
133
0
    return (ZxElement *)this;
134
0
  }
135
0
  for (child = firstChild; child; child = child->next) {
136
0
    if ((result = child->findFirstElement(type))) {
137
0
      return result;
138
0
    }
139
0
  }
140
0
  return NULL;
141
0
}
142
143
237k
ZxElement *ZxNode::findFirstChildElement(const char *type) {
144
237k
  ZxNode *child;
145
146
823k
  for (child = firstChild; child; child = child->next) {
147
597k
    if (child->isElement(type)) {
148
11.5k
      return (ZxElement *)child;
149
11.5k
    }
150
597k
  }
151
225k
  return NULL;
152
237k
}
153
154
0
GList *ZxNode::findAllElements(const char *type) {
155
0
  GList *results;
156
157
0
  results = new GList();
158
0
  findAllElements(type, results);
159
0
  return results;
160
0
}
161
162
0
void ZxNode::findAllElements(const char *type, GList *results) {
163
0
  ZxNode *child;
164
165
0
  if (isElement(type)) {
166
0
    results->append(this);
167
0
  }
168
0
  for (child = firstChild; child; child = child->next) {
169
0
    child->findAllElements(type, results);
170
0
  }
171
0
}
172
173
0
GList *ZxNode::findAllChildElements(const char *type) {
174
0
  GList *results;
175
0
  ZxNode *child;
176
177
0
  results = new GList();
178
0
  for (child = firstChild; child; child = child->next) {
179
0
    if (child->isElement(type)) {
180
0
      results->append(child);
181
0
    }
182
0
  }
183
0
  return results;
184
0
}
185
186
3.39M
void ZxNode::addChild(ZxNode *child) {
187
3.39M
  if (lastChild) {
188
1.86M
    lastChild->next = child;
189
1.86M
    lastChild = child;
190
1.86M
  } else {
191
1.53M
    firstChild = lastChild = child;
192
1.53M
  }
193
3.39M
  child->parent = this;
194
3.39M
  child->next = NULL;
195
3.39M
}
196
197
//------------------------------------------------------------------------
198
199
9.26k
ZxDoc::ZxDoc() {
200
9.26k
  xmlDecl = NULL;
201
9.26k
  docTypeDecl = NULL;
202
9.26k
  root = NULL;
203
9.26k
}
204
205
5.44k
ZxDoc *ZxDoc::loadMem(const char *data, Guint dataLen) {
206
5.44k
  ZxDoc *doc;
207
208
5.44k
  doc = new ZxDoc();
209
5.44k
  if (!doc->parse(data, dataLen)) {
210
1.75k
    delete doc;
211
1.75k
    return NULL;
212
1.75k
  }
213
3.69k
  return doc;
214
5.44k
}
215
216
0
ZxDoc *ZxDoc::loadFile(const char *fileName) {
217
0
  ZxDoc *doc;
218
0
  FILE *f;
219
0
  char *data;
220
0
  Guint dataLen;
221
222
0
  if (!(f = fopen(fileName, "rb"))) {
223
0
    return NULL;
224
0
  }
225
0
  fseek(f, 0, SEEK_END);
226
0
  dataLen = (Guint)ftell(f);
227
0
  if (!dataLen) {
228
0
    fclose(f);
229
0
    return NULL;
230
0
  }
231
0
  fseek(f, 0, SEEK_SET);
232
0
  data = (char *)gmalloc(dataLen);
233
0
  if (fread(data, 1, dataLen, f) != dataLen) {
234
0
    fclose(f);
235
0
    gfree(data);
236
0
    return NULL;
237
0
  }
238
0
  fclose(f);
239
0
  doc = loadMem(data, dataLen);
240
0
  gfree(data);
241
0
  return doc;
242
0
}
243
244
ZxDoc::~ZxDoc() {
245
}
246
247
0
static bool writeToFileFunc(void *stream, const char *data, int length) {
248
0
  return (int)fwrite(data, 1, length, (FILE *)stream) == length;
249
0
}
250
251
0
bool ZxDoc::writeFile(const char *fileName) {
252
0
  FILE *f;
253
254
0
  if (!(f = fopen(fileName, "wb"))) {
255
0
    return false;
256
0
  }
257
0
  write(&writeToFileFunc, f);
258
0
  fclose(f);
259
0
  return true;
260
0
}
261
262
7.43k
void ZxDoc::addChild(ZxNode *node) {
263
7.43k
  if (node->isXMLDecl() && !xmlDecl) {
264
1.49k
    xmlDecl = (ZxXMLDecl *)node;
265
5.94k
  } else if (node->isDocTypeDecl() && !docTypeDecl) {
266
323
    docTypeDecl = (ZxDocTypeDecl *)node;
267
5.61k
  } else if (node->isElement() && !root) {
268
3.69k
    root = (ZxElement *)node;
269
3.69k
  }
270
7.43k
  ZxNode::addChild(node);
271
7.43k
}
272
273
5.44k
bool ZxDoc::parse(const char *data, Guint dataLen) {
274
5.44k
  parsePtr = data;
275
5.44k
  parseEnd = data + dataLen;
276
  
277
5.44k
  parseSpace();
278
5.44k
  parseBOM();
279
5.44k
  parseSpace();
280
5.44k
  parseXMLDecl(this);
281
5.44k
  parseMisc(this);
282
5.44k
  parseDocTypeDecl(this);
283
5.44k
  parseMisc(this);
284
5.44k
  if (match("<")) {
285
3.69k
    parseElement(this);
286
3.69k
  }
287
5.44k
  parseMisc(this);
288
5.44k
  return root != NULL;
289
5.44k
}
290
291
5.44k
void ZxDoc::parseXMLDecl(ZxNode *par) {
292
5.44k
  GString *version, *encoding, *s;
293
5.44k
  bool standalone;
294
295
5.44k
  if (!match("<?xml")) {
296
3.95k
    return;
297
3.95k
  }
298
1.49k
  parsePtr += 5;
299
1.49k
  parseSpace();
300
301
  // version
302
1.49k
  version = NULL;
303
1.49k
  if (match("version")) {
304
877
    parsePtr += 7;
305
877
    parseSpace();
306
877
    if (match("=")) {
307
794
      ++parsePtr;
308
794
      parseSpace();
309
794
      version = parseQuotedString();
310
794
    }
311
877
  }
312
1.49k
  if (!version) {
313
700
    version = new GString("1.0");
314
700
  }
315
1.49k
  parseSpace();
316
  
317
  // encoding
318
1.49k
  encoding = NULL;
319
1.49k
  if (match("encoding")) {
320
715
    parsePtr += 8;
321
715
    parseSpace();
322
715
    if (match("=")) {
323
626
      ++parsePtr;
324
626
      parseSpace();
325
626
      encoding = parseQuotedString();
326
626
    }
327
715
  }
328
1.49k
  parseSpace();
329
330
  // standalone
331
1.49k
  standalone = false;
332
1.49k
  if (match("standalone")) {
333
256
    parsePtr += 10;
334
256
    parseSpace();
335
256
    if (match("=")) {
336
176
      ++parsePtr;
337
176
      parseSpace();
338
176
      s = parseQuotedString();
339
176
      standalone = !s->cmp("yes");
340
176
      delete s;
341
176
    }
342
256
  }
343
1.49k
  parseSpace();
344
345
1.49k
  if (match("?>")) {
346
469
    parsePtr += 2;
347
469
  }
348
349
1.49k
  par->addChild(new ZxXMLDecl(version, encoding, standalone));
350
1.49k
}
351
352
//~ this just skips everything after the name
353
5.44k
void ZxDoc::parseDocTypeDecl(ZxNode *par) {
354
5.44k
  GString *name;
355
5.44k
  int state;
356
5.44k
  char c, quote;
357
358
5.44k
  if (!match("<!DOCTYPE")) {
359
5.12k
    return;
360
5.12k
  }
361
323
  parsePtr += 9;
362
323
  parseSpace();
363
364
323
  name = parseName();
365
323
  parseSpace();
366
367
323
  state = 0;
368
323
  quote = '\0';
369
860k
  while (parsePtr < parseEnd && state < 4) {
370
859k
    c = *parsePtr++;
371
859k
    switch (state) {
372
81.5k
    case 0: // not in square brackets; not in quotes
373
81.5k
      if (c == '>') {
374
38
  state = 4;
375
81.5k
      } else if (c == '"' || c == '\'') {
376
1.68k
  state = 1;
377
79.8k
      } else if (c == '[') {
378
1.24k
  state = 2;
379
1.24k
      }
380
81.5k
      break;
381
87.2k
    case 1: // not in square brackets; in quotes
382
87.2k
      if (c == quote) {
383
1.64k
  state = 0;
384
1.64k
      }
385
87.2k
      break;
386
564k
    case 2: // in square brackets; not in quotes
387
564k
      if (c == ']') {
388
1.14k
  state = 0;
389
563k
      } else if (c == '"' || c == '\'') {
390
2.43k
  state = 3;
391
2.43k
      }
392
564k
      break;
393
126k
    case 3: // in square brackets; in quotes
394
126k
      if (c == quote) {
395
2.39k
  state = 2;
396
2.39k
      }
397
126k
      break;
398
859k
    }
399
859k
  }
400
401
323
  par->addChild(new ZxDocTypeDecl(name));
402
323
}
403
404
// assumes match("<")
405
2.46M
void ZxDoc::parseElement(ZxNode *par) {
406
2.46M
  GString *type;
407
2.46M
  ZxElement *elem;
408
2.46M
  ZxAttr *attr;
409
410
2.46M
  ++parsePtr;
411
2.46M
  type = parseName();
412
2.46M
  elem = new ZxElement(type);
413
2.46M
  parseSpace();
414
3.54M
  while ((attr = parseAttr())) {
415
1.07M
    elem->addAttr(attr);
416
1.07M
    parseSpace();
417
1.07M
  }
418
2.46M
  if (match("/>")) {
419
78.8k
    parsePtr += 2;
420
2.38M
  } else if (match(">")) {
421
1.53M
    ++parsePtr;
422
1.53M
    parseContent(elem);
423
1.53M
  }
424
2.46M
  par->addChild(elem);
425
2.46M
}
426
427
3.54M
ZxAttr *ZxDoc::parseAttr() {
428
3.54M
  GString *name, *value;
429
3.54M
  const char *start;
430
3.54M
  char quote, c;
431
3.54M
  unsigned int x;
432
3.54M
  int n;
433
434
3.54M
  name = parseName();
435
3.54M
  parseSpace();
436
3.54M
  if (!match("=")) {
437
2.43M
    delete name;
438
2.43M
    return NULL;
439
2.43M
  }
440
1.10M
  ++parsePtr;
441
1.10M
  parseSpace();
442
1.10M
  if (!(parsePtr < parseEnd && (*parsePtr == '"' || *parsePtr == '\''))) {
443
31.0k
    delete name;
444
31.0k
    return NULL;
445
31.0k
  }
446
1.07M
  quote = *parsePtr++;
447
1.07M
  value = new GString();
448
1.55M
  while (parsePtr < parseEnd && *parsePtr != quote) {
449
476k
    if (*parsePtr == '&') {
450
179k
      ++parsePtr;
451
179k
      if (parsePtr < parseEnd && *parsePtr == '#') {
452
49.2k
  ++parsePtr;
453
49.2k
  if (parsePtr < parseEnd && *parsePtr == 'x') {
454
21.6k
    ++parsePtr;
455
21.6k
    x = 0;
456
74.6k
    while (parsePtr < parseEnd) {
457
74.6k
      c = *parsePtr;
458
74.6k
      if (c >= '0' && c <= '9') {
459
8.81k
        x = (x << 4) + (c - '0');
460
65.8k
      } else if (c >= 'a' && c <= 'f') {
461
24.0k
        x = (x << 4) + (10 + c - 'a');
462
41.7k
      } else if (c >= 'A' && c <= 'F') {
463
20.1k
        x = (x << 4) + (10 + c - 'A');
464
21.6k
      } else {
465
21.6k
        break;
466
21.6k
      }
467
53.0k
      ++parsePtr;
468
53.0k
    }
469
21.6k
    if (parsePtr < parseEnd && *parsePtr == ';') {
470
3.11k
      ++parsePtr;
471
3.11k
    }
472
21.6k
    appendUTF8(value, x);
473
27.5k
  } else {
474
27.5k
    x = 0;
475
79.9k
    while (parsePtr < parseEnd) {
476
79.9k
      c = *parsePtr;
477
79.9k
      if (c >= '0' && c <= '9') {
478
52.3k
        x = x * 10 + (c - '0');
479
52.3k
      } else {
480
27.5k
        break;
481
27.5k
      }
482
52.3k
      ++parsePtr;
483
52.3k
    }
484
27.5k
    if (parsePtr < parseEnd && *parsePtr == ';') {
485
1.22k
      ++parsePtr;
486
1.22k
    }
487
27.5k
    appendUTF8(value, x);
488
27.5k
  }
489
130k
      } else {
490
130k
  start = parsePtr;
491
130k
  for (++parsePtr;
492
20.6M
       parsePtr < parseEnd && *parsePtr != ';' &&
493
20.6M
         *parsePtr != quote && *parsePtr != '&';
494
20.5M
       ++parsePtr) ;
495
130k
  n = (int)(parsePtr - start);
496
130k
  if (parsePtr < parseEnd && *parsePtr == ';') {
497
3.11k
    ++parsePtr;
498
3.11k
  }
499
130k
  if (n == 2 && !strncmp(start, "lt", 2)) {
500
1.44k
    value->append('<');
501
128k
  } else if (n == 2 && !strncmp(start, "gt", 2)) {
502
18.7k
    value->append('>');
503
110k
  } else if (n == 3 && !strncmp(start, "amp", 3)) {
504
15.0k
    value->append('&');
505
95.1k
  } else if (n == 4 && !strncmp(start, "apos", 4)) {
506
993
    value->append('\'');
507
94.1k
  } else if (n == 4 && !strncmp(start, "quot", 4)) {
508
3.24k
    value->append('"');
509
90.8k
  } else {
510
90.8k
    value->append(start - 1, (int)(parsePtr - start) + 1);
511
90.8k
  }
512
130k
      }
513
297k
    } else {
514
297k
      start = parsePtr;
515
297k
      for (++parsePtr;
516
20.7M
     parsePtr < parseEnd && *parsePtr != quote && *parsePtr != '&';
517
20.4M
     ++parsePtr) ;
518
297k
      value->append(start, (int)(parsePtr - start));
519
297k
    }
520
476k
  }
521
1.07M
  if (parsePtr < parseEnd && *parsePtr == quote) {
522
1.07M
    ++parsePtr;
523
1.07M
  }
524
1.07M
  return new ZxAttr(name, value);
525
1.10M
}
526
527
// this consumes the end tag
528
1.53M
void ZxDoc::parseContent(ZxElement *par) {
529
1.53M
  GString *endType;
530
531
1.53M
  endType = (new GString("</"))->append(par->getType());
532
533
4.91M
  while (parsePtr < parseEnd) {
534
3.47M
    if (match(endType->getCString())) {
535
84.9k
      parsePtr += endType->getLength();
536
84.9k
      parseSpace();
537
84.9k
      if (match(">")) {
538
57.2k
  ++parsePtr;
539
57.2k
      }
540
84.9k
      break;
541
3.38M
    } else if (match("<?")) {
542
29.2k
      parsePI(par);
543
3.35M
    } else if (match("<![CDATA[")) {
544
3.66k
      parseCDSect(par);
545
3.35M
    } else if (match("<!--")) {
546
2.86k
      parseComment(par);
547
3.35M
    } else if (match("<")) {
548
2.46M
      parseElement(par);
549
2.46M
    } else {
550
889k
      parseCharData(par);
551
889k
    }
552
3.47M
  }
553
554
1.53M
  delete endType;
555
1.53M
}
556
557
889k
void ZxDoc::parseCharData(ZxElement *par) {
558
889k
  GString *data;
559
889k
  const char *start;
560
889k
  char c;
561
889k
  unsigned int x;
562
889k
  int n;
563
564
889k
  data = new GString();
565
2.53M
  while (parsePtr < parseEnd && *parsePtr != '<') {
566
1.64M
    if (*parsePtr == '&') {
567
660k
      ++parsePtr;
568
660k
      if (parsePtr < parseEnd && *parsePtr == '#') {
569
195k
  ++parsePtr;
570
195k
  if (parsePtr < parseEnd && *parsePtr == 'x') {
571
33.3k
    ++parsePtr;
572
33.3k
    x = 0;
573
135k
    while (parsePtr < parseEnd) {
574
134k
      c = *parsePtr;
575
134k
      if (c >= '0' && c <= '9') {
576
47.1k
        x = (x << 4) + (c - '0');
577
87.8k
      } else if (c >= 'a' && c <= 'f') {
578
25.8k
        x = (x << 4) + (10 + c - 'a');
579
61.9k
      } else if (c >= 'A' && c <= 'F') {
580
28.7k
        x = (x << 4) + (10 + c - 'A');
581
33.2k
      } else {
582
33.2k
        break;
583
33.2k
      }
584
101k
      ++parsePtr;
585
101k
    }
586
33.3k
    if (parsePtr < parseEnd && *parsePtr == ';') {
587
6.80k
      ++parsePtr;
588
6.80k
    }
589
33.3k
    appendUTF8(data, x);
590
161k
  } else {
591
161k
    x = 0;
592
402k
    while (parsePtr < parseEnd) {
593
402k
      c = *parsePtr;
594
402k
      if (c >= '0' && c <= '9') {
595
240k
        x = x * 10 + (c - '0');
596
240k
      } else {
597
161k
        break;
598
161k
      }
599
240k
      ++parsePtr;
600
240k
    }
601
161k
    if (parsePtr < parseEnd && *parsePtr == ';') {
602
6.54k
      ++parsePtr;
603
6.54k
    }
604
161k
    appendUTF8(data, x);
605
161k
  }
606
465k
      } else {
607
465k
  start = parsePtr;
608
465k
  for (++parsePtr;
609
22.0M
       parsePtr < parseEnd && *parsePtr != ';' &&
610
22.0M
         *parsePtr != '<' && *parsePtr != '&';
611
21.5M
       ++parsePtr) ;
612
465k
  n = (int)(parsePtr - start);
613
465k
  if (parsePtr < parseEnd && *parsePtr == ';') {
614
6.47k
    ++parsePtr;
615
6.47k
  }
616
465k
  if (n == 2 && !strncmp(start, "lt", 2)) {
617
3.79k
    data->append('<');
618
461k
  } else if (n == 2 && !strncmp(start, "gt", 2)) {
619
91.0k
    data->append('>');
620
370k
  } else if (n == 3 && !strncmp(start, "amp", 3)) {
621
32.2k
    data->append('&');
622
338k
  } else if (n == 4 && !strncmp(start, "apos", 4)) {
623
1.22k
    data->append('\'');
624
337k
  } else if (n == 4 && !strncmp(start, "quot", 4)) {
625
17.2k
    data->append('"');
626
319k
  } else {
627
319k
    data->append(start - 1, (int)(parsePtr - start) + 1);
628
319k
  }
629
465k
      }
630
981k
    } else {
631
981k
      start = parsePtr;
632
981k
      for (++parsePtr;
633
45.8M
     parsePtr < parseEnd && *parsePtr != '<' && *parsePtr != '&';
634
44.8M
     ++parsePtr) ;
635
981k
      data->append(start, (int)(parsePtr - start));
636
981k
    }
637
1.64M
  }
638
889k
  par->addChild(new ZxCharData(data, true));
639
889k
}
640
641
244k
void ZxDoc::appendUTF8(GString *s, unsigned int c) {
642
244k
  if (c <= 0x7f) {
643
179k
    s->append((char)c);
644
179k
  } else if (c <= 0x7ff) {
645
9.08k
    s->append((char)(0xc0 + (c >> 6)));
646
9.08k
    s->append((char)(0x80 + (c & 0x3f)));
647
55.4k
  } else if (c <= 0xffff) {
648
14.7k
    s->append((char)(0xe0 + (c >> 12)));
649
14.7k
    s->append((char)(0x80 + ((c >> 6) & 0x3f)));
650
14.7k
    s->append((char)(0x80 + (c & 0x3f)));
651
40.6k
  } else if (c <= 0x1fffff) {
652
12.1k
    s->append((char)(0xf0 + (c >> 18)));
653
12.1k
    s->append((char)(0x80 + ((c >> 12) & 0x3f)));
654
12.1k
    s->append((char)(0x80 + ((c >> 6) & 0x3f)));
655
12.1k
    s->append((char)(0x80 + (c & 0x3f)));
656
28.5k
  } else if (c <= 0x3ffffff) {
657
4.34k
    s->append((char)(0xf8 + (c >> 24)));
658
4.34k
    s->append((char)(0x80 + ((c >> 18) & 0x3f)));
659
4.34k
    s->append((char)(0x80 + ((c >> 12) & 0x3f)));
660
4.34k
    s->append((char)(0x80 + ((c >> 6) & 0x3f)));
661
4.34k
    s->append((char)(0x80 + (c & 0x3f)));
662
24.2k
  } else if (c <= 0x7fffffff) {
663
18.9k
    s->append((char)(0xfc + (c >> 30)));
664
18.9k
    s->append((char)(0x80 + ((c >> 24) & 0x3f)));
665
18.9k
    s->append((char)(0x80 + ((c >> 18) & 0x3f)));
666
18.9k
    s->append((char)(0x80 + ((c >> 12) & 0x3f)));
667
18.9k
    s->append((char)(0x80 + ((c >> 6) & 0x3f)));
668
18.9k
    s->append((char)(0x80 + (c & 0x3f)));
669
18.9k
  }
670
244k
}
671
672
// assumes match("<![CDATA[")
673
3.66k
void ZxDoc::parseCDSect(ZxNode *par) {
674
3.66k
  const char *start;
675
676
3.66k
  parsePtr += 9;
677
3.66k
  start = parsePtr;
678
371k
  while (parsePtr < parseEnd - 3) {
679
371k
    if (!strncmp(parsePtr, "]]>", 3)) {
680
3.61k
      par->addChild(new ZxCharData(new GString(start, (int)(parsePtr - start)),
681
3.61k
           false));
682
3.61k
      parsePtr += 3;
683
3.61k
      return;
684
3.61k
    }
685
368k
    ++parsePtr;
686
368k
  }
687
52
  parsePtr = parseEnd;
688
52
  par->addChild(new ZxCharData(new GString(start, (int)(parsePtr - start)),
689
52
             false));
690
52
}
691
692
16.3k
void ZxDoc::parseMisc(ZxNode *par) {
693
26.4k
  while (1) {
694
26.4k
    if (match("<!--")) {
695
644
      parseComment(par);
696
25.7k
    } else if (match("<?")) {
697
1.32k
      parsePI(par);
698
24.4k
    } else if (parsePtr < parseEnd && (*parsePtr == '\x20' ||
699
15.1k
               *parsePtr == '\x09' ||
700
13.6k
               *parsePtr == '\x0d' ||
701
11.9k
               *parsePtr == '\x0a')) {
702
8.08k
      ++parsePtr;
703
16.3k
    } else {
704
16.3k
      break;
705
16.3k
    }
706
26.4k
  }
707
16.3k
}
708
709
// assumes match("<!--")
710
3.50k
void ZxDoc::parseComment(ZxNode *par) {
711
3.50k
  const char *start;
712
713
3.50k
  parsePtr += 4;
714
3.50k
  start = parsePtr;
715
1.00M
  while (parsePtr <= parseEnd - 3) {
716
1.00M
    if (!strncmp(parsePtr, "-->", 3)) {
717
3.42k
      par->addChild(new ZxComment(new GString(start, (int)(parsePtr - start))));
718
3.42k
      parsePtr += 3;
719
3.42k
      return;
720
3.42k
    }
721
1.00M
    ++parsePtr;
722
1.00M
  }
723
79
  parsePtr = parseEnd;
724
79
}
725
726
// assumes match("<?")
727
30.5k
void ZxDoc::parsePI(ZxNode *par) {
728
30.5k
  GString *target;
729
30.5k
  const char *start;
730
731
30.5k
  parsePtr += 2;
732
30.5k
  target = parseName();
733
30.5k
  parseSpace();
734
30.5k
  start = parsePtr;
735
10.4M
  while (parsePtr <= parseEnd - 2) {
736
10.4M
    if (!strncmp(parsePtr, "?>", 2)) {
737
30.2k
      par->addChild(new ZxPI(target, new GString(start,
738
30.2k
             (int)(parsePtr - start))));
739
30.2k
      parsePtr += 2;
740
30.2k
      return;
741
30.2k
    }
742
10.4M
    ++parsePtr;
743
10.4M
  }
744
334
  parsePtr = parseEnd;
745
334
  par->addChild(new ZxPI(target, new GString(start, (int)(parsePtr - start))));
746
334
}
747
748
//~ this accepts all chars >= 0x80
749
//~ this doesn't check for properly-formed UTF-8
750
6.03M
GString *ZxDoc::parseName() {
751
6.03M
  GString *name;
752
753
6.03M
  name = new GString();
754
6.03M
  if (parsePtr < parseEnd && nameStartChar[*parsePtr & 0xff]) {
755
1.23M
    name->append(*parsePtr++);
756
17.2M
    while (parsePtr < parseEnd && nameChar[*parsePtr & 0xff]) {
757
15.9M
      name->append(*parsePtr++);
758
15.9M
    }
759
1.23M
  }
760
6.03M
  return name;
761
6.03M
}
762
763
1.59k
GString *ZxDoc::parseQuotedString() {
764
1.59k
  GString *s;
765
1.59k
  const char *start;
766
1.59k
  char quote;
767
768
1.59k
  if (parsePtr < parseEnd && (*parsePtr == '"' || *parsePtr == '\'')) {
769
1.33k
    quote = *parsePtr++;
770
1.33k
    start = parsePtr;
771
44.3k
    while (parsePtr < parseEnd && *parsePtr != quote) {
772
43.0k
      ++parsePtr;
773
43.0k
    }
774
1.33k
    s = new GString(start, (int)(parsePtr - start));
775
1.33k
    if (parsePtr < parseEnd && *parsePtr == quote) {
776
1.28k
      ++parsePtr;
777
1.28k
    }
778
1.33k
  } else {
779
262
    s = new GString();
780
262
  }
781
1.59k
  return s;
782
1.59k
}
783
784
5.44k
void ZxDoc::parseBOM() {
785
5.44k
  if (match("\xef\xbb\xbf")) {
786
50
    parsePtr += 3;
787
50
  }
788
5.44k
}
789
790
8.32M
void ZxDoc::parseSpace() {
791
9.20M
  while (parsePtr < parseEnd && (*parsePtr == '\x20' ||
792
8.77M
         *parsePtr == '\x09' ||
793
8.68M
         *parsePtr == '\x0d' ||
794
8.57M
         *parsePtr == '\x0a')) {
795
879k
    ++parsePtr;
796
879k
  }
797
8.32M
}
798
799
25.4M
bool ZxDoc::match(const char *s) {
800
25.4M
  int n;
801
802
25.4M
  n = (int)strlen(s);
803
25.4M
  return parseEnd - parsePtr >= n && !strncmp(parsePtr, s, n);
804
25.4M
}
805
806
0
bool ZxDoc::write(ZxWriteFunc writeFunc, void *stream) {
807
0
  ZxNode *child;
808
809
0
  for (child = getFirstChild(); child; child = child->getNextChild()) {
810
0
    if (!child->write(writeFunc, stream)) {
811
0
      return false;
812
0
    }
813
0
    if (!(*writeFunc)(stream, "\n", 1)) {
814
0
      return false;
815
0
    }
816
0
  }
817
0
  return true;
818
0
}
819
820
//------------------------------------------------------------------------
821
822
1.49k
ZxXMLDecl::ZxXMLDecl(GString *versionA, GString *encodingA, bool standaloneA) {
823
1.49k
  version = versionA;
824
1.49k
  encoding = encodingA;
825
1.49k
  standalone = standaloneA;
826
1.49k
}
827
828
1.49k
ZxXMLDecl::~ZxXMLDecl() {
829
1.49k
  delete version;
830
1.49k
  if (encoding) {
831
626
    delete encoding;
832
626
  }
833
1.49k
}
834
835
0
bool ZxXMLDecl::write(ZxWriteFunc writeFunc, void *stream) {
836
0
  GString *s;
837
0
  bool ok;
838
839
0
  s = new GString("<?xml version=\"");
840
0
  s->append(version);
841
0
  s->append("\"");
842
0
  if (encoding) {
843
0
    s->append(" encoding=\"");
844
0
    s->append(encoding);
845
0
    s->append("\"");
846
0
  }
847
0
  if (standalone) {
848
0
    s->append(" standlone=\"yes\"");
849
0
  }
850
0
  s->append("?>");
851
0
  ok = (*writeFunc)(stream, s->getCString(), s->getLength());
852
0
  delete s;
853
0
  return ok;
854
0
}
855
856
//------------------------------------------------------------------------
857
858
323
ZxDocTypeDecl::ZxDocTypeDecl(GString *nameA) {
859
323
  name = nameA;
860
323
}
861
862
323
ZxDocTypeDecl::~ZxDocTypeDecl() {
863
323
  delete name;
864
323
}
865
866
0
bool ZxDocTypeDecl::write(ZxWriteFunc writeFunc, void *stream) {
867
0
  GString *s;
868
0
  bool ok;
869
870
0
  s = new GString("<!DOCTYPE ");
871
0
  s->append(name);
872
0
  s->append(">");
873
0
  ok = (*writeFunc)(stream, s->getCString(), s->getLength());
874
0
  delete s;
875
0
  return ok;
876
0
}
877
878
//------------------------------------------------------------------------
879
880
3.42k
ZxComment::ZxComment(GString *textA) {
881
3.42k
  text = textA;
882
3.42k
}
883
884
3.42k
ZxComment::~ZxComment() {
885
3.42k
  delete text;
886
3.42k
}
887
888
0
bool ZxComment::write(ZxWriteFunc writeFunc, void *stream) {
889
0
  GString *s;
890
0
  bool ok;
891
892
0
  s = new GString("<!--");
893
0
  s->append(text);
894
0
  s->append("-->");
895
0
  ok = (*writeFunc)(stream, s->getCString(), s->getLength());
896
0
  delete s;
897
0
  return ok;
898
0
}
899
900
//------------------------------------------------------------------------
901
902
30.5k
ZxPI::ZxPI(GString *targetA, GString *textA) {
903
30.5k
  target = targetA;
904
30.5k
  text = textA;
905
30.5k
}
906
907
30.5k
ZxPI::~ZxPI() {
908
30.5k
  delete target;
909
30.5k
  delete text;
910
30.5k
}
911
912
0
bool ZxPI::write(ZxWriteFunc writeFunc, void *stream) {
913
0
  GString *s;
914
0
  bool ok;
915
916
0
  s = new GString("<?");
917
0
  s->append(target);
918
0
  s->append(" ");
919
0
  s->append(text);
920
0
  s->append("?>");
921
0
  ok = (*writeFunc)(stream, s->getCString(), s->getLength());
922
0
  delete s;
923
0
  return ok;
924
0
}
925
926
//------------------------------------------------------------------------
927
928
2.46M
ZxElement::ZxElement(GString *typeA) {
929
2.46M
  type = typeA;
930
2.46M
  attrs = new GHash();
931
2.46M
  firstAttr = lastAttr = NULL;
932
2.46M
}
933
  
934
2.46M
ZxElement::~ZxElement() {
935
2.46M
  delete type;
936
2.46M
  deleteGHash(attrs, ZxAttr);
937
2.46M
}
938
939
1.87M
bool ZxElement::isElement(const char *typeA) {
940
1.87M
  return !type->cmp(typeA);
941
1.87M
}
942
943
390k
ZxAttr *ZxElement::findAttr(const char *attrName) {
944
390k
  return (ZxAttr *)attrs->lookup(attrName);
945
390k
}
946
947
1.07M
void ZxElement::addAttr(ZxAttr *attr) {
948
1.07M
  attrs->add(attr->getName(), attr);
949
1.07M
  if (lastAttr) {
950
909k
    lastAttr->next = attr;
951
909k
    lastAttr= attr;
952
909k
  } else {
953
165k
    firstAttr = lastAttr = attr;
954
165k
  }
955
1.07M
  attr->parent = this;
956
1.07M
  attr->next = NULL;
957
1.07M
}
958
959
0
bool ZxElement::write(ZxWriteFunc writeFunc, void *stream) {
960
0
  GString *s;
961
0
  ZxAttr *attr;
962
0
  ZxNode *child;
963
0
  bool ok;
964
965
0
  s = new GString("<");
966
0
  s->append(type);
967
0
  for (attr = firstAttr; attr; attr = attr->getNextAttr()) {
968
0
    s->append(" ");
969
0
    s->append(attr->name);
970
0
    s->append("=\"");
971
0
    appendEscapedAttrValue(s, attr->value);
972
0
    s->append("\"");
973
0
  }
974
0
  if ((child = getFirstChild())) {
975
0
    s->append(">");
976
0
  } else {
977
0
    s->append("/>");
978
0
  }
979
0
  ok = (*writeFunc)(stream, s->getCString(), s->getLength());
980
0
  delete s;
981
0
  if (!ok) {
982
0
    return false;
983
0
  }
984
0
  if (child) {
985
0
    for (; child; child = child->getNextChild()) {
986
0
      if (!child->write(writeFunc, stream)) {
987
0
  return false;
988
0
      }
989
0
    }
990
0
    s = new GString();
991
0
    s->append("</");
992
0
    s->append(type);
993
0
    s->append(">");
994
0
    ok = (*writeFunc)(stream, s->getCString(), s->getLength());
995
0
    delete s;
996
0
    if (!ok) {
997
0
      return false;
998
0
    }
999
0
  }
1000
0
  return true;
1001
0
}
1002
1003
0
void ZxElement::appendEscapedAttrValue(GString *out, GString *s) {
1004
0
  char c;
1005
0
  int i;
1006
1007
0
  for (i = 0; i < s->getLength(); ++i) {
1008
0
    c = s->getChar(i);
1009
0
    if (c == '<') {
1010
0
      out->append("&lt;");
1011
0
    } else if (c == '>') {
1012
0
      out->append("&gt;");
1013
0
    } else if (c == '&') {
1014
0
      out->append("&amp;");
1015
0
    } else if (c == '"') {
1016
0
      out->append("&quot;");
1017
0
    } else {
1018
0
      out->append(c);
1019
0
    }
1020
0
  }
1021
0
}
1022
1023
//------------------------------------------------------------------------
1024
1025
1.07M
ZxAttr::ZxAttr(GString *nameA, GString *valueA) {
1026
1.07M
  name = nameA;
1027
1.07M
  value = valueA;
1028
1.07M
  parent = NULL;
1029
1.07M
  next = NULL;
1030
1.07M
}
1031
1032
1.07M
ZxAttr::~ZxAttr() {
1033
1.07M
  delete name;
1034
1.07M
  delete value;
1035
1.07M
}
1036
1037
//------------------------------------------------------------------------
1038
1039
892k
ZxCharData::ZxCharData(GString *dataA, bool parsedA) {
1040
892k
  data = dataA;
1041
892k
  parsed = parsedA;
1042
892k
}
1043
1044
892k
ZxCharData::~ZxCharData() {
1045
892k
  delete data;
1046
892k
}
1047
1048
0
bool ZxCharData::write(ZxWriteFunc writeFunc, void *stream) {
1049
0
  GString *s;
1050
0
  char c;
1051
0
  int i;
1052
0
  bool ok;
1053
1054
0
  s = new GString();
1055
0
  if (parsed) {
1056
0
    for (i = 0; i < data->getLength(); ++i) {
1057
0
      c = data->getChar(i);
1058
0
      if (c == '<') {
1059
0
  s->append("&lt;");
1060
0
      } else if (c == '>') {
1061
0
  s->append("&gt;");
1062
0
      } else if (c == '&') {
1063
0
  s->append("&amp;");
1064
0
      } else {
1065
0
  s->append(c);
1066
0
      }
1067
0
    }
1068
0
  } else {
1069
0
    s->append("<![CDATA[");
1070
0
    s->append(data);
1071
0
    s->append("]]>");
1072
0
  }
1073
0
  ok = (*writeFunc)(stream, s->getCString(), s->getLength());
1074
0
  delete s;
1075
0
  return ok;
1076
0
}