Coverage Report

Created: 2025-08-26 06:28

/src/xpdf-4.05/xpdf/Zoox.cc
Line
Count
Source (jump to first uncovered line)
1
//========================================================================
2
//
3
// Zoox.cc
4
//
5
//========================================================================
6
7
#include <aconf.h>
8
9
#include <stdlib.h>
10
#include <stdio.h>
11
#include <string.h>
12
#include "gmem.h"
13
#include "gmempp.h"
14
#include "GString.h"
15
#include "GList.h"
16
#include "GHash.h"
17
#include "Zoox.h"
18
19
//~ all of this code assumes the encoding is UTF-8 or ASCII or something
20
//~   similar (ISO-8859-*)
21
22
//------------------------------------------------------------------------
23
24
static char nameStartChar[256] = {
25
  0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, // 00
26
  0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, // 10
27
  0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, // 20
28
  0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, // 30
29
  0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, // 40
30
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 1, // 50
31
  0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, // 60
32
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, // 70
33
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, // 80
34
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, // 90
35
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, // a0
36
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, // b0
37
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, // c0
38
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, // d0
39
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, // e0
40
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1  // f0
41
};
42
43
static char nameChar[256] = {
44
  0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, // 00
45
  0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, // 10
46
  0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, // 20
47
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, // 30
48
  0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, // 40
49
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 1, // 50
50
  0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, // 60
51
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, // 70
52
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, // 80
53
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, // 90
54
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, // a0
55
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, // b0
56
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, // c0
57
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, // d0
58
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, // e0
59
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1  // f0
60
};
61
62
//------------------------------------------------------------------------
63
64
2.33M
ZxNode::ZxNode() {
65
2.33M
  next = NULL;
66
2.33M
  parent = NULL;
67
2.33M
  firstChild = lastChild = NULL;
68
2.33M
}
69
70
2.33M
ZxNode::~ZxNode() {
71
2.33M
  ZxNode *child;
72
73
4.66M
  while (firstChild) {
74
2.33M
    child = firstChild;
75
2.33M
    firstChild = firstChild->next;
76
2.33M
    delete child;
77
2.33M
  }
78
2.33M
}
79
80
0
ZxNode *ZxNode::deleteChild(ZxNode *child) {
81
0
  ZxNode *p1, *p2;
82
83
0
  for (p1 = NULL, p2 = firstChild;
84
0
       p2 && p2 != child;
85
0
       p1 = p2, p2 = p2->next) ;
86
0
  if (!p2) {
87
0
    return NULL;
88
0
  }
89
0
  if (p1) {
90
0
    p1->next = child->next;
91
0
  } else {
92
0
    firstChild = child->next;
93
0
  }
94
0
  child->parent = NULL;
95
0
  child->next = NULL;
96
0
  return child;
97
0
}
98
99
0
void ZxNode::appendChild(ZxNode *child) {
100
0
  ZxNode *p1;
101
102
0
  if (child->parent || child->next) {
103
0
    return;
104
0
  }
105
0
  if (firstChild) {
106
0
    for (p1 = firstChild; p1->next; p1 = p1->next) ;
107
0
    p1->next = child;
108
0
  } else {
109
0
    firstChild = child;
110
0
  }
111
0
  child->parent = this;
112
0
}
113
114
0
void ZxNode::insertChildAfter(ZxNode *child, ZxNode *prev) {
115
0
  if (child->parent || child->next || (prev && prev->parent != this)) {
116
0
    return;
117
0
  }
118
0
  if (prev) {
119
0
    child->next = prev->next;
120
0
    prev->next = child;
121
0
  } else {
122
0
    child->next = firstChild;
123
0
    firstChild = child;
124
0
  }
125
0
  child->parent = this;
126
0
}
127
128
0
ZxElement *ZxNode::findFirstElement(const char *type) {
129
0
  ZxNode *child;
130
0
  ZxElement *result;
131
132
0
  if (isElement(type)) {
133
0
    return (ZxElement *)this;
134
0
  }
135
0
  for (child = firstChild; child; child = child->next) {
136
0
    if ((result = child->findFirstElement(type))) {
137
0
      return result;
138
0
    }
139
0
  }
140
0
  return NULL;
141
0
}
142
143
98.7k
ZxElement *ZxNode::findFirstChildElement(const char *type) {
144
98.7k
  ZxNode *child;
145
146
319k
  for (child = firstChild; child; child = child->next) {
147
223k
    if (child->isElement(type)) {
148
2.94k
      return (ZxElement *)child;
149
2.94k
    }
150
223k
  }
151
95.7k
  return NULL;
152
98.7k
}
153
154
0
GList *ZxNode::findAllElements(const char *type) {
155
0
  GList *results;
156
157
0
  results = new GList();
158
0
  findAllElements(type, results);
159
0
  return results;
160
0
}
161
162
0
void ZxNode::findAllElements(const char *type, GList *results) {
163
0
  ZxNode *child;
164
165
0
  if (isElement(type)) {
166
0
    results->append(this);
167
0
  }
168
0
  for (child = firstChild; child; child = child->next) {
169
0
    child->findAllElements(type, results);
170
0
  }
171
0
}
172
173
0
GList *ZxNode::findAllChildElements(const char *type) {
174
0
  GList *results;
175
0
  ZxNode *child;
176
177
0
  results = new GList();
178
0
  for (child = firstChild; child; child = child->next) {
179
0
    if (child->isElement(type)) {
180
0
      results->append(child);
181
0
    }
182
0
  }
183
0
  return results;
184
0
}
185
186
2.33M
void ZxNode::addChild(ZxNode *child) {
187
2.33M
  if (lastChild) {
188
2.04M
    lastChild->next = child;
189
2.04M
    lastChild = child;
190
2.04M
  } else {
191
288k
    firstChild = lastChild = child;
192
288k
  }
193
2.33M
  child->parent = this;
194
2.33M
  child->next = NULL;
195
2.33M
}
196
197
//------------------------------------------------------------------------
198
199
553
ZxDoc::ZxDoc() {
200
553
  xmlDecl = NULL;
201
553
  docTypeDecl = NULL;
202
553
  root = NULL;
203
553
}
204
205
553
ZxDoc *ZxDoc::loadMem(const char *data, Guint dataLen) {
206
553
  ZxDoc *doc;
207
208
553
  doc = new ZxDoc();
209
553
  if (!doc->parse(data, dataLen)) {
210
59
    delete doc;
211
59
    return NULL;
212
59
  }
213
494
  return doc;
214
553
}
215
216
0
ZxDoc *ZxDoc::loadFile(const char *fileName) {
217
0
  ZxDoc *doc;
218
0
  FILE *f;
219
0
  char *data;
220
0
  Guint dataLen;
221
222
0
  if (!(f = fopen(fileName, "rb"))) {
223
0
    return NULL;
224
0
  }
225
0
  fseek(f, 0, SEEK_END);
226
0
  dataLen = (Guint)ftell(f);
227
0
  if (!dataLen) {
228
0
    fclose(f);
229
0
    return NULL;
230
0
  }
231
0
  fseek(f, 0, SEEK_SET);
232
0
  data = (char *)gmalloc(dataLen);
233
0
  if (fread(data, 1, dataLen, f) != dataLen) {
234
0
    fclose(f);
235
0
    gfree(data);
236
0
    return NULL;
237
0
  }
238
0
  fclose(f);
239
0
  doc = loadMem(data, dataLen);
240
0
  gfree(data);
241
0
  return doc;
242
0
}
243
244
ZxDoc::~ZxDoc() {
245
}
246
247
0
static bool writeToFileFunc(void *stream, const char *data, int length) {
248
0
  return (int)fwrite(data, 1, length, (FILE *)stream) == length;
249
0
}
250
251
0
bool ZxDoc::writeFile(const char *fileName) {
252
0
  FILE *f;
253
254
0
  if (!(f = fopen(fileName, "wb"))) {
255
0
    return false;
256
0
  }
257
0
  write(&writeToFileFunc, f);
258
0
  fclose(f);
259
0
  return true;
260
0
}
261
262
853
void ZxDoc::addChild(ZxNode *node) {
263
853
  if (node->isXMLDecl() && !xmlDecl) {
264
258
    xmlDecl = (ZxXMLDecl *)node;
265
595
  } else if (node->isDocTypeDecl() && !docTypeDecl) {
266
0
    docTypeDecl = (ZxDocTypeDecl *)node;
267
595
  } else if (node->isElement() && !root) {
268
494
    root = (ZxElement *)node;
269
494
  }
270
853
  ZxNode::addChild(node);
271
853
}
272
273
553
bool ZxDoc::parse(const char *data, Guint dataLen) {
274
553
  parsePtr = data;
275
553
  parseEnd = data + dataLen;
276
  
277
553
  parseSpace();
278
553
  parseBOM();
279
553
  parseSpace();
280
553
  parseXMLDecl(this);
281
553
  parseMisc(this);
282
553
  parseDocTypeDecl(this);
283
553
  parseMisc(this);
284
553
  if (match("<")) {
285
494
    parseElement(this);
286
494
  }
287
553
  parseMisc(this);
288
553
  return root != NULL;
289
553
}
290
291
553
void ZxDoc::parseXMLDecl(ZxNode *par) {
292
553
  GString *version, *encoding, *s;
293
553
  bool standalone;
294
295
553
  if (!match("<?xml")) {
296
295
    return;
297
295
  }
298
258
  parsePtr += 5;
299
258
  parseSpace();
300
301
  // version
302
258
  version = NULL;
303
258
  if (match("version")) {
304
247
    parsePtr += 7;
305
247
    parseSpace();
306
247
    if (match("=")) {
307
245
      ++parsePtr;
308
245
      parseSpace();
309
245
      version = parseQuotedString();
310
245
    }
311
247
  }
312
258
  if (!version) {
313
13
    version = new GString("1.0");
314
13
  }
315
258
  parseSpace();
316
  
317
  // encoding
318
258
  encoding = NULL;
319
258
  if (match("encoding")) {
320
242
    parsePtr += 8;
321
242
    parseSpace();
322
242
    if (match("=")) {
323
236
      ++parsePtr;
324
236
      parseSpace();
325
236
      encoding = parseQuotedString();
326
236
    }
327
242
  }
328
258
  parseSpace();
329
330
  // standalone
331
258
  standalone = false;
332
258
  if (match("standalone")) {
333
0
    parsePtr += 10;
334
0
    parseSpace();
335
0
    if (match("=")) {
336
0
      ++parsePtr;
337
0
      parseSpace();
338
0
      s = parseQuotedString();
339
0
      standalone = !s->cmp("yes");
340
0
      delete s;
341
0
    }
342
0
  }
343
258
  parseSpace();
344
345
258
  if (match("?>")) {
346
210
    parsePtr += 2;
347
210
  }
348
349
258
  par->addChild(new ZxXMLDecl(version, encoding, standalone));
350
258
}
351
352
//~ this just skips everything after the name
353
553
void ZxDoc::parseDocTypeDecl(ZxNode *par) {
354
553
  GString *name;
355
553
  int state;
356
553
  char c, quote;
357
358
553
  if (!match("<!DOCTYPE")) {
359
553
    return;
360
553
  }
361
0
  parsePtr += 9;
362
0
  parseSpace();
363
364
0
  name = parseName();
365
0
  parseSpace();
366
367
0
  state = 0;
368
0
  quote = '\0';
369
0
  while (parsePtr < parseEnd && state < 4) {
370
0
    c = *parsePtr++;
371
0
    switch (state) {
372
0
    case 0: // not in square brackets; not in quotes
373
0
      if (c == '>') {
374
0
  state = 4;
375
0
      } else if (c == '"' || c == '\'') {
376
0
  state = 1;
377
0
      } else if (c == '[') {
378
0
  state = 2;
379
0
      }
380
0
      break;
381
0
    case 1: // not in square brackets; in quotes
382
0
      if (c == quote) {
383
0
  state = 0;
384
0
      }
385
0
      break;
386
0
    case 2: // in square brackets; not in quotes
387
0
      if (c == ']') {
388
0
  state = 0;
389
0
      } else if (c == '"' || c == '\'') {
390
0
  state = 3;
391
0
      }
392
0
      break;
393
0
    case 3: // in square brackets; in quotes
394
0
      if (c == quote) {
395
0
  state = 2;
396
0
      }
397
0
      break;
398
0
    }
399
0
  }
400
401
0
  par->addChild(new ZxDocTypeDecl(name));
402
0
}
403
404
// assumes match("<")
405
1.33M
void ZxDoc::parseElement(ZxNode *par) {
406
1.33M
  GString *type;
407
1.33M
  ZxElement *elem;
408
1.33M
  ZxAttr *attr;
409
410
1.33M
  ++parsePtr;
411
1.33M
  type = parseName();
412
1.33M
  elem = new ZxElement(type);
413
1.33M
  parseSpace();
414
1.41M
  while ((attr = parseAttr())) {
415
80.4k
    elem->addAttr(attr);
416
80.4k
    parseSpace();
417
80.4k
  }
418
1.33M
  if (match("/>")) {
419
9.33k
    parsePtr += 2;
420
1.32M
  } else if (match(">")) {
421
287k
    ++parsePtr;
422
287k
    parseContent(elem);
423
287k
  }
424
1.33M
  par->addChild(elem);
425
1.33M
}
426
427
1.41M
ZxAttr *ZxDoc::parseAttr() {
428
1.41M
  GString *name, *value;
429
1.41M
  const char *start;
430
1.41M
  char quote, c;
431
1.41M
  unsigned int x;
432
1.41M
  int n;
433
434
1.41M
  name = parseName();
435
1.41M
  parseSpace();
436
1.41M
  if (!match("=")) {
437
1.32M
    delete name;
438
1.32M
    return NULL;
439
1.32M
  }
440
94.1k
  ++parsePtr;
441
94.1k
  parseSpace();
442
94.1k
  if (!(parsePtr < parseEnd && (*parsePtr == '"' || *parsePtr == '\''))) {
443
13.7k
    delete name;
444
13.7k
    return NULL;
445
13.7k
  }
446
80.4k
  quote = *parsePtr++;
447
80.4k
  value = new GString();
448
219k
  while (parsePtr < parseEnd && *parsePtr != quote) {
449
139k
    if (*parsePtr == '&') {
450
38.4k
      ++parsePtr;
451
38.4k
      if (parsePtr < parseEnd && *parsePtr == '#') {
452
21.8k
  ++parsePtr;
453
21.8k
  if (parsePtr < parseEnd && *parsePtr == 'x') {
454
9.21k
    ++parsePtr;
455
9.21k
    x = 0;
456
26.8k
    while (parsePtr < parseEnd) {
457
26.8k
      c = *parsePtr;
458
26.8k
      if (c >= '0' && c <= '9') {
459
7.68k
        x = (x << 4) + (c - '0');
460
19.1k
      } else if (c >= 'a' && c <= 'f') {
461
9.19k
        x = (x << 4) + (10 + c - 'a');
462
9.99k
      } else if (c >= 'A' && c <= 'F') {
463
783
        x = (x << 4) + (10 + c - 'A');
464
9.21k
      } else {
465
9.21k
        break;
466
9.21k
      }
467
17.6k
      ++parsePtr;
468
17.6k
    }
469
9.21k
    if (parsePtr < parseEnd && *parsePtr == ';') {
470
293
      ++parsePtr;
471
293
    }
472
9.21k
    appendUTF8(value, x);
473
12.6k
  } else {
474
12.6k
    x = 0;
475
13.3k
    while (parsePtr < parseEnd) {
476
13.3k
      c = *parsePtr;
477
13.3k
      if (c >= '0' && c <= '9') {
478
716
        x = x * 10 + (c - '0');
479
12.6k
      } else {
480
12.6k
        break;
481
12.6k
      }
482
716
      ++parsePtr;
483
716
    }
484
12.6k
    if (parsePtr < parseEnd && *parsePtr == ';') {
485
320
      ++parsePtr;
486
320
    }
487
12.6k
    appendUTF8(value, x);
488
12.6k
  }
489
21.8k
      } else {
490
16.5k
  start = parsePtr;
491
16.5k
  for (++parsePtr;
492
1.53M
       parsePtr < parseEnd && *parsePtr != ';' &&
493
1.53M
         *parsePtr != quote && *parsePtr != '&';
494
1.51M
       ++parsePtr) ;
495
16.5k
  n = (int)(parsePtr - start);
496
16.5k
  if (parsePtr < parseEnd && *parsePtr == ';') {
497
272
    ++parsePtr;
498
272
  }
499
16.5k
  if (n == 2 && !strncmp(start, "lt", 2)) {
500
78
    value->append('<');
501
16.4k
  } else if (n == 2 && !strncmp(start, "gt", 2)) {
502
40
    value->append('>');
503
16.4k
  } else if (n == 3 && !strncmp(start, "amp", 3)) {
504
0
    value->append('&');
505
16.4k
  } else if (n == 4 && !strncmp(start, "apos", 4)) {
506
0
    value->append('\'');
507
16.4k
  } else if (n == 4 && !strncmp(start, "quot", 4)) {
508
0
    value->append('"');
509
16.4k
  } else {
510
16.4k
    value->append(start - 1, (int)(parsePtr - start) + 1);
511
16.4k
  }
512
16.5k
      }
513
100k
    } else {
514
100k
      start = parsePtr;
515
100k
      for (++parsePtr;
516
4.17M
     parsePtr < parseEnd && *parsePtr != quote && *parsePtr != '&';
517
4.07M
     ++parsePtr) ;
518
100k
      value->append(start, (int)(parsePtr - start));
519
100k
    }
520
139k
  }
521
80.4k
  if (parsePtr < parseEnd && *parsePtr == quote) {
522
80.3k
    ++parsePtr;
523
80.3k
  }
524
80.4k
  return new ZxAttr(name, value);
525
94.1k
}
526
527
// this consumes the end tag
528
287k
void ZxDoc::parseContent(ZxElement *par) {
529
287k
  GString *endType;
530
531
287k
  endType = (new GString("</"))->append(par->getType());
532
533
2.61M
  while (parsePtr < parseEnd) {
534
2.35M
    if (match(endType->getCString())) {
535
22.5k
      parsePtr += endType->getLength();
536
22.5k
      parseSpace();
537
22.5k
      if (match(">")) {
538
15.2k
  ++parsePtr;
539
15.2k
      }
540
22.5k
      break;
541
2.32M
    } else if (match("<?")) {
542
3.53k
      parsePI(par);
543
2.32M
    } else if (match("<![CDATA[")) {
544
43
      parseCDSect(par);
545
2.32M
    } else if (match("<!--")) {
546
5.25k
      parseComment(par);
547
2.32M
    } else if (match("<")) {
548
1.33M
      parseElement(par);
549
1.33M
    } else {
550
986k
      parseCharData(par);
551
986k
    }
552
2.35M
  }
553
554
287k
  delete endType;
555
287k
}
556
557
986k
void ZxDoc::parseCharData(ZxElement *par) {
558
986k
  GString *data;
559
986k
  const char *start;
560
986k
  char c;
561
986k
  unsigned int x;
562
986k
  int n;
563
564
986k
  data = new GString();
565
2.78M
  while (parsePtr < parseEnd && *parsePtr != '<') {
566
1.80M
    if (*parsePtr == '&') {
567
815k
      ++parsePtr;
568
815k
      if (parsePtr < parseEnd && *parsePtr == '#') {
569
31.4k
  ++parsePtr;
570
31.4k
  if (parsePtr < parseEnd && *parsePtr == 'x') {
571
6.67k
    ++parsePtr;
572
6.67k
    x = 0;
573
11.4k
    while (parsePtr < parseEnd) {
574
11.4k
      c = *parsePtr;
575
11.4k
      if (c >= '0' && c <= '9') {
576
1.96k
        x = (x << 4) + (c - '0');
577
9.52k
      } else if (c >= 'a' && c <= 'f') {
578
1.91k
        x = (x << 4) + (10 + c - 'a');
579
7.60k
      } else if (c >= 'A' && c <= 'F') {
580
935
        x = (x << 4) + (10 + c - 'A');
581
6.67k
      } else {
582
6.67k
        break;
583
6.67k
      }
584
4.81k
      ++parsePtr;
585
4.81k
    }
586
6.67k
    if (parsePtr < parseEnd && *parsePtr == ';') {
587
423
      ++parsePtr;
588
423
    }
589
6.67k
    appendUTF8(data, x);
590
24.8k
  } else {
591
24.8k
    x = 0;
592
45.4k
    while (parsePtr < parseEnd) {
593
45.4k
      c = *parsePtr;
594
45.4k
      if (c >= '0' && c <= '9') {
595
20.6k
        x = x * 10 + (c - '0');
596
24.7k
      } else {
597
24.7k
        break;
598
24.7k
      }
599
20.6k
      ++parsePtr;
600
20.6k
    }
601
24.8k
    if (parsePtr < parseEnd && *parsePtr == ';') {
602
275
      ++parsePtr;
603
275
    }
604
24.8k
    appendUTF8(data, x);
605
24.8k
  }
606
784k
      } else {
607
784k
  start = parsePtr;
608
784k
  for (++parsePtr;
609
20.4M
       parsePtr < parseEnd && *parsePtr != ';' &&
610
20.4M
         *parsePtr != '<' && *parsePtr != '&';
611
19.6M
       ++parsePtr) ;
612
784k
  n = (int)(parsePtr - start);
613
784k
  if (parsePtr < parseEnd && *parsePtr == ';') {
614
480
    ++parsePtr;
615
480
  }
616
784k
  if (n == 2 && !strncmp(start, "lt", 2)) {
617
84
    data->append('<');
618
784k
  } else if (n == 2 && !strncmp(start, "gt", 2)) {
619
181
    data->append('>');
620
783k
  } else if (n == 3 && !strncmp(start, "amp", 3)) {
621
0
    data->append('&');
622
783k
  } else if (n == 4 && !strncmp(start, "apos", 4)) {
623
0
    data->append('\'');
624
783k
  } else if (n == 4 && !strncmp(start, "quot", 4)) {
625
0
    data->append('"');
626
783k
  } else {
627
783k
    data->append(start - 1, (int)(parsePtr - start) + 1);
628
783k
  }
629
784k
      }
630
987k
    } else {
631
987k
      start = parsePtr;
632
987k
      for (++parsePtr;
633
30.2M
     parsePtr < parseEnd && *parsePtr != '<' && *parsePtr != '&';
634
29.2M
     ++parsePtr) ;
635
987k
      data->append(start, (int)(parsePtr - start));
636
987k
    }
637
1.80M
  }
638
986k
  par->addChild(new ZxCharData(data, true));
639
986k
}
640
641
53.3k
void ZxDoc::appendUTF8(GString *s, unsigned int c) {
642
53.3k
  if (c <= 0x7f) {
643
47.7k
    s->append((char)c);
644
47.7k
  } else if (c <= 0x7ff) {
645
1.38k
    s->append((char)(0xc0 + (c >> 6)));
646
1.38k
    s->append((char)(0x80 + (c & 0x3f)));
647
4.24k
  } else if (c <= 0xffff) {
648
467
    s->append((char)(0xe0 + (c >> 12)));
649
467
    s->append((char)(0x80 + ((c >> 6) & 0x3f)));
650
467
    s->append((char)(0x80 + (c & 0x3f)));
651
3.78k
  } else if (c <= 0x1fffff) {
652
2.14k
    s->append((char)(0xf0 + (c >> 18)));
653
2.14k
    s->append((char)(0x80 + ((c >> 12) & 0x3f)));
654
2.14k
    s->append((char)(0x80 + ((c >> 6) & 0x3f)));
655
2.14k
    s->append((char)(0x80 + (c & 0x3f)));
656
2.14k
  } else if (c <= 0x3ffffff) {
657
330
    s->append((char)(0xf8 + (c >> 24)));
658
330
    s->append((char)(0x80 + ((c >> 18) & 0x3f)));
659
330
    s->append((char)(0x80 + ((c >> 12) & 0x3f)));
660
330
    s->append((char)(0x80 + ((c >> 6) & 0x3f)));
661
330
    s->append((char)(0x80 + (c & 0x3f)));
662
1.30k
  } else if (c <= 0x7fffffff) {
663
738
    s->append((char)(0xfc + (c >> 30)));
664
738
    s->append((char)(0x80 + ((c >> 24) & 0x3f)));
665
738
    s->append((char)(0x80 + ((c >> 18) & 0x3f)));
666
738
    s->append((char)(0x80 + ((c >> 12) & 0x3f)));
667
738
    s->append((char)(0x80 + ((c >> 6) & 0x3f)));
668
738
    s->append((char)(0x80 + (c & 0x3f)));
669
738
  }
670
53.3k
}
671
672
// assumes match("<![CDATA[")
673
43
void ZxDoc::parseCDSect(ZxNode *par) {
674
43
  const char *start;
675
676
43
  parsePtr += 9;
677
43
  start = parsePtr;
678
1.70M
  while (parsePtr < parseEnd - 3) {
679
1.70M
    if (!strncmp(parsePtr, "]]>", 3)) {
680
36
      par->addChild(new ZxCharData(new GString(start, (int)(parsePtr - start)),
681
36
           false));
682
36
      parsePtr += 3;
683
36
      return;
684
36
    }
685
1.70M
    ++parsePtr;
686
1.70M
  }
687
7
  parsePtr = parseEnd;
688
7
  par->addChild(new ZxCharData(new GString(start, (int)(parsePtr - start)),
689
7
             false));
690
7
}
691
692
1.65k
void ZxDoc::parseMisc(ZxNode *par) {
693
2.14k
  while (1) {
694
2.14k
    if (match("<!--")) {
695
0
      parseComment(par);
696
2.14k
    } else if (match("<?")) {
697
101
      parsePI(par);
698
2.04k
    } else if (parsePtr < parseEnd && (*parsePtr == '\x20' ||
699
1.53k
               *parsePtr == '\x09' ||
700
1.53k
               *parsePtr == '\x0d' ||
701
1.53k
               *parsePtr == '\x0a')) {
702
382
      ++parsePtr;
703
1.65k
    } else {
704
1.65k
      break;
705
1.65k
    }
706
2.14k
  }
707
1.65k
}
708
709
// assumes match("<!--")
710
5.25k
void ZxDoc::parseComment(ZxNode *par) {
711
5.25k
  const char *start;
712
713
5.25k
  parsePtr += 4;
714
5.25k
  start = parsePtr;
715
379k
  while (parsePtr <= parseEnd - 3) {
716
379k
    if (!strncmp(parsePtr, "-->", 3)) {
717
5.25k
      par->addChild(new ZxComment(new GString(start, (int)(parsePtr - start))));
718
5.25k
      parsePtr += 3;
719
5.25k
      return;
720
5.25k
    }
721
374k
    ++parsePtr;
722
374k
  }
723
5
  parsePtr = parseEnd;
724
5
}
725
726
// assumes match("<?")
727
3.63k
void ZxDoc::parsePI(ZxNode *par) {
728
3.63k
  GString *target;
729
3.63k
  const char *start;
730
731
3.63k
  parsePtr += 2;
732
3.63k
  target = parseName();
733
3.63k
  parseSpace();
734
3.63k
  start = parsePtr;
735
869k
  while (parsePtr <= parseEnd - 2) {
736
869k
    if (!strncmp(parsePtr, "?>", 2)) {
737
3.58k
      par->addChild(new ZxPI(target, new GString(start,
738
3.58k
             (int)(parsePtr - start))));
739
3.58k
      parsePtr += 2;
740
3.58k
      return;
741
3.58k
    }
742
866k
    ++parsePtr;
743
866k
  }
744
49
  parsePtr = parseEnd;
745
49
  par->addChild(new ZxPI(target, new GString(start, (int)(parsePtr - start))));
746
49
}
747
748
//~ this accepts all chars >= 0x80
749
//~ this doesn't check for properly-formed UTF-8
750
2.75M
GString *ZxDoc::parseName() {
751
2.75M
  GString *name;
752
753
2.75M
  name = new GString();
754
2.75M
  if (parsePtr < parseEnd && nameStartChar[*parsePtr & 0xff]) {
755
1.03M
    name->append(*parsePtr++);
756
4.00M
    while (parsePtr < parseEnd && nameChar[*parsePtr & 0xff]) {
757
2.97M
      name->append(*parsePtr++);
758
2.97M
    }
759
1.03M
  }
760
2.75M
  return name;
761
2.75M
}
762
763
481
GString *ZxDoc::parseQuotedString() {
764
481
  GString *s;
765
481
  const char *start;
766
481
  char quote;
767
768
481
  if (parsePtr < parseEnd && (*parsePtr == '"' || *parsePtr == '\'')) {
769
472
    quote = *parsePtr++;
770
472
    start = parsePtr;
771
11.2k
    while (parsePtr < parseEnd && *parsePtr != quote) {
772
10.7k
      ++parsePtr;
773
10.7k
    }
774
472
    s = new GString(start, (int)(parsePtr - start));
775
472
    if (parsePtr < parseEnd && *parsePtr == quote) {
776
472
      ++parsePtr;
777
472
    }
778
472
  } else {
779
9
    s = new GString();
780
9
  }
781
481
  return s;
782
481
}
783
784
553
void ZxDoc::parseBOM() {
785
553
  if (match("\xef\xbb\xbf")) {
786
0
    parsePtr += 3;
787
0
  }
788
553
}
789
790
2.95M
void ZxDoc::parseSpace() {
791
3.41M
  while (parsePtr < parseEnd && (*parsePtr == '\x20' ||
792
3.41M
         *parsePtr == '\x09' ||
793
3.41M
         *parsePtr == '\x0d' ||
794
3.41M
         *parsePtr == '\x0a')) {
795
458k
    ++parsePtr;
796
458k
  }
797
2.95M
}
798
799
15.7M
bool ZxDoc::match(const char *s) {
800
15.7M
  int n;
801
802
15.7M
  n = (int)strlen(s);
803
15.7M
  return parseEnd - parsePtr >= n && !strncmp(parsePtr, s, n);
804
15.7M
}
805
806
0
bool ZxDoc::write(ZxWriteFunc writeFunc, void *stream) {
807
0
  ZxNode *child;
808
809
0
  for (child = getFirstChild(); child; child = child->getNextChild()) {
810
0
    if (!child->write(writeFunc, stream)) {
811
0
      return false;
812
0
    }
813
0
    if (!(*writeFunc)(stream, "\n", 1)) {
814
0
      return false;
815
0
    }
816
0
  }
817
0
  return true;
818
0
}
819
820
//------------------------------------------------------------------------
821
822
258
ZxXMLDecl::ZxXMLDecl(GString *versionA, GString *encodingA, bool standaloneA) {
823
258
  version = versionA;
824
258
  encoding = encodingA;
825
258
  standalone = standaloneA;
826
258
}
827
828
258
ZxXMLDecl::~ZxXMLDecl() {
829
258
  delete version;
830
258
  if (encoding) {
831
236
    delete encoding;
832
236
  }
833
258
}
834
835
0
bool ZxXMLDecl::write(ZxWriteFunc writeFunc, void *stream) {
836
0
  GString *s;
837
0
  bool ok;
838
839
0
  s = new GString("<?xml version=\"");
840
0
  s->append(version);
841
0
  s->append("\"");
842
0
  if (encoding) {
843
0
    s->append(" encoding=\"");
844
0
    s->append(encoding);
845
0
    s->append("\"");
846
0
  }
847
0
  if (standalone) {
848
0
    s->append(" standlone=\"yes\"");
849
0
  }
850
0
  s->append("?>");
851
0
  ok = (*writeFunc)(stream, s->getCString(), s->getLength());
852
0
  delete s;
853
0
  return ok;
854
0
}
855
856
//------------------------------------------------------------------------
857
858
0
ZxDocTypeDecl::ZxDocTypeDecl(GString *nameA) {
859
0
  name = nameA;
860
0
}
861
862
0
ZxDocTypeDecl::~ZxDocTypeDecl() {
863
0
  delete name;
864
0
}
865
866
0
bool ZxDocTypeDecl::write(ZxWriteFunc writeFunc, void *stream) {
867
0
  GString *s;
868
0
  bool ok;
869
870
0
  s = new GString("<!DOCTYPE ");
871
0
  s->append(name);
872
0
  s->append(">");
873
0
  ok = (*writeFunc)(stream, s->getCString(), s->getLength());
874
0
  delete s;
875
0
  return ok;
876
0
}
877
878
//------------------------------------------------------------------------
879
880
5.25k
ZxComment::ZxComment(GString *textA) {
881
5.25k
  text = textA;
882
5.25k
}
883
884
5.25k
ZxComment::~ZxComment() {
885
5.25k
  delete text;
886
5.25k
}
887
888
0
bool ZxComment::write(ZxWriteFunc writeFunc, void *stream) {
889
0
  GString *s;
890
0
  bool ok;
891
892
0
  s = new GString("<!--");
893
0
  s->append(text);
894
0
  s->append("-->");
895
0
  ok = (*writeFunc)(stream, s->getCString(), s->getLength());
896
0
  delete s;
897
0
  return ok;
898
0
}
899
900
//------------------------------------------------------------------------
901
902
3.63k
ZxPI::ZxPI(GString *targetA, GString *textA) {
903
3.63k
  target = targetA;
904
3.63k
  text = textA;
905
3.63k
}
906
907
3.63k
ZxPI::~ZxPI() {
908
3.63k
  delete target;
909
3.63k
  delete text;
910
3.63k
}
911
912
0
bool ZxPI::write(ZxWriteFunc writeFunc, void *stream) {
913
0
  GString *s;
914
0
  bool ok;
915
916
0
  s = new GString("<?");
917
0
  s->append(target);
918
0
  s->append(" ");
919
0
  s->append(text);
920
0
  s->append("?>");
921
0
  ok = (*writeFunc)(stream, s->getCString(), s->getLength());
922
0
  delete s;
923
0
  return ok;
924
0
}
925
926
//------------------------------------------------------------------------
927
928
1.33M
ZxElement::ZxElement(GString *typeA) {
929
1.33M
  type = typeA;
930
1.33M
  attrs = new GHash();
931
1.33M
  firstAttr = lastAttr = NULL;
932
1.33M
}
933
  
934
1.33M
ZxElement::~ZxElement() {
935
1.33M
  delete type;
936
1.33M
  deleteGHash(attrs, ZxAttr);
937
1.33M
}
938
939
698k
bool ZxElement::isElement(const char *typeA) {
940
698k
  return !type->cmp(typeA);
941
698k
}
942
943
138k
ZxAttr *ZxElement::findAttr(const char *attrName) {
944
138k
  return (ZxAttr *)attrs->lookup(attrName);
945
138k
}
946
947
80.4k
void ZxElement::addAttr(ZxAttr *attr) {
948
80.4k
  attrs->add(attr->getName(), attr);
949
80.4k
  if (lastAttr) {
950
7.92k
    lastAttr->next = attr;
951
7.92k
    lastAttr= attr;
952
72.5k
  } else {
953
72.5k
    firstAttr = lastAttr = attr;
954
72.5k
  }
955
80.4k
  attr->parent = this;
956
80.4k
  attr->next = NULL;
957
80.4k
}
958
959
0
bool ZxElement::write(ZxWriteFunc writeFunc, void *stream) {
960
0
  GString *s;
961
0
  ZxAttr *attr;
962
0
  ZxNode *child;
963
0
  bool ok;
964
965
0
  s = new GString("<");
966
0
  s->append(type);
967
0
  for (attr = firstAttr; attr; attr = attr->getNextAttr()) {
968
0
    s->append(" ");
969
0
    s->append(attr->name);
970
0
    s->append("=\"");
971
0
    appendEscapedAttrValue(s, attr->value);
972
0
    s->append("\"");
973
0
  }
974
0
  if ((child = getFirstChild())) {
975
0
    s->append(">");
976
0
  } else {
977
0
    s->append("/>");
978
0
  }
979
0
  ok = (*writeFunc)(stream, s->getCString(), s->getLength());
980
0
  delete s;
981
0
  if (!ok) {
982
0
    return false;
983
0
  }
984
0
  if (child) {
985
0
    for (; child; child = child->getNextChild()) {
986
0
      if (!child->write(writeFunc, stream)) {
987
0
  return false;
988
0
      }
989
0
    }
990
0
    s = new GString();
991
0
    s->append("</");
992
0
    s->append(type);
993
0
    s->append(">");
994
0
    ok = (*writeFunc)(stream, s->getCString(), s->getLength());
995
0
    delete s;
996
0
    if (!ok) {
997
0
      return false;
998
0
    }
999
0
  }
1000
0
  return true;
1001
0
}
1002
1003
0
void ZxElement::appendEscapedAttrValue(GString *out, GString *s) {
1004
0
  char c;
1005
0
  int i;
1006
1007
0
  for (i = 0; i < s->getLength(); ++i) {
1008
0
    c = s->getChar(i);
1009
0
    if (c == '<') {
1010
0
      out->append("&lt;");
1011
0
    } else if (c == '>') {
1012
0
      out->append("&gt;");
1013
0
    } else if (c == '&') {
1014
0
      out->append("&amp;");
1015
0
    } else if (c == '"') {
1016
0
      out->append("&quot;");
1017
0
    } else {
1018
0
      out->append(c);
1019
0
    }
1020
0
  }
1021
0
}
1022
1023
//------------------------------------------------------------------------
1024
1025
80.4k
ZxAttr::ZxAttr(GString *nameA, GString *valueA) {
1026
80.4k
  name = nameA;
1027
80.4k
  value = valueA;
1028
80.4k
  parent = NULL;
1029
80.4k
  next = NULL;
1030
80.4k
}
1031
1032
80.4k
ZxAttr::~ZxAttr() {
1033
80.4k
  delete name;
1034
80.4k
  delete value;
1035
80.4k
}
1036
1037
//------------------------------------------------------------------------
1038
1039
986k
ZxCharData::ZxCharData(GString *dataA, bool parsedA) {
1040
986k
  data = dataA;
1041
986k
  parsed = parsedA;
1042
986k
}
1043
1044
986k
ZxCharData::~ZxCharData() {
1045
986k
  delete data;
1046
986k
}
1047
1048
0
bool ZxCharData::write(ZxWriteFunc writeFunc, void *stream) {
1049
0
  GString *s;
1050
0
  char c;
1051
0
  int i;
1052
0
  bool ok;
1053
1054
0
  s = new GString();
1055
0
  if (parsed) {
1056
0
    for (i = 0; i < data->getLength(); ++i) {
1057
0
      c = data->getChar(i);
1058
0
      if (c == '<') {
1059
0
  s->append("&lt;");
1060
0
      } else if (c == '>') {
1061
0
  s->append("&gt;");
1062
0
      } else if (c == '&') {
1063
0
  s->append("&amp;");
1064
0
      } else {
1065
0
  s->append(c);
1066
0
      }
1067
0
    }
1068
0
  } else {
1069
0
    s->append("<![CDATA[");
1070
0
    s->append(data);
1071
0
    s->append("]]>");
1072
0
  }
1073
0
  ok = (*writeFunc)(stream, s->getCString(), s->getLength());
1074
0
  delete s;
1075
0
  return ok;
1076
0
}