Coverage Report

Created: 2026-03-31 07:03

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
/src/xpdf-4.06/xpdf/TextString.cc
Line
Count
Source
1
//========================================================================
2
//
3
// TextString.cc
4
//
5
// Copyright 2011-2013 Glyph & Cog, LLC
6
//
7
//========================================================================
8
9
#include <aconf.h>
10
11
#include <string.h>
12
#include "gmem.h"
13
#include "gmempp.h"
14
#include "GString.h"
15
#include "PDFDocEncoding.h"
16
#include "UTF8.h"
17
#include "TextString.h"
18
19
//------------------------------------------------------------------------
20
21
213k
TextString::TextString() {
22
213k
  u = NULL;
23
213k
  len = size = 0;
24
213k
}
25
26
16.5k
TextString::TextString(GString *s) {
27
16.5k
  u = NULL;
28
16.5k
  len = size = 0;
29
16.5k
  append(s);
30
16.5k
}
31
32
2.93k
TextString::TextString(TextString *s) {
33
2.93k
  len = size = s->len;
34
2.93k
  if (len) {
35
1.14k
    u = (Unicode *)gmallocn(size, sizeof(Unicode));
36
1.14k
    memcpy(u, s->u, len * sizeof(Unicode));
37
1.78k
  } else {
38
1.78k
    u = NULL;
39
1.78k
  }
40
2.93k
}
41
42
232k
TextString::~TextString() {
43
232k
  gfree(u);
44
232k
}
45
46
0
TextString *TextString::append(Unicode c) {
47
0
  expand(1);
48
0
  u[len] = c;
49
0
  ++len;
50
0
  return this;
51
0
}
52
53
16.5k
TextString *TextString::append(GString *s) {
54
16.5k
  return insert(len, s);
55
16.5k
}
56
57
21.2k
TextString *TextString::insert(int idx, Unicode c) {
58
21.2k
  if (idx >= 0 && idx <= len) {
59
21.2k
    expand(1);
60
21.2k
    if (idx < len) {
61
21.2k
      memmove(u + idx + 1, u + idx, (len - idx) * sizeof(Unicode));
62
21.2k
    }
63
21.2k
    u[idx] = c;
64
21.2k
    ++len;
65
21.2k
  }
66
21.2k
  return this;
67
21.2k
}
68
69
133k
TextString *TextString::insert(int idx, Unicode *u2, int n) {
70
133k
  if (idx >= 0 && idx <= len) {
71
133k
    expand(n);
72
133k
    if (idx < len) {
73
80.9k
      memmove(u + idx + n, u + idx, (len - idx) * sizeof(Unicode));
74
80.9k
    }
75
133k
    memcpy(u + idx, u2, n * sizeof(Unicode));
76
133k
    len += n;
77
133k
  }
78
133k
  return this;
79
133k
}
80
81
38.3k
TextString *TextString::insert(int idx, GString *s) {
82
38.3k
  Unicode uBuf[100];
83
38.3k
  int n, i;
84
85
38.3k
  if (idx >= 0 && idx <= len) {
86
    // look for a UTF-16BE BOM
87
38.3k
    if ((s->getChar(0) & 0xff) == 0xfe &&
88
14.3k
  (s->getChar(1) & 0xff) == 0xff) {
89
14.0k
      i = 2;
90
14.0k
      n = 0;
91
3.06M
      while (getUTF16BE(s, &i, uBuf + n)) {
92
3.05M
  ++n;
93
3.05M
  if (n == sizeof(uBuf) / sizeof(Unicode)) {
94
25.7k
    insert(idx, uBuf, n);
95
25.7k
    idx += n;
96
25.7k
    n = 0;
97
25.7k
  }
98
3.05M
      }
99
14.0k
      if (n > 0) {
100
13.3k
  insert(idx, uBuf, n);
101
13.3k
      }
102
103
    // look for a UTF-16LE BOM
104
    // (technically, this isn't allowed by the PDF spec, but some
105
    // PDF files use it)
106
24.3k
    } else if ((s->getChar(0) & 0xff) == 0xff &&
107
1.81k
         (s->getChar(1) & 0xff) == 0xfe) {
108
1.45k
      i = 2;
109
1.45k
      n = 0;
110
5.95M
      while (getUTF16LE(s, &i, uBuf + n)) {
111
5.94M
  ++n;
112
5.94M
  if (n == sizeof(uBuf) / sizeof(Unicode)) {
113
58.8k
    insert(idx, uBuf, n);
114
58.8k
    idx += n;
115
58.8k
    n = 0;
116
58.8k
  }
117
5.94M
      }
118
1.45k
      if (n > 0) {
119
1.25k
  insert(idx, uBuf, n);
120
1.25k
      }
121
122
    // look for a UTF-8 BOM
123
22.9k
    } else if ((s->getChar(0) & 0xff) == 0xef &&
124
1.12k
         (s->getChar(1) & 0xff) == 0xbb &&
125
1.00k
         (s->getChar(2) & 0xff) == 0xbf) {
126
962
      i = 3;
127
962
      n = 0;
128
3.41M
      while (getUTF8(s, &i, uBuf + n)) {
129
3.41M
  ++n;
130
3.41M
  if (n == sizeof(uBuf) / sizeof(Unicode)) {
131
33.5k
    insert(idx, uBuf, n);
132
33.5k
    idx += n;
133
33.5k
    n = 0;
134
33.5k
  }
135
3.41M
      }
136
962
      if (n > 0) {
137
889
  insert(idx, uBuf, n);
138
889
      }
139
140
    // otherwise, use PDFDocEncoding
141
21.9k
    } else {
142
21.9k
      n = s->getLength();
143
21.9k
      expand(n);
144
21.9k
      if (idx < len) {
145
10.5k
  memmove(u + idx + n, u + idx, (len - idx) * sizeof(Unicode));
146
10.5k
      }
147
30.0M
      for (i = 0; i < n; ++i) {
148
30.0M
  u[idx + i] = pdfDocEncoding[s->getChar(i) & 0xff];
149
30.0M
      }
150
21.9k
      len += n;
151
21.9k
    }
152
38.3k
  }
153
38.3k
  return this;
154
38.3k
}
155
156
176k
void TextString::expand(int delta) {
157
176k
  int newLen;
158
159
176k
  newLen = len + delta;
160
176k
  if (delta > INT_MAX - len) {
161
    // trigger an out-of-memory error
162
0
    size = -1;
163
176k
  } else if (newLen <= size) {
164
147k
    return;
165
147k
  } else if (size > 0 && size <= INT_MAX / 2 && size*2 >= newLen) {
166
11.6k
    size *= 2;
167
17.5k
  } else {
168
17.5k
    size = newLen;
169
17.5k
  }
170
29.1k
  u = (Unicode *)greallocn(u, size, sizeof(Unicode));
171
29.1k
}
172
173
0
GString *TextString::toPDFTextString() {
174
0
  GString *s;
175
0
  GBool useUnicode;
176
0
  int i;
177
178
0
  useUnicode = gFalse;
179
0
  for (i = 0; i < len; ++i) {
180
0
    if (u[i] >= 0x80) {
181
0
      useUnicode = gTrue;
182
0
      break;
183
0
    }
184
0
  }
185
0
  s = new GString();
186
0
  if (useUnicode) {
187
0
    s->append((char)0xfe);
188
0
    s->append((char)0xff);
189
0
    for (i = 0; i < len; ++i) {
190
0
      s->append((char)(u[i] >> 8));
191
0
      s->append((char)u[i]);
192
0
    }
193
0
  } else {
194
0
    for (i = 0; i < len; ++i) {
195
0
      s->append((char)u[i]);
196
0
    }
197
0
  }
198
0
  return s;
199
0
}
200
201
135
GString *TextString::toUTF8() {
202
135
  GString *s = new GString();
203
37.5k
  for (int i = 0; i < len; ++i) {
204
37.4k
    char buf[8];
205
37.4k
    int n = mapUTF8(u[i], buf, sizeof(buf));
206
37.4k
    s->append(buf, n);
207
37.4k
  }
208
135
  return s;
209
135
}