/src/curl/lib/curlx/strparse.c
Line | Count | Source |
1 | | /*************************************************************************** |
2 | | * _ _ ____ _ |
3 | | * Project ___| | | | _ \| | |
4 | | * / __| | | | |_) | | |
5 | | * | (__| |_| | _ <| |___ |
6 | | * \___|\___/|_| \_\_____| |
7 | | * |
8 | | * Copyright (C) Daniel Stenberg, <daniel@haxx.se>, et al. |
9 | | * |
10 | | * This software is licensed as described in the file COPYING, which |
11 | | * you should have received as part of this distribution. The terms |
12 | | * are also available at https://curl.se/docs/copyright.html. |
13 | | * |
14 | | * You may opt to use, copy, modify, merge, publish, distribute and/or sell |
15 | | * copies of the Software, and permit persons to whom the Software is |
16 | | * furnished to do so, under the terms of the COPYING file. |
17 | | * |
18 | | * This software is distributed on an "AS IS" basis, WITHOUT WARRANTY OF ANY |
19 | | * KIND, either express or implied. |
20 | | * |
21 | | * SPDX-License-Identifier: curl |
22 | | * |
23 | | ***************************************************************************/ |
24 | | #include "curlx/strparse.h" |
25 | | |
26 | | void curlx_str_init(struct Curl_str *out) |
27 | 776k | { |
28 | 776k | out->str = NULL; |
29 | 776k | out->len = 0; |
30 | 776k | } |
31 | | |
32 | | void curlx_str_assign(struct Curl_str *out, const char *str, size_t len) |
33 | 15.5k | { |
34 | 15.5k | out->str = str; |
35 | 15.5k | out->len = len; |
36 | 15.5k | } |
37 | | |
38 | | /* remove bytes from the end of the string, never remove more bytes than what |
39 | | the string holds! */ |
40 | | void curlx_str_trim(struct Curl_str *out, size_t len) |
41 | 0 | { |
42 | 0 | DEBUGASSERT(out); |
43 | 0 | DEBUGASSERT(out->len >= len); |
44 | 0 | out->len -= len; |
45 | 0 | } |
46 | | |
47 | | /* Get a word until the first DELIM or end of string. At least one byte long. |
48 | | return non-zero on error. If 'max' is zero, it will always return error. */ |
49 | | int curlx_str_until(const char **linep, struct Curl_str *out, |
50 | | const size_t max, char delim) |
51 | 441k | { |
52 | 441k | const char *s; |
53 | 441k | size_t len = 0; |
54 | 441k | DEBUGASSERT(linep); |
55 | 441k | DEBUGASSERT(*linep); |
56 | 441k | DEBUGASSERT(out); |
57 | 441k | DEBUGASSERT(delim); |
58 | 441k | s = *linep; |
59 | | |
60 | 441k | curlx_str_init(out); |
61 | 8.21M | while(*s && (*s != delim)) { |
62 | 7.76M | s++; |
63 | 7.76M | if(++len > max) { |
64 | 633 | return STRE_BIG; |
65 | 633 | } |
66 | 7.76M | } |
67 | 441k | if(!len) |
68 | 17.7k | return STRE_SHORT; |
69 | 423k | out->str = *linep; |
70 | 423k | out->len = len; |
71 | 423k | *linep = s; /* point to the first byte after the word */ |
72 | 423k | return STRE_OK; |
73 | 441k | } |
74 | | |
75 | | /* Get a word until the first space or end of string. At least one byte long. |
76 | | return non-zero on error */ |
77 | | int curlx_str_word(const char **linep, struct Curl_str *out, const size_t max) |
78 | 194k | { |
79 | 194k | return curlx_str_until(linep, out, max, ' '); |
80 | 194k | } |
81 | | |
82 | | /* Get a word until a newline byte or end of string. At least one byte long. |
83 | | return non-zero on error */ |
84 | | int curlx_str_untilnl(const char **linep, struct Curl_str *out, |
85 | | const size_t max) |
86 | 84.5k | { |
87 | 84.5k | const char *s = *linep; |
88 | 84.5k | size_t len = 0; |
89 | 84.5k | DEBUGASSERT(linep && *linep && out && max); |
90 | | |
91 | 84.5k | curlx_str_init(out); |
92 | 8.89M | while(*s && !ISNEWLINE(*s)) { |
93 | 8.80M | s++; |
94 | 8.80M | if(++len > max) |
95 | 2 | return STRE_BIG; |
96 | 8.80M | } |
97 | 84.5k | if(!len) |
98 | 6.26k | return STRE_SHORT; |
99 | 78.2k | out->str = *linep; |
100 | 78.2k | out->len = len; |
101 | 78.2k | *linep = s; /* point to the first byte after the word */ |
102 | 78.2k | return STRE_OK; |
103 | 84.5k | } |
104 | | |
105 | | /* Get a "quoted" word. Escaped quotes are supported. |
106 | | return non-zero on error */ |
107 | | int curlx_str_quotedword(const char **linep, struct Curl_str *out, |
108 | | const size_t max) |
109 | 6.60k | { |
110 | 6.60k | const char *s = *linep; |
111 | 6.60k | size_t len = 0; |
112 | 6.60k | DEBUGASSERT(linep && *linep && out && max); |
113 | | |
114 | 6.60k | curlx_str_init(out); |
115 | 6.60k | if(*s != '\"') |
116 | 28 | return STRE_BEGQUOTE; |
117 | 6.57k | s++; |
118 | 37.5k | while(*s && (*s != '\"')) { |
119 | 30.9k | if(*s == '\\' && s[1]) { |
120 | 611 | s++; |
121 | 611 | if(++len > max) |
122 | 0 | return STRE_BIG; |
123 | 611 | } |
124 | 30.9k | s++; |
125 | 30.9k | if(++len > max) |
126 | 0 | return STRE_BIG; |
127 | 30.9k | } |
128 | 6.57k | if(*s != '\"') |
129 | 1.60k | return STRE_ENDQUOTE; |
130 | 4.97k | out->str = (*linep) + 1; |
131 | 4.97k | out->len = len; |
132 | 4.97k | *linep = s + 1; |
133 | 4.97k | return STRE_OK; |
134 | 6.57k | } |
135 | | |
136 | | /* Advance over a single character. |
137 | | return non-zero on error */ |
138 | | int curlx_str_single(const char **linep, char byte) |
139 | 6.48M | { |
140 | 6.48M | DEBUGASSERT(linep && *linep); |
141 | 6.48M | if(**linep != byte) |
142 | 5.36M | return STRE_BYTE; |
143 | 1.12M | (*linep)++; /* move over it */ |
144 | 1.12M | return STRE_OK; |
145 | 6.48M | } |
146 | | |
147 | | /* Advance over a single space. |
148 | | return non-zero on error */ |
149 | | int curlx_str_singlespace(const char **linep) |
150 | 194k | { |
151 | 194k | return curlx_str_single(linep, ' '); |
152 | 194k | } |
153 | | |
154 | | /* given an ASCII character and max ascii, return TRUE if valid */ |
155 | | #define valid_digit(x, m) \ |
156 | 41.7M | (((x) >= '0') && ((x) <= (m)) && curlx_hexasciitable[(x) - '0']) |
157 | | |
158 | | /* We use 16 for the zero index (and the necessary bitwise AND in the loop) |
159 | | to be able to have a non-zero value there to make valid_digit() able to |
160 | | use the info */ |
161 | | const unsigned char curlx_hexasciitable[] = { |
162 | | 16, 1, 2, 3, 4, 5, 6, 7, 8, 9, /* 0x30: 0 - 9 */ |
163 | | 0, 0, 0, 0, 0, 0, 0, |
164 | | 10, 11, 12, 13, 14, 15, /* 0x41: A - F */ |
165 | | 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, |
166 | | 10, 11, 12, 13, 14, 15 /* 0x61: a - f */ |
167 | | }; |
168 | | |
169 | | /* no support for 0x prefix nor leading spaces */ |
170 | | static int str_num_base(const char **linep, curl_off_t *nump, curl_off_t max, |
171 | | int base) /* 8, 10 or 16, nothing else */ |
172 | 21.6M | { |
173 | 21.6M | curl_off_t num = 0; |
174 | 21.6M | const char *p; |
175 | 21.6M | int m = (base == 10) ? '9' : /* the largest digit possible */ |
176 | 21.6M | (base == 16) ? 'f' : '7'; |
177 | 21.6M | DEBUGASSERT(linep && *linep && nump); |
178 | 21.6M | DEBUGASSERT((base == 8) || (base == 10) || (base == 16)); |
179 | 21.6M | DEBUGASSERT(max >= 0); /* mostly to catch SIZE_MAX, which is too large */ |
180 | 21.6M | *nump = 0; |
181 | 21.6M | p = *linep; |
182 | 21.6M | if(!valid_digit(*p, m)) |
183 | 11.5M | return STRE_NO_NUM; |
184 | 10.0M | if(max < base) { |
185 | | /* special-case low max scenario because check needs to be different */ |
186 | 0 | do { |
187 | 0 | int n = curlx_hexval(*p++); |
188 | 0 | num = (num * base) + n; |
189 | 0 | if(num > max) |
190 | 0 | return STRE_OVERFLOW; |
191 | 0 | } while(valid_digit(*p, m)); |
192 | 0 | } |
193 | 10.0M | else { |
194 | 20.0M | do { |
195 | 20.0M | int n = curlx_hexval(*p++); |
196 | 20.0M | if(num > ((max - n) / base)) |
197 | 6.58k | return STRE_OVERFLOW; |
198 | 20.0M | num = (num * base) + n; |
199 | 20.0M | } while(valid_digit(*p, m)); |
200 | 10.0M | } |
201 | 10.0M | *nump = num; |
202 | 10.0M | *linep = p; |
203 | 10.0M | return STRE_OK; |
204 | 10.0M | } |
205 | | |
206 | | /* Get an unsigned decimal number with no leading space or minus. Leading |
207 | | zeroes are accepted. return non-zero on error */ |
208 | | int curlx_str_number(const char **linep, curl_off_t *nump, curl_off_t max) |
209 | 21.5M | { |
210 | 21.5M | return str_num_base(linep, nump, max, 10); |
211 | 21.5M | } |
212 | | |
213 | | /* Get an unsigned hexadecimal number with no leading space or minus and no |
214 | | "0x" support. Leading zeroes are accepted. return non-zero on error */ |
215 | | int curlx_str_hex(const char **linep, curl_off_t *nump, curl_off_t max) |
216 | 3.12k | { |
217 | 3.12k | return str_num_base(linep, nump, max, 16); |
218 | 3.12k | } |
219 | | |
220 | | /* Get an unsigned octal number with no leading space or minus and no "0" |
221 | | prefix support. Leading zeroes are accepted. return non-zero on error */ |
222 | | int curlx_str_octal(const char **linep, curl_off_t *nump, curl_off_t max) |
223 | 132k | { |
224 | 132k | return str_num_base(linep, nump, max, 8); |
225 | 132k | } |
226 | | |
227 | | /* |
228 | | * Parse a positive number up to 63-bit number written in ASCII. Skip leading |
229 | | * blanks. No support for prefixes. |
230 | | */ |
231 | | int curlx_str_numblanks(const char **str, curl_off_t *num) |
232 | 9.21k | { |
233 | 9.21k | curlx_str_passblanks(str); |
234 | 9.21k | return curlx_str_number(str, num, CURL_OFF_T_MAX); |
235 | 9.21k | } |
236 | | |
237 | | /* CR or LF |
238 | | return non-zero on error */ |
239 | | int curlx_str_newline(const char **linep) |
240 | 5.75k | { |
241 | 5.75k | DEBUGASSERT(linep && *linep); |
242 | 5.75k | if(ISNEWLINE(**linep)) { |
243 | 5.71k | (*linep)++; |
244 | 5.71k | return STRE_OK; /* yessir */ |
245 | 5.71k | } |
246 | 34 | return STRE_NEWLINE; |
247 | 5.75k | } |
248 | | |
249 | | #ifndef WITHOUT_LIBCURL |
250 | | /* case insensitive compare that the parsed string matches the given string. |
251 | | Returns non-zero on match. */ |
252 | | int curlx_str_casecompare(struct Curl_str *str, const char *check) |
253 | 1.83M | { |
254 | 1.83M | size_t clen = check ? strlen(check) : 0; |
255 | 1.83M | return ((str->len == clen) && curl_strnequal(str->str, check, clen)); |
256 | 1.83M | } |
257 | | #endif |
258 | | |
259 | | /* case sensitive string compare. Returns non-zero on match. */ |
260 | | int curlx_str_cmp(struct Curl_str *str, const char *check) |
261 | 53.3k | { |
262 | 53.3k | if(check) { |
263 | 53.3k | size_t clen = strlen(check); |
264 | 53.3k | return ((str->len == clen) && !strncmp(str->str, check, clen)); |
265 | 53.3k | } |
266 | 0 | return !!(str->len); |
267 | 53.3k | } |
268 | | |
269 | | /* Trim off 'num' number of bytes from the beginning (left side) of the |
270 | | string. If 'num' is larger than the string, return error. */ |
271 | | int curlx_str_nudge(struct Curl_str *str, size_t num) |
272 | 134k | { |
273 | 134k | if(num <= str->len) { |
274 | 134k | str->str += num; |
275 | 134k | str->len -= num; |
276 | 134k | return STRE_OK; |
277 | 134k | } |
278 | 0 | return STRE_OVERFLOW; |
279 | 134k | } |
280 | | |
281 | | /* Get the following character sequence that consists only of bytes not |
282 | | present in the 'reject' string. Like strcspn(). */ |
283 | | int curlx_str_cspn(const char **linep, struct Curl_str *out, |
284 | | const char *reject) |
285 | 1.02M | { |
286 | 1.02M | const char *s = *linep; |
287 | 1.02M | size_t len; |
288 | 1.02M | DEBUGASSERT(linep && *linep); |
289 | | |
290 | 1.02M | len = strcspn(s, reject); |
291 | 1.02M | if(len) { |
292 | 928k | out->str = s; |
293 | 928k | out->len = len; |
294 | 928k | *linep = &s[len]; |
295 | 928k | return STRE_OK; |
296 | 928k | } |
297 | 100k | curlx_str_init(out); |
298 | 100k | return STRE_SHORT; |
299 | 1.02M | } |
300 | | |
301 | | /* remove ISBLANK()s from both ends of the string */ |
302 | | void curlx_str_trimblanks(struct Curl_str *out) |
303 | 894k | { |
304 | 1.02M | while(out->len && ISBLANK(*out->str)) |
305 | 133k | curlx_str_nudge(out, 1); |
306 | | |
307 | | /* trim trailing spaces and tabs */ |
308 | 924k | while(out->len && ISBLANK(out->str[out->len - 1])) |
309 | 30.2k | out->len--; |
310 | 894k | } |
311 | | |
312 | | /* increase the pointer until it has moved over all blanks */ |
313 | | void curlx_str_passblanks(const char **linep) |
314 | 958k | { |
315 | 1.06M | while(ISBLANK(**linep)) |
316 | 108k | (*linep)++; /* move over it */ |
317 | 958k | } |