/src/curl/lib/curlx/strparse.c
Line | Count | Source |
1 | | /*************************************************************************** |
2 | | * _ _ ____ _ |
3 | | * Project ___| | | | _ \| | |
4 | | * / __| | | | |_) | | |
5 | | * | (__| |_| | _ <| |___ |
6 | | * \___|\___/|_| \_\_____| |
7 | | * |
8 | | * Copyright (C) Daniel Stenberg, <daniel@haxx.se>, et al. |
9 | | * |
10 | | * This software is licensed as described in the file COPYING, which |
11 | | * you should have received as part of this distribution. The terms |
12 | | * are also available at https://curl.se/docs/copyright.html. |
13 | | * |
14 | | * You may opt to use, copy, modify, merge, publish, distribute and/or sell |
15 | | * copies of the Software, and permit persons to whom the Software is |
16 | | * furnished to do so, under the terms of the COPYING file. |
17 | | * |
18 | | * This software is distributed on an "AS IS" basis, WITHOUT WARRANTY OF ANY |
19 | | * KIND, either express or implied. |
20 | | * |
21 | | * SPDX-License-Identifier: curl |
22 | | * |
23 | | ***************************************************************************/ |
24 | | #include "curlx/strparse.h" |
25 | | |
26 | | void curlx_str_init(struct Curl_str *out) |
27 | 10.3k | { |
28 | 10.3k | out->str = NULL; |
29 | 10.3k | out->len = 0; |
30 | 10.3k | } |
31 | | |
32 | | void curlx_str_assign(struct Curl_str *out, const char *str, size_t len) |
33 | 0 | { |
34 | 0 | out->str = str; |
35 | 0 | out->len = len; |
36 | 0 | } |
37 | | |
38 | | /* remove bytes from the end of the string, never remove more bytes than what |
39 | | the string holds! */ |
40 | | void curlx_str_trim(struct Curl_str *out, size_t len) |
41 | 0 | { |
42 | 0 | DEBUGASSERT(out); |
43 | 0 | DEBUGASSERT(out->len >= len); |
44 | 0 | out->len -= len; |
45 | 0 | } |
46 | | |
47 | | /* Get a word until the first DELIM or end of string. At least one byte long. |
48 | | return non-zero on error. If 'max' is zero, it will always return error. */ |
49 | | int curlx_str_until(const char **linep, struct Curl_str *out, |
50 | | const size_t max, char delim) |
51 | 4.35k | { |
52 | 4.35k | const char *s; |
53 | 4.35k | size_t len = 0; |
54 | 4.35k | DEBUGASSERT(linep); |
55 | 4.35k | DEBUGASSERT(*linep); |
56 | 4.35k | DEBUGASSERT(out); |
57 | 4.35k | DEBUGASSERT(delim); |
58 | 4.35k | s = *linep; |
59 | | |
60 | 4.35k | curlx_str_init(out); |
61 | 13.8k | while(*s && (*s != delim)) { |
62 | 9.53k | s++; |
63 | 9.53k | if(++len > max) { |
64 | 26 | return STRE_BIG; |
65 | 26 | } |
66 | 9.53k | } |
67 | 4.32k | if(!len) |
68 | 16 | return STRE_SHORT; |
69 | 4.30k | out->str = *linep; |
70 | 4.30k | out->len = len; |
71 | 4.30k | *linep = s; /* point to the first byte after the word */ |
72 | 4.30k | return STRE_OK; |
73 | 4.32k | } |
74 | | |
75 | | /* Get a word until the first space or end of string. At least one byte long. |
76 | | return non-zero on error */ |
77 | | int curlx_str_word(const char **linep, struct Curl_str *out, const size_t max) |
78 | 4.12k | { |
79 | 4.12k | return curlx_str_until(linep, out, max, ' '); |
80 | 4.12k | } |
81 | | |
82 | | /* Get a word until a newline byte or end of string. At least one byte long. |
83 | | return non-zero on error */ |
84 | | int curlx_str_untilnl(const char **linep, struct Curl_str *out, |
85 | | const size_t max) |
86 | 0 | { |
87 | 0 | const char *s = *linep; |
88 | 0 | size_t len = 0; |
89 | 0 | DEBUGASSERT(linep && *linep && out && max); |
90 | |
|
91 | 0 | curlx_str_init(out); |
92 | 0 | while(*s && !ISNEWLINE(*s)) { |
93 | 0 | s++; |
94 | 0 | if(++len > max) |
95 | 0 | return STRE_BIG; |
96 | 0 | } |
97 | 0 | if(!len) |
98 | 0 | return STRE_SHORT; |
99 | 0 | out->str = *linep; |
100 | 0 | out->len = len; |
101 | 0 | *linep = s; /* point to the first byte after the word */ |
102 | 0 | return STRE_OK; |
103 | 0 | } |
104 | | |
105 | | /* Get a "quoted" word. Escaped quotes are supported. |
106 | | return non-zero on error */ |
107 | | int curlx_str_quotedword(const char **linep, struct Curl_str *out, |
108 | | const size_t max) |
109 | 0 | { |
110 | 0 | const char *s = *linep; |
111 | 0 | size_t len = 0; |
112 | 0 | DEBUGASSERT(linep && *linep && out && max); |
113 | |
|
114 | 0 | curlx_str_init(out); |
115 | 0 | if(*s != '\"') |
116 | 0 | return STRE_BEGQUOTE; |
117 | 0 | s++; |
118 | 0 | while(*s && (*s != '\"')) { |
119 | 0 | if(*s == '\\' && s[1]) { |
120 | 0 | s++; |
121 | 0 | if(++len > max) |
122 | 0 | return STRE_BIG; |
123 | 0 | } |
124 | 0 | s++; |
125 | 0 | if(++len > max) |
126 | 0 | return STRE_BIG; |
127 | 0 | } |
128 | 0 | if(*s != '\"') |
129 | 0 | return STRE_ENDQUOTE; |
130 | 0 | out->str = (*linep) + 1; |
131 | 0 | out->len = len; |
132 | 0 | *linep = s + 1; |
133 | 0 | return STRE_OK; |
134 | 0 | } |
135 | | |
136 | | /* Advance over a single character. |
137 | | return non-zero on error */ |
138 | | int curlx_str_single(const char **linep, char byte) |
139 | 47.5k | { |
140 | 47.5k | DEBUGASSERT(linep && *linep); |
141 | 47.5k | if(**linep != byte) |
142 | 12.9k | return STRE_BYTE; |
143 | 34.5k | (*linep)++; /* move over it */ |
144 | 34.5k | return STRE_OK; |
145 | 47.5k | } |
146 | | |
147 | | /* Advance over a single space. |
148 | | return non-zero on error */ |
149 | | int curlx_str_singlespace(const char **linep) |
150 | 4.12k | { |
151 | 4.12k | return curlx_str_single(linep, ' '); |
152 | 4.12k | } |
153 | | |
154 | | /* given an ASCII character and max ascii, return TRUE if valid */ |
155 | | #define valid_digit(x, m) \ |
156 | 51.0k | (((x) >= '0') && ((x) <= (m)) && curlx_hexasciitable[(x) - '0']) |
157 | | |
158 | | /* We use 16 for the zero index (and the necessary bitwise AND in the loop) |
159 | | to be able to have a non-zero value there to make valid_digit() able to |
160 | | use the info */ |
161 | | const unsigned char curlx_hexasciitable[] = { |
162 | | 16, 1, 2, 3, 4, 5, 6, 7, 8, 9, /* 0x30: 0 - 9 */ |
163 | | 0, 0, 0, 0, 0, 0, 0, |
164 | | 10, 11, 12, 13, 14, 15, /* 0x41: A - F */ |
165 | | 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, |
166 | | 10, 11, 12, 13, 14, 15 /* 0x61: a - f */ |
167 | | }; |
168 | | |
169 | | /* no support for 0x prefix nor leading spaces */ |
170 | | static int str_num_base(const char **linep, curl_off_t *nump, curl_off_t max, |
171 | | int base) /* 8, 10 or 16, nothing else */ |
172 | 13.5k | { |
173 | 13.5k | curl_off_t num = 0; |
174 | 13.5k | const char *p; |
175 | 13.5k | int m = (base == 10) ? '9' : /* the largest digit possible */ |
176 | 13.5k | (base == 16) ? 'f' : '7'; |
177 | 13.5k | DEBUGASSERT(linep && *linep && nump); |
178 | 13.5k | DEBUGASSERT((base == 8) || (base == 10) || (base == 16)); |
179 | 13.5k | DEBUGASSERT(max >= 0); /* mostly to catch SIZE_MAX, which is too large */ |
180 | 13.5k | *nump = 0; |
181 | 13.5k | p = *linep; |
182 | 13.5k | if(!valid_digit(*p, m)) |
183 | 196 | return STRE_NO_NUM; |
184 | 13.3k | if(max < base) { |
185 | | /* special-case low max scenario because check needs to be different */ |
186 | 0 | do { |
187 | 0 | int n = curlx_hexval(*p++); |
188 | 0 | num = (num * base) + n; |
189 | 0 | if(num > max) |
190 | 0 | return STRE_OVERFLOW; |
191 | 0 | } while(valid_digit(*p, m)); |
192 | 0 | } |
193 | 13.3k | else { |
194 | 37.8k | do { |
195 | 37.8k | int n = curlx_hexval(*p++); |
196 | 37.8k | if(num > ((max - n) / base)) |
197 | 297 | return STRE_OVERFLOW; |
198 | 37.5k | num = (num * base) + n; |
199 | 37.5k | } while(valid_digit(*p, m)); |
200 | 13.3k | } |
201 | 13.0k | *nump = num; |
202 | 13.0k | *linep = p; |
203 | 13.0k | return STRE_OK; |
204 | 13.3k | } |
205 | | |
206 | | /* Get an unsigned decimal number with no leading space or minus. Leading |
207 | | zeroes are accepted. return non-zero on error */ |
208 | | int curlx_str_number(const char **linep, curl_off_t *nump, curl_off_t max) |
209 | 13.5k | { |
210 | 13.5k | return str_num_base(linep, nump, max, 10); |
211 | 13.5k | } |
212 | | |
213 | | /* Get an unsigned hexadecimal number with no leading space or minus and no |
214 | | "0x" support. Leading zeroes are accepted. return non-zero on error */ |
215 | | int curlx_str_hex(const char **linep, curl_off_t *nump, curl_off_t max) |
216 | 0 | { |
217 | 0 | return str_num_base(linep, nump, max, 16); |
218 | 0 | } |
219 | | |
220 | | /* Get an unsigned octal number with no leading space or minus and no "0" |
221 | | prefix support. Leading zeroes are accepted. return non-zero on error */ |
222 | | int curlx_str_octal(const char **linep, curl_off_t *nump, curl_off_t max) |
223 | 0 | { |
224 | 0 | return str_num_base(linep, nump, max, 8); |
225 | 0 | } |
226 | | |
227 | | /* |
228 | | * Parse a positive number up to 63-bit number written in ASCII. Skip leading |
229 | | * blanks. No support for prefixes. |
230 | | */ |
231 | | int curlx_str_numblanks(const char **str, curl_off_t *num) |
232 | 0 | { |
233 | 0 | curlx_str_passblanks(str); |
234 | 0 | return curlx_str_number(str, num, CURL_OFF_T_MAX); |
235 | 0 | } |
236 | | |
237 | | /* CR or LF |
238 | | return non-zero on error */ |
239 | | int curlx_str_newline(const char **linep) |
240 | 0 | { |
241 | 0 | DEBUGASSERT(linep && *linep); |
242 | 0 | if(ISNEWLINE(**linep)) { |
243 | 0 | (*linep)++; |
244 | 0 | return STRE_OK; /* yessir */ |
245 | 0 | } |
246 | 0 | return STRE_NEWLINE; |
247 | 0 | } |
248 | | |
249 | | #ifndef WITHOUT_LIBCURL |
250 | | /* case insensitive compare that the parsed string matches the given string. |
251 | | Returns non-zero on match. */ |
252 | | int curlx_str_casecompare(struct Curl_str *str, const char *check) |
253 | 63.8k | { |
254 | 63.8k | size_t clen = check ? strlen(check) : 0; |
255 | 63.8k | return ((str->len == clen) && curl_strnequal(str->str, check, clen)); |
256 | 63.8k | } |
257 | | #endif |
258 | | |
259 | | /* case sensitive string compare. Returns non-zero on match. */ |
260 | | int curlx_str_cmp(struct Curl_str *str, const char *check) |
261 | 0 | { |
262 | 0 | if(check) { |
263 | 0 | size_t clen = strlen(check); |
264 | 0 | return ((str->len == clen) && !strncmp(str->str, check, clen)); |
265 | 0 | } |
266 | 0 | return !!(str->len); |
267 | 0 | } |
268 | | |
269 | | /* Trim off 'num' number of bytes from the beginning (left side) of the |
270 | | string. If 'num' is larger than the string, return error. */ |
271 | | int curlx_str_nudge(struct Curl_str *str, size_t num) |
272 | 2.45k | { |
273 | 2.45k | if(num <= str->len) { |
274 | 2.45k | str->str += num; |
275 | 2.45k | str->len -= num; |
276 | 2.45k | return STRE_OK; |
277 | 2.45k | } |
278 | 0 | return STRE_OVERFLOW; |
279 | 2.45k | } |
280 | | |
281 | | /* Get the following character sequence that consists only of bytes not |
282 | | present in the 'reject' string. Like strcspn(). */ |
283 | | int curlx_str_cspn(const char **linep, struct Curl_str *out, |
284 | | const char *reject) |
285 | 35.8k | { |
286 | 35.8k | const char *s = *linep; |
287 | 35.8k | size_t len; |
288 | 35.8k | DEBUGASSERT(linep && *linep); |
289 | | |
290 | 35.8k | len = strcspn(s, reject); |
291 | 35.8k | if(len) { |
292 | 33.2k | out->str = s; |
293 | 33.2k | out->len = len; |
294 | 33.2k | *linep = &s[len]; |
295 | 33.2k | return STRE_OK; |
296 | 33.2k | } |
297 | 2.59k | curlx_str_init(out); |
298 | 2.59k | return STRE_SHORT; |
299 | 35.8k | } |
300 | | |
301 | | /* remove ISBLANK()s from both ends of the string */ |
302 | | void curlx_str_trimblanks(struct Curl_str *out) |
303 | 33.2k | { |
304 | 35.6k | while(out->len && ISBLANK(*out->str)) |
305 | 2.45k | curlx_str_nudge(out, 1); |
306 | | |
307 | | /* trim trailing spaces and tabs */ |
308 | 33.9k | while(out->len && ISBLANK(out->str[out->len - 1])) |
309 | 740 | out->len--; |
310 | 33.2k | } |
311 | | |
312 | | /* increase the pointer until it has moved over all blanks */ |
313 | | void curlx_str_passblanks(const char **linep) |
314 | 4.12k | { |
315 | 4.12k | while(ISBLANK(**linep)) |
316 | 0 | (*linep)++; /* move over it */ |
317 | 4.12k | } |