Coverage Report

Created: 2026-02-14 07:20

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
/src/openssl36/crypto/asn1/a_mbstr.c
Line
Count
Source
1
/*
2
 * Copyright 1999-2025 The OpenSSL Project Authors. All Rights Reserved.
3
 *
4
 * Licensed under the Apache License 2.0 (the "License").  You may not use
5
 * this file except in compliance with the License.  You can obtain a copy
6
 * in the file LICENSE in the source distribution or at
7
 * https://www.openssl.org/source/license.html
8
 */
9
10
#include <stdio.h>
11
#include "crypto/ctype.h"
12
#include "internal/cryptlib.h"
13
#include "internal/unicode.h"
14
#include <openssl/asn1.h>
15
16
static int traverse_string(const unsigned char *p, int len, int inform,
17
    int (*rfunc)(unsigned long value, void *in),
18
    void *arg);
19
static int in_utf8(unsigned long value, void *arg);
20
static int out_utf8(unsigned long value, void *arg);
21
static int type_str(unsigned long value, void *arg);
22
static int cpy_asc(unsigned long value, void *arg);
23
static int cpy_bmp(unsigned long value, void *arg);
24
static int cpy_univ(unsigned long value, void *arg);
25
static int cpy_utf8(unsigned long value, void *arg);
26
27
/*
28
 * These functions take a string in UTF8, ASCII or multibyte form and a mask
29
 * of permissible ASN1 string types. It then works out the minimal type
30
 * (using the order Numeric < Printable < IA5 < T61 < BMP < Universal < UTF8)
31
 * and creates a string of the correct type with the supplied data. Yes this is
32
 * horrible: it has to be :-( The 'ncopy' form checks minimum and maximum
33
 * size limits too.
34
 */
35
36
int ASN1_mbstring_copy(ASN1_STRING **out, const unsigned char *in, int len,
37
    int inform, unsigned long mask)
38
9.07M
{
39
9.07M
    return ASN1_mbstring_ncopy(out, in, len, inform, mask, 0, 0);
40
9.07M
}
41
42
int ASN1_mbstring_ncopy(ASN1_STRING **out, const unsigned char *in, int len,
43
    int inform, unsigned long mask,
44
    long minsize, long maxsize)
45
3.04M
{
46
3.04M
    int str_type;
47
3.04M
    int ret;
48
3.04M
    char free_out;
49
3.04M
    int outform, outlen = 0;
50
3.04M
    ASN1_STRING *dest;
51
3.04M
    unsigned char *p;
52
3.04M
    int nchar;
53
3.04M
    int (*cpyfunc)(unsigned long, void *) = NULL;
54
3.04M
    if (len == -1) {
55
0
        size_t len_s = strlen((const char *)in);
56
57
0
        if (len_s >= INT_MAX) {
58
0
            ERR_raise(ERR_LIB_ASN1, ASN1_R_STRING_TOO_LONG);
59
0
            return -1;
60
0
        }
61
0
        len = (int)len_s;
62
0
    }
63
3.04M
    if (!mask)
64
0
        mask = DIRSTRING_TYPE;
65
3.04M
    if (len < 0) {
66
0
        ERR_raise(ERR_LIB_ASN1, ERR_R_PASSED_INVALID_ARGUMENT);
67
0
        return -1;
68
0
    }
69
70
    /* First do a string check and work out the number of characters */
71
3.04M
    switch (inform) {
72
73
257k
    case MBSTRING_BMP:
74
257k
        if (len & 1) {
75
0
            ERR_raise(ERR_LIB_ASN1, ASN1_R_INVALID_BMPSTRING_LENGTH);
76
0
            return -1;
77
0
        }
78
257k
        nchar = len >> 1;
79
257k
        break;
80
81
373k
    case MBSTRING_UNIV:
82
373k
        if (len & 3) {
83
0
            ERR_raise(ERR_LIB_ASN1, ASN1_R_INVALID_UNIVERSALSTRING_LENGTH);
84
0
            return -1;
85
0
        }
86
373k
        nchar = len >> 2;
87
373k
        break;
88
89
717k
    case MBSTRING_UTF8:
90
717k
        nchar = 0;
91
        /* This counts the characters and does utf8 syntax checking */
92
717k
        ret = traverse_string(in, len, MBSTRING_UTF8, in_utf8, &nchar);
93
717k
        if (ret < 0) {
94
5.67k
            ERR_raise(ERR_LIB_ASN1, ASN1_R_INVALID_UTF8STRING);
95
5.67k
            return -1;
96
5.67k
        }
97
711k
        break;
98
99
1.70M
    case MBSTRING_ASC:
100
1.70M
        nchar = len;
101
1.70M
        break;
102
103
0
    default:
104
0
        ERR_raise(ERR_LIB_ASN1, ASN1_R_UNKNOWN_FORMAT);
105
0
        return -1;
106
3.04M
    }
107
108
3.04M
    if ((minsize > 0) && (nchar < minsize)) {
109
0
        ERR_raise_data(ERR_LIB_ASN1, ASN1_R_STRING_TOO_SHORT,
110
0
            "minsize=%ld", minsize);
111
0
        return -1;
112
0
    }
113
114
3.04M
    if ((maxsize > 0) && (nchar > maxsize)) {
115
0
        ERR_raise_data(ERR_LIB_ASN1, ASN1_R_STRING_TOO_LONG,
116
0
            "maxsize=%ld", maxsize);
117
0
        return -1;
118
0
    }
119
120
    /* Now work out minimal type (if any) */
121
3.04M
    if (traverse_string(in, len, inform, type_str, &mask) < 0) {
122
1.49k
        ERR_raise(ERR_LIB_ASN1, ASN1_R_ILLEGAL_CHARACTERS);
123
1.49k
        return -1;
124
1.49k
    }
125
126
    /*
127
     * Now work out output format and string type.
128
     * These checks should be in sync with the checks in type_str.
129
     */
130
3.04M
    outform = MBSTRING_ASC;
131
3.04M
    if (mask & B_ASN1_NUMERICSTRING)
132
0
        str_type = V_ASN1_NUMERICSTRING;
133
3.04M
    else if (mask & B_ASN1_PRINTABLESTRING)
134
0
        str_type = V_ASN1_PRINTABLESTRING;
135
3.04M
    else if (mask & B_ASN1_IA5STRING)
136
0
        str_type = V_ASN1_IA5STRING;
137
3.04M
    else if (mask & B_ASN1_T61STRING)
138
0
        str_type = V_ASN1_T61STRING;
139
3.04M
    else if (mask & B_ASN1_BMPSTRING) {
140
0
        str_type = V_ASN1_BMPSTRING;
141
0
        outform = MBSTRING_BMP;
142
3.04M
    } else if (mask & B_ASN1_UNIVERSALSTRING) {
143
0
        str_type = V_ASN1_UNIVERSALSTRING;
144
0
        outform = MBSTRING_UNIV;
145
3.04M
    } else {
146
3.04M
        str_type = V_ASN1_UTF8STRING;
147
3.04M
        outform = MBSTRING_UTF8;
148
3.04M
    }
149
3.04M
    if (!out)
150
0
        return str_type;
151
3.04M
    if (*out) {
152
3.04M
        free_out = 0;
153
3.04M
        dest = *out;
154
3.04M
        ASN1_STRING_set0(dest, NULL, 0);
155
3.04M
        dest->type = str_type;
156
3.04M
    } else {
157
0
        free_out = 1;
158
0
        dest = ASN1_STRING_type_new(str_type);
159
0
        if (dest == NULL) {
160
0
            ERR_raise(ERR_LIB_ASN1, ERR_R_ASN1_LIB);
161
0
            return -1;
162
0
        }
163
0
        *out = dest;
164
0
    }
165
    /* If both the same type just copy across */
166
3.04M
    if (inform == outform) {
167
711k
        if (!ASN1_STRING_set(dest, in, len)) {
168
0
            if (free_out) {
169
0
                ASN1_STRING_free(dest);
170
0
                *out = NULL;
171
0
            }
172
0
            ERR_raise(ERR_LIB_ASN1, ERR_R_ASN1_LIB);
173
0
            return -1;
174
0
        }
175
711k
        return str_type;
176
711k
    }
177
178
    /* Work out how much space the destination will need */
179
2.32M
    switch (outform) {
180
0
    case MBSTRING_ASC:
181
0
        outlen = nchar;
182
0
        cpyfunc = cpy_asc;
183
0
        break;
184
185
0
    case MBSTRING_BMP:
186
0
        outlen = nchar << 1;
187
0
        cpyfunc = cpy_bmp;
188
0
        break;
189
190
0
    case MBSTRING_UNIV:
191
0
        outlen = nchar << 2;
192
0
        cpyfunc = cpy_univ;
193
0
        break;
194
195
2.32M
    case MBSTRING_UTF8:
196
2.32M
        outlen = 0;
197
2.32M
        ret = traverse_string(in, len, inform, out_utf8, &outlen);
198
2.32M
        if (ret < 0) {
199
0
            ERR_raise(ERR_LIB_ASN1, ASN1_R_INVALID_UTF8STRING);
200
0
            return -1;
201
0
        }
202
2.32M
        cpyfunc = cpy_utf8;
203
2.32M
        break;
204
2.32M
    }
205
2.32M
    if ((p = OPENSSL_malloc(outlen + 1)) == NULL) {
206
0
        if (free_out) {
207
0
            ASN1_STRING_free(dest);
208
0
            *out = NULL;
209
0
        }
210
0
        return -1;
211
0
    }
212
2.32M
    dest->length = outlen;
213
2.32M
    dest->data = p;
214
2.32M
    p[outlen] = 0;
215
2.32M
    traverse_string(in, len, inform, cpyfunc, &p);
216
2.32M
    return str_type;
217
2.32M
}
218
219
/*
220
 * This function traverses a string and passes the value of each character to
221
 * an optional function along with a void * argument.
222
 */
223
224
static int traverse_string(const unsigned char *p, int len, int inform,
225
    int (*rfunc)(unsigned long value, void *in),
226
    void *arg)
227
25.4M
{
228
25.4M
    unsigned long value;
229
25.4M
    int ret;
230
1.51G
    while (len) {
231
1.49G
        if (inform == MBSTRING_ASC) {
232
1.42G
            value = *p++;
233
1.42G
            len--;
234
1.42G
        } else if (inform == MBSTRING_BMP) {
235
46.4M
            value = *p++ << 8;
236
46.4M
            value |= *p++;
237
46.4M
            len -= 2;
238
46.4M
        } else if (inform == MBSTRING_UNIV) {
239
182k
            value = ((unsigned long)*p++) << 24;
240
182k
            value |= ((unsigned long)*p++) << 16;
241
182k
            value |= *p++ << 8;
242
182k
            value |= *p++;
243
182k
            len -= 4;
244
18.0M
        } else {
245
18.0M
            ret = UTF8_getc(p, len, &value);
246
18.0M
            if (ret < 0)
247
22.3k
                return -1;
248
17.9M
            len -= ret;
249
17.9M
            p += ret;
250
17.9M
        }
251
1.49G
        if (rfunc) {
252
1.49G
            ret = rfunc(value, arg);
253
1.49G
            if (ret <= 0)
254
3.93k
                return ret;
255
1.49G
        }
256
1.49G
    }
257
25.4M
    return 1;
258
25.4M
}
259
260
/* Various utility functions for traverse_string */
261
262
/* Just count number of characters */
263
264
static int in_utf8(unsigned long value, void *arg)
265
9.78M
{
266
9.78M
    int *nchar;
267
268
9.78M
    if (!is_unicode_valid(value))
269
0
        return -2;
270
9.78M
    nchar = arg;
271
9.78M
    (*nchar)++;
272
9.78M
    return 1;
273
9.78M
}
274
275
/* Determine size of output as a UTF8 String */
276
277
static int out_utf8(unsigned long value, void *arg)
278
490M
{
279
490M
    int *outlen, len;
280
281
490M
    len = UTF8_putc(NULL, -1, value);
282
490M
    if (len <= 0)
283
0
        return len;
284
490M
    outlen = arg;
285
490M
    *outlen += len;
286
490M
    return 1;
287
490M
}
288
289
/*
290
 * Determine the "type" of a string: check each character against a supplied
291
 * "mask".
292
 */
293
294
static int type_str(unsigned long value, void *arg)
295
499M
{
296
499M
    unsigned long usable_types = *((unsigned long *)arg);
297
499M
    unsigned long types = usable_types;
298
499M
    const int native = value > INT_MAX ? INT_MAX : ossl_fromascii(value);
299
300
    /*
301
     * Clear out all the types which are not checked later. If any of those
302
     * is present in the mask, then the UTF8 type will be added and checked
303
     * below.
304
     */
305
499M
    types &= B_ASN1_NUMERICSTRING | B_ASN1_PRINTABLESTRING
306
499M
        | B_ASN1_IA5STRING | B_ASN1_T61STRING | B_ASN1_BMPSTRING
307
499M
        | B_ASN1_UNIVERSALSTRING | B_ASN1_UTF8STRING;
308
309
    /*
310
     * If any other types were in the input mask, they're effectively treated
311
     * as UTF8
312
     */
313
499M
    if (types != usable_types)
314
0
        types |= B_ASN1_UTF8STRING;
315
316
    /*
317
     * These checks should be in sync with ASN1_mbstring_ncopy.
318
     */
319
499M
    if ((types & B_ASN1_NUMERICSTRING) && !(ossl_isdigit(native) || native == ' '))
320
0
        types &= ~B_ASN1_NUMERICSTRING;
321
499M
    if ((types & B_ASN1_PRINTABLESTRING) && !ossl_isasn1print(native))
322
0
        types &= ~B_ASN1_PRINTABLESTRING;
323
499M
    if ((types & B_ASN1_IA5STRING) && !ossl_isascii(native))
324
0
        types &= ~B_ASN1_IA5STRING;
325
499M
    if ((types & B_ASN1_T61STRING) && (value > 0xff))
326
0
        types &= ~B_ASN1_T61STRING;
327
499M
    if ((types & B_ASN1_BMPSTRING) && (value > 0xffff))
328
0
        types &= ~B_ASN1_BMPSTRING;
329
499M
    if ((types & B_ASN1_UTF8STRING) && !is_unicode_valid(value))
330
3.93k
        types &= ~B_ASN1_UTF8STRING;
331
499M
    if (!types)
332
3.93k
        return -1;
333
499M
    *((unsigned long *)arg) = types;
334
499M
    return 1;
335
499M
}
336
337
/* Copy one byte per character ASCII like strings */
338
339
static int cpy_asc(unsigned long value, void *arg)
340
0
{
341
0
    unsigned char **p, *q;
342
0
    p = arg;
343
0
    q = *p;
344
0
    *q = (unsigned char)value;
345
0
    (*p)++;
346
0
    return 1;
347
0
}
348
349
/* Copy two byte per character BMPStrings */
350
351
static int cpy_bmp(unsigned long value, void *arg)
352
0
{
353
0
    unsigned char **p, *q;
354
0
    p = arg;
355
0
    q = *p;
356
0
    *q++ = (unsigned char)((value >> 8) & 0xff);
357
0
    *q = (unsigned char)(value & 0xff);
358
0
    *p += 2;
359
0
    return 1;
360
0
}
361
362
/* Copy four byte per character UniversalStrings */
363
364
static int cpy_univ(unsigned long value, void *arg)
365
0
{
366
0
    unsigned char **p, *q;
367
0
    p = arg;
368
0
    q = *p;
369
0
    *q++ = (unsigned char)((value >> 24) & 0xff);
370
0
    *q++ = (unsigned char)((value >> 16) & 0xff);
371
0
    *q++ = (unsigned char)((value >> 8) & 0xff);
372
0
    *q = (unsigned char)(value & 0xff);
373
0
    *p += 4;
374
0
    return 1;
375
0
}
376
377
/* Copy to a UTF8String */
378
379
static int cpy_utf8(unsigned long value, void *arg)
380
490M
{
381
490M
    unsigned char **p;
382
490M
    int ret;
383
490M
    p = arg;
384
    /* We already know there is enough room so pass 0xff as the length */
385
490M
    ret = UTF8_putc(*p, 0xff, value);
386
490M
    if (ret < 0)
387
0
        return ret;
388
490M
    *p += ret;
389
490M
    return 1;
390
490M
}