Coverage Report

Created: 2025-08-26 06:31

/src/FreeRDP/winpr/libwinpr/crt/unicode_builtin.c
Line
Count
Source (jump to first uncovered line)
1
/*
2
 * Copyright 2001-2004 Unicode, Inc.
3
 *
4
 * Disclaimer
5
 *
6
 * This source code is provided as is by Unicode, Inc. No claims are
7
 * made as to fitness for any particular purpose. No warranties of any
8
 * kind are expressed or implied. The recipient agrees to determine
9
 * applicability of information provided. If this file has been
10
 * purchased on magnetic or optical media from Unicode, Inc., the
11
 * sole remedy for any claim will be exchange of defective media
12
 * within 90 days of receipt.
13
 *
14
 * Limitations on Rights to Redistribute This Code
15
 *
16
 * Unicode, Inc. hereby grants the right to freely use the information
17
 * supplied in this file in the creation of products supporting the
18
 * Unicode Standard, and to make copies of this file in any form
19
 * for internal or external distribution as long as this notice
20
 * remains attached.
21
 */
22
23
/* ---------------------------------------------------------------------
24
25
Conversions between UTF32, UTF-16, and UTF-8. Source code file.
26
Author: Mark E. Davis, 1994.
27
Rev History: Rick McGowan, fixes & updates May 2001.
28
Sept 2001: fixed const & error conditions per
29
mods suggested by S. Parent & A. Lillich.
30
June 2002: Tim Dodd added detection and handling of incomplete
31
source sequences, enhanced error detection, added casts
32
to eliminate compiler warnings.
33
July 2003: slight mods to back out aggressive FFFE detection.
34
Jan 2004: updated switches in from-UTF8 conversions.
35
Oct 2004: updated to use UNI_MAX_LEGAL_UTF32 in UTF-32 conversions.
36
37
See the header file "utf.h" for complete documentation.
38
39
------------------------------------------------------------------------ */
40
41
#include <winpr/wtypes.h>
42
#include <winpr/string.h>
43
#include <winpr/assert.h>
44
#include <winpr/cast.h>
45
46
#include "unicode.h"
47
48
#include "../log.h"
49
#define TAG WINPR_TAG("unicode")
50
51
/*
52
 * Character Types:
53
 *
54
 * UTF8:    uint8_t   8 bits
55
 * UTF16: uint16_t  16 bits
56
 * UTF32: uint32_t  32 bits
57
 */
58
59
/* Some fundamental constants */
60
0
#define UNI_REPLACEMENT_CHAR (uint32_t)0x0000FFFD
61
0
#define UNI_MAX_BMP (uint32_t)0x0000FFFF
62
0
#define UNI_MAX_UTF16 (uint32_t)0x0010FFFF
63
#define UNI_MAX_UTF32 (uint32_t)0x7FFFFFFF
64
#define UNI_MAX_LEGAL_UTF32 (uint32_t)0x0010FFFF
65
66
typedef enum
67
{
68
  conversionOK,    /* conversion successful */
69
  sourceExhausted, /* partial character in source, but hit end */
70
  targetExhausted, /* insuff. room in target for conversion */
71
  sourceIllegal    /* source sequence is illegal/malformed */
72
} ConversionResult;
73
74
typedef enum
75
{
76
  strictConversion = 0,
77
  lenientConversion
78
} ConversionFlags;
79
80
static const int halfShift = 10; /* used for shifting by 10 bits */
81
82
static const uint32_t halfBase = 0x0010000UL;
83
static const uint32_t halfMask = 0x3FFUL;
84
85
0
#define UNI_SUR_HIGH_START (uint32_t)0xD800
86
0
#define UNI_SUR_HIGH_END (uint32_t)0xDBFF
87
0
#define UNI_SUR_LOW_START (uint32_t)0xDC00
88
0
#define UNI_SUR_LOW_END (uint32_t)0xDFFF
89
90
/* --------------------------------------------------------------------- */
91
92
/*
93
 * Index into the table below with the first byte of a UTF-8 sequence to
94
 * get the number of trailing bytes that are supposed to follow it.
95
 * Note that *legal* UTF-8 values can't have 4 or 5-bytes. The table is
96
 * left as-is for anyone who may want to do such conversion, which was
97
 * allowed in earlier algorithms.
98
 */
99
static const char trailingBytesForUTF8[256] = {
100
  0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
101
  0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
102
  0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
103
  0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
104
  0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
105
  0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
106
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
107
  2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 3, 3, 3, 3, 3, 3, 3, 3, 4, 4, 4, 4, 5, 5, 5, 5
108
};
109
110
/*
111
 * Magic values subtracted from a buffer value during UTF8 conversion.
112
 * This table contains as many values as there might be trailing bytes
113
 * in a UTF-8 sequence.
114
 */
115
static const uint32_t offsetsFromUTF8[6] = { 0x00000000UL, 0x00003080UL, 0x000E2080UL,
116
                                           0x03C82080UL, 0xFA082080UL, 0x82082080UL };
117
118
/*
119
 * Once the bits are split out into bytes of UTF-8, this is a mask OR-ed
120
 * into the first byte, depending on how many bytes follow.  There are
121
 * as many entries in this table as there are UTF-8 sequence types.
122
 * (I.e., one byte sequence, two byte... etc.). Remember that sequence
123
 * for *legal* UTF-8 will be 4 or fewer bytes total.
124
 */
125
static const uint8_t firstByteMark[7] = { 0x00, 0x00, 0xC0, 0xE0, 0xF0, 0xF8, 0xFC };
126
127
/* We always need UTF-16LE, even on big endian systems! */
128
static WCHAR setWcharFrom(WCHAR w)
129
0
{
130
#if defined(__BIG_ENDIAN__)
131
  union
132
  {
133
    WCHAR w;
134
    char c[2];
135
  } cnv;
136
137
  cnv.w = w;
138
  const char c = cnv.c[0];
139
  cnv.c[0] = cnv.c[1];
140
  cnv.c[1] = c;
141
  return cnv.w;
142
#else
143
0
  return w;
144
0
#endif
145
0
}
146
147
/* --------------------------------------------------------------------- */
148
149
/* The interface converts a whole buffer to avoid function-call overhead.
150
 * Constants have been gathered. Loops & conditionals have been removed as
151
 * much as possible for efficiency, in favor of drop-through switches.
152
 * (See "Note A" at the bottom of the file for equivalent code.)
153
 * If your compiler supports it, the "isLegalUTF8" call can be turned
154
 * into an inline function.
155
 */
156
157
/* --------------------------------------------------------------------- */
158
159
static ConversionResult winpr_ConvertUTF16toUTF8_Internal(const uint16_t** sourceStart,
160
                                                          const uint16_t* sourceEnd,
161
                                                          uint8_t** targetStart,
162
                                                          const uint8_t* targetEnd,
163
                                                          ConversionFlags flags)
164
0
{
165
0
  bool computeLength = (!targetEnd) ? true : false;
166
0
  const uint16_t* source = *sourceStart;
167
0
  uint8_t* target = *targetStart;
168
0
  ConversionResult result = conversionOK;
169
170
0
  while (source < sourceEnd)
171
0
  {
172
0
    uint32_t ch = 0;
173
0
    unsigned short bytesToWrite = 0;
174
0
    const uint32_t byteMask = 0xBF;
175
0
    const uint32_t byteMark = 0x80;
176
0
    const uint16_t* oldSource =
177
0
        source; /* In case we have to back up because of target overflow. */
178
179
0
    ch = setWcharFrom(*source++);
180
181
    /* If we have a surrogate pair, convert to UTF32 first. */
182
0
    if (ch >= UNI_SUR_HIGH_START && ch <= UNI_SUR_HIGH_END)
183
0
    {
184
      /* If the 16 bits following the high surrogate are in the source buffer... */
185
0
      if (source < sourceEnd)
186
0
      {
187
0
        uint32_t ch2 = setWcharFrom(*source);
188
189
        /* If it's a low surrogate, convert to UTF32. */
190
0
        if (ch2 >= UNI_SUR_LOW_START && ch2 <= UNI_SUR_LOW_END)
191
0
        {
192
0
          ch = ((ch - UNI_SUR_HIGH_START) << halfShift) + (ch2 - UNI_SUR_LOW_START) +
193
0
               halfBase;
194
0
          ++source;
195
0
        }
196
0
        else if (flags == strictConversion)
197
0
        {
198
          /* it's an unpaired high surrogate */
199
0
          --source; /* return to the illegal value itself */
200
0
          result = sourceIllegal;
201
0
          break;
202
0
        }
203
0
      }
204
0
      else
205
0
      {
206
        /* We don't have the 16 bits following the high surrogate. */
207
0
        --source; /* return to the high surrogate */
208
0
        result = sourceExhausted;
209
0
        break;
210
0
      }
211
0
    }
212
0
    else if (flags == strictConversion)
213
0
    {
214
      /* UTF-16 surrogate values are illegal in UTF-32 */
215
0
      if (ch >= UNI_SUR_LOW_START && ch <= UNI_SUR_LOW_END)
216
0
      {
217
0
        --source; /* return to the illegal value itself */
218
0
        result = sourceIllegal;
219
0
        break;
220
0
      }
221
0
    }
222
223
    /* Figure out how many bytes the result will require */
224
0
    if (ch < (uint32_t)0x80)
225
0
    {
226
0
      bytesToWrite = 1;
227
0
    }
228
0
    else if (ch < (uint32_t)0x800)
229
0
    {
230
0
      bytesToWrite = 2;
231
0
    }
232
0
    else if (ch < (uint32_t)0x10000)
233
0
    {
234
0
      bytesToWrite = 3;
235
0
    }
236
0
    else if (ch < (uint32_t)0x110000)
237
0
    {
238
0
      bytesToWrite = 4;
239
0
    }
240
0
    else
241
0
    {
242
0
      bytesToWrite = 3;
243
0
      ch = UNI_REPLACEMENT_CHAR;
244
0
    }
245
246
0
    target += bytesToWrite;
247
248
0
    if ((target > targetEnd) && (!computeLength))
249
0
    {
250
0
      source = oldSource; /* Back up source pointer! */
251
0
      target -= bytesToWrite;
252
0
      result = targetExhausted;
253
0
      break;
254
0
    }
255
256
0
    if (!computeLength)
257
0
    {
258
0
      switch (bytesToWrite)
259
0
      {
260
          /* note: everything falls through. */
261
0
        case 4:
262
0
          *--target = (uint8_t)((ch | byteMark) & byteMask);
263
0
          ch >>= 6;
264
          /* fallthrough */
265
0
          WINPR_FALLTHROUGH
266
0
        case 3:
267
0
          *--target = (uint8_t)((ch | byteMark) & byteMask);
268
0
          ch >>= 6;
269
          /* fallthrough */
270
0
          WINPR_FALLTHROUGH
271
272
0
        case 2:
273
0
          *--target = (uint8_t)((ch | byteMark) & byteMask);
274
0
          ch >>= 6;
275
          /* fallthrough */
276
0
          WINPR_FALLTHROUGH
277
278
0
        case 1:
279
0
          *--target = (uint8_t)(ch | firstByteMark[bytesToWrite]);
280
0
          break;
281
0
        default:
282
0
          return sourceIllegal;
283
0
      }
284
0
    }
285
0
    else
286
0
    {
287
0
      switch (bytesToWrite)
288
0
      {
289
          /* note: everything falls through. */
290
0
        case 4:
291
0
          --target;
292
          /* fallthrough */
293
0
          WINPR_FALLTHROUGH
294
295
0
        case 3:
296
0
          --target;
297
          /* fallthrough */
298
0
          WINPR_FALLTHROUGH
299
300
0
        case 2:
301
0
          --target;
302
          /* fallthrough */
303
0
          WINPR_FALLTHROUGH
304
305
0
        case 1:
306
0
          --target;
307
0
          break;
308
0
        default:
309
0
          return sourceIllegal;
310
0
      }
311
0
    }
312
313
0
    target += bytesToWrite;
314
0
  }
315
316
0
  *sourceStart = source;
317
0
  *targetStart = target;
318
0
  return result;
319
0
}
320
321
/* --------------------------------------------------------------------- */
322
323
/*
324
 * Utility routine to tell whether a sequence of bytes is legal UTF-8.
325
 * This must be called with the length pre-determined by the first byte.
326
 * If not calling this from ConvertUTF8to*, then the length can be set by:
327
 *  length = trailingBytesForUTF8[*source]+1;
328
 * and the sequence is illegal right away if there aren't that many bytes
329
 * available.
330
 * If presented with a length > 4, this returns false.  The Unicode
331
 * definition of UTF-8 goes up to 4-byte sequences.
332
 */
333
334
static bool isLegalUTF8(const uint8_t* source, int length)
335
0
{
336
0
  uint8_t a = 0;
337
0
  const uint8_t* srcptr = source + length;
338
339
0
  switch (length)
340
0
  {
341
0
    default:
342
0
      return false;
343
344
      /* Everything else falls through when "true"... */
345
0
    case 4:
346
0
      if ((a = (*--srcptr)) < 0x80 || a > 0xBF)
347
0
        return false;
348
      /* fallthrough */
349
0
      WINPR_FALLTHROUGH
350
351
0
    case 3:
352
0
      if ((a = (*--srcptr)) < 0x80 || a > 0xBF)
353
0
        return false;
354
      /* fallthrough */
355
0
      WINPR_FALLTHROUGH
356
357
0
    case 2:
358
0
      if ((a = (*--srcptr)) > 0xBF)
359
0
        return false;
360
361
0
      switch (*source)
362
0
      {
363
          /* no fall-through in this inner switch */
364
0
        case 0xE0:
365
0
          if (a < 0xA0)
366
0
            return false;
367
368
0
          break;
369
370
0
        case 0xED:
371
0
          if (a > 0x9F)
372
0
            return false;
373
374
0
          break;
375
376
0
        case 0xF0:
377
0
          if (a < 0x90)
378
0
            return false;
379
380
0
          break;
381
382
0
        case 0xF4:
383
0
          if (a > 0x8F)
384
0
            return false;
385
386
0
          break;
387
388
0
        default:
389
0
          if (a < 0x80)
390
0
            return false;
391
0
          break;
392
0
      }
393
      /* fallthrough */
394
0
      WINPR_FALLTHROUGH
395
396
0
    case 1:
397
0
      if (*source >= 0x80 && *source < 0xC2)
398
0
        return false;
399
0
  }
400
401
0
  if (*source > 0xF4)
402
0
    return false;
403
404
0
  return true;
405
0
}
406
407
/* --------------------------------------------------------------------- */
408
409
static ConversionResult winpr_ConvertUTF8toUTF16_Internal(const uint8_t** sourceStart,
410
                                                          const uint8_t* sourceEnd,
411
                                                          uint16_t** targetStart,
412
                                                          const uint16_t* targetEnd,
413
                                                          ConversionFlags flags)
414
0
{
415
0
  bool computeLength = (!targetEnd) ? true : false;
416
0
  ConversionResult result = conversionOK;
417
0
  const uint8_t* source = *sourceStart;
418
0
  uint16_t* target = *targetStart;
419
420
0
  while (source < sourceEnd)
421
0
  {
422
0
    uint32_t ch = 0;
423
0
    unsigned short extraBytesToRead =
424
0
        WINPR_ASSERTING_INT_CAST(unsigned short, trailingBytesForUTF8[*source]);
425
426
0
    if ((source + extraBytesToRead) >= sourceEnd)
427
0
    {
428
0
      result = sourceExhausted;
429
0
      break;
430
0
    }
431
432
    /* Do this check whether lenient or strict */
433
0
    if (!isLegalUTF8(source, extraBytesToRead + 1))
434
0
    {
435
0
      result = sourceIllegal;
436
0
      break;
437
0
    }
438
439
    /*
440
     * The cases all fall through. See "Note A" below.
441
     */
442
0
    switch (extraBytesToRead)
443
0
    {
444
0
      case 5:
445
0
        ch += *source++;
446
0
        ch <<= 6; /* remember, illegal UTF-8 */
447
                  /* fallthrough */
448
0
        WINPR_FALLTHROUGH
449
450
0
      case 4:
451
0
        ch += *source++;
452
0
        ch <<= 6; /* remember, illegal UTF-8 */
453
                  /* fallthrough */
454
0
        WINPR_FALLTHROUGH
455
456
0
      case 3:
457
0
        ch += *source++;
458
0
        ch <<= 6;
459
        /* fallthrough */
460
0
        WINPR_FALLTHROUGH
461
462
0
      case 2:
463
0
        ch += *source++;
464
0
        ch <<= 6;
465
        /* fallthrough */
466
0
        WINPR_FALLTHROUGH
467
468
0
      case 1:
469
0
        ch += *source++;
470
0
        ch <<= 6;
471
        /* fallthrough */
472
0
        WINPR_FALLTHROUGH
473
474
0
      case 0:
475
0
        ch += *source++;
476
0
        break;
477
0
      default:
478
0
        return sourceIllegal;
479
0
    }
480
481
0
    ch -= offsetsFromUTF8[extraBytesToRead];
482
483
0
    if ((target >= targetEnd) && (!computeLength))
484
0
    {
485
0
      source -= (extraBytesToRead + 1); /* Back up source pointer! */
486
0
      result = targetExhausted;
487
0
      break;
488
0
    }
489
490
0
    if (ch <= UNI_MAX_BMP)
491
0
    {
492
      /* Target is a character <= 0xFFFF */
493
      /* UTF-16 surrogate values are illegal in UTF-32 */
494
0
      if (ch >= UNI_SUR_HIGH_START && ch <= UNI_SUR_LOW_END)
495
0
      {
496
0
        if (flags == strictConversion)
497
0
        {
498
0
          source -= (extraBytesToRead + 1); /* return to the illegal value itself */
499
0
          result = sourceIllegal;
500
0
          break;
501
0
        }
502
0
        else
503
0
        {
504
0
          if (!computeLength)
505
0
            *target++ = setWcharFrom(UNI_REPLACEMENT_CHAR);
506
0
          else
507
0
            target++;
508
0
        }
509
0
      }
510
0
      else
511
0
      {
512
0
        if (!computeLength)
513
0
          *target++ = setWcharFrom((WCHAR)ch); /* normal case */
514
0
        else
515
0
          target++;
516
0
      }
517
0
    }
518
0
    else if (ch > UNI_MAX_UTF16)
519
0
    {
520
0
      if (flags == strictConversion)
521
0
      {
522
0
        result = sourceIllegal;
523
0
        source -= (extraBytesToRead + 1); /* return to the start */
524
0
        break;                            /* Bail out; shouldn't continue */
525
0
      }
526
0
      else
527
0
      {
528
0
        if (!computeLength)
529
0
          *target++ = setWcharFrom(UNI_REPLACEMENT_CHAR);
530
0
        else
531
0
          target++;
532
0
      }
533
0
    }
534
0
    else
535
0
    {
536
      /* target is a character in range 0xFFFF - 0x10FFFF. */
537
0
      if ((target + 1 >= targetEnd) && (!computeLength))
538
0
      {
539
0
        source -= (extraBytesToRead + 1); /* Back up source pointer! */
540
0
        result = targetExhausted;
541
0
        break;
542
0
      }
543
544
0
      ch -= halfBase;
545
546
0
      if (!computeLength)
547
0
      {
548
0
        *target++ = setWcharFrom((WCHAR)((ch >> halfShift) + UNI_SUR_HIGH_START));
549
0
        *target++ = setWcharFrom((WCHAR)((ch & halfMask) + UNI_SUR_LOW_START));
550
0
      }
551
0
      else
552
0
      {
553
0
        target++;
554
0
        target++;
555
0
      }
556
0
    }
557
0
  }
558
559
0
  *sourceStart = source;
560
0
  *targetStart = target;
561
0
  return result;
562
0
}
563
564
/**
565
 * WinPR built-in Unicode API
566
 */
567
568
static int winpr_ConvertUTF8toUTF16(const uint8_t* src, int cchSrc, uint16_t* dst, int cchDst)
569
0
{
570
0
  size_t length = 0;
571
0
  uint16_t* dstBeg = NULL;
572
0
  uint16_t* dstEnd = NULL;
573
0
  const uint8_t* srcBeg = NULL;
574
0
  const uint8_t* srcEnd = NULL;
575
0
  ConversionResult result = sourceIllegal;
576
577
0
  if (cchSrc == -1)
578
0
    cchSrc = (int)strnlen((const char*)src, INT32_MAX - 1) + 1;
579
580
0
  srcBeg = src;
581
0
  srcEnd = &src[cchSrc];
582
583
0
  if (cchDst == 0)
584
0
  {
585
0
    result =
586
0
        winpr_ConvertUTF8toUTF16_Internal(&srcBeg, srcEnd, &dstBeg, dstEnd, strictConversion);
587
588
0
    length = dstBeg - (uint16_t*)NULL;
589
0
  }
590
0
  else
591
0
  {
592
0
    dstBeg = dst;
593
0
    dstEnd = &dst[cchDst];
594
595
0
    result =
596
0
        winpr_ConvertUTF8toUTF16_Internal(&srcBeg, srcEnd, &dstBeg, dstEnd, strictConversion);
597
598
0
    length = dstBeg - dst;
599
0
  }
600
601
0
  if (result == targetExhausted)
602
0
  {
603
0
    SetLastError(ERROR_INSUFFICIENT_BUFFER);
604
0
    return 0;
605
0
  }
606
607
0
  return (result == conversionOK) ? WINPR_ASSERTING_INT_CAST(int, length) : 0;
608
0
}
609
610
static int winpr_ConvertUTF16toUTF8(const uint16_t* src, int cchSrc, uint8_t* dst, int cchDst)
611
0
{
612
0
  size_t length = 0;
613
0
  uint8_t* dstBeg = NULL;
614
0
  uint8_t* dstEnd = NULL;
615
0
  const uint16_t* srcBeg = NULL;
616
0
  const uint16_t* srcEnd = NULL;
617
0
  ConversionResult result = sourceIllegal;
618
619
0
  if (cchSrc == -1)
620
0
    cchSrc = (int)_wcsnlen((const WCHAR*)src, INT32_MAX - 1) + 1;
621
622
0
  srcBeg = src;
623
0
  srcEnd = &src[cchSrc];
624
625
0
  if (cchDst == 0)
626
0
  {
627
0
    result =
628
0
        winpr_ConvertUTF16toUTF8_Internal(&srcBeg, srcEnd, &dstBeg, dstEnd, strictConversion);
629
630
0
    length = dstBeg - ((uint8_t*)NULL);
631
0
  }
632
0
  else
633
0
  {
634
0
    dstBeg = dst;
635
0
    dstEnd = &dst[cchDst];
636
637
0
    result =
638
0
        winpr_ConvertUTF16toUTF8_Internal(&srcBeg, srcEnd, &dstBeg, dstEnd, strictConversion);
639
640
0
    length = dstBeg - dst;
641
0
  }
642
643
0
  if (result == targetExhausted)
644
0
  {
645
0
    SetLastError(ERROR_INSUFFICIENT_BUFFER);
646
0
    return 0;
647
0
  }
648
649
0
  return (result == conversionOK) ? WINPR_ASSERTING_INT_CAST(int, length) : 0;
650
0
}
651
652
/* --------------------------------------------------------------------- */
653
654
int int_MultiByteToWideChar(UINT CodePage, DWORD dwFlags, LPCSTR lpMultiByteStr, int cbMultiByte,
655
                            LPWSTR lpWideCharStr, int cchWideChar)
656
0
{
657
0
  size_t cbCharLen = (size_t)cbMultiByte;
658
659
0
  WINPR_UNUSED(dwFlags);
660
661
  /* If cbMultiByte is 0, the function fails */
662
0
  if ((cbMultiByte == 0) || (cbMultiByte < -1))
663
0
    return 0;
664
665
0
  if (cchWideChar < 0)
666
0
    return -1;
667
668
0
  if (cbMultiByte < 0)
669
0
  {
670
0
    const size_t len = strlen(lpMultiByteStr);
671
0
    if (len >= INT32_MAX)
672
0
      return 0;
673
0
    cbCharLen = (int)len + 1;
674
0
  }
675
0
  else
676
0
    cbCharLen = cbMultiByte;
677
678
0
  WINPR_ASSERT(lpMultiByteStr);
679
0
  switch (CodePage)
680
0
  {
681
0
    case CP_ACP:
682
0
    case CP_UTF8:
683
0
      break;
684
685
0
    default:
686
0
      WLog_ERR(TAG, "Unsupported encoding %u", CodePage);
687
0
      return 0;
688
0
  }
689
690
0
  return winpr_ConvertUTF8toUTF16((const uint8_t*)lpMultiByteStr,
691
0
                                  WINPR_ASSERTING_INT_CAST(int, cbCharLen),
692
0
                                  (uint16_t*)lpWideCharStr, cchWideChar);
693
0
}
694
695
int int_WideCharToMultiByte(UINT CodePage, DWORD dwFlags, LPCWSTR lpWideCharStr, int cchWideChar,
696
                            LPSTR lpMultiByteStr, int cbMultiByte, LPCSTR lpDefaultChar,
697
                            LPBOOL lpUsedDefaultChar)
698
0
{
699
0
  size_t cbCharLen = (size_t)cchWideChar;
700
701
0
  WINPR_UNUSED(dwFlags);
702
  /* If cchWideChar is 0, the function fails */
703
0
  if ((cchWideChar == 0) || (cchWideChar < -1))
704
0
    return 0;
705
706
0
  if (cbMultiByte < 0)
707
0
    return -1;
708
709
0
  WINPR_ASSERT(lpWideCharStr);
710
  /* If cchWideChar is -1, the string is null-terminated */
711
0
  if (cchWideChar == -1)
712
0
  {
713
0
    const size_t len = _wcslen(lpWideCharStr);
714
0
    if (len >= INT32_MAX)
715
0
      return 0;
716
0
    cbCharLen = (int)len + 1;
717
0
  }
718
0
  else
719
0
    cbCharLen = cchWideChar;
720
721
  /*
722
   * if cbMultiByte is 0, the function returns the required buffer size
723
   * in bytes for lpMultiByteStr and makes no use of the output parameter itself.
724
   */
725
726
0
  return winpr_ConvertUTF16toUTF8((const uint16_t*)lpWideCharStr,
727
0
                                  WINPR_ASSERTING_INT_CAST(int, cbCharLen),
728
0
                                  (uint8_t*)lpMultiByteStr, cbMultiByte);
729
0
}