/src/FreeRDP/winpr/libwinpr/crt/unicode_builtin.c

Source
/*
 * Copyright 2001-2004 Unicode, Inc.
 *
 * Disclaimer
 *
 * This source code is provided as is by Unicode, Inc. No claims are
 * made as to fitness for any particular purpose. No warranties of any
 * kind are expressed or implied. The recipient agrees to determine
 * applicability of information provided. If this file has been
 * purchased on magnetic or optical media from Unicode, Inc., the
 * sole remedy for any claim will be exchange of defective media
 * within 90 days of receipt.
 *
 * Limitations on Rights to Redistribute This Code
 *
 * Unicode, Inc. hereby grants the right to freely use the information
 * supplied in this file in the creation of products supporting the
 * Unicode Standard, and to make copies of this file in any form
 * for internal or external distribution as long as this notice
 * remains attached.
 */

/* ---------------------------------------------------------------------

Conversions between UTF32, UTF-16, and UTF-8. Source code file.
Author: Mark E. Davis, 1994.
Rev History: Rick McGowan, fixes & updates May 2001.
Sept 2001: fixed const & error conditions per
mods suggested by S. Parent & A. Lillich.
June 2002: Tim Dodd added detection and handling of incomplete
source sequences, enhanced error detection, added casts
to eliminate compiler warnings.
July 2003: slight mods to back out aggressive FFFE detection.
Jan 2004: updated switches in from-UTF8 conversions.
Oct 2004: updated to use UNI_MAX_LEGAL_UTF32 in UTF-32 conversions.

See the header file "utf.h" for complete documentation.

------------------------------------------------------------------------ */

#include <winpr/wtypes.h>
#include <winpr/string.h>
#include <winpr/assert.h>
#include <winpr/cast.h>

#include "unicode.h"

#include "../log.h"
#define TAG WINPR_TAG("unicode")

/*
 * Character Types:
 *
 * UTF8:    uint8_t   8 bits
 * UTF16: uint16_t  16 bits
 * UTF32: uint32_t  32 bits
 */

/* Some fundamental constants */
#define UNI_REPLACEMENT_CHAR (uint32_t)0x0000FFFD
#define UNI_MAX_BMP (uint32_t)0x0000FFFF
#define UNI_MAX_UTF16 (uint32_t)0x0010FFFF
#define UNI_MAX_UTF32 (uint32_t)0x7FFFFFFF
#define UNI_MAX_LEGAL_UTF32 (uint32_t)0x0010FFFF

typedef enum
{
  conversionOK,    /* conversion successful */
  sourceExhausted, /* partial character in source, but hit end */
  targetExhausted, /* insuff. room in target for conversion */
  sourceIllegal    /* source sequence is illegal/malformed */
} ConversionResult;

typedef enum
{
  strictConversion = 0,
  lenientConversion
} ConversionFlags;

static const int halfShift = 10; /* used for shifting by 10 bits */

static const uint32_t halfBase = 0x0010000UL;
static const uint32_t halfMask = 0x3FFUL;

#define UNI_SUR_HIGH_START (uint32_t)0xD800
#define UNI_SUR_HIGH_END (uint32_t)0xDBFF
#define UNI_SUR_LOW_START (uint32_t)0xDC00
#define UNI_SUR_LOW_END (uint32_t)0xDFFF

/* --------------------------------------------------------------------- */

/*
 * Index into the table below with the first byte of a UTF-8 sequence to
 * get the number of trailing bytes that are supposed to follow it.
 * Note that *legal* UTF-8 values can't have 4 or 5-bytes. The table is
 * left as-is for anyone who may want to do such conversion, which was
 * allowed in earlier algorithms.
 */
static const char trailingBytesForUTF8[256] = {
  0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
  0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
  0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
  0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
  0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
  0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
  2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 3, 3, 3, 3, 3, 3, 3, 3, 4, 4, 4, 4, 5, 5, 5, 5
};

/*
 * Magic values subtracted from a buffer value during UTF8 conversion.
 * This table contains as many values as there might be trailing bytes
 * in a UTF-8 sequence.
 */
static const uint32_t offsetsFromUTF8[6] = { 0x00000000UL, 0x00003080UL, 0x000E2080UL,
                                           0x03C82080UL, 0xFA082080UL, 0x82082080UL };

/*
 * Once the bits are split out into bytes of UTF-8, this is a mask OR-ed
 * into the first byte, depending on how many bytes follow.  There are
 * as many entries in this table as there are UTF-8 sequence types.
 * (I.e., one byte sequence, two byte... etc.). Remember that sequence
 * for *legal* UTF-8 will be 4 or fewer bytes total.
 */
static const uint8_t firstByteMark[7] = { 0x00, 0x00, 0xC0, 0xE0, 0xF0, 0xF8, 0xFC };

/* We always need UTF-16LE, even on big endian systems! */
static WCHAR setWcharFrom(WCHAR w)
{
#if defined(__BIG_ENDIAN__)
  union
  {
    WCHAR w;
    char c[2];
  } cnv;

  cnv.w = w;
  const char c = cnv.c[0];
  cnv.c[0] = cnv.c[1];
  cnv.c[1] = c;
  return cnv.w;
#else
  return w;
#endif
}

/* --------------------------------------------------------------------- */

/* The interface converts a whole buffer to avoid function-call overhead.
 * Constants have been gathered. Loops & conditionals have been removed as
 * much as possible for efficiency, in favor of drop-through switches.
 * (See "Note A" at the bottom of the file for equivalent code.)
 * If your compiler supports it, the "isLegalUTF8" call can be turned
 * into an inline function.
 */

/* --------------------------------------------------------------------- */

static ConversionResult winpr_ConvertUTF16toUTF8_Internal(const uint16_t** sourceStart,
                                                          const uint16_t* sourceEnd,
                                                          uint8_t** targetStart,
                                                          const uint8_t* targetEnd,
                                                          ConversionFlags flags)
{
  bool computeLength = (!targetEnd) ? true : false;
  const uint16_t* source = *sourceStart;
  uint8_t* target = *targetStart;
  ConversionResult result = conversionOK;

  while (source < sourceEnd)
  {
    uint32_t ch = 0;
    unsigned short bytesToWrite = 0;
    const uint32_t byteMask = 0xBF;
    const uint32_t byteMark = 0x80;
    const uint16_t* oldSource =
        source; /* In case we have to back up because of target overflow. */

    ch = setWcharFrom(*source++);

    /* If we have a surrogate pair, convert to UTF32 first. */
    if (ch >= UNI_SUR_HIGH_START && ch <= UNI_SUR_HIGH_END)
    {
      /* If the 16 bits following the high surrogate are in the source buffer... */
      if (source < sourceEnd)
      {
        uint32_t ch2 = setWcharFrom(*source);

        /* If it's a low surrogate, convert to UTF32. */
        if (ch2 >= UNI_SUR_LOW_START && ch2 <= UNI_SUR_LOW_END)
        {
          ch = ((ch - UNI_SUR_HIGH_START) << halfShift) + (ch2 - UNI_SUR_LOW_START) +
               halfBase;
          ++source;
        }
        else if (flags == strictConversion)
        {
          /* it's an unpaired high surrogate */
          --source; /* return to the illegal value itself */
          result = sourceIllegal;
          break;
        }
      }
      else
      {
        /* We don't have the 16 bits following the high surrogate. */
        --source; /* return to the high surrogate */
        result = sourceExhausted;
        break;
      }
    }
    else if (flags == strictConversion)
    {
      /* UTF-16 surrogate values are illegal in UTF-32 */
      if (ch >= UNI_SUR_LOW_START && ch <= UNI_SUR_LOW_END)
      {
        --source; /* return to the illegal value itself */
        result = sourceIllegal;
        break;
      }
    }

    /* Figure out how many bytes the result will require */
    if (ch < (uint32_t)0x80)
    {
      bytesToWrite = 1;
    }
    else if (ch < (uint32_t)0x800)
    {
      bytesToWrite = 2;
    }
    else if (ch < (uint32_t)0x10000)
    {
      bytesToWrite = 3;
    }
    else if (ch < (uint32_t)0x110000)
    {
      bytesToWrite = 4;
    }
    else
    {
      bytesToWrite = 3;
      ch = UNI_REPLACEMENT_CHAR;
    }

    target += bytesToWrite;

    if ((target > targetEnd) && (!computeLength))
    {
      source = oldSource; /* Back up source pointer! */
      target -= bytesToWrite;
      result = targetExhausted;
      break;
    }

    if (!computeLength)
    {
      switch (bytesToWrite)
      {
          /* note: everything falls through. */
        case 4:
          *--target = (uint8_t)((ch | byteMark) & byteMask);
          ch >>= 6;
          /* fallthrough */
          WINPR_FALLTHROUGH
        case 3:
          *--target = (uint8_t)((ch | byteMark) & byteMask);
          ch >>= 6;
          /* fallthrough */
          WINPR_FALLTHROUGH

        case 2:
          *--target = (uint8_t)((ch | byteMark) & byteMask);
          ch >>= 6;
          /* fallthrough */
          WINPR_FALLTHROUGH

        case 1:
          *--target = (uint8_t)(ch | firstByteMark[bytesToWrite]);
          break;
        default:
          return sourceIllegal;
      }
    }
    else
    {
      switch (bytesToWrite)
      {
          /* note: everything falls through. */
        case 4:
          --target;
          /* fallthrough */
          WINPR_FALLTHROUGH

        case 3:
          --target;
          /* fallthrough */
          WINPR_FALLTHROUGH

        case 2:
          --target;
          /* fallthrough */
          WINPR_FALLTHROUGH

        case 1:
          --target;
          break;
        default:
          return sourceIllegal;
      }
    }

    target += bytesToWrite;
  }

  *sourceStart = source;
  *targetStart = target;
  return result;
}

/* --------------------------------------------------------------------- */

/*
 * Utility routine to tell whether a sequence of bytes is legal UTF-8.
 * This must be called with the length pre-determined by the first byte.
 * If not calling this from ConvertUTF8to*, then the length can be set by:
 *  length = trailingBytesForUTF8[*source]+1;
 * and the sequence is illegal right away if there aren't that many bytes
 * available.
 * If presented with a length > 4, this returns false.  The Unicode
 * definition of UTF-8 goes up to 4-byte sequences.
 */

static bool isLegalUTF8(const uint8_t* source, int length)
{
  uint8_t a = 0;
  const uint8_t* srcptr = source + length;

  switch (length)
  {
    default:
      return false;

      /* Everything else falls through when "true"... */
    case 4:
      if ((a = (*--srcptr)) < 0x80 || a > 0xBF)
        return false;
      /* fallthrough */
      WINPR_FALLTHROUGH

    case 3:
      if ((a = (*--srcptr)) < 0x80 || a > 0xBF)
        return false;
      /* fallthrough */
      WINPR_FALLTHROUGH

    case 2:
      if ((a = (*--srcptr)) > 0xBF)
        return false;

      switch (*source)
      {
          /* no fall-through in this inner switch */
        case 0xE0:
          if (a < 0xA0)
            return false;

          break;

        case 0xED:
          if (a > 0x9F)
            return false;

          break;

        case 0xF0:
          if (a < 0x90)
            return false;

          break;

        case 0xF4:
          if (a > 0x8F)
            return false;

          break;

        default:
          if (a < 0x80)
            return false;
          break;
      }
      /* fallthrough */
      WINPR_FALLTHROUGH

    case 1:
      if (*source >= 0x80 && *source < 0xC2)
        return false;
  }

  if (*source > 0xF4)
    return false;

  return true;
}

/* --------------------------------------------------------------------- */

static ConversionResult winpr_ConvertUTF8toUTF16_Internal(const uint8_t** sourceStart,
                                                          const uint8_t* sourceEnd,
                                                          uint16_t** targetStart,
                                                          const uint16_t* targetEnd,
                                                          ConversionFlags flags)
{
  bool computeLength = (!targetEnd) ? true : false;
  ConversionResult result = conversionOK;
  const uint8_t* source = *sourceStart;
  uint16_t* target = *targetStart;

  while (source < sourceEnd)
  {
    uint32_t ch = 0;
    unsigned short extraBytesToRead =
        WINPR_ASSERTING_INT_CAST(unsigned short, trailingBytesForUTF8[*source]);

    if ((source + extraBytesToRead) >= sourceEnd)
    {
      result = sourceExhausted;
      break;
    }

    /* Do this check whether lenient or strict */
    if (!isLegalUTF8(source, extraBytesToRead + 1))
    {
      result = sourceIllegal;
      break;
    }

    /*
     * The cases all fall through. See "Note A" below.
     */
    switch (extraBytesToRead)
    {
      case 5:
        ch += *source++;
        ch <<= 6; /* remember, illegal UTF-8 */
                  /* fallthrough */
        WINPR_FALLTHROUGH

      case 4:
        ch += *source++;
        ch <<= 6; /* remember, illegal UTF-8 */
                  /* fallthrough */
        WINPR_FALLTHROUGH

      case 3:
        ch += *source++;
        ch <<= 6;
        /* fallthrough */
        WINPR_FALLTHROUGH

      case 2:
        ch += *source++;
        ch <<= 6;
        /* fallthrough */
        WINPR_FALLTHROUGH

      case 1:
        ch += *source++;
        ch <<= 6;
        /* fallthrough */
        WINPR_FALLTHROUGH

      case 0:
        ch += *source++;
        break;
      default:
        return sourceIllegal;
    }

    ch -= offsetsFromUTF8[extraBytesToRead];

    if ((target >= targetEnd) && (!computeLength))
    {
      source -= (extraBytesToRead + 1); /* Back up source pointer! */
      result = targetExhausted;
      break;
    }

    if (ch <= UNI_MAX_BMP)
    {
      /* Target is a character <= 0xFFFF */
      /* UTF-16 surrogate values are illegal in UTF-32 */
      if (ch >= UNI_SUR_HIGH_START && ch <= UNI_SUR_LOW_END)
      {
        if (flags == strictConversion)
        {
          source -= (extraBytesToRead + 1); /* return to the illegal value itself */
          result = sourceIllegal;
          break;
        }
        else
        {
          if (!computeLength)
            *target++ = setWcharFrom(UNI_REPLACEMENT_CHAR);
          else
            target++;
        }
      }
      else
      {
        if (!computeLength)
          *target++ = setWcharFrom((WCHAR)ch); /* normal case */
        else
          target++;
      }
    }
    else if (ch > UNI_MAX_UTF16)
    {
      if (flags == strictConversion)
      {
        result = sourceIllegal;
        source -= (extraBytesToRead + 1); /* return to the start */
        break;                            /* Bail out; shouldn't continue */
      }
      else
      {
        if (!computeLength)
          *target++ = setWcharFrom(UNI_REPLACEMENT_CHAR);
        else
          target++;
      }
    }
    else
    {
      /* target is a character in range 0xFFFF - 0x10FFFF. */
      if ((target + 1 >= targetEnd) && (!computeLength))
      {
        source -= (extraBytesToRead + 1); /* Back up source pointer! */
        result = targetExhausted;
        break;
      }

      ch -= halfBase;

      if (!computeLength)
      {
        *target++ = setWcharFrom((WCHAR)((ch >> halfShift) + UNI_SUR_HIGH_START));
        *target++ = setWcharFrom((WCHAR)((ch & halfMask) + UNI_SUR_LOW_START));
      }
      else
      {
        target++;
        target++;
      }
    }
  }

  *sourceStart = source;
  *targetStart = target;
  return result;
}

/**
 * WinPR built-in Unicode API
 */

static int winpr_ConvertUTF8toUTF16(const uint8_t* src, int cchSrc, uint16_t* dst, int cchDst)
{
  size_t length = 0;
  uint16_t* dstBeg = NULL;
  uint16_t* dstEnd = NULL;
  const uint8_t* srcBeg = NULL;
  const uint8_t* srcEnd = NULL;
  ConversionResult result = sourceIllegal;

  if (cchSrc == -1)
    cchSrc = (int)strnlen((const char*)src, INT32_MAX - 1) + 1;

  srcBeg = src;
  srcEnd = &src[cchSrc];

  if (cchDst == 0)
  {
    result =
        winpr_ConvertUTF8toUTF16_Internal(&srcBeg, srcEnd, &dstBeg, dstEnd, strictConversion);

    length = dstBeg - (uint16_t*)NULL;
  }
  else
  {
    dstBeg = dst;
    dstEnd = &dst[cchDst];

    result =
        winpr_ConvertUTF8toUTF16_Internal(&srcBeg, srcEnd, &dstBeg, dstEnd, strictConversion);

    length = dstBeg - dst;
  }

  if (result == targetExhausted)
  {
    SetLastError(ERROR_INSUFFICIENT_BUFFER);
    return 0;
  }

  return (result == conversionOK) ? WINPR_ASSERTING_INT_CAST(int, length) : 0;
}

static int winpr_ConvertUTF16toUTF8(const uint16_t* src, int cchSrc, uint8_t* dst, int cchDst)
{
  size_t length = 0;
  uint8_t* dstBeg = NULL;
  uint8_t* dstEnd = NULL;
  const uint16_t* srcBeg = NULL;
  const uint16_t* srcEnd = NULL;
  ConversionResult result = sourceIllegal;

  if (cchSrc == -1)
    cchSrc = (int)_wcsnlen((const WCHAR*)src, INT32_MAX - 1) + 1;

  srcBeg = src;
  srcEnd = &src[cchSrc];

  if (cchDst == 0)
  {
    result =
        winpr_ConvertUTF16toUTF8_Internal(&srcBeg, srcEnd, &dstBeg, dstEnd, strictConversion);

    length = dstBeg - ((uint8_t*)NULL);
  }
  else
  {
    dstBeg = dst;
    dstEnd = &dst[cchDst];

    result =
        winpr_ConvertUTF16toUTF8_Internal(&srcBeg, srcEnd, &dstBeg, dstEnd, strictConversion);

    length = dstBeg - dst;
  }

  if (result == targetExhausted)
  {
    SetLastError(ERROR_INSUFFICIENT_BUFFER);
    return 0;
  }

  return (result == conversionOK) ? WINPR_ASSERTING_INT_CAST(int, length) : 0;
}

/* --------------------------------------------------------------------- */

int int_MultiByteToWideChar(UINT CodePage, DWORD dwFlags, LPCSTR lpMultiByteStr, int cbMultiByte,
                            LPWSTR lpWideCharStr, int cchWideChar)
{
  size_t cbCharLen = (size_t)cbMultiByte;

  WINPR_UNUSED(dwFlags);

  /* If cbMultiByte is 0, the function fails */
  if ((cbMultiByte == 0) || (cbMultiByte < -1))
    return 0;

  if (cchWideChar < 0)
    return -1;

  if (cbMultiByte < 0)
  {
    const size_t len = strlen(lpMultiByteStr);
    if (len >= INT32_MAX)
      return 0;
    cbCharLen = (int)len + 1;
  }
  else
    cbCharLen = cbMultiByte;

  WINPR_ASSERT(lpMultiByteStr);
  switch (CodePage)
  {
    case CP_ACP:
    case CP_UTF8:
      break;

    default:
      WLog_ERR(TAG, "Unsupported encoding %u", CodePage);
      return 0;
  }

  return winpr_ConvertUTF8toUTF16((const uint8_t*)lpMultiByteStr,
                                  WINPR_ASSERTING_INT_CAST(int, cbCharLen),
                                  (uint16_t*)lpWideCharStr, cchWideChar);
}

int int_WideCharToMultiByte(UINT CodePage, DWORD dwFlags, LPCWSTR lpWideCharStr, int cchWideChar,
                            LPSTR lpMultiByteStr, int cbMultiByte, LPCSTR lpDefaultChar,
                            LPBOOL lpUsedDefaultChar)
{
  size_t cbCharLen = (size_t)cchWideChar;

  WINPR_UNUSED(dwFlags);
  /* If cchWideChar is 0, the function fails */
  if ((cchWideChar == 0) || (cchWideChar < -1))
    return 0;

  if (cbMultiByte < 0)
    return -1;

  WINPR_ASSERT(lpWideCharStr);
  /* If cchWideChar is -1, the string is null-terminated */
  if (cchWideChar == -1)
  {
    const size_t len = _wcslen(lpWideCharStr);
    if (len >= INT32_MAX)
      return 0;
    cbCharLen = (int)len + 1;
  }
  else
    cbCharLen = cchWideChar;

  /*
   * if cbMultiByte is 0, the function returns the required buffer size
   * in bytes for lpMultiByteStr and makes no use of the output parameter itself.
   */

  return winpr_ConvertUTF16toUTF8((const uint16_t*)lpWideCharStr,
                                  WINPR_ASSERTING_INT_CAST(int, cbCharLen),
                                  (uint8_t*)lpMultiByteStr, cbMultiByte);
}

Coverage Report

Created: 2025-12-14 07:05

Line	Count	Source
1		/*
2		* Copyright 2001-2004 Unicode, Inc.
3		*
4		* Disclaimer
5		*
6		* This source code is provided as is by Unicode, Inc. No claims are
7		* made as to fitness for any particular purpose. No warranties of any
8		* kind are expressed or implied. The recipient agrees to determine
9		* applicability of information provided. If this file has been
10		* purchased on magnetic or optical media from Unicode, Inc., the
11		* sole remedy for any claim will be exchange of defective media
12		* within 90 days of receipt.
13		*
14		* Limitations on Rights to Redistribute This Code
15		*
16		* Unicode, Inc. hereby grants the right to freely use the information
17		* supplied in this file in the creation of products supporting the
18		* Unicode Standard, and to make copies of this file in any form
19		* for internal or external distribution as long as this notice
20		* remains attached.
21		*/
22
23		/* ---------------------------------------------------------------------
24
25		Conversions between UTF32, UTF-16, and UTF-8. Source code file.
26		Author: Mark E. Davis, 1994.
27		Rev History: Rick McGowan, fixes & updates May 2001.
28		Sept 2001: fixed const & error conditions per
29		mods suggested by S. Parent & A. Lillich.
30		June 2002: Tim Dodd added detection and handling of incomplete
31		source sequences, enhanced error detection, added casts
32		to eliminate compiler warnings.
33		July 2003: slight mods to back out aggressive FFFE detection.
34		Jan 2004: updated switches in from-UTF8 conversions.
35		Oct 2004: updated to use UNI_MAX_LEGAL_UTF32 in UTF-32 conversions.
36
37		See the header file "utf.h" for complete documentation.
38
39		------------------------------------------------------------------------ */
40
41		#include <winpr/wtypes.h>
42		#include <winpr/string.h>
43		#include <winpr/assert.h>
44		#include <winpr/cast.h>
45
46		#include "unicode.h"
47
48		#include "../log.h"
49		#define TAG WINPR_TAG("unicode")
50
51		/*
52		* Character Types:
53		*
54		* UTF8: uint8_t 8 bits
55		* UTF16: uint16_t 16 bits
56		* UTF32: uint32_t 32 bits
57		*/
58
59		/* Some fundamental constants */
60	0	#define UNI_REPLACEMENT_CHAR (uint32_t)0x0000FFFD
61	15.8M	#define UNI_MAX_BMP (uint32_t)0x0000FFFF
62	876	#define UNI_MAX_UTF16 (uint32_t)0x0010FFFF
63		#define UNI_MAX_UTF32 (uint32_t)0x7FFFFFFF
64		#define UNI_MAX_LEGAL_UTF32 (uint32_t)0x0010FFFF
65
66		typedef enum
67		{
68		conversionOK, /* conversion successful */
69		sourceExhausted, /* partial character in source, but hit end */
70		targetExhausted, /* insuff. room in target for conversion */
71		sourceIllegal /* source sequence is illegal/malformed */
72		} ConversionResult;
73
74		typedef enum
75		{
76		strictConversion = 0,
77		lenientConversion
78		} ConversionFlags;
79
80		static const int halfShift = 10; /* used for shifting by 10 bits */
81
82		static const uint32_t halfBase = 0x0010000UL;
83		static const uint32_t halfMask = 0x3FFUL;
84
85	47.0M	#define UNI_SUR_HIGH_START (uint32_t)0xD800
86	91.6k	#define UNI_SUR_HIGH_END (uint32_t)0xDBFF
87	15.4M	#define UNI_SUR_LOW_START (uint32_t)0xDC00
88	80.9k	#define UNI_SUR_LOW_END (uint32_t)0xDFFF
89
90		/* --------------------------------------------------------------------- */
91
92		/*
93		* Index into the table below with the first byte of a UTF-8 sequence to
94		* get the number of trailing bytes that are supposed to follow it.
95		* Note that legal UTF-8 values can't have 4 or 5-bytes. The table is
96		* left as-is for anyone who may want to do such conversion, which was
97		* allowed in earlier algorithms.
98		*/
99		static const char trailingBytesForUTF8[256] = {
100		0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
101		0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
102		0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
103		0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
104		0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
105		0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
106		1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
107		2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 3, 3, 3, 3, 3, 3, 3, 3, 4, 4, 4, 4, 5, 5, 5, 5
108		};
109
110		/*
111		* Magic values subtracted from a buffer value during UTF8 conversion.
112		* This table contains as many values as there might be trailing bytes
113		* in a UTF-8 sequence.
114		*/
115		static const uint32_t offsetsFromUTF8[6] = { 0x00000000UL, 0x00003080UL, 0x000E2080UL,
116		0x03C82080UL, 0xFA082080UL, 0x82082080UL };
117
118		/*
119		* Once the bits are split out into bytes of UTF-8, this is a mask OR-ed
120		* into the first byte, depending on how many bytes follow. There are
121		* as many entries in this table as there are UTF-8 sequence types.
122		* (I.e., one byte sequence, two byte... etc.). Remember that sequence
123		* for legal UTF-8 will be 4 or fewer bytes total.
124		*/
125		static const uint8_t firstByteMark[7] = { 0x00, 0x00, 0xC0, 0xE0, 0xF0, 0xF8, 0xFC };
126
127		/* We always need UTF-16LE, even on big endian systems! */
128		static WCHAR setWcharFrom(WCHAR w)
129	19.7M	{
130		#if defined(__BIG_ENDIAN__)
131		union
132		{
133		WCHAR w;
134		char c[2];
135		} cnv;
136
137		cnv.w = w;
138		const char c = cnv.c[0];
139		cnv.c[0] = cnv.c[1];
140		cnv.c[1] = c;
141		return cnv.w;
142		#else
143	19.7M	return w;
144	19.7M	#endif
145	19.7M	}
146
147		/* --------------------------------------------------------------------- */
148
149		/* The interface converts a whole buffer to avoid function-call overhead.
150		* Constants have been gathered. Loops & conditionals have been removed as
151		* much as possible for efficiency, in favor of drop-through switches.
152		* (See "Note A" at the bottom of the file for equivalent code.)
153		* If your compiler supports it, the "isLegalUTF8" call can be turned
154		* into an inline function.
155		*/
156
157		/* --------------------------------------------------------------------- */
158
159		static ConversionResult winpr_ConvertUTF16toUTF8_Internal(const uint16_t** sourceStart,
160		const uint16_t* sourceEnd,
161		uint8_t** targetStart,
162		const uint8_t* targetEnd,
163		ConversionFlags flags)
164	466k	{
165	466k	bool computeLength = (!targetEnd) ? true : false;
166	466k	const uint16_t* source = *sourceStart;
167	466k	uint8_t* target = *targetStart;
168	466k	ConversionResult result = conversionOK;
169
170	8.18M	while (source < sourceEnd)
171	7.73M	{
172	7.73M	uint32_t ch = 0;
173	7.73M	unsigned short bytesToWrite = 0;
174	7.73M	const uint32_t byteMask = 0xBF;
175	7.73M	const uint32_t byteMark = 0x80;
176	7.73M	const uint16_t* oldSource =
177	7.73M	source; /* In case we have to back up because of target overflow. */
178
179	7.73M	ch = setWcharFrom(*source++);
180
181		/* If we have a surrogate pair, convert to UTF32 first. */
182	7.73M	if (ch >= UNI_SUR_HIGH_START && ch <= UNI_SUR_HIGH_END)
183	12.0k	{
184		/* If the 16 bits following the high surrogate are in the source buffer... */
185	12.0k	if (source < sourceEnd)
186	12.0k	{
187	12.0k	uint32_t ch2 = setWcharFrom(*source);
188
189		/* If it's a low surrogate, convert to UTF32. */
190	12.0k	if (ch2 >= UNI_SUR_LOW_START && ch2 <= UNI_SUR_LOW_END)
191	1.07k	{
192	1.07k	ch = ((ch - UNI_SUR_HIGH_START) << halfShift) + (ch2 - UNI_SUR_LOW_START) +
193	1.07k	halfBase;
194	1.07k	++source;
195	1.07k	}
196	10.9k	else if (flags == strictConversion)
197	10.9k	{
198		/* it's an unpaired high surrogate */
199	10.9k	--source; /* return to the illegal value itself */
200	10.9k	result = sourceIllegal;
201	10.9k	break;
202	10.9k	}
203	12.0k	}
204	18	else
205	18	{
206		/* We don't have the 16 bits following the high surrogate. */
207	18	--source; /* return to the high surrogate */
208	18	result = sourceExhausted;
209	18	break;
210	18	}
211	12.0k	}
212	7.72M	else if (flags == strictConversion)
213	7.72M	{
214		/* UTF-16 surrogate values are illegal in UTF-32 */
215	7.72M	if (ch >= UNI_SUR_LOW_START && ch <= UNI_SUR_LOW_END)
216	233	{
217	233	--source; /* return to the illegal value itself */
218	233	result = sourceIllegal;
219	233	break;
220	233	}
221	7.72M	}
222
223		/* Figure out how many bytes the result will require */
224	7.72M	if (ch < (uint32_t)0x80)
225	6.86M	{
226	6.86M	bytesToWrite = 1;
227	6.86M	}
228	856k	else if (ch < (uint32_t)0x800)
229	49.6k	{
230	49.6k	bytesToWrite = 2;
231	49.6k	}
232	806k	else if (ch < (uint32_t)0x10000)
233	805k	{
234	805k	bytesToWrite = 3;
235	805k	}
236	1.07k	else if (ch < (uint32_t)0x110000)
237	1.07k	{
238	1.07k	bytesToWrite = 4;
239	1.07k	}
240	0	else
241	0	{
242	0	bytesToWrite = 3;
243	0	ch = UNI_REPLACEMENT_CHAR;
244	0	}
245
246	7.72M	target += bytesToWrite;
247
248	7.72M	if ((target > targetEnd) && (!computeLength))
249	1.76k	{
250	1.76k	source = oldSource; /* Back up source pointer! */
251	1.76k	target -= bytesToWrite;
252	1.76k	result = targetExhausted;
253	1.76k	break;
254	1.76k	}
255
256	7.71M	if (!computeLength)
257	7.20M	{
258	7.20M	switch (bytesToWrite)
259	7.20M	{
260		/* note: everything falls through. */
261	528	case 4:
262	528	*--target = (uint8_t)((ch \| byteMark) & byteMask);
263	528	ch >>= 6;
264		/* fallthrough */
265	528	WINPR_FALLTHROUGH
266	532k	case 3:
267	532k	*--target = (uint8_t)((ch \| byteMark) & byteMask);
268	532k	ch >>= 6;
269		/* fallthrough */
270	532k	WINPR_FALLTHROUGH
271
272	564k	case 2:
273	564k	*--target = (uint8_t)((ch \| byteMark) & byteMask);
274	564k	ch >>= 6;
275		/* fallthrough */
276	564k	WINPR_FALLTHROUGH
277
278	7.20M	case 1:
279	7.20M	*--target = (uint8_t)(ch \| firstByteMark[bytesToWrite]);
280	7.20M	break;
281	0	default:
282	0	return sourceIllegal;
283	7.20M	}
284	7.20M	}
285	516k	else
286	516k	{
287	516k	switch (bytesToWrite)
288	516k	{
289		/* note: everything falls through. */
290	546	case 4:
291	546	--target;
292		/* fallthrough */
293	546	WINPR_FALLTHROUGH
294
295	272k	case 3:
296	272k	--target;
297		/* fallthrough */
298	272k	WINPR_FALLTHROUGH
299
300	290k	case 2:
301	290k	--target;
302		/* fallthrough */
303	290k	WINPR_FALLTHROUGH
304
305	516k	case 1:
306	516k	--target;
307	516k	break;
308	0	default:
309	0	return sourceIllegal;
310	516k	}
311	516k	}
312
313	7.71M	target += bytesToWrite;
314	7.71M	}
315
316	466k	*sourceStart = source;
317	466k	*targetStart = target;
318	466k	return result;
319	466k	}
320
321		/* --------------------------------------------------------------------- */
322
323		/*
324		* Utility routine to tell whether a sequence of bytes is legal UTF-8.
325		* This must be called with the length pre-determined by the first byte.
326		* If not calling this from ConvertUTF8to*, then the length can be set by:
327		* length = trailingBytesForUTF8[*source]+1;
328		* and the sequence is illegal right away if there aren't that many bytes
329		* available.
330		* If presented with a length > 4, this returns false. The Unicode
331		* definition of UTF-8 goes up to 4-byte sequences.
332		*/
333
334		static bool isLegalUTF8(const uint8_t* source, int length)
335	15.8M	{
336	15.8M	uint8_t a = 0;
337	15.8M	const uint8_t* srcptr = source + length;
338
339	15.8M	switch (length)
340	15.8M	{
341	3	default:
342	3	return false;
343
344		/* Everything else falls through when "true"... */
345	897	case 4:
346	897	if ((a = (*--srcptr)) < 0x80 \|\| a > 0xBF)
347	9	return false;
348		/* fallthrough */
349	888	WINPR_FALLTHROUGH
350
351	1.68k	case 3:
352	1.68k	if ((a = (*--srcptr)) < 0x80 \|\| a > 0xBF)
353	12	return false;
354		/* fallthrough */
355	1.67k	WINPR_FALLTHROUGH
356
357	1.98k	case 2:
358	1.98k	if ((a = (*--srcptr)) > 0xBF)
359	3	return false;
360
361	1.97k	switch (*source)
362	1.97k	{
363		/* no fall-through in this inner switch */
364	327	case 0xE0:
365	327	if (a < 0xA0)
366	9	return false;
367
368	318	break;
369
370	318	case 0xED:
371	225	if (a > 0x9F)
372	1	return false;
373
374	224	break;
375
376	361	case 0xF0:
377	361	if (a < 0x90)
378	9	return false;
379
380	352	break;
381
382	520	case 0xF4:
383	520	if (a > 0x8F)
384	2	return false;
385
386	518	break;
387
388	544	default:
389	544	if (a < 0x80)
390	7	return false;
391	537	break;
392	1.97k	}
393		/* fallthrough */
394	1.94k	WINPR_FALLTHROUGH
395
396	15.8M	case 1:
397	15.8M	if (source >= 0x80 && source < 0xC2)
398	20	return false;
399	15.8M	}
400
401	15.8M	if (*source > 0xF4)
402	1	return false;
403
404	15.8M	return true;
405	15.8M	}
406
407		/* --------------------------------------------------------------------- */
408
409		static ConversionResult winpr_ConvertUTF8toUTF16_Internal(const uint8_t** sourceStart,
410		const uint8_t* sourceEnd,
411		uint16_t** targetStart,
412		const uint16_t* targetEnd,
413		ConversionFlags flags)
414	436k	{
415	436k	bool computeLength = (!targetEnd) ? true : false;
416	436k	ConversionResult result = conversionOK;
417	436k	const uint8_t* source = *sourceStart;
418	436k	uint16_t* target = *targetStart;
419
420	16.2M	while (source < sourceEnd)
421	15.8M	{
422	15.8M	uint32_t ch = 0;
423	15.8M	unsigned short extraBytesToRead =
424	31.6M	WINPR_ASSERTING_INT_CAST(unsigned short, trailingBytesForUTF8[*source]);
425
426	31.6M	if ((source + extraBytesToRead) >= sourceEnd)
427	1	{
428	1	result = sourceExhausted;
429	1	break;
430	1	}
431
432		/* Do this check whether lenient or strict */
433	15.8M	if (!isLegalUTF8(source, extraBytesToRead + 1))
434	76	{
435	76	result = sourceIllegal;
436	76	break;
437	76	}
438
439		/*
440		* The cases all fall through. See "Note A" below.
441		*/
442	15.8M	switch (extraBytesToRead)
443	15.8M	{
444	0	case 5:
445	0	ch += *source++;
446	0	ch <<= 6; /* remember, illegal UTF-8 */
447		/* fallthrough */
448	0	WINPR_FALLTHROUGH
449
450	0	case 4:
451	0	ch += *source++;
452	0	ch <<= 6; /* remember, illegal UTF-8 */
453		/* fallthrough */
454	0	WINPR_FALLTHROUGH
455
456	876	case 3:
457	876	ch += *source++;
458	876	ch <<= 6;
459		/* fallthrough */
460	876	WINPR_FALLTHROUGH
461
462	1.65k	case 2:
463	1.65k	ch += *source++;
464	1.65k	ch <<= 6;
465		/* fallthrough */
466	1.65k	WINPR_FALLTHROUGH
467
468	1.94k	case 1:
469	1.94k	ch += *source++;
470	1.94k	ch <<= 6;
471		/* fallthrough */
472	1.94k	WINPR_FALLTHROUGH
473
474	15.8M	case 0:
475	15.8M	ch += *source++;
476	15.8M	break;
477	0	default:
478	0	return sourceIllegal;
479	15.8M	}
480
481	15.8M	ch -= offsetsFromUTF8[extraBytesToRead];
482
483	15.8M	if ((target >= targetEnd) && (!computeLength))
484	0	{
485	0	source -= (extraBytesToRead + 1); /* Back up source pointer! */
486	0	result = targetExhausted;
487	0	break;
488	0	}
489
490	15.8M	if (ch <= UNI_MAX_BMP)
491	15.8M	{
492		/* Target is a character <= 0xFFFF */
493		/* UTF-16 surrogate values are illegal in UTF-32 */
494	15.8M	if (ch >= UNI_SUR_HIGH_START && ch <= UNI_SUR_LOW_END)
495	0	{
496	0	if (flags == strictConversion)
497	0	{
498	0	source -= (extraBytesToRead + 1); /* return to the illegal value itself */
499	0	result = sourceIllegal;
500	0	break;
501	0	}
502	0	else
503	0	{
504	0	if (!computeLength)
505	0	*target++ = setWcharFrom(UNI_REPLACEMENT_CHAR);
506	0	else
507	0	target++;
508	0	}
509	0	}
510	15.8M	else
511	15.8M	{
512	15.8M	if (!computeLength)
513	12.0M	target++ = setWcharFrom((WCHAR)ch); / normal case */
514	3.80M	else
515	3.80M	target++;
516	15.8M	}
517	15.8M	}
518	876	else if (ch > UNI_MAX_UTF16)
519	0	{
520	0	if (flags == strictConversion)
521	0	{
522	0	result = sourceIllegal;
523	0	source -= (extraBytesToRead + 1); /* return to the start */
524	0	break; /* Bail out; shouldn't continue */
525	0	}
526	0	else
527	0	{
528	0	if (!computeLength)
529	0	*target++ = setWcharFrom(UNI_REPLACEMENT_CHAR);
530	0	else
531	0	target++;
532	0	}
533	0	}
534	876	else
535	876	{
536		/* target is a character in range 0xFFFF - 0x10FFFF. */
537	876	if ((target + 1 >= targetEnd) && (!computeLength))
538	0	{
539	0	source -= (extraBytesToRead + 1); /* Back up source pointer! */
540	0	result = targetExhausted;
541	0	break;
542	0	}
543
544	876	ch -= halfBase;
545
546	876	if (!computeLength)
547	433	{
548	433	*target++ = setWcharFrom((WCHAR)((ch >> halfShift) + UNI_SUR_HIGH_START));
549	433	*target++ = setWcharFrom((WCHAR)((ch & halfMask) + UNI_SUR_LOW_START));
550	433	}
551	443	else
552	443	{
553	443	target++;
554	443	target++;
555	443	}
556	876	}
557	15.8M	}
558
559	436k	*sourceStart = source;
560	436k	*targetStart = target;
561	436k	return result;
562	436k	}
563
564		/**
565		* WinPR built-in Unicode API
566		*/
567
568		static int winpr_ConvertUTF8toUTF16(const uint8_t* src, int cchSrc, uint16_t* dst, int cchDst)
569	436k	{
570	436k	size_t length = 0;
571	436k	uint16_t* dstBeg = NULL;
572	436k	uint16_t* dstEnd = NULL;
573	436k	const uint8_t* srcBeg = NULL;
574	436k	const uint8_t* srcEnd = NULL;
575	436k	ConversionResult result = sourceIllegal;
576
577	436k	if (cchSrc == -1)
578	0	cchSrc = (int)strnlen((const char*)src, INT32_MAX - 1) + 1;
579
580	436k	srcBeg = src;
581	436k	srcEnd = &src[cchSrc];
582
583	436k	if (cchDst == 0)
584	1.01k	{
585	1.01k	result =
586	1.01k	winpr_ConvertUTF8toUTF16_Internal(&srcBeg, srcEnd, &dstBeg, dstEnd, strictConversion);
587
588	1.01k	length = dstBeg - (uint16_t*)NULL;
589	1.01k	}
590	435k	else
591	435k	{
592	435k	dstBeg = dst;
593	435k	dstEnd = &dst[cchDst];
594
595	435k	result =
596	435k	winpr_ConvertUTF8toUTF16_Internal(&srcBeg, srcEnd, &dstBeg, dstEnd, strictConversion);
597
598	435k	length = dstBeg - dst;
599	435k	}
600
601	436k	if (result == targetExhausted)
602	0	{
603	0	SetLastError(ERROR_INSUFFICIENT_BUFFER);
604	0	return 0;
605	0	}
606
607	436k	return (result == conversionOK) ? WINPR_ASSERTING_INT_CAST(int, length) : 0;
608	436k	}
609
610		static int winpr_ConvertUTF16toUTF8(const uint16_t* src, int cchSrc, uint8_t* dst, int cchDst)
611	466k	{
612	466k	size_t length = 0;
613	466k	uint8_t* dstBeg = NULL;
614	466k	uint8_t* dstEnd = NULL;
615	466k	const uint16_t* srcBeg = NULL;
616	466k	const uint16_t* srcEnd = NULL;
617	466k	ConversionResult result = sourceIllegal;
618
619	466k	if (cchSrc == -1)
620	0	cchSrc = (int)_wcsnlen((const WCHAR*)src, INT32_MAX - 1) + 1;
621
622	466k	srcBeg = src;
623	466k	srcEnd = &src[cchSrc];
624
625	466k	if (cchDst == 0)
626	55.4k	{
627	55.4k	result =
628	55.4k	winpr_ConvertUTF16toUTF8_Internal(&srcBeg, srcEnd, &dstBeg, dstEnd, strictConversion);
629
630	55.4k	length = dstBeg - ((uint8_t*)NULL);
631	55.4k	}
632	411k	else
633	411k	{
634	411k	dstBeg = dst;
635	411k	dstEnd = &dst[cchDst];
636
637	411k	result =
638	411k	winpr_ConvertUTF16toUTF8_Internal(&srcBeg, srcEnd, &dstBeg, dstEnd, strictConversion);
639
640	411k	length = dstBeg - dst;
641	411k	}
642
643	466k	if (result == targetExhausted)
644	1.76k	{
645	1.76k	SetLastError(ERROR_INSUFFICIENT_BUFFER);
646	1.76k	return 0;
647	1.76k	}
648
649	464k	return (result == conversionOK) ? WINPR_ASSERTING_INT_CAST(int, length) : 0;
650	464k	}
651
652		/* --------------------------------------------------------------------- */
653
654		int int_MultiByteToWideChar(UINT CodePage, DWORD dwFlags, LPCSTR lpMultiByteStr, int cbMultiByte,
655		LPWSTR lpWideCharStr, int cchWideChar)
656	436k	{
657	436k	size_t cbCharLen = (size_t)cbMultiByte;
658
659	436k	WINPR_UNUSED(dwFlags);
660
661		/* If cbMultiByte is 0, the function fails */
662	436k	if ((cbMultiByte == 0) \|\| (cbMultiByte < -1))
663	0	return 0;
664
665	436k	if (cchWideChar < 0)
666	0	return -1;
667
668	436k	if (cbMultiByte < 0)
669	0	{
670	0	const size_t len = strlen(lpMultiByteStr);
671	0	if (len >= INT32_MAX)
672	0	return 0;
673	0	cbCharLen = (int)len + 1;
674	0	}
675	436k	else
676	436k	cbCharLen = cbMultiByte;
677
678	436k	WINPR_ASSERT(lpMultiByteStr);
679	436k	switch (CodePage)
680	436k	{
681	0	case CP_ACP:
682	436k	case CP_UTF8:
683	436k	break;
684
685	0	default:
686	0	WLog_ERR(TAG, "Unsupported encoding %u", CodePage);
687	0	return 0;
688	436k	}
689
690	436k	return winpr_ConvertUTF8toUTF16((const uint8_t*)lpMultiByteStr,
691	436k	WINPR_ASSERTING_INT_CAST(int, cbCharLen),
692	436k	(uint16_t*)lpWideCharStr, cchWideChar);
693	436k	}
694
695		int int_WideCharToMultiByte(UINT CodePage, DWORD dwFlags, LPCWSTR lpWideCharStr, int cchWideChar,
696		LPSTR lpMultiByteStr, int cbMultiByte, LPCSTR lpDefaultChar,
697		LPBOOL lpUsedDefaultChar)
698	466k	{
699	466k	size_t cbCharLen = (size_t)cchWideChar;
700
701	466k	WINPR_UNUSED(dwFlags);
702		/* If cchWideChar is 0, the function fails */
703	466k	if ((cchWideChar == 0) \|\| (cchWideChar < -1))
704	0	return 0;
705
706	466k	if (cbMultiByte < 0)
707	0	return -1;
708
709	466k	WINPR_ASSERT(lpWideCharStr);
710		/* If cchWideChar is -1, the string is null-terminated */
711	466k	if (cchWideChar == -1)
712	0	{
713	0	const size_t len = _wcslen(lpWideCharStr);
714	0	if (len >= INT32_MAX)
715	0	return 0;
716	0	cbCharLen = (int)len + 1;
717	0	}
718	466k	else
719	466k	cbCharLen = cchWideChar;
720
721		/*
722		* if cbMultiByte is 0, the function returns the required buffer size
723		* in bytes for lpMultiByteStr and makes no use of the output parameter itself.
724		*/
725
726	466k	return winpr_ConvertUTF16toUTF8((const uint16_t*)lpWideCharStr,
727	466k	WINPR_ASSERTING_INT_CAST(int, cbCharLen),
728	466k	(uint8_t*)lpMultiByteStr, cbMultiByte);
729	466k	}