266 lines
8.8 KiB
C
266 lines
8.8 KiB
C
|
/***
|
||
|
*mbstowcs.c - Convert multibyte char string to wide char string.
|
||
|
*
|
||
|
* Copyright (c) 1990-2001, Microsoft Corporation. All rights reserved.
|
||
|
*
|
||
|
*Purpose:
|
||
|
* Convert a multibyte char string into the equivalent wide char string.
|
||
|
*
|
||
|
*Revision History:
|
||
|
* 08-24-90 KRS Module created.
|
||
|
* 03-20-91 KRS Ported from 16-bit tree.
|
||
|
* 10-16-91 ETC Locale support under _INTL switch.
|
||
|
* 12-09-91 ETC Updated nlsapi; added multithread.
|
||
|
* 08-20-92 KRS Activated NLSAPI support.
|
||
|
* 08-31-92 SRW Allow INTL definition to be conditional for building ntcrt.lib
|
||
|
* 09-02-92 SRW Get _INTL definition via ..\crt32.def
|
||
|
* 02-09-93 CFW Always stuff WC 0 at end of output string of room (non _INTL).
|
||
|
* 04-06-93 SKS Replace _CRTAPI* with _cdecl
|
||
|
* 05-03-93 CFW Return pointer == NULL, return size, plus massive cleanup.
|
||
|
* 06-01-93 CFW Minor optimization and beautify.
|
||
|
* 06-02-93 SRW ignore _INTL if _NTSUBSET_ defined.
|
||
|
* 09-15-93 CFW Use ANSI conformant "__" names.
|
||
|
* 09-21-93 CFW Avoid cast bug.
|
||
|
* 09-27-93 GJF Merged NT SDK and Cuda.
|
||
|
* 10-22-93 CFW Test for invalid MB chars using global preset flag.
|
||
|
* 01-14-94 SRW if _NTSUBSET_ defined call Rtl functions
|
||
|
* 02-03-94 GJF Merged in Steve Wood's latest change (affects
|
||
|
* _NTSUBSET_ build only).
|
||
|
* 02-07-94 CFW POSIXify.
|
||
|
* 08-03-94 CFW Bug #15300; fix MBToWC workaround for small buffer.
|
||
|
* 09-06-94 CFW Remove _INTL switch.
|
||
|
* 10-18-94 BWT Fix build warning for call to RtlMultiByteToUnicodeN
|
||
|
* 12-21-94 CFW Remove invalid MB chars NT 3.1 hack.
|
||
|
* 01-07-95 CFW Mac merge cleanup.
|
||
|
* 02-06-95 CFW assert -> _ASSERTE.
|
||
|
* 04-19-95 CFW Rearrange & fix non-Win32 version.
|
||
|
* 09-26-95 GJF New locking macro, and scheme, for functions which
|
||
|
* reference the locale.
|
||
|
* 04-01-96 BWT POSIX work.
|
||
|
* 05-26-96 BWT Return the word count, not the byte count for
|
||
|
* _NTSUBSET_/POSIX case.
|
||
|
* 06-25-96 GJF Removed DLL_FOR_WIN32S. Replaced defined(_WIN32) with
|
||
|
* !defined(_MAC). Polished the format a bit.
|
||
|
* 07-27-98 GJF Revised multithread support based on threadlocinfo
|
||
|
* struct.
|
||
|
* 12-15-98 GJF Changes for 64-bit size_t.
|
||
|
* 05-17-99 PML Remove all Macintosh support.
|
||
|
*
|
||
|
*******************************************************************************/
|
||
|
|
||
|
#if defined(_NTSUBSET_) || defined(_POSIX_)
|
||
|
#include <nt.h>
|
||
|
#include <ntrtl.h>
|
||
|
#include <nturtl.h>
|
||
|
#endif
|
||
|
|
||
|
#include <internal.h>
|
||
|
#include <locale.h>
|
||
|
#include <setlocal.h>
|
||
|
#include <errno.h>
|
||
|
#include <cruntime.h>
|
||
|
#include <stdlib.h>
|
||
|
#include <string.h>
|
||
|
#include <mtdll.h>
|
||
|
#include <dbgint.h>
|
||
|
#include <stdio.h>
|
||
|
|
||
|
/***
|
||
|
*size_t mbstowcs() - Convert multibyte char string to wide char string.
|
||
|
*
|
||
|
*Purpose:
|
||
|
* Convert a multi-byte char string into the equivalent wide char string,
|
||
|
* according to the LC_CTYPE category of the current locale.
|
||
|
* [ANSI].
|
||
|
*
|
||
|
*Entry:
|
||
|
* wchar_t *pwcs = pointer to destination wide character string buffer
|
||
|
* const char *s = pointer to source multibyte character string
|
||
|
* size_t n = maximum number of wide characters to store
|
||
|
*
|
||
|
*Exit:
|
||
|
* If s != NULL, returns: number of words modified (<=n)
|
||
|
* (size_t)-1 (if invalid mbcs)
|
||
|
*
|
||
|
*Exceptions:
|
||
|
* Returns (size_t)-1 if s is NULL or invalid mbcs character encountered
|
||
|
*
|
||
|
*******************************************************************************/
|
||
|
|
||
|
size_t __cdecl mbstowcs
|
||
|
(
|
||
|
wchar_t *pwcs,
|
||
|
const char *s,
|
||
|
size_t n
|
||
|
)
|
||
|
{
|
||
|
#ifdef _MT
|
||
|
pthreadlocinfo ptloci = _getptd()->ptlocinfo;
|
||
|
|
||
|
if ( ptloci != __ptlocinfo )
|
||
|
ptloci = __updatetlocinfo();
|
||
|
|
||
|
return __mbstowcs_mt(ptloci, pwcs, s, n);
|
||
|
}
|
||
|
|
||
|
size_t __cdecl __mbstowcs_mt (
|
||
|
pthreadlocinfo ptloci,
|
||
|
wchar_t *pwcs,
|
||
|
const char *s,
|
||
|
size_t n
|
||
|
)
|
||
|
{
|
||
|
#endif
|
||
|
size_t count = 0;
|
||
|
|
||
|
if (pwcs && n == 0)
|
||
|
/* dest string exists, but 0 bytes converted */
|
||
|
return (size_t) 0;
|
||
|
|
||
|
_ASSERTE(s != NULL);
|
||
|
|
||
|
#ifdef _WIN64
|
||
|
/* n must fit into an int for MultiByteToWideChar */
|
||
|
if ( n > INT_MAX )
|
||
|
return (size_t)-1;
|
||
|
#endif
|
||
|
|
||
|
#if !defined(_NTSUBSET_) && !defined(_POSIX_)
|
||
|
|
||
|
/* if destination string exists, fill it in */
|
||
|
if (pwcs)
|
||
|
{
|
||
|
#ifdef _MT
|
||
|
if (ptloci->lc_handle[LC_CTYPE] == _CLOCALEHANDLE)
|
||
|
#else
|
||
|
if (__lc_handle[LC_CTYPE] == _CLOCALEHANDLE)
|
||
|
#endif
|
||
|
{
|
||
|
/* C locale: easy and fast */
|
||
|
while (count < n)
|
||
|
{
|
||
|
*pwcs = (wchar_t) ((unsigned char)s[count]);
|
||
|
if (!s[count])
|
||
|
return count;
|
||
|
count++;
|
||
|
pwcs++;
|
||
|
}
|
||
|
return count;
|
||
|
|
||
|
} else {
|
||
|
int bytecnt, charcnt;
|
||
|
unsigned char *p;
|
||
|
|
||
|
/* Assume that the buffer is large enough */
|
||
|
#ifdef _MT
|
||
|
if ( (count = MultiByteToWideChar( ptloci->lc_codepage,
|
||
|
#else
|
||
|
if ( (count = MultiByteToWideChar( __lc_codepage,
|
||
|
#endif
|
||
|
MB_PRECOMPOSED |
|
||
|
MB_ERR_INVALID_CHARS,
|
||
|
s,
|
||
|
-1,
|
||
|
pwcs,
|
||
|
(int)n )) != 0 )
|
||
|
return count - 1; /* don't count NUL */
|
||
|
|
||
|
if (GetLastError() != ERROR_INSUFFICIENT_BUFFER)
|
||
|
{
|
||
|
errno = EILSEQ;
|
||
|
return (size_t)-1;
|
||
|
}
|
||
|
|
||
|
/* User-supplied buffer not large enough. */
|
||
|
|
||
|
/* How many bytes are in n characters of the string? */
|
||
|
charcnt = (int)n;
|
||
|
for (p = (unsigned char *)s; (charcnt-- && *p); p++)
|
||
|
{
|
||
|
#ifdef _MT
|
||
|
if (__isleadbyte_mt(ptloci, *p))
|
||
|
#else
|
||
|
if (isleadbyte(*p))
|
||
|
#endif
|
||
|
p++;
|
||
|
}
|
||
|
bytecnt = ((int) ((char *)p - (char *)s));
|
||
|
|
||
|
#ifdef _MT
|
||
|
if ( (count = MultiByteToWideChar( ptloci->lc_codepage,
|
||
|
#else
|
||
|
if ( (count = MultiByteToWideChar( __lc_codepage,
|
||
|
#endif
|
||
|
MB_PRECOMPOSED,
|
||
|
s,
|
||
|
bytecnt,
|
||
|
pwcs,
|
||
|
(int)n )) == 0 )
|
||
|
{
|
||
|
errno = EILSEQ;
|
||
|
return (size_t)-1;
|
||
|
}
|
||
|
|
||
|
return count; /* no NUL in string */
|
||
|
}
|
||
|
}
|
||
|
else { /* pwcs == NULL, get size only, s must be NUL-terminated */
|
||
|
#ifdef _MT
|
||
|
if (ptloci->lc_handle[LC_CTYPE] == _CLOCALEHANDLE)
|
||
|
#else
|
||
|
if (__lc_handle[LC_CTYPE] == _CLOCALEHANDLE)
|
||
|
#endif
|
||
|
return strlen(s);
|
||
|
|
||
|
else {
|
||
|
#ifdef _MT
|
||
|
if ( (count = MultiByteToWideChar( ptloci->lc_codepage,
|
||
|
#else
|
||
|
if ( (count = MultiByteToWideChar( __lc_codepage,
|
||
|
#endif
|
||
|
MB_PRECOMPOSED |
|
||
|
MB_ERR_INVALID_CHARS,
|
||
|
s,
|
||
|
-1,
|
||
|
NULL,
|
||
|
0 )) == 0 )
|
||
|
{
|
||
|
errno = EILSEQ;
|
||
|
return (size_t)-1;
|
||
|
}
|
||
|
|
||
|
return count - 1;
|
||
|
}
|
||
|
}
|
||
|
|
||
|
#else /* _NTSUBSET_/_POSIX_ */
|
||
|
|
||
|
if (pwcs) {
|
||
|
|
||
|
NTSTATUS Status;
|
||
|
int size;
|
||
|
|
||
|
size = _mbstrlen(s);
|
||
|
Status = RtlMultiByteToUnicodeN(pwcs,
|
||
|
(ULONG) ( n * sizeof( *pwcs ) ),
|
||
|
(PULONG)&size,
|
||
|
(char *)s,
|
||
|
size+1 );
|
||
|
if (!NT_SUCCESS(Status)) {
|
||
|
errno = EILSEQ;
|
||
|
size = -1;
|
||
|
} else {
|
||
|
size = size / sizeof(*pwcs);
|
||
|
if (pwcs[size-1] == L'\0') {
|
||
|
size -= 1;
|
||
|
}
|
||
|
}
|
||
|
return size;
|
||
|
|
||
|
} else { /* pwcs == NULL, get size only, s must be NUL-terminated */
|
||
|
return strlen(s);
|
||
|
}
|
||
|
|
||
|
#endif /* _NTSUBSET_/_POSIX_ */
|
||
|
}
|