/*** *xmbtowc.c - Convert multibyte char to wide char. * * Copyright (c) 1995-2001, Microsoft Corporation. All rights reserved. * *Purpose: * Convert a multibyte character into the equivalent wide character. * *Revision History: * 12-XX-95 PJP Created from mbtowc.c December 1995 by P.J. Plauger * 04-17-96 GJF Updated for current locale locking. Also, reformatted * and made several cosmetic changes. * 09-25-96 GJF Made mbrlen, mbrtowc and mbsrtowcs multithread safe. * 09-17-97 JWM Added "return MB_CUR_MAX" to "if (*pst != 0)" branch. * *******************************************************************************/ #include #include #include #include #include #include #include /* for INT_MAX */ #include /* for EOF */ #include /* for _Cvtvec, _Mbrtowc */ #ifdef _WIN32 #include #include #include #endif /* _WIN32 */ #ifndef _MT #define _Mbrtowc_lk _Mbrtowc #endif /*** *int _Mbrtowc() - Convert multibyte char to wide character. * *Purpose: * Convert a multi-byte character into the equivalent wide character, * according to the specified LC_CTYPE category, or the current locale. * [ANSI]. * * NOTE: Currently, the C libraries support the "C" locale only. * Non-C locale support now available under _INTL switch. *Entry: * wchar_t *pwc = pointer to destination wide character * const char *s = pointer to multibyte character * size_t n = maximum length of multibyte character to consider * mbstate_t *pst = pointer to state * const _Cvtvec * = pointer to locale info * *Exit: * If s = NULL, returns 0, indicating we only use state-independent * character encodings. * If s != NULL, returns: 0 (if *s = null char) * -1 (if the next n or fewer bytes not valid mbc) * number of bytes comprising converted mbc * *Exceptions: * *******************************************************************************/ #ifdef _MT static int __cdecl _Mbrtowc_lk ( wchar_t *pwc, const char *s, size_t n, mbstate_t *pst, const _Cvtvec *ploc ); int _CRTIMP2 __cdecl _Mbrtowc( wchar_t *pwc, const char *s, size_t n, mbstate_t *pst, const _Cvtvec *ploc ) { int retval; #ifdef _MT int local_lock_flag; #endif _lock_locale( local_lock_flag ) retval = _Mbrtowc_lk(pwc, s, n, pst, ploc); _unlock_locale( local_lock_flag ) return retval; } #endif /* _MT */ #ifdef _MT static int __cdecl _Mbrtowc_lk #else /* _MT */ int _CRTIMP2 __cdecl _Mbrtowc #endif /* _MT */ ( wchar_t *pwc, const char *s, size_t n, mbstate_t *pst, const _Cvtvec *ploc ) { _ASSERTE (MB_CUR_MAX == 1 || MB_CUR_MAX == 2); if ( !s || n == 0 ) /* indicate do not have state-dependent encodings, handle zero length string */ return 0; if ( !*s ) { /* handle NULL char */ if (pwc) *pwc = 0; return 0; } #ifdef _WIN32 { /* perform locale-dependent parse */ LCID handle; UINT codepage; if (ploc == 0) { handle = __lc_handle[LC_CTYPE]; codepage = __lc_codepage; } else { handle = ploc->_Hand; codepage = ploc->_Page; } if ( handle == _CLOCALEHANDLE ) { if (pwc) *pwc = (wchar_t)(unsigned char)*s; return sizeof(char); } if (*pst != 0) { /* complete two-byte multibyte character */ ((char *)pst)[1] = *s; if (MB_CUR_MAX <= 1 || (MultiByteToWideChar(codepage, MB_PRECOMPOSED|MB_ERR_INVALID_CHARS, (char *)pst, 2, pwc, (pwc) ? 1 : 0) == 0)) { /* translation failed */ *pst = 0; errno = EILSEQ; return -1; } *pst = 0; return MB_CUR_MAX; } else if ( isleadbyte((unsigned char)*s) ) { /* multi-byte char */ if (n < MB_CUR_MAX) { /* save partial multibyte character */ ((char *)pst)[0] = *s; return (-2); } else if ( MB_CUR_MAX <= 1 || (MultiByteToWideChar( codepage, MB_PRECOMPOSED | MB_ERR_INVALID_CHARS, s, MB_CUR_MAX, pwc, (pwc) ? 1 : 0) == 0) ) { /* validate high byte of mbcs char */ if (!*(s+1)) { *pst = 0; errno = EILSEQ; return -1; } /* else translation failed with no complaint? [pjp] */ } return MB_CUR_MAX; } else { /* single byte char */ if ( MultiByteToWideChar( codepage, MB_PRECOMPOSED|MB_ERR_INVALID_CHARS, s, 1, pwc, (pwc) ? 1 : 0) == 0 ) { errno = EILSEQ; return -1; } return sizeof(char); } } #else /* _WIN32 */ /* stuck the "C" locale again */ if (pwc) *pwc = (wchar_t)(unsigned char)*s; return sizeof(char); #endif /* _WIN32 */ } /*** *wint_t btowc(c) - translate single byte to wide char * *Purpose: * *Entry: * *Exit: * *Exceptions: * *******************************************************************************/ wint_t _CRTIMP2 __cdecl btowc ( int c ) { if (c == EOF) return (WEOF); else { /* convert as one-byte string */ char ch = (char)c; mbstate_t mbst = 0; wchar_t wc; return (_Mbrtowc(&wc, &ch, 1, &mbst, 0) < 0 ? WEOF : wc); } } /*** *size_t mbrlen(s, n, pst) - determine next multibyte code, restartably * *Purpose: * *Entry: * *Exit: * *Exceptions: * *******************************************************************************/ size_t _CRTIMP2 __cdecl mbrlen ( const char *s, size_t n, mbstate_t *pst ) { #ifdef _MT int local_lock_flag; #endif size_t retval; static mbstate_t mbst = {0}; _lock_locale( local_lock_flag ) retval = _Mbrtowc_lk(0, s != 0 ? s : 0, n, pst ? pst : &mbst, 0); _unlock_locale( local_lock_flag ) return retval; } /*** *size_t mbrtowc(pwc, s, n, pst) - translate multibyte to wchar_t, restartably * *Purpose: * *Entry: * *Exit: * *Exceptions: * *******************************************************************************/ size_t _CRTIMP2 __cdecl mbrtowc ( wchar_t *pwc, const char *s, size_t n, mbstate_t *pst ) { #ifdef _MT int local_lock_flag; #endif size_t retval; static mbstate_t mbst = {0}; _lock_locale( local_lock_flag ) retval = (s != 0) ? _Mbrtowc_lk(pwc, s, n, pst ? pst : &mbst, 0) : _Mbrtowc_lk(0, "", n, pst ? pst : &mbst, 0); _unlock_locale( local_lock_flag ) return retval; } /*** *size_t mbsrtowcs(wcs, ps, n, pst) - translate multibyte string to wide, * restartably * *Purpose: * *Entry: * *Exit: * *Exceptions: * *******************************************************************************/ size_t _CRTIMP2 __cdecl mbsrtowcs ( wchar_t *wcs, const char **ps, size_t n, mbstate_t *pst ) { const char *s = *ps; int i; size_t nwc = 0; #ifdef _MT int local_lock_flag; #endif static mbstate_t mbst = {0}; if (pst == 0) pst = &mbst; _lock_locale( local_lock_flag ) if (wcs == 0) for (; ; ++nwc, s += i) { /* translate but don't store */ wchar_t wc; if ((i = _Mbrtowc_lk(&wc, s, INT_MAX, pst, 0)) < 0) { _unlock_locale( local_lock_flag ) return ((size_t)-1); } else if (i == 0) { _unlock_locale( local_lock_flag ) return (nwc); } } for (; 0 < n; ++nwc, s += i, ++wcs, --n) { /* translate and store */ if ((i = _Mbrtowc_lk(wcs, s, INT_MAX, pst, 0)) < 0) { /* encountered invalid sequence */ nwc = (size_t)-1; break; } else if (i == 0) { /* encountered terminating null */ s = 0; break; } } *ps = s; _unlock_locale( local_lock_flag ) return (nwc); }