windows-nt/Source/XPSP1/NT/inetsrv/iis/svcs/infocomm/kisfecnv/unix2pc.c
2020-09-26 16:20:57 +08:00

295 lines
12 KiB
C

// File Name: unix2pc.c
// Owner: Tetsuhide Akaishi
// Revision: 1.00 02/21/'93 Tetsuhide Akaishi
//
#include "win32.h"
#include "fechrcnv.h"
#ifdef DBCS_DIVIDE
extern DBCS_STATUS dStatus0;
extern DBCS_STATUS dStatus;
#endif
#ifdef IEXPLORE
extern int nCurrentCodeSet;
#endif
int JPNUNIX_to_PC ( int CodeSet,
UCHAR *pUNIXChar, int UNIXChar_len,
UCHAR *pPCChar, int PCChar_len )
// The JPNUNIX_to_PC function convert a character string as Japanese UNIX code
// set string to a PC code set string.
//
//
// int CodeSet Code Set Type.
// There are three Japanese Code set in UNIX world.
// These code sets are JIS, EUC and Shift JIS.
// When CodePage is Japanese, the following Code set
// constants are defined:
//
// Value Meaning
// CODE_UNKNOWN Unknown. If this value is CODE_UNKNOWN,
// Code Type is checked automatically.
//
// CODE_JPN_JIS JIS Code Set. The function convert
// pUNIXChar string as JIS code set string
// to a PC code set string.
// CODE_JPN_EUC EUC Code Set. The function convert
// pUNIXChar string as EUC code set string
// to a PC code set string.
// CODE_JPN_SJIS Shift JIS Code Set.
//
// UCHAR *pUNIXChar Points to the character string to be converted.
//
// int UNIXChar_len Specifies the size in bytes of the string pointed
// to by the pUNIXChar parameter. If this value is -1,
// the string is assumed to be NULL terminated and the
// length is calculated automatically.
//
// UCHAR *pPCChar Points to a buffer that receives the convert string
// from UNIX Code to PC Code.
//
// int PCChar_len Specifies the size, in PC characters of the buffer
// pointed to by the pPCChar parameter. If the value is zero,
// the function returns the number of PC characters
// required for the buffer, and makes no use of the pPCChar
// buffer.
//
// Return Value
// If the function succeeds, and PCChar_len is nonzero, the return value is the
// number of PC characters written to the buffer pointed to by pPCChar.
//
// If the function succeeds, and PCChar_len is zero, the return value is the
// required size, in PC characters, for a buffer that can receive the
// converted string.
//
// If the function fails, the return value is -1. The error mean pPCChar buffer
// is small for setting converted strings.
//
{
int re;
#ifdef DBCS_DIVIDE
int i = 0, nDelta = 0;
if ( PCChar_len == 0 && dStatus0.nCodeSet != CODE_UNKNOWN)
CodeSet = dStatus0.nCodeSet;
else if ( PCChar_len != 0 && dStatus.nCodeSet != CODE_UNKNOWN )
CodeSet = dStatus.nCodeSet;
else
#endif
#ifdef IEXPLORE
if ( nCurrentCodeSet == CODE_UNKNOWN ) {
#endif
if ( CodeSet == CODE_UNKNOWN ) {
if ( ( CodeSet = DetectJPNCode ( pUNIXChar, UNIXChar_len ) )
== CODE_ONLY_SBCS ) {
CodeSet = CODE_JPN_JIS;
}
}
#ifdef IEXPLORE
nCurrentCodeSet = CodeSet;
} else
CodeSet = nCurrentCodeSet;
#endif
switch ( CodeSet ) {
case CODE_JPN_JIS: // Japanese JIS Code
// Convert from JIS to Shift JIS
re = JIS_to_ShiftJIS ( pUNIXChar, UNIXChar_len,
pPCChar, PCChar_len );
break;
case CODE_JPN_EUC: // Japanese EUC Code
// Convert from EUC to Shift JIS
re = EUC_to_ShiftJIS ( pUNIXChar, UNIXChar_len,
pPCChar, PCChar_len );
break;
default:
case CODE_JPN_SJIS: // Japanese Shift JIS Code
// Start Only Copy Process
if ( UNIXChar_len == -1 ) {
UNIXChar_len = strlen ( pUNIXChar ) + 1;
}
if ( PCChar_len != 0 ) {
#ifdef DBCS_DIVIDE
UCHAR *pPCCharEnd = pPCChar + PCChar_len - 1;
if ( dStatus.nCodeSet == CODE_JPN_SJIS && dStatus.cSavedByte){
*pPCChar++ = dStatus.cSavedByte;
*pPCChar = *pUNIXChar;
++UNIXChar_len;
++nDelta;
++i;
dStatus.nCodeSet = CODE_UNKNOWN;
dStatus.cSavedByte = '\0';
}
while(i < UNIXChar_len - nDelta){
if(IsDBCSLeadByte(*(pUNIXChar + i))){
if(i == UNIXChar_len - nDelta - 1){
dStatus.nCodeSet = CODE_JPN_SJIS;
dStatus.cSavedByte = *(pUNIXChar + i);
--UNIXChar_len;
break;
} else if((i == UNIXChar_len - nDelta - 2) &&
(*(pUNIXChar + i + 1) == '\0')){
dStatus.nCodeSet = CODE_JPN_SJIS;
dStatus.cSavedByte = *(pUNIXChar + i);
*(pPCChar + i + 1) = '\0';
--UNIXChar_len;
break;
}
if(pPCChar + i > pPCCharEnd) // check destination buf
break;
*(pPCChar + i++) = *(pUNIXChar + i);
*(pPCChar + i++) = *(pUNIXChar + i);
} else
*(pPCChar + i++) = *(pUNIXChar + i);
}
#else
if ( UNIXChar_len > PCChar_len ) { // Is the buffer small?
return ( -1 );
}
memmove ( pPCChar, pUNIXChar, UNIXChar_len );
#endif
}
#ifdef DBCS_DIVIDE
else { // Only retrun the required size
if ( dStatus0.nCodeSet == CODE_JPN_SJIS ){ // 1st byte was saved
++UNIXChar_len;
++nDelta;
++i;
dStatus0.nCodeSet = CODE_UNKNOWN;
dStatus0.cSavedByte = '\0';
}
while(i < UNIXChar_len - nDelta){
if(IsDBCSLeadByte(*(pUNIXChar + i))){
if(i == UNIXChar_len - nDelta - 1){
dStatus0.nCodeSet = CODE_JPN_SJIS;
dStatus0.cSavedByte = *(pUNIXChar + i);
--UNIXChar_len;
break;
} else if((i == UNIXChar_len - nDelta - 2) &&
(*(pUNIXChar + i + 1) == '\0')){
dStatus0.nCodeSet = CODE_JPN_SJIS;
dStatus0.cSavedByte = *(pUNIXChar + i);
--UNIXChar_len;
break;
}
i+=2;
} else
i++;
}
}
#endif
re = UNIXChar_len;
break;
}
return ( re );
}
int WINAPI UNIX_to_PC ( int CodePage, int CodeSet,
UCHAR *pUNIXChar, int UNIXChar_len,
UCHAR *pPCChar, int PCChar_len )
// The UNIX_to_PC function convert a character string as UNIX code
// set string to a PC code set string.
//
// int CodePage Country Code Page.
// If this value is -1, the function use OS CodePage from
// Operating System automatically.
//
// Value Meaning
// -1 Auto Detect Mode.
// 932 Japan.
// ??? Taiwan.
// ??? Korea.
// ??? PRC(Chaina)?
//
// int CodeSet Code Set Type.
// There are three Japanese Code set in UNIX world.
// These code sets are JIS, EUC and Shift JIS.
// When CodePage is Japanese, the following Code set
// constants are defined:
//
// Value Meaning
// CODE_UNKNOWN Unknown. If this value is CODE_UNKNOWN,
// Code Type is checked automatically.
//
// CODE_JPN_JIS JIS Code Set. The function convert
// pUNIXChar string as JIS code set string
// to a PC code set string.
// CODE_JPN_EUC EUC Code Set. The function convert
// pUNIXChar string as EUC code set string
// to a PC code set string.
// CODE_JPN_SJIS Shift JIS Code Set.
//
// UCHAR *pUNIXChar Points to the character string to be converted.
//
// int UNIXChar_len Specifies the size in bytes of the string pointed
// to by the pUNIXChar parameter. If this value is -1,
// the string is assumed to be NULL terminated and the
// length is calculated automatically.
//
// UCHAR *pPCChar Points to a buffer that receives the convert string
// from UNIX Code to PC Code.
//
// int PCChar_len Specifies the size, in PC characters of the buffer
// pointed to by the pPCChar parameter. If the value is zero,
// the function returns the number of PC characters
// required for the buffer, and makes no use of the pPCChar
// buffer.
//
// Return Value
// If the function succeeds, and PCChar_len is nonzero, the return value is the
// number of PC characters written to the buffer pointed to by pPCChar.
//
// If the function succeeds, and PCChar_len is zero, the return value is the
// required size, in PC characters, for a buffer that can receive the
// converted string.
//
// If the function fails, the return value is -1. The error mean pPCChar buffer
// is small for setting converted strings.
//
//@
{
int re;
if ( CodePage == -1 ) {
CodePage = (int)GetOEMCP();
}
switch ( CodePage ) {
case 932: // Japanese Code Page
re = JPNUNIX_to_PC ( CodeSet, pUNIXChar, UNIXChar_len,
pPCChar, PCChar_len );
break;
// case ???: // Taiwan Code Page
// re = TAIWANUNIX_to_PC (,,,,,,);
// break;
// case ???: // Korea Code Page
// re = KOREAUNIX_to_PC (,,,,,,);
// break;
// case ???: // PRC Code Page
// re = PRCUNIX_to_PC (,,,,,,);
// break;
default:
// Start Only Copy Process
if ( UNIXChar_len == -1 ) {
UNIXChar_len = strlen ( pUNIXChar ) + 1;
}
if ( PCChar_len != 0 ) {
if ( UNIXChar_len > PCChar_len ) { // Is the buffer small?
return ( -1 );
}
memmove ( pPCChar, pUNIXChar, UNIXChar_len );
}
re = UNIXChar_len;
break;
}
return ( re );
}