Windows2003-3790/base/win32/winnls/data/dlls/iso_2022/c_is2022.c
2020-09-30 16:53:55 +02:00

1428 lines
43 KiB
C

/*++
Copyright (c) 1991-1999, Microsoft Corporation All rights reserved.
Module Name:
c_is2022.c
Abstract:
This file contains the main functions for this module.
External Routines in this file:
DllEntry
NlsDllCodePageTranslation
Revision History:
10-30-96 JulieB Created.
--*/
////////////////////////////////////////////////////////////////////////////
//
// 50220 ISO-2022-JP Japanese JIS X 0202-1984 with no halfwidth Katakana
// 50221 ISO-2022-JP Japanese JIS X 0202-1984 with <ESC>(I for halfwidth Katakana
// 50222 ISO-2022-JP Japanese JIS X 0201-1989 with <ESC>(J+SO for halfwidth Katakana
// ;RFC 1468
//
// 50225 ISO-2022-KR Korean KSC-5601-1987 ;RFC 1557
//
// 50227 ISO 2022-CN Traditional Chinese ;RFC 1922:CNS-11643-1,CNS-11643-2
// 50229 ISO 2022-CN Simplified Chinese ;RFC 1922:GB-2312-80
//
// 52936 HZ-GB2312 Simplified Chinese
//
////////////////////////////////////////////////////////////////////////////
//
// Include Files.
//
#include <share.h>
//
// Macro Definitions.
//
#define NLS_CODEPAGE(cp) (NLS_CP[(cp) % 10])
#define SHIFT_OUT ((BYTE)0x0E)
#define SHIFT_IN ((BYTE)0x0F)
#define ESCAPE ((BYTE)0x1B)
#define LEADBYTE_HALFWIDTH ((BYTE)0x8E)
#define MODE_ASCII 11
#define MODE_HALFWIDTH_KATAKANA 0
#define MODE_JIS_0208 1
#define MODE_JIS_0212 2
#define MODE_KSC_5601 5
#define MODE_HZ 6
#define MODE_GB_2312 7
#define MODE_CNS_11643_1 9
#define MODE_CNS_11643_2 10
//
// Global Variables.
//
DWORD NLS_CP[] =
{
20932, // 50220 ISO-2022-JP, MODE_HALFWIDTH_KATAKANA
20932, // 50221 ISO-2022-JP, MODE_JIS_0208
20932, // 50222 ISO-2022-JP, MODE_JIS_0212
0,
0,
20949, // 50225 ISO-2022-KR, MODE_KSC_5601
20936, // 52936 HZ-GB2312, MODE_HZ
20936, // 50227 ISO-2022-CN, MODE_GB_2312
0,
20000, // 50229 ISO-2022-CN, MODE_CNS_11643_1
20000, // 50229 ISO-2022-CN, MODE_CNS_11643_2
0 // MODE_ASCII
};
//
// Forward Declarations.
//
DWORD
ParseMB_CP5022J(
DWORD CodePage,
LPSTR lpMultiByteStr,
int cchMultiByte,
LPSTR lpMBNoEscStr,
int cchMBCount);
DWORD
ParseMB_CP5022_579(
DWORD CodePage,
LPSTR lpMultiByteStr,
int cchMultiByte,
LPSTR lpMBNoEscStr,
int cchMBCount);
DWORD
ParseMB_CP52936(
LPSTR lpMultiByteStr,
int cchMultiByte,
LPSTR lpMBNoEscStr,
int cchMBCount);
DWORD
MBToWC_CP5022X(
LPSTR lpMultiByteStr,
int cchMultiByte,
LPWSTR lpWideCharStr,
int cchWideChar);
DWORD
MBToWC_CP52936(
LPSTR lpMultiByteStr,
int cchMultiByte,
LPWSTR lpWideCharStr,
int cchWideChar);
//-------------------------------------------------------------------------//
// DLL ENTRY POINT //
//-------------------------------------------------------------------------//
////////////////////////////////////////////////////////////////////////////
//
// DllEntry
//
// DLL Entry initialization procedure.
//
// 10-30-96 JulieB Created.
////////////////////////////////////////////////////////////////////////////
BOOL DllEntry(
HANDLE hModule,
DWORD dwReason,
LPVOID lpRes)
{
switch (dwReason)
{
case ( DLL_THREAD_ATTACH ) :
{
return (TRUE);
}
case ( DLL_THREAD_DETACH ) :
{
return (TRUE);
}
case ( DLL_PROCESS_ATTACH ) :
{
return (TRUE);
}
case ( DLL_PROCESS_DETACH ) :
{
return (TRUE);
}
}
return (FALSE);
hModule;
lpRes;
}
//-------------------------------------------------------------------------//
// EXTERNAL ROUTINES //
//-------------------------------------------------------------------------//
////////////////////////////////////////////////////////////////////////////
//
// NlsDllCodePageTranslation
//
// This routine is the main exported procedure for the functionality in
// this DLL. All calls to this DLL must go through this function.
//
// 10-30-96 JulieB Created.
////////////////////////////////////////////////////////////////////////////
DWORD NlsDllCodePageTranslation(
DWORD CodePage,
DWORD dwFlags,
LPSTR lpMultiByteStr,
int cchMultiByte,
LPWSTR lpWideCharStr,
int cchWideChar,
LPCPINFO lpCPInfo)
{
DWORD NlsCodePage = NLS_CODEPAGE(CodePage);
if (!IsValidCodePage(NlsCodePage))
{
SetLastError(ERROR_INVALID_PARAMETER);
return (0);
}
switch (dwFlags)
{
case ( NLS_CP_CPINFO ) :
{
memset(lpCPInfo, 0, sizeof(CPINFO));
lpCPInfo->MaxCharSize = 5;
lpCPInfo->DefaultChar[0] = 0x3f;
//
// The lead-byte does not apply here, leave them all NULL.
//
return (TRUE);
}
case ( NLS_CP_MBTOWC ) :
{
if (cchMultiByte == -1)
{
cchMultiByte = strlen(lpMultiByteStr) + 1;
}
switch (CodePage)
{
case (50220) :
case (50221) :
case (50222) :
case (50225) :
case (50227) :
case (50229) :
{
return (MBToWC_CP5022X( lpMultiByteStr,
cchMultiByte,
lpWideCharStr,
cchWideChar ));
}
case (52936) :
{
return (MBToWC_CP52936( lpMultiByteStr,
cchMultiByte,
lpWideCharStr,
cchWideChar ));
}
}
break;
}
case ( NLS_CP_WCTOMB ) :
{
int cchMBCount;
LPSTR lpMBNoEscStr;
if (cchWideChar == -1)
{
cchWideChar = wcslen(lpWideCharStr) + 1;
}
lpMBNoEscStr = (LPSTR)NLS_ALLOC_MEM(cchWideChar * sizeof(WCHAR));
if (lpMBNoEscStr == NULL)
{
SetLastError(ERROR_OUTOFMEMORY);
return (0);
}
cchMBCount = WideCharToMultiByte( NlsCodePage,
WC_NO_BEST_FIT_CHARS,
lpWideCharStr,
cchWideChar,
lpMBNoEscStr,
cchWideChar * sizeof(WCHAR),
NULL,
NULL );
if (cchMBCount != 0)
{
switch (CodePage)
{
case (50220) :
case (50221) :
case (50222) :
{
cchMBCount = ParseMB_CP5022J( CodePage,
lpMultiByteStr,
cchMultiByte,
lpMBNoEscStr,
cchMBCount );
break;
}
case (50225) :
case (50227) :
case (50229) :
{
cchMBCount = ParseMB_CP5022_579( CodePage,
lpMultiByteStr,
cchMultiByte,
lpMBNoEscStr,
cchMBCount );
break;
}
case (52936) :
{
cchMBCount = ParseMB_CP52936( lpMultiByteStr,
cchMultiByte,
lpMBNoEscStr,
cchMBCount );
break;
}
}
}
NLS_FREE_MEM (lpMBNoEscStr);
return (cchMBCount);
}
}
//
// This shouldn't happen since this function gets called by
// the NLS API routines.
//
SetLastError(ERROR_INVALID_PARAMETER);
return (0);
}
//-------------------------------------------------------------------------//
// INTERNAL ROUTINES //
//-------------------------------------------------------------------------//
////////////////////////////////////////////////////////////////////////////
//
// MBToWC_CP5022X
//
// This routine does the translations from ISO-2022 to Unicode.
//
////////////////////////////////////////////////////////////////////////////
DWORD MBToWC_CP5022X(
LPSTR lpMultiByteStr,
int cchMultiByte,
LPWSTR lpWideCharStr,
int cchWideChar)
{
int ctr, cchMBTemp = 0, cchWCCount = 0;
LPSTR lpMBTempStr, lpMBNoEscStr, lpMBStrStart;
WORD wMode, wModePrev, wModeSO;
LPWSTR lpWCTempStr;
int rc;
//
// Allocate a buffer of the appropriate size.
// Use sizeof(WCHAR) because size could potentially double if
// the buffer contains all halfwidth Katakanas.
//
lpMBStrStart = (LPSTR)NLS_ALLOC_MEM(cchMultiByte * sizeof(WCHAR));
if (lpMBStrStart == NULL)
{
SetLastError(ERROR_OUTOFMEMORY);
return (0);
}
lpWCTempStr = (LPWSTR)NLS_ALLOC_MEM(cchMultiByte * sizeof(WCHAR));
if (lpWCTempStr == NULL)
{
SetLastError(ERROR_OUTOFMEMORY);
return (0);
}
if (cchWideChar)
{
*lpWideCharStr = 0;
}
lpMBTempStr = lpMBNoEscStr = lpMBStrStart;
wModePrev = wMode = wModeSO = MODE_ASCII;
//
// Remove esc sequence, then convert to Unicode.
//
for (ctr = 0; ctr < cchMultiByte;)
{
if ((BYTE)lpMultiByteStr[ctr] == ESCAPE)
{
wMode = wModeSO = MODE_ASCII;
if (ctr >= (cchMultiByte - 2))
{
//
// Incomplete escape sequence.
//
}
else if ((BYTE)lpMultiByteStr[ctr + 1] == '(')
{
if ((BYTE)lpMultiByteStr[ctr + 2] == 'B') // <esc>(B
{
wMode = wModeSO = MODE_ASCII;
ctr += 3;
}
else if ((BYTE)lpMultiByteStr[ctr + 2] == 'J') // <esc>(J
{
wMode = MODE_ASCII;
wModeSO = MODE_HALFWIDTH_KATAKANA;
ctr += 3;
}
else if ((BYTE)lpMultiByteStr[ctr + 2] == 'I') // <esc>(I
{
wMode = wModeSO = MODE_HALFWIDTH_KATAKANA;
ctr += 3;
}
}
else if ((BYTE)lpMultiByteStr[ctr + 1] == '$')
{
if (((BYTE)lpMultiByteStr[ctr + 2] == '@') || // <esc>$@
((BYTE)lpMultiByteStr[ctr + 2] == 'B')) // <esc>$B
{
wMode = wModeSO = MODE_JIS_0208;
ctr += 3;
}
else
{
if (ctr >= (cchMultiByte - 3))
{
//
// Imcomplete escape sequence.
//
}
else if ((BYTE)lpMultiByteStr[ctr + 2] == '(')
{
if (((BYTE)lpMultiByteStr[ctr + 3] == '@') || // <esc>$(@
((BYTE)lpMultiByteStr[ctr + 3] == 'B')) // <esc>$(B
{
wMode = wModeSO = MODE_JIS_0208;
ctr += 4;
}
else if ((BYTE)lpMultiByteStr[ctr + 3] == 'D') // <esc>$(D
{
wMode = wModeSO = MODE_JIS_0212;
ctr += 4;
}
}
else if ((BYTE)lpMultiByteStr[ctr + 2] == ')')
{
if ((BYTE)lpMultiByteStr[ctr + 3] == 'C') // <esc>$)C
{
wMode = wModeSO = MODE_KSC_5601;
ctr += 4;
}
else if ((BYTE)lpMultiByteStr[ctr + 3] == 'A') // <esc>$)A
{
wMode = wModeSO = MODE_GB_2312;
ctr += 4;
}
else if ((BYTE)lpMultiByteStr[ctr + 3] == 'G') // <esc>$)G
{
wMode = wModeSO = MODE_CNS_11643_1;
ctr += 4;
}
}
else if (((BYTE)lpMultiByteStr[ctr + 2] == '*') && // <esc>$*H
((BYTE)lpMultiByteStr[ctr + 3] == 'H'))
{
wMode = wModeSO = MODE_CNS_11643_2;
ctr += 4;
}
}
}
else if (lpMultiByteStr[ctr + 1] == '&')
{
if (ctr >= (cchMultiByte - 5))
{
//
// Incomplete escape sequence.
//
}
else if (((BYTE)lpMultiByteStr[ctr + 2] == '@') &&
((BYTE)lpMultiByteStr[ctr + 3] == ESCAPE) &&
((BYTE)lpMultiByteStr[ctr + 4] == '$') &&
((BYTE)lpMultiByteStr[ctr + 5] == 'B'))
{
wMode = wModeSO = MODE_JIS_0208;
ctr += 6;
}
}
}
else if ((BYTE)lpMultiByteStr[ctr] == SHIFT_OUT)
{
wMode = wModeSO;
ctr++;
}
else if ((BYTE)lpMultiByteStr[ctr] == SHIFT_IN)
{
wMode = MODE_ASCII;
ctr++;
}
switch (wMode)
{
case ( MODE_JIS_0208 ) :
case ( MODE_KSC_5601 ) :
case ( MODE_GB_2312 ) :
case ( MODE_CNS_11643_1 ) :
{
//
// To handle errors, we need to check:
// 1. if trailbyte is there
// 2. if code is valid
//
while (ctr < cchMultiByte && lpMultiByteStr[ctr] == SHIFT_OUT)
{
ctr++;
}
while ((ctr < (cchMultiByte - 1)) &&
(lpMultiByteStr[ctr] != ESCAPE) &&
(lpMultiByteStr[ctr] != SHIFT_IN))
{
*lpMBTempStr++ = lpMultiByteStr[ctr++] | 0x80;
*lpMBTempStr++ = lpMultiByteStr[ctr++] | 0x80;
cchMBTemp += 2;
}
break;
}
case ( MODE_JIS_0212 ) :
case ( MODE_CNS_11643_2 ) :
{
while (ctr < cchMultiByte && lpMultiByteStr[ctr] == SHIFT_OUT)
{
ctr++;
}
while ((ctr < (cchMultiByte - 1)) &&
(lpMultiByteStr[ctr] != ESCAPE) &&
(lpMultiByteStr[ctr] != SHIFT_IN))
{
*lpMBTempStr++ = lpMultiByteStr[ctr++] | 0x80;
*lpMBTempStr++ = lpMultiByteStr[ctr++];
cchMBTemp += 2;
}
break;
}
case ( MODE_HALFWIDTH_KATAKANA ) :
{
while (ctr < cchMultiByte && lpMultiByteStr[ctr] == SHIFT_OUT)
{
ctr++;
}
while ((ctr < cchMultiByte) &&
(lpMultiByteStr[ctr] != ESCAPE) &&
(lpMultiByteStr[ctr] != SHIFT_IN))
{
*lpMBTempStr++ = (BYTE)0x8E;
*lpMBTempStr++ = lpMultiByteStr[ctr++] | 0x80;
cchMBTemp += 2;
}
break;
}
default : // MODE_ASCII
{
while (ctr < cchMultiByte && lpMultiByteStr[ctr] == SHIFT_IN)
{
ctr++;
}
while ((ctr < cchMultiByte) &&
(lpMultiByteStr[ctr] != ESCAPE) &&
(lpMultiByteStr[ctr] != SHIFT_OUT))
{
*lpMBTempStr++ = lpMultiByteStr[ctr++];
cchMBTemp++;
}
}
}
if (cchMBTemp == 0)
{
break;
}
rc = MultiByteToWideChar( NLS_CP[wMode],
0,
lpMBNoEscStr,
cchMBTemp,
lpWCTempStr,
cchMultiByte );
if (cchWideChar)
{
if ((cchWCCount + rc) > cchWideChar)
{
//
// Output buffer is too small.
//
SetLastError(ERROR_INSUFFICIENT_BUFFER);
cchWCCount = 0;
break;
}
else
{
memcpy( lpWideCharStr + cchWCCount,
lpWCTempStr,
rc * sizeof(WCHAR) );
}
}
cchWCCount += rc;
lpMBNoEscStr += cchMBTemp;
cchMBTemp = 0;
}
//
// Clean up memory allocations.
//
NLS_FREE_MEM(lpMBStrStart);
NLS_FREE_MEM(lpWCTempStr);
//
// Return the result.
//
return (cchWCCount);
}
////////////////////////////////////////////////////////////////////////////
//
// ParseMB_CP5022J
//
// --> ISO-2022-JP
//
// for 50220 : convert all halfwidth katakana to fullwidth
// 50221 : use <esc>(I for halfwidth katakana
// 50222 : use <esc>(J<SO> for halfwidth katakana
//
////////////////////////////////////////////////////////////////////////////
DWORD ParseMB_CP5022J(
DWORD CodePage,
LPSTR lpMultiByteStr,
int cchMultiByte,
LPSTR lpMBNoEscStr,
int cchMBCount)
{
int ctr, cchMBTemp = 0;
WORD wMode, wModeSO;
LPSTR lpMBTempStr;
static WORD HalfToFullWidthKanaTable[] =
{
0xa1a3, // 0x8ea1 : Halfwidth Ideographic Period
0xa1d6, // 0x8ea2 : Halfwidth Opening Corner Bracket
0xa1d7, // 0x8ea3 : Halfwidth Closing Corner Bracket
0xa1a2, // 0x8ea4 : Halfwidth Ideographic Comma
0xa1a6, // 0x8ea5 : Halfwidth Katakana Middle Dot
0xa5f2, // 0x8ea6 : Halfwidth Katakana Wo
0xa5a1, // 0x8ea7 : Halfwidth Katakana Small A
0xa5a3, // 0x8ea8 : Halfwidth Katakana Small I
0xa5a5, // 0x8ea9 : Halfwidth Katakana Small U
0xa5a7, // 0x8eaa : Halfwidth Katakana Small E
0xa5a9, // 0x8eab : Halfwidth Katakana Small O
0xa5e3, // 0x8eac : Halfwidth Katakana Small Ya
0xa5e5, // 0x8ead : Halfwidth Katakana Small Yu
0xa5e7, // 0x8eae : Halfwidth Katakana Small Yo
0xa5c3, // 0x8eaf : Halfwidth Katakana Small Tu
0xa1bc, // 0x8eb0 : Halfwidth Katakana-Hiragana Prolonged Sound Mark
0xa5a2, // 0x8eb1 : Halfwidth Katakana A
0xa5a4, // 0x8eb2 : Halfwidth Katakana I
0xa5a6, // 0x8eb3 : Halfwidth Katakana U
0xa5a8, // 0x8eb4 : Halfwidth Katakana E
0xa5aa, // 0x8eb5 : Halfwidth Katakana O
0xa5ab, // 0x8eb6 : Halfwidth Katakana Ka
0xa5ad, // 0x8eb7 : Halfwidth Katakana Ki
0xa5af, // 0x8eb8 : Halfwidth Katakana Ku
0xa5b1, // 0x8eb9 : Halfwidth Katakana Ke
0xa5b3, // 0x8eba : Halfwidth Katakana Ko
0xa5b5, // 0x8ebb : Halfwidth Katakana Sa
0xa5b7, // 0x8ebc : Halfwidth Katakana Si
0xa5b9, // 0x8ebd : Halfwidth Katakana Su
0xa5bb, // 0x8ebe : Halfwidth Katakana Se
0xa5bd, // 0x8ebf : Halfwidth Katakana So
0xa5bf, // 0x8ec0 : Halfwidth Katakana Ta
0xa5c1, // 0x8ec1 : Halfwidth Katakana Ti
0xa5c4, // 0x8ec2 : Halfwidth Katakana Tu
0xa5c6, // 0x8ec3 : Halfwidth Katakana Te
0xa5c8, // 0x8ec4 : Halfwidth Katakana To
0xa5ca, // 0x8ec5 : Halfwidth Katakana Na
0xa5cb, // 0x8ec6 : Halfwidth Katakana Ni
0xa5cc, // 0x8ec7 : Halfwidth Katakana Nu
0xa5cd, // 0x8ec8 : Halfwidth Katakana Ne
0xa5ce, // 0x8ec9 : Halfwidth Katakana No
0xa5cf, // 0x8eca : Halfwidth Katakana Ha
0xa5d2, // 0x8ecb : Halfwidth Katakana Hi
0xa5d5, // 0x8ecc : Halfwidth Katakana Hu
0xa5d8, // 0x8ecd : Halfwidth Katakana He
0xa5db, // 0x8ece : Halfwidth Katakana Ho
0xa5de, // 0x8ecf : Halfwidth Katakana Ma
0xa5df, // 0x8ed0 : Halfwidth Katakana Mi
0xa5e0, // 0x8ed1 : Halfwidth Katakana Mu
0xa5e1, // 0x8ed2 : Halfwidth Katakana Me
0xa5e2, // 0x8ed3 : Halfwidth Katakana Mo
0xa5e4, // 0x8ed4 : Halfwidth Katakana Ya
0xa5e6, // 0x8ed5 : Halfwidth Katakana Yu
0xa5e8, // 0x8ed6 : Halfwidth Katakana Yo
0xa5e9, // 0x8ed7 : Halfwidth Katakana Ra
0xa5ea, // 0x8ed8 : Halfwidth Katakana Ri
0xa5eb, // 0x8ed9 : Halfwidth Katakana Ru
0xa5ec, // 0x8eda : Halfwidth Katakana Re
0xa5ed, // 0x8edb : Halfwidth Katakana Ro
0xa5ef, // 0x8edc : Halfwidth Katakana Wa
0xa5f3, // 0x8edd : Halfwidth Katakana N
0xa1ab, // 0x8ede : Halfwidth Katakana Voiced Sound Mark
0xa1ac // 0x8edf : Halfwidth Katakana Semi-Voiced Sound Mark
};
wMode = wModeSO = MODE_ASCII;
//
// Code page 50220 does not use halfwidth Katakana.
// Convert to fullwidth.
//
if (CodePage == 50220)
{
for (ctr = 0; ctr < cchMBCount; ctr++)
{
WORD wFWKana;
if ((BYTE)lpMBNoEscStr[ctr] == LEADBYTE_HALFWIDTH)
{
wFWKana = HalfToFullWidthKanaTable[(BYTE)lpMBNoEscStr[ctr + 1] - 0xA1];
lpMBNoEscStr[ctr++] = HIBYTE(wFWKana);
lpMBNoEscStr[ctr] = LOBYTE(wFWKana);
}
}
}
lpMBTempStr = lpMultiByteStr;
for (ctr = 0; ctr < cchMBCount; ctr++)
{
if ((BYTE)lpMBNoEscStr[ctr] == LEADBYTE_HALFWIDTH)
{
//
// It's halfwidth Katakana.
//
ctr++;
if (CodePage == 50222)
{
if (wMode != MODE_HALFWIDTH_KATAKANA)
{
if (wModeSO != MODE_HALFWIDTH_KATAKANA)
{
if (cchMultiByte)
{
if (cchMBTemp < (cchMultiByte - 2))
{
*lpMBTempStr++ = ESCAPE;
*lpMBTempStr++ = '(';
*lpMBTempStr++ = 'J';
}
else
{
//
// Output buffer is too small.
//
SetLastError(ERROR_INSUFFICIENT_BUFFER);
return (0);
}
}
cchMBTemp += 3;
wModeSO = MODE_HALFWIDTH_KATAKANA;
}
if (cchMultiByte)
{
if (cchMBTemp < cchMultiByte)
{
*lpMBTempStr++ = SHIFT_OUT;
}
else
{
//
// Output buffer is too small.
//
SetLastError(ERROR_INSUFFICIENT_BUFFER);
return (0);
}
}
cchMBTemp++;
wMode = MODE_HALFWIDTH_KATAKANA;
}
}
else // CodePage = 50221
{
if (wMode != MODE_HALFWIDTH_KATAKANA)
{
if (cchMultiByte)
{
if (cchMBTemp < (cchMultiByte - 2))
{
*lpMBTempStr++ = ESCAPE;
*lpMBTempStr++ = '(';
*lpMBTempStr++ = 'I';
}
else
{
//
// Output buffer is too small.
//
SetLastError(ERROR_INSUFFICIENT_BUFFER);
return (0);
}
}
cchMBTemp += 3;
wMode = MODE_HALFWIDTH_KATAKANA;
}
}
if (cchMultiByte)
{
if (cchMBTemp < cchMultiByte)
{
*lpMBTempStr++ = lpMBNoEscStr[ctr] & 0x7F;
}
else
{
//
// Output buffer is too small.
//
SetLastError(ERROR_INSUFFICIENT_BUFFER);
return (0);
}
}
cchMBTemp++;
}
else if (IsDBCSLeadByteEx(20932, lpMBNoEscStr[ctr]))
{
//
// It's a double byte character.
//
if (lpMBNoEscStr[ctr + 1] & 0x80) // JIS X 0208
{
if (wMode != MODE_JIS_0208)
{
if (cchMultiByte)
{
if (cchMBTemp < (cchMultiByte - 2))
{
*lpMBTempStr++ = ESCAPE;
*lpMBTempStr++ = '$';
*lpMBTempStr++ = 'B';
}
else
{
//
// Output buffer is too small.
//
SetLastError(ERROR_INSUFFICIENT_BUFFER);
return (0);
}
}
cchMBTemp += 3;
wMode = MODE_JIS_0208;
}
}
else // JIS X 0212
{
if (wMode != MODE_JIS_0212)
{
if (cchMultiByte)
{
if (cchMBTemp < (cchMultiByte - 3))
{
*lpMBTempStr++ = ESCAPE;
*lpMBTempStr++ = '$';
*lpMBTempStr++ = '(';
*lpMBTempStr++ = 'D';
}
else
{
//
// Output buffer is too small.
//
SetLastError(ERROR_INSUFFICIENT_BUFFER);
return (0);
}
}
cchMBTemp += 4;
wMode = MODE_JIS_0212;
}
}
if (ctr >= (cchMBCount - 1))
{
//
// Missing trail byte.
//
break;
}
if (cchMultiByte)
{
if (cchMBTemp < (cchMultiByte - 1))
{
*lpMBTempStr++ = lpMBNoEscStr[ctr] & 0x7F;
*lpMBTempStr++ = lpMBNoEscStr[ctr + 1] & 0x7F;
}
else
{
//
// Output buffer is too small.
//
SetLastError(ERROR_INSUFFICIENT_BUFFER);
return (0);
}
}
ctr++;
cchMBTemp += 2;
}
else // Single byte Char
{
if (wMode != MODE_ASCII)
{
if (cchMultiByte)
{
if (cchMBTemp < (cchMultiByte - 2))
{
*lpMBTempStr++ = ESCAPE;
*lpMBTempStr++ = '(';
*lpMBTempStr++ = 'B';
}
else
{
//
// Output buffer is too small.
//
SetLastError(ERROR_INSUFFICIENT_BUFFER);
return (0);
}
}
cchMBTemp += 3;
wMode = MODE_ASCII;
}
if (cchMultiByte)
{
if (cchMBTemp < cchMultiByte)
{
*lpMBTempStr++ = lpMBNoEscStr[ctr];
}
else
{
//
// Output buffer is too small.
//
SetLastError(ERROR_INSUFFICIENT_BUFFER);
return (0);
}
}
cchMBTemp++;
}
}
if (cchMultiByte && (cchMBTemp > cchMultiByte))
{
//
// Output buffer is too small.
//
SetLastError(ERROR_INSUFFICIENT_BUFFER);
return (0);
}
return (cchMBTemp);
}
////////////////////////////////////////////////////////////////////////////
//
// ParseMB_CP5022_579
//
// KSC --> ISO-2022-KR (CP-50225)
// GB --> ISO-2022-CN (CP-50227)
// CNS --> ISO-2022-CN (CP-50229)
//
////////////////////////////////////////////////////////////////////////////
DWORD ParseMB_CP5022_579(
DWORD CodePage,
LPSTR lpMultiByteStr,
int cchMultiByte,
LPSTR lpMBNoEscStr,
int cchMBCount)
{
int ctr, cchMBTemp = 0;
WORD wMode, wModeSO, wModeCP;
char EscChar;
LPSTR lpMBTempStr;
lpMBTempStr = lpMultiByteStr;
wMode = wModeSO = MODE_ASCII;
wModeCP = (WORD)(CodePage % 10);
EscChar = ( wModeCP == MODE_KSC_5601 ? 'C' :
(wModeCP == MODE_GB_2312 ? 'A' : 'G'));
for (ctr = 0; ctr < cchMBCount; ctr++)
{
if (IsDBCSLeadByteEx(NLS_CODEPAGE(CodePage), lpMBNoEscStr[ctr]))
{
//
// It's a double byte character.
//
if (lpMBNoEscStr[ctr + 1] & 0x80) // KSC, GB or CNS-1
{
if (wModeSO != wModeCP)
{
if (cchMultiByte)
{
if (cchMBTemp < (cchMultiByte - 3))
{
*lpMBTempStr++ = ESCAPE;
*lpMBTempStr++ = '$';
*lpMBTempStr++ = ')';
*lpMBTempStr++ = EscChar;
}
else
{
//
// Output buffer is too small.
//
SetLastError(ERROR_INSUFFICIENT_BUFFER);
return (0);
}
}
cchMBTemp += 4;
wModeSO = wModeCP;
}
}
else
{
//
// lpMBNoEscStr[ctr + 1] & 0x80 == 0 indicates CNS-2
//
if (wModeSO != MODE_CNS_11643_2)
{
if (cchMultiByte)
{
if (cchMBTemp < (cchMultiByte - 3))
{
*lpMBTempStr++ = ESCAPE;
*lpMBTempStr++ = '$';
*lpMBTempStr++ = '*';
*lpMBTempStr++ = 'H';
}
else
{
//
// Output buffer is too small.
//
SetLastError(ERROR_INSUFFICIENT_BUFFER);
return (0);
}
}
cchMBTemp += 4;
wModeSO = MODE_CNS_11643_2;
}
}
if (wMode == MODE_ASCII)
{
if (cchMultiByte)
{
if (cchMBTemp < cchMultiByte)
{
*lpMBTempStr++ = SHIFT_OUT;
}
else
{
//
// Output buffer is too small.
//
SetLastError(ERROR_INSUFFICIENT_BUFFER);
return (0);
}
}
cchMBTemp++;
wMode = wModeSO;
}
if (ctr >= (cchMBCount - 1))
{
//
// Missing trail byte.
//
break;
}
if (cchMultiByte)
{
if (cchMBTemp < (cchMultiByte - 1))
{
*lpMBTempStr++ = lpMBNoEscStr[ctr] & 0x7F;
*lpMBTempStr++ = lpMBNoEscStr[ctr + 1] & 0x7F;
}
else
{
//
// Output buffer is too small.
//
SetLastError(ERROR_INSUFFICIENT_BUFFER);
return (0);
}
}
ctr++;
cchMBTemp += 2;
}
else
{
//
// It's a single byte character.
//
if (wMode != MODE_ASCII)
{
if (cchMultiByte)
{
if (cchMBTemp < cchMultiByte)
{
*lpMBTempStr++ = SHIFT_IN;
}
else
{
//
// Output buffer is too small.
//
SetLastError(ERROR_INSUFFICIENT_BUFFER);
return (0);
}
}
cchMBTemp++;
wMode = MODE_ASCII;
}
if (cchMultiByte)
{
if (cchMBTemp < cchMultiByte)
{
*lpMBTempStr++ = lpMBNoEscStr[ctr];
}
else
{
//
// Output buffer is too small.
//
SetLastError(ERROR_INSUFFICIENT_BUFFER);
return (0);
}
}
cchMBTemp++;
}
}
if (cchMultiByte && (cchMBTemp > cchMultiByte))
{
//
// Output buffer is too small.
//
SetLastError(ERROR_INSUFFICIENT_BUFFER);
return (0);
}
return (cchMBTemp);
}
////////////////////////////////////////////////////////////////////////////
//
// ParseMB_CP52936
//
// GB-2312 --> HZ (CP-52936)
//
////////////////////////////////////////////////////////////////////////////
DWORD ParseMB_CP52936(
LPSTR lpMultiByteStr,
int cchMultiByte,
LPSTR lpMBNoEscStr,
int cchMBCount)
{
int ctr, cchMBTemp = 0;
WORD wMode;
LPSTR lpMBTempStr;
lpMBTempStr = lpMultiByteStr;
wMode = MODE_ASCII;
for (ctr = 0; ctr < cchMBCount; ctr++)
{
if (lpMBNoEscStr[ctr] & 0x80)
{
if (wMode != MODE_HZ)
{
if (cchMultiByte)
{
if (cchMBTemp < (cchMultiByte - 1))
{
*lpMBTempStr++ = '~';
*lpMBTempStr++ = '{';
}
else
{
//
// Output buffer is too small.
//
SetLastError(ERROR_INSUFFICIENT_BUFFER);
return (0);
}
}
wMode = MODE_HZ;
cchMBTemp += 2;
}
if (ctr >= (cchMBCount - 1))
{
//
// Missing trail byte.
//
break;
}
if (cchMultiByte)
{
if (cchMBTemp < (cchMultiByte - 1))
{
*lpMBTempStr++ = lpMBNoEscStr[ctr] & 0x7F;
*lpMBTempStr++ = lpMBNoEscStr[ctr + 1] & 0x7F;
}
else
{
//
// Output buffer is too small.
//
SetLastError(ERROR_INSUFFICIENT_BUFFER);
return (0);
}
}
ctr++;
cchMBTemp += 2;
}
else
{
if (wMode != MODE_ASCII)
{
if (cchMultiByte)
{
if (cchMBTemp < (cchMultiByte - 1))
{
*lpMBTempStr++ = '~';
*lpMBTempStr++ = '}';
}
else
{
//
// Output buffer is too small.
//
SetLastError(ERROR_INSUFFICIENT_BUFFER);
return (0);
}
}
wMode = MODE_ASCII;
cchMBTemp += 2;
}
if ((BYTE)lpMBNoEscStr[ctr] == '~')
{
if (cchMultiByte)
{
if (cchMBTemp < cchMultiByte)
{
*lpMBTempStr++ = '~';
}
else
{
//
// Output buffer is too small.
//
SetLastError(ERROR_INSUFFICIENT_BUFFER);
return (0);
}
}
cchMBTemp++;
}
if (cchMultiByte)
{
if (cchMBTemp < cchMultiByte)
{
*lpMBTempStr++ = lpMBNoEscStr[ctr];
}
else
{
//
// Output buffer is too small.
//
SetLastError(ERROR_INSUFFICIENT_BUFFER);
return (0);
}
}
cchMBTemp++;
}
}
if (cchMultiByte && (cchMBTemp > cchMultiByte))
{
//
// Output buffer is too small.
//
SetLastError(ERROR_INSUFFICIENT_BUFFER);
return (0);
}
return (cchMBTemp);
}
////////////////////////////////////////////////////////////////////////////
//
// MBToWC_CP52936
//
// HZ (CP-52936) --> Unicode
//
////////////////////////////////////////////////////////////////////////////
DWORD MBToWC_CP52936(
LPSTR lpMultiByteStr,
int cchMultiByte,
LPWSTR lpWideCharStr,
int cchWideChar)
{
int ctr, cchMBTemp, cchWCCount;
WORD wMode;
LPSTR lpMBNoEscStr;
lpMBNoEscStr = (LPSTR)NLS_ALLOC_MEM(cchMultiByte * sizeof(WCHAR));
if (lpMBNoEscStr == NULL)
{
SetLastError(ERROR_OUTOFMEMORY);
return (0);
}
cchMBTemp = 0;
wMode = MODE_ASCII;
for (ctr = 0; ctr < cchMultiByte; ctr++)
{
if (((BYTE)lpMultiByteStr[ctr] == '~') && (ctr < (cchMultiByte - 1)))
{
if ((BYTE)lpMultiByteStr[ctr + 1] == '{')
{
wMode = MODE_HZ;
ctr += 2;
}
else if ((BYTE)lpMultiByteStr[ctr + 1] == '}')
{
wMode = MODE_ASCII;
ctr += 2;
}
else if ((BYTE)lpMultiByteStr[ctr + 1] == '~')
{
ctr++;
}
else if (((BYTE)lpMultiByteStr[ctr + 1] == '\\') &&
(ctr < (cchMultiByte - 2)) &&
(((BYTE)lpMultiByteStr[ctr + 2] == 'n') ||
((BYTE)lpMultiByteStr[ctr + 2] == 'N' )))
{
ctr += 2;
}
}
if (wMode == MODE_HZ)
{
if (ctr < (cchMultiByte - 1))
{
lpMBNoEscStr[cchMBTemp++] = lpMultiByteStr[ctr++] | 0x80;
lpMBNoEscStr[cchMBTemp++] = lpMultiByteStr[ctr] | 0x80;
}
}
else
{
if (ctr < cchMultiByte)
{
lpMBNoEscStr[cchMBTemp++] = lpMultiByteStr[ctr];
}
}
}
cchWCCount = MultiByteToWideChar ( 20936,
0,
lpMBNoEscStr,
cchMBTemp,
lpWideCharStr,
cchWideChar );
NLS_FREE_MEM(lpMBNoEscStr);
return (cchWCCount);
}