2000-06-10 06:42:33 +02:00
|
|
|
/*
|
|
|
|
* Code page functions
|
|
|
|
*
|
|
|
|
* Copyright 2000 Alexandre Julliard
|
|
|
|
*/
|
|
|
|
|
|
|
|
#include <assert.h>
|
|
|
|
#include <stdio.h>
|
2000-07-12 00:08:43 +02:00
|
|
|
#include <stdlib.h>
|
2000-06-10 06:42:33 +02:00
|
|
|
|
|
|
|
#include "winbase.h"
|
|
|
|
#include "winerror.h"
|
|
|
|
#include "winnls.h"
|
|
|
|
#include "wine/unicode.h"
|
|
|
|
#include "debugtools.h"
|
|
|
|
|
|
|
|
DEFAULT_DEBUG_CHANNEL(string);
|
|
|
|
|
|
|
|
/* current code pages */
|
|
|
|
static const union cptable *ansi_cptable;
|
|
|
|
static const union cptable *oem_cptable;
|
|
|
|
static const union cptable *mac_cptable;
|
|
|
|
|
2000-07-12 00:08:43 +02:00
|
|
|
/* retrieve a code page table from the locale info */
|
|
|
|
static const union cptable *get_locale_cp( LCID lcid, LCTYPE type )
|
|
|
|
{
|
|
|
|
const union cptable *table = NULL;
|
|
|
|
char buf[32];
|
|
|
|
|
|
|
|
if (GetLocaleInfoA( lcid, type, buf, sizeof(buf) )) table = cp_get_table( atoi(buf) );
|
|
|
|
return table;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* setup default codepage info before we can get at the locale stuff */
|
|
|
|
static void init_codepages(void)
|
|
|
|
{
|
|
|
|
ansi_cptable = cp_get_table( 1252 );
|
|
|
|
oem_cptable = cp_get_table( 437 );
|
|
|
|
mac_cptable = cp_get_table( 10000 );
|
|
|
|
assert( ansi_cptable );
|
|
|
|
assert( oem_cptable );
|
|
|
|
assert( mac_cptable );
|
|
|
|
}
|
2000-06-10 06:42:33 +02:00
|
|
|
|
|
|
|
/* find the table for a given codepage, handling CP_ACP etc. pseudo-codepages */
|
|
|
|
static const union cptable *get_codepage_table( unsigned int codepage )
|
|
|
|
{
|
|
|
|
const union cptable *ret = NULL;
|
|
|
|
|
2000-07-12 00:08:43 +02:00
|
|
|
if (!ansi_cptable) init_codepages();
|
2000-06-10 06:42:33 +02:00
|
|
|
|
|
|
|
switch(codepage)
|
|
|
|
{
|
|
|
|
case CP_ACP: return ansi_cptable;
|
|
|
|
case CP_OEMCP: return oem_cptable;
|
|
|
|
case CP_MACCP: return mac_cptable;
|
2000-07-12 00:08:43 +02:00
|
|
|
case CP_THREAD_ACP: return get_locale_cp( GetThreadLocale(), LOCALE_IDEFAULTANSICODEPAGE );
|
2000-06-10 06:42:33 +02:00
|
|
|
case CP_UTF7:
|
|
|
|
case CP_UTF8:
|
|
|
|
break;
|
|
|
|
default:
|
2000-07-12 00:08:43 +02:00
|
|
|
if (codepage == ansi_cptable->info.codepage) return ansi_cptable;
|
|
|
|
if (codepage == oem_cptable->info.codepage) return oem_cptable;
|
|
|
|
if (codepage == mac_cptable->info.codepage) return mac_cptable;
|
2000-06-10 06:42:33 +02:00
|
|
|
ret = cp_get_table( codepage );
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
2000-07-12 00:08:43 +02:00
|
|
|
/* initialize default code pages from locale info */
|
|
|
|
/* FIXME: should be done in init_codepages, but it can't right now */
|
|
|
|
/* since it needs KERNEL32 to be loaded for the locale info. */
|
|
|
|
void CODEPAGE_Init(void)
|
|
|
|
{
|
|
|
|
const union cptable *table;
|
|
|
|
LCID lcid = GetUserDefaultLCID();
|
|
|
|
|
|
|
|
if (!ansi_cptable) init_codepages(); /* just in case */
|
|
|
|
|
|
|
|
if ((table = get_locale_cp( lcid, LOCALE_IDEFAULTANSICODEPAGE ))) ansi_cptable = table;
|
|
|
|
if ((table = get_locale_cp( lcid, LOCALE_IDEFAULTMACCODEPAGE ))) mac_cptable = table;
|
|
|
|
if ((table = get_locale_cp( lcid, LOCALE_IDEFAULTCODEPAGE ))) oem_cptable = table;
|
|
|
|
|
|
|
|
TRACE( "ansi=%03d oem=%03d mac=%03d\n", ansi_cptable->info.codepage,
|
|
|
|
oem_cptable->info.codepage, mac_cptable->info.codepage );
|
|
|
|
}
|
|
|
|
|
2000-06-10 06:42:33 +02:00
|
|
|
/******************************************************************************
|
|
|
|
* GetACP (KERNEL32)
|
|
|
|
*
|
|
|
|
* RETURNS
|
|
|
|
* Current ANSI code-page identifier, default if no current defined
|
|
|
|
*/
|
|
|
|
UINT WINAPI GetACP(void)
|
|
|
|
{
|
2000-07-12 00:08:43 +02:00
|
|
|
if (!ansi_cptable) init_codepages();
|
|
|
|
return ansi_cptable->info.codepage;
|
2000-06-10 06:42:33 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
/***********************************************************************
|
|
|
|
* GetOEMCP (KERNEL32)
|
|
|
|
*/
|
|
|
|
UINT WINAPI GetOEMCP(void)
|
|
|
|
{
|
2000-07-12 00:08:43 +02:00
|
|
|
if (!oem_cptable) init_codepages();
|
|
|
|
return oem_cptable->info.codepage;
|
2000-06-10 06:42:33 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
/***********************************************************************
|
|
|
|
* IsValidCodePage (KERNEL32)
|
|
|
|
*/
|
|
|
|
BOOL WINAPI IsValidCodePage( UINT codepage )
|
|
|
|
{
|
|
|
|
return cp_get_table( codepage ) != NULL;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
/***********************************************************************
|
|
|
|
* IsDBCSLeadByteEx (KERNEL32)
|
|
|
|
*/
|
|
|
|
BOOL WINAPI IsDBCSLeadByteEx( UINT codepage, BYTE testchar )
|
|
|
|
{
|
|
|
|
const union cptable *table = get_codepage_table( codepage );
|
|
|
|
return table && is_dbcs_leadbyte( table, testchar );
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
/***********************************************************************
|
|
|
|
* IsDBCSLeadByte (KERNEL32)
|
|
|
|
*/
|
|
|
|
BOOL WINAPI IsDBCSLeadByte( BYTE testchar )
|
|
|
|
{
|
2000-07-12 00:08:43 +02:00
|
|
|
if (!ansi_cptable) init_codepages();
|
2000-06-10 06:42:33 +02:00
|
|
|
return is_dbcs_leadbyte( ansi_cptable, testchar );
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
/***********************************************************************
|
|
|
|
* GetCPInfo (KERNEL32)
|
|
|
|
*/
|
|
|
|
BOOL WINAPI GetCPInfo( UINT codepage, LPCPINFO cpinfo )
|
|
|
|
{
|
|
|
|
const union cptable *table = get_codepage_table( codepage );
|
|
|
|
|
|
|
|
if (!table)
|
|
|
|
{
|
|
|
|
SetLastError( ERROR_INVALID_PARAMETER );
|
|
|
|
return FALSE;
|
|
|
|
}
|
|
|
|
if (table->info.def_char & 0xff00)
|
|
|
|
{
|
|
|
|
cpinfo->DefaultChar[0] = table->info.def_char & 0xff00;
|
|
|
|
cpinfo->DefaultChar[1] = table->info.def_char & 0x00ff;
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
cpinfo->DefaultChar[0] = table->info.def_char & 0xff;
|
|
|
|
cpinfo->DefaultChar[1] = 0;
|
|
|
|
}
|
|
|
|
if ((cpinfo->MaxCharSize = table->info.char_size) == 2)
|
|
|
|
memcpy( cpinfo->LeadByte, table->dbcs.lead_bytes, sizeof(cpinfo->LeadByte) );
|
|
|
|
else
|
|
|
|
cpinfo->LeadByte[0] = cpinfo->LeadByte[1] = 0;
|
|
|
|
|
|
|
|
return TRUE;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
/***********************************************************************
|
|
|
|
* EnumSystemCodePagesA (KERNEL32)
|
|
|
|
*/
|
|
|
|
BOOL WINAPI EnumSystemCodePagesA( CODEPAGE_ENUMPROCA lpfnCodePageEnum, DWORD flags )
|
|
|
|
{
|
|
|
|
const union cptable *table;
|
|
|
|
char buffer[10];
|
|
|
|
int index = 0;
|
|
|
|
|
|
|
|
for (;;)
|
|
|
|
{
|
|
|
|
if (!(table = cp_enum_table( index++ ))) break;
|
|
|
|
sprintf( buffer, "%d", table->info.codepage );
|
|
|
|
if (!lpfnCodePageEnum( buffer )) break;
|
|
|
|
}
|
|
|
|
return TRUE;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
/***********************************************************************
|
|
|
|
* EnumSystemCodePagesW (KERNEL32)
|
|
|
|
*/
|
|
|
|
BOOL WINAPI EnumSystemCodePagesW( CODEPAGE_ENUMPROCW lpfnCodePageEnum, DWORD flags )
|
|
|
|
{
|
|
|
|
const union cptable *table;
|
|
|
|
WCHAR buffer[10], *p;
|
|
|
|
int page, index = 0;
|
|
|
|
|
|
|
|
for (;;)
|
|
|
|
{
|
|
|
|
if (!(table = cp_enum_table( index++ ))) break;
|
|
|
|
p = buffer + sizeof(buffer)/sizeof(WCHAR);
|
|
|
|
*--p = 0;
|
|
|
|
page = table->info.codepage;
|
|
|
|
do
|
|
|
|
{
|
|
|
|
*--p = '0' + (page % 10);
|
|
|
|
page /= 10;
|
|
|
|
} while( page );
|
|
|
|
if (!lpfnCodePageEnum( p )) break;
|
|
|
|
}
|
|
|
|
return TRUE;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
/***********************************************************************
|
|
|
|
* MultiByteToWideChar (KERNEL32)
|
|
|
|
*
|
|
|
|
* PARAMS
|
|
|
|
* page [in] Codepage character set to convert from
|
|
|
|
* flags [in] Character mapping flags
|
|
|
|
* src [in] Source string buffer
|
|
|
|
* srclen [in] Length of source string buffer
|
|
|
|
* dst [in] Destination buffer
|
|
|
|
* dstlen [in] Length of destination buffer
|
|
|
|
*
|
|
|
|
* NOTES
|
|
|
|
* The returned length includes the null terminator character.
|
|
|
|
*
|
|
|
|
* RETURNS
|
|
|
|
* Success: If dstlen > 0, number of characters written to destination
|
|
|
|
* buffer. If dstlen == 0, number of characters needed to do
|
|
|
|
* conversion.
|
|
|
|
* Failure: 0. Occurs if not enough space is available.
|
|
|
|
*
|
|
|
|
* ERRORS
|
|
|
|
* ERROR_INSUFFICIENT_BUFFER
|
|
|
|
* ERROR_INVALID_PARAMETER
|
|
|
|
* ERROR_NO_UNICODE_TRANSLATION
|
|
|
|
*
|
|
|
|
*/
|
|
|
|
INT WINAPI MultiByteToWideChar( UINT page, DWORD flags, LPCSTR src, INT srclen,
|
|
|
|
LPWSTR dst, INT dstlen )
|
|
|
|
{
|
|
|
|
const union cptable *table;
|
|
|
|
int ret;
|
|
|
|
|
2000-07-29 01:58:48 +02:00
|
|
|
if (!src || (!dst && dstlen))
|
|
|
|
{
|
|
|
|
SetLastError( ERROR_INVALID_PARAMETER );
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2000-06-10 06:42:33 +02:00
|
|
|
if (srclen == -1) srclen = strlen(src) + 1;
|
|
|
|
|
2000-08-11 02:44:33 +02:00
|
|
|
if (flags & MB_COMPOSITE) FIXME("MB_COMPOSITE not supported\n");
|
|
|
|
if (flags & MB_USEGLYPHCHARS) FIXME("MB_USEGLYPHCHARS not supported\n");
|
|
|
|
|
|
|
|
switch(page)
|
2000-06-10 06:42:33 +02:00
|
|
|
{
|
2000-08-11 02:44:33 +02:00
|
|
|
case CP_UTF7:
|
2000-06-10 06:42:33 +02:00
|
|
|
FIXME("UTF not supported\n");
|
|
|
|
SetLastError( ERROR_CALL_NOT_IMPLEMENTED );
|
|
|
|
return 0;
|
2000-08-11 02:44:33 +02:00
|
|
|
case CP_UTF8:
|
|
|
|
ret = utf8_mbstowcs( flags, src, srclen, dst, dstlen );
|
|
|
|
break;
|
|
|
|
default:
|
|
|
|
if (!(table = get_codepage_table( page )))
|
|
|
|
{
|
|
|
|
SetLastError( ERROR_INVALID_PARAMETER );
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
ret = cp_mbstowcs( table, flags, src, srclen, dst, dstlen );
|
|
|
|
break;
|
2000-06-10 06:42:33 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
if (ret < 0)
|
|
|
|
{
|
|
|
|
switch(ret)
|
|
|
|
{
|
|
|
|
case -1: SetLastError( ERROR_INSUFFICIENT_BUFFER ); break;
|
|
|
|
case -2: SetLastError( ERROR_NO_UNICODE_TRANSLATION ); break;
|
|
|
|
}
|
|
|
|
ret = 0;
|
|
|
|
}
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
/***********************************************************************
|
|
|
|
* WideCharToMultiByte (KERNEL32)
|
|
|
|
*
|
|
|
|
* PARAMS
|
|
|
|
* page [in] Codepage character set to convert to
|
|
|
|
* flags [in] Character mapping flags
|
|
|
|
* src [in] Source string buffer
|
|
|
|
* srclen [in] Length of source string buffer
|
|
|
|
* dst [in] Destination buffer
|
|
|
|
* dstlen [in] Length of destination buffer
|
|
|
|
* defchar [in] Default character to use for conversion if no exact
|
|
|
|
* conversion can be made
|
|
|
|
* used [out] Set if default character was used in the conversion
|
|
|
|
*
|
|
|
|
* NOTES
|
|
|
|
* The returned length includes the null terminator character.
|
|
|
|
*
|
|
|
|
* RETURNS
|
|
|
|
* Success: If dstlen > 0, number of characters written to destination
|
|
|
|
* buffer. If dstlen == 0, number of characters needed to do
|
|
|
|
* conversion.
|
|
|
|
* Failure: 0. Occurs if not enough space is available.
|
|
|
|
*
|
|
|
|
* ERRORS
|
|
|
|
* ERROR_INSUFFICIENT_BUFFER
|
|
|
|
* ERROR_INVALID_PARAMETER
|
|
|
|
*/
|
|
|
|
INT WINAPI WideCharToMultiByte( UINT page, DWORD flags, LPCWSTR src, INT srclen,
|
|
|
|
LPSTR dst, INT dstlen, LPCSTR defchar, BOOL *used )
|
|
|
|
{
|
|
|
|
const union cptable *table;
|
|
|
|
int ret, used_tmp;
|
|
|
|
|
2000-07-29 01:58:48 +02:00
|
|
|
if (!src || (!dst && dstlen))
|
|
|
|
{
|
|
|
|
SetLastError( ERROR_INVALID_PARAMETER );
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2000-06-10 06:42:33 +02:00
|
|
|
if (srclen == -1) srclen = strlenW(src) + 1;
|
|
|
|
|
2000-08-11 02:44:33 +02:00
|
|
|
/* if (flags & WC_COMPOSITECHECK) FIXME( "WC_COMPOSITECHECK (%lx) not supported\n", flags );*/
|
2000-06-10 06:42:33 +02:00
|
|
|
|
2000-08-11 02:44:33 +02:00
|
|
|
switch(page)
|
2000-06-10 06:42:33 +02:00
|
|
|
{
|
2000-08-11 02:44:33 +02:00
|
|
|
case CP_UTF7:
|
|
|
|
FIXME("UTF-7 not supported\n");
|
|
|
|
SetLastError( ERROR_CALL_NOT_IMPLEMENTED );
|
2000-06-10 06:42:33 +02:00
|
|
|
return 0;
|
2000-08-11 02:44:33 +02:00
|
|
|
case CP_UTF8:
|
|
|
|
ret = utf8_wcstombs( src, srclen, dst, dstlen );
|
|
|
|
break;
|
|
|
|
default:
|
|
|
|
if (!(table = get_codepage_table( page )))
|
|
|
|
{
|
|
|
|
SetLastError( ERROR_INVALID_PARAMETER );
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
ret = cp_wcstombs( table, flags, src, srclen, dst, dstlen,
|
|
|
|
defchar, used ? &used_tmp : NULL );
|
|
|
|
if (used) *used = used_tmp;
|
|
|
|
break;
|
2000-06-10 06:42:33 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
if (ret == -1)
|
|
|
|
{
|
|
|
|
SetLastError( ERROR_INSUFFICIENT_BUFFER );
|
|
|
|
ret = 0;
|
|
|
|
}
|
|
|
|
return ret;
|
|
|
|
}
|
2000-08-11 22:53:40 +02:00
|
|
|
|
|
|
|
|
|
|
|
/******************************************************************************
|
|
|
|
* GetStringTypeW (KERNEL32)
|
|
|
|
*
|
|
|
|
*/
|
|
|
|
BOOL WINAPI GetStringTypeW( DWORD type, LPCWSTR src, INT count, LPWORD chartype )
|
|
|
|
{
|
|
|
|
if (count == -1) count = strlenW(src) + 1;
|
|
|
|
switch(type)
|
|
|
|
{
|
|
|
|
case CT_CTYPE1:
|
|
|
|
while (count--) *chartype++ = get_char_typeW( *src++ ) & 0xfff;
|
|
|
|
break;
|
|
|
|
case CT_CTYPE2:
|
|
|
|
while (count--) *chartype++ = get_char_typeW( *src++ ) >> 12;
|
|
|
|
break;
|
|
|
|
case CT_CTYPE3:
|
|
|
|
FIXME("CT_CTYPE3 not supported.\n");
|
|
|
|
default:
|
|
|
|
SetLastError( ERROR_INVALID_PARAMETER );
|
|
|
|
return FALSE;
|
|
|
|
}
|
|
|
|
return TRUE;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
/******************************************************************************
|
|
|
|
* GetStringTypeExW (KERNEL32)
|
|
|
|
*/
|
|
|
|
BOOL WINAPI GetStringTypeExW( LCID locale, DWORD type, LPCWSTR src, INT count, LPWORD chartype )
|
|
|
|
{
|
|
|
|
/* locale is ignored for Unicode */
|
|
|
|
return GetStringTypeW( type, src, count, chartype );
|
|
|
|
}
|