phobos/std/windows/charset.d
2007-09-10 05:11:52 +00:00

122 lines
2.6 KiB
D

/* Public Domain */
/**
* Support UTF-8 on Windows 95, 98 and ME systems.
* Macros:
* WIKI = Phobos/StdWindowsCharset
*/
module std.windows.charset;
private import std.c.windows.windows;
private import std.windows.syserror;
private import std.utf;
private import std.string;
/**
* If non-zero, the application should use the W versions of Windows API
* functions and std.utf.toUTF16z and toUTF8, rather than toMBSz and
* fromMBSz.
*/
int useWfuncs = 1;
static this()
{
// Win 95, 98, ME do not implement the W functions
// TODO: detect MSLU?
useWfuncs = (GetVersion() < 0x80000000);
}
/******************************************
* Converts the UTF-8 string s into a null-terminated string in a Windows
* 8-bit character set.
*
* Params:
* s = UTF-8 string to convert.
* codePage = is the number of the target codepage, or
* 0 - ANSI,
* 1 - OEM,
* 2 - Mac
*
* Authors:
* yaneurao, Walter Bright, Stewart Gordon
*/
char* toMBSz(char[] s, uint codePage = 0)
{
// Only need to do this if any chars have the high bit set
foreach (char c; s)
{
if (c >= 0x80)
{
char[] result;
int readLen;
wchar* ws = std.utf.toUTF16z(s);
result.length = WideCharToMultiByte(codePage, 0, ws, -1, null, 0,
null, null);
if (result.length)
{
readLen = WideCharToMultiByte(codePage, 0, ws, -1, result.ptr,
result.length, null, null);
}
if (!readLen || readLen != result.length)
{
throw new Exception("Couldn't convert string: " ~
sysErrorString(GetLastError()));
}
return result;
}
}
return std.string.toStringz(s);
}
/**********************************************
* Converts the null-terminated string s from a Windows 8-bit character set
* into a UTF-8 char array.
*
* Params:
* s = UTF-8 string to convert.
* codePage = is the number of the source codepage, or
* 0 - ANSI,
* 1 - OEM,
* 2 - Mac
* Authors: Stewart Gordon, Walter Bright
*/
char[] fromMBSz(char* s, int codePage = 0)
{
char* c;
for (c = s; *c != 0; c++)
{
if (*c >= 0x80)
{
wchar[] result;
int readLen;
result.length = MultiByteToWideChar(codePage, 0, s, -1, null, 0);
if (result.length)
{
readLen = MultiByteToWideChar(codePage, 0, s, -1, result.ptr,
result.length);
}
if (!readLen || readLen != result.length)
{
throw new Exception("Couldn't convert string: " ~
sysErrorString(GetLastError()));
}
return std.utf.toUTF8(result[0 .. result.length-1]); // omit trailing null
}
}
return s[0 .. c-s]; // string is ASCII, no conversion necessary
}