mirror of
https://github.com/dlang/phobos.git
synced 2025-04-29 14:40:30 +03:00
122 lines
2.6 KiB
D
122 lines
2.6 KiB
D
/* Public Domain */
|
|
|
|
/**
|
|
* Support UTF-8 on Windows 95, 98 and ME systems.
|
|
* Macros:
|
|
* WIKI = Phobos/StdWindowsCharset
|
|
*/
|
|
|
|
module std.windows.charset;
|
|
|
|
private import std.c.windows.windows;
|
|
private import std.windows.syserror;
|
|
private import std.utf;
|
|
private import std.string;
|
|
|
|
/**
|
|
* If non-zero, the application should use the W versions of Windows API
|
|
* functions and std.utf.toUTF16z and toUTF8, rather than toMBSz and
|
|
* fromMBSz.
|
|
*/
|
|
int useWfuncs = 1;
|
|
|
|
static this()
|
|
{
|
|
// Win 95, 98, ME do not implement the W functions
|
|
// TODO: detect MSLU?
|
|
useWfuncs = (GetVersion() < 0x80000000);
|
|
}
|
|
|
|
|
|
/******************************************
|
|
* Converts the UTF-8 string s into a null-terminated string in a Windows
|
|
* 8-bit character set.
|
|
*
|
|
* Params:
|
|
* s = UTF-8 string to convert.
|
|
* codePage = is the number of the target codepage, or
|
|
* 0 - ANSI,
|
|
* 1 - OEM,
|
|
* 2 - Mac
|
|
*
|
|
* Authors:
|
|
* yaneurao, Walter Bright, Stewart Gordon
|
|
*/
|
|
|
|
char* toMBSz(char[] s, uint codePage = 0)
|
|
{
|
|
// Only need to do this if any chars have the high bit set
|
|
foreach (char c; s)
|
|
{
|
|
if (c >= 0x80)
|
|
{
|
|
char[] result;
|
|
int readLen;
|
|
wchar* ws = std.utf.toUTF16z(s);
|
|
result.length = WideCharToMultiByte(codePage, 0, ws, -1, null, 0,
|
|
null, null);
|
|
|
|
if (result.length)
|
|
{
|
|
readLen = WideCharToMultiByte(codePage, 0, ws, -1, result.ptr,
|
|
result.length, null, null);
|
|
}
|
|
|
|
if (!readLen || readLen != result.length)
|
|
{
|
|
throw new Exception("Couldn't convert string: " ~
|
|
sysErrorString(GetLastError()));
|
|
}
|
|
|
|
return result;
|
|
}
|
|
}
|
|
return std.string.toStringz(s);
|
|
}
|
|
|
|
|
|
/**********************************************
|
|
* Converts the null-terminated string s from a Windows 8-bit character set
|
|
* into a UTF-8 char array.
|
|
*
|
|
* Params:
|
|
* s = UTF-8 string to convert.
|
|
* codePage = is the number of the source codepage, or
|
|
* 0 - ANSI,
|
|
* 1 - OEM,
|
|
* 2 - Mac
|
|
* Authors: Stewart Gordon, Walter Bright
|
|
*/
|
|
|
|
char[] fromMBSz(char* s, int codePage = 0)
|
|
{
|
|
char* c;
|
|
|
|
for (c = s; *c != 0; c++)
|
|
{
|
|
if (*c >= 0x80)
|
|
{
|
|
wchar[] result;
|
|
int readLen;
|
|
|
|
result.length = MultiByteToWideChar(codePage, 0, s, -1, null, 0);
|
|
|
|
if (result.length)
|
|
{
|
|
readLen = MultiByteToWideChar(codePage, 0, s, -1, result.ptr,
|
|
result.length);
|
|
}
|
|
|
|
if (!readLen || readLen != result.length)
|
|
{
|
|
throw new Exception("Couldn't convert string: " ~
|
|
sysErrorString(GetLastError()));
|
|
}
|
|
|
|
return std.utf.toUTF8(result[0 .. result.length-1]); // omit trailing null
|
|
}
|
|
}
|
|
return s[0 .. c-s]; // string is ASCII, no conversion necessary
|
|
}
|
|
|
|
|