mirror of
https://github.com/reactos/reactos.git
synced 2025-01-03 21:09:19 +00:00
17e9dcc922
- Fix the garbled characters (a.k.a. mojibake) in some Japanese text files. - weight will remain 3 unless IS_TEXT_UNICODE_DBCS_LEADBYTE flag is set. - Strengthen advapi32_apitest IsTextUnicode testcase. CORE-19016
201 lines
9.3 KiB
C
201 lines
9.3 KiB
C
/*
|
|
* PROJECT: ReactOS api tests
|
|
* LICENSE: GPLv2+ - See COPYING in the top level directory
|
|
* PURPOSE: Tests for (Rtl)IsTextUnicode.
|
|
* PROGRAMMERS: Hermes Belusca-Maito
|
|
* Dmitry Chapyshev
|
|
* Katayama Hirofumi MZ
|
|
*/
|
|
|
|
#include "precomp.h"
|
|
|
|
#include <stdio.h>
|
|
|
|
PVOID LoadCodePageData(ULONG Code)
|
|
{
|
|
char filename[MAX_PATH], sysdir[MAX_PATH];
|
|
HANDLE hFile;
|
|
PVOID Data = NULL;
|
|
GetSystemDirectoryA(sysdir, MAX_PATH);
|
|
|
|
if (Code != -1)
|
|
StringCbPrintfA(filename, sizeof(filename), "%s\\c_%lu.nls", sysdir, Code);
|
|
else
|
|
StringCbPrintfA(filename, sizeof(filename), "%s\\l_intl.nls", sysdir);
|
|
|
|
hFile = CreateFile(filename, GENERIC_READ, FILE_SHARE_READ, NULL, OPEN_EXISTING, 0, NULL);
|
|
if (hFile != INVALID_HANDLE_VALUE)
|
|
{
|
|
DWORD dwRead;
|
|
DWORD dwFileSize = GetFileSize(hFile, NULL);
|
|
Data = malloc(dwFileSize);
|
|
ReadFile(hFile, Data, dwFileSize, &dwRead, NULL);
|
|
CloseHandle(hFile);
|
|
}
|
|
return Data;
|
|
}
|
|
|
|
/* https://www.microsoft.com/resources/msdn/goglobal/default.mspx */
|
|
void SetupLocale(ULONG AnsiCode, ULONG OemCode, ULONG Unicode)
|
|
{
|
|
NLSTABLEINFO NlsTable;
|
|
PVOID AnsiCodePageData;
|
|
PVOID OemCodePageData;
|
|
PVOID UnicodeCaseTableData;
|
|
|
|
AnsiCodePageData = LoadCodePageData(AnsiCode);
|
|
OemCodePageData = LoadCodePageData(OemCode);
|
|
UnicodeCaseTableData = LoadCodePageData(Unicode);
|
|
|
|
RtlInitNlsTables(AnsiCodePageData, OemCodePageData, UnicodeCaseTableData, &NlsTable);
|
|
RtlResetRtlTranslations(&NlsTable);
|
|
/* Do NOT free the buffers here, they are directly used!
|
|
Yes, we leak the old buffers, but this is a test anyway... */
|
|
|
|
}
|
|
|
|
START_TEST(IsTextUnicode)
|
|
{
|
|
#define INVALID_FLAG 0xFFFFFFFF
|
|
|
|
#define NEW_TEST(Buffer, Flags, ResultFlags, Success) \
|
|
{ __LINE__, (PVOID)(Buffer), sizeof((Buffer)), (Flags), (ResultFlags), (Success) }
|
|
|
|
static struct
|
|
{
|
|
INT lineno;
|
|
|
|
/* Input */
|
|
PVOID Buffer;
|
|
INT Size;
|
|
INT Flags;
|
|
|
|
/* Output */
|
|
INT ResultFlags;
|
|
BOOL Success;
|
|
} Tests[] =
|
|
{
|
|
/* ANSI string */
|
|
NEW_TEST("ANSI string", IS_TEXT_UNICODE_ASCII16, 0, FALSE),
|
|
NEW_TEST("ANSI string", IS_TEXT_UNICODE_STATISTICS, 0, FALSE),
|
|
NEW_TEST("ANSI string", INVALID_FLAG, 0, FALSE),
|
|
|
|
/* UNICODE strings */
|
|
NEW_TEST(L"a", IS_TEXT_UNICODE_ASCII16, IS_TEXT_UNICODE_ASCII16, TRUE),
|
|
NEW_TEST(L"a", IS_TEXT_UNICODE_UNICODE_MASK, IS_TEXT_UNICODE_STATISTICS | IS_TEXT_UNICODE_ASCII16, TRUE),
|
|
NEW_TEST(L"a", IS_TEXT_UNICODE_STATISTICS, IS_TEXT_UNICODE_STATISTICS, TRUE),
|
|
NEW_TEST(L"a", INVALID_FLAG, 0, TRUE),
|
|
|
|
NEW_TEST(L"UNICODE String 0", IS_TEXT_UNICODE_ASCII16, 0, FALSE),
|
|
NEW_TEST(L"UNICODE String 0", IS_TEXT_UNICODE_UNICODE_MASK, IS_TEXT_UNICODE_CONTROLS | IS_TEXT_UNICODE_STATISTICS, TRUE),
|
|
NEW_TEST(L"UNICODE String 0", IS_TEXT_UNICODE_STATISTICS, IS_TEXT_UNICODE_STATISTICS, TRUE),
|
|
NEW_TEST(L"UNICODE String 0", INVALID_FLAG, 0, TRUE),
|
|
|
|
NEW_TEST(L"\xFEFF" L"UNICODE String 1", IS_TEXT_UNICODE_ASCII16, 0, FALSE),
|
|
NEW_TEST(L"\xFEFF" L"UNICODE String 1", IS_TEXT_UNICODE_UNICODE_MASK, IS_TEXT_UNICODE_SIGNATURE | IS_TEXT_UNICODE_CONTROLS, TRUE),
|
|
NEW_TEST(L"\xFEFF" L"UNICODE String 1", IS_TEXT_UNICODE_STATISTICS, 0, FALSE),
|
|
NEW_TEST(L"\xFEFF" L"UNICODE String 1", INVALID_FLAG, 0, TRUE),
|
|
|
|
NEW_TEST(L"\xFFFE" L"UNICODE String 2", IS_TEXT_UNICODE_ASCII16, 0, FALSE),
|
|
NEW_TEST(L"\xFFFE" L"UNICODE String 2", IS_TEXT_UNICODE_UNICODE_MASK, IS_TEXT_UNICODE_CONTROLS, TRUE),
|
|
NEW_TEST(L"\xFFFE" L"UNICODE String 2", IS_TEXT_UNICODE_STATISTICS, 0, FALSE),
|
|
NEW_TEST(L"\xFFFE" L"UNICODE String 2", INVALID_FLAG, 0, FALSE),
|
|
|
|
NEW_TEST(L"UNICODE String 3 Привет!", IS_TEXT_UNICODE_ASCII16, 0, FALSE),
|
|
NEW_TEST(L"UNICODE String 3 Привет!", IS_TEXT_UNICODE_UNICODE_MASK, IS_TEXT_UNICODE_CONTROLS | IS_TEXT_UNICODE_STATISTICS, TRUE),
|
|
NEW_TEST(L"UNICODE String 3 Привет!", IS_TEXT_UNICODE_STATISTICS, IS_TEXT_UNICODE_STATISTICS, TRUE),
|
|
NEW_TEST(L"UNICODE String 3 Привет!", INVALID_FLAG, 0, TRUE),
|
|
|
|
NEW_TEST(L"\xFEFF" L"UNICODE String 4 Привет!", IS_TEXT_UNICODE_ASCII16, 0, FALSE),
|
|
NEW_TEST(L"\xFEFF" L"UNICODE String 4 Привет!", IS_TEXT_UNICODE_UNICODE_MASK, IS_TEXT_UNICODE_SIGNATURE | IS_TEXT_UNICODE_CONTROLS, TRUE),
|
|
NEW_TEST(L"\xFEFF" L"UNICODE String 4 Привет!", IS_TEXT_UNICODE_STATISTICS, 0, FALSE),
|
|
NEW_TEST(L"\xFEFF" L"UNICODE String 4 Привет!", INVALID_FLAG, 0, TRUE),
|
|
|
|
NEW_TEST(L"\xFFFE" L"UNICODE String 5 Привет!", IS_TEXT_UNICODE_ASCII16, 0, FALSE),
|
|
NEW_TEST(L"\xFFFE" L"UNICODE String 5 Привет!", IS_TEXT_UNICODE_UNICODE_MASK, IS_TEXT_UNICODE_CONTROLS, TRUE),
|
|
NEW_TEST(L"\xFFFE" L"UNICODE String 5 Привет!", IS_TEXT_UNICODE_STATISTICS, 0, FALSE),
|
|
NEW_TEST(L"\xFFFE" L"UNICODE String 5 Привет!", INVALID_FLAG, 0, FALSE),
|
|
|
|
/* Reverse BOM */
|
|
NEW_TEST(L"UNICODE S" L"\xFFFE" L"tring 5 Привет!", IS_TEXT_UNICODE_ILLEGAL_CHARS, IS_TEXT_UNICODE_ILLEGAL_CHARS, FALSE),
|
|
/* UNICODE_NUL */
|
|
NEW_TEST(L"UNICODE S" L"\x0000" L"tring 5 Привет!", IS_TEXT_UNICODE_ILLEGAL_CHARS, IS_TEXT_UNICODE_ILLEGAL_CHARS, FALSE),
|
|
/* ASCII CRLF (packed into one word) */
|
|
NEW_TEST(L"UNICODE S" L"\x0A0D" L"tring 5 Привет!", IS_TEXT_UNICODE_ILLEGAL_CHARS, IS_TEXT_UNICODE_ILLEGAL_CHARS, FALSE),
|
|
/* Unicode 0xFFFF */
|
|
NEW_TEST(L"UNICODE S" L"\xFFFF" L"tring 5 Привет!", IS_TEXT_UNICODE_ILLEGAL_CHARS, IS_TEXT_UNICODE_ILLEGAL_CHARS, FALSE),
|
|
|
|
NEW_TEST(L"UNICODE String 0", IS_TEXT_UNICODE_DBCS_LEADBYTE, 0, FALSE)
|
|
};
|
|
|
|
const char japanese_with_lead[] = "ABC" "\x83\x40" "D";
|
|
const char japanese_sjis[] = "\x93\xFA\x96\x7B\x8C\xEA\x31\x32\x33\x93\xFA\x96\x7B\x8C\xEA";
|
|
const char japanese_utf8[] = "\xE6\x97\xA5\xE6\x9C\xAC\xE8\xAA\x9E\x31\x32\x33\xE6\x97\xA5"
|
|
"\xE6\x9C\xAC\xE8\xAA\x9E";
|
|
const char simplfied_chinese_with_lead[] = "ABC" "\xC5\xC5" "D";
|
|
const char korean_with_lead[] = "ABC" "\xBF\xAD" "D";
|
|
const char traditional_chinese_with_lead[] = "ABC" "\xB1\xC1" "D";
|
|
|
|
UINT i;
|
|
BOOL Success;
|
|
INT Result;
|
|
|
|
for (i = 0; i < ARRAYSIZE(Tests); ++i)
|
|
{
|
|
Result = Tests[i].Flags;
|
|
Success = IsTextUnicode(Tests[i].Buffer, Tests[i].Size, ((Result != INVALID_FLAG) ? &Result : NULL));
|
|
ok(Success == Tests[i].Success, "Line %u: IsTextUnicode() returned 0x%x, expected %s\n", Tests[i].lineno, Success, (Tests[i].Success ? "TRUE" : "FALSE"));
|
|
if (Result != INVALID_FLAG)
|
|
ok(Result == Tests[i].ResultFlags, "Line %u: IsTextUnicode() Result returned 0x%x, expected 0x%x\n", Tests[i].lineno, Result, Tests[i].ResultFlags);
|
|
}
|
|
|
|
/* Japanese */
|
|
SetupLocale(932, 932, -1);
|
|
|
|
Result = IS_TEXT_UNICODE_DBCS_LEADBYTE;
|
|
ok_int(IsTextUnicode(japanese_with_lead, sizeof(japanese_with_lead), &Result), FALSE);
|
|
ok_int(Result, IS_TEXT_UNICODE_DBCS_LEADBYTE);
|
|
|
|
ok_int(IsTextUnicode(japanese_sjis, sizeof(japanese_sjis) - 1, NULL), FALSE);
|
|
|
|
Result = IS_TEXT_UNICODE_STATISTICS | IS_TEXT_UNICODE_REVERSE_STATISTICS;
|
|
ok_int(IsTextUnicode(japanese_sjis, sizeof(japanese_sjis) - 1, &Result), FALSE);
|
|
ok_int(Result, 0);
|
|
|
|
Result = IS_TEXT_UNICODE_STATISTICS | IS_TEXT_UNICODE_REVERSE_STATISTICS |
|
|
IS_TEXT_UNICODE_DBCS_LEADBYTE;
|
|
ok_int(IsTextUnicode(japanese_sjis, sizeof(japanese_sjis) - 1, &Result), FALSE);
|
|
ok_int(Result, (IS_TEXT_UNICODE_DBCS_LEADBYTE | IS_TEXT_UNICODE_REVERSE_STATISTICS));
|
|
|
|
ok_int(IsTextUnicode(japanese_utf8, sizeof(japanese_utf8) - 1, NULL), FALSE);
|
|
|
|
Result = IS_TEXT_UNICODE_STATISTICS | IS_TEXT_UNICODE_REVERSE_STATISTICS;
|
|
ok_int(IsTextUnicode(japanese_utf8, sizeof(japanese_utf8) - 1, &Result), FALSE);
|
|
ok_int(Result, 0);
|
|
|
|
Result = IS_TEXT_UNICODE_STATISTICS | IS_TEXT_UNICODE_REVERSE_STATISTICS |
|
|
IS_TEXT_UNICODE_DBCS_LEADBYTE;
|
|
ok_int(IsTextUnicode(japanese_utf8, sizeof(japanese_utf8) - 1, &Result), FALSE);
|
|
ok_int(Result, (IS_TEXT_UNICODE_DBCS_LEADBYTE | IS_TEXT_UNICODE_STATISTICS));
|
|
|
|
/* Simplified Chinese */
|
|
SetupLocale(936, 936, -1);
|
|
|
|
Result = IS_TEXT_UNICODE_DBCS_LEADBYTE;
|
|
ok(!IsTextUnicode(simplfied_chinese_with_lead, sizeof(simplfied_chinese_with_lead), &Result), "IsTextUnicode() returned TRUE, expected FALSE\n");
|
|
ok(Result == IS_TEXT_UNICODE_DBCS_LEADBYTE, "Result returned 0x%x, expected 0x%x\n", Result, IS_TEXT_UNICODE_DBCS_LEADBYTE);
|
|
|
|
/* Korean */
|
|
SetupLocale(949, 949, -1);
|
|
|
|
Result = IS_TEXT_UNICODE_DBCS_LEADBYTE;
|
|
ok(!IsTextUnicode(korean_with_lead, sizeof(korean_with_lead), &Result), "IsTextUnicode() returned TRUE, expected FALSE\n");
|
|
ok(Result == IS_TEXT_UNICODE_DBCS_LEADBYTE, "Result returned 0x%x, expected 0x%x\n", Result, IS_TEXT_UNICODE_DBCS_LEADBYTE);
|
|
|
|
/* Traditional Chinese */
|
|
SetupLocale(950, 950, -1);
|
|
|
|
Result = IS_TEXT_UNICODE_DBCS_LEADBYTE;
|
|
ok(!IsTextUnicode(traditional_chinese_with_lead, sizeof(traditional_chinese_with_lead), &Result), "IsTextUnicode() returned TRUE, expected FALSE\n");
|
|
ok(Result == IS_TEXT_UNICODE_DBCS_LEADBYTE, "Result returned 0x%x, expected 0x%x\n", Result, IS_TEXT_UNICODE_DBCS_LEADBYTE);
|
|
}
|