mirror of
https://github.com/OpenMW/openmw.git
synced 2025-01-16 15:29:55 +00:00
test utf8
This commit is contained in:
parent
22d685eca3
commit
d21f3809bd
2 changed files with 41 additions and 4 deletions
|
@ -6,8 +6,8 @@
|
||||||
namespace
|
namespace
|
||||||
{
|
{
|
||||||
constexpr std::string_view UTF8PATT = "[%z\x01-\x7F\xC2-\xF4][\x80-\xBF]*"; // %z is deprecated in Lua5.2
|
constexpr std::string_view UTF8PATT = "[%z\x01-\x7F\xC2-\xF4][\x80-\xBF]*"; // %z is deprecated in Lua5.2
|
||||||
constexpr uint32_t MAXUTF = 0x7FFFFFFFu;
|
// constexpr uint32_t MAXUTF = 0x7FFFFFFFu;
|
||||||
// constexpr uint32_t MAXUNICODE = 0x10FFFFu;
|
constexpr uint32_t MAXUNICODE = 0x10FFFFu;
|
||||||
|
|
||||||
inline bool isNilOrNone(const sol::stack_proxy arg)
|
inline bool isNilOrNone(const sol::stack_proxy arg)
|
||||||
{
|
{
|
||||||
|
@ -100,7 +100,7 @@ namespace LuaUtf8
|
||||||
for (size_t i = 0; i < args.size(); ++i)
|
for (size_t i = 0; i < args.size(); ++i)
|
||||||
{
|
{
|
||||||
int64_t codepoint = getInteger(args[i], (i + 1), "char");
|
int64_t codepoint = getInteger(args[i], (i + 1), "char");
|
||||||
if (codepoint < 0 || codepoint > MAXUTF)
|
if (codepoint < 0 || codepoint > MAXUNICODE)
|
||||||
throw std::runtime_error(
|
throw std::runtime_error(
|
||||||
"bad argument #" + std::to_string(i + 1) + " to 'char' (value out of range)");
|
"bad argument #" + std::to_string(i + 1) + " to 'char' (value out of range)");
|
||||||
|
|
||||||
|
|
|
@ -1,4 +1,4 @@
|
||||||
local testing = require('testing_util')
|
local testing = require('testing_util')
|
||||||
local core = require('openmw.core')
|
local core = require('openmw.core')
|
||||||
local async = require('openmw.async')
|
local async = require('openmw.async')
|
||||||
local util = require('openmw.util')
|
local util = require('openmw.util')
|
||||||
|
@ -150,6 +150,42 @@ local function testRecordCreation()
|
||||||
testing.expectEqual(record[key],value)
|
testing.expectEqual(record[key],value)
|
||||||
end
|
end
|
||||||
end
|
end
|
||||||
|
local function testUTF8()
|
||||||
|
local utf8char = "😀"
|
||||||
|
local utf8str = "Hello, 你好, 🌎!"
|
||||||
|
local chars = {}
|
||||||
|
|
||||||
|
for codepoint = 0, 0x10FFFF do
|
||||||
|
local char = utf8.char(codepoint)
|
||||||
|
local charSize = string.len(char)
|
||||||
|
|
||||||
|
testing.expect(not chars[char], nil, "Duplicate UTF-8 character: " .. char)
|
||||||
|
chars[char] = true
|
||||||
|
|
||||||
|
if codepoint <= 0x7F then
|
||||||
|
testing.expectEqual(charSize, 1)
|
||||||
|
elseif codepoint <= 0x7FF then
|
||||||
|
testing.expectEqual(charSize, 2)
|
||||||
|
elseif codepoint <= 0xFFFF then
|
||||||
|
testing.expectEqual(charSize, 3)
|
||||||
|
elseif codepoint <= 0x10FFFF then
|
||||||
|
testing.expectEqual(charSize, 4)
|
||||||
|
end
|
||||||
|
|
||||||
|
testing.expectEqual(utf8.codepoint(char), codepoint)
|
||||||
|
testing.expectEqual(utf8.len(char), 1)
|
||||||
|
end
|
||||||
|
|
||||||
|
local str = ""
|
||||||
|
for utf_char in utf8str:gmatch(utf8.charpattern) do
|
||||||
|
str = str .. utf_char
|
||||||
|
end
|
||||||
|
testing.expectEqual(str, utf8str)
|
||||||
|
|
||||||
|
testing.expectEqual(utf8.codepoint(utf8char), 128512)
|
||||||
|
testing.expectEqual(utf8.len(utf8str), 13)
|
||||||
|
testing.expectEqual(utf8.offset(utf8str, 9), 11)
|
||||||
|
end
|
||||||
local function initPlayer()
|
local function initPlayer()
|
||||||
player:teleport('', util.vector3(4096, 4096, 867.237), util.transform.identity)
|
player:teleport('', util.vector3(4096, 4096, 867.237), util.transform.identity)
|
||||||
coroutine.yield()
|
coroutine.yield()
|
||||||
|
@ -189,6 +225,7 @@ tests = {
|
||||||
{'getGMST', testGetGMST},
|
{'getGMST', testGetGMST},
|
||||||
{'recordStores', testRecordStores},
|
{'recordStores', testRecordStores},
|
||||||
{'recordCreation', testRecordCreation},
|
{'recordCreation', testRecordCreation},
|
||||||
|
{'utf8', testUTF8},
|
||||||
{'mwscript', testMWScript},
|
{'mwscript', testMWScript},
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
Loading…
Reference in a new issue