aboutsummaryrefslogtreecommitdiffstats
path: root/tests/test_utf8.lua
diff options
context:
space:
mode:
authorMatthew Wild <mwild1@gmail.com>2015-03-23 17:16:54 +0000
committerMatthew Wild <mwild1@gmail.com>2015-03-23 17:16:54 +0000
commitf70ce48360c597c96aadce377625db25e1627ea8 (patch)
tree76bb4e5cd4f5d11ff9d69d45e66ec9d9aac9a957 /tests/test_utf8.lua
parentdd0acd25ece857dd71d84e0b673b29082e47567d (diff)
downloadprosody-f70ce48360c597c96aadce377625db25e1627ea8.tar.gz
prosody-f70ce48360c597c96aadce377625db25e1627ea8.zip
tests: Add UTF-8 validity tests
Diffstat (limited to 'tests/test_utf8.lua')
-rw-r--r--tests/test_utf8.lua19
1 files changed, 19 insertions, 0 deletions
diff --git a/tests/test_utf8.lua b/tests/test_utf8.lua
new file mode 100644
index 00000000..481eff5d
--- /dev/null
+++ b/tests/test_utf8.lua
@@ -0,0 +1,19 @@
+package.cpath = "../?.so"
+package.path = "../?.lua";
+
+function valid()
+ local encodings = require "util.encodings";
+ local utf8 = assert(encodings.utf8, "no encodings.utf8 module");
+
+ for line in io.lines("utf8_sequences.txt") do
+ local data = line:match(":%s*([^#]+)"):gsub("%s+", ""):gsub("..", function (c) return string.char(tonumber(c, 16)); end)
+ local expect = line:match("(%S+):");
+ if expect ~= "pass" and expect ~= "fail" then
+ error("unknown expectation: "..line:match("^[^:]+"));
+ end
+ local prefix, style = " ", valid_style;
+ local valid = utf8.valid(data);
+ assert_equal(valid, utf8.valid(data.." "));
+ assert_equal(valid, expect == "pass", line);
+ end
+end