aboutsummaryrefslogtreecommitdiff
path: root/tests
diff options
context:
space:
mode:
authorFeoramund <161657516+Feoramund@users.noreply.github.com>2024-06-19 22:35:36 -0400
committerFeoramund <161657516+Feoramund@users.noreply.github.com>2024-06-19 22:35:36 -0400
commite620645a035fd5ce2b3b67bee83f04d003556306 (patch)
tree1d76b24f67475e4fb19fe0ba340e82710a332622 /tests
parent43809342836a2230a96d86b403722f424ce19a87 (diff)
Measure `East_Asian_Width` during grapheme decoding
Diffstat (limited to 'tests')
-rw-r--r--tests/core/unicode/test_core_unicode.odin66
1 files changed, 64 insertions, 2 deletions
diff --git a/tests/core/unicode/test_core_unicode.odin b/tests/core/unicode/test_core_unicode.odin
index c097d518a..a1f6ac934 100644
--- a/tests/core/unicode/test_core_unicode.odin
+++ b/tests/core/unicode/test_core_unicode.odin
@@ -13,7 +13,7 @@ run_test_cases :: proc(t: ^testing.T, test_cases: []Test_Case, loc := #caller_lo
failed := 0
for c, i in test_cases {
log.debugf("(#% 4i) %q ...", i, c.str)
- result, _ := utf8.grapheme_count(c.str)
+ result, _, _ := utf8.grapheme_count(c.str)
if !testing.expectf(t, result == c.expected_clusters,
"(#% 4i) graphemes: %i != %i, %q %s", i, result, c.expected_clusters, c.str, c.str,
loc = loc)
@@ -43,7 +43,7 @@ test_grapheme_byte_index_segmentation :: proc(t: ^testing.T) {
str := SAMPLE_1 + SAMPLE_2 + SAMPLE_3 + SAMPLE_2 + SAMPLE_1
- graphemes, _, _ := utf8.decode_grapheme_clusters(str)
+ graphemes, _, _, _ := utf8.decode_grapheme_clusters(str)
defer delete(graphemes)
defer if testing.failed(t) {
@@ -71,3 +71,65 @@ test_grapheme_byte_index_segmentation :: proc(t: ^testing.T) {
testing.expectf(t, grapheme_4 == SAMPLE_2, "expected %q, got %q", SAMPLE_2, grapheme_2)
testing.expectf(t, grapheme_5 == SAMPLE_1, "expected %q, got %q", SAMPLE_1, grapheme_1)
}
+
+@test
+test_width :: proc(t: ^testing.T) {
+ {
+ str := "He\u200dllo"
+ graphemes, _, width := utf8.grapheme_count(str)
+ testing.expect_value(t, graphemes, 5)
+ testing.expect_value(t, width, 5)
+ }
+
+ {
+ // Note that a zero-width space is still considered a grapheme as far
+ // as the specification is concerned.
+ str := "He\u200bllo"
+ graphemes, _, width := utf8.grapheme_count(str)
+ testing.expect_value(t, graphemes, 6)
+ testing.expect_value(t, width, 5)
+ }
+
+ {
+ str := "\U0001F926\U0001F3FC\u200D\u2642"
+ graphemes, _, width := utf8.grapheme_count(str)
+ testing.expect_value(t, graphemes, 1)
+ testing.expect_value(t, width, 2)
+ }
+
+ {
+ str := "H̷e̶l̵l̸o̴p̵e̷ ̸w̶o̸r̵l̶d̵!̴"
+ graphemes, _, width := utf8.grapheme_count(str)
+ testing.expect_value(t, graphemes, 14)
+ testing.expect_value(t, width, 14)
+ }
+
+ {
+ str := "aカ.ヒフ"
+ graphemes, grapheme_count, _, width := utf8.decode_grapheme_clusters(str)
+ defer delete(graphemes)
+ testing.expect_value(t, grapheme_count, 5)
+ testing.expect_value(t, width, 8)
+ if grapheme_count == 5 {
+ testing.expect_value(t, graphemes[0].width, 1)
+ testing.expect_value(t, graphemes[1].width, 2)
+ testing.expect_value(t, graphemes[2].width, 1)
+ testing.expect_value(t, graphemes[3].width, 2)
+ testing.expect_value(t, graphemes[4].width, 2)
+ }
+ }
+
+ {
+ str := "いろはにほへ"
+ graphemes, _, width := utf8.grapheme_count(str)
+ testing.expect_value(t, graphemes, 6)
+ testing.expect_value(t, width, 12)
+ }
+
+ {
+ str := "舍利弗,是諸法空相,不生不滅,不垢不淨,不增不減。"
+ graphemes, _, width := utf8.grapheme_count(str)
+ testing.expect_value(t, graphemes, 25)
+ testing.expect_value(t, width, 50)
+ }
+}