From d81308faba0cfb3fccf8c3b12446863c7b76ae32 Mon Sep 17 00:00:00 2001 From: "Steven G. Johnson" Date: Wed, 2 May 2018 14:18:26 -0400 Subject: uppercase mapping ß (U+00df) to ẞ (U+1E9E) (#134) MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit * uppercase(0x00df) = 0x1e9e * tests for titlecase and u+00df uppercase * NEWS, another test --- test/case.c | 23 ++++++++++++++++++++++- 1 file changed, 22 insertions(+), 1 deletion(-) (limited to 'test/case.c') diff --git a/test/case.c b/test/case.c index 39958e3..a267609 100644 --- a/test/case.c +++ b/test/case.c @@ -13,13 +13,20 @@ int main(int argc, char **argv) for (c = 0; c <= 0x110000; ++c) { utf8proc_int32_t l = utf8proc_tolower(c); utf8proc_int32_t u = utf8proc_toupper(c); + utf8proc_int32_t t = utf8proc_totitle(c); check(l == c || utf8proc_codepoint_valid(l), "invalid tolower"); check(u == c || utf8proc_codepoint_valid(u), "invalid toupper"); + check(t == c || utf8proc_codepoint_valid(t), "invalid totitle"); + + if (utf8proc_codepoint_valid(c) && (l == u) != (l == t)) { + fprintf(stderr, "unexpected titlecase %x for lowercase %x / uppercase %x\n", t, l, c); + ++error; + } if (sizeof(wint_t) > 2 || c < (1<<16)) { wint_t l0 = towlower(c), u0 = towupper(c); - + /* OS unicode tables may be out of date. But if they do have a lower/uppercase mapping, hopefully it is correct? */ @@ -44,6 +51,20 @@ int main(int argc, char **argv) } } check(!error, "utf8proc case conversion FAILED %d tests.", error); + + /* issue #130 */ + check(utf8proc_toupper(0x00df) == 0x1e9e && + utf8proc_totitle(0x00df) == 0x1e9e && + utf8proc_tolower(0x00df) == 0x00df && + utf8proc_tolower(0x1e9e) == 0x00df && + utf8proc_toupper(0x1e9e) == 0x1e9e, + "incorrect 0x00df/0x1e9e case conversions"); + utf8proc_uint8_t str_00df[] = {0xc3, 0x9f, 0x00}; + utf8proc_uint8_t str_1e9e[] = {0xe1, 0xba, 0x9e, 0x00}; + check(!strcmp((char*)utf8proc_NFKC_Casefold(str_00df), "ss") && + !strcmp((char*)utf8proc_NFKC_Casefold(str_1e9e), "ss"), + "incorrect 0x00df/0x1e9e casefold normalization"); + printf("More up-to-date than OS unicode tables for %d tests.\n", better); printf("utf8proc case conversion tests SUCCEEDED.\n"); return 0; -- cgit v1.2.3