minori: dep/utf8proc/test/case.c comparison

comparison dep/utf8proc/test/case.c @ 343:1faa72660932

*: transfer back to cmake from autotools autotools just made lots of things more complicated than they should have and many things broke (i.e. translations)

author	Paper <paper@paper.us.eu.org>
date	Thu, 20 Jun 2024 05:56:06 -0400
parents
children

comparison

equal deleted inserted replaced

-:adb79bdde329
+:1faa72660932
+#include "tests.h"
+#include <wctype.h>
+int main(int argc, char **argv)
+{
+int error = 0, better = 0;
+utf8proc_int32_t c;
+(void) argc; /* unused */
+(void) argv; /* unused */
+/* some simple sanity tests of the character widths */
+for (c = 0; c <= 0x110000; ++c) {
+utf8proc_int32_t l = utf8proc_tolower(c);
+utf8proc_int32_t u = utf8proc_toupper(c);
+utf8proc_int32_t t = utf8proc_totitle(c);
+check(l == c || utf8proc_codepoint_valid(l), "invalid tolower");
+check(u == c || utf8proc_codepoint_valid(u), "invalid toupper");
+check(t == c || utf8proc_codepoint_valid(t), "invalid totitle");
+if (utf8proc_codepoint_valid(c) && (l == u) != (l == t) &&
+/* Unicode 11: Georgian Mkhedruli chars have uppercase but no titlecase. */
+!(((c >= 0x10d0 && c <= 0x10fa) || c >= (0x10fd && c <= 0x10ff)) && l != u)) {
+fprintf(stderr, "unexpected titlecase %x for lowercase %x / uppercase %x\n", t, l, c);
+++error;
+}
+if (sizeof(wint_t) > 2 || (c < (1<<16) && u < (1<<16) && l < (1<<16))) {
+wint_t l0 = towlower((wint_t)c), u0 = towupper((wint_t)c);
+/* OS unicode tables may be out of date.  But if they
+do have a lower/uppercase mapping, hopefully it
+is correct? */
+if (l0 != (wint_t)c && l0 != (wint_t)l) {
+fprintf(stderr, "MISMATCH %x != towlower(%x) == %x\n",
+l, c, l0);
+++error;
+}
+else if (l0 != (wint_t)l) { /* often true for out-of-date OS unicode */
+++better;
+/* printf("%x != towlower(%x) == %x\n", l, c, l0); */
+}
+if (u0 != (wint_t)c && u0 != (wint_t)u) {
+fprintf(stderr, "MISMATCH %x != towupper(%x) == %x\n",
+u, c, u0);
+++error;
+}
+else if (u0 != (wint_t)u) { /* often true for out-of-date OS unicode */
+++better;
+/* printf("%x != towupper(%x) == %x\n", u, c, u0); */
+}
+}
+}
+check(!error, "utf8proc case conversion FAILED %d tests.", error);
+/* issue #130 */
+check(utf8proc_toupper(0x00df) == 0x1e9e &&
+utf8proc_totitle(0x00df) == 0x1e9e &&
+utf8proc_tolower(0x00df) == 0x00df &&
+utf8proc_tolower(0x1e9e) == 0x00df &&
+utf8proc_toupper(0x1e9e) == 0x1e9e,
+"incorrect 0x00df/0x1e9e case conversions");
+utf8proc_uint8_t str_00df[] = {0xc3, 0x9f, 0x00};
+utf8proc_uint8_t str_1e9e[] = {0xe1, 0xba, 0x9e, 0x00};
+utf8proc_uint8_t *s1 = utf8proc_NFKC_Casefold(str_00df);
+utf8proc_uint8_t *s2 = utf8proc_NFKC_Casefold(str_1e9e);
+check(!strcmp((char*)s1, "ss") &&
+!strcmp((char*)s2, "ss"),
+"incorrect 0x00df/0x1e9e casefold normalization");
+free(s1);
+free(s2);
+printf("More up-to-date than OS unicode tables for %d tests.\n", better);
+printf("utf8proc case conversion tests SUCCEEDED.\n");
+return 0;
+}

Mercurial > minori

comparison dep/utf8proc/test/case.c @ 343:1faa72660932