Fix #34 handle 66 Unicode non-characters, also improve performance and surrogate handling

author: Scott Paul Jones <scottjones@alum.mit.edu> 2015-05-09 11:45:03 -0400
committer: ScottPJones <scottjones@alum.mit.edu> 2015-05-29 19:50:03 +0200
commit: 6249e6b8b1d5e360b5b5adad651911f3b4359604 (patch)
tree: c70afc21d3ef8d820d5b9de4d17c0d6e9fde1045 /test/tests.h
parent: 7c14ef5f8371e463a01e0f1de971caa600384390 (diff)
download: libutf8proc-6249e6b8b1d5e360b5b5adad651911f3b4359604.tar.gz
libutf8proc-6249e6b8b1d5e360b5b5adad651911f3b4359604.tar.bz2
1 files changed, 5 insertions, 4 deletions
diff --git a/test/tests.h b/test/tests.h
index c27185d..6eb5457 100644
--- a/test/tests.h
+++ b/test/tests.h
@@ -33,10 +33,11 @@ size_t skipspaces(const char *buf, size_t i)
    separated by whitespace, and terminated by any character not in
    [0-9a-fA-F] or whitespace, then stores the corresponding utf8 string
    in dest, returning the number of bytes read from buf */
+utf8proc_ssize_t unsafe_encode_char(utf8proc_int32_t uc, utf8proc_uint8_t *dst);
 size_t encode(char *dest, const char *buf)
 {
      size_t i = 0, j, d = 0;
-     do {
+     for (;;) {
           int c;
           i = skipspaces(buf, i);
           for (j=i; buf[j] && strchr("0123456789abcdef", tolower(buf[j])); ++j)
@@ -45,9 +46,9 @@ size_t encode(char *dest, const char *buf)
                dest[d] = 0; /* NUL-terminate destination string */
                return i + 1;
           }
-          check(sscanf(buf + i, "%x", &c) == 1, "invalid hex input %s", buf+i);
+          check(sscanf(buf + i, "%x", (unsigned int *)&c) == 1, "invalid hex input %s", buf+i);
           i = j; /* skip to char after hex input */
-          d += utf8proc_encode_char(c, (utf8proc_uint8_t *) (dest + d));
-     } while (1);
+          d += unsafe_encode_char(c, (utf8proc_uint8_t *) (dest + d));
+     }
 }
author	Scott Paul Jones <scottjones@alum.mit.edu>	2015-05-09 11:45:03 -0400
committer	ScottPJones <scottjones@alum.mit.edu>	2015-05-29 19:50:03 +0200
commit	6249e6b8b1d5e360b5b5adad651911f3b4359604 (patch)
tree	c70afc21d3ef8d820d5b9de4d17c0d6e9fde1045 /test/tests.h
parent	7c14ef5f8371e463a01e0f1de971caa600384390 (diff)
download	libutf8proc-6249e6b8b1d5e360b5b5adad651911f3b4359604.tar.gz libutf8proc-6249e6b8b1d5e360b5b5adad651911f3b4359604.tar.bz2