diff options
Diffstat (limited to 'tests/unit/unicode.cxx')
-rw-r--r-- | tests/unit/unicode.cxx | 165 |
1 files changed, 165 insertions, 0 deletions
diff --git a/tests/unit/unicode.cxx b/tests/unit/unicode.cxx new file mode 100644 index 00000000..748f4347 --- /dev/null +++ b/tests/unit/unicode.cxx @@ -0,0 +1,165 @@ +/* Copyright 2020 Pierre Ossman <ossman@cendio.se> for Cendio AB + * + * This is free software; you can redistribute it and/or modify + * it under the terms of the GNU General Public License as published by + * the Free Software Foundation; either version 2 of the License, or + * (at your option) any later version. + * + * This software is distributed in the hope that it will be useful, + * but WITHOUT ANY WARRANTY; without even the implied warranty of + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the + * GNU General Public License for more details. + * + * You should have received a copy of the GNU General Public License + * along with this software; if not, write to the Free Software + * Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, + * USA. + */ + +#include <stdio.h> +#include <wchar.h> + +#include <rfb/util.h> + +struct _ucs4utf8 { + unsigned ucs4; + const char *utf8; +}; + +struct _ucs4utf16 { + unsigned ucs4; + const wchar_t *utf16; +}; + +struct _utf8utf16 { + const char *utf8; + const wchar_t *utf16; +}; + +struct _ucs4utf8 ucs4utf8[] = { + { 0x0061, "a" }, + { 0x00f6, "\xc3\xb6" }, + { 0x263a, "\xe2\x98\xba" }, + { 0x1f638, "\xf0\x9f\x98\xb8" }, + { 0x2d006, "\xf0\xad\x80\x86" }, + { 0xfffd, "\xe5\xe4" }, + { 0x110200, "\xef\xbf\xbd" }, +}; + +struct _ucs4utf16 ucs4utf16[] = { + { 0x0061, L"a" }, + { 0x00f6, L"\xf6" }, + { 0x263a, L"\x263a" }, + { 0xfffd, L"\xdc40\xdc12" }, + { 0x110200, L"\xfffd" }, +}; + +struct _utf8utf16 utf8utf16[] = { + { "abc", L"abc" }, + { "\xc3\xa5\xc3\xa4\xc3\xb6", L"\xe5\xe4\xf6" }, + { "\xe2\x98\xb9\xe2\x98\xba\xe2\x98\xbb", L"\x2639\x263a\x263b" }, + { "\xef\xbf\xbd\xc3\xa5", L"\xd840\xe5" }, +}; + +#define ARRAY_SIZE(a) (sizeof(a)/sizeof(*a)) + +int main(int argc, char** argv) +{ + int failures; + size_t i; + + unsigned ucs4; + char utf8[5]; + wchar_t utf16[3]; + char *out; + wchar_t *wout; + size_t len; + + failures = 0; + + for (i = 0;i < ARRAY_SIZE(ucs4utf8);i++) { + /* Expected failure? */ + if (ucs4utf8[i].ucs4 == 0xfffd) + continue; + + len = rfb::ucs4ToUTF8(ucs4utf8[i].ucs4, utf8); + if ((len != strlen(utf8)) || + (strcmp(utf8, ucs4utf8[i].utf8) != 0)) { + printf("FAILED: ucs4ToUTF8() #%d\n", (int)i+1); + failures++; + } + } + + for (i = 0;i < ARRAY_SIZE(ucs4utf8);i++) { + /* Expected failure? */ + if (strcmp(ucs4utf8[i].utf8, "\xef\xbf\xbd") == 0) + continue; + + len = rfb::utf8ToUCS4(ucs4utf8[i].utf8, strlen(ucs4utf8[i].utf8), &ucs4); + if ((len != strlen(ucs4utf8[i].utf8)) || + (ucs4 != ucs4utf8[i].ucs4)) { + printf("FAILED: utf8ToUCS4() #%d\n", (int)i+1); + failures++; + } + } + + for (i = 0;i < ARRAY_SIZE(ucs4utf16);i++) { + /* Expected failure? */ + if (ucs4utf16[i].ucs4 == 0xfffd) + continue; + + len = rfb::ucs4ToUTF16(ucs4utf16[i].ucs4, utf16); + if ((len != wcslen(utf16)) || + (wcscmp(utf16, ucs4utf16[i].utf16) != 0)) { + printf("FAILED: ucs4ToUTF16() #%d\n", (int)i+1); + failures++; + } + } + + for (i = 0;i < ARRAY_SIZE(ucs4utf16);i++) { + /* Expected failure? */ + if (wcscmp(ucs4utf16[i].utf16, L"\xfffd") == 0) + continue; + + len = rfb::utf16ToUCS4(ucs4utf16[i].utf16, wcslen(ucs4utf16[i].utf16), &ucs4); + if ((len != wcslen(ucs4utf16[i].utf16)) || + (ucs4 != ucs4utf16[i].ucs4)) { + printf("FAILED: utf16ToUCS4() #%d\n", (int)i+1); + failures++; + } + } + + for (i = 0;i < ARRAY_SIZE(utf8utf16);i++) { + /* Expected failure? */ + if (wcscmp(utf8utf16[i].utf16, L"\xfffd") == 0) + continue; + + out = rfb::utf16ToUTF8(utf8utf16[i].utf16); + if (strcmp(out, utf8utf16[i].utf8) != 0) { + printf("FAILED: utf16ToUTF8() #%d\n", (int)i+1); + failures++; + } + rfb::strFree(out); + } + + for (i = 0;i < ARRAY_SIZE(utf8utf16);i++) { + /* Expected failure? */ + if (strstr(utf8utf16[i].utf8, "\xef\xbf\xbd") != NULL) + continue; + + wout = rfb::utf8ToUTF16(utf8utf16[i].utf8); + if (wcscmp(wout, utf8utf16[i].utf16) != 0) { + printf("FAILED: utf8ToUTF16() #%d\n", (int)i+1); + failures++; + } + rfb::strFree(wout); + } + + if (failures == 0) { + printf("OK\n"); + } else { + printf("FAIL: %d failures\n", failures); + } + + return 0; +} |