server/src/util/unicode.test.c

#ifdef _MSC_VER
#include <platform.h>
#endif

#include "unicode.h"

#include <CuTest.h>

#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <errno.h>

static void test_unicode_trim(CuTest * tc)
{
    char buffer[32];

    strcpy(buffer, "Hello World");
    CuAssertIntEquals(tc, 0, unicode_utf8_trim(buffer));
    CuAssertStrEquals(tc, "Hello World", buffer);

    strcpy(buffer, "  Hello World");
    CuAssertIntEquals(tc, 2, unicode_utf8_trim(buffer));
    CuAssertStrEquals(tc, "Hello World", buffer);

    strcpy(buffer, "Hello World  ");
    CuAssertIntEquals(tc, 2, unicode_utf8_trim(buffer));
    CuAssertStrEquals(tc, "Hello World", buffer);

    strcpy(buffer, " Hello World ");
    CuAssertIntEquals(tc, 2, unicode_utf8_trim(buffer));
    CuAssertStrEquals(tc, "Hello World", buffer);

    strcpy(buffer, "Hello\t\r\nWorld");
    CuAssertIntEquals(tc, 3, unicode_utf8_trim(buffer));
    CuAssertStrEquals(tc, "HelloWorld", buffer);

    strcpy(buffer, "LTR");
    buffer[3] = -30;
    buffer[4] = -128;
    buffer[5] = -114;
    buffer[6] = 0;
    CuAssertIntEquals(tc, 3, unicode_utf8_trim(buffer));
    CuAssertStrEquals(tc, "LTR", buffer);

    strcpy(buffer, "  Hello Word  ");
    CuAssertIntEquals(tc, 4, unicode_utf8_trim(buffer));
    CuAssertStrEquals(tc, "Hello Word", buffer);

    strcpy(buffer, "Hello Word\n");
    CuAssertIntEquals(tc, 1, unicode_utf8_trim(buffer));
    CuAssertStrEquals(tc, "Hello Word", buffer);

    strcpy(buffer, "  Hello Word\t\n");
    CuAssertIntEquals(tc, 4, unicode_utf8_trim(buffer));
    CuAssertStrEquals(tc, "Hello Word", buffer);

    strcpy(buffer, " \t Hello Word");
    CuAssertIntEquals(tc, 3, unicode_utf8_trim(buffer));
    CuAssertStrEquals(tc, "Hello Word", buffer);

    buffer[9] = -61;
    CuAssertIntEquals(tc, 1, unicode_utf8_trim(buffer));
    CuAssertStrEquals(tc, "Hello Wor?", buffer);
}

static void test_unicode_tolower(CuTest * tc)
{
    char buffer[32];
    CuAssertIntEquals(tc, 0, unicode_utf8_tolower(buffer, sizeof(buffer), "HeLlO W0Rld"));
    CuAssertStrEquals(tc, "hello w0rld", buffer);
    memset(buffer, 0, sizeof(buffer));
    buffer[5] = 'X';
    CuAssertIntEquals(tc, ENOMEM, unicode_utf8_tolower(buffer, 5, "HeLlO W0Rld"));
    CuAssertStrEquals(tc, "helloX", buffer);
}

static void test_unicode_utf8_to_other(CuTest *tc)
{
    const unsigned char uchar_str[] = { 0xc3, 0x98, 0xc5, 0xb8, 0xc2, 0x9d, 'l', 0 }; /* &Oslash;&Yuml;&#157;l */
    char *utf8_str = (char *)uchar_str;
    unsigned char ch;
    size_t sz;
    CuAssertIntEquals(tc, 0, unicode_utf8_to_cp437(&ch, utf8_str, &sz));
    CuAssertIntEquals(tc, 2, (int)sz);
    CuAssertIntEquals(tc, '?', ch);
    CuAssertIntEquals(tc, 0, unicode_utf8_to_cp437(&ch, utf8_str+2, &sz));
    CuAssertIntEquals(tc, 2, (int)sz);
    CuAssertIntEquals(tc, '?', ch);
    CuAssertIntEquals(tc, 0, unicode_utf8_to_cp437(&ch, utf8_str+4, &sz));
    CuAssertIntEquals(tc, 2, (int)sz);
    CuAssertIntEquals(tc, '?', ch);
    CuAssertIntEquals(tc, 0, unicode_utf8_to_cp437(&ch, utf8_str + 6, &sz));
    CuAssertIntEquals(tc, 1, (int)sz);
    CuAssertIntEquals(tc, 'l', ch);

    CuAssertIntEquals(tc, 0, unicode_utf8_to_cp1252(&ch, utf8_str, &sz));
    CuAssertIntEquals(tc, 2, (int)sz);
    CuAssertIntEquals(tc, 216, ch);
    CuAssertIntEquals(tc, 0, unicode_utf8_to_cp1252(&ch, utf8_str+2, &sz));
    CuAssertIntEquals(tc, 2, (int)sz);
    CuAssertIntEquals(tc, 120, ch);
    CuAssertIntEquals(tc, 0, unicode_utf8_to_cp1252(&ch, utf8_str + 4, &sz));
    CuAssertIntEquals(tc, 2, (int)sz);
    CuAssertIntEquals(tc, 0x9d, ch);
    CuAssertIntEquals(tc, 0, unicode_utf8_to_cp1252(&ch, utf8_str + 6, &sz));
    CuAssertIntEquals(tc, 1, (int)sz);
    CuAssertIntEquals(tc, 'l', ch);

    CuAssertIntEquals(tc, 0, unicode_utf8_to_ascii(&ch, utf8_str, &sz));
    CuAssertIntEquals(tc, 2, (int)sz);
    CuAssertIntEquals(tc, '?', ch);
    CuAssertIntEquals(tc, 0, unicode_utf8_to_ascii(&ch, utf8_str + 2, &sz));
    CuAssertIntEquals(tc, 2, (int)sz);
    CuAssertIntEquals(tc, '?', ch);
    CuAssertIntEquals(tc, 0, unicode_utf8_to_ascii(&ch, utf8_str + 4, &sz));
    CuAssertIntEquals(tc, 2, (int)sz);
    CuAssertIntEquals(tc, '?', ch);
    CuAssertIntEquals(tc, 0, unicode_utf8_to_ascii(&ch, utf8_str + 6, &sz));
    CuAssertIntEquals(tc, 1, (int)sz);
    CuAssertIntEquals(tc, 'l', ch);
}

static void test_unicode_utf8_to_ucs(CuTest *tc) {
    wint_t wc;
    size_t sz;

    CuAssertIntEquals(tc, 0, unicode_utf8_decode(&wc, "a", &sz));
    CuAssertIntEquals(tc, 'a', wc);
    CuAssertIntEquals(tc, 1, sz);
}

static void test_unicode_bug2262(CuTest *tc) {
    char name[7];
    wint_t wc;
    size_t sz;

    strcpy(name, "utende");
    CuAssertIntEquals(tc, 0, unicode_utf8_decode(&wc, name, &sz));
    CuAssertIntEquals(tc, 1, sz);
    CuAssertIntEquals(tc, 'u', wc);
    CuAssertIntEquals(tc, 0, unicode_utf8_trim(name));

    name[0] = -4; /* latin1: &uuml; should fail to decode */
    CuAssertIntEquals(tc, EILSEQ, unicode_utf8_decode(&wc, name, &sz));
    CuAssertIntEquals(tc, EILSEQ, unicode_utf8_trim(name));
}

static void test_unicode_compare(CuTest *tc)
{
    CuAssertIntEquals(tc, 0, unicode_utf8_strcasecmp("ABCDEFG", "abcdefg"));
    CuAssertIntEquals(tc, 0, unicode_utf8_strcasecmp("abcdefg123", "ABCDEFG123"));
    CuAssertIntEquals(tc, 1, unicode_utf8_strcasecmp("bacdefg123", "ABCDEFG123"));
}

static void test_unicode_trim_zwnj(CuTest *tc) {
    const char zwnj[] = { 0xe2, 0x80, 0x8c, 0x00 };
    char name[64];
    char expect[64];
    snprintf(name, sizeof(name), "%sA%sB%s  ", zwnj, zwnj, zwnj);
    snprintf(expect, sizeof(expect), "A%sB", zwnj);
    CuAssertIntEquals(tc, 8, unicode_utf8_trim(name));
    CuAssertStrEquals(tc, expect, name);
}

static void test_unicode_trim_ltrm(CuTest *tc) {
    const char ltrm[] = { 0xe2, 0x80, 0x8e, 0x00 };
    char name[64];
    char expect[64];
    snprintf(name, sizeof(name), "%sBrot%szeit%s  ", ltrm, ltrm, ltrm);
    snprintf(expect, sizeof(expect), "Brot%szeit", ltrm);
    CuAssertIntEquals(tc, 8, unicode_utf8_trim(name));
    CuAssertStrEquals(tc, expect, name);
}

static void test_unicode_trim_emoji(CuTest *tc) {
    const char clock[] = { 0xE2, 0x8F, 0xB0, 0x00 };
    char name[64];
    char expect[64];
    snprintf(name, sizeof(name), "%s Alarm%sClock %s", clock, clock, clock);
    strcpy(expect, name);
    CuAssertIntEquals(tc, 0, unicode_utf8_trim(name));
    CuAssertStrEquals(tc, expect, name);
}

CuSuite *get_unicode_suite(void)
{
    CuSuite *suite = CuSuiteNew();
    SUITE_ADD_TEST(suite, test_unicode_trim);
    SUITE_ADD_TEST(suite, test_unicode_trim_zwnj);
    SUITE_ADD_TEST(suite, test_unicode_trim_ltrm);
    SUITE_ADD_TEST(suite, test_unicode_trim_emoji);
    SUITE_ADD_TEST(suite, test_unicode_utf8_to_other);
    SUITE_ADD_TEST(suite, test_unicode_utf8_to_ucs);
    SUITE_ADD_TEST(suite, test_unicode_compare);
    SUITE_ADD_TEST(suite, test_unicode_bug2262);
    SUITE_ADD_TEST(suite, test_unicode_tolower);
    return suite;
}
use wint_t, not long. 2019-08-01 18:40:42 +02:00			`#ifdef _MSC_VER`
try to allow visual studio to build with all warnings (/WAll) enabled. 2015-01-12 22:53:21 +01:00			`#include <platform.h>`
use wint_t, not long. 2019-08-01 18:40:42 +02:00			`#endif`

basic test for tolower function. 2014-10-19 06:42:40 +02:00			`#include "unicode.h"`
use wint_t, not long. 2019-08-01 18:40:42 +02:00
			`#include <CuTest.h>`

			`#include <stdio.h>`
basic test for tolower function. 2014-10-19 06:42:40 +02:00			`#include <stdlib.h>`
			`#include <string.h>`
			`#include <errno.h>`

fix bad names. trim leading whitespace and non-printable characters from existing unit, region and faction names/descriptions. 2016-11-11 00:30:49 +01:00			`static void test_unicode_trim(CuTest * tc)`
			`{`
			`char buffer[32];`

use wint_t, not long. 2019-08-01 18:40:42 +02:00			`strcpy(buffer, "Hello World");`
fix bad names. trim leading whitespace and non-printable characters from existing unit, region and faction names/descriptions. 2016-11-11 00:30:49 +01:00			`CuAssertIntEquals(tc, 0, unicode_utf8_trim(buffer));`
use wint_t, not long. 2019-08-01 18:40:42 +02:00			`CuAssertStrEquals(tc, "Hello World", buffer);`

			`strcpy(buffer, " Hello World");`
			`CuAssertIntEquals(tc, 2, unicode_utf8_trim(buffer));`
			`CuAssertStrEquals(tc, "Hello World", buffer);`

			`strcpy(buffer, "Hello World ");`
			`CuAssertIntEquals(tc, 2, unicode_utf8_trim(buffer));`
			`CuAssertStrEquals(tc, "Hello World", buffer);`

			`strcpy(buffer, " Hello World ");`
			`CuAssertIntEquals(tc, 2, unicode_utf8_trim(buffer));`
			`CuAssertStrEquals(tc, "Hello World", buffer);`

			`strcpy(buffer, "Hello\t\r\nWorld");`
			`CuAssertIntEquals(tc, 3, unicode_utf8_trim(buffer));`
			`CuAssertStrEquals(tc, "HelloWorld", buffer);`

			`strcpy(buffer, "LTR");`
			`buffer[3] = -30;`
			`buffer[4] = -128;`
			`buffer[5] = -114;`
			`buffer[6] = 0;`
			`CuAssertIntEquals(tc, 3, unicode_utf8_trim(buffer));`
			`CuAssertStrEquals(tc, "LTR", buffer);`
fix bad names. trim leading whitespace and non-printable characters from existing unit, region and faction names/descriptions. 2016-11-11 00:30:49 +01:00
also remove trailing spaces. 2016-11-11 01:34:59 +01:00			`strcpy(buffer, " Hello Word ");`
			`CuAssertIntEquals(tc, 4, unicode_utf8_trim(buffer));`
			`CuAssertStrEquals(tc, "Hello Word", buffer);`

fix bad names. trim leading whitespace and non-printable characters from existing unit, region and faction names/descriptions. 2016-11-11 00:30:49 +01:00			`strcpy(buffer, "Hello Word\n");`
			`CuAssertIntEquals(tc, 1, unicode_utf8_trim(buffer));`
			`CuAssertStrEquals(tc, "Hello Word", buffer);`

			`strcpy(buffer, " Hello Word\t\n");`
			`CuAssertIntEquals(tc, 4, unicode_utf8_trim(buffer));`
			`CuAssertStrEquals(tc, "Hello Word", buffer);`

			`strcpy(buffer, " \t Hello Word");`
			`CuAssertIntEquals(tc, 3, unicode_utf8_trim(buffer));`
			`CuAssertStrEquals(tc, "Hello Word", buffer);`
fix truncated names that split a utf8 sequence. 2016-11-20 14:50:38 +01:00
fix curse-vigour calculation math. also fix a ton of small other niggles from pvs-studio. 2016-11-20 19:08:39 +01:00			`buffer[9] = -61;`
fix truncated names that split a utf8 sequence. 2016-11-20 14:50:38 +01:00			`CuAssertIntEquals(tc, 1, unicode_utf8_trim(buffer));`
			`CuAssertStrEquals(tc, "Hello Wor?", buffer);`
fix bad names. trim leading whitespace and non-printable characters from existing unit, region and faction names/descriptions. 2016-11-11 00:30:49 +01:00			`}`

basic test for tolower function. 2014-10-19 06:42:40 +02:00			`static void test_unicode_tolower(CuTest * tc)`
			`{`
			`char buffer[32];`
			`CuAssertIntEquals(tc, 0, unicode_utf8_tolower(buffer, sizeof(buffer), "HeLlO W0Rld"));`
			`CuAssertStrEquals(tc, "hello w0rld", buffer);`
			`memset(buffer, 0, sizeof(buffer));`
try to allow visual studio to build with all warnings (/WAll) enabled. 2015-01-12 22:53:21 +01:00			`buffer[5] = 'X';`
basic test for tolower function. 2014-10-19 06:42:40 +02:00			`CuAssertIntEquals(tc, ENOMEM, unicode_utf8_tolower(buffer, 5, "HeLlO W0Rld"));`
			`CuAssertStrEquals(tc, "helloX", buffer);`
			`}`

fix endless loop in cp1252 search (wrong sort) fix indentation additional testing 2016-10-02 13:12:47 +02:00			`static void test_unicode_utf8_to_other(CuTest *tc)`
fix an endless loop in unicode_utf8_to_cp437 for characters not in the table. 2016-10-02 12:46:07 +02:00			`{`
Be very strict about C standards. Compile with -std=c89 in gcc. remove all // comments (they are nice, but unnecessary). variables only declared at start of block. various pedantery. backwards compatible va_copy for pre-C99 gcc. 2017-02-18 21:15:14 +01:00			`const unsigned char uchar_str[] = { 0xc3, 0x98, 0xc5, 0xb8, 0xc2, 0x9d, 'l', 0 }; /* Ø&Yuml;l */`
use wint_t, not long. 2019-08-01 18:40:42 +02:00			`char utf8_str = (char )uchar_str;`
fix endless loop in cp1252 search (wrong sort) fix indentation additional testing 2016-10-02 13:12:47 +02:00			`unsigned char ch;`
fix an endless loop in unicode_utf8_to_cp437 for characters not in the table. 2016-10-02 12:46:07 +02:00			`size_t sz;`
			`CuAssertIntEquals(tc, 0, unicode_utf8_to_cp437(&ch, utf8_str, &sz));`
fix gcc conversion warnings 2016-10-09 10:06:51 +02:00			`CuAssertIntEquals(tc, 2, (int)sz);`
fix an endless loop in unicode_utf8_to_cp437 for characters not in the table. 2016-10-02 12:46:07 +02:00			`CuAssertIntEquals(tc, '?', ch);`
fix endless loop in cp1252 search (wrong sort) fix indentation additional testing 2016-10-02 13:12:47 +02:00			`CuAssertIntEquals(tc, 0, unicode_utf8_to_cp437(&ch, utf8_str+2, &sz));`
fix gcc conversion warnings 2016-10-09 10:06:51 +02:00			`CuAssertIntEquals(tc, 2, (int)sz);`
fix endless loop in cp1252 search (wrong sort) fix indentation additional testing 2016-10-02 13:12:47 +02:00			`CuAssertIntEquals(tc, '?', ch);`
			`CuAssertIntEquals(tc, 0, unicode_utf8_to_cp437(&ch, utf8_str+4, &sz));`
fix gcc conversion warnings 2016-10-09 10:06:51 +02:00			`CuAssertIntEquals(tc, 2, (int)sz);`
fix endless loop in cp1252 search (wrong sort) fix indentation additional testing 2016-10-02 13:12:47 +02:00			`CuAssertIntEquals(tc, '?', ch);`
			`CuAssertIntEquals(tc, 0, unicode_utf8_to_cp437(&ch, utf8_str + 6, &sz));`
fix gcc conversion warnings 2016-10-09 10:06:51 +02:00			`CuAssertIntEquals(tc, 1, (int)sz);`
fix endless loop in cp1252 search (wrong sort) fix indentation additional testing 2016-10-02 13:12:47 +02:00			`CuAssertIntEquals(tc, 'l', ch);`

			`CuAssertIntEquals(tc, 0, unicode_utf8_to_cp1252(&ch, utf8_str, &sz));`
fix gcc conversion warnings 2016-10-09 10:06:51 +02:00			`CuAssertIntEquals(tc, 2, (int)sz);`
fix endless loop in cp1252 search (wrong sort) fix indentation additional testing 2016-10-02 13:12:47 +02:00			`CuAssertIntEquals(tc, 216, ch);`
			`CuAssertIntEquals(tc, 0, unicode_utf8_to_cp1252(&ch, utf8_str+2, &sz));`
fix gcc conversion warnings 2016-10-09 10:06:51 +02:00			`CuAssertIntEquals(tc, 2, (int)sz);`
fix endless loop in cp1252 search (wrong sort) fix indentation additional testing 2016-10-02 13:12:47 +02:00			`CuAssertIntEquals(tc, 120, ch);`
			`CuAssertIntEquals(tc, 0, unicode_utf8_to_cp1252(&ch, utf8_str + 4, &sz));`
fix gcc conversion warnings 2016-10-09 10:06:51 +02:00			`CuAssertIntEquals(tc, 2, (int)sz);`
fix endless loop in cp1252 search (wrong sort) fix indentation additional testing 2016-10-02 13:12:47 +02:00			`CuAssertIntEquals(tc, 0x9d, ch);`
			`CuAssertIntEquals(tc, 0, unicode_utf8_to_cp1252(&ch, utf8_str + 6, &sz));`
fix gcc conversion warnings 2016-10-09 10:06:51 +02:00			`CuAssertIntEquals(tc, 1, (int)sz);`
fix endless loop in cp1252 search (wrong sort) fix indentation additional testing 2016-10-02 13:12:47 +02:00			`CuAssertIntEquals(tc, 'l', ch);`

			`CuAssertIntEquals(tc, 0, unicode_utf8_to_ascii(&ch, utf8_str, &sz));`
fix gcc conversion warnings 2016-10-09 10:06:51 +02:00			`CuAssertIntEquals(tc, 2, (int)sz);`
fix endless loop in cp1252 search (wrong sort) fix indentation additional testing 2016-10-02 13:12:47 +02:00			`CuAssertIntEquals(tc, '?', ch);`
			`CuAssertIntEquals(tc, 0, unicode_utf8_to_ascii(&ch, utf8_str + 2, &sz));`
fix gcc conversion warnings 2016-10-09 10:06:51 +02:00			`CuAssertIntEquals(tc, 2, (int)sz);`
fix endless loop in cp1252 search (wrong sort) fix indentation additional testing 2016-10-02 13:12:47 +02:00			`CuAssertIntEquals(tc, '?', ch);`
			`CuAssertIntEquals(tc, 0, unicode_utf8_to_ascii(&ch, utf8_str + 4, &sz));`
fix gcc conversion warnings 2016-10-09 10:06:51 +02:00			`CuAssertIntEquals(tc, 2, (int)sz);`
fix endless loop in cp1252 search (wrong sort) fix indentation additional testing 2016-10-02 13:12:47 +02:00			`CuAssertIntEquals(tc, '?', ch);`
			`CuAssertIntEquals(tc, 0, unicode_utf8_to_ascii(&ch, utf8_str + 6, &sz));`
fix gcc conversion warnings 2016-10-09 10:06:51 +02:00			`CuAssertIntEquals(tc, 1, (int)sz);`
fix endless loop in cp1252 search (wrong sort) fix indentation additional testing 2016-10-02 13:12:47 +02:00			`CuAssertIntEquals(tc, 'l', ch);`
fix an endless loop in unicode_utf8_to_cp437 for characters not in the table. 2016-10-02 12:46:07 +02:00			`}`

fix truncated names that split a utf8 sequence. 2016-11-20 14:50:38 +01:00			`static void test_unicode_utf8_to_ucs(CuTest *tc) {`
use wint_t, not long. 2019-08-01 18:40:42 +02:00			`wint_t wc;`
fix truncated names that split a utf8 sequence. 2016-11-20 14:50:38 +01:00			`size_t sz;`

use wint_t, not long. 2019-08-01 18:40:42 +02:00			`CuAssertIntEquals(tc, 0, unicode_utf8_decode(&wc, "a", &sz));`
			`CuAssertIntEquals(tc, 'a', wc);`
fix truncated names that split a utf8 sequence. 2016-11-20 14:50:38 +01:00			`CuAssertIntEquals(tc, 1, sz);`
			`}`

change error message categories. also removing some unused messages and code that supports them. https://bugs.eressea.de/view.php?id=2270 2017-01-20 22:39:38 +01:00			`static void test_unicode_bug2262(CuTest *tc) {`
			`char name[7];`
use wint_t, not long. 2019-08-01 18:40:42 +02:00			`wint_t wc;`
change error message categories. also removing some unused messages and code that supports them. https://bugs.eressea.de/view.php?id=2270 2017-01-20 22:39:38 +01:00			`size_t sz;`

			`strcpy(name, "utende");`
use wint_t, not long. 2019-08-01 18:40:42 +02:00			`CuAssertIntEquals(tc, 0, unicode_utf8_decode(&wc, name, &sz));`
change error message categories. also removing some unused messages and code that supports them. https://bugs.eressea.de/view.php?id=2270 2017-01-20 22:39:38 +01:00			`CuAssertIntEquals(tc, 1, sz);`
use wint_t, not long. 2019-08-01 18:40:42 +02:00			`CuAssertIntEquals(tc, 'u', wc);`
change error message categories. also removing some unused messages and code that supports them. https://bugs.eressea.de/view.php?id=2270 2017-01-20 22:39:38 +01:00			`CuAssertIntEquals(tc, 0, unicode_utf8_trim(name));`

Be very strict about C standards. Compile with -std=c89 in gcc. remove all // comments (they are nice, but unnecessary). variables only declared at start of block. various pedantery. backwards compatible va_copy for pre-C99 gcc. 2017-02-18 21:15:14 +01:00			`name[0] = -4; /* latin1: ü should fail to decode */`
use wint_t, not long. 2019-08-01 18:40:42 +02:00			`CuAssertIntEquals(tc, EILSEQ, unicode_utf8_decode(&wc, name, &sz));`
change error message categories. also removing some unused messages and code that supports them. https://bugs.eressea.de/view.php?id=2270 2017-01-20 22:39:38 +01:00			`CuAssertIntEquals(tc, EILSEQ, unicode_utf8_trim(name));`
			`}`

add a very simple tst for unicode comparisons 2016-08-07 10:28:09 +02:00			`static void test_unicode_compare(CuTest *tc)`
			`{`
			`CuAssertIntEquals(tc, 0, unicode_utf8_strcasecmp("ABCDEFG", "abcdefg"));`
			`CuAssertIntEquals(tc, 0, unicode_utf8_strcasecmp("abcdefg123", "ABCDEFG123"));`
			`CuAssertIntEquals(tc, 1, unicode_utf8_strcasecmp("bacdefg123", "ABCDEFG123"));`
			`}`

use wint_t, not long. 2019-08-01 18:40:42 +02:00			`static void test_unicode_trim_zwnj(CuTest *tc) {`
			`const char zwnj[] = { 0xe2, 0x80, 0x8c, 0x00 };`
fix farsi names containing nzwj symbol. 2017-04-10 17:32:32 +02:00			`char name[64];`
use wint_t, not long. 2019-08-01 18:40:42 +02:00			`char expect[64];`
			`snprintf(name, sizeof(name), "%sA%sB%s ", zwnj, zwnj, zwnj);`
			`snprintf(expect, sizeof(expect), "A%sB", zwnj);`
			`CuAssertIntEquals(tc, 8, unicode_utf8_trim(name));`
			`CuAssertStrEquals(tc, expect, name);`
			`}`

			`static void test_unicode_trim_ltrm(CuTest *tc) {`
			`const char ltrm[] = { 0xe2, 0x80, 0x8e, 0x00 };`
			`char name[64];`
			`char expect[64];`
			`snprintf(name, sizeof(name), "%sBrot%szeit%s ", ltrm, ltrm, ltrm);`
			`snprintf(expect, sizeof(expect), "Brot%szeit", ltrm);`
			`CuAssertIntEquals(tc, 8, unicode_utf8_trim(name));`
			`CuAssertStrEquals(tc, expect, name);`
fix farsi names containing nzwj symbol. 2017-04-10 17:32:32 +02:00			`}`

ignore some code more points, but leave emoji intact. 2019-08-08 18:23:31 +02:00			`static void test_unicode_trim_emoji(CuTest *tc) {`
			`const char clock[] = { 0xE2, 0x8F, 0xB0, 0x00 };`
			`char name[64];`
			`char expect[64];`
			`snprintf(name, sizeof(name), "%s Alarm%sClock %s", clock, clock, clock);`
			`strcpy(expect, name);`
			`CuAssertIntEquals(tc, 0, unicode_utf8_trim(name));`
			`CuAssertStrEquals(tc, expect, name);`
			`}`

basic test for tolower function. 2014-10-19 06:42:40 +02:00			`CuSuite *get_unicode_suite(void)`
			`{`
try to allow visual studio to build with all warnings (/WAll) enabled. 2015-01-12 22:53:21 +01:00			`CuSuite *suite = CuSuiteNew();`
fix bad names. trim leading whitespace and non-printable characters from existing unit, region and faction names/descriptions. 2016-11-11 00:30:49 +01:00			`SUITE_ADD_TEST(suite, test_unicode_trim);`
use wint_t, not long. 2019-08-01 18:40:42 +02:00			`SUITE_ADD_TEST(suite, test_unicode_trim_zwnj);`
			`SUITE_ADD_TEST(suite, test_unicode_trim_ltrm);`
ignore some code more points, but leave emoji intact. 2019-08-08 18:23:31 +02:00			`SUITE_ADD_TEST(suite, test_unicode_trim_emoji);`
fix endless loop in cp1252 search (wrong sort) fix indentation additional testing 2016-10-02 13:12:47 +02:00			`SUITE_ADD_TEST(suite, test_unicode_utf8_to_other);`
fix truncated names that split a utf8 sequence. 2016-11-20 14:50:38 +01:00			`SUITE_ADD_TEST(suite, test_unicode_utf8_to_ucs);`
add a very simple tst for unicode comparisons 2016-08-07 10:28:09 +02:00			`SUITE_ADD_TEST(suite, test_unicode_compare);`
use wint_t, not long. 2019-08-01 18:40:42 +02:00			`SUITE_ADD_TEST(suite, test_unicode_bug2262);`
			`SUITE_ADD_TEST(suite, test_unicode_tolower);`
try to allow visual studio to build with all warnings (/WAll) enabled. 2015-01-12 22:53:21 +01:00			`return suite;`
basic test for tolower function. 2014-10-19 06:42:40 +02:00			`}`