diff -r e4d67989cc36 -r 47c74d1534e1 glib/tests/unicode-normalize.c --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/glib/tests/unicode-normalize.c Fri Apr 16 16:46:38 2010 +0300 @@ -0,0 +1,255 @@ +/* +* Copyright (c) 2008 Nokia Corporation and/or its subsidiary(-ies). +* All rights reserved. +* This component and the accompanying materials are made available +* under the terms of "Eclipse Public License v1.0" +* which accompanies this distribution, and is available +* at the URL "http://www.eclipse.org/legal/epl-v10.html". +* +* Initial Contributors: +* Nokia Corporation - initial contribution. +* +* Contributors: +* +* Description: +* +*/ + +#undef G_DISABLE_ASSERT +#undef G_LOG_DOMAIN + +#include +#include +#include +#include + +#ifdef __SYMBIAN32__ +#include +#include "mrt2_glib2_test.h" +#endif /*__SYMBIAN32__*/ + +gboolean success = TRUE; + +static char * +decode (const gchar *input) +{ + unsigned ch; + int offset = 0; + GString *result = g_string_new (NULL); + + do + { + if (sscanf (input + offset, "%x", &ch) != 1) + { + fprintf (stderr, "Error parsing character string %s\n", input); + g_assert(FALSE && "unicode-normalize failed"); + #ifdef __SYMBIAN32__ + testResultXml("unicode-normalize"); + #endif /* EMULATOR */ + exit (1); + } + + g_string_append_unichar (result, ch); + + while (input[offset] && input[offset] != ' ') + offset++; + while (input[offset] && input[offset] == ' ') + offset++; + } + while (input[offset]); + + return g_string_free (result, FALSE); +} + +const char *names[4] = { + "NFD", + "NFC", + "NFKD", + "NFKC" +}; + +static char * +encode (const gchar *input) +{ + GString *result = g_string_new(NULL); + + const gchar *p = input; + while (*p) + { + gunichar c = g_utf8_get_char (p); + g_string_append_printf (result, "%04X ", c); + p = g_utf8_next_char(p); + } + + return g_string_free (result, FALSE); +} + +static void +test_form (int line, + GNormalizeMode mode, + gboolean do_compat, + int expected, + char **c, + char **raw) +{ + int i; + + gboolean mode_is_compat = (mode == G_NORMALIZE_NFKC || + mode == G_NORMALIZE_NFKD); + + if (mode_is_compat || !do_compat) + { + for (i = 0; i < 3; i++) + { + char *result = g_utf8_normalize (c[i], -1, mode); + if (strcmp (result, c[expected]) != 0) + { + char *result_raw = encode(result); + fprintf (stderr, "\nFailure: %d/%d: %s\n", line, i + 1, raw[5]); + fprintf (stderr, " g_utf8_normalize (%s, %s) != %s but %s\n", + raw[i], names[mode], raw[expected], result_raw); + g_free (result_raw); + success = FALSE; + } + + g_free (result); + } + } + if (mode_is_compat || do_compat) + { + for (i = 3; i < 5; i++) + { + char *result = g_utf8_normalize (c[i], -1, mode); + if (strcmp (result, c[expected]) != 0) + { + char *result_raw = encode(result); + fprintf (stderr, "\nFailure: %d/%d: %s\n", line, i, raw[5]); + fprintf (stderr, " g_utf8_normalize (%s, %s) != %s but %s\n", + raw[i], names[mode], raw[expected], result_raw); + g_free (result_raw); + success = FALSE; + } + + g_free (result); + } + } +} + +static gboolean +process_one (int line, gchar **columns) +{ + char *c[5]; + int i; + gboolean skip = FALSE; + + for (i=0; i < 5; i++) + { + c[i] = decode(columns[i]); + if (!c[i]) + skip = TRUE; + } + + if (!skip) + { + test_form (line, G_NORMALIZE_NFD, FALSE, 2, c, columns); + test_form (line, G_NORMALIZE_NFD, TRUE, 4, c, columns); + test_form (line, G_NORMALIZE_NFC, FALSE, 1, c, columns); + test_form (line, G_NORMALIZE_NFC, TRUE, 3, c, columns); + test_form (line, G_NORMALIZE_NFKD, TRUE, 4, c, columns); + test_form (line, G_NORMALIZE_NFKC, TRUE, 3, c, columns); + } + + for (i=0; i < 5; i++) + g_free (c[i]); + + return TRUE; +} + +int main (int argc, char **argv) +{ + GIOChannel *in; + GError *error = NULL; + GString *buffer = g_string_new (NULL); + int line_to_do = 0; + int line = 1; + + #ifdef __SYMBIAN32__ + g_log_set_handler (NULL, G_LOG_FLAG_FATAL| G_LOG_FLAG_RECURSION | G_LOG_LEVEL_CRITICAL | G_LOG_LEVEL_WARNING | G_LOG_LEVEL_MESSAGE | G_LOG_LEVEL_INFO | G_LOG_LEVEL_DEBUG, &mrtLogHandler, NULL); + g_set_print_handler(mrtPrintHandler); + #endif /*__SYMBIAN32__*/ + if (argc != 2 && argc != 3) + { + fprintf (stderr, "Usage: unicode-normalize NormalizationTest.txt LINE\n"); + return 1; + } + + if (argc == 3) + line_to_do = atoi(argv[2]); + + in = g_io_channel_new_file (argv[1], "r", &error); + if (!in) + { + fprintf (stderr, "Cannot open %s: %s\n", argv[1], error->message); + g_assert(FALSE && "unicode-normalize failed"); + + #ifdef __SYMBIAN32__ + testResultXml("unicode-normalize"); + #endif /* EMULATOR */ + + return 1; + } + + while (TRUE) + { + gsize term_pos; + gchar **columns; + + if (g_io_channel_read_line_string (in, buffer, &term_pos, &error) != G_IO_STATUS_NORMAL) + break; + + if (line_to_do && line != line_to_do) + goto next; + + buffer->str[term_pos] = '\0'; + + if (buffer->str[0] == '#') /* Comment */ + goto next; + if (buffer->str[0] == '@') /* Part */ + { + fprintf (stderr, "\nProcessing %s\n", buffer->str + 1); + goto next; + } + + columns = g_strsplit (buffer->str, ";", -1); + if (!columns[0]) + goto next; + + if (!process_one (line, columns)) + return 1; + g_strfreev (columns); + + next: + g_string_truncate (buffer, 0); + line++; + } + + if (error) + { + fprintf (stderr, "Error reading test file, %s\n", error->message); + g_assert(FALSE && "unicode-normalize failed"); + #ifdef __SYMBIAN32__ + testResultXml("unicode-normalize"); + #endif /* EMULATOR */ + return 1; + } + + g_io_channel_unref (in); + g_string_free (buffer, TRUE); + + #ifdef __SYMBIAN32__ + assert_failed = !success; + testResultXml("unicode-normalize"); + #endif /* EMULATOR */ + + return !success; +}