os/ossrv/glib/tests/unicode-normalize.c
author sl
Tue, 10 Jun 2014 14:32:02 +0200
changeset 1 260cb5ec6c19
permissions -rw-r--r--
Update contrib.
     1 /* Portion Copyright © 2008-09 Nokia Corporation and/or its subsidiary(-ies). All rights reserved.*/
     2 #undef G_DISABLE_ASSERT
     3 #undef G_LOG_DOMAIN
     4 
     5 #include <glib.h>
     6 #include <stdio.h>
     7 #include <stdlib.h>
     8 #include <string.h>
     9 
    10 #ifdef __SYMBIAN32__
    11 #include <glib_global.h>
    12 #include "mrt2_glib2_test.h"
    13 #endif /*__SYMBIAN32__*/
    14 
    15 gboolean success = TRUE;
    16 
    17 static char *
    18 decode (const gchar *input)
    19 {
    20   unsigned ch;
    21   int offset = 0;
    22   GString *result = g_string_new (NULL);
    23   
    24   do 
    25     {
    26       if (sscanf (input + offset, "%x", &ch) != 1)
    27 	{
    28 	  fprintf (stderr, "Error parsing character string %s\n", input);
    29 	  g_assert(FALSE && "unicode-normalize failed");
    30 	  #ifdef __SYMBIAN32__
    31   	  testResultXml("unicode-normalize");
    32   	  #endif /* EMULATOR */
    33 	  exit (1);
    34 	}
    35 
    36       g_string_append_unichar (result, ch);
    37       
    38       while (input[offset] && input[offset] != ' ')
    39 	offset++;
    40       while (input[offset] && input[offset] == ' ')
    41 	offset++;
    42     }
    43   while (input[offset]);
    44 
    45   return g_string_free (result, FALSE);
    46 }
    47 
    48 const char *names[4] = {
    49   "NFD",
    50   "NFC",
    51   "NFKD",
    52   "NFKC"
    53 };
    54 
    55 static char *
    56 encode (const gchar *input)
    57 {
    58   GString *result = g_string_new(NULL);
    59 
    60   const gchar *p = input;
    61   while (*p)
    62     {
    63       gunichar c = g_utf8_get_char (p);
    64       g_string_append_printf (result, "%04X ", c);
    65       p = g_utf8_next_char(p);
    66     }
    67 
    68   return g_string_free (result, FALSE);
    69 }
    70 
    71 static void
    72 test_form (int            line,
    73 	   GNormalizeMode mode,
    74 	   gboolean       do_compat,
    75 	   int            expected,
    76 	   char         **c,
    77 	   char         **raw)
    78 {
    79   int i;
    80   
    81   gboolean mode_is_compat = (mode == G_NORMALIZE_NFKC ||
    82 			     mode == G_NORMALIZE_NFKD);
    83 
    84   if (mode_is_compat || !do_compat)
    85     {
    86       for (i = 0; i < 3; i++)
    87 	{
    88 	  char *result = g_utf8_normalize (c[i], -1, mode);
    89 	  if (strcmp (result, c[expected]) != 0)
    90 	    {
    91 	      char *result_raw = encode(result);
    92 	      fprintf (stderr, "\nFailure: %d/%d: %s\n", line, i + 1, raw[5]);
    93 	      fprintf (stderr, "  g_utf8_normalize (%s, %s) != %s but %s\n",
    94 		   raw[i], names[mode], raw[expected], result_raw);
    95 	      g_free (result_raw);
    96 	      success = FALSE;
    97 	    }
    98 	  
    99 	  g_free (result);
   100 	}
   101     }
   102   if (mode_is_compat || do_compat)
   103     {
   104       for (i = 3; i < 5; i++)
   105 	{
   106 	  char *result = g_utf8_normalize (c[i], -1, mode);
   107 	  if (strcmp (result, c[expected]) != 0)
   108 	    {
   109 	      char *result_raw = encode(result);
   110 	      fprintf (stderr, "\nFailure: %d/%d: %s\n", line, i, raw[5]);
   111 	      fprintf (stderr, "  g_utf8_normalize (%s, %s) != %s but %s\n",
   112 		   raw[i], names[mode], raw[expected], result_raw);
   113 	      g_free (result_raw);
   114 	      success = FALSE;
   115 	    }
   116 	  
   117 	  g_free (result);
   118 	}
   119     }
   120 }
   121 
   122 static gboolean
   123 process_one (int line, gchar **columns)
   124 {
   125   char *c[5];
   126   int i;
   127   gboolean skip = FALSE;
   128 
   129   for (i=0; i < 5; i++)
   130     {
   131       c[i] = decode(columns[i]);
   132       if (!c[i])
   133 	skip = TRUE;
   134     }
   135 
   136   if (!skip)
   137     {
   138       test_form (line, G_NORMALIZE_NFD, FALSE, 2, c, columns);
   139       test_form (line, G_NORMALIZE_NFD, TRUE, 4, c, columns);
   140       test_form (line, G_NORMALIZE_NFC, FALSE, 1, c, columns);
   141       test_form (line, G_NORMALIZE_NFC, TRUE, 3, c, columns);
   142       test_form (line, G_NORMALIZE_NFKD, TRUE, 4, c, columns);
   143       test_form (line, G_NORMALIZE_NFKC, TRUE, 3, c, columns);
   144     }
   145 
   146   for (i=0; i < 5; i++)
   147     g_free (c[i]);
   148   
   149   return TRUE;
   150 }
   151 
   152 int main (int argc, char **argv)
   153 {
   154   GIOChannel *in;
   155   GError *error = NULL;
   156   GString *buffer = g_string_new (NULL);
   157   int line_to_do = 0;
   158   int line = 1;
   159 
   160   #ifdef __SYMBIAN32__
   161   g_log_set_handler (NULL,  G_LOG_FLAG_FATAL| G_LOG_FLAG_RECURSION | G_LOG_LEVEL_CRITICAL | G_LOG_LEVEL_WARNING | G_LOG_LEVEL_MESSAGE | G_LOG_LEVEL_INFO | G_LOG_LEVEL_DEBUG, &mrtLogHandler, NULL);
   162   g_set_print_handler(mrtPrintHandler);
   163   #endif /*__SYMBIAN32__*/
   164   if (argc != 2 && argc != 3)
   165     {
   166       fprintf (stderr, "Usage: unicode-normalize NormalizationTest.txt LINE\n");
   167       return 1;
   168     }
   169 
   170   if (argc == 3)
   171     line_to_do = atoi(argv[2]);
   172 
   173   in = g_io_channel_new_file (argv[1], "r", &error);
   174   if (!in)
   175     {
   176       fprintf (stderr, "Cannot open %s: %s\n", argv[1], error->message);
   177       g_assert(FALSE && "unicode-normalize failed");
   178       
   179       #ifdef __SYMBIAN32__
   180       testResultXml("unicode-normalize");
   181       #endif /* EMULATOR */
   182       
   183       return 1;
   184     }
   185 
   186   while (TRUE)
   187     {
   188       gsize term_pos;
   189       gchar **columns;
   190 
   191       if (g_io_channel_read_line_string (in, buffer, &term_pos, &error) != G_IO_STATUS_NORMAL)
   192 	break;
   193 	
   194       if (line_to_do && line != line_to_do)
   195 	goto next;
   196       
   197       buffer->str[term_pos] = '\0';
   198       
   199       if (buffer->str[0] == '#') /* Comment */
   200 	goto next;
   201       if (buffer->str[0] == '@') /* Part */
   202 	{
   203 	  fprintf (stderr, "\nProcessing %s\n", buffer->str + 1);
   204 	  goto next;
   205 	}
   206       
   207       columns = g_strsplit (buffer->str, ";", -1);
   208       if (!columns[0])
   209 	goto next;
   210       
   211       if (!process_one (line, columns))
   212 	return 1;
   213       g_strfreev (columns);
   214 
   215     next:
   216       g_string_truncate (buffer, 0);
   217       line++;
   218     }
   219 
   220   if (error)
   221     {
   222       fprintf (stderr, "Error reading test file, %s\n", error->message);
   223       g_assert(FALSE && "unicode-normalize failed");
   224 	  #ifdef __SYMBIAN32__
   225   	  testResultXml("unicode-normalize");
   226   	  #endif /* EMULATOR */
   227       return 1;
   228     }
   229 
   230   g_io_channel_unref (in);
   231   g_string_free (buffer, TRUE);
   232     
   233   #ifdef __SYMBIAN32__
   234   assert_failed = !success;
   235   testResultXml("unicode-normalize");
   236   #endif /* EMULATOR */
   237 
   238   return !success;
   239 }