os/ossrv/glib/tests/unicode-normalize.c
author sl
Tue, 10 Jun 2014 14:32:02 +0200
changeset 1 260cb5ec6c19
permissions -rw-r--r--
Update contrib.
sl@0
     1
/* Portion Copyright © 2008-09 Nokia Corporation and/or its subsidiary(-ies). All rights reserved.*/
sl@0
     2
#undef G_DISABLE_ASSERT
sl@0
     3
#undef G_LOG_DOMAIN
sl@0
     4
sl@0
     5
#include <glib.h>
sl@0
     6
#include <stdio.h>
sl@0
     7
#include <stdlib.h>
sl@0
     8
#include <string.h>
sl@0
     9
sl@0
    10
#ifdef __SYMBIAN32__
sl@0
    11
#include <glib_global.h>
sl@0
    12
#include "mrt2_glib2_test.h"
sl@0
    13
#endif /*__SYMBIAN32__*/
sl@0
    14
sl@0
    15
gboolean success = TRUE;
sl@0
    16
sl@0
    17
static char *
sl@0
    18
decode (const gchar *input)
sl@0
    19
{
sl@0
    20
  unsigned ch;
sl@0
    21
  int offset = 0;
sl@0
    22
  GString *result = g_string_new (NULL);
sl@0
    23
  
sl@0
    24
  do 
sl@0
    25
    {
sl@0
    26
      if (sscanf (input + offset, "%x", &ch) != 1)
sl@0
    27
	{
sl@0
    28
	  fprintf (stderr, "Error parsing character string %s\n", input);
sl@0
    29
	  g_assert(FALSE && "unicode-normalize failed");
sl@0
    30
	  #ifdef __SYMBIAN32__
sl@0
    31
  	  testResultXml("unicode-normalize");
sl@0
    32
  	  #endif /* EMULATOR */
sl@0
    33
	  exit (1);
sl@0
    34
	}
sl@0
    35
sl@0
    36
      g_string_append_unichar (result, ch);
sl@0
    37
      
sl@0
    38
      while (input[offset] && input[offset] != ' ')
sl@0
    39
	offset++;
sl@0
    40
      while (input[offset] && input[offset] == ' ')
sl@0
    41
	offset++;
sl@0
    42
    }
sl@0
    43
  while (input[offset]);
sl@0
    44
sl@0
    45
  return g_string_free (result, FALSE);
sl@0
    46
}
sl@0
    47
sl@0
    48
const char *names[4] = {
sl@0
    49
  "NFD",
sl@0
    50
  "NFC",
sl@0
    51
  "NFKD",
sl@0
    52
  "NFKC"
sl@0
    53
};
sl@0
    54
sl@0
    55
static char *
sl@0
    56
encode (const gchar *input)
sl@0
    57
{
sl@0
    58
  GString *result = g_string_new(NULL);
sl@0
    59
sl@0
    60
  const gchar *p = input;
sl@0
    61
  while (*p)
sl@0
    62
    {
sl@0
    63
      gunichar c = g_utf8_get_char (p);
sl@0
    64
      g_string_append_printf (result, "%04X ", c);
sl@0
    65
      p = g_utf8_next_char(p);
sl@0
    66
    }
sl@0
    67
sl@0
    68
  return g_string_free (result, FALSE);
sl@0
    69
}
sl@0
    70
sl@0
    71
static void
sl@0
    72
test_form (int            line,
sl@0
    73
	   GNormalizeMode mode,
sl@0
    74
	   gboolean       do_compat,
sl@0
    75
	   int            expected,
sl@0
    76
	   char         **c,
sl@0
    77
	   char         **raw)
sl@0
    78
{
sl@0
    79
  int i;
sl@0
    80
  
sl@0
    81
  gboolean mode_is_compat = (mode == G_NORMALIZE_NFKC ||
sl@0
    82
			     mode == G_NORMALIZE_NFKD);
sl@0
    83
sl@0
    84
  if (mode_is_compat || !do_compat)
sl@0
    85
    {
sl@0
    86
      for (i = 0; i < 3; i++)
sl@0
    87
	{
sl@0
    88
	  char *result = g_utf8_normalize (c[i], -1, mode);
sl@0
    89
	  if (strcmp (result, c[expected]) != 0)
sl@0
    90
	    {
sl@0
    91
	      char *result_raw = encode(result);
sl@0
    92
	      fprintf (stderr, "\nFailure: %d/%d: %s\n", line, i + 1, raw[5]);
sl@0
    93
	      fprintf (stderr, "  g_utf8_normalize (%s, %s) != %s but %s\n",
sl@0
    94
		   raw[i], names[mode], raw[expected], result_raw);
sl@0
    95
	      g_free (result_raw);
sl@0
    96
	      success = FALSE;
sl@0
    97
	    }
sl@0
    98
	  
sl@0
    99
	  g_free (result);
sl@0
   100
	}
sl@0
   101
    }
sl@0
   102
  if (mode_is_compat || do_compat)
sl@0
   103
    {
sl@0
   104
      for (i = 3; i < 5; i++)
sl@0
   105
	{
sl@0
   106
	  char *result = g_utf8_normalize (c[i], -1, mode);
sl@0
   107
	  if (strcmp (result, c[expected]) != 0)
sl@0
   108
	    {
sl@0
   109
	      char *result_raw = encode(result);
sl@0
   110
	      fprintf (stderr, "\nFailure: %d/%d: %s\n", line, i, raw[5]);
sl@0
   111
	      fprintf (stderr, "  g_utf8_normalize (%s, %s) != %s but %s\n",
sl@0
   112
		   raw[i], names[mode], raw[expected], result_raw);
sl@0
   113
	      g_free (result_raw);
sl@0
   114
	      success = FALSE;
sl@0
   115
	    }
sl@0
   116
	  
sl@0
   117
	  g_free (result);
sl@0
   118
	}
sl@0
   119
    }
sl@0
   120
}
sl@0
   121
sl@0
   122
static gboolean
sl@0
   123
process_one (int line, gchar **columns)
sl@0
   124
{
sl@0
   125
  char *c[5];
sl@0
   126
  int i;
sl@0
   127
  gboolean skip = FALSE;
sl@0
   128
sl@0
   129
  for (i=0; i < 5; i++)
sl@0
   130
    {
sl@0
   131
      c[i] = decode(columns[i]);
sl@0
   132
      if (!c[i])
sl@0
   133
	skip = TRUE;
sl@0
   134
    }
sl@0
   135
sl@0
   136
  if (!skip)
sl@0
   137
    {
sl@0
   138
      test_form (line, G_NORMALIZE_NFD, FALSE, 2, c, columns);
sl@0
   139
      test_form (line, G_NORMALIZE_NFD, TRUE, 4, c, columns);
sl@0
   140
      test_form (line, G_NORMALIZE_NFC, FALSE, 1, c, columns);
sl@0
   141
      test_form (line, G_NORMALIZE_NFC, TRUE, 3, c, columns);
sl@0
   142
      test_form (line, G_NORMALIZE_NFKD, TRUE, 4, c, columns);
sl@0
   143
      test_form (line, G_NORMALIZE_NFKC, TRUE, 3, c, columns);
sl@0
   144
    }
sl@0
   145
sl@0
   146
  for (i=0; i < 5; i++)
sl@0
   147
    g_free (c[i]);
sl@0
   148
  
sl@0
   149
  return TRUE;
sl@0
   150
}
sl@0
   151
sl@0
   152
int main (int argc, char **argv)
sl@0
   153
{
sl@0
   154
  GIOChannel *in;
sl@0
   155
  GError *error = NULL;
sl@0
   156
  GString *buffer = g_string_new (NULL);
sl@0
   157
  int line_to_do = 0;
sl@0
   158
  int line = 1;
sl@0
   159
sl@0
   160
  #ifdef __SYMBIAN32__
sl@0
   161
  g_log_set_handler (NULL,  G_LOG_FLAG_FATAL| G_LOG_FLAG_RECURSION | G_LOG_LEVEL_CRITICAL | G_LOG_LEVEL_WARNING | G_LOG_LEVEL_MESSAGE | G_LOG_LEVEL_INFO | G_LOG_LEVEL_DEBUG, &mrtLogHandler, NULL);
sl@0
   162
  g_set_print_handler(mrtPrintHandler);
sl@0
   163
  #endif /*__SYMBIAN32__*/
sl@0
   164
  if (argc != 2 && argc != 3)
sl@0
   165
    {
sl@0
   166
      fprintf (stderr, "Usage: unicode-normalize NormalizationTest.txt LINE\n");
sl@0
   167
      return 1;
sl@0
   168
    }
sl@0
   169
sl@0
   170
  if (argc == 3)
sl@0
   171
    line_to_do = atoi(argv[2]);
sl@0
   172
sl@0
   173
  in = g_io_channel_new_file (argv[1], "r", &error);
sl@0
   174
  if (!in)
sl@0
   175
    {
sl@0
   176
      fprintf (stderr, "Cannot open %s: %s\n", argv[1], error->message);
sl@0
   177
      g_assert(FALSE && "unicode-normalize failed");
sl@0
   178
      
sl@0
   179
      #ifdef __SYMBIAN32__
sl@0
   180
      testResultXml("unicode-normalize");
sl@0
   181
      #endif /* EMULATOR */
sl@0
   182
      
sl@0
   183
      return 1;
sl@0
   184
    }
sl@0
   185
sl@0
   186
  while (TRUE)
sl@0
   187
    {
sl@0
   188
      gsize term_pos;
sl@0
   189
      gchar **columns;
sl@0
   190
sl@0
   191
      if (g_io_channel_read_line_string (in, buffer, &term_pos, &error) != G_IO_STATUS_NORMAL)
sl@0
   192
	break;
sl@0
   193
	
sl@0
   194
      if (line_to_do && line != line_to_do)
sl@0
   195
	goto next;
sl@0
   196
      
sl@0
   197
      buffer->str[term_pos] = '\0';
sl@0
   198
      
sl@0
   199
      if (buffer->str[0] == '#') /* Comment */
sl@0
   200
	goto next;
sl@0
   201
      if (buffer->str[0] == '@') /* Part */
sl@0
   202
	{
sl@0
   203
	  fprintf (stderr, "\nProcessing %s\n", buffer->str + 1);
sl@0
   204
	  goto next;
sl@0
   205
	}
sl@0
   206
      
sl@0
   207
      columns = g_strsplit (buffer->str, ";", -1);
sl@0
   208
      if (!columns[0])
sl@0
   209
	goto next;
sl@0
   210
      
sl@0
   211
      if (!process_one (line, columns))
sl@0
   212
	return 1;
sl@0
   213
      g_strfreev (columns);
sl@0
   214
sl@0
   215
    next:
sl@0
   216
      g_string_truncate (buffer, 0);
sl@0
   217
      line++;
sl@0
   218
    }
sl@0
   219
sl@0
   220
  if (error)
sl@0
   221
    {
sl@0
   222
      fprintf (stderr, "Error reading test file, %s\n", error->message);
sl@0
   223
      g_assert(FALSE && "unicode-normalize failed");
sl@0
   224
	  #ifdef __SYMBIAN32__
sl@0
   225
  	  testResultXml("unicode-normalize");
sl@0
   226
  	  #endif /* EMULATOR */
sl@0
   227
      return 1;
sl@0
   228
    }
sl@0
   229
sl@0
   230
  g_io_channel_unref (in);
sl@0
   231
  g_string_free (buffer, TRUE);
sl@0
   232
    
sl@0
   233
  #ifdef __SYMBIAN32__
sl@0
   234
  assert_failed = !success;
sl@0
   235
  testResultXml("unicode-normalize");
sl@0
   236
  #endif /* EMULATOR */
sl@0
   237
sl@0
   238
  return !success;
sl@0
   239
}