changeset 30598:85d772346e39

Tests for module 'mbrtowc'.
author Bruno Haible <bruno@clisp.org>
date Fri, 19 Dec 2008 03:33:05 +0100
parents 2ef0c8d4d55a
children 9e2b8239b111
files ChangeLog modules/mbrtowc-tests tests/test-mbrtowc.c tests/test-mbrtowc1.sh tests/test-mbrtowc2.sh tests/test-mbrtowc3.sh tests/test-mbrtowc4.sh
diffstat 7 files changed, 426 insertions(+), 0 deletions(-) [+]
line wrap: on
line diff
--- a/ChangeLog	Fri Dec 19 03:30:28 2008 +0100
+++ b/ChangeLog	Fri Dec 19 03:33:05 2008 +0100
@@ -1,5 +1,12 @@
 2008-12-18  Bruno Haible  <bruno@clisp.org>
 
+	* modules/mbrtowc-tests: New file.
+	* tests/test-mbrtowc1.sh: New file.
+	* tests/test-mbrtowc2.sh: New file.
+	* tests/test-mbrtowc3.sh: New file.
+	* tests/test-mbrtowc4.sh: New file.
+	* tests/test-mbrtowc.c: New file.
+
 	New module 'mbrtowc'.
 	* lib/wchar.in.h (mbstate_t): Override when the system does not have
 	mbsinit and mbrtowc.
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/modules/mbrtowc-tests	Fri Dec 19 03:33:05 2008 +0100
@@ -0,0 +1,31 @@
+Files:
+tests/test-mbrtowc1.sh
+tests/test-mbrtowc2.sh
+tests/test-mbrtowc3.sh
+tests/test-mbrtowc4.sh
+tests/test-mbrtowc.c
+m4/locale-fr.m4
+m4/locale-ja.m4
+m4/locale-zh.m4
+m4/codeset.m4
+
+Depends-on:
+mbsinit
+wctob
+
+configure.ac:
+gt_LOCALE_FR
+gt_LOCALE_FR_UTF8
+gt_LOCALE_JA
+gt_LOCALE_ZH_CN
+
+Makefile.am:
+TESTS += test-mbrtowc1.sh test-mbrtowc2.sh test-mbrtowc3.sh test-mbrtowc4.sh
+TESTS_ENVIRONMENT += \
+  EXEEXT='@EXEEXT@' \
+  LOCALE_FR='@LOCALE_FR@' \
+  LOCALE_FR_UTF8='@LOCALE_FR_UTF8@' \
+  LOCALE_JA='@LOCALE_JA@' \
+  LOCALE_ZH_CN='@LOCALE_ZH_CN@'
+check_PROGRAMS += test-mbrtowc
+
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/tests/test-mbrtowc.c	Fri Dec 19 03:33:05 2008 +0100
@@ -0,0 +1,328 @@
+/* Test of conversion of multibyte character to wide character.
+   Copyright (C) 2008 Free Software Foundation, Inc.
+
+   This program is free software: you can redistribute it and/or modify
+   it under the terms of the GNU General Public License as published by
+   the Free Software Foundation; either version 3 of the License, or
+   (at your option) any later version.
+
+   This program is distributed in the hope that it will be useful,
+   but WITHOUT ANY WARRANTY; without even the implied warranty of
+   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+   GNU General Public License for more details.
+
+   You should have received a copy of the GNU General Public License
+   along with this program.  If not, see <http://www.gnu.org/licenses/>.  */
+
+/* Written by Bruno Haible <bruno@clisp.org>, 2008.  */
+
+#include <config.h>
+
+#include <wchar.h>
+
+#include <locale.h>
+#include <stdio.h>
+#include <stdlib.h>
+#include <string.h>
+
+#define ASSERT(expr) \
+  do									     \
+    {									     \
+      if (!(expr))							     \
+        {								     \
+          fprintf (stderr, "%s:%d: assertion failed\n", __FILE__, __LINE__); \
+          fflush (stderr);						     \
+          abort ();							     \
+        }								     \
+    }									     \
+  while (0)
+
+int
+main (int argc, char *argv[])
+{
+  mbstate_t state;
+  wchar_t wc;
+  size_t ret;
+
+  /* configure should already have checked that the locale is supported.  */
+  if (setlocale (LC_ALL, "") == NULL)
+    return 1;
+
+  /* Test zero-length input.  */
+  {
+    memset (&state, '\0', sizeof (mbstate_t));
+    wc = 0xBADFACE;
+    ret = mbrtowc (&wc, "x", 0, &state);
+    ASSERT (ret == (size_t)(-2) || ret == 0);
+    ASSERT (mbsinit (&state));
+  }
+
+  /* Test NUL byte input.  */
+  {
+    memset (&state, '\0', sizeof (mbstate_t));
+    wc = 0xBADFACE;
+    ret = mbrtowc (&wc, "", 1, &state);
+    ASSERT (ret == 0);
+    ASSERT (wc == 0);
+    ASSERT (mbsinit (&state));
+    ret = mbrtowc (NULL, "", 1, &state);
+    ASSERT (ret == 0);
+    ASSERT (mbsinit (&state));
+  }
+
+  /* Test single-byte input.  */
+  {
+    int c;
+    char buf[1];
+
+    memset (&state, '\0', sizeof (mbstate_t));
+    for (c = 0; c < 0x100; c++)
+      switch (c)
+	{
+	case '\t': case '\v': case '\f':
+	case ' ': case '!': case '"': case '#': case '%':
+	case '&': case '\'': case '(': case ')': case '*':
+	case '+': case ',': case '-': case '.': case '/':
+	case '0': case '1': case '2': case '3': case '4':
+	case '5': case '6': case '7': case '8': case '9':
+	case ':': case ';': case '<': case '=': case '>':
+	case '?':
+	case 'A': case 'B': case 'C': case 'D': case 'E':
+	case 'F': case 'G': case 'H': case 'I': case 'J':
+	case 'K': case 'L': case 'M': case 'N': case 'O':
+	case 'P': case 'Q': case 'R': case 'S': case 'T':
+	case 'U': case 'V': case 'W': case 'X': case 'Y':
+	case 'Z':
+	case '[': case '\\': case ']': case '^': case '_':
+	case 'a': case 'b': case 'c': case 'd': case 'e':
+	case 'f': case 'g': case 'h': case 'i': case 'j':
+	case 'k': case 'l': case 'm': case 'n': case 'o':
+	case 'p': case 'q': case 'r': case 's': case 't':
+	case 'u': case 'v': case 'w': case 'x': case 'y':
+	case 'z': case '{': case '|': case '}': case '~':
+	  /* c is in the ISO C "basic character set".  */
+	  buf[0] = c;
+	  wc = 0xBADFACE;
+	  ret = mbrtowc (&wc, buf, 1, &state);
+	  ASSERT (ret == 1);
+	  ASSERT (wc == c);
+	  ASSERT (mbsinit (&state));
+	  ret = mbrtowc (NULL, buf, 1, &state);
+	  ASSERT (ret == 1);
+	  ASSERT (mbsinit (&state));
+	  break;
+	}
+  }
+
+  /* Test special calling convention, passing a NULL pointer.  */
+  {
+    memset (&state, '\0', sizeof (mbstate_t));
+    wc = 0xBADFACE;
+    ret = mbrtowc (&wc, NULL, 5, &state);
+    ASSERT (ret == 0);
+    ASSERT (wc == 0xBADFACE);
+    ASSERT (mbsinit (&state));
+  }
+
+  if (argc > 1)
+    switch (argv[1][0])
+      {
+      case '1':
+	/* Locale encoding is ISO-8859-1 or ISO-8859-15.  */
+	{
+	  char input[] = "B\374\337er"; /* "Büßer" */
+	  memset (&state, '\0', sizeof (mbstate_t));
+
+	  wc = 0xBADFACE;
+	  ret = mbrtowc (&wc, input, 1, &state);
+	  ASSERT (ret == 1);
+	  ASSERT (wc == 'B');
+	  ASSERT (mbsinit (&state));
+	  input[0] = '\0';
+
+	  wc = 0xBADFACE;
+	  ret = mbrtowc (&wc, input + 1, 1, &state);
+	  ASSERT (ret == 1);
+	  ASSERT (wctob (wc) == (unsigned char) '\374');
+	  ASSERT (mbsinit (&state));
+	  input[1] = '\0';
+
+	  wc = 0xBADFACE;
+	  ret = mbrtowc (&wc, input + 2, 3, &state);
+	  ASSERT (ret == 1);
+	  ASSERT (wctob (wc) == (unsigned char) '\337');
+	  ASSERT (mbsinit (&state));
+	  input[2] = '\0';
+
+	  wc = 0xBADFACE;
+	  ret = mbrtowc (&wc, input + 3, 2, &state);
+	  ASSERT (ret == 1);
+	  ASSERT (wc == 'e');
+	  ASSERT (mbsinit (&state));
+	  input[3] = '\0';
+
+	  wc = 0xBADFACE;
+	  ret = mbrtowc (&wc, input + 4, 1, &state);
+	  ASSERT (ret == 1);
+	  ASSERT (wc == 'r');
+	  ASSERT (mbsinit (&state));
+	}
+	return 0;
+
+      case '2':
+	/* Locale encoding is UTF-8.  */
+	{
+	  char input[] = "B\303\274\303\237er"; /* "Büßer" */
+	  memset (&state, '\0', sizeof (mbstate_t));
+
+	  wc = 0xBADFACE;
+	  ret = mbrtowc (&wc, input, 1, &state);
+	  ASSERT (ret == 1);
+	  ASSERT (wc == 'B');
+	  ASSERT (mbsinit (&state));
+	  input[0] = '\0';
+
+	  wc = 0xBADFACE;
+	  ret = mbrtowc (&wc, input + 1, 1, &state);
+	  ASSERT (ret == (size_t)(-2));
+	  ASSERT (wc == 0xBADFACE);
+	  ASSERT (!mbsinit (&state));
+	  input[1] = '\0';
+
+	  wc = 0xBADFACE;
+	  ret = mbrtowc (&wc, input + 2, 5, &state);
+	  ASSERT (ret == 1);
+	  ASSERT (wctob (wc) == EOF);
+	  ASSERT (mbsinit (&state));
+	  input[2] = '\0';
+
+	  wc = 0xBADFACE;
+	  ret = mbrtowc (&wc, input + 3, 4, &state);
+	  ASSERT (ret == 2);
+	  ASSERT (wctob (wc) == EOF);
+	  ASSERT (mbsinit (&state));
+	  input[3] = '\0';
+	  input[4] = '\0';
+
+	  wc = 0xBADFACE;
+	  ret = mbrtowc (&wc, input + 5, 2, &state);
+	  ASSERT (ret == 1);
+	  ASSERT (wc == 'e');
+	  ASSERT (mbsinit (&state));
+	  input[5] = '\0';
+
+	  wc = 0xBADFACE;
+	  ret = mbrtowc (&wc, input + 6, 1, &state);
+	  ASSERT (ret == 1);
+	  ASSERT (wc == 'r');
+	  ASSERT (mbsinit (&state));
+	}
+	return 0;
+
+      case '3':
+	/* Locale encoding is EUC-JP.  */
+	{
+	  char input[] = "B\217\253\344\217\251\316er"; /* "Büßer" */
+	  memset (&state, '\0', sizeof (mbstate_t));
+
+	  wc = 0xBADFACE;
+	  ret = mbrtowc (&wc, input, 1, &state);
+	  ASSERT (ret == 1);
+	  ASSERT (wc == 'B');
+	  ASSERT (mbsinit (&state));
+	  input[0] = '\0';
+
+	  wc = 0xBADFACE;
+	  ret = mbrtowc (&wc, input + 1, 1, &state);
+	  ASSERT (ret == (size_t)(-2));
+	  ASSERT (wc == 0xBADFACE);
+	  ASSERT (!mbsinit (&state));
+	  input[1] = '\0';
+
+	  wc = 0xBADFACE;
+	  ret = mbrtowc (&wc, input + 2, 7, &state);
+	  ASSERT (ret == 2);
+	  ASSERT (wctob (wc) == EOF);
+	  ASSERT (mbsinit (&state));
+	  input[2] = '\0';
+	  input[3] = '\0';
+
+	  wc = 0xBADFACE;
+	  ret = mbrtowc (&wc, input + 4, 5, &state);
+	  ASSERT (ret == 3);
+	  ASSERT (wctob (wc) == EOF);
+	  ASSERT (mbsinit (&state));
+	  input[4] = '\0';
+	  input[5] = '\0';
+	  input[6] = '\0';
+
+	  wc = 0xBADFACE;
+	  ret = mbrtowc (&wc, input + 7, 2, &state);
+	  ASSERT (ret == 1);
+	  ASSERT (wc == 'e');
+	  ASSERT (mbsinit (&state));
+	  input[5] = '\0';
+
+	  wc = 0xBADFACE;
+	  ret = mbrtowc (&wc, input + 8, 1, &state);
+	  ASSERT (ret == 1);
+	  ASSERT (wc == 'r');
+	  ASSERT (mbsinit (&state));
+	}
+	return 0;
+
+      case '4':
+	/* Locale encoding is GB18030.  */
+	{
+	  char input[] = "B\250\271\201\060\211\070er"; /* "Büßer" */
+	  memset (&state, '\0', sizeof (mbstate_t));
+
+	  wc = 0xBADFACE;
+	  ret = mbrtowc (&wc, input, 1, &state);
+	  ASSERT (ret == 1);
+	  ASSERT (wc == 'B');
+	  ASSERT (mbsinit (&state));
+	  input[0] = '\0';
+
+	  wc = 0xBADFACE;
+	  ret = mbrtowc (&wc, input + 1, 1, &state);
+	  ASSERT (ret == (size_t)(-2));
+	  ASSERT (wc == 0xBADFACE);
+	  ASSERT (!mbsinit (&state));
+	  input[1] = '\0';
+
+	  wc = 0xBADFACE;
+	  ret = mbrtowc (&wc, input + 2, 7, &state);
+	  ASSERT (ret == 1);
+	  ASSERT (wctob (wc) == EOF);
+	  ASSERT (mbsinit (&state));
+	  input[2] = '\0';
+
+	  wc = 0xBADFACE;
+	  ret = mbrtowc (&wc, input + 3, 6, &state);
+	  ASSERT (ret == 4);
+	  ASSERT (wctob (wc) == EOF);
+	  ASSERT (mbsinit (&state));
+	  input[3] = '\0';
+	  input[4] = '\0';
+	  input[5] = '\0';
+	  input[6] = '\0';
+
+	  wc = 0xBADFACE;
+	  ret = mbrtowc (&wc, input + 7, 2, &state);
+	  ASSERT (ret == 1);
+	  ASSERT (wc == 'e');
+	  ASSERT (mbsinit (&state));
+	  input[5] = '\0';
+
+	  wc = 0xBADFACE;
+	  ret = mbrtowc (&wc, input + 8, 1, &state);
+	  ASSERT (ret == 1);
+	  ASSERT (wc == 'r');
+	  ASSERT (mbsinit (&state));
+	}
+	return 0;
+      }
+
+  return 1;
+}
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/tests/test-mbrtowc1.sh	Fri Dec 19 03:33:05 2008 +0100
@@ -0,0 +1,15 @@
+#!/bin/sh
+
+# Test in an ISO-8859-1 or ISO-8859-15 locale.
+: ${LOCALE_FR=fr_FR}
+if test $LOCALE_FR = none; then
+  if test -f /usr/bin/localedef; then
+    echo "Skipping test: no traditional french locale is installed"
+  else
+    echo "Skipping test: no traditional french locale is supported"
+  fi
+  exit 77
+fi
+
+LC_ALL=$LOCALE_FR \
+./test-mbrtowc${EXEEXT} 1
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/tests/test-mbrtowc2.sh	Fri Dec 19 03:33:05 2008 +0100
@@ -0,0 +1,15 @@
+#!/bin/sh
+
+# Test whether a specific UTF-8 locale is installed.
+: ${LOCALE_FR_UTF8=fr_FR.UTF-8}
+if test $LOCALE_FR_UTF8 = none; then
+  if test -f /usr/bin/localedef; then
+    echo "Skipping test: no french Unicode locale is installed"
+  else
+    echo "Skipping test: no french Unicode locale is supported"
+  fi
+  exit 77
+fi
+
+LC_ALL=$LOCALE_FR_UTF8 \
+./test-mbrtowc${EXEEXT} 2
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/tests/test-mbrtowc3.sh	Fri Dec 19 03:33:05 2008 +0100
@@ -0,0 +1,15 @@
+#!/bin/sh
+
+# Test whether a specific EUC-JP locale is installed.
+: ${LOCALE_JA=ja_JP}
+if test $LOCALE_JA = none; then
+  if test -f /usr/bin/localedef; then
+    echo "Skipping test: no traditional japanese locale is installed"
+  else
+    echo "Skipping test: no traditional japanese locale is supported"
+  fi
+  exit 77
+fi
+
+LC_ALL=$LOCALE_JA \
+./test-mbrtowc${EXEEXT} 3
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/tests/test-mbrtowc4.sh	Fri Dec 19 03:33:05 2008 +0100
@@ -0,0 +1,15 @@
+#!/bin/sh
+
+# Test whether a specific GB18030 locale is installed.
+: ${LOCALE_ZH_CN=zh_CN}
+if test $LOCALE_ZH_CN = none; then
+  if test -f /usr/bin/localedef; then
+    echo "Skipping test: no transitional chinese locale is installed"
+  else
+    echo "Skipping test: no transitional chinese locale is supported"
+  fi
+  exit 77
+fi
+
+LC_ALL=$LOCALE_ZH_CN \
+./test-mbrtowc${EXEEXT} 4