changeset 11135:8ffa77feaa58

New module 'uniwbrk/table'.
author Bruno Haible <bruno@clisp.org>
date Sun, 08 Feb 2009 20:54:44 +0100
parents f08e03828662
children 096d0a714fac
files ChangeLog lib/uniwbrk/wbrktable.c lib/uniwbrk/wbrktable.h modules/uniwbrk/table
diffstat 4 files changed, 97 insertions(+), 0 deletions(-) [+]
line wrap: on
line diff
--- a/ChangeLog	Sun Feb 08 20:52:49 2009 +0100
+++ b/ChangeLog	Sun Feb 08 20:54:44 2009 +0100
@@ -1,5 +1,10 @@
 2009-02-08  Bruno Haible  <bruno@clisp.org>
 
+	New module 'uniwbrk/table'.
+	* modules/uniwbrk/table: New file.
+	* lib/uniwbrk/wbrktable.h: New file.
+	* lib/uniwbrk/wbrktable.c: New file.
+
 	New module 'uniwbrk/wordbreak-property'.
 	* modules/uniwbrk/wordbreak-property: New file.
 	* lib/uniwbrk/wordbreak-property.c: New file.
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/lib/uniwbrk/wbrktable.c	Sun Feb 08 20:54:44 2009 +0100
@@ -0,0 +1,52 @@
+/* Word break auxiliary table.
+   Copyright (C) 2009 Free Software Foundation, Inc.
+   Written by Bruno Haible <bruno@clisp.org>, 2009.
+
+   This program is free software: you can redistribute it and/or modify it
+   under the terms of the GNU Lesser General Public License as published
+   by the Free Software Foundation; either version 3 of the License, or
+   (at your option) any later version.
+
+   This program is distributed in the hope that it will be useful,
+   but WITHOUT ANY WARRANTY; without even the implied warranty of
+   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
+   Lesser General Public License for more details.
+
+   You should have received a copy of the GNU Lesser General Public License
+   along with this program.  If not, see <http://www.gnu.org/licenses/>.  */
+
+#include <config.h>
+
+/* Specification.  */
+#include "wbrktable.h"
+
+/* This table contains the following rules (see UAX #29):
+
+		       last         current
+
+			 ALetter × ALetter                         (WB5)
+			 ALetter × Numeric                         (WB9)
+			 Numeric × ALetter                         (WB10)
+			 Numeric × Numeric                         (WB8)
+			Katakana × Katakana                        (WB13)
+  (ALetter | Numeric | Katakana) × ExtendNumLet                    (WB13a)
+		    ExtendNumLet × ExtendNumLet                    (WB13a)
+		    ExtendNumLet × (ALetter | Numeric | Katakana)  (WB13b)
+ */
+
+const unsigned char uniwbrk_table[10][8] =
+{        /* current:      OTHER            MIDNUMLET         NUMERIC         */
+	 /*                   KATAKANA           MIDLETTER      EXTENDNUMLET */
+	 /*                          ALETTER            MIDNUM               */
+  /* last */
+  /* WBP_OTHER */        {  1,    1,    1,    1,    1,    1,    1,    1 },
+  /* WBP_KATAKANA */     {  1,    0,    1,    1,    1,    1,    1,    0 },
+  /* WBP_ALETTER */      {  1,    1,    0,    1,    1,    1,    0,    0 },
+  /* WBP_MIDNUMLET */    {  1,    1,    1,    1,    1,    1,    1,    1 },
+  /* WBP_MIDLETTER */    {  1,    1,    1,    1,    1,    1,    1,    1 },
+  /* WBP_MIDNUM */       {  1,    1,    1,    1,    1,    1,    1,    1 },
+  /* WBP_NUMERIC */      {  1,    1,    0,    1,    1,    1,    0,    0 },
+  /* WBP_EXTENDNUMLET */ {  1,    0,    0,    1,    1,    1,    0,    0 },
+  /* WBP_EXTEND */       {  1,    1,    1,    1,    1,    1,    1,    1 },
+  /* WBP_FORMAT */       {  1,    1,    1,    1,    1,    1,    1,    1 }
+};
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/lib/uniwbrk/wbrktable.h	Sun Feb 08 20:54:44 2009 +0100
@@ -0,0 +1,18 @@
+/* Word break auxiliary table.
+   Copyright (C) 2009 Free Software Foundation, Inc.
+   Written by Bruno Haible <bruno@clisp.org>, 2009.
+
+   This program is free software: you can redistribute it and/or modify it
+   under the terms of the GNU Lesser General Public License as published
+   by the Free Software Foundation; either version 3 of the License, or
+   (at your option) any later version.
+
+   This program is distributed in the hope that it will be useful,
+   but WITHOUT ANY WARRANTY; without even the implied warranty of
+   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
+   Lesser General Public License for more details.
+
+   You should have received a copy of the GNU Lesser General Public License
+   along with this program.  If not, see <http://www.gnu.org/licenses/>.  */
+
+extern const unsigned char uniwbrk_table[10][8];
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/modules/uniwbrk/table	Sun Feb 08 20:54:44 2009 +0100
@@ -0,0 +1,22 @@
+Description:
+
+Files:
+lib/uniwbrk/wbrktable.h
+lib/uniwbrk/wbrktable.c
+
+Depends-on:
+
+configure.ac:
+
+Makefile.am:
+lib_SOURCES += uniwbrk/wbrktable.c
+
+Include:
+"uniwbrk/wbrktable.h"
+
+License:
+LGPL
+
+Maintainer:
+Bruno Haible
+