view lib/unictype/blocks.h @ 29162:c7c2e5573f14

Unicode character classification functions.
author Bruno Haible <bruno@clisp.org>
date Tue, 13 Nov 2007 00:15:53 +0100
parents
children 5bfb3f92b613
line wrap: on
line source

/* DO NOT EDIT! GENERATED AUTOMATICALLY! */
/* Unicode blocks.  */
/* Generated automatically by gen-ctype.c for Unicode 5.0.0.  */
static const uc_block_t blocks[] =
{
  { 0x0000, 0x007F, "Basic Latin" },
  { 0x0080, 0x00FF, "Latin-1 Supplement" },
  { 0x0100, 0x017F, "Latin Extended-A" },
  { 0x0180, 0x024F, "Latin Extended-B" },
  { 0x0250, 0x02AF, "IPA Extensions" },
  { 0x02B0, 0x02FF, "Spacing Modifier Letters" },
  { 0x0300, 0x036F, "Combining Diacritical Marks" },
  { 0x0370, 0x03FF, "Greek and Coptic" },
  { 0x0400, 0x04FF, "Cyrillic" },
  { 0x0500, 0x052F, "Cyrillic Supplement" },
  { 0x0530, 0x058F, "Armenian" },
  { 0x0590, 0x05FF, "Hebrew" },
  { 0x0600, 0x06FF, "Arabic" },
  { 0x0700, 0x074F, "Syriac" },
  { 0x0750, 0x077F, "Arabic Supplement" },
  { 0x0780, 0x07BF, "Thaana" },
  { 0x07C0, 0x07FF, "NKo" },
  { 0x0900, 0x097F, "Devanagari" },
  { 0x0980, 0x09FF, "Bengali" },
  { 0x0A00, 0x0A7F, "Gurmukhi" },
  { 0x0A80, 0x0AFF, "Gujarati" },
  { 0x0B00, 0x0B7F, "Oriya" },
  { 0x0B80, 0x0BFF, "Tamil" },
  { 0x0C00, 0x0C7F, "Telugu" },
  { 0x0C80, 0x0CFF, "Kannada" },
  { 0x0D00, 0x0D7F, "Malayalam" },
  { 0x0D80, 0x0DFF, "Sinhala" },
  { 0x0E00, 0x0E7F, "Thai" },
  { 0x0E80, 0x0EFF, "Lao" },
  { 0x0F00, 0x0FFF, "Tibetan" },
  { 0x1000, 0x109F, "Myanmar" },
  { 0x10A0, 0x10FF, "Georgian" },
  { 0x1100, 0x11FF, "Hangul Jamo" },
  { 0x1200, 0x137F, "Ethiopic" },
  { 0x1380, 0x139F, "Ethiopic Supplement" },
  { 0x13A0, 0x13FF, "Cherokee" },
  { 0x1400, 0x167F, "Unified Canadian Aboriginal Syllabics" },
  { 0x1680, 0x169F, "Ogham" },
  { 0x16A0, 0x16FF, "Runic" },
  { 0x1700, 0x171F, "Tagalog" },
  { 0x1720, 0x173F, "Hanunoo" },
  { 0x1740, 0x175F, "Buhid" },
  { 0x1760, 0x177F, "Tagbanwa" },
  { 0x1780, 0x17FF, "Khmer" },
  { 0x1800, 0x18AF, "Mongolian" },
  { 0x1900, 0x194F, "Limbu" },
  { 0x1950, 0x197F, "Tai Le" },
  { 0x1980, 0x19DF, "New Tai Lue" },
  { 0x19E0, 0x19FF, "Khmer Symbols" },
  { 0x1A00, 0x1A1F, "Buginese" },
  { 0x1B00, 0x1B7F, "Balinese" },
  { 0x1D00, 0x1D7F, "Phonetic Extensions" },
  { 0x1D80, 0x1DBF, "Phonetic Extensions Supplement" },
  { 0x1DC0, 0x1DFF, "Combining Diacritical Marks Supplement" },
  { 0x1E00, 0x1EFF, "Latin Extended Additional" },
  { 0x1F00, 0x1FFF, "Greek Extended" },
  { 0x2000, 0x206F, "General Punctuation" },
  { 0x2070, 0x209F, "Superscripts and Subscripts" },
  { 0x20A0, 0x20CF, "Currency Symbols" },
  { 0x20D0, 0x20FF, "Combining Diacritical Marks for Symbols" },
  { 0x2100, 0x214F, "Letterlike Symbols" },
  { 0x2150, 0x218F, "Number Forms" },
  { 0x2190, 0x21FF, "Arrows" },
  { 0x2200, 0x22FF, "Mathematical Operators" },
  { 0x2300, 0x23FF, "Miscellaneous Technical" },
  { 0x2400, 0x243F, "Control Pictures" },
  { 0x2440, 0x245F, "Optical Character Recognition" },
  { 0x2460, 0x24FF, "Enclosed Alphanumerics" },
  { 0x2500, 0x257F, "Box Drawing" },
  { 0x2580, 0x259F, "Block Elements" },
  { 0x25A0, 0x25FF, "Geometric Shapes" },
  { 0x2600, 0x26FF, "Miscellaneous Symbols" },
  { 0x2700, 0x27BF, "Dingbats" },
  { 0x27C0, 0x27EF, "Miscellaneous Mathematical Symbols-A" },
  { 0x27F0, 0x27FF, "Supplemental Arrows-A" },
  { 0x2800, 0x28FF, "Braille Patterns" },
  { 0x2900, 0x297F, "Supplemental Arrows-B" },
  { 0x2980, 0x29FF, "Miscellaneous Mathematical Symbols-B" },
  { 0x2A00, 0x2AFF, "Supplemental Mathematical Operators" },
  { 0x2B00, 0x2BFF, "Miscellaneous Symbols and Arrows" },
  { 0x2C00, 0x2C5F, "Glagolitic" },
  { 0x2C60, 0x2C7F, "Latin Extended-C" },
  { 0x2C80, 0x2CFF, "Coptic" },
  { 0x2D00, 0x2D2F, "Georgian Supplement" },
  { 0x2D30, 0x2D7F, "Tifinagh" },
  { 0x2D80, 0x2DDF, "Ethiopic Extended" },
  { 0x2E00, 0x2E7F, "Supplemental Punctuation" },
  { 0x2E80, 0x2EFF, "CJK Radicals Supplement" },
  { 0x2F00, 0x2FDF, "Kangxi Radicals" },
  { 0x2FF0, 0x2FFF, "Ideographic Description Characters" },
  { 0x3000, 0x303F, "CJK Symbols and Punctuation" },
  { 0x3040, 0x309F, "Hiragana" },
  { 0x30A0, 0x30FF, "Katakana" },
  { 0x3100, 0x312F, "Bopomofo" },
  { 0x3130, 0x318F, "Hangul Compatibility Jamo" },
  { 0x3190, 0x319F, "Kanbun" },
  { 0x31A0, 0x31BF, "Bopomofo Extended" },
  { 0x31C0, 0x31EF, "CJK Strokes" },
  { 0x31F0, 0x31FF, "Katakana Phonetic Extensions" },
  { 0x3200, 0x32FF, "Enclosed CJK Letters and Months" },
  { 0x3300, 0x33FF, "CJK Compatibility" },
  { 0x3400, 0x4DBF, "CJK Unified Ideographs Extension A" },
  { 0x4DC0, 0x4DFF, "Yijing Hexagram Symbols" },
  { 0x4E00, 0x9FFF, "CJK Unified Ideographs" },
  { 0xA000, 0xA48F, "Yi Syllables" },
  { 0xA490, 0xA4CF, "Yi Radicals" },
  { 0xA700, 0xA71F, "Modifier Tone Letters" },
  { 0xA720, 0xA7FF, "Latin Extended-D" },
  { 0xA800, 0xA82F, "Syloti Nagri" },
  { 0xA840, 0xA87F, "Phags-pa" },
  { 0xAC00, 0xD7AF, "Hangul Syllables" },
  { 0xD800, 0xDB7F, "High Surrogates" },
  { 0xDB80, 0xDBFF, "High Private Use Surrogates" },
  { 0xDC00, 0xDFFF, "Low Surrogates" },
  { 0xE000, 0xF8FF, "Private Use Area" },
  { 0xF900, 0xFAFF, "CJK Compatibility Ideographs" },
  { 0xFB00, 0xFB4F, "Alphabetic Presentation Forms" },
  { 0xFB50, 0xFDFF, "Arabic Presentation Forms-A" },
  { 0xFE00, 0xFE0F, "Variation Selectors" },
  { 0xFE10, 0xFE1F, "Vertical Forms" },
  { 0xFE20, 0xFE2F, "Combining Half Marks" },
  { 0xFE30, 0xFE4F, "CJK Compatibility Forms" },
  { 0xFE50, 0xFE6F, "Small Form Variants" },
  { 0xFE70, 0xFEFF, "Arabic Presentation Forms-B" },
  { 0xFF00, 0xFFEF, "Halfwidth and Fullwidth Forms" },
  { 0xFFF0, 0xFFFF, "Specials" },
  { 0x10000, 0x1007F, "Linear B Syllabary" },
  { 0x10080, 0x100FF, "Linear B Ideograms" },
  { 0x10100, 0x1013F, "Aegean Numbers" },
  { 0x10140, 0x1018F, "Ancient Greek Numbers" },
  { 0x10300, 0x1032F, "Old Italic" },
  { 0x10330, 0x1034F, "Gothic" },
  { 0x10380, 0x1039F, "Ugaritic" },
  { 0x103A0, 0x103DF, "Old Persian" },
  { 0x10400, 0x1044F, "Deseret" },
  { 0x10450, 0x1047F, "Shavian" },
  { 0x10480, 0x104AF, "Osmanya" },
  { 0x10800, 0x1083F, "Cypriot Syllabary" },
  { 0x10900, 0x1091F, "Phoenician" },
  { 0x10A00, 0x10A5F, "Kharoshthi" },
  { 0x12000, 0x123FF, "Cuneiform" },
  { 0x12400, 0x1247F, "Cuneiform Numbers and Punctuation" },
  { 0x1D000, 0x1D0FF, "Byzantine Musical Symbols" },
  { 0x1D100, 0x1D1FF, "Musical Symbols" },
  { 0x1D200, 0x1D24F, "Ancient Greek Musical Notation" },
  { 0x1D300, 0x1D35F, "Tai Xuan Jing Symbols" },
  { 0x1D360, 0x1D37F, "Counting Rod Numerals" },
  { 0x1D400, 0x1D7FF, "Mathematical Alphanumeric Symbols" },
  { 0x20000, 0x2A6DF, "CJK Unified Ideographs Extension B" },
  { 0x2F800, 0x2FA1F, "CJK Compatibility Ideographs Supplement" },
  { 0xE0000, 0xE007F, "Tags" },
  { 0xE0100, 0xE01EF, "Variation Selectors Supplement" },
  { 0xF0000, 0xFFFFF, "Supplementary Private Use Area-A" },
  { 0x100000, 0x10FFFF, "Supplementary Private Use Area-B" }
};
#define blocks_level1_shift 8
#define blocks_level1_threshold 0x30000
static const uint8_t blocks_level1[768 * 2] =
{
    0,   2,
    2,   4,
    3,   6,
    6,   8,
    8,   9,
    9,  12,
   12,  13,
   13,  17,
   17,  17,
   17,  19,
   19,  21,
   21,  23,
   23,  25,
   25,  27,
   27,  29,
   29,  30,
   30,  32,
   32,  33,
   33,  34,
   33,  36,
   36,  37,
   36,  37,
   36,  39,
   39,  44,
   44,  45,
   45,  49,
   49,  50,
   50,  51,
   51,  51,
   51,  54,
   54,  55,
   55,  56,
   56,  60,
   60,  63,
   63,  64,
   64,  65,
   65,  68,
   68,  71,
   71,  72,
   72,  75,
   75,  76,
   76,  78,
   78,  79,
   79,  80,
   80,  83,
   83,  86,
   86,  88,
   88,  90,
   90,  93,
   93,  99,
   99, 100,
  100, 101,
  101, 102,
  101, 102,
  101, 102,
  101, 102,
  101, 102,
  101, 102,
  101, 102,
  101, 102,
  101, 102,
  101, 102,
  101, 102,
  101, 102,
  101, 102,
  101, 102,
  101, 102,
  101, 102,
  101, 102,
  101, 102,
  101, 102,
  101, 102,
  101, 102,
  101, 102,
  101, 102,
  101, 102,
  101, 102,
  101, 103,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  103, 104,
  104, 105,
  104, 105,
  104, 105,
  104, 105,
  104, 106,
  106, 106,
  106, 106,
  106, 108,
  108, 110,
  110, 110,
  110, 110,
  110, 110,
  110, 111,
  110, 111,
  110, 111,
  110, 111,
  110, 111,
  110, 111,
  110, 111,
  110, 111,
  110, 111,
  110, 111,
  110, 111,
  110, 111,
  110, 111,
  110, 111,
  110, 111,
  110, 111,
  110, 111,
  110, 111,
  110, 111,
  110, 111,
  110, 111,
  110, 111,
  110, 111,
  110, 111,
  110, 111,
  110, 111,
  110, 111,
  110, 111,
  110, 111,
  110, 111,
  110, 111,
  110, 111,
  110, 111,
  110, 111,
  110, 111,
  110, 111,
  110, 111,
  110, 111,
  110, 111,
  110, 111,
  110, 111,
  110, 111,
  110, 111,
  110, 111,
  111, 112,
  111, 112,
  111, 112,
  111, 113,
  113, 114,
  113, 114,
  113, 114,
  113, 114,
  114, 115,
  114, 115,
  114, 115,
  114, 115,
  114, 115,
  114, 115,
  114, 115,
  114, 115,
  114, 115,
  114, 115,
  114, 115,
  114, 115,
  114, 115,
  114, 115,
  114, 115,
  114, 115,
  114, 115,
  114, 115,
  114, 115,
  114, 115,
  114, 115,
  114, 115,
  114, 115,
  114, 115,
  114, 115,
  115, 116,
  115, 116,
  116, 118,
  117, 118,
  117, 118,
  118, 124,
  124, 126,
  126, 128,
  128, 130,
  130, 130,
  130, 134,
  134, 137,
  137, 137,
  137, 137,
  137, 137,
  137, 138,
  138, 139,
  139, 140,
  140, 140,
  140, 140,
  140, 140,
  140, 140,
  140, 140,
  140, 140,
  140, 140,
  140, 140,
  140, 140,
  140, 140,
  140, 140,
  140, 140,
  140, 140,
  140, 140,
  140, 140,
  140, 140,
  140, 140,
  140, 140,
  140, 140,
  140, 140,
  140, 140,
  140, 141,
  140, 141,
  140, 141,
  140, 141,
  141, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 142,
  142, 143,
  143, 144,
  144, 145,
  145, 147,
  147, 148,
  147, 148,
  147, 148,
  147, 148,
  148, 148,
  148, 148,
  148, 148,
  148, 148,
  148, 148,
  148, 148,
  148, 148,
  148, 148,
  148, 148,
  148, 148,
  148, 148,
  148, 148,
  148, 148,
  148, 148,
  148, 148,
  148, 148,
  148, 148,
  148, 148,
  148, 148,
  148, 148,
  148, 148,
  148, 148,
  148, 148,
  148, 148,
  148, 148,
  148, 148,
  148, 148,
  148, 148,
  148, 148,
  148, 148,
  148, 148,
  148, 148,
  148, 148,
  148, 148,
  148, 148,
  148, 148,
  148, 148,
  148, 148,
  148, 148,
  148, 148,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  148, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 149,
  149, 150,
  149, 150,
  149, 150,
  150, 150,
  150, 150,
  150, 150,
  150, 150,
  150, 150
};
#define blocks_upper_first_index 150
#define blocks_upper_last_index 154