1 
2 #ifdef DEBUG
3 #include <stdio.h>
4 #endif
5 
6 #include "uniblock.h"
7 
8 struct ublock {
9   long min, max, cjk;
10 };
11 
12 /*
13  References:
14  [1] http://www.unicode.org/Public/UNIDATA/Blocks.txt
15         Blocks-7.0.0.txt
16         Date: 2014-04-03, 23:23:00 GMT [RP, KW]
17  [2] CMap files
18      http://sourceforge.net/adobe/cmap/wiki/Home/
19      cmapresources_cns1-6.tar.z     Adobe-CNS1-6 materials
20         cid2code.txt (Version 10/25/2010)
21      cmapresources_gb1-5.tar.z      Adobe-GB1-5 materials
22         cid2code.txt (Version 10/29/2010)
23      cmapresources_japan1-6.tar.z   Adobe-Japan1-6 materials
24         cid2code.txt (Version 08/13/2012)
25      cmapresources_korean1-2.tar.z  Adobe-Korea1-2 materials
26         cid2code.txt (Version 01/31/2012)
27 */
28 
29 static struct ublock ublock_data[] = {
30   {0x0000, 0x007F, ENTRY_GCJK}, /* Basic Latin */
31   {0x0080, 0x00FF, ENTRY_GCJK}, /* Latin-1 Supplement */
32   {0x0100, 0x017F, ENTRY_GCJK}, /* Latin Extended-A */
33   {0x0180, 0x024F, ENTRY_GCJ }, /* Latin Extended-B */
34   {0x0250, 0x02AF, ENTRY_GCJ }, /* IPA Extensions */
35   {0x02B0, 0x02FF, ENTRY_GCJK}, /* Spacing Modifier Letters */
36   {0x0300, 0x036F, ENTRY_CJ  }, /* Combining Diacritical Marks */
37   {0x0370, 0x03FF, ENTRY_GCJK}, /* Greek and Coptic */
38   {0x0400, 0x04FF, ENTRY_GCJK}, /* Cyrillic */
39   {0x0500, 0x052F, ENTRY_NO  }, /* Cyrillic Supplement */
40   {0x0530, 0x058F, ENTRY_NO  }, /* Armenian */
41   {0x0590, 0x05FF, ENTRY_NO  }, /* Hebrew */
42   {0x0600, 0x06FF, ENTRY_NO  }, /* Arabic */
43   {0x0700, 0x074F, ENTRY_NO  }, /* Syriac */
44   {0x0750, 0x077F, ENTRY_NO  }, /* Arabic Supplement */
45   {0x0780, 0x07BF, ENTRY_NO  }, /* Thaana */
46   {0x07C0, 0x07FF, ENTRY_NO  }, /* NKo */
47   {0x0800, 0x083F, ENTRY_NO  }, /* Samaritan */
48   {0x0840, 0x085F, ENTRY_NO  }, /* Mandaic */
49   {0x08A0, 0x08FF, ENTRY_NO  }, /* Arabic Extended-A */
50   {0x0900, 0x097F, ENTRY_NO  }, /* Devanagari */
51   {0x0980, 0x09FF, ENTRY_NO  }, /* Bengali */
52   {0x0A00, 0x0A7F, ENTRY_NO  }, /* Gurmukhi */
53   {0x0A80, 0x0AFF, ENTRY_NO  }, /* Gujarati */
54   {0x0B00, 0x0B7F, ENTRY_NO  }, /* Oriya */
55   {0x0B80, 0x0BFF, ENTRY_NO  }, /* Tamil */
56   {0x0C00, 0x0C7F, ENTRY_NO  }, /* Telugu */
57   {0x0C80, 0x0CFF, ENTRY_NO  }, /* Kannada */
58   {0x0D00, 0x0D7F, ENTRY_NO  }, /* Malayalam */
59   {0x0D80, 0x0DFF, ENTRY_NO  }, /* Sinhala */
60   {0x0E00, 0x0E7F, ENTRY_NO  }, /* Thai */
61   {0x0E80, 0x0EFF, ENTRY_NO  }, /* Lao */
62   {0x0F00, 0x0FFF, ENTRY_NO  }, /* Tibetan */
63   {0x1000, 0x109F, ENTRY_NO  }, /* Myanmar */
64   {0x10A0, 0x10FF, ENTRY_NO  }, /* Georgian */
65   {0x1100, 0x11FF, ENTRY_K   }, /* Hangul Jamo */
66   {0x1200, 0x137F, ENTRY_NO  }, /* Ethiopic */
67   {0x1380, 0x139F, ENTRY_NO  }, /* Ethiopic Supplement */
68   {0x13A0, 0x13FF, ENTRY_NO  }, /* Cherokee */
69   {0x1400, 0x167F, ENTRY_NO  }, /* Unified Canadian Aboriginal Syllabics */
70   {0x1680, 0x169F, ENTRY_NO  }, /* Ogham */
71   {0x16A0, 0x16FF, ENTRY_NO  }, /* Runic */
72   {0x1700, 0x171F, ENTRY_NO  }, /* Tagalog */
73   {0x1720, 0x173F, ENTRY_NO  }, /* Hanunoo */
74   {0x1740, 0x175F, ENTRY_NO  }, /* Buhid */
75   {0x1760, 0x177F, ENTRY_NO  }, /* Tagbanwa */
76   {0x1780, 0x17FF, ENTRY_NO  }, /* Khmer */
77   {0x1800, 0x18AF, ENTRY_NO  }, /* Mongolian */
78   {0x18B0, 0x18FF, ENTRY_NO  }, /* Unified Canadian Aboriginal Syllabics Extended */
79   {0x1900, 0x194F, ENTRY_NO  }, /* Limbu */
80   {0x1950, 0x197F, ENTRY_NO  }, /* Tai Le */
81   {0x1980, 0x19DF, ENTRY_NO  }, /* New Tai Lue */
82   {0x19E0, 0x19FF, ENTRY_NO  }, /* Khmer Symbols */
83   {0x1A00, 0x1A1F, ENTRY_NO  }, /* Buginese */
84   {0x1A20, 0x1AAF, ENTRY_NO  }, /* Tai Tham */
85   {0x1AB0, 0x1AFF, ENTRY_NO  }, /* Combining Diacritical Marks Extended */
86   {0x1B00, 0x1B7F, ENTRY_NO  }, /* Balinese */
87   {0x1B80, 0x1BBF, ENTRY_NO  }, /* Sundanese */
88   {0x1BC0, 0x1BFF, ENTRY_NO  }, /* Batak */
89   {0x1C00, 0x1C4F, ENTRY_NO  }, /* Lepcha */
90   {0x1C50, 0x1C7F, ENTRY_NO  }, /* Ol Chiki */
91   {0x1CC0, 0x1CCF, ENTRY_NO  }, /* Sundanese Supplement */
92   {0x1CD0, 0x1CFF, ENTRY_NO  }, /* Vedic Extensions */
93   {0x1D00, 0x1D7F, ENTRY_NO  }, /* Phonetic Extensions */
94   {0x1D80, 0x1DBF, ENTRY_NO  }, /* Phonetic Extensions Supplement */
95   {0x1DC0, 0x1DFF, ENTRY_NO  }, /* Combining Diacritical Marks Supplement */
96   {0x1E00, 0x1EFF, ENTRY_GCJ }, /* Latin Extended Additional */
97   {0x1F00, 0x1FFF, ENTRY_J   }, /* Greek Extended */
98   {0x2000, 0x206F, ENTRY_GCJK}, /* General Punctuation */
99   {0x2070, 0x209F, ENTRY_JK  }, /* Superscripts and Subscripts */
100   {0x20A0, 0x20CF, ENTRY_GCJK}, /* Currency Symbols */
101   {0x20D0, 0x20FF, ENTRY_J   }, /* Combining Diacritical Marks for Symbols */
102   {0x2100, 0x214F, ENTRY_GCJK}, /* Letterlike Symbols */
103   {0x2150, 0x218F, ENTRY_GCJK}, /* Number Forms */
104   {0x2190, 0x21FF, ENTRY_GCJK}, /* Arrows */
105   {0x2200, 0x22FF, ENTRY_GCJK}, /* Mathematical Operators */
106   {0x2300, 0x23FF, ENTRY_GCJK}, /* Miscellaneous Technical */
107   {0x2400, 0x243F, ENTRY_CJ  }, /* Control Pictures */
108   {0x2440, 0x245F, ENTRY_NO  }, /* Optical Character Recognition */
109   {0x2460, 0x24FF, ENTRY_GCJK}, /* Enclosed Alphanumerics */
110   {0x2500, 0x257F, ENTRY_GCJK}, /* Box Drawing */
111   {0x2580, 0x259F, ENTRY_GCJK}, /* Block Elements */
112   {0x25A0, 0x25FF, ENTRY_GCJK}, /* Geometric Shapes */
113   {0x2600, 0x26FF, ENTRY_GCJK}, /* Miscellaneous Symbols */
114   {0x2700, 0x27BF, ENTRY_CJK }, /* Dingbats */
115   {0x27C0, 0x27EF, ENTRY_NO  }, /* Miscellaneous Mathematical Symbols-A */
116   {0x27F0, 0x27FF, ENTRY_NO  }, /* Supplemental Arrows-A */
117   {0x2800, 0x28FF, ENTRY_NO  }, /* Braille Patterns */
118   {0x2900, 0x297F, ENTRY_J   }, /* Supplemental Arrows-B */
119   {0x2980, 0x29FF, ENTRY_J   }, /* Miscellaneous Mathematical Symbols-B */
120   {0x2A00, 0x2AFF, ENTRY_NO  }, /* Supplemental Mathematical Operators */
121   {0x2B00, 0x2BFF, ENTRY_J   }, /* Miscellaneous Symbols and Arrows */
122   {0x2C00, 0x2C5F, ENTRY_NO  }, /* Glagolitic */
123   {0x2C60, 0x2C7F, ENTRY_NO  }, /* Latin Extended-C */
124   {0x2C80, 0x2CFF, ENTRY_NO  }, /* Coptic */
125   {0x2D00, 0x2D2F, ENTRY_NO  }, /* Georgian Supplement */
126   {0x2D30, 0x2D7F, ENTRY_NO  }, /* Tifinagh */
127   {0x2D80, 0x2DDF, ENTRY_NO  }, /* Ethiopic Extended */
128   {0x2DE0, 0x2DFF, ENTRY_NO  }, /* Cyrillic Extended-A */
129   {0x2E00, 0x2E7F, ENTRY_NO  }, /* Supplemental Punctuation */
130   {0x2E80, 0x2EFF, ENTRY_GCJ }, /* CJK Radicals Supplement */
131   {0x2F00, 0x2FDF, ENTRY_GCJK}, /* Kangxi Radicals */
132   {0x2FF0, 0x2FFF, ENTRY_G   }, /* Ideographic Description Characters */
133   {0x3000, 0x303F, ENTRY_GCJK}, /* CJK Symbols and Punctuation */
134   {0x3040, 0x309F, ENTRY_GCJK}, /* Hiragana */
135   {0x30A0, 0x30FF, ENTRY_GCJK}, /* Katakana */
136   {0x3100, 0x312F, ENTRY_GC  }, /* Bopomofo */
137   {0x3130, 0x318F, ENTRY_K   }, /* Hangul Compatibility Jamo */
138   {0x3190, 0x319F, ENTRY_J   }, /* Kanbun */
139   {0x31A0, 0x31BF, ENTRY_G   }, /* Bopomofo Extended */
140   {0x31C0, 0x31EF, ENTRY_C   }, /* CJK Strokes */
141   {0x31F0, 0x31FF, ENTRY_J   }, /* Katakana Phonetic Extensions */
142   {0x3200, 0x32FF, ENTRY_GCJK}, /* Enclosed CJK Letters and Months */
143   {0x3300, 0x33FF, ENTRY_GCJK}, /* CJK Compatibility */
144   {0x3400, 0x4DBF, ENTRY_GCJ }, /* CJK Unified Ideographs Extension A */
145   {0x4DC0, 0x4DFF, ENTRY_NO  }, /* Yijing Hexagram Symbols */
146   {0x4E00, 0x9FFF, ENTRY_GCJK}, /* CJK Unified Ideographs */
147   {0xA000, 0xA48F, ENTRY_G   }, /* Yi Syllables */
148   {0xA490, 0xA4CF, ENTRY_G   }, /* Yi Radicals */
149   {0xA4D0, 0xA4FF, ENTRY_NO  }, /* Lisu */
150   {0xA500, 0xA63F, ENTRY_NO  }, /* Vai */
151   {0xA640, 0xA69F, ENTRY_NO  }, /* Cyrillic Extended-B */
152   {0xA6A0, 0xA6FF, ENTRY_NO  }, /* Bamum */
153   {0xA700, 0xA71F, ENTRY_NO  }, /* Modifier Tone Letters */
154   {0xA720, 0xA7FF, ENTRY_NO  }, /* Latin Extended-D */
155   {0xA800, 0xA82F, ENTRY_NO  }, /* Syloti Nagri */
156   {0xA830, 0xA83F, ENTRY_NO  }, /* Common Indic Number Forms */
157   {0xA840, 0xA87F, ENTRY_NO  }, /* Phags-pa */
158   {0xA880, 0xA8DF, ENTRY_NO  }, /* Saurashtra */
159   {0xA8E0, 0xA8FF, ENTRY_NO  }, /* Devanagari Extended */
160   {0xA900, 0xA92F, ENTRY_NO  }, /* Kayah Li */
161   {0xA930, 0xA95F, ENTRY_NO  }, /* Rejang */
162   {0xA960, 0xA97F, ENTRY_NO  }, /* Hangul Jamo Extended-A */
163   {0xA980, 0xA9DF, ENTRY_NO  }, /* Javanese */
164   {0xA9E0, 0xA9FF, ENTRY_NO  }, /* Myanmar Extended-B */
165   {0xAA00, 0xAA5F, ENTRY_NO  }, /* Cham */
166   {0xAA60, 0xAA7F, ENTRY_NO  }, /* Myanmar Extended-A */
167   {0xAA80, 0xAADF, ENTRY_NO  }, /* Tai Viet */
168   {0xAAE0, 0xAAFF, ENTRY_NO  }, /* Meetei Mayek Extensions */
169   {0xAB00, 0xAB2F, ENTRY_NO  }, /* Ethiopic Extended-A */
170   {0xAB30, 0xAB6F, ENTRY_NO  }, /* Latin Extended-E */
171   {0xABC0, 0xABFF, ENTRY_NO  }, /* Meetei Mayek */
172   {0xAC00, 0xD7AF, ENTRY_K   }, /* Hangul Syllables */
173   {0xD7B0, 0xD7FF, ENTRY_NO  }, /* Hangul Jamo Extended-B */
174   {0xD800, 0xDB7F, ENTRY_NO  }, /* High Surrogates */
175   {0xDB80, 0xDBFF, ENTRY_NO  }, /* High Private Use Surrogates */
176   {0xDC00, 0xDFFF, ENTRY_NO  }, /* Low Surrogates */
177   {0xE000, 0xF8FF, ENTRY_GCJK}, /* Private Use Area */
178   {0xF900, 0xFAFF, ENTRY_GCJK}, /* CJK Compatibility Ideographs */
179   {0xFB00, 0xFB4F, ENTRY_J   }, /* Alphabetic Presentation Forms */
180   {0xFB50, 0xFDFF, ENTRY_NO  }, /* Arabic Presentation Forms-A */
181   {0xFE00, 0xFE0F, ENTRY_NO  }, /* Variation Selectors */
182   {0xFE10, 0xFE1F, ENTRY_GCJ }, /* Vertical Forms */
183   {0xFE20, 0xFE2F, ENTRY_NO  }, /* Combining Half Marks */
184   {0xFE30, 0xFE4F, ENTRY_GCJ }, /* CJK Compatibility Forms */
185   {0xFE50, 0xFE6F, ENTRY_GC  }, /* Small Form Variants */
186   {0xFE70, 0xFEFF, ENTRY_NO  }, /* Arabic Presentation Forms-B */
187   {0xFF00, 0xFFEF, ENTRY_GCJK}, /* Halfwidth and Fullwidth Forms */
188   {0xFFF0, 0xFFFF, ENTRY_NO  }, /* Specials */
189   {0x10000, 0x1007F, ENTRY_NO  }, /* Linear B Syllabary */
190   {0x10080, 0x100FF, ENTRY_NO  }, /* Linear B Ideograms */
191   {0x10100, 0x1013F, ENTRY_NO  }, /* Aegean Numbers */
192   {0x10140, 0x1018F, ENTRY_NO  }, /* Ancient Greek Numbers */
193   {0x10190, 0x101CF, ENTRY_NO  }, /* Ancient Symbols */
194   {0x101D0, 0x101FF, ENTRY_NO  }, /* Phaistos Disc */
195   {0x10280, 0x1029F, ENTRY_NO  }, /* Lycian */
196   {0x102A0, 0x102DF, ENTRY_NO  }, /* Carian */
197   {0x102E0, 0x102FF, ENTRY_NO  }, /* Coptic Epact Numbers */
198   {0x10300, 0x1032F, ENTRY_NO  }, /* Old Italic */
199   {0x10330, 0x1034F, ENTRY_NO  }, /* Gothic */
200   {0x10350, 0x1037F, ENTRY_NO  }, /* Old Permic */
201   {0x10380, 0x1039F, ENTRY_NO  }, /* Ugaritic */
202   {0x103A0, 0x103DF, ENTRY_NO  }, /* Old Persian */
203   {0x10400, 0x1044F, ENTRY_NO  }, /* Deseret */
204   {0x10450, 0x1047F, ENTRY_NO  }, /* Shavian */
205   {0x10480, 0x104AF, ENTRY_NO  }, /* Osmanya */
206   {0x10500, 0x1052F, ENTRY_NO  }, /* Elbasan */
207   {0x10530, 0x1056F, ENTRY_NO  }, /* Caucasian Albanian */
208   {0x10600, 0x1077F, ENTRY_NO  }, /* Linear A */
209   {0x10800, 0x1083F, ENTRY_NO  }, /* Cypriot Syllabary */
210   {0x10840, 0x1085F, ENTRY_NO  }, /* Imperial Aramaic */
211   {0x10860, 0x1087F, ENTRY_NO  }, /* Palmyrene */
212   {0x10880, 0x108AF, ENTRY_NO  }, /* Nabataean */
213   {0x10900, 0x1091F, ENTRY_NO  }, /* Phoenician */
214   {0x10920, 0x1093F, ENTRY_NO  }, /* Lydian */
215   {0x10980, 0x1099F, ENTRY_NO  }, /* Meroitic Hieroglyphs */
216   {0x109A0, 0x109FF, ENTRY_NO  }, /* Meroitic Cursive */
217   {0x10A00, 0x10A5F, ENTRY_NO  }, /* Kharoshthi */
218   {0x10A60, 0x10A7F, ENTRY_NO  }, /* Old South Arabian */
219   {0x10A80, 0x10A9F, ENTRY_NO  }, /* Old North Arabian */
220   {0x10AC0, 0x10AFF, ENTRY_NO  }, /* Manichaean */
221   {0x10B00, 0x10B3F, ENTRY_NO  }, /* Avestan */
222   {0x10B40, 0x10B5F, ENTRY_NO  }, /* Inscriptional Parthian */
223   {0x10B60, 0x10B7F, ENTRY_NO  }, /* Inscriptional Pahlavi */
224   {0x10B80, 0x10BAF, ENTRY_NO  }, /* Psalter Pahlavi */
225   {0x10C00, 0x10C4F, ENTRY_NO  }, /* Old Turkic */
226   {0x10E60, 0x10E7F, ENTRY_NO  }, /* Rumi Numeral Symbols */
227   {0x11000, 0x1107F, ENTRY_NO  }, /* Brahmi */
228   {0x11080, 0x110CF, ENTRY_NO  }, /* Kaithi */
229   {0x110D0, 0x110FF, ENTRY_NO  }, /* Sora Sompeng */
230   {0x11100, 0x1114F, ENTRY_NO  }, /* Chakma */
231   {0x11150, 0x1117F, ENTRY_NO  }, /* Mahajani */
232   {0x11180, 0x111DF, ENTRY_NO  }, /* Sharada */
233   {0x111E0, 0x111FF, ENTRY_NO  }, /* Sinhala Archaic Numbers*/
234   {0x11200, 0x1124F, ENTRY_NO  }, /* Khojki */
235   {0x112B0, 0x112FF, ENTRY_NO  }, /* Khudawadi */
236   {0x11300, 0x1137F, ENTRY_NO  }, /* Grantha */
237   {0x11480, 0x114DF, ENTRY_NO  }, /* Tirhuta */
238   {0x11580, 0x115FF, ENTRY_NO  }, /* Siddham */
239   {0x11600, 0x1165F, ENTRY_NO  }, /* Modi */
240   {0x11680, 0x116CF, ENTRY_NO  }, /* Takri */
241   {0x118A0, 0x118FF, ENTRY_NO  }, /* Warang Citi */
242   {0x11AC0, 0x11AFF, ENTRY_NO  }, /* Pau Cin Hau */
243   {0x12000, 0x123FF, ENTRY_NO  }, /* Cuneiform */
244   {0x12400, 0x1247F, ENTRY_NO  }, /* Cuneiform Numbers and Punctuation */
245   {0x13000, 0x1342F, ENTRY_NO  }, /* Egyptian Hieroglyphs */
246   {0x16800, 0x16A3F, ENTRY_NO  }, /* Bamum Supplement */
247   {0x16A40, 0x16A6F, ENTRY_NO  }, /* Mro */
248   {0x16AD0, 0x16AFF, ENTRY_NO  }, /* Bassa Vah */
249   {0x16B00, 0x16B8F, ENTRY_NO  }, /* Pahawh Hmong */
250   {0x16F00, 0x16F9F, ENTRY_NO  }, /* Miao */
251   {0x1B000, 0x1B0FF, ENTRY_NO  }, /* Kana Supplement */
252   {0x1BC00, 0x1BC9F, ENTRY_NO  }, /* Duployan */
253   {0x1BCA0, 0x1BCAF, ENTRY_NO  }, /* Shorthand Format Controls */
254   {0x1D000, 0x1D0FF, ENTRY_NO  }, /* Byzantine Musical Symbols */
255   {0x1D100, 0x1D1FF, ENTRY_NO  }, /* Musical Symbols */
256   {0x1D200, 0x1D24F, ENTRY_NO  }, /* Ancient Greek Musical Notation */
257   {0x1D300, 0x1D35F, ENTRY_NO  }, /* Tai Xuan Jing Symbols */
258   {0x1D360, 0x1D37F, ENTRY_NO  }, /* Counting Rod Numerals */
259   {0x1D400, 0x1D7FF, ENTRY_NO  }, /* Mathematical Alphanumeric Symbols */
260   {0x1E800, 0x1E8DF, ENTRY_NO  }, /* Mende Kikakui */
261   {0x1EE00, 0x1EEFF, ENTRY_NO  }, /* Arabic Mathematical Alphabetic Symbols */
262   {0x1F000, 0x1F02F, ENTRY_NO  }, /* Mahjong Tiles */
263   {0x1F030, 0x1F09F, ENTRY_NO  }, /* Domino Tiles */
264   {0x1F0A0, 0x1F0FF, ENTRY_NO  }, /* Playing Cards */
265   {0x1F100, 0x1F1FF, ENTRY_J   }, /* Enclosed Alphanumeric Supplement */
266   {0x1F200, 0x1F2FF, ENTRY_J   }, /* Enclosed Ideographic Supplement */
267   {0x1F300, 0x1F5FF, ENTRY_NO  }, /* Miscellaneous Symbols and Pictographs */
268   {0x1F600, 0x1F64F, ENTRY_NO  }, /* Emoticons */
269   {0x1F650, 0x1F67F, ENTRY_NO  }, /* Ornamental Dingbats */
270   {0x1F680, 0x1F6FF, ENTRY_NO  }, /* Transport and Map Symbols */
271   {0x1F700, 0x1F77F, ENTRY_NO  }, /* Alchemical Symbols */
272   {0x1F780, 0x1F7FF, ENTRY_NO  }, /* Geometric Shapes Extended */
273   {0x1F800, 0x1F8FF, ENTRY_NO  }, /* Supplemental Arrows-C */
274   {0x20000, 0x2A6DF, ENTRY_GCJ }, /* CJK Unified Ideographs Extension B */
275   {0x2A700, 0x2B73F, ENTRY_CJ  }, /* CJK Unified Ideographs Extension C */
276   {0x2B740, 0x2B81F, ENTRY_J   }, /* CJK Unified Ideographs Extension D */
277   {0x2F800, 0x2FA1F, ENTRY_CJ  }, /* CJK Compatibility Ideographs Supplement */
278   {0xE0000, 0xE007F, ENTRY_NO  }, /* Tags */
279   {0xE0100, 0xE01EF, ENTRY_NO  }, /* Variation Selectors Supplement */
280   {0xF0000, 0xFFFFF, ENTRY_NO  }, /* Supplementary Private Use Area-A */
281   {0x100000, 0x10FFFF, ENTRY_NO  }, /* Supplementary Private Use Area-B */
282   {0x200000, 0xFFFFFF, ENTRY_NO  }, /* illegal */
283 };
284 
285 
search_cjk_entry(int * ib,long ch,long cjk)286 int search_cjk_entry(int *ib, long ch, long cjk) {
287   if (cjk==ENTRY_NO) return 1;
288   if (cjk==ENTRY_JQ) return
289 	(ch==U_OPEN_SQUOTE || ch==U_CLOSE_SQUOTE
290 	 || ch==U_OPEN_DQUOTE || ch==U_CLOSE_DQUOTE);
291   while(ublock_data[*ib].max<ch) (*ib)++;
292   if (ublock_data[*ib].min<=ch && ch<=ublock_data[*ib].max) {
293     return ublock_data[*ib].cjk & cjk;
294   } else {
295     return 0;
296   }
297 }
298 
299 
300 #ifdef DEBUG
main()301 int main() {
302   long ch;
303   int ib;
304 
305   ib=0;
306   for (ch=0x0;ch<0x10000;ch++) {
307     printf(" %05x %2d %2d %2d %2d %2d\n", ch, ib,
308 	   search_cjk_entry(&ib,ch,ENTRY_G),
309 	   search_cjk_entry(&ib,ch,ENTRY_C),
310 	   search_cjk_entry(&ib,ch,ENTRY_J),
311 	   search_cjk_entry(&ib,ch,ENTRY_K));
312   }
313 
314 }
315 #endif
316