1 /*
2  * Copyright (C) 2012 Grigori Goronzy <greg@kinoho.net>
3  *
4  * Permission to use, copy, modify, and/or distribute this software for any
5  * purpose with or without fee is hereby granted, provided that the above
6  * copyright notice and this permission notice appear in all copies.
7  *
8  * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
9  * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
10  * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
11  * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
12  * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
13  * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
14  * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
15  */
16 
17 #include "hb-private.hh"
18 
19 #include "hb-unicode-private.hh"
20 
21 #include "ucdn.h"
22 
23 static const hb_script_t ucdn_script_translate[] =
24 {
25     HB_SCRIPT_COMMON,
26     HB_SCRIPT_LATIN,
27     HB_SCRIPT_GREEK,
28     HB_SCRIPT_CYRILLIC,
29     HB_SCRIPT_ARMENIAN,
30     HB_SCRIPT_HEBREW,
31     HB_SCRIPT_ARABIC,
32     HB_SCRIPT_SYRIAC,
33     HB_SCRIPT_THAANA,
34     HB_SCRIPT_DEVANAGARI,
35     HB_SCRIPT_BENGALI,
36     HB_SCRIPT_GURMUKHI,
37     HB_SCRIPT_GUJARATI,
38     HB_SCRIPT_ORIYA,
39     HB_SCRIPT_TAMIL,
40     HB_SCRIPT_TELUGU,
41     HB_SCRIPT_KANNADA,
42     HB_SCRIPT_MALAYALAM,
43     HB_SCRIPT_SINHALA,
44     HB_SCRIPT_THAI,
45     HB_SCRIPT_LAO,
46     HB_SCRIPT_TIBETAN,
47     HB_SCRIPT_MYANMAR,
48     HB_SCRIPT_GEORGIAN,
49     HB_SCRIPT_HANGUL,
50     HB_SCRIPT_ETHIOPIC,
51     HB_SCRIPT_CHEROKEE,
52     HB_SCRIPT_CANADIAN_SYLLABICS,
53     HB_SCRIPT_OGHAM,
54     HB_SCRIPT_RUNIC,
55     HB_SCRIPT_KHMER,
56     HB_SCRIPT_MONGOLIAN,
57     HB_SCRIPT_HIRAGANA,
58     HB_SCRIPT_KATAKANA,
59     HB_SCRIPT_BOPOMOFO,
60     HB_SCRIPT_HAN,
61     HB_SCRIPT_YI,
62     HB_SCRIPT_OLD_ITALIC,
63     HB_SCRIPT_GOTHIC,
64     HB_SCRIPT_DESERET,
65     HB_SCRIPT_INHERITED,
66     HB_SCRIPT_TAGALOG,
67     HB_SCRIPT_HANUNOO,
68     HB_SCRIPT_BUHID,
69     HB_SCRIPT_TAGBANWA,
70     HB_SCRIPT_LIMBU,
71     HB_SCRIPT_TAI_LE,
72     HB_SCRIPT_LINEAR_B,
73     HB_SCRIPT_UGARITIC,
74     HB_SCRIPT_SHAVIAN,
75     HB_SCRIPT_OSMANYA,
76     HB_SCRIPT_CYPRIOT,
77     HB_SCRIPT_BRAILLE,
78     HB_SCRIPT_BUGINESE,
79     HB_SCRIPT_COPTIC,
80     HB_SCRIPT_NEW_TAI_LUE,
81     HB_SCRIPT_GLAGOLITIC,
82     HB_SCRIPT_TIFINAGH,
83     HB_SCRIPT_SYLOTI_NAGRI,
84     HB_SCRIPT_OLD_PERSIAN,
85     HB_SCRIPT_KHAROSHTHI,
86     HB_SCRIPT_BALINESE,
87     HB_SCRIPT_CUNEIFORM,
88     HB_SCRIPT_PHOENICIAN,
89     HB_SCRIPT_PHAGS_PA,
90     HB_SCRIPT_NKO,
91     HB_SCRIPT_SUNDANESE,
92     HB_SCRIPT_LEPCHA,
93     HB_SCRIPT_OL_CHIKI,
94     HB_SCRIPT_VAI,
95     HB_SCRIPT_SAURASHTRA,
96     HB_SCRIPT_KAYAH_LI,
97     HB_SCRIPT_REJANG,
98     HB_SCRIPT_LYCIAN,
99     HB_SCRIPT_CARIAN,
100     HB_SCRIPT_LYDIAN,
101     HB_SCRIPT_CHAM,
102     HB_SCRIPT_TAI_THAM,
103     HB_SCRIPT_TAI_VIET,
104     HB_SCRIPT_AVESTAN,
105     HB_SCRIPT_EGYPTIAN_HIEROGLYPHS,
106     HB_SCRIPT_SAMARITAN,
107     HB_SCRIPT_LISU,
108     HB_SCRIPT_BAMUM,
109     HB_SCRIPT_JAVANESE,
110     HB_SCRIPT_MEETEI_MAYEK,
111     HB_SCRIPT_IMPERIAL_ARAMAIC,
112     HB_SCRIPT_OLD_SOUTH_ARABIAN,
113     HB_SCRIPT_INSCRIPTIONAL_PARTHIAN,
114     HB_SCRIPT_INSCRIPTIONAL_PAHLAVI,
115     HB_SCRIPT_OLD_TURKIC,
116     HB_SCRIPT_KAITHI,
117     HB_SCRIPT_BATAK,
118     HB_SCRIPT_BRAHMI,
119     HB_SCRIPT_MANDAIC,
120     HB_SCRIPT_CHAKMA,
121     HB_SCRIPT_MEROITIC_CURSIVE,
122     HB_SCRIPT_MEROITIC_HIEROGLYPHS,
123     HB_SCRIPT_MIAO,
124     HB_SCRIPT_SHARADA,
125     HB_SCRIPT_SORA_SOMPENG,
126     HB_SCRIPT_TAKRI,
127     HB_SCRIPT_UNKNOWN,
128     HB_SCRIPT_BASSA_VAH,
129     HB_SCRIPT_CAUCASIAN_ALBANIAN,
130     HB_SCRIPT_DUPLOYAN,
131     HB_SCRIPT_ELBASAN,
132     HB_SCRIPT_GRANTHA,
133     HB_SCRIPT_KHOJKI,
134     HB_SCRIPT_KHUDAWADI,
135     HB_SCRIPT_LINEAR_A,
136     HB_SCRIPT_MAHAJANI,
137     HB_SCRIPT_MANICHAEAN,
138     HB_SCRIPT_MENDE_KIKAKUI,
139     HB_SCRIPT_MODI,
140     HB_SCRIPT_MRO,
141     HB_SCRIPT_NABATAEAN,
142     HB_SCRIPT_OLD_NORTH_ARABIAN,
143     HB_SCRIPT_OLD_PERMIC,
144     HB_SCRIPT_PAHAWH_HMONG,
145     HB_SCRIPT_PALMYRENE,
146     HB_SCRIPT_PAU_CIN_HAU,
147     HB_SCRIPT_PSALTER_PAHLAVI,
148     HB_SCRIPT_SIDDHAM,
149     HB_SCRIPT_TIRHUTA,
150     HB_SCRIPT_WARANG_CITI,
151     HB_SCRIPT_AHOM,
152     HB_SCRIPT_ANATOLIAN_HIEROGLYPHS,
153     HB_SCRIPT_HATRAN,
154     HB_SCRIPT_MULTANI,
155     HB_SCRIPT_OLD_HUNGARIAN,
156     HB_SCRIPT_SIGNWRITING,
157     HB_SCRIPT_ADLAM,
158     HB_SCRIPT_BHAIKSUKI,
159     HB_SCRIPT_MARCHEN,
160     HB_SCRIPT_NEWA,
161     HB_SCRIPT_OSAGE,
162     HB_SCRIPT_TANGUT,
163     HB_SCRIPT_MASARAM_GONDI,
164     HB_SCRIPT_NUSHU,
165     HB_SCRIPT_SOYOMBO,
166     HB_SCRIPT_ZANABAZAR_SQUARE,
167 };
168 
169 static hb_unicode_combining_class_t
hb_ucdn_combining_class(hb_unicode_funcs_t * ufuncs HB_UNUSED,hb_codepoint_t unicode,void * user_data HB_UNUSED)170 hb_ucdn_combining_class(hb_unicode_funcs_t *ufuncs HB_UNUSED,
171 			hb_codepoint_t unicode,
172 			void *user_data HB_UNUSED)
173 {
174     return (hb_unicode_combining_class_t) ucdn_get_combining_class(unicode);
175 }
176 
177 static unsigned int
hb_ucdn_eastasian_width(hb_unicode_funcs_t * ufuncs HB_UNUSED,hb_codepoint_t unicode,void * user_data HB_UNUSED)178 hb_ucdn_eastasian_width(hb_unicode_funcs_t *ufuncs HB_UNUSED,
179 			hb_codepoint_t unicode,
180 			void *user_data HB_UNUSED)
181 {
182     int w = ucdn_get_east_asian_width(unicode);
183     return (w == UCDN_EAST_ASIAN_F || w == UCDN_EAST_ASIAN_W) ? 2 : 1;
184 }
185 
186 static hb_unicode_general_category_t
hb_ucdn_general_category(hb_unicode_funcs_t * ufuncs HB_UNUSED,hb_codepoint_t unicode,void * user_data HB_UNUSED)187 hb_ucdn_general_category(hb_unicode_funcs_t *ufuncs HB_UNUSED,
188 			 hb_codepoint_t unicode,
189 			 void *user_data HB_UNUSED)
190 {
191     return (hb_unicode_general_category_t)ucdn_get_general_category(unicode);
192 }
193 
194 static hb_codepoint_t
hb_ucdn_mirroring(hb_unicode_funcs_t * ufuncs HB_UNUSED,hb_codepoint_t unicode,void * user_data HB_UNUSED)195 hb_ucdn_mirroring(hb_unicode_funcs_t *ufuncs HB_UNUSED,
196 		  hb_codepoint_t unicode,
197 		  void *user_data HB_UNUSED)
198 {
199     return ucdn_mirror(unicode);
200 }
201 
202 static hb_script_t
hb_ucdn_script(hb_unicode_funcs_t * ufuncs HB_UNUSED,hb_codepoint_t unicode,void * user_data HB_UNUSED)203 hb_ucdn_script(hb_unicode_funcs_t *ufuncs HB_UNUSED,
204 	       hb_codepoint_t unicode,
205 	       void *user_data HB_UNUSED)
206 {
207     return ucdn_script_translate[ucdn_get_script(unicode)];
208 }
209 
210 static hb_bool_t
hb_ucdn_compose(hb_unicode_funcs_t * ufuncs HB_UNUSED,hb_codepoint_t a,hb_codepoint_t b,hb_codepoint_t * ab,void * user_data HB_UNUSED)211 hb_ucdn_compose(hb_unicode_funcs_t *ufuncs HB_UNUSED,
212 		hb_codepoint_t a, hb_codepoint_t b, hb_codepoint_t *ab,
213 		void *user_data HB_UNUSED)
214 {
215     return ucdn_compose(ab, a, b);
216 }
217 
218 static hb_bool_t
hb_ucdn_decompose(hb_unicode_funcs_t * ufuncs HB_UNUSED,hb_codepoint_t ab,hb_codepoint_t * a,hb_codepoint_t * b,void * user_data HB_UNUSED)219 hb_ucdn_decompose(hb_unicode_funcs_t *ufuncs HB_UNUSED,
220 		  hb_codepoint_t ab, hb_codepoint_t *a, hb_codepoint_t *b,
221 		  void *user_data HB_UNUSED)
222 {
223     return ucdn_decompose(ab, a, b);
224 }
225 
226 static unsigned int
hb_ucdn_decompose_compatibility(hb_unicode_funcs_t * ufuncs HB_UNUSED,hb_codepoint_t u,hb_codepoint_t * decomposed,void * user_data HB_UNUSED)227 hb_ucdn_decompose_compatibility(hb_unicode_funcs_t *ufuncs HB_UNUSED,
228 				hb_codepoint_t u, hb_codepoint_t *decomposed,
229 				void *user_data HB_UNUSED)
230 {
231     return ucdn_compat_decompose(u, decomposed);
232 }
233 
234 static hb_unicode_funcs_t *static_ucdn_funcs = nullptr;
235 
236 #ifdef HB_USE_ATEXIT
237 static
free_static_ucdn_funcs(void)238 void free_static_ucdn_funcs (void)
239 {
240   hb_unicode_funcs_destroy (static_ucdn_funcs);
241 }
242 #endif
243 
244 extern "C" HB_INTERNAL
245 hb_unicode_funcs_t *
hb_ucdn_get_unicode_funcs(void)246 hb_ucdn_get_unicode_funcs (void)
247 {
248 retry:
249   hb_unicode_funcs_t *funcs = (hb_unicode_funcs_t *) hb_atomic_ptr_get (&static_ucdn_funcs);
250 
251   if (unlikely (!funcs))
252   {
253     funcs = hb_unicode_funcs_create (nullptr);
254 
255 #define HB_UNICODE_FUNC_IMPLEMENT(name) \
256     hb_unicode_funcs_set_##name##_func (funcs, hb_ucdn_##name, nullptr, nullptr);
257       HB_UNICODE_FUNCS_IMPLEMENT_CALLBACKS
258 #undef HB_UNICODE_FUNC_IMPLEMENT
259 
260     hb_unicode_funcs_make_immutable (funcs);
261 
262     if (!hb_atomic_ptr_cmpexch (&static_ucdn_funcs, nullptr, funcs)) {
263       hb_unicode_funcs_destroy (funcs);
264       goto retry;
265     }
266 
267 #ifdef HB_USE_ATEXIT
268     atexit (free_static_ucdn_funcs); /* First person registers atexit() callback. */
269 #endif
270   };
271 
272   return hb_unicode_funcs_reference (funcs);
273 }
274