blob: 02ea36670e3913d88e381608f06aae963224ca93 [file] [log] [blame]
Behdad Esfahbod3f33f0d2012-10-02 16:03:18 -04001/*
2 * Copyright (C) 2012 Grigori Goronzy <greg@kinoho.net>
3 *
4 * Permission to use, copy, modify, and/or distribute this software for any
5 * purpose with or without fee is hereby granted, provided that the above
6 * copyright notice and this permission notice appear in all copies.
7 *
8 * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
9 * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
10 * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
11 * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
12 * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
13 * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
14 * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
15 */
16
17#include "hb-private.hh"
18
19#include "hb-unicode-private.hh"
20
Behdad Esfahbod3f33f0d2012-10-02 16:03:18 -040021#include "ucdn.h"
Behdad Esfahbod3f33f0d2012-10-02 16:03:18 -040022
23static const hb_script_t ucdn_script_translate[] =
24{
25 HB_SCRIPT_COMMON,
26 HB_SCRIPT_LATIN,
27 HB_SCRIPT_GREEK,
28 HB_SCRIPT_CYRILLIC,
29 HB_SCRIPT_ARMENIAN,
30 HB_SCRIPT_HEBREW,
31 HB_SCRIPT_ARABIC,
32 HB_SCRIPT_SYRIAC,
33 HB_SCRIPT_THAANA,
34 HB_SCRIPT_DEVANAGARI,
35 HB_SCRIPT_BENGALI,
36 HB_SCRIPT_GURMUKHI,
37 HB_SCRIPT_GUJARATI,
38 HB_SCRIPT_ORIYA,
39 HB_SCRIPT_TAMIL,
40 HB_SCRIPT_TELUGU,
41 HB_SCRIPT_KANNADA,
42 HB_SCRIPT_MALAYALAM,
43 HB_SCRIPT_SINHALA,
44 HB_SCRIPT_THAI,
45 HB_SCRIPT_LAO,
46 HB_SCRIPT_TIBETAN,
47 HB_SCRIPT_MYANMAR,
48 HB_SCRIPT_GEORGIAN,
49 HB_SCRIPT_HANGUL,
50 HB_SCRIPT_ETHIOPIC,
51 HB_SCRIPT_CHEROKEE,
Behdad Esfahbod54e6f6c2013-08-09 14:34:54 -040052 HB_SCRIPT_CANADIAN_SYLLABICS,
Behdad Esfahbod3f33f0d2012-10-02 16:03:18 -040053 HB_SCRIPT_OGHAM,
54 HB_SCRIPT_RUNIC,
55 HB_SCRIPT_KHMER,
56 HB_SCRIPT_MONGOLIAN,
57 HB_SCRIPT_HIRAGANA,
58 HB_SCRIPT_KATAKANA,
59 HB_SCRIPT_BOPOMOFO,
60 HB_SCRIPT_HAN,
61 HB_SCRIPT_YI,
62 HB_SCRIPT_OLD_ITALIC,
63 HB_SCRIPT_GOTHIC,
64 HB_SCRIPT_DESERET,
65 HB_SCRIPT_INHERITED,
66 HB_SCRIPT_TAGALOG,
67 HB_SCRIPT_HANUNOO,
68 HB_SCRIPT_BUHID,
69 HB_SCRIPT_TAGBANWA,
70 HB_SCRIPT_LIMBU,
71 HB_SCRIPT_TAI_LE,
72 HB_SCRIPT_LINEAR_B,
73 HB_SCRIPT_UGARITIC,
74 HB_SCRIPT_SHAVIAN,
75 HB_SCRIPT_OSMANYA,
76 HB_SCRIPT_CYPRIOT,
77 HB_SCRIPT_BRAILLE,
78 HB_SCRIPT_BUGINESE,
79 HB_SCRIPT_COPTIC,
80 HB_SCRIPT_NEW_TAI_LUE,
81 HB_SCRIPT_GLAGOLITIC,
82 HB_SCRIPT_TIFINAGH,
83 HB_SCRIPT_SYLOTI_NAGRI,
84 HB_SCRIPT_OLD_PERSIAN,
85 HB_SCRIPT_KHAROSHTHI,
86 HB_SCRIPT_BALINESE,
87 HB_SCRIPT_CUNEIFORM,
88 HB_SCRIPT_PHOENICIAN,
89 HB_SCRIPT_PHAGS_PA,
90 HB_SCRIPT_NKO,
91 HB_SCRIPT_SUNDANESE,
92 HB_SCRIPT_LEPCHA,
93 HB_SCRIPT_OL_CHIKI,
94 HB_SCRIPT_VAI,
95 HB_SCRIPT_SAURASHTRA,
96 HB_SCRIPT_KAYAH_LI,
97 HB_SCRIPT_REJANG,
98 HB_SCRIPT_LYCIAN,
99 HB_SCRIPT_CARIAN,
100 HB_SCRIPT_LYDIAN,
101 HB_SCRIPT_CHAM,
102 HB_SCRIPT_TAI_THAM,
103 HB_SCRIPT_TAI_VIET,
104 HB_SCRIPT_AVESTAN,
105 HB_SCRIPT_EGYPTIAN_HIEROGLYPHS,
106 HB_SCRIPT_SAMARITAN,
107 HB_SCRIPT_LISU,
108 HB_SCRIPT_BAMUM,
109 HB_SCRIPT_JAVANESE,
110 HB_SCRIPT_MEETEI_MAYEK,
111 HB_SCRIPT_IMPERIAL_ARAMAIC,
112 HB_SCRIPT_OLD_SOUTH_ARABIAN,
113 HB_SCRIPT_INSCRIPTIONAL_PARTHIAN,
114 HB_SCRIPT_INSCRIPTIONAL_PAHLAVI,
115 HB_SCRIPT_OLD_TURKIC,
116 HB_SCRIPT_KAITHI,
117 HB_SCRIPT_BATAK,
118 HB_SCRIPT_BRAHMI,
119 HB_SCRIPT_MANDAIC,
120 HB_SCRIPT_CHAKMA,
121 HB_SCRIPT_MEROITIC_CURSIVE,
122 HB_SCRIPT_MEROITIC_HIEROGLYPHS,
123 HB_SCRIPT_MIAO,
124 HB_SCRIPT_SHARADA,
125 HB_SCRIPT_SORA_SOMPENG,
126 HB_SCRIPT_TAKRI,
127 HB_SCRIPT_UNKNOWN,
Behdad Esfahbod0cd94492014-07-09 16:51:38 -0400128 HB_SCRIPT_BASSA_VAH,
129 HB_SCRIPT_CAUCASIAN_ALBANIAN,
130 HB_SCRIPT_DUPLOYAN,
131 HB_SCRIPT_ELBASAN,
132 HB_SCRIPT_GRANTHA,
133 HB_SCRIPT_KHOJKI,
134 HB_SCRIPT_KHUDAWADI,
135 HB_SCRIPT_LINEAR_A,
136 HB_SCRIPT_MAHAJANI,
137 HB_SCRIPT_MANICHAEAN,
138 HB_SCRIPT_MENDE_KIKAKUI,
139 HB_SCRIPT_MODI,
140 HB_SCRIPT_MRO,
141 HB_SCRIPT_NABATAEAN,
142 HB_SCRIPT_OLD_NORTH_ARABIAN,
143 HB_SCRIPT_OLD_PERMIC,
144 HB_SCRIPT_PAHAWH_HMONG,
145 HB_SCRIPT_PALMYRENE,
146 HB_SCRIPT_PAU_CIN_HAU,
147 HB_SCRIPT_PSALTER_PAHLAVI,
148 HB_SCRIPT_SIDDHAM,
149 HB_SCRIPT_TIRHUTA,
150 HB_SCRIPT_WARANG_CITI,
Grigori Goronzy91a2e5d2015-07-08 23:28:11 +0200151 HB_SCRIPT_AHOM,
152 HB_SCRIPT_ANATOLIAN_HIEROGLYPHS,
153 HB_SCRIPT_HATRAN,
154 HB_SCRIPT_MULTANI,
155 HB_SCRIPT_OLD_HUNGARIAN,
156 HB_SCRIPT_SIGNWRITING,
Behdad Esfahbod08c08af2016-07-21 01:23:33 -0700157 HB_SCRIPT_ADLAM,
158 HB_SCRIPT_BHAIKSUKI,
159 HB_SCRIPT_MARCHEN,
160 HB_SCRIPT_NEWA,
161 HB_SCRIPT_OSAGE,
162 HB_SCRIPT_TANGUT,
Behdad Esfahbod0faa16a2017-10-02 17:15:46 +0200163 HB_SCRIPT_MASARAM_GONDI,
164 HB_SCRIPT_NUSHU,
165 HB_SCRIPT_SOYOMBO,
166 HB_SCRIPT_ZANABAZAR_SQUARE,
Behdad Esfahbod3f33f0d2012-10-02 16:03:18 -0400167};
168
169static hb_unicode_combining_class_t
Behdad Esfahbod74f1b882017-10-13 11:01:55 +0200170hb_ucdn_combining_class(hb_unicode_funcs_t *ufuncs HB_UNUSED,
171 hb_codepoint_t unicode,
Behdad Esfahbod0beb66e2012-12-05 18:46:04 -0500172 void *user_data HB_UNUSED)
Behdad Esfahbod3f33f0d2012-10-02 16:03:18 -0400173{
174 return (hb_unicode_combining_class_t) ucdn_get_combining_class(unicode);
175}
176
177static unsigned int
Behdad Esfahbod74f1b882017-10-13 11:01:55 +0200178hb_ucdn_eastasian_width(hb_unicode_funcs_t *ufuncs HB_UNUSED,
179 hb_codepoint_t unicode,
Behdad Esfahbod0beb66e2012-12-05 18:46:04 -0500180 void *user_data HB_UNUSED)
Behdad Esfahbod3f33f0d2012-10-02 16:03:18 -0400181{
182 int w = ucdn_get_east_asian_width(unicode);
183 return (w == UCDN_EAST_ASIAN_F || w == UCDN_EAST_ASIAN_W) ? 2 : 1;
184}
185
186static hb_unicode_general_category_t
Behdad Esfahbod74f1b882017-10-13 11:01:55 +0200187hb_ucdn_general_category(hb_unicode_funcs_t *ufuncs HB_UNUSED,
188 hb_codepoint_t unicode,
Behdad Esfahbod0beb66e2012-12-05 18:46:04 -0500189 void *user_data HB_UNUSED)
Behdad Esfahbod3f33f0d2012-10-02 16:03:18 -0400190{
191 return (hb_unicode_general_category_t)ucdn_get_general_category(unicode);
192}
193
194static hb_codepoint_t
Behdad Esfahbod74f1b882017-10-13 11:01:55 +0200195hb_ucdn_mirroring(hb_unicode_funcs_t *ufuncs HB_UNUSED,
196 hb_codepoint_t unicode,
Behdad Esfahbod0beb66e2012-12-05 18:46:04 -0500197 void *user_data HB_UNUSED)
Behdad Esfahbod3f33f0d2012-10-02 16:03:18 -0400198{
199 return ucdn_mirror(unicode);
200}
201
202static hb_script_t
Behdad Esfahbod74f1b882017-10-13 11:01:55 +0200203hb_ucdn_script(hb_unicode_funcs_t *ufuncs HB_UNUSED,
204 hb_codepoint_t unicode,
Behdad Esfahbod0beb66e2012-12-05 18:46:04 -0500205 void *user_data HB_UNUSED)
Behdad Esfahbod3f33f0d2012-10-02 16:03:18 -0400206{
207 return ucdn_script_translate[ucdn_get_script(unicode)];
208}
209
210static hb_bool_t
Behdad Esfahbod74f1b882017-10-13 11:01:55 +0200211hb_ucdn_compose(hb_unicode_funcs_t *ufuncs HB_UNUSED,
Behdad Esfahbod0beb66e2012-12-05 18:46:04 -0500212 hb_codepoint_t a, hb_codepoint_t b, hb_codepoint_t *ab,
213 void *user_data HB_UNUSED)
Behdad Esfahbod3f33f0d2012-10-02 16:03:18 -0400214{
215 return ucdn_compose(ab, a, b);
216}
217
218static hb_bool_t
Behdad Esfahbod74f1b882017-10-13 11:01:55 +0200219hb_ucdn_decompose(hb_unicode_funcs_t *ufuncs HB_UNUSED,
Behdad Esfahbod0beb66e2012-12-05 18:46:04 -0500220 hb_codepoint_t ab, hb_codepoint_t *a, hb_codepoint_t *b,
221 void *user_data HB_UNUSED)
Behdad Esfahbod3f33f0d2012-10-02 16:03:18 -0400222{
223 return ucdn_decompose(ab, a, b);
224}
225
226static unsigned int
Behdad Esfahbod74f1b882017-10-13 11:01:55 +0200227hb_ucdn_decompose_compatibility(hb_unicode_funcs_t *ufuncs HB_UNUSED,
Behdad Esfahbod0beb66e2012-12-05 18:46:04 -0500228 hb_codepoint_t u, hb_codepoint_t *decomposed,
229 void *user_data HB_UNUSED)
Behdad Esfahbod3f33f0d2012-10-02 16:03:18 -0400230{
231 return ucdn_compat_decompose(u, decomposed);
232}
233
Behdad Esfahbod88648642017-10-27 15:26:45 -0600234static hb_unicode_funcs_t *static_ucdn_funcs = nullptr;
235
236#ifdef HB_USE_ATEXIT
237static
238void free_static_ucdn_funcs (void)
239{
Ebrahim Byagowi70d36542018-03-30 05:00:28 +0430240retry:
241 hb_unicode_funcs_t *ucdn_funcs = (hb_unicode_funcs_t *) hb_atomic_ptr_get (&static_ucdn_funcs);
242 if (!hb_atomic_ptr_cmpexch (&static_ucdn_funcs, ucdn_funcs, nullptr))
243 goto retry;
244
245 hb_unicode_funcs_destroy (ucdn_funcs);
Behdad Esfahbod88648642017-10-27 15:26:45 -0600246}
247#endif
248
Behdad Esfahbod3f33f0d2012-10-02 16:03:18 -0400249extern "C" HB_INTERNAL
250hb_unicode_funcs_t *
251hb_ucdn_get_unicode_funcs (void)
252{
Behdad Esfahbod88648642017-10-27 15:26:45 -0600253retry:
254 hb_unicode_funcs_t *funcs = (hb_unicode_funcs_t *) hb_atomic_ptr_get (&static_ucdn_funcs);
Behdad Esfahbod3f33f0d2012-10-02 16:03:18 -0400255
Behdad Esfahbod88648642017-10-27 15:26:45 -0600256 if (unlikely (!funcs))
257 {
258 funcs = hb_unicode_funcs_create (nullptr);
259
260#define HB_UNICODE_FUNC_IMPLEMENT(name) \
261 hb_unicode_funcs_set_##name##_func (funcs, hb_ucdn_##name, nullptr, nullptr);
Behdad Esfahbod3f33f0d2012-10-02 16:03:18 -0400262 HB_UNICODE_FUNCS_IMPLEMENT_CALLBACKS
263#undef HB_UNICODE_FUNC_IMPLEMENT
Behdad Esfahbod88648642017-10-27 15:26:45 -0600264
265 hb_unicode_funcs_make_immutable (funcs);
266
267 if (!hb_atomic_ptr_cmpexch (&static_ucdn_funcs, nullptr, funcs)) {
268 hb_unicode_funcs_destroy (funcs);
269 goto retry;
Behdad Esfahbod3f33f0d2012-10-02 16:03:18 -0400270 }
Behdad Esfahbod88648642017-10-27 15:26:45 -0600271
272#ifdef HB_USE_ATEXIT
273 atexit (free_static_ucdn_funcs); /* First person registers atexit() callback. */
274#endif
Behdad Esfahbod3f33f0d2012-10-02 16:03:18 -0400275 };
276
Behdad Esfahbodbfa7f372017-10-27 16:03:51 -0600277 return hb_unicode_funcs_reference (funcs);
Behdad Esfahbod3f33f0d2012-10-02 16:03:18 -0400278}