blob: c8640cc561e29bba1f16c753a4ba6c29b5fe450b [file] [log] [blame]
Behdad Esfahbodb9ddbd52011-06-02 17:43:12 -04001/*
Behdad Esfahbod27aba592012-05-24 15:00:01 -04002 * Copyright © 2011,2012 Google, Inc.
Behdad Esfahbodb9ddbd52011-06-02 17:43:12 -04003 *
4 * This is part of HarfBuzz, a text shaping library.
5 *
6 * Permission is hereby granted, without written agreement and without
7 * license or royalty fees, to use, copy, modify, and distribute this
8 * software and its documentation for any purpose, provided that the
9 * above copyright notice and the following two paragraphs appear in
10 * all copies of this software.
11 *
12 * IN NO EVENT SHALL THE COPYRIGHT HOLDER BE LIABLE TO ANY PARTY FOR
13 * DIRECT, INDIRECT, SPECIAL, INCIDENTAL, OR CONSEQUENTIAL DAMAGES
14 * ARISING OUT OF THE USE OF THIS SOFTWARE AND ITS DOCUMENTATION, EVEN
15 * IF THE COPYRIGHT HOLDER HAS BEEN ADVISED OF THE POSSIBILITY OF SUCH
16 * DAMAGE.
17 *
18 * THE COPYRIGHT HOLDER SPECIFICALLY DISCLAIMS ANY WARRANTIES, INCLUDING,
19 * BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND
20 * FITNESS FOR A PARTICULAR PURPOSE. THE SOFTWARE PROVIDED HEREUNDER IS
21 * ON AN "AS IS" BASIS, AND THE COPYRIGHT HOLDER HAS NO OBLIGATION TO
22 * PROVIDE MAINTENANCE, SUPPORT, UPDATES, ENHANCEMENTS, OR MODIFICATIONS.
23 *
24 * Google Author(s): Behdad Esfahbod
25 */
26
Behdad Esfahbod3ed46342012-04-19 22:34:06 -040027#include "hb-ot-shape-complex-indic-private.hh"
Behdad Esfahbod49c5ec52012-07-23 20:14:13 -040028#include "hb-ot-layout-private.hh"
Behdad Esfahbod352372a2011-07-30 19:04:02 -040029
Behdad Esfahbod3a83d332013-02-12 12:14:10 -050030/* buffer var allocations */
31#define indic_category() complex_var_u8_0() /* indic_category_t */
32#define indic_position() complex_var_u8_1() /* indic_position_t */
33
34
35/*
36 * Indic shaper.
37 */
38
39
Behdad Esfahbod76271002014-07-11 14:54:42 -040040#define IN_HALF_BLOCK(u, Base) (((u) & ~0x7Fu) == (Base))
Behdad Esfahbod3a83d332013-02-12 12:14:10 -050041
Behdad Esfahbod76271002014-07-11 14:54:42 -040042#define IS_DEVA(u) (IN_HALF_BLOCK (u, 0x0900u))
43#define IS_BENG(u) (IN_HALF_BLOCK (u, 0x0980u))
44#define IS_GURU(u) (IN_HALF_BLOCK (u, 0x0A00u))
45#define IS_GUJR(u) (IN_HALF_BLOCK (u, 0x0A80u))
46#define IS_ORYA(u) (IN_HALF_BLOCK (u, 0x0B00u))
47#define IS_TAML(u) (IN_HALF_BLOCK (u, 0x0B80u))
48#define IS_TELU(u) (IN_HALF_BLOCK (u, 0x0C00u))
49#define IS_KNDA(u) (IN_HALF_BLOCK (u, 0x0C80u))
50#define IS_MLYM(u) (IN_HALF_BLOCK (u, 0x0D00u))
51#define IS_SINH(u) (IN_HALF_BLOCK (u, 0x0D80u))
52#define IS_KHMR(u) (IN_HALF_BLOCK (u, 0x1780u))
Behdad Esfahbod3a83d332013-02-12 12:14:10 -050053
54
55#define MATRA_POS_LEFT(u) POS_PRE_M
56#define MATRA_POS_RIGHT(u) ( \
57 IS_DEVA(u) ? POS_AFTER_SUB : \
58 IS_BENG(u) ? POS_AFTER_POST : \
59 IS_GURU(u) ? POS_AFTER_POST : \
60 IS_GUJR(u) ? POS_AFTER_POST : \
61 IS_ORYA(u) ? POS_AFTER_POST : \
62 IS_TAML(u) ? POS_AFTER_POST : \
Behdad Esfahbod76271002014-07-11 14:54:42 -040063 IS_TELU(u) ? (u <= 0x0C42u ? POS_BEFORE_SUB : POS_AFTER_SUB) : \
64 IS_KNDA(u) ? (u < 0x0CC3u || u > 0xCD6u ? POS_BEFORE_SUB : POS_AFTER_SUB) : \
Behdad Esfahbod3a83d332013-02-12 12:14:10 -050065 IS_MLYM(u) ? POS_AFTER_POST : \
66 IS_SINH(u) ? POS_AFTER_SUB : \
67 IS_KHMR(u) ? POS_AFTER_POST : \
68 /*default*/ POS_AFTER_SUB \
69 )
70#define MATRA_POS_TOP(u) ( /* BENG and MLYM don't have top matras. */ \
71 IS_DEVA(u) ? POS_AFTER_SUB : \
72 IS_GURU(u) ? POS_AFTER_POST : /* Deviate from spec */ \
73 IS_GUJR(u) ? POS_AFTER_SUB : \
74 IS_ORYA(u) ? POS_AFTER_MAIN : \
75 IS_TAML(u) ? POS_AFTER_SUB : \
76 IS_TELU(u) ? POS_BEFORE_SUB : \
77 IS_KNDA(u) ? POS_BEFORE_SUB : \
78 IS_SINH(u) ? POS_AFTER_SUB : \
79 IS_KHMR(u) ? POS_AFTER_POST : \
80 /*default*/ POS_AFTER_SUB \
81 )
82#define MATRA_POS_BOTTOM(u) ( \
83 IS_DEVA(u) ? POS_AFTER_SUB : \
84 IS_BENG(u) ? POS_AFTER_SUB : \
85 IS_GURU(u) ? POS_AFTER_POST : \
86 IS_GUJR(u) ? POS_AFTER_POST : \
87 IS_ORYA(u) ? POS_AFTER_SUB : \
88 IS_TAML(u) ? POS_AFTER_POST : \
89 IS_TELU(u) ? POS_BEFORE_SUB : \
90 IS_KNDA(u) ? POS_BEFORE_SUB : \
91 IS_MLYM(u) ? POS_AFTER_POST : \
92 IS_SINH(u) ? POS_AFTER_SUB : \
93 IS_KHMR(u) ? POS_AFTER_POST : \
94 /*default*/ POS_AFTER_SUB \
95 )
96
97static inline indic_position_t
98matra_position (hb_codepoint_t u, indic_position_t side)
99{
100 switch ((int) side)
101 {
102 case POS_PRE_C: return MATRA_POS_LEFT (u);
103 case POS_POST_C: return MATRA_POS_RIGHT (u);
104 case POS_ABOVE_C: return MATRA_POS_TOP (u);
105 case POS_BELOW_C: return MATRA_POS_BOTTOM (u);
106 };
107 return side;
108}
109
110/* XXX
111 * This is a hack for now. We should move this data into the main Indic table.
112 * Or completely remove it and just check in the tables.
113 */
114static const hb_codepoint_t ra_chars[] = {
Behdad Esfahbod76271002014-07-11 14:54:42 -0400115 0x0930u, /* Devanagari */
116 0x09B0u, /* Bengali */
117 0x09F0u, /* Bengali */
118 0x0A30u, /* Gurmukhi */ /* No Reph */
119 0x0AB0u, /* Gujarati */
120 0x0B30u, /* Oriya */
121 0x0BB0u, /* Tamil */ /* No Reph */
122 0x0C30u, /* Telugu */ /* Reph formed only with ZWJ */
123 0x0CB0u, /* Kannada */
124 0x0D30u, /* Malayalam */ /* No Reph, Logical Repha */
Behdad Esfahbod3a83d332013-02-12 12:14:10 -0500125
Behdad Esfahbod76271002014-07-11 14:54:42 -0400126 0x0DBBu, /* Sinhala */ /* Reph formed only with ZWJ */
Behdad Esfahbod3a83d332013-02-12 12:14:10 -0500127
Behdad Esfahbod76271002014-07-11 14:54:42 -0400128 0x179Au, /* Khmer */ /* No Reph, Visual Repha */
Behdad Esfahbod3a83d332013-02-12 12:14:10 -0500129};
130
Behdad Esfahbod3a83d332013-02-12 12:14:10 -0500131static inline bool
132is_ra (hb_codepoint_t u)
133{
134 for (unsigned int i = 0; i < ARRAY_LENGTH (ra_chars); i++)
135 if (u == ra_chars[i])
136 return true;
137 return false;
138}
139
140static inline bool
141is_one_of (const hb_glyph_info_t &info, unsigned int flags)
142{
143 /* If it ligated, all bets are off. */
Behdad Esfahboda1f7b282013-10-18 01:09:08 +0200144 if (_hb_glyph_info_ligated (&info)) return false;
Behdad Esfahbodf8160a42015-07-21 15:50:02 +0100145 return !!(FLAG_SAFE (info.indic_category()) & flags);
Behdad Esfahbod3a83d332013-02-12 12:14:10 -0500146}
147
Behdad Esfahbod3a83d332013-02-12 12:14:10 -0500148static inline bool
149is_joiner (const hb_glyph_info_t &info)
150{
151 return is_one_of (info, JOINER_FLAGS);
152}
153
Behdad Esfahbod3a83d332013-02-12 12:14:10 -0500154static inline bool
155is_consonant (const hb_glyph_info_t &info)
156{
157 return is_one_of (info, CONSONANT_FLAGS);
158}
159
Behdad Esfahbod3a83d332013-02-12 12:14:10 -0500160static inline bool
161is_halant_or_coeng (const hb_glyph_info_t &info)
162{
163 return is_one_of (info, HALANT_OR_COENG_FLAGS);
164}
165
166static inline void
167set_indic_properties (hb_glyph_info_t &info)
168{
169 hb_codepoint_t u = info.codepoint;
170 unsigned int type = hb_indic_get_categories (u);
Behdad Esfahbod76271002014-07-11 14:54:42 -0400171 indic_category_t cat = (indic_category_t) (type & 0x7Fu);
Behdad Esfahbod3a83d332013-02-12 12:14:10 -0500172 indic_position_t pos = (indic_position_t) (type >> 8);
173
174
175 /*
176 * Re-assign category
177 */
178
Behdad Esfahbodc11fc682014-05-22 18:41:49 -0400179 /* The following act more like the Bindus. */
Ebrahim Byagowi3b0e47c2017-06-19 14:47:09 +0430180 if (unlikely (hb_in_range<hb_codepoint_t> (u, 0x0953u, 0x0954u)))
Behdad Esfahbodc11fc682014-05-22 18:41:49 -0400181 cat = OT_SM;
Behdad Esfahbod131e17f2014-05-22 19:32:51 -0400182 /* The following act like consonants. */
Ebrahim Byagowi3b0e47c2017-06-19 14:47:09 +0430183 else if (unlikely (hb_in_ranges<hb_codepoint_t> (u, 0x0A72u, 0x0A73u,
Behdad Esfahbod76271002014-07-11 14:54:42 -0400184 0x1CF5u, 0x1CF6u)))
Behdad Esfahbod131e17f2014-05-22 19:32:51 -0400185 cat = OT_C;
Behdad Esfahbodecb98ba2014-05-22 19:36:21 -0400186 /* TODO: The following should only be allowed after a Visarga.
187 * For now, just treat them like regular tone marks. */
Ebrahim Byagowi3b0e47c2017-06-19 14:47:09 +0430188 else if (unlikely (hb_in_range<hb_codepoint_t> (u, 0x1CE2u, 0x1CE8u)))
Behdad Esfahbodecb98ba2014-05-22 19:36:21 -0400189 cat = OT_A;
Behdad Esfahbode9b2a4c2014-05-23 15:49:10 -0400190 /* TODO: The following should only be allowed after some of
191 * the nasalization marks, maybe only for U+1CE9..U+1CF1.
192 * For now, just treat them like tone marks. */
Behdad Esfahbod76271002014-07-11 14:54:42 -0400193 else if (unlikely (u == 0x1CEDu))
Behdad Esfahbode9b2a4c2014-05-23 15:49:10 -0400194 cat = OT_A;
Behdad Esfahbodd19f8e82014-05-23 15:45:50 -0400195 /* The following take marks in standalone clusters, similar to Avagraha. */
Ebrahim Byagowi3b0e47c2017-06-19 14:47:09 +0430196 else if (unlikely (hb_in_ranges<hb_codepoint_t> (u, 0xA8F2u, 0xA8F7u,
Behdad Esfahbod76271002014-07-11 14:54:42 -0400197 0x1CE9u, 0x1CECu,
198 0x1CEEu, 0x1CF1u)))
Behdad Esfahbodd19f8e82014-05-23 15:45:50 -0400199 {
200 cat = OT_Symbol;
201 ASSERT_STATIC ((int) INDIC_SYLLABIC_CATEGORY_AVAGRAHA == OT_Symbol);
202 }
Ebrahim Byagowi65f64d12017-07-19 02:42:53 +0430203 else if (unlikely (hb_in_range<hb_codepoint_t> (u, 0x17CDu, 0x17D1u) ||
Behdad Esfahbod3cc84f42017-07-14 15:50:22 +0100204 u == 0x17CBu || u == 0x17D3u || u == 0x17DDu)) /* Khmer Various signs */
205 {
Behdad Esfahbodf1cd7ca2017-07-14 15:59:40 +0100206 /* These can occur mid-syllable (eg. before matras), even though Unicode marks them as Syllable_Modifier.
207 * https://github.com/roozbehp/unicode-data/issues/5 */
Behdad Esfahbod3cc84f42017-07-14 15:50:22 +0100208 cat = OT_M;
209 pos = POS_ABOVE_C;
210 }
211
Behdad Esfahbod819cc362017-10-02 09:03:16 -0400212 /* According to ScriptExtensions.txt, these Grantha marks may also be used in Tamil,
213 * so the Indic shaper needs to know their categories. */
214 else if (unlikely (u == 0x11303u)) cat = OT_SM;
215 else if (unlikely (u == 0x1133cu)) cat = OT_N;
216
Behdad Esfahbod1a0a3562017-10-02 08:49:23 -0400217 else if (unlikely (u == 0x0980u)) cat = OT_PLACEHOLDER; /* https://github.com/behdad/harfbuzz/issues/538 */
Behdad Esfahbod76271002014-07-11 14:54:42 -0400218 else if (unlikely (u == 0x17C6u)) cat = OT_N; /* Khmer Bindu doesn't like to be repositioned. */
Ebrahim Byagowi3b0e47c2017-06-19 14:47:09 +0430219 else if (unlikely (hb_in_range<hb_codepoint_t> (u, 0x2010u, 0x2011u)))
Behdad Esfahbod76271002014-07-11 14:54:42 -0400220 cat = OT_PLACEHOLDER;
221 else if (unlikely (u == 0x25CCu)) cat = OT_DOTTEDCIRCLE;
Behdad Esfahbod3a83d332013-02-12 12:14:10 -0500222
223
224 /*
225 * Re-assign position.
226 */
227
Behdad Esfahbodf8160a42015-07-21 15:50:02 +0100228 if ((FLAG_SAFE (cat) & CONSONANT_FLAGS))
Behdad Esfahbod3a83d332013-02-12 12:14:10 -0500229 {
Behdad Esfahbodc4e71ff2013-10-17 17:04:47 +0200230 pos = POS_BASE_C;
Behdad Esfahbod3a83d332013-02-12 12:14:10 -0500231 if (is_ra (u))
232 cat = OT_Ra;
233 }
234 else if (cat == OT_M)
235 {
236 pos = matra_position (u, pos);
237 }
Behdad Esfahbodf8160a42015-07-21 15:50:02 +0100238 else if ((FLAG_SAFE (cat) & (FLAG (OT_SM) | FLAG (OT_VD) | FLAG (OT_A) | FLAG (OT_Symbol))))
Behdad Esfahbod3a83d332013-02-12 12:14:10 -0500239 {
240 pos = POS_SMVD;
241 }
242
Behdad Esfahbod76271002014-07-11 14:54:42 -0400243 if (unlikely (u == 0x0B01u)) pos = POS_BEFORE_SUB; /* Oriya Bindu is BeforeSub in the spec. */
Behdad Esfahbod3a83d332013-02-12 12:14:10 -0500244
245
246
247 info.indic_category() = cat;
248 info.indic_position() = pos;
249}
250
251/*
252 * Things above this line should ideally be moved to the Indic table itself.
253 */
254
Behdad Esfahbod1d002042012-08-02 05:01:11 -0400255
Behdad Esfahbod11b0e202012-08-02 14:21:40 -0400256/*
Behdad Esfahbod11b0e202012-08-02 14:21:40 -0400257 * Indic configurations. Note that we do not want to keep every single script-specific
258 * behavior in these tables necessarily. This should mainly be used for per-script
259 * properties that are cheaper keeping here, than in the code. Ie. if, say, one and
260 * only one script has an exception, that one script can be if'ed directly in the code,
261 * instead of adding a new flag in these structs.
262 */
263
264enum base_position_t {
265 BASE_POS_FIRST,
Behdad Esfahbode10453e2013-10-17 16:49:06 +0200266 BASE_POS_LAST_SINHALA,
Behdad Esfahbod11b0e202012-08-02 14:21:40 -0400267 BASE_POS_LAST
268};
269enum reph_position_t {
Behdad Esfahbod11b0e202012-08-02 14:21:40 -0400270 REPH_POS_AFTER_MAIN = POS_AFTER_MAIN,
271 REPH_POS_BEFORE_SUB = POS_BEFORE_SUB,
272 REPH_POS_AFTER_SUB = POS_AFTER_SUB,
273 REPH_POS_BEFORE_POST = POS_BEFORE_POST,
Behdad Esfahbod74f4bbf2013-10-17 19:07:53 +0200274 REPH_POS_AFTER_POST = POS_AFTER_POST,
275 REPH_POS_DONT_CARE = POS_RA_TO_BECOME_REPH
Behdad Esfahbod11b0e202012-08-02 14:21:40 -0400276};
277enum reph_mode_t {
278 REPH_MODE_IMPLICIT, /* Reph formed out of initial Ra,H sequence. */
279 REPH_MODE_EXPLICIT, /* Reph formed out of initial Ra,H,ZWJ sequence. */
280 REPH_MODE_VIS_REPHA, /* Encoded Repha character, no reordering needed. */
281 REPH_MODE_LOG_REPHA /* Encoded Repha character, needs reordering. */
282};
Behdad Esfahbod8acbb6b2013-10-15 12:15:49 +0200283enum blwf_mode_t {
284 BLWF_MODE_PRE_AND_POST, /* Below-forms feature applied to pre-base and post-base. */
285 BLWF_MODE_POST_ONLY /* Below-forms feature applied to post-base only. */
286};
Behdad Esfahbod11b0e202012-08-02 14:21:40 -0400287struct indic_config_t
288{
289 hb_script_t script;
290 bool has_old_spec;
291 hb_codepoint_t virama;
292 base_position_t base_pos;
293 reph_position_t reph_pos;
294 reph_mode_t reph_mode;
Behdad Esfahbod8acbb6b2013-10-15 12:15:49 +0200295 blwf_mode_t blwf_mode;
Behdad Esfahbod11b0e202012-08-02 14:21:40 -0400296};
297
298static const indic_config_t indic_configs[] =
299{
300 /* Default. Should be first. */
Behdad Esfahbod3c1666c2016-05-06 16:05:07 +0100301 {HB_SCRIPT_INVALID, false, 0,BASE_POS_LAST, REPH_POS_BEFORE_POST,REPH_MODE_IMPLICIT, BLWF_MODE_PRE_AND_POST},
302 {HB_SCRIPT_DEVANAGARI,true, 0x094Du,BASE_POS_LAST, REPH_POS_BEFORE_POST,REPH_MODE_IMPLICIT, BLWF_MODE_PRE_AND_POST},
303 {HB_SCRIPT_BENGALI, true, 0x09CDu,BASE_POS_LAST, REPH_POS_AFTER_SUB, REPH_MODE_IMPLICIT, BLWF_MODE_PRE_AND_POST},
304 {HB_SCRIPT_GURMUKHI, true, 0x0A4Du,BASE_POS_LAST, REPH_POS_BEFORE_SUB, REPH_MODE_IMPLICIT, BLWF_MODE_PRE_AND_POST},
305 {HB_SCRIPT_GUJARATI, true, 0x0ACDu,BASE_POS_LAST, REPH_POS_BEFORE_POST,REPH_MODE_IMPLICIT, BLWF_MODE_PRE_AND_POST},
306 {HB_SCRIPT_ORIYA, true, 0x0B4Du,BASE_POS_LAST, REPH_POS_AFTER_MAIN, REPH_MODE_IMPLICIT, BLWF_MODE_PRE_AND_POST},
307 {HB_SCRIPT_TAMIL, true, 0x0BCDu,BASE_POS_LAST, REPH_POS_AFTER_POST, REPH_MODE_IMPLICIT, BLWF_MODE_PRE_AND_POST},
308 {HB_SCRIPT_TELUGU, true, 0x0C4Du,BASE_POS_LAST, REPH_POS_AFTER_POST, REPH_MODE_EXPLICIT, BLWF_MODE_POST_ONLY},
309 {HB_SCRIPT_KANNADA, true, 0x0CCDu,BASE_POS_LAST, REPH_POS_AFTER_POST, REPH_MODE_IMPLICIT, BLWF_MODE_POST_ONLY},
310 {HB_SCRIPT_MALAYALAM, true, 0x0D4Du,BASE_POS_LAST, REPH_POS_AFTER_MAIN, REPH_MODE_LOG_REPHA,BLWF_MODE_PRE_AND_POST},
Behdad Esfahbod76271002014-07-11 14:54:42 -0400311 {HB_SCRIPT_SINHALA, false,0x0DCAu,BASE_POS_LAST_SINHALA,
Behdad Esfahbod3c1666c2016-05-06 16:05:07 +0100312 REPH_POS_AFTER_MAIN, REPH_MODE_EXPLICIT, BLWF_MODE_PRE_AND_POST},
313 {HB_SCRIPT_KHMER, false,0x17D2u,BASE_POS_FIRST,REPH_POS_DONT_CARE, REPH_MODE_VIS_REPHA,BLWF_MODE_PRE_AND_POST},
Behdad Esfahbod11b0e202012-08-02 14:21:40 -0400314};
315
316
317
318/*
319 * Indic shaper.
320 */
Behdad Esfahbod9ccc6382012-07-19 12:32:16 -0400321
Behdad Esfahbodeed903b2012-05-11 20:50:53 +0200322struct feature_list_t {
Behdad Esfahbodc7fe56a2011-06-24 19:05:34 -0400323 hb_tag_t tag;
Behdad Esfahbodec544862013-02-14 11:25:10 -0500324 hb_ot_map_feature_flags_t flags;
Behdad Esfahbodeed903b2012-05-11 20:50:53 +0200325};
326
327static const feature_list_t
Behdad Esfahbod85fc6c42012-08-02 12:21:44 -0400328indic_features[] =
Behdad Esfahbodb9ddbd52011-06-02 17:43:12 -0400329{
Behdad Esfahbod85fc6c42012-08-02 12:21:44 -0400330 /*
331 * Basic features.
332 * These features are applied in order, one at a time, after initial_reordering.
333 */
Behdad Esfahboda8cf7b42013-03-19 05:53:26 -0400334 {HB_TAG('n','u','k','t'), F_GLOBAL},
335 {HB_TAG('a','k','h','n'), F_GLOBAL},
336 {HB_TAG('r','p','h','f'), F_NONE},
337 {HB_TAG('r','k','r','f'), F_GLOBAL},
338 {HB_TAG('p','r','e','f'), F_NONE},
339 {HB_TAG('b','l','w','f'), F_NONE},
Behdad Esfahboda8cf7b42013-03-19 05:53:26 -0400340 {HB_TAG('a','b','v','f'), F_NONE},
Behdad Esfahboda01cbf62013-10-15 16:37:53 +0200341 {HB_TAG('h','a','l','f'), F_NONE},
Behdad Esfahboda8cf7b42013-03-19 05:53:26 -0400342 {HB_TAG('p','s','t','f'), F_NONE},
Behdad Esfahboda8cf7b42013-03-19 05:53:26 -0400343 {HB_TAG('v','a','t','u'), F_GLOBAL},
344 {HB_TAG('c','j','c','t'), F_GLOBAL},
Behdad Esfahboda01cbf62013-10-15 16:37:53 +0200345 {HB_TAG('c','f','a','r'), F_NONE},
Behdad Esfahbod85fc6c42012-08-02 12:21:44 -0400346 /*
347 * Other features.
348 * These features are applied all at once, after final_reordering.
Behdad Esfahboda01cbf62013-10-15 16:37:53 +0200349 * Default Bengali font in Windows for example has intermixed
350 * lookups for init,pres,abvs,blws features.
Behdad Esfahbod85fc6c42012-08-02 12:21:44 -0400351 */
Behdad Esfahbodec544862013-02-14 11:25:10 -0500352 {HB_TAG('i','n','i','t'), F_NONE},
353 {HB_TAG('p','r','e','s'), F_GLOBAL},
354 {HB_TAG('a','b','v','s'), F_GLOBAL},
355 {HB_TAG('b','l','w','s'), F_GLOBAL},
356 {HB_TAG('p','s','t','s'), F_GLOBAL},
357 {HB_TAG('h','a','l','n'), F_GLOBAL},
Behdad Esfahbod85fc6c42012-08-02 12:21:44 -0400358 /* Positioning features, though we don't care about the types. */
Behdad Esfahbodec544862013-02-14 11:25:10 -0500359 {HB_TAG('d','i','s','t'), F_GLOBAL},
360 {HB_TAG('a','b','v','m'), F_GLOBAL},
361 {HB_TAG('b','l','w','m'), F_GLOBAL},
Behdad Esfahbodc7fe56a2011-06-24 19:05:34 -0400362};
363
Behdad Esfahbod85fc6c42012-08-02 12:21:44 -0400364/*
365 * Must be in the same order as the indic_features array.
366 */
Behdad Esfahbodc7fe56a2011-06-24 19:05:34 -0400367enum {
368 _NUKT,
Behdad Esfahbode0475342012-07-19 20:24:14 -0400369 _AKHN,
Behdad Esfahbodc7fe56a2011-06-24 19:05:34 -0400370 RPHF,
Behdad Esfahboddf6d45c2012-05-09 11:38:31 +0200371 _RKRF,
Behdad Esfahbodc7fe56a2011-06-24 19:05:34 -0400372 PREF,
Behdad Esfahbod167b6252012-08-05 21:16:26 -0700373 BLWF,
Behdad Esfahbod29f106d2012-07-16 12:05:35 -0400374 ABVF,
Behdad Esfahboda01cbf62013-10-15 16:37:53 +0200375 HALF,
Behdad Esfahbodc7fe56a2011-06-24 19:05:34 -0400376 PSTF,
Behdad Esfahbod85fc6c42012-08-02 12:21:44 -0400377 _VATU,
Behdad Esfahbod70d65652013-02-12 18:01:21 -0500378 _CJCT,
Behdad Esfahboda01cbf62013-10-15 16:37:53 +0200379 CFAR,
Behdad Esfahbod85fc6c42012-08-02 12:21:44 -0400380
381 INIT,
382 _PRES,
383 _ABVS,
384 _BLWS,
385 _PSTS,
386 _HALN,
387 _DIST,
388 _ABVM,
389 _BLWM,
390
391 INDIC_NUM_FEATURES,
392 INDIC_BASIC_FEATURES = INIT /* Don't forget to update this! */
Behdad Esfahbodb9ddbd52011-06-02 17:43:12 -0400393};
394
Behdad Esfahbod743807a2011-07-29 16:37:02 -0400395static void
Behdad Esfahbod166b5cf2012-09-07 14:55:07 -0400396setup_syllables (const hb_ot_shape_plan_t *plan,
397 hb_font_t *font,
398 hb_buffer_t *buffer);
399static void
Behdad Esfahbod8bb5deb2012-08-02 10:07:58 -0400400initial_reordering (const hb_ot_shape_plan_t *plan,
Behdad Esfahbodafbcc242012-08-02 08:36:40 -0400401 hb_font_t *font,
Behdad Esfahbod3e38c0f2012-08-02 09:44:18 -0400402 hb_buffer_t *buffer);
Behdad Esfahbodf6fd3782011-07-08 00:22:40 -0400403static void
Behdad Esfahbod8bb5deb2012-08-02 10:07:58 -0400404final_reordering (const hb_ot_shape_plan_t *plan,
Behdad Esfahbodafbcc242012-08-02 08:36:40 -0400405 hb_font_t *font,
Behdad Esfahbod3e38c0f2012-08-02 09:44:18 -0400406 hb_buffer_t *buffer);
Behdad Esfahbod30145272013-10-15 13:47:27 +0200407static void
408clear_syllables (const hb_ot_shape_plan_t *plan,
409 hb_font_t *font,
410 hb_buffer_t *buffer);
Behdad Esfahbodb9ddbd52011-06-02 17:43:12 -0400411
Behdad Esfahbod693918e2012-07-30 21:08:51 -0400412static void
Behdad Esfahbod16c6a272012-08-02 09:38:28 -0400413collect_features_indic (hb_ot_shape_planner_t *plan)
Behdad Esfahbodb9ddbd52011-06-02 17:43:12 -0400414{
Behdad Esfahbod16c6a272012-08-02 09:38:28 -0400415 hb_ot_map_builder_t *map = &plan->map;
416
Behdad Esfahbod166b5cf2012-09-07 14:55:07 -0400417 /* Do this before any lookups have been applied. */
418 map->add_gsub_pause (setup_syllables);
419
Behdad Esfahbode7ffcfa2013-02-14 11:05:56 -0500420 map->add_global_bool_feature (HB_TAG('l','o','c','l'));
Behdad Esfahboda54a5502011-07-20 16:42:10 -0400421 /* The Indic specs do not require ccmp, but we apply it here since if
422 * there is a use of it, it's typically at the beginning. */
Behdad Esfahbode7ffcfa2013-02-14 11:05:56 -0500423 map->add_global_bool_feature (HB_TAG('c','c','m','p'));
Behdad Esfahbodf6fd3782011-07-08 00:22:40 -0400424
Behdad Esfahbodf6fd3782011-07-08 00:22:40 -0400425
Behdad Esfahbod85fc6c42012-08-02 12:21:44 -0400426 unsigned int i = 0;
427 map->add_gsub_pause (initial_reordering);
428 for (; i < INDIC_BASIC_FEATURES; i++) {
Behdad Esfahbode359a4b2017-07-14 14:14:35 +0100429 map->add_feature (indic_features[i].tag, 1, indic_features[i].flags | F_MANUAL_ZWJ | F_MANUAL_ZWNJ);
Behdad Esfahbod3e38c0f2012-08-02 09:44:18 -0400430 map->add_gsub_pause (NULL);
Behdad Esfahbod412b9182012-05-09 11:07:18 +0200431 }
Behdad Esfahbod3e38c0f2012-08-02 09:44:18 -0400432 map->add_gsub_pause (final_reordering);
Behdad Esfahbod85fc6c42012-08-02 12:21:44 -0400433 for (; i < INDIC_NUM_FEATURES; i++) {
Behdad Esfahbode359a4b2017-07-14 14:14:35 +0100434 map->add_feature (indic_features[i].tag, 1, indic_features[i].flags | F_MANUAL_ZWJ | F_MANUAL_ZWNJ);
Behdad Esfahbod85fc6c42012-08-02 12:21:44 -0400435 }
Behdad Esfahbod42d0f552013-10-17 13:05:05 +0200436
437 map->add_global_bool_feature (HB_TAG('c','a','l','t'));
438 map->add_global_bool_feature (HB_TAG('c','l','i','g'));
439
Behdad Esfahbod30145272013-10-15 13:47:27 +0200440 map->add_gsub_pause (clear_syllables);
Behdad Esfahbodb9ddbd52011-06-02 17:43:12 -0400441}
442
Behdad Esfahbod693918e2012-07-30 21:08:51 -0400443static void
Behdad Esfahbod16c6a272012-08-02 09:38:28 -0400444override_features_indic (hb_ot_shape_planner_t *plan)
Behdad Esfahbodd96838e2012-07-16 20:26:57 -0400445{
Behdad Esfahbodeb102332013-10-15 15:26:44 +0200446 /* Uniscribe does not apply 'kern' in Khmer. */
Behdad Esfahbodbab02d32013-02-12 15:26:45 -0500447 if (hb_options ().uniscribe_bug_compatible)
Behdad Esfahbodeb102332013-10-15 15:26:44 +0200448 {
449 switch ((hb_tag_t) plan->props.script)
450 {
451 case HB_SCRIPT_KHMER:
Behdad Esfahbod9ac6b012013-10-17 16:27:38 +0200452 plan->map.add_feature (HB_TAG('k','e','r','n'), 0, F_GLOBAL);
Behdad Esfahbodeb102332013-10-15 15:26:44 +0200453 break;
454 }
455 }
Behdad Esfahbod6b389dd2012-11-12 11:02:56 -0800456
Behdad Esfahbodec544862013-02-14 11:25:10 -0500457 plan->map.add_feature (HB_TAG('l','i','g','a'), 0, F_GLOBAL);
Behdad Esfahbodd96838e2012-07-16 20:26:57 -0400458}
459
Behdad Esfahbod867361c2011-06-17 18:35:46 -0400460
Behdad Esfahbod85fc6c42012-08-02 12:21:44 -0400461struct would_substitute_feature_t
Behdad Esfahboda8c6da92012-08-02 10:46:34 -0400462{
Behdad Esfahbodb5a0f692013-10-17 18:04:23 +0200463 inline void init (const hb_ot_map_t *map, hb_tag_t feature_tag, bool zero_context_)
Behdad Esfahboda8c6da92012-08-02 10:46:34 -0400464 {
Behdad Esfahbodb5a0f692013-10-17 18:04:23 +0200465 zero_context = zero_context_;
Behdad Esfahboda8c6da92012-08-02 10:46:34 -0400466 map->get_stage_lookups (0/*GSUB*/,
467 map->get_feature_stage (0/*GSUB*/, feature_tag),
468 &lookups, &count);
469 }
470
Behdad Esfahbod81449362013-03-05 20:08:59 -0500471 inline bool would_substitute (const hb_codepoint_t *glyphs,
472 unsigned int glyphs_count,
Behdad Esfahbod81449362013-03-05 20:08:59 -0500473 hb_face_t *face) const
Behdad Esfahboda8c6da92012-08-02 10:46:34 -0400474 {
475 for (unsigned int i = 0; i < count; i++)
Behdad Esfahbod362a9902012-11-15 14:57:31 -0800476 if (hb_ot_layout_lookup_would_substitute_fast (face, lookups[i].index, glyphs, glyphs_count, zero_context))
Behdad Esfahboda8c6da92012-08-02 10:46:34 -0400477 return true;
478 return false;
479 }
480
481 private:
482 const hb_ot_map_t::lookup_map_t *lookups;
483 unsigned int count;
Behdad Esfahbodb5a0f692013-10-17 18:04:23 +0200484 bool zero_context;
Behdad Esfahboda8c6da92012-08-02 10:46:34 -0400485};
486
487struct indic_shape_plan_t
488{
Behdad Esfahbod85fc6c42012-08-02 12:21:44 -0400489 ASSERT_POD ();
Behdad Esfahbod914ffaa2012-08-02 11:03:39 -0400490
491 inline bool get_virama_glyph (hb_font_t *font, hb_codepoint_t *pglyph) const
492 {
493 hb_codepoint_t glyph = virama_glyph;
494 if (unlikely (virama_glyph == (hb_codepoint_t) -1))
495 {
Behdad Esfahbod8b5bc142016-02-24 19:05:23 +0900496 if (!config->virama || !font->get_nominal_glyph (config->virama, &glyph))
Behdad Esfahbod914ffaa2012-08-02 11:03:39 -0400497 glyph = 0;
498 /* Technically speaking, the spec says we should apply 'locl' to virama too.
499 * Maybe one day... */
500
Behdad Esfahbod8b5bc142016-02-24 19:05:23 +0900501 /* Our get_nominal_glyph() function needs a font, so we can't get the virama glyph
Behdad Esfahbod914ffaa2012-08-02 11:03:39 -0400502 * during shape planning... Instead, overwrite it here. It's safe. Don't worry! */
503 (const_cast<indic_shape_plan_t *> (this))->virama_glyph = glyph;
504 }
505
506 *pglyph = glyph;
507 return glyph != 0;
508 }
Behdad Esfahbod85fc6c42012-08-02 12:21:44 -0400509
Behdad Esfahbod11b0e202012-08-02 14:21:40 -0400510 const indic_config_t *config;
Behdad Esfahbod85fc6c42012-08-02 12:21:44 -0400511
512 bool is_old_spec;
Behdad Esfahbod85fc6c42012-08-02 12:21:44 -0400513 hb_codepoint_t virama_glyph;
514
Behdad Esfahbodf2c0f592012-11-12 14:02:02 -0800515 would_substitute_feature_t rphf;
Behdad Esfahbod85fc6c42012-08-02 12:21:44 -0400516 would_substitute_feature_t pref;
517 would_substitute_feature_t blwf;
518 would_substitute_feature_t pstf;
519
520 hb_mask_t mask_array[INDIC_NUM_FEATURES];
Behdad Esfahboda8c6da92012-08-02 10:46:34 -0400521};
522
523static void *
524data_create_indic (const hb_ot_shape_plan_t *plan)
525{
Behdad Esfahbod85fc6c42012-08-02 12:21:44 -0400526 indic_shape_plan_t *indic_plan = (indic_shape_plan_t *) calloc (1, sizeof (indic_shape_plan_t));
527 if (unlikely (!indic_plan))
Behdad Esfahboda8c6da92012-08-02 10:46:34 -0400528 return NULL;
529
Behdad Esfahbod11b0e202012-08-02 14:21:40 -0400530 indic_plan->config = &indic_configs[0];
531 for (unsigned int i = 1; i < ARRAY_LENGTH (indic_configs); i++)
532 if (plan->props.script == indic_configs[i].script) {
533 indic_plan->config = &indic_configs[i];
534 break;
Behdad Esfahbod85fc6c42012-08-02 12:21:44 -0400535 }
Behdad Esfahbod11b0e202012-08-02 14:21:40 -0400536
Behdad Esfahbod76271002014-07-11 14:54:42 -0400537 indic_plan->is_old_spec = indic_plan->config->has_old_spec && ((plan->map.chosen_script[0] & 0x000000FFu) != '2');
Behdad Esfahbod11b0e202012-08-02 14:21:40 -0400538 indic_plan->virama_glyph = (hb_codepoint_t) -1;
Behdad Esfahboda8c6da92012-08-02 10:46:34 -0400539
Behdad Esfahbodb5a0f692013-10-17 18:04:23 +0200540 /* Use zero-context would_substitute() matching for new-spec of the main
Behdad Esfahbod508cc3d2015-12-17 17:31:17 +0000541 * Indic scripts, and scripts with one spec only, but not for old-specs.
542 * The new-spec for all dual-spec scripts says zero-context matching happens.
543 *
544 * However, testing with Malayalam shows that old and new spec both allow
545 * context. Testing with Bengali new-spec however shows that it doesn't.
546 * So, the heuristic here is the way it is. It should *only* be changed,
547 * as we discover more cases of what Windows does. DON'T TOUCH OTHERWISE.
548 */
549 bool zero_context = !indic_plan->is_old_spec && plan->props.script != HB_SCRIPT_MALAYALAM;
Behdad Esfahbodb5a0f692013-10-17 18:04:23 +0200550 indic_plan->rphf.init (&plan->map, HB_TAG('r','p','h','f'), zero_context);
551 indic_plan->pref.init (&plan->map, HB_TAG('p','r','e','f'), zero_context);
552 indic_plan->blwf.init (&plan->map, HB_TAG('b','l','w','f'), zero_context);
553 indic_plan->pstf.init (&plan->map, HB_TAG('p','s','t','f'), zero_context);
Behdad Esfahbod85fc6c42012-08-02 12:21:44 -0400554
555 for (unsigned int i = 0; i < ARRAY_LENGTH (indic_plan->mask_array); i++)
Behdad Esfahbodec544862013-02-14 11:25:10 -0500556 indic_plan->mask_array[i] = (indic_features[i].flags & F_GLOBAL) ?
557 0 : plan->map.get_1_mask (indic_features[i].tag);
Behdad Esfahbod85fc6c42012-08-02 12:21:44 -0400558
559 return indic_plan;
Behdad Esfahboda8c6da92012-08-02 10:46:34 -0400560}
561
562static void
563data_destroy_indic (void *data)
564{
565 free (data);
566}
567
568static indic_position_t
569consonant_position_from_face (const indic_shape_plan_t *indic_plan,
Behdad Esfahbod684fe592013-10-17 18:30:06 +0200570 const hb_codepoint_t consonant,
571 const hb_codepoint_t virama,
Behdad Esfahbod81449362013-03-05 20:08:59 -0500572 hb_face_t *face)
Behdad Esfahboda8c6da92012-08-02 10:46:34 -0400573{
Behdad Esfahbod81449362013-03-05 20:08:59 -0500574 /* For old-spec, the order of glyphs is Consonant,Virama,
575 * whereas for new-spec, it's Virama,Consonant. However,
576 * some broken fonts (like Free Sans) simply copied lookups
577 * from old-spec to new-spec without modification.
578 * And oddly enough, Uniscribe seems to respect those lookups.
579 * Eg. in the sequence U+0924,U+094D,U+0930, Uniscribe finds
580 * base at 0. The font however, only has lookups matching
581 * 930,94D in 'blwf', not the expected 94D,930 (with new-spec
582 * table). As such, we simply match both sequences. Seems
583 * to work. */
Behdad Esfahbod684fe592013-10-17 18:30:06 +0200584 hb_codepoint_t glyphs[3] = {virama, consonant, virama};
Behdad Esfahbodb5a0f692013-10-17 18:04:23 +0200585 if (indic_plan->blwf.would_substitute (glyphs , 2, face) ||
Behdad Esfahbod684fe592013-10-17 18:30:06 +0200586 indic_plan->blwf.would_substitute (glyphs+1, 2, face))
Behdad Esfahbod81449362013-03-05 20:08:59 -0500587 return POS_BELOW_C;
Behdad Esfahbodb5a0f692013-10-17 18:04:23 +0200588 if (indic_plan->pstf.would_substitute (glyphs , 2, face) ||
Behdad Esfahbod684fe592013-10-17 18:30:06 +0200589 indic_plan->pstf.would_substitute (glyphs+1, 2, face))
Behdad Esfahbod81449362013-03-05 20:08:59 -0500590 return POS_POST_C;
Behdad Esfahbod3c1666c2016-05-06 16:05:07 +0100591 if (indic_plan->pref.would_substitute (glyphs , 2, face) ||
592 indic_plan->pref.would_substitute (glyphs+1, 2, face))
Behdad Esfahbodae9a5832013-10-17 12:24:55 +0200593 return POS_POST_C;
Behdad Esfahboda8c6da92012-08-02 10:46:34 -0400594 return POS_BASE_C;
595}
596
597
Behdad Esfahbod166b5cf2012-09-07 14:55:07 -0400598enum syllable_type_t {
599 consonant_syllable,
600 vowel_syllable,
601 standalone_cluster,
Behdad Esfahbod9f9bd9b2014-05-23 15:33:13 -0400602 symbol_cluster,
Behdad Esfahbod166b5cf2012-09-07 14:55:07 -0400603 broken_cluster,
604 non_indic_cluster,
605};
606
607#include "hb-ot-shape-complex-indic-machine.hh"
608
609
Behdad Esfahbod693918e2012-07-30 21:08:51 -0400610static void
Behdad Esfahbod16c6a272012-08-02 09:38:28 -0400611setup_masks_indic (const hb_ot_shape_plan_t *plan HB_UNUSED,
612 hb_buffer_t *buffer,
613 hb_font_t *font HB_UNUSED)
Behdad Esfahbod24eacf12012-08-02 08:42:11 -0400614{
615 HB_BUFFER_ALLOCATE_VAR (buffer, indic_category);
616 HB_BUFFER_ALLOCATE_VAR (buffer, indic_position);
617
618 /* We cannot setup masks here. We save information about characters
619 * and setup masks later on in a pause-callback. */
620
621 unsigned int count = buffer->len;
Behdad Esfahbod7cd33f22014-07-17 14:22:11 -0400622 hb_glyph_info_t *info = buffer->info;
Behdad Esfahbod24eacf12012-08-02 08:42:11 -0400623 for (unsigned int i = 0; i < count; i++)
Behdad Esfahbod7cd33f22014-07-17 14:22:11 -0400624 set_indic_properties (info[i]);
Behdad Esfahbod24eacf12012-08-02 08:42:11 -0400625}
626
Behdad Esfahbod166b5cf2012-09-07 14:55:07 -0400627static void
628setup_syllables (const hb_ot_shape_plan_t *plan HB_UNUSED,
629 hb_font_t *font HB_UNUSED,
630 hb_buffer_t *buffer)
631{
632 find_syllables (buffer);
Behdad Esfahbod9e005c52017-08-10 18:45:33 -0700633 foreach_syllable (buffer, start, end)
634 buffer->unsafe_to_break (start, end);
Behdad Esfahbod166b5cf2012-09-07 14:55:07 -0400635}
636
Behdad Esfahbod24eacf12012-08-02 08:42:11 -0400637static int
638compare_indic_order (const hb_glyph_info_t *pa, const hb_glyph_info_t *pb)
639{
640 int a = pa->indic_position();
641 int b = pb->indic_position();
642
643 return a < b ? -1 : a == b ? 0 : +1;
644}
645
646
647
648static void
Behdad Esfahbod8bb5deb2012-08-02 10:07:58 -0400649update_consonant_positions (const hb_ot_shape_plan_t *plan,
Behdad Esfahbod85fc6c42012-08-02 12:21:44 -0400650 hb_font_t *font,
651 hb_buffer_t *buffer)
Behdad Esfahbod8ef3d532012-08-02 07:53:18 -0400652{
Behdad Esfahboda8c6da92012-08-02 10:46:34 -0400653 const indic_shape_plan_t *indic_plan = (const indic_shape_plan_t *) plan->data;
Behdad Esfahbod8ef3d532012-08-02 07:53:18 -0400654
Behdad Esfahbodc4e71ff2013-10-17 17:04:47 +0200655 if (indic_plan->config->base_pos != BASE_POS_LAST)
656 return;
657
Behdad Esfahbod684fe592013-10-17 18:30:06 +0200658 hb_codepoint_t virama;
659 if (indic_plan->get_virama_glyph (font, &virama))
Behdad Esfahbod8ef3d532012-08-02 07:53:18 -0400660 {
661 hb_face_t *face = font->face;
662 unsigned int count = buffer->len;
Behdad Esfahbod7cd33f22014-07-17 14:22:11 -0400663 hb_glyph_info_t *info = buffer->info;
Behdad Esfahbod8ef3d532012-08-02 07:53:18 -0400664 for (unsigned int i = 0; i < count; i++)
Behdad Esfahbod7cd33f22014-07-17 14:22:11 -0400665 if (info[i].indic_position() == POS_BASE_C)
666 {
667 hb_codepoint_t consonant = info[i].codepoint;
668 info[i].indic_position() = consonant_position_from_face (indic_plan, consonant, virama, face);
Behdad Esfahbod8ef3d532012-08-02 07:53:18 -0400669 }
670 }
671}
672
Behdad Esfahbod867361c2011-06-17 18:35:46 -0400673
Behdad Esfahbod7ea58db2012-05-11 18:58:57 +0200674/* Rules from:
675 * https://www.microsoft.com/typography/otfntdev/devanot/shaping.aspx */
676
Behdad Esfahbod743807a2011-07-29 16:37:02 -0400677static void
Behdad Esfahbodf2c0f592012-11-12 14:02:02 -0800678initial_reordering_consonant_syllable (const hb_ot_shape_plan_t *plan,
679 hb_face_t *face,
680 hb_buffer_t *buffer,
Behdad Esfahbodef24cc82012-05-09 17:56:03 +0200681 unsigned int start, unsigned int end)
Behdad Esfahbod743807a2011-07-29 16:37:02 -0400682{
Behdad Esfahbod914ffaa2012-08-02 11:03:39 -0400683 const indic_shape_plan_t *indic_plan = (const indic_shape_plan_t *) plan->data;
Behdad Esfahbodee58f3b2011-07-30 19:15:53 -0400684 hb_glyph_info_t *info = buffer->info;
Behdad Esfahbod743807a2011-07-29 16:37:02 -0400685
Behdad Esfahbod617f4ac2012-05-13 16:48:03 +0200686
Behdad Esfahbod743807a2011-07-29 16:37:02 -0400687 /* 1. Find base consonant:
688 *
689 * The shaping engine finds the base consonant of the syllable, using the
690 * following algorithm: starting from the end of the syllable, move backwards
691 * until a consonant is found that does not have a below-base or post-base
692 * form (post-base forms have to follow below-base forms), or that is not a
693 * pre-base reordering Ra, or arrive at the first consonant. The consonant
694 * stopped at will be the base.
695 *
696 * o If the syllable starts with Ra + Halant (in a script that has Reph)
697 * and has more than one consonant, Ra is excluded from candidates for
698 * base consonants.
699 */
700
Behdad Esfahbod5e720712011-07-31 17:51:50 -0400701 unsigned int base = end;
Behdad Esfahbod76b34092012-05-09 11:43:43 +0200702 bool has_reph = false;
703
Behdad Esfahbod76b34092012-05-09 11:43:43 +0200704 {
Behdad Esfahbod617f4ac2012-05-13 16:48:03 +0200705 /* -> If the syllable starts with Ra + Halant (in a script that has Reph)
706 * and has more than one consonant, Ra is excluded from candidates for
707 * base consonants. */
708 unsigned int limit = start;
Behdad Esfahbodf175aa32013-10-18 02:07:44 +0200709 if (indic_plan->config->reph_pos != REPH_POS_DONT_CARE &&
Behdad Esfahbodefed40b2013-10-17 18:50:11 +0200710 indic_plan->mask_array[RPHF] &&
Behdad Esfahbod617f4ac2012-05-13 16:48:03 +0200711 start + 3 <= end &&
Behdad Esfahbod8b217f52012-12-21 15:48:32 -0500712 (
Behdad Esfahbod11b0e202012-08-02 14:21:40 -0400713 (indic_plan->config->reph_mode == REPH_MODE_IMPLICIT && !is_joiner (info[start + 2])) ||
714 (indic_plan->config->reph_mode == REPH_MODE_EXPLICIT && info[start + 2].indic_category() == OT_ZWJ)
Behdad Esfahbod3285e102012-07-18 17:22:14 -0400715 ))
Behdad Esfahbod617f4ac2012-05-13 16:48:03 +0200716 {
Behdad Esfahbodf2c0f592012-11-12 14:02:02 -0800717 /* See if it matches the 'rphf' feature. */
Behdad Esfahbod29531122014-05-15 14:04:02 -0600718 hb_codepoint_t glyphs[3] = {info[start].codepoint,
719 info[start + 1].codepoint,
720 indic_plan->config->reph_mode == REPH_MODE_EXPLICIT ?
721 info[start + 2].codepoint : 0};
722 if (indic_plan->rphf.would_substitute (glyphs, 2, face) ||
723 (indic_plan->config->reph_mode == REPH_MODE_EXPLICIT &&
724 indic_plan->rphf.would_substitute (glyphs, 3, face)))
Behdad Esfahbodf2c0f592012-11-12 14:02:02 -0800725 {
726 limit += 2;
727 while (limit < end && is_joiner (info[limit]))
728 limit++;
729 base = start;
730 has_reph = true;
731 }
Behdad Esfahbod8b217f52012-12-21 15:48:32 -0500732 } else if (indic_plan->config->reph_mode == REPH_MODE_LOG_REPHA && info[start].indic_category() == OT_Repha)
733 {
734 limit += 1;
735 while (limit < end && is_joiner (info[limit]))
736 limit++;
737 base = start;
738 has_reph = true;
739 }
Behdad Esfahbod743807a2011-07-29 16:37:02 -0400740
Behdad Esfahbod23b0e9d2012-08-26 14:30:18 -0400741 switch (indic_plan->config->base_pos)
Behdad Esfahbod14dbdd92012-07-18 13:13:03 -0400742 {
Behdad Esfahbod11b0e202012-08-02 14:21:40 -0400743 case BASE_POS_LAST:
744 {
745 /* -> starting from the end of the syllable, move backwards */
746 unsigned int i = end;
747 bool seen_below = false;
748 do {
749 i--;
750 /* -> until a consonant is found */
751 if (is_consonant (info[i]))
752 {
753 /* -> that does not have a below-base or post-base form
754 * (post-base forms have to follow below-base forms), */
755 if (info[i].indic_position() != POS_BELOW_C &&
756 (info[i].indic_position() != POS_POST_C || seen_below))
757 {
758 base = i;
759 break;
760 }
761 if (info[i].indic_position() == POS_BELOW_C)
762 seen_below = true;
763
764 /* -> or that is not a pre-base reordering Ra,
765 *
766 * IMPLEMENTATION NOTES:
767 *
Behdad Esfahbodfb7c1822013-03-06 00:53:24 -0500768 * Our pre-base reordering Ra's are marked POS_POST_C, so will be skipped
Behdad Esfahbod11b0e202012-08-02 14:21:40 -0400769 * by the logic above already.
770 */
771
772 /* -> or arrive at the first consonant. The consonant stopped at will
773 * be the base. */
774 base = i;
775 }
776 else
777 {
778 /* A ZWJ after a Halant stops the base search, and requests an explicit
779 * half form.
780 * A ZWJ before a Halant, requests a subjoined form instead, and hence
781 * search continues. This is particularly important for Bengali
Behdad Esfahbodc4be9912012-11-12 14:27:33 -0800782 * sequence Ra,H,Ya that should form Ya-Phalaa by subjoining Ya. */
Behdad Esfahbod11b0e202012-08-02 14:21:40 -0400783 if (start < i &&
784 info[i].indic_category() == OT_ZWJ &&
785 info[i - 1].indic_category() == OT_H)
786 break;
787 }
788 } while (i > limit);
789 }
790 break;
791
Behdad Esfahbode10453e2013-10-17 16:49:06 +0200792 case BASE_POS_LAST_SINHALA:
Behdad Esfahbod11b0e202012-08-02 14:21:40 -0400793 {
Behdad Esfahbodc4e71ff2013-10-17 17:04:47 +0200794 /* Sinhala base positioning is slightly different from main Indic, in that:
Behdad Esfahbodb082ef32014-04-25 11:48:10 -0700795 * 1. Its ZWJ behavior is different,
Behdad Esfahbodc4e71ff2013-10-17 17:04:47 +0200796 * 2. We don't need to look into the font for consonant positions.
797 */
Behdad Esfahbod11b0e202012-08-02 14:21:40 -0400798
799 if (!has_reph)
800 base = limit;
801
802 /* Find the last base consonant that is not blocked by ZWJ. If there is
803 * a ZWJ right before a base consonant, that would request a subjoined form. */
804 for (unsigned int i = limit; i < end; i++)
Behdad Esfahbodc4e71ff2013-10-17 17:04:47 +0200805 if (is_consonant (info[i]))
Behdad Esfahbod11b0e202012-08-02 14:21:40 -0400806 {
807 if (limit < i && info[i - 1].indic_category() == OT_ZWJ)
808 break;
809 else
810 base = i;
811 }
812
813 /* Mark all subsequent consonants as below. */
814 for (unsigned int i = base + 1; i < end; i++)
Behdad Esfahbodc4e71ff2013-10-17 17:04:47 +0200815 if (is_consonant (info[i]))
Behdad Esfahbod11b0e202012-08-02 14:21:40 -0400816 info[i].indic_position() = POS_BELOW_C;
817 }
818 break;
Behdad Esfahbode10453e2013-10-17 16:49:06 +0200819
820 case BASE_POS_FIRST:
821 {
822 /* The first consonant is always the base. */
823
824 assert (indic_plan->config->reph_mode == REPH_MODE_VIS_REPHA);
Behdad Esfahbodefed40b2013-10-17 18:50:11 +0200825 assert (!has_reph);
Behdad Esfahbode10453e2013-10-17 16:49:06 +0200826
827 base = start;
828
829 /* Mark all subsequent consonants as below. */
830 for (unsigned int i = base + 1; i < end; i++)
Behdad Esfahbodc4e71ff2013-10-17 17:04:47 +0200831 if (is_consonant (info[i]))
Behdad Esfahbode10453e2013-10-17 16:49:06 +0200832 info[i].indic_position() = POS_BELOW_C;
833 }
834 break;
Behdad Esfahbod5d326902012-07-17 14:23:28 -0400835 }
Behdad Esfahbod3c2ea942012-05-11 16:23:38 +0200836
Behdad Esfahbod617f4ac2012-05-13 16:48:03 +0200837 /* -> If the syllable starts with Ra + Halant (in a script that has Reph)
838 * and has more than one consonant, Ra is excluded from candidates for
Behdad Esfahbod2278eef2012-07-24 00:26:43 -0400839 * base consonants.
840 *
841 * Only do this for unforced Reph. (ie. not for Ra,H,ZWJ. */
Behdad Esfahbod9621e0b2013-02-11 06:58:27 -0500842 if (has_reph && base == start && limit - base <= 2) {
Behdad Esfahbod617f4ac2012-05-13 16:48:03 +0200843 /* Have no other consonant, so Reph is not formed and Ra becomes base. */
844 has_reph = false;
845 }
Behdad Esfahbod5e4e21f2012-05-13 16:46:08 +0200846 }
Behdad Esfahbod2278eef2012-07-24 00:26:43 -0400847
Behdad Esfahbod3d250792012-05-10 11:37:42 +0200848
Behdad Esfahbod743807a2011-07-29 16:37:02 -0400849 /* 2. Decompose and reorder Matras:
850 *
851 * Each matra and any syllable modifier sign in the cluster are moved to the
852 * appropriate position relative to the consonant(s) in the cluster. The
853 * shaping engine decomposes two- or three-part matras into their constituent
854 * parts before any repositioning. Matra characters are classified by which
855 * consonant in a conjunct they have affinity for and are reordered to the
856 * following positions:
857 *
858 * o Before first half form in the syllable
859 * o After subjoined consonants
860 * o After post-form consonant
861 * o After main consonant (for above marks)
862 *
863 * IMPLEMENTATION NOTES:
864 *
865 * The normalize() routine has already decomposed matras for us, so we don't
866 * need to worry about that.
867 */
868
869
870 /* 3. Reorder marks to canonical order:
871 *
872 * Adjacent nukta and halant or nukta and vedic sign are always repositioned
873 * if necessary, so that the nukta is first.
874 *
875 * IMPLEMENTATION NOTES:
876 *
877 * We don't need to do this: the normalize() routine already did this for us.
878 */
879
880
Behdad Esfahbod45d6f292011-07-30 14:44:30 -0400881 /* Reorder characters */
882
Behdad Esfahbod3c2ea942012-05-11 16:23:38 +0200883 for (unsigned int i = start; i < base; i++)
Behdad Esfahbod900cf3d2012-07-20 10:18:23 -0400884 info[i].indic_position() = MIN (POS_PRE_C, (indic_position_t) info[i].indic_position());
Behdad Esfahbod55f70eb2012-07-17 12:50:13 -0400885
Behdad Esfahbod075d6712012-07-18 15:41:53 -0400886 if (base < end)
887 info[base].indic_position() = POS_BASE_C;
Behdad Esfahbod45d6f292011-07-30 14:44:30 -0400888
Behdad Esfahbod55f70eb2012-07-17 12:50:13 -0400889 /* Mark final consonants. A final consonant is one appearing after a matra,
890 * like in Khmer. */
891 for (unsigned int i = base + 1; i < end; i++)
892 if (info[i].indic_category() == OT_M) {
893 for (unsigned int j = i + 1; j < end; j++)
894 if (is_consonant (info[j])) {
895 info[j].indic_position() = POS_FINAL_C;
896 break;
897 }
898 break;
899 }
900
Behdad Esfahbodfd06bf52011-07-30 20:14:44 -0400901 /* Handle beginning Ra */
Behdad Esfahbod5e4e21f2012-05-13 16:46:08 +0200902 if (has_reph)
Behdad Esfahboddbb10582012-05-10 13:45:52 +0200903 info[start].indic_position() = POS_RA_TO_BECOME_REPH;
Behdad Esfahbodfd06bf52011-07-30 20:14:44 -0400904
Behdad Esfahbodf5bc2722011-07-30 21:08:10 -0400905 /* For old-style Indic script tags, move the first post-base Halant after
Behdad Esfahbodfc0daaf2014-07-23 16:48:51 -0400906 * last consonant.
907 *
908 * Reports suggest that in some scripts Uniscribe does this only if there
909 * is *not* a Halant after last consonant already (eg. Kannada), while it
910 * does it unconditionally in other scripts (eg. Malayalam). We don't
911 * currently know about other scripts, so we single out Malayalam for now.
912 *
913 * Kannada test case:
914 * U+0C9A,U+0CCD,U+0C9A,U+0CCD
915 * With some versions of Lohit Kannada.
916 * https://bugs.freedesktop.org/show_bug.cgi?id=59118
917 *
918 * Malayalam test case:
919 * U+0D38,U+0D4D,U+0D31,U+0D4D,U+0D31,U+0D4D
920 * With lohit-ttf-20121122/Lohit-Malayalam.ttf
921 */
922 if (indic_plan->is_old_spec)
923 {
924 bool disallow_double_halants = buffer->props.script != HB_SCRIPT_MALAYALAM;
Behdad Esfahbod3c2ea942012-05-11 16:23:38 +0200925 for (unsigned int i = base + 1; i < end; i++)
Behdad Esfahbodfc0daaf2014-07-23 16:48:51 -0400926 if (info[i].indic_category() == OT_H)
927 {
Behdad Esfahbodf5bc2722011-07-30 21:08:10 -0400928 unsigned int j;
929 for (j = end - 1; j > i; j--)
Behdad Esfahbodfc0daaf2014-07-23 16:48:51 -0400930 if (is_consonant (info[j]) ||
931 (disallow_double_halants && info[j].indic_category() == OT_H))
Behdad Esfahbodf5bc2722011-07-30 21:08:10 -0400932 break;
Behdad Esfahbodecd454b2013-01-08 18:09:46 -0600933 if (info[j].indic_category() != OT_H && j > i) {
Behdad Esfahbodf5bc2722011-07-30 21:08:10 -0400934 /* Move Halant to after last consonant. */
935 hb_glyph_info_t t = info[i];
936 memmove (&info[i], &info[i + 1], (j - i) * sizeof (info[0]));
937 info[j] = t;
938 }
939 break;
940 }
941 }
942
Behdad Esfahbod81202bd2012-07-20 15:10:02 -0400943 /* Attach misc marks to previous char to move with them. */
Behdad Esfahbodebe29732012-05-11 16:43:12 +0200944 {
Behdad Esfahbod81202bd2012-07-20 15:10:02 -0400945 indic_position_t last_pos = POS_START;
946 for (unsigned int i = start; i < end; i++)
947 {
Behdad Esfahbodf8160a42015-07-21 15:50:02 +0100948 if ((FLAG_SAFE (info[i].indic_category()) & (JOINER_FLAGS | FLAG (OT_N) | FLAG (OT_RS) | MEDIAL_FLAGS | HALANT_OR_COENG_FLAGS)))
Behdad Esfahbod81202bd2012-07-20 15:10:02 -0400949 {
950 info[i].indic_position() = last_pos;
Behdad Esfahboddde55062012-11-14 11:37:04 -0800951 if (unlikely (info[i].indic_category() == OT_H &&
Behdad Esfahbod81202bd2012-07-20 15:10:02 -0400952 info[i].indic_position() == POS_PRE_M))
953 {
954 /*
955 * Uniscribe doesn't move the Halant with Left Matra.
956 * TEST: U+092B,U+093F,U+094DE
Behdad Esfahboddde55062012-11-14 11:37:04 -0800957 * We follow. This is important for the Sinhala
958 * U+0DDA split matra since it decomposes to U+0DD9,U+0DCA
959 * where U+0DD9 is a left matra and U+0DCA is the virama.
960 * We don't want to move the virama with the left matra.
961 * TEST: U+0D9A,U+0DDA
Behdad Esfahbod81202bd2012-07-20 15:10:02 -0400962 */
Behdad Esfahbodebe29732012-05-11 16:43:12 +0200963 for (unsigned int j = i; j > start; j--)
Behdad Esfahbod6a091df2012-05-11 21:42:27 +0200964 if (info[j - 1].indic_position() != POS_PRE_M) {
Behdad Esfahbodebe29732012-05-11 16:43:12 +0200965 info[i].indic_position() = info[j - 1].indic_position();
966 break;
967 }
Behdad Esfahbod81202bd2012-07-20 15:10:02 -0400968 }
969 } else if (info[i].indic_position() != POS_SMVD) {
970 last_pos = (indic_position_t) info[i].indic_position();
Behdad Esfahbodebe29732012-05-11 16:43:12 +0200971 }
Behdad Esfahbod81202bd2012-07-20 15:10:02 -0400972 }
Behdad Esfahbodebe29732012-05-11 16:43:12 +0200973 }
Behdad Esfahbodddce2d82013-10-18 18:07:11 +0200974 /* For post-base consonants let them own anything before them
975 * since the last consonant or matra. */
Behdad Esfahbod74ccc6a2012-07-17 11:16:19 -0400976 {
Behdad Esfahbodddce2d82013-10-18 18:07:11 +0200977 unsigned int last = base;
Behdad Esfahbod74ccc6a2012-07-17 11:16:19 -0400978 for (unsigned int i = base + 1; i < end; i++)
Behdad Esfahbodddce2d82013-10-18 18:07:11 +0200979 if (is_consonant (info[i]))
980 {
981 for (unsigned int j = last + 1; j < i; j++)
982 if (info[j].indic_position() < POS_SMVD)
Behdad Esfahbod81202bd2012-07-20 15:10:02 -0400983 info[j].indic_position() = info[i].indic_position();
Behdad Esfahbodddce2d82013-10-18 18:07:11 +0200984 last = i;
985 } else if (info[i].indic_category() == OT_M)
986 last = i;
Behdad Esfahbod74ccc6a2012-07-17 11:16:19 -0400987 }
Behdad Esfahbod45d6f292011-07-30 14:44:30 -0400988
Behdad Esfahbod28d5dae2013-10-16 12:32:12 +0200989
Behdad Esfahboda391ff52012-05-10 11:31:20 +0200990 {
Behdad Esfahbod28d5dae2013-10-16 12:32:12 +0200991 /* Use syllable() for sort accounting temporarily. */
992 unsigned int syllable = info[start].syllable();
993 for (unsigned int i = start; i < end; i++)
994 info[i].syllable() = i - start;
995
Behdad Esfahboda391ff52012-05-10 11:31:20 +0200996 /* Sit tight, rock 'n roll! */
Behdad Esfahbod85846b32015-09-01 15:07:52 +0100997 hb_stable_sort (info + start, end - start, compare_indic_order);
Behdad Esfahboda391ff52012-05-10 11:31:20 +0200998 /* Find base again */
999 base = end;
Behdad Esfahbod3c2ea942012-05-11 16:23:38 +02001000 for (unsigned int i = start; i < end; i++)
Behdad Esfahbod28d5dae2013-10-16 12:32:12 +02001001 if (info[i].indic_position() == POS_BASE_C)
1002 {
1003 base = i;
Behdad Esfahboda391ff52012-05-10 11:31:20 +02001004 break;
1005 }
Behdad Esfahbod28d5dae2013-10-16 12:32:12 +02001006 /* Things are out-of-control for post base positions, they may shuffle
1007 * around like crazy. In old-spec mode, we move halants around, so in
1008 * that case merge all clusters after base. Otherwise, check the sort
1009 * order and merge as needed.
Behdad Esfahbod5828c452015-09-01 16:26:35 +01001010 * For pre-base stuff, we handle cluster issues in final reordering.
1011 *
1012 * We could use buffer->sort() for this, if there was no special
1013 * reordering of pre-base stuff happening later...
1014 */
Behdad Esfahbod28d5dae2013-10-16 12:32:12 +02001015 if (indic_plan->is_old_spec || end - base > 127)
1016 buffer->merge_clusters (base, end);
1017 else
1018 {
1019 /* Note! syllable() is a one-byte field. */
1020 for (unsigned int i = base; i < end; i++)
1021 if (info[i].syllable() != 255)
1022 {
1023 unsigned int max = i;
1024 unsigned int j = start + info[i].syllable();
1025 while (j != i)
1026 {
1027 max = MAX (max, j);
1028 unsigned int next = start + info[j].syllable();
1029 info[j].syllable() = 255; /* So we don't process j later again. */
1030 j = next;
1031 }
1032 if (i != max)
1033 buffer->merge_clusters (i, max + 1);
1034 }
1035 }
1036
1037 /* Put syllable back in. */
1038 for (unsigned int i = start; i < end; i++)
1039 info[i].syllable() = syllable;
Behdad Esfahboda391ff52012-05-10 11:31:20 +02001040 }
Behdad Esfahbod45d6f292011-07-30 14:44:30 -04001041
Behdad Esfahbod743807a2011-07-29 16:37:02 -04001042 /* Setup masks now */
1043
Behdad Esfahbod28168392011-07-31 16:00:35 -04001044 {
1045 hb_mask_t mask;
1046
Behdad Esfahboddbb10582012-05-10 13:45:52 +02001047 /* Reph */
Behdad Esfahbod668c6042012-05-11 15:34:13 +02001048 for (unsigned int i = start; i < end && info[i].indic_position() == POS_RA_TO_BECOME_REPH; i++)
Behdad Esfahbod85fc6c42012-08-02 12:21:44 -04001049 info[i].mask |= indic_plan->mask_array[RPHF];
Behdad Esfahboddbb10582012-05-10 13:45:52 +02001050
Behdad Esfahbod28168392011-07-31 16:00:35 -04001051 /* Pre-base */
Behdad Esfahbod85fc6c42012-08-02 12:21:44 -04001052 mask = indic_plan->mask_array[HALF];
Behdad Esfahbodc7dacac2013-10-17 12:20:24 +02001053 if (!indic_plan->is_old_spec &&
1054 indic_plan->config->blwf_mode == BLWF_MODE_PRE_AND_POST)
Behdad Esfahbod8acbb6b2013-10-15 12:15:49 +02001055 mask |= indic_plan->mask_array[BLWF];
Behdad Esfahbod3c2ea942012-05-11 16:23:38 +02001056 for (unsigned int i = start; i < base; i++)
Behdad Esfahbod28168392011-07-31 16:00:35 -04001057 info[i].mask |= mask;
1058 /* Base */
Behdad Esfahbod20b68e62012-07-20 10:47:46 -04001059 mask = 0;
Behdad Esfahbod075d6712012-07-18 15:41:53 -04001060 if (base < end)
1061 info[base].mask |= mask;
Behdad Esfahbod28168392011-07-31 16:00:35 -04001062 /* Post-base */
Behdad Esfahbod85fc6c42012-08-02 12:21:44 -04001063 mask = indic_plan->mask_array[BLWF] | indic_plan->mask_array[ABVF] | indic_plan->mask_array[PSTF];
Behdad Esfahbod3c2ea942012-05-11 16:23:38 +02001064 for (unsigned int i = base + 1; i < end; i++)
Behdad Esfahbod28168392011-07-31 16:00:35 -04001065 info[i].mask |= mask;
1066 }
Behdad Esfahbod9da04872011-07-31 13:46:44 -04001067
Behdad Esfahbod85c51ec2013-02-12 18:17:39 -05001068 if (indic_plan->is_old_spec &&
1069 buffer->props.script == HB_SCRIPT_DEVANAGARI)
1070 {
1071 /* Old-spec eye-lash Ra needs special handling. From the
1072 * spec:
1073 *
1074 * "The feature 'below-base form' is applied to consonants
1075 * having below-base forms and following the base consonant.
1076 * The exception is vattu, which may appear below half forms
1077 * as well as below the base glyph. The feature 'below-base
1078 * form' will be applied to all such occurrences of Ra as well."
1079 *
1080 * Test case: U+0924,U+094D,U+0930,U+094d,U+0915
1081 * with Sanskrit 2003 font.
1082 *
1083 * However, note that Ra,Halant,ZWJ is the correct way to
1084 * request eyelash form of Ra, so we wouldbn't inhibit it
1085 * in that sequence.
1086 *
1087 * Test case: U+0924,U+094D,U+0930,U+094d,U+200D,U+0915
1088 */
1089 for (unsigned int i = start; i + 1 < base; i++)
1090 if (info[i ].indic_category() == OT_Ra &&
1091 info[i+1].indic_category() == OT_H &&
1092 (i + 2 == base ||
1093 info[i+2].indic_category() != OT_ZWJ))
1094 {
1095 info[i ].mask |= indic_plan->mask_array[BLWF];
1096 info[i+1].mask |= indic_plan->mask_array[BLWF];
1097 }
1098 }
1099
Behdad Esfahbod3c1666c2016-05-06 16:05:07 +01001100 unsigned int pref_len = 2;
Behdad Esfahbod74f4bbf2013-10-17 19:07:53 +02001101 if (indic_plan->mask_array[PREF] && base + pref_len < end)
Behdad Esfahbod17d7de92012-07-16 15:20:15 -04001102 {
Behdad Esfahbod771a8f52012-07-23 20:07:50 -04001103 /* Find a Halant,Ra sequence and mark it for pre-base reordering processing. */
Behdad Esfahbod74f4bbf2013-10-17 19:07:53 +02001104 for (unsigned int i = base + 1; i + pref_len - 1 < end; i++) {
1105 hb_codepoint_t glyphs[2];
1106 for (unsigned int j = 0; j < pref_len; j++)
1107 glyphs[j] = info[i + j].codepoint;
1108 if (indic_plan->pref.would_substitute (glyphs, pref_len, face))
Behdad Esfahbod8e7b5882012-07-16 17:04:46 -04001109 {
Behdad Esfahbod74f4bbf2013-10-17 19:07:53 +02001110 for (unsigned int j = 0; j < pref_len; j++)
1111 info[i++].mask |= indic_plan->mask_array[PREF];
Behdad Esfahbod0201e0a2012-07-17 13:55:10 -04001112
1113 /* Mark the subsequent stuff with 'cfar'. Used in Khmer.
1114 * Read the feature spec.
1115 * This allows distinguishing the following cases with MS Khmer fonts:
1116 * U+1784,U+17D2,U+179A,U+17D2,U+1782
1117 * U+1784,U+17D2,U+1782,U+17D2,U+179A
1118 */
Behdad Esfahbod74f4bbf2013-10-17 19:07:53 +02001119 if (indic_plan->mask_array[CFAR])
1120 for (; i < end; i++)
1121 info[i].mask |= indic_plan->mask_array[CFAR];
Behdad Esfahbod0201e0a2012-07-17 13:55:10 -04001122
Behdad Esfahbod8e7b5882012-07-16 17:04:46 -04001123 break;
1124 }
Behdad Esfahbod56be6772012-11-12 14:09:40 -08001125 }
Behdad Esfahbod17d7de92012-07-16 15:20:15 -04001126 }
1127
Behdad Esfahbod9da04872011-07-31 13:46:44 -04001128 /* Apply ZWJ/ZWNJ effects */
Behdad Esfahbod3c2ea942012-05-11 16:23:38 +02001129 for (unsigned int i = start + 1; i < end; i++)
Behdad Esfahbod9da04872011-07-31 13:46:44 -04001130 if (is_joiner (info[i])) {
1131 bool non_joiner = info[i].indic_category() == OT_ZWNJ;
Behdad Esfahbod6b37bc82011-07-31 15:57:00 -04001132 unsigned int j = i;
Behdad Esfahbod9da04872011-07-31 13:46:44 -04001133
1134 do {
Behdad Esfahbod9da04872011-07-31 13:46:44 -04001135 j--;
Behdad Esfahbod6b37bc82011-07-31 15:57:00 -04001136
Behdad Esfahbodcfc507c2013-02-14 10:40:12 -05001137 /* ZWJ/ZWNJ should disable CJCT. They do that by simply
1138 * being there, since we don't skip them for the CJCT
Behdad Esfahboda8cf7b42013-03-19 05:53:26 -04001139 * feature (ie. F_MANUAL_ZWJ) */
Behdad Esfahbod20b68e62012-07-20 10:47:46 -04001140
1141 /* A ZWNJ disables HALF. */
Behdad Esfahbod6b37bc82011-07-31 15:57:00 -04001142 if (non_joiner)
Behdad Esfahbod85fc6c42012-08-02 12:21:44 -04001143 info[j].mask &= ~indic_plan->mask_array[HALF];
Behdad Esfahbod6b37bc82011-07-31 15:57:00 -04001144
Behdad Esfahbod9da04872011-07-31 13:46:44 -04001145 } while (j > start && !is_consonant (info[j]));
1146 }
Behdad Esfahbod743807a2011-07-29 16:37:02 -04001147}
1148
Behdad Esfahbod743807a2011-07-29 16:37:02 -04001149static void
Behdad Esfahbod8bb5deb2012-08-02 10:07:58 -04001150initial_reordering_standalone_cluster (const hb_ot_shape_plan_t *plan,
Behdad Esfahbodf2c0f592012-11-12 14:02:02 -08001151 hb_face_t *face,
Behdad Esfahbod9f377ed2012-05-13 16:13:44 +02001152 hb_buffer_t *buffer,
Behdad Esfahbodef24cc82012-05-09 17:56:03 +02001153 unsigned int start, unsigned int end)
Behdad Esfahbod743807a2011-07-29 16:37:02 -04001154{
Behdad Esfahbodcf78dd42014-05-27 17:53:37 -04001155 /* We treat placeholder/dotted-circle as if they are consonants, so we
1156 * should just chain. Only if not in compatibility mode that is... */
Behdad Esfahbod18c06e12012-05-11 20:02:14 +02001157
Behdad Esfahbodbab02d32013-02-12 15:26:45 -05001158 if (hb_options ().uniscribe_bug_compatible)
Behdad Esfahbod18c06e12012-05-11 20:02:14 +02001159 {
1160 /* For dotted-circle, this is what Uniscribe does:
1161 * If dotted-circle is the last glyph, it just does nothing.
1162 * Ie. It doesn't form Reph. */
1163 if (buffer->info[end - 1].indic_category() == OT_DOTTEDCIRCLE)
1164 return;
1165 }
1166
Behdad Esfahbodf2c0f592012-11-12 14:02:02 -08001167 initial_reordering_consonant_syllable (plan, face, buffer, start, end);
Behdad Esfahbod743807a2011-07-29 16:37:02 -04001168}
1169
1170static void
Behdad Esfahbod327d14e2012-08-31 16:49:34 -04001171initial_reordering_syllable (const hb_ot_shape_plan_t *plan,
Behdad Esfahbodf2c0f592012-11-12 14:02:02 -08001172 hb_face_t *face,
Behdad Esfahbod327d14e2012-08-31 16:49:34 -04001173 hb_buffer_t *buffer,
1174 unsigned int start, unsigned int end)
1175{
1176 syllable_type_t syllable_type = (syllable_type_t) (buffer->info[start].syllable() & 0x0F);
Behdad Esfahbodecb0b242015-07-22 12:02:09 +01001177 switch (syllable_type)
1178 {
1179 case vowel_syllable: /* We made the vowels look like consonants. So let's call the consonant logic! */
1180 case consonant_syllable:
1181 initial_reordering_consonant_syllable (plan, face, buffer, start, end);
1182 break;
1183
1184 case broken_cluster: /* We already inserted dotted-circles, so just call the standalone_cluster. */
1185 case standalone_cluster:
1186 initial_reordering_standalone_cluster (plan, face, buffer, start, end);
1187 break;
1188
1189 case symbol_cluster:
1190 case non_indic_cluster:
1191 break;
Behdad Esfahbod327d14e2012-08-31 16:49:34 -04001192 }
1193}
1194
Behdad Esfahbod166b5cf2012-09-07 14:55:07 -04001195static inline void
Behdad Esfahbod0beb66e2012-12-05 18:46:04 -05001196insert_dotted_circles (const hb_ot_shape_plan_t *plan HB_UNUSED,
Behdad Esfahbodb85800f2012-08-31 18:12:01 -04001197 hb_font_t *font,
1198 hb_buffer_t *buffer)
1199{
Behdad Esfahbod166b5cf2012-09-07 14:55:07 -04001200 /* Note: This loop is extra overhead, but should not be measurable. */
1201 bool has_broken_syllables = false;
1202 unsigned int count = buffer->len;
Behdad Esfahbod7cd33f22014-07-17 14:22:11 -04001203 hb_glyph_info_t *info = buffer->info;
Behdad Esfahbod166b5cf2012-09-07 14:55:07 -04001204 for (unsigned int i = 0; i < count; i++)
Behdad Esfahbod7cd33f22014-07-17 14:22:11 -04001205 if ((info[i].syllable() & 0x0F) == broken_cluster)
1206 {
Behdad Esfahbod166b5cf2012-09-07 14:55:07 -04001207 has_broken_syllables = true;
1208 break;
1209 }
1210 if (likely (!has_broken_syllables))
1211 return;
1212
1213
Behdad Esfahbodb85800f2012-08-31 18:12:01 -04001214 hb_codepoint_t dottedcircle_glyph;
Behdad Esfahbod8b5bc142016-02-24 19:05:23 +09001215 if (!font->get_nominal_glyph (0x25CCu, &dottedcircle_glyph))
Behdad Esfahbodb85800f2012-08-31 18:12:01 -04001216 return;
1217
Behdad Esfahbodf41dc2d2012-11-15 10:36:43 -08001218 hb_glyph_info_t dottedcircle = {0};
Behdad Esfahbod76271002014-07-11 14:54:42 -04001219 dottedcircle.codepoint = 0x25CCu;
Behdad Esfahbodb85800f2012-08-31 18:12:01 -04001220 set_indic_properties (dottedcircle);
1221 dottedcircle.codepoint = dottedcircle_glyph;
1222
1223 buffer->clear_output ();
1224
1225 buffer->idx = 0;
1226 unsigned int last_syllable = 0;
Behdad Esfahbodabadc172015-11-18 17:52:08 -08001227 while (buffer->idx < buffer->len && !buffer->in_error)
Behdad Esfahbodb85800f2012-08-31 18:12:01 -04001228 {
1229 unsigned int syllable = buffer->cur().syllable();
1230 syllable_type_t syllable_type = (syllable_type_t) (syllable & 0x0F);
1231 if (unlikely (last_syllable != syllable && syllable_type == broken_cluster))
1232 {
Behdad Esfahbod596740d2012-12-21 19:41:04 -05001233 last_syllable = syllable;
1234
Behdad Esfahbod6f932bc2015-10-21 11:16:49 -02001235 hb_glyph_info_t ginfo = dottedcircle;
1236 ginfo.cluster = buffer->cur().cluster;
1237 ginfo.mask = buffer->cur().mask;
1238 ginfo.syllable() = buffer->cur().syllable();
Behdad Esfahbod595d2b92014-07-26 18:44:15 -04001239 /* TODO Set glyph_props? */
Behdad Esfahbod596740d2012-12-21 19:41:04 -05001240
1241 /* Insert dottedcircle after possible Repha. */
Behdad Esfahbodb894a852016-02-02 16:39:19 +08001242 while (buffer->idx < buffer->len && !buffer->in_error &&
Behdad Esfahbod596740d2012-12-21 19:41:04 -05001243 last_syllable == buffer->cur().syllable() &&
1244 buffer->cur().indic_category() == OT_Repha)
1245 buffer->next_glyph ();
1246
Behdad Esfahbod6f932bc2015-10-21 11:16:49 -02001247 buffer->output_info (ginfo);
Behdad Esfahbodb85800f2012-08-31 18:12:01 -04001248 }
Behdad Esfahbod596740d2012-12-21 19:41:04 -05001249 else
1250 buffer->next_glyph ();
Behdad Esfahbodb85800f2012-08-31 18:12:01 -04001251 }
1252
1253 buffer->swap_buffers ();
1254}
1255
1256static void
Behdad Esfahbod8bb5deb2012-08-02 10:07:58 -04001257initial_reordering (const hb_ot_shape_plan_t *plan,
Behdad Esfahbod24eacf12012-08-02 08:42:11 -04001258 hb_font_t *font,
Behdad Esfahbod3e38c0f2012-08-02 09:44:18 -04001259 hb_buffer_t *buffer)
Behdad Esfahbod743807a2011-07-29 16:37:02 -04001260{
Behdad Esfahbod85fc6c42012-08-02 12:21:44 -04001261 update_consonant_positions (plan, font, buffer);
Behdad Esfahbod166b5cf2012-09-07 14:55:07 -04001262 insert_dotted_circles (plan, font, buffer);
Behdad Esfahbod327d14e2012-08-31 16:49:34 -04001263
Behdad Esfahbodecb0b242015-07-22 12:02:09 +01001264 foreach_syllable (buffer, start, end)
1265 initial_reordering_syllable (plan, font->face, buffer, start, end);
Behdad Esfahbodb9ddbd52011-06-02 17:43:12 -04001266}
1267
Behdad Esfahbod743807a2011-07-29 16:37:02 -04001268static void
Behdad Esfahbod85fc6c42012-08-02 12:21:44 -04001269final_reordering_syllable (const hb_ot_shape_plan_t *plan,
1270 hb_buffer_t *buffer,
Behdad Esfahbodef24cc82012-05-09 17:56:03 +02001271 unsigned int start, unsigned int end)
Behdad Esfahbod743807a2011-07-29 16:37:02 -04001272{
Behdad Esfahbod85fc6c42012-08-02 12:21:44 -04001273 const indic_shape_plan_t *indic_plan = (const indic_shape_plan_t *) plan->data;
Behdad Esfahbod4ac9e982012-05-10 12:53:53 +02001274 hb_glyph_info_t *info = buffer->info;
1275
Behdad Esfahbod04dc52f2014-06-06 17:28:38 -04001276
1277 /* This function relies heavily on halant glyphs. Lots of ligation
1278 * and possibly multiplication substitutions happened prior to this
1279 * phase, and that might have messed up our properties. Recover
1280 * from a particular case of that where we're fairly sure that a
1281 * class of OT_H is desired but has been lost. */
1282 if (indic_plan->virama_glyph)
1283 {
1284 unsigned int virama_glyph = indic_plan->virama_glyph;
1285 for (unsigned int i = start; i < end; i++)
1286 if (info[i].codepoint == virama_glyph &&
1287 _hb_glyph_info_ligated (&info[i]) &&
1288 _hb_glyph_info_multiplied (&info[i]))
1289 {
1290 /* This will make sure that this glyph passes is_halant_or_coeng() test. */
1291 info[i].indic_category() = OT_H;
1292 _hb_glyph_info_clear_ligated_and_multiplied (&info[i]);
1293 }
1294 }
1295
1296
Behdad Esfahbode7be0572011-07-31 15:18:57 -04001297 /* 4. Final reordering:
1298 *
1299 * After the localized forms and basic shaping forms GSUB features have been
1300 * applied (see below), the shaping engine performs some final glyph
1301 * reordering before applying all the remaining font features to the entire
1302 * cluster.
Behdad Esfahbod4ac9e982012-05-10 12:53:53 +02001303 */
1304
Behdad Esfahbod1d634cb2014-06-06 17:55:02 -04001305 bool try_pref = !!indic_plan->mask_array[PREF];
1306
Behdad Esfahbod4ac9e982012-05-10 12:53:53 +02001307 /* Find base again */
Behdad Esfahbod5f0eaaa2012-07-20 15:47:24 -04001308 unsigned int base;
1309 for (base = start; base < end; base++)
Behdad Esfahbod1d634cb2014-06-06 17:55:02 -04001310 if (info[base].indic_position() >= POS_BASE_C)
1311 {
Behdad Esfahbod3c1666c2016-05-06 16:05:07 +01001312 if (try_pref && base + 1 < end)
Behdad Esfahbod1d634cb2014-06-06 17:55:02 -04001313 {
1314 for (unsigned int i = base + 1; i < end; i++)
1315 if ((info[i].mask & indic_plan->mask_array[PREF]) != 0)
1316 {
1317 if (!(_hb_glyph_info_substituted (&info[i]) &&
1318 _hb_glyph_info_ligated_and_didnt_multiply (&info[i])))
1319 {
1320 /* Ok, this was a 'pref' candidate but didn't form any.
1321 * Base is around here... */
1322 base = i;
1323 while (base < end && is_halant_or_coeng (info[base]))
1324 base++;
1325 info[base].indic_position() = POS_BASE_C;
1326
1327 try_pref = false;
1328 }
1329 break;
1330 }
1331 }
Behdad Esfahbod45b7ec32015-12-18 13:47:16 +00001332 /* For Malayalam, skip over unformed below- (but NOT post-) forms. */
1333 if (buffer->props.script == HB_SCRIPT_MALAYALAM)
1334 {
1335 for (unsigned int i = base + 1; i < end; i++)
1336 {
1337 while (i < end && is_joiner (info[i]))
1338 i++;
1339 if (i == end || !is_halant_or_coeng (info[i]))
1340 break;
1341 i++; /* Skip halant. */
1342 while (i < end && is_joiner (info[i]))
1343 i++;
1344 if (i < end && is_consonant (info[i]) && info[i].indic_position() == POS_BELOW_C)
1345 {
1346 base = i;
1347 info[base].indic_position() = POS_BASE_C;
1348 }
1349 }
1350 }
Behdad Esfahbod1d634cb2014-06-06 17:55:02 -04001351
Behdad Esfahbod5f0eaaa2012-07-20 15:47:24 -04001352 if (start < base && info[base].indic_position() > POS_BASE_C)
1353 base--;
1354 break;
1355 }
Behdad Esfahboda0cb9f32013-02-13 09:26:55 -05001356 if (base == end && start < base &&
Behdad Esfahbod39c82012014-06-06 17:19:35 -04001357 is_one_of (info[base - 1], FLAG (OT_ZWJ)))
Behdad Esfahboda0cb9f32013-02-13 09:26:55 -05001358 base--;
Behdad Esfahbode7ce50d2014-07-16 12:30:39 -04001359 if (base < end)
1360 while (start < base &&
1361 is_one_of (info[base], (FLAG (OT_N) | HALANT_OR_COENG_FLAGS)))
1362 base--;
Behdad Esfahbod4ac9e982012-05-10 12:53:53 +02001363
Behdad Esfahbod4705a702012-05-10 13:09:08 +02001364
Behdad Esfahbod4ac9e982012-05-10 12:53:53 +02001365 /* o Reorder matras:
Behdad Esfahbode7be0572011-07-31 15:18:57 -04001366 *
1367 * If a pre-base matra character had been reordered before applying basic
1368 * features, the glyph can be moved closer to the main consonant based on
1369 * whether half-forms had been formed. Actual position for the matra is
1370 * defined as “after last standalone halant glyph, after initial matra
1371 * position and before the main consonant”. If ZWJ or ZWNJ follow this
1372 * halant, position is moved after it.
Behdad Esfahbod4ac9e982012-05-10 12:53:53 +02001373 */
1374
Behdad Esfahbod65c43ac2012-07-24 03:36:47 -04001375 if (start + 1 < end && start < base) /* Otherwise there can't be any pre-base matra characters. */
Behdad Esfahbod9d0d3192012-05-11 21:36:32 +02001376 {
Behdad Esfahbod65c43ac2012-07-24 03:36:47 -04001377 /* If we lost track of base, alas, position before last thingy. */
1378 unsigned int new_pos = base == end ? base - 2 : base - 1;
Behdad Esfahbod4ac9e982012-05-10 12:53:53 +02001379
Behdad Esfahbod27bd55b2012-09-05 15:11:14 -04001380 /* Malayalam / Tamil do not have "half" forms or explicit virama forms.
1381 * The glyphs formed by 'half' are Chillus or ligated explicit viramas.
1382 * We want to position matra after them.
Behdad Esfahbod65c43ac2012-07-24 03:36:47 -04001383 */
Behdad Esfahbod27bd55b2012-09-05 15:11:14 -04001384 if (buffer->props.script != HB_SCRIPT_MALAYALAM && buffer->props.script != HB_SCRIPT_TAMIL)
Behdad Esfahbod65c43ac2012-07-24 03:36:47 -04001385 {
1386 while (new_pos > start &&
Behdad Esfahbodc04d5f02014-06-06 17:02:39 -04001387 !(is_one_of (info[new_pos], (FLAG (OT_M) | HALANT_OR_COENG_FLAGS))))
Behdad Esfahbod65c43ac2012-07-24 03:36:47 -04001388 new_pos--;
1389
1390 /* If we found no Halant we are done.
1391 * Otherwise only proceed if the Halant does
1392 * not belong to the Matra itself! */
1393 if (is_halant_or_coeng (info[new_pos]) &&
1394 info[new_pos].indic_position() != POS_PRE_M)
1395 {
1396 /* -> If ZWJ or ZWNJ follow this halant, position is moved after it. */
1397 if (new_pos + 1 < end && is_joiner (info[new_pos + 1]))
1398 new_pos++;
1399 }
1400 else
1401 new_pos = start; /* No move. */
1402 }
1403
Behdad Esfahbod27bd55b2012-09-05 15:11:14 -04001404 if (start < new_pos && info[new_pos].indic_position () != POS_PRE_M)
Behdad Esfahbod65c43ac2012-07-24 03:36:47 -04001405 {
Behdad Esfahbod9d0d3192012-05-11 21:36:32 +02001406 /* Now go see if there's actually any matras... */
Behdad Esfahbod921ce5b2012-07-16 15:26:56 -04001407 for (unsigned int i = new_pos; i > start; i--)
Behdad Esfahbod6a091df2012-05-11 21:42:27 +02001408 if (info[i - 1].indic_position () == POS_PRE_M)
Behdad Esfahbod9d0d3192012-05-11 21:36:32 +02001409 {
Behdad Esfahbod1a1dbe92012-07-16 15:40:33 -04001410 unsigned int old_pos = i - 1;
Behdad Esfahbod5828c452015-09-01 16:26:35 +01001411 if (old_pos < base && base <= new_pos) /* Shouldn't actually happen. */
1412 base--;
1413
Behdad Esfahbod1a1dbe92012-07-16 15:40:33 -04001414 hb_glyph_info_t tmp = info[old_pos];
1415 memmove (&info[old_pos], &info[old_pos + 1], (new_pos - old_pos) * sizeof (info[0]));
1416 info[new_pos] = tmp;
Behdad Esfahbod5828c452015-09-01 16:26:35 +01001417
1418 /* Note: this merge_clusters() is intentionally *after* the reordering.
1419 * Indic matra reordering is special and tricky... */
Behdad Esfahbod9cb59d42013-10-16 11:34:07 +02001420 buffer->merge_clusters (new_pos, MIN (end, base + 1));
Behdad Esfahbod5828c452015-09-01 16:26:35 +01001421
Behdad Esfahbod921ce5b2012-07-16 15:26:56 -04001422 new_pos--;
Behdad Esfahbod9d0d3192012-05-11 21:36:32 +02001423 }
Behdad Esfahbodabb32392012-07-22 23:55:19 -04001424 } else {
Behdad Esfahbode6b01a82012-07-23 00:11:26 -04001425 for (unsigned int i = start; i < base; i++)
Behdad Esfahbodabb32392012-07-22 23:55:19 -04001426 if (info[i].indic_position () == POS_PRE_M) {
Behdad Esfahbod2cc933a2012-07-23 08:22:55 -04001427 buffer->merge_clusters (i, MIN (end, base + 1));
Behdad Esfahbodabb32392012-07-22 23:55:19 -04001428 break;
1429 }
Behdad Esfahbod9d0d3192012-05-11 21:36:32 +02001430 }
Behdad Esfahbod4ac9e982012-05-10 12:53:53 +02001431 }
1432
1433
1434 /* o Reorder reph:
Behdad Esfahbode7be0572011-07-31 15:18:57 -04001435 *
1436 * Reph’s original position is always at the beginning of the syllable,
1437 * (i.e. it is not reordered at the character reordering stage). However,
1438 * it will be reordered according to the basic-forms shaping results.
1439 * Possible positions for reph, depending on the script, are; after main,
1440 * before post-base consonant forms, and after post-base consonant forms.
Behdad Esfahboddbb10582012-05-10 13:45:52 +02001441 */
1442
Behdad Esfahbod65a929b2013-10-15 18:08:05 +02001443 /* Two cases:
1444 *
1445 * - If repha is encoded as a sequence of characters (Ra,H or Ra,H,ZWJ), then
1446 * we should only move it if the sequence ligated to the repha form.
1447 *
1448 * - If repha is encoded separately and in the logical position, we should only
1449 * move it if it did NOT ligate. If it ligated, it's probably the font trying
1450 * to make it work without the reordering.
1451 */
Behdad Esfahbodf5299ef2013-10-15 18:13:07 +02001452 if (start + 1 < end &&
1453 info[start].indic_position() == POS_RA_TO_BECOME_REPH &&
Behdad Esfahbod3ddf8922013-10-18 00:02:43 +02001454 ((info[start].indic_category() == OT_Repha) ^
Behdad Esfahbod832a6f92014-06-04 16:57:42 -04001455 _hb_glyph_info_ligated_and_didnt_multiply (&info[start])))
Behdad Esfahboddbb10582012-05-10 13:45:52 +02001456 {
Behdad Esfahbod11b0e202012-08-02 14:21:40 -04001457 unsigned int new_reph_pos;
1458 reph_position_t reph_pos = indic_plan->config->reph_pos;
Behdad Esfahbod02b29222012-05-10 21:44:50 +02001459
Behdad Esfahbodf175aa32013-10-18 02:07:44 +02001460 assert (reph_pos != REPH_POS_DONT_CARE);
Behdad Esfahbod02b29222012-05-10 21:44:50 +02001461
Behdad Esfahboddbb10582012-05-10 13:45:52 +02001462 /* 1. If reph should be positioned after post-base consonant forms,
1463 * proceed to step 5.
Behdad Esfahbod02b29222012-05-10 21:44:50 +02001464 */
Behdad Esfahbod11b0e202012-08-02 14:21:40 -04001465 if (reph_pos == REPH_POS_AFTER_POST)
Behdad Esfahbod02b29222012-05-10 21:44:50 +02001466 {
Behdad Esfahbod9d0d3192012-05-11 21:36:32 +02001467 goto reph_step_5;
Behdad Esfahbod02b29222012-05-10 21:44:50 +02001468 }
1469
1470 /* 2. If the reph repositioning class is not after post-base: target
Behdad Esfahboddbb10582012-05-10 13:45:52 +02001471 * position is after the first explicit halant glyph between the
1472 * first post-reph consonant and last main consonant. If ZWJ or ZWNJ
1473 * are following this halant, position is moved after it. If such
1474 * position is found, this is the target position. Otherwise,
1475 * proceed to the next step.
1476 *
1477 * Note: in old-implementation fonts, where classifications were
1478 * fixed in shaping engine, there was no case where reph position
1479 * will be found on this step.
Behdad Esfahbod02b29222012-05-10 21:44:50 +02001480 */
Behdad Esfahbod02b29222012-05-10 21:44:50 +02001481 {
1482 new_reph_pos = start + 1;
Behdad Esfahboddeb521d2012-07-17 11:37:32 -04001483 while (new_reph_pos < base && !is_halant_or_coeng (info[new_reph_pos]))
Behdad Esfahbod02b29222012-05-10 21:44:50 +02001484 new_reph_pos++;
1485
Behdad Esfahbod1f91c392013-02-13 09:38:40 -05001486 if (new_reph_pos < base && is_halant_or_coeng (info[new_reph_pos]))
1487 {
Behdad Esfahbod02b29222012-05-10 21:44:50 +02001488 /* ->If ZWJ or ZWNJ are following this halant, position is moved after it. */
1489 if (new_reph_pos + 1 < base && is_joiner (info[new_reph_pos + 1]))
1490 new_reph_pos++;
1491 goto reph_move;
1492 }
1493 }
1494
1495 /* 3. If reph should be repositioned after the main consonant: find the
Behdad Esfahboddbb10582012-05-10 13:45:52 +02001496 * first consonant not ligated with main, or find the first
1497 * consonant that is not a potential pre-base reordering Ra.
Behdad Esfahbod02b29222012-05-10 21:44:50 +02001498 */
Behdad Esfahbod11b0e202012-08-02 14:21:40 -04001499 if (reph_pos == REPH_POS_AFTER_MAIN)
Behdad Esfahbod02b29222012-05-10 21:44:50 +02001500 {
Behdad Esfahbodb504e062012-07-16 15:21:12 -04001501 new_reph_pos = base;
Behdad Esfahbod34ae3362012-07-20 16:17:28 -04001502 while (new_reph_pos + 1 < end && info[new_reph_pos + 1].indic_position() <= POS_AFTER_MAIN)
Behdad Esfahbodb504e062012-07-16 15:21:12 -04001503 new_reph_pos++;
1504 if (new_reph_pos < end)
1505 goto reph_move;
Behdad Esfahbod02b29222012-05-10 21:44:50 +02001506 }
1507
1508 /* 4. If reph should be positioned before post-base consonant, find
Behdad Esfahboddbb10582012-05-10 13:45:52 +02001509 * first post-base classified consonant not ligated with main. If no
1510 * consonant is found, the target position should be before the
1511 * first matra, syllable modifier sign or vedic sign.
Behdad Esfahbod02b29222012-05-10 21:44:50 +02001512 */
Behdad Esfahbod9d0d3192012-05-11 21:36:32 +02001513 /* This is our take on what step 4 is trying to say (and failing, BADLY). */
Behdad Esfahbod11b0e202012-08-02 14:21:40 -04001514 if (reph_pos == REPH_POS_AFTER_SUB)
Behdad Esfahbod02b29222012-05-10 21:44:50 +02001515 {
Behdad Esfahbod9d0d3192012-05-11 21:36:32 +02001516 new_reph_pos = base;
Behdad Esfahbod85630992017-02-25 13:30:38 -08001517 while (new_reph_pos + 1 < end &&
Behdad Esfahbodf8160a42015-07-21 15:50:02 +01001518 !( FLAG_SAFE (info[new_reph_pos + 1].indic_position()) & (FLAG (POS_POST_C) | FLAG (POS_AFTER_POST) | FLAG (POS_SMVD))))
Behdad Esfahbod9d0d3192012-05-11 21:36:32 +02001519 new_reph_pos++;
1520 if (new_reph_pos < end)
1521 goto reph_move;
Behdad Esfahbod02b29222012-05-10 21:44:50 +02001522 }
1523
1524 /* 5. If no consonant is found in steps 3 or 4, move reph to a position
Behdad Esfahboddbb10582012-05-10 13:45:52 +02001525 * immediately before the first post-base matra, syllable modifier
1526 * sign or vedic sign that has a reordering class after the intended
1527 * reph position. For example, if the reordering position for reph
1528 * is post-main, it will skip above-base matras that also have a
1529 * post-main position.
Behdad Esfahboddbb10582012-05-10 13:45:52 +02001530 */
Behdad Esfahbod02b29222012-05-10 21:44:50 +02001531 reph_step_5:
1532 {
Behdad Esfahbodd0e68db2012-07-20 11:25:41 -04001533 /* Copied from step 2. */
1534 new_reph_pos = start + 1;
1535 while (new_reph_pos < base && !is_halant_or_coeng (info[new_reph_pos]))
1536 new_reph_pos++;
1537
Behdad Esfahbod1f91c392013-02-13 09:38:40 -05001538 if (new_reph_pos < base && is_halant_or_coeng (info[new_reph_pos]))
1539 {
Behdad Esfahbodd0e68db2012-07-20 11:25:41 -04001540 /* ->If ZWJ or ZWNJ are following this halant, position is moved after it. */
1541 if (new_reph_pos + 1 < base && is_joiner (info[new_reph_pos + 1]))
1542 new_reph_pos++;
1543 goto reph_move;
1544 }
Behdad Esfahbod8df56362012-05-10 15:41:04 +02001545 }
1546
Behdad Esfahbod02b29222012-05-10 21:44:50 +02001547 /* 6. Otherwise, reorder reph to the end of the syllable.
1548 */
Behdad Esfahbod02b29222012-05-10 21:44:50 +02001549 {
1550 new_reph_pos = end - 1;
1551 while (new_reph_pos > start && info[new_reph_pos].indic_position() == POS_SMVD)
1552 new_reph_pos--;
1553
Behdad Esfahbod892eb782012-05-11 16:54:40 +02001554 /*
1555 * If the Reph is to be ending up after a Matra,Halant sequence,
1556 * position it before that Halant so it can interact with the Matra.
1557 * However, if it's a plain Consonant,Halant we shouldn't do that.
1558 * Uniscribe doesn't do this.
1559 * TEST: U+0930,U+094D,U+0915,U+094B,U+094D
1560 */
Behdad Esfahbodbab02d32013-02-12 15:26:45 -05001561 if (!hb_options ().uniscribe_bug_compatible &&
Behdad Esfahboddeb521d2012-07-17 11:37:32 -04001562 unlikely (is_halant_or_coeng (info[new_reph_pos]))) {
Behdad Esfahbod02b29222012-05-10 21:44:50 +02001563 for (unsigned int i = base + 1; i < new_reph_pos; i++)
1564 if (info[i].indic_category() == OT_M) {
1565 /* Ok, got it. */
1566 new_reph_pos--;
1567 }
1568 }
1569 goto reph_move;
1570 }
1571
1572 reph_move:
1573 {
1574 /* Move */
Behdad Esfahbod5828c452015-09-01 16:26:35 +01001575 buffer->merge_clusters (start, new_reph_pos + 1);
Behdad Esfahbod02b29222012-05-10 21:44:50 +02001576 hb_glyph_info_t reph = info[start];
1577 memmove (&info[start], &info[start + 1], (new_reph_pos - start) * sizeof (info[0]));
1578 info[new_reph_pos] = reph;
Behdad Esfahbod5828c452015-09-01 16:26:35 +01001579
Behdad Esfahbodf22b7e72013-02-13 07:32:46 -05001580 if (start < base && base <= new_reph_pos)
1581 base--;
Behdad Esfahbod02b29222012-05-10 21:44:50 +02001582 }
Behdad Esfahboddbb10582012-05-10 13:45:52 +02001583 }
1584
1585
1586 /* o Reorder pre-base reordering consonants:
Behdad Esfahbode7be0572011-07-31 15:18:57 -04001587 *
1588 * If a pre-base reordering consonant is found, reorder it according to
1589 * the following rules:
Behdad Esfahbode7be0572011-07-31 15:18:57 -04001590 */
1591
Behdad Esfahbod1d634cb2014-06-06 17:55:02 -04001592 if (try_pref && base + 1 < end) /* Otherwise there can't be any pre-base reordering Ra. */
Behdad Esfahbod46e645e2012-07-16 15:30:05 -04001593 {
Behdad Esfahbod8e7b5882012-07-16 17:04:46 -04001594 for (unsigned int i = base + 1; i < end; i++)
Behdad Esfahbod85fc6c42012-08-02 12:21:44 -04001595 if ((info[i].mask & indic_plan->mask_array[PREF]) != 0)
Behdad Esfahbod78818122012-07-16 15:49:08 -04001596 {
Behdad Esfahbod8e7b5882012-07-16 17:04:46 -04001597 /* 1. Only reorder a glyph produced by substitution during application
1598 * of the <pref> feature. (Note that a font may shape a Ra consonant with
1599 * the feature generally but block it in certain contexts.)
1600 */
Behdad Esfahbod9a493512013-10-18 02:14:53 +02001601 /* Note: We just check that something got substituted. We don't check that
Behdad Esfahbod46a863d2013-10-27 23:24:50 +01001602 * the <pref> feature actually did it...
1603 *
Behdad Esfahbod3c1666c2016-05-06 16:05:07 +01001604 * Reorder pref only if it ligated. */
1605 if (_hb_glyph_info_ligated_and_didnt_multiply (&info[i]))
Behdad Esfahbod8e7b5882012-07-16 17:04:46 -04001606 {
1607 /*
1608 * 2. Try to find a target position the same way as for pre-base matra.
1609 * If it is found, reorder pre-base consonant glyph.
1610 *
1611 * 3. If position is not found, reorder immediately before main
1612 * consonant.
1613 */
1614
1615 unsigned int new_pos = base;
Behdad Esfahbod88d3c982012-10-29 16:27:02 -07001616 /* Malayalam / Tamil do not have "half" forms or explicit virama forms.
1617 * The glyphs formed by 'half' are Chillus or ligated explicit viramas.
1618 * We want to position matra after them.
1619 */
1620 if (buffer->props.script != HB_SCRIPT_MALAYALAM && buffer->props.script != HB_SCRIPT_TAMIL)
Behdad Esfahbodd90b8e82012-07-24 02:10:20 -04001621 {
Behdad Esfahbod88d3c982012-10-29 16:27:02 -07001622 while (new_pos > start &&
1623 !(is_one_of (info[new_pos - 1], FLAG(OT_M) | HALANT_OR_COENG_FLAGS)))
1624 new_pos--;
1625
Behdad Esfahbod9a493512013-10-18 02:14:53 +02001626 /* In Khmer coeng model, a H,Ra can go *after* matras. If it goes after a
Behdad Esfahbod88d3c982012-10-29 16:27:02 -07001627 * split matra, it should be reordered to *before* the left part of such matra. */
1628 if (new_pos > start && info[new_pos - 1].indic_category() == OT_M)
1629 {
1630 unsigned int old_pos = i;
Behdad Esfahbodb90cb362015-10-21 11:13:21 -02001631 for (unsigned int j = base + 1; j < old_pos; j++)
1632 if (info[j].indic_category() == OT_M)
Behdad Esfahbod88d3c982012-10-29 16:27:02 -07001633 {
1634 new_pos--;
1635 break;
1636 }
1637 }
Behdad Esfahbodd90b8e82012-07-24 02:10:20 -04001638 }
1639
Behdad Esfahboddeb521d2012-07-17 11:37:32 -04001640 if (new_pos > start && is_halant_or_coeng (info[new_pos - 1]))
Behdad Esfahbod1f91c392013-02-13 09:38:40 -05001641 {
Behdad Esfahbod8e7b5882012-07-16 17:04:46 -04001642 /* -> If ZWJ or ZWNJ follow this halant, position is moved after it. */
1643 if (new_pos < end && is_joiner (info[new_pos]))
1644 new_pos++;
Behdad Esfahbod1f91c392013-02-13 09:38:40 -05001645 }
Behdad Esfahbod8e7b5882012-07-16 17:04:46 -04001646
1647 {
1648 unsigned int old_pos = i;
Behdad Esfahbod5828c452015-09-01 16:26:35 +01001649
Behdad Esfahbode6b01a82012-07-23 00:11:26 -04001650 buffer->merge_clusters (new_pos, old_pos + 1);
Behdad Esfahbod8e7b5882012-07-16 17:04:46 -04001651 hb_glyph_info_t tmp = info[old_pos];
1652 memmove (&info[new_pos + 1], &info[new_pos], (old_pos - new_pos) * sizeof (info[0]));
1653 info[new_pos] = tmp;
Behdad Esfahbod5828c452015-09-01 16:26:35 +01001654
Behdad Esfahbodf22b7e72013-02-13 07:32:46 -05001655 if (new_pos <= base && base < old_pos)
1656 base++;
Behdad Esfahbod8e7b5882012-07-16 17:04:46 -04001657 }
1658 }
1659
1660 break;
Behdad Esfahbod78818122012-07-16 15:49:08 -04001661 }
Behdad Esfahbod46e645e2012-07-16 15:30:05 -04001662 }
Behdad Esfahbodeed903b2012-05-11 20:50:53 +02001663
1664
Behdad Esfahboda913b022012-05-11 20:59:26 +02001665 /* Apply 'init' to the Left Matra if it's a word start. */
Behdad Esfahbod6a091df2012-05-11 21:42:27 +02001666 if (info[start].indic_position () == POS_PRE_M &&
Behdad Esfahboda913b022012-05-11 20:59:26 +02001667 (!start ||
Behdad Esfahbodf8160a42015-07-21 15:50:02 +01001668 !(FLAG_SAFE (_hb_glyph_info_get_general_category (&info[start - 1])) &
Behdad Esfahbod2c372b82012-07-20 13:37:48 -04001669 FLAG_RANGE (HB_UNICODE_GENERAL_CATEGORY_FORMAT, HB_UNICODE_GENERAL_CATEGORY_NON_SPACING_MARK))))
Behdad Esfahbod85fc6c42012-08-02 12:21:44 -04001670 info[start].mask |= indic_plan->mask_array[INIT];
Behdad Esfahboda913b022012-05-11 20:59:26 +02001671
Behdad Esfahbodeed903b2012-05-11 20:50:53 +02001672
Behdad Esfahbod8ed248d2012-07-20 11:42:24 -04001673 /*
1674 * Finish off the clusters and go home!
1675 */
Behdad Esfahbod9ac6b012013-10-17 16:27:38 +02001676 if (hb_options ().uniscribe_bug_compatible)
Behdad Esfahbodebe29732012-05-11 16:43:12 +02001677 {
Behdad Esfahbod9ac6b012013-10-17 16:27:38 +02001678 switch ((hb_tag_t) plan->props.script)
1679 {
1680 case HB_SCRIPT_TAMIL:
1681 case HB_SCRIPT_SINHALA:
1682 break;
1683
1684 default:
1685 /* Uniscribe merges the entire cluster... Except for Tamil & Sinhala.
1686 * This means, half forms are submerged into the main consonants cluster.
1687 * This is unnecessary, and makes cursor positioning harder, but that's what
1688 * Uniscribe does. */
1689 buffer->merge_clusters (start, end);
1690 break;
1691 }
Behdad Esfahbod21d28032012-05-10 18:34:34 +02001692 }
Behdad Esfahbodef24cc82012-05-09 17:56:03 +02001693}
Behdad Esfahbode7be0572011-07-31 15:18:57 -04001694
1695
Behdad Esfahbodef24cc82012-05-09 17:56:03 +02001696static void
Behdad Esfahbod8bb5deb2012-08-02 10:07:58 -04001697final_reordering (const hb_ot_shape_plan_t *plan,
Behdad Esfahbod0beb66e2012-12-05 18:46:04 -05001698 hb_font_t *font HB_UNUSED,
Behdad Esfahbod3e38c0f2012-08-02 09:44:18 -04001699 hb_buffer_t *buffer)
Behdad Esfahbodef24cc82012-05-09 17:56:03 +02001700{
1701 unsigned int count = buffer->len;
Behdad Esfahbod327d14e2012-08-31 16:49:34 -04001702 if (unlikely (!count)) return;
Behdad Esfahbode7be0572011-07-31 15:18:57 -04001703
Behdad Esfahbodecb0b242015-07-22 12:02:09 +01001704 foreach_syllable (buffer, start, end)
1705 final_reordering_syllable (plan, buffer, start, end);
Behdad Esfahbodef24cc82012-05-09 17:56:03 +02001706
Behdad Esfahbod743807a2011-07-29 16:37:02 -04001707 HB_BUFFER_DEALLOCATE_VAR (buffer, indic_category);
1708 HB_BUFFER_DEALLOCATE_VAR (buffer, indic_position);
1709}
1710
1711
Behdad Esfahbod30145272013-10-15 13:47:27 +02001712static void
1713clear_syllables (const hb_ot_shape_plan_t *plan HB_UNUSED,
1714 hb_font_t *font HB_UNUSED,
1715 hb_buffer_t *buffer)
1716{
1717 hb_glyph_info_t *info = buffer->info;
1718 unsigned int count = buffer->len;
1719 for (unsigned int i = 0; i < count; i++)
1720 info[i].syllable() = 0;
1721}
1722
1723
Behdad Esfahbodeba312c2012-11-16 12:39:23 -08001724static bool
1725decompose_indic (const hb_ot_shape_normalize_context_t *c,
Behdad Esfahbod07369152012-11-13 12:35:35 -08001726 hb_codepoint_t ab,
1727 hb_codepoint_t *a,
1728 hb_codepoint_t *b)
1729{
1730 switch (ab)
1731 {
1732 /* Don't decompose these. */
Behdad Esfahbod3cc48a42016-12-26 13:10:31 -05001733 case 0x0931u : return false; /* DEVANAGARI LETTER RRA */
1734 case 0x0B94u : return false; /* TAMIL LETTER AU */
Behdad Esfahbod07369152012-11-13 12:35:35 -08001735
1736
1737 /*
1738 * Decompose split matras that don't have Unicode decompositions.
1739 */
1740
Behdad Esfahbod3cc48a42016-12-26 13:10:31 -05001741 /* Khmer */
Behdad Esfahbod76271002014-07-11 14:54:42 -04001742 case 0x17BEu : *a = 0x17C1u; *b= 0x17BEu; return true;
1743 case 0x17BFu : *a = 0x17C1u; *b= 0x17BFu; return true;
1744 case 0x17C0u : *a = 0x17C1u; *b= 0x17C0u; return true;
1745 case 0x17C4u : *a = 0x17C1u; *b= 0x17C4u; return true;
1746 case 0x17C5u : *a = 0x17C1u; *b= 0x17C5u; return true;
Behdad Esfahbod3cc48a42016-12-26 13:10:31 -05001747
Behdad Esfahbod07369152012-11-13 12:35:35 -08001748#if 0
Behdad Esfahbod3cc48a42016-12-26 13:10:31 -05001749 /* Gujarati */
Behdad Esfahbod07369152012-11-13 12:35:35 -08001750 /* This one has no decomposition in Unicode, but needs no decomposition either. */
Behdad Esfahbod76271002014-07-11 14:54:42 -04001751 /* case 0x0AC9u : return false; */
Behdad Esfahbod3cc48a42016-12-26 13:10:31 -05001752
1753 /* Oriya */
Behdad Esfahbod76271002014-07-11 14:54:42 -04001754 case 0x0B57u : *a = no decomp, -> RIGHT; return true;
Behdad Esfahbod07369152012-11-13 12:35:35 -08001755#endif
1756 }
1757
Ebrahim Byagowi3b0e47c2017-06-19 14:47:09 +04301758 if ((ab == 0x0DDAu || hb_in_range<hb_codepoint_t> (ab, 0x0DDCu, 0x0DDEu)))
Behdad Esfahbod07369152012-11-13 12:35:35 -08001759 {
Behdad Esfahbod43b65312012-11-16 13:12:35 -08001760 /*
1761 * Sinhala split matras... Let the fun begin.
1762 *
1763 * These four characters have Unicode decompositions. However, Uniscribe
1764 * decomposes them "Khmer-style", that is, it uses the character itself to
1765 * get the second half. The first half of all four decompositions is always
1766 * U+0DD9.
1767 *
1768 * Now, there are buggy fonts, namely, the widely used lklug.ttf, that are
1769 * broken with Uniscribe. But we need to support them. As such, we only
1770 * do the Uniscribe-style decomposition if the character is transformed into
1771 * its "sec.half" form by the 'pstf' feature. Otherwise, we fall back to
1772 * Unicode decomposition.
1773 *
1774 * Note that we can't unconditionally use Unicode decomposition. That would
1775 * break some other fonts, that are designed to work with Uniscribe, and
1776 * don't have positioning features for the Unicode-style decomposition.
1777 *
1778 * Argh...
Behdad Esfahbodb71b0bd2012-12-05 19:20:31 -05001779 *
1780 * The Uniscribe behavior is now documented in the newly published Sinhala
1781 * spec in 2012:
1782 *
1783 * http://www.microsoft.com/typography/OpenTypeDev/sinhala/intro.htm#shaping
Behdad Esfahbod43b65312012-11-16 13:12:35 -08001784 */
1785
1786 const indic_shape_plan_t *indic_plan = (const indic_shape_plan_t *) c->plan->data;
1787
1788 hb_codepoint_t glyph;
1789
Behdad Esfahbodbab02d32013-02-12 15:26:45 -05001790 if (hb_options ().uniscribe_bug_compatible ||
Behdad Esfahbod8b5bc142016-02-24 19:05:23 +09001791 (c->font->get_nominal_glyph (ab, &glyph) &&
Behdad Esfahbodb5a0f692013-10-17 18:04:23 +02001792 indic_plan->pstf.would_substitute (&glyph, 1, c->font->face)))
Behdad Esfahbod43b65312012-11-16 13:12:35 -08001793 {
1794 /* Ok, safe to use Uniscribe-style decomposition. */
Behdad Esfahbod76271002014-07-11 14:54:42 -04001795 *a = 0x0DD9u;
Behdad Esfahbod43b65312012-11-16 13:12:35 -08001796 *b = ab;
1797 return true;
1798 }
Behdad Esfahbod07369152012-11-13 12:35:35 -08001799 }
1800
Behdad Esfahbodea512f72015-11-26 19:22:22 -05001801 return (bool) c->unicode->decompose (ab, a, b);
Behdad Esfahbod07369152012-11-13 12:35:35 -08001802}
1803
Behdad Esfahbodeba312c2012-11-16 12:39:23 -08001804static bool
1805compose_indic (const hb_ot_shape_normalize_context_t *c,
Behdad Esfahbod07369152012-11-13 12:35:35 -08001806 hb_codepoint_t a,
1807 hb_codepoint_t b,
1808 hb_codepoint_t *ab)
1809{
1810 /* Avoid recomposing split matras. */
Behdad Esfahbodeba312c2012-11-16 12:39:23 -08001811 if (HB_UNICODE_GENERAL_CATEGORY_IS_MARK (c->unicode->general_category (a)))
Behdad Esfahbod07369152012-11-13 12:35:35 -08001812 return false;
1813
1814 /* Composition-exclusion exceptions that we want to recompose. */
Behdad Esfahbod76271002014-07-11 14:54:42 -04001815 if (a == 0x09AFu && b == 0x09BCu) { *ab = 0x09DFu; return true; }
Behdad Esfahbod07369152012-11-13 12:35:35 -08001816
Behdad Esfahbodea512f72015-11-26 19:22:22 -05001817 return (bool) c->unicode->compose (a, b, ab);
Behdad Esfahbod07369152012-11-13 12:35:35 -08001818}
1819
1820
Behdad Esfahbod693918e2012-07-30 21:08:51 -04001821const hb_ot_complex_shaper_t _hb_ot_complex_shaper_indic =
1822{
1823 "indic",
1824 collect_features_indic,
1825 override_features_indic,
Behdad Esfahboda8c6da92012-08-02 10:46:34 -04001826 data_create_indic,
1827 data_destroy_indic,
Behdad Esfahbod9f9f04c2012-08-11 18:34:13 -04001828 NULL, /* preprocess_text */
Behdad Esfahbod13686332015-11-05 13:24:15 -08001829 NULL, /* postprocess_glyphs */
Behdad Esfahbod3d6ca0d2013-12-31 16:04:35 +08001830 HB_OT_SHAPE_NORMALIZATION_MODE_COMPOSED_DIACRITICS_NO_SHORT_CIRCUIT,
Behdad Esfahbod07369152012-11-13 12:35:35 -08001831 decompose_indic,
1832 compose_indic,
Behdad Esfahbod693918e2012-07-30 21:08:51 -04001833 setup_masks_indic,
Behdad Esfahbode2b87802016-12-22 14:40:19 -06001834 NULL, /* disable_otl */
Behdad Esfahbod71b4c992013-10-28 00:20:59 +01001835 HB_OT_SHAPE_ZERO_WIDTH_MARKS_NONE,
Behdad Esfahbod865745b2012-11-14 13:48:26 -08001836 false, /* fallback_position */
Behdad Esfahbod693918e2012-07-30 21:08:51 -04001837};