blob: 44481dbb4c8b7ac4939efb23f68eefc7e89551b0 [file] [log] [blame]
Behdad Esfahbodb9ddbd52011-06-02 17:43:12 -04001/*
Behdad Esfahbod27aba592012-05-24 15:00:01 -04002 * Copyright © 2011,2012 Google, Inc.
Behdad Esfahbodb9ddbd52011-06-02 17:43:12 -04003 *
4 * This is part of HarfBuzz, a text shaping library.
5 *
6 * Permission is hereby granted, without written agreement and without
7 * license or royalty fees, to use, copy, modify, and distribute this
8 * software and its documentation for any purpose, provided that the
9 * above copyright notice and the following two paragraphs appear in
10 * all copies of this software.
11 *
12 * IN NO EVENT SHALL THE COPYRIGHT HOLDER BE LIABLE TO ANY PARTY FOR
13 * DIRECT, INDIRECT, SPECIAL, INCIDENTAL, OR CONSEQUENTIAL DAMAGES
14 * ARISING OUT OF THE USE OF THIS SOFTWARE AND ITS DOCUMENTATION, EVEN
15 * IF THE COPYRIGHT HOLDER HAS BEEN ADVISED OF THE POSSIBILITY OF SUCH
16 * DAMAGE.
17 *
18 * THE COPYRIGHT HOLDER SPECIFICALLY DISCLAIMS ANY WARRANTIES, INCLUDING,
19 * BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND
20 * FITNESS FOR A PARTICULAR PURPOSE. THE SOFTWARE PROVIDED HEREUNDER IS
21 * ON AN "AS IS" BASIS, AND THE COPYRIGHT HOLDER HAS NO OBLIGATION TO
22 * PROVIDE MAINTENANCE, SUPPORT, UPDATES, ENHANCEMENTS, OR MODIFICATIONS.
23 *
24 * Google Author(s): Behdad Esfahbod
25 */
26
Behdad Esfahbod3ed46342012-04-19 22:34:06 -040027#include "hb-ot-shape-complex-indic-private.hh"
Behdad Esfahbod49c5ec52012-07-23 20:14:13 -040028#include "hb-ot-layout-private.hh"
Behdad Esfahbod352372a2011-07-30 19:04:02 -040029
Behdad Esfahbod3a83d332013-02-12 12:14:10 -050030/* buffer var allocations */
31#define indic_category() complex_var_u8_0() /* indic_category_t */
32#define indic_position() complex_var_u8_1() /* indic_position_t */
33
34
35/*
36 * Indic shaper.
37 */
38
39
Behdad Esfahbod76271002014-07-11 14:54:42 -040040#define IN_HALF_BLOCK(u, Base) (((u) & ~0x7Fu) == (Base))
Behdad Esfahbod3a83d332013-02-12 12:14:10 -050041
Behdad Esfahbod76271002014-07-11 14:54:42 -040042#define IS_DEVA(u) (IN_HALF_BLOCK (u, 0x0900u))
43#define IS_BENG(u) (IN_HALF_BLOCK (u, 0x0980u))
44#define IS_GURU(u) (IN_HALF_BLOCK (u, 0x0A00u))
45#define IS_GUJR(u) (IN_HALF_BLOCK (u, 0x0A80u))
46#define IS_ORYA(u) (IN_HALF_BLOCK (u, 0x0B00u))
47#define IS_TAML(u) (IN_HALF_BLOCK (u, 0x0B80u))
48#define IS_TELU(u) (IN_HALF_BLOCK (u, 0x0C00u))
49#define IS_KNDA(u) (IN_HALF_BLOCK (u, 0x0C80u))
50#define IS_MLYM(u) (IN_HALF_BLOCK (u, 0x0D00u))
51#define IS_SINH(u) (IN_HALF_BLOCK (u, 0x0D80u))
52#define IS_KHMR(u) (IN_HALF_BLOCK (u, 0x1780u))
Behdad Esfahbod3a83d332013-02-12 12:14:10 -050053
54
55#define MATRA_POS_LEFT(u) POS_PRE_M
56#define MATRA_POS_RIGHT(u) ( \
57 IS_DEVA(u) ? POS_AFTER_SUB : \
58 IS_BENG(u) ? POS_AFTER_POST : \
59 IS_GURU(u) ? POS_AFTER_POST : \
60 IS_GUJR(u) ? POS_AFTER_POST : \
61 IS_ORYA(u) ? POS_AFTER_POST : \
62 IS_TAML(u) ? POS_AFTER_POST : \
Behdad Esfahbod76271002014-07-11 14:54:42 -040063 IS_TELU(u) ? (u <= 0x0C42u ? POS_BEFORE_SUB : POS_AFTER_SUB) : \
64 IS_KNDA(u) ? (u < 0x0CC3u || u > 0xCD6u ? POS_BEFORE_SUB : POS_AFTER_SUB) : \
Behdad Esfahbod3a83d332013-02-12 12:14:10 -050065 IS_MLYM(u) ? POS_AFTER_POST : \
66 IS_SINH(u) ? POS_AFTER_SUB : \
67 IS_KHMR(u) ? POS_AFTER_POST : \
68 /*default*/ POS_AFTER_SUB \
69 )
70#define MATRA_POS_TOP(u) ( /* BENG and MLYM don't have top matras. */ \
71 IS_DEVA(u) ? POS_AFTER_SUB : \
72 IS_GURU(u) ? POS_AFTER_POST : /* Deviate from spec */ \
73 IS_GUJR(u) ? POS_AFTER_SUB : \
74 IS_ORYA(u) ? POS_AFTER_MAIN : \
75 IS_TAML(u) ? POS_AFTER_SUB : \
76 IS_TELU(u) ? POS_BEFORE_SUB : \
77 IS_KNDA(u) ? POS_BEFORE_SUB : \
78 IS_SINH(u) ? POS_AFTER_SUB : \
79 IS_KHMR(u) ? POS_AFTER_POST : \
80 /*default*/ POS_AFTER_SUB \
81 )
82#define MATRA_POS_BOTTOM(u) ( \
83 IS_DEVA(u) ? POS_AFTER_SUB : \
84 IS_BENG(u) ? POS_AFTER_SUB : \
85 IS_GURU(u) ? POS_AFTER_POST : \
86 IS_GUJR(u) ? POS_AFTER_POST : \
87 IS_ORYA(u) ? POS_AFTER_SUB : \
88 IS_TAML(u) ? POS_AFTER_POST : \
89 IS_TELU(u) ? POS_BEFORE_SUB : \
90 IS_KNDA(u) ? POS_BEFORE_SUB : \
91 IS_MLYM(u) ? POS_AFTER_POST : \
92 IS_SINH(u) ? POS_AFTER_SUB : \
93 IS_KHMR(u) ? POS_AFTER_POST : \
94 /*default*/ POS_AFTER_SUB \
95 )
96
97static inline indic_position_t
98matra_position (hb_codepoint_t u, indic_position_t side)
99{
100 switch ((int) side)
101 {
102 case POS_PRE_C: return MATRA_POS_LEFT (u);
103 case POS_POST_C: return MATRA_POS_RIGHT (u);
104 case POS_ABOVE_C: return MATRA_POS_TOP (u);
105 case POS_BELOW_C: return MATRA_POS_BOTTOM (u);
106 };
107 return side;
108}
109
110/* XXX
111 * This is a hack for now. We should move this data into the main Indic table.
112 * Or completely remove it and just check in the tables.
113 */
114static const hb_codepoint_t ra_chars[] = {
Behdad Esfahbod76271002014-07-11 14:54:42 -0400115 0x0930u, /* Devanagari */
116 0x09B0u, /* Bengali */
117 0x09F0u, /* Bengali */
118 0x0A30u, /* Gurmukhi */ /* No Reph */
119 0x0AB0u, /* Gujarati */
120 0x0B30u, /* Oriya */
121 0x0BB0u, /* Tamil */ /* No Reph */
122 0x0C30u, /* Telugu */ /* Reph formed only with ZWJ */
123 0x0CB0u, /* Kannada */
124 0x0D30u, /* Malayalam */ /* No Reph, Logical Repha */
Behdad Esfahbod3a83d332013-02-12 12:14:10 -0500125
Behdad Esfahbod76271002014-07-11 14:54:42 -0400126 0x0DBBu, /* Sinhala */ /* Reph formed only with ZWJ */
Behdad Esfahbod3a83d332013-02-12 12:14:10 -0500127
Behdad Esfahbod76271002014-07-11 14:54:42 -0400128 0x179Au, /* Khmer */ /* No Reph, Visual Repha */
Behdad Esfahbod3a83d332013-02-12 12:14:10 -0500129};
130
Behdad Esfahbod3a83d332013-02-12 12:14:10 -0500131static inline bool
132is_ra (hb_codepoint_t u)
133{
134 for (unsigned int i = 0; i < ARRAY_LENGTH (ra_chars); i++)
135 if (u == ra_chars[i])
136 return true;
137 return false;
138}
139
140static inline bool
141is_one_of (const hb_glyph_info_t &info, unsigned int flags)
142{
143 /* If it ligated, all bets are off. */
Behdad Esfahboda1f7b282013-10-18 01:09:08 +0200144 if (_hb_glyph_info_ligated (&info)) return false;
Behdad Esfahbodf8160a42015-07-21 15:50:02 +0100145 return !!(FLAG_SAFE (info.indic_category()) & flags);
Behdad Esfahbod3a83d332013-02-12 12:14:10 -0500146}
147
Behdad Esfahbod3a83d332013-02-12 12:14:10 -0500148static inline bool
149is_joiner (const hb_glyph_info_t &info)
150{
151 return is_one_of (info, JOINER_FLAGS);
152}
153
Behdad Esfahbod3a83d332013-02-12 12:14:10 -0500154static inline bool
155is_consonant (const hb_glyph_info_t &info)
156{
157 return is_one_of (info, CONSONANT_FLAGS);
158}
159
Behdad Esfahbod3a83d332013-02-12 12:14:10 -0500160static inline bool
161is_halant_or_coeng (const hb_glyph_info_t &info)
162{
163 return is_one_of (info, HALANT_OR_COENG_FLAGS);
164}
165
166static inline void
167set_indic_properties (hb_glyph_info_t &info)
168{
169 hb_codepoint_t u = info.codepoint;
170 unsigned int type = hb_indic_get_categories (u);
Behdad Esfahbod76271002014-07-11 14:54:42 -0400171 indic_category_t cat = (indic_category_t) (type & 0x7Fu);
Behdad Esfahbod3a83d332013-02-12 12:14:10 -0500172 indic_position_t pos = (indic_position_t) (type >> 8);
173
174
175 /*
176 * Re-assign category
177 */
178
179
180 /* The spec says U+0952 is OT_A. However, testing shows that Uniscribe
Behdad Esfahbodc11fc682014-05-22 18:41:49 -0400181 * treats a whole bunch of characters similarly.
182 * TESTS: For example, for U+0951:
Behdad Esfahbod3a83d332013-02-12 12:14:10 -0500183 * U+092E,U+0947,U+0952
184 * U+092E,U+0952,U+0947
185 * U+092E,U+0947,U+0951
186 * U+092E,U+0951,U+0947
Behdad Esfahbodc11fc682014-05-22 18:41:49 -0400187 * U+092E,U+0951,U+0952
188 * U+092E,U+0952,U+0951
Behdad Esfahbod3756efa2013-10-16 19:06:29 +0200189 */
Behdad Esfahbod76271002014-07-11 14:54:42 -0400190 if (unlikely (hb_in_ranges (u, 0x0951u, 0x0952u,
191 0x1CD0u, 0x1CD2u,
192 0x1CD4u, 0x1CE1u) ||
193 u == 0x1CF4u))
Behdad Esfahbod3756efa2013-10-16 19:06:29 +0200194 cat = OT_A;
Behdad Esfahbodc11fc682014-05-22 18:41:49 -0400195 /* The following act more like the Bindus. */
Behdad Esfahbod76271002014-07-11 14:54:42 -0400196 else if (unlikely (hb_in_range (u, 0x0953u, 0x0954u)))
Behdad Esfahbodc11fc682014-05-22 18:41:49 -0400197 cat = OT_SM;
Behdad Esfahbod131e17f2014-05-22 19:32:51 -0400198 /* The following act like consonants. */
Behdad Esfahbod76271002014-07-11 14:54:42 -0400199 else if (unlikely (hb_in_ranges (u, 0x0A72u, 0x0A73u,
200 0x1CF5u, 0x1CF6u)))
Behdad Esfahbod131e17f2014-05-22 19:32:51 -0400201 cat = OT_C;
Behdad Esfahbodecb98ba2014-05-22 19:36:21 -0400202 /* TODO: The following should only be allowed after a Visarga.
203 * For now, just treat them like regular tone marks. */
Behdad Esfahbod76271002014-07-11 14:54:42 -0400204 else if (unlikely (hb_in_range (u, 0x1CE2u, 0x1CE8u)))
Behdad Esfahbodecb98ba2014-05-22 19:36:21 -0400205 cat = OT_A;
Behdad Esfahbode9b2a4c2014-05-23 15:49:10 -0400206 /* TODO: The following should only be allowed after some of
207 * the nasalization marks, maybe only for U+1CE9..U+1CF1.
208 * For now, just treat them like tone marks. */
Behdad Esfahbod76271002014-07-11 14:54:42 -0400209 else if (unlikely (u == 0x1CEDu))
Behdad Esfahbode9b2a4c2014-05-23 15:49:10 -0400210 cat = OT_A;
Behdad Esfahbodd19f8e82014-05-23 15:45:50 -0400211 /* The following take marks in standalone clusters, similar to Avagraha. */
Behdad Esfahbod76271002014-07-11 14:54:42 -0400212 else if (unlikely (hb_in_ranges (u, 0xA8F2u, 0xA8F7u,
213 0x1CE9u, 0x1CECu,
214 0x1CEEu, 0x1CF1u)))
Behdad Esfahbodd19f8e82014-05-23 15:45:50 -0400215 {
216 cat = OT_Symbol;
217 ASSERT_STATIC ((int) INDIC_SYLLABIC_CATEGORY_AVAGRAHA == OT_Symbol);
218 }
Behdad Esfahbod76271002014-07-11 14:54:42 -0400219 else if (unlikely (hb_in_range (u, 0x17CDu, 0x17D1u) ||
220 u == 0x17CBu || u == 0x17D3u || u == 0x17DDu)) /* Khmer Various signs */
Behdad Esfahbod3a83d332013-02-12 12:14:10 -0500221 {
222 /* These are like Top Matras. */
223 cat = OT_M;
224 pos = POS_ABOVE_C;
225 }
Behdad Esfahbod76271002014-07-11 14:54:42 -0400226 else if (unlikely (u == 0x17C6u)) cat = OT_N; /* Khmer Bindu doesn't like to be repositioned. */
227 else if (unlikely (u == 0x17D2u)) cat = OT_Coeng; /* Khmer coeng */
228 else if (unlikely (hb_in_range (u, 0x2010u, 0x2011u)))
229 cat = OT_PLACEHOLDER;
230 else if (unlikely (u == 0x25CCu)) cat = OT_DOTTEDCIRCLE;
231 else if (unlikely (u == 0xA982u)) cat = OT_SM; /* Javanese repha. */
232 else if (unlikely (u == 0xA9BEu)) cat = OT_CM2; /* Javanese medial ya. */
233 else if (unlikely (u == 0xA9BDu)) { cat = OT_M; pos = POS_POST_C; } /* Javanese vocalic r. */
Behdad Esfahbod3a83d332013-02-12 12:14:10 -0500234
235
236 /*
237 * Re-assign position.
238 */
239
Behdad Esfahbodf8160a42015-07-21 15:50:02 +0100240 if ((FLAG_SAFE (cat) & CONSONANT_FLAGS))
Behdad Esfahbod3a83d332013-02-12 12:14:10 -0500241 {
Behdad Esfahbodc4e71ff2013-10-17 17:04:47 +0200242 pos = POS_BASE_C;
Behdad Esfahbod3a83d332013-02-12 12:14:10 -0500243 if (is_ra (u))
244 cat = OT_Ra;
245 }
246 else if (cat == OT_M)
247 {
248 pos = matra_position (u, pos);
249 }
Behdad Esfahbodf8160a42015-07-21 15:50:02 +0100250 else if ((FLAG_SAFE (cat) & (FLAG (OT_SM) | FLAG (OT_VD) | FLAG (OT_A) | FLAG (OT_Symbol))))
Behdad Esfahbod3a83d332013-02-12 12:14:10 -0500251 {
252 pos = POS_SMVD;
253 }
254
Behdad Esfahbod76271002014-07-11 14:54:42 -0400255 if (unlikely (u == 0x0B01u)) pos = POS_BEFORE_SUB; /* Oriya Bindu is BeforeSub in the spec. */
Behdad Esfahbod3a83d332013-02-12 12:14:10 -0500256
257
258
259 info.indic_category() = cat;
260 info.indic_position() = pos;
261}
262
263/*
264 * Things above this line should ideally be moved to the Indic table itself.
265 */
266
Behdad Esfahbod1d002042012-08-02 05:01:11 -0400267
Behdad Esfahbod11b0e202012-08-02 14:21:40 -0400268/*
Behdad Esfahbod11b0e202012-08-02 14:21:40 -0400269 * Indic configurations. Note that we do not want to keep every single script-specific
270 * behavior in these tables necessarily. This should mainly be used for per-script
271 * properties that are cheaper keeping here, than in the code. Ie. if, say, one and
272 * only one script has an exception, that one script can be if'ed directly in the code,
273 * instead of adding a new flag in these structs.
274 */
275
276enum base_position_t {
277 BASE_POS_FIRST,
Behdad Esfahbode10453e2013-10-17 16:49:06 +0200278 BASE_POS_LAST_SINHALA,
Behdad Esfahbod11b0e202012-08-02 14:21:40 -0400279 BASE_POS_LAST
280};
281enum reph_position_t {
Behdad Esfahbod11b0e202012-08-02 14:21:40 -0400282 REPH_POS_AFTER_MAIN = POS_AFTER_MAIN,
283 REPH_POS_BEFORE_SUB = POS_BEFORE_SUB,
284 REPH_POS_AFTER_SUB = POS_AFTER_SUB,
285 REPH_POS_BEFORE_POST = POS_BEFORE_POST,
Behdad Esfahbod74f4bbf2013-10-17 19:07:53 +0200286 REPH_POS_AFTER_POST = POS_AFTER_POST,
287 REPH_POS_DONT_CARE = POS_RA_TO_BECOME_REPH
Behdad Esfahbod11b0e202012-08-02 14:21:40 -0400288};
289enum reph_mode_t {
290 REPH_MODE_IMPLICIT, /* Reph formed out of initial Ra,H sequence. */
291 REPH_MODE_EXPLICIT, /* Reph formed out of initial Ra,H,ZWJ sequence. */
292 REPH_MODE_VIS_REPHA, /* Encoded Repha character, no reordering needed. */
293 REPH_MODE_LOG_REPHA /* Encoded Repha character, needs reordering. */
294};
Behdad Esfahbod8acbb6b2013-10-15 12:15:49 +0200295enum blwf_mode_t {
296 BLWF_MODE_PRE_AND_POST, /* Below-forms feature applied to pre-base and post-base. */
297 BLWF_MODE_POST_ONLY /* Below-forms feature applied to post-base only. */
298};
Behdad Esfahbod74f4bbf2013-10-17 19:07:53 +0200299enum pref_len_t {
300 PREF_LEN_1 = 1,
301 PREF_LEN_2 = 2,
302 PREF_LEN_DONT_CARE = PREF_LEN_2
303};
Behdad Esfahbod11b0e202012-08-02 14:21:40 -0400304struct indic_config_t
305{
306 hb_script_t script;
307 bool has_old_spec;
308 hb_codepoint_t virama;
309 base_position_t base_pos;
310 reph_position_t reph_pos;
311 reph_mode_t reph_mode;
Behdad Esfahbod8acbb6b2013-10-15 12:15:49 +0200312 blwf_mode_t blwf_mode;
Behdad Esfahbod74f4bbf2013-10-17 19:07:53 +0200313 pref_len_t pref_len;
Behdad Esfahbod11b0e202012-08-02 14:21:40 -0400314};
315
316static const indic_config_t indic_configs[] =
317{
318 /* Default. Should be first. */
Behdad Esfahbod76271002014-07-11 14:54:42 -0400319 {HB_SCRIPT_INVALID, false, 0,BASE_POS_LAST, REPH_POS_BEFORE_POST,REPH_MODE_IMPLICIT, BLWF_MODE_PRE_AND_POST, PREF_LEN_1},
320 {HB_SCRIPT_DEVANAGARI,true, 0x094Du,BASE_POS_LAST, REPH_POS_BEFORE_POST,REPH_MODE_IMPLICIT, BLWF_MODE_PRE_AND_POST, PREF_LEN_DONT_CARE},
321 {HB_SCRIPT_BENGALI, true, 0x09CDu,BASE_POS_LAST, REPH_POS_AFTER_SUB, REPH_MODE_IMPLICIT, BLWF_MODE_PRE_AND_POST, PREF_LEN_DONT_CARE},
322 {HB_SCRIPT_GURMUKHI, true, 0x0A4Du,BASE_POS_LAST, REPH_POS_BEFORE_SUB, REPH_MODE_IMPLICIT, BLWF_MODE_PRE_AND_POST, PREF_LEN_DONT_CARE},
323 {HB_SCRIPT_GUJARATI, true, 0x0ACDu,BASE_POS_LAST, REPH_POS_BEFORE_POST,REPH_MODE_IMPLICIT, BLWF_MODE_PRE_AND_POST, PREF_LEN_DONT_CARE},
324 {HB_SCRIPT_ORIYA, true, 0x0B4Du,BASE_POS_LAST, REPH_POS_AFTER_MAIN, REPH_MODE_IMPLICIT, BLWF_MODE_PRE_AND_POST, PREF_LEN_DONT_CARE},
325 {HB_SCRIPT_TAMIL, true, 0x0BCDu,BASE_POS_LAST, REPH_POS_AFTER_POST, REPH_MODE_IMPLICIT, BLWF_MODE_PRE_AND_POST, PREF_LEN_2},
326 {HB_SCRIPT_TELUGU, true, 0x0C4Du,BASE_POS_LAST, REPH_POS_AFTER_POST, REPH_MODE_EXPLICIT, BLWF_MODE_POST_ONLY, PREF_LEN_2},
327 {HB_SCRIPT_KANNADA, true, 0x0CCDu,BASE_POS_LAST, REPH_POS_AFTER_POST, REPH_MODE_IMPLICIT, BLWF_MODE_POST_ONLY, PREF_LEN_2},
328 {HB_SCRIPT_MALAYALAM, true, 0x0D4Du,BASE_POS_LAST, REPH_POS_AFTER_MAIN, REPH_MODE_LOG_REPHA,BLWF_MODE_PRE_AND_POST, PREF_LEN_2},
329 {HB_SCRIPT_SINHALA, false,0x0DCAu,BASE_POS_LAST_SINHALA,
330 REPH_POS_AFTER_MAIN, REPH_MODE_EXPLICIT, BLWF_MODE_PRE_AND_POST, PREF_LEN_DONT_CARE},
331 {HB_SCRIPT_KHMER, false,0x17D2u,BASE_POS_FIRST,REPH_POS_DONT_CARE, REPH_MODE_VIS_REPHA,BLWF_MODE_PRE_AND_POST, PREF_LEN_2},
332 {HB_SCRIPT_JAVANESE, false,0xA9C0u,BASE_POS_FIRST,REPH_POS_DONT_CARE, REPH_MODE_VIS_REPHA,BLWF_MODE_PRE_AND_POST, PREF_LEN_1},
Behdad Esfahbod11b0e202012-08-02 14:21:40 -0400333};
334
335
336
337/*
338 * Indic shaper.
339 */
Behdad Esfahbod9ccc6382012-07-19 12:32:16 -0400340
Behdad Esfahbodeed903b2012-05-11 20:50:53 +0200341struct feature_list_t {
Behdad Esfahbodc7fe56a2011-06-24 19:05:34 -0400342 hb_tag_t tag;
Behdad Esfahbodec544862013-02-14 11:25:10 -0500343 hb_ot_map_feature_flags_t flags;
Behdad Esfahbodeed903b2012-05-11 20:50:53 +0200344};
345
346static const feature_list_t
Behdad Esfahbod85fc6c42012-08-02 12:21:44 -0400347indic_features[] =
Behdad Esfahbodb9ddbd52011-06-02 17:43:12 -0400348{
Behdad Esfahbod85fc6c42012-08-02 12:21:44 -0400349 /*
350 * Basic features.
351 * These features are applied in order, one at a time, after initial_reordering.
352 */
Behdad Esfahboda8cf7b42013-03-19 05:53:26 -0400353 {HB_TAG('n','u','k','t'), F_GLOBAL},
354 {HB_TAG('a','k','h','n'), F_GLOBAL},
355 {HB_TAG('r','p','h','f'), F_NONE},
356 {HB_TAG('r','k','r','f'), F_GLOBAL},
357 {HB_TAG('p','r','e','f'), F_NONE},
358 {HB_TAG('b','l','w','f'), F_NONE},
Behdad Esfahboda8cf7b42013-03-19 05:53:26 -0400359 {HB_TAG('a','b','v','f'), F_NONE},
Behdad Esfahboda01cbf62013-10-15 16:37:53 +0200360 {HB_TAG('h','a','l','f'), F_NONE},
Behdad Esfahboda8cf7b42013-03-19 05:53:26 -0400361 {HB_TAG('p','s','t','f'), F_NONE},
Behdad Esfahboda8cf7b42013-03-19 05:53:26 -0400362 {HB_TAG('v','a','t','u'), F_GLOBAL},
363 {HB_TAG('c','j','c','t'), F_GLOBAL},
Behdad Esfahboda01cbf62013-10-15 16:37:53 +0200364 {HB_TAG('c','f','a','r'), F_NONE},
Behdad Esfahbod85fc6c42012-08-02 12:21:44 -0400365 /*
366 * Other features.
367 * These features are applied all at once, after final_reordering.
Behdad Esfahboda01cbf62013-10-15 16:37:53 +0200368 * Default Bengali font in Windows for example has intermixed
369 * lookups for init,pres,abvs,blws features.
Behdad Esfahbod85fc6c42012-08-02 12:21:44 -0400370 */
Behdad Esfahbodec544862013-02-14 11:25:10 -0500371 {HB_TAG('i','n','i','t'), F_NONE},
372 {HB_TAG('p','r','e','s'), F_GLOBAL},
373 {HB_TAG('a','b','v','s'), F_GLOBAL},
374 {HB_TAG('b','l','w','s'), F_GLOBAL},
375 {HB_TAG('p','s','t','s'), F_GLOBAL},
376 {HB_TAG('h','a','l','n'), F_GLOBAL},
Behdad Esfahbod85fc6c42012-08-02 12:21:44 -0400377 /* Positioning features, though we don't care about the types. */
Behdad Esfahbodec544862013-02-14 11:25:10 -0500378 {HB_TAG('d','i','s','t'), F_GLOBAL},
379 {HB_TAG('a','b','v','m'), F_GLOBAL},
380 {HB_TAG('b','l','w','m'), F_GLOBAL},
Behdad Esfahbodc7fe56a2011-06-24 19:05:34 -0400381};
382
Behdad Esfahbod85fc6c42012-08-02 12:21:44 -0400383/*
384 * Must be in the same order as the indic_features array.
385 */
Behdad Esfahbodc7fe56a2011-06-24 19:05:34 -0400386enum {
387 _NUKT,
Behdad Esfahbode0475342012-07-19 20:24:14 -0400388 _AKHN,
Behdad Esfahbodc7fe56a2011-06-24 19:05:34 -0400389 RPHF,
Behdad Esfahboddf6d45c2012-05-09 11:38:31 +0200390 _RKRF,
Behdad Esfahbodc7fe56a2011-06-24 19:05:34 -0400391 PREF,
Behdad Esfahbod167b6252012-08-05 21:16:26 -0700392 BLWF,
Behdad Esfahbod29f106d2012-07-16 12:05:35 -0400393 ABVF,
Behdad Esfahboda01cbf62013-10-15 16:37:53 +0200394 HALF,
Behdad Esfahbodc7fe56a2011-06-24 19:05:34 -0400395 PSTF,
Behdad Esfahbod85fc6c42012-08-02 12:21:44 -0400396 _VATU,
Behdad Esfahbod70d65652013-02-12 18:01:21 -0500397 _CJCT,
Behdad Esfahboda01cbf62013-10-15 16:37:53 +0200398 CFAR,
Behdad Esfahbod85fc6c42012-08-02 12:21:44 -0400399
400 INIT,
401 _PRES,
402 _ABVS,
403 _BLWS,
404 _PSTS,
405 _HALN,
406 _DIST,
407 _ABVM,
408 _BLWM,
409
410 INDIC_NUM_FEATURES,
411 INDIC_BASIC_FEATURES = INIT /* Don't forget to update this! */
Behdad Esfahbodb9ddbd52011-06-02 17:43:12 -0400412};
413
Behdad Esfahbod743807a2011-07-29 16:37:02 -0400414static void
Behdad Esfahbod166b5cf2012-09-07 14:55:07 -0400415setup_syllables (const hb_ot_shape_plan_t *plan,
416 hb_font_t *font,
417 hb_buffer_t *buffer);
418static void
Behdad Esfahbod8bb5deb2012-08-02 10:07:58 -0400419initial_reordering (const hb_ot_shape_plan_t *plan,
Behdad Esfahbodafbcc242012-08-02 08:36:40 -0400420 hb_font_t *font,
Behdad Esfahbod3e38c0f2012-08-02 09:44:18 -0400421 hb_buffer_t *buffer);
Behdad Esfahbodf6fd3782011-07-08 00:22:40 -0400422static void
Behdad Esfahbod8bb5deb2012-08-02 10:07:58 -0400423final_reordering (const hb_ot_shape_plan_t *plan,
Behdad Esfahbodafbcc242012-08-02 08:36:40 -0400424 hb_font_t *font,
Behdad Esfahbod3e38c0f2012-08-02 09:44:18 -0400425 hb_buffer_t *buffer);
Behdad Esfahbod30145272013-10-15 13:47:27 +0200426static void
427clear_syllables (const hb_ot_shape_plan_t *plan,
428 hb_font_t *font,
429 hb_buffer_t *buffer);
Behdad Esfahbodb9ddbd52011-06-02 17:43:12 -0400430
Behdad Esfahbod693918e2012-07-30 21:08:51 -0400431static void
Behdad Esfahbod16c6a272012-08-02 09:38:28 -0400432collect_features_indic (hb_ot_shape_planner_t *plan)
Behdad Esfahbodb9ddbd52011-06-02 17:43:12 -0400433{
Behdad Esfahbod16c6a272012-08-02 09:38:28 -0400434 hb_ot_map_builder_t *map = &plan->map;
435
Behdad Esfahbod166b5cf2012-09-07 14:55:07 -0400436 /* Do this before any lookups have been applied. */
437 map->add_gsub_pause (setup_syllables);
438
Behdad Esfahbode7ffcfa2013-02-14 11:05:56 -0500439 map->add_global_bool_feature (HB_TAG('l','o','c','l'));
Behdad Esfahboda54a5502011-07-20 16:42:10 -0400440 /* The Indic specs do not require ccmp, but we apply it here since if
441 * there is a use of it, it's typically at the beginning. */
Behdad Esfahbode7ffcfa2013-02-14 11:05:56 -0500442 map->add_global_bool_feature (HB_TAG('c','c','m','p'));
Behdad Esfahbodf6fd3782011-07-08 00:22:40 -0400443
Behdad Esfahbodf6fd3782011-07-08 00:22:40 -0400444
Behdad Esfahbod85fc6c42012-08-02 12:21:44 -0400445 unsigned int i = 0;
446 map->add_gsub_pause (initial_reordering);
447 for (; i < INDIC_BASIC_FEATURES; i++) {
Behdad Esfahboda8cf7b42013-03-19 05:53:26 -0400448 map->add_feature (indic_features[i].tag, 1, indic_features[i].flags | F_MANUAL_ZWJ);
Behdad Esfahbod3e38c0f2012-08-02 09:44:18 -0400449 map->add_gsub_pause (NULL);
Behdad Esfahbod412b9182012-05-09 11:07:18 +0200450 }
Behdad Esfahbod3e38c0f2012-08-02 09:44:18 -0400451 map->add_gsub_pause (final_reordering);
Behdad Esfahbod85fc6c42012-08-02 12:21:44 -0400452 for (; i < INDIC_NUM_FEATURES; i++) {
Behdad Esfahboda8cf7b42013-03-19 05:53:26 -0400453 map->add_feature (indic_features[i].tag, 1, indic_features[i].flags | F_MANUAL_ZWJ);
Behdad Esfahbod85fc6c42012-08-02 12:21:44 -0400454 }
Behdad Esfahbod42d0f552013-10-17 13:05:05 +0200455
456 map->add_global_bool_feature (HB_TAG('c','a','l','t'));
457 map->add_global_bool_feature (HB_TAG('c','l','i','g'));
458
Behdad Esfahbod30145272013-10-15 13:47:27 +0200459 map->add_gsub_pause (clear_syllables);
Behdad Esfahbodb9ddbd52011-06-02 17:43:12 -0400460}
461
Behdad Esfahbod693918e2012-07-30 21:08:51 -0400462static void
Behdad Esfahbod16c6a272012-08-02 09:38:28 -0400463override_features_indic (hb_ot_shape_planner_t *plan)
Behdad Esfahbodd96838e2012-07-16 20:26:57 -0400464{
Behdad Esfahbodeb102332013-10-15 15:26:44 +0200465 /* Uniscribe does not apply 'kern' in Khmer. */
Behdad Esfahbodbab02d32013-02-12 15:26:45 -0500466 if (hb_options ().uniscribe_bug_compatible)
Behdad Esfahbodeb102332013-10-15 15:26:44 +0200467 {
468 switch ((hb_tag_t) plan->props.script)
469 {
470 case HB_SCRIPT_KHMER:
Behdad Esfahbod9ac6b012013-10-17 16:27:38 +0200471 plan->map.add_feature (HB_TAG('k','e','r','n'), 0, F_GLOBAL);
Behdad Esfahbodeb102332013-10-15 15:26:44 +0200472 break;
473 }
474 }
Behdad Esfahbod6b389dd2012-11-12 11:02:56 -0800475
Behdad Esfahbodec544862013-02-14 11:25:10 -0500476 plan->map.add_feature (HB_TAG('l','i','g','a'), 0, F_GLOBAL);
Behdad Esfahbodd96838e2012-07-16 20:26:57 -0400477}
478
Behdad Esfahbod867361c2011-06-17 18:35:46 -0400479
Behdad Esfahbod85fc6c42012-08-02 12:21:44 -0400480struct would_substitute_feature_t
Behdad Esfahboda8c6da92012-08-02 10:46:34 -0400481{
Behdad Esfahbodb5a0f692013-10-17 18:04:23 +0200482 inline void init (const hb_ot_map_t *map, hb_tag_t feature_tag, bool zero_context_)
Behdad Esfahboda8c6da92012-08-02 10:46:34 -0400483 {
Behdad Esfahbodb5a0f692013-10-17 18:04:23 +0200484 zero_context = zero_context_;
Behdad Esfahboda8c6da92012-08-02 10:46:34 -0400485 map->get_stage_lookups (0/*GSUB*/,
486 map->get_feature_stage (0/*GSUB*/, feature_tag),
487 &lookups, &count);
488 }
489
Behdad Esfahbod81449362013-03-05 20:08:59 -0500490 inline bool would_substitute (const hb_codepoint_t *glyphs,
491 unsigned int glyphs_count,
Behdad Esfahbod81449362013-03-05 20:08:59 -0500492 hb_face_t *face) const
Behdad Esfahboda8c6da92012-08-02 10:46:34 -0400493 {
494 for (unsigned int i = 0; i < count; i++)
Behdad Esfahbod362a9902012-11-15 14:57:31 -0800495 if (hb_ot_layout_lookup_would_substitute_fast (face, lookups[i].index, glyphs, glyphs_count, zero_context))
Behdad Esfahboda8c6da92012-08-02 10:46:34 -0400496 return true;
497 return false;
498 }
499
500 private:
501 const hb_ot_map_t::lookup_map_t *lookups;
502 unsigned int count;
Behdad Esfahbodb5a0f692013-10-17 18:04:23 +0200503 bool zero_context;
Behdad Esfahboda8c6da92012-08-02 10:46:34 -0400504};
505
506struct indic_shape_plan_t
507{
Behdad Esfahbod85fc6c42012-08-02 12:21:44 -0400508 ASSERT_POD ();
Behdad Esfahbod914ffaa2012-08-02 11:03:39 -0400509
510 inline bool get_virama_glyph (hb_font_t *font, hb_codepoint_t *pglyph) const
511 {
512 hb_codepoint_t glyph = virama_glyph;
513 if (unlikely (virama_glyph == (hb_codepoint_t) -1))
514 {
Behdad Esfahbod11b0e202012-08-02 14:21:40 -0400515 if (!config->virama || !font->get_glyph (config->virama, 0, &glyph))
Behdad Esfahbod914ffaa2012-08-02 11:03:39 -0400516 glyph = 0;
517 /* Technically speaking, the spec says we should apply 'locl' to virama too.
518 * Maybe one day... */
519
520 /* Our get_glyph() function needs a font, so we can't get the virama glyph
521 * during shape planning... Instead, overwrite it here. It's safe. Don't worry! */
522 (const_cast<indic_shape_plan_t *> (this))->virama_glyph = glyph;
523 }
524
525 *pglyph = glyph;
526 return glyph != 0;
527 }
Behdad Esfahbod85fc6c42012-08-02 12:21:44 -0400528
Behdad Esfahbod11b0e202012-08-02 14:21:40 -0400529 const indic_config_t *config;
Behdad Esfahbod85fc6c42012-08-02 12:21:44 -0400530
531 bool is_old_spec;
Behdad Esfahbod85fc6c42012-08-02 12:21:44 -0400532 hb_codepoint_t virama_glyph;
533
Behdad Esfahbodf2c0f592012-11-12 14:02:02 -0800534 would_substitute_feature_t rphf;
Behdad Esfahbod85fc6c42012-08-02 12:21:44 -0400535 would_substitute_feature_t pref;
536 would_substitute_feature_t blwf;
537 would_substitute_feature_t pstf;
538
539 hb_mask_t mask_array[INDIC_NUM_FEATURES];
Behdad Esfahboda8c6da92012-08-02 10:46:34 -0400540};
541
542static void *
543data_create_indic (const hb_ot_shape_plan_t *plan)
544{
Behdad Esfahbod85fc6c42012-08-02 12:21:44 -0400545 indic_shape_plan_t *indic_plan = (indic_shape_plan_t *) calloc (1, sizeof (indic_shape_plan_t));
546 if (unlikely (!indic_plan))
Behdad Esfahboda8c6da92012-08-02 10:46:34 -0400547 return NULL;
548
Behdad Esfahbod11b0e202012-08-02 14:21:40 -0400549 indic_plan->config = &indic_configs[0];
550 for (unsigned int i = 1; i < ARRAY_LENGTH (indic_configs); i++)
551 if (plan->props.script == indic_configs[i].script) {
552 indic_plan->config = &indic_configs[i];
553 break;
Behdad Esfahbod85fc6c42012-08-02 12:21:44 -0400554 }
Behdad Esfahbod11b0e202012-08-02 14:21:40 -0400555
Behdad Esfahbod76271002014-07-11 14:54:42 -0400556 indic_plan->is_old_spec = indic_plan->config->has_old_spec && ((plan->map.chosen_script[0] & 0x000000FFu) != '2');
Behdad Esfahbod11b0e202012-08-02 14:21:40 -0400557 indic_plan->virama_glyph = (hb_codepoint_t) -1;
Behdad Esfahboda8c6da92012-08-02 10:46:34 -0400558
Behdad Esfahbodb5a0f692013-10-17 18:04:23 +0200559 /* Use zero-context would_substitute() matching for new-spec of the main
Behdad Esfahbod828e1092014-04-18 16:53:34 -0700560 * Indic scripts, and scripts with one spec only, but not for old-specs. */
561 bool zero_context = !indic_plan->is_old_spec;
Behdad Esfahbodb5a0f692013-10-17 18:04:23 +0200562 indic_plan->rphf.init (&plan->map, HB_TAG('r','p','h','f'), zero_context);
563 indic_plan->pref.init (&plan->map, HB_TAG('p','r','e','f'), zero_context);
564 indic_plan->blwf.init (&plan->map, HB_TAG('b','l','w','f'), zero_context);
565 indic_plan->pstf.init (&plan->map, HB_TAG('p','s','t','f'), zero_context);
Behdad Esfahbod85fc6c42012-08-02 12:21:44 -0400566
567 for (unsigned int i = 0; i < ARRAY_LENGTH (indic_plan->mask_array); i++)
Behdad Esfahbodec544862013-02-14 11:25:10 -0500568 indic_plan->mask_array[i] = (indic_features[i].flags & F_GLOBAL) ?
569 0 : plan->map.get_1_mask (indic_features[i].tag);
Behdad Esfahbod85fc6c42012-08-02 12:21:44 -0400570
571 return indic_plan;
Behdad Esfahboda8c6da92012-08-02 10:46:34 -0400572}
573
574static void
575data_destroy_indic (void *data)
576{
577 free (data);
578}
579
580static indic_position_t
581consonant_position_from_face (const indic_shape_plan_t *indic_plan,
Behdad Esfahbod684fe592013-10-17 18:30:06 +0200582 const hb_codepoint_t consonant,
583 const hb_codepoint_t virama,
Behdad Esfahbod81449362013-03-05 20:08:59 -0500584 hb_face_t *face)
Behdad Esfahboda8c6da92012-08-02 10:46:34 -0400585{
Behdad Esfahbod81449362013-03-05 20:08:59 -0500586 /* For old-spec, the order of glyphs is Consonant,Virama,
587 * whereas for new-spec, it's Virama,Consonant. However,
588 * some broken fonts (like Free Sans) simply copied lookups
589 * from old-spec to new-spec without modification.
590 * And oddly enough, Uniscribe seems to respect those lookups.
591 * Eg. in the sequence U+0924,U+094D,U+0930, Uniscribe finds
592 * base at 0. The font however, only has lookups matching
593 * 930,94D in 'blwf', not the expected 94D,930 (with new-spec
594 * table). As such, we simply match both sequences. Seems
595 * to work. */
Behdad Esfahbod684fe592013-10-17 18:30:06 +0200596 hb_codepoint_t glyphs[3] = {virama, consonant, virama};
Behdad Esfahbodb5a0f692013-10-17 18:04:23 +0200597 if (indic_plan->blwf.would_substitute (glyphs , 2, face) ||
Behdad Esfahbod684fe592013-10-17 18:30:06 +0200598 indic_plan->blwf.would_substitute (glyphs+1, 2, face))
Behdad Esfahbod81449362013-03-05 20:08:59 -0500599 return POS_BELOW_C;
Behdad Esfahbodb5a0f692013-10-17 18:04:23 +0200600 if (indic_plan->pstf.would_substitute (glyphs , 2, face) ||
Behdad Esfahbod684fe592013-10-17 18:30:06 +0200601 indic_plan->pstf.would_substitute (glyphs+1, 2, face))
Behdad Esfahbod81449362013-03-05 20:08:59 -0500602 return POS_POST_C;
Behdad Esfahbod74f4bbf2013-10-17 19:07:53 +0200603 unsigned int pref_len = indic_plan->config->pref_len;
604 if ((pref_len == PREF_LEN_2 &&
605 (indic_plan->pref.would_substitute (glyphs , 2, face) ||
606 indic_plan->pref.would_substitute (glyphs+1, 2, face)))
607 || (pref_len == PREF_LEN_1 &&
608 indic_plan->pref.would_substitute (glyphs+1, 1, face)))
Behdad Esfahbodae9a5832013-10-17 12:24:55 +0200609 return POS_POST_C;
Behdad Esfahboda8c6da92012-08-02 10:46:34 -0400610 return POS_BASE_C;
611}
612
613
Behdad Esfahbod166b5cf2012-09-07 14:55:07 -0400614enum syllable_type_t {
615 consonant_syllable,
616 vowel_syllable,
617 standalone_cluster,
Behdad Esfahbod9f9bd9b2014-05-23 15:33:13 -0400618 symbol_cluster,
Behdad Esfahbod166b5cf2012-09-07 14:55:07 -0400619 broken_cluster,
620 non_indic_cluster,
621};
622
623#include "hb-ot-shape-complex-indic-machine.hh"
624
625
Behdad Esfahbod693918e2012-07-30 21:08:51 -0400626static void
Behdad Esfahbod16c6a272012-08-02 09:38:28 -0400627setup_masks_indic (const hb_ot_shape_plan_t *plan HB_UNUSED,
628 hb_buffer_t *buffer,
629 hb_font_t *font HB_UNUSED)
Behdad Esfahbod24eacf12012-08-02 08:42:11 -0400630{
631 HB_BUFFER_ALLOCATE_VAR (buffer, indic_category);
632 HB_BUFFER_ALLOCATE_VAR (buffer, indic_position);
633
634 /* We cannot setup masks here. We save information about characters
635 * and setup masks later on in a pause-callback. */
636
637 unsigned int count = buffer->len;
Behdad Esfahbod7cd33f22014-07-17 14:22:11 -0400638 hb_glyph_info_t *info = buffer->info;
Behdad Esfahbod24eacf12012-08-02 08:42:11 -0400639 for (unsigned int i = 0; i < count; i++)
Behdad Esfahbod7cd33f22014-07-17 14:22:11 -0400640 set_indic_properties (info[i]);
Behdad Esfahbod24eacf12012-08-02 08:42:11 -0400641}
642
Behdad Esfahbod166b5cf2012-09-07 14:55:07 -0400643static void
644setup_syllables (const hb_ot_shape_plan_t *plan HB_UNUSED,
645 hb_font_t *font HB_UNUSED,
646 hb_buffer_t *buffer)
647{
648 find_syllables (buffer);
649}
650
Behdad Esfahbod24eacf12012-08-02 08:42:11 -0400651static int
652compare_indic_order (const hb_glyph_info_t *pa, const hb_glyph_info_t *pb)
653{
654 int a = pa->indic_position();
655 int b = pb->indic_position();
656
657 return a < b ? -1 : a == b ? 0 : +1;
658}
659
660
661
662static void
Behdad Esfahbod8bb5deb2012-08-02 10:07:58 -0400663update_consonant_positions (const hb_ot_shape_plan_t *plan,
Behdad Esfahbod85fc6c42012-08-02 12:21:44 -0400664 hb_font_t *font,
665 hb_buffer_t *buffer)
Behdad Esfahbod8ef3d532012-08-02 07:53:18 -0400666{
Behdad Esfahboda8c6da92012-08-02 10:46:34 -0400667 const indic_shape_plan_t *indic_plan = (const indic_shape_plan_t *) plan->data;
Behdad Esfahbod8ef3d532012-08-02 07:53:18 -0400668
Behdad Esfahbodc4e71ff2013-10-17 17:04:47 +0200669 if (indic_plan->config->base_pos != BASE_POS_LAST)
670 return;
671
Behdad Esfahbod684fe592013-10-17 18:30:06 +0200672 hb_codepoint_t virama;
673 if (indic_plan->get_virama_glyph (font, &virama))
Behdad Esfahbod8ef3d532012-08-02 07:53:18 -0400674 {
675 hb_face_t *face = font->face;
676 unsigned int count = buffer->len;
Behdad Esfahbod7cd33f22014-07-17 14:22:11 -0400677 hb_glyph_info_t *info = buffer->info;
Behdad Esfahbod8ef3d532012-08-02 07:53:18 -0400678 for (unsigned int i = 0; i < count; i++)
Behdad Esfahbod7cd33f22014-07-17 14:22:11 -0400679 if (info[i].indic_position() == POS_BASE_C)
680 {
681 hb_codepoint_t consonant = info[i].codepoint;
682 info[i].indic_position() = consonant_position_from_face (indic_plan, consonant, virama, face);
Behdad Esfahbod8ef3d532012-08-02 07:53:18 -0400683 }
684 }
685}
686
Behdad Esfahbod867361c2011-06-17 18:35:46 -0400687
Behdad Esfahbod7ea58db2012-05-11 18:58:57 +0200688/* Rules from:
689 * https://www.microsoft.com/typography/otfntdev/devanot/shaping.aspx */
690
Behdad Esfahbod743807a2011-07-29 16:37:02 -0400691static void
Behdad Esfahbodf2c0f592012-11-12 14:02:02 -0800692initial_reordering_consonant_syllable (const hb_ot_shape_plan_t *plan,
693 hb_face_t *face,
694 hb_buffer_t *buffer,
Behdad Esfahbodef24cc82012-05-09 17:56:03 +0200695 unsigned int start, unsigned int end)
Behdad Esfahbod743807a2011-07-29 16:37:02 -0400696{
Behdad Esfahbod914ffaa2012-08-02 11:03:39 -0400697 const indic_shape_plan_t *indic_plan = (const indic_shape_plan_t *) plan->data;
Behdad Esfahbodee58f3b2011-07-30 19:15:53 -0400698 hb_glyph_info_t *info = buffer->info;
Behdad Esfahbod743807a2011-07-29 16:37:02 -0400699
Behdad Esfahbod617f4ac2012-05-13 16:48:03 +0200700
Behdad Esfahbod743807a2011-07-29 16:37:02 -0400701 /* 1. Find base consonant:
702 *
703 * The shaping engine finds the base consonant of the syllable, using the
704 * following algorithm: starting from the end of the syllable, move backwards
705 * until a consonant is found that does not have a below-base or post-base
706 * form (post-base forms have to follow below-base forms), or that is not a
707 * pre-base reordering Ra, or arrive at the first consonant. The consonant
708 * stopped at will be the base.
709 *
710 * o If the syllable starts with Ra + Halant (in a script that has Reph)
711 * and has more than one consonant, Ra is excluded from candidates for
712 * base consonants.
713 */
714
Behdad Esfahbod5e720712011-07-31 17:51:50 -0400715 unsigned int base = end;
Behdad Esfahbod76b34092012-05-09 11:43:43 +0200716 bool has_reph = false;
717
Behdad Esfahbod76b34092012-05-09 11:43:43 +0200718 {
Behdad Esfahbod617f4ac2012-05-13 16:48:03 +0200719 /* -> If the syllable starts with Ra + Halant (in a script that has Reph)
720 * and has more than one consonant, Ra is excluded from candidates for
721 * base consonants. */
722 unsigned int limit = start;
Behdad Esfahbodf175aa32013-10-18 02:07:44 +0200723 if (indic_plan->config->reph_pos != REPH_POS_DONT_CARE &&
Behdad Esfahbodefed40b2013-10-17 18:50:11 +0200724 indic_plan->mask_array[RPHF] &&
Behdad Esfahbod617f4ac2012-05-13 16:48:03 +0200725 start + 3 <= end &&
Behdad Esfahbod8b217f52012-12-21 15:48:32 -0500726 (
Behdad Esfahbod11b0e202012-08-02 14:21:40 -0400727 (indic_plan->config->reph_mode == REPH_MODE_IMPLICIT && !is_joiner (info[start + 2])) ||
728 (indic_plan->config->reph_mode == REPH_MODE_EXPLICIT && info[start + 2].indic_category() == OT_ZWJ)
Behdad Esfahbod3285e102012-07-18 17:22:14 -0400729 ))
Behdad Esfahbod617f4ac2012-05-13 16:48:03 +0200730 {
Behdad Esfahbodf2c0f592012-11-12 14:02:02 -0800731 /* See if it matches the 'rphf' feature. */
Behdad Esfahbod29531122014-05-15 14:04:02 -0600732 hb_codepoint_t glyphs[3] = {info[start].codepoint,
733 info[start + 1].codepoint,
734 indic_plan->config->reph_mode == REPH_MODE_EXPLICIT ?
735 info[start + 2].codepoint : 0};
736 if (indic_plan->rphf.would_substitute (glyphs, 2, face) ||
737 (indic_plan->config->reph_mode == REPH_MODE_EXPLICIT &&
738 indic_plan->rphf.would_substitute (glyphs, 3, face)))
Behdad Esfahbodf2c0f592012-11-12 14:02:02 -0800739 {
740 limit += 2;
741 while (limit < end && is_joiner (info[limit]))
742 limit++;
743 base = start;
744 has_reph = true;
745 }
Behdad Esfahbod8b217f52012-12-21 15:48:32 -0500746 } else if (indic_plan->config->reph_mode == REPH_MODE_LOG_REPHA && info[start].indic_category() == OT_Repha)
747 {
748 limit += 1;
749 while (limit < end && is_joiner (info[limit]))
750 limit++;
751 base = start;
752 has_reph = true;
753 }
Behdad Esfahbod743807a2011-07-29 16:37:02 -0400754
Behdad Esfahbod23b0e9d2012-08-26 14:30:18 -0400755 switch (indic_plan->config->base_pos)
Behdad Esfahbod14dbdd92012-07-18 13:13:03 -0400756 {
Behdad Esfahbodd469fad2012-11-14 15:07:36 -0800757 default:
758 assert (false);
Behdad Esfahbod305d2fb2015-10-21 11:04:28 -0200759 HB_FALLTHROUGH;
Behdad Esfahbodd469fad2012-11-14 15:07:36 -0800760
Behdad Esfahbod11b0e202012-08-02 14:21:40 -0400761 case BASE_POS_LAST:
762 {
763 /* -> starting from the end of the syllable, move backwards */
764 unsigned int i = end;
765 bool seen_below = false;
766 do {
767 i--;
768 /* -> until a consonant is found */
769 if (is_consonant (info[i]))
770 {
771 /* -> that does not have a below-base or post-base form
772 * (post-base forms have to follow below-base forms), */
773 if (info[i].indic_position() != POS_BELOW_C &&
774 (info[i].indic_position() != POS_POST_C || seen_below))
775 {
776 base = i;
777 break;
778 }
779 if (info[i].indic_position() == POS_BELOW_C)
780 seen_below = true;
781
782 /* -> or that is not a pre-base reordering Ra,
783 *
784 * IMPLEMENTATION NOTES:
785 *
Behdad Esfahbodfb7c1822013-03-06 00:53:24 -0500786 * Our pre-base reordering Ra's are marked POS_POST_C, so will be skipped
Behdad Esfahbod11b0e202012-08-02 14:21:40 -0400787 * by the logic above already.
788 */
789
790 /* -> or arrive at the first consonant. The consonant stopped at will
791 * be the base. */
792 base = i;
793 }
794 else
795 {
796 /* A ZWJ after a Halant stops the base search, and requests an explicit
797 * half form.
798 * A ZWJ before a Halant, requests a subjoined form instead, and hence
799 * search continues. This is particularly important for Bengali
Behdad Esfahbodc4be9912012-11-12 14:27:33 -0800800 * sequence Ra,H,Ya that should form Ya-Phalaa by subjoining Ya. */
Behdad Esfahbod11b0e202012-08-02 14:21:40 -0400801 if (start < i &&
802 info[i].indic_category() == OT_ZWJ &&
803 info[i - 1].indic_category() == OT_H)
804 break;
805 }
806 } while (i > limit);
807 }
808 break;
809
Behdad Esfahbode10453e2013-10-17 16:49:06 +0200810 case BASE_POS_LAST_SINHALA:
Behdad Esfahbod11b0e202012-08-02 14:21:40 -0400811 {
Behdad Esfahbodc4e71ff2013-10-17 17:04:47 +0200812 /* Sinhala base positioning is slightly different from main Indic, in that:
Behdad Esfahbodb082ef32014-04-25 11:48:10 -0700813 * 1. Its ZWJ behavior is different,
Behdad Esfahbodc4e71ff2013-10-17 17:04:47 +0200814 * 2. We don't need to look into the font for consonant positions.
815 */
Behdad Esfahbod11b0e202012-08-02 14:21:40 -0400816
817 if (!has_reph)
818 base = limit;
819
820 /* Find the last base consonant that is not blocked by ZWJ. If there is
821 * a ZWJ right before a base consonant, that would request a subjoined form. */
822 for (unsigned int i = limit; i < end; i++)
Behdad Esfahbodc4e71ff2013-10-17 17:04:47 +0200823 if (is_consonant (info[i]))
Behdad Esfahbod11b0e202012-08-02 14:21:40 -0400824 {
825 if (limit < i && info[i - 1].indic_category() == OT_ZWJ)
826 break;
827 else
828 base = i;
829 }
830
831 /* Mark all subsequent consonants as below. */
832 for (unsigned int i = base + 1; i < end; i++)
Behdad Esfahbodc4e71ff2013-10-17 17:04:47 +0200833 if (is_consonant (info[i]))
Behdad Esfahbod11b0e202012-08-02 14:21:40 -0400834 info[i].indic_position() = POS_BELOW_C;
835 }
836 break;
Behdad Esfahbode10453e2013-10-17 16:49:06 +0200837
838 case BASE_POS_FIRST:
839 {
840 /* The first consonant is always the base. */
841
842 assert (indic_plan->config->reph_mode == REPH_MODE_VIS_REPHA);
Behdad Esfahbodefed40b2013-10-17 18:50:11 +0200843 assert (!has_reph);
Behdad Esfahbode10453e2013-10-17 16:49:06 +0200844
845 base = start;
846
847 /* Mark all subsequent consonants as below. */
848 for (unsigned int i = base + 1; i < end; i++)
Behdad Esfahbodc4e71ff2013-10-17 17:04:47 +0200849 if (is_consonant (info[i]))
Behdad Esfahbode10453e2013-10-17 16:49:06 +0200850 info[i].indic_position() = POS_BELOW_C;
851 }
852 break;
Behdad Esfahbod5d326902012-07-17 14:23:28 -0400853 }
Behdad Esfahbod3c2ea942012-05-11 16:23:38 +0200854
Behdad Esfahbod617f4ac2012-05-13 16:48:03 +0200855 /* -> If the syllable starts with Ra + Halant (in a script that has Reph)
856 * and has more than one consonant, Ra is excluded from candidates for
Behdad Esfahbod2278eef2012-07-24 00:26:43 -0400857 * base consonants.
858 *
859 * Only do this for unforced Reph. (ie. not for Ra,H,ZWJ. */
Behdad Esfahbod9621e0b2013-02-11 06:58:27 -0500860 if (has_reph && base == start && limit - base <= 2) {
Behdad Esfahbod617f4ac2012-05-13 16:48:03 +0200861 /* Have no other consonant, so Reph is not formed and Ra becomes base. */
862 has_reph = false;
863 }
Behdad Esfahbod5e4e21f2012-05-13 16:46:08 +0200864 }
Behdad Esfahbod2278eef2012-07-24 00:26:43 -0400865
Behdad Esfahbod3d250792012-05-10 11:37:42 +0200866
Behdad Esfahbod743807a2011-07-29 16:37:02 -0400867 /* 2. Decompose and reorder Matras:
868 *
869 * Each matra and any syllable modifier sign in the cluster are moved to the
870 * appropriate position relative to the consonant(s) in the cluster. The
871 * shaping engine decomposes two- or three-part matras into their constituent
872 * parts before any repositioning. Matra characters are classified by which
873 * consonant in a conjunct they have affinity for and are reordered to the
874 * following positions:
875 *
876 * o Before first half form in the syllable
877 * o After subjoined consonants
878 * o After post-form consonant
879 * o After main consonant (for above marks)
880 *
881 * IMPLEMENTATION NOTES:
882 *
883 * The normalize() routine has already decomposed matras for us, so we don't
884 * need to worry about that.
885 */
886
887
888 /* 3. Reorder marks to canonical order:
889 *
890 * Adjacent nukta and halant or nukta and vedic sign are always repositioned
891 * if necessary, so that the nukta is first.
892 *
893 * IMPLEMENTATION NOTES:
894 *
895 * We don't need to do this: the normalize() routine already did this for us.
896 */
897
898
Behdad Esfahbod45d6f292011-07-30 14:44:30 -0400899 /* Reorder characters */
900
Behdad Esfahbod3c2ea942012-05-11 16:23:38 +0200901 for (unsigned int i = start; i < base; i++)
Behdad Esfahbod900cf3d2012-07-20 10:18:23 -0400902 info[i].indic_position() = MIN (POS_PRE_C, (indic_position_t) info[i].indic_position());
Behdad Esfahbod55f70eb2012-07-17 12:50:13 -0400903
Behdad Esfahbod075d6712012-07-18 15:41:53 -0400904 if (base < end)
905 info[base].indic_position() = POS_BASE_C;
Behdad Esfahbod45d6f292011-07-30 14:44:30 -0400906
Behdad Esfahbod55f70eb2012-07-17 12:50:13 -0400907 /* Mark final consonants. A final consonant is one appearing after a matra,
908 * like in Khmer. */
909 for (unsigned int i = base + 1; i < end; i++)
910 if (info[i].indic_category() == OT_M) {
911 for (unsigned int j = i + 1; j < end; j++)
912 if (is_consonant (info[j])) {
913 info[j].indic_position() = POS_FINAL_C;
914 break;
915 }
916 break;
917 }
918
Behdad Esfahbodfd06bf52011-07-30 20:14:44 -0400919 /* Handle beginning Ra */
Behdad Esfahbod5e4e21f2012-05-13 16:46:08 +0200920 if (has_reph)
Behdad Esfahboddbb10582012-05-10 13:45:52 +0200921 info[start].indic_position() = POS_RA_TO_BECOME_REPH;
Behdad Esfahbodfd06bf52011-07-30 20:14:44 -0400922
Behdad Esfahbodf5bc2722011-07-30 21:08:10 -0400923 /* For old-style Indic script tags, move the first post-base Halant after
Behdad Esfahbodfc0daaf2014-07-23 16:48:51 -0400924 * last consonant.
925 *
926 * Reports suggest that in some scripts Uniscribe does this only if there
927 * is *not* a Halant after last consonant already (eg. Kannada), while it
928 * does it unconditionally in other scripts (eg. Malayalam). We don't
929 * currently know about other scripts, so we single out Malayalam for now.
930 *
931 * Kannada test case:
932 * U+0C9A,U+0CCD,U+0C9A,U+0CCD
933 * With some versions of Lohit Kannada.
934 * https://bugs.freedesktop.org/show_bug.cgi?id=59118
935 *
936 * Malayalam test case:
937 * U+0D38,U+0D4D,U+0D31,U+0D4D,U+0D31,U+0D4D
938 * With lohit-ttf-20121122/Lohit-Malayalam.ttf
939 */
940 if (indic_plan->is_old_spec)
941 {
942 bool disallow_double_halants = buffer->props.script != HB_SCRIPT_MALAYALAM;
Behdad Esfahbod3c2ea942012-05-11 16:23:38 +0200943 for (unsigned int i = base + 1; i < end; i++)
Behdad Esfahbodfc0daaf2014-07-23 16:48:51 -0400944 if (info[i].indic_category() == OT_H)
945 {
Behdad Esfahbodf5bc2722011-07-30 21:08:10 -0400946 unsigned int j;
947 for (j = end - 1; j > i; j--)
Behdad Esfahbodfc0daaf2014-07-23 16:48:51 -0400948 if (is_consonant (info[j]) ||
949 (disallow_double_halants && info[j].indic_category() == OT_H))
Behdad Esfahbodf5bc2722011-07-30 21:08:10 -0400950 break;
Behdad Esfahbodecd454b2013-01-08 18:09:46 -0600951 if (info[j].indic_category() != OT_H && j > i) {
Behdad Esfahbodf5bc2722011-07-30 21:08:10 -0400952 /* Move Halant to after last consonant. */
953 hb_glyph_info_t t = info[i];
954 memmove (&info[i], &info[i + 1], (j - i) * sizeof (info[0]));
955 info[j] = t;
956 }
957 break;
958 }
959 }
960
Behdad Esfahbod81202bd2012-07-20 15:10:02 -0400961 /* Attach misc marks to previous char to move with them. */
Behdad Esfahbodebe29732012-05-11 16:43:12 +0200962 {
Behdad Esfahbod81202bd2012-07-20 15:10:02 -0400963 indic_position_t last_pos = POS_START;
964 for (unsigned int i = start; i < end; i++)
965 {
Behdad Esfahbodf8160a42015-07-21 15:50:02 +0100966 if ((FLAG_SAFE (info[i].indic_category()) & (JOINER_FLAGS | FLAG (OT_N) | FLAG (OT_RS) | MEDIAL_FLAGS | HALANT_OR_COENG_FLAGS)))
Behdad Esfahbod81202bd2012-07-20 15:10:02 -0400967 {
968 info[i].indic_position() = last_pos;
Behdad Esfahboddde55062012-11-14 11:37:04 -0800969 if (unlikely (info[i].indic_category() == OT_H &&
Behdad Esfahbod81202bd2012-07-20 15:10:02 -0400970 info[i].indic_position() == POS_PRE_M))
971 {
972 /*
973 * Uniscribe doesn't move the Halant with Left Matra.
974 * TEST: U+092B,U+093F,U+094DE
Behdad Esfahboddde55062012-11-14 11:37:04 -0800975 * We follow. This is important for the Sinhala
976 * U+0DDA split matra since it decomposes to U+0DD9,U+0DCA
977 * where U+0DD9 is a left matra and U+0DCA is the virama.
978 * We don't want to move the virama with the left matra.
979 * TEST: U+0D9A,U+0DDA
Behdad Esfahbod81202bd2012-07-20 15:10:02 -0400980 */
Behdad Esfahbodebe29732012-05-11 16:43:12 +0200981 for (unsigned int j = i; j > start; j--)
Behdad Esfahbod6a091df2012-05-11 21:42:27 +0200982 if (info[j - 1].indic_position() != POS_PRE_M) {
Behdad Esfahbodebe29732012-05-11 16:43:12 +0200983 info[i].indic_position() = info[j - 1].indic_position();
984 break;
985 }
Behdad Esfahbod81202bd2012-07-20 15:10:02 -0400986 }
987 } else if (info[i].indic_position() != POS_SMVD) {
988 last_pos = (indic_position_t) info[i].indic_position();
Behdad Esfahbodebe29732012-05-11 16:43:12 +0200989 }
Behdad Esfahbod81202bd2012-07-20 15:10:02 -0400990 }
Behdad Esfahbodebe29732012-05-11 16:43:12 +0200991 }
Behdad Esfahbodddce2d82013-10-18 18:07:11 +0200992 /* For post-base consonants let them own anything before them
993 * since the last consonant or matra. */
Behdad Esfahbod74ccc6a2012-07-17 11:16:19 -0400994 {
Behdad Esfahbodddce2d82013-10-18 18:07:11 +0200995 unsigned int last = base;
Behdad Esfahbod74ccc6a2012-07-17 11:16:19 -0400996 for (unsigned int i = base + 1; i < end; i++)
Behdad Esfahbodddce2d82013-10-18 18:07:11 +0200997 if (is_consonant (info[i]))
998 {
999 for (unsigned int j = last + 1; j < i; j++)
1000 if (info[j].indic_position() < POS_SMVD)
Behdad Esfahbod81202bd2012-07-20 15:10:02 -04001001 info[j].indic_position() = info[i].indic_position();
Behdad Esfahbodddce2d82013-10-18 18:07:11 +02001002 last = i;
1003 } else if (info[i].indic_category() == OT_M)
1004 last = i;
Behdad Esfahbod74ccc6a2012-07-17 11:16:19 -04001005 }
Behdad Esfahbod45d6f292011-07-30 14:44:30 -04001006
Behdad Esfahbod28d5dae2013-10-16 12:32:12 +02001007
Behdad Esfahboda391ff52012-05-10 11:31:20 +02001008 {
Behdad Esfahbod28d5dae2013-10-16 12:32:12 +02001009 /* Use syllable() for sort accounting temporarily. */
1010 unsigned int syllable = info[start].syllable();
1011 for (unsigned int i = start; i < end; i++)
1012 info[i].syllable() = i - start;
1013
Behdad Esfahboda391ff52012-05-10 11:31:20 +02001014 /* Sit tight, rock 'n roll! */
Behdad Esfahbod85846b32015-09-01 15:07:52 +01001015 hb_stable_sort (info + start, end - start, compare_indic_order);
Behdad Esfahboda391ff52012-05-10 11:31:20 +02001016 /* Find base again */
1017 base = end;
Behdad Esfahbod3c2ea942012-05-11 16:23:38 +02001018 for (unsigned int i = start; i < end; i++)
Behdad Esfahbod28d5dae2013-10-16 12:32:12 +02001019 if (info[i].indic_position() == POS_BASE_C)
1020 {
1021 base = i;
Behdad Esfahboda391ff52012-05-10 11:31:20 +02001022 break;
1023 }
Behdad Esfahbod28d5dae2013-10-16 12:32:12 +02001024 /* Things are out-of-control for post base positions, they may shuffle
1025 * around like crazy. In old-spec mode, we move halants around, so in
1026 * that case merge all clusters after base. Otherwise, check the sort
1027 * order and merge as needed.
Behdad Esfahbod5828c452015-09-01 16:26:35 +01001028 * For pre-base stuff, we handle cluster issues in final reordering.
1029 *
1030 * We could use buffer->sort() for this, if there was no special
1031 * reordering of pre-base stuff happening later...
1032 */
Behdad Esfahbod28d5dae2013-10-16 12:32:12 +02001033 if (indic_plan->is_old_spec || end - base > 127)
1034 buffer->merge_clusters (base, end);
1035 else
1036 {
1037 /* Note! syllable() is a one-byte field. */
1038 for (unsigned int i = base; i < end; i++)
1039 if (info[i].syllable() != 255)
1040 {
1041 unsigned int max = i;
1042 unsigned int j = start + info[i].syllable();
1043 while (j != i)
1044 {
1045 max = MAX (max, j);
1046 unsigned int next = start + info[j].syllable();
1047 info[j].syllable() = 255; /* So we don't process j later again. */
1048 j = next;
1049 }
1050 if (i != max)
1051 buffer->merge_clusters (i, max + 1);
1052 }
1053 }
1054
1055 /* Put syllable back in. */
1056 for (unsigned int i = start; i < end; i++)
1057 info[i].syllable() = syllable;
Behdad Esfahboda391ff52012-05-10 11:31:20 +02001058 }
Behdad Esfahbod45d6f292011-07-30 14:44:30 -04001059
Behdad Esfahbod743807a2011-07-29 16:37:02 -04001060 /* Setup masks now */
1061
Behdad Esfahbod28168392011-07-31 16:00:35 -04001062 {
1063 hb_mask_t mask;
1064
Behdad Esfahboddbb10582012-05-10 13:45:52 +02001065 /* Reph */
Behdad Esfahbod668c6042012-05-11 15:34:13 +02001066 for (unsigned int i = start; i < end && info[i].indic_position() == POS_RA_TO_BECOME_REPH; i++)
Behdad Esfahbod85fc6c42012-08-02 12:21:44 -04001067 info[i].mask |= indic_plan->mask_array[RPHF];
Behdad Esfahboddbb10582012-05-10 13:45:52 +02001068
Behdad Esfahbod28168392011-07-31 16:00:35 -04001069 /* Pre-base */
Behdad Esfahbod85fc6c42012-08-02 12:21:44 -04001070 mask = indic_plan->mask_array[HALF];
Behdad Esfahbodc7dacac2013-10-17 12:20:24 +02001071 if (!indic_plan->is_old_spec &&
1072 indic_plan->config->blwf_mode == BLWF_MODE_PRE_AND_POST)
Behdad Esfahbod8acbb6b2013-10-15 12:15:49 +02001073 mask |= indic_plan->mask_array[BLWF];
Behdad Esfahbod3c2ea942012-05-11 16:23:38 +02001074 for (unsigned int i = start; i < base; i++)
Behdad Esfahbod28168392011-07-31 16:00:35 -04001075 info[i].mask |= mask;
1076 /* Base */
Behdad Esfahbod20b68e62012-07-20 10:47:46 -04001077 mask = 0;
Behdad Esfahbod075d6712012-07-18 15:41:53 -04001078 if (base < end)
1079 info[base].mask |= mask;
Behdad Esfahbod28168392011-07-31 16:00:35 -04001080 /* Post-base */
Behdad Esfahbod85fc6c42012-08-02 12:21:44 -04001081 mask = indic_plan->mask_array[BLWF] | indic_plan->mask_array[ABVF] | indic_plan->mask_array[PSTF];
Behdad Esfahbod3c2ea942012-05-11 16:23:38 +02001082 for (unsigned int i = base + 1; i < end; i++)
Behdad Esfahbod28168392011-07-31 16:00:35 -04001083 info[i].mask |= mask;
1084 }
Behdad Esfahbod9da04872011-07-31 13:46:44 -04001085
Behdad Esfahbod85c51ec2013-02-12 18:17:39 -05001086 if (indic_plan->is_old_spec &&
1087 buffer->props.script == HB_SCRIPT_DEVANAGARI)
1088 {
1089 /* Old-spec eye-lash Ra needs special handling. From the
1090 * spec:
1091 *
1092 * "The feature 'below-base form' is applied to consonants
1093 * having below-base forms and following the base consonant.
1094 * The exception is vattu, which may appear below half forms
1095 * as well as below the base glyph. The feature 'below-base
1096 * form' will be applied to all such occurrences of Ra as well."
1097 *
1098 * Test case: U+0924,U+094D,U+0930,U+094d,U+0915
1099 * with Sanskrit 2003 font.
1100 *
1101 * However, note that Ra,Halant,ZWJ is the correct way to
1102 * request eyelash form of Ra, so we wouldbn't inhibit it
1103 * in that sequence.
1104 *
1105 * Test case: U+0924,U+094D,U+0930,U+094d,U+200D,U+0915
1106 */
1107 for (unsigned int i = start; i + 1 < base; i++)
1108 if (info[i ].indic_category() == OT_Ra &&
1109 info[i+1].indic_category() == OT_H &&
1110 (i + 2 == base ||
1111 info[i+2].indic_category() != OT_ZWJ))
1112 {
1113 info[i ].mask |= indic_plan->mask_array[BLWF];
1114 info[i+1].mask |= indic_plan->mask_array[BLWF];
1115 }
1116 }
1117
Behdad Esfahbod74f4bbf2013-10-17 19:07:53 +02001118 unsigned int pref_len = indic_plan->config->pref_len;
1119 if (indic_plan->mask_array[PREF] && base + pref_len < end)
Behdad Esfahbod17d7de92012-07-16 15:20:15 -04001120 {
Behdad Esfahbod74f4bbf2013-10-17 19:07:53 +02001121 assert (1 <= pref_len && pref_len <= 2);
Behdad Esfahbod771a8f52012-07-23 20:07:50 -04001122 /* Find a Halant,Ra sequence and mark it for pre-base reordering processing. */
Behdad Esfahbod74f4bbf2013-10-17 19:07:53 +02001123 for (unsigned int i = base + 1; i + pref_len - 1 < end; i++) {
1124 hb_codepoint_t glyphs[2];
1125 for (unsigned int j = 0; j < pref_len; j++)
1126 glyphs[j] = info[i + j].codepoint;
1127 if (indic_plan->pref.would_substitute (glyphs, pref_len, face))
Behdad Esfahbod8e7b5882012-07-16 17:04:46 -04001128 {
Behdad Esfahbod74f4bbf2013-10-17 19:07:53 +02001129 for (unsigned int j = 0; j < pref_len; j++)
1130 info[i++].mask |= indic_plan->mask_array[PREF];
Behdad Esfahbod0201e0a2012-07-17 13:55:10 -04001131
1132 /* Mark the subsequent stuff with 'cfar'. Used in Khmer.
1133 * Read the feature spec.
1134 * This allows distinguishing the following cases with MS Khmer fonts:
1135 * U+1784,U+17D2,U+179A,U+17D2,U+1782
1136 * U+1784,U+17D2,U+1782,U+17D2,U+179A
1137 */
Behdad Esfahbod74f4bbf2013-10-17 19:07:53 +02001138 if (indic_plan->mask_array[CFAR])
1139 for (; i < end; i++)
1140 info[i].mask |= indic_plan->mask_array[CFAR];
Behdad Esfahbod0201e0a2012-07-17 13:55:10 -04001141
Behdad Esfahbod8e7b5882012-07-16 17:04:46 -04001142 break;
1143 }
Behdad Esfahbod56be6772012-11-12 14:09:40 -08001144 }
Behdad Esfahbod17d7de92012-07-16 15:20:15 -04001145 }
1146
Behdad Esfahbod9da04872011-07-31 13:46:44 -04001147 /* Apply ZWJ/ZWNJ effects */
Behdad Esfahbod3c2ea942012-05-11 16:23:38 +02001148 for (unsigned int i = start + 1; i < end; i++)
Behdad Esfahbod9da04872011-07-31 13:46:44 -04001149 if (is_joiner (info[i])) {
1150 bool non_joiner = info[i].indic_category() == OT_ZWNJ;
Behdad Esfahbod6b37bc82011-07-31 15:57:00 -04001151 unsigned int j = i;
Behdad Esfahbod9da04872011-07-31 13:46:44 -04001152
1153 do {
Behdad Esfahbod9da04872011-07-31 13:46:44 -04001154 j--;
Behdad Esfahbod6b37bc82011-07-31 15:57:00 -04001155
Behdad Esfahbodcfc507c2013-02-14 10:40:12 -05001156 /* ZWJ/ZWNJ should disable CJCT. They do that by simply
1157 * being there, since we don't skip them for the CJCT
Behdad Esfahboda8cf7b42013-03-19 05:53:26 -04001158 * feature (ie. F_MANUAL_ZWJ) */
Behdad Esfahbod20b68e62012-07-20 10:47:46 -04001159
1160 /* A ZWNJ disables HALF. */
Behdad Esfahbod6b37bc82011-07-31 15:57:00 -04001161 if (non_joiner)
Behdad Esfahbod85fc6c42012-08-02 12:21:44 -04001162 info[j].mask &= ~indic_plan->mask_array[HALF];
Behdad Esfahbod6b37bc82011-07-31 15:57:00 -04001163
Behdad Esfahbod9da04872011-07-31 13:46:44 -04001164 } while (j > start && !is_consonant (info[j]));
1165 }
Behdad Esfahbod743807a2011-07-29 16:37:02 -04001166}
1167
Behdad Esfahbod743807a2011-07-29 16:37:02 -04001168static void
Behdad Esfahbod8bb5deb2012-08-02 10:07:58 -04001169initial_reordering_standalone_cluster (const hb_ot_shape_plan_t *plan,
Behdad Esfahbodf2c0f592012-11-12 14:02:02 -08001170 hb_face_t *face,
Behdad Esfahbod9f377ed2012-05-13 16:13:44 +02001171 hb_buffer_t *buffer,
Behdad Esfahbodef24cc82012-05-09 17:56:03 +02001172 unsigned int start, unsigned int end)
Behdad Esfahbod743807a2011-07-29 16:37:02 -04001173{
Behdad Esfahbodcf78dd42014-05-27 17:53:37 -04001174 /* We treat placeholder/dotted-circle as if they are consonants, so we
1175 * should just chain. Only if not in compatibility mode that is... */
Behdad Esfahbod18c06e12012-05-11 20:02:14 +02001176
Behdad Esfahbodbab02d32013-02-12 15:26:45 -05001177 if (hb_options ().uniscribe_bug_compatible)
Behdad Esfahbod18c06e12012-05-11 20:02:14 +02001178 {
1179 /* For dotted-circle, this is what Uniscribe does:
1180 * If dotted-circle is the last glyph, it just does nothing.
1181 * Ie. It doesn't form Reph. */
1182 if (buffer->info[end - 1].indic_category() == OT_DOTTEDCIRCLE)
1183 return;
1184 }
1185
Behdad Esfahbodf2c0f592012-11-12 14:02:02 -08001186 initial_reordering_consonant_syllable (plan, face, buffer, start, end);
Behdad Esfahbod743807a2011-07-29 16:37:02 -04001187}
1188
1189static void
Behdad Esfahbod327d14e2012-08-31 16:49:34 -04001190initial_reordering_syllable (const hb_ot_shape_plan_t *plan,
Behdad Esfahbodf2c0f592012-11-12 14:02:02 -08001191 hb_face_t *face,
Behdad Esfahbod327d14e2012-08-31 16:49:34 -04001192 hb_buffer_t *buffer,
1193 unsigned int start, unsigned int end)
1194{
1195 syllable_type_t syllable_type = (syllable_type_t) (buffer->info[start].syllable() & 0x0F);
Behdad Esfahbodecb0b242015-07-22 12:02:09 +01001196 switch (syllable_type)
1197 {
1198 case vowel_syllable: /* We made the vowels look like consonants. So let's call the consonant logic! */
1199 case consonant_syllable:
1200 initial_reordering_consonant_syllable (plan, face, buffer, start, end);
1201 break;
1202
1203 case broken_cluster: /* We already inserted dotted-circles, so just call the standalone_cluster. */
1204 case standalone_cluster:
1205 initial_reordering_standalone_cluster (plan, face, buffer, start, end);
1206 break;
1207
1208 case symbol_cluster:
1209 case non_indic_cluster:
1210 break;
Behdad Esfahbod327d14e2012-08-31 16:49:34 -04001211 }
1212}
1213
Behdad Esfahbod166b5cf2012-09-07 14:55:07 -04001214static inline void
Behdad Esfahbod0beb66e2012-12-05 18:46:04 -05001215insert_dotted_circles (const hb_ot_shape_plan_t *plan HB_UNUSED,
Behdad Esfahbodb85800f2012-08-31 18:12:01 -04001216 hb_font_t *font,
1217 hb_buffer_t *buffer)
1218{
Behdad Esfahbod166b5cf2012-09-07 14:55:07 -04001219 /* Note: This loop is extra overhead, but should not be measurable. */
1220 bool has_broken_syllables = false;
1221 unsigned int count = buffer->len;
Behdad Esfahbod7cd33f22014-07-17 14:22:11 -04001222 hb_glyph_info_t *info = buffer->info;
Behdad Esfahbod166b5cf2012-09-07 14:55:07 -04001223 for (unsigned int i = 0; i < count; i++)
Behdad Esfahbod7cd33f22014-07-17 14:22:11 -04001224 if ((info[i].syllable() & 0x0F) == broken_cluster)
1225 {
Behdad Esfahbod166b5cf2012-09-07 14:55:07 -04001226 has_broken_syllables = true;
1227 break;
1228 }
1229 if (likely (!has_broken_syllables))
1230 return;
1231
1232
Behdad Esfahbodb85800f2012-08-31 18:12:01 -04001233 hb_codepoint_t dottedcircle_glyph;
Behdad Esfahbod76271002014-07-11 14:54:42 -04001234 if (!font->get_glyph (0x25CCu, 0, &dottedcircle_glyph))
Behdad Esfahbodb85800f2012-08-31 18:12:01 -04001235 return;
1236
Behdad Esfahbodf41dc2d2012-11-15 10:36:43 -08001237 hb_glyph_info_t dottedcircle = {0};
Behdad Esfahbod76271002014-07-11 14:54:42 -04001238 dottedcircle.codepoint = 0x25CCu;
Behdad Esfahbodb85800f2012-08-31 18:12:01 -04001239 set_indic_properties (dottedcircle);
1240 dottedcircle.codepoint = dottedcircle_glyph;
1241
1242 buffer->clear_output ();
1243
1244 buffer->idx = 0;
1245 unsigned int last_syllable = 0;
1246 while (buffer->idx < buffer->len)
1247 {
1248 unsigned int syllable = buffer->cur().syllable();
1249 syllable_type_t syllable_type = (syllable_type_t) (syllable & 0x0F);
1250 if (unlikely (last_syllable != syllable && syllable_type == broken_cluster))
1251 {
Behdad Esfahbod596740d2012-12-21 19:41:04 -05001252 last_syllable = syllable;
1253
Behdad Esfahbod6f932bc2015-10-21 11:16:49 -02001254 hb_glyph_info_t ginfo = dottedcircle;
1255 ginfo.cluster = buffer->cur().cluster;
1256 ginfo.mask = buffer->cur().mask;
1257 ginfo.syllable() = buffer->cur().syllable();
Behdad Esfahbod595d2b92014-07-26 18:44:15 -04001258 /* TODO Set glyph_props? */
Behdad Esfahbod596740d2012-12-21 19:41:04 -05001259
1260 /* Insert dottedcircle after possible Repha. */
1261 while (buffer->idx < buffer->len &&
1262 last_syllable == buffer->cur().syllable() &&
1263 buffer->cur().indic_category() == OT_Repha)
1264 buffer->next_glyph ();
1265
Behdad Esfahbod6f932bc2015-10-21 11:16:49 -02001266 buffer->output_info (ginfo);
Behdad Esfahbodb85800f2012-08-31 18:12:01 -04001267 }
Behdad Esfahbod596740d2012-12-21 19:41:04 -05001268 else
1269 buffer->next_glyph ();
Behdad Esfahbodb85800f2012-08-31 18:12:01 -04001270 }
1271
1272 buffer->swap_buffers ();
1273}
1274
1275static void
Behdad Esfahbod8bb5deb2012-08-02 10:07:58 -04001276initial_reordering (const hb_ot_shape_plan_t *plan,
Behdad Esfahbod24eacf12012-08-02 08:42:11 -04001277 hb_font_t *font,
Behdad Esfahbod3e38c0f2012-08-02 09:44:18 -04001278 hb_buffer_t *buffer)
Behdad Esfahbod743807a2011-07-29 16:37:02 -04001279{
Behdad Esfahbod85fc6c42012-08-02 12:21:44 -04001280 update_consonant_positions (plan, font, buffer);
Behdad Esfahbod166b5cf2012-09-07 14:55:07 -04001281 insert_dotted_circles (plan, font, buffer);
Behdad Esfahbod327d14e2012-08-31 16:49:34 -04001282
Behdad Esfahbodecb0b242015-07-22 12:02:09 +01001283 foreach_syllable (buffer, start, end)
1284 initial_reordering_syllable (plan, font->face, buffer, start, end);
Behdad Esfahbodb9ddbd52011-06-02 17:43:12 -04001285}
1286
Behdad Esfahbod743807a2011-07-29 16:37:02 -04001287static void
Behdad Esfahbod85fc6c42012-08-02 12:21:44 -04001288final_reordering_syllable (const hb_ot_shape_plan_t *plan,
1289 hb_buffer_t *buffer,
Behdad Esfahbodef24cc82012-05-09 17:56:03 +02001290 unsigned int start, unsigned int end)
Behdad Esfahbod743807a2011-07-29 16:37:02 -04001291{
Behdad Esfahbod85fc6c42012-08-02 12:21:44 -04001292 const indic_shape_plan_t *indic_plan = (const indic_shape_plan_t *) plan->data;
Behdad Esfahbod4ac9e982012-05-10 12:53:53 +02001293 hb_glyph_info_t *info = buffer->info;
1294
Behdad Esfahbod04dc52f2014-06-06 17:28:38 -04001295
1296 /* This function relies heavily on halant glyphs. Lots of ligation
1297 * and possibly multiplication substitutions happened prior to this
1298 * phase, and that might have messed up our properties. Recover
1299 * from a particular case of that where we're fairly sure that a
1300 * class of OT_H is desired but has been lost. */
1301 if (indic_plan->virama_glyph)
1302 {
1303 unsigned int virama_glyph = indic_plan->virama_glyph;
1304 for (unsigned int i = start; i < end; i++)
1305 if (info[i].codepoint == virama_glyph &&
1306 _hb_glyph_info_ligated (&info[i]) &&
1307 _hb_glyph_info_multiplied (&info[i]))
1308 {
1309 /* This will make sure that this glyph passes is_halant_or_coeng() test. */
1310 info[i].indic_category() = OT_H;
1311 _hb_glyph_info_clear_ligated_and_multiplied (&info[i]);
1312 }
1313 }
1314
1315
Behdad Esfahbode7be0572011-07-31 15:18:57 -04001316 /* 4. Final reordering:
1317 *
1318 * After the localized forms and basic shaping forms GSUB features have been
1319 * applied (see below), the shaping engine performs some final glyph
1320 * reordering before applying all the remaining font features to the entire
1321 * cluster.
Behdad Esfahbod4ac9e982012-05-10 12:53:53 +02001322 */
1323
Behdad Esfahbod1d634cb2014-06-06 17:55:02 -04001324 bool try_pref = !!indic_plan->mask_array[PREF];
1325
Behdad Esfahbod4ac9e982012-05-10 12:53:53 +02001326 /* Find base again */
Behdad Esfahbod5f0eaaa2012-07-20 15:47:24 -04001327 unsigned int base;
1328 for (base = start; base < end; base++)
Behdad Esfahbod1d634cb2014-06-06 17:55:02 -04001329 if (info[base].indic_position() >= POS_BASE_C)
1330 {
1331 if (try_pref && base + 1 < end && indic_plan->config->pref_len == 2)
1332 {
1333 for (unsigned int i = base + 1; i < end; i++)
1334 if ((info[i].mask & indic_plan->mask_array[PREF]) != 0)
1335 {
1336 if (!(_hb_glyph_info_substituted (&info[i]) &&
1337 _hb_glyph_info_ligated_and_didnt_multiply (&info[i])))
1338 {
1339 /* Ok, this was a 'pref' candidate but didn't form any.
1340 * Base is around here... */
1341 base = i;
1342 while (base < end && is_halant_or_coeng (info[base]))
1343 base++;
1344 info[base].indic_position() = POS_BASE_C;
1345
1346 try_pref = false;
1347 }
1348 break;
1349 }
1350 }
1351
Behdad Esfahbod5f0eaaa2012-07-20 15:47:24 -04001352 if (start < base && info[base].indic_position() > POS_BASE_C)
1353 base--;
1354 break;
1355 }
Behdad Esfahboda0cb9f32013-02-13 09:26:55 -05001356 if (base == end && start < base &&
Behdad Esfahbod39c82012014-06-06 17:19:35 -04001357 is_one_of (info[base - 1], FLAG (OT_ZWJ)))
Behdad Esfahboda0cb9f32013-02-13 09:26:55 -05001358 base--;
Behdad Esfahbode7ce50d2014-07-16 12:30:39 -04001359 if (base < end)
1360 while (start < base &&
1361 is_one_of (info[base], (FLAG (OT_N) | HALANT_OR_COENG_FLAGS)))
1362 base--;
Behdad Esfahbod4ac9e982012-05-10 12:53:53 +02001363
Behdad Esfahbod4705a702012-05-10 13:09:08 +02001364
Behdad Esfahbod4ac9e982012-05-10 12:53:53 +02001365 /* o Reorder matras:
Behdad Esfahbode7be0572011-07-31 15:18:57 -04001366 *
1367 * If a pre-base matra character had been reordered before applying basic
1368 * features, the glyph can be moved closer to the main consonant based on
1369 * whether half-forms had been formed. Actual position for the matra is
1370 * defined as “after last standalone halant glyph, after initial matra
1371 * position and before the main consonant”. If ZWJ or ZWNJ follow this
1372 * halant, position is moved after it.
Behdad Esfahbod4ac9e982012-05-10 12:53:53 +02001373 */
1374
Behdad Esfahbod65c43ac2012-07-24 03:36:47 -04001375 if (start + 1 < end && start < base) /* Otherwise there can't be any pre-base matra characters. */
Behdad Esfahbod9d0d3192012-05-11 21:36:32 +02001376 {
Behdad Esfahbod65c43ac2012-07-24 03:36:47 -04001377 /* If we lost track of base, alas, position before last thingy. */
1378 unsigned int new_pos = base == end ? base - 2 : base - 1;
Behdad Esfahbod4ac9e982012-05-10 12:53:53 +02001379
Behdad Esfahbod27bd55b2012-09-05 15:11:14 -04001380 /* Malayalam / Tamil do not have "half" forms or explicit virama forms.
1381 * The glyphs formed by 'half' are Chillus or ligated explicit viramas.
1382 * We want to position matra after them.
Behdad Esfahbod65c43ac2012-07-24 03:36:47 -04001383 */
Behdad Esfahbod27bd55b2012-09-05 15:11:14 -04001384 if (buffer->props.script != HB_SCRIPT_MALAYALAM && buffer->props.script != HB_SCRIPT_TAMIL)
Behdad Esfahbod65c43ac2012-07-24 03:36:47 -04001385 {
1386 while (new_pos > start &&
Behdad Esfahbodc04d5f02014-06-06 17:02:39 -04001387 !(is_one_of (info[new_pos], (FLAG (OT_M) | HALANT_OR_COENG_FLAGS))))
Behdad Esfahbod65c43ac2012-07-24 03:36:47 -04001388 new_pos--;
1389
1390 /* If we found no Halant we are done.
1391 * Otherwise only proceed if the Halant does
1392 * not belong to the Matra itself! */
1393 if (is_halant_or_coeng (info[new_pos]) &&
1394 info[new_pos].indic_position() != POS_PRE_M)
1395 {
1396 /* -> If ZWJ or ZWNJ follow this halant, position is moved after it. */
1397 if (new_pos + 1 < end && is_joiner (info[new_pos + 1]))
1398 new_pos++;
1399 }
1400 else
1401 new_pos = start; /* No move. */
1402 }
1403
Behdad Esfahbod27bd55b2012-09-05 15:11:14 -04001404 if (start < new_pos && info[new_pos].indic_position () != POS_PRE_M)
Behdad Esfahbod65c43ac2012-07-24 03:36:47 -04001405 {
Behdad Esfahbod9d0d3192012-05-11 21:36:32 +02001406 /* Now go see if there's actually any matras... */
Behdad Esfahbod921ce5b2012-07-16 15:26:56 -04001407 for (unsigned int i = new_pos; i > start; i--)
Behdad Esfahbod6a091df2012-05-11 21:42:27 +02001408 if (info[i - 1].indic_position () == POS_PRE_M)
Behdad Esfahbod9d0d3192012-05-11 21:36:32 +02001409 {
Behdad Esfahbod1a1dbe92012-07-16 15:40:33 -04001410 unsigned int old_pos = i - 1;
Behdad Esfahbod5828c452015-09-01 16:26:35 +01001411 if (old_pos < base && base <= new_pos) /* Shouldn't actually happen. */
1412 base--;
1413
Behdad Esfahbod1a1dbe92012-07-16 15:40:33 -04001414 hb_glyph_info_t tmp = info[old_pos];
1415 memmove (&info[old_pos], &info[old_pos + 1], (new_pos - old_pos) * sizeof (info[0]));
1416 info[new_pos] = tmp;
Behdad Esfahbod5828c452015-09-01 16:26:35 +01001417
1418 /* Note: this merge_clusters() is intentionally *after* the reordering.
1419 * Indic matra reordering is special and tricky... */
Behdad Esfahbod9cb59d42013-10-16 11:34:07 +02001420 buffer->merge_clusters (new_pos, MIN (end, base + 1));
Behdad Esfahbod5828c452015-09-01 16:26:35 +01001421
Behdad Esfahbod921ce5b2012-07-16 15:26:56 -04001422 new_pos--;
Behdad Esfahbod9d0d3192012-05-11 21:36:32 +02001423 }
Behdad Esfahbodabb32392012-07-22 23:55:19 -04001424 } else {
Behdad Esfahbode6b01a82012-07-23 00:11:26 -04001425 for (unsigned int i = start; i < base; i++)
Behdad Esfahbodabb32392012-07-22 23:55:19 -04001426 if (info[i].indic_position () == POS_PRE_M) {
Behdad Esfahbod2cc933a2012-07-23 08:22:55 -04001427 buffer->merge_clusters (i, MIN (end, base + 1));
Behdad Esfahbodabb32392012-07-22 23:55:19 -04001428 break;
1429 }
Behdad Esfahbod9d0d3192012-05-11 21:36:32 +02001430 }
Behdad Esfahbod4ac9e982012-05-10 12:53:53 +02001431 }
1432
1433
1434 /* o Reorder reph:
Behdad Esfahbode7be0572011-07-31 15:18:57 -04001435 *
1436 * Reph’s original position is always at the beginning of the syllable,
1437 * (i.e. it is not reordered at the character reordering stage). However,
1438 * it will be reordered according to the basic-forms shaping results.
1439 * Possible positions for reph, depending on the script, are; after main,
1440 * before post-base consonant forms, and after post-base consonant forms.
Behdad Esfahboddbb10582012-05-10 13:45:52 +02001441 */
1442
Behdad Esfahbod65a929b2013-10-15 18:08:05 +02001443 /* Two cases:
1444 *
1445 * - If repha is encoded as a sequence of characters (Ra,H or Ra,H,ZWJ), then
1446 * we should only move it if the sequence ligated to the repha form.
1447 *
1448 * - If repha is encoded separately and in the logical position, we should only
1449 * move it if it did NOT ligate. If it ligated, it's probably the font trying
1450 * to make it work without the reordering.
1451 */
Behdad Esfahbodf5299ef2013-10-15 18:13:07 +02001452 if (start + 1 < end &&
1453 info[start].indic_position() == POS_RA_TO_BECOME_REPH &&
Behdad Esfahbod3ddf8922013-10-18 00:02:43 +02001454 ((info[start].indic_category() == OT_Repha) ^
Behdad Esfahbod832a6f92014-06-04 16:57:42 -04001455 _hb_glyph_info_ligated_and_didnt_multiply (&info[start])))
Behdad Esfahboddbb10582012-05-10 13:45:52 +02001456 {
Behdad Esfahbod11b0e202012-08-02 14:21:40 -04001457 unsigned int new_reph_pos;
1458 reph_position_t reph_pos = indic_plan->config->reph_pos;
Behdad Esfahbod02b29222012-05-10 21:44:50 +02001459
Behdad Esfahbodf175aa32013-10-18 02:07:44 +02001460 assert (reph_pos != REPH_POS_DONT_CARE);
Behdad Esfahbod02b29222012-05-10 21:44:50 +02001461
Behdad Esfahboddbb10582012-05-10 13:45:52 +02001462 /* 1. If reph should be positioned after post-base consonant forms,
1463 * proceed to step 5.
Behdad Esfahbod02b29222012-05-10 21:44:50 +02001464 */
Behdad Esfahbod11b0e202012-08-02 14:21:40 -04001465 if (reph_pos == REPH_POS_AFTER_POST)
Behdad Esfahbod02b29222012-05-10 21:44:50 +02001466 {
Behdad Esfahbod9d0d3192012-05-11 21:36:32 +02001467 goto reph_step_5;
Behdad Esfahbod02b29222012-05-10 21:44:50 +02001468 }
1469
1470 /* 2. If the reph repositioning class is not after post-base: target
Behdad Esfahboddbb10582012-05-10 13:45:52 +02001471 * position is after the first explicit halant glyph between the
1472 * first post-reph consonant and last main consonant. If ZWJ or ZWNJ
1473 * are following this halant, position is moved after it. If such
1474 * position is found, this is the target position. Otherwise,
1475 * proceed to the next step.
1476 *
1477 * Note: in old-implementation fonts, where classifications were
1478 * fixed in shaping engine, there was no case where reph position
1479 * will be found on this step.
Behdad Esfahbod02b29222012-05-10 21:44:50 +02001480 */
Behdad Esfahbod02b29222012-05-10 21:44:50 +02001481 {
1482 new_reph_pos = start + 1;
Behdad Esfahboddeb521d2012-07-17 11:37:32 -04001483 while (new_reph_pos < base && !is_halant_or_coeng (info[new_reph_pos]))
Behdad Esfahbod02b29222012-05-10 21:44:50 +02001484 new_reph_pos++;
1485
Behdad Esfahbod1f91c392013-02-13 09:38:40 -05001486 if (new_reph_pos < base && is_halant_or_coeng (info[new_reph_pos]))
1487 {
Behdad Esfahbod02b29222012-05-10 21:44:50 +02001488 /* ->If ZWJ or ZWNJ are following this halant, position is moved after it. */
1489 if (new_reph_pos + 1 < base && is_joiner (info[new_reph_pos + 1]))
1490 new_reph_pos++;
1491 goto reph_move;
1492 }
1493 }
1494
1495 /* 3. If reph should be repositioned after the main consonant: find the
Behdad Esfahboddbb10582012-05-10 13:45:52 +02001496 * first consonant not ligated with main, or find the first
1497 * consonant that is not a potential pre-base reordering Ra.
Behdad Esfahbod02b29222012-05-10 21:44:50 +02001498 */
Behdad Esfahbod11b0e202012-08-02 14:21:40 -04001499 if (reph_pos == REPH_POS_AFTER_MAIN)
Behdad Esfahbod02b29222012-05-10 21:44:50 +02001500 {
Behdad Esfahbodb504e062012-07-16 15:21:12 -04001501 new_reph_pos = base;
Behdad Esfahbod34ae3362012-07-20 16:17:28 -04001502 while (new_reph_pos + 1 < end && info[new_reph_pos + 1].indic_position() <= POS_AFTER_MAIN)
Behdad Esfahbodb504e062012-07-16 15:21:12 -04001503 new_reph_pos++;
1504 if (new_reph_pos < end)
1505 goto reph_move;
Behdad Esfahbod02b29222012-05-10 21:44:50 +02001506 }
1507
1508 /* 4. If reph should be positioned before post-base consonant, find
Behdad Esfahboddbb10582012-05-10 13:45:52 +02001509 * first post-base classified consonant not ligated with main. If no
1510 * consonant is found, the target position should be before the
1511 * first matra, syllable modifier sign or vedic sign.
Behdad Esfahbod02b29222012-05-10 21:44:50 +02001512 */
Behdad Esfahbod9d0d3192012-05-11 21:36:32 +02001513 /* This is our take on what step 4 is trying to say (and failing, BADLY). */
Behdad Esfahbod11b0e202012-08-02 14:21:40 -04001514 if (reph_pos == REPH_POS_AFTER_SUB)
Behdad Esfahbod02b29222012-05-10 21:44:50 +02001515 {
Behdad Esfahbod9d0d3192012-05-11 21:36:32 +02001516 new_reph_pos = base;
1517 while (new_reph_pos < end &&
Behdad Esfahbodf8160a42015-07-21 15:50:02 +01001518 !( FLAG_SAFE (info[new_reph_pos + 1].indic_position()) & (FLAG (POS_POST_C) | FLAG (POS_AFTER_POST) | FLAG (POS_SMVD))))
Behdad Esfahbod9d0d3192012-05-11 21:36:32 +02001519 new_reph_pos++;
1520 if (new_reph_pos < end)
1521 goto reph_move;
Behdad Esfahbod02b29222012-05-10 21:44:50 +02001522 }
1523
1524 /* 5. If no consonant is found in steps 3 or 4, move reph to a position
Behdad Esfahboddbb10582012-05-10 13:45:52 +02001525 * immediately before the first post-base matra, syllable modifier
1526 * sign or vedic sign that has a reordering class after the intended
1527 * reph position. For example, if the reordering position for reph
1528 * is post-main, it will skip above-base matras that also have a
1529 * post-main position.
Behdad Esfahboddbb10582012-05-10 13:45:52 +02001530 */
Behdad Esfahbod02b29222012-05-10 21:44:50 +02001531 reph_step_5:
1532 {
Behdad Esfahbodd0e68db2012-07-20 11:25:41 -04001533 /* Copied from step 2. */
1534 new_reph_pos = start + 1;
1535 while (new_reph_pos < base && !is_halant_or_coeng (info[new_reph_pos]))
1536 new_reph_pos++;
1537
Behdad Esfahbod1f91c392013-02-13 09:38:40 -05001538 if (new_reph_pos < base && is_halant_or_coeng (info[new_reph_pos]))
1539 {
Behdad Esfahbodd0e68db2012-07-20 11:25:41 -04001540 /* ->If ZWJ or ZWNJ are following this halant, position is moved after it. */
1541 if (new_reph_pos + 1 < base && is_joiner (info[new_reph_pos + 1]))
1542 new_reph_pos++;
1543 goto reph_move;
1544 }
Behdad Esfahbod8df56362012-05-10 15:41:04 +02001545 }
1546
Behdad Esfahbod02b29222012-05-10 21:44:50 +02001547 /* 6. Otherwise, reorder reph to the end of the syllable.
1548 */
Behdad Esfahbod02b29222012-05-10 21:44:50 +02001549 {
1550 new_reph_pos = end - 1;
1551 while (new_reph_pos > start && info[new_reph_pos].indic_position() == POS_SMVD)
1552 new_reph_pos--;
1553
Behdad Esfahbod892eb782012-05-11 16:54:40 +02001554 /*
1555 * If the Reph is to be ending up after a Matra,Halant sequence,
1556 * position it before that Halant so it can interact with the Matra.
1557 * However, if it's a plain Consonant,Halant we shouldn't do that.
1558 * Uniscribe doesn't do this.
1559 * TEST: U+0930,U+094D,U+0915,U+094B,U+094D
1560 */
Behdad Esfahbodbab02d32013-02-12 15:26:45 -05001561 if (!hb_options ().uniscribe_bug_compatible &&
Behdad Esfahboddeb521d2012-07-17 11:37:32 -04001562 unlikely (is_halant_or_coeng (info[new_reph_pos]))) {
Behdad Esfahbod02b29222012-05-10 21:44:50 +02001563 for (unsigned int i = base + 1; i < new_reph_pos; i++)
1564 if (info[i].indic_category() == OT_M) {
1565 /* Ok, got it. */
1566 new_reph_pos--;
1567 }
1568 }
1569 goto reph_move;
1570 }
1571
1572 reph_move:
1573 {
1574 /* Move */
Behdad Esfahbod5828c452015-09-01 16:26:35 +01001575 buffer->merge_clusters (start, new_reph_pos + 1);
Behdad Esfahbod02b29222012-05-10 21:44:50 +02001576 hb_glyph_info_t reph = info[start];
1577 memmove (&info[start], &info[start + 1], (new_reph_pos - start) * sizeof (info[0]));
1578 info[new_reph_pos] = reph;
Behdad Esfahbod5828c452015-09-01 16:26:35 +01001579
Behdad Esfahbodf22b7e72013-02-13 07:32:46 -05001580 if (start < base && base <= new_reph_pos)
1581 base--;
Behdad Esfahbod02b29222012-05-10 21:44:50 +02001582 }
Behdad Esfahboddbb10582012-05-10 13:45:52 +02001583 }
1584
1585
1586 /* o Reorder pre-base reordering consonants:
Behdad Esfahbode7be0572011-07-31 15:18:57 -04001587 *
1588 * If a pre-base reordering consonant is found, reorder it according to
1589 * the following rules:
Behdad Esfahbode7be0572011-07-31 15:18:57 -04001590 */
1591
Behdad Esfahbod1d634cb2014-06-06 17:55:02 -04001592 if (try_pref && base + 1 < end) /* Otherwise there can't be any pre-base reordering Ra. */
Behdad Esfahbod46e645e2012-07-16 15:30:05 -04001593 {
Behdad Esfahbod46a863d2013-10-27 23:24:50 +01001594 unsigned int pref_len = indic_plan->config->pref_len;
Behdad Esfahbod8e7b5882012-07-16 17:04:46 -04001595 for (unsigned int i = base + 1; i < end; i++)
Behdad Esfahbod85fc6c42012-08-02 12:21:44 -04001596 if ((info[i].mask & indic_plan->mask_array[PREF]) != 0)
Behdad Esfahbod78818122012-07-16 15:49:08 -04001597 {
Behdad Esfahbod8e7b5882012-07-16 17:04:46 -04001598 /* 1. Only reorder a glyph produced by substitution during application
1599 * of the <pref> feature. (Note that a font may shape a Ra consonant with
1600 * the feature generally but block it in certain contexts.)
1601 */
Behdad Esfahbod9a493512013-10-18 02:14:53 +02001602 /* Note: We just check that something got substituted. We don't check that
Behdad Esfahbod46a863d2013-10-27 23:24:50 +01001603 * the <pref> feature actually did it...
1604 *
1605 * If pref len is longer than one, then only reorder if it ligated. If
1606 * pref len is one, only reorder if it didn't ligate with other things. */
1607 if (_hb_glyph_info_substituted (&info[i]) &&
Behdad Esfahbod832a6f92014-06-04 16:57:42 -04001608 ((pref_len == 1) ^ _hb_glyph_info_ligated_and_didnt_multiply (&info[i])))
Behdad Esfahbod8e7b5882012-07-16 17:04:46 -04001609 {
1610 /*
1611 * 2. Try to find a target position the same way as for pre-base matra.
1612 * If it is found, reorder pre-base consonant glyph.
1613 *
1614 * 3. If position is not found, reorder immediately before main
1615 * consonant.
1616 */
1617
1618 unsigned int new_pos = base;
Behdad Esfahbod88d3c982012-10-29 16:27:02 -07001619 /* Malayalam / Tamil do not have "half" forms or explicit virama forms.
1620 * The glyphs formed by 'half' are Chillus or ligated explicit viramas.
1621 * We want to position matra after them.
1622 */
1623 if (buffer->props.script != HB_SCRIPT_MALAYALAM && buffer->props.script != HB_SCRIPT_TAMIL)
Behdad Esfahbodd90b8e82012-07-24 02:10:20 -04001624 {
Behdad Esfahbod88d3c982012-10-29 16:27:02 -07001625 while (new_pos > start &&
1626 !(is_one_of (info[new_pos - 1], FLAG(OT_M) | HALANT_OR_COENG_FLAGS)))
1627 new_pos--;
1628
Behdad Esfahbod9a493512013-10-18 02:14:53 +02001629 /* In Khmer coeng model, a H,Ra can go *after* matras. If it goes after a
Behdad Esfahbod88d3c982012-10-29 16:27:02 -07001630 * split matra, it should be reordered to *before* the left part of such matra. */
1631 if (new_pos > start && info[new_pos - 1].indic_category() == OT_M)
1632 {
1633 unsigned int old_pos = i;
Behdad Esfahbodb90cb362015-10-21 11:13:21 -02001634 for (unsigned int j = base + 1; j < old_pos; j++)
1635 if (info[j].indic_category() == OT_M)
Behdad Esfahbod88d3c982012-10-29 16:27:02 -07001636 {
1637 new_pos--;
1638 break;
1639 }
1640 }
Behdad Esfahbodd90b8e82012-07-24 02:10:20 -04001641 }
1642
Behdad Esfahboddeb521d2012-07-17 11:37:32 -04001643 if (new_pos > start && is_halant_or_coeng (info[new_pos - 1]))
Behdad Esfahbod1f91c392013-02-13 09:38:40 -05001644 {
Behdad Esfahbod8e7b5882012-07-16 17:04:46 -04001645 /* -> If ZWJ or ZWNJ follow this halant, position is moved after it. */
1646 if (new_pos < end && is_joiner (info[new_pos]))
1647 new_pos++;
Behdad Esfahbod1f91c392013-02-13 09:38:40 -05001648 }
Behdad Esfahbod8e7b5882012-07-16 17:04:46 -04001649
1650 {
1651 unsigned int old_pos = i;
Behdad Esfahbod5828c452015-09-01 16:26:35 +01001652
Behdad Esfahbode6b01a82012-07-23 00:11:26 -04001653 buffer->merge_clusters (new_pos, old_pos + 1);
Behdad Esfahbod8e7b5882012-07-16 17:04:46 -04001654 hb_glyph_info_t tmp = info[old_pos];
1655 memmove (&info[new_pos + 1], &info[new_pos], (old_pos - new_pos) * sizeof (info[0]));
1656 info[new_pos] = tmp;
Behdad Esfahbod5828c452015-09-01 16:26:35 +01001657
Behdad Esfahbodf22b7e72013-02-13 07:32:46 -05001658 if (new_pos <= base && base < old_pos)
1659 base++;
Behdad Esfahbod8e7b5882012-07-16 17:04:46 -04001660 }
1661 }
1662
1663 break;
Behdad Esfahbod78818122012-07-16 15:49:08 -04001664 }
Behdad Esfahbod46e645e2012-07-16 15:30:05 -04001665 }
Behdad Esfahbodeed903b2012-05-11 20:50:53 +02001666
1667
Behdad Esfahboda913b022012-05-11 20:59:26 +02001668 /* Apply 'init' to the Left Matra if it's a word start. */
Behdad Esfahbod6a091df2012-05-11 21:42:27 +02001669 if (info[start].indic_position () == POS_PRE_M &&
Behdad Esfahboda913b022012-05-11 20:59:26 +02001670 (!start ||
Behdad Esfahbodf8160a42015-07-21 15:50:02 +01001671 !(FLAG_SAFE (_hb_glyph_info_get_general_category (&info[start - 1])) &
Behdad Esfahbod2c372b82012-07-20 13:37:48 -04001672 FLAG_RANGE (HB_UNICODE_GENERAL_CATEGORY_FORMAT, HB_UNICODE_GENERAL_CATEGORY_NON_SPACING_MARK))))
Behdad Esfahbod85fc6c42012-08-02 12:21:44 -04001673 info[start].mask |= indic_plan->mask_array[INIT];
Behdad Esfahboda913b022012-05-11 20:59:26 +02001674
Behdad Esfahbodeed903b2012-05-11 20:50:53 +02001675
Behdad Esfahbod8ed248d2012-07-20 11:42:24 -04001676 /*
1677 * Finish off the clusters and go home!
1678 */
Behdad Esfahbod9ac6b012013-10-17 16:27:38 +02001679 if (hb_options ().uniscribe_bug_compatible)
Behdad Esfahbodebe29732012-05-11 16:43:12 +02001680 {
Behdad Esfahbod9ac6b012013-10-17 16:27:38 +02001681 switch ((hb_tag_t) plan->props.script)
1682 {
1683 case HB_SCRIPT_TAMIL:
1684 case HB_SCRIPT_SINHALA:
1685 break;
1686
1687 default:
1688 /* Uniscribe merges the entire cluster... Except for Tamil & Sinhala.
1689 * This means, half forms are submerged into the main consonants cluster.
1690 * This is unnecessary, and makes cursor positioning harder, but that's what
1691 * Uniscribe does. */
1692 buffer->merge_clusters (start, end);
1693 break;
1694 }
Behdad Esfahbod21d28032012-05-10 18:34:34 +02001695 }
Behdad Esfahbodef24cc82012-05-09 17:56:03 +02001696}
Behdad Esfahbode7be0572011-07-31 15:18:57 -04001697
1698
Behdad Esfahbodef24cc82012-05-09 17:56:03 +02001699static void
Behdad Esfahbod8bb5deb2012-08-02 10:07:58 -04001700final_reordering (const hb_ot_shape_plan_t *plan,
Behdad Esfahbod0beb66e2012-12-05 18:46:04 -05001701 hb_font_t *font HB_UNUSED,
Behdad Esfahbod3e38c0f2012-08-02 09:44:18 -04001702 hb_buffer_t *buffer)
Behdad Esfahbodef24cc82012-05-09 17:56:03 +02001703{
1704 unsigned int count = buffer->len;
Behdad Esfahbod327d14e2012-08-31 16:49:34 -04001705 if (unlikely (!count)) return;
Behdad Esfahbode7be0572011-07-31 15:18:57 -04001706
Behdad Esfahbodecb0b242015-07-22 12:02:09 +01001707 foreach_syllable (buffer, start, end)
1708 final_reordering_syllable (plan, buffer, start, end);
Behdad Esfahbodef24cc82012-05-09 17:56:03 +02001709
Behdad Esfahbod743807a2011-07-29 16:37:02 -04001710 HB_BUFFER_DEALLOCATE_VAR (buffer, indic_category);
1711 HB_BUFFER_DEALLOCATE_VAR (buffer, indic_position);
1712}
1713
1714
Behdad Esfahbod30145272013-10-15 13:47:27 +02001715static void
1716clear_syllables (const hb_ot_shape_plan_t *plan HB_UNUSED,
1717 hb_font_t *font HB_UNUSED,
1718 hb_buffer_t *buffer)
1719{
1720 hb_glyph_info_t *info = buffer->info;
1721 unsigned int count = buffer->len;
1722 for (unsigned int i = 0; i < count; i++)
1723 info[i].syllable() = 0;
1724}
1725
1726
Behdad Esfahbodeba312c2012-11-16 12:39:23 -08001727static bool
1728decompose_indic (const hb_ot_shape_normalize_context_t *c,
Behdad Esfahbod07369152012-11-13 12:35:35 -08001729 hb_codepoint_t ab,
1730 hb_codepoint_t *a,
1731 hb_codepoint_t *b)
1732{
1733 switch (ab)
1734 {
1735 /* Don't decompose these. */
Behdad Esfahbod76271002014-07-11 14:54:42 -04001736 case 0x0931u : return false;
1737 case 0x0B94u : return false;
Behdad Esfahbod07369152012-11-13 12:35:35 -08001738
1739
1740 /*
1741 * Decompose split matras that don't have Unicode decompositions.
1742 */
1743
Behdad Esfahbod76271002014-07-11 14:54:42 -04001744 case 0x0F77u : *a = 0x0FB2u; *b= 0x0F81u; return true;
1745 case 0x0F79u : *a = 0x0FB3u; *b= 0x0F81u; return true;
1746 case 0x17BEu : *a = 0x17C1u; *b= 0x17BEu; return true;
1747 case 0x17BFu : *a = 0x17C1u; *b= 0x17BFu; return true;
1748 case 0x17C0u : *a = 0x17C1u; *b= 0x17C0u; return true;
1749 case 0x17C4u : *a = 0x17C1u; *b= 0x17C4u; return true;
1750 case 0x17C5u : *a = 0x17C1u; *b= 0x17C5u; return true;
1751 case 0x1925u : *a = 0x1920u; *b= 0x1923u; return true;
1752 case 0x1926u : *a = 0x1920u; *b= 0x1924u; return true;
1753 case 0x1B3Cu : *a = 0x1B42u; *b= 0x1B3Cu; return true;
1754 case 0x1112Eu : *a = 0x11127u; *b= 0x11131u; return true;
1755 case 0x1112Fu : *a = 0x11127u; *b= 0x11132u; return true;
Behdad Esfahbod07369152012-11-13 12:35:35 -08001756#if 0
1757 /* This one has no decomposition in Unicode, but needs no decomposition either. */
Behdad Esfahbod76271002014-07-11 14:54:42 -04001758 /* case 0x0AC9u : return false; */
1759 case 0x0B57u : *a = no decomp, -> RIGHT; return true;
1760 case 0x1C29u : *a = no decomp, -> LEFT; return true;
1761 case 0xA9C0u : *a = no decomp, -> RIGHT; return true;
1762 case 0x111BuF : *a = no decomp, -> ABOVE; return true;
Behdad Esfahbod07369152012-11-13 12:35:35 -08001763#endif
1764 }
1765
Behdad Esfahbod76271002014-07-11 14:54:42 -04001766 if ((ab == 0x0DDAu || hb_in_range (ab, 0x0DDCu, 0x0DDEu)))
Behdad Esfahbod07369152012-11-13 12:35:35 -08001767 {
Behdad Esfahbod43b65312012-11-16 13:12:35 -08001768 /*
1769 * Sinhala split matras... Let the fun begin.
1770 *
1771 * These four characters have Unicode decompositions. However, Uniscribe
1772 * decomposes them "Khmer-style", that is, it uses the character itself to
1773 * get the second half. The first half of all four decompositions is always
1774 * U+0DD9.
1775 *
1776 * Now, there are buggy fonts, namely, the widely used lklug.ttf, that are
1777 * broken with Uniscribe. But we need to support them. As such, we only
1778 * do the Uniscribe-style decomposition if the character is transformed into
1779 * its "sec.half" form by the 'pstf' feature. Otherwise, we fall back to
1780 * Unicode decomposition.
1781 *
1782 * Note that we can't unconditionally use Unicode decomposition. That would
1783 * break some other fonts, that are designed to work with Uniscribe, and
1784 * don't have positioning features for the Unicode-style decomposition.
1785 *
1786 * Argh...
Behdad Esfahbodb71b0bd2012-12-05 19:20:31 -05001787 *
1788 * The Uniscribe behavior is now documented in the newly published Sinhala
1789 * spec in 2012:
1790 *
1791 * http://www.microsoft.com/typography/OpenTypeDev/sinhala/intro.htm#shaping
Behdad Esfahbod43b65312012-11-16 13:12:35 -08001792 */
1793
1794 const indic_shape_plan_t *indic_plan = (const indic_shape_plan_t *) c->plan->data;
1795
1796 hb_codepoint_t glyph;
1797
Behdad Esfahbodbab02d32013-02-12 15:26:45 -05001798 if (hb_options ().uniscribe_bug_compatible ||
Behdad Esfahbod43b65312012-11-16 13:12:35 -08001799 (c->font->get_glyph (ab, 0, &glyph) &&
Behdad Esfahbodb5a0f692013-10-17 18:04:23 +02001800 indic_plan->pstf.would_substitute (&glyph, 1, c->font->face)))
Behdad Esfahbod43b65312012-11-16 13:12:35 -08001801 {
1802 /* Ok, safe to use Uniscribe-style decomposition. */
Behdad Esfahbod76271002014-07-11 14:54:42 -04001803 *a = 0x0DD9u;
Behdad Esfahbod43b65312012-11-16 13:12:35 -08001804 *b = ab;
1805 return true;
1806 }
Behdad Esfahbod07369152012-11-13 12:35:35 -08001807 }
1808
Behdad Esfahbodeba312c2012-11-16 12:39:23 -08001809 return c->unicode->decompose (ab, a, b);
Behdad Esfahbod07369152012-11-13 12:35:35 -08001810}
1811
Behdad Esfahbodeba312c2012-11-16 12:39:23 -08001812static bool
1813compose_indic (const hb_ot_shape_normalize_context_t *c,
Behdad Esfahbod07369152012-11-13 12:35:35 -08001814 hb_codepoint_t a,
1815 hb_codepoint_t b,
1816 hb_codepoint_t *ab)
1817{
1818 /* Avoid recomposing split matras. */
Behdad Esfahbodeba312c2012-11-16 12:39:23 -08001819 if (HB_UNICODE_GENERAL_CATEGORY_IS_MARK (c->unicode->general_category (a)))
Behdad Esfahbod07369152012-11-13 12:35:35 -08001820 return false;
1821
1822 /* Composition-exclusion exceptions that we want to recompose. */
Behdad Esfahbod76271002014-07-11 14:54:42 -04001823 if (a == 0x09AFu && b == 0x09BCu) { *ab = 0x09DFu; return true; }
Behdad Esfahbod07369152012-11-13 12:35:35 -08001824
Behdad Esfahbodeba312c2012-11-16 12:39:23 -08001825 return c->unicode->compose (a, b, ab);
Behdad Esfahbod07369152012-11-13 12:35:35 -08001826}
1827
1828
Behdad Esfahbod693918e2012-07-30 21:08:51 -04001829const hb_ot_complex_shaper_t _hb_ot_complex_shaper_indic =
1830{
1831 "indic",
1832 collect_features_indic,
1833 override_features_indic,
Behdad Esfahboda8c6da92012-08-02 10:46:34 -04001834 data_create_indic,
1835 data_destroy_indic,
Behdad Esfahbod9f9f04c2012-08-11 18:34:13 -04001836 NULL, /* preprocess_text */
Behdad Esfahbod3d6ca0d2013-12-31 16:04:35 +08001837 HB_OT_SHAPE_NORMALIZATION_MODE_COMPOSED_DIACRITICS_NO_SHORT_CIRCUIT,
Behdad Esfahbod07369152012-11-13 12:35:35 -08001838 decompose_indic,
1839 compose_indic,
Behdad Esfahbod693918e2012-07-30 21:08:51 -04001840 setup_masks_indic,
Behdad Esfahbod71b4c992013-10-28 00:20:59 +01001841 HB_OT_SHAPE_ZERO_WIDTH_MARKS_NONE,
Behdad Esfahbod865745b2012-11-14 13:48:26 -08001842 false, /* fallback_position */
Behdad Esfahbod693918e2012-07-30 21:08:51 -04001843};