Behdad Esfahbod | dcf4d95 | 2018-01-05 14:54:31 +0000 | [diff] [blame] | 1 | /* |
| 2 | * Copyright © 2011,2012 Google, Inc. |
| 3 | * |
| 4 | * This is part of HarfBuzz, a text shaping library. |
| 5 | * |
| 6 | * Permission is hereby granted, without written agreement and without |
| 7 | * license or royalty fees, to use, copy, modify, and distribute this |
| 8 | * software and its documentation for any purpose, provided that the |
| 9 | * above copyright notice and the following two paragraphs appear in |
| 10 | * all copies of this software. |
| 11 | * |
| 12 | * IN NO EVENT SHALL THE COPYRIGHT HOLDER BE LIABLE TO ANY PARTY FOR |
| 13 | * DIRECT, INDIRECT, SPECIAL, INCIDENTAL, OR CONSEQUENTIAL DAMAGES |
| 14 | * ARISING OUT OF THE USE OF THIS SOFTWARE AND ITS DOCUMENTATION, EVEN |
| 15 | * IF THE COPYRIGHT HOLDER HAS BEEN ADVISED OF THE POSSIBILITY OF SUCH |
| 16 | * DAMAGE. |
| 17 | * |
| 18 | * THE COPYRIGHT HOLDER SPECIFICALLY DISCLAIMS ANY WARRANTIES, INCLUDING, |
| 19 | * BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND |
| 20 | * FITNESS FOR A PARTICULAR PURPOSE. THE SOFTWARE PROVIDED HEREUNDER IS |
| 21 | * ON AN "AS IS" BASIS, AND THE COPYRIGHT HOLDER HAS NO OBLIGATION TO |
| 22 | * PROVIDE MAINTENANCE, SUPPORT, UPDATES, ENHANCEMENTS, OR MODIFICATIONS. |
| 23 | * |
| 24 | * Google Author(s): Behdad Esfahbod |
| 25 | */ |
| 26 | |
| 27 | #ifndef HB_OT_SHAPE_COMPLEX_KHMER_MACHINE_HH |
| 28 | #define HB_OT_SHAPE_COMPLEX_KHMER_MACHINE_HH |
| 29 | |
| 30 | #include "hb-private.hh" |
| 31 | |
| 32 | %%{ |
| 33 | machine khmer_syllable_machine; |
| 34 | alphtype unsigned char; |
| 35 | write data; |
| 36 | }%% |
| 37 | |
| 38 | %%{ |
| 39 | |
| 40 | # Same order as enum khmer_category_t. Not sure how to avoid duplication. |
Behdad Esfahbod | dcf4d95 | 2018-01-05 14:54:31 +0000 | [diff] [blame] | 41 | C = 1; |
| 42 | V = 2; |
| 43 | N = 3; |
Behdad Esfahbod | dcf4d95 | 2018-01-05 14:54:31 +0000 | [diff] [blame] | 44 | ZWNJ = 5; |
| 45 | ZWJ = 6; |
| 46 | M = 7; |
| 47 | SM = 8; |
Behdad Esfahbod | dcf4d95 | 2018-01-05 14:54:31 +0000 | [diff] [blame] | 48 | PLACEHOLDER = 11; |
| 49 | DOTTEDCIRCLE = 12; |
| 50 | RS = 13; |
| 51 | Coeng = 14; |
Behdad Esfahbod | dcf4d95 | 2018-01-05 14:54:31 +0000 | [diff] [blame] | 52 | Ra = 16; |
Behdad Esfahbod | dcf4d95 | 2018-01-05 14:54:31 +0000 | [diff] [blame] | 53 | |
Behdad Esfahbod | 80c870b | 2018-01-05 17:52:24 +0000 | [diff] [blame] | 54 | c = (C | Ra | V); # is_consonant |
Behdad Esfahbod | dcf4d95 | 2018-01-05 14:54:31 +0000 | [diff] [blame] | 55 | n = ((ZWNJ?.RS)? (N.N?)?); # is_consonant_modifier |
| 56 | z = ZWJ|ZWNJ; # is_joiner |
Behdad Esfahbod | dcf4d95 | 2018-01-05 14:54:31 +0000 | [diff] [blame] | 57 | |
Behdad Esfahbod | db0207b | 2018-01-05 18:06:00 +0000 | [diff] [blame] | 58 | cn = c.n?; |
Behdad Esfahbod | 65795e3 | 2018-01-05 18:03:00 +0000 | [diff] [blame] | 59 | matra_group = z?.M.N?; |
Behdad Esfahbod | 66d7bef | 2018-01-05 18:09:29 +0000 | [diff] [blame] | 60 | syllable_tail = (SM.SM?)?; |
Behdad Esfahbod | dcf4d95 | 2018-01-05 14:54:31 +0000 | [diff] [blame] | 61 | |
| 62 | |
Behdad Esfahbod | 90affe8 | 2018-01-05 18:04:56 +0000 | [diff] [blame] | 63 | broken_cluster = n? (Coeng.cn)* matra_group* (Coeng.cn)? syllable_tail; |
Behdad Esfahbod | e13ee93 | 2018-01-05 18:01:01 +0000 | [diff] [blame] | 64 | consonant_syllable = (c|PLACEHOLDER|DOTTEDCIRCLE) broken_cluster; |
Behdad Esfahbod | dcf4d95 | 2018-01-05 14:54:31 +0000 | [diff] [blame] | 65 | other = any; |
| 66 | |
| 67 | main := |* |
| 68 | consonant_syllable => { found_syllable (consonant_syllable); }; |
Behdad Esfahbod | dcf4d95 | 2018-01-05 14:54:31 +0000 | [diff] [blame] | 69 | broken_cluster => { found_syllable (broken_cluster); }; |
| 70 | other => { found_syllable (non_khmer_cluster); }; |
| 71 | *|; |
| 72 | |
| 73 | |
| 74 | }%% |
| 75 | |
| 76 | #define found_syllable(syllable_type) \ |
| 77 | HB_STMT_START { \ |
| 78 | if (0) fprintf (stderr, "syllable %d..%d %s\n", last, p+1, #syllable_type); \ |
| 79 | for (unsigned int i = last; i < p+1; i++) \ |
| 80 | info[i].syllable() = (syllable_serial << 4) | syllable_type; \ |
| 81 | last = p+1; \ |
| 82 | syllable_serial++; \ |
| 83 | if (unlikely (syllable_serial == 16)) syllable_serial = 1; \ |
| 84 | } HB_STMT_END |
| 85 | |
| 86 | static void |
| 87 | find_syllables (hb_buffer_t *buffer) |
| 88 | { |
| 89 | unsigned int p, pe, eof, ts HB_UNUSED, te HB_UNUSED, act HB_UNUSED; |
| 90 | int cs; |
| 91 | hb_glyph_info_t *info = buffer->info; |
| 92 | %%{ |
| 93 | write init; |
| 94 | getkey info[p].khmer_category(); |
| 95 | }%% |
| 96 | |
| 97 | p = 0; |
| 98 | pe = eof = buffer->len; |
| 99 | |
| 100 | unsigned int last = 0; |
| 101 | unsigned int syllable_serial = 1; |
| 102 | %%{ |
| 103 | write exec; |
| 104 | }%% |
| 105 | } |
| 106 | |
| 107 | #endif /* HB_OT_SHAPE_COMPLEX_KHMER_MACHINE_HH */ |