hb-ot-shape-complex-indic.cc revision 0201e0a4649ad5b607e50bcb9605e7a5b7143812
1b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod/* 227aba594c90b4444c35273a38f5fedc8e09d9a88Behdad Esfahbod * Copyright © 2011,2012 Google, Inc. 3b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod * 4b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod * This is part of HarfBuzz, a text shaping library. 5b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod * 6b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod * Permission is hereby granted, without written agreement and without 7b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod * license or royalty fees, to use, copy, modify, and distribute this 8b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod * software and its documentation for any purpose, provided that the 9b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod * above copyright notice and the following two paragraphs appear in 10b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod * all copies of this software. 11b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod * 12b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod * IN NO EVENT SHALL THE COPYRIGHT HOLDER BE LIABLE TO ANY PARTY FOR 13b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod * DIRECT, INDIRECT, SPECIAL, INCIDENTAL, OR CONSEQUENTIAL DAMAGES 14b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod * ARISING OUT OF THE USE OF THIS SOFTWARE AND ITS DOCUMENTATION, EVEN 15b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod * IF THE COPYRIGHT HOLDER HAS BEEN ADVISED OF THE POSSIBILITY OF SUCH 16b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod * DAMAGE. 17b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod * 18b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod * THE COPYRIGHT HOLDER SPECIFICALLY DISCLAIMS ANY WARRANTIES, INCLUDING, 19b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod * BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND 20b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod * FITNESS FOR A PARTICULAR PURPOSE. THE SOFTWARE PROVIDED HEREUNDER IS 21b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod * ON AN "AS IS" BASIS, AND THE COPYRIGHT HOLDER HAS NO OBLIGATION TO 22b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod * PROVIDE MAINTENANCE, SUPPORT, UPDATES, ENHANCEMENTS, OR MODIFICATIONS. 23b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod * 24b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod * Google Author(s): Behdad Esfahbod 25b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod */ 26b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod 273ed4634ec349fa9e943ad23718c04be4dd4bba62Behdad Esfahbod#include "hb-ot-shape-complex-indic-private.hh" 28a913b024d84973556094fd64ce5f0b7106fcc3b5Behdad Esfahbod#include "hb-ot-shape-private.hh" 29352372ae5ea0998e40cf9fe43c22b6b610a5764eBehdad Esfahbod 30a3e04bee2c2fa648759a87e460db6b4f1b685586Behdad Esfahbod#define OLD_INDIC_TAG(script) (((hb_tag_t) script) | 0x20000000) 31a3e04bee2c2fa648759a87e460db6b4f1b685586Behdad Esfahbod#define IS_OLD_INDIC_TAG(tag) ( \ 32a3e04bee2c2fa648759a87e460db6b4f1b685586Behdad Esfahbod (tag) == OLD_INDIC_TAG (HB_SCRIPT_BENGALI) || \ 33a3e04bee2c2fa648759a87e460db6b4f1b685586Behdad Esfahbod (tag) == OLD_INDIC_TAG (HB_SCRIPT_DEVANAGARI) || \ 34a3e04bee2c2fa648759a87e460db6b4f1b685586Behdad Esfahbod (tag) == OLD_INDIC_TAG (HB_SCRIPT_GUJARATI) || \ 35a3e04bee2c2fa648759a87e460db6b4f1b685586Behdad Esfahbod (tag) == OLD_INDIC_TAG (HB_SCRIPT_GURMUKHI) || \ 36a3e04bee2c2fa648759a87e460db6b4f1b685586Behdad Esfahbod (tag) == OLD_INDIC_TAG (HB_SCRIPT_KANNADA) || \ 37a3e04bee2c2fa648759a87e460db6b4f1b685586Behdad Esfahbod (tag) == OLD_INDIC_TAG (HB_SCRIPT_MALAYALAM) || \ 38a3e04bee2c2fa648759a87e460db6b4f1b685586Behdad Esfahbod (tag) == OLD_INDIC_TAG (HB_SCRIPT_ORIYA) || \ 39a3e04bee2c2fa648759a87e460db6b4f1b685586Behdad Esfahbod (tag) == OLD_INDIC_TAG (HB_SCRIPT_TAMIL) || \ 40a3e04bee2c2fa648759a87e460db6b4f1b685586Behdad Esfahbod (tag) == OLD_INDIC_TAG (HB_SCRIPT_TELUGU) \ 41a3e04bee2c2fa648759a87e460db6b4f1b685586Behdad Esfahbod ) 42a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbodstruct indic_options_t 43ebe29733d44fe0fa9fb30f946ab0dd7a40336a24Behdad Esfahbod{ 44a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbod int initialized : 1; 45a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbod int uniscribe_bug_compatible : 1; 46a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbod}; 47a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbod 48a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbodunion indic_options_union_t { 49a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbod int i; 50a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbod indic_options_t opts; 51a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbod}; 52a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad EsfahbodASSERT_STATIC (sizeof (int) == sizeof (indic_options_union_t)); 53a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbod 54a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbodstatic indic_options_union_t 55a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbodindic_options_init (void) 56a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbod{ 57a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbod indic_options_union_t u; 58a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbod u.i = 0; 59a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbod u.opts.initialized = 1; 60a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbod 61a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbod char *c = getenv ("HB_OT_INDIC_OPTIONS"); 62a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbod u.opts.uniscribe_bug_compatible = c && strstr (c, "uniscribe-bug-compatible"); 63a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbod 64a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbod return u; 65a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbod} 66a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbod 67a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbodinline indic_options_t 68a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbodindic_options (void) 69a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbod{ 70a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbod static indic_options_union_t options; 71a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbod 72a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbod if (unlikely (!options.i)) { 73a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbod /* This is idempotent and threadsafe. */ 74a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbod options = indic_options_init (); 75ebe29733d44fe0fa9fb30f946ab0dd7a40336a24Behdad Esfahbod } 76ebe29733d44fe0fa9fb30f946ab0dd7a40336a24Behdad Esfahbod 77a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbod return options.opts; 78a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbod} 79a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbod 80ebe29733d44fe0fa9fb30f946ab0dd7a40336a24Behdad Esfahbod 81743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbodstatic int 82743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbodcompare_codepoint (const void *pa, const void *pb) 83743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod{ 84743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod hb_codepoint_t a = * (hb_codepoint_t *) pa; 85743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod hb_codepoint_t b = * (hb_codepoint_t *) pb; 86743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod 87743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod return a < b ? -1 : a == b ? 0 : +1; 88743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod} 89743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod 90743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbodstatic indic_position_t 91743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbodconsonant_position (hb_codepoint_t u) 92743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod{ 93743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod consonant_position_t *record; 94743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod 950de771b72da6b342b015e3556190821547a4011dBehdad Esfahbod /* Khmer does not have pre-base half forms. */ 960de771b72da6b342b015e3556190821547a4011dBehdad Esfahbod if (0x1780 <= u && u <= 0x17FF) 970de771b72da6b342b015e3556190821547a4011dBehdad Esfahbod return POS_BELOW_C; 980de771b72da6b342b015e3556190821547a4011dBehdad Esfahbod 99743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod record = (consonant_position_t *) bsearch (&u, consonant_positions, 100743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod ARRAY_LENGTH (consonant_positions), 101743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod sizeof (consonant_positions[0]), 102743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod compare_codepoint); 103743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod 104dbccf87eef0d26838fa4bb3ae26410f6c4818836Behdad Esfahbod return record ? record->position : POS_BASE_C; 105743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod} 106743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod 107352372ae5ea0998e40cf9fe43c22b6b610a5764eBehdad Esfahbodstatic bool 108352372ae5ea0998e40cf9fe43c22b6b610a5764eBehdad Esfahbodis_ra (hb_codepoint_t u) 109352372ae5ea0998e40cf9fe43c22b6b610a5764eBehdad Esfahbod{ 110352372ae5ea0998e40cf9fe43c22b6b610a5764eBehdad Esfahbod return !!bsearch (&u, ra_chars, 111352372ae5ea0998e40cf9fe43c22b6b610a5764eBehdad Esfahbod ARRAY_LENGTH (ra_chars), 112352372ae5ea0998e40cf9fe43c22b6b610a5764eBehdad Esfahbod sizeof (ra_chars[0]), 113352372ae5ea0998e40cf9fe43c22b6b610a5764eBehdad Esfahbod compare_codepoint); 114352372ae5ea0998e40cf9fe43c22b6b610a5764eBehdad Esfahbod} 115352372ae5ea0998e40cf9fe43c22b6b610a5764eBehdad Esfahbod 1169ee27a928a989c71923cef82a9e9828f8e9ca051Behdad Esfahbodstatic bool 1179da0487cd452d780673e24329ce03e174a4ef83bBehdad Esfahbodis_joiner (const hb_glyph_info_t &info) 1189ee27a928a989c71923cef82a9e9828f8e9ca051Behdad Esfahbod{ 1199da0487cd452d780673e24329ce03e174a4ef83bBehdad Esfahbod return !!(FLAG (info.indic_category()) & (FLAG (OT_ZWJ) | FLAG (OT_ZWNJ))); 1209da0487cd452d780673e24329ce03e174a4ef83bBehdad Esfahbod} 1219da0487cd452d780673e24329ce03e174a4ef83bBehdad Esfahbod 1229da0487cd452d780673e24329ce03e174a4ef83bBehdad Esfahbodstatic bool 1239da0487cd452d780673e24329ce03e174a4ef83bBehdad Esfahbodis_consonant (const hb_glyph_info_t &info) 1249da0487cd452d780673e24329ce03e174a4ef83bBehdad Esfahbod{ 1251a1fa8c655a082fc1439608457ba717306cc83caBehdad Esfahbod /* Note: 1261a1fa8c655a082fc1439608457ba717306cc83caBehdad Esfahbod * 12718c06e189bd078affbb84c3bb5bb80687a227c5eBehdad Esfahbod * We treat Vowels and placeholders as if they were consonants. This is safe because Vowels 128c5306b6861cfaa50af40e8ceb058791fa06d7981Behdad Esfahbod * cannot happen in a consonant syllable. The plus side however is, we can call the 129c5306b6861cfaa50af40e8ceb058791fa06d7981Behdad Esfahbod * consonant syllable logic from the vowel syllable function and get it all right! */ 13018c06e189bd078affbb84c3bb5bb80687a227c5eBehdad Esfahbod return !!(FLAG (info.indic_category()) & (FLAG (OT_C) | FLAG (OT_Ra) | FLAG (OT_V) | FLAG (OT_NBSP) | FLAG (OT_DOTTEDCIRCLE))); 1319ee27a928a989c71923cef82a9e9828f8e9ca051Behdad Esfahbod} 132c7fe56a1d5d3e969b6ec51cd9ecd471706a19568Behdad Esfahbod 133deb521dee4fdca8c2124cfb39a205e6269d4a70dBehdad Esfahbodstatic bool 134deb521dee4fdca8c2124cfb39a205e6269d4a70dBehdad Esfahbodis_halant_or_coeng (const hb_glyph_info_t &info) 135deb521dee4fdca8c2124cfb39a205e6269d4a70dBehdad Esfahbod{ 136deb521dee4fdca8c2124cfb39a205e6269d4a70dBehdad Esfahbod return !!(FLAG (info.indic_category()) & (FLAG (OT_H) | FLAG (OT_Coeng))); 137deb521dee4fdca8c2124cfb39a205e6269d4a70dBehdad Esfahbod} 138deb521dee4fdca8c2124cfb39a205e6269d4a70dBehdad Esfahbod 139eed903b1644e087178438959664a6a57bebc398bBehdad Esfahbodstruct feature_list_t { 140c7fe56a1d5d3e969b6ec51cd9ecd471706a19568Behdad Esfahbod hb_tag_t tag; 141c7fe56a1d5d3e969b6ec51cd9ecd471706a19568Behdad Esfahbod hb_bool_t is_global; 142eed903b1644e087178438959664a6a57bebc398bBehdad Esfahbod}; 143eed903b1644e087178438959664a6a57bebc398bBehdad Esfahbod 144d5c4edcdd6df32f2f23aca44f14838b4baab4d7aBehdad Esfahbod/* These features are applied one at a time, given the order in this table. */ 145eed903b1644e087178438959664a6a57bebc398bBehdad Esfahbodstatic const feature_list_t 146eed903b1644e087178438959664a6a57bebc398bBehdad Esfahbodindic_basic_features[] = 147b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod{ 148c7fe56a1d5d3e969b6ec51cd9ecd471706a19568Behdad Esfahbod {HB_TAG('n','u','k','t'), true}, 149c7fe56a1d5d3e969b6ec51cd9ecd471706a19568Behdad Esfahbod {HB_TAG('a','k','h','n'), false}, 150c7fe56a1d5d3e969b6ec51cd9ecd471706a19568Behdad Esfahbod {HB_TAG('r','p','h','f'), false}, 1511ac075b227090a9ad930dcc1670236c176b27067Behdad Esfahbod {HB_TAG('r','k','r','f'), true}, 152c7fe56a1d5d3e969b6ec51cd9ecd471706a19568Behdad Esfahbod {HB_TAG('p','r','e','f'), false}, 153c7fe56a1d5d3e969b6ec51cd9ecd471706a19568Behdad Esfahbod {HB_TAG('b','l','w','f'), false}, 154c7fe56a1d5d3e969b6ec51cd9ecd471706a19568Behdad Esfahbod {HB_TAG('h','a','l','f'), false}, 15529f106d7fba25e1464debd3a4831a7380d75c4c9Behdad Esfahbod {HB_TAG('a','b','v','f'), false}, 156c7fe56a1d5d3e969b6ec51cd9ecd471706a19568Behdad Esfahbod {HB_TAG('p','s','t','f'), false}, 1570201e0a4649ad5b607e50bcb9605e7a5b7143812Behdad Esfahbod {HB_TAG('c','f','a','r'), false}, 1589da0487cd452d780673e24329ce03e174a4ef83bBehdad Esfahbod {HB_TAG('c','j','c','t'), false}, 1591d6846db9ebf84561bb30a4e48c6c43184914099Behdad Esfahbod {HB_TAG('v','a','t','u'), true}, 160c7fe56a1d5d3e969b6ec51cd9ecd471706a19568Behdad Esfahbod}; 161c7fe56a1d5d3e969b6ec51cd9ecd471706a19568Behdad Esfahbod 162c7fe56a1d5d3e969b6ec51cd9ecd471706a19568Behdad Esfahbod/* Same order as the indic_basic_features array */ 163c7fe56a1d5d3e969b6ec51cd9ecd471706a19568Behdad Esfahbodenum { 164c7fe56a1d5d3e969b6ec51cd9ecd471706a19568Behdad Esfahbod _NUKT, 165c7fe56a1d5d3e969b6ec51cd9ecd471706a19568Behdad Esfahbod AKHN, 166c7fe56a1d5d3e969b6ec51cd9ecd471706a19568Behdad Esfahbod RPHF, 167df6d45c693c417bf311e6fa49f18a8558542e525Behdad Esfahbod _RKRF, 168c7fe56a1d5d3e969b6ec51cd9ecd471706a19568Behdad Esfahbod PREF, 169c7fe56a1d5d3e969b6ec51cd9ecd471706a19568Behdad Esfahbod BLWF, 170c7fe56a1d5d3e969b6ec51cd9ecd471706a19568Behdad Esfahbod HALF, 17129f106d7fba25e1464debd3a4831a7380d75c4c9Behdad Esfahbod ABVF, 172c7fe56a1d5d3e969b6ec51cd9ecd471706a19568Behdad Esfahbod PSTF, 1730201e0a4649ad5b607e50bcb9605e7a5b7143812Behdad Esfahbod CFAR, 1741d6846db9ebf84561bb30a4e48c6c43184914099Behdad Esfahbod CJCT, 1751d6846db9ebf84561bb30a4e48c6c43184914099Behdad Esfahbod VATU 176b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod}; 177b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod 178d5c4edcdd6df32f2f23aca44f14838b4baab4d7aBehdad Esfahbod/* These features are applied all at once. */ 179eed903b1644e087178438959664a6a57bebc398bBehdad Esfahbodstatic const feature_list_t 180eed903b1644e087178438959664a6a57bebc398bBehdad Esfahbodindic_other_features[] = 181b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod{ 182eed903b1644e087178438959664a6a57bebc398bBehdad Esfahbod {HB_TAG('i','n','i','t'), false}, 183eed903b1644e087178438959664a6a57bebc398bBehdad Esfahbod {HB_TAG('p','r','e','s'), true}, 184eed903b1644e087178438959664a6a57bebc398bBehdad Esfahbod {HB_TAG('a','b','v','s'), true}, 185eed903b1644e087178438959664a6a57bebc398bBehdad Esfahbod {HB_TAG('b','l','w','s'), true}, 186eed903b1644e087178438959664a6a57bebc398bBehdad Esfahbod {HB_TAG('p','s','t','s'), true}, 187eed903b1644e087178438959664a6a57bebc398bBehdad Esfahbod {HB_TAG('h','a','l','n'), true}, 188eed903b1644e087178438959664a6a57bebc398bBehdad Esfahbod 189eed903b1644e087178438959664a6a57bebc398bBehdad Esfahbod {HB_TAG('d','i','s','t'), true}, 190eed903b1644e087178438959664a6a57bebc398bBehdad Esfahbod {HB_TAG('a','b','v','m'), true}, 191eed903b1644e087178438959664a6a57bebc398bBehdad Esfahbod {HB_TAG('b','l','w','m'), true}, 192eed903b1644e087178438959664a6a57bebc398bBehdad Esfahbod}; 193eed903b1644e087178438959664a6a57bebc398bBehdad Esfahbod 194743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod 195743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbodstatic void 196743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbodinitial_reordering (const hb_ot_map_t *map, 197743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod hb_face_t *face, 198743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod hb_buffer_t *buffer, 199743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod void *user_data HB_UNUSED); 200f6fd3780e12b23ff7ed3743497c8996e71dcb064Behdad Esfahbodstatic void 201f6fd3780e12b23ff7ed3743497c8996e71dcb064Behdad Esfahbodfinal_reordering (const hb_ot_map_t *map, 202f6fd3780e12b23ff7ed3743497c8996e71dcb064Behdad Esfahbod hb_face_t *face, 203f6fd3780e12b23ff7ed3743497c8996e71dcb064Behdad Esfahbod hb_buffer_t *buffer, 204743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod void *user_data HB_UNUSED); 205b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod 206b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbodvoid 2079f377ed3210fe7d9f15e0c4f82020556f9a8f6f0Behdad Esfahbod_hb_ot_shape_complex_collect_features_indic (hb_ot_map_builder_t *map, 2089f377ed3210fe7d9f15e0c4f82020556f9a8f6f0Behdad Esfahbod const hb_segment_properties_t *props HB_UNUSED) 209b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod{ 210f6fd3780e12b23ff7ed3743497c8996e71dcb064Behdad Esfahbod map->add_bool_feature (HB_TAG('l','o','c','l')); 211a54a5505a35eef5315a8e2e7a79502901e3eff5fBehdad Esfahbod /* The Indic specs do not require ccmp, but we apply it here since if 212a54a5505a35eef5315a8e2e7a79502901e3eff5fBehdad Esfahbod * there is a use of it, it's typically at the beginning. */ 213f6fd3780e12b23ff7ed3743497c8996e71dcb064Behdad Esfahbod map->add_bool_feature (HB_TAG('c','c','m','p')); 214f6fd3780e12b23ff7ed3743497c8996e71dcb064Behdad Esfahbod 215743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod map->add_gsub_pause (initial_reordering, NULL); 216f6fd3780e12b23ff7ed3743497c8996e71dcb064Behdad Esfahbod 217412b91889d9a1ae477e8b6907d0b9a76e78a6c91Behdad Esfahbod for (unsigned int i = 0; i < ARRAY_LENGTH (indic_basic_features); i++) { 21876f76812ac7cca8ac6935952a2360d5e151480faBehdad Esfahbod map->add_bool_feature (indic_basic_features[i].tag, indic_basic_features[i].is_global); 219412b91889d9a1ae477e8b6907d0b9a76e78a6c91Behdad Esfahbod map->add_gsub_pause (NULL, NULL); 220412b91889d9a1ae477e8b6907d0b9a76e78a6c91Behdad Esfahbod } 221b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod 222f6fd3780e12b23ff7ed3743497c8996e71dcb064Behdad Esfahbod map->add_gsub_pause (final_reordering, NULL); 223f6fd3780e12b23ff7ed3743497c8996e71dcb064Behdad Esfahbod 224d5c4edcdd6df32f2f23aca44f14838b4baab4d7aBehdad Esfahbod for (unsigned int i = 0; i < ARRAY_LENGTH (indic_other_features); i++) 225eed903b1644e087178438959664a6a57bebc398bBehdad Esfahbod map->add_bool_feature (indic_other_features[i].tag, indic_other_features[i].is_global); 226b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod} 227b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod 228d96838ef951ce6170eb2dc576ebcba2262cf7008Behdad Esfahbodvoid 229d96838ef951ce6170eb2dc576ebcba2262cf7008Behdad Esfahbod_hb_ot_shape_complex_override_features_indic (hb_ot_map_builder_t *map, 230d96838ef951ce6170eb2dc576ebcba2262cf7008Behdad Esfahbod const hb_segment_properties_t *props HB_UNUSED) 231d96838ef951ce6170eb2dc576ebcba2262cf7008Behdad Esfahbod{ 232af92b4cc90e4184d5bdd8037c551ed482700114fBehdad Esfahbod /* Uniscribe does not apply 'kern'. */ 233af92b4cc90e4184d5bdd8037c551ed482700114fBehdad Esfahbod if (indic_options ().uniscribe_bug_compatible) 234af92b4cc90e4184d5bdd8037c551ed482700114fBehdad Esfahbod map->add_feature (HB_TAG('k','e','r','n'), 0, true); 235d96838ef951ce6170eb2dc576ebcba2262cf7008Behdad Esfahbod} 236d96838ef951ce6170eb2dc576ebcba2262cf7008Behdad Esfahbod 237867361c3ad39629a8d5b7dc48d558a1c19e37d43Behdad Esfahbod 23811138ccff71f442da1fcf64faa0e1d22e083e775Behdad Esfahbodhb_ot_shape_normalization_mode_t 23911138ccff71f442da1fcf64faa0e1d22e083e775Behdad Esfahbod_hb_ot_shape_complex_normalization_preference_indic (void) 24002cdf743c2ec345a44d4fcf865594b6ac13fccd0Behdad Esfahbod{ 24102cdf743c2ec345a44d4fcf865594b6ac13fccd0Behdad Esfahbod /* We want split matras decomposed by the common shaping logic. */ 24211138ccff71f442da1fcf64faa0e1d22e083e775Behdad Esfahbod return HB_OT_SHAPE_NORMALIZATION_MODE_DECOMPOSED; 24302cdf743c2ec345a44d4fcf865594b6ac13fccd0Behdad Esfahbod} 24402cdf743c2ec345a44d4fcf865594b6ac13fccd0Behdad Esfahbod 245867361c3ad39629a8d5b7dc48d558a1c19e37d43Behdad Esfahbod 246b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbodvoid 2479f377ed3210fe7d9f15e0c4f82020556f9a8f6f0Behdad Esfahbod_hb_ot_shape_complex_setup_masks_indic (hb_ot_map_t *map HB_UNUSED, 2489f377ed3210fe7d9f15e0c4f82020556f9a8f6f0Behdad Esfahbod hb_buffer_t *buffer, 2493f18236a03880c0960f5990dc90685f6146951a6Behdad Esfahbod hb_font_t *font HB_UNUSED) 250b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod{ 2519f9bcceca6321d5a5812f878de1de39901349a78Behdad Esfahbod HB_BUFFER_ALLOCATE_VAR (buffer, indic_category); 2529f9bcceca6321d5a5812f878de1de39901349a78Behdad Esfahbod HB_BUFFER_ALLOCATE_VAR (buffer, indic_position); 2539f9bcceca6321d5a5812f878de1de39901349a78Behdad Esfahbod 254743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod /* We cannot setup masks here. We save information about characters 255743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod * and setup masks later on in a pause-callback. */ 256743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod 257743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod unsigned int count = buffer->len; 258b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod for (unsigned int i = 0; i < count; i++) 259b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod { 26092332e5116271a5d96e532005fe750e7552a6cbbBehdad Esfahbod hb_glyph_info_t &info = buffer->info[i]; 26192332e5116271a5d96e532005fe750e7552a6cbbBehdad Esfahbod unsigned int type = get_indic_categories (info.codepoint); 26292332e5116271a5d96e532005fe750e7552a6cbbBehdad Esfahbod 26392332e5116271a5d96e532005fe750e7552a6cbbBehdad Esfahbod info.indic_category() = type & 0x0F; 26492332e5116271a5d96e532005fe750e7552a6cbbBehdad Esfahbod info.indic_position() = type >> 4; 26592332e5116271a5d96e532005fe750e7552a6cbbBehdad Esfahbod 2663399a06e7033651ee926448737bdb18e553c1796Behdad Esfahbod /* The spec says U+0952 is OT_A. However, testing shows that Uniscribe 2673399a06e7033651ee926448737bdb18e553c1796Behdad Esfahbod * treats U+0951..U+0952 all as OT_VD. 2683399a06e7033651ee926448737bdb18e553c1796Behdad Esfahbod * TESTS: 2693399a06e7033651ee926448737bdb18e553c1796Behdad Esfahbod * U+092E,U+0947,U+0952 2703399a06e7033651ee926448737bdb18e553c1796Behdad Esfahbod * U+092E,U+0952,U+0947 2713399a06e7033651ee926448737bdb18e553c1796Behdad Esfahbod * U+092E,U+0947,U+0951 2723399a06e7033651ee926448737bdb18e553c1796Behdad Esfahbod * U+092E,U+0951,U+0947 2733399a06e7033651ee926448737bdb18e553c1796Behdad Esfahbod * */ 2743399a06e7033651ee926448737bdb18e553c1796Behdad Esfahbod if (unlikely (hb_in_range<hb_codepoint_t> (info.codepoint, 0x0951, 0x0954))) 2753399a06e7033651ee926448737bdb18e553c1796Behdad Esfahbod info.indic_category() = OT_VD; 2763399a06e7033651ee926448737bdb18e553c1796Behdad Esfahbod 277df50b8474094f0563ccfdae12c4425a51b72add6Behdad Esfahbod if (info.indic_category() == OT_X && 278df50b8474094f0563ccfdae12c4425a51b72add6Behdad Esfahbod unlikely (hb_in_range<hb_codepoint_t> (info.codepoint, 0x17CB, 0x17D0))) 279df50b8474094f0563ccfdae12c4425a51b72add6Behdad Esfahbod info.indic_category() = OT_RS; 280df50b8474094f0563ccfdae12c4425a51b72add6Behdad Esfahbod 281c50ed71e9a3df1844f564de66d54b46a696c1356Behdad Esfahbod /* Khmer Virama is different since it can be used to form a final consonant. */ 282c50ed71e9a3df1844f564de66d54b46a696c1356Behdad Esfahbod if (unlikely (info.codepoint == 0x17D2)) 283c50ed71e9a3df1844f564de66d54b46a696c1356Behdad Esfahbod info.indic_category() = OT_Coeng; 284c50ed71e9a3df1844f564de66d54b46a696c1356Behdad Esfahbod 285c50ed71e9a3df1844f564de66d54b46a696c1356Behdad Esfahbod if (is_consonant (info)) { 28692332e5116271a5d96e532005fe750e7552a6cbbBehdad Esfahbod info.indic_position() = consonant_position (info.codepoint); 28792332e5116271a5d96e532005fe750e7552a6cbbBehdad Esfahbod if (is_ra (info.codepoint)) 28892332e5116271a5d96e532005fe750e7552a6cbbBehdad Esfahbod info.indic_category() = OT_Ra; 2897d09c98a1fff97127e48eae48d380dc9fcff288eBehdad Esfahbod } else if (info.indic_category() == OT_RS) { 2907d09c98a1fff97127e48eae48d380dc9fcff288eBehdad Esfahbod info.indic_position() = POS_ABOVE_M; 29192332e5116271a5d96e532005fe750e7552a6cbbBehdad Esfahbod } else if (info.indic_category() == OT_SM || 29292332e5116271a5d96e532005fe750e7552a6cbbBehdad Esfahbod info.indic_category() == OT_VD) { 29392332e5116271a5d96e532005fe750e7552a6cbbBehdad Esfahbod info.indic_position() = POS_SMVD; 29492332e5116271a5d96e532005fe750e7552a6cbbBehdad Esfahbod } else if (unlikely (info.codepoint == 0x200C)) 29592332e5116271a5d96e532005fe750e7552a6cbbBehdad Esfahbod info.indic_category() = OT_ZWNJ; 29692332e5116271a5d96e532005fe750e7552a6cbbBehdad Esfahbod else if (unlikely (info.codepoint == 0x200D)) 29792332e5116271a5d96e532005fe750e7552a6cbbBehdad Esfahbod info.indic_category() = OT_ZWJ; 29818c06e189bd078affbb84c3bb5bb80687a227c5eBehdad Esfahbod else if (unlikely (info.codepoint == 0x25CC)) 29918c06e189bd078affbb84c3bb5bb80687a227c5eBehdad Esfahbod info.indic_category() = OT_DOTTEDCIRCLE; 300b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod } 301743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod} 302b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod 30345d6f29f15f1d2323bcaa2498aed23ff0c8a1567Behdad Esfahbodstatic int 30445d6f29f15f1d2323bcaa2498aed23ff0c8a1567Behdad Esfahbodcompare_indic_order (const hb_glyph_info_t *pa, const hb_glyph_info_t *pb) 30545d6f29f15f1d2323bcaa2498aed23ff0c8a1567Behdad Esfahbod{ 30645d6f29f15f1d2323bcaa2498aed23ff0c8a1567Behdad Esfahbod int a = pa->indic_position(); 30745d6f29f15f1d2323bcaa2498aed23ff0c8a1567Behdad Esfahbod int b = pb->indic_position(); 30845d6f29f15f1d2323bcaa2498aed23ff0c8a1567Behdad Esfahbod 30945d6f29f15f1d2323bcaa2498aed23ff0c8a1567Behdad Esfahbod return a < b ? -1 : a == b ? 0 : +1; 31045d6f29f15f1d2323bcaa2498aed23ff0c8a1567Behdad Esfahbod} 311867361c3ad39629a8d5b7dc48d558a1c19e37d43Behdad Esfahbod 3127ea58db311bfb0d8f804d1e9f4a1f004bd45075aBehdad Esfahbod/* Rules from: 3137ea58db311bfb0d8f804d1e9f4a1f004bd45075aBehdad Esfahbod * https://www.microsoft.com/typography/otfntdev/devanot/shaping.aspx */ 3147ea58db311bfb0d8f804d1e9f4a1f004bd45075aBehdad Esfahbod 315743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbodstatic void 31670fe77bb9a25922bd34f206826d8731d901fb451Behdad Esfahbodinitial_reordering_consonant_syllable (const hb_ot_map_t *map, hb_buffer_t *buffer, hb_mask_t *basic_mask_array, 317ef24cc8c8e2478a6352c340f4611a617646de4ccBehdad Esfahbod unsigned int start, unsigned int end) 318743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod{ 319ee58f3bc75d2d071a71b94063bf12205a5871acbBehdad Esfahbod hb_glyph_info_t *info = buffer->info; 320743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod 321617f4ac46f1084859d2034c08760e31e52d3bec3Behdad Esfahbod 322743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod /* 1. Find base consonant: 323743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod * 324743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod * The shaping engine finds the base consonant of the syllable, using the 325743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod * following algorithm: starting from the end of the syllable, move backwards 326743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod * until a consonant is found that does not have a below-base or post-base 327743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod * form (post-base forms have to follow below-base forms), or that is not a 328743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod * pre-base reordering Ra, or arrive at the first consonant. The consonant 329743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod * stopped at will be the base. 330743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod * 331743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod * o If the syllable starts with Ra + Halant (in a script that has Reph) 332743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod * and has more than one consonant, Ra is excluded from candidates for 333743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod * base consonants. 334743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod */ 335743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod 3365e72071062c015237b79fbd0521341a63166a204Behdad Esfahbod unsigned int base = end; 33776b3409de6887c1cdd5c679939497b1b56f4554bBehdad Esfahbod bool has_reph = false; 338743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod 33976b3409de6887c1cdd5c679939497b1b56f4554bBehdad Esfahbod { 340617f4ac46f1084859d2034c08760e31e52d3bec3Behdad Esfahbod /* -> If the syllable starts with Ra + Halant (in a script that has Reph) 341617f4ac46f1084859d2034c08760e31e52d3bec3Behdad Esfahbod * and has more than one consonant, Ra is excluded from candidates for 342617f4ac46f1084859d2034c08760e31e52d3bec3Behdad Esfahbod * base consonants. */ 343617f4ac46f1084859d2034c08760e31e52d3bec3Behdad Esfahbod unsigned int limit = start; 34470fe77bb9a25922bd34f206826d8731d901fb451Behdad Esfahbod if (basic_mask_array[RPHF] && 345617f4ac46f1084859d2034c08760e31e52d3bec3Behdad Esfahbod start + 3 <= end && 346617f4ac46f1084859d2034c08760e31e52d3bec3Behdad Esfahbod info[start].indic_category() == OT_Ra && 347617f4ac46f1084859d2034c08760e31e52d3bec3Behdad Esfahbod info[start + 1].indic_category() == OT_H && 348617f4ac46f1084859d2034c08760e31e52d3bec3Behdad Esfahbod !is_joiner (info[start + 2])) 349617f4ac46f1084859d2034c08760e31e52d3bec3Behdad Esfahbod { 350617f4ac46f1084859d2034c08760e31e52d3bec3Behdad Esfahbod limit += 2; 351617f4ac46f1084859d2034c08760e31e52d3bec3Behdad Esfahbod base = start; 352617f4ac46f1084859d2034c08760e31e52d3bec3Behdad Esfahbod has_reph = true; 353617f4ac46f1084859d2034c08760e31e52d3bec3Behdad Esfahbod }; 35476b3409de6887c1cdd5c679939497b1b56f4554bBehdad Esfahbod 3553c2ea9481b1028e927e615a5434ebf8edcb5f891Behdad Esfahbod /* -> starting from the end of the syllable, move backwards */ 3563c2ea9481b1028e927e615a5434ebf8edcb5f891Behdad Esfahbod unsigned int i = end; 3573c2ea9481b1028e927e615a5434ebf8edcb5f891Behdad Esfahbod do { 3583c2ea9481b1028e927e615a5434ebf8edcb5f891Behdad Esfahbod i--; 3593c2ea9481b1028e927e615a5434ebf8edcb5f891Behdad Esfahbod /* -> until a consonant is found */ 3603c2ea9481b1028e927e615a5434ebf8edcb5f891Behdad Esfahbod if (is_consonant (info[i])) 361743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod { 3623c2ea9481b1028e927e615a5434ebf8edcb5f891Behdad Esfahbod /* -> that does not have a below-base or post-base form 3633c2ea9481b1028e927e615a5434ebf8edcb5f891Behdad Esfahbod * (post-base forms have to follow below-base forms), */ 3643c2ea9481b1028e927e615a5434ebf8edcb5f891Behdad Esfahbod if (info[i].indic_position() != POS_BELOW_C && 3653c2ea9481b1028e927e615a5434ebf8edcb5f891Behdad Esfahbod info[i].indic_position() != POS_POST_C) 3663c2ea9481b1028e927e615a5434ebf8edcb5f891Behdad Esfahbod { 3673c2ea9481b1028e927e615a5434ebf8edcb5f891Behdad Esfahbod base = i; 3683c2ea9481b1028e927e615a5434ebf8edcb5f891Behdad Esfahbod break; 3693c2ea9481b1028e927e615a5434ebf8edcb5f891Behdad Esfahbod } 370743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod 3713c2ea9481b1028e927e615a5434ebf8edcb5f891Behdad Esfahbod /* -> or that is not a pre-base reordering Ra, 3723c2ea9481b1028e927e615a5434ebf8edcb5f891Behdad Esfahbod * 3733c2ea9481b1028e927e615a5434ebf8edcb5f891Behdad Esfahbod * TODO 3743c2ea9481b1028e927e615a5434ebf8edcb5f891Behdad Esfahbod */ 375e7be05702447ae270d797398132c1930cd3a9b86Behdad Esfahbod 3763c2ea9481b1028e927e615a5434ebf8edcb5f891Behdad Esfahbod /* -> or arrive at the first consonant. The consonant stopped at will 3773c2ea9481b1028e927e615a5434ebf8edcb5f891Behdad Esfahbod * be the base. */ 3783c2ea9481b1028e927e615a5434ebf8edcb5f891Behdad Esfahbod base = i; 3793c2ea9481b1028e927e615a5434ebf8edcb5f891Behdad Esfahbod } 3803c2ea9481b1028e927e615a5434ebf8edcb5f891Behdad Esfahbod else 3813c2ea9481b1028e927e615a5434ebf8edcb5f891Behdad Esfahbod if (is_joiner (info[i])) 3823c2ea9481b1028e927e615a5434ebf8edcb5f891Behdad Esfahbod break; 3833c2ea9481b1028e927e615a5434ebf8edcb5f891Behdad Esfahbod } while (i > limit); 3843c2ea9481b1028e927e615a5434ebf8edcb5f891Behdad Esfahbod if (base < start) 3853c2ea9481b1028e927e615a5434ebf8edcb5f891Behdad Esfahbod base = start; /* Just in case... */ 386743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod 387617f4ac46f1084859d2034c08760e31e52d3bec3Behdad Esfahbod 388617f4ac46f1084859d2034c08760e31e52d3bec3Behdad Esfahbod /* -> If the syllable starts with Ra + Halant (in a script that has Reph) 389617f4ac46f1084859d2034c08760e31e52d3bec3Behdad Esfahbod * and has more than one consonant, Ra is excluded from candidates for 390617f4ac46f1084859d2034c08760e31e52d3bec3Behdad Esfahbod * base consonants. */ 391617f4ac46f1084859d2034c08760e31e52d3bec3Behdad Esfahbod if (has_reph && base == start) { 392617f4ac46f1084859d2034c08760e31e52d3bec3Behdad Esfahbod /* Have no other consonant, so Reph is not formed and Ra becomes base. */ 393617f4ac46f1084859d2034c08760e31e52d3bec3Behdad Esfahbod has_reph = false; 394617f4ac46f1084859d2034c08760e31e52d3bec3Behdad Esfahbod } 3955e4e21fce4b548b0b8a5951bc8f35a9f27428192Behdad Esfahbod } 3963d25079f8d6be81b9b4b91d3a97016b8a572f571Behdad Esfahbod 3973d25079f8d6be81b9b4b91d3a97016b8a572f571Behdad Esfahbod 398743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod /* 2. Decompose and reorder Matras: 399743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod * 400743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod * Each matra and any syllable modifier sign in the cluster are moved to the 401743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod * appropriate position relative to the consonant(s) in the cluster. The 402743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod * shaping engine decomposes two- or three-part matras into their constituent 403743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod * parts before any repositioning. Matra characters are classified by which 404743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod * consonant in a conjunct they have affinity for and are reordered to the 405743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod * following positions: 406743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod * 407743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod * o Before first half form in the syllable 408743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod * o After subjoined consonants 409743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod * o After post-form consonant 410743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod * o After main consonant (for above marks) 411743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod * 412743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod * IMPLEMENTATION NOTES: 413743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod * 414743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod * The normalize() routine has already decomposed matras for us, so we don't 415743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod * need to worry about that. 416743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod */ 417743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod 418743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod 419743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod /* 3. Reorder marks to canonical order: 420743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod * 421743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod * Adjacent nukta and halant or nukta and vedic sign are always repositioned 422743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod * if necessary, so that the nukta is first. 423743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod * 424743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod * IMPLEMENTATION NOTES: 425743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod * 426743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod * We don't need to do this: the normalize() routine already did this for us. 427743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod */ 428743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod 429743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod 43045d6f29f15f1d2323bcaa2498aed23ff0c8a1567Behdad Esfahbod /* Reorder characters */ 43145d6f29f15f1d2323bcaa2498aed23ff0c8a1567Behdad Esfahbod 4323c2ea9481b1028e927e615a5434ebf8edcb5f891Behdad Esfahbod for (unsigned int i = start; i < base; i++) 433dbccf87eef0d26838fa4bb3ae26410f6c4818836Behdad Esfahbod info[i].indic_position() = POS_PRE_C; 43455f70ebfb95083f515d9b0044a2a65ab11484bb5Behdad Esfahbod 435dbccf87eef0d26838fa4bb3ae26410f6c4818836Behdad Esfahbod info[base].indic_position() = POS_BASE_C; 43645d6f29f15f1d2323bcaa2498aed23ff0c8a1567Behdad Esfahbod 43755f70ebfb95083f515d9b0044a2a65ab11484bb5Behdad Esfahbod /* Mark final consonants. A final consonant is one appearing after a matra, 43855f70ebfb95083f515d9b0044a2a65ab11484bb5Behdad Esfahbod * like in Khmer. */ 43955f70ebfb95083f515d9b0044a2a65ab11484bb5Behdad Esfahbod for (unsigned int i = base + 1; i < end; i++) 44055f70ebfb95083f515d9b0044a2a65ab11484bb5Behdad Esfahbod if (info[i].indic_category() == OT_M) { 44155f70ebfb95083f515d9b0044a2a65ab11484bb5Behdad Esfahbod for (unsigned int j = i + 1; j < end; j++) 44255f70ebfb95083f515d9b0044a2a65ab11484bb5Behdad Esfahbod if (is_consonant (info[j])) { 44355f70ebfb95083f515d9b0044a2a65ab11484bb5Behdad Esfahbod info[j].indic_position() = POS_FINAL_C; 44455f70ebfb95083f515d9b0044a2a65ab11484bb5Behdad Esfahbod break; 44555f70ebfb95083f515d9b0044a2a65ab11484bb5Behdad Esfahbod } 44655f70ebfb95083f515d9b0044a2a65ab11484bb5Behdad Esfahbod break; 44755f70ebfb95083f515d9b0044a2a65ab11484bb5Behdad Esfahbod } 44855f70ebfb95083f515d9b0044a2a65ab11484bb5Behdad Esfahbod 449fd06bf56110e73826b3d5c73ac964e2609450d46Behdad Esfahbod /* Handle beginning Ra */ 4505e4e21fce4b548b0b8a5951bc8f35a9f27428192Behdad Esfahbod if (has_reph) 451dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod info[start].indic_position() = POS_RA_TO_BECOME_REPH; 452fd06bf56110e73826b3d5c73ac964e2609450d46Behdad Esfahbod 453f5bc2725cb892264ba223e0a49f7fd2c622a0730Behdad Esfahbod /* For old-style Indic script tags, move the first post-base Halant after 454f5bc2725cb892264ba223e0a49f7fd2c622a0730Behdad Esfahbod * last consonant. */ 455a3e04bee2c2fa648759a87e460db6b4f1b685586Behdad Esfahbod if (IS_OLD_INDIC_TAG (map->get_chosen_script (0))) { 4563c2ea9481b1028e927e615a5434ebf8edcb5f891Behdad Esfahbod for (unsigned int i = base + 1; i < end; i++) 457f5bc2725cb892264ba223e0a49f7fd2c622a0730Behdad Esfahbod if (info[i].indic_category() == OT_H) { 458f5bc2725cb892264ba223e0a49f7fd2c622a0730Behdad Esfahbod unsigned int j; 459f5bc2725cb892264ba223e0a49f7fd2c622a0730Behdad Esfahbod for (j = end - 1; j > i; j--) 460190eb31a16178269aecaf5d2ecc9012f956749f4Behdad Esfahbod if (is_consonant (info[j])) 461f5bc2725cb892264ba223e0a49f7fd2c622a0730Behdad Esfahbod break; 462f5bc2725cb892264ba223e0a49f7fd2c622a0730Behdad Esfahbod if (j > i) { 463f5bc2725cb892264ba223e0a49f7fd2c622a0730Behdad Esfahbod /* Move Halant to after last consonant. */ 464f5bc2725cb892264ba223e0a49f7fd2c622a0730Behdad Esfahbod hb_glyph_info_t t = info[i]; 465f5bc2725cb892264ba223e0a49f7fd2c622a0730Behdad Esfahbod memmove (&info[i], &info[i + 1], (j - i) * sizeof (info[0])); 466f5bc2725cb892264ba223e0a49f7fd2c622a0730Behdad Esfahbod info[j] = t; 467f5bc2725cb892264ba223e0a49f7fd2c622a0730Behdad Esfahbod } 468f5bc2725cb892264ba223e0a49f7fd2c622a0730Behdad Esfahbod break; 469f5bc2725cb892264ba223e0a49f7fd2c622a0730Behdad Esfahbod } 470f5bc2725cb892264ba223e0a49f7fd2c622a0730Behdad Esfahbod } 471f5bc2725cb892264ba223e0a49f7fd2c622a0730Behdad Esfahbod 47245d6f29f15f1d2323bcaa2498aed23ff0c8a1567Behdad Esfahbod /* Attach ZWJ, ZWNJ, nukta, and halant to previous char to move with them. */ 473a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbod if (!indic_options ().uniscribe_bug_compatible) 474ebe29733d44fe0fa9fb30f946ab0dd7a40336a24Behdad Esfahbod { 475ebe29733d44fe0fa9fb30f946ab0dd7a40336a24Behdad Esfahbod /* Please update the Uniscribe branch when touching this! */ 476ebe29733d44fe0fa9fb30f946ab0dd7a40336a24Behdad Esfahbod for (unsigned int i = start + 1; i < end; i++) 477ebe29733d44fe0fa9fb30f946ab0dd7a40336a24Behdad Esfahbod if ((FLAG (info[i].indic_category()) & (FLAG (OT_ZWNJ) | FLAG (OT_ZWJ) | FLAG (OT_N) | FLAG (OT_H)))) 478ebe29733d44fe0fa9fb30f946ab0dd7a40336a24Behdad Esfahbod info[i].indic_position() = info[i - 1].indic_position(); 479ebe29733d44fe0fa9fb30f946ab0dd7a40336a24Behdad Esfahbod } else { 48067ea29af49bb08ee679914076808327992cf6676Behdad Esfahbod /* 48167ea29af49bb08ee679914076808327992cf6676Behdad Esfahbod * Uniscribe doesn't move the Halant with Left Matra. 48267ea29af49bb08ee679914076808327992cf6676Behdad Esfahbod * TEST: U+092B,U+093F,U+094DE 48367ea29af49bb08ee679914076808327992cf6676Behdad Esfahbod */ 484ebe29733d44fe0fa9fb30f946ab0dd7a40336a24Behdad Esfahbod /* Please update the non-Uniscribe branch when touching this! */ 485ebe29733d44fe0fa9fb30f946ab0dd7a40336a24Behdad Esfahbod for (unsigned int i = start + 1; i < end; i++) 486ebe29733d44fe0fa9fb30f946ab0dd7a40336a24Behdad Esfahbod if ((FLAG (info[i].indic_category()) & (FLAG (OT_ZWNJ) | FLAG (OT_ZWJ) | FLAG (OT_N) | FLAG (OT_H)))) { 487ebe29733d44fe0fa9fb30f946ab0dd7a40336a24Behdad Esfahbod info[i].indic_position() = info[i - 1].indic_position(); 4886a091df9b403b147ef78f3974610dedf4ce1e08aBehdad Esfahbod if (info[i].indic_category() == OT_H && info[i].indic_position() == POS_PRE_M) 489ebe29733d44fe0fa9fb30f946ab0dd7a40336a24Behdad Esfahbod for (unsigned int j = i; j > start; j--) 4906a091df9b403b147ef78f3974610dedf4ce1e08aBehdad Esfahbod if (info[j - 1].indic_position() != POS_PRE_M) { 491ebe29733d44fe0fa9fb30f946ab0dd7a40336a24Behdad Esfahbod info[i].indic_position() = info[j - 1].indic_position(); 492ebe29733d44fe0fa9fb30f946ab0dd7a40336a24Behdad Esfahbod break; 493ebe29733d44fe0fa9fb30f946ab0dd7a40336a24Behdad Esfahbod } 494ebe29733d44fe0fa9fb30f946ab0dd7a40336a24Behdad Esfahbod } 495ebe29733d44fe0fa9fb30f946ab0dd7a40336a24Behdad Esfahbod } 49674ccc6a1322f8c48c5f2a05f04821783c4b87a14Behdad Esfahbod /* Re-attach ZWJ, ZWNJ, and halant to next char, for after-base consonants. */ 49774ccc6a1322f8c48c5f2a05f04821783c4b87a14Behdad Esfahbod { 49874ccc6a1322f8c48c5f2a05f04821783c4b87a14Behdad Esfahbod unsigned int last_halant = end; 49974ccc6a1322f8c48c5f2a05f04821783c4b87a14Behdad Esfahbod for (unsigned int i = base + 1; i < end; i++) 500deb521dee4fdca8c2124cfb39a205e6269d4a70dBehdad Esfahbod if (is_halant_or_coeng (info[i])) 50174ccc6a1322f8c48c5f2a05f04821783c4b87a14Behdad Esfahbod last_halant = i; 50274ccc6a1322f8c48c5f2a05f04821783c4b87a14Behdad Esfahbod else if (is_consonant (info[i])) { 50374ccc6a1322f8c48c5f2a05f04821783c4b87a14Behdad Esfahbod for (unsigned int j = last_halant; j < i; j++) 50474ccc6a1322f8c48c5f2a05f04821783c4b87a14Behdad Esfahbod info[j].indic_position() = info[i].indic_position(); 50574ccc6a1322f8c48c5f2a05f04821783c4b87a14Behdad Esfahbod } 50674ccc6a1322f8c48c5f2a05f04821783c4b87a14Behdad Esfahbod } 50745d6f29f15f1d2323bcaa2498aed23ff0c8a1567Behdad Esfahbod 50845d6f29f15f1d2323bcaa2498aed23ff0c8a1567Behdad Esfahbod /* We do bubble-sort, skip malicious clusters attempts */ 509b99d63ae114fb58f129562b293a8a66543d499adBehdad Esfahbod if (end - start < 64) 510a391ff50b9a7b6ac3e58d199ea726b20ee6839bbBehdad Esfahbod { 511a391ff50b9a7b6ac3e58d199ea726b20ee6839bbBehdad Esfahbod /* Sit tight, rock 'n roll! */ 512d3637edb248162970e202e9d0671540274192844Behdad Esfahbod hb_bubble_sort (info + start, end - start, compare_indic_order); 513a391ff50b9a7b6ac3e58d199ea726b20ee6839bbBehdad Esfahbod /* Find base again */ 514a391ff50b9a7b6ac3e58d199ea726b20ee6839bbBehdad Esfahbod base = end; 5153c2ea9481b1028e927e615a5434ebf8edcb5f891Behdad Esfahbod for (unsigned int i = start; i < end; i++) 516a391ff50b9a7b6ac3e58d199ea726b20ee6839bbBehdad Esfahbod if (info[i].indic_position() == POS_BASE_C) { 517a391ff50b9a7b6ac3e58d199ea726b20ee6839bbBehdad Esfahbod base = i; 518a391ff50b9a7b6ac3e58d199ea726b20ee6839bbBehdad Esfahbod break; 519a391ff50b9a7b6ac3e58d199ea726b20ee6839bbBehdad Esfahbod } 520a391ff50b9a7b6ac3e58d199ea726b20ee6839bbBehdad Esfahbod } 52145d6f29f15f1d2323bcaa2498aed23ff0c8a1567Behdad Esfahbod 522743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod /* Setup masks now */ 523743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod 524281683995a46ed37aeeb84061249758c59822457Behdad Esfahbod { 525281683995a46ed37aeeb84061249758c59822457Behdad Esfahbod hb_mask_t mask; 526281683995a46ed37aeeb84061249758c59822457Behdad Esfahbod 527dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod /* Reph */ 528668c6046c1b3af3bd316bda0cc8636f2a5e8df42Behdad Esfahbod for (unsigned int i = start; i < end && info[i].indic_position() == POS_RA_TO_BECOME_REPH; i++) 52970fe77bb9a25922bd34f206826d8731d901fb451Behdad Esfahbod info[i].mask |= basic_mask_array[RPHF]; 530dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod 531281683995a46ed37aeeb84061249758c59822457Behdad Esfahbod /* Pre-base */ 53270fe77bb9a25922bd34f206826d8731d901fb451Behdad Esfahbod mask = basic_mask_array[HALF] | basic_mask_array[AKHN] | basic_mask_array[CJCT]; 5333c2ea9481b1028e927e615a5434ebf8edcb5f891Behdad Esfahbod for (unsigned int i = start; i < base; i++) 534281683995a46ed37aeeb84061249758c59822457Behdad Esfahbod info[i].mask |= mask; 535281683995a46ed37aeeb84061249758c59822457Behdad Esfahbod /* Base */ 53670fe77bb9a25922bd34f206826d8731d901fb451Behdad Esfahbod mask = basic_mask_array[AKHN] | basic_mask_array[CJCT]; 537281683995a46ed37aeeb84061249758c59822457Behdad Esfahbod info[base].mask |= mask; 538281683995a46ed37aeeb84061249758c59822457Behdad Esfahbod /* Post-base */ 53970fe77bb9a25922bd34f206826d8731d901fb451Behdad Esfahbod mask = basic_mask_array[BLWF] | basic_mask_array[ABVF] | basic_mask_array[PSTF] | basic_mask_array[CJCT]; 5403c2ea9481b1028e927e615a5434ebf8edcb5f891Behdad Esfahbod for (unsigned int i = base + 1; i < end; i++) 541281683995a46ed37aeeb84061249758c59822457Behdad Esfahbod info[i].mask |= mask; 542281683995a46ed37aeeb84061249758c59822457Behdad Esfahbod } 5439da0487cd452d780673e24329ce03e174a4ef83bBehdad Esfahbod 54417d7de91d76406d3e92db37d9eef2fc615f06e68Behdad Esfahbod /* XXX This will not match for old-Indic spec since the Halant-Ra order is reversed already. */ 5458e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod if (basic_mask_array[PREF] && base + 3 <= end) 54617d7de91d76406d3e92db37d9eef2fc615f06e68Behdad Esfahbod { 5478e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod /* Find a Halant,Ra sequence and mark it fore pre-base reordering processing. */ 5488e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod for (unsigned int i = base + 1; i + 1 < end; i++) 549deb521dee4fdca8c2124cfb39a205e6269d4a70dBehdad Esfahbod if (is_halant_or_coeng (info[i]) && 5508e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod info[i + 1].indic_category() == OT_Ra) 5518e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod { 5520201e0a4649ad5b607e50bcb9605e7a5b7143812Behdad Esfahbod info[i++].mask |= basic_mask_array[PREF]; 5530201e0a4649ad5b607e50bcb9605e7a5b7143812Behdad Esfahbod info[i++].mask |= basic_mask_array[PREF]; 5540201e0a4649ad5b607e50bcb9605e7a5b7143812Behdad Esfahbod 5550201e0a4649ad5b607e50bcb9605e7a5b7143812Behdad Esfahbod /* Mark the subsequent stuff with 'cfar'. Used in Khmer. 5560201e0a4649ad5b607e50bcb9605e7a5b7143812Behdad Esfahbod * Read the feature spec. 5570201e0a4649ad5b607e50bcb9605e7a5b7143812Behdad Esfahbod * This allows distinguishing the following cases with MS Khmer fonts: 5580201e0a4649ad5b607e50bcb9605e7a5b7143812Behdad Esfahbod * U+1784,U+17D2,U+179A,U+17D2,U+1782 5590201e0a4649ad5b607e50bcb9605e7a5b7143812Behdad Esfahbod * U+1784,U+17D2,U+1782,U+17D2,U+179A 5600201e0a4649ad5b607e50bcb9605e7a5b7143812Behdad Esfahbod */ 5610201e0a4649ad5b607e50bcb9605e7a5b7143812Behdad Esfahbod for (; i < end; i++) 5620201e0a4649ad5b607e50bcb9605e7a5b7143812Behdad Esfahbod info[i].mask |= basic_mask_array[CFAR]; 5630201e0a4649ad5b607e50bcb9605e7a5b7143812Behdad Esfahbod 5648e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod break; 5658e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod } 56617d7de91d76406d3e92db37d9eef2fc615f06e68Behdad Esfahbod } 56717d7de91d76406d3e92db37d9eef2fc615f06e68Behdad Esfahbod 5689da0487cd452d780673e24329ce03e174a4ef83bBehdad Esfahbod /* Apply ZWJ/ZWNJ effects */ 5693c2ea9481b1028e927e615a5434ebf8edcb5f891Behdad Esfahbod for (unsigned int i = start + 1; i < end; i++) 5709da0487cd452d780673e24329ce03e174a4ef83bBehdad Esfahbod if (is_joiner (info[i])) { 5719da0487cd452d780673e24329ce03e174a4ef83bBehdad Esfahbod bool non_joiner = info[i].indic_category() == OT_ZWNJ; 5726b37bc80843e38ca7b62500f95fd70c08af68d62Behdad Esfahbod unsigned int j = i; 5739da0487cd452d780673e24329ce03e174a4ef83bBehdad Esfahbod 5749da0487cd452d780673e24329ce03e174a4ef83bBehdad Esfahbod do { 5759da0487cd452d780673e24329ce03e174a4ef83bBehdad Esfahbod j--; 5766b37bc80843e38ca7b62500f95fd70c08af68d62Behdad Esfahbod 57770fe77bb9a25922bd34f206826d8731d901fb451Behdad Esfahbod info[j].mask &= ~basic_mask_array[CJCT]; 5786b37bc80843e38ca7b62500f95fd70c08af68d62Behdad Esfahbod if (non_joiner) 57970fe77bb9a25922bd34f206826d8731d901fb451Behdad Esfahbod info[j].mask &= ~basic_mask_array[HALF]; 5806b37bc80843e38ca7b62500f95fd70c08af68d62Behdad Esfahbod 5819da0487cd452d780673e24329ce03e174a4ef83bBehdad Esfahbod } while (j > start && !is_consonant (info[j])); 5829da0487cd452d780673e24329ce03e174a4ef83bBehdad Esfahbod } 583743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod} 584743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod 585743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod 586743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbodstatic void 5879f377ed3210fe7d9f15e0c4f82020556f9a8f6f0Behdad Esfahbodinitial_reordering_vowel_syllable (const hb_ot_map_t *map, 5889f377ed3210fe7d9f15e0c4f82020556f9a8f6f0Behdad Esfahbod hb_buffer_t *buffer, 58970fe77bb9a25922bd34f206826d8731d901fb451Behdad Esfahbod hb_mask_t *basic_mask_array, 590ef24cc8c8e2478a6352c340f4611a617646de4ccBehdad Esfahbod unsigned int start, unsigned int end) 591743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod{ 592c5306b6861cfaa50af40e8ceb058791fa06d7981Behdad Esfahbod /* We made the vowels look like consonants. So let's call the consonant logic! */ 59370fe77bb9a25922bd34f206826d8731d901fb451Behdad Esfahbod initial_reordering_consonant_syllable (map, buffer, basic_mask_array, start, end); 594743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod} 595743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod 596743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbodstatic void 5979f377ed3210fe7d9f15e0c4f82020556f9a8f6f0Behdad Esfahbodinitial_reordering_standalone_cluster (const hb_ot_map_t *map, 5989f377ed3210fe7d9f15e0c4f82020556f9a8f6f0Behdad Esfahbod hb_buffer_t *buffer, 59970fe77bb9a25922bd34f206826d8731d901fb451Behdad Esfahbod hb_mask_t *basic_mask_array, 600ef24cc8c8e2478a6352c340f4611a617646de4ccBehdad Esfahbod unsigned int start, unsigned int end) 601743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod{ 60218c06e189bd078affbb84c3bb5bb80687a227c5eBehdad Esfahbod /* We treat NBSP/dotted-circle as if they are consonants, so we should just chain. 60318c06e189bd078affbb84c3bb5bb80687a227c5eBehdad Esfahbod * Only if not in compatibility mode that is... */ 60418c06e189bd078affbb84c3bb5bb80687a227c5eBehdad Esfahbod 605a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbod if (indic_options ().uniscribe_bug_compatible) 60618c06e189bd078affbb84c3bb5bb80687a227c5eBehdad Esfahbod { 60718c06e189bd078affbb84c3bb5bb80687a227c5eBehdad Esfahbod /* For dotted-circle, this is what Uniscribe does: 60818c06e189bd078affbb84c3bb5bb80687a227c5eBehdad Esfahbod * If dotted-circle is the last glyph, it just does nothing. 60918c06e189bd078affbb84c3bb5bb80687a227c5eBehdad Esfahbod * Ie. It doesn't form Reph. */ 61018c06e189bd078affbb84c3bb5bb80687a227c5eBehdad Esfahbod if (buffer->info[end - 1].indic_category() == OT_DOTTEDCIRCLE) 61118c06e189bd078affbb84c3bb5bb80687a227c5eBehdad Esfahbod return; 61218c06e189bd078affbb84c3bb5bb80687a227c5eBehdad Esfahbod } 61318c06e189bd078affbb84c3bb5bb80687a227c5eBehdad Esfahbod 61470fe77bb9a25922bd34f206826d8731d901fb451Behdad Esfahbod initial_reordering_consonant_syllable (map, buffer, basic_mask_array, start, end); 615743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod} 616743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod 617743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbodstatic void 6189f377ed3210fe7d9f15e0c4f82020556f9a8f6f0Behdad Esfahbodinitial_reordering_non_indic (const hb_ot_map_t *map HB_UNUSED, 6199f377ed3210fe7d9f15e0c4f82020556f9a8f6f0Behdad Esfahbod hb_buffer_t *buffer HB_UNUSED, 62070fe77bb9a25922bd34f206826d8731d901fb451Behdad Esfahbod hb_mask_t *basic_mask_array HB_UNUSED, 6213f18236a03880c0960f5990dc90685f6146951a6Behdad Esfahbod unsigned int start HB_UNUSED, unsigned int end HB_UNUSED) 622743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod{ 623743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod /* Nothing to do right now. If we ever switch to using the output 624743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod * buffer in the reordering process, we'd need to next_glyph() here. */ 625743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod} 626743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod 627743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod#include "hb-ot-shape-complex-indic-machine.hh" 628743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod 629743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbodstatic void 630743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbodinitial_reordering (const hb_ot_map_t *map, 6313f18236a03880c0960f5990dc90685f6146951a6Behdad Esfahbod hb_face_t *face HB_UNUSED, 632743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod hb_buffer_t *buffer, 633743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod void *user_data HB_UNUSED) 634743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod{ 63570fe77bb9a25922bd34f206826d8731d901fb451Behdad Esfahbod hb_mask_t basic_mask_array[ARRAY_LENGTH (indic_basic_features)] = {0}; 636b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod unsigned int num_masks = ARRAY_LENGTH (indic_basic_features); 637b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod for (unsigned int i = 0; i < num_masks; i++) 63870fe77bb9a25922bd34f206826d8731d901fb451Behdad Esfahbod basic_mask_array[i] = map->get_1_mask (indic_basic_features[i].tag); 639743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod 64070fe77bb9a25922bd34f206826d8731d901fb451Behdad Esfahbod find_syllables (map, buffer, basic_mask_array); 641b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod} 642b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod 643743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbodstatic void 64446e645ec4b59f0a278347be11f40c7df700d5bb6Behdad Esfahbodfinal_reordering_syllable (hb_buffer_t *buffer, 64546e645ec4b59f0a278347be11f40c7df700d5bb6Behdad Esfahbod hb_mask_t init_mask, hb_mask_t pref_mask, 646ef24cc8c8e2478a6352c340f4611a617646de4ccBehdad Esfahbod unsigned int start, unsigned int end) 647743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod{ 6484ac9e98d9d2ea973dd612dc4063cf78496c643a0Behdad Esfahbod hb_glyph_info_t *info = buffer->info; 6494ac9e98d9d2ea973dd612dc4063cf78496c643a0Behdad Esfahbod 650e7be05702447ae270d797398132c1930cd3a9b86Behdad Esfahbod /* 4. Final reordering: 651e7be05702447ae270d797398132c1930cd3a9b86Behdad Esfahbod * 652e7be05702447ae270d797398132c1930cd3a9b86Behdad Esfahbod * After the localized forms and basic shaping forms GSUB features have been 653e7be05702447ae270d797398132c1930cd3a9b86Behdad Esfahbod * applied (see below), the shaping engine performs some final glyph 654e7be05702447ae270d797398132c1930cd3a9b86Behdad Esfahbod * reordering before applying all the remaining font features to the entire 655e7be05702447ae270d797398132c1930cd3a9b86Behdad Esfahbod * cluster. 6564ac9e98d9d2ea973dd612dc4063cf78496c643a0Behdad Esfahbod */ 6574ac9e98d9d2ea973dd612dc4063cf78496c643a0Behdad Esfahbod 6584ac9e98d9d2ea973dd612dc4063cf78496c643a0Behdad Esfahbod /* Find base again */ 6594ac9e98d9d2ea973dd612dc4063cf78496c643a0Behdad Esfahbod unsigned int base = end; 6604ac9e98d9d2ea973dd612dc4063cf78496c643a0Behdad Esfahbod for (unsigned int i = start; i < end; i++) 6614ac9e98d9d2ea973dd612dc4063cf78496c643a0Behdad Esfahbod if (info[i].indic_position() == POS_BASE_C) { 6624ac9e98d9d2ea973dd612dc4063cf78496c643a0Behdad Esfahbod base = i; 6634ac9e98d9d2ea973dd612dc4063cf78496c643a0Behdad Esfahbod break; 6644ac9e98d9d2ea973dd612dc4063cf78496c643a0Behdad Esfahbod } 6654ac9e98d9d2ea973dd612dc4063cf78496c643a0Behdad Esfahbod 6664705a7026900e51f6430f03a73c87f2df035df92Behdad Esfahbod unsigned int start_of_last_cluster = base; 6674705a7026900e51f6430f03a73c87f2df035df92Behdad Esfahbod 6684ac9e98d9d2ea973dd612dc4063cf78496c643a0Behdad Esfahbod /* o Reorder matras: 669e7be05702447ae270d797398132c1930cd3a9b86Behdad Esfahbod * 670e7be05702447ae270d797398132c1930cd3a9b86Behdad Esfahbod * If a pre-base matra character had been reordered before applying basic 671e7be05702447ae270d797398132c1930cd3a9b86Behdad Esfahbod * features, the glyph can be moved closer to the main consonant based on 672e7be05702447ae270d797398132c1930cd3a9b86Behdad Esfahbod * whether half-forms had been formed. Actual position for the matra is 673e7be05702447ae270d797398132c1930cd3a9b86Behdad Esfahbod * defined as “after last standalone halant glyph, after initial matra 674e7be05702447ae270d797398132c1930cd3a9b86Behdad Esfahbod * position and before the main consonant”. If ZWJ or ZWNJ follow this 675e7be05702447ae270d797398132c1930cd3a9b86Behdad Esfahbod * halant, position is moved after it. 6764ac9e98d9d2ea973dd612dc4063cf78496c643a0Behdad Esfahbod */ 6774ac9e98d9d2ea973dd612dc4063cf78496c643a0Behdad Esfahbod 678362d3db8d3527d0fef260a17d2466e92a4a25425Behdad Esfahbod if (start < base) /* Otherwise there can't be any pre-base matra characters. */ 6799d0d319a4a7e85d922e58fade0f40caae1c9f109Behdad Esfahbod { 680921ce5b17daf06af8e17989a3e335b9f5df20483Behdad Esfahbod unsigned int new_pos = base - 1; 681921ce5b17daf06af8e17989a3e335b9f5df20483Behdad Esfahbod while (new_pos > start && 682deb521dee4fdca8c2124cfb39a205e6269d4a70dBehdad Esfahbod !(FLAG (info[new_pos].indic_category()) & (FLAG (OT_M) | FLAG (OT_H) | FLAG (OT_Coeng)))) 683921ce5b17daf06af8e17989a3e335b9f5df20483Behdad Esfahbod new_pos--; 6849d0d319a4a7e85d922e58fade0f40caae1c9f109Behdad Esfahbod /* If we found no Halant we are done. Otherwise only proceed if the Halant does 6859d0d319a4a7e85d922e58fade0f40caae1c9f109Behdad Esfahbod * not belong to the Matra itself! */ 686deb521dee4fdca8c2124cfb39a205e6269d4a70dBehdad Esfahbod if (is_halant_or_coeng (info[new_pos]) && 687921ce5b17daf06af8e17989a3e335b9f5df20483Behdad Esfahbod info[new_pos].indic_position() != POS_PRE_M) { 6889d0d319a4a7e85d922e58fade0f40caae1c9f109Behdad Esfahbod /* -> If ZWJ or ZWNJ follow this halant, position is moved after it. */ 689921ce5b17daf06af8e17989a3e335b9f5df20483Behdad Esfahbod if (new_pos + 1 < end && is_joiner (info[new_pos + 1])) 690921ce5b17daf06af8e17989a3e335b9f5df20483Behdad Esfahbod new_pos++; 6919d0d319a4a7e85d922e58fade0f40caae1c9f109Behdad Esfahbod 6929d0d319a4a7e85d922e58fade0f40caae1c9f109Behdad Esfahbod /* Now go see if there's actually any matras... */ 693921ce5b17daf06af8e17989a3e335b9f5df20483Behdad Esfahbod for (unsigned int i = new_pos; i > start; i--) 6946a091df9b403b147ef78f3974610dedf4ce1e08aBehdad Esfahbod if (info[i - 1].indic_position () == POS_PRE_M) 6959d0d319a4a7e85d922e58fade0f40caae1c9f109Behdad Esfahbod { 6961a1dbe9a2787f226f3e43063da8eb6633438b0a0Behdad Esfahbod unsigned int old_pos = i - 1; 6971a1dbe9a2787f226f3e43063da8eb6633438b0a0Behdad Esfahbod hb_glyph_info_t tmp = info[old_pos]; 6981a1dbe9a2787f226f3e43063da8eb6633438b0a0Behdad Esfahbod memmove (&info[old_pos], &info[old_pos + 1], (new_pos - old_pos) * sizeof (info[0])); 6991a1dbe9a2787f226f3e43063da8eb6633438b0a0Behdad Esfahbod info[new_pos] = tmp; 700921ce5b17daf06af8e17989a3e335b9f5df20483Behdad Esfahbod start_of_last_cluster = MIN (new_pos, start_of_last_cluster); 701921ce5b17daf06af8e17989a3e335b9f5df20483Behdad Esfahbod new_pos--; 7029d0d319a4a7e85d922e58fade0f40caae1c9f109Behdad Esfahbod } 7039d0d319a4a7e85d922e58fade0f40caae1c9f109Behdad Esfahbod } 7044ac9e98d9d2ea973dd612dc4063cf78496c643a0Behdad Esfahbod } 7054ac9e98d9d2ea973dd612dc4063cf78496c643a0Behdad Esfahbod 7064ac9e98d9d2ea973dd612dc4063cf78496c643a0Behdad Esfahbod 7074ac9e98d9d2ea973dd612dc4063cf78496c643a0Behdad Esfahbod /* o Reorder reph: 708e7be05702447ae270d797398132c1930cd3a9b86Behdad Esfahbod * 709e7be05702447ae270d797398132c1930cd3a9b86Behdad Esfahbod * Reph’s original position is always at the beginning of the syllable, 710e7be05702447ae270d797398132c1930cd3a9b86Behdad Esfahbod * (i.e. it is not reordered at the character reordering stage). However, 711e7be05702447ae270d797398132c1930cd3a9b86Behdad Esfahbod * it will be reordered according to the basic-forms shaping results. 712e7be05702447ae270d797398132c1930cd3a9b86Behdad Esfahbod * Possible positions for reph, depending on the script, are; after main, 713e7be05702447ae270d797398132c1930cd3a9b86Behdad Esfahbod * before post-base consonant forms, and after post-base consonant forms. 714dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod */ 715dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod 716dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod /* If there's anything after the Ra that has the REPH pos, it ought to be halant. 717dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod * Which means that the font has failed to ligate the Reph. In which case, we 718dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod * shouldn't move. */ 719dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod if (start + 1 < end && 720dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod info[start].indic_position() == POS_RA_TO_BECOME_REPH && 721dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod info[start + 1].indic_position() != POS_RA_TO_BECOME_REPH) 722dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod { 72302b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod unsigned int new_reph_pos; 72402b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod 72502b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod enum reph_position_t { 726f89367251109af235f4f0446c13c261a5a4a6f72Behdad Esfahbod REPH_AFTER_MAIN, 727f89367251109af235f4f0446c13c261a5a4a6f72Behdad Esfahbod REPH_BEFORE_SUBSCRIPT, 728f89367251109af235f4f0446c13c261a5a4a6f72Behdad Esfahbod REPH_AFTER_SUBSCRIPT, 729f89367251109af235f4f0446c13c261a5a4a6f72Behdad Esfahbod REPH_BEFORE_POSTSCRIPT, 7309fc7a11469113d31d8095757c4fc038c3427d44aBehdad Esfahbod REPH_AFTER_POSTSCRIPT 731f89367251109af235f4f0446c13c261a5a4a6f72Behdad Esfahbod } reph_pos; 732f89367251109af235f4f0446c13c261a5a4a6f72Behdad Esfahbod 733f89367251109af235f4f0446c13c261a5a4a6f72Behdad Esfahbod /* XXX Figure out old behavior too */ 7347f852b644b8143492a02edfc853114aaa23446bdBehdad Esfahbod switch ((hb_tag_t) buffer->props.script) 735f89367251109af235f4f0446c13c261a5a4a6f72Behdad Esfahbod { 736f89367251109af235f4f0446c13c261a5a4a6f72Behdad Esfahbod case HB_SCRIPT_MALAYALAM: 737f89367251109af235f4f0446c13c261a5a4a6f72Behdad Esfahbod case HB_SCRIPT_ORIYA: 738f89367251109af235f4f0446c13c261a5a4a6f72Behdad Esfahbod reph_pos = REPH_AFTER_MAIN; 739f89367251109af235f4f0446c13c261a5a4a6f72Behdad Esfahbod break; 740f89367251109af235f4f0446c13c261a5a4a6f72Behdad Esfahbod 741f89367251109af235f4f0446c13c261a5a4a6f72Behdad Esfahbod case HB_SCRIPT_GURMUKHI: 742f89367251109af235f4f0446c13c261a5a4a6f72Behdad Esfahbod reph_pos = REPH_BEFORE_SUBSCRIPT; 743f89367251109af235f4f0446c13c261a5a4a6f72Behdad Esfahbod break; 744f89367251109af235f4f0446c13c261a5a4a6f72Behdad Esfahbod 745f89367251109af235f4f0446c13c261a5a4a6f72Behdad Esfahbod case HB_SCRIPT_BENGALI: 746f89367251109af235f4f0446c13c261a5a4a6f72Behdad Esfahbod reph_pos = REPH_AFTER_SUBSCRIPT; 747f89367251109af235f4f0446c13c261a5a4a6f72Behdad Esfahbod break; 748f89367251109af235f4f0446c13c261a5a4a6f72Behdad Esfahbod 749f89367251109af235f4f0446c13c261a5a4a6f72Behdad Esfahbod default: 750f89367251109af235f4f0446c13c261a5a4a6f72Behdad Esfahbod case HB_SCRIPT_DEVANAGARI: 751f89367251109af235f4f0446c13c261a5a4a6f72Behdad Esfahbod case HB_SCRIPT_GUJARATI: 752f89367251109af235f4f0446c13c261a5a4a6f72Behdad Esfahbod reph_pos = REPH_BEFORE_POSTSCRIPT; 753f89367251109af235f4f0446c13c261a5a4a6f72Behdad Esfahbod break; 754f89367251109af235f4f0446c13c261a5a4a6f72Behdad Esfahbod 755f89367251109af235f4f0446c13c261a5a4a6f72Behdad Esfahbod case HB_SCRIPT_KANNADA: 756f89367251109af235f4f0446c13c261a5a4a6f72Behdad Esfahbod case HB_SCRIPT_TAMIL: 757f89367251109af235f4f0446c13c261a5a4a6f72Behdad Esfahbod case HB_SCRIPT_TELUGU: 758f89367251109af235f4f0446c13c261a5a4a6f72Behdad Esfahbod reph_pos = REPH_AFTER_POSTSCRIPT; 759f89367251109af235f4f0446c13c261a5a4a6f72Behdad Esfahbod break; 760f89367251109af235f4f0446c13c261a5a4a6f72Behdad Esfahbod } 76102b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod 762dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod /* 1. If reph should be positioned after post-base consonant forms, 763dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod * proceed to step 5. 76402b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod */ 7659d0d319a4a7e85d922e58fade0f40caae1c9f109Behdad Esfahbod if (reph_pos == REPH_AFTER_POSTSCRIPT) 76602b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod { 7679d0d319a4a7e85d922e58fade0f40caae1c9f109Behdad Esfahbod goto reph_step_5; 76802b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod } 76902b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod 77002b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod /* 2. If the reph repositioning class is not after post-base: target 771dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod * position is after the first explicit halant glyph between the 772dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod * first post-reph consonant and last main consonant. If ZWJ or ZWNJ 773dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod * are following this halant, position is moved after it. If such 774dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod * position is found, this is the target position. Otherwise, 775dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod * proceed to the next step. 776dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod * 777dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod * Note: in old-implementation fonts, where classifications were 778dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod * fixed in shaping engine, there was no case where reph position 779dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod * will be found on this step. 78002b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod */ 78102b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod { 78202b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod new_reph_pos = start + 1; 783deb521dee4fdca8c2124cfb39a205e6269d4a70dBehdad Esfahbod while (new_reph_pos < base && !is_halant_or_coeng (info[new_reph_pos])) 78402b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod new_reph_pos++; 78502b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod 786deb521dee4fdca8c2124cfb39a205e6269d4a70dBehdad Esfahbod if (new_reph_pos < base && is_halant_or_coeng (info[new_reph_pos])) { 78702b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod /* ->If ZWJ or ZWNJ are following this halant, position is moved after it. */ 78802b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod if (new_reph_pos + 1 < base && is_joiner (info[new_reph_pos + 1])) 78902b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod new_reph_pos++; 79002b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod goto reph_move; 79102b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod } 79202b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod } 79302b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod 79402b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod /* 3. If reph should be repositioned after the main consonant: find the 795dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod * first consonant not ligated with main, or find the first 796dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod * consonant that is not a potential pre-base reordering Ra. 79702b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod */ 7989d0d319a4a7e85d922e58fade0f40caae1c9f109Behdad Esfahbod if (reph_pos == REPH_AFTER_MAIN) 79902b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod { 800b504e060f008e95b1ba36c06600c9fea4f5d4808Behdad Esfahbod new_reph_pos = base; 801b504e060f008e95b1ba36c06600c9fea4f5d4808Behdad Esfahbod /* XXX Skip potential pre-base reordering Ra. */ 802b504e060f008e95b1ba36c06600c9fea4f5d4808Behdad Esfahbod while (new_reph_pos < end && 803b504e060f008e95b1ba36c06600c9fea4f5d4808Behdad Esfahbod !( FLAG (info[new_reph_pos + 1].indic_position()) & (FLAG (POS_BELOW_C) | FLAG (POS_POST_C) | FLAG (POS_POST_M) | FLAG (POS_SMVD)))) 804b504e060f008e95b1ba36c06600c9fea4f5d4808Behdad Esfahbod new_reph_pos++; 805b504e060f008e95b1ba36c06600c9fea4f5d4808Behdad Esfahbod if (new_reph_pos < end) 806b504e060f008e95b1ba36c06600c9fea4f5d4808Behdad Esfahbod goto reph_move; 80702b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod } 80802b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod 80902b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod /* 4. If reph should be positioned before post-base consonant, find 810dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod * first post-base classified consonant not ligated with main. If no 811dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod * consonant is found, the target position should be before the 812dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod * first matra, syllable modifier sign or vedic sign. 81302b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod */ 8149d0d319a4a7e85d922e58fade0f40caae1c9f109Behdad Esfahbod /* This is our take on what step 4 is trying to say (and failing, BADLY). */ 8159d0d319a4a7e85d922e58fade0f40caae1c9f109Behdad Esfahbod if (reph_pos == REPH_AFTER_SUBSCRIPT) 81602b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod { 8179d0d319a4a7e85d922e58fade0f40caae1c9f109Behdad Esfahbod new_reph_pos = base; 8189d0d319a4a7e85d922e58fade0f40caae1c9f109Behdad Esfahbod while (new_reph_pos < end && 8196a091df9b403b147ef78f3974610dedf4ce1e08aBehdad Esfahbod !( FLAG (info[new_reph_pos + 1].indic_position()) & (FLAG (POS_POST_C) | FLAG (POS_POST_M) | FLAG (POS_SMVD)))) 8209d0d319a4a7e85d922e58fade0f40caae1c9f109Behdad Esfahbod new_reph_pos++; 8219d0d319a4a7e85d922e58fade0f40caae1c9f109Behdad Esfahbod if (new_reph_pos < end) 8229d0d319a4a7e85d922e58fade0f40caae1c9f109Behdad Esfahbod goto reph_move; 82302b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod } 82402b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod 82502b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod /* 5. If no consonant is found in steps 3 or 4, move reph to a position 826dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod * immediately before the first post-base matra, syllable modifier 827dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod * sign or vedic sign that has a reordering class after the intended 828dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod * reph position. For example, if the reordering position for reph 829dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod * is post-main, it will skip above-base matras that also have a 830dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod * post-main position. 831dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod */ 83202b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod reph_step_5: 83302b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod { 83402b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod /* XXX */ 83502b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod } 836dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod 83702b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod /* 6. Otherwise, reorder reph to the end of the syllable. 83802b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod */ 83902b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod { 84002b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod new_reph_pos = end - 1; 84102b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod while (new_reph_pos > start && info[new_reph_pos].indic_position() == POS_SMVD) 84202b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod new_reph_pos--; 84302b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod 844892eb7878238d810a2a70f9dadbf958207bfeaa1Behdad Esfahbod /* 845892eb7878238d810a2a70f9dadbf958207bfeaa1Behdad Esfahbod * If the Reph is to be ending up after a Matra,Halant sequence, 846892eb7878238d810a2a70f9dadbf958207bfeaa1Behdad Esfahbod * position it before that Halant so it can interact with the Matra. 847892eb7878238d810a2a70f9dadbf958207bfeaa1Behdad Esfahbod * However, if it's a plain Consonant,Halant we shouldn't do that. 848892eb7878238d810a2a70f9dadbf958207bfeaa1Behdad Esfahbod * Uniscribe doesn't do this. 849892eb7878238d810a2a70f9dadbf958207bfeaa1Behdad Esfahbod * TEST: U+0930,U+094D,U+0915,U+094B,U+094D 850892eb7878238d810a2a70f9dadbf958207bfeaa1Behdad Esfahbod */ 851a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbod if (!indic_options ().uniscribe_bug_compatible && 852deb521dee4fdca8c2124cfb39a205e6269d4a70dBehdad Esfahbod unlikely (is_halant_or_coeng (info[new_reph_pos]))) { 85302b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod for (unsigned int i = base + 1; i < new_reph_pos; i++) 85402b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod if (info[i].indic_category() == OT_M) { 85502b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod /* Ok, got it. */ 85602b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod new_reph_pos--; 85702b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod } 85802b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod } 85902b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod goto reph_move; 8608df5636968389ac7bf8620ccd091fd4872b0bbeeBehdad Esfahbod } 8618df5636968389ac7bf8620ccd091fd4872b0bbeeBehdad Esfahbod 86202b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod reph_move: 86302b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod { 86402b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod /* Move */ 86502b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod hb_glyph_info_t reph = info[start]; 86602b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod memmove (&info[start], &info[start + 1], (new_reph_pos - start) * sizeof (info[0])); 86702b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod info[new_reph_pos] = reph; 86802b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod start_of_last_cluster = start; /* Yay, one big cluster! */ 86902b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod } 870dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod } 871dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod 872dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod 873dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod /* o Reorder pre-base reordering consonants: 874e7be05702447ae270d797398132c1930cd3a9b86Behdad Esfahbod * 875e7be05702447ae270d797398132c1930cd3a9b86Behdad Esfahbod * If a pre-base reordering consonant is found, reorder it according to 876e7be05702447ae270d797398132c1930cd3a9b86Behdad Esfahbod * the following rules: 877e7be05702447ae270d797398132c1930cd3a9b86Behdad Esfahbod */ 878e7be05702447ae270d797398132c1930cd3a9b86Behdad Esfahbod 87946e645ec4b59f0a278347be11f40c7df700d5bb6Behdad Esfahbod if (pref_mask && base + 1 < end) /* Otherwise there can't be any pre-base reordering Ra. */ 88046e645ec4b59f0a278347be11f40c7df700d5bb6Behdad Esfahbod { 8818e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod for (unsigned int i = base + 1; i < end; i++) 8828e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod if ((info[i].mask & pref_mask) != 0) 88378818124b17691ec2c647142fdb9ae743aa03deeBehdad Esfahbod { 8848e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod /* 1. Only reorder a glyph produced by substitution during application 8858e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod * of the <pref> feature. (Note that a font may shape a Ra consonant with 8868e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod * the feature generally but block it in certain contexts.) 8878e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod */ 8888e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod if (i + 1 == end || (info[i + 1].mask & pref_mask) == 0) 8898e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod { 8908e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod /* 8918e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod * 2. Try to find a target position the same way as for pre-base matra. 8928e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod * If it is found, reorder pre-base consonant glyph. 8938e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod * 8948e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod * 3. If position is not found, reorder immediately before main 8958e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod * consonant. 8968e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod */ 8978e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod 8988e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod unsigned int new_pos = base; 8998e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod while (new_pos > start + 1 && 900deb521dee4fdca8c2124cfb39a205e6269d4a70dBehdad Esfahbod !(FLAG (info[new_pos - 1].indic_category()) & (FLAG (OT_M) | FLAG (OT_H) | FLAG (OT_Coeng)))) 9018e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod new_pos--; 9028e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod 903deb521dee4fdca8c2124cfb39a205e6269d4a70dBehdad Esfahbod if (new_pos > start && is_halant_or_coeng (info[new_pos - 1])) 9048e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod /* -> If ZWJ or ZWNJ follow this halant, position is moved after it. */ 9058e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod if (new_pos < end && is_joiner (info[new_pos])) 9068e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod new_pos++; 9078e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod 9088e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod { 9098e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod unsigned int old_pos = i; 9108e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod hb_glyph_info_t tmp = info[old_pos]; 9118e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod memmove (&info[new_pos + 1], &info[new_pos], (old_pos - new_pos) * sizeof (info[0])); 9128e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod info[new_pos] = tmp; 9138e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod start_of_last_cluster = MIN (new_pos, start_of_last_cluster); 9148e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod } 9158e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod } 9168e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod 9178e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod break; 91878818124b17691ec2c647142fdb9ae743aa03deeBehdad Esfahbod } 91946e645ec4b59f0a278347be11f40c7df700d5bb6Behdad Esfahbod } 920eed903b1644e087178438959664a6a57bebc398bBehdad Esfahbod 921eed903b1644e087178438959664a6a57bebc398bBehdad Esfahbod 922a913b024d84973556094fd64ce5f0b7106fcc3b5Behdad Esfahbod /* Apply 'init' to the Left Matra if it's a word start. */ 9236a091df9b403b147ef78f3974610dedf4ce1e08aBehdad Esfahbod if (info[start].indic_position () == POS_PRE_M && 924a913b024d84973556094fd64ce5f0b7106fcc3b5Behdad Esfahbod (!start || 925eace47b173807d94b29a6490d0bc3c9f8f6168d1Behdad Esfahbod !(FLAG (_hb_glyph_info_get_general_category (&info[start - 1])) & 926a913b024d84973556094fd64ce5f0b7106fcc3b5Behdad Esfahbod (FLAG (HB_UNICODE_GENERAL_CATEGORY_LOWERCASE_LETTER) | 927a913b024d84973556094fd64ce5f0b7106fcc3b5Behdad Esfahbod FLAG (HB_UNICODE_GENERAL_CATEGORY_MODIFIER_LETTER) | 928a913b024d84973556094fd64ce5f0b7106fcc3b5Behdad Esfahbod FLAG (HB_UNICODE_GENERAL_CATEGORY_OTHER_LETTER) | 929a913b024d84973556094fd64ce5f0b7106fcc3b5Behdad Esfahbod FLAG (HB_UNICODE_GENERAL_CATEGORY_TITLECASE_LETTER) | 930a913b024d84973556094fd64ce5f0b7106fcc3b5Behdad Esfahbod FLAG (HB_UNICODE_GENERAL_CATEGORY_UPPERCASE_LETTER) | 931a913b024d84973556094fd64ce5f0b7106fcc3b5Behdad Esfahbod FLAG (HB_UNICODE_GENERAL_CATEGORY_SPACING_MARK) | 932a913b024d84973556094fd64ce5f0b7106fcc3b5Behdad Esfahbod FLAG (HB_UNICODE_GENERAL_CATEGORY_ENCLOSING_MARK) | 933a913b024d84973556094fd64ce5f0b7106fcc3b5Behdad Esfahbod FLAG (HB_UNICODE_GENERAL_CATEGORY_NON_SPACING_MARK))))) 93446e645ec4b59f0a278347be11f40c7df700d5bb6Behdad Esfahbod info[start].mask |= init_mask; 935a913b024d84973556094fd64ce5f0b7106fcc3b5Behdad Esfahbod 936eed903b1644e087178438959664a6a57bebc398bBehdad Esfahbod 93721d2803133c2c424ed37a9f3d17c7fc4963e5a60Behdad Esfahbod 93821d2803133c2c424ed37a9f3d17c7fc4963e5a60Behdad Esfahbod /* Finish off the clusters and go home! */ 93921d2803133c2c424ed37a9f3d17c7fc4963e5a60Behdad Esfahbod 940a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbod if (!indic_options ().uniscribe_bug_compatible) 941ebe29733d44fe0fa9fb30f946ab0dd7a40336a24Behdad Esfahbod { 94221d2803133c2c424ed37a9f3d17c7fc4963e5a60Behdad Esfahbod /* This is what Uniscribe does. Ie. add cluster boundaries after Halant,ZWNJ. 94321d2803133c2c424ed37a9f3d17c7fc4963e5a60Behdad Esfahbod * This means, half forms are submerged into the main consonants cluster. 94421d2803133c2c424ed37a9f3d17c7fc4963e5a60Behdad Esfahbod * This is unnecessary, and makes cursor positioning harder, but that's what 94521d2803133c2c424ed37a9f3d17c7fc4963e5a60Behdad Esfahbod * Uniscribe does. */ 94621d2803133c2c424ed37a9f3d17c7fc4963e5a60Behdad Esfahbod unsigned int cluster_start = start; 94721d2803133c2c424ed37a9f3d17c7fc4963e5a60Behdad Esfahbod for (unsigned int i = start + 1; i < start_of_last_cluster; i++) 948deb521dee4fdca8c2124cfb39a205e6269d4a70dBehdad Esfahbod if (is_halant_or_coeng (info[i - 1]) && info[i].indic_category() == OT_ZWNJ) { 94921d2803133c2c424ed37a9f3d17c7fc4963e5a60Behdad Esfahbod i++; 95021d2803133c2c424ed37a9f3d17c7fc4963e5a60Behdad Esfahbod buffer->merge_clusters (cluster_start, i); 95121d2803133c2c424ed37a9f3d17c7fc4963e5a60Behdad Esfahbod cluster_start = i; 95221d2803133c2c424ed37a9f3d17c7fc4963e5a60Behdad Esfahbod } 95321d2803133c2c424ed37a9f3d17c7fc4963e5a60Behdad Esfahbod start_of_last_cluster = cluster_start; 95421d2803133c2c424ed37a9f3d17c7fc4963e5a60Behdad Esfahbod } 95521d2803133c2c424ed37a9f3d17c7fc4963e5a60Behdad Esfahbod 95621d2803133c2c424ed37a9f3d17c7fc4963e5a60Behdad Esfahbod buffer->merge_clusters (start_of_last_cluster, end); 957ef24cc8c8e2478a6352c340f4611a617646de4ccBehdad Esfahbod} 958e7be05702447ae270d797398132c1930cd3a9b86Behdad Esfahbod 959e7be05702447ae270d797398132c1930cd3a9b86Behdad Esfahbod 960ef24cc8c8e2478a6352c340f4611a617646de4ccBehdad Esfahbodstatic void 961ef24cc8c8e2478a6352c340f4611a617646de4ccBehdad Esfahbodfinal_reordering (const hb_ot_map_t *map, 9623f18236a03880c0960f5990dc90685f6146951a6Behdad Esfahbod hb_face_t *face HB_UNUSED, 963ef24cc8c8e2478a6352c340f4611a617646de4ccBehdad Esfahbod hb_buffer_t *buffer, 964ef24cc8c8e2478a6352c340f4611a617646de4ccBehdad Esfahbod void *user_data HB_UNUSED) 965ef24cc8c8e2478a6352c340f4611a617646de4ccBehdad Esfahbod{ 966ef24cc8c8e2478a6352c340f4611a617646de4ccBehdad Esfahbod unsigned int count = buffer->len; 967ef24cc8c8e2478a6352c340f4611a617646de4ccBehdad Esfahbod if (!count) return; 968ef24cc8c8e2478a6352c340f4611a617646de4ccBehdad Esfahbod 96946e645ec4b59f0a278347be11f40c7df700d5bb6Behdad Esfahbod hb_mask_t init_mask = map->get_1_mask (HB_TAG('i','n','i','t')); 97046e645ec4b59f0a278347be11f40c7df700d5bb6Behdad Esfahbod hb_mask_t pref_mask = map->get_1_mask (HB_TAG('p','r','e','f')); 971eed903b1644e087178438959664a6a57bebc398bBehdad Esfahbod 972ef24cc8c8e2478a6352c340f4611a617646de4ccBehdad Esfahbod hb_glyph_info_t *info = buffer->info; 973ef24cc8c8e2478a6352c340f4611a617646de4ccBehdad Esfahbod unsigned int last = 0; 974cee7187447b76b22e1bb6136d137b35ac49c3a5dBehdad Esfahbod unsigned int last_syllable = info[0].syllable(); 975ef24cc8c8e2478a6352c340f4611a617646de4ccBehdad Esfahbod for (unsigned int i = 1; i < count; i++) 976cee7187447b76b22e1bb6136d137b35ac49c3a5dBehdad Esfahbod if (last_syllable != info[i].syllable()) { 97746e645ec4b59f0a278347be11f40c7df700d5bb6Behdad Esfahbod final_reordering_syllable (buffer, init_mask, pref_mask, last, i); 978ef24cc8c8e2478a6352c340f4611a617646de4ccBehdad Esfahbod last = i; 979cee7187447b76b22e1bb6136d137b35ac49c3a5dBehdad Esfahbod last_syllable = info[last].syllable(); 980ef24cc8c8e2478a6352c340f4611a617646de4ccBehdad Esfahbod } 98146e645ec4b59f0a278347be11f40c7df700d5bb6Behdad Esfahbod final_reordering_syllable (buffer, init_mask, pref_mask, last, count); 982e7be05702447ae270d797398132c1930cd3a9b86Behdad Esfahbod 983743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod HB_BUFFER_DEALLOCATE_VAR (buffer, indic_category); 984743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod HB_BUFFER_DEALLOCATE_VAR (buffer, indic_position); 985743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod} 986743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod 987743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod 988b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod 989