hb-ot-shape-complex-indic.cc revision af92b4cc90e4184d5bdd8037c551ed482700114f
1b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod/*
227aba594c90b4444c35273a38f5fedc8e09d9a88Behdad Esfahbod * Copyright © 2011,2012  Google, Inc.
3b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod *
4b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod *  This is part of HarfBuzz, a text shaping library.
5b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod *
6b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod * Permission is hereby granted, without written agreement and without
7b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod * license or royalty fees, to use, copy, modify, and distribute this
8b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod * software and its documentation for any purpose, provided that the
9b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod * above copyright notice and the following two paragraphs appear in
10b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod * all copies of this software.
11b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod *
12b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod * IN NO EVENT SHALL THE COPYRIGHT HOLDER BE LIABLE TO ANY PARTY FOR
13b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod * DIRECT, INDIRECT, SPECIAL, INCIDENTAL, OR CONSEQUENTIAL DAMAGES
14b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod * ARISING OUT OF THE USE OF THIS SOFTWARE AND ITS DOCUMENTATION, EVEN
15b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod * IF THE COPYRIGHT HOLDER HAS BEEN ADVISED OF THE POSSIBILITY OF SUCH
16b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod * DAMAGE.
17b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod *
18b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod * THE COPYRIGHT HOLDER SPECIFICALLY DISCLAIMS ANY WARRANTIES, INCLUDING,
19b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod * BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND
20b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod * FITNESS FOR A PARTICULAR PURPOSE.  THE SOFTWARE PROVIDED HEREUNDER IS
21b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod * ON AN "AS IS" BASIS, AND THE COPYRIGHT HOLDER HAS NO OBLIGATION TO
22b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod * PROVIDE MAINTENANCE, SUPPORT, UPDATES, ENHANCEMENTS, OR MODIFICATIONS.
23b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod *
24b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod * Google Author(s): Behdad Esfahbod
25b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod */
26b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod
273ed4634ec349fa9e943ad23718c04be4dd4bba62Behdad Esfahbod#include "hb-ot-shape-complex-indic-private.hh"
28a913b024d84973556094fd64ce5f0b7106fcc3b5Behdad Esfahbod#include "hb-ot-shape-private.hh"
29352372ae5ea0998e40cf9fe43c22b6b610a5764eBehdad Esfahbod
30a3e04bee2c2fa648759a87e460db6b4f1b685586Behdad Esfahbod#define OLD_INDIC_TAG(script) (((hb_tag_t) script) | 0x20000000)
31a3e04bee2c2fa648759a87e460db6b4f1b685586Behdad Esfahbod#define IS_OLD_INDIC_TAG(tag) ( \
32a3e04bee2c2fa648759a87e460db6b4f1b685586Behdad Esfahbod				(tag) == OLD_INDIC_TAG (HB_SCRIPT_BENGALI) || \
33a3e04bee2c2fa648759a87e460db6b4f1b685586Behdad Esfahbod				(tag) == OLD_INDIC_TAG (HB_SCRIPT_DEVANAGARI) || \
34a3e04bee2c2fa648759a87e460db6b4f1b685586Behdad Esfahbod				(tag) == OLD_INDIC_TAG (HB_SCRIPT_GUJARATI) || \
35a3e04bee2c2fa648759a87e460db6b4f1b685586Behdad Esfahbod				(tag) == OLD_INDIC_TAG (HB_SCRIPT_GURMUKHI) || \
36a3e04bee2c2fa648759a87e460db6b4f1b685586Behdad Esfahbod				(tag) == OLD_INDIC_TAG (HB_SCRIPT_KANNADA) || \
37a3e04bee2c2fa648759a87e460db6b4f1b685586Behdad Esfahbod				(tag) == OLD_INDIC_TAG (HB_SCRIPT_MALAYALAM) || \
38a3e04bee2c2fa648759a87e460db6b4f1b685586Behdad Esfahbod				(tag) == OLD_INDIC_TAG (HB_SCRIPT_ORIYA) || \
39a3e04bee2c2fa648759a87e460db6b4f1b685586Behdad Esfahbod				(tag) == OLD_INDIC_TAG (HB_SCRIPT_TAMIL) || \
40a3e04bee2c2fa648759a87e460db6b4f1b685586Behdad Esfahbod				(tag) == OLD_INDIC_TAG (HB_SCRIPT_TELUGU) \
41a3e04bee2c2fa648759a87e460db6b4f1b685586Behdad Esfahbod			      )
42a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbodstruct indic_options_t
43ebe29733d44fe0fa9fb30f946ab0dd7a40336a24Behdad Esfahbod{
44a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbod  int initialized : 1;
45a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbod  int uniscribe_bug_compatible : 1;
46a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbod};
47a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbod
48a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbodunion indic_options_union_t {
49a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbod  int i;
50a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbod  indic_options_t opts;
51a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbod};
52a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad EsfahbodASSERT_STATIC (sizeof (int) == sizeof (indic_options_union_t));
53a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbod
54a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbodstatic indic_options_union_t
55a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbodindic_options_init (void)
56a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbod{
57a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbod  indic_options_union_t u;
58a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbod  u.i = 0;
59a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbod  u.opts.initialized = 1;
60a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbod
61a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbod  char *c = getenv ("HB_OT_INDIC_OPTIONS");
62a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbod  u.opts.uniscribe_bug_compatible = c && strstr (c, "uniscribe-bug-compatible");
63a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbod
64a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbod  return u;
65a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbod}
66a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbod
67a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbodinline indic_options_t
68a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbodindic_options (void)
69a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbod{
70a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbod  static indic_options_union_t options;
71a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbod
72a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbod  if (unlikely (!options.i)) {
73a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbod    /* This is idempotent and threadsafe. */
74a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbod    options = indic_options_init ();
75ebe29733d44fe0fa9fb30f946ab0dd7a40336a24Behdad Esfahbod  }
76ebe29733d44fe0fa9fb30f946ab0dd7a40336a24Behdad Esfahbod
77a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbod  return options.opts;
78a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbod}
79a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbod
80ebe29733d44fe0fa9fb30f946ab0dd7a40336a24Behdad Esfahbod
81743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbodstatic int
82743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbodcompare_codepoint (const void *pa, const void *pb)
83743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod{
84743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod  hb_codepoint_t a = * (hb_codepoint_t *) pa;
85743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod  hb_codepoint_t b = * (hb_codepoint_t *) pb;
86743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod
87743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod  return a < b ? -1 : a == b ? 0 : +1;
88743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod}
89743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod
90743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbodstatic indic_position_t
91743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbodconsonant_position (hb_codepoint_t u)
92743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod{
93743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod  consonant_position_t *record;
94743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod
950de771b72da6b342b015e3556190821547a4011dBehdad Esfahbod  /* Khmer does not have pre-base half forms. */
960de771b72da6b342b015e3556190821547a4011dBehdad Esfahbod  if (0x1780 <= u && u <= 0x17FF)
970de771b72da6b342b015e3556190821547a4011dBehdad Esfahbod    return POS_BELOW_C;
980de771b72da6b342b015e3556190821547a4011dBehdad Esfahbod
99743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod  record = (consonant_position_t *) bsearch (&u, consonant_positions,
100743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod					     ARRAY_LENGTH (consonant_positions),
101743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod					     sizeof (consonant_positions[0]),
102743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod					     compare_codepoint);
103743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod
104dbccf87eef0d26838fa4bb3ae26410f6c4818836Behdad Esfahbod  return record ? record->position : POS_BASE_C;
105743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod}
106743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod
107352372ae5ea0998e40cf9fe43c22b6b610a5764eBehdad Esfahbodstatic bool
108352372ae5ea0998e40cf9fe43c22b6b610a5764eBehdad Esfahbodis_ra (hb_codepoint_t u)
109352372ae5ea0998e40cf9fe43c22b6b610a5764eBehdad Esfahbod{
110352372ae5ea0998e40cf9fe43c22b6b610a5764eBehdad Esfahbod  return !!bsearch (&u, ra_chars,
111352372ae5ea0998e40cf9fe43c22b6b610a5764eBehdad Esfahbod		    ARRAY_LENGTH (ra_chars),
112352372ae5ea0998e40cf9fe43c22b6b610a5764eBehdad Esfahbod		    sizeof (ra_chars[0]),
113352372ae5ea0998e40cf9fe43c22b6b610a5764eBehdad Esfahbod		    compare_codepoint);
114352372ae5ea0998e40cf9fe43c22b6b610a5764eBehdad Esfahbod}
115352372ae5ea0998e40cf9fe43c22b6b610a5764eBehdad Esfahbod
1169ee27a928a989c71923cef82a9e9828f8e9ca051Behdad Esfahbodstatic bool
1179da0487cd452d780673e24329ce03e174a4ef83bBehdad Esfahbodis_joiner (const hb_glyph_info_t &info)
1189ee27a928a989c71923cef82a9e9828f8e9ca051Behdad Esfahbod{
1199da0487cd452d780673e24329ce03e174a4ef83bBehdad Esfahbod  return !!(FLAG (info.indic_category()) & (FLAG (OT_ZWJ) | FLAG (OT_ZWNJ)));
1209da0487cd452d780673e24329ce03e174a4ef83bBehdad Esfahbod}
1219da0487cd452d780673e24329ce03e174a4ef83bBehdad Esfahbod
1229da0487cd452d780673e24329ce03e174a4ef83bBehdad Esfahbodstatic bool
1239da0487cd452d780673e24329ce03e174a4ef83bBehdad Esfahbodis_consonant (const hb_glyph_info_t &info)
1249da0487cd452d780673e24329ce03e174a4ef83bBehdad Esfahbod{
1251a1fa8c655a082fc1439608457ba717306cc83caBehdad Esfahbod  /* Note:
1261a1fa8c655a082fc1439608457ba717306cc83caBehdad Esfahbod   *
12718c06e189bd078affbb84c3bb5bb80687a227c5eBehdad Esfahbod   * We treat Vowels and placeholders as if they were consonants.  This is safe because Vowels
128c5306b6861cfaa50af40e8ceb058791fa06d7981Behdad Esfahbod   * cannot happen in a consonant syllable.  The plus side however is, we can call the
129c5306b6861cfaa50af40e8ceb058791fa06d7981Behdad Esfahbod   * consonant syllable logic from the vowel syllable function and get it all right! */
13018c06e189bd078affbb84c3bb5bb80687a227c5eBehdad Esfahbod  return !!(FLAG (info.indic_category()) & (FLAG (OT_C) | FLAG (OT_Ra) | FLAG (OT_V) | FLAG (OT_NBSP) | FLAG (OT_DOTTEDCIRCLE)));
1319ee27a928a989c71923cef82a9e9828f8e9ca051Behdad Esfahbod}
132c7fe56a1d5d3e969b6ec51cd9ecd471706a19568Behdad Esfahbod
133eed903b1644e087178438959664a6a57bebc398bBehdad Esfahbodstruct feature_list_t {
134c7fe56a1d5d3e969b6ec51cd9ecd471706a19568Behdad Esfahbod  hb_tag_t tag;
135c7fe56a1d5d3e969b6ec51cd9ecd471706a19568Behdad Esfahbod  hb_bool_t is_global;
136eed903b1644e087178438959664a6a57bebc398bBehdad Esfahbod};
137eed903b1644e087178438959664a6a57bebc398bBehdad Esfahbod
138eed903b1644e087178438959664a6a57bebc398bBehdad Esfahbodstatic const feature_list_t
139eed903b1644e087178438959664a6a57bebc398bBehdad Esfahbodindic_basic_features[] =
140b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod{
141c7fe56a1d5d3e969b6ec51cd9ecd471706a19568Behdad Esfahbod  {HB_TAG('n','u','k','t'), true},
142c7fe56a1d5d3e969b6ec51cd9ecd471706a19568Behdad Esfahbod  {HB_TAG('a','k','h','n'), false},
143c7fe56a1d5d3e969b6ec51cd9ecd471706a19568Behdad Esfahbod  {HB_TAG('r','p','h','f'), false},
1441ac075b227090a9ad930dcc1670236c176b27067Behdad Esfahbod  {HB_TAG('r','k','r','f'), true},
145c7fe56a1d5d3e969b6ec51cd9ecd471706a19568Behdad Esfahbod  {HB_TAG('p','r','e','f'), false},
146c7fe56a1d5d3e969b6ec51cd9ecd471706a19568Behdad Esfahbod  {HB_TAG('b','l','w','f'), false},
147c7fe56a1d5d3e969b6ec51cd9ecd471706a19568Behdad Esfahbod  {HB_TAG('h','a','l','f'), false},
14829f106d7fba25e1464debd3a4831a7380d75c4c9Behdad Esfahbod  {HB_TAG('a','b','v','f'), false},
149c7fe56a1d5d3e969b6ec51cd9ecd471706a19568Behdad Esfahbod  {HB_TAG('p','s','t','f'), false},
1509da0487cd452d780673e24329ce03e174a4ef83bBehdad Esfahbod  {HB_TAG('c','j','c','t'), false},
1511d6846db9ebf84561bb30a4e48c6c43184914099Behdad Esfahbod  {HB_TAG('v','a','t','u'), true},
152c7fe56a1d5d3e969b6ec51cd9ecd471706a19568Behdad Esfahbod};
153c7fe56a1d5d3e969b6ec51cd9ecd471706a19568Behdad Esfahbod
154c7fe56a1d5d3e969b6ec51cd9ecd471706a19568Behdad Esfahbod/* Same order as the indic_basic_features array */
155c7fe56a1d5d3e969b6ec51cd9ecd471706a19568Behdad Esfahbodenum {
156c7fe56a1d5d3e969b6ec51cd9ecd471706a19568Behdad Esfahbod  _NUKT,
157c7fe56a1d5d3e969b6ec51cd9ecd471706a19568Behdad Esfahbod  AKHN,
158c7fe56a1d5d3e969b6ec51cd9ecd471706a19568Behdad Esfahbod  RPHF,
159df6d45c693c417bf311e6fa49f18a8558542e525Behdad Esfahbod  _RKRF,
160c7fe56a1d5d3e969b6ec51cd9ecd471706a19568Behdad Esfahbod  PREF,
161c7fe56a1d5d3e969b6ec51cd9ecd471706a19568Behdad Esfahbod  BLWF,
162c7fe56a1d5d3e969b6ec51cd9ecd471706a19568Behdad Esfahbod  HALF,
16329f106d7fba25e1464debd3a4831a7380d75c4c9Behdad Esfahbod  ABVF,
164c7fe56a1d5d3e969b6ec51cd9ecd471706a19568Behdad Esfahbod  PSTF,
1651d6846db9ebf84561bb30a4e48c6c43184914099Behdad Esfahbod  CJCT,
1661d6846db9ebf84561bb30a4e48c6c43184914099Behdad Esfahbod  VATU
167b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod};
168b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod
169eed903b1644e087178438959664a6a57bebc398bBehdad Esfahbodstatic const feature_list_t
170eed903b1644e087178438959664a6a57bebc398bBehdad Esfahbodindic_other_features[] =
171b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod{
172eed903b1644e087178438959664a6a57bebc398bBehdad Esfahbod  {HB_TAG('i','n','i','t'), false},
173eed903b1644e087178438959664a6a57bebc398bBehdad Esfahbod  {HB_TAG('p','r','e','s'), true},
174eed903b1644e087178438959664a6a57bebc398bBehdad Esfahbod  {HB_TAG('a','b','v','s'), true},
175eed903b1644e087178438959664a6a57bebc398bBehdad Esfahbod  {HB_TAG('b','l','w','s'), true},
176eed903b1644e087178438959664a6a57bebc398bBehdad Esfahbod  {HB_TAG('p','s','t','s'), true},
177eed903b1644e087178438959664a6a57bebc398bBehdad Esfahbod  {HB_TAG('h','a','l','n'), true},
178eed903b1644e087178438959664a6a57bebc398bBehdad Esfahbod
179eed903b1644e087178438959664a6a57bebc398bBehdad Esfahbod  {HB_TAG('d','i','s','t'), true},
180eed903b1644e087178438959664a6a57bebc398bBehdad Esfahbod  {HB_TAG('a','b','v','m'), true},
181eed903b1644e087178438959664a6a57bebc398bBehdad Esfahbod  {HB_TAG('b','l','w','m'), true},
182eed903b1644e087178438959664a6a57bebc398bBehdad Esfahbod};
183eed903b1644e087178438959664a6a57bebc398bBehdad Esfahbod
184743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod
185743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbodstatic void
186743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbodinitial_reordering (const hb_ot_map_t *map,
187743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod		    hb_face_t *face,
188743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod		    hb_buffer_t *buffer,
189743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod		    void *user_data HB_UNUSED);
190f6fd3780e12b23ff7ed3743497c8996e71dcb064Behdad Esfahbodstatic void
191f6fd3780e12b23ff7ed3743497c8996e71dcb064Behdad Esfahbodfinal_reordering (const hb_ot_map_t *map,
192f6fd3780e12b23ff7ed3743497c8996e71dcb064Behdad Esfahbod		  hb_face_t *face,
193f6fd3780e12b23ff7ed3743497c8996e71dcb064Behdad Esfahbod		  hb_buffer_t *buffer,
194743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod		  void *user_data HB_UNUSED);
195b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod
196b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbodvoid
1979f377ed3210fe7d9f15e0c4f82020556f9a8f6f0Behdad Esfahbod_hb_ot_shape_complex_collect_features_indic (hb_ot_map_builder_t *map,
1989f377ed3210fe7d9f15e0c4f82020556f9a8f6f0Behdad Esfahbod					     const hb_segment_properties_t *props HB_UNUSED)
199b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod{
200f6fd3780e12b23ff7ed3743497c8996e71dcb064Behdad Esfahbod  map->add_bool_feature (HB_TAG('l','o','c','l'));
201a54a5505a35eef5315a8e2e7a79502901e3eff5fBehdad Esfahbod  /* The Indic specs do not require ccmp, but we apply it here since if
202a54a5505a35eef5315a8e2e7a79502901e3eff5fBehdad Esfahbod   * there is a use of it, it's typically at the beginning. */
203f6fd3780e12b23ff7ed3743497c8996e71dcb064Behdad Esfahbod  map->add_bool_feature (HB_TAG('c','c','m','p'));
204f6fd3780e12b23ff7ed3743497c8996e71dcb064Behdad Esfahbod
205743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod  map->add_gsub_pause (initial_reordering, NULL);
206f6fd3780e12b23ff7ed3743497c8996e71dcb064Behdad Esfahbod
207412b91889d9a1ae477e8b6907d0b9a76e78a6c91Behdad Esfahbod  for (unsigned int i = 0; i < ARRAY_LENGTH (indic_basic_features); i++) {
20876f76812ac7cca8ac6935952a2360d5e151480faBehdad Esfahbod    map->add_bool_feature (indic_basic_features[i].tag, indic_basic_features[i].is_global);
209412b91889d9a1ae477e8b6907d0b9a76e78a6c91Behdad Esfahbod    map->add_gsub_pause (NULL, NULL);
210412b91889d9a1ae477e8b6907d0b9a76e78a6c91Behdad Esfahbod  }
211b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod
212f6fd3780e12b23ff7ed3743497c8996e71dcb064Behdad Esfahbod  map->add_gsub_pause (final_reordering, NULL);
213f6fd3780e12b23ff7ed3743497c8996e71dcb064Behdad Esfahbod
214412b91889d9a1ae477e8b6907d0b9a76e78a6c91Behdad Esfahbod  for (unsigned int i = 0; i < ARRAY_LENGTH (indic_other_features); i++) {
215eed903b1644e087178438959664a6a57bebc398bBehdad Esfahbod    map->add_bool_feature (indic_other_features[i].tag, indic_other_features[i].is_global);
216412b91889d9a1ae477e8b6907d0b9a76e78a6c91Behdad Esfahbod    map->add_gsub_pause (NULL, NULL);
217412b91889d9a1ae477e8b6907d0b9a76e78a6c91Behdad Esfahbod  }
218b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod}
219b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod
220d96838ef951ce6170eb2dc576ebcba2262cf7008Behdad Esfahbodvoid
221d96838ef951ce6170eb2dc576ebcba2262cf7008Behdad Esfahbod_hb_ot_shape_complex_override_features_indic (hb_ot_map_builder_t *map,
222d96838ef951ce6170eb2dc576ebcba2262cf7008Behdad Esfahbod					      const hb_segment_properties_t *props HB_UNUSED)
223d96838ef951ce6170eb2dc576ebcba2262cf7008Behdad Esfahbod{
224af92b4cc90e4184d5bdd8037c551ed482700114fBehdad Esfahbod  /* Uniscribe does not apply 'kern'. */
225af92b4cc90e4184d5bdd8037c551ed482700114fBehdad Esfahbod  if (indic_options ().uniscribe_bug_compatible)
226af92b4cc90e4184d5bdd8037c551ed482700114fBehdad Esfahbod    map->add_feature (HB_TAG('k','e','r','n'), 0, true);
227d96838ef951ce6170eb2dc576ebcba2262cf7008Behdad Esfahbod}
228d96838ef951ce6170eb2dc576ebcba2262cf7008Behdad Esfahbod
229867361c3ad39629a8d5b7dc48d558a1c19e37d43Behdad Esfahbod
23011138ccff71f442da1fcf64faa0e1d22e083e775Behdad Esfahbodhb_ot_shape_normalization_mode_t
23111138ccff71f442da1fcf64faa0e1d22e083e775Behdad Esfahbod_hb_ot_shape_complex_normalization_preference_indic (void)
23202cdf743c2ec345a44d4fcf865594b6ac13fccd0Behdad Esfahbod{
23302cdf743c2ec345a44d4fcf865594b6ac13fccd0Behdad Esfahbod  /* We want split matras decomposed by the common shaping logic. */
23411138ccff71f442da1fcf64faa0e1d22e083e775Behdad Esfahbod  return HB_OT_SHAPE_NORMALIZATION_MODE_DECOMPOSED;
23502cdf743c2ec345a44d4fcf865594b6ac13fccd0Behdad Esfahbod}
23602cdf743c2ec345a44d4fcf865594b6ac13fccd0Behdad Esfahbod
237867361c3ad39629a8d5b7dc48d558a1c19e37d43Behdad Esfahbod
238b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbodvoid
2399f377ed3210fe7d9f15e0c4f82020556f9a8f6f0Behdad Esfahbod_hb_ot_shape_complex_setup_masks_indic (hb_ot_map_t *map HB_UNUSED,
2409f377ed3210fe7d9f15e0c4f82020556f9a8f6f0Behdad Esfahbod					hb_buffer_t *buffer,
2413f18236a03880c0960f5990dc90685f6146951a6Behdad Esfahbod					hb_font_t *font HB_UNUSED)
242b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod{
2439f9bcceca6321d5a5812f878de1de39901349a78Behdad Esfahbod  HB_BUFFER_ALLOCATE_VAR (buffer, indic_category);
2449f9bcceca6321d5a5812f878de1de39901349a78Behdad Esfahbod  HB_BUFFER_ALLOCATE_VAR (buffer, indic_position);
2459f9bcceca6321d5a5812f878de1de39901349a78Behdad Esfahbod
246743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod  /* We cannot setup masks here.  We save information about characters
247743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod   * and setup masks later on in a pause-callback. */
248743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod
249743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod  unsigned int count = buffer->len;
250b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod  for (unsigned int i = 0; i < count; i++)
251b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod  {
25292332e5116271a5d96e532005fe750e7552a6cbbBehdad Esfahbod    hb_glyph_info_t &info = buffer->info[i];
25392332e5116271a5d96e532005fe750e7552a6cbbBehdad Esfahbod    unsigned int type = get_indic_categories (info.codepoint);
25492332e5116271a5d96e532005fe750e7552a6cbbBehdad Esfahbod
25592332e5116271a5d96e532005fe750e7552a6cbbBehdad Esfahbod    info.indic_category() = type & 0x0F;
25692332e5116271a5d96e532005fe750e7552a6cbbBehdad Esfahbod    info.indic_position() = type >> 4;
25792332e5116271a5d96e532005fe750e7552a6cbbBehdad Esfahbod
2583399a06e7033651ee926448737bdb18e553c1796Behdad Esfahbod    /* The spec says U+0952 is OT_A.  However, testing shows that Uniscribe
2593399a06e7033651ee926448737bdb18e553c1796Behdad Esfahbod     * treats U+0951..U+0952 all as OT_VD.
2603399a06e7033651ee926448737bdb18e553c1796Behdad Esfahbod     * TESTS:
2613399a06e7033651ee926448737bdb18e553c1796Behdad Esfahbod     * U+092E,U+0947,U+0952
2623399a06e7033651ee926448737bdb18e553c1796Behdad Esfahbod     * U+092E,U+0952,U+0947
2633399a06e7033651ee926448737bdb18e553c1796Behdad Esfahbod     * U+092E,U+0947,U+0951
2643399a06e7033651ee926448737bdb18e553c1796Behdad Esfahbod     * U+092E,U+0951,U+0947
2653399a06e7033651ee926448737bdb18e553c1796Behdad Esfahbod     * */
2663399a06e7033651ee926448737bdb18e553c1796Behdad Esfahbod    if (unlikely (hb_in_range<hb_codepoint_t> (info.codepoint, 0x0951, 0x0954)))
2673399a06e7033651ee926448737bdb18e553c1796Behdad Esfahbod      info.indic_category() = OT_VD;
2683399a06e7033651ee926448737bdb18e553c1796Behdad Esfahbod
269df50b8474094f0563ccfdae12c4425a51b72add6Behdad Esfahbod    if (info.indic_category() == OT_X &&
270df50b8474094f0563ccfdae12c4425a51b72add6Behdad Esfahbod	unlikely (hb_in_range<hb_codepoint_t> (info.codepoint, 0x17CB, 0x17D0)))
271df50b8474094f0563ccfdae12c4425a51b72add6Behdad Esfahbod      info.indic_category() = OT_RS;
272df50b8474094f0563ccfdae12c4425a51b72add6Behdad Esfahbod
27392332e5116271a5d96e532005fe750e7552a6cbbBehdad Esfahbod    if (info.indic_category() == OT_C) {
27492332e5116271a5d96e532005fe750e7552a6cbbBehdad Esfahbod      info.indic_position() = consonant_position (info.codepoint);
27592332e5116271a5d96e532005fe750e7552a6cbbBehdad Esfahbod      if (is_ra (info.codepoint))
27692332e5116271a5d96e532005fe750e7552a6cbbBehdad Esfahbod	info.indic_category() = OT_Ra;
2777d09c98a1fff97127e48eae48d380dc9fcff288eBehdad Esfahbod    } else if (info.indic_category() == OT_RS) {
2787d09c98a1fff97127e48eae48d380dc9fcff288eBehdad Esfahbod      info.indic_position() = POS_ABOVE_M;
27992332e5116271a5d96e532005fe750e7552a6cbbBehdad Esfahbod    } else if (info.indic_category() == OT_SM ||
28092332e5116271a5d96e532005fe750e7552a6cbbBehdad Esfahbod	       info.indic_category() == OT_VD) {
28192332e5116271a5d96e532005fe750e7552a6cbbBehdad Esfahbod      info.indic_position() = POS_SMVD;
28292332e5116271a5d96e532005fe750e7552a6cbbBehdad Esfahbod    } else if (unlikely (info.codepoint == 0x200C))
28392332e5116271a5d96e532005fe750e7552a6cbbBehdad Esfahbod      info.indic_category() = OT_ZWNJ;
28492332e5116271a5d96e532005fe750e7552a6cbbBehdad Esfahbod    else if (unlikely (info.codepoint == 0x200D))
28592332e5116271a5d96e532005fe750e7552a6cbbBehdad Esfahbod      info.indic_category() = OT_ZWJ;
28618c06e189bd078affbb84c3bb5bb80687a227c5eBehdad Esfahbod    else if (unlikely (info.codepoint == 0x25CC))
28718c06e189bd078affbb84c3bb5bb80687a227c5eBehdad Esfahbod      info.indic_category() = OT_DOTTEDCIRCLE;
288b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod  }
289743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod}
290b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod
29145d6f29f15f1d2323bcaa2498aed23ff0c8a1567Behdad Esfahbodstatic int
29245d6f29f15f1d2323bcaa2498aed23ff0c8a1567Behdad Esfahbodcompare_indic_order (const hb_glyph_info_t *pa, const hb_glyph_info_t *pb)
29345d6f29f15f1d2323bcaa2498aed23ff0c8a1567Behdad Esfahbod{
29445d6f29f15f1d2323bcaa2498aed23ff0c8a1567Behdad Esfahbod  int a = pa->indic_position();
29545d6f29f15f1d2323bcaa2498aed23ff0c8a1567Behdad Esfahbod  int b = pb->indic_position();
29645d6f29f15f1d2323bcaa2498aed23ff0c8a1567Behdad Esfahbod
29745d6f29f15f1d2323bcaa2498aed23ff0c8a1567Behdad Esfahbod  return a < b ? -1 : a == b ? 0 : +1;
29845d6f29f15f1d2323bcaa2498aed23ff0c8a1567Behdad Esfahbod}
299867361c3ad39629a8d5b7dc48d558a1c19e37d43Behdad Esfahbod
3007ea58db311bfb0d8f804d1e9f4a1f004bd45075aBehdad Esfahbod/* Rules from:
3017ea58db311bfb0d8f804d1e9f4a1f004bd45075aBehdad Esfahbod * https://www.microsoft.com/typography/otfntdev/devanot/shaping.aspx */
3027ea58db311bfb0d8f804d1e9f4a1f004bd45075aBehdad Esfahbod
303743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbodstatic void
30470fe77bb9a25922bd34f206826d8731d901fb451Behdad Esfahbodinitial_reordering_consonant_syllable (const hb_ot_map_t *map, hb_buffer_t *buffer, hb_mask_t *basic_mask_array,
305ef24cc8c8e2478a6352c340f4611a617646de4ccBehdad Esfahbod				       unsigned int start, unsigned int end)
306743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod{
307ee58f3bc75d2d071a71b94063bf12205a5871acbBehdad Esfahbod  hb_glyph_info_t *info = buffer->info;
308743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod
309617f4ac46f1084859d2034c08760e31e52d3bec3Behdad Esfahbod
310743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod  /* 1. Find base consonant:
311743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod   *
312743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod   * The shaping engine finds the base consonant of the syllable, using the
313743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod   * following algorithm: starting from the end of the syllable, move backwards
314743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod   * until a consonant is found that does not have a below-base or post-base
315743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod   * form (post-base forms have to follow below-base forms), or that is not a
316743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod   * pre-base reordering Ra, or arrive at the first consonant. The consonant
317743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod   * stopped at will be the base.
318743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod   *
319743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod   *   o If the syllable starts with Ra + Halant (in a script that has Reph)
320743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod   *     and has more than one consonant, Ra is excluded from candidates for
321743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod   *     base consonants.
322743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod   */
323743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod
3245e72071062c015237b79fbd0521341a63166a204Behdad Esfahbod  unsigned int base = end;
32576b3409de6887c1cdd5c679939497b1b56f4554bBehdad Esfahbod  bool has_reph = false;
326743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod
32776b3409de6887c1cdd5c679939497b1b56f4554bBehdad Esfahbod  {
328617f4ac46f1084859d2034c08760e31e52d3bec3Behdad Esfahbod    /* -> If the syllable starts with Ra + Halant (in a script that has Reph)
329617f4ac46f1084859d2034c08760e31e52d3bec3Behdad Esfahbod     *    and has more than one consonant, Ra is excluded from candidates for
330617f4ac46f1084859d2034c08760e31e52d3bec3Behdad Esfahbod     *    base consonants. */
331617f4ac46f1084859d2034c08760e31e52d3bec3Behdad Esfahbod    unsigned int limit = start;
33270fe77bb9a25922bd34f206826d8731d901fb451Behdad Esfahbod    if (basic_mask_array[RPHF] &&
333617f4ac46f1084859d2034c08760e31e52d3bec3Behdad Esfahbod	start + 3 <= end &&
334617f4ac46f1084859d2034c08760e31e52d3bec3Behdad Esfahbod	info[start].indic_category() == OT_Ra &&
335617f4ac46f1084859d2034c08760e31e52d3bec3Behdad Esfahbod	info[start + 1].indic_category() == OT_H &&
336617f4ac46f1084859d2034c08760e31e52d3bec3Behdad Esfahbod	!is_joiner (info[start + 2]))
337617f4ac46f1084859d2034c08760e31e52d3bec3Behdad Esfahbod    {
338617f4ac46f1084859d2034c08760e31e52d3bec3Behdad Esfahbod      limit += 2;
339617f4ac46f1084859d2034c08760e31e52d3bec3Behdad Esfahbod      base = start;
340617f4ac46f1084859d2034c08760e31e52d3bec3Behdad Esfahbod      has_reph = true;
341617f4ac46f1084859d2034c08760e31e52d3bec3Behdad Esfahbod    };
34276b3409de6887c1cdd5c679939497b1b56f4554bBehdad Esfahbod
3433c2ea9481b1028e927e615a5434ebf8edcb5f891Behdad Esfahbod    /* -> starting from the end of the syllable, move backwards */
3443c2ea9481b1028e927e615a5434ebf8edcb5f891Behdad Esfahbod    unsigned int i = end;
3453c2ea9481b1028e927e615a5434ebf8edcb5f891Behdad Esfahbod    do {
3463c2ea9481b1028e927e615a5434ebf8edcb5f891Behdad Esfahbod      i--;
3473c2ea9481b1028e927e615a5434ebf8edcb5f891Behdad Esfahbod      /* -> until a consonant is found */
3483c2ea9481b1028e927e615a5434ebf8edcb5f891Behdad Esfahbod      if (is_consonant (info[i]))
349743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod      {
3503c2ea9481b1028e927e615a5434ebf8edcb5f891Behdad Esfahbod	/* -> that does not have a below-base or post-base form
3513c2ea9481b1028e927e615a5434ebf8edcb5f891Behdad Esfahbod	 * (post-base forms have to follow below-base forms), */
3523c2ea9481b1028e927e615a5434ebf8edcb5f891Behdad Esfahbod	if (info[i].indic_position() != POS_BELOW_C &&
3533c2ea9481b1028e927e615a5434ebf8edcb5f891Behdad Esfahbod	    info[i].indic_position() != POS_POST_C)
3543c2ea9481b1028e927e615a5434ebf8edcb5f891Behdad Esfahbod	{
3553c2ea9481b1028e927e615a5434ebf8edcb5f891Behdad Esfahbod	  base = i;
3563c2ea9481b1028e927e615a5434ebf8edcb5f891Behdad Esfahbod	  break;
3573c2ea9481b1028e927e615a5434ebf8edcb5f891Behdad Esfahbod	}
358743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod
3593c2ea9481b1028e927e615a5434ebf8edcb5f891Behdad Esfahbod	/* -> or that is not a pre-base reordering Ra,
3603c2ea9481b1028e927e615a5434ebf8edcb5f891Behdad Esfahbod	 *
3613c2ea9481b1028e927e615a5434ebf8edcb5f891Behdad Esfahbod	 * TODO
3623c2ea9481b1028e927e615a5434ebf8edcb5f891Behdad Esfahbod	 */
363e7be05702447ae270d797398132c1930cd3a9b86Behdad Esfahbod
3643c2ea9481b1028e927e615a5434ebf8edcb5f891Behdad Esfahbod	/* -> or arrive at the first consonant. The consonant stopped at will
3653c2ea9481b1028e927e615a5434ebf8edcb5f891Behdad Esfahbod	 * be the base. */
3663c2ea9481b1028e927e615a5434ebf8edcb5f891Behdad Esfahbod	base = i;
3673c2ea9481b1028e927e615a5434ebf8edcb5f891Behdad Esfahbod      }
3683c2ea9481b1028e927e615a5434ebf8edcb5f891Behdad Esfahbod      else
3693c2ea9481b1028e927e615a5434ebf8edcb5f891Behdad Esfahbod	if (is_joiner (info[i]))
3703c2ea9481b1028e927e615a5434ebf8edcb5f891Behdad Esfahbod	  break;
3713c2ea9481b1028e927e615a5434ebf8edcb5f891Behdad Esfahbod    } while (i > limit);
3723c2ea9481b1028e927e615a5434ebf8edcb5f891Behdad Esfahbod    if (base < start)
3733c2ea9481b1028e927e615a5434ebf8edcb5f891Behdad Esfahbod      base = start; /* Just in case... */
374743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod
375617f4ac46f1084859d2034c08760e31e52d3bec3Behdad Esfahbod
376617f4ac46f1084859d2034c08760e31e52d3bec3Behdad Esfahbod    /* -> If the syllable starts with Ra + Halant (in a script that has Reph)
377617f4ac46f1084859d2034c08760e31e52d3bec3Behdad Esfahbod     *    and has more than one consonant, Ra is excluded from candidates for
378617f4ac46f1084859d2034c08760e31e52d3bec3Behdad Esfahbod     *    base consonants. */
379617f4ac46f1084859d2034c08760e31e52d3bec3Behdad Esfahbod    if (has_reph && base == start) {
380617f4ac46f1084859d2034c08760e31e52d3bec3Behdad Esfahbod      /* Have no other consonant, so Reph is not formed and Ra becomes base. */
381617f4ac46f1084859d2034c08760e31e52d3bec3Behdad Esfahbod      has_reph = false;
382617f4ac46f1084859d2034c08760e31e52d3bec3Behdad Esfahbod    }
3835e4e21fce4b548b0b8a5951bc8f35a9f27428192Behdad Esfahbod  }
3843d25079f8d6be81b9b4b91d3a97016b8a572f571Behdad Esfahbod
3853d25079f8d6be81b9b4b91d3a97016b8a572f571Behdad Esfahbod
386743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod  /* 2. Decompose and reorder Matras:
387743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod   *
388743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod   * Each matra and any syllable modifier sign in the cluster are moved to the
389743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod   * appropriate position relative to the consonant(s) in the cluster. The
390743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod   * shaping engine decomposes two- or three-part matras into their constituent
391743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod   * parts before any repositioning. Matra characters are classified by which
392743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod   * consonant in a conjunct they have affinity for and are reordered to the
393743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod   * following positions:
394743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod   *
395743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod   *   o Before first half form in the syllable
396743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod   *   o After subjoined consonants
397743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod   *   o After post-form consonant
398743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod   *   o After main consonant (for above marks)
399743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod   *
400743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod   * IMPLEMENTATION NOTES:
401743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod   *
402743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod   * The normalize() routine has already decomposed matras for us, so we don't
403743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod   * need to worry about that.
404743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod   */
405743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod
406743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod
407743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod  /* 3.  Reorder marks to canonical order:
408743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod   *
409743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod   * Adjacent nukta and halant or nukta and vedic sign are always repositioned
410743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod   * if necessary, so that the nukta is first.
411743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod   *
412743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod   * IMPLEMENTATION NOTES:
413743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod   *
414743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod   * We don't need to do this: the normalize() routine already did this for us.
415743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod   */
416743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod
417743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod
41845d6f29f15f1d2323bcaa2498aed23ff0c8a1567Behdad Esfahbod  /* Reorder characters */
41945d6f29f15f1d2323bcaa2498aed23ff0c8a1567Behdad Esfahbod
4203c2ea9481b1028e927e615a5434ebf8edcb5f891Behdad Esfahbod  for (unsigned int i = start; i < base; i++)
421dbccf87eef0d26838fa4bb3ae26410f6c4818836Behdad Esfahbod    info[i].indic_position() = POS_PRE_C;
422dbccf87eef0d26838fa4bb3ae26410f6c4818836Behdad Esfahbod  info[base].indic_position() = POS_BASE_C;
42345d6f29f15f1d2323bcaa2498aed23ff0c8a1567Behdad Esfahbod
424fd06bf56110e73826b3d5c73ac964e2609450d46Behdad Esfahbod  /* Handle beginning Ra */
4255e4e21fce4b548b0b8a5951bc8f35a9f27428192Behdad Esfahbod  if (has_reph)
426dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod    info[start].indic_position() = POS_RA_TO_BECOME_REPH;
427fd06bf56110e73826b3d5c73ac964e2609450d46Behdad Esfahbod
428f5bc2725cb892264ba223e0a49f7fd2c622a0730Behdad Esfahbod  /* For old-style Indic script tags, move the first post-base Halant after
429f5bc2725cb892264ba223e0a49f7fd2c622a0730Behdad Esfahbod   * last consonant. */
430a3e04bee2c2fa648759a87e460db6b4f1b685586Behdad Esfahbod  if (IS_OLD_INDIC_TAG (map->get_chosen_script (0))) {
4313c2ea9481b1028e927e615a5434ebf8edcb5f891Behdad Esfahbod    for (unsigned int i = base + 1; i < end; i++)
432f5bc2725cb892264ba223e0a49f7fd2c622a0730Behdad Esfahbod      if (info[i].indic_category() == OT_H) {
433f5bc2725cb892264ba223e0a49f7fd2c622a0730Behdad Esfahbod        unsigned int j;
434f5bc2725cb892264ba223e0a49f7fd2c622a0730Behdad Esfahbod        for (j = end - 1; j > i; j--)
435190eb31a16178269aecaf5d2ecc9012f956749f4Behdad Esfahbod	  if (is_consonant (info[j]))
436f5bc2725cb892264ba223e0a49f7fd2c622a0730Behdad Esfahbod	    break;
437f5bc2725cb892264ba223e0a49f7fd2c622a0730Behdad Esfahbod	if (j > i) {
438f5bc2725cb892264ba223e0a49f7fd2c622a0730Behdad Esfahbod	  /* Move Halant to after last consonant. */
439f5bc2725cb892264ba223e0a49f7fd2c622a0730Behdad Esfahbod	  hb_glyph_info_t t = info[i];
440f5bc2725cb892264ba223e0a49f7fd2c622a0730Behdad Esfahbod	  memmove (&info[i], &info[i + 1], (j - i) * sizeof (info[0]));
441f5bc2725cb892264ba223e0a49f7fd2c622a0730Behdad Esfahbod	  info[j] = t;
442f5bc2725cb892264ba223e0a49f7fd2c622a0730Behdad Esfahbod	}
443f5bc2725cb892264ba223e0a49f7fd2c622a0730Behdad Esfahbod        break;
444f5bc2725cb892264ba223e0a49f7fd2c622a0730Behdad Esfahbod      }
445f5bc2725cb892264ba223e0a49f7fd2c622a0730Behdad Esfahbod  }
446f5bc2725cb892264ba223e0a49f7fd2c622a0730Behdad Esfahbod
44745d6f29f15f1d2323bcaa2498aed23ff0c8a1567Behdad Esfahbod  /* Attach ZWJ, ZWNJ, nukta, and halant to previous char to move with them. */
448a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbod  if (!indic_options ().uniscribe_bug_compatible)
449ebe29733d44fe0fa9fb30f946ab0dd7a40336a24Behdad Esfahbod  {
450ebe29733d44fe0fa9fb30f946ab0dd7a40336a24Behdad Esfahbod    /* Please update the Uniscribe branch when touching this! */
451ebe29733d44fe0fa9fb30f946ab0dd7a40336a24Behdad Esfahbod    for (unsigned int i = start + 1; i < end; i++)
452ebe29733d44fe0fa9fb30f946ab0dd7a40336a24Behdad Esfahbod      if ((FLAG (info[i].indic_category()) & (FLAG (OT_ZWNJ) | FLAG (OT_ZWJ) | FLAG (OT_N) | FLAG (OT_H))))
453ebe29733d44fe0fa9fb30f946ab0dd7a40336a24Behdad Esfahbod	info[i].indic_position() = info[i - 1].indic_position();
454ebe29733d44fe0fa9fb30f946ab0dd7a40336a24Behdad Esfahbod  } else {
45567ea29af49bb08ee679914076808327992cf6676Behdad Esfahbod    /*
45667ea29af49bb08ee679914076808327992cf6676Behdad Esfahbod     * Uniscribe doesn't move the Halant with Left Matra.
45767ea29af49bb08ee679914076808327992cf6676Behdad Esfahbod     * TEST: U+092B,U+093F,U+094DE
45867ea29af49bb08ee679914076808327992cf6676Behdad Esfahbod     */
459ebe29733d44fe0fa9fb30f946ab0dd7a40336a24Behdad Esfahbod    /* Please update the non-Uniscribe branch when touching this! */
460ebe29733d44fe0fa9fb30f946ab0dd7a40336a24Behdad Esfahbod    for (unsigned int i = start + 1; i < end; i++)
461ebe29733d44fe0fa9fb30f946ab0dd7a40336a24Behdad Esfahbod      if ((FLAG (info[i].indic_category()) & (FLAG (OT_ZWNJ) | FLAG (OT_ZWJ) | FLAG (OT_N) | FLAG (OT_H)))) {
462ebe29733d44fe0fa9fb30f946ab0dd7a40336a24Behdad Esfahbod	info[i].indic_position() = info[i - 1].indic_position();
4636a091df9b403b147ef78f3974610dedf4ce1e08aBehdad Esfahbod	if (info[i].indic_category() == OT_H && info[i].indic_position() == POS_PRE_M)
464ebe29733d44fe0fa9fb30f946ab0dd7a40336a24Behdad Esfahbod	  for (unsigned int j = i; j > start; j--)
4656a091df9b403b147ef78f3974610dedf4ce1e08aBehdad Esfahbod	    if (info[j - 1].indic_position() != POS_PRE_M) {
466ebe29733d44fe0fa9fb30f946ab0dd7a40336a24Behdad Esfahbod	      info[i].indic_position() = info[j - 1].indic_position();
467ebe29733d44fe0fa9fb30f946ab0dd7a40336a24Behdad Esfahbod	      break;
468ebe29733d44fe0fa9fb30f946ab0dd7a40336a24Behdad Esfahbod	    }
469ebe29733d44fe0fa9fb30f946ab0dd7a40336a24Behdad Esfahbod      }
470ebe29733d44fe0fa9fb30f946ab0dd7a40336a24Behdad Esfahbod  }
47145d6f29f15f1d2323bcaa2498aed23ff0c8a1567Behdad Esfahbod
47245d6f29f15f1d2323bcaa2498aed23ff0c8a1567Behdad Esfahbod  /* We do bubble-sort, skip malicious clusters attempts */
473b99d63ae114fb58f129562b293a8a66543d499adBehdad Esfahbod  if (end - start < 64)
474a391ff50b9a7b6ac3e58d199ea726b20ee6839bbBehdad Esfahbod  {
475a391ff50b9a7b6ac3e58d199ea726b20ee6839bbBehdad Esfahbod    /* Sit tight, rock 'n roll! */
476d3637edb248162970e202e9d0671540274192844Behdad Esfahbod    hb_bubble_sort (info + start, end - start, compare_indic_order);
477a391ff50b9a7b6ac3e58d199ea726b20ee6839bbBehdad Esfahbod    /* Find base again */
478a391ff50b9a7b6ac3e58d199ea726b20ee6839bbBehdad Esfahbod    base = end;
4793c2ea9481b1028e927e615a5434ebf8edcb5f891Behdad Esfahbod    for (unsigned int i = start; i < end; i++)
480a391ff50b9a7b6ac3e58d199ea726b20ee6839bbBehdad Esfahbod      if (info[i].indic_position() == POS_BASE_C) {
481a391ff50b9a7b6ac3e58d199ea726b20ee6839bbBehdad Esfahbod        base = i;
482a391ff50b9a7b6ac3e58d199ea726b20ee6839bbBehdad Esfahbod	break;
483a391ff50b9a7b6ac3e58d199ea726b20ee6839bbBehdad Esfahbod      }
484a391ff50b9a7b6ac3e58d199ea726b20ee6839bbBehdad Esfahbod  }
48545d6f29f15f1d2323bcaa2498aed23ff0c8a1567Behdad Esfahbod
486743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod  /* Setup masks now */
487743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod
488281683995a46ed37aeeb84061249758c59822457Behdad Esfahbod  {
489281683995a46ed37aeeb84061249758c59822457Behdad Esfahbod    hb_mask_t mask;
490281683995a46ed37aeeb84061249758c59822457Behdad Esfahbod
491dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod    /* Reph */
492668c6046c1b3af3bd316bda0cc8636f2a5e8df42Behdad Esfahbod    for (unsigned int i = start; i < end && info[i].indic_position() == POS_RA_TO_BECOME_REPH; i++)
49370fe77bb9a25922bd34f206826d8731d901fb451Behdad Esfahbod      info[i].mask |= basic_mask_array[RPHF];
494dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod
495281683995a46ed37aeeb84061249758c59822457Behdad Esfahbod    /* Pre-base */
49670fe77bb9a25922bd34f206826d8731d901fb451Behdad Esfahbod    mask = basic_mask_array[HALF] | basic_mask_array[AKHN] | basic_mask_array[CJCT];
4973c2ea9481b1028e927e615a5434ebf8edcb5f891Behdad Esfahbod    for (unsigned int i = start; i < base; i++)
498281683995a46ed37aeeb84061249758c59822457Behdad Esfahbod      info[i].mask  |= mask;
499281683995a46ed37aeeb84061249758c59822457Behdad Esfahbod    /* Base */
50070fe77bb9a25922bd34f206826d8731d901fb451Behdad Esfahbod    mask = basic_mask_array[AKHN] | basic_mask_array[CJCT];
501281683995a46ed37aeeb84061249758c59822457Behdad Esfahbod    info[base].mask |= mask;
502281683995a46ed37aeeb84061249758c59822457Behdad Esfahbod    /* Post-base */
50370fe77bb9a25922bd34f206826d8731d901fb451Behdad Esfahbod    mask = basic_mask_array[BLWF] | basic_mask_array[ABVF] | basic_mask_array[PSTF] | basic_mask_array[CJCT];
5043c2ea9481b1028e927e615a5434ebf8edcb5f891Behdad Esfahbod    for (unsigned int i = base + 1; i < end; i++)
505281683995a46ed37aeeb84061249758c59822457Behdad Esfahbod      info[i].mask  |= mask;
506281683995a46ed37aeeb84061249758c59822457Behdad Esfahbod  }
5079da0487cd452d780673e24329ce03e174a4ef83bBehdad Esfahbod
50817d7de91d76406d3e92db37d9eef2fc615f06e68Behdad Esfahbod  /* XXX This will not match for old-Indic spec since the Halant-Ra order is reversed already. */
5098e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod  if (basic_mask_array[PREF] && base + 3 <= end)
51017d7de91d76406d3e92db37d9eef2fc615f06e68Behdad Esfahbod  {
5118e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod    /* Find a Halant,Ra sequence and mark it fore pre-base reordering processing. */
5128e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod    for (unsigned int i = base + 1; i + 1 < end; i++)
5138e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod      if (info[i].indic_category() == OT_H &&
5148e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod	  info[i + 1].indic_category() == OT_Ra)
5158e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod      {
5168e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod	info[i].mask |= basic_mask_array[PREF];
5178e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod	info[i + 1].mask |= basic_mask_array[PREF];
5188e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod	break;
5198e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod      }
52017d7de91d76406d3e92db37d9eef2fc615f06e68Behdad Esfahbod  }
52117d7de91d76406d3e92db37d9eef2fc615f06e68Behdad Esfahbod
5229da0487cd452d780673e24329ce03e174a4ef83bBehdad Esfahbod  /* Apply ZWJ/ZWNJ effects */
5233c2ea9481b1028e927e615a5434ebf8edcb5f891Behdad Esfahbod  for (unsigned int i = start + 1; i < end; i++)
5249da0487cd452d780673e24329ce03e174a4ef83bBehdad Esfahbod    if (is_joiner (info[i])) {
5259da0487cd452d780673e24329ce03e174a4ef83bBehdad Esfahbod      bool non_joiner = info[i].indic_category() == OT_ZWNJ;
5266b37bc80843e38ca7b62500f95fd70c08af68d62Behdad Esfahbod      unsigned int j = i;
5279da0487cd452d780673e24329ce03e174a4ef83bBehdad Esfahbod
5289da0487cd452d780673e24329ce03e174a4ef83bBehdad Esfahbod      do {
5299da0487cd452d780673e24329ce03e174a4ef83bBehdad Esfahbod	j--;
5306b37bc80843e38ca7b62500f95fd70c08af68d62Behdad Esfahbod
53170fe77bb9a25922bd34f206826d8731d901fb451Behdad Esfahbod	info[j].mask &= ~basic_mask_array[CJCT];
5326b37bc80843e38ca7b62500f95fd70c08af68d62Behdad Esfahbod	if (non_joiner)
53370fe77bb9a25922bd34f206826d8731d901fb451Behdad Esfahbod	  info[j].mask &= ~basic_mask_array[HALF];
5346b37bc80843e38ca7b62500f95fd70c08af68d62Behdad Esfahbod
5359da0487cd452d780673e24329ce03e174a4ef83bBehdad Esfahbod      } while (j > start && !is_consonant (info[j]));
5369da0487cd452d780673e24329ce03e174a4ef83bBehdad Esfahbod    }
537743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod}
538743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod
539743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod
540743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbodstatic void
5419f377ed3210fe7d9f15e0c4f82020556f9a8f6f0Behdad Esfahbodinitial_reordering_vowel_syllable (const hb_ot_map_t *map,
5429f377ed3210fe7d9f15e0c4f82020556f9a8f6f0Behdad Esfahbod				   hb_buffer_t *buffer,
54370fe77bb9a25922bd34f206826d8731d901fb451Behdad Esfahbod				   hb_mask_t *basic_mask_array,
544ef24cc8c8e2478a6352c340f4611a617646de4ccBehdad Esfahbod				   unsigned int start, unsigned int end)
545743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod{
546c5306b6861cfaa50af40e8ceb058791fa06d7981Behdad Esfahbod  /* We made the vowels look like consonants.  So let's call the consonant logic! */
54770fe77bb9a25922bd34f206826d8731d901fb451Behdad Esfahbod  initial_reordering_consonant_syllable (map, buffer, basic_mask_array, start, end);
548743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod}
549743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod
550743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbodstatic void
5519f377ed3210fe7d9f15e0c4f82020556f9a8f6f0Behdad Esfahbodinitial_reordering_standalone_cluster (const hb_ot_map_t *map,
5529f377ed3210fe7d9f15e0c4f82020556f9a8f6f0Behdad Esfahbod				       hb_buffer_t *buffer,
55370fe77bb9a25922bd34f206826d8731d901fb451Behdad Esfahbod				       hb_mask_t *basic_mask_array,
554ef24cc8c8e2478a6352c340f4611a617646de4ccBehdad Esfahbod				       unsigned int start, unsigned int end)
555743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod{
55618c06e189bd078affbb84c3bb5bb80687a227c5eBehdad Esfahbod  /* We treat NBSP/dotted-circle as if they are consonants, so we should just chain.
55718c06e189bd078affbb84c3bb5bb80687a227c5eBehdad Esfahbod   * Only if not in compatibility mode that is... */
55818c06e189bd078affbb84c3bb5bb80687a227c5eBehdad Esfahbod
559a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbod  if (indic_options ().uniscribe_bug_compatible)
56018c06e189bd078affbb84c3bb5bb80687a227c5eBehdad Esfahbod  {
56118c06e189bd078affbb84c3bb5bb80687a227c5eBehdad Esfahbod    /* For dotted-circle, this is what Uniscribe does:
56218c06e189bd078affbb84c3bb5bb80687a227c5eBehdad Esfahbod     * If dotted-circle is the last glyph, it just does nothing.
56318c06e189bd078affbb84c3bb5bb80687a227c5eBehdad Esfahbod     * Ie. It doesn't form Reph. */
56418c06e189bd078affbb84c3bb5bb80687a227c5eBehdad Esfahbod    if (buffer->info[end - 1].indic_category() == OT_DOTTEDCIRCLE)
56518c06e189bd078affbb84c3bb5bb80687a227c5eBehdad Esfahbod      return;
56618c06e189bd078affbb84c3bb5bb80687a227c5eBehdad Esfahbod  }
56718c06e189bd078affbb84c3bb5bb80687a227c5eBehdad Esfahbod
56870fe77bb9a25922bd34f206826d8731d901fb451Behdad Esfahbod  initial_reordering_consonant_syllable (map, buffer, basic_mask_array, start, end);
569743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod}
570743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod
571743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbodstatic void
5729f377ed3210fe7d9f15e0c4f82020556f9a8f6f0Behdad Esfahbodinitial_reordering_non_indic (const hb_ot_map_t *map HB_UNUSED,
5739f377ed3210fe7d9f15e0c4f82020556f9a8f6f0Behdad Esfahbod			      hb_buffer_t *buffer HB_UNUSED,
57470fe77bb9a25922bd34f206826d8731d901fb451Behdad Esfahbod			      hb_mask_t *basic_mask_array HB_UNUSED,
5753f18236a03880c0960f5990dc90685f6146951a6Behdad Esfahbod			      unsigned int start HB_UNUSED, unsigned int end HB_UNUSED)
576743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod{
577743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod  /* Nothing to do right now.  If we ever switch to using the output
578743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod   * buffer in the reordering process, we'd need to next_glyph() here. */
579743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod}
580743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod
581743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod#include "hb-ot-shape-complex-indic-machine.hh"
582743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod
583743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbodstatic void
584743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbodinitial_reordering (const hb_ot_map_t *map,
5853f18236a03880c0960f5990dc90685f6146951a6Behdad Esfahbod		    hb_face_t *face HB_UNUSED,
586743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod		    hb_buffer_t *buffer,
587743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod		    void *user_data HB_UNUSED)
588743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod{
58970fe77bb9a25922bd34f206826d8731d901fb451Behdad Esfahbod  hb_mask_t basic_mask_array[ARRAY_LENGTH (indic_basic_features)] = {0};
590b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod  unsigned int num_masks = ARRAY_LENGTH (indic_basic_features);
591b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod  for (unsigned int i = 0; i < num_masks; i++)
59270fe77bb9a25922bd34f206826d8731d901fb451Behdad Esfahbod    basic_mask_array[i] = map->get_1_mask (indic_basic_features[i].tag);
593743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod
59470fe77bb9a25922bd34f206826d8731d901fb451Behdad Esfahbod  find_syllables (map, buffer, basic_mask_array);
595b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod}
596b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod
597743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbodstatic void
59846e645ec4b59f0a278347be11f40c7df700d5bb6Behdad Esfahbodfinal_reordering_syllable (hb_buffer_t *buffer,
59946e645ec4b59f0a278347be11f40c7df700d5bb6Behdad Esfahbod			   hb_mask_t init_mask, hb_mask_t pref_mask,
600ef24cc8c8e2478a6352c340f4611a617646de4ccBehdad Esfahbod			   unsigned int start, unsigned int end)
601743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod{
6024ac9e98d9d2ea973dd612dc4063cf78496c643a0Behdad Esfahbod  hb_glyph_info_t *info = buffer->info;
6034ac9e98d9d2ea973dd612dc4063cf78496c643a0Behdad Esfahbod
604e7be05702447ae270d797398132c1930cd3a9b86Behdad Esfahbod  /* 4. Final reordering:
605e7be05702447ae270d797398132c1930cd3a9b86Behdad Esfahbod   *
606e7be05702447ae270d797398132c1930cd3a9b86Behdad Esfahbod   * After the localized forms and basic shaping forms GSUB features have been
607e7be05702447ae270d797398132c1930cd3a9b86Behdad Esfahbod   * applied (see below), the shaping engine performs some final glyph
608e7be05702447ae270d797398132c1930cd3a9b86Behdad Esfahbod   * reordering before applying all the remaining font features to the entire
609e7be05702447ae270d797398132c1930cd3a9b86Behdad Esfahbod   * cluster.
6104ac9e98d9d2ea973dd612dc4063cf78496c643a0Behdad Esfahbod   */
6114ac9e98d9d2ea973dd612dc4063cf78496c643a0Behdad Esfahbod
6124ac9e98d9d2ea973dd612dc4063cf78496c643a0Behdad Esfahbod  /* Find base again */
6134ac9e98d9d2ea973dd612dc4063cf78496c643a0Behdad Esfahbod  unsigned int base = end;
6144ac9e98d9d2ea973dd612dc4063cf78496c643a0Behdad Esfahbod  for (unsigned int i = start; i < end; i++)
6154ac9e98d9d2ea973dd612dc4063cf78496c643a0Behdad Esfahbod    if (info[i].indic_position() == POS_BASE_C) {
6164ac9e98d9d2ea973dd612dc4063cf78496c643a0Behdad Esfahbod      base = i;
6174ac9e98d9d2ea973dd612dc4063cf78496c643a0Behdad Esfahbod      break;
6184ac9e98d9d2ea973dd612dc4063cf78496c643a0Behdad Esfahbod    }
6194ac9e98d9d2ea973dd612dc4063cf78496c643a0Behdad Esfahbod
6204705a7026900e51f6430f03a73c87f2df035df92Behdad Esfahbod  unsigned int start_of_last_cluster = base;
6214705a7026900e51f6430f03a73c87f2df035df92Behdad Esfahbod
6224ac9e98d9d2ea973dd612dc4063cf78496c643a0Behdad Esfahbod  /*   o Reorder matras:
623e7be05702447ae270d797398132c1930cd3a9b86Behdad Esfahbod   *
624e7be05702447ae270d797398132c1930cd3a9b86Behdad Esfahbod   *     If a pre-base matra character had been reordered before applying basic
625e7be05702447ae270d797398132c1930cd3a9b86Behdad Esfahbod   *     features, the glyph can be moved closer to the main consonant based on
626e7be05702447ae270d797398132c1930cd3a9b86Behdad Esfahbod   *     whether half-forms had been formed. Actual position for the matra is
627e7be05702447ae270d797398132c1930cd3a9b86Behdad Esfahbod   *     defined as “after last standalone halant glyph, after initial matra
628e7be05702447ae270d797398132c1930cd3a9b86Behdad Esfahbod   *     position and before the main consonant”. If ZWJ or ZWNJ follow this
629e7be05702447ae270d797398132c1930cd3a9b86Behdad Esfahbod   *     halant, position is moved after it.
6304ac9e98d9d2ea973dd612dc4063cf78496c643a0Behdad Esfahbod   */
6314ac9e98d9d2ea973dd612dc4063cf78496c643a0Behdad Esfahbod
632362d3db8d3527d0fef260a17d2466e92a4a25425Behdad Esfahbod  if (start < base) /* Otherwise there can't be any pre-base matra characters. */
6339d0d319a4a7e85d922e58fade0f40caae1c9f109Behdad Esfahbod  {
634921ce5b17daf06af8e17989a3e335b9f5df20483Behdad Esfahbod    unsigned int new_pos = base - 1;
635921ce5b17daf06af8e17989a3e335b9f5df20483Behdad Esfahbod    while (new_pos > start &&
636921ce5b17daf06af8e17989a3e335b9f5df20483Behdad Esfahbod	   !(FLAG (info[new_pos].indic_category()) & (FLAG (OT_M) | FLAG (OT_H))))
637921ce5b17daf06af8e17989a3e335b9f5df20483Behdad Esfahbod      new_pos--;
6389d0d319a4a7e85d922e58fade0f40caae1c9f109Behdad Esfahbod    /* If we found no Halant we are done.  Otherwise only proceed if the Halant does
6399d0d319a4a7e85d922e58fade0f40caae1c9f109Behdad Esfahbod     * not belong to the Matra itself! */
640921ce5b17daf06af8e17989a3e335b9f5df20483Behdad Esfahbod    if (info[new_pos].indic_category() == OT_H &&
641921ce5b17daf06af8e17989a3e335b9f5df20483Behdad Esfahbod	info[new_pos].indic_position() != POS_PRE_M) {
6429d0d319a4a7e85d922e58fade0f40caae1c9f109Behdad Esfahbod      /* -> If ZWJ or ZWNJ follow this halant, position is moved after it. */
643921ce5b17daf06af8e17989a3e335b9f5df20483Behdad Esfahbod      if (new_pos + 1 < end && is_joiner (info[new_pos + 1]))
644921ce5b17daf06af8e17989a3e335b9f5df20483Behdad Esfahbod	new_pos++;
6459d0d319a4a7e85d922e58fade0f40caae1c9f109Behdad Esfahbod
6469d0d319a4a7e85d922e58fade0f40caae1c9f109Behdad Esfahbod      /* Now go see if there's actually any matras... */
647921ce5b17daf06af8e17989a3e335b9f5df20483Behdad Esfahbod      for (unsigned int i = new_pos; i > start; i--)
6486a091df9b403b147ef78f3974610dedf4ce1e08aBehdad Esfahbod	if (info[i - 1].indic_position () == POS_PRE_M)
6499d0d319a4a7e85d922e58fade0f40caae1c9f109Behdad Esfahbod	{
6501a1dbe9a2787f226f3e43063da8eb6633438b0a0Behdad Esfahbod	  unsigned int old_pos = i - 1;
6511a1dbe9a2787f226f3e43063da8eb6633438b0a0Behdad Esfahbod	  hb_glyph_info_t tmp = info[old_pos];
6521a1dbe9a2787f226f3e43063da8eb6633438b0a0Behdad Esfahbod	  memmove (&info[old_pos], &info[old_pos + 1], (new_pos - old_pos) * sizeof (info[0]));
6531a1dbe9a2787f226f3e43063da8eb6633438b0a0Behdad Esfahbod	  info[new_pos] = tmp;
654921ce5b17daf06af8e17989a3e335b9f5df20483Behdad Esfahbod	  start_of_last_cluster = MIN (new_pos, start_of_last_cluster);
655921ce5b17daf06af8e17989a3e335b9f5df20483Behdad Esfahbod	  new_pos--;
6569d0d319a4a7e85d922e58fade0f40caae1c9f109Behdad Esfahbod	}
6579d0d319a4a7e85d922e58fade0f40caae1c9f109Behdad Esfahbod    }
6584ac9e98d9d2ea973dd612dc4063cf78496c643a0Behdad Esfahbod  }
6594ac9e98d9d2ea973dd612dc4063cf78496c643a0Behdad Esfahbod
6604ac9e98d9d2ea973dd612dc4063cf78496c643a0Behdad Esfahbod
6614ac9e98d9d2ea973dd612dc4063cf78496c643a0Behdad Esfahbod  /*   o Reorder reph:
662e7be05702447ae270d797398132c1930cd3a9b86Behdad Esfahbod   *
663e7be05702447ae270d797398132c1930cd3a9b86Behdad Esfahbod   *     Reph’s original position is always at the beginning of the syllable,
664e7be05702447ae270d797398132c1930cd3a9b86Behdad Esfahbod   *     (i.e. it is not reordered at the character reordering stage). However,
665e7be05702447ae270d797398132c1930cd3a9b86Behdad Esfahbod   *     it will be reordered according to the basic-forms shaping results.
666e7be05702447ae270d797398132c1930cd3a9b86Behdad Esfahbod   *     Possible positions for reph, depending on the script, are; after main,
667e7be05702447ae270d797398132c1930cd3a9b86Behdad Esfahbod   *     before post-base consonant forms, and after post-base consonant forms.
668dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod   */
669dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod
670dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod  /* If there's anything after the Ra that has the REPH pos, it ought to be halant.
671dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod   * Which means that the font has failed to ligate the Reph.  In which case, we
672dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod   * shouldn't move. */
673dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod  if (start + 1 < end &&
674dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod      info[start].indic_position() == POS_RA_TO_BECOME_REPH &&
675dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod      info[start + 1].indic_position() != POS_RA_TO_BECOME_REPH)
676dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod  {
67702b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod      unsigned int new_reph_pos;
67802b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod
67902b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod     enum reph_position_t {
680f89367251109af235f4f0446c13c261a5a4a6f72Behdad Esfahbod       REPH_AFTER_MAIN,
681f89367251109af235f4f0446c13c261a5a4a6f72Behdad Esfahbod       REPH_BEFORE_SUBSCRIPT,
682f89367251109af235f4f0446c13c261a5a4a6f72Behdad Esfahbod       REPH_AFTER_SUBSCRIPT,
683f89367251109af235f4f0446c13c261a5a4a6f72Behdad Esfahbod       REPH_BEFORE_POSTSCRIPT,
6849fc7a11469113d31d8095757c4fc038c3427d44aBehdad Esfahbod       REPH_AFTER_POSTSCRIPT
685f89367251109af235f4f0446c13c261a5a4a6f72Behdad Esfahbod     } reph_pos;
686f89367251109af235f4f0446c13c261a5a4a6f72Behdad Esfahbod
687f89367251109af235f4f0446c13c261a5a4a6f72Behdad Esfahbod     /* XXX Figure out old behavior too */
6887f852b644b8143492a02edfc853114aaa23446bdBehdad Esfahbod     switch ((hb_tag_t) buffer->props.script)
689f89367251109af235f4f0446c13c261a5a4a6f72Behdad Esfahbod     {
690f89367251109af235f4f0446c13c261a5a4a6f72Behdad Esfahbod       case HB_SCRIPT_MALAYALAM:
691f89367251109af235f4f0446c13c261a5a4a6f72Behdad Esfahbod       case HB_SCRIPT_ORIYA:
692f89367251109af235f4f0446c13c261a5a4a6f72Behdad Esfahbod	 reph_pos = REPH_AFTER_MAIN;
693f89367251109af235f4f0446c13c261a5a4a6f72Behdad Esfahbod	 break;
694f89367251109af235f4f0446c13c261a5a4a6f72Behdad Esfahbod
695f89367251109af235f4f0446c13c261a5a4a6f72Behdad Esfahbod       case HB_SCRIPT_GURMUKHI:
696f89367251109af235f4f0446c13c261a5a4a6f72Behdad Esfahbod	 reph_pos = REPH_BEFORE_SUBSCRIPT;
697f89367251109af235f4f0446c13c261a5a4a6f72Behdad Esfahbod	 break;
698f89367251109af235f4f0446c13c261a5a4a6f72Behdad Esfahbod
699f89367251109af235f4f0446c13c261a5a4a6f72Behdad Esfahbod       case HB_SCRIPT_BENGALI:
700f89367251109af235f4f0446c13c261a5a4a6f72Behdad Esfahbod	 reph_pos = REPH_AFTER_SUBSCRIPT;
701f89367251109af235f4f0446c13c261a5a4a6f72Behdad Esfahbod	 break;
702f89367251109af235f4f0446c13c261a5a4a6f72Behdad Esfahbod
703f89367251109af235f4f0446c13c261a5a4a6f72Behdad Esfahbod       default:
704f89367251109af235f4f0446c13c261a5a4a6f72Behdad Esfahbod       case HB_SCRIPT_DEVANAGARI:
705f89367251109af235f4f0446c13c261a5a4a6f72Behdad Esfahbod       case HB_SCRIPT_GUJARATI:
706f89367251109af235f4f0446c13c261a5a4a6f72Behdad Esfahbod	 reph_pos = REPH_BEFORE_POSTSCRIPT;
707f89367251109af235f4f0446c13c261a5a4a6f72Behdad Esfahbod	 break;
708f89367251109af235f4f0446c13c261a5a4a6f72Behdad Esfahbod
709f89367251109af235f4f0446c13c261a5a4a6f72Behdad Esfahbod       case HB_SCRIPT_KANNADA:
710f89367251109af235f4f0446c13c261a5a4a6f72Behdad Esfahbod       case HB_SCRIPT_TAMIL:
711f89367251109af235f4f0446c13c261a5a4a6f72Behdad Esfahbod       case HB_SCRIPT_TELUGU:
712f89367251109af235f4f0446c13c261a5a4a6f72Behdad Esfahbod	 reph_pos = REPH_AFTER_POSTSCRIPT;
713f89367251109af235f4f0446c13c261a5a4a6f72Behdad Esfahbod	 break;
714f89367251109af235f4f0446c13c261a5a4a6f72Behdad Esfahbod     }
71502b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod
716dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod    /*       1. If reph should be positioned after post-base consonant forms,
717dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod     *          proceed to step 5.
71802b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod     */
7199d0d319a4a7e85d922e58fade0f40caae1c9f109Behdad Esfahbod    if (reph_pos == REPH_AFTER_POSTSCRIPT)
72002b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod    {
7219d0d319a4a7e85d922e58fade0f40caae1c9f109Behdad Esfahbod      goto reph_step_5;
72202b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod    }
72302b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod
72402b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod    /*       2. If the reph repositioning class is not after post-base: target
725dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod     *          position is after the first explicit halant glyph between the
726dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod     *          first post-reph consonant and last main consonant. If ZWJ or ZWNJ
727dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod     *          are following this halant, position is moved after it. If such
728dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod     *          position is found, this is the target position. Otherwise,
729dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod     *          proceed to the next step.
730dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod     *
731dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod     *          Note: in old-implementation fonts, where classifications were
732dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod     *          fixed in shaping engine, there was no case where reph position
733dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod     *          will be found on this step.
73402b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod     */
73502b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod    {
73602b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod      new_reph_pos = start + 1;
73702b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod      while (new_reph_pos < base && info[new_reph_pos].indic_category() != OT_H)
73802b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod	new_reph_pos++;
73902b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod
74002b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod      if (new_reph_pos < base && info[new_reph_pos].indic_category() == OT_H) {
74102b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod	/* ->If ZWJ or ZWNJ are following this halant, position is moved after it. */
74202b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod	if (new_reph_pos + 1 < base && is_joiner (info[new_reph_pos + 1]))
74302b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod	  new_reph_pos++;
74402b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod	goto reph_move;
74502b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod      }
74602b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod    }
74702b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod
74802b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod    /*       3. If reph should be repositioned after the main consonant: find the
749dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod     *          first consonant not ligated with main, or find the first
750dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod     *          consonant that is not a potential pre-base reordering Ra.
75102b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod     */
7529d0d319a4a7e85d922e58fade0f40caae1c9f109Behdad Esfahbod    if (reph_pos == REPH_AFTER_MAIN)
75302b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod    {
754b504e060f008e95b1ba36c06600c9fea4f5d4808Behdad Esfahbod      new_reph_pos = base;
755b504e060f008e95b1ba36c06600c9fea4f5d4808Behdad Esfahbod      /* XXX Skip potential pre-base reordering Ra. */
756b504e060f008e95b1ba36c06600c9fea4f5d4808Behdad Esfahbod      while (new_reph_pos < end &&
757b504e060f008e95b1ba36c06600c9fea4f5d4808Behdad Esfahbod	     !( FLAG (info[new_reph_pos + 1].indic_position()) & (FLAG (POS_BELOW_C) | FLAG (POS_POST_C) | FLAG (POS_POST_M) | FLAG (POS_SMVD))))
758b504e060f008e95b1ba36c06600c9fea4f5d4808Behdad Esfahbod	new_reph_pos++;
759b504e060f008e95b1ba36c06600c9fea4f5d4808Behdad Esfahbod      if (new_reph_pos < end)
760b504e060f008e95b1ba36c06600c9fea4f5d4808Behdad Esfahbod        goto reph_move;
76102b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod    }
76202b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod
76302b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod    /*       4. If reph should be positioned before post-base consonant, find
764dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod     *          first post-base classified consonant not ligated with main. If no
765dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod     *          consonant is found, the target position should be before the
766dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod     *          first matra, syllable modifier sign or vedic sign.
76702b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod     */
7689d0d319a4a7e85d922e58fade0f40caae1c9f109Behdad Esfahbod    /* This is our take on what step 4 is trying to say (and failing, BADLY). */
7699d0d319a4a7e85d922e58fade0f40caae1c9f109Behdad Esfahbod    if (reph_pos == REPH_AFTER_SUBSCRIPT)
77002b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod    {
7719d0d319a4a7e85d922e58fade0f40caae1c9f109Behdad Esfahbod      new_reph_pos = base;
7729d0d319a4a7e85d922e58fade0f40caae1c9f109Behdad Esfahbod      while (new_reph_pos < end &&
7736a091df9b403b147ef78f3974610dedf4ce1e08aBehdad Esfahbod	     !( FLAG (info[new_reph_pos + 1].indic_position()) & (FLAG (POS_POST_C) | FLAG (POS_POST_M) | FLAG (POS_SMVD))))
7749d0d319a4a7e85d922e58fade0f40caae1c9f109Behdad Esfahbod	new_reph_pos++;
7759d0d319a4a7e85d922e58fade0f40caae1c9f109Behdad Esfahbod      if (new_reph_pos < end)
7769d0d319a4a7e85d922e58fade0f40caae1c9f109Behdad Esfahbod        goto reph_move;
77702b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod    }
77802b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod
77902b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod    /*       5. If no consonant is found in steps 3 or 4, move reph to a position
780dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod     *          immediately before the first post-base matra, syllable modifier
781dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod     *          sign or vedic sign that has a reordering class after the intended
782dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod     *          reph position. For example, if the reordering position for reph
783dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod     *          is post-main, it will skip above-base matras that also have a
784dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod     *          post-main position.
785dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod     */
78602b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod    reph_step_5:
78702b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod    {
78802b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod      /* XXX */
78902b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod    }
790dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod
79102b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod    /*       6. Otherwise, reorder reph to the end of the syllable.
79202b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod     */
79302b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod    {
79402b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod      new_reph_pos = end - 1;
79502b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod      while (new_reph_pos > start && info[new_reph_pos].indic_position() == POS_SMVD)
79602b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod	new_reph_pos--;
79702b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod
798892eb7878238d810a2a70f9dadbf958207bfeaa1Behdad Esfahbod      /*
799892eb7878238d810a2a70f9dadbf958207bfeaa1Behdad Esfahbod       * If the Reph is to be ending up after a Matra,Halant sequence,
800892eb7878238d810a2a70f9dadbf958207bfeaa1Behdad Esfahbod       * position it before that Halant so it can interact with the Matra.
801892eb7878238d810a2a70f9dadbf958207bfeaa1Behdad Esfahbod       * However, if it's a plain Consonant,Halant we shouldn't do that.
802892eb7878238d810a2a70f9dadbf958207bfeaa1Behdad Esfahbod       * Uniscribe doesn't do this.
803892eb7878238d810a2a70f9dadbf958207bfeaa1Behdad Esfahbod       * TEST: U+0930,U+094D,U+0915,U+094B,U+094D
804892eb7878238d810a2a70f9dadbf958207bfeaa1Behdad Esfahbod       */
805a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbod      if (!indic_options ().uniscribe_bug_compatible &&
806892eb7878238d810a2a70f9dadbf958207bfeaa1Behdad Esfahbod	  unlikely (info[new_reph_pos].indic_category() == OT_H)) {
80702b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod	for (unsigned int i = base + 1; i < new_reph_pos; i++)
80802b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod	  if (info[i].indic_category() == OT_M) {
80902b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod	    /* Ok, got it. */
81002b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod	    new_reph_pos--;
81102b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod	  }
81202b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod      }
81302b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod      goto reph_move;
8148df5636968389ac7bf8620ccd091fd4872b0bbeeBehdad Esfahbod    }
8158df5636968389ac7bf8620ccd091fd4872b0bbeeBehdad Esfahbod
81602b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod    reph_move:
81702b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod    {
81802b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod      /* Move */
81902b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod      hb_glyph_info_t reph = info[start];
82002b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod      memmove (&info[start], &info[start + 1], (new_reph_pos - start) * sizeof (info[0]));
82102b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod      info[new_reph_pos] = reph;
82202b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod      start_of_last_cluster = start; /* Yay, one big cluster! */
82302b2922fbf098c8282eb23dc2c54d5829cf67024Behdad Esfahbod    }
824dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod  }
825dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod
826dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod
827dbb105883c6e9b83e78dc8b10766cd56b98cd7e1Behdad Esfahbod  /*   o Reorder pre-base reordering consonants:
828e7be05702447ae270d797398132c1930cd3a9b86Behdad Esfahbod   *
829e7be05702447ae270d797398132c1930cd3a9b86Behdad Esfahbod   *     If a pre-base reordering consonant is found, reorder it according to
830e7be05702447ae270d797398132c1930cd3a9b86Behdad Esfahbod   *     the following rules:
831e7be05702447ae270d797398132c1930cd3a9b86Behdad Esfahbod   */
832e7be05702447ae270d797398132c1930cd3a9b86Behdad Esfahbod
83346e645ec4b59f0a278347be11f40c7df700d5bb6Behdad Esfahbod  if (pref_mask && base + 1 < end) /* Otherwise there can't be any pre-base reordering Ra. */
83446e645ec4b59f0a278347be11f40c7df700d5bb6Behdad Esfahbod  {
8358e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod    for (unsigned int i = base + 1; i < end; i++)
8368e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod      if ((info[i].mask & pref_mask) != 0)
83778818124b17691ec2c647142fdb9ae743aa03deeBehdad Esfahbod      {
8388e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod	/*       1. Only reorder a glyph produced by substitution during application
8398e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod	 *          of the <pref> feature. (Note that a font may shape a Ra consonant with
8408e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod	 *          the feature generally but block it in certain contexts.)
8418e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod	 */
8428e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod	if (i + 1 == end || (info[i + 1].mask & pref_mask) == 0)
8438e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod	{
8448e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod	  /*
8458e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod	   *       2. Try to find a target position the same way as for pre-base matra.
8468e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod	   *          If it is found, reorder pre-base consonant glyph.
8478e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod	   *
8488e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod	   *       3. If position is not found, reorder immediately before main
8498e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod	   *          consonant.
8508e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod	   */
8518e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod
8528e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod	  unsigned int new_pos = base;
8538e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod	  while (new_pos > start + 1 &&
8548e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod		 !(FLAG (info[new_pos - 1].indic_category()) & (FLAG (OT_M) | FLAG (OT_H))))
8558e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod	    new_pos--;
8568e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod
8578e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod	  if (new_pos > start && info[new_pos - 1].indic_category() == OT_H)
8588e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod	    /* -> If ZWJ or ZWNJ follow this halant, position is moved after it. */
8598e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod	    if (new_pos < end && is_joiner (info[new_pos]))
8608e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod	      new_pos++;
8618e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod
8628e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod	  {
8638e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod	    unsigned int old_pos = i;
8648e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod	    hb_glyph_info_t tmp = info[old_pos];
8658e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod	    memmove (&info[new_pos + 1], &info[new_pos], (old_pos - new_pos) * sizeof (info[0]));
8668e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod	    info[new_pos] = tmp;
8678e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod	    start_of_last_cluster = MIN (new_pos, start_of_last_cluster);
8688e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod	  }
8698e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod	}
8708e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod
8718e7b5882fb4c1921c9d030d354a9b998115cdb8cBehdad Esfahbod        break;
87278818124b17691ec2c647142fdb9ae743aa03deeBehdad Esfahbod      }
87346e645ec4b59f0a278347be11f40c7df700d5bb6Behdad Esfahbod  }
874eed903b1644e087178438959664a6a57bebc398bBehdad Esfahbod
875eed903b1644e087178438959664a6a57bebc398bBehdad Esfahbod
876a913b024d84973556094fd64ce5f0b7106fcc3b5Behdad Esfahbod  /* Apply 'init' to the Left Matra if it's a word start. */
8776a091df9b403b147ef78f3974610dedf4ce1e08aBehdad Esfahbod  if (info[start].indic_position () == POS_PRE_M &&
878a913b024d84973556094fd64ce5f0b7106fcc3b5Behdad Esfahbod      (!start ||
879eace47b173807d94b29a6490d0bc3c9f8f6168d1Behdad Esfahbod       !(FLAG (_hb_glyph_info_get_general_category (&info[start - 1])) &
880a913b024d84973556094fd64ce5f0b7106fcc3b5Behdad Esfahbod	 (FLAG (HB_UNICODE_GENERAL_CATEGORY_LOWERCASE_LETTER) |
881a913b024d84973556094fd64ce5f0b7106fcc3b5Behdad Esfahbod	  FLAG (HB_UNICODE_GENERAL_CATEGORY_MODIFIER_LETTER) |
882a913b024d84973556094fd64ce5f0b7106fcc3b5Behdad Esfahbod	  FLAG (HB_UNICODE_GENERAL_CATEGORY_OTHER_LETTER) |
883a913b024d84973556094fd64ce5f0b7106fcc3b5Behdad Esfahbod	  FLAG (HB_UNICODE_GENERAL_CATEGORY_TITLECASE_LETTER) |
884a913b024d84973556094fd64ce5f0b7106fcc3b5Behdad Esfahbod	  FLAG (HB_UNICODE_GENERAL_CATEGORY_UPPERCASE_LETTER) |
885a913b024d84973556094fd64ce5f0b7106fcc3b5Behdad Esfahbod	  FLAG (HB_UNICODE_GENERAL_CATEGORY_SPACING_MARK) |
886a913b024d84973556094fd64ce5f0b7106fcc3b5Behdad Esfahbod	  FLAG (HB_UNICODE_GENERAL_CATEGORY_ENCLOSING_MARK) |
887a913b024d84973556094fd64ce5f0b7106fcc3b5Behdad Esfahbod	  FLAG (HB_UNICODE_GENERAL_CATEGORY_NON_SPACING_MARK)))))
88846e645ec4b59f0a278347be11f40c7df700d5bb6Behdad Esfahbod    info[start].mask |= init_mask;
889a913b024d84973556094fd64ce5f0b7106fcc3b5Behdad Esfahbod
890eed903b1644e087178438959664a6a57bebc398bBehdad Esfahbod
89121d2803133c2c424ed37a9f3d17c7fc4963e5a60Behdad Esfahbod
89221d2803133c2c424ed37a9f3d17c7fc4963e5a60Behdad Esfahbod  /* Finish off the clusters and go home! */
89321d2803133c2c424ed37a9f3d17c7fc4963e5a60Behdad Esfahbod
894a2b471df821b32625d127f83b2f90e6d6a967e7eBehdad Esfahbod  if (!indic_options ().uniscribe_bug_compatible)
895ebe29733d44fe0fa9fb30f946ab0dd7a40336a24Behdad Esfahbod  {
89621d2803133c2c424ed37a9f3d17c7fc4963e5a60Behdad Esfahbod    /* This is what Uniscribe does.  Ie. add cluster boundaries after Halant,ZWNJ.
89721d2803133c2c424ed37a9f3d17c7fc4963e5a60Behdad Esfahbod     * This means, half forms are submerged into the main consonants cluster.
89821d2803133c2c424ed37a9f3d17c7fc4963e5a60Behdad Esfahbod     * This is unnecessary, and makes cursor positioning harder, but that's what
89921d2803133c2c424ed37a9f3d17c7fc4963e5a60Behdad Esfahbod     * Uniscribe does. */
90021d2803133c2c424ed37a9f3d17c7fc4963e5a60Behdad Esfahbod    unsigned int cluster_start = start;
90121d2803133c2c424ed37a9f3d17c7fc4963e5a60Behdad Esfahbod    for (unsigned int i = start + 1; i < start_of_last_cluster; i++)
90221d2803133c2c424ed37a9f3d17c7fc4963e5a60Behdad Esfahbod      if (info[i - 1].indic_category() == OT_H && info[i].indic_category() == OT_ZWNJ) {
90321d2803133c2c424ed37a9f3d17c7fc4963e5a60Behdad Esfahbod        i++;
90421d2803133c2c424ed37a9f3d17c7fc4963e5a60Behdad Esfahbod	buffer->merge_clusters (cluster_start, i);
90521d2803133c2c424ed37a9f3d17c7fc4963e5a60Behdad Esfahbod	cluster_start = i;
90621d2803133c2c424ed37a9f3d17c7fc4963e5a60Behdad Esfahbod      }
90721d2803133c2c424ed37a9f3d17c7fc4963e5a60Behdad Esfahbod    start_of_last_cluster = cluster_start;
90821d2803133c2c424ed37a9f3d17c7fc4963e5a60Behdad Esfahbod  }
90921d2803133c2c424ed37a9f3d17c7fc4963e5a60Behdad Esfahbod
91021d2803133c2c424ed37a9f3d17c7fc4963e5a60Behdad Esfahbod  buffer->merge_clusters (start_of_last_cluster, end);
911ef24cc8c8e2478a6352c340f4611a617646de4ccBehdad Esfahbod}
912e7be05702447ae270d797398132c1930cd3a9b86Behdad Esfahbod
913e7be05702447ae270d797398132c1930cd3a9b86Behdad Esfahbod
914ef24cc8c8e2478a6352c340f4611a617646de4ccBehdad Esfahbodstatic void
915ef24cc8c8e2478a6352c340f4611a617646de4ccBehdad Esfahbodfinal_reordering (const hb_ot_map_t *map,
9163f18236a03880c0960f5990dc90685f6146951a6Behdad Esfahbod		  hb_face_t *face HB_UNUSED,
917ef24cc8c8e2478a6352c340f4611a617646de4ccBehdad Esfahbod		  hb_buffer_t *buffer,
918ef24cc8c8e2478a6352c340f4611a617646de4ccBehdad Esfahbod		  void *user_data HB_UNUSED)
919ef24cc8c8e2478a6352c340f4611a617646de4ccBehdad Esfahbod{
920ef24cc8c8e2478a6352c340f4611a617646de4ccBehdad Esfahbod  unsigned int count = buffer->len;
921ef24cc8c8e2478a6352c340f4611a617646de4ccBehdad Esfahbod  if (!count) return;
922ef24cc8c8e2478a6352c340f4611a617646de4ccBehdad Esfahbod
92346e645ec4b59f0a278347be11f40c7df700d5bb6Behdad Esfahbod  hb_mask_t init_mask = map->get_1_mask (HB_TAG('i','n','i','t'));
92446e645ec4b59f0a278347be11f40c7df700d5bb6Behdad Esfahbod  hb_mask_t pref_mask = map->get_1_mask (HB_TAG('p','r','e','f'));
925eed903b1644e087178438959664a6a57bebc398bBehdad Esfahbod
926ef24cc8c8e2478a6352c340f4611a617646de4ccBehdad Esfahbod  hb_glyph_info_t *info = buffer->info;
927ef24cc8c8e2478a6352c340f4611a617646de4ccBehdad Esfahbod  unsigned int last = 0;
928cee7187447b76b22e1bb6136d137b35ac49c3a5dBehdad Esfahbod  unsigned int last_syllable = info[0].syllable();
929ef24cc8c8e2478a6352c340f4611a617646de4ccBehdad Esfahbod  for (unsigned int i = 1; i < count; i++)
930cee7187447b76b22e1bb6136d137b35ac49c3a5dBehdad Esfahbod    if (last_syllable != info[i].syllable()) {
93146e645ec4b59f0a278347be11f40c7df700d5bb6Behdad Esfahbod      final_reordering_syllable (buffer, init_mask, pref_mask, last, i);
932ef24cc8c8e2478a6352c340f4611a617646de4ccBehdad Esfahbod      last = i;
933cee7187447b76b22e1bb6136d137b35ac49c3a5dBehdad Esfahbod      last_syllable = info[last].syllable();
934ef24cc8c8e2478a6352c340f4611a617646de4ccBehdad Esfahbod    }
93546e645ec4b59f0a278347be11f40c7df700d5bb6Behdad Esfahbod  final_reordering_syllable (buffer, init_mask, pref_mask, last, count);
936e7be05702447ae270d797398132c1930cd3a9b86Behdad Esfahbod
937743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod  HB_BUFFER_DEALLOCATE_VAR (buffer, indic_category);
938743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod  HB_BUFFER_DEALLOCATE_VAR (buffer, indic_position);
939743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod}
940743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod
941743807a3ce1b2229e5307a8aea074a7544623d8dBehdad Esfahbod
942b9ddbd55930228422e82b34a141ad1b6093f5376Behdad Esfahbod
943