2 * Copyright © 2011,2012,2013 Google, Inc.
4 * This is part of HarfBuzz, a text shaping library.
6 * Permission is hereby granted, without written agreement and without
7 * license or royalty fees, to use, copy, modify, and distribute this
8 * software and its documentation for any purpose, provided that the
9 * above copyright notice and the following two paragraphs appear in
10 * all copies of this software.
12 * IN NO EVENT SHALL THE COPYRIGHT HOLDER BE LIABLE TO ANY PARTY FOR
13 * DIRECT, INDIRECT, SPECIAL, INCIDENTAL, OR CONSEQUENTIAL DAMAGES
14 * ARISING OUT OF THE USE OF THIS SOFTWARE AND ITS DOCUMENTATION, EVEN
15 * IF THE COPYRIGHT HOLDER HAS BEEN ADVISED OF THE POSSIBILITY OF SUCH
18 * THE COPYRIGHT HOLDER SPECIFICALLY DISCLAIMS ANY WARRANTIES, INCLUDING,
19 * BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND
20 * FITNESS FOR A PARTICULAR PURPOSE. THE SOFTWARE PROVIDED HEREUNDER IS
21 * ON AN "AS IS" BASIS, AND THE COPYRIGHT HOLDER HAS NO OBLIGATION TO
22 * PROVIDE MAINTENANCE, SUPPORT, UPDATES, ENHANCEMENTS, OR MODIFICATIONS.
24 * Google Author(s): Behdad Esfahbod
27 #include "hb-ot-shape-complex-indic-private.hh"
29 /* buffer var allocations */
30 #define myanmar_category() complex_var_u8_0() /* myanmar_category_t */
31 #define myanmar_position() complex_var_u8_1() /* myanmar_position_t */
43 * These features are applied in order, one at a time, after initial_reordering.
45 HB_TAG('r','p','h','f'),
46 HB_TAG('p','r','e','f'),
47 HB_TAG('b','l','w','f'),
48 HB_TAG('p','s','t','f'),
55 * These features are applied all at once, after final_reordering.
57 HB_TAG('p','r','e','s'),
58 HB_TAG('a','b','v','s'),
59 HB_TAG('b','l','w','s'),
60 HB_TAG('p','s','t','s'),
61 /* Positioning features, though we don't care about the types. */
62 HB_TAG('d','i','s','t'),
66 setup_syllables (const hb_ot_shape_plan_t
*plan
,
70 initial_reordering (const hb_ot_shape_plan_t
*plan
,
74 final_reordering (const hb_ot_shape_plan_t
*plan
,
79 collect_features_myanmar (hb_ot_shape_planner_t
*plan
)
81 hb_ot_map_builder_t
*map
= &plan
->map
;
83 /* Do this before any lookups have been applied. */
84 map
->add_gsub_pause (setup_syllables
);
86 map
->add_global_bool_feature (HB_TAG('l','o','c','l'));
87 /* The Indic specs do not require ccmp, but we apply it here since if
88 * there is a use of it, it's typically at the beginning. */
89 map
->add_global_bool_feature (HB_TAG('c','c','m','p'));
92 map
->add_gsub_pause (initial_reordering
);
93 for (unsigned int i
= 0; i
< ARRAY_LENGTH (basic_features
); i
++)
95 map
->add_feature (basic_features
[i
], 1, F_GLOBAL
| F_MANUAL_ZWJ
);
96 map
->add_gsub_pause (NULL
);
98 map
->add_gsub_pause (final_reordering
);
99 for (unsigned int i
= 0; i
< ARRAY_LENGTH (other_features
); i
++)
100 map
->add_feature (other_features
[i
], 1, F_GLOBAL
| F_MANUAL_ZWJ
);
104 override_features_myanmar (hb_ot_shape_planner_t
*plan
)
106 plan
->map
.add_feature (HB_TAG('l','i','g','a'), 0, F_GLOBAL
);
111 * Spec says 'mark' is used, and the mmrtext.ttf font from
112 * Windows 8 has lookups for it. But testing suggests that
113 * Windows 8 Uniscribe is NOT applying it. It *is* applying
116 if (hb_options ().uniscribe_bug_compatible
)
117 plan
->map
.add_feature (HB_TAG('m','a','r','k'), 0, F_GLOBAL
);
121 enum syllable_type_t
{
127 #include "hb-ot-shape-complex-myanmar-machine.hh"
130 /* Note: This enum is duplicated in the -machine.rl source file.
131 * Not sure how to avoid duplication. */
132 enum myanmar_category_t
{
133 OT_As
= 18, /* Asat */
134 OT_D
= 19, /* Digits except zero */
135 OT_D0
= 20, /* Digit zero */
136 OT_DB
= OT_N
, /* Dot below */
137 OT_GB
= OT_DOTTEDCIRCLE
,
138 OT_MH
= 21, /* Various consonant medial types */
139 OT_MR
= 22, /* Various consonant medial types */
140 OT_MW
= 23, /* Various consonant medial types */
141 OT_MY
= 24, /* Various consonant medial types */
142 OT_PT
= 25, /* Pwo and other tones */
147 OT_VS
= 30 /* Variation selectors */
152 is_one_of (const hb_glyph_info_t
&info
, unsigned int flags
)
154 /* If it ligated, all bets are off. */
155 if (is_a_ligature (info
)) return false;
156 return !!(FLAG (info
.myanmar_category()) & flags
);
161 * We treat Vowels and placeholders as if they were consonants. This is safe because Vowels
162 * cannot happen in a consonant syllable. The plus side however is, we can call the
163 * consonant syllable logic from the vowel syllable function and get it all right! */
164 #define CONSONANT_FLAGS (FLAG (OT_C) | FLAG (OT_CM) | FLAG (OT_Ra) | FLAG (OT_V) | FLAG (OT_NBSP) | FLAG (OT_GB))
166 is_consonant (const hb_glyph_info_t
&info
)
168 return is_one_of (info
, CONSONANT_FLAGS
);
173 set_myanmar_properties (hb_glyph_info_t
&info
)
175 hb_codepoint_t u
= info
.codepoint
;
176 unsigned int type
= hb_indic_get_categories (u
);
177 indic_category_t cat
= (indic_category_t
) (type
& 0x7F);
178 indic_position_t pos
= (indic_position_t
) (type
>> 8);
181 * http://www.microsoft.com/typography/OpenTypeDev/myanmar/intro.htm#analyze
183 if (unlikely (hb_in_range
<hb_codepoint_t
> (u
, 0xFE00, 0xFE0F)))
184 cat
= (indic_category_t
) OT_VS
;
185 else if (unlikely (u
== 0x200C)) cat
= (indic_category_t
) OT_ZWNJ
;
186 else if (unlikely (u
== 0x200D)) cat
= (indic_category_t
) OT_ZWJ
;
190 case 0x002D: case 0x00A0: case 0x00D7: case 0x2012:
191 case 0x2013: case 0x2014: case 0x2015: case 0x2022:
192 case 0x25CC: case 0x25FB: case 0x25FC: case 0x25FD:
194 cat
= (indic_category_t
) OT_GB
;
197 case 0x1004: case 0x101B: case 0x105A:
198 cat
= (indic_category_t
) OT_Ra
;
201 case 0x1032: case 0x1036:
202 cat
= (indic_category_t
) OT_A
;
206 cat
= (indic_category_t
) OT_As
;
209 case 0x1041: case 0x1042: case 0x1043: case 0x1044:
210 case 0x1045: case 0x1046: case 0x1047: case 0x1048:
211 case 0x1049: case 0x1090: case 0x1091: case 0x1092:
212 case 0x1093: case 0x1094: case 0x1095: case 0x1096:
213 case 0x1097: case 0x1098: case 0x1099:
214 cat
= (indic_category_t
) OT_D
;
218 cat
= (indic_category_t
) OT_D
; /* XXX The spec says D0, but Uniscribe doesn't seem to do. */
221 case 0x103E: case 0x1060:
222 cat
= (indic_category_t
) OT_MH
;
226 cat
= (indic_category_t
) OT_MR
;
229 case 0x103D: case 0x1082:
230 cat
= (indic_category_t
) OT_MW
;
233 case 0x103B: case 0x105E: case 0x105F:
234 cat
= (indic_category_t
) OT_MY
;
237 case 0x1063: case 0x1064: case 0x1069: case 0x106A:
238 case 0x106B: case 0x106C: case 0x106D: case 0xAA7B:
239 cat
= (indic_category_t
) OT_PT
;
242 case 0x1038: case 0x1087: case 0x1088: case 0x1089:
243 case 0x108A: case 0x108B: case 0x108C: case 0x108D:
244 case 0x108F: case 0x109A: case 0x109B: case 0x109C:
245 cat
= (indic_category_t
) OT_SM
;
253 case POS_PRE_C
: cat
= (indic_category_t
) OT_VPre
;
254 pos
= POS_PRE_M
; break;
255 case POS_ABOVE_C
: cat
= (indic_category_t
) OT_VAbv
; break;
256 case POS_BELOW_C
: cat
= (indic_category_t
) OT_VBlw
; break;
257 case POS_POST_C
: cat
= (indic_category_t
) OT_VPst
; break;
261 info
.myanmar_category() = (myanmar_category_t
) cat
;
262 info
.myanmar_position() = pos
;
268 setup_masks_myanmar (const hb_ot_shape_plan_t
*plan HB_UNUSED
,
270 hb_font_t
*font HB_UNUSED
)
272 HB_BUFFER_ALLOCATE_VAR (buffer
, myanmar_category
);
273 HB_BUFFER_ALLOCATE_VAR (buffer
, myanmar_position
);
275 /* We cannot setup masks here. We save information about characters
276 * and setup masks later on in a pause-callback. */
278 unsigned int count
= buffer
->len
;
279 for (unsigned int i
= 0; i
< count
; i
++)
280 set_myanmar_properties (buffer
->info
[i
]);
284 setup_syllables (const hb_ot_shape_plan_t
*plan HB_UNUSED
,
285 hb_font_t
*font HB_UNUSED
,
288 find_syllables (buffer
);
292 compare_myanmar_order (const hb_glyph_info_t
*pa
, const hb_glyph_info_t
*pb
)
294 int a
= pa
->myanmar_position();
295 int b
= pb
->myanmar_position();
297 return a
< b
? -1 : a
== b
? 0 : +1;
302 * http://www.microsoft.com/typography/OpenTypeDev/myanmar/intro.htm */
305 initial_reordering_consonant_syllable (const hb_ot_shape_plan_t
*plan
,
308 unsigned int start
, unsigned int end
)
310 hb_glyph_info_t
*info
= buffer
->info
;
312 unsigned int base
= end
;
313 bool has_reph
= false;
316 unsigned int limit
= start
;
317 if (start
+ 3 <= end
&&
318 info
[start
].myanmar_category() == OT_Ra
&&
319 info
[start
+1].myanmar_category() == OT_As
&&
320 info
[start
+2].myanmar_category() == OT_H
)
331 for (unsigned int i
= limit
; i
< end
; i
++)
332 if (is_consonant (info
[i
]))
342 unsigned int i
= start
;
343 for (; i
< start
+ (has_reph
? 3 : 0); i
++)
344 info
[i
].myanmar_position() = POS_AFTER_MAIN
;
345 for (; i
< base
; i
++)
346 info
[i
].myanmar_position() = POS_PRE_C
;
349 info
[i
].myanmar_position() = POS_BASE_C
;
352 indic_position_t pos
= POS_AFTER_MAIN
;
353 /* The following loop may be ugly, but it implements all of
354 * Myanmar reordering! */
357 if (info
[i
].myanmar_category() == OT_MR
) /* Pre-base reordering */
359 info
[i
].myanmar_position() = POS_PRE_C
;
362 if (info
[i
].myanmar_position() < POS_BASE_C
) /* Left matra */
367 if (pos
== POS_AFTER_MAIN
&& info
[i
].myanmar_category() == OT_VBlw
)
370 info
[i
].myanmar_position() = pos
;
374 if (pos
== POS_BELOW_C
&& info
[i
].myanmar_category() == OT_A
)
376 info
[i
].myanmar_position() = POS_BEFORE_SUB
;
379 if (pos
== POS_BELOW_C
&& info
[i
].myanmar_category() == OT_VBlw
)
381 info
[i
].myanmar_position() = pos
;
384 if (pos
== POS_BELOW_C
&& info
[i
].myanmar_category() != OT_A
)
387 info
[i
].myanmar_position() = pos
;
390 info
[i
].myanmar_position() = pos
;
394 buffer
->merge_clusters (start
, end
);
395 /* Sit tight, rock 'n roll! */
396 hb_bubble_sort (info
+ start
, end
- start
, compare_myanmar_order
);
400 initial_reordering_broken_cluster (const hb_ot_shape_plan_t
*plan
,
403 unsigned int start
, unsigned int end
)
405 /* We already inserted dotted-circles, so just call the consonant_syllable. */
406 initial_reordering_consonant_syllable (plan
, face
, buffer
, start
, end
);
410 initial_reordering_non_myanmar_cluster (const hb_ot_shape_plan_t
*plan HB_UNUSED
,
411 hb_face_t
*face HB_UNUSED
,
412 hb_buffer_t
*buffer HB_UNUSED
,
413 unsigned int start HB_UNUSED
, unsigned int end HB_UNUSED
)
415 /* Nothing to do right now. If we ever switch to using the output
416 * buffer in the reordering process, we'd need to next_glyph() here. */
421 initial_reordering_syllable (const hb_ot_shape_plan_t
*plan
,
424 unsigned int start
, unsigned int end
)
426 syllable_type_t syllable_type
= (syllable_type_t
) (buffer
->info
[start
].syllable() & 0x0F);
427 switch (syllable_type
) {
428 case consonant_syllable
: initial_reordering_consonant_syllable (plan
, face
, buffer
, start
, end
); return;
429 case broken_cluster
: initial_reordering_broken_cluster (plan
, face
, buffer
, start
, end
); return;
430 case non_myanmar_cluster
: initial_reordering_non_myanmar_cluster (plan
, face
, buffer
, start
, end
); return;
435 insert_dotted_circles (const hb_ot_shape_plan_t
*plan HB_UNUSED
,
439 /* Note: This loop is extra overhead, but should not be measurable. */
440 bool has_broken_syllables
= false;
441 unsigned int count
= buffer
->len
;
442 for (unsigned int i
= 0; i
< count
; i
++)
443 if ((buffer
->info
[i
].syllable() & 0x0F) == broken_cluster
) {
444 has_broken_syllables
= true;
447 if (likely (!has_broken_syllables
))
451 hb_codepoint_t dottedcircle_glyph
;
452 if (!font
->get_glyph (0x25CC, 0, &dottedcircle_glyph
))
455 hb_glyph_info_t dottedcircle
= {0};
456 dottedcircle
.codepoint
= 0x25CC;
457 set_myanmar_properties (dottedcircle
);
458 dottedcircle
.codepoint
= dottedcircle_glyph
;
460 buffer
->clear_output ();
463 unsigned int last_syllable
= 0;
464 while (buffer
->idx
< buffer
->len
)
466 unsigned int syllable
= buffer
->cur().syllable();
467 syllable_type_t syllable_type
= (syllable_type_t
) (syllable
& 0x0F);
468 if (unlikely (last_syllable
!= syllable
&& syllable_type
== broken_cluster
))
470 last_syllable
= syllable
;
472 hb_glyph_info_t info
= dottedcircle
;
473 info
.cluster
= buffer
->cur().cluster
;
474 info
.mask
= buffer
->cur().mask
;
475 info
.syllable() = buffer
->cur().syllable();
477 buffer
->output_info (info
);
480 buffer
->next_glyph ();
483 buffer
->swap_buffers ();
487 initial_reordering (const hb_ot_shape_plan_t
*plan
,
491 insert_dotted_circles (plan
, font
, buffer
);
493 hb_glyph_info_t
*info
= buffer
->info
;
494 unsigned int count
= buffer
->len
;
495 if (unlikely (!count
)) return;
496 unsigned int last
= 0;
497 unsigned int last_syllable
= info
[0].syllable();
498 for (unsigned int i
= 1; i
< count
; i
++)
499 if (last_syllable
!= info
[i
].syllable()) {
500 initial_reordering_syllable (plan
, font
->face
, buffer
, last
, i
);
502 last_syllable
= info
[last
].syllable();
504 initial_reordering_syllable (plan
, font
->face
, buffer
, last
, count
);
508 final_reordering (const hb_ot_shape_plan_t
*plan
,
509 hb_font_t
*font HB_UNUSED
,
512 hb_glyph_info_t
*info
= buffer
->info
;
513 unsigned int count
= buffer
->len
;
515 /* Zero syllables now... */
516 for (unsigned int i
= 0; i
< count
; i
++)
517 info
[i
].syllable() = 0;
519 HB_BUFFER_DEALLOCATE_VAR (buffer
, myanmar_category
);
520 HB_BUFFER_DEALLOCATE_VAR (buffer
, myanmar_position
);
524 static hb_ot_shape_normalization_mode_t
525 normalization_preference_myanmar (const hb_segment_properties_t
*props HB_UNUSED
)
527 return HB_OT_SHAPE_NORMALIZATION_MODE_COMPOSED_DIACRITICS_NO_SHORT_CIRCUIT
;
531 const hb_ot_complex_shaper_t _hb_ot_complex_shaper_myanmar
=
534 collect_features_myanmar
,
535 override_features_myanmar
,
536 NULL
, /* data_create */
537 NULL
, /* data_destroy */
538 NULL
, /* preprocess_text */
539 normalization_preference_myanmar
,
540 NULL
, /* decompose */
543 HB_OT_SHAPE_ZERO_WIDTH_MARKS_BY_GDEF_EARLY
,
544 false, /* fallback_position */