Update mojo sdk to rev 1dc8a9a5db73d3718d99917fadf31f5fb2ebad4f
[chromium-blink-merge.git] / third_party / harfbuzz-ng / src / hb-unicode.h
blob1c4e097b92d5ba628455fefe25b6f4697cc16f11
1 /*
2 * Copyright © 2009 Red Hat, Inc.
3 * Copyright © 2011 Codethink Limited
4 * Copyright © 2011,2012 Google, Inc.
6 * This is part of HarfBuzz, a text shaping library.
8 * Permission is hereby granted, without written agreement and without
9 * license or royalty fees, to use, copy, modify, and distribute this
10 * software and its documentation for any purpose, provided that the
11 * above copyright notice and the following two paragraphs appear in
12 * all copies of this software.
14 * IN NO EVENT SHALL THE COPYRIGHT HOLDER BE LIABLE TO ANY PARTY FOR
15 * DIRECT, INDIRECT, SPECIAL, INCIDENTAL, OR CONSEQUENTIAL DAMAGES
16 * ARISING OUT OF THE USE OF THIS SOFTWARE AND ITS DOCUMENTATION, EVEN
17 * IF THE COPYRIGHT HOLDER HAS BEEN ADVISED OF THE POSSIBILITY OF SUCH
18 * DAMAGE.
20 * THE COPYRIGHT HOLDER SPECIFICALLY DISCLAIMS ANY WARRANTIES, INCLUDING,
21 * BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND
22 * FITNESS FOR A PARTICULAR PURPOSE. THE SOFTWARE PROVIDED HEREUNDER IS
23 * ON AN "AS IS" BASIS, AND THE COPYRIGHT HOLDER HAS NO OBLIGATION TO
24 * PROVIDE MAINTENANCE, SUPPORT, UPDATES, ENHANCEMENTS, OR MODIFICATIONS.
26 * Red Hat Author(s): Behdad Esfahbod
27 * Codethink Author(s): Ryan Lortie
28 * Google Author(s): Behdad Esfahbod
31 #ifndef HB_H_IN
32 #error "Include <hb.h> instead."
33 #endif
35 #ifndef HB_UNICODE_H
36 #define HB_UNICODE_H
38 #include "hb-common.h"
40 HB_BEGIN_DECLS
43 /* hb_unicode_general_category_t */
45 /* Unicode Character Database property: General_Category (gc) */
46 typedef enum
48 HB_UNICODE_GENERAL_CATEGORY_CONTROL, /* Cc */
49 HB_UNICODE_GENERAL_CATEGORY_FORMAT, /* Cf */
50 HB_UNICODE_GENERAL_CATEGORY_UNASSIGNED, /* Cn */
51 HB_UNICODE_GENERAL_CATEGORY_PRIVATE_USE, /* Co */
52 HB_UNICODE_GENERAL_CATEGORY_SURROGATE, /* Cs */
53 HB_UNICODE_GENERAL_CATEGORY_LOWERCASE_LETTER, /* Ll */
54 HB_UNICODE_GENERAL_CATEGORY_MODIFIER_LETTER, /* Lm */
55 HB_UNICODE_GENERAL_CATEGORY_OTHER_LETTER, /* Lo */
56 HB_UNICODE_GENERAL_CATEGORY_TITLECASE_LETTER, /* Lt */
57 HB_UNICODE_GENERAL_CATEGORY_UPPERCASE_LETTER, /* Lu */
58 HB_UNICODE_GENERAL_CATEGORY_SPACING_MARK, /* Mc */
59 HB_UNICODE_GENERAL_CATEGORY_ENCLOSING_MARK, /* Me */
60 HB_UNICODE_GENERAL_CATEGORY_NON_SPACING_MARK, /* Mn */
61 HB_UNICODE_GENERAL_CATEGORY_DECIMAL_NUMBER, /* Nd */
62 HB_UNICODE_GENERAL_CATEGORY_LETTER_NUMBER, /* Nl */
63 HB_UNICODE_GENERAL_CATEGORY_OTHER_NUMBER, /* No */
64 HB_UNICODE_GENERAL_CATEGORY_CONNECT_PUNCTUATION, /* Pc */
65 HB_UNICODE_GENERAL_CATEGORY_DASH_PUNCTUATION, /* Pd */
66 HB_UNICODE_GENERAL_CATEGORY_CLOSE_PUNCTUATION, /* Pe */
67 HB_UNICODE_GENERAL_CATEGORY_FINAL_PUNCTUATION, /* Pf */
68 HB_UNICODE_GENERAL_CATEGORY_INITIAL_PUNCTUATION, /* Pi */
69 HB_UNICODE_GENERAL_CATEGORY_OTHER_PUNCTUATION, /* Po */
70 HB_UNICODE_GENERAL_CATEGORY_OPEN_PUNCTUATION, /* Ps */
71 HB_UNICODE_GENERAL_CATEGORY_CURRENCY_SYMBOL, /* Sc */
72 HB_UNICODE_GENERAL_CATEGORY_MODIFIER_SYMBOL, /* Sk */
73 HB_UNICODE_GENERAL_CATEGORY_MATH_SYMBOL, /* Sm */
74 HB_UNICODE_GENERAL_CATEGORY_OTHER_SYMBOL, /* So */
75 HB_UNICODE_GENERAL_CATEGORY_LINE_SEPARATOR, /* Zl */
76 HB_UNICODE_GENERAL_CATEGORY_PARAGRAPH_SEPARATOR, /* Zp */
77 HB_UNICODE_GENERAL_CATEGORY_SPACE_SEPARATOR /* Zs */
78 } hb_unicode_general_category_t;
80 /* hb_unicode_combining_class_t */
82 /* Note: newer versions of Unicode may add new values. Clients should be ready to handle
83 * any value in the 0..254 range being returned from hb_unicode_combining_class().
86 /* Unicode Character Database property: Canonical_Combining_Class (ccc) */
87 typedef enum
89 HB_UNICODE_COMBINING_CLASS_NOT_REORDERED = 0,
90 HB_UNICODE_COMBINING_CLASS_OVERLAY = 1,
91 HB_UNICODE_COMBINING_CLASS_NUKTA = 7,
92 HB_UNICODE_COMBINING_CLASS_KANA_VOICING = 8,
93 HB_UNICODE_COMBINING_CLASS_VIRAMA = 9,
95 /* Hebrew */
96 HB_UNICODE_COMBINING_CLASS_CCC10 = 10,
97 HB_UNICODE_COMBINING_CLASS_CCC11 = 11,
98 HB_UNICODE_COMBINING_CLASS_CCC12 = 12,
99 HB_UNICODE_COMBINING_CLASS_CCC13 = 13,
100 HB_UNICODE_COMBINING_CLASS_CCC14 = 14,
101 HB_UNICODE_COMBINING_CLASS_CCC15 = 15,
102 HB_UNICODE_COMBINING_CLASS_CCC16 = 16,
103 HB_UNICODE_COMBINING_CLASS_CCC17 = 17,
104 HB_UNICODE_COMBINING_CLASS_CCC18 = 18,
105 HB_UNICODE_COMBINING_CLASS_CCC19 = 19,
106 HB_UNICODE_COMBINING_CLASS_CCC20 = 20,
107 HB_UNICODE_COMBINING_CLASS_CCC21 = 21,
108 HB_UNICODE_COMBINING_CLASS_CCC22 = 22,
109 HB_UNICODE_COMBINING_CLASS_CCC23 = 23,
110 HB_UNICODE_COMBINING_CLASS_CCC24 = 24,
111 HB_UNICODE_COMBINING_CLASS_CCC25 = 25,
112 HB_UNICODE_COMBINING_CLASS_CCC26 = 26,
114 /* Arabic */
115 HB_UNICODE_COMBINING_CLASS_CCC27 = 27,
116 HB_UNICODE_COMBINING_CLASS_CCC28 = 28,
117 HB_UNICODE_COMBINING_CLASS_CCC29 = 29,
118 HB_UNICODE_COMBINING_CLASS_CCC30 = 30,
119 HB_UNICODE_COMBINING_CLASS_CCC31 = 31,
120 HB_UNICODE_COMBINING_CLASS_CCC32 = 32,
121 HB_UNICODE_COMBINING_CLASS_CCC33 = 33,
122 HB_UNICODE_COMBINING_CLASS_CCC34 = 34,
123 HB_UNICODE_COMBINING_CLASS_CCC35 = 35,
125 /* Syriac */
126 HB_UNICODE_COMBINING_CLASS_CCC36 = 36,
128 /* Telugu */
129 HB_UNICODE_COMBINING_CLASS_CCC84 = 84,
130 HB_UNICODE_COMBINING_CLASS_CCC91 = 91,
132 /* Thai */
133 HB_UNICODE_COMBINING_CLASS_CCC103 = 103,
134 HB_UNICODE_COMBINING_CLASS_CCC107 = 107,
136 /* Lao */
137 HB_UNICODE_COMBINING_CLASS_CCC118 = 118,
138 HB_UNICODE_COMBINING_CLASS_CCC122 = 122,
140 /* Tibetan */
141 HB_UNICODE_COMBINING_CLASS_CCC129 = 129,
142 HB_UNICODE_COMBINING_CLASS_CCC130 = 130,
143 HB_UNICODE_COMBINING_CLASS_CCC133 = 132,
146 HB_UNICODE_COMBINING_CLASS_ATTACHED_BELOW_LEFT = 200,
147 HB_UNICODE_COMBINING_CLASS_ATTACHED_BELOW = 202,
148 HB_UNICODE_COMBINING_CLASS_ATTACHED_ABOVE = 214,
149 HB_UNICODE_COMBINING_CLASS_ATTACHED_ABOVE_RIGHT = 216,
150 HB_UNICODE_COMBINING_CLASS_BELOW_LEFT = 218,
151 HB_UNICODE_COMBINING_CLASS_BELOW = 220,
152 HB_UNICODE_COMBINING_CLASS_BELOW_RIGHT = 222,
153 HB_UNICODE_COMBINING_CLASS_LEFT = 224,
154 HB_UNICODE_COMBINING_CLASS_RIGHT = 226,
155 HB_UNICODE_COMBINING_CLASS_ABOVE_LEFT = 228,
156 HB_UNICODE_COMBINING_CLASS_ABOVE = 230,
157 HB_UNICODE_COMBINING_CLASS_ABOVE_RIGHT = 232,
158 HB_UNICODE_COMBINING_CLASS_DOUBLE_BELOW = 233,
159 HB_UNICODE_COMBINING_CLASS_DOUBLE_ABOVE = 234,
161 HB_UNICODE_COMBINING_CLASS_IOTA_SUBSCRIPT = 240,
163 HB_UNICODE_COMBINING_CLASS_INVALID = 255
164 } hb_unicode_combining_class_t;
168 * hb_unicode_funcs_t
171 typedef struct hb_unicode_funcs_t hb_unicode_funcs_t;
175 * just give me the best implementation you've got there.
177 hb_unicode_funcs_t *
178 hb_unicode_funcs_get_default (void);
181 hb_unicode_funcs_t *
182 hb_unicode_funcs_create (hb_unicode_funcs_t *parent);
184 hb_unicode_funcs_t *
185 hb_unicode_funcs_get_empty (void);
187 hb_unicode_funcs_t *
188 hb_unicode_funcs_reference (hb_unicode_funcs_t *ufuncs);
190 void
191 hb_unicode_funcs_destroy (hb_unicode_funcs_t *ufuncs);
193 hb_bool_t
194 hb_unicode_funcs_set_user_data (hb_unicode_funcs_t *ufuncs,
195 hb_user_data_key_t *key,
196 void * data,
197 hb_destroy_func_t destroy,
198 hb_bool_t replace);
201 void *
202 hb_unicode_funcs_get_user_data (hb_unicode_funcs_t *ufuncs,
203 hb_user_data_key_t *key);
206 void
207 hb_unicode_funcs_make_immutable (hb_unicode_funcs_t *ufuncs);
209 hb_bool_t
210 hb_unicode_funcs_is_immutable (hb_unicode_funcs_t *ufuncs);
212 hb_unicode_funcs_t *
213 hb_unicode_funcs_get_parent (hb_unicode_funcs_t *ufuncs);
217 * funcs
220 /* typedefs */
222 typedef hb_unicode_combining_class_t (*hb_unicode_combining_class_func_t) (hb_unicode_funcs_t *ufuncs,
223 hb_codepoint_t unicode,
224 void *user_data);
225 typedef unsigned int (*hb_unicode_eastasian_width_func_t) (hb_unicode_funcs_t *ufuncs,
226 hb_codepoint_t unicode,
227 void *user_data);
228 typedef hb_unicode_general_category_t (*hb_unicode_general_category_func_t) (hb_unicode_funcs_t *ufuncs,
229 hb_codepoint_t unicode,
230 void *user_data);
231 typedef hb_codepoint_t (*hb_unicode_mirroring_func_t) (hb_unicode_funcs_t *ufuncs,
232 hb_codepoint_t unicode,
233 void *user_data);
234 typedef hb_script_t (*hb_unicode_script_func_t) (hb_unicode_funcs_t *ufuncs,
235 hb_codepoint_t unicode,
236 void *user_data);
238 typedef hb_bool_t (*hb_unicode_compose_func_t) (hb_unicode_funcs_t *ufuncs,
239 hb_codepoint_t a,
240 hb_codepoint_t b,
241 hb_codepoint_t *ab,
242 void *user_data);
243 typedef hb_bool_t (*hb_unicode_decompose_func_t) (hb_unicode_funcs_t *ufuncs,
244 hb_codepoint_t ab,
245 hb_codepoint_t *a,
246 hb_codepoint_t *b,
247 void *user_data);
250 * hb_unicode_decompose_compatibility_func_t:
251 * @ufuncs: a Unicode function structure
252 * @u: codepoint to decompose
253 * @decomposed: address of codepoint array (of length %HB_UNICODE_MAX_DECOMPOSITION_LEN) to write decomposition into
254 * @user_data: user data pointer as passed to hb_unicode_funcs_set_decompose_compatibility_func()
256 * Fully decompose @u to its Unicode compatibility decomposition. The codepoints of the decomposition will be written to @decomposed.
257 * The complete length of the decomposition will be returned.
259 * If @u has no compatibility decomposition, zero should be returned.
261 * The Unicode standard guarantees that a buffer of length %HB_UNICODE_MAX_DECOMPOSITION_LEN codepoints will always be sufficient for any
262 * compatibility decomposition plus an terminating value of 0. Consequently, @decompose must be allocated by the caller to be at least this length. Implementations
263 * of this function type must ensure that they do not write past the provided array.
265 * Return value: number of codepoints in the full compatibility decomposition of @u, or 0 if no decomposition available.
267 typedef unsigned int (*hb_unicode_decompose_compatibility_func_t) (hb_unicode_funcs_t *ufuncs,
268 hb_codepoint_t u,
269 hb_codepoint_t *decomposed,
270 void *user_data);
272 /* See Unicode 6.1 for details on the maximum decomposition length. */
273 #define HB_UNICODE_MAX_DECOMPOSITION_LEN (18+1) /* codepoints */
275 /* setters */
278 * hb_unicode_funcs_set_combining_class_func:
279 * @ufuncs: a Unicode function structure
280 * @func: (closure user_data) (destroy destroy) (scope notified):
281 * @user_data:
282 * @destroy:
286 * Since: 1.0
288 void
289 hb_unicode_funcs_set_combining_class_func (hb_unicode_funcs_t *ufuncs,
290 hb_unicode_combining_class_func_t func,
291 void *user_data, hb_destroy_func_t destroy);
294 * hb_unicode_funcs_set_eastasian_width_func:
295 * @ufuncs: a Unicode function structure
296 * @func: (closure user_data) (destroy destroy) (scope notified):
297 * @user_data:
298 * @destroy:
302 * Since: 1.0
304 void
305 hb_unicode_funcs_set_eastasian_width_func (hb_unicode_funcs_t *ufuncs,
306 hb_unicode_eastasian_width_func_t func,
307 void *user_data, hb_destroy_func_t destroy);
310 * hb_unicode_funcs_set_general_category_func:
311 * @ufuncs: a Unicode function structure
312 * @func: (closure user_data) (destroy destroy) (scope notified):
313 * @user_data:
314 * @destroy:
318 * Since: 1.0
320 void
321 hb_unicode_funcs_set_general_category_func (hb_unicode_funcs_t *ufuncs,
322 hb_unicode_general_category_func_t func,
323 void *user_data, hb_destroy_func_t destroy);
326 * hb_unicode_funcs_set_mirroring_func:
327 * @ufuncs: a Unicode function structure
328 * @func: (closure user_data) (destroy destroy) (scope notified):
329 * @user_data:
330 * @destroy:
334 * Since: 1.0
336 void
337 hb_unicode_funcs_set_mirroring_func (hb_unicode_funcs_t *ufuncs,
338 hb_unicode_mirroring_func_t func,
339 void *user_data, hb_destroy_func_t destroy);
342 * hb_unicode_funcs_set_script_func:
343 * @ufuncs: a Unicode function structure
344 * @func: (closure user_data) (destroy destroy) (scope notified):
345 * @user_data:
346 * @destroy:
350 * Since: 1.0
352 void
353 hb_unicode_funcs_set_script_func (hb_unicode_funcs_t *ufuncs,
354 hb_unicode_script_func_t func,
355 void *user_data, hb_destroy_func_t destroy);
358 * hb_unicode_funcs_set_compose_func:
359 * @ufuncs: a Unicode function structure
360 * @func: (closure user_data) (destroy destroy) (scope notified):
361 * @user_data:
362 * @destroy:
366 * Since: 1.0
368 void
369 hb_unicode_funcs_set_compose_func (hb_unicode_funcs_t *ufuncs,
370 hb_unicode_compose_func_t func,
371 void *user_data, hb_destroy_func_t destroy);
374 * hb_unicode_funcs_set_decompose_func:
375 * @ufuncs: a Unicode function structure
376 * @func: (closure user_data) (destroy destroy) (scope notified):
377 * @user_data:
378 * @destroy:
382 * Since: 1.0
384 void
385 hb_unicode_funcs_set_decompose_func (hb_unicode_funcs_t *ufuncs,
386 hb_unicode_decompose_func_t func,
387 void *user_data, hb_destroy_func_t destroy);
390 * hb_unicode_funcs_set_decompose_compatibility_func:
391 * @ufuncs: a Unicode function structure
392 * @func: (closure user_data) (destroy destroy) (scope notified):
393 * @user_data:
394 * @destroy:
398 * Since: 1.0
400 void
401 hb_unicode_funcs_set_decompose_compatibility_func (hb_unicode_funcs_t *ufuncs,
402 hb_unicode_decompose_compatibility_func_t func,
403 void *user_data, hb_destroy_func_t destroy);
405 /* accessors */
407 hb_unicode_combining_class_t
408 hb_unicode_combining_class (hb_unicode_funcs_t *ufuncs,
409 hb_codepoint_t unicode);
411 unsigned int
412 hb_unicode_eastasian_width (hb_unicode_funcs_t *ufuncs,
413 hb_codepoint_t unicode);
415 hb_unicode_general_category_t
416 hb_unicode_general_category (hb_unicode_funcs_t *ufuncs,
417 hb_codepoint_t unicode);
419 hb_codepoint_t
420 hb_unicode_mirroring (hb_unicode_funcs_t *ufuncs,
421 hb_codepoint_t unicode);
423 hb_script_t
424 hb_unicode_script (hb_unicode_funcs_t *ufuncs,
425 hb_codepoint_t unicode);
427 hb_bool_t
428 hb_unicode_compose (hb_unicode_funcs_t *ufuncs,
429 hb_codepoint_t a,
430 hb_codepoint_t b,
431 hb_codepoint_t *ab);
432 hb_bool_t
433 hb_unicode_decompose (hb_unicode_funcs_t *ufuncs,
434 hb_codepoint_t ab,
435 hb_codepoint_t *a,
436 hb_codepoint_t *b);
438 unsigned int
439 hb_unicode_decompose_compatibility (hb_unicode_funcs_t *ufuncs,
440 hb_codepoint_t u,
441 hb_codepoint_t *decomposed);
443 HB_END_DECLS
445 #endif /* HB_UNICODE_H */