2 * Copyright © 2014 Google, Inc.
4 * This is part of HarfBuzz, a text shaping library.
6 * Permission is hereby granted, without written agreement and without
7 * license or royalty fees, to use, copy, modify, and distribute this
8 * software and its documentation for any purpose, provided that the
9 * above copyright notice and the following two paragraphs appear in
10 * all copies of this software.
12 * IN NO EVENT SHALL THE COPYRIGHT HOLDER BE LIABLE TO ANY PARTY FOR
13 * DIRECT, INDIRECT, SPECIAL, INCIDENTAL, OR CONSEQUENTIAL DAMAGES
14 * ARISING OUT OF THE USE OF THIS SOFTWARE AND ITS DOCUMENTATION, EVEN
15 * IF THE COPYRIGHT HOLDER HAS BEEN ADVISED OF THE POSSIBILITY OF SUCH
18 * THE COPYRIGHT HOLDER SPECIFICALLY DISCLAIMS ANY WARRANTIES, INCLUDING,
19 * BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND
20 * FITNESS FOR A PARTICULAR PURPOSE. THE SOFTWARE PROVIDED HEREUNDER IS
21 * ON AN "AS IS" BASIS, AND THE COPYRIGHT HOLDER HAS NO OBLIGATION TO
22 * PROVIDE MAINTENANCE, SUPPORT, UPDATES, ENHANCEMENTS, OR MODIFICATIONS.
24 * Google Author(s): Behdad Esfahbod
27 #ifndef HB_OT_CMAP_TABLE_HH
28 #define HB_OT_CMAP_TABLE_HH
30 #include "hb-open-type-private.hh"
37 * cmap -- Character To Glyph Index Mapping Table
40 #define HB_OT_TAG_cmap HB_TAG('c','m','a','p')
43 struct CmapSubtableFormat0
45 inline bool get_glyph (hb_codepoint_t codepoint
, hb_codepoint_t
*glyph
) const
47 hb_codepoint_t gid
= codepoint
< 256 ? glyphIdArray
[codepoint
] : 0;
54 inline bool sanitize (hb_sanitize_context_t
*c
) const
56 TRACE_SANITIZE (this);
57 return TRACE_RETURN (c
->check_struct (this));
61 USHORT format
; /* Format number is set to 0. */
62 USHORT lengthZ
; /* Byte length of this subtable. */
63 USHORT languageZ
; /* Ignore. */
64 BYTE glyphIdArray
[256];/* An array that maps character
65 * code to glyph index values. */
67 DEFINE_SIZE_STATIC (6 + 256);
70 struct CmapSubtableFormat4
72 inline bool get_glyph (hb_codepoint_t codepoint
, hb_codepoint_t
*glyph
) const
74 unsigned int segCount
;
75 const USHORT
*endCount
;
76 const USHORT
*startCount
;
77 const USHORT
*idDelta
;
78 const USHORT
*idRangeOffset
;
79 const USHORT
*glyphIdArray
;
80 unsigned int glyphIdArrayLength
;
82 segCount
= this->segCountX2
/ 2;
83 endCount
= this->values
;
84 startCount
= endCount
+ segCount
+ 1;
85 idDelta
= startCount
+ segCount
;
86 idRangeOffset
= idDelta
+ segCount
;
87 glyphIdArray
= idRangeOffset
+ segCount
;
88 glyphIdArrayLength
= (this->length
- 16 - 8 * segCount
) / 2;
90 /* Custom two-array bsearch. */
91 int min
= 0, max
= (int) segCount
- 1;
95 int mid
= (min
+ max
) / 2;
96 if (codepoint
< startCount
[mid
])
98 else if (codepoint
> endCount
[mid
])
110 unsigned int rangeOffset
= idRangeOffset
[i
];
111 if (rangeOffset
== 0)
112 gid
= codepoint
+ idDelta
[i
];
115 /* Somebody has been smoking... */
116 unsigned int index
= rangeOffset
/ 2 + (codepoint
- startCount
[i
]) + i
- segCount
;
117 if (unlikely (index
>= glyphIdArrayLength
))
119 gid
= glyphIdArray
[index
];
125 *glyph
= gid
& 0xFFFFu
;
129 inline bool sanitize (hb_sanitize_context_t
*c
) const
131 TRACE_SANITIZE (this);
132 if (unlikely (!c
->check_struct (this)))
133 return TRACE_RETURN (false);
135 if (unlikely (!c
->check_range (this, length
)))
137 /* Some broken fonts have too long of a "length" value.
138 * If that is the case, just change the value to truncate
139 * the subtable at the end of the blob. */
140 uint16_t new_length
= (uint16_t) MIN ((uintptr_t) 65535,
141 (uintptr_t) (c
->end
-
143 if (!c
->try_set (&length
, new_length
))
144 return TRACE_RETURN (false);
147 return TRACE_RETURN (16 + 4 * (unsigned int) segCountX2
<= length
);
151 USHORT format
; /* Format number is set to 4. */
152 USHORT length
; /* This is the length in bytes of the
154 USHORT languageZ
; /* Ignore. */
155 USHORT segCountX2
; /* 2 x segCount. */
156 USHORT searchRangeZ
; /* 2 * (2**floor(log2(segCount))) */
157 USHORT entrySelectorZ
; /* log2(searchRange/2) */
158 USHORT rangeShiftZ
; /* 2 x segCount - searchRange */
162 USHORT endCount
[segCount
]; /* End characterCode for each segment,
164 USHORT reservedPad
; /* Set to 0. */
165 USHORT startCount
[segCount
]; /* Start character code for each segment. */
166 SHORT idDelta
[segCount
]; /* Delta for all character codes in segment. */
167 USHORT idRangeOffset
[segCount
];/* Offsets into glyphIdArray or 0 */
168 USHORT glyphIdArray
[VAR
]; /* Glyph index array (arbitrary length) */
172 DEFINE_SIZE_ARRAY (14, values
);
175 struct CmapSubtableLongGroup
177 friend struct CmapSubtableFormat12
;
178 friend struct CmapSubtableFormat13
;
180 int cmp (hb_codepoint_t codepoint
) const
182 if (codepoint
< startCharCode
) return -1;
183 if (codepoint
> endCharCode
) return +1;
187 inline bool sanitize (hb_sanitize_context_t
*c
) const
189 TRACE_SANITIZE (this);
190 return TRACE_RETURN (c
->check_struct (this));
194 ULONG startCharCode
; /* First character code in this group. */
195 ULONG endCharCode
; /* Last character code in this group. */
196 ULONG glyphID
; /* Glyph index; interpretation depends on
197 * subtable format. */
199 DEFINE_SIZE_STATIC (12);
202 template <typename UINT
>
203 struct CmapSubtableTrimmed
205 inline bool get_glyph (hb_codepoint_t codepoint
, hb_codepoint_t
*glyph
) const
207 /* Rely on our implicit array bound-checking. */
208 hb_codepoint_t gid
= glyphIdArray
[codepoint
- startCharCode
];
215 inline bool sanitize (hb_sanitize_context_t
*c
) const
217 TRACE_SANITIZE (this);
218 return TRACE_RETURN (c
->check_struct (this) && glyphIdArray
.sanitize (c
));
222 UINT formatReserved
; /* Subtable format and (maybe) padding. */
223 UINT lengthZ
; /* Byte length of this subtable. */
224 UINT languageZ
; /* Ignore. */
225 UINT startCharCode
; /* First character code covered. */
226 ArrayOf
<GlyphID
, UINT
>
227 glyphIdArray
; /* Array of glyph index values for character
228 * codes in the range. */
230 DEFINE_SIZE_ARRAY (5 * sizeof (UINT
), glyphIdArray
);
233 struct CmapSubtableFormat6
: CmapSubtableTrimmed
<USHORT
> {};
234 struct CmapSubtableFormat10
: CmapSubtableTrimmed
<ULONG
> {};
236 template <typename T
>
237 struct CmapSubtableLongSegmented
239 inline bool get_glyph (hb_codepoint_t codepoint
, hb_codepoint_t
*glyph
) const
241 int i
= groups
.bsearch (codepoint
);
244 *glyph
= T::group_get_glyph (groups
[i
], codepoint
);
248 inline bool sanitize (hb_sanitize_context_t
*c
) const
250 TRACE_SANITIZE (this);
251 return TRACE_RETURN (c
->check_struct (this) && groups
.sanitize (c
));
255 USHORT format
; /* Subtable format; set to 12. */
256 USHORT reservedZ
; /* Reserved; set to 0. */
257 ULONG lengthZ
; /* Byte length of this subtable. */
258 ULONG languageZ
; /* Ignore. */
259 SortedArrayOf
<CmapSubtableLongGroup
, ULONG
>
260 groups
; /* Groupings. */
262 DEFINE_SIZE_ARRAY (16, groups
);
265 struct CmapSubtableFormat12
: CmapSubtableLongSegmented
<CmapSubtableFormat12
>
267 static inline hb_codepoint_t
group_get_glyph (const CmapSubtableLongGroup
&group
,
269 { return group
.glyphID
+ (u
- group
.startCharCode
); }
272 struct CmapSubtableFormat13
: CmapSubtableLongSegmented
<CmapSubtableFormat13
>
274 static inline hb_codepoint_t
group_get_glyph (const CmapSubtableLongGroup
&group
,
275 hb_codepoint_t u HB_UNUSED
)
276 { return group
.glyphID
; }
281 GLYPH_VARIANT_NOT_FOUND
= 0,
282 GLYPH_VARIANT_FOUND
= 1,
283 GLYPH_VARIANT_USE_DEFAULT
= 2
286 struct UnicodeValueRange
288 inline int cmp (const hb_codepoint_t
&codepoint
) const
290 if (codepoint
< startUnicodeValue
) return -1;
291 if (codepoint
> startUnicodeValue
+ additionalCount
) return +1;
295 inline bool sanitize (hb_sanitize_context_t
*c
) const
297 TRACE_SANITIZE (this);
298 return TRACE_RETURN (c
->check_struct (this));
301 UINT24 startUnicodeValue
; /* First value in this range. */
302 BYTE additionalCount
; /* Number of additional values in this
305 DEFINE_SIZE_STATIC (4);
308 typedef SortedArrayOf
<UnicodeValueRange
, ULONG
> DefaultUVS
;
312 inline int cmp (const hb_codepoint_t
&codepoint
) const
314 return unicodeValue
.cmp (codepoint
);
317 inline bool sanitize (hb_sanitize_context_t
*c
) const
319 TRACE_SANITIZE (this);
320 return TRACE_RETURN (c
->check_struct (this));
323 UINT24 unicodeValue
; /* Base Unicode value of the UVS */
324 GlyphID glyphID
; /* Glyph ID of the UVS */
326 DEFINE_SIZE_STATIC (5);
329 typedef SortedArrayOf
<UVSMapping
, ULONG
> NonDefaultUVS
;
331 struct VariationSelectorRecord
333 inline glyph_variant_t
get_glyph (hb_codepoint_t codepoint
,
334 hb_codepoint_t
*glyph
,
335 const void *base
) const
338 const DefaultUVS
&defaults
= base
+defaultUVS
;
339 i
= defaults
.bsearch (codepoint
);
341 return GLYPH_VARIANT_USE_DEFAULT
;
342 const NonDefaultUVS
&nonDefaults
= base
+nonDefaultUVS
;
343 i
= nonDefaults
.bsearch (codepoint
);
346 *glyph
= nonDefaults
[i
].glyphID
;
347 return GLYPH_VARIANT_FOUND
;
349 return GLYPH_VARIANT_NOT_FOUND
;
352 inline int cmp (const hb_codepoint_t
&variation_selector
) const
354 return varSelector
.cmp (variation_selector
);
357 inline bool sanitize (hb_sanitize_context_t
*c
, const void *base
) const
359 TRACE_SANITIZE (this);
360 return TRACE_RETURN (c
->check_struct (this) &&
361 defaultUVS
.sanitize (c
, base
) &&
362 nonDefaultUVS
.sanitize (c
, base
));
365 UINT24 varSelector
; /* Variation selector. */
366 OffsetTo
<DefaultUVS
, ULONG
>
367 defaultUVS
; /* Offset to Default UVS Table. May be 0. */
368 OffsetTo
<NonDefaultUVS
, ULONG
>
369 nonDefaultUVS
; /* Offset to Non-Default UVS Table. May be 0. */
371 DEFINE_SIZE_STATIC (11);
374 struct CmapSubtableFormat14
376 inline glyph_variant_t
get_glyph_variant (hb_codepoint_t codepoint
,
377 hb_codepoint_t variation_selector
,
378 hb_codepoint_t
*glyph
) const
380 return record
[record
.bsearch(variation_selector
)].get_glyph (codepoint
, glyph
, this);
383 inline bool sanitize (hb_sanitize_context_t
*c
) const
385 TRACE_SANITIZE (this);
386 return TRACE_RETURN (c
->check_struct (this) &&
387 record
.sanitize (c
, this));
391 USHORT format
; /* Format number is set to 0. */
392 ULONG lengthZ
; /* Byte length of this subtable. */
393 SortedArrayOf
<VariationSelectorRecord
, ULONG
>
394 record
; /* Variation selector records; sorted
395 * in increasing order of `varSelector'. */
397 DEFINE_SIZE_ARRAY (10, record
);
402 /* Note: We intentionally do NOT implement subtable formats 2 and 8. */
404 inline bool get_glyph (hb_codepoint_t codepoint
,
405 hb_codepoint_t
*glyph
) const
408 case 0: return u
.format0
.get_glyph(codepoint
, glyph
);
409 case 4: return u
.format4
.get_glyph(codepoint
, glyph
);
410 case 6: return u
.format6
.get_glyph(codepoint
, glyph
);
411 case 10: return u
.format10
.get_glyph(codepoint
, glyph
);
412 case 12: return u
.format12
.get_glyph(codepoint
, glyph
);
413 case 13: return u
.format13
.get_glyph(codepoint
, glyph
);
415 default: return false;
419 inline glyph_variant_t
get_glyph_variant (hb_codepoint_t codepoint
,
420 hb_codepoint_t variation_selector
,
421 hb_codepoint_t
*glyph
) const
424 case 14: return u
.format14
.get_glyph_variant(codepoint
, variation_selector
, glyph
);
425 default: return GLYPH_VARIANT_NOT_FOUND
;
429 inline bool sanitize (hb_sanitize_context_t
*c
) const
431 TRACE_SANITIZE (this);
432 if (!u
.format
.sanitize (c
)) return TRACE_RETURN (false);
434 case 0: return TRACE_RETURN (u
.format0
.sanitize (c
));
435 case 4: return TRACE_RETURN (u
.format4
.sanitize (c
));
436 case 6: return TRACE_RETURN (u
.format6
.sanitize (c
));
437 case 10: return TRACE_RETURN (u
.format10
.sanitize (c
));
438 case 12: return TRACE_RETURN (u
.format12
.sanitize (c
));
439 case 13: return TRACE_RETURN (u
.format13
.sanitize (c
));
440 case 14: return TRACE_RETURN (u
.format14
.sanitize (c
));
441 default:return TRACE_RETURN (true);
447 USHORT format
; /* Format identifier */
448 CmapSubtableFormat0 format0
;
449 CmapSubtableFormat4 format4
;
450 CmapSubtableFormat6 format6
;
451 CmapSubtableFormat10 format10
;
452 CmapSubtableFormat12 format12
;
453 CmapSubtableFormat13 format13
;
454 CmapSubtableFormat14 format14
;
457 DEFINE_SIZE_UNION (2, format
);
461 struct EncodingRecord
463 inline int cmp (const EncodingRecord
&other
) const
466 ret
= platformID
.cmp (other
.platformID
);
468 ret
= encodingID
.cmp (other
.encodingID
);
473 inline bool sanitize (hb_sanitize_context_t
*c
, const void *base
) const
475 TRACE_SANITIZE (this);
476 return TRACE_RETURN (c
->check_struct (this) &&
477 subtable
.sanitize (c
, base
));
480 USHORT platformID
; /* Platform ID. */
481 USHORT encodingID
; /* Platform-specific encoding ID. */
482 OffsetTo
<CmapSubtable
, ULONG
>
483 subtable
; /* Byte offset from beginning of table to the subtable for this encoding. */
485 DEFINE_SIZE_STATIC (8);
490 static const hb_tag_t tableTag
= HB_OT_TAG_cmap
;
492 inline const CmapSubtable
*find_subtable (unsigned int platform_id
,
493 unsigned int encoding_id
) const
496 key
.platformID
.set (platform_id
);
497 key
.encodingID
.set (encoding_id
);
499 /* Note: We can use bsearch, but since it has no performance
500 * implications, we use lsearch and as such accept fonts with
501 * unsorted subtable list. */
502 int result
= encodingRecord
./*bsearch*/lsearch (key
);
503 if (result
== -1 || !encodingRecord
[result
].subtable
)
506 return &(this+encodingRecord
[result
].subtable
);
509 inline bool sanitize (hb_sanitize_context_t
*c
) const
511 TRACE_SANITIZE (this);
512 return TRACE_RETURN (c
->check_struct (this) &&
513 likely (version
== 0) &&
514 encodingRecord
.sanitize (c
, this));
517 USHORT version
; /* Table version number (0). */
518 SortedArrayOf
<EncodingRecord
>
519 encodingRecord
; /* Encoding tables. */
521 DEFINE_SIZE_ARRAY (4, encodingRecord
);
528 #endif /* HB_OT_CMAP_TABLE_HH */