1/*
2 * Copyright © 2011,2012 Google, Inc.
3 *
4 * This is part of HarfBuzz, a text shaping library.
5 *
6 * Permission is hereby granted, without written agreement and without
7 * license or royalty fees, to use, copy, modify, and distribute this
8 * software and its documentation for any purpose, provided that the
9 * above copyright notice and the following two paragraphs appear in
10 * all copies of this software.
11 *
12 * IN NO EVENT SHALL THE COPYRIGHT HOLDER BE LIABLE TO ANY PARTY FOR
13 * DIRECT, INDIRECT, SPECIAL, INCIDENTAL, OR CONSEQUENTIAL DAMAGES
14 * ARISING OUT OF THE USE OF THIS SOFTWARE AND ITS DOCUMENTATION, EVEN
15 * IF THE COPYRIGHT HOLDER HAS BEEN ADVISED OF THE POSSIBILITY OF SUCH
16 * DAMAGE.
17 *
18 * THE COPYRIGHT HOLDER SPECIFICALLY DISCLAIMS ANY WARRANTIES, INCLUDING,
19 * BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND
20 * FITNESS FOR A PARTICULAR PURPOSE. THE SOFTWARE PROVIDED HEREUNDER IS
21 * ON AN "AS IS" BASIS, AND THE COPYRIGHT HOLDER HAS NO OBLIGATION TO
22 * PROVIDE MAINTENANCE, SUPPORT, UPDATES, ENHANCEMENTS, OR MODIFICATIONS.
23 *
24 * Google Author(s): Behdad Esfahbod
25 */
26
27#include "hb-ot-shape-fallback-private.hh"
28#include "hb-ot-layout-gsubgpos-private.hh"
29
30static unsigned int
31recategorize_combining_class (hb_codepoint_t u,
32 unsigned int klass)
33{
34 if (klass >= 200)
35 return klass;
36
37 /* Thai / Lao need some per-character work. */
38 if ((u & ~0xFF) == 0x0E00u)
39 {
40 if (unlikely (klass == 0))
41 {
42 switch (u)
43 {
44 case 0x0E31u:
45 case 0x0E34u:
46 case 0x0E35u:
47 case 0x0E36u:
48 case 0x0E37u:
49 case 0x0E47u:
50 case 0x0E4Cu:
51 case 0x0E4Du:
52 case 0x0E4Eu:
53 klass = HB_UNICODE_COMBINING_CLASS_ABOVE_RIGHT;
54 break;
55
56 case 0x0EB1u:
57 case 0x0EB4u:
58 case 0x0EB5u:
59 case 0x0EB6u:
60 case 0x0EB7u:
61 case 0x0EBBu:
62 case 0x0ECCu:
63 case 0x0ECDu:
64 klass = HB_UNICODE_COMBINING_CLASS_ABOVE;
65 break;
66
67 case 0x0EBCu:
68 klass = HB_UNICODE_COMBINING_CLASS_BELOW;
69 break;
70 }
71 } else {
72 /* Thai virama is below-right */
73 if (u == 0x0E3Au)
74 klass = HB_UNICODE_COMBINING_CLASS_BELOW_RIGHT;
75 }
76 }
77
78 switch (klass)
79 {
80
81 /* Hebrew */
82
83 case HB_MODIFIED_COMBINING_CLASS_CCC10: /* sheva */
84 case HB_MODIFIED_COMBINING_CLASS_CCC11: /* hataf segol */
85 case HB_MODIFIED_COMBINING_CLASS_CCC12: /* hataf patah */
86 case HB_MODIFIED_COMBINING_CLASS_CCC13: /* hataf qamats */
87 case HB_MODIFIED_COMBINING_CLASS_CCC14: /* hiriq */
88 case HB_MODIFIED_COMBINING_CLASS_CCC15: /* tsere */
89 case HB_MODIFIED_COMBINING_CLASS_CCC16: /* segol */
90 case HB_MODIFIED_COMBINING_CLASS_CCC17: /* patah */
91 case HB_MODIFIED_COMBINING_CLASS_CCC18: /* qamats */
92 case HB_MODIFIED_COMBINING_CLASS_CCC20: /* qubuts */
93 case HB_MODIFIED_COMBINING_CLASS_CCC22: /* meteg */
94 return HB_UNICODE_COMBINING_CLASS_BELOW;
95
96 case HB_MODIFIED_COMBINING_CLASS_CCC23: /* rafe */
97 return HB_UNICODE_COMBINING_CLASS_ATTACHED_ABOVE;
98
99 case HB_MODIFIED_COMBINING_CLASS_CCC24: /* shin dot */
100 return HB_UNICODE_COMBINING_CLASS_ABOVE_RIGHT;
101
102 case HB_MODIFIED_COMBINING_CLASS_CCC25: /* sin dot */
103 case HB_MODIFIED_COMBINING_CLASS_CCC19: /* holam */
104 return HB_UNICODE_COMBINING_CLASS_ABOVE_LEFT;
105
106 case HB_MODIFIED_COMBINING_CLASS_CCC26: /* point varika */
107 return HB_UNICODE_COMBINING_CLASS_ABOVE;
108
109 case HB_MODIFIED_COMBINING_CLASS_CCC21: /* dagesh */
110 break;
111
112
113 /* Arabic and Syriac */
114
115 case HB_MODIFIED_COMBINING_CLASS_CCC27: /* fathatan */
116 case HB_MODIFIED_COMBINING_CLASS_CCC28: /* dammatan */
117 case HB_MODIFIED_COMBINING_CLASS_CCC30: /* fatha */
118 case HB_MODIFIED_COMBINING_CLASS_CCC31: /* damma */
119 case HB_MODIFIED_COMBINING_CLASS_CCC33: /* shadda */
120 case HB_MODIFIED_COMBINING_CLASS_CCC34: /* sukun */
121 case HB_MODIFIED_COMBINING_CLASS_CCC35: /* superscript alef */
122 case HB_MODIFIED_COMBINING_CLASS_CCC36: /* superscript alaph */
123 return HB_UNICODE_COMBINING_CLASS_ABOVE;
124
125 case HB_MODIFIED_COMBINING_CLASS_CCC29: /* kasratan */
126 case HB_MODIFIED_COMBINING_CLASS_CCC32: /* kasra */
127 return HB_UNICODE_COMBINING_CLASS_BELOW;
128
129
130 /* Thai */
131
132 case HB_MODIFIED_COMBINING_CLASS_CCC103: /* sara u / sara uu */
133 return HB_UNICODE_COMBINING_CLASS_BELOW_RIGHT;
134
135 case HB_MODIFIED_COMBINING_CLASS_CCC107: /* mai */
136 return HB_UNICODE_COMBINING_CLASS_ABOVE_RIGHT;
137
138
139 /* Lao */
140
141 case HB_MODIFIED_COMBINING_CLASS_CCC118: /* sign u / sign uu */
142 return HB_UNICODE_COMBINING_CLASS_BELOW;
143
144 case HB_MODIFIED_COMBINING_CLASS_CCC122: /* mai */
145 return HB_UNICODE_COMBINING_CLASS_ABOVE;
146
147
148 /* Tibetan */
149
150 case HB_MODIFIED_COMBINING_CLASS_CCC129: /* sign aa */
151 return HB_UNICODE_COMBINING_CLASS_BELOW;
152
153 case HB_MODIFIED_COMBINING_CLASS_CCC130: /* sign i*/
154 return HB_UNICODE_COMBINING_CLASS_ABOVE;
155
156 case HB_MODIFIED_COMBINING_CLASS_CCC132: /* sign u */
157 return HB_UNICODE_COMBINING_CLASS_BELOW;
158
159 }
160
161 return klass;
162}
163
164void
165_hb_ot_shape_fallback_position_recategorize_marks (const hb_ot_shape_plan_t *plan HB_UNUSED,
166 hb_font_t *font HB_UNUSED,
167 hb_buffer_t *buffer)
168{
169 unsigned int count = buffer->len;
170 hb_glyph_info_t *info = buffer->info;
171 for (unsigned int i = 0; i < count; i++)
172 if (_hb_glyph_info_get_general_category (info: &info[i]) == HB_UNICODE_GENERAL_CATEGORY_NON_SPACING_MARK) {
173 unsigned int combining_class = _hb_glyph_info_get_modified_combining_class (info: &info[i]);
174 combining_class = recategorize_combining_class (u: info[i].codepoint, klass: combining_class);
175 _hb_glyph_info_set_modified_combining_class (info: &info[i], modified_class: combining_class);
176 }
177}
178
179
180static void
181zero_mark_advances (hb_buffer_t *buffer,
182 unsigned int start,
183 unsigned int end)
184{
185 hb_glyph_info_t *info = buffer->info;
186 for (unsigned int i = start; i < end; i++)
187 if (_hb_glyph_info_get_general_category (info: &info[i]) == HB_UNICODE_GENERAL_CATEGORY_NON_SPACING_MARK)
188 {
189 buffer->pos[i].x_advance = 0;
190 buffer->pos[i].y_advance = 0;
191 }
192}
193
194static inline void
195position_mark (const hb_ot_shape_plan_t *plan,
196 hb_font_t *font,
197 hb_buffer_t *buffer,
198 hb_glyph_extents_t &base_extents,
199 unsigned int i,
200 unsigned int combining_class)
201{
202 hb_glyph_extents_t mark_extents;
203 if (!font->get_glyph_extents (glyph: buffer->info[i].codepoint,
204 extents: &mark_extents))
205 return;
206
207 hb_position_t y_gap = font->y_scale / 16;
208
209 hb_glyph_position_t &pos = buffer->pos[i];
210 pos.x_offset = pos.y_offset = 0;
211
212
213 /* We don't position LEFT and RIGHT marks. */
214
215 /* X positioning */
216 switch (combining_class)
217 {
218 case HB_UNICODE_COMBINING_CLASS_DOUBLE_BELOW:
219 case HB_UNICODE_COMBINING_CLASS_DOUBLE_ABOVE:
220 if (buffer->props.direction == HB_DIRECTION_LTR) {
221 pos.x_offset += base_extents.x_bearing + base_extents.width - mark_extents.width / 2 - mark_extents.x_bearing;
222 break;
223 } else if (buffer->props.direction == HB_DIRECTION_RTL) {
224 pos.x_offset += base_extents.x_bearing - mark_extents.width / 2 - mark_extents.x_bearing;
225 break;
226 }
227 HB_FALLTHROUGH;
228
229 default:
230 case HB_UNICODE_COMBINING_CLASS_ATTACHED_BELOW:
231 case HB_UNICODE_COMBINING_CLASS_ATTACHED_ABOVE:
232 case HB_UNICODE_COMBINING_CLASS_BELOW:
233 case HB_UNICODE_COMBINING_CLASS_ABOVE:
234 /* Center align. */
235 pos.x_offset += base_extents.x_bearing + (base_extents.width - mark_extents.width) / 2 - mark_extents.x_bearing;
236 break;
237
238 case HB_UNICODE_COMBINING_CLASS_ATTACHED_BELOW_LEFT:
239 case HB_UNICODE_COMBINING_CLASS_BELOW_LEFT:
240 case HB_UNICODE_COMBINING_CLASS_ABOVE_LEFT:
241 /* Left align. */
242 pos.x_offset += base_extents.x_bearing - mark_extents.x_bearing;
243 break;
244
245 case HB_UNICODE_COMBINING_CLASS_ATTACHED_ABOVE_RIGHT:
246 case HB_UNICODE_COMBINING_CLASS_BELOW_RIGHT:
247 case HB_UNICODE_COMBINING_CLASS_ABOVE_RIGHT:
248 /* Right align. */
249 pos.x_offset += base_extents.x_bearing + base_extents.width - mark_extents.width - mark_extents.x_bearing;
250 break;
251 }
252
253 /* Y positioning */
254 switch (combining_class)
255 {
256 case HB_UNICODE_COMBINING_CLASS_DOUBLE_BELOW:
257 case HB_UNICODE_COMBINING_CLASS_BELOW_LEFT:
258 case HB_UNICODE_COMBINING_CLASS_BELOW:
259 case HB_UNICODE_COMBINING_CLASS_BELOW_RIGHT:
260 /* Add gap, fall-through. */
261 base_extents.height -= y_gap;
262 HB_FALLTHROUGH;
263
264 case HB_UNICODE_COMBINING_CLASS_ATTACHED_BELOW_LEFT:
265 case HB_UNICODE_COMBINING_CLASS_ATTACHED_BELOW:
266 pos.y_offset = base_extents.y_bearing + base_extents.height - mark_extents.y_bearing;
267 /* Never shift up "below" marks. */
268 if ((y_gap > 0) == (pos.y_offset > 0))
269 {
270 base_extents.height -= pos.y_offset;
271 pos.y_offset = 0;
272 }
273 base_extents.height += mark_extents.height;
274 break;
275
276 case HB_UNICODE_COMBINING_CLASS_DOUBLE_ABOVE:
277 case HB_UNICODE_COMBINING_CLASS_ABOVE_LEFT:
278 case HB_UNICODE_COMBINING_CLASS_ABOVE:
279 case HB_UNICODE_COMBINING_CLASS_ABOVE_RIGHT:
280 /* Add gap, fall-through. */
281 base_extents.y_bearing += y_gap;
282 base_extents.height -= y_gap;
283 HB_FALLTHROUGH;
284
285 case HB_UNICODE_COMBINING_CLASS_ATTACHED_ABOVE:
286 case HB_UNICODE_COMBINING_CLASS_ATTACHED_ABOVE_RIGHT:
287 pos.y_offset = base_extents.y_bearing - (mark_extents.y_bearing + mark_extents.height);
288 /* Don't shift down "above" marks too much. */
289 if ((y_gap > 0) != (pos.y_offset > 0))
290 {
291 unsigned int correction = -pos.y_offset / 2;
292 base_extents.y_bearing += correction;
293 base_extents.height -= correction;
294 pos.y_offset += correction;
295 }
296 base_extents.y_bearing -= mark_extents.height;
297 base_extents.height += mark_extents.height;
298 break;
299 }
300}
301
302static inline void
303position_around_base (const hb_ot_shape_plan_t *plan,
304 hb_font_t *font,
305 hb_buffer_t *buffer,
306 unsigned int base,
307 unsigned int end)
308{
309 hb_direction_t horiz_dir = HB_DIRECTION_INVALID;
310
311 buffer->unsafe_to_break (start: base, end);
312
313 hb_glyph_extents_t base_extents;
314 if (!font->get_glyph_extents (glyph: buffer->info[base].codepoint,
315 extents: &base_extents))
316 {
317 /* If extents don't work, zero marks and go home. */
318 zero_mark_advances (buffer, start: base + 1, end);
319 return;
320 }
321 base_extents.x_bearing += buffer->pos[base].x_offset;
322 base_extents.y_bearing += buffer->pos[base].y_offset;
323
324 unsigned int lig_id = _hb_glyph_info_get_lig_id (info: &buffer->info[base]);
325 unsigned int num_lig_components = _hb_glyph_info_get_lig_num_comps (info: &buffer->info[base]);
326
327 hb_position_t x_offset = 0, y_offset = 0;
328 if (HB_DIRECTION_IS_FORWARD (buffer->props.direction)) {
329 x_offset -= buffer->pos[base].x_advance;
330 y_offset -= buffer->pos[base].y_advance;
331 }
332
333 hb_glyph_extents_t component_extents = base_extents;
334 unsigned int last_lig_component = (unsigned int) -1;
335 unsigned int last_combining_class = 255;
336 hb_glyph_extents_t cluster_extents = base_extents; /* Initialization is just to shut gcc up. */
337 hb_glyph_info_t *info = buffer->info;
338 for (unsigned int i = base + 1; i < end; i++)
339 if (_hb_glyph_info_get_modified_combining_class (info: &info[i]))
340 {
341 if (num_lig_components > 1) {
342 unsigned int this_lig_id = _hb_glyph_info_get_lig_id (info: &info[i]);
343 unsigned int this_lig_component = _hb_glyph_info_get_lig_comp (info: &info[i]) - 1;
344 /* Conditions for attaching to the last component. */
345 if (!lig_id || lig_id != this_lig_id || this_lig_component >= num_lig_components)
346 this_lig_component = num_lig_components - 1;
347 if (last_lig_component != this_lig_component)
348 {
349 last_lig_component = this_lig_component;
350 last_combining_class = 255;
351 component_extents = base_extents;
352 if (unlikely (horiz_dir == HB_DIRECTION_INVALID)) {
353 if (HB_DIRECTION_IS_HORIZONTAL (plan->props.direction))
354 horiz_dir = plan->props.direction;
355 else
356 horiz_dir = hb_script_get_horizontal_direction (script: plan->props.script);
357 }
358 if (horiz_dir == HB_DIRECTION_LTR)
359 component_extents.x_bearing += (this_lig_component * component_extents.width) / num_lig_components;
360 else
361 component_extents.x_bearing += ((num_lig_components - 1 - this_lig_component) * component_extents.width) / num_lig_components;
362 component_extents.width /= num_lig_components;
363 }
364 }
365
366 unsigned int this_combining_class = _hb_glyph_info_get_modified_combining_class (info: &info[i]);
367 if (last_combining_class != this_combining_class)
368 {
369 last_combining_class = this_combining_class;
370 cluster_extents = component_extents;
371 }
372
373 position_mark (plan, font, buffer, base_extents&: cluster_extents, i, combining_class: this_combining_class);
374
375 buffer->pos[i].x_advance = 0;
376 buffer->pos[i].y_advance = 0;
377 buffer->pos[i].x_offset += x_offset;
378 buffer->pos[i].y_offset += y_offset;
379
380 } else {
381 if (HB_DIRECTION_IS_FORWARD (buffer->props.direction)) {
382 x_offset -= buffer->pos[i].x_advance;
383 y_offset -= buffer->pos[i].y_advance;
384 } else {
385 x_offset += buffer->pos[i].x_advance;
386 y_offset += buffer->pos[i].y_advance;
387 }
388 }
389}
390
391static inline void
392position_cluster (const hb_ot_shape_plan_t *plan,
393 hb_font_t *font,
394 hb_buffer_t *buffer,
395 unsigned int start,
396 unsigned int end)
397{
398 if (end - start < 2)
399 return;
400
401 /* Find the base glyph */
402 hb_glyph_info_t *info = buffer->info;
403 for (unsigned int i = start; i < end; i++)
404 if (!HB_UNICODE_GENERAL_CATEGORY_IS_MARK (_hb_glyph_info_get_general_category (&info[i])))
405 {
406 /* Find mark glyphs */
407 unsigned int j;
408 for (j = i + 1; j < end; j++)
409 if (!HB_UNICODE_GENERAL_CATEGORY_IS_MARK (_hb_glyph_info_get_general_category (&info[j])))
410 break;
411
412 position_around_base (plan, font, buffer, base: i, end: j);
413
414 i = j - 1;
415 }
416}
417
418void
419_hb_ot_shape_fallback_position (const hb_ot_shape_plan_t *plan,
420 hb_font_t *font,
421 hb_buffer_t *buffer)
422{
423 _hb_buffer_assert_gsubgpos_vars (buffer);
424
425 unsigned int start = 0;
426 unsigned int count = buffer->len;
427 hb_glyph_info_t *info = buffer->info;
428 for (unsigned int i = 1; i < count; i++)
429 if (likely (!HB_UNICODE_GENERAL_CATEGORY_IS_MARK (_hb_glyph_info_get_general_category (&info[i])))) {
430 position_cluster (plan, font, buffer, start, end: i);
431 start = i;
432 }
433 position_cluster (plan, font, buffer, start, end: count);
434}
435
436
437/* Performs old-style TrueType kerning. */
438void
439_hb_ot_shape_fallback_kern (const hb_ot_shape_plan_t *plan,
440 hb_font_t *font,
441 hb_buffer_t *buffer)
442{
443 if (!plan->has_kern) return;
444
445 OT::hb_apply_context_t c (1, font, buffer);
446 c.set_lookup_mask (plan->kern_mask);
447 c.set_lookup_props (OT::LookupFlag::IgnoreMarks);
448 OT::hb_apply_context_t::skipping_iterator_t &skippy_iter = c.iter_input;
449 skippy_iter.init (c_: &c);
450
451 unsigned int count = buffer->len;
452 hb_glyph_info_t *info = buffer->info;
453 hb_glyph_position_t *pos = buffer->pos;
454 for (unsigned int idx = 0; idx < count;)
455 {
456 skippy_iter.reset (start_index_: idx, num_items_: 1);
457 if (!skippy_iter.next ())
458 {
459 idx++;
460 continue;
461 }
462
463 hb_position_t x_kern, y_kern;
464 font->get_glyph_kerning_for_direction (first_glyph: info[idx].codepoint,
465 second_glyph: info[skippy_iter.idx].codepoint,
466 direction: buffer->props.direction,
467 x: &x_kern, y: &y_kern);
468
469 if (x_kern)
470 {
471 hb_position_t kern1 = x_kern >> 1;
472 hb_position_t kern2 = x_kern - kern1;
473 pos[idx].x_advance += kern1;
474 pos[skippy_iter.idx].x_advance += kern2;
475 pos[skippy_iter.idx].x_offset += kern2;
476 }
477
478 if (y_kern)
479 {
480 hb_position_t kern1 = y_kern >> 1;
481 hb_position_t kern2 = y_kern - kern1;
482 pos[idx].y_advance += kern1;
483 pos[skippy_iter.idx].y_advance += kern2;
484 pos[skippy_iter.idx].y_offset += kern2;
485 }
486
487 idx = skippy_iter.idx;
488 }
489}
490
491
492/* Adjusts width of various spaces. */
493void
494_hb_ot_shape_fallback_spaces (const hb_ot_shape_plan_t *plan,
495 hb_font_t *font,
496 hb_buffer_t *buffer)
497{
498 if (!HB_DIRECTION_IS_HORIZONTAL (buffer->props.direction))
499 return;
500
501 hb_glyph_info_t *info = buffer->info;
502 hb_glyph_position_t *pos = buffer->pos;
503 unsigned int count = buffer->len;
504 for (unsigned int i = 0; i < count; i++)
505 if (_hb_glyph_info_is_unicode_space (info: &info[i]) && !_hb_glyph_info_ligated (info: &info[i]))
506 {
507 hb_unicode_funcs_t::space_t space_type = _hb_glyph_info_get_unicode_space_fallback_type (info: &info[i]);
508 hb_codepoint_t glyph;
509 typedef hb_unicode_funcs_t t;
510 switch (space_type)
511 {
512 case t::NOT_SPACE: /* Shouldn't happen. */
513 case t::SPACE:
514 break;
515
516 case t::SPACE_EM:
517 case t::SPACE_EM_2:
518 case t::SPACE_EM_3:
519 case t::SPACE_EM_4:
520 case t::SPACE_EM_5:
521 case t::SPACE_EM_6:
522 case t::SPACE_EM_16:
523 pos[i].x_advance = (font->x_scale + ((int) space_type)/2) / (int) space_type;
524 break;
525
526 case t::SPACE_4_EM_18:
527 pos[i].x_advance = font->x_scale * 4 / 18;
528 break;
529
530 case t::SPACE_FIGURE:
531 for (char u = '0'; u <= '9'; u++)
532 if (font->get_nominal_glyph (unicode: u, glyph: &glyph))
533 {
534 pos[i].x_advance = font->get_glyph_h_advance (glyph);
535 break;
536 }
537 break;
538
539 case t::SPACE_PUNCTUATION:
540 if (font->get_nominal_glyph (unicode: '.', glyph: &glyph))
541 pos[i].x_advance = font->get_glyph_h_advance (glyph);
542 else if (font->get_nominal_glyph (unicode: ',', glyph: &glyph))
543 pos[i].x_advance = font->get_glyph_h_advance (glyph);
544 break;
545
546 case t::SPACE_NARROW:
547 /* Half-space?
548 * Unicode doc http://www.unicode.org/charts/PDF/U2000.pdf says ~1/4 or 1/5 of EM.
549 * However, in my testing, many fonts have their regular space being about that
550 * size. To me, a percentage of the space width makes more sense. Half is as
551 * good as any. */
552 pos[i].x_advance /= 2;
553 break;
554 }
555 }
556}
557

source code of qtbase/src/3rdparty/harfbuzz-ng/src/hb-ot-shape-fallback.cc