fonts/shapers/
harfbuzz.rs

1/* This Source Code Form is subject to the terms of the Mozilla Public
2 * License, v. 2.0. If a copy of the MPL was not distributed with this
3 * file, You can obtain one at https://mozilla.org/MPL/2.0/. */
4
5#![expect(unsafe_code)]
6
7use std::os::raw::{c_char, c_int, c_uint, c_void};
8use std::sync::LazyLock;
9use std::{char, ptr};
10
11use app_units::Au;
12use euclid::default::Point2D;
13// Eventually we would like the shaper to be pluggable, as many operating systems have their own
14// shapers. For now, however, HarfBuzz is a hard dependency.
15use harfbuzz_sys::{
16    HB_BUFFER_CLUSTER_LEVEL_MONOTONE_CHARACTERS, HB_DIRECTION_LTR, HB_DIRECTION_RTL,
17    HB_MEMORY_MODE_READONLY, HB_OT_LAYOUT_BASELINE_TAG_HANGING,
18    HB_OT_LAYOUT_BASELINE_TAG_IDEO_EMBOX_BOTTOM_OR_LEFT, HB_OT_LAYOUT_BASELINE_TAG_ROMAN,
19    hb_blob_create, hb_blob_t, hb_bool_t, hb_buffer_add_utf8, hb_buffer_create, hb_buffer_destroy,
20    hb_buffer_get_glyph_infos, hb_buffer_get_glyph_positions, hb_buffer_get_length,
21    hb_buffer_set_cluster_level, hb_buffer_set_direction, hb_buffer_set_language,
22    hb_buffer_set_script, hb_buffer_t, hb_codepoint_t, hb_face_create_for_tables, hb_face_destroy,
23    hb_face_t, hb_feature_t, hb_font_create, hb_font_destroy, hb_font_funcs_create,
24    hb_font_funcs_set_glyph_h_advance_func, hb_font_funcs_set_nominal_glyph_func, hb_font_funcs_t,
25    hb_font_set_funcs, hb_font_set_ppem, hb_font_set_scale, hb_font_set_variations, hb_font_t,
26    hb_glyph_info_t, hb_glyph_position_t, hb_language_from_string, hb_ot_layout_get_baseline,
27    hb_position_t, hb_script_from_iso15924_tag, hb_shape, hb_tag_t, hb_variation_t,
28};
29use num_traits::Zero;
30use read_fonts::types::Tag;
31
32use super::{GlyphShapingResult, ShapedGlyph, unicode_script_to_iso15924_tag};
33use crate::platform::font::FontTable;
34use crate::{
35    BASE, Font, FontBaseline, FontTableMethods, GlyphId, GlyphStore, KERN, LIGA, ShapingFlags,
36    ShapingOptions, fixed_to_float, float_to_fixed,
37};
38
39const HB_OT_TAG_DEFAULT_SCRIPT: hb_tag_t = u32::from_be_bytes(Tag::new(b"DFLT").to_be_bytes());
40const HB_OT_TAG_DEFAULT_LANGUAGE: hb_tag_t = u32::from_be_bytes(Tag::new(b"dflt").to_be_bytes());
41
42pub(crate) struct HarfbuzzGlyphShapingResult {
43    count: usize,
44    buffer: *mut hb_buffer_t,
45    glyph_infos: *mut hb_glyph_info_t,
46    pos_infos: *mut hb_glyph_position_t,
47}
48
49impl HarfbuzzGlyphShapingResult {
50    /// Create a new [`ShapedGlyphData`] from the given HarfBuzz buffer.
51    ///
52    /// # Safety
53    ///
54    /// - Passing an invalid buffer pointer to this function results in undefined behavior.
55    /// - This function takes ownership of the buffer and the ShapedGlyphData destroys the buffer when dropped
56    ///   so the pointer must an owned pointer and must not be used after being passed to this function
57    unsafe fn new(buffer: *mut hb_buffer_t) -> HarfbuzzGlyphShapingResult {
58        let mut glyph_count = 0;
59        let glyph_infos = unsafe { hb_buffer_get_glyph_infos(buffer, &mut glyph_count) };
60        assert!(!glyph_infos.is_null());
61        let mut pos_count = 0;
62        let pos_infos = unsafe { hb_buffer_get_glyph_positions(buffer, &mut pos_count) };
63        assert!(!pos_infos.is_null());
64        assert_eq!(glyph_count, pos_count);
65
66        HarfbuzzGlyphShapingResult {
67            count: glyph_count as usize,
68            buffer,
69            glyph_infos,
70            pos_infos,
71        }
72    }
73}
74
75impl Drop for HarfbuzzGlyphShapingResult {
76    fn drop(&mut self) {
77        unsafe { hb_buffer_destroy(self.buffer) }
78    }
79}
80
81struct ShapedGlyphIterator<'a> {
82    shaped_glyph_data: &'a HarfbuzzGlyphShapingResult,
83    current_glyph_offset: usize,
84    y_position: Au,
85}
86
87impl<'a> Iterator for ShapedGlyphIterator<'a> {
88    type Item = ShapedGlyph;
89
90    fn next(&mut self) -> Option<Self::Item> {
91        if self.current_glyph_offset >= self.shaped_glyph_data.count {
92            return None;
93        }
94
95        unsafe {
96            let glyph_info_i = self
97                .shaped_glyph_data
98                .glyph_infos
99                .add(self.current_glyph_offset);
100            let pos_info_i = self
101                .shaped_glyph_data
102                .pos_infos
103                .add(self.current_glyph_offset);
104            let x_offset = Shaper::fixed_to_float((*pos_info_i).x_offset);
105            let y_offset = Shaper::fixed_to_float((*pos_info_i).y_offset);
106            let x_advance = Shaper::fixed_to_float((*pos_info_i).x_advance);
107            let y_advance = Shaper::fixed_to_float((*pos_info_i).y_advance);
108
109            let x_offset = Au::from_f64_px(x_offset);
110            let y_offset = Au::from_f64_px(y_offset);
111            let x_advance = Au::from_f64_px(x_advance);
112            let y_advance = Au::from_f64_px(y_advance);
113
114            let offset = if x_offset.is_zero() && y_offset.is_zero() && y_advance.is_zero() {
115                None
116            } else {
117                // adjust the pen..
118                if y_advance > Au::zero() {
119                    self.y_position -= y_advance;
120                }
121
122                Some(Point2D::new(x_offset, self.y_position - y_offset))
123            };
124
125            self.current_glyph_offset += 1;
126            Some(ShapedGlyph {
127                glyph_id: (*glyph_info_i).codepoint as GlyphId,
128                string_byte_offset: (*glyph_info_i).cluster as usize,
129                advance: x_advance,
130                offset,
131            })
132        }
133    }
134}
135
136impl GlyphShapingResult for HarfbuzzGlyphShapingResult {
137    #[inline]
138    fn len(&self) -> usize {
139        self.count
140    }
141
142    fn iter(&self) -> impl Iterator<Item = ShapedGlyph> {
143        ShapedGlyphIterator {
144            shaped_glyph_data: self,
145            current_glyph_offset: 0,
146            y_position: Au::zero(),
147        }
148    }
149
150    fn is_rtl(&self) -> bool {
151        unsafe {
152            let first_glyph_info = self.glyph_infos.add(0);
153            let last_glyph_info = self.glyph_infos.add(self.count - 1);
154            (*last_glyph_info).cluster < (*first_glyph_info).cluster
155        }
156    }
157}
158
159#[derive(Debug)]
160pub(crate) struct Shaper {
161    hb_face: *mut hb_face_t,
162    hb_font: *mut hb_font_t,
163    font: *const Font,
164}
165
166// The HarfBuzz API is thread safe as well as our `Font`, so we can make the data
167// structures here as thread-safe as well. This doesn't seem to be documented,
168// but was expressed as one of the original goals of the HarfBuzz API.
169unsafe impl Sync for Shaper {}
170unsafe impl Send for Shaper {}
171
172impl Drop for Shaper {
173    fn drop(&mut self) {
174        unsafe {
175            assert!(!self.hb_face.is_null());
176            hb_face_destroy(self.hb_face);
177
178            assert!(!self.hb_font.is_null());
179            hb_font_destroy(self.hb_font);
180        }
181    }
182}
183
184impl Shaper {
185    pub(crate) fn new(font: &Font) -> Shaper {
186        unsafe {
187            let hb_face: *mut hb_face_t = hb_face_create_for_tables(
188                Some(font_table_func),
189                font as *const Font as *mut c_void,
190                None,
191            );
192            let hb_font: *mut hb_font_t = hb_font_create(hb_face);
193
194            // Set points-per-em. if zero, performs no hinting in that direction.
195            let pt_size = font.descriptor.pt_size.to_f64_px();
196            hb_font_set_ppem(hb_font, pt_size as c_uint, pt_size as c_uint);
197
198            // Set scaling. Note that this takes 16.16 fixed point.
199            hb_font_set_scale(
200                hb_font,
201                Shaper::float_to_fixed(pt_size) as c_int,
202                Shaper::float_to_fixed(pt_size) as c_int,
203            );
204
205            // configure static function callbacks.
206            hb_font_set_funcs(
207                hb_font,
208                HB_FONT_FUNCS.0,
209                font as *const Font as *mut c_void,
210                None,
211            );
212
213            if servo_config::pref!(layout_variable_fonts_enabled) {
214                let variations = &font.variations();
215                if !variations.is_empty() {
216                    let variations: Vec<_> = variations
217                        .iter()
218                        .map(|variation| hb_variation_t {
219                            tag: variation.tag,
220
221                            value: variation.value,
222                        })
223                        .collect();
224
225                    hb_font_set_variations(hb_font, variations.as_ptr(), variations.len() as u32);
226                }
227            }
228
229            Shaper {
230                hb_face,
231                hb_font,
232                font,
233            }
234        }
235    }
236
237    /// Calculate the layout metrics associated with the given text with the [`Shaper`]s font.
238    fn shaped_glyph_data(
239        &self,
240        text: &str,
241        options: &ShapingOptions,
242    ) -> HarfbuzzGlyphShapingResult {
243        unsafe {
244            let hb_buffer: *mut hb_buffer_t = hb_buffer_create();
245            hb_buffer_set_cluster_level(hb_buffer, HB_BUFFER_CLUSTER_LEVEL_MONOTONE_CHARACTERS);
246            hb_buffer_set_direction(
247                hb_buffer,
248                if options.flags.contains(ShapingFlags::RTL_FLAG) {
249                    HB_DIRECTION_RTL
250                } else {
251                    HB_DIRECTION_LTR
252                },
253            );
254
255            let script =
256                hb_script_from_iso15924_tag(unicode_script_to_iso15924_tag(options.script));
257            hb_buffer_set_script(hb_buffer, script);
258
259            hb_buffer_add_utf8(
260                hb_buffer,
261                text.as_ptr() as *const c_char,
262                text.len() as c_int,
263                0,
264                text.len() as c_int,
265            );
266
267            let language = options.language;
268            let hb_language = hb_language_from_string(
269                language.as_str().as_ptr() as *const c_char,
270                language.as_str().len() as c_int,
271            );
272            hb_buffer_set_language(hb_buffer, hb_language);
273
274            let mut features = Vec::new();
275            if options
276                .flags
277                .contains(ShapingFlags::IGNORE_LIGATURES_SHAPING_FLAG)
278            {
279                features.push(hb_feature_t {
280                    tag: u32::from_be_bytes(LIGA.to_be_bytes()),
281                    value: 0,
282                    start: 0,
283                    end: hb_buffer_get_length(hb_buffer),
284                })
285            }
286            if options
287                .flags
288                .contains(ShapingFlags::DISABLE_KERNING_SHAPING_FLAG)
289            {
290                features.push(hb_feature_t {
291                    tag: u32::from_be_bytes(KERN.to_be_bytes()),
292                    value: 0,
293                    start: 0,
294                    end: hb_buffer_get_length(hb_buffer),
295                })
296            }
297
298            hb_shape(
299                self.hb_font,
300                hb_buffer,
301                features.as_mut_ptr(),
302                features.len() as u32,
303            );
304
305            HarfbuzzGlyphShapingResult::new(hb_buffer)
306        }
307    }
308
309    pub(crate) fn shape_text(
310        &self,
311        font: &Font,
312        text: &str,
313        options: &ShapingOptions,
314    ) -> GlyphStore {
315        GlyphStore::with_shaped_glyph_data(
316            font,
317            text,
318            options,
319            &self.shaped_glyph_data(text, options),
320        )
321    }
322
323    pub(crate) fn baseline(&self) -> Option<FontBaseline> {
324        unsafe { (*self.font).table_for_tag(BASE)? };
325
326        let mut hanging_baseline = 0;
327        let mut alphabetic_baseline = 0;
328        let mut ideographic_baseline = 0;
329
330        unsafe {
331            hb_ot_layout_get_baseline(
332                self.hb_font,
333                HB_OT_LAYOUT_BASELINE_TAG_ROMAN,
334                HB_DIRECTION_LTR,
335                HB_OT_TAG_DEFAULT_SCRIPT,
336                HB_OT_TAG_DEFAULT_LANGUAGE,
337                &mut alphabetic_baseline as *mut _,
338            );
339
340            hb_ot_layout_get_baseline(
341                self.hb_font,
342                HB_OT_LAYOUT_BASELINE_TAG_HANGING,
343                HB_DIRECTION_LTR,
344                HB_OT_TAG_DEFAULT_SCRIPT,
345                HB_OT_TAG_DEFAULT_LANGUAGE,
346                &mut hanging_baseline as *mut _,
347            );
348
349            hb_ot_layout_get_baseline(
350                self.hb_font,
351                HB_OT_LAYOUT_BASELINE_TAG_IDEO_EMBOX_BOTTOM_OR_LEFT,
352                HB_DIRECTION_LTR,
353                HB_OT_TAG_DEFAULT_SCRIPT,
354                HB_OT_TAG_DEFAULT_LANGUAGE,
355                &mut ideographic_baseline as *mut _,
356            );
357        }
358
359        Some(FontBaseline {
360            ideographic_baseline: Shaper::fixed_to_float(ideographic_baseline) as f32,
361            alphabetic_baseline: Shaper::fixed_to_float(alphabetic_baseline) as f32,
362            hanging_baseline: Shaper::fixed_to_float(hanging_baseline) as f32,
363        })
364    }
365
366    fn float_to_fixed(f: f64) -> i32 {
367        float_to_fixed(16, f)
368    }
369
370    fn fixed_to_float(i: hb_position_t) -> f64 {
371        fixed_to_float(16, i)
372    }
373}
374
375/// Callbacks from Harfbuzz when font map and glyph advance lookup needed.
376struct FontFuncs(*mut hb_font_funcs_t);
377
378unsafe impl Sync for FontFuncs {}
379unsafe impl Send for FontFuncs {}
380
381static HB_FONT_FUNCS: LazyLock<FontFuncs> = LazyLock::new(|| unsafe {
382    let hb_funcs = hb_font_funcs_create();
383    hb_font_funcs_set_nominal_glyph_func(hb_funcs, Some(glyph_func), ptr::null_mut(), None);
384    hb_font_funcs_set_glyph_h_advance_func(
385        hb_funcs,
386        Some(glyph_h_advance_func),
387        ptr::null_mut(),
388        None,
389    );
390
391    FontFuncs(hb_funcs)
392});
393
394extern "C" fn glyph_func(
395    _: *mut hb_font_t,
396    font_data: *mut c_void,
397    unicode: hb_codepoint_t,
398    glyph: *mut hb_codepoint_t,
399    _: *mut c_void,
400) -> hb_bool_t {
401    let font: *const Font = font_data as *const Font;
402    assert!(!font.is_null());
403
404    match unsafe { (*font).glyph_index(char::from_u32(unicode).unwrap()) } {
405        Some(g) => {
406            unsafe { *glyph = g as hb_codepoint_t };
407            true as hb_bool_t
408        },
409        None => false as hb_bool_t,
410    }
411}
412
413extern "C" fn glyph_h_advance_func(
414    _: *mut hb_font_t,
415    font_data: *mut c_void,
416    glyph: hb_codepoint_t,
417    _: *mut c_void,
418) -> hb_position_t {
419    let font: *mut Font = font_data as *mut Font;
420    assert!(!font.is_null());
421
422    let advance = unsafe { (*font).glyph_h_advance(glyph as GlyphId) };
423    Shaper::float_to_fixed(advance)
424}
425
426/// Callback to get a font table out of a font.
427extern "C" fn font_table_func(
428    _: *mut hb_face_t,
429    tag: hb_tag_t,
430    user_data: *mut c_void,
431) -> *mut hb_blob_t {
432    // NB: These asserts have security implications.
433    let font = user_data as *const Font;
434    assert!(!font.is_null());
435
436    // TODO(Issue #197): reuse font table data, which will change the unsound trickery here.
437    let Some(font_table) = (unsafe { (*font).table_for_tag(Tag::from_u32(tag)) }) else {
438        return ptr::null_mut();
439    };
440
441    // `Box::into_raw` intentionally leaks the FontTable so we don't destroy the buffer
442    // while HarfBuzz is using it.  When HarfBuzz is done with the buffer, it will pass
443    // this raw pointer back to `destroy_blob_func` which will deallocate the Box.
444    let font_table_ptr = Box::into_raw(Box::new(font_table));
445
446    let buf = unsafe { (*font_table_ptr).buffer() };
447    // HarfBuzz calls `destroy_blob_func` when the buffer is no longer needed.
448    let blob = unsafe {
449        hb_blob_create(
450            buf.as_ptr() as *const c_char,
451            buf.len() as c_uint,
452            HB_MEMORY_MODE_READONLY,
453            font_table_ptr as *mut c_void,
454            Some(destroy_blob_func),
455        )
456    };
457
458    assert!(!blob.is_null());
459    blob
460}
461
462extern "C" fn destroy_blob_func(font_table_ptr: *mut c_void) {
463    unsafe {
464        drop(Box::from_raw(font_table_ptr as *mut FontTable));
465    }
466}