read_fonts/
array.rs

1//! Custom array types
2
3#![deny(clippy::arithmetic_side_effects)]
4
5use bytemuck::AnyBitPattern;
6use font_types::FixedSize;
7
8use crate::read::{ComputeSize, FontReadWithArgs, ReadArgs, VarSize};
9use crate::{FontData, FontRead, ReadError};
10
11/// An array whose items size is not known at compile time.
12///
13/// This requires the inner type to implement [`FontReadWithArgs`] as well as
14/// [`ComputeSize`].
15///
16/// At runtime, `Args` are provided which will be used to compute the size
17/// of each item; this size is then used to compute the positions of the items
18/// within the underlying data, from which they will be read lazily.
19#[derive(Clone)]
20pub struct ComputedArray<'a, T: ReadArgs> {
21    // the length of each item
22    item_len: usize,
23    len: usize,
24    data: FontData<'a>,
25    args: T::Args,
26}
27
28impl<'a, T: ComputeSize> ComputedArray<'a, T> {
29    pub fn new(data: FontData<'a>, args: T::Args) -> Result<Self, ReadError> {
30        let item_len = T::compute_size(&args)?;
31        let len = data.len().checked_div(item_len).unwrap_or(0);
32        Ok(ComputedArray {
33            item_len,
34            len,
35            data,
36            args,
37        })
38    }
39
40    /// The number of items in the array
41    pub fn len(&self) -> usize {
42        self.len
43    }
44
45    pub fn is_empty(&self) -> bool {
46        self.len == 0
47    }
48}
49
50impl<T: ReadArgs> ReadArgs for ComputedArray<'_, T> {
51    type Args = T::Args;
52}
53
54impl<'a, T> FontReadWithArgs<'a> for ComputedArray<'a, T>
55where
56    T: ComputeSize + FontReadWithArgs<'a>,
57    T::Args: Copy,
58{
59    fn read_with_args(data: FontData<'a>, args: &Self::Args) -> Result<Self, ReadError> {
60        Self::new(data, *args)
61    }
62}
63
64impl<'a, T> ComputedArray<'a, T>
65where
66    T: FontReadWithArgs<'a>,
67    T::Args: Copy + 'static,
68{
69    pub fn iter(&self) -> impl Iterator<Item = Result<T, ReadError>> + 'a {
70        let mut i = 0;
71        let data = self.data;
72        let args = self.args;
73        let item_len = self.item_len;
74        let len = self.len;
75
76        std::iter::from_fn(move || {
77            if i == len {
78                return None;
79            }
80            let item_start = item_len.checked_mul(i)?;
81            i = i.checked_add(1)?;
82            let data = data.split_off(item_start)?;
83            Some(T::read_with_args(data, &args))
84        })
85    }
86
87    #[inline]
88    pub fn get(&self, idx: usize) -> Result<T, ReadError> {
89        let item_start = idx
90            .checked_mul(self.item_len)
91            .ok_or(ReadError::OutOfBounds)?;
92        self.data
93            .split_off(item_start)
94            .ok_or(ReadError::OutOfBounds)
95            .and_then(|data| T::read_with_args(data, &self.args))
96    }
97}
98
99impl<T: ReadArgs> std::fmt::Debug for ComputedArray<'_, T> {
100    fn fmt(&self, f: &mut std::fmt::Formatter) -> std::fmt::Result {
101        f.debug_struct("DynSizedArray")
102            .field("bytes", &self.data)
103            .finish()
104    }
105}
106
107/// An array of items of non-uniform length.
108///
109/// Random access into this array cannot be especially efficient, since it requires
110/// a linear scan.
111pub struct VarLenArray<'a, T> {
112    data: FontData<'a>,
113    phantom: std::marker::PhantomData<*const T>,
114}
115
116impl<'a, T: FontRead<'a> + VarSize> VarLenArray<'a, T> {
117    /// Return the item at the provided index.
118    ///
119    /// # Performance
120    ///
121    /// Determining the position of an item in this collection requires looking
122    /// at all the preceding items; that is, it is `O(n)` instead of `O(1)` as
123    /// it would be for a `Vec`.
124    ///
125    /// As a consequence, calling this method in a loop could potentially be
126    /// very slow. If this is something you need to do, it will probably be
127    /// much faster to first collect all the items into a `Vec` beforehand,
128    /// and then fetch them from there.
129    pub fn get(&self, idx: usize) -> Option<Result<T, ReadError>> {
130        let mut pos = 0usize;
131        for _ in 0..idx {
132            pos = pos.checked_add(T::read_len_at(self.data, pos)?)?;
133        }
134        self.data.split_off(pos).map(T::read)
135    }
136
137    /// Return an iterator over this array's items.
138    pub fn iter(&self) -> impl Iterator<Item = Result<T, ReadError>> + 'a {
139        let mut data = self.data;
140        std::iter::from_fn(move || {
141            if data.is_empty() {
142                return None;
143            }
144
145            let item_len = T::read_len_at(data, 0)?;
146            // If the length is 0 then then it's not useful to continue
147            // iteration. The subsequent read will probably fail but if
148            // the user is skipping malformed elements (which is common)
149            // this this iterator will continue forever.
150            if item_len == 0 {
151                return None;
152            }
153            let item_data = data.slice(..item_len)?;
154            let next = T::read(item_data);
155            data = data.split_off(item_len)?;
156            Some(next)
157        })
158    }
159}
160
161impl<'a, T> FontRead<'a> for VarLenArray<'a, T> {
162    fn read(data: FontData<'a>) -> Result<Self, ReadError> {
163        Ok(VarLenArray {
164            data,
165            phantom: core::marker::PhantomData,
166        })
167    }
168}
169
170impl<T: AnyBitPattern> ReadArgs for &[T] {
171    type Args = u16;
172}
173
174impl<'a, T: AnyBitPattern + FixedSize> FontReadWithArgs<'a> for &'a [T] {
175    fn read_with_args(data: FontData<'a>, args: &u16) -> Result<Self, ReadError> {
176        let len = (*args as usize)
177            .checked_mul(T::RAW_BYTE_LEN)
178            .ok_or(ReadError::OutOfBounds)?;
179        data.read_array(0..len)
180    }
181}
182
183#[cfg(test)]
184mod tests {
185    use super::*;
186    use crate::codegen_test::records::VarLenItem;
187    use font_test_data::bebuffer::BeBuffer;
188
189    impl VarSize for VarLenItem<'_> {
190        type Size = u32;
191
192        fn read_len_at(data: FontData, pos: usize) -> Option<usize> {
193            data.read_at::<u32>(pos).ok().map(|len| len as usize)
194        }
195    }
196
197    /// HB/HarfRuzz test "shlana_9_006" has a morx table containing a chain
198    /// with a length of 0. This caused the VarLenArray iterator to loop
199    /// indefinitely.
200    #[test]
201    fn var_len_iter_with_zero_length_item() {
202        // Create a buffer containing three elements where the last
203        // has zero length
204        let mut buf = BeBuffer::new();
205        buf = buf.push(8u32).extend([0u8; 4]);
206        buf = buf.push(18u32).extend([0u8; 14]);
207        buf = buf.push(0u32);
208        let arr: VarLenArray<VarLenItem> = VarLenArray::read(FontData::new(buf.data())).unwrap();
209        // Ensure we don't iterate forever and only read two elements (the
210        // take() exists so that the test fails rather than hanging if the
211        // code regresses in the future)
212        assert_eq!(arr.iter().take(10).count(), 2);
213    }
214}