1 | /*! |
2 | A [Character to Glyph Index Mapping Table]( |
3 | https://docs.microsoft.com/en-us/typography/opentype/spec/cmap) implementation. |
4 | |
5 | This module provides a low-level alternative to |
6 | [`Face::glyph_index`](../struct.Face.html#method.glyph_index) and |
7 | [`Face::glyph_variation_index`](../struct.Face.html#method.glyph_variation_index) |
8 | methods. |
9 | */ |
10 | |
11 | use crate::parser::{FromData, LazyArray16, Offset, Offset32, Stream}; |
12 | use crate::{name::PlatformId, GlyphId}; |
13 | |
14 | mod format0; |
15 | mod format10; |
16 | mod format12; |
17 | mod format13; |
18 | mod format14; |
19 | mod format2; |
20 | mod format4; |
21 | mod format6; |
22 | |
23 | pub use format0::Subtable0; |
24 | pub use format10::Subtable10; |
25 | pub use format12::Subtable12; |
26 | pub use format13::Subtable13; |
27 | pub use format14::{GlyphVariationResult, Subtable14}; |
28 | pub use format2::Subtable2; |
29 | pub use format4::Subtable4; |
30 | pub use format6::Subtable6; |
31 | |
32 | /// A character encoding subtable variant. |
33 | #[allow (missing_docs)] |
34 | #[derive (Clone, Copy, Debug)] |
35 | pub enum Format<'a> { |
36 | ByteEncodingTable(Subtable0<'a>), |
37 | HighByteMappingThroughTable(Subtable2<'a>), |
38 | SegmentMappingToDeltaValues(Subtable4<'a>), |
39 | TrimmedTableMapping(Subtable6<'a>), |
40 | MixedCoverage, // unsupported |
41 | TrimmedArray(Subtable10<'a>), |
42 | SegmentedCoverage(Subtable12<'a>), |
43 | ManyToOneRangeMappings(Subtable13<'a>), |
44 | UnicodeVariationSequences(Subtable14<'a>), |
45 | } |
46 | |
47 | /// A character encoding subtable. |
48 | #[derive (Clone, Copy, Debug)] |
49 | pub struct Subtable<'a> { |
50 | /// Subtable platform. |
51 | pub platform_id: PlatformId, |
52 | /// Subtable encoding. |
53 | pub encoding_id: u16, |
54 | /// A subtable format. |
55 | pub format: Format<'a>, |
56 | } |
57 | |
58 | impl<'a> Subtable<'a> { |
59 | /// Checks that the current encoding is Unicode compatible. |
60 | #[inline ] |
61 | pub fn is_unicode(&self) -> bool { |
62 | // https://docs.microsoft.com/en-us/typography/opentype/spec/name#windows-encoding-ids |
63 | const WINDOWS_UNICODE_BMP_ENCODING_ID: u16 = 1; |
64 | const WINDOWS_UNICODE_FULL_REPERTOIRE_ENCODING_ID: u16 = 10; |
65 | |
66 | match self.platform_id { |
67 | PlatformId::Unicode => true, |
68 | PlatformId::Windows if self.encoding_id == WINDOWS_UNICODE_BMP_ENCODING_ID => true, |
69 | PlatformId::Windows => { |
70 | // "Note: Subtable format 13 has the same structure as format 12; it differs only |
71 | // in the interpretation of the startGlyphID/glyphID fields". |
72 | let is_format_12_compatible = matches!( |
73 | self.format, |
74 | Format::SegmentedCoverage(..) | Format::ManyToOneRangeMappings(..) |
75 | ); |
76 | |
77 | // "Fonts that support Unicode supplementary-plane characters (U+10000 to U+10FFFF) |
78 | // on the Windows platform must have a format 12 subtable for platform ID 3, |
79 | // encoding ID 10." |
80 | self.encoding_id == WINDOWS_UNICODE_FULL_REPERTOIRE_ENCODING_ID |
81 | && is_format_12_compatible |
82 | } |
83 | _ => false, |
84 | } |
85 | } |
86 | |
87 | /// Maps a character to a glyph ID. |
88 | /// |
89 | /// This is a low-level method and unlike `Face::glyph_index` it doesn't |
90 | /// check that the current encoding is Unicode. |
91 | /// It simply maps a `u32` codepoint number to a glyph ID. |
92 | /// |
93 | /// Returns `None`: |
94 | /// - when glyph ID is `0`. |
95 | /// - when format is `MixedCoverage`, since it's not supported. |
96 | /// - when format is `UnicodeVariationSequences`. Use `glyph_variation_index` instead. |
97 | #[inline ] |
98 | pub fn glyph_index(&self, code_point: u32) -> Option<GlyphId> { |
99 | match self.format { |
100 | Format::ByteEncodingTable(ref subtable) => subtable.glyph_index(code_point), |
101 | Format::HighByteMappingThroughTable(ref subtable) => subtable.glyph_index(code_point), |
102 | Format::SegmentMappingToDeltaValues(ref subtable) => subtable.glyph_index(code_point), |
103 | Format::TrimmedTableMapping(ref subtable) => subtable.glyph_index(code_point), |
104 | Format::MixedCoverage => None, |
105 | Format::TrimmedArray(ref subtable) => subtable.glyph_index(code_point), |
106 | Format::SegmentedCoverage(ref subtable) => subtable.glyph_index(code_point), |
107 | Format::ManyToOneRangeMappings(ref subtable) => subtable.glyph_index(code_point), |
108 | // This subtable should be accessed via glyph_variation_index(). |
109 | Format::UnicodeVariationSequences(_) => None, |
110 | } |
111 | } |
112 | |
113 | /// Resolves a variation of a glyph ID from two code points. |
114 | /// |
115 | /// Returns `None`: |
116 | /// - when glyph ID is `0`. |
117 | /// - when format is not `UnicodeVariationSequences`. |
118 | #[inline ] |
119 | pub fn glyph_variation_index( |
120 | &self, |
121 | code_point: u32, |
122 | variation: u32, |
123 | ) -> Option<GlyphVariationResult> { |
124 | match self.format { |
125 | Format::UnicodeVariationSequences(ref subtable) => { |
126 | subtable.glyph_index(code_point, variation) |
127 | } |
128 | _ => None, |
129 | } |
130 | } |
131 | |
132 | /// Calls `f` for all codepoints contained in this subtable. |
133 | /// |
134 | /// This is a low-level method and it doesn't check that the current |
135 | /// encoding is Unicode. It simply calls the function `f` for all `u32` |
136 | /// codepoints that are present in this subtable. |
137 | /// |
138 | /// Note that this may list codepoints for which `glyph_index` still returns |
139 | /// `None` because this method finds all codepoints which were _defined_ in |
140 | /// this subtable. The subtable may still map them to glyph ID `0`. |
141 | /// |
142 | /// Returns without doing anything: |
143 | /// - when format is `MixedCoverage`, since it's not supported. |
144 | /// - when format is `UnicodeVariationSequences`, since it's not supported. |
145 | pub fn codepoints<F: FnMut(u32)>(&self, f: F) { |
146 | match self.format { |
147 | Format::ByteEncodingTable(ref subtable) => subtable.codepoints(f), |
148 | Format::HighByteMappingThroughTable(ref subtable) => subtable.codepoints(f), |
149 | Format::SegmentMappingToDeltaValues(ref subtable) => subtable.codepoints(f), |
150 | Format::TrimmedTableMapping(ref subtable) => subtable.codepoints(f), |
151 | Format::MixedCoverage => {} // unsupported |
152 | Format::TrimmedArray(ref subtable) => subtable.codepoints(f), |
153 | Format::SegmentedCoverage(ref subtable) => subtable.codepoints(f), |
154 | Format::ManyToOneRangeMappings(ref subtable) => subtable.codepoints(f), |
155 | Format::UnicodeVariationSequences(_) => {} // unsupported |
156 | }; |
157 | } |
158 | } |
159 | |
160 | #[derive (Clone, Copy)] |
161 | struct EncodingRecord { |
162 | platform_id: PlatformId, |
163 | encoding_id: u16, |
164 | offset: Offset32, |
165 | } |
166 | |
167 | impl FromData for EncodingRecord { |
168 | const SIZE: usize = 8; |
169 | |
170 | #[inline ] |
171 | fn parse(data: &[u8]) -> Option<Self> { |
172 | let mut s: Stream<'_> = Stream::new(data); |
173 | Some(EncodingRecord { |
174 | platform_id: s.read::<PlatformId>()?, |
175 | encoding_id: s.read::<u16>()?, |
176 | offset: s.read::<Offset32>()?, |
177 | }) |
178 | } |
179 | } |
180 | |
181 | /// A list of subtables. |
182 | #[derive (Clone, Copy, Default)] |
183 | pub struct Subtables<'a> { |
184 | data: &'a [u8], |
185 | records: LazyArray16<'a, EncodingRecord>, |
186 | } |
187 | |
188 | impl core::fmt::Debug for Subtables<'_> { |
189 | fn fmt(&self, f: &mut core::fmt::Formatter) -> core::fmt::Result { |
190 | write!(f, "Subtables {{ ... }}" ) |
191 | } |
192 | } |
193 | |
194 | impl<'a> Subtables<'a> { |
195 | /// Returns a subtable at an index. |
196 | pub fn get(&self, index: u16) -> Option<Subtable<'a>> { |
197 | let record = self.records.get(index)?; |
198 | let data = self.data.get(record.offset.to_usize()..)?; |
199 | let format = match Stream::read_at::<u16>(data, 0)? { |
200 | 0 => Format::ByteEncodingTable(Subtable0::parse(data)?), |
201 | 2 => Format::HighByteMappingThroughTable(Subtable2::parse(data)?), |
202 | 4 => Format::SegmentMappingToDeltaValues(Subtable4::parse(data)?), |
203 | 6 => Format::TrimmedTableMapping(Subtable6::parse(data)?), |
204 | 8 => Format::MixedCoverage, // unsupported |
205 | 10 => Format::TrimmedArray(Subtable10::parse(data)?), |
206 | 12 => Format::SegmentedCoverage(Subtable12::parse(data)?), |
207 | 13 => Format::ManyToOneRangeMappings(Subtable13::parse(data)?), |
208 | 14 => Format::UnicodeVariationSequences(Subtable14::parse(data)?), |
209 | _ => return None, |
210 | }; |
211 | |
212 | Some(Subtable { |
213 | platform_id: record.platform_id, |
214 | encoding_id: record.encoding_id, |
215 | format, |
216 | }) |
217 | } |
218 | |
219 | /// Returns the number of subtables. |
220 | #[inline ] |
221 | pub fn len(&self) -> u16 { |
222 | self.records.len() |
223 | } |
224 | |
225 | /// Checks if there are any subtables. |
226 | pub fn is_empty(&self) -> bool { |
227 | self.records.is_empty() |
228 | } |
229 | } |
230 | |
231 | impl<'a> IntoIterator for Subtables<'a> { |
232 | type Item = Subtable<'a>; |
233 | type IntoIter = SubtablesIter<'a>; |
234 | |
235 | #[inline ] |
236 | fn into_iter(self) -> Self::IntoIter { |
237 | SubtablesIter { |
238 | subtables: self, |
239 | index: 0, |
240 | } |
241 | } |
242 | } |
243 | |
244 | /// An iterator over [`Subtables`]. |
245 | #[allow (missing_debug_implementations)] |
246 | pub struct SubtablesIter<'a> { |
247 | subtables: Subtables<'a>, |
248 | index: u16, |
249 | } |
250 | |
251 | impl<'a> Iterator for SubtablesIter<'a> { |
252 | type Item = Subtable<'a>; |
253 | |
254 | #[inline ] |
255 | fn next(&mut self) -> Option<Self::Item> { |
256 | if self.index < self.subtables.len() { |
257 | self.index += 1; |
258 | self.subtables.get(self.index - 1) |
259 | } else { |
260 | None |
261 | } |
262 | } |
263 | } |
264 | |
265 | /// A [Character to Glyph Index Mapping Table]( |
266 | /// https://docs.microsoft.com/en-us/typography/opentype/spec/cmap). |
267 | #[derive (Clone, Copy, Debug)] |
268 | pub struct Table<'a> { |
269 | /// A list of subtables. |
270 | pub subtables: Subtables<'a>, |
271 | } |
272 | |
273 | impl<'a> Table<'a> { |
274 | /// Parses a table from raw data. |
275 | pub fn parse(data: &'a [u8]) -> Option<Self> { |
276 | let mut s: Stream<'_> = Stream::new(data); |
277 | s.skip::<u16>(); // version |
278 | let count: u16 = s.read::<u16>()?; |
279 | let records: LazyArray16<'_, EncodingRecord> = s.read_array16::<EncodingRecord>(count)?; |
280 | Some(Table { |
281 | subtables: Subtables { data, records }, |
282 | }) |
283 | } |
284 | } |
285 | |