1//! Parsing of GCC-style Language-Specific Data Area (LSDA)
2//! For details see:
3//! * <https://refspecs.linuxfoundation.org/LSB_3.0.0/LSB-PDA/LSB-PDA/ehframechpt.html>
4//! * <https://refspecs.linuxfoundation.org/LSB_5.0.0/LSB-Core-generic/LSB-Core-generic/dwarfext.html>
5//! * <https://itanium-cxx-abi.github.io/cxx-abi/exceptions.pdf>
6//! * <https://www.airs.com/blog/archives/460>
7//! * <https://www.airs.com/blog/archives/464>
8//!
9//! A reference implementation may be found in the GCC source tree
10//! (`<root>/libgcc/unwind-c.c` as of this writing).
11
12#![allow(non_upper_case_globals)]
13#![allow(unused)]
14
15use super::DwarfReader;
16use core::mem;
17use core::ptr;
18
19pub const DW_EH_PE_omit: u8 = 0xFF;
20pub const DW_EH_PE_absptr: u8 = 0x00;
21
22pub const DW_EH_PE_uleb128: u8 = 0x01;
23pub const DW_EH_PE_udata2: u8 = 0x02;
24pub const DW_EH_PE_udata4: u8 = 0x03;
25pub const DW_EH_PE_udata8: u8 = 0x04;
26pub const DW_EH_PE_sleb128: u8 = 0x09;
27pub const DW_EH_PE_sdata2: u8 = 0x0A;
28pub const DW_EH_PE_sdata4: u8 = 0x0B;
29pub const DW_EH_PE_sdata8: u8 = 0x0C;
30
31pub const DW_EH_PE_pcrel: u8 = 0x10;
32pub const DW_EH_PE_textrel: u8 = 0x20;
33pub const DW_EH_PE_datarel: u8 = 0x30;
34pub const DW_EH_PE_funcrel: u8 = 0x40;
35pub const DW_EH_PE_aligned: u8 = 0x50;
36
37pub const DW_EH_PE_indirect: u8 = 0x80;
38
39#[derive(Copy, Clone)]
40pub struct EHContext<'a> {
41 pub ip: *const u8, // Current instruction pointer
42 pub func_start: *const u8, // Pointer to the current function
43 pub get_text_start: &'a dyn Fn() -> *const u8, // Get pointer to the code section
44 pub get_data_start: &'a dyn Fn() -> *const u8, // Get pointer to the data section
45}
46
47/// Landing pad.
48type LPad = *const u8;
49pub enum EHAction {
50 None,
51 Cleanup(LPad),
52 Catch(LPad),
53 Filter(LPad),
54 Terminate,
55}
56
57pub const USING_SJLJ_EXCEPTIONS: bool = cfg!(all(target_os = "ios", target_arch = "arm"));
58
59pub unsafe fn find_eh_action(lsda: *const u8, context: &EHContext<'_>) -> Result<EHAction, ()> {
60 if lsda.is_null() {
61 return Ok(EHAction::None);
62 }
63
64 let func_start = context.func_start;
65 let mut reader = DwarfReader::new(lsda);
66
67 let start_encoding = reader.read::<u8>();
68 // base address for landing pad offsets
69 let lpad_base = if start_encoding != DW_EH_PE_omit {
70 read_encoded_pointer(&mut reader, context, start_encoding)?
71 } else {
72 func_start
73 };
74
75 let ttype_encoding = reader.read::<u8>();
76 if ttype_encoding != DW_EH_PE_omit {
77 // Rust doesn't analyze exception types, so we don't care about the type table
78 reader.read_uleb128();
79 }
80
81 let call_site_encoding = reader.read::<u8>();
82 let call_site_table_length = reader.read_uleb128();
83 let action_table = reader.ptr.add(call_site_table_length as usize);
84 let ip = context.ip;
85
86 if !USING_SJLJ_EXCEPTIONS {
87 // read the callsite table
88 while reader.ptr < action_table {
89 // these are offsets rather than pointers;
90 let cs_start = read_encoded_offset(&mut reader, call_site_encoding)?;
91 let cs_len = read_encoded_offset(&mut reader, call_site_encoding)?;
92 let cs_lpad = read_encoded_offset(&mut reader, call_site_encoding)?;
93 let cs_action_entry = reader.read_uleb128();
94 // Callsite table is sorted by cs_start, so if we've passed the ip, we
95 // may stop searching.
96 if ip < func_start.wrapping_add(cs_start) {
97 break;
98 }
99 if ip < func_start.wrapping_add(cs_start + cs_len) {
100 if cs_lpad == 0 {
101 return Ok(EHAction::None);
102 } else {
103 let lpad = lpad_base.wrapping_add(cs_lpad);
104 return Ok(interpret_cs_action(action_table, cs_action_entry, lpad));
105 }
106 }
107 }
108 // Ip is not present in the table. This indicates a nounwind call.
109 Ok(EHAction::Terminate)
110 } else {
111 // SjLj version:
112 // The "IP" is an index into the call-site table, with two exceptions:
113 // -1 means 'no-action', and 0 means 'terminate'.
114 match ip.addr() as isize {
115 -1 => return Ok(EHAction::None),
116 0 => return Ok(EHAction::Terminate),
117 _ => (),
118 }
119 let mut idx = ip.addr();
120 loop {
121 let cs_lpad = reader.read_uleb128();
122 let cs_action_entry = reader.read_uleb128();
123 idx -= 1;
124 if idx == 0 {
125 // Can never have null landing pad for sjlj -- that would have
126 // been indicated by a -1 call site index.
127 // FIXME(strict provenance)
128 let lpad = ptr::from_exposed_addr((cs_lpad + 1) as usize);
129 return Ok(interpret_cs_action(action_table, cs_action_entry, lpad));
130 }
131 }
132 }
133}
134
135unsafe fn interpret_cs_action(
136 action_table: *const u8,
137 cs_action_entry: u64,
138 lpad: LPad,
139) -> EHAction {
140 if cs_action_entry == 0 {
141 // If cs_action_entry is 0 then this is a cleanup (Drop::drop). We run these
142 // for both Rust panics and foreign exceptions.
143 EHAction::Cleanup(lpad)
144 } else {
145 // If lpad != 0 and cs_action_entry != 0, we have to check ttype_index.
146 // If ttype_index == 0 under the condition, we take cleanup action.
147 let action_record: *const u8 = action_table.offset(count:cs_action_entry as isize - 1);
148 let mut action_reader: DwarfReader = DwarfReader::new(ptr:action_record);
149 let ttype_index: i64 = action_reader.read_sleb128();
150 if ttype_index == 0 {
151 EHAction::Cleanup(lpad)
152 } else if ttype_index > 0 {
153 // Stop unwinding Rust panics at catch_unwind.
154 EHAction::Catch(lpad)
155 } else {
156 EHAction::Filter(lpad)
157 }
158 }
159}
160
161#[inline]
162fn round_up(unrounded: usize, align: usize) -> Result<usize, ()> {
163 if align.is_power_of_two() { Ok((unrounded + align - 1) & !(align - 1)) } else { Err(()) }
164}
165
166/// Read a offset (`usize`) from `reader` whose encoding is described by `encoding`.
167///
168/// `encoding` must be a [DWARF Exception Header Encoding as described by the LSB spec][LSB-dwarf-ext].
169/// In addition the upper ("application") part must be zero.
170///
171/// # Errors
172/// Returns `Err` if `encoding`
173/// * is not a valid DWARF Exception Header Encoding,
174/// * is `DW_EH_PE_omit`, or
175/// * has a non-zero application part.
176///
177/// [LSB-dwarf-ext]: https://refspecs.linuxfoundation.org/LSB_5.0.0/LSB-Core-generic/LSB-Core-generic/dwarfext.html
178unsafe fn read_encoded_offset(reader: &mut DwarfReader, encoding: u8) -> Result<usize, ()> {
179 if encoding == DW_EH_PE_omit || encoding & 0xF0 != 0 {
180 return Err(());
181 }
182 let result: usize = match encoding & 0x0F {
183 // despite the name, LLVM also uses absptr for offsets instead of pointers
184 DW_EH_PE_absptr => reader.read::<usize>(),
185 DW_EH_PE_uleb128 => reader.read_uleb128() as usize,
186 DW_EH_PE_udata2 => reader.read::<u16>() as usize,
187 DW_EH_PE_udata4 => reader.read::<u32>() as usize,
188 DW_EH_PE_udata8 => reader.read::<u64>() as usize,
189 DW_EH_PE_sleb128 => reader.read_sleb128() as usize,
190 DW_EH_PE_sdata2 => reader.read::<i16>() as usize,
191 DW_EH_PE_sdata4 => reader.read::<i32>() as usize,
192 DW_EH_PE_sdata8 => reader.read::<i64>() as usize,
193 _ => return Err(()),
194 };
195 Ok(result)
196}
197
198/// Read a pointer from `reader` whose encoding is described by `encoding`.
199///
200/// `encoding` must be a [DWARF Exception Header Encoding as described by the LSB spec][LSB-dwarf-ext].
201///
202/// # Errors
203/// Returns `Err` if `encoding`
204/// * is not a valid DWARF Exception Header Encoding,
205/// * is `DW_EH_PE_omit`, or
206/// * combines `DW_EH_PE_absptr` or `DW_EH_PE_aligned` application part with an integer encoding
207/// (not `DW_EH_PE_absptr`) in the value format part.
208///
209/// [LSB-dwarf-ext]: https://refspecs.linuxfoundation.org/LSB_5.0.0/LSB-Core-generic/LSB-Core-generic/dwarfext.html
210unsafe fn read_encoded_pointer(
211 reader: &mut DwarfReader,
212 context: &EHContext<'_>,
213 encoding: u8,
214) -> Result<*const u8, ()> {
215 if encoding == DW_EH_PE_omit {
216 return Err(());
217 }
218
219 let base_ptr = match encoding & 0x70 {
220 DW_EH_PE_absptr => core::ptr::null(),
221 // relative to address of the encoded value, despite the name
222 DW_EH_PE_pcrel => reader.ptr,
223 DW_EH_PE_funcrel => {
224 if context.func_start.is_null() {
225 return Err(());
226 }
227 context.func_start
228 }
229 DW_EH_PE_textrel => (*context.get_text_start)(),
230 DW_EH_PE_datarel => (*context.get_data_start)(),
231 // aligned means the value is aligned to the size of a pointer
232 DW_EH_PE_aligned => {
233 reader.ptr =
234 reader.ptr.with_addr(round_up(reader.ptr.addr(), mem::size_of::<*const u8>())?);
235 core::ptr::null()
236 }
237 _ => return Err(()),
238 };
239
240 let mut ptr = if base_ptr.is_null() {
241 // any value encoding other than absptr would be nonsensical here;
242 // there would be no source of pointer provenance
243 if encoding & 0x0F != DW_EH_PE_absptr {
244 return Err(());
245 }
246 reader.read::<*const u8>()
247 } else {
248 let offset = read_encoded_offset(reader, encoding & 0x0F)?;
249 base_ptr.wrapping_add(offset)
250 };
251
252 if encoding & DW_EH_PE_indirect != 0 {
253 ptr = *(ptr.cast::<*const u8>());
254 }
255
256 Ok(ptr)
257}
258