1 | //! Support for symbolication using the `gimli` crate on crates.io |
2 | //! |
3 | //! This is the default symbolication implementation for Rust. |
4 | |
5 | use self::gimli::read::EndianSlice; |
6 | use self::gimli::NativeEndian as Endian; |
7 | use self::mmap::Mmap; |
8 | use self::stash::Stash; |
9 | use super::BytesOrWideString; |
10 | use super::ResolveWhat; |
11 | use super::SymbolName; |
12 | use addr2line::gimli; |
13 | use core::convert::TryInto; |
14 | use core::mem; |
15 | use core::u32; |
16 | use libc::c_void; |
17 | use mystd::ffi::OsString; |
18 | use mystd::fs::File; |
19 | use mystd::path::Path; |
20 | use mystd::prelude::v1::*; |
21 | |
22 | #[cfg (backtrace_in_libstd)] |
23 | mod mystd { |
24 | pub use crate::*; |
25 | } |
26 | #[cfg (not(backtrace_in_libstd))] |
27 | extern crate std as mystd; |
28 | |
29 | cfg_if::cfg_if! { |
30 | if #[cfg(windows)] { |
31 | #[path = "gimli/mmap_windows.rs" ] |
32 | mod mmap; |
33 | } else if #[cfg(any( |
34 | target_os = "android" , |
35 | target_os = "freebsd" , |
36 | target_os = "fuchsia" , |
37 | target_os = "haiku" , |
38 | target_os = "hurd" , |
39 | target_os = "ios" , |
40 | target_os = "linux" , |
41 | target_os = "macos" , |
42 | target_os = "openbsd" , |
43 | target_os = "solaris" , |
44 | target_os = "illumos" , |
45 | target_os = "aix" , |
46 | ))] { |
47 | #[path = "gimli/mmap_unix.rs" ] |
48 | mod mmap; |
49 | } else { |
50 | #[path = "gimli/mmap_fake.rs" ] |
51 | mod mmap; |
52 | } |
53 | } |
54 | |
55 | mod stash; |
56 | |
57 | const MAPPINGS_CACHE_SIZE: usize = 4; |
58 | |
59 | struct Mapping { |
60 | // 'static lifetime is a lie to hack around lack of support for self-referential structs. |
61 | cx: Context<'static>, |
62 | _map: Mmap, |
63 | stash: Stash, |
64 | } |
65 | |
66 | enum Either<A, B> { |
67 | #[allow (dead_code)] |
68 | A(A), |
69 | B(B), |
70 | } |
71 | |
72 | impl Mapping { |
73 | /// Creates a `Mapping` by ensuring that the `data` specified is used to |
74 | /// create a `Context` and it can only borrow from that or the `Stash` of |
75 | /// decompressed sections or auxiliary data. |
76 | fn mk<F>(data: Mmap, mk: F) -> Option<Mapping> |
77 | where |
78 | F: for<'a> FnOnce(&'a [u8], &'a Stash) -> Option<Context<'a>>, |
79 | { |
80 | Mapping::mk_or_other(data, move |data, stash| { |
81 | let cx = mk(data, stash)?; |
82 | Some(Either::B(cx)) |
83 | }) |
84 | } |
85 | |
86 | /// Creates a `Mapping` from `data`, or if the closure decides to, returns a |
87 | /// different mapping. |
88 | fn mk_or_other<F>(data: Mmap, mk: F) -> Option<Mapping> |
89 | where |
90 | F: for<'a> FnOnce(&'a [u8], &'a Stash) -> Option<Either<Mapping, Context<'a>>>, |
91 | { |
92 | let stash = Stash::new(); |
93 | let cx = match mk(&data, &stash)? { |
94 | Either::A(mapping) => return Some(mapping), |
95 | Either::B(cx) => cx, |
96 | }; |
97 | Some(Mapping { |
98 | // Convert to 'static lifetimes since the symbols should |
99 | // only borrow `map` and `stash` and we're preserving them below. |
100 | cx: unsafe { core::mem::transmute::<Context<'_>, Context<'static>>(cx) }, |
101 | _map: data, |
102 | stash: stash, |
103 | }) |
104 | } |
105 | } |
106 | |
107 | struct Context<'a> { |
108 | dwarf: addr2line::Context<EndianSlice<'a, Endian>>, |
109 | object: Object<'a>, |
110 | package: Option<gimli::DwarfPackage<EndianSlice<'a, Endian>>>, |
111 | } |
112 | |
113 | impl<'data> Context<'data> { |
114 | fn new( |
115 | stash: &'data Stash, |
116 | object: Object<'data>, |
117 | sup: Option<Object<'data>>, |
118 | dwp: Option<Object<'data>>, |
119 | ) -> Option<Context<'data>> { |
120 | let mut sections = gimli::Dwarf::load(|id| -> Result<_, ()> { |
121 | if cfg!(not(target_os = "aix" )) { |
122 | let data = object.section(stash, id.name()).unwrap_or(&[]); |
123 | Ok(EndianSlice::new(data, Endian)) |
124 | } else { |
125 | if let Some(name) = id.xcoff_name() { |
126 | let data = object.section(stash, name).unwrap_or(&[]); |
127 | Ok(EndianSlice::new(data, Endian)) |
128 | } else { |
129 | Ok(EndianSlice::new(&[], Endian)) |
130 | } |
131 | } |
132 | }) |
133 | .ok()?; |
134 | |
135 | if let Some(sup) = sup { |
136 | sections |
137 | .load_sup(|id| -> Result<_, ()> { |
138 | let data = sup.section(stash, id.name()).unwrap_or(&[]); |
139 | Ok(EndianSlice::new(data, Endian)) |
140 | }) |
141 | .ok()?; |
142 | } |
143 | let dwarf = addr2line::Context::from_dwarf(sections).ok()?; |
144 | |
145 | let mut package = None; |
146 | if let Some(dwp) = dwp { |
147 | package = Some( |
148 | gimli::DwarfPackage::load( |
149 | |id| -> Result<_, gimli::Error> { |
150 | let data = id |
151 | .dwo_name() |
152 | .and_then(|name| dwp.section(stash, name)) |
153 | .unwrap_or(&[]); |
154 | Ok(EndianSlice::new(data, Endian)) |
155 | }, |
156 | EndianSlice::new(&[], Endian), |
157 | ) |
158 | .ok()?, |
159 | ); |
160 | } |
161 | |
162 | Some(Context { |
163 | dwarf, |
164 | object, |
165 | package, |
166 | }) |
167 | } |
168 | |
169 | fn find_frames( |
170 | &'_ self, |
171 | stash: &'data Stash, |
172 | probe: u64, |
173 | ) -> gimli::Result<addr2line::FrameIter<'_, EndianSlice<'data, Endian>>> { |
174 | use addr2line::{LookupContinuation, LookupResult}; |
175 | |
176 | let mut l = self.dwarf.find_frames(probe); |
177 | loop { |
178 | let (load, continuation) = match l { |
179 | LookupResult::Output(output) => break output, |
180 | LookupResult::Load { load, continuation } => (load, continuation), |
181 | }; |
182 | |
183 | l = continuation.resume(handle_split_dwarf(self.package.as_ref(), stash, load)); |
184 | } |
185 | } |
186 | } |
187 | |
188 | fn mmap(path: &Path) -> Option<Mmap> { |
189 | let file: File = File::open(path).ok()?; |
190 | let len: usize = file.metadata().ok()?.len().try_into().ok()?; |
191 | unsafe { Mmap::map(&file, len) } |
192 | } |
193 | |
194 | cfg_if::cfg_if! { |
195 | if #[cfg(windows)] { |
196 | mod coff; |
197 | use self::coff::{handle_split_dwarf, Object}; |
198 | } else if #[cfg(any( |
199 | target_os = "macos" , |
200 | target_os = "ios" , |
201 | target_os = "tvos" , |
202 | target_os = "watchos" , |
203 | ))] { |
204 | mod macho; |
205 | use self::macho::{handle_split_dwarf, Object}; |
206 | } else if #[cfg(target_os = "aix" )] { |
207 | mod xcoff; |
208 | use self::xcoff::{handle_split_dwarf, Object}; |
209 | } else { |
210 | mod elf; |
211 | use self::elf::{handle_split_dwarf, Object}; |
212 | } |
213 | } |
214 | |
215 | cfg_if::cfg_if! { |
216 | if #[cfg(windows)] { |
217 | mod libs_windows; |
218 | use libs_windows::native_libraries; |
219 | } else if #[cfg(any( |
220 | target_os = "macos" , |
221 | target_os = "ios" , |
222 | target_os = "tvos" , |
223 | target_os = "watchos" , |
224 | ))] { |
225 | mod libs_macos; |
226 | use libs_macos::native_libraries; |
227 | } else if #[cfg(target_os = "illumos" )] { |
228 | mod libs_illumos; |
229 | use libs_illumos::native_libraries; |
230 | } else if #[cfg(all( |
231 | any( |
232 | target_os = "linux" , |
233 | target_os = "fuchsia" , |
234 | target_os = "freebsd" , |
235 | target_os = "hurd" , |
236 | target_os = "openbsd" , |
237 | target_os = "netbsd" , |
238 | all(target_os = "android" , feature = "dl_iterate_phdr" ), |
239 | ), |
240 | not(target_env = "uclibc" ), |
241 | ))] { |
242 | mod libs_dl_iterate_phdr; |
243 | use libs_dl_iterate_phdr::native_libraries; |
244 | #[path = "gimli/parse_running_mmaps_unix.rs" ] |
245 | mod parse_running_mmaps; |
246 | } else if #[cfg(target_env = "libnx" )] { |
247 | mod libs_libnx; |
248 | use libs_libnx::native_libraries; |
249 | } else if #[cfg(target_os = "haiku" )] { |
250 | mod libs_haiku; |
251 | use libs_haiku::native_libraries; |
252 | } else if #[cfg(target_os = "aix" )] { |
253 | mod libs_aix; |
254 | use libs_aix::native_libraries; |
255 | } else { |
256 | // Everything else should doesn't know how to load native libraries. |
257 | fn native_libraries() -> Vec<Library> { |
258 | Vec::new() |
259 | } |
260 | } |
261 | } |
262 | |
263 | #[derive (Default)] |
264 | struct Cache { |
265 | /// All known shared libraries that have been loaded. |
266 | libraries: Vec<Library>, |
267 | |
268 | /// Mappings cache where we retain parsed dwarf information. |
269 | /// |
270 | /// This list has a fixed capacity for its entire lifetime which never |
271 | /// increases. The `usize` element of each pair is an index into `libraries` |
272 | /// above where `usize::max_value()` represents the current executable. The |
273 | /// `Mapping` is corresponding parsed dwarf information. |
274 | /// |
275 | /// Note that this is basically an LRU cache and we'll be shifting things |
276 | /// around in here as we symbolize addresses. |
277 | mappings: Vec<(usize, Mapping)>, |
278 | } |
279 | |
280 | struct Library { |
281 | name: OsString, |
282 | #[cfg (target_os = "aix" )] |
283 | /// On AIX, the library mmapped can be a member of a big-archive file. |
284 | /// For example, with a big-archive named libfoo.a containing libbar.so, |
285 | /// one can use `dlopen("libfoo.a(libbar.so)", RTLD_MEMBER | RTLD_LAZY)` |
286 | /// to use the `libbar.so` library. In this case, only `libbar.so` is |
287 | /// mmapped, not the whole `libfoo.a`. |
288 | member_name: OsString, |
289 | /// Segments of this library loaded into memory, and where they're loaded. |
290 | segments: Vec<LibrarySegment>, |
291 | /// The "bias" of this library, typically where it's loaded into memory. |
292 | /// This value is added to each segment's stated address to get the actual |
293 | /// virtual memory address that the segment is loaded into. Additionally |
294 | /// this bias is subtracted from real virtual memory addresses to index into |
295 | /// debuginfo and the symbol table. |
296 | bias: usize, |
297 | } |
298 | |
299 | struct LibrarySegment { |
300 | /// The stated address of this segment in the object file. This is not |
301 | /// actually where the segment is loaded, but rather this address plus the |
302 | /// containing library's `bias` is where to find it. |
303 | stated_virtual_memory_address: usize, |
304 | /// The size of this segment in memory. |
305 | len: usize, |
306 | } |
307 | |
308 | #[cfg (target_os = "aix" )] |
309 | fn create_mapping(lib: &Library) -> Option<Mapping> { |
310 | let name = &lib.name; |
311 | let member_name = &lib.member_name; |
312 | Mapping::new(name.as_ref(), member_name) |
313 | } |
314 | |
315 | #[cfg (not(target_os = "aix" ))] |
316 | fn create_mapping(lib: &Library) -> Option<Mapping> { |
317 | let name: &OsString = &lib.name; |
318 | Mapping::new(path:name.as_ref()) |
319 | } |
320 | |
321 | // unsafe because this is required to be externally synchronized |
322 | pub unsafe fn clear_symbol_cache() { |
323 | Cache::with_global(|cache: &mut Cache| cache.mappings.clear()); |
324 | } |
325 | |
326 | impl Cache { |
327 | fn new() -> Cache { |
328 | Cache { |
329 | mappings: Vec::with_capacity(MAPPINGS_CACHE_SIZE), |
330 | libraries: native_libraries(), |
331 | } |
332 | } |
333 | |
334 | // unsafe because this is required to be externally synchronized |
335 | unsafe fn with_global(f: impl FnOnce(&mut Self)) { |
336 | // A very small, very simple LRU cache for debug info mappings. |
337 | // |
338 | // The hit rate should be very high, since the typical stack doesn't cross |
339 | // between many shared libraries. |
340 | // |
341 | // The `addr2line::Context` structures are pretty expensive to create. Its |
342 | // cost is expected to be amortized by subsequent `locate` queries, which |
343 | // leverage the structures built when constructing `addr2line::Context`s to |
344 | // get nice speedups. If we didn't have this cache, that amortization would |
345 | // never happen, and symbolicating backtraces would be ssssllllooooowwww. |
346 | static mut MAPPINGS_CACHE: Option<Cache> = None; |
347 | |
348 | f(MAPPINGS_CACHE.get_or_insert_with(|| Cache::new())) |
349 | } |
350 | |
351 | fn avma_to_svma(&self, addr: *const u8) -> Option<(usize, *const u8)> { |
352 | self.libraries |
353 | .iter() |
354 | .enumerate() |
355 | .filter_map(|(i, lib)| { |
356 | // First up, test if this `lib` has any segment containing the |
357 | // `addr` (handling relocation). If this check passes then we |
358 | // can continue below and actually translate the address. |
359 | // |
360 | // Note that we're using `wrapping_add` here to avoid overflow |
361 | // checks. It's been seen in the wild that the SVMA + bias |
362 | // computation overflows. It seems a bit odd that would happen |
363 | // but there's not a huge amount we can do about it other than |
364 | // probably just ignore those segments since they're likely |
365 | // pointing off into space. This originally came up in |
366 | // rust-lang/backtrace-rs#329. |
367 | if !lib.segments.iter().any(|s| { |
368 | let svma = s.stated_virtual_memory_address; |
369 | let start = svma.wrapping_add(lib.bias); |
370 | let end = start.wrapping_add(s.len); |
371 | let address = addr as usize; |
372 | start <= address && address < end |
373 | }) { |
374 | return None; |
375 | } |
376 | |
377 | // Now that we know `lib` contains `addr`, we can offset with |
378 | // the bias to find the stated virtual memory address. |
379 | let svma = (addr as usize).wrapping_sub(lib.bias); |
380 | Some((i, svma as *const u8)) |
381 | }) |
382 | .next() |
383 | } |
384 | |
385 | fn mapping_for_lib<'a>(&'a mut self, lib: usize) -> Option<(&'a mut Context<'a>, &'a Stash)> { |
386 | let idx = self.mappings.iter().position(|(idx, _)| *idx == lib); |
387 | |
388 | // Invariant: after this conditional completes without early returning |
389 | // from an error, the cache entry for this path is at index 0. |
390 | |
391 | if let Some(idx) = idx { |
392 | // When the mapping is already in the cache, move it to the front. |
393 | if idx != 0 { |
394 | let entry = self.mappings.remove(idx); |
395 | self.mappings.insert(0, entry); |
396 | } |
397 | } else { |
398 | // When the mapping is not in the cache, create a new mapping, |
399 | // insert it into the front of the cache, and evict the oldest cache |
400 | // entry if necessary. |
401 | let mapping = create_mapping(&self.libraries[lib])?; |
402 | |
403 | if self.mappings.len() == MAPPINGS_CACHE_SIZE { |
404 | self.mappings.pop(); |
405 | } |
406 | |
407 | self.mappings.insert(0, (lib, mapping)); |
408 | } |
409 | |
410 | let mapping = &mut self.mappings[0].1; |
411 | let cx: &'a mut Context<'static> = &mut mapping.cx; |
412 | let stash: &'a Stash = &mapping.stash; |
413 | // don't leak the `'static` lifetime, make sure it's scoped to just |
414 | // ourselves |
415 | Some(( |
416 | unsafe { mem::transmute::<&'a mut Context<'static>, &'a mut Context<'a>>(cx) }, |
417 | stash, |
418 | )) |
419 | } |
420 | } |
421 | |
422 | pub unsafe fn resolve(what: ResolveWhat<'_>, cb: &mut dyn FnMut(&super::Symbol)) { |
423 | let addr = what.address_or_ip(); |
424 | let mut call = |sym: Symbol<'_>| { |
425 | // Extend the lifetime of `sym` to `'static` since we are unfortunately |
426 | // required to here, but it's only ever going out as a reference so no |
427 | // reference to it should be persisted beyond this frame anyway. |
428 | let sym = mem::transmute::<Symbol<'_>, Symbol<'static>>(sym); |
429 | (cb)(&super::Symbol { inner: sym }); |
430 | }; |
431 | |
432 | Cache::with_global(|cache| { |
433 | let (lib, addr) = match cache.avma_to_svma(addr.cast_const().cast::<u8>()) { |
434 | Some(pair) => pair, |
435 | None => return, |
436 | }; |
437 | |
438 | // Finally, get a cached mapping or create a new mapping for this file, and |
439 | // evaluate the DWARF info to find the file/line/name for this address. |
440 | let (cx, stash) = match cache.mapping_for_lib(lib) { |
441 | Some((cx, stash)) => (cx, stash), |
442 | None => return, |
443 | }; |
444 | let mut any_frames = false; |
445 | if let Ok(mut frames) = cx.find_frames(stash, addr as u64) { |
446 | while let Ok(Some(frame)) = frames.next() { |
447 | any_frames = true; |
448 | let name = match frame.function { |
449 | Some(f) => Some(f.name.slice()), |
450 | None => cx.object.search_symtab(addr as u64), |
451 | }; |
452 | call(Symbol::Frame { |
453 | addr: addr as *mut c_void, |
454 | location: frame.location, |
455 | name, |
456 | }); |
457 | } |
458 | } |
459 | if !any_frames { |
460 | if let Some((object_cx, object_addr)) = cx.object.search_object_map(addr as u64) { |
461 | if let Ok(mut frames) = object_cx.find_frames(stash, object_addr) { |
462 | while let Ok(Some(frame)) = frames.next() { |
463 | any_frames = true; |
464 | call(Symbol::Frame { |
465 | addr: addr as *mut c_void, |
466 | location: frame.location, |
467 | name: frame.function.map(|f| f.name.slice()), |
468 | }); |
469 | } |
470 | } |
471 | } |
472 | } |
473 | if !any_frames { |
474 | if let Some(name) = cx.object.search_symtab(addr as u64) { |
475 | call(Symbol::Symtab { |
476 | addr: addr as *mut c_void, |
477 | name, |
478 | }); |
479 | } |
480 | } |
481 | }); |
482 | } |
483 | |
484 | pub enum Symbol<'a> { |
485 | /// We were able to locate frame information for this symbol, and |
486 | /// `addr2line`'s frame internally has all the nitty gritty details. |
487 | Frame { |
488 | addr: *mut c_void, |
489 | location: Option<addr2line::Location<'a>>, |
490 | name: Option<&'a [u8]>, |
491 | }, |
492 | /// Couldn't find debug information, but we found it in the symbol table of |
493 | /// the elf executable. |
494 | Symtab { addr: *mut c_void, name: &'a [u8] }, |
495 | } |
496 | |
497 | impl Symbol<'_> { |
498 | pub fn name(&self) -> Option<SymbolName<'_>> { |
499 | match self { |
500 | Symbol::Frame { name, .. } => { |
501 | let name = name.as_ref()?; |
502 | Some(SymbolName::new(name)) |
503 | } |
504 | Symbol::Symtab { name, .. } => Some(SymbolName::new(name)), |
505 | } |
506 | } |
507 | |
508 | pub fn addr(&self) -> Option<*mut c_void> { |
509 | match self { |
510 | Symbol::Frame { addr, .. } => Some(*addr), |
511 | Symbol::Symtab { .. } => None, |
512 | } |
513 | } |
514 | |
515 | pub fn filename_raw(&self) -> Option<BytesOrWideString<'_>> { |
516 | match self { |
517 | Symbol::Frame { location, .. } => { |
518 | let file = location.as_ref()?.file?; |
519 | Some(BytesOrWideString::Bytes(file.as_bytes())) |
520 | } |
521 | Symbol::Symtab { .. } => None, |
522 | } |
523 | } |
524 | |
525 | pub fn filename(&self) -> Option<&Path> { |
526 | match self { |
527 | Symbol::Frame { location, .. } => { |
528 | let file = location.as_ref()?.file?; |
529 | Some(Path::new(file)) |
530 | } |
531 | Symbol::Symtab { .. } => None, |
532 | } |
533 | } |
534 | |
535 | pub fn lineno(&self) -> Option<u32> { |
536 | match self { |
537 | Symbol::Frame { location, .. } => location.as_ref()?.line, |
538 | Symbol::Symtab { .. } => None, |
539 | } |
540 | } |
541 | |
542 | pub fn colno(&self) -> Option<u32> { |
543 | match self { |
544 | Symbol::Frame { location, .. } => location.as_ref()?.column, |
545 | Symbol::Symtab { .. } => None, |
546 | } |
547 | } |
548 | } |
549 | |