1 | // SPDX-License-Identifier: Apache-2.0 OR MIT |
2 | |
3 | /* |
4 | Run-time CPU feature detection on x86_64 by using CPUID. |
5 | |
6 | Adapted from https://github.com/rust-lang/stdarch. |
7 | */ |
8 | |
9 | #![cfg_attr (portable_atomic_sanitize_thread, allow(dead_code))] |
10 | |
11 | // Miri doesn't support inline assembly used in __cpuid: https://github.com/rust-lang/miri/issues/932 |
12 | // SGX doesn't support CPUID: https://github.com/rust-lang/stdarch/blob/a0c30f3e3c75adcd6ee7efc94014ebcead61c507/crates/core_arch/src/x86/cpuid.rs#L102-L105 |
13 | #[cfg (any(target_env = "sgx" , miri))] |
14 | compile_error!("internal error: this module is not supported on this environment" ); |
15 | |
16 | include!("common.rs" ); |
17 | |
18 | #[cfg (not(portable_atomic_no_asm))] |
19 | use core::arch::asm; |
20 | use core::arch::x86_64::CpuidResult; |
21 | |
22 | // Workaround for https://github.com/rust-lang/rust/issues/101346 |
23 | // It is not clear if our use cases are affected, but we implement this just in case. |
24 | // |
25 | // Refs: |
26 | // - https://www.felixcloutier.com/x86/cpuid |
27 | // - https://en.wikipedia.org/wiki/CPUID |
28 | // - https://github.com/rust-lang/stdarch/blob/a0c30f3e3c75adcd6ee7efc94014ebcead61c507/crates/core_arch/src/x86/cpuid.rs |
29 | #[cfg (not(target_env = "sgx" ))] |
30 | fn __cpuid(leaf: u32) -> CpuidResult { |
31 | let eax: u32; |
32 | let mut ebx: u32; |
33 | let ecx: u32; |
34 | let edx: u32; |
35 | // SAFETY: Calling `__cpuid`` is safe on all x86_64 CPUs except for SGX, |
36 | // which doesn't support `cpuid`. |
37 | // https://github.com/rust-lang/stdarch/blob/a0c30f3e3c75adcd6ee7efc94014ebcead61c507/crates/core_arch/src/x86/cpuid.rs#L102-L109 |
38 | unsafe { |
39 | asm!( |
40 | "mov { ebx_tmp:r}, rbx" , // save rbx which is reserved by LLVM |
41 | "cpuid" , |
42 | "xchg { ebx_tmp:r}, rbx" , // restore rbx |
43 | ebx_tmp = out(reg) ebx, |
44 | inout("eax" ) leaf => eax, |
45 | inout("ecx" ) 0 => ecx, |
46 | out("edx" ) edx, |
47 | options(nostack, preserves_flags), |
48 | ); |
49 | } |
50 | CpuidResult { eax, ebx, ecx, edx } |
51 | } |
52 | |
53 | // https://en.wikipedia.org/wiki/CPUID |
54 | const _VENDOR_ID_INTEL: [u32; 3] = _vender(b"GenuineIntel" ); // Intel |
55 | const _VENDOR_ID_INTEL2: [u32; 3] = _vender(b"GenuineIotel" ); // Intel https://github.com/InstLatx64/InstLatx64/commit/8fdd319884c67d2c6ec1ca0c595b42c1c4b8d803 |
56 | const _VENDOR_ID_AMD: [u32; 3] = _vender(b"AuthenticAMD" ); // AMD |
57 | const _VENDOR_ID_CENTAUR: [u32; 3] = _vender(b"CentaurHauls" ); // Centaur/VIA/Zhaoxin |
58 | const _VENDOR_ID_ZHAOXIN: [u32; 3] = _vender(b" Shanghai " ); // Zhaoxin |
59 | const fn _vender(b: &[u8; 12]) -> [u32; 3] { |
60 | [ |
61 | u32::from_ne_bytes([b[0], b[1], b[2], b[3]]), |
62 | u32::from_ne_bytes([b[4], b[5], b[6], b[7]]), |
63 | u32::from_ne_bytes([b[8], b[9], b[10], b[11]]), |
64 | ] |
65 | } |
66 | fn _vendor_id() -> [u32; 3] { |
67 | let CpuidResult { ebx: u32, ecx: u32, edx: u32, .. } = __cpuid(leaf:0); |
68 | [ebx, edx, ecx] |
69 | } |
70 | fn _vendor_has_vmovdqa_atomic(vendor_id: [u32; 3], family: u32) -> bool { |
71 | // VMOVDQA is atomic on Intel, AMD, and Zhaoxin CPUs with AVX. |
72 | // See https://gcc.gnu.org/bugzilla/show_bug.cgi?id=104688 for details. |
73 | vendor_id == _VENDOR_ID_INTEL |
74 | || vendor_id == _VENDOR_ID_INTEL2 |
75 | || vendor_id == _VENDOR_ID_AMD |
76 | || vendor_id == _VENDOR_ID_ZHAOXIN |
77 | || vendor_id == _VENDOR_ID_CENTAUR && family > 6 |
78 | } |
79 | |
80 | #[cold ] |
81 | fn _detect(info: &mut CpuInfo) { |
82 | let CpuidResult { |
83 | #[cfg (target_feature = "sse" )] |
84 | eax: proc_info_eax, |
85 | ecx: proc_info_ecx, |
86 | .. |
87 | } = __cpuid(1); |
88 | |
89 | // https://github.com/rust-lang/stdarch/blob/a0c30f3e3c75adcd6ee7efc94014ebcead61c507/crates/std_detect/src/detect/os/x86.rs#L111 |
90 | if test(proc_info_ecx, 13) { |
91 | info.set(CpuInfo::HAS_CMPXCHG16B); |
92 | } |
93 | |
94 | // We only use VMOVDQA when SSE is enabled. See atomic_load_vmovdqa() in atomic128/x86_64.rs for more. |
95 | #[cfg (target_feature = "sse" )] |
96 | { |
97 | use core::arch::x86_64::_xgetbv; |
98 | |
99 | // https://github.com/rust-lang/stdarch/blob/a0c30f3e3c75adcd6ee7efc94014ebcead61c507/crates/std_detect/src/detect/os/x86.rs#L131-L224 |
100 | let cpu_xsave = test(proc_info_ecx, 26); |
101 | if cpu_xsave { |
102 | let cpu_osxsave = test(proc_info_ecx, 27); |
103 | if cpu_osxsave { |
104 | // SAFETY: Calling `_xgetbv`` is safe because the CPU has `xsave` support |
105 | // and OS has set `osxsave`. |
106 | let xcr0 = unsafe { _xgetbv(0) }; |
107 | let os_avx_support = xcr0 & 6 == 6; |
108 | if os_avx_support && test(proc_info_ecx, 28) { |
109 | let vendor_id = _vendor_id(); |
110 | let family = (proc_info_eax >> 8) & 0x0F; |
111 | if _vendor_has_vmovdqa_atomic(vendor_id, family) { |
112 | info.set(CpuInfo::HAS_VMOVDQA_ATOMIC); |
113 | } |
114 | } |
115 | } |
116 | } |
117 | } |
118 | } |
119 | |
120 | #[allow ( |
121 | clippy::alloc_instead_of_core, |
122 | clippy::std_instead_of_alloc, |
123 | clippy::std_instead_of_core, |
124 | clippy::undocumented_unsafe_blocks, |
125 | clippy::wildcard_imports |
126 | )] |
127 | #[cfg (test)] |
128 | mod tests { |
129 | use std::{ |
130 | io::{self, Write}, |
131 | mem, str, |
132 | }; |
133 | |
134 | use super::*; |
135 | |
136 | #[test ] |
137 | #[cfg_attr (portable_atomic_test_outline_atomics_detect_false, ignore)] |
138 | fn test_cpuid() { |
139 | assert_eq!(std::is_x86_feature_detected!("cmpxchg16b" ), detect().has_cmpxchg16b()); |
140 | let vendor_id = _vendor_id(); |
141 | { |
142 | let stdout = io::stderr(); |
143 | let mut stdout = stdout.lock(); |
144 | let _ = writeln!( |
145 | stdout, |
146 | " \n vendor_id: {} (ebx: {:x}, edx: {:x}, ecx: {:x})" , |
147 | str::from_utf8(&unsafe { mem::transmute::<[u32; 3], [u8; 12]>(vendor_id) }) |
148 | .unwrap(), |
149 | vendor_id[0], |
150 | vendor_id[1], |
151 | vendor_id[2], |
152 | ); |
153 | } |
154 | let CpuidResult { eax: proc_info_eax, .. } = __cpuid(1); |
155 | let family = (proc_info_eax >> 8) & 0x0F; |
156 | if _vendor_has_vmovdqa_atomic(vendor_id, family) { |
157 | assert_eq!(std::is_x86_feature_detected!("avx" ), detect().has_vmovdqa_atomic()); |
158 | } else { |
159 | assert!(!detect().has_vmovdqa_atomic()); |
160 | } |
161 | assert_eq!( |
162 | unsafe { mem::transmute::<[u32; 3], [u8; 12]>(_VENDOR_ID_INTEL) }, |
163 | *b"GenuineIntel" |
164 | ); |
165 | } |
166 | } |
167 | |