1 | //! The underlying OsString/OsStr implementation on Unix and many other |
2 | //! systems: just a `Vec<u8>`/`[u8]`. |
3 | |
4 | use core::clone::CloneToUninit; |
5 | |
6 | use crate::borrow::Cow; |
7 | use crate::collections::TryReserveError; |
8 | use crate::fmt::Write; |
9 | use crate::rc::Rc; |
10 | use crate::sync::Arc; |
11 | use crate::sys_common::{AsInner, FromInner, IntoInner}; |
12 | use crate::{fmt, mem, str}; |
13 | |
14 | #[cfg (test)] |
15 | mod tests; |
16 | |
17 | #[derive (Hash)] |
18 | #[repr (transparent)] |
19 | pub struct Buf { |
20 | pub inner: Vec<u8>, |
21 | } |
22 | |
23 | #[repr (transparent)] |
24 | pub struct Slice { |
25 | pub inner: [u8], |
26 | } |
27 | |
28 | impl IntoInner<Vec<u8>> for Buf { |
29 | fn into_inner(self) -> Vec<u8> { |
30 | self.inner |
31 | } |
32 | } |
33 | |
34 | impl FromInner<Vec<u8>> for Buf { |
35 | fn from_inner(inner: Vec<u8>) -> Self { |
36 | Buf { inner } |
37 | } |
38 | } |
39 | |
40 | impl AsInner<[u8]> for Buf { |
41 | #[inline ] |
42 | fn as_inner(&self) -> &[u8] { |
43 | &self.inner |
44 | } |
45 | } |
46 | |
47 | impl fmt::Debug for Buf { |
48 | fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result { |
49 | fmt::Debug::fmt(self.as_slice(), f) |
50 | } |
51 | } |
52 | |
53 | impl fmt::Display for Buf { |
54 | fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result { |
55 | fmt::Display::fmt(self.as_slice(), f) |
56 | } |
57 | } |
58 | |
59 | impl fmt::Debug for Slice { |
60 | fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result { |
61 | fmt::Debug::fmt(&self.inner.utf8_chunks().debug(), f) |
62 | } |
63 | } |
64 | |
65 | impl fmt::Display for Slice { |
66 | fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result { |
67 | // If we're the empty string then our iterator won't actually yield |
68 | // anything, so perform the formatting manually |
69 | if self.inner.is_empty() { |
70 | return "" .fmt(f); |
71 | } |
72 | |
73 | for chunk: Utf8Chunk<'_> in self.inner.utf8_chunks() { |
74 | let valid: &str = chunk.valid(); |
75 | // If we successfully decoded the whole chunk as a valid string then |
76 | // we can return a direct formatting of the string which will also |
77 | // respect various formatting flags if possible. |
78 | if chunk.invalid().is_empty() { |
79 | return valid.fmt(f); |
80 | } |
81 | |
82 | f.write_str(data:valid)?; |
83 | f.write_char(char::REPLACEMENT_CHARACTER)?; |
84 | } |
85 | Ok(()) |
86 | } |
87 | } |
88 | |
89 | impl Clone for Buf { |
90 | #[inline ] |
91 | fn clone(&self) -> Self { |
92 | Buf { inner: self.inner.clone() } |
93 | } |
94 | |
95 | #[inline ] |
96 | fn clone_from(&mut self, source: &Self) { |
97 | self.inner.clone_from(&source.inner) |
98 | } |
99 | } |
100 | |
101 | impl Buf { |
102 | #[inline ] |
103 | pub fn into_encoded_bytes(self) -> Vec<u8> { |
104 | self.inner |
105 | } |
106 | |
107 | #[inline ] |
108 | pub unsafe fn from_encoded_bytes_unchecked(s: Vec<u8>) -> Self { |
109 | Self { inner: s } |
110 | } |
111 | |
112 | #[inline ] |
113 | pub fn into_string(self) -> Result<String, Buf> { |
114 | String::from_utf8(self.inner).map_err(|p| Buf { inner: p.into_bytes() }) |
115 | } |
116 | |
117 | #[inline ] |
118 | pub fn from_string(s: String) -> Buf { |
119 | Buf { inner: s.into_bytes() } |
120 | } |
121 | |
122 | #[inline ] |
123 | pub fn with_capacity(capacity: usize) -> Buf { |
124 | Buf { inner: Vec::with_capacity(capacity) } |
125 | } |
126 | |
127 | #[inline ] |
128 | pub fn clear(&mut self) { |
129 | self.inner.clear() |
130 | } |
131 | |
132 | #[inline ] |
133 | pub fn capacity(&self) -> usize { |
134 | self.inner.capacity() |
135 | } |
136 | |
137 | #[inline ] |
138 | pub fn push_slice(&mut self, s: &Slice) { |
139 | self.inner.extend_from_slice(&s.inner) |
140 | } |
141 | |
142 | #[inline ] |
143 | pub fn push_str(&mut self, s: &str) { |
144 | self.inner.extend_from_slice(s.as_bytes()); |
145 | } |
146 | |
147 | #[inline ] |
148 | pub fn reserve(&mut self, additional: usize) { |
149 | self.inner.reserve(additional) |
150 | } |
151 | |
152 | #[inline ] |
153 | pub fn try_reserve(&mut self, additional: usize) -> Result<(), TryReserveError> { |
154 | self.inner.try_reserve(additional) |
155 | } |
156 | |
157 | #[inline ] |
158 | pub fn reserve_exact(&mut self, additional: usize) { |
159 | self.inner.reserve_exact(additional) |
160 | } |
161 | |
162 | #[inline ] |
163 | pub fn try_reserve_exact(&mut self, additional: usize) -> Result<(), TryReserveError> { |
164 | self.inner.try_reserve_exact(additional) |
165 | } |
166 | |
167 | #[inline ] |
168 | pub fn shrink_to_fit(&mut self) { |
169 | self.inner.shrink_to_fit() |
170 | } |
171 | |
172 | #[inline ] |
173 | pub fn shrink_to(&mut self, min_capacity: usize) { |
174 | self.inner.shrink_to(min_capacity) |
175 | } |
176 | |
177 | #[inline ] |
178 | pub fn as_slice(&self) -> &Slice { |
179 | // SAFETY: Slice just wraps [u8], |
180 | // and &*self.inner is &[u8], therefore |
181 | // transmuting &[u8] to &Slice is safe. |
182 | unsafe { mem::transmute(self.inner.as_slice()) } |
183 | } |
184 | |
185 | #[inline ] |
186 | pub fn as_mut_slice(&mut self) -> &mut Slice { |
187 | // SAFETY: Slice just wraps [u8], |
188 | // and &mut *self.inner is &mut [u8], therefore |
189 | // transmuting &mut [u8] to &mut Slice is safe. |
190 | unsafe { mem::transmute(self.inner.as_mut_slice()) } |
191 | } |
192 | |
193 | #[inline ] |
194 | pub fn leak<'a>(self) -> &'a mut Slice { |
195 | unsafe { mem::transmute(self.inner.leak()) } |
196 | } |
197 | |
198 | #[inline ] |
199 | pub fn into_box(self) -> Box<Slice> { |
200 | unsafe { mem::transmute(self.inner.into_boxed_slice()) } |
201 | } |
202 | |
203 | #[inline ] |
204 | pub fn from_box(boxed: Box<Slice>) -> Buf { |
205 | let inner: Box<[u8]> = unsafe { mem::transmute(boxed) }; |
206 | Buf { inner: inner.into_vec() } |
207 | } |
208 | |
209 | #[inline ] |
210 | pub fn into_arc(&self) -> Arc<Slice> { |
211 | self.as_slice().into_arc() |
212 | } |
213 | |
214 | #[inline ] |
215 | pub fn into_rc(&self) -> Rc<Slice> { |
216 | self.as_slice().into_rc() |
217 | } |
218 | |
219 | /// Provides plumbing to core `Vec::truncate`. |
220 | /// More well behaving alternative to allowing outer types |
221 | /// full mutable access to the core `Vec`. |
222 | #[inline ] |
223 | pub(crate) fn truncate(&mut self, len: usize) { |
224 | self.inner.truncate(len); |
225 | } |
226 | |
227 | /// Provides plumbing to core `Vec::extend_from_slice`. |
228 | /// More well behaving alternative to allowing outer types |
229 | /// full mutable access to the core `Vec`. |
230 | #[inline ] |
231 | pub(crate) fn extend_from_slice(&mut self, other: &[u8]) { |
232 | self.inner.extend_from_slice(other); |
233 | } |
234 | } |
235 | |
236 | impl Slice { |
237 | #[inline ] |
238 | pub fn as_encoded_bytes(&self) -> &[u8] { |
239 | &self.inner |
240 | } |
241 | |
242 | #[inline ] |
243 | pub unsafe fn from_encoded_bytes_unchecked(s: &[u8]) -> &Slice { |
244 | unsafe { mem::transmute(s) } |
245 | } |
246 | |
247 | #[track_caller ] |
248 | #[inline ] |
249 | pub fn check_public_boundary(&self, index: usize) { |
250 | if index == 0 || index == self.inner.len() { |
251 | return; |
252 | } |
253 | if index < self.inner.len() |
254 | && (self.inner[index - 1].is_ascii() || self.inner[index].is_ascii()) |
255 | { |
256 | return; |
257 | } |
258 | |
259 | slow_path(&self.inner, index); |
260 | |
261 | /// We're betting that typical splits will involve an ASCII character. |
262 | /// |
263 | /// Putting the expensive checks in a separate function generates notably |
264 | /// better assembly. |
265 | #[track_caller ] |
266 | #[inline (never)] |
267 | fn slow_path(bytes: &[u8], index: usize) { |
268 | let (before, after) = bytes.split_at(index); |
269 | |
270 | // UTF-8 takes at most 4 bytes per codepoint, so we don't |
271 | // need to check more than that. |
272 | let after = after.get(..4).unwrap_or(after); |
273 | match str::from_utf8(after) { |
274 | Ok(_) => return, |
275 | Err(err) if err.valid_up_to() != 0 => return, |
276 | Err(_) => (), |
277 | } |
278 | |
279 | for len in 2..=4.min(index) { |
280 | let before = &before[index - len..]; |
281 | if str::from_utf8(before).is_ok() { |
282 | return; |
283 | } |
284 | } |
285 | |
286 | panic!("byte index {index} is not an OsStr boundary" ); |
287 | } |
288 | } |
289 | |
290 | #[inline ] |
291 | pub fn from_str(s: &str) -> &Slice { |
292 | unsafe { Slice::from_encoded_bytes_unchecked(s.as_bytes()) } |
293 | } |
294 | |
295 | #[inline ] |
296 | pub fn to_str(&self) -> Result<&str, crate::str::Utf8Error> { |
297 | str::from_utf8(&self.inner) |
298 | } |
299 | |
300 | #[inline ] |
301 | pub fn to_string_lossy(&self) -> Cow<'_, str> { |
302 | String::from_utf8_lossy(&self.inner) |
303 | } |
304 | |
305 | #[inline ] |
306 | pub fn to_owned(&self) -> Buf { |
307 | Buf { inner: self.inner.to_vec() } |
308 | } |
309 | |
310 | #[inline ] |
311 | pub fn clone_into(&self, buf: &mut Buf) { |
312 | self.inner.clone_into(&mut buf.inner) |
313 | } |
314 | |
315 | #[inline ] |
316 | pub fn into_box(&self) -> Box<Slice> { |
317 | let boxed: Box<[u8]> = self.inner.into(); |
318 | unsafe { mem::transmute(boxed) } |
319 | } |
320 | |
321 | #[inline ] |
322 | pub fn empty_box() -> Box<Slice> { |
323 | let boxed: Box<[u8]> = Default::default(); |
324 | unsafe { mem::transmute(boxed) } |
325 | } |
326 | |
327 | #[inline ] |
328 | pub fn into_arc(&self) -> Arc<Slice> { |
329 | let arc: Arc<[u8]> = Arc::from(&self.inner); |
330 | unsafe { Arc::from_raw(Arc::into_raw(arc) as *const Slice) } |
331 | } |
332 | |
333 | #[inline ] |
334 | pub fn into_rc(&self) -> Rc<Slice> { |
335 | let rc: Rc<[u8]> = Rc::from(&self.inner); |
336 | unsafe { Rc::from_raw(Rc::into_raw(rc) as *const Slice) } |
337 | } |
338 | |
339 | #[inline ] |
340 | pub fn make_ascii_lowercase(&mut self) { |
341 | self.inner.make_ascii_lowercase() |
342 | } |
343 | |
344 | #[inline ] |
345 | pub fn make_ascii_uppercase(&mut self) { |
346 | self.inner.make_ascii_uppercase() |
347 | } |
348 | |
349 | #[inline ] |
350 | pub fn to_ascii_lowercase(&self) -> Buf { |
351 | Buf { inner: self.inner.to_ascii_lowercase() } |
352 | } |
353 | |
354 | #[inline ] |
355 | pub fn to_ascii_uppercase(&self) -> Buf { |
356 | Buf { inner: self.inner.to_ascii_uppercase() } |
357 | } |
358 | |
359 | #[inline ] |
360 | pub fn is_ascii(&self) -> bool { |
361 | self.inner.is_ascii() |
362 | } |
363 | |
364 | #[inline ] |
365 | pub fn eq_ignore_ascii_case(&self, other: &Self) -> bool { |
366 | self.inner.eq_ignore_ascii_case(&other.inner) |
367 | } |
368 | } |
369 | |
370 | #[unstable (feature = "clone_to_uninit" , issue = "126799" )] |
371 | unsafe impl CloneToUninit for Slice { |
372 | #[inline ] |
373 | #[cfg_attr (debug_assertions, track_caller)] |
374 | unsafe fn clone_to_uninit(&self, dst: *mut u8) { |
375 | // SAFETY: we're just a transparent wrapper around [u8] |
376 | unsafe { self.inner.clone_to_uninit(dest:dst) } |
377 | } |
378 | } |
379 | |