1 | //! Helper code for character escaping. |
2 | |
3 | use crate::ascii; |
4 | use crate::num::NonZeroUsize; |
5 | use crate::ops::Range; |
6 | |
7 | const HEX_DIGITS: [ascii::Char; 16] = *b"0123456789abcdef" .as_ascii().unwrap(); |
8 | |
9 | /// Escapes a byte into provided buffer; returns length of escaped |
10 | /// representation. |
11 | pub(crate) fn escape_ascii_into(output: &mut [ascii::Char; 4], byte: u8) -> Range<u8> { |
12 | #[inline ] |
13 | fn backslash(a: ascii::Char) -> ([ascii::Char; 4], u8) { |
14 | ([ascii::Char::ReverseSolidus, a, ascii::Char::Null, ascii::Char::Null], 2) |
15 | } |
16 | |
17 | let (data, len) = match byte { |
18 | b' \t' => backslash(ascii::Char::SmallT), |
19 | b' \r' => backslash(ascii::Char::SmallR), |
20 | b' \n' => backslash(ascii::Char::SmallN), |
21 | b' \\' => backslash(ascii::Char::ReverseSolidus), |
22 | b' \'' => backslash(ascii::Char::Apostrophe), |
23 | b' \"' => backslash(ascii::Char::QuotationMark), |
24 | _ => { |
25 | if let Some(a) = byte.as_ascii() |
26 | && !byte.is_ascii_control() |
27 | { |
28 | ([a, ascii::Char::Null, ascii::Char::Null, ascii::Char::Null], 1) |
29 | } else { |
30 | let hi = HEX_DIGITS[usize::from(byte >> 4)]; |
31 | let lo = HEX_DIGITS[usize::from(byte & 0xf)]; |
32 | ([ascii::Char::ReverseSolidus, ascii::Char::SmallX, hi, lo], 4) |
33 | } |
34 | } |
35 | }; |
36 | *output = data; |
37 | 0..len |
38 | } |
39 | |
40 | /// Escapes a character into provided buffer using `\u{NNNN}` representation. |
41 | pub(crate) fn escape_unicode_into(output: &mut [ascii::Char; 10], ch: char) -> Range<u8> { |
42 | output[9] = ascii::Char::RightCurlyBracket; |
43 | |
44 | let ch: u32 = ch as u32; |
45 | output[3] = HEX_DIGITS[((ch >> 20) & 15) as usize]; |
46 | output[4] = HEX_DIGITS[((ch >> 16) & 15) as usize]; |
47 | output[5] = HEX_DIGITS[((ch >> 12) & 15) as usize]; |
48 | output[6] = HEX_DIGITS[((ch >> 8) & 15) as usize]; |
49 | output[7] = HEX_DIGITS[((ch >> 4) & 15) as usize]; |
50 | output[8] = HEX_DIGITS[((ch >> 0) & 15) as usize]; |
51 | |
52 | // or-ing 1 ensures that for ch==0 the code computes that one digit should |
53 | // be printed. |
54 | let start: usize = (ch | 1).leading_zeros() as usize / 4 - 2; |
55 | const UNICODE_ESCAPE_PREFIX: &[ascii::Char; 3] = b" \\u{" .as_ascii().unwrap(); |
56 | output[start..][..3].copy_from_slice(UNICODE_ESCAPE_PREFIX); |
57 | |
58 | (start as u8)..10 |
59 | } |
60 | |
61 | /// An iterator over an fixed-size array. |
62 | /// |
63 | /// This is essentially equivalent to array’s IntoIter except that indexes are |
64 | /// limited to u8 to reduce size of the structure. |
65 | #[derive (Clone, Debug)] |
66 | pub(crate) struct EscapeIterInner<const N: usize> { |
67 | // The element type ensures this is always ASCII, and thus also valid UTF-8. |
68 | pub(crate) data: [ascii::Char; N], |
69 | |
70 | // Invariant: alive.start <= alive.end <= N. |
71 | pub(crate) alive: Range<u8>, |
72 | } |
73 | |
74 | impl<const N: usize> EscapeIterInner<N> { |
75 | pub fn new(data: [ascii::Char; N], alive: Range<u8>) -> Self { |
76 | const { assert!(N < 256) }; |
77 | debug_assert!(alive.start <= alive.end && usize::from(alive.end) <= N, " {alive:?}" ); |
78 | Self { data, alive } |
79 | } |
80 | |
81 | pub fn from_array<const M: usize>(array: [ascii::Char; M]) -> Self { |
82 | const { assert!(M <= N) }; |
83 | |
84 | let mut data = [ascii::Char::Null; N]; |
85 | data[..M].copy_from_slice(&array); |
86 | Self::new(data, 0..M as u8) |
87 | } |
88 | |
89 | pub fn as_ascii(&self) -> &[ascii::Char] { |
90 | &self.data[usize::from(self.alive.start)..usize::from(self.alive.end)] |
91 | } |
92 | |
93 | pub fn as_str(&self) -> &str { |
94 | self.as_ascii().as_str() |
95 | } |
96 | |
97 | pub fn len(&self) -> usize { |
98 | usize::from(self.alive.end - self.alive.start) |
99 | } |
100 | |
101 | pub fn next(&mut self) -> Option<u8> { |
102 | self.alive.next().map(|i| self.data[usize::from(i)].to_u8()) |
103 | } |
104 | |
105 | pub fn next_back(&mut self) -> Option<u8> { |
106 | self.alive.next_back().map(|i| self.data[usize::from(i)].to_u8()) |
107 | } |
108 | |
109 | pub fn advance_by(&mut self, n: usize) -> Result<(), NonZeroUsize> { |
110 | self.alive.advance_by(n) |
111 | } |
112 | |
113 | pub fn advance_back_by(&mut self, n: usize) -> Result<(), NonZeroUsize> { |
114 | self.alive.advance_back_by(n) |
115 | } |
116 | } |
117 | |