bit_reader_reverse.rs source code [crates/ruzstd/src/decoding/bit_reader_reverse.rs]

1	use core::convert::TryInto;
2
3	pub use super::bit_reader::GetBitsError;
4	use crate::io::Read;
5
6	/// Zstandard encodes some types of data in a way that the data must be read
7	/// back to front to decode it properly. `BitReaderReversed` provides a
8	/// convenient interface to do that.
9	pub struct BitReaderReversed<'s> {
10	idx: isize, //index counts bits already read
11	source: &'s [u8],
12	/// The reader doesn't read directly from the source,
13	/// it reads bits from here, and the container is
14	/// "refilled" as it's emptied.
15	bit_container: u64,
16	bits_in_container: u8,
17	}
18
19	impl<'s> BitReaderReversed<'s> {
20	/// How many bits are left to read by the reader.
21	pub fn bits_remaining(&self) -> isize {
22	self.idx + self.bits_in_container as isize
23	}
24
25	pub fn new(source: &'s [u8]) -> BitReaderReversed<'s> {
26	BitReaderReversed {
27	idx: source.len() as isize * `8`,
28	source,
29	bit_container: `0`,
30	bits_in_container: `0`,
31	}
32	}
33
34	/// We refill the container in full bytes, shifting the still unread portion to the left, and filling the lower bits with new data
35	#[inline(always)]
36	fn refill_container(&mut self) {
37	let byte_idx = self.byte_idx() as usize;
38
39	let retain_bytes = (self.bits_in_container + `7`) / `8`;
40	let want_to_read_bits = `64` - (retain_bytes * `8`);
41
42	// if there are >= 8 byte left to read we go a fast path:
43	// The slice is looking something like this \|U..UCCCCCCCCR..R\| Where U are some unread bytes, C are the bytes in the container, and R are already read bytes
44	// What we do is, we shift the container by a few bytes to the left by just reading a u64 from the correct position, rereading the portion we did not yet return from the conainer.
45	// Technically this would still work for positions lower than 8 but this guarantees that enough bytes are in the source and generally makes for less edge cases
46	if byte_idx >= `8` {
47	self.refill_fast(byte_idx, retain_bytes, want_to_read_bits)
48	} else {
49	// In the slow path we just read however many bytes we can
50	self.refill_slow(byte_idx, want_to_read_bits)
51	}
52	}
53
54	#[inline(always)]
55	fn refill_fast(&mut self, byte_idx: usize, retain_bytes: u8, want_to_read_bits: u8) {
56	let load_from_byte_idx = byte_idx - `7` + retain_bytes as usize;
57	let tmp_bytes: [u8; `8`] = (&self.source[load_from_byte_idx..][..`8`])
58	.try_into()
59	.unwrap();
60	let refill = u64::from_le_bytes(tmp_bytes);
61	self.bit_container = refill;
62	self.bits_in_container += want_to_read_bits;
63	self.idx -= want_to_read_bits as isize;
64	}
65
66	#[cold]
67	fn refill_slow(&mut self, byte_idx: usize, want_to_read_bits: u8) {
68	let can_read_bits = isize::min(want_to_read_bits as isize, self.idx);
69	let can_read_bytes = can_read_bits / `8`;
70	let mut tmp_bytes = [`0u8`; `8`];
71	let offset @ `1`..=`8` = can_read_bytes as usize else {
72	unreachable!()
73	};
74	let bits_read = offset * `8`;
75
76	let _ = (&self.source[byte_idx - (offset - `1`)..]).read_exact(&mut tmp_bytes[`0`..offset]);
77	self.bits_in_container += bits_read as u8;
78	self.idx -= bits_read as isize;
79	if offset < `8` {
80	self.bit_container <<= bits_read;
81	self.bit_container \|= u64::from_le_bytes(tmp_bytes);
82	} else {
83	self.bit_container = u64::from_le_bytes(tmp_bytes);
84	}
85	}
86
87	/// Next byte that should be read into the container
88	/// Negative values mean that the source buffer as been read into the container completetly.
89	fn byte_idx(&self) -> isize {
90	(self.idx - `1`) / `8`
91	}
92
93	/// Read `n` number of bits from the source. Will read at most 56 bits.
94	/// If there are no more bits to be read from the source zero bits will be returned instead.
95	#[inline(always)]
96	pub fn get_bits(&mut self, n: u8) -> u64 {
97	if n == `0` {
98	return `0`;
99	}
100	if self.bits_in_container >= n {
101	return self.get_bits_unchecked(n);
102	}
103
104	self.get_bits_cold(n)
105	}
106
107	#[cold]
108	fn get_bits_cold(&mut self, n: u8) -> u64 {
109	let n = u8::min(n, `56`);
110	let signed_n = n as isize;
111
112	if self.bits_remaining() <= `0` {
113	self.idx -= signed_n;
114	return `0`;
115	}
116
117	if self.bits_remaining() < signed_n {
118	let emulated_read_shift = signed_n - self.bits_remaining();
119	let v = self.get_bits(self.bits_remaining() as u8);
120	debug_assert!(self.idx == `0`);
121	let value = v.wrapping_shl(emulated_read_shift as u32);
122	self.idx -= emulated_read_shift;
123	return value;
124	}
125
126	while (self.bits_in_container < n) && self.idx > `0` {
127	self.refill_container();
128	}
129
130	debug_assert!(self.bits_in_container >= n);
131
132	//if we reach this point there are enough bits in the container
133
134	self.get_bits_unchecked(n)
135	}
136
137	/// Same as calling get_bits three times but slightly more performant
138	#[inline(always)]
139	pub fn get_bits_triple(&mut self, n1: u8, n2: u8, n3: u8) -> (u64, u64, u64) {
140	let sum = n1 as usize + n2 as usize + n3 as usize;
141	if sum == `0` {
142	return (`0`, `0`, `0`);
143	}
144	if sum > `56` {
145	// try and get the values separately
146	return (self.get_bits(n1), self.get_bits(n2), self.get_bits(n3));
147	}
148	let sum = sum as u8;
149
150	if self.bits_in_container >= sum {
151	let v1 = if n1 == `0` {
152	`0`
153	} else {
154	self.get_bits_unchecked(n1)
155	};
156	let v2 = if n2 == `0` {
157	`0`
158	} else {
159	self.get_bits_unchecked(n2)
160	};
161	let v3 = if n3 == `0` {
162	`0`
163	} else {
164	self.get_bits_unchecked(n3)
165	};
166
167	return (v1, v2, v3);
168	}
169
170	self.get_bits_triple_cold(n1, n2, n3, sum)
171	}
172
173	#[cold]
174	fn get_bits_triple_cold(&mut self, n1: u8, n2: u8, n3: u8, sum: u8) -> (u64, u64, u64) {
175	let sum_signed = sum as isize;
176
177	if self.bits_remaining() <= `0` {
178	self.idx -= sum_signed;
179	return (`0`, `0`, `0`);
180	}
181
182	if self.bits_remaining() < sum_signed {
183	return (self.get_bits(n1), self.get_bits(n2), self.get_bits(n3));
184	}
185
186	while (self.bits_in_container < sum) && self.idx > `0` {
187	self.refill_container();
188	}
189
190	debug_assert!(self.bits_in_container >= sum);
191
192	//if we reach this point there are enough bits in the container
193
194	let v1 = if n1 == `0` {
195	`0`
196	} else {
197	self.get_bits_unchecked(n1)
198	};
199	let v2 = if n2 == `0` {
200	`0`
201	} else {
202	self.get_bits_unchecked(n2)
203	};
204	let v3 = if n3 == `0` {
205	`0`
206	} else {
207	self.get_bits_unchecked(n3)
208	};
209
210	(v1, v2, v3)
211	}
212
213	#[inline(always)]
214	fn get_bits_unchecked(&mut self, n: u8) -> u64 {
215	let shift_by = self.bits_in_container - n;
216	let mask = (`1u64` << n) - `1u64`;
217
218	let value = self.bit_container >> shift_by;
219	self.bits_in_container -= n;
220	let value_masked = value & mask;
221	debug_assert!(value_masked < (`1` << n));
222
223	value_masked
224	}
225
226	pub fn reset(&mut self, new_source: &'s [u8]) {
227	self.idx = new_source.len() as isize * `8`;
228	self.source = new_source;
229	self.bit_container = `0`;
230	self.bits_in_container = `0`;
231	}
232	}
233