mod.rs source code [crates/miniz_oxide/src/inflate/mod.rs]

1	//! This module contains functionality for decompression.
2
3	#[cfg(feature = "with-alloc")]
4	use crate::alloc::{boxed::Box, vec, vec::Vec};
5	#[cfg(all(feature = "std", feature = "with-alloc"))]
6	use std::error::Error;
7
8	pub mod core;
9	mod output_buffer;
10	#[cfg(not(feature = "rustc-dep-of-std"))]
11	pub mod stream;
12	#[cfg(not(feature = "rustc-dep-of-std"))]
13	use self::core::*;
14
15	const TINFL_STATUS_FAILED_CANNOT_MAKE_PROGRESS: i32 = `-4`;
16	const TINFL_STATUS_BAD_PARAM: i32 = `-3`;
17	const TINFL_STATUS_ADLER32_MISMATCH: i32 = `-2`;
18	const TINFL_STATUS_FAILED: i32 = `-1`;
19	const TINFL_STATUS_DONE: i32 = `0`;
20	const TINFL_STATUS_NEEDS_MORE_INPUT: i32 = `1`;
21	const TINFL_STATUS_HAS_MORE_OUTPUT: i32 = `2`;
22	#[cfg(feature = "block-boundary")]
23	const TINFL_STATUS_BLOCK_BOUNDARY: i32 = `3`;
24
25	/// Return status codes.
26	#[repr(i8)]
27	#[cfg_attr(not(feature = "rustc-dep-of-std"), derive(Hash, Debug))]
28	#[derive(Copy, Clone, PartialEq, Eq)]
29	pub enum TINFLStatus {
30	/// More input data was expected, but the caller indicated that there was no more data, so the
31	/// input stream is likely truncated.
32	///
33	/// This can't happen if you have provided the
34	/// [`TINFL_FLAG_HAS_MORE_INPUT`][core::inflate_flags::TINFL_FLAG_HAS_MORE_INPUT] flag to the
35	/// decompression. By setting that flag, you indicate more input exists but is not provided,
36	/// and so reaching the end of the input data without finding the end of the compressed stream
37	/// would instead return a [`NeedsMoreInput`][Self::NeedsMoreInput] status.
38	FailedCannotMakeProgress = TINFL_STATUS_FAILED_CANNOT_MAKE_PROGRESS as i8,
39
40	/// The output buffer is an invalid size; consider the `flags` parameter.
41	BadParam = TINFL_STATUS_BAD_PARAM as i8,
42
43	/// The decompression went fine, but the adler32 checksum did not match the one
44	/// provided in the header.
45	Adler32Mismatch = TINFL_STATUS_ADLER32_MISMATCH as i8,
46
47	/// Failed to decompress due to invalid data.
48	Failed = TINFL_STATUS_FAILED as i8,
49
50	/// Finished decompression without issues.
51	///
52	/// This indicates the end of the compressed stream has been reached.
53	Done = TINFL_STATUS_DONE as i8,
54
55	/// The decompressor needs more input data to continue decompressing.
56	///
57	/// This occurs when there's no more consumable input, but the end of the stream hasn't been
58	/// reached, and you have supplied the
59	/// [`TINFL_FLAG_HAS_MORE_INPUT`][core::inflate_flags::TINFL_FLAG_HAS_MORE_INPUT] flag to the
60	/// decompressor. Had you not supplied that flag (which would mean you were asserting that you
61	/// believed all the data was available) you would have gotten a
62	/// [`FailedCannotMakeProcess`][Self::FailedCannotMakeProgress] instead.
63	NeedsMoreInput = TINFL_STATUS_NEEDS_MORE_INPUT as i8,
64
65	/// There is still pending data that didn't fit in the output buffer.
66	HasMoreOutput = TINFL_STATUS_HAS_MORE_OUTPUT as i8,
67
68	/// Reached the end of a deflate block, and the start of the next block.
69	///
70	/// At this point, you can suspend decompression and later resume with a new `DecompressorOxide`.
71	/// The only state that must be preserved is [`DecompressorOxide::block_boundary_state()`],
72	/// plus the last 32KiB of the output buffer (or less if you know the stream was compressed with
73	/// a smaller window size).
74	///
75	/// This is only returned if you use the
76	/// [`TINFL_FLAG_STOP_ON_BLOCK_BOUNDARY`][core::inflate_flags::TINFL_FLAG_STOP_ON_BLOCK_BOUNDARY] flag.
77	#[cfg(feature = "block-boundary")]
78	BlockBoundary = TINFL_STATUS_BLOCK_BOUNDARY as i8,
79	}
80
81	impl TINFLStatus {
82	pub fn from_i32(value: i32) -> Option<TINFLStatus> {
83	use self::TINFLStatus::*;
84	match value {
85	TINFL_STATUS_FAILED_CANNOT_MAKE_PROGRESS => Some(FailedCannotMakeProgress),
86	TINFL_STATUS_BAD_PARAM => Some(BadParam),
87	TINFL_STATUS_ADLER32_MISMATCH => Some(Adler32Mismatch),
88	TINFL_STATUS_FAILED => Some(Failed),
89	TINFL_STATUS_DONE => Some(Done),
90	TINFL_STATUS_NEEDS_MORE_INPUT => Some(NeedsMoreInput),
91	TINFL_STATUS_HAS_MORE_OUTPUT => Some(HasMoreOutput),
92	#[cfg(feature = "block-boundary")]
93	TINFL_STATUS_BLOCK_BOUNDARY => Some(BlockBoundary),
94	_ => None,
95	}
96	}
97	}
98
99	/// Struct return when decompress_to_vec functions fail.
100	#[cfg(feature = "with-alloc")]
101	#[derive(Debug)]
102	pub struct DecompressError {
103	/// Decompressor status on failure. See [TINFLStatus] for details.
104	pub status: TINFLStatus,
105	/// The currently decompressed data if any.
106	pub output: Vec<u8>,
107	}
108
109	#[cfg(feature = "with-alloc")]
110	impl alloc::fmt::Display for DecompressError {
111	#[cold]
112	fn fmt(&self, f: &mut ::core::fmt::Formatter<'_>) -> ::core::fmt::Result {
113	f.write_str(data:match self.status {
114	TINFLStatus::FailedCannotMakeProgress => "Truncated input stream",
115	TINFLStatus::BadParam => "Invalid output buffer size",
116	TINFLStatus::Adler32Mismatch => "Adler32 checksum mismatch",
117	TINFLStatus::Failed => "Invalid input data",
118	TINFLStatus::Done => "", // Unreachable
119	TINFLStatus::NeedsMoreInput => "Truncated input stream",
120	TINFLStatus::HasMoreOutput => "Output size exceeded the specified limit",
121	#[cfg(feature = "block-boundary")]
122	TINFLStatus::BlockBoundary => "Reached end of a deflate block",
123	})
124	}
125	}
126
127	/// Implement Error trait only if std feature is requested as it requires std.
128	#[cfg(all(feature = "std", feature = "with-alloc"))]
129	impl Error for DecompressError {}
130
131	#[cfg(feature = "with-alloc")]
132	fn decompress_error(status: TINFLStatus, output: Vec<u8>) -> Result<Vec<u8>, DecompressError> {
133	Err(DecompressError { status, output })
134	}
135
136	/// Decompress the deflate-encoded data in `input` to a vector.
137	///
138	/// NOTE: This function will not bound the output, so if the output is large enough it can result in an out of memory error.
139	/// It is therefore suggested to not use this for anything other than test programs, use the functions with a specified limit, or
140	/// ideally streaming decompression via the [flate2](https://github.com/alexcrichton/flate2-rs) library instead.
141	///
142	/// Returns a [`Result`] containing the [`Vec`] of decompressed data on success, and a [struct][DecompressError] containing the status and so far decompressed data if any on failure.
143	#[inline]
144	#[cfg(feature = "with-alloc")]
145	pub fn decompress_to_vec(input: &[u8]) -> Result<Vec<u8>, DecompressError> {
146	decompress_to_vec_inner(input, flags:`0`, max_output_size:usize::MAX)
147	}
148
149	/// Decompress the deflate-encoded data (with a zlib wrapper) in `input` to a vector.
150	///
151	/// NOTE: This function will not bound the output, so if the output is large enough it can result in an out of memory error.
152	/// It is therefore suggested to not use this for anything other than test programs, use the functions with a specified limit, or
153	/// ideally streaming decompression via the [flate2](https://github.com/alexcrichton/flate2-rs) library instead.
154	///
155	/// Returns a [`Result`] containing the [`Vec`] of decompressed data on success, and a [struct][DecompressError] containing the status and so far decompressed data if any on failure.
156	#[inline]
157	#[cfg(feature = "with-alloc")]
158	pub fn decompress_to_vec_zlib(input: &[u8]) -> Result<Vec<u8>, DecompressError> {
159	decompress_to_vec_inner(
160	input,
161	flags:inflate_flags::TINFL_FLAG_PARSE_ZLIB_HEADER,
162	max_output_size:usize::MAX,
163	)
164	}
165
166	/// Decompress the deflate-encoded data in `input` to a vector.
167	///
168	/// The vector is grown to at most `max_size` bytes; if the data does not fit in that size,
169	/// the error [struct][DecompressError] will contain the status [`TINFLStatus::HasMoreOutput`] and the data that was decompressed on failure.
170	///
171	/// As this function tries to decompress everything in one go, it's not ideal for general use outside of tests or where the output size is expected to be small.
172	/// It is suggested to use streaming decompression via the [flate2](https://github.com/alexcrichton/flate2-rs) library instead.
173	///
174	/// Returns a [`Result`] containing the [`Vec`] of decompressed data on success, and a [struct][DecompressError] on failure.
175	#[inline]
176	#[cfg(feature = "with-alloc")]
177	pub fn decompress_to_vec_with_limit(
178	input: &[u8],
179	max_size: usize,
180	) -> Result<Vec<u8>, DecompressError> {
181	decompress_to_vec_inner(input, flags:`0`, max_output_size:max_size)
182	}
183
184	/// Decompress the deflate-encoded data (with a zlib wrapper) in `input` to a vector.
185	/// The vector is grown to at most `max_size` bytes; if the data does not fit in that size,
186	/// the error [struct][DecompressError] will contain the status [`TINFLStatus::HasMoreOutput`] and the data that was decompressed on failure.
187	///
188	/// As this function tries to decompress everything in one go, it's not ideal for general use outside of tests or where the output size is expected to be small.
189	/// It is suggested to use streaming decompression via the [flate2](https://github.com/alexcrichton/flate2-rs) library instead.
190	///
191	/// Returns a [`Result`] containing the [`Vec`] of decompressed data on success, and a [struct][DecompressError] on failure.
192	#[inline]
193	#[cfg(feature = "with-alloc")]
194	pub fn decompress_to_vec_zlib_with_limit(
195	input: &[u8],
196	max_size: usize,
197	) -> Result<Vec<u8>, DecompressError> {
198	decompress_to_vec_inner(input, flags:inflate_flags::TINFL_FLAG_PARSE_ZLIB_HEADER, max_output_size:max_size)
199	}
200
201	/// Backend of various to-[`Vec`] decompressions.
202	///
203	/// Returns [`Vec`] of decompressed data on success and the [error struct][DecompressError] with details on failure.
204	#[cfg(feature = "with-alloc")]
205	fn decompress_to_vec_inner(
206	mut input: &[u8],
207	flags: u32,
208	max_output_size: usize,
209	) -> Result<Vec<u8>, DecompressError> {
210	let flags = flags \| inflate_flags::TINFL_FLAG_USING_NON_WRAPPING_OUTPUT_BUF;
211	let mut ret: Vec<u8> = vec![`0`; input.len().saturating_mul(`2`).min(max_output_size)];
212
213	let mut decomp = Box::<DecompressorOxide>::default();
214
215	let mut out_pos = `0`;
216	loop {
217	// Wrap the whole output slice so we know we have enough of the
218	// decompressed data for matches.
219	let (status, in_consumed, out_consumed) =
220	decompress(&mut decomp, input, &mut ret, out_pos, flags);
221	out_pos += out_consumed;
222
223	match status {
224	TINFLStatus::Done => {
225	ret.truncate(out_pos);
226	return Ok(ret);
227	}
228
229	TINFLStatus::HasMoreOutput => {
230	// in_consumed is not expected to be out of bounds,
231	// but the check eliminates a panicking code path
232	if in_consumed > input.len() {
233	return decompress_error(TINFLStatus::HasMoreOutput, ret);
234	}
235	input = &input[in_consumed..];
236
237	// if the buffer has already reached the size limit, return an error
238	if ret.len() >= max_output_size {
239	return decompress_error(TINFLStatus::HasMoreOutput, ret);
240	}
241	// calculate the new length, capped at `max_output_size`
242	let new_len = ret.len().saturating_mul(`2`).min(max_output_size);
243	ret.resize(new_len, `0`);
244	}
245
246	_ => return decompress_error(status, ret),
247	}
248	}
249	}
250
251	/// Decompress one or more source slices from an iterator into the output slice.
252	///
253	/// On success, returns the number of bytes that were written.*
254	/// On failure, returns the failure status code.*
255	///
256	/// This will fail if the output buffer is not large enough, but in that case
257	/// the output buffer will still contain the partial decompression.
258	///
259	/// `out` the output buffer.*
260	/// `it` the iterator of input slices.*
261	/// `zlib_header` if the first slice out of the iterator is expected to have a*
262	/// Zlib header. Otherwise the slices are assumed to be the deflate data only.
263	/// `ignore_adler32` if the adler32 checksum should be calculated or not.*
264	#[cfg(not(feature = "rustc-dep-of-std"))]
265	pub fn decompress_slice_iter_to_slice<'out, 'inp>(
266	out: &'out mut [u8],
267	it: impl Iterator<Item = &'inp [u8]>,
268	zlib_header: bool,
269	ignore_adler32: bool,
270	) -> Result<usize, TINFLStatus> {
271	use self::core::inflate_flags::*;
272
273	let mut it = it.peekable();
274	let r = &mut DecompressorOxide::new();
275	let mut out_pos = `0`;
276	while let Some(in_buf) = it.next() {
277	let has_more = it.peek().is_some();
278	let flags = {
279	let mut f = TINFL_FLAG_USING_NON_WRAPPING_OUTPUT_BUF;
280	if zlib_header {
281	f \|= TINFL_FLAG_PARSE_ZLIB_HEADER;
282	}
283	if ignore_adler32 {
284	f \|= TINFL_FLAG_IGNORE_ADLER32;
285	}
286	if has_more {
287	f \|= TINFL_FLAG_HAS_MORE_INPUT;
288	}
289	f
290	};
291	let (status, _input_read, bytes_written) = decompress(r, in_buf, out, out_pos, flags);
292	out_pos += bytes_written;
293	match status {
294	TINFLStatus::NeedsMoreInput => continue,
295	TINFLStatus::Done => return Ok(out_pos),
296	e => return Err(e),
297	}
298	}
299	// If we ran out of source slices without getting a `Done` from the
300	// decompression we can call it a failure.
301	Err(TINFLStatus::FailedCannotMakeProgress)
302	}
303
304	#[cfg(all(test, feature = "with-alloc"))]
305	mod test {
306	use super::{
307	decompress_slice_iter_to_slice, decompress_to_vec_zlib, decompress_to_vec_zlib_with_limit,
308	DecompressError, TINFLStatus,
309	};
310	const ENCODED: [u8; `20`] = [
311	`120`, `156`, `243`, `72`, `205`, `201`, `201`, `215`, `81`, `168`, `202`, `201`, `76`, `82`, `4`, `0`, `27`, `101`, `4`, `19`,
312	];
313
314	#[test]
315	fn decompress_vec() {
316	let res = decompress_to_vec_zlib(&ENCODED[..]).unwrap();
317	assert_eq!(res.as_slice(), &b"Hello, zlib!"[..]);
318	}
319
320	#[test]
321	fn decompress_vec_with_high_limit() {
322	let res = decompress_to_vec_zlib_with_limit(&ENCODED[..], `100_000`).unwrap();
323	assert_eq!(res.as_slice(), &b"Hello, zlib!"[..]);
324	}
325
326	#[test]
327	fn fail_to_decompress_with_limit() {
328	let res = decompress_to_vec_zlib_with_limit(&ENCODED[..], `8`);
329	match res {
330	Err(DecompressError {
331	status: TINFLStatus::HasMoreOutput,
332	..
333	}) => (), // expected result
334	_ => panic!("Decompression output size limit was not enforced"),
335	}
336	}
337
338	#[test]
339	fn test_decompress_slice_iter_to_slice() {
340	// one slice
341	let mut out = [`0_u8`; `12_usize`];
342	let r =
343	decompress_slice_iter_to_slice(&mut out, Some(&ENCODED[..]).into_iter(), `true`, `false`);
344	assert_eq!(r, Ok(`12`));
345	assert_eq!(&out[..`12`], &b"Hello, zlib!"[..]);
346
347	// some chunks at a time
348	for chunk_size in `1`..`13` {
349	// Note: because of https://github.com/Frommi/miniz_oxide/issues/110 our
350	// out buffer needs to have +1 byte available when the chunk size cuts
351	// the adler32 data off from the last actual data.
352	let mut out = [`0_u8`; `12_usize` + `1`];
353	let r =
354	decompress_slice_iter_to_slice(&mut out, ENCODED.chunks(chunk_size), `true`, `false`);
355	assert_eq!(r, Ok(`12`));
356	assert_eq!(&out[..`12`], &b"Hello, zlib!"[..]);
357	}
358
359	// output buffer too small
360	let mut out = [`0_u8`; `3_usize`];
361	let r = decompress_slice_iter_to_slice(&mut out, ENCODED.chunks(`7`), `true`, `false`);
362	assert!(r.is_err());
363	}
364	}
365