1 | use std::cmp; |
2 | use std::io; |
3 | use std::io::prelude::*; |
4 | |
5 | use super::{corrupt, GzBuilder, GzHeader, GzHeaderParser}; |
6 | use crate::crc::{Crc, CrcWriter}; |
7 | use crate::zio; |
8 | use crate::{Compress, Compression, Decompress, Status}; |
9 | |
10 | /// A gzip streaming encoder |
11 | /// |
12 | /// This structure exposes a [`Write`] interface that will emit compressed data |
13 | /// to the underlying writer `W`. |
14 | /// |
15 | /// [`Write`]: https://doc.rust-lang.org/std/io/trait.Write.html |
16 | /// |
17 | /// # Examples |
18 | /// |
19 | /// ``` |
20 | /// use std::io::prelude::*; |
21 | /// use flate2::Compression; |
22 | /// use flate2::write::GzEncoder; |
23 | /// |
24 | /// // Vec<u8> implements Write to print the compressed bytes of sample string |
25 | /// # fn main() { |
26 | /// |
27 | /// let mut e = GzEncoder::new(Vec::new(), Compression::default()); |
28 | /// e.write_all(b"Hello World" ).unwrap(); |
29 | /// println!("{:?}" , e.finish().unwrap()); |
30 | /// # } |
31 | /// ``` |
32 | #[derive (Debug)] |
33 | pub struct GzEncoder<W: Write> { |
34 | inner: zio::Writer<W, Compress>, |
35 | crc: Crc, |
36 | crc_bytes_written: usize, |
37 | header: Vec<u8>, |
38 | } |
39 | |
40 | pub fn gz_encoder<W: Write>(header: Vec<u8>, w: W, lvl: Compression) -> GzEncoder<W> { |
41 | GzEncoder { |
42 | inner: zio::Writer::new(w, d:Compress::new(level:lvl, zlib_header:false)), |
43 | crc: Crc::new(), |
44 | header, |
45 | crc_bytes_written: 0, |
46 | } |
47 | } |
48 | |
49 | impl<W: Write> GzEncoder<W> { |
50 | /// Creates a new encoder which will use the given compression level. |
51 | /// |
52 | /// The encoder is not configured specially for the emitted header. For |
53 | /// header configuration, see the `GzBuilder` type. |
54 | /// |
55 | /// The data written to the returned encoder will be compressed and then |
56 | /// written to the stream `w`. |
57 | pub fn new(w: W, level: Compression) -> GzEncoder<W> { |
58 | GzBuilder::new().write(w, level) |
59 | } |
60 | |
61 | /// Acquires a reference to the underlying writer. |
62 | pub fn get_ref(&self) -> &W { |
63 | self.inner.get_ref() |
64 | } |
65 | |
66 | /// Acquires a mutable reference to the underlying writer. |
67 | /// |
68 | /// Note that mutation of the writer may result in surprising results if |
69 | /// this encoder is continued to be used. |
70 | pub fn get_mut(&mut self) -> &mut W { |
71 | self.inner.get_mut() |
72 | } |
73 | |
74 | /// Attempt to finish this output stream, writing out final chunks of data. |
75 | /// |
76 | /// Note that this function can only be used once data has finished being |
77 | /// written to the output stream. After this function is called then further |
78 | /// calls to `write` may result in a panic. |
79 | /// |
80 | /// # Panics |
81 | /// |
82 | /// Attempts to write data to this stream may result in a panic after this |
83 | /// function is called. |
84 | /// |
85 | /// # Errors |
86 | /// |
87 | /// This function will perform I/O to complete this stream, and any I/O |
88 | /// errors which occur will be returned from this function. |
89 | pub fn try_finish(&mut self) -> io::Result<()> { |
90 | self.write_header()?; |
91 | self.inner.finish()?; |
92 | |
93 | while self.crc_bytes_written < 8 { |
94 | let (sum, amt) = (self.crc.sum(), self.crc.amount()); |
95 | let buf = [ |
96 | (sum >> 0) as u8, |
97 | (sum >> 8) as u8, |
98 | (sum >> 16) as u8, |
99 | (sum >> 24) as u8, |
100 | (amt >> 0) as u8, |
101 | (amt >> 8) as u8, |
102 | (amt >> 16) as u8, |
103 | (amt >> 24) as u8, |
104 | ]; |
105 | let inner = self.inner.get_mut(); |
106 | let n = inner.write(&buf[self.crc_bytes_written..])?; |
107 | self.crc_bytes_written += n; |
108 | } |
109 | Ok(()) |
110 | } |
111 | |
112 | /// Finish encoding this stream, returning the underlying writer once the |
113 | /// encoding is done. |
114 | /// |
115 | /// Note that this function may not be suitable to call in a situation where |
116 | /// the underlying stream is an asynchronous I/O stream. To finish a stream |
117 | /// the `try_finish` (or `shutdown`) method should be used instead. To |
118 | /// re-acquire ownership of a stream it is safe to call this method after |
119 | /// `try_finish` or `shutdown` has returned `Ok`. |
120 | /// |
121 | /// # Errors |
122 | /// |
123 | /// This function will perform I/O to complete this stream, and any I/O |
124 | /// errors which occur will be returned from this function. |
125 | pub fn finish(mut self) -> io::Result<W> { |
126 | self.try_finish()?; |
127 | Ok(self.inner.take_inner()) |
128 | } |
129 | |
130 | fn write_header(&mut self) -> io::Result<()> { |
131 | while !self.header.is_empty() { |
132 | let n = self.inner.get_mut().write(&self.header)?; |
133 | self.header.drain(..n); |
134 | } |
135 | Ok(()) |
136 | } |
137 | } |
138 | |
139 | impl<W: Write> Write for GzEncoder<W> { |
140 | fn write(&mut self, buf: &[u8]) -> io::Result<usize> { |
141 | assert_eq!(self.crc_bytes_written, 0); |
142 | self.write_header()?; |
143 | let n: usize = self.inner.write(buf)?; |
144 | self.crc.update(&buf[..n]); |
145 | Ok(n) |
146 | } |
147 | |
148 | fn flush(&mut self) -> io::Result<()> { |
149 | assert_eq!(self.crc_bytes_written, 0); |
150 | self.write_header()?; |
151 | self.inner.flush() |
152 | } |
153 | } |
154 | |
155 | impl<R: Read + Write> Read for GzEncoder<R> { |
156 | fn read(&mut self, buf: &mut [u8]) -> io::Result<usize> { |
157 | self.get_mut().read(buf) |
158 | } |
159 | } |
160 | |
161 | impl<W: Write> Drop for GzEncoder<W> { |
162 | fn drop(&mut self) { |
163 | if self.inner.is_present() { |
164 | let _ = self.try_finish(); |
165 | } |
166 | } |
167 | } |
168 | |
169 | /// A decoder for a single member of a [gzip file]. |
170 | /// |
171 | /// This structure exposes a [`Write`] interface, receiving compressed data and |
172 | /// writing uncompressed data to the underlying writer. |
173 | /// |
174 | /// After decoding a single member of the gzip data this writer will return the number of bytes up to |
175 | /// to the end of the gzip member and subsequent writes will return Ok(0) allowing the caller to |
176 | /// handle any data following the gzip member. |
177 | /// |
178 | /// To handle gzip files that may have multiple members, see [`MultiGzDecoder`] |
179 | /// or read more |
180 | /// [in the introduction](../index.html#about-multi-member-gzip-files). |
181 | /// |
182 | /// [gzip file]: https://www.rfc-editor.org/rfc/rfc1952#page-5 |
183 | /// [`Write`]: https://doc.rust-lang.org/std/io/trait.Write.html |
184 | /// |
185 | /// # Examples |
186 | /// |
187 | /// ``` |
188 | /// use std::io::prelude::*; |
189 | /// use std::io; |
190 | /// use flate2::Compression; |
191 | /// use flate2::write::{GzEncoder, GzDecoder}; |
192 | /// |
193 | /// # fn main() { |
194 | /// # let mut e = GzEncoder::new(Vec::new(), Compression::default()); |
195 | /// # e.write(b"Hello World" ).unwrap(); |
196 | /// # let bytes = e.finish().unwrap(); |
197 | /// # assert_eq!("Hello World" , decode_writer(bytes).unwrap()); |
198 | /// # } |
199 | /// // Uncompresses a gzip encoded vector of bytes and returns a string or error |
200 | /// // Here Vec<u8> implements Write |
201 | /// fn decode_writer(bytes: Vec<u8>) -> io::Result<String> { |
202 | /// let mut writer = Vec::new(); |
203 | /// let mut decoder = GzDecoder::new(writer); |
204 | /// decoder.write_all(&bytes[..])?; |
205 | /// writer = decoder.finish()?; |
206 | /// let return_string = String::from_utf8(writer).expect("String parsing error" ); |
207 | /// Ok(return_string) |
208 | /// } |
209 | /// ``` |
210 | #[derive (Debug)] |
211 | pub struct GzDecoder<W: Write> { |
212 | inner: zio::Writer<CrcWriter<W>, Decompress>, |
213 | crc_bytes: Vec<u8>, |
214 | header_parser: GzHeaderParser, |
215 | } |
216 | |
217 | const CRC_BYTES_LEN: usize = 8; |
218 | |
219 | impl<W: Write> GzDecoder<W> { |
220 | /// Creates a new decoder which will write uncompressed data to the stream. |
221 | /// |
222 | /// When this encoder is dropped or unwrapped the final pieces of data will |
223 | /// be flushed. |
224 | pub fn new(w: W) -> GzDecoder<W> { |
225 | GzDecoder { |
226 | inner: zio::Writer::new(CrcWriter::new(w), Decompress::new(false)), |
227 | crc_bytes: Vec::with_capacity(CRC_BYTES_LEN), |
228 | header_parser: GzHeaderParser::new(), |
229 | } |
230 | } |
231 | |
232 | /// Returns the header associated with this stream. |
233 | pub fn header(&self) -> Option<&GzHeader> { |
234 | self.header_parser.header() |
235 | } |
236 | |
237 | /// Acquires a reference to the underlying writer. |
238 | pub fn get_ref(&self) -> &W { |
239 | self.inner.get_ref().get_ref() |
240 | } |
241 | |
242 | /// Acquires a mutable reference to the underlying writer. |
243 | /// |
244 | /// Note that mutating the output/input state of the stream may corrupt this |
245 | /// object, so care must be taken when using this method. |
246 | pub fn get_mut(&mut self) -> &mut W { |
247 | self.inner.get_mut().get_mut() |
248 | } |
249 | |
250 | /// Attempt to finish this output stream, writing out final chunks of data. |
251 | /// |
252 | /// Note that this function can only be used once data has finished being |
253 | /// written to the output stream. After this function is called then further |
254 | /// calls to `write` may result in a panic. |
255 | /// |
256 | /// # Panics |
257 | /// |
258 | /// Attempts to write data to this stream may result in a panic after this |
259 | /// function is called. |
260 | /// |
261 | /// # Errors |
262 | /// |
263 | /// This function will perform I/O to finish the stream, returning any |
264 | /// errors which happen. |
265 | pub fn try_finish(&mut self) -> io::Result<()> { |
266 | self.finish_and_check_crc()?; |
267 | Ok(()) |
268 | } |
269 | |
270 | /// Consumes this decoder, flushing the output stream. |
271 | /// |
272 | /// This will flush the underlying data stream and then return the contained |
273 | /// writer if the flush succeeded. |
274 | /// |
275 | /// Note that this function may not be suitable to call in a situation where |
276 | /// the underlying stream is an asynchronous I/O stream. To finish a stream |
277 | /// the `try_finish` (or `shutdown`) method should be used instead. To |
278 | /// re-acquire ownership of a stream it is safe to call this method after |
279 | /// `try_finish` or `shutdown` has returned `Ok`. |
280 | /// |
281 | /// # Errors |
282 | /// |
283 | /// This function will perform I/O to complete this stream, and any I/O |
284 | /// errors which occur will be returned from this function. |
285 | pub fn finish(mut self) -> io::Result<W> { |
286 | self.finish_and_check_crc()?; |
287 | Ok(self.inner.take_inner().into_inner()) |
288 | } |
289 | |
290 | fn finish_and_check_crc(&mut self) -> io::Result<()> { |
291 | self.inner.finish()?; |
292 | |
293 | if self.crc_bytes.len() != 8 { |
294 | return Err(corrupt()); |
295 | } |
296 | |
297 | let crc = ((self.crc_bytes[0] as u32) << 0) |
298 | | ((self.crc_bytes[1] as u32) << 8) |
299 | | ((self.crc_bytes[2] as u32) << 16) |
300 | | ((self.crc_bytes[3] as u32) << 24); |
301 | let amt = ((self.crc_bytes[4] as u32) << 0) |
302 | | ((self.crc_bytes[5] as u32) << 8) |
303 | | ((self.crc_bytes[6] as u32) << 16) |
304 | | ((self.crc_bytes[7] as u32) << 24); |
305 | if crc != self.inner.get_ref().crc().sum() { |
306 | return Err(corrupt()); |
307 | } |
308 | if amt != self.inner.get_ref().crc().amount() { |
309 | return Err(corrupt()); |
310 | } |
311 | Ok(()) |
312 | } |
313 | } |
314 | |
315 | impl<W: Write> Write for GzDecoder<W> { |
316 | fn write(&mut self, mut buf: &[u8]) -> io::Result<usize> { |
317 | let buflen = buf.len(); |
318 | if self.header().is_none() { |
319 | match self.header_parser.parse(&mut buf) { |
320 | Err(err) => { |
321 | if err.kind() == io::ErrorKind::UnexpectedEof { |
322 | // all data read but header still not complete |
323 | Ok(buflen) |
324 | } else { |
325 | Err(err) |
326 | } |
327 | } |
328 | Ok(_) => { |
329 | debug_assert!(self.header().is_some()); |
330 | // buf now contains the unread part of the original buf |
331 | let n = buflen - buf.len(); |
332 | Ok(n) |
333 | } |
334 | } |
335 | } else { |
336 | let (n, status) = self.inner.write_with_status(buf)?; |
337 | |
338 | if status == Status::StreamEnd && n < buf.len() && self.crc_bytes.len() < 8 { |
339 | let remaining = buf.len() - n; |
340 | let crc_bytes = cmp::min(remaining, CRC_BYTES_LEN - self.crc_bytes.len()); |
341 | self.crc_bytes.extend(&buf[n..n + crc_bytes]); |
342 | return Ok(n + crc_bytes); |
343 | } |
344 | Ok(n) |
345 | } |
346 | } |
347 | |
348 | fn flush(&mut self) -> io::Result<()> { |
349 | self.inner.flush() |
350 | } |
351 | } |
352 | |
353 | impl<W: Read + Write> Read for GzDecoder<W> { |
354 | fn read(&mut self, buf: &mut [u8]) -> io::Result<usize> { |
355 | self.inner.get_mut().get_mut().read(buf) |
356 | } |
357 | } |
358 | |
359 | /// A gzip streaming decoder that decodes a [gzip file] with multiple members. |
360 | /// |
361 | /// This structure exposes a [`Write`] interface that will consume compressed data and |
362 | /// write uncompressed data to the underlying writer. |
363 | /// |
364 | /// A gzip file consists of a series of *members* concatenated one after another. |
365 | /// `MultiGzDecoder` decodes all members of a file and writes them to the |
366 | /// underlying writer one after another. |
367 | /// |
368 | /// To handle members separately, see [GzDecoder] or read more |
369 | /// [in the introduction](../index.html#about-multi-member-gzip-files). |
370 | /// |
371 | /// [gzip file]: https://www.rfc-editor.org/rfc/rfc1952#page-5 |
372 | #[derive (Debug)] |
373 | pub struct MultiGzDecoder<W: Write> { |
374 | inner: GzDecoder<W>, |
375 | } |
376 | |
377 | impl<W: Write> MultiGzDecoder<W> { |
378 | /// Creates a new decoder which will write uncompressed data to the stream. |
379 | /// If the gzip stream contains multiple members all will be decoded. |
380 | pub fn new(w: W) -> MultiGzDecoder<W> { |
381 | MultiGzDecoder { |
382 | inner: GzDecoder::new(w), |
383 | } |
384 | } |
385 | |
386 | /// Returns the header associated with the current member. |
387 | pub fn header(&self) -> Option<&GzHeader> { |
388 | self.inner.header() |
389 | } |
390 | |
391 | /// Acquires a reference to the underlying writer. |
392 | pub fn get_ref(&self) -> &W { |
393 | self.inner.get_ref() |
394 | } |
395 | |
396 | /// Acquires a mutable reference to the underlying writer. |
397 | /// |
398 | /// Note that mutating the output/input state of the stream may corrupt this |
399 | /// object, so care must be taken when using this method. |
400 | pub fn get_mut(&mut self) -> &mut W { |
401 | self.inner.get_mut() |
402 | } |
403 | |
404 | /// Attempt to finish this output stream, writing out final chunks of data. |
405 | /// |
406 | /// Note that this function can only be used once data has finished being |
407 | /// written to the output stream. After this function is called then further |
408 | /// calls to `write` may result in a panic. |
409 | /// |
410 | /// # Panics |
411 | /// |
412 | /// Attempts to write data to this stream may result in a panic after this |
413 | /// function is called. |
414 | /// |
415 | /// # Errors |
416 | /// |
417 | /// This function will perform I/O to finish the stream, returning any |
418 | /// errors which happen. |
419 | pub fn try_finish(&mut self) -> io::Result<()> { |
420 | self.inner.try_finish() |
421 | } |
422 | |
423 | /// Consumes this decoder, flushing the output stream. |
424 | /// |
425 | /// This will flush the underlying data stream and then return the contained |
426 | /// writer if the flush succeeded. |
427 | /// |
428 | /// Note that this function may not be suitable to call in a situation where |
429 | /// the underlying stream is an asynchronous I/O stream. To finish a stream |
430 | /// the `try_finish` (or `shutdown`) method should be used instead. To |
431 | /// re-acquire ownership of a stream it is safe to call this method after |
432 | /// `try_finish` or `shutdown` has returned `Ok`. |
433 | /// |
434 | /// # Errors |
435 | /// |
436 | /// This function will perform I/O to complete this stream, and any I/O |
437 | /// errors which occur will be returned from this function. |
438 | pub fn finish(self) -> io::Result<W> { |
439 | self.inner.finish() |
440 | } |
441 | } |
442 | |
443 | impl<W: Write> Write for MultiGzDecoder<W> { |
444 | fn write(&mut self, buf: &[u8]) -> io::Result<usize> { |
445 | if buf.is_empty() { |
446 | Ok(0) |
447 | } else { |
448 | match self.inner.write(buf) { |
449 | Ok(0) => { |
450 | // When the GzDecoder indicates that it has finished |
451 | // create a new GzDecoder to handle additional data. |
452 | self.inner.try_finish()?; |
453 | let w: W = self.inner.inner.take_inner().into_inner(); |
454 | self.inner = GzDecoder::new(w); |
455 | self.inner.write(buf) |
456 | } |
457 | res: Result => res, |
458 | } |
459 | } |
460 | } |
461 | |
462 | fn flush(&mut self) -> io::Result<()> { |
463 | self.inner.flush() |
464 | } |
465 | } |
466 | |
467 | #[cfg (test)] |
468 | mod tests { |
469 | use super::*; |
470 | |
471 | const STR: &str = "Hello World Hello World Hello World Hello World Hello World \ |
472 | Hello World Hello World Hello World Hello World Hello World \ |
473 | Hello World Hello World Hello World Hello World Hello World \ |
474 | Hello World Hello World Hello World Hello World Hello World \ |
475 | Hello World Hello World Hello World Hello World Hello World" ; |
476 | |
477 | #[test ] |
478 | fn decode_writer_one_chunk() { |
479 | let mut e = GzEncoder::new(Vec::new(), Compression::default()); |
480 | e.write(STR.as_ref()).unwrap(); |
481 | let bytes = e.finish().unwrap(); |
482 | |
483 | let mut writer = Vec::new(); |
484 | let mut decoder = GzDecoder::new(writer); |
485 | let n = decoder.write(&bytes[..]).unwrap(); |
486 | decoder.write(&bytes[n..]).unwrap(); |
487 | decoder.try_finish().unwrap(); |
488 | writer = decoder.finish().unwrap(); |
489 | let return_string = String::from_utf8(writer).expect("String parsing error" ); |
490 | assert_eq!(return_string, STR); |
491 | } |
492 | |
493 | #[test ] |
494 | fn decode_writer_partial_header() { |
495 | let mut e = GzEncoder::new(Vec::new(), Compression::default()); |
496 | e.write(STR.as_ref()).unwrap(); |
497 | let bytes = e.finish().unwrap(); |
498 | |
499 | let mut writer = Vec::new(); |
500 | let mut decoder = GzDecoder::new(writer); |
501 | assert_eq!(decoder.write(&bytes[..5]).unwrap(), 5); |
502 | let n = decoder.write(&bytes[5..]).unwrap(); |
503 | if n < bytes.len() - 5 { |
504 | decoder.write(&bytes[n + 5..]).unwrap(); |
505 | } |
506 | writer = decoder.finish().unwrap(); |
507 | let return_string = String::from_utf8(writer).expect("String parsing error" ); |
508 | assert_eq!(return_string, STR); |
509 | } |
510 | |
511 | #[test ] |
512 | fn decode_writer_partial_header_filename() { |
513 | let filename = "test.txt" ; |
514 | let mut e = GzBuilder::new() |
515 | .filename(filename) |
516 | .read(STR.as_bytes(), Compression::default()); |
517 | let mut bytes = Vec::new(); |
518 | e.read_to_end(&mut bytes).unwrap(); |
519 | |
520 | let mut writer = Vec::new(); |
521 | let mut decoder = GzDecoder::new(writer); |
522 | assert_eq!(decoder.write(&bytes[..12]).unwrap(), 12); |
523 | let n = decoder.write(&bytes[12..]).unwrap(); |
524 | if n < bytes.len() - 12 { |
525 | decoder.write(&bytes[n + 12..]).unwrap(); |
526 | } |
527 | assert_eq!( |
528 | decoder.header().unwrap().filename().unwrap(), |
529 | filename.as_bytes() |
530 | ); |
531 | writer = decoder.finish().unwrap(); |
532 | let return_string = String::from_utf8(writer).expect("String parsing error" ); |
533 | assert_eq!(return_string, STR); |
534 | } |
535 | |
536 | #[test ] |
537 | fn decode_writer_partial_header_comment() { |
538 | let comment = "test comment" ; |
539 | let mut e = GzBuilder::new() |
540 | .comment(comment) |
541 | .read(STR.as_bytes(), Compression::default()); |
542 | let mut bytes = Vec::new(); |
543 | e.read_to_end(&mut bytes).unwrap(); |
544 | |
545 | let mut writer = Vec::new(); |
546 | let mut decoder = GzDecoder::new(writer); |
547 | assert_eq!(decoder.write(&bytes[..12]).unwrap(), 12); |
548 | let n = decoder.write(&bytes[12..]).unwrap(); |
549 | if n < bytes.len() - 12 { |
550 | decoder.write(&bytes[n + 12..]).unwrap(); |
551 | } |
552 | assert_eq!( |
553 | decoder.header().unwrap().comment().unwrap(), |
554 | comment.as_bytes() |
555 | ); |
556 | writer = decoder.finish().unwrap(); |
557 | let return_string = String::from_utf8(writer).expect("String parsing error" ); |
558 | assert_eq!(return_string, STR); |
559 | } |
560 | |
561 | #[test ] |
562 | fn decode_writer_exact_header() { |
563 | let mut e = GzEncoder::new(Vec::new(), Compression::default()); |
564 | e.write(STR.as_ref()).unwrap(); |
565 | let bytes = e.finish().unwrap(); |
566 | |
567 | let mut writer = Vec::new(); |
568 | let mut decoder = GzDecoder::new(writer); |
569 | assert_eq!(decoder.write(&bytes[..10]).unwrap(), 10); |
570 | decoder.write(&bytes[10..]).unwrap(); |
571 | writer = decoder.finish().unwrap(); |
572 | let return_string = String::from_utf8(writer).expect("String parsing error" ); |
573 | assert_eq!(return_string, STR); |
574 | } |
575 | |
576 | #[test ] |
577 | fn decode_writer_partial_crc() { |
578 | let mut e = GzEncoder::new(Vec::new(), Compression::default()); |
579 | e.write(STR.as_ref()).unwrap(); |
580 | let bytes = e.finish().unwrap(); |
581 | |
582 | let mut writer = Vec::new(); |
583 | let mut decoder = GzDecoder::new(writer); |
584 | let l = bytes.len() - 5; |
585 | let n = decoder.write(&bytes[..l]).unwrap(); |
586 | decoder.write(&bytes[n..]).unwrap(); |
587 | writer = decoder.finish().unwrap(); |
588 | let return_string = String::from_utf8(writer).expect("String parsing error" ); |
589 | assert_eq!(return_string, STR); |
590 | } |
591 | |
592 | // Two or more gzip files concatenated form a multi-member gzip file. MultiGzDecoder will |
593 | // concatenate the decoded contents of all members. |
594 | #[test ] |
595 | fn decode_multi_writer() { |
596 | let mut e = GzEncoder::new(Vec::new(), Compression::default()); |
597 | e.write(STR.as_ref()).unwrap(); |
598 | let bytes = e.finish().unwrap().repeat(2); |
599 | |
600 | let mut writer = Vec::new(); |
601 | let mut decoder = MultiGzDecoder::new(writer); |
602 | let mut count = 0; |
603 | while count < bytes.len() { |
604 | let n = decoder.write(&bytes[count..]).unwrap(); |
605 | assert!(n != 0); |
606 | count += n; |
607 | } |
608 | writer = decoder.finish().unwrap(); |
609 | let return_string = String::from_utf8(writer).expect("String parsing error" ); |
610 | let expected = STR.repeat(2); |
611 | assert_eq!(return_string, expected); |
612 | } |
613 | |
614 | // GzDecoder consumes one gzip member and then returns 0 for subsequent writes, allowing any |
615 | // additional data to be consumed by the caller. |
616 | #[test ] |
617 | fn decode_extra_data() { |
618 | let compressed = { |
619 | let mut e = GzEncoder::new(Vec::new(), Compression::default()); |
620 | e.write(STR.as_ref()).unwrap(); |
621 | let mut b = e.finish().unwrap(); |
622 | b.push(b'x' ); |
623 | b |
624 | }; |
625 | |
626 | let mut writer = Vec::new(); |
627 | let mut decoder = GzDecoder::new(writer); |
628 | let mut consumed_bytes = 0; |
629 | loop { |
630 | let n = decoder.write(&compressed[consumed_bytes..]).unwrap(); |
631 | if n == 0 { |
632 | break; |
633 | } |
634 | consumed_bytes += n; |
635 | } |
636 | writer = decoder.finish().unwrap(); |
637 | let actual = String::from_utf8(writer).expect("String parsing error" ); |
638 | assert_eq!(actual, STR); |
639 | assert_eq!(&compressed[consumed_bytes..], b"x" ); |
640 | } |
641 | } |
642 | |