writer.rs source code [crates/exr/src/block/writer.rs]

1	//! Composable structures to handle writing an image.
2
3
4	use std::fmt::Debug;
5	use std::io::Seek;
6	use std::iter::Peekable;
7	use std::ops::Not;
8	use std::sync::mpsc;
9	use rayon_core::{ThreadPool, ThreadPoolBuildError};
10
11	use smallvec::alloc::collections::BTreeMap;
12
13	use crate::block::UncompressedBlock;
14	use crate::block::chunk::Chunk;
15	use crate::compression::Compression;
16	use crate::error::{Error, Result, UnitResult, usize_to_u64};
17	use crate::io::{Data, Tracking, Write};
18	use crate::meta::{Headers, MetaData, OffsetTables};
19	use crate::meta::attribute::LineOrder;
20
21	/// Write an exr file by writing one chunk after another in a closure.
22	/// In the closure, you are provided a chunk writer, which should be used to write all the chunks.
23	/// Assumes the your write destination is buffered.
24	pub fn write_chunks_with<W: Write + Seek>(
25	buffered_write: W, headers: Headers, pedantic: bool,
26	write_chunks: impl FnOnce(MetaData, &mut ChunkWriter<W>) -> UnitResult
27	) -> UnitResult {
28	// this closure approach ensures that after writing all chunks, the file is always completed and checked and flushed
29	let (meta: MetaData, mut writer: ChunkWriter) = ChunkWriter::new_for_buffered(buffered_byte_writer:buffered_write, headers, pedantic)?;
30	write_chunks(meta, &mut writer)?;
31	writer.complete_meta_data()
32	}
33
34	/// Can consume compressed pixel chunks, writing them a file.
35	/// Use `sequential_blocks_compressor` or `parallel_blocks_compressor` to compress your data,
36	/// or use `compress_all_blocks_sequential` or `compress_all_blocks_parallel`.
37	/// Use `on_progress` to obtain a new writer
38	/// that triggers a callback for each block.
39	// #[must_use]
40	#[derive(Debug)]
41	#[must_use]
42	pub struct ChunkWriter<W> {
43	header_count: usize,
44	byte_writer: Tracking<W>,
45	chunk_indices_byte_location: std::ops::Range<usize>,
46	chunk_indices_increasing_y: OffsetTables,
47	chunk_count: usize, // TODO compose?
48	}
49
50	/// A new writer that triggers a callback
51	/// for each block written to the inner writer.
52	#[derive(Debug)]
53	#[must_use]
54	pub struct OnProgressChunkWriter<'w, W, F> {
55	chunk_writer: &'w mut W,
56	written_chunks: usize,
57	on_progress: F,
58	}
59
60	/// Write chunks to a byte destination.
61	/// Then write each chunk with `writer.write_chunk(chunk)`.
62	pub trait ChunksWriter: Sized {
63
64	/// The total number of chunks that the complete file will contain.
65	fn total_chunks_count(&self) -> usize;
66
67	/// Any more calls will result in an error and have no effect.
68	/// If writing results in an error, the file and the writer
69	/// may remain in an invalid state and should not be used further.
70	/// Errors when the chunk at this index was already written.
71	fn write_chunk(&mut self, index_in_header_increasing_y: usize, chunk: Chunk) -> UnitResult;
72
73	/// Obtain a new writer that calls the specified closure for each block that is written to this writer.
74	fn on_progress<F>(&mut self, on_progress: F) -> OnProgressChunkWriter<'_, Self, F> where F: FnMut(f64) {
75	OnProgressChunkWriter { chunk_writer: self, written_chunks: `0`, on_progress }
76	}
77
78	/// Obtain a new writer that can compress blocks to chunks, which are then passed to this writer.
79	fn sequential_blocks_compressor<'w>(&'w mut self, meta: &'w MetaData) -> SequentialBlocksCompressor<'w, Self> {
80	SequentialBlocksCompressor::new(meta, self)
81	}
82
83	/// Obtain a new writer that can compress blocks to chunks on multiple threads, which are then passed to this writer.
84	/// Returns none if the sequential compressor should be used instead (thread pool creation failure or too large performance overhead).
85	fn parallel_blocks_compressor<'w>(&'w mut self, meta: &'w MetaData) -> Option<ParallelBlocksCompressor<'w, Self>> {
86	ParallelBlocksCompressor::new(meta, self)
87	}
88
89	/// Compresses all blocks to the file.
90	/// The index of the block must be in increasing line order within the header.
91	/// Obtain iterator with `MetaData::collect_ordered_blocks(...)` or similar methods.
92	fn compress_all_blocks_sequential(mut self, meta: &MetaData, blocks: impl Iterator<Item=(usize, UncompressedBlock)>) -> UnitResult {
93	let mut writer = self.sequential_blocks_compressor(meta);
94
95	// TODO check block order if line order is not unspecified!
96	for (index_in_header_increasing_y, block) in blocks {
97	writer.compress_block(index_in_header_increasing_y, block)?;
98	}
99
100	// TODO debug_assert_eq!(self.is_complete());
101	Ok(())
102	}
103
104	/// Compresses all blocks to the file.
105	/// The index of the block must be in increasing line order within the header.
106	/// Obtain iterator with `MetaData::collect_ordered_blocks(...)` or similar methods.
107	/// Will fallback to sequential processing where threads are not available, or where it would not speed up the process.
108	fn compress_all_blocks_parallel(mut self, meta: &MetaData, blocks: impl Iterator<Item=(usize, UncompressedBlock)>) -> UnitResult {
109	let mut parallel_writer = match self.parallel_blocks_compressor(meta) {
110	None => return self.compress_all_blocks_sequential(meta, blocks),
111	Some(writer) => writer,
112	};
113
114	// TODO check block order if line order is not unspecified!
115	for (index_in_header_increasing_y, block) in blocks {
116	parallel_writer.add_block_to_compression_queue(index_in_header_increasing_y, block)?;
117	}
118
119	// TODO debug_assert_eq!(self.is_complete());
120	Ok(())
121	}
122	}
123
124
125	impl<W> ChunksWriter for ChunkWriter<W> where W: Write + Seek {
126
127	/// The total number of chunks that the complete file will contain.
128	fn total_chunks_count(&self) -> usize { self.chunk_count }
129
130	/// Any more calls will result in an error and have no effect.
131	/// If writing results in an error, the file and the writer
132	/// may remain in an invalid state and should not be used further.
133	/// Errors when the chunk at this index was already written.
134	fn write_chunk(&mut self, index_in_header_increasing_y: usize, chunk: Chunk) -> UnitResult {
135	let header_chunk_indices = &mut self.chunk_indices_increasing_y[chunk.layer_index];
136
137	if index_in_header_increasing_y >= header_chunk_indices.len() {
138	return Err(Error::invalid("too large chunk index"));
139	}
140
141	let chunk_index_slot = &mut header_chunk_indices[index_in_header_increasing_y];
142	if *chunk_index_slot != `0` {
143	return Err(Error::invalid(format!("chunk at index {} is already written", index_in_header_increasing_y)));
144	}
145
146	*chunk_index_slot = usize_to_u64(self.byte_writer.byte_position());
147	chunk.write(&mut self.byte_writer, self.header_count)?;
148	Ok(())
149	}
150	}
151
152	impl<W> ChunkWriter<W> where W: Write + Seek {
153	// -- the following functions are private, because they must be called in a strict order --
154
155	/// Writes the meta data and zeroed offset tables as a placeholder.
156	fn new_for_buffered(buffered_byte_writer: W, headers: Headers, pedantic: bool) -> Result<(MetaData, Self)> {
157	let mut write = Tracking::new(buffered_byte_writer);
158	let requirements = MetaData::write_validating_to_buffered(&mut write, headers.as_slice(), pedantic)?;
159
160	// TODO: use increasing line order where possible, but this requires us to know whether we want to be parallel right now
161	/// if non-parallel compression, we always use increasing order anyways*
162	if !parallel \|\| !has_compression {
163	for header in &mut headers {
164	if header.line_order == LineOrder::Unspecified {
165	header.line_order = LineOrder::Increasing;
166	}
167	}
168	}/*
169
170	let offset_table_size: usize = headers.iter().map(\|header\| header.chunk_count).sum();
171
172	let offset_table_start_byte = write.byte_position();
173	let offset_table_end_byte = write.byte_position() + offset_table_size * u64::BYTE_SIZE;
174
175	// skip offset tables, filling with 0, will be updated after the last chunk has been written
176	write.seek_write_to(offset_table_end_byte)?;
177
178	let header_count = headers.len();
179	let chunk_indices_increasing_y = headers.iter()
180	.map(\|header\| vec![`0_u64`; header.chunk_count]).collect();
181
182	let meta_data = MetaData { requirements, headers };
183
184	Ok((meta_data, ChunkWriter {
185	header_count,
186	byte_writer: write,
187	chunk_count: offset_table_size,
188	chunk_indices_byte_location: offset_table_start_byte .. offset_table_end_byte,
189	chunk_indices_increasing_y,
190	}))
191	}
192
193	/// Seek back to the meta data, write offset tables, and flush the byte writer.
194	/// Leaves the writer seeked to the middle of the file.
195	fn complete_meta_data(mut self) -> UnitResult {
196	if self.chunk_indices_increasing_y.iter().flatten().any(\|&index\| index == `0`) {
197	return Err(Error::invalid("some chunks are not written yet"))
198	}
199
200	// write all offset tables
201	debug_assert_ne!(self.byte_writer.byte_position(), self.chunk_indices_byte_location.end, "offset table has already been updated");
202	self.byte_writer.seek_write_to(self.chunk_indices_byte_location.start)?;
203
204	for table in self.chunk_indices_increasing_y {
205	u64::write_slice(&mut self.byte_writer, table.as_slice())?;
206	}
207
208	self.byte_writer.flush()?; // make sure we catch all (possibly delayed) io errors before returning
209	Ok(())
210	}
211
212	}
213
214
215	impl<'w, W, F> ChunksWriter for OnProgressChunkWriter<'w, W, F> where W: 'w + ChunksWriter, F: FnMut(f64) {
216	fn total_chunks_count(&self) -> usize {
217	self.chunk_writer.total_chunks_count()
218	}
219
220	fn write_chunk(&mut self, index_in_header_increasing_y: usize, chunk: Chunk) -> UnitResult {
221	let total_chunks = self.total_chunks_count();
222	let on_progress = &mut self.on_progress;
223
224	// guarantee on_progress being called with 0 once
225	if self.written_chunks == `0` { on_progress(`0.0`); }
226
227	self.chunk_writer.write_chunk(index_in_header_increasing_y, chunk)?;
228
229	self.written_chunks += `1`;
230
231	on_progress({
232	// guarantee finishing with progress 1.0 for last block at least once, float division might slightly differ from 1.0
233	if self.written_chunks == total_chunks { `1.0` }
234	else { self.written_chunks as f64 / total_chunks as f64 }
235	});
236
237	Ok(())
238	}
239	}
240
241
242	/// Write blocks that appear in any order and reorder them before writing.
243	#[derive(Debug)]
244	#[must_use]
245	pub struct SortedBlocksWriter<'w, W> {
246	chunk_writer: &'w mut W,
247	pending_chunks: BTreeMap<usize, (usize, Chunk)>,
248	unwritten_chunk_indices: Peekable<std::ops::Range<usize>>,
249	requires_sorting: bool, // using this instead of Option, because of borrowing
250	}
251
252
253	impl<'w, W> SortedBlocksWriter<'w, W> where W: ChunksWriter {
254
255	/// New sorting writer. Returns `None` if sorting is not required.
256	pub fn new(meta_data: &MetaData, chunk_writer: &'w mut W) -> SortedBlocksWriter<'w, W> {
257	let requires_sorting = meta_data.headers.iter()
258	.any(\|header\| header.line_order != LineOrder::Unspecified);
259
260	let total_chunk_count = chunk_writer.total_chunks_count();
261
262	SortedBlocksWriter {
263	pending_chunks: BTreeMap::new(),
264	unwritten_chunk_indices: (`0` .. total_chunk_count).peekable(),
265	requires_sorting,
266	chunk_writer
267	}
268	}
269
270	/// Write the chunk or stash it. In the closure, write all chunks that can be written now.
271	pub fn write_or_stash_chunk(&mut self, chunk_index_in_file: usize, chunk_y_index: usize, chunk: Chunk) -> UnitResult {
272	if self.requires_sorting.not() {
273	return self.chunk_writer.write_chunk(chunk_y_index, chunk);
274	}
275
276	// write this chunk now if possible
277	if self.unwritten_chunk_indices.peek() == Some(&chunk_index_in_file){
278	self.chunk_writer.write_chunk(chunk_y_index, chunk)?;
279	self.unwritten_chunk_indices.next().expect("peeked chunk index is missing");
280
281	// write all pending blocks that are immediate successors of this block
282	while let Some((next_chunk_y_index, next_chunk)) = self
283	.unwritten_chunk_indices.peek().cloned()
284	.and_then(\|id\| self.pending_chunks.remove(&id))
285	{
286	self.chunk_writer.write_chunk(next_chunk_y_index, next_chunk)?;
287	self.unwritten_chunk_indices.next().expect("peeked chunk index is missing");
288	}
289	}
290
291	else {
292	// the argument block is not to be written now,
293	// and all the pending blocks are not next up either,
294	// so just stash this block
295	self.pending_chunks.insert(chunk_index_in_file, (chunk_y_index, chunk));
296	}
297
298	Ok(())
299	}
300
301	/// Where the chunks will be written to.
302	pub fn inner_chunks_writer(&self) -> &W {
303	&self.chunk_writer
304	}
305	}
306
307
308
309	/// Compress blocks to a chunk writer in this thread.
310	#[derive(Debug)]
311	#[must_use]
312	pub struct SequentialBlocksCompressor<'w, W> {
313	meta: &'w MetaData,
314	chunks_writer: &'w mut W,
315	}
316
317	impl<'w, W> SequentialBlocksCompressor<'w, W> where W: 'w + ChunksWriter {
318
319	/// New blocks writer.
320	pub fn new(meta: &'w MetaData, chunks_writer: &'w mut W) -> Self { Self { meta, chunks_writer, } }
321
322	/// This is where the compressed blocks are written to.
323	pub fn inner_chunks_writer(&'w self) -> &'w W { self.chunks_writer }
324
325	/// Compress a single block immediately. The index of the block must be in increasing line order.
326	pub fn compress_block(&mut self, index_in_header_increasing_y: usize, block: UncompressedBlock) -> UnitResult {
327	self.chunks_writer.write_chunk(
328	index_in_header_increasing_y,
329	block.compress_to_chunk(&self.meta.headers)?
330	)
331	}
332	}
333
334	/// Compress blocks to a chunk writer with multiple threads.
335	#[derive(Debug)]
336	#[must_use]
337	pub struct ParallelBlocksCompressor<'w, W> {
338	meta: &'w MetaData,
339	sorted_writer: SortedBlocksWriter<'w, W>,
340
341	sender: mpsc::Sender<Result<(usize, usize, Chunk)>>,
342	receiver: mpsc::Receiver<Result<(usize, usize, Chunk)>>,
343	pool: rayon_core::ThreadPool,
344
345	currently_compressing_count: usize,
346	written_chunk_count: usize, // used to check for last chunk
347	max_threads: usize,
348	next_incoming_chunk_index: usize, // used to remember original chunk order
349	}
350
351	impl<'w, W> ParallelBlocksCompressor<'w, W> where W: 'w + ChunksWriter {
352
353	/// New blocks writer. Returns none if sequential compression should be used.
354	/// Use `new_with_thread_pool` to customize the threadpool.
355	pub fn new(meta: &'w MetaData, chunks_writer: &'w mut W) -> Option<Self> {
356	Self::new_with_thread_pool(meta, chunks_writer, \|\|{
357	rayon_core::ThreadPoolBuilder::new()
358	.thread_name(\|index\| format!("OpenEXR Block Compressor Thread #{}", index))
359	.build()
360	})
361	}
362
363	/// New blocks writer. Returns none if sequential compression should be used.
364	pub fn new_with_thread_pool<CreatePool>(
365	meta: &'w MetaData, chunks_writer: &'w mut W, try_create_thread_pool: CreatePool)
366	-> Option<Self>
367	where CreatePool: FnOnce() -> std::result::Result<ThreadPool, ThreadPoolBuildError>
368	{
369	if meta.headers.iter().all(\|head\|head.compression == Compression::Uncompressed) {
370	return None;
371	}
372
373	// in case thread pool creation fails (for example on WASM currently),
374	// we revert to sequential compression
375	let pool = match try_create_thread_pool() {
376	Ok(pool) => pool,
377
378	// TODO print warning?
379	Err(_) => return None,
380	};
381
382	let max_threads = pool.current_num_threads().max(`1`).min(chunks_writer.total_chunks_count()) + `2`; // ca one block for each thread at all times
383	let (send, recv) = mpsc::channel(); // TODO bounded channel simplifies logic?
384
385	Some(Self {
386	sorted_writer: SortedBlocksWriter::new(meta, chunks_writer),
387	next_incoming_chunk_index: `0`,
388	currently_compressing_count: `0`,
389	written_chunk_count: `0`,
390	sender: send,
391	receiver: recv,
392	max_threads,
393	pool,
394	meta,
395	})
396	}
397
398	/// This is where the compressed blocks are written to.
399	pub fn inner_chunks_writer(&'w self) -> &'w W { self.sorted_writer.inner_chunks_writer() }
400
401	// private, as may underflow counter in release mode
402	fn write_next_queued_chunk(&mut self) -> UnitResult {
403	debug_assert!(self.currently_compressing_count > `0`, "cannot wait for chunks as there are none left");
404
405	let some_compressed_chunk = self.receiver.recv()
406	.expect("cannot receive compressed block");
407
408	self.currently_compressing_count -= `1`;
409	let (chunk_file_index, chunk_y_index, chunk) = some_compressed_chunk?;
410	self.sorted_writer.write_or_stash_chunk(chunk_file_index, chunk_y_index, chunk)?;
411
412	self.written_chunk_count += `1`;
413	Ok(())
414	}
415
416	/// Wait until all currently compressing chunks in the compressor have been written.
417	pub fn write_all_queued_chunks(&mut self) -> UnitResult {
418	while self.currently_compressing_count > `0` {
419	self.write_next_queued_chunk()?;
420	}
421
422	debug_assert_eq!(self.currently_compressing_count, `0`, "counter does not match block count");
423	Ok(())
424	}
425
426	/// Add a single block to the compressor queue. The index of the block must be in increasing line order.
427	/// When calling this function for the last block, this method waits until all the blocks have been written.
428	/// This only works when you write as many blocks as the image expects, otherwise you can use `wait_for_all_remaining_chunks`.
429	/// Waits for a block from the queue to be written, if the queue already has enough items.
430	pub fn add_block_to_compression_queue(&mut self, index_in_header_increasing_y: usize, block: UncompressedBlock) -> UnitResult {
431
432	// if pipe is full, block to wait for a slot to free up
433	if self.currently_compressing_count >= self.max_threads {
434	self.write_next_queued_chunk()?;
435	}
436
437	// add the argument chunk to the compression queueue
438	let index_in_file = self.next_incoming_chunk_index;
439	let sender = self.sender.clone();
440	let meta = self.meta.clone();
441
442	self.pool.spawn(move \|\|{
443	let compressed_or_err = block.compress_to_chunk(&meta.headers);
444
445	// by now, decompressing could have failed in another thread.
446	// the error is then already handled, so we simply
447	// don't send the decompressed block and do nothing
448	let _ = sender.send(compressed_or_err.map(move \|compressed\| (index_in_file, index_in_header_increasing_y, compressed)));
449	});
450
451	self.currently_compressing_count += `1`;
452	self.next_incoming_chunk_index += `1`;
453
454	// if this is the last chunk, wait for all chunks to complete before returning
455	if self.written_chunk_count + self.currently_compressing_count == self.inner_chunks_writer().total_chunks_count() {
456	self.write_all_queued_chunks()?;
457	debug_assert_eq!(
458	self.written_chunk_count, self.inner_chunks_writer().total_chunks_count(),
459	"written chunk count mismatch"
460	);
461	}
462
463
464	Ok(())
465	}
466	}
467
468
469
470