1 | //! Parallel iterator types for [ranges][std::range], |
2 | //! the type for values created by `a..b` expressions |
3 | //! |
4 | //! You will rarely need to interact with this module directly unless you have |
5 | //! need to name one of the iterator types. |
6 | //! |
7 | //! ``` |
8 | //! use rayon::prelude::*; |
9 | //! |
10 | //! let r = (0..100u64).into_par_iter() |
11 | //! .sum(); |
12 | //! |
13 | //! // compare result with sequential calculation |
14 | //! assert_eq!((0..100).sum::<u64>(), r); |
15 | //! ``` |
16 | //! |
17 | //! [std::range]: https://doc.rust-lang.org/core/ops/struct.Range.html |
18 | |
19 | use crate::iter::plumbing::*; |
20 | use crate::iter::*; |
21 | use std::ops::Range; |
22 | |
23 | /// Parallel iterator over a range, implemented for all integer types and `char`. |
24 | /// |
25 | /// **Note:** The `zip` operation requires `IndexedParallelIterator` |
26 | /// which is not implemented for `u64`, `i64`, `u128`, or `i128`. |
27 | /// |
28 | /// ``` |
29 | /// use rayon::prelude::*; |
30 | /// |
31 | /// let p = (0..25usize).into_par_iter() |
32 | /// .zip(0..25usize) |
33 | /// .filter(|&(x, y)| x % 5 == 0 || y % 5 == 0) |
34 | /// .map(|(x, y)| x * y) |
35 | /// .sum::<usize>(); |
36 | /// |
37 | /// let s = (0..25usize).zip(0..25) |
38 | /// .filter(|&(x, y)| x % 5 == 0 || y % 5 == 0) |
39 | /// .map(|(x, y)| x * y) |
40 | /// .sum(); |
41 | /// |
42 | /// assert_eq!(p, s); |
43 | /// ``` |
44 | #[derive (Debug, Clone)] |
45 | pub struct Iter<T> { |
46 | range: Range<T>, |
47 | } |
48 | |
49 | /// Implemented for ranges of all primitive integer types and `char`. |
50 | impl<T> IntoParallelIterator for Range<T> |
51 | where |
52 | Iter<T>: ParallelIterator, |
53 | { |
54 | type Item = <Iter<T> as ParallelIterator>::Item; |
55 | type Iter = Iter<T>; |
56 | |
57 | fn into_par_iter(self) -> Self::Iter { |
58 | Iter { range: self } |
59 | } |
60 | } |
61 | |
62 | struct IterProducer<T> { |
63 | range: Range<T>, |
64 | } |
65 | |
66 | impl<T> IntoIterator for IterProducer<T> |
67 | where |
68 | Range<T>: Iterator, |
69 | { |
70 | type Item = <Range<T> as Iterator>::Item; |
71 | type IntoIter = Range<T>; |
72 | |
73 | fn into_iter(self) -> Self::IntoIter { |
74 | self.range |
75 | } |
76 | } |
77 | |
78 | /// These traits help drive integer type inference. Without them, an unknown `{integer}` type only |
79 | /// has constraints on `Iter<{integer}>`, which will probably give up and use `i32`. By adding |
80 | /// these traits on the item type, the compiler can see a more direct constraint to infer like |
81 | /// `{integer}: RangeInteger`, which works better. See `test_issue_833` for an example. |
82 | /// |
83 | /// They have to be `pub` since they're seen in the public `impl ParallelIterator` constraints, but |
84 | /// we put them in a private modules so they're not actually reachable in our public API. |
85 | mod private { |
86 | use super::*; |
87 | |
88 | /// Implementation details of `ParallelIterator for Iter<Self>` |
89 | pub trait RangeInteger: Sized + Send { |
90 | private_decl! {} |
91 | |
92 | fn drive_unindexed<C>(iter: Iter<Self>, consumer: C) -> C::Result |
93 | where |
94 | C: UnindexedConsumer<Self>; |
95 | |
96 | fn opt_len(iter: &Iter<Self>) -> Option<usize>; |
97 | } |
98 | |
99 | /// Implementation details of `IndexedParallelIterator for Iter<Self>` |
100 | pub trait IndexedRangeInteger: RangeInteger { |
101 | private_decl! {} |
102 | |
103 | fn drive<C>(iter: Iter<Self>, consumer: C) -> C::Result |
104 | where |
105 | C: Consumer<Self>; |
106 | |
107 | fn len(iter: &Iter<Self>) -> usize; |
108 | |
109 | fn with_producer<CB>(iter: Iter<Self>, callback: CB) -> CB::Output |
110 | where |
111 | CB: ProducerCallback<Self>; |
112 | } |
113 | } |
114 | use private::{IndexedRangeInteger, RangeInteger}; |
115 | |
116 | impl<T: RangeInteger> ParallelIterator for Iter<T> { |
117 | type Item = T; |
118 | |
119 | fn drive_unindexed<C>(self, consumer: C) -> C::Result |
120 | where |
121 | C: UnindexedConsumer<T>, |
122 | { |
123 | T::drive_unindexed(self, consumer) |
124 | } |
125 | |
126 | #[inline ] |
127 | fn opt_len(&self) -> Option<usize> { |
128 | T::opt_len(self) |
129 | } |
130 | } |
131 | |
132 | impl<T: IndexedRangeInteger> IndexedParallelIterator for Iter<T> { |
133 | fn drive<C>(self, consumer: C) -> C::Result |
134 | where |
135 | C: Consumer<T>, |
136 | { |
137 | T::drive(self, consumer) |
138 | } |
139 | |
140 | #[inline ] |
141 | fn len(&self) -> usize { |
142 | T::len(self) |
143 | } |
144 | |
145 | fn with_producer<CB>(self, callback: CB) -> CB::Output |
146 | where |
147 | CB: ProducerCallback<T>, |
148 | { |
149 | T::with_producer(self, callback) |
150 | } |
151 | } |
152 | |
153 | macro_rules! indexed_range_impl { |
154 | ( $t:ty ) => { |
155 | impl RangeInteger for $t { |
156 | private_impl! {} |
157 | |
158 | fn drive_unindexed<C>(iter: Iter<$t>, consumer: C) -> C::Result |
159 | where |
160 | C: UnindexedConsumer<$t>, |
161 | { |
162 | bridge(iter, consumer) |
163 | } |
164 | |
165 | fn opt_len(iter: &Iter<$t>) -> Option<usize> { |
166 | Some(iter.range.len()) |
167 | } |
168 | } |
169 | |
170 | impl IndexedRangeInteger for $t { |
171 | private_impl! {} |
172 | |
173 | fn drive<C>(iter: Iter<$t>, consumer: C) -> C::Result |
174 | where |
175 | C: Consumer<$t>, |
176 | { |
177 | bridge(iter, consumer) |
178 | } |
179 | |
180 | fn len(iter: &Iter<$t>) -> usize { |
181 | iter.range.len() |
182 | } |
183 | |
184 | fn with_producer<CB>(iter: Iter<$t>, callback: CB) -> CB::Output |
185 | where |
186 | CB: ProducerCallback<$t>, |
187 | { |
188 | callback.callback(IterProducer { range: iter.range }) |
189 | } |
190 | } |
191 | |
192 | impl Producer for IterProducer<$t> { |
193 | type Item = <Range<$t> as Iterator>::Item; |
194 | type IntoIter = Range<$t>; |
195 | fn into_iter(self) -> Self::IntoIter { |
196 | self.range |
197 | } |
198 | |
199 | fn split_at(self, index: usize) -> (Self, Self) { |
200 | assert!(index <= self.range.len()); |
201 | // For signed $t, the length and requested index could be greater than $t::MAX, and |
202 | // then `index as $t` could wrap to negative, so wrapping_add is necessary. |
203 | let mid = self.range.start.wrapping_add(index as $t); |
204 | let left = self.range.start..mid; |
205 | let right = mid..self.range.end; |
206 | (IterProducer { range: left }, IterProducer { range: right }) |
207 | } |
208 | } |
209 | }; |
210 | } |
211 | |
212 | trait UnindexedRangeLen<L> { |
213 | fn len(&self) -> L; |
214 | } |
215 | |
216 | macro_rules! unindexed_range_impl { |
217 | ( $t:ty, $len_t:ty ) => { |
218 | impl UnindexedRangeLen<$len_t> for Range<$t> { |
219 | fn len(&self) -> $len_t { |
220 | let &Range { start, end } = self; |
221 | if end > start { |
222 | end.wrapping_sub(start) as $len_t |
223 | } else { |
224 | 0 |
225 | } |
226 | } |
227 | } |
228 | |
229 | impl RangeInteger for $t { |
230 | private_impl! {} |
231 | |
232 | fn drive_unindexed<C>(iter: Iter<$t>, consumer: C) -> C::Result |
233 | where |
234 | C: UnindexedConsumer<$t>, |
235 | { |
236 | #[inline] |
237 | fn offset(start: $t) -> impl Fn(usize) -> $t { |
238 | move |i| start.wrapping_add(i as $t) |
239 | } |
240 | |
241 | if let Some(len) = iter.opt_len() { |
242 | // Drive this in indexed mode for better `collect`. |
243 | (0..len) |
244 | .into_par_iter() |
245 | .map(offset(iter.range.start)) |
246 | .drive(consumer) |
247 | } else { |
248 | bridge_unindexed(IterProducer { range: iter.range }, consumer) |
249 | } |
250 | } |
251 | |
252 | fn opt_len(iter: &Iter<$t>) -> Option<usize> { |
253 | usize::try_from(iter.range.len()).ok() |
254 | } |
255 | } |
256 | |
257 | impl UnindexedProducer for IterProducer<$t> { |
258 | type Item = $t; |
259 | |
260 | fn split(mut self) -> (Self, Option<Self>) { |
261 | let index = self.range.len() / 2; |
262 | if index > 0 { |
263 | let mid = self.range.start.wrapping_add(index as $t); |
264 | let right = mid..self.range.end; |
265 | self.range.end = mid; |
266 | (self, Some(IterProducer { range: right })) |
267 | } else { |
268 | (self, None) |
269 | } |
270 | } |
271 | |
272 | fn fold_with<F>(self, folder: F) -> F |
273 | where |
274 | F: Folder<Self::Item>, |
275 | { |
276 | folder.consume_iter(self) |
277 | } |
278 | } |
279 | }; |
280 | } |
281 | |
282 | // all Range<T> with ExactSizeIterator |
283 | indexed_range_impl! {u8} |
284 | indexed_range_impl! {u16} |
285 | indexed_range_impl! {u32} |
286 | indexed_range_impl! {usize} |
287 | indexed_range_impl! {i8} |
288 | indexed_range_impl! {i16} |
289 | indexed_range_impl! {i32} |
290 | indexed_range_impl! {isize} |
291 | |
292 | // other Range<T> with just Iterator |
293 | unindexed_range_impl! {u64, u64} |
294 | unindexed_range_impl! {i64, u64} |
295 | unindexed_range_impl! {u128, u128} |
296 | unindexed_range_impl! {i128, u128} |
297 | |
298 | // char is special because of the surrogate range hole |
299 | macro_rules! convert_char { |
300 | ( $self:ident . $method:ident ( $( $arg:expr ),* ) ) => {{ |
301 | let start = $self.range.start as u32; |
302 | let end = $self.range.end as u32; |
303 | if start < 0xD800 && 0xE000 < end { |
304 | // chain the before and after surrogate range fragments |
305 | (start..0xD800) |
306 | .into_par_iter() |
307 | .chain(0xE000..end) |
308 | .map(|codepoint| unsafe { char::from_u32_unchecked(codepoint) }) |
309 | .$method($( $arg ),*) |
310 | } else { |
311 | // no surrogate range to worry about |
312 | (start..end) |
313 | .into_par_iter() |
314 | .map(|codepoint| unsafe { char::from_u32_unchecked(codepoint) }) |
315 | .$method($( $arg ),*) |
316 | } |
317 | }}; |
318 | } |
319 | |
320 | impl ParallelIterator for Iter<char> { |
321 | type Item = char; |
322 | |
323 | fn drive_unindexed<C>(self, consumer: C) -> C::Result |
324 | where |
325 | C: UnindexedConsumer<Self::Item>, |
326 | { |
327 | convert_char!(self.drive(consumer)) |
328 | } |
329 | |
330 | fn opt_len(&self) -> Option<usize> { |
331 | Some(self.len()) |
332 | } |
333 | } |
334 | |
335 | impl IndexedParallelIterator for Iter<char> { |
336 | // Split at the surrogate range first if we're allowed to |
337 | fn drive<C>(self, consumer: C) -> C::Result |
338 | where |
339 | C: Consumer<Self::Item>, |
340 | { |
341 | convert_char!(self.drive(consumer)) |
342 | } |
343 | |
344 | fn len(&self) -> usize { |
345 | // Taken from <char as Step>::steps_between |
346 | let start = self.range.start as u32; |
347 | let end = self.range.end as u32; |
348 | if start < end { |
349 | let mut count = end - start; |
350 | if start < 0xD800 && 0xE000 <= end { |
351 | count -= 0x800 |
352 | } |
353 | count as usize |
354 | } else { |
355 | 0 |
356 | } |
357 | } |
358 | |
359 | fn with_producer<CB>(self, callback: CB) -> CB::Output |
360 | where |
361 | CB: ProducerCallback<Self::Item>, |
362 | { |
363 | convert_char!(self.with_producer(callback)) |
364 | } |
365 | } |
366 | |
367 | #[test ] |
368 | fn check_range_split_at_overflow() { |
369 | // Note, this split index overflows i8! |
370 | let producer = IterProducer { range: -100i8..100 }; |
371 | let (left, right) = producer.split_at(150); |
372 | let r1: i32 = left.range.map(i32::from).sum(); |
373 | let r2: i32 = right.range.map(i32::from).sum(); |
374 | assert_eq!(r1 + r2, -100); |
375 | } |
376 | |
377 | #[test ] |
378 | fn test_i128_len_doesnt_overflow() { |
379 | // Using parse because some versions of rust don't allow long literals |
380 | let octillion: i128 = "1000000000000000000000000000" .parse().unwrap(); |
381 | let producer = IterProducer { |
382 | range: 0..octillion, |
383 | }; |
384 | |
385 | assert_eq!(octillion as u128, producer.range.len()); |
386 | assert_eq!(octillion as u128, (0..octillion).len()); |
387 | assert_eq!(2 * octillion as u128, (-octillion..octillion).len()); |
388 | |
389 | assert_eq!(u128::MAX, (i128::MIN..i128::MAX).len()); |
390 | } |
391 | |
392 | #[test ] |
393 | fn test_u64_opt_len() { |
394 | assert_eq!(Some(100), (0..100u64).into_par_iter().opt_len()); |
395 | assert_eq!( |
396 | Some(usize::MAX), |
397 | (0..usize::MAX as u64).into_par_iter().opt_len() |
398 | ); |
399 | if (usize::MAX as u64) < u64::MAX { |
400 | assert_eq!( |
401 | None, |
402 | (0..(usize::MAX as u64).wrapping_add(1)) |
403 | .into_par_iter() |
404 | .opt_len() |
405 | ); |
406 | assert_eq!(None, (0..u64::MAX).into_par_iter().opt_len()); |
407 | } |
408 | } |
409 | |
410 | #[test ] |
411 | fn test_u128_opt_len() { |
412 | assert_eq!(Some(100), (0..100u128).into_par_iter().opt_len()); |
413 | assert_eq!( |
414 | Some(usize::MAX), |
415 | (0..usize::MAX as u128).into_par_iter().opt_len() |
416 | ); |
417 | assert_eq!(None, (0..1 + usize::MAX as u128).into_par_iter().opt_len()); |
418 | assert_eq!(None, (0..u128::MAX).into_par_iter().opt_len()); |
419 | } |
420 | |
421 | // `usize as i64` can overflow, so make sure to wrap it appropriately |
422 | // when using the `opt_len` "indexed" mode. |
423 | #[test ] |
424 | #[cfg (target_pointer_width = "64" )] |
425 | fn test_usize_i64_overflow() { |
426 | use crate::ThreadPoolBuilder; |
427 | |
428 | let iter = (-2..i64::MAX).into_par_iter(); |
429 | assert_eq!(iter.opt_len(), Some(i64::MAX as usize + 2)); |
430 | |
431 | // always run with multiple threads to split into, or this will take forever... |
432 | let pool = ThreadPoolBuilder::new().num_threads(8).build().unwrap(); |
433 | pool.install(|| assert_eq!(iter.find_last(|_| true), Some(i64::MAX - 1))); |
434 | } |
435 | |
436 | #[test ] |
437 | fn test_issue_833() { |
438 | fn is_even(n: i64) -> bool { |
439 | n % 2 == 0 |
440 | } |
441 | |
442 | // The integer type should be inferred from `is_even` |
443 | let v: Vec<_> = (1..100).into_par_iter().filter(|&x| is_even(x)).collect(); |
444 | assert!(v.into_iter().eq((2..100).step_by(2))); |
445 | |
446 | // Try examples with indexed iterators too |
447 | let pos = (0..100).into_par_iter().position_any(|x| x == 50i16); |
448 | assert_eq!(pos, Some(50usize)); |
449 | |
450 | assert!((0..100) |
451 | .into_par_iter() |
452 | .zip(0..100) |
453 | .all(|(a, b)| i16::eq(&a, &b))); |
454 | } |
455 | |