| 1 | use crate::size_hint; | 
| 2 | use crate::Itertools; | 
|---|
| 3 |  | 
|---|
| 4 | use alloc::vec::Vec; | 
|---|
| 5 | use std::fmt; | 
|---|
| 6 | use std::iter::FusedIterator; | 
|---|
| 7 | use std::mem::replace; | 
|---|
| 8 |  | 
|---|
| 9 | /// Head element and Tail iterator pair | 
|---|
| 10 | /// | 
|---|
| 11 | /// `PartialEq`, `Eq`, `PartialOrd` and `Ord` are implemented by comparing sequences based on | 
|---|
| 12 | /// first items (which are guaranteed to exist). | 
|---|
| 13 | /// | 
|---|
| 14 | /// The meanings of `PartialOrd` and `Ord` are reversed so as to turn the heap used in | 
|---|
| 15 | /// `KMerge` into a min-heap. | 
|---|
| 16 | #[ derive(Debug)] | 
|---|
| 17 | struct HeadTail<I> | 
|---|
| 18 | where | 
|---|
| 19 | I: Iterator, | 
|---|
| 20 | { | 
|---|
| 21 | head: I::Item, | 
|---|
| 22 | tail: I, | 
|---|
| 23 | } | 
|---|
| 24 |  | 
|---|
| 25 | impl<I> HeadTail<I> | 
|---|
| 26 | where | 
|---|
| 27 | I: Iterator, | 
|---|
| 28 | { | 
|---|
| 29 | /// Constructs a `HeadTail` from an `Iterator`. Returns `None` if the `Iterator` is empty. | 
|---|
| 30 | fn new(mut it: I) -> Option<Self> { | 
|---|
| 31 | let head: Option<::Item> = it.next(); | 
|---|
| 32 | head.map(|h: ::Item| Self { head: h, tail: it }) | 
|---|
| 33 | } | 
|---|
| 34 |  | 
|---|
| 35 | /// Get the next element and update `head`, returning the old head in `Some`. | 
|---|
| 36 | /// | 
|---|
| 37 | /// Returns `None` when the tail is exhausted (only `head` then remains). | 
|---|
| 38 | fn next(&mut self) -> Option<I::Item> { | 
|---|
| 39 | if let Some(next: ::Item) = self.tail.next() { | 
|---|
| 40 | Some(replace(&mut self.head, src:next)) | 
|---|
| 41 | } else { | 
|---|
| 42 | None | 
|---|
| 43 | } | 
|---|
| 44 | } | 
|---|
| 45 |  | 
|---|
| 46 | /// Hints at the size of the sequence, same as the `Iterator` method. | 
|---|
| 47 | fn size_hint(&self) -> (usize, Option<usize>) { | 
|---|
| 48 | size_hint::add_scalar(self.tail.size_hint(), x:1) | 
|---|
| 49 | } | 
|---|
| 50 | } | 
|---|
| 51 |  | 
|---|
| 52 | impl<I> Clone for HeadTail<I> | 
|---|
| 53 | where | 
|---|
| 54 | I: Iterator + Clone, | 
|---|
| 55 | I::Item: Clone, | 
|---|
| 56 | { | 
|---|
| 57 | clone_fields!(head, tail); | 
|---|
| 58 | } | 
|---|
| 59 |  | 
|---|
| 60 | /// Make `data` a heap (min-heap w.r.t the sorting). | 
|---|
| 61 | fn heapify<T, S>(data: &mut [T], mut less_than: S) | 
|---|
| 62 | where | 
|---|
| 63 | S: FnMut(&T, &T) -> bool, | 
|---|
| 64 | { | 
|---|
| 65 | for i: usize in (0..data.len() / 2).rev() { | 
|---|
| 66 | sift_down(heap:data, index:i, &mut less_than); | 
|---|
| 67 | } | 
|---|
| 68 | } | 
|---|
| 69 |  | 
|---|
| 70 | /// Sift down element at `index` (`heap` is a min-heap wrt the ordering) | 
|---|
| 71 | fn sift_down<T, S>(heap: &mut [T], index: usize, mut less_than: S) | 
|---|
| 72 | where | 
|---|
| 73 | S: FnMut(&T, &T) -> bool, | 
|---|
| 74 | { | 
|---|
| 75 | debug_assert!(index <= heap.len()); | 
|---|
| 76 | let mut pos = index; | 
|---|
| 77 | let mut child = 2 * pos + 1; | 
|---|
| 78 | // Require the right child to be present | 
|---|
| 79 | // This allows to find the index of the smallest child without a branch | 
|---|
| 80 | // that wouldn't be predicted if present | 
|---|
| 81 | while child + 1 < heap.len() { | 
|---|
| 82 | // pick the smaller of the two children | 
|---|
| 83 | // use arithmetic to avoid an unpredictable branch | 
|---|
| 84 | child += less_than(&heap[child + 1], &heap[child]) as usize; | 
|---|
| 85 |  | 
|---|
| 86 | // sift down is done if we are already in order | 
|---|
| 87 | if !less_than(&heap[child], &heap[pos]) { | 
|---|
| 88 | return; | 
|---|
| 89 | } | 
|---|
| 90 | heap.swap(pos, child); | 
|---|
| 91 | pos = child; | 
|---|
| 92 | child = 2 * pos + 1; | 
|---|
| 93 | } | 
|---|
| 94 | // Check if the last (left) child was an only child | 
|---|
| 95 | // if it is then it has to be compared with the parent | 
|---|
| 96 | if child + 1 == heap.len() && less_than(&heap[child], &heap[pos]) { | 
|---|
| 97 | heap.swap(pos, child); | 
|---|
| 98 | } | 
|---|
| 99 | } | 
|---|
| 100 |  | 
|---|
| 101 | /// An iterator adaptor that merges an abitrary number of base iterators in ascending order. | 
|---|
| 102 | /// If all base iterators are sorted (ascending), the result is sorted. | 
|---|
| 103 | /// | 
|---|
| 104 | /// Iterator element type is `I::Item`. | 
|---|
| 105 | /// | 
|---|
| 106 | /// See [`.kmerge()`](crate::Itertools::kmerge) for more information. | 
|---|
| 107 | pub type KMerge<I> = KMergeBy<I, KMergeByLt>; | 
|---|
| 108 |  | 
|---|
| 109 | pub trait KMergePredicate<T> { | 
|---|
| 110 | fn kmerge_pred(&mut self, a: &T, b: &T) -> bool; | 
|---|
| 111 | } | 
|---|
| 112 |  | 
|---|
| 113 | #[ derive(Clone, Debug)] | 
|---|
| 114 | pub struct KMergeByLt; | 
|---|
| 115 |  | 
|---|
| 116 | impl<T: PartialOrd> KMergePredicate<T> for KMergeByLt { | 
|---|
| 117 | fn kmerge_pred(&mut self, a: &T, b: &T) -> bool { | 
|---|
| 118 | a < b | 
|---|
| 119 | } | 
|---|
| 120 | } | 
|---|
| 121 |  | 
|---|
| 122 | impl<T, F: FnMut(&T, &T) -> bool> KMergePredicate<T> for F { | 
|---|
| 123 | fn kmerge_pred(&mut self, a: &T, b: &T) -> bool { | 
|---|
| 124 | self(a, b) | 
|---|
| 125 | } | 
|---|
| 126 | } | 
|---|
| 127 |  | 
|---|
| 128 | /// Create an iterator that merges elements of the contained iterators using | 
|---|
| 129 | /// the ordering function. | 
|---|
| 130 | /// | 
|---|
| 131 | /// [`IntoIterator`] enabled version of [`Itertools::kmerge`]. | 
|---|
| 132 | /// | 
|---|
| 133 | /// ``` | 
|---|
| 134 | /// use itertools::kmerge; | 
|---|
| 135 | /// | 
|---|
| 136 | /// for elt in kmerge(vec![vec![0, 2, 4], vec![1, 3, 5], vec![6, 7]]) { | 
|---|
| 137 | ///     /* loop body */ | 
|---|
| 138 | /// } | 
|---|
| 139 | /// ``` | 
|---|
| 140 | pub fn kmerge<I>(iterable: I) -> KMerge<<I::Item as IntoIterator>::IntoIter> | 
|---|
| 141 | where | 
|---|
| 142 | I: IntoIterator, | 
|---|
| 143 | I::Item: IntoIterator, | 
|---|
| 144 | <<I as IntoIterator>::Item as IntoIterator>::Item: PartialOrd, | 
|---|
| 145 | { | 
|---|
| 146 | kmerge_by(iterable, less_than:KMergeByLt) | 
|---|
| 147 | } | 
|---|
| 148 |  | 
|---|
| 149 | /// An iterator adaptor that merges an abitrary number of base iterators | 
|---|
| 150 | /// according to an ordering function. | 
|---|
| 151 | /// | 
|---|
| 152 | /// Iterator element type is `I::Item`. | 
|---|
| 153 | /// | 
|---|
| 154 | /// See [`.kmerge_by()`](crate::Itertools::kmerge_by) for more | 
|---|
| 155 | /// information. | 
|---|
| 156 | #[ must_use= "iterator adaptors are lazy and do nothing unless consumed"] | 
|---|
| 157 | pub struct KMergeBy<I, F> | 
|---|
| 158 | where | 
|---|
| 159 | I: Iterator, | 
|---|
| 160 | { | 
|---|
| 161 | heap: Vec<HeadTail<I>>, | 
|---|
| 162 | less_than: F, | 
|---|
| 163 | } | 
|---|
| 164 |  | 
|---|
| 165 | impl<I, F> fmt::Debug for KMergeBy<I, F> | 
|---|
| 166 | where | 
|---|
| 167 | I: Iterator + fmt::Debug, | 
|---|
| 168 | I::Item: fmt::Debug, | 
|---|
| 169 | { | 
|---|
| 170 | debug_fmt_fields!(KMergeBy, heap); | 
|---|
| 171 | } | 
|---|
| 172 |  | 
|---|
| 173 | /// Create an iterator that merges elements of the contained iterators. | 
|---|
| 174 | /// | 
|---|
| 175 | /// [`IntoIterator`] enabled version of [`Itertools::kmerge_by`]. | 
|---|
| 176 | pub fn kmerge_by<I, F>( | 
|---|
| 177 | iterable: I, | 
|---|
| 178 | mut less_than: F, | 
|---|
| 179 | ) -> KMergeBy<<I::Item as IntoIterator>::IntoIter, F> | 
|---|
| 180 | where | 
|---|
| 181 | I: IntoIterator, | 
|---|
| 182 | I::Item: IntoIterator, | 
|---|
| 183 | F: KMergePredicate<<<I as IntoIterator>::Item as IntoIterator>::Item>, | 
|---|
| 184 | { | 
|---|
| 185 | let iter: impl IntoIterator = iterable.into_iter(); | 
|---|
| 186 | let (lower: usize, _) = iter.size_hint(); | 
|---|
| 187 | let mut heap: Vec<_> = Vec::with_capacity(lower); | 
|---|
| 188 | heap.extend(iter.filter_map(|it| HeadTail::new(it.into_iter()))); | 
|---|
| 189 | heapify(&mut heap, |a: &HeadTail<{unknown}>, b: &HeadTail<{unknown}>| less_than.kmerge_pred(&a.head, &b.head)); | 
|---|
| 190 | KMergeBy { heap, less_than } | 
|---|
| 191 | } | 
|---|
| 192 |  | 
|---|
| 193 | impl<I, F> Clone for KMergeBy<I, F> | 
|---|
| 194 | where | 
|---|
| 195 | I: Iterator + Clone, | 
|---|
| 196 | I::Item: Clone, | 
|---|
| 197 | F: Clone, | 
|---|
| 198 | { | 
|---|
| 199 | clone_fields!(heap, less_than); | 
|---|
| 200 | } | 
|---|
| 201 |  | 
|---|
| 202 | impl<I, F> Iterator for KMergeBy<I, F> | 
|---|
| 203 | where | 
|---|
| 204 | I: Iterator, | 
|---|
| 205 | F: KMergePredicate<I::Item>, | 
|---|
| 206 | { | 
|---|
| 207 | type Item = I::Item; | 
|---|
| 208 |  | 
|---|
| 209 | fn next(&mut self) -> Option<Self::Item> { | 
|---|
| 210 | if self.heap.is_empty() { | 
|---|
| 211 | return None; | 
|---|
| 212 | } | 
|---|
| 213 | let result = if let Some(next) = self.heap[0].next() { | 
|---|
| 214 | next | 
|---|
| 215 | } else { | 
|---|
| 216 | self.heap.swap_remove(0).head | 
|---|
| 217 | }; | 
|---|
| 218 | let less_than = &mut self.less_than; | 
|---|
| 219 | sift_down(&mut self.heap, 0, |a, b| { | 
|---|
| 220 | less_than.kmerge_pred(&a.head, &b.head) | 
|---|
| 221 | }); | 
|---|
| 222 | Some(result) | 
|---|
| 223 | } | 
|---|
| 224 |  | 
|---|
| 225 | fn size_hint(&self) -> (usize, Option<usize>) { | 
|---|
| 226 | #[ allow(deprecated)] //TODO: once msrv hits 1.51. replace `fold1` with `reduce` | 
|---|
| 227 | self.heap | 
|---|
| 228 | .iter() | 
|---|
| 229 | .map(|i| i.size_hint()) | 
|---|
| 230 | .fold1(size_hint::add) | 
|---|
| 231 | .unwrap_or((0, Some(0))) | 
|---|
| 232 | } | 
|---|
| 233 | } | 
|---|
| 234 |  | 
|---|
| 235 | impl<I, F> FusedIterator for KMergeBy<I, F> | 
|---|
| 236 | where | 
|---|
| 237 | I: Iterator, | 
|---|
| 238 | F: KMergePredicate<I::Item>, | 
|---|
| 239 | { | 
|---|
| 240 | } | 
|---|
| 241 |  | 
|---|