| 1 | use std::cmp::Ordering; |
| 2 | use std::fmt; |
| 3 | use std::iter::{Fuse, FusedIterator}; |
| 4 | use std::marker::PhantomData; |
| 5 | |
| 6 | use either::Either; |
| 7 | |
| 8 | use super::adaptors::{put_back, PutBack}; |
| 9 | use crate::either_or_both::EitherOrBoth; |
| 10 | use crate::size_hint::{self, SizeHint}; |
| 11 | #[cfg (doc)] |
| 12 | use crate::Itertools; |
| 13 | |
| 14 | #[derive (Clone, Debug)] |
| 15 | pub struct MergeLte; |
| 16 | |
| 17 | /// An iterator adaptor that merges the two base iterators in ascending order. |
| 18 | /// If both base iterators are sorted (ascending), the result is sorted. |
| 19 | /// |
| 20 | /// Iterator element type is `I::Item`. |
| 21 | /// |
| 22 | /// See [`.merge()`](crate::Itertools::merge_by) for more information. |
| 23 | pub type Merge<I, J> = MergeBy<I, J, MergeLte>; |
| 24 | |
| 25 | /// Create an iterator that merges elements in `i` and `j`. |
| 26 | /// |
| 27 | /// [`IntoIterator`] enabled version of [`Itertools::merge`](crate::Itertools::merge). |
| 28 | /// |
| 29 | /// ``` |
| 30 | /// use itertools::merge; |
| 31 | /// |
| 32 | /// for elt in merge(&[1, 2, 3], &[2, 3, 4]) { |
| 33 | /// /* loop body */ |
| 34 | /// } |
| 35 | /// ``` |
| 36 | pub fn merge<I, J>( |
| 37 | i: I, |
| 38 | j: J, |
| 39 | ) -> Merge<<I as IntoIterator>::IntoIter, <J as IntoIterator>::IntoIter> |
| 40 | where |
| 41 | I: IntoIterator, |
| 42 | J: IntoIterator<Item = I::Item>, |
| 43 | I::Item: PartialOrd, |
| 44 | { |
| 45 | merge_by_new(a:i, b:j, cmp:MergeLte) |
| 46 | } |
| 47 | |
| 48 | /// An iterator adaptor that merges the two base iterators in ascending order. |
| 49 | /// If both base iterators are sorted (ascending), the result is sorted. |
| 50 | /// |
| 51 | /// Iterator element type is `I::Item`. |
| 52 | /// |
| 53 | /// See [`.merge_by()`](crate::Itertools::merge_by) for more information. |
| 54 | #[must_use = "iterator adaptors are lazy and do nothing unless consumed" ] |
| 55 | pub struct MergeBy<I: Iterator, J: Iterator, F> { |
| 56 | left: PutBack<Fuse<I>>, |
| 57 | right: PutBack<Fuse<J>>, |
| 58 | cmp_fn: F, |
| 59 | } |
| 60 | |
| 61 | /// Create a `MergeBy` iterator. |
| 62 | pub fn merge_by_new<I, J, F>(a: I, b: J, cmp: F) -> MergeBy<I::IntoIter, J::IntoIter, F> |
| 63 | where |
| 64 | I: IntoIterator, |
| 65 | J: IntoIterator<Item = I::Item>, |
| 66 | { |
| 67 | MergeBy { |
| 68 | left: put_back(iterable:a.into_iter().fuse()), |
| 69 | right: put_back(iterable:b.into_iter().fuse()), |
| 70 | cmp_fn: cmp, |
| 71 | } |
| 72 | } |
| 73 | |
| 74 | /// Return an iterator adaptor that merge-joins items from the two base iterators in ascending order. |
| 75 | /// |
| 76 | /// [`IntoIterator`] enabled version of [`Itertools::merge_join_by`]. |
| 77 | pub fn merge_join_by<I, J, F, T>( |
| 78 | left: I, |
| 79 | right: J, |
| 80 | cmp_fn: F, |
| 81 | ) -> MergeJoinBy<I::IntoIter, J::IntoIter, F> |
| 82 | where |
| 83 | I: IntoIterator, |
| 84 | J: IntoIterator, |
| 85 | F: FnMut(&I::Item, &J::Item) -> T, |
| 86 | { |
| 87 | MergeBy { |
| 88 | left: put_back(iterable:left.into_iter().fuse()), |
| 89 | right: put_back(iterable:right.into_iter().fuse()), |
| 90 | cmp_fn: MergeFuncLR(cmp_fn, PhantomData), |
| 91 | } |
| 92 | } |
| 93 | |
| 94 | /// An iterator adaptor that merge-joins items from the two base iterators in ascending order. |
| 95 | /// |
| 96 | /// See [`.merge_join_by()`](crate::Itertools::merge_join_by) for more information. |
| 97 | pub type MergeJoinBy<I, J, F> = |
| 98 | MergeBy<I, J, MergeFuncLR<F, <F as FuncLR<<I as Iterator>::Item, <J as Iterator>::Item>>::T>>; |
| 99 | |
| 100 | #[derive (Clone, Debug)] |
| 101 | pub struct MergeFuncLR<F, T>(F, PhantomData<T>); |
| 102 | |
| 103 | pub trait FuncLR<L, R> { |
| 104 | type T; |
| 105 | } |
| 106 | |
| 107 | impl<L, R, T, F: FnMut(&L, &R) -> T> FuncLR<L, R> for F { |
| 108 | type T = T; |
| 109 | } |
| 110 | |
| 111 | pub trait OrderingOrBool<L, R> { |
| 112 | type MergeResult; |
| 113 | fn left(left: L) -> Self::MergeResult; |
| 114 | fn right(right: R) -> Self::MergeResult; |
| 115 | // "merge" never returns (Some(...), Some(...), ...) so Option<Either<I::Item, J::Item>> |
| 116 | // is appealing but it is always followed by two put_backs, so we think the compiler is |
| 117 | // smart enough to optimize it. Or we could move put_backs into "merge". |
| 118 | fn merge(&mut self, left: L, right: R) -> (Option<L>, Option<R>, Self::MergeResult); |
| 119 | fn size_hint(left: SizeHint, right: SizeHint) -> SizeHint; |
| 120 | } |
| 121 | |
| 122 | impl<L, R, F: FnMut(&L, &R) -> Ordering> OrderingOrBool<L, R> for MergeFuncLR<F, Ordering> { |
| 123 | type MergeResult = EitherOrBoth<L, R>; |
| 124 | fn left(left: L) -> Self::MergeResult { |
| 125 | EitherOrBoth::Left(left) |
| 126 | } |
| 127 | fn right(right: R) -> Self::MergeResult { |
| 128 | EitherOrBoth::Right(right) |
| 129 | } |
| 130 | fn merge(&mut self, left: L, right: R) -> (Option<L>, Option<R>, Self::MergeResult) { |
| 131 | match self.0(&left, &right) { |
| 132 | Ordering::Equal => (None, None, EitherOrBoth::Both(left, right)), |
| 133 | Ordering::Less => (None, Some(right), EitherOrBoth::Left(left)), |
| 134 | Ordering::Greater => (Some(left), None, EitherOrBoth::Right(right)), |
| 135 | } |
| 136 | } |
| 137 | fn size_hint(left: SizeHint, right: SizeHint) -> SizeHint { |
| 138 | let (a_lower, a_upper) = left; |
| 139 | let (b_lower, b_upper) = right; |
| 140 | let lower = ::std::cmp::max(a_lower, b_lower); |
| 141 | let upper = match (a_upper, b_upper) { |
| 142 | (Some(x), Some(y)) => x.checked_add(y), |
| 143 | _ => None, |
| 144 | }; |
| 145 | (lower, upper) |
| 146 | } |
| 147 | } |
| 148 | |
| 149 | impl<L, R, F: FnMut(&L, &R) -> bool> OrderingOrBool<L, R> for MergeFuncLR<F, bool> { |
| 150 | type MergeResult = Either<L, R>; |
| 151 | fn left(left: L) -> Self::MergeResult { |
| 152 | Either::Left(left) |
| 153 | } |
| 154 | fn right(right: R) -> Self::MergeResult { |
| 155 | Either::Right(right) |
| 156 | } |
| 157 | fn merge(&mut self, left: L, right: R) -> (Option<L>, Option<R>, Self::MergeResult) { |
| 158 | if self.0(&left, &right) { |
| 159 | (None, Some(right), Either::Left(left)) |
| 160 | } else { |
| 161 | (Some(left), None, Either::Right(right)) |
| 162 | } |
| 163 | } |
| 164 | fn size_hint(left: SizeHint, right: SizeHint) -> SizeHint { |
| 165 | // Not ExactSizeIterator because size may be larger than usize |
| 166 | size_hint::add(a:left, b:right) |
| 167 | } |
| 168 | } |
| 169 | |
| 170 | impl<T, F: FnMut(&T, &T) -> bool> OrderingOrBool<T, T> for F { |
| 171 | type MergeResult = T; |
| 172 | fn left(left: T) -> Self::MergeResult { |
| 173 | left |
| 174 | } |
| 175 | fn right(right: T) -> Self::MergeResult { |
| 176 | right |
| 177 | } |
| 178 | fn merge(&mut self, left: T, right: T) -> (Option<T>, Option<T>, Self::MergeResult) { |
| 179 | if self(&left, &right) { |
| 180 | (None, Some(right), left) |
| 181 | } else { |
| 182 | (Some(left), None, right) |
| 183 | } |
| 184 | } |
| 185 | fn size_hint(left: SizeHint, right: SizeHint) -> SizeHint { |
| 186 | // Not ExactSizeIterator because size may be larger than usize |
| 187 | size_hint::add(a:left, b:right) |
| 188 | } |
| 189 | } |
| 190 | |
| 191 | impl<T: PartialOrd> OrderingOrBool<T, T> for MergeLte { |
| 192 | type MergeResult = T; |
| 193 | fn left(left: T) -> Self::MergeResult { |
| 194 | left |
| 195 | } |
| 196 | fn right(right: T) -> Self::MergeResult { |
| 197 | right |
| 198 | } |
| 199 | fn merge(&mut self, left: T, right: T) -> (Option<T>, Option<T>, Self::MergeResult) { |
| 200 | if left <= right { |
| 201 | (None, Some(right), left) |
| 202 | } else { |
| 203 | (Some(left), None, right) |
| 204 | } |
| 205 | } |
| 206 | fn size_hint(left: SizeHint, right: SizeHint) -> SizeHint { |
| 207 | // Not ExactSizeIterator because size may be larger than usize |
| 208 | size_hint::add(a:left, b:right) |
| 209 | } |
| 210 | } |
| 211 | |
| 212 | impl<I, J, F> Clone for MergeBy<I, J, F> |
| 213 | where |
| 214 | I: Iterator, |
| 215 | J: Iterator, |
| 216 | PutBack<Fuse<I>>: Clone, |
| 217 | PutBack<Fuse<J>>: Clone, |
| 218 | F: Clone, |
| 219 | { |
| 220 | clone_fields!(left, right, cmp_fn); |
| 221 | } |
| 222 | |
| 223 | impl<I, J, F> fmt::Debug for MergeBy<I, J, F> |
| 224 | where |
| 225 | I: Iterator + fmt::Debug, |
| 226 | I::Item: fmt::Debug, |
| 227 | J: Iterator + fmt::Debug, |
| 228 | J::Item: fmt::Debug, |
| 229 | { |
| 230 | debug_fmt_fields!(MergeBy, left, right); |
| 231 | } |
| 232 | |
| 233 | impl<I, J, F> Iterator for MergeBy<I, J, F> |
| 234 | where |
| 235 | I: Iterator, |
| 236 | J: Iterator, |
| 237 | F: OrderingOrBool<I::Item, J::Item>, |
| 238 | { |
| 239 | type Item = F::MergeResult; |
| 240 | |
| 241 | fn next(&mut self) -> Option<Self::Item> { |
| 242 | match (self.left.next(), self.right.next()) { |
| 243 | (None, None) => None, |
| 244 | (Some(left), None) => Some(F::left(left)), |
| 245 | (None, Some(right)) => Some(F::right(right)), |
| 246 | (Some(left), Some(right)) => { |
| 247 | let (left, right, next) = self.cmp_fn.merge(left, right); |
| 248 | if let Some(left) = left { |
| 249 | self.left.put_back(left); |
| 250 | } |
| 251 | if let Some(right) = right { |
| 252 | self.right.put_back(right); |
| 253 | } |
| 254 | Some(next) |
| 255 | } |
| 256 | } |
| 257 | } |
| 258 | |
| 259 | fn size_hint(&self) -> SizeHint { |
| 260 | F::size_hint(self.left.size_hint(), self.right.size_hint()) |
| 261 | } |
| 262 | |
| 263 | fn count(mut self) -> usize { |
| 264 | let mut count = 0; |
| 265 | loop { |
| 266 | match (self.left.next(), self.right.next()) { |
| 267 | (None, None) => break count, |
| 268 | (Some(_left), None) => break count + 1 + self.left.into_parts().1.count(), |
| 269 | (None, Some(_right)) => break count + 1 + self.right.into_parts().1.count(), |
| 270 | (Some(left), Some(right)) => { |
| 271 | count += 1; |
| 272 | let (left, right, _) = self.cmp_fn.merge(left, right); |
| 273 | if let Some(left) = left { |
| 274 | self.left.put_back(left); |
| 275 | } |
| 276 | if let Some(right) = right { |
| 277 | self.right.put_back(right); |
| 278 | } |
| 279 | } |
| 280 | } |
| 281 | } |
| 282 | } |
| 283 | |
| 284 | fn last(mut self) -> Option<Self::Item> { |
| 285 | let mut previous_element = None; |
| 286 | loop { |
| 287 | match (self.left.next(), self.right.next()) { |
| 288 | (None, None) => break previous_element, |
| 289 | (Some(left), None) => { |
| 290 | break Some(F::left(self.left.into_parts().1.last().unwrap_or(left))) |
| 291 | } |
| 292 | (None, Some(right)) => { |
| 293 | break Some(F::right(self.right.into_parts().1.last().unwrap_or(right))) |
| 294 | } |
| 295 | (Some(left), Some(right)) => { |
| 296 | let (left, right, elem) = self.cmp_fn.merge(left, right); |
| 297 | if let Some(left) = left { |
| 298 | self.left.put_back(left); |
| 299 | } |
| 300 | if let Some(right) = right { |
| 301 | self.right.put_back(right); |
| 302 | } |
| 303 | previous_element = Some(elem); |
| 304 | } |
| 305 | } |
| 306 | } |
| 307 | } |
| 308 | |
| 309 | fn nth(&mut self, mut n: usize) -> Option<Self::Item> { |
| 310 | loop { |
| 311 | if n == 0 { |
| 312 | break self.next(); |
| 313 | } |
| 314 | n -= 1; |
| 315 | match (self.left.next(), self.right.next()) { |
| 316 | (None, None) => break None, |
| 317 | (Some(_left), None) => break self.left.nth(n).map(F::left), |
| 318 | (None, Some(_right)) => break self.right.nth(n).map(F::right), |
| 319 | (Some(left), Some(right)) => { |
| 320 | let (left, right, _) = self.cmp_fn.merge(left, right); |
| 321 | if let Some(left) = left { |
| 322 | self.left.put_back(left); |
| 323 | } |
| 324 | if let Some(right) = right { |
| 325 | self.right.put_back(right); |
| 326 | } |
| 327 | } |
| 328 | } |
| 329 | } |
| 330 | } |
| 331 | } |
| 332 | |
| 333 | impl<I, J, F> FusedIterator for MergeBy<I, J, F> |
| 334 | where |
| 335 | I: Iterator, |
| 336 | J: Iterator, |
| 337 | F: OrderingOrBool<I::Item, J::Item>, |
| 338 | { |
| 339 | } |
| 340 | |