1 | //! This module contains logic for performing a merge of two sorted sub-slices. |
2 | |
3 | use crate::mem::MaybeUninit; |
4 | use crate::{cmp, ptr}; |
5 | |
6 | /// Merges non-decreasing runs `v[..mid]` and `v[mid..]` using `scratch` as |
7 | /// temporary storage, and stores the result into `v[..]`. |
8 | pub fn merge<T, F: FnMut(&T, &T) -> bool>( |
9 | v: &mut [T], |
10 | scratch: &mut [MaybeUninit<T>], |
11 | mid: usize, |
12 | is_less: &mut F, |
13 | ) { |
14 | let len = v.len(); |
15 | |
16 | if mid == 0 || mid >= len || scratch.len() < cmp::min(mid, len - mid) { |
17 | return; |
18 | } |
19 | |
20 | // SAFETY: We checked that the two slices are non-empty and `mid` is in-bounds. |
21 | // We checked that the buffer `scratch` has enough capacity to hold a copy of |
22 | // the shorter slice. `merge_up` and `merge_down` are written in such a way that |
23 | // they uphold the contract described in `MergeState::drop`. |
24 | unsafe { |
25 | // The merge process first copies the shorter run into `buf`. Then it traces |
26 | // the newly copied run and the longer run forwards (or backwards), comparing |
27 | // their next unconsumed elements and copying the lesser (or greater) one into `v`. |
28 | // |
29 | // As soon as the shorter run is fully consumed, the process is done. If the |
30 | // longer run gets consumed first, then we must copy whatever is left of the |
31 | // shorter run into the remaining gap in `v`. |
32 | // |
33 | // Intermediate state of the process is always tracked by `gap`, which serves |
34 | // two purposes: |
35 | // 1. Protects integrity of `v` from panics in `is_less`. |
36 | // 2. Fills the remaining gap in `v` if the longer run gets consumed first. |
37 | |
38 | let buf = MaybeUninit::slice_as_mut_ptr(scratch); |
39 | |
40 | let v_base = v.as_mut_ptr(); |
41 | let v_mid = v_base.add(mid); |
42 | let v_end = v_base.add(len); |
43 | |
44 | let left_len = mid; |
45 | let right_len = len - mid; |
46 | |
47 | let left_is_shorter = left_len <= right_len; |
48 | let save_base = if left_is_shorter { v_base } else { v_mid }; |
49 | let save_len = if left_is_shorter { left_len } else { right_len }; |
50 | |
51 | ptr::copy_nonoverlapping(save_base, buf, save_len); |
52 | |
53 | let mut merge_state = MergeState { start: buf, end: buf.add(save_len), dst: save_base }; |
54 | |
55 | if left_is_shorter { |
56 | merge_state.merge_up(v_mid, v_end, is_less); |
57 | } else { |
58 | merge_state.merge_down(v_base, buf, v_end, is_less); |
59 | } |
60 | // Finally, `merge_state` gets dropped. If the shorter run was not fully |
61 | // consumed, whatever remains of it will now be copied into the hole in `v`. |
62 | } |
63 | } |
64 | |
65 | // When dropped, copies the range `start..end` into `dst..`. |
66 | struct MergeState<T> { |
67 | start: *mut T, |
68 | end: *mut T, |
69 | dst: *mut T, |
70 | } |
71 | |
72 | impl<T> MergeState<T> { |
73 | /// # Safety |
74 | /// The caller MUST guarantee that `self` is initialized in a way where `start -> end` is |
75 | /// the longer sub-slice and so that `dst` can be written to at least the shorter sub-slice |
76 | /// length times. In addition `start -> end` and `right -> right_end` MUST be valid to be |
77 | /// read. This function MUST only be called once. |
78 | unsafe fn merge_up<F: FnMut(&T, &T) -> bool>( |
79 | &mut self, |
80 | mut right: *const T, |
81 | right_end: *const T, |
82 | is_less: &mut F, |
83 | ) { |
84 | // SAFETY: See function safety comment. |
85 | unsafe { |
86 | let left = &mut self.start; |
87 | let out = &mut self.dst; |
88 | |
89 | while *left != self.end && right as *const T != right_end { |
90 | let consume_left = !is_less(&*right, &**left); |
91 | |
92 | let src = if consume_left { *left } else { right }; |
93 | ptr::copy_nonoverlapping(src, *out, 1); |
94 | |
95 | *left = left.add(consume_left as usize); |
96 | right = right.add(!consume_left as usize); |
97 | |
98 | *out = out.add(1); |
99 | } |
100 | } |
101 | } |
102 | |
103 | /// # Safety |
104 | /// The caller MUST guarantee that `self` is initialized in a way where `left_end <- dst` is |
105 | /// the shorter sub-slice and so that `out` can be written to at least the shorter sub-slice |
106 | /// length times. In addition `left_end <- dst` and `right_end <- end` MUST be valid to be |
107 | /// read. This function MUST only be called once. |
108 | unsafe fn merge_down<F: FnMut(&T, &T) -> bool>( |
109 | &mut self, |
110 | left_end: *const T, |
111 | right_end: *const T, |
112 | mut out: *mut T, |
113 | is_less: &mut F, |
114 | ) { |
115 | // SAFETY: See function safety comment. |
116 | unsafe { |
117 | loop { |
118 | let left = self.dst.sub(1); |
119 | let right = self.end.sub(1); |
120 | out = out.sub(1); |
121 | |
122 | let consume_left = is_less(&*right, &*left); |
123 | |
124 | let src = if consume_left { left } else { right }; |
125 | ptr::copy_nonoverlapping(src, out, 1); |
126 | |
127 | self.dst = left.add(!consume_left as usize); |
128 | self.end = right.add(consume_left as usize); |
129 | |
130 | if self.dst as *const T == left_end || self.end as *const T == right_end { |
131 | break; |
132 | } |
133 | } |
134 | } |
135 | } |
136 | } |
137 | |
138 | impl<T> Drop for MergeState<T> { |
139 | fn drop(&mut self) { |
140 | // SAFETY: The user of MergeState MUST ensure, that at any point this drop |
141 | // impl MAY run, for example when the user provided `is_less` panics, that |
142 | // copying the contiguous region between `start` and `end` to `dst` will |
143 | // leave the input slice `v` with each original element and all possible |
144 | // modifications observed. |
145 | unsafe { |
146 | let len: usize = self.end.offset_from_unsigned(self.start); |
147 | ptr::copy_nonoverlapping(self.start, self.dst, count:len); |
148 | } |
149 | } |
150 | } |
151 | |