Skip to content

Commit cd3d6e8

Browse files
committed
Shrink heapsort further by combining sift_down loops
1 parent bea61da commit cd3d6e8

File tree

3 files changed

+22
-26
lines changed

3 files changed

+22
-26
lines changed

core/src/slice/sort/unstable/heapsort.rs

+18-18
Original file line numberDiff line numberDiff line change
@@ -1,46 +1,46 @@
11
//! This module contains a branchless heapsort as fallback for unstable quicksort.
22
3-
use crate::{intrinsics, ptr};
3+
use crate::{cmp, intrinsics, ptr};
44

55
/// Sorts `v` using heapsort, which guarantees *O*(*n* \* log(*n*)) worst-case.
66
///
77
/// Never inline this, it sits the main hot-loop in `recurse` and is meant as unlikely algorithmic
88
/// fallback.
9-
///
10-
/// SAFETY: The caller has to guarantee that `v.len()` >= 2.
119
#[inline(never)]
12-
pub(crate) unsafe fn heapsort<T, F>(v: &mut [T], is_less: &mut F)
10+
pub(crate) fn heapsort<T, F>(v: &mut [T], is_less: &mut F)
1311
where
1412
F: FnMut(&T, &T) -> bool,
1513
{
16-
// SAFETY: See function safety.
17-
unsafe {
18-
intrinsics::assume(v.len() >= 2);
19-
20-
// Build the heap in linear time.
21-
for i in (0..v.len() / 2).rev() {
22-
sift_down(v, i, is_less);
23-
}
14+
let len = v.len();
2415

25-
// Pop maximal elements from the heap.
26-
for i in (1..v.len()).rev() {
16+
for i in (0..len + len / 2).rev() {
17+
let sift_idx = if i >= len {
18+
i - len
19+
} else {
2720
v.swap(0, i);
28-
sift_down(&mut v[..i], 0, is_less);
21+
0
22+
};
23+
24+
// SAFETY: The above calculation ensures that `sift_idx` is either 0 or
25+
// `(len..(len + (len / 2))) - len`, which simplifies to `0..(len / 2)`.
26+
// This guarantees the required `sift_idx <= len`.
27+
unsafe {
28+
sift_down(&mut v[..cmp::min(i, len)], sift_idx, is_less);
2929
}
3030
}
3131
}
3232

3333
// This binary heap respects the invariant `parent >= child`.
3434
//
35-
// SAFETY: The caller has to guarantee that node < `v.len()`.
36-
#[inline(never)]
35+
// SAFETY: The caller has to guarantee that `node <= v.len()`.
36+
#[inline(always)]
3737
unsafe fn sift_down<T, F>(v: &mut [T], mut node: usize, is_less: &mut F)
3838
where
3939
F: FnMut(&T, &T) -> bool,
4040
{
4141
// SAFETY: See function safety.
4242
unsafe {
43-
intrinsics::assume(node < v.len());
43+
intrinsics::assume(node <= v.len());
4444
}
4545

4646
let len = v.len();

core/src/slice/sort/unstable/mod.rs

+1-4
Original file line numberDiff line numberDiff line change
@@ -32,10 +32,7 @@ pub fn sort<T, F: FnMut(&T, &T) -> bool>(v: &mut [T], is_less: &mut F) {
3232

3333
cfg_if! {
3434
if #[cfg(feature = "optimize_for_size")] {
35-
// SAFETY: We checked that `len >= 2`.
36-
unsafe {
37-
heapsort::heapsort(v, is_less);
38-
}
35+
heapsort::heapsort(v, is_less);
3936
} else {
4037
// More advanced sorting methods than insertion sort are faster if called in
4138
// a hot loop for small inputs, but for general-purpose code the small

core/src/slice/sort/unstable/quicksort.rs

+3-4
Original file line numberDiff line numberDiff line change
@@ -5,6 +5,8 @@ use crate::mem::{self, ManuallyDrop};
55
use crate::slice::sort::shared::pivot::choose_pivot;
66
#[cfg(not(feature = "optimize_for_size"))]
77
use crate::slice::sort::shared::smallsort::UnstableSmallSortTypeImpl;
8+
#[cfg(not(feature = "optimize_for_size"))]
9+
use crate::slice::sort::unstable::heapsort;
810
use crate::{intrinsics, ptr};
911

1012
/// Sorts `v` recursively.
@@ -31,10 +33,7 @@ pub(crate) fn quicksort<'a, T, F>(
3133
// If too many bad pivot choices were made, simply fall back to heapsort in order to
3234
// guarantee `O(N x log(N))` worst-case.
3335
if limit == 0 {
34-
// SAFETY: We assume the `small_sort` threshold is at least 1.
35-
unsafe {
36-
crate::slice::sort::unstable::heapsort::heapsort(v, is_less);
37-
}
36+
heapsort::heapsort(v, is_less);
3837
return;
3938
}
4039

0 commit comments

Comments
 (0)