Skip to content

Commit af9b508

Browse files
committedOct 15, 2021
Auto merge of #88717 - tabokie:vecdeque-fast-append, r=m-ou-se
Optimize VecDeque::append Optimize `VecDeque::append` to do unsafe copy rather than iterating through each element. On my `Intel(R) Xeon(R) CPU E5-2630 v4 @ 2.20GHz`, the benchmark shows 37% improvements: ``` Master: custom-bench vec_deque_append 583164 ns/iter custom-bench vec_deque_append 550040 ns/iter Patched: custom-bench vec_deque_append 349204 ns/iter custom-bench vec_deque_append 368164 ns/iter ``` Additional notes on the context: this is the third attempt to implement a non-trivial version of `VecDeque::append`, the last two are reverted due to unsoundness or regression, see: - #52553, reverted in #53571 - #53564, reverted in #54851 Both cases are covered by existing tests. Signed-off-by: tabokie <[email protected]>
2 parents 1dafe6d + cd773c3 commit af9b508

File tree

1 file changed

+30
-2
lines changed
  • library/alloc/src/collections/vec_deque

1 file changed

+30
-2
lines changed
 

‎library/alloc/src/collections/vec_deque/mod.rs

+30-2
Original file line numberDiff line numberDiff line change
@@ -418,6 +418,25 @@ impl<T, A: Allocator> VecDeque<T, A> {
418418
}
419419
}
420420

421+
/// Copies all values from `src` to `dst`, wrapping around if needed.
422+
/// Assumes capacity is sufficient.
423+
#[inline]
424+
unsafe fn copy_slice(&mut self, dst: usize, src: &[T]) {
425+
debug_assert!(src.len() <= self.cap());
426+
let head_room = self.cap() - dst;
427+
if src.len() <= head_room {
428+
unsafe {
429+
ptr::copy_nonoverlapping(src.as_ptr(), self.ptr().add(dst), src.len());
430+
}
431+
} else {
432+
let (left, right) = src.split_at(head_room);
433+
unsafe {
434+
ptr::copy_nonoverlapping(left.as_ptr(), self.ptr().add(dst), left.len());
435+
ptr::copy_nonoverlapping(right.as_ptr(), self.ptr(), right.len());
436+
}
437+
}
438+
}
439+
421440
/// Frobs the head and tail sections around to handle the fact that we
422441
/// just reallocated. Unsafe because it trusts old_capacity.
423442
#[inline]
@@ -2081,8 +2100,17 @@ impl<T, A: Allocator> VecDeque<T, A> {
20812100
#[inline]
20822101
#[stable(feature = "append", since = "1.4.0")]
20832102
pub fn append(&mut self, other: &mut Self) {
2084-
// naive impl
2085-
self.extend(other.drain(..));
2103+
self.reserve(other.len());
2104+
unsafe {
2105+
let (left, right) = other.as_slices();
2106+
self.copy_slice(self.head, left);
2107+
self.copy_slice(self.wrap_add(self.head, left.len()), right);
2108+
}
2109+
// SAFETY: Update pointers after copying to avoid leaving doppelganger
2110+
// in case of panics.
2111+
self.head = self.wrap_add(self.head, other.len());
2112+
// Silently drop values in `other`.
2113+
other.tail = other.head;
20862114
}
20872115

20882116
/// Retains only the elements specified by the predicate.

0 commit comments

Comments
 (0)
Please sign in to comment.