Skip to content

Commit 316b300

Browse files
committed
In-place growth for HashMap.
1 parent 7169114 commit 316b300

File tree

2 files changed

+96
-24
lines changed

2 files changed

+96
-24
lines changed

src/libstd/collections/hash/map.rs

+40-17
Original file line numberDiff line numberDiff line change
@@ -23,7 +23,7 @@ use iter::{Iterator, ExactSizeIterator, IntoIterator, IteratorExt, FromIterator,
2323
use marker::Sized;
2424
use mem::{self, replace};
2525
use num::{Int, UnsignedInt};
26-
use ops::{Drop, FnMut, Index, IndexMut};
26+
use ops::{Deref, DerefMut, Drop, FnMut, Index, IndexMut};
2727
use option::Option::{self, Some, None};
2828
use rand::{self, Rng};
2929
use result::Result::{self, Ok, Err};
@@ -445,7 +445,7 @@ fn robin_hood<'a, K: 'a, V: 'a>(bucket: FullBucketMut<'a, K, V>,
445445

446446
// Performs insertion with relaxed requirements.
447447
// The caller should ensure that invariants of Robin Hood linear probing hold.
448-
fn insert_hashed_ordered<M, K, V>(arg: M, h: SafeHash, k: K, v: V) -> M
448+
fn insert_hashed_ordered<M: Put, K, V>(arg: M, h: SafeHash, k: K, v: V) -> M
449449
where RawTable<K, V>: BorrowFromMut<M>
450450
{
451451
let table = TableRef(arg);
@@ -652,12 +652,20 @@ impl<K, V, S> HashMap<K, V, S>
652652
}
653653

654654
// Grow the table.
655-
let mut destination = RawTable::new(new_capacity);
655+
let is_inplace = self.table.grow_inplace(new_capacity);
656+
657+
let mut destination = if is_inplace {
658+
// Resizing in-place.
659+
None
660+
} else {
661+
// Borrow self.table in both branches to satisfy the checker.
662+
Some(RawTable::new(new_capacity))
663+
};
656664

657665
// Iterate over `old_capacity` buckets, which constitute half of
658666
// the table which was resized in-place, or the entire
659667
// `old_table`.
660-
let mut bucket = Bucket::at_index(&mut self.table, 0).ok().unwrap();
668+
let mut bucket = Bucket::at_index(&mut self.table, 0).ok().unwrap().iter_to(old_capacity);
661669

662670
// "So a few of the first shall be last: for many be called,
663671
// but few chosen."
@@ -703,20 +711,35 @@ impl<K, V, S> HashMap<K, V, S>
703711
// ^ exit once table.size == 0
704712
let idx_end = bucket.index() + old_capacity;
705713

706-
while bucket.index() != idx_end {
707-
bucket = match bucket.peek() {
708-
Full(bucket) => {
709-
let h = *bucket.read().0;
710-
let (b, k, v) = bucket.take();
711-
insert_hashed_ordered(&mut destination, h, k, v);
712-
b.into_bucket()
713-
}
714-
Empty(b) => b.into_bucket()
715-
};
716-
bucket.next(); // wraps at old_capacity
717-
}
714+
if let Some(mut dest) = destination {
715+
while bucket.index() != idx_end {
716+
bucket = match bucket.peek() {
717+
Full(bucket) => {
718+
let h = *bucket.read().0;
719+
let (b, k, v) = bucket.take();
720+
insert_hashed_ordered(&mut dest, h, k, v);
721+
b.into_bucket()
722+
}
723+
Empty(b) => b.into_bucket()
724+
};
725+
bucket.next(); // wraps at old_capacity
726+
}
718727

719-
replace(bucket.into_table(), destination);
728+
replace(bucket.into_table(), dest);
729+
} else {
730+
while bucket.index() != idx_end {
731+
bucket = match bucket.peek() {
732+
Full(bucket) => {
733+
let h = *bucket.read().0;
734+
let (b, k, v) = bucket.take();
735+
// Resizing in-place.
736+
insert_hashed_ordered(b.into_bucket(), h, k, v)
737+
}
738+
Empty(b) => b.into_bucket()
739+
};
740+
bucket.next(); // wraps at old_capacity
741+
}
742+
}
720743
}
721744

722745
/// Shrinks the capacity of the map as much as possible. It will drop

src/libstd/collections/hash/table.rs

+56-7
Original file line numberDiff line numberDiff line change
@@ -22,9 +22,9 @@ use mem::{self, min_align_of, size_of};
2222
use num::{Int, UnsignedInt};
2323
use ops::{Deref, DerefMut, Drop};
2424
use option::Option::{self, Some, None};
25-
use ptr::{self, Unique, PtrExt, copy_nonoverlapping_memory, zero_memory};
25+
use ptr::{self, Unique, PtrExt, copy_memory, copy_nonoverlapping_memory, zero_memory};
2626
use result::Result::{self, Ok, Err};
27-
use rt::heap::{allocate, deallocate, EMPTY};
27+
use rt::heap::{EMPTY, allocate, deallocate, reallocate_inplace};
2828
use collections::hash_state::HashState;
2929
use core::nonzero::NonZero;
3030

@@ -199,15 +199,15 @@ impl<K, V, M, S> Borrow<RawTable<K, V>> for Bucket<K, V, M, S>
199199
where M: Borrow<RawTable<K, V>>
200200
{
201201
fn borrow(&self) -> &RawTable<K, V> {
202-
bucket.table.0.borrow()
202+
self.table.0.borrow()
203203
}
204204
}
205205

206206
impl<K, V, M, S> BorrowMut<RawTable<K, V>> for Bucket<K, V, M, S>
207207
where M: Borrow<RawTable<K, V>>
208208
{
209209
fn borrow_mut(&mut self) -> &mut RawTable<K, V> {
210-
bucket.table.0.borrow_mut()
210+
self.table.0.borrow_mut()
211211
}
212212
}
213213

@@ -271,6 +271,14 @@ impl<K, V, M> Bucket<K, V, M> where M: Borrow<RawTable<K, V>> {
271271
Bucket::at_index(table, 0).map(|b| b.into_iter()).unwrap_or_else(|b| b.into_iter())
272272
}
273273

274+
/// Narrows down the range of iteration, which must be a power of 2.
275+
pub fn iter_to(mut self, limit: usize) -> Bucket<K, V, M> {
276+
assert!(limit <= self.table.capacity());
277+
assert!(limit.is_power_of_two());
278+
self.capacity = limit;
279+
self
280+
}
281+
274282
/// Reads a bucket at a given index, returning an enum indicating whether
275283
/// it's initialized or not. You need to match on this enum to get
276284
/// the appropriate types to call most of the other functions in
@@ -479,7 +487,7 @@ impl<K, V> RawTable<K, V> {
479487
RawTable {
480488
capacity: capacity,
481489
size: 0,
482-
middle: Unique((hashes as *mut (K, V)).offset(capacity as isize)),
490+
middle: Unique::new((hashes as *mut (K, V)).offset(capacity as isize)),
483491
}
484492
};
485493

@@ -514,6 +522,47 @@ impl<K, V> RawTable<K, V> {
514522
}
515523
}
516524

525+
pub fn grow_inplace(&mut self, capacity: uint) -> bool {
526+
assert!(capacity.is_power_of_two());
527+
assert!(capacity >= self.capacity);
528+
529+
if self.middle.ptr.is_null() {
530+
return false;
531+
}
532+
533+
let new_size = checked_size_generic::<K, V>(capacity);
534+
535+
unsafe {
536+
let ptr = self.middle.ptr.offset(-(self.capacity as isize)) as *mut u8;
537+
let is_inplace = reallocate_inplace(ptr,
538+
size_generic::<K, V>(self.capacity),
539+
new_size,
540+
align::<K, V>()) >= new_size;
541+
542+
if is_inplace {
543+
let cap_diff = (capacity - self.capacity) as isize;
544+
let hashes = self.middle.ptr.offset(cap_diff) as *mut Option<SafeHash>;
545+
// Copy the array of hashes. Maybe it's already in cache.
546+
if size_of::<(K, V)>() >= size_of::<Option<SafeHash>>() {
547+
// The regions of memory occupied by old and new hash arrays are disjoint.
548+
// before: [KVKVKVKV|h h h h ]
549+
// after: [KVKVKVKV|KVKVKVKV|h h h h h h h h ]
550+
copy_nonoverlapping_memory(hashes, self.middle.ptr as *const _, self.capacity);
551+
} else {
552+
// before: [KVKVKVKV|h h |h h ]
553+
// after: [KVKVKVKV|KVKVKVKV|h h h h h h h h ]
554+
copy_memory(hashes, self.middle.ptr as *const _, self.capacity);
555+
}
556+
zero_memory(hashes.offset(self.capacity as int), capacity - self.capacity);
557+
558+
self.middle = Unique::new(self.middle.ptr.offset(cap_diff));
559+
self.capacity = capacity;
560+
}
561+
562+
return is_inplace;
563+
}
564+
}
565+
517566
/// The hashtable's capacity, similar to a vector's.
518567
pub fn capacity(&self) -> usize {
519568
self.capacity
@@ -570,13 +619,13 @@ fn align<K, V>() -> usize {
570619
/// A newtyped RawBucket. Not copyable.
571620
pub struct RawFullBucket<K, V, M>(RawBucket<K, V>);
572621

573-
impl<'t, K, V, M: 't> RawFullBucket<K, V, M> where RawTable<K, V>: BorrowFrom<M> {
622+
impl<'t, K, V, M: 't> RawFullBucket<K, V, M> where M: Borrow<RawTable<K, V>> {
574623
pub fn into_refs(self) -> (&'t K, &'t V) {
575624
unsafe { (&(*self.0.kval).0, &(*self.0.kval).1) }
576625
}
577626
}
578627

579-
impl<'t, K, V, M: 't> RawFullBucket<K, V, M> where RawTable<K, V>: BorrowFromMut<M> {
628+
impl<'t, K, V, M: 't> RawFullBucket<K, V, M> where M: BorrowMut<RawTable<K, V>> {
580629
pub fn into_mut_refs(self) -> (&'t mut K, &'t mut V) {
581630
unsafe { (&mut (*self.0.kval).0, &mut (*self.0.kval).1) }
582631
}

0 commit comments

Comments
 (0)