Skip to content
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.

Commit 897896d

Browse files
committedApr 6, 2019
Auto merge of #59591 - kennytm:needle-api, r=<try>
[WIP] Implement Needle API (RFC 2500) cc #56345 ---- Insta-stable changes: * `impl Index<Range***> for OsStr` cannot be gated and is insta-stable. I'll add more comments after the crater run.
2 parents b025802 + d8bdeb6 commit 897896d

30 files changed

+7085
-3467
lines changed
 

‎src/liballoc/lib.rs

+1-1
Original file line numberDiff line numberDiff line change
@@ -93,7 +93,7 @@
9393
#![feature(needs_allocator)]
9494
#![feature(nll)]
9595
#![feature(optin_builtin_traits)]
96-
#![feature(pattern)]
96+
#![feature(needle)]
9797
#![feature(ptr_internals)]
9898
#![feature(ptr_offset_from)]
9999
#![feature(rustc_attrs)]

‎src/liballoc/slice.rs

+35
Original file line numberDiff line numberDiff line change
@@ -92,6 +92,7 @@ use core::cmp::Ordering::{self, Less};
9292
use core::mem::{self, size_of};
9393
use core::ptr;
9494
use core::{u8, u16, u32};
95+
use core::needle::{ext, Needle, Searcher, Consumer};
9596

9697
use crate::borrow::ToOwned;
9798
use crate::boxed::Box;
@@ -485,6 +486,40 @@ impl<T> [T] {
485486
}
486487
buf
487488
}
489+
490+
/// Replaces all matches of a predicate with another slice.
491+
#[unstable(feature = "slice_needle_methods", issue = "56345")]
492+
#[inline]
493+
#[must_use = "this returns the replaced slice as a new allocation, \
494+
without modifying the original"]
495+
pub fn replace<'s: 'a, 'a, F>(&'s self, from: F, to: &'a [T]) -> Vec<T>
496+
where
497+
T: Clone,
498+
F: Needle<&'a [T]>,
499+
F::Searcher: Searcher<[T]>, // FIXME: RFC 2089
500+
F::Consumer: Consumer<[T]>, // FIXME: RFC 2089
501+
{
502+
let mut result = Vec::with_capacity(self.len());
503+
ext::replace_with(self, from, |_| to, |s| result.extend_from_slice(s));
504+
result
505+
}
506+
507+
/// Replaces first N matches of a predicate with another slice.
508+
#[unstable(feature = "slice_needle_methods", issue = "56345")]
509+
#[inline]
510+
#[must_use = "this returns the replaced slice as a new allocation, \
511+
without modifying the original"]
512+
pub fn replacen<'s: 'a, 'a, F>(&'s self, from: F, to: &'a [T], count: usize) -> Vec<T>
513+
where
514+
T: Clone,
515+
F: Needle<&'a [T]>,
516+
F::Searcher: Searcher<[T]>, // FIXME: RFC 2089
517+
F::Consumer: Consumer<[T]>, // FIXME: RFC 2089
518+
{
519+
let mut result = Vec::with_capacity(self.len());
520+
ext::replacen_with(self, from, |_| to, count, |s| result.extend_from_slice(s));
521+
result
522+
}
488523
}
489524

490525
#[lang = "slice_u8_alloc"]

‎src/liballoc/str.rs

+19-23
Original file line numberDiff line numberDiff line change
@@ -28,14 +28,14 @@
2828
// It's cleaner to just turn off the unused_imports warning than to fix them.
2929
#![allow(unused_imports)]
3030

31-
use core::borrow::Borrow;
32-
use core::str::pattern::{Pattern, Searcher, ReverseSearcher, DoubleEndedSearcher};
31+
use core::fmt;
32+
use core::needle::{ext, Needle, Searcher, Consumer};
3333
use core::mem;
3434
use core::ptr;
3535
use core::iter::FusedIterator;
3636
use core::unicode::conversions;
3737

38-
use crate::borrow::ToOwned;
38+
use crate::borrow::{Borrow, ToOwned};
3939
use crate::boxed::Box;
4040
use crate::slice::{SliceConcatExt, SliceIndex};
4141
use crate::string::String;
@@ -62,8 +62,6 @@ pub use core::str::{from_utf8, from_utf8_mut, Chars, CharIndices, Bytes};
6262
pub use core::str::{from_utf8_unchecked, from_utf8_unchecked_mut, ParseBoolError};
6363
#[stable(feature = "rust1", since = "1.0.0")]
6464
pub use core::str::SplitWhitespace;
65-
#[stable(feature = "rust1", since = "1.0.0")]
66-
pub use core::str::pattern;
6765
#[stable(feature = "encode_utf16", since = "1.8.0")]
6866
pub use core::str::EncodeUtf16;
6967
#[stable(feature = "split_ascii_whitespace", since = "1.34.0")]
@@ -253,15 +251,14 @@ impl str {
253251
without modifying the original"]
254252
#[stable(feature = "rust1", since = "1.0.0")]
255253
#[inline]
256-
pub fn replace<'a, P: Pattern<'a>>(&'a self, from: P, to: &str) -> String {
257-
let mut result = String::new();
258-
let mut last_end = 0;
259-
for (start, part) in self.match_indices(from) {
260-
result.push_str(unsafe { self.get_unchecked(last_end..start) });
261-
result.push_str(to);
262-
last_end = start + part.len();
263-
}
264-
result.push_str(unsafe { self.get_unchecked(last_end..self.len()) });
254+
pub fn replace<'s: 'a, 'a, P>(&'s self, from: P, to: &'a str) -> String
255+
where
256+
P: Needle<&'a str>,
257+
P::Searcher: Searcher<str>, // FIXME: RFC 2089
258+
P::Consumer: Consumer<str>, // FIXME: RFC 2089
259+
{
260+
let mut result = String::with_capacity(self.len());
261+
ext::replace_with(self, from, |_| to, |s| result.push_str(s));
265262
result
266263
}
267264

@@ -293,16 +290,15 @@ impl str {
293290
#[must_use = "this returns the replaced string as a new allocation, \
294291
without modifying the original"]
295292
#[stable(feature = "str_replacen", since = "1.16.0")]
296-
pub fn replacen<'a, P: Pattern<'a>>(&'a self, pat: P, to: &str, count: usize) -> String {
293+
pub fn replacen<'s: 'a, 'a, P>(&'s self, pat: P, to: &'a str, count: usize) -> String
294+
where
295+
P: Needle<&'a str>,
296+
P::Searcher: Searcher<str>, // FIXME: RFC 2089
297+
P::Consumer: Consumer<str>, // FIXME: RFC 2089
298+
{
297299
// Hope to reduce the times of re-allocation
298-
let mut result = String::with_capacity(32);
299-
let mut last_end = 0;
300-
for (start, part) in self.match_indices(pat).take(count) {
301-
result.push_str(unsafe { self.get_unchecked(last_end..start) });
302-
result.push_str(to);
303-
last_end = start + part.len();
304-
}
305-
result.push_str(unsafe { self.get_unchecked(last_end..self.len()) });
300+
let mut result = String::with_capacity(self.len());
301+
ext::replacen_with(self, pat, |_| to, count, |s| result.push_str(s));
306302
result
307303
}
308304

‎src/liballoc/string.rs

+10-14
Original file line numberDiff line numberDiff line change
@@ -53,7 +53,8 @@ use core::iter::{FromIterator, FusedIterator};
5353
use core::ops::{self, Add, AddAssign, Index, IndexMut, RangeBounds};
5454
use core::ops::Bound::{Excluded, Included, Unbounded};
5555
use core::ptr;
56-
use core::str::{pattern::Pattern, lossy};
56+
use core::needle::Needle;
57+
use core::str::lossy;
5758

5859
use crate::borrow::{Cow, ToOwned};
5960
use crate::collections::CollectionAllocErr;
@@ -1792,24 +1793,19 @@ impl<'a> Extend<Cow<'a, str>> for String {
17921793
}
17931794

17941795
/// A convenience impl that delegates to the impl for `&str`
1795-
#[unstable(feature = "pattern",
1796-
reason = "API not fully fleshed out and ready to be stabilized",
1797-
issue = "27721")]
1798-
impl<'a, 'b> Pattern<'a> for &'b String {
1799-
type Searcher = <&'b str as Pattern<'a>>::Searcher;
1800-
1801-
fn into_searcher(self, haystack: &'a str) -> <&'b str as Pattern<'a>>::Searcher {
1802-
self[..].into_searcher(haystack)
1803-
}
1796+
#[unstable(feature = "needle", issue = "56345")]
1797+
impl<'a, 'b> Needle<&'a str> for &'b String {
1798+
type Searcher = <&'b str as Needle<&'a str>>::Searcher;
1799+
type Consumer = <&'b str as Needle<&'a str>>::Consumer;
18041800

18051801
#[inline]
1806-
fn is_contained_in(self, haystack: &'a str) -> bool {
1807-
self[..].is_contained_in(haystack)
1802+
fn into_searcher(self) -> Self::Searcher {
1803+
<&'b str as Needle<&'a str>>::into_searcher(&**self)
18081804
}
18091805

18101806
#[inline]
1811-
fn is_prefix_of(self, haystack: &'a str) -> bool {
1812-
self[..].is_prefix_of(haystack)
1807+
fn into_consumer(self) -> Self::Consumer {
1808+
<&'b str as Needle<&'a str>>::into_consumer(&**self)
18131809
}
18141810
}
18151811

‎src/liballoc/tests/lib.rs

+3-1
Original file line numberDiff line numberDiff line change
@@ -2,11 +2,13 @@
22
#![feature(box_syntax)]
33
#![feature(drain_filter)]
44
#![feature(exact_size_is_empty)]
5-
#![feature(pattern)]
65
#![feature(repeat_generic_slice)]
6+
#![feature(needle)]
77
#![feature(try_reserve)]
88
#![feature(unboxed_closures)]
99
#![feature(vecdeque_rotate)]
10+
#![feature(mut_str_needle_methods)]
11+
#![feature(slice_needle_methods)]
1012

1113
use std::hash::{Hash, Hasher};
1214
use std::collections::hash_map::DefaultHasher;

‎src/liballoc/tests/slice.rs

+82-28
Original file line numberDiff line numberDiff line change
@@ -5,6 +5,7 @@ use std::panic;
55
use std::rc::Rc;
66
use std::sync::atomic::{Ordering::Relaxed, AtomicUsize};
77
use std::thread;
8+
use std::f64::NAN;
89

910
use rand::{Rng, RngCore, thread_rng};
1011
use rand::seq::SliceRandom;
@@ -835,88 +836,88 @@ fn test_splitator() {
835836
let xs = &[1, 2, 3, 4, 5];
836837

837838
let splits: &[&[_]] = &[&[1], &[3], &[5]];
838-
assert_eq!(xs.split(|x| *x % 2 == 0).collect::<Vec<_>>(), splits);
839+
assert_eq!(xs.split(|x: &i32| *x % 2 == 0).collect::<Vec<_>>(), splits);
839840
let splits: &[&[_]] = &[&[], &[2, 3, 4, 5]];
840-
assert_eq!(xs.split(|x| *x == 1).collect::<Vec<_>>(), splits);
841+
assert_eq!(xs.split(|x: &i32| *x == 1).collect::<Vec<_>>(), splits);
841842
let splits: &[&[_]] = &[&[1, 2, 3, 4], &[]];
842-
assert_eq!(xs.split(|x| *x == 5).collect::<Vec<_>>(), splits);
843+
assert_eq!(xs.split(|x: &i32| *x == 5).collect::<Vec<_>>(), splits);
843844
let splits: &[&[_]] = &[&[1, 2, 3, 4, 5]];
844-
assert_eq!(xs.split(|x| *x == 10).collect::<Vec<_>>(), splits);
845+
assert_eq!(xs.split(|x: &i32| *x == 10).collect::<Vec<_>>(), splits);
845846
let splits: &[&[_]] = &[&[], &[], &[], &[], &[], &[]];
846-
assert_eq!(xs.split(|_| true).collect::<Vec<&[i32]>>(), splits);
847+
assert_eq!(xs.split(|_: &i32| true).collect::<Vec<&[i32]>>(), splits);
847848

848849
let xs: &[i32] = &[];
849850
let splits: &[&[i32]] = &[&[]];
850-
assert_eq!(xs.split(|x| *x == 5).collect::<Vec<&[i32]>>(), splits);
851+
assert_eq!(xs.split(|x: &i32| *x == 5).collect::<Vec<&[i32]>>(), splits);
851852
}
852853

853854
#[test]
854855
fn test_splitnator() {
855856
let xs = &[1, 2, 3, 4, 5];
856857

857858
let splits: &[&[_]] = &[&[1, 2, 3, 4, 5]];
858-
assert_eq!(xs.splitn(1, |x| *x % 2 == 0).collect::<Vec<_>>(), splits);
859+
assert_eq!(xs.splitn(1, |x: &i32| *x % 2 == 0).collect::<Vec<_>>(), splits);
859860
let splits: &[&[_]] = &[&[1], &[3, 4, 5]];
860-
assert_eq!(xs.splitn(2, |x| *x % 2 == 0).collect::<Vec<_>>(), splits);
861+
assert_eq!(xs.splitn(2, |x: &i32| *x % 2 == 0).collect::<Vec<_>>(), splits);
861862
let splits: &[&[_]] = &[&[], &[], &[], &[4, 5]];
862-
assert_eq!(xs.splitn(4, |_| true).collect::<Vec<_>>(), splits);
863+
assert_eq!(xs.splitn(4, |_: &i32| true).collect::<Vec<_>>(), splits);
863864

864865
let xs: &[i32] = &[];
865866
let splits: &[&[i32]] = &[&[]];
866-
assert_eq!(xs.splitn(2, |x| *x == 5).collect::<Vec<_>>(), splits);
867+
assert_eq!(xs.splitn(2, |x: &i32| *x == 5).collect::<Vec<_>>(), splits);
867868
}
868869

869870
#[test]
870871
fn test_splitnator_mut() {
871872
let xs = &mut [1, 2, 3, 4, 5];
872873

873874
let splits: &[&mut [_]] = &[&mut [1, 2, 3, 4, 5]];
874-
assert_eq!(xs.splitn_mut(1, |x| *x % 2 == 0).collect::<Vec<_>>(),
875+
assert_eq!(xs.splitn_mut(1, |x: &i32| *x % 2 == 0).collect::<Vec<_>>(),
875876
splits);
876877
let splits: &[&mut [_]] = &[&mut [1], &mut [3, 4, 5]];
877-
assert_eq!(xs.splitn_mut(2, |x| *x % 2 == 0).collect::<Vec<_>>(),
878+
assert_eq!(xs.splitn_mut(2, |x: &i32| *x % 2 == 0).collect::<Vec<_>>(),
878879
splits);
879880
let splits: &[&mut [_]] = &[&mut [], &mut [], &mut [], &mut [4, 5]];
880-
assert_eq!(xs.splitn_mut(4, |_| true).collect::<Vec<_>>(), splits);
881+
assert_eq!(xs.splitn_mut(4, |_: &i32| true).collect::<Vec<_>>(), splits);
881882

882883
let xs: &mut [i32] = &mut [];
883884
let splits: &[&mut [i32]] = &[&mut []];
884-
assert_eq!(xs.splitn_mut(2, |x| *x == 5).collect::<Vec<_>>(), splits);
885+
assert_eq!(xs.splitn_mut(2, |x: &i32| *x == 5).collect::<Vec<_>>(), splits);
885886
}
886887

887888
#[test]
888889
fn test_rsplitator() {
889890
let xs = &[1, 2, 3, 4, 5];
890891

891892
let splits: &[&[_]] = &[&[5], &[3], &[1]];
892-
assert_eq!(xs.split(|x| *x % 2 == 0).rev().collect::<Vec<_>>(), splits);
893+
assert_eq!(xs.split(|x: &i32| *x % 2 == 0).rev().collect::<Vec<_>>(), splits);
893894
let splits: &[&[_]] = &[&[2, 3, 4, 5], &[]];
894-
assert_eq!(xs.split(|x| *x == 1).rev().collect::<Vec<_>>(), splits);
895+
assert_eq!(xs.split(|x: &i32| *x == 1).rev().collect::<Vec<_>>(), splits);
895896
let splits: &[&[_]] = &[&[], &[1, 2, 3, 4]];
896-
assert_eq!(xs.split(|x| *x == 5).rev().collect::<Vec<_>>(), splits);
897+
assert_eq!(xs.split(|x: &i32| *x == 5).rev().collect::<Vec<_>>(), splits);
897898
let splits: &[&[_]] = &[&[1, 2, 3, 4, 5]];
898-
assert_eq!(xs.split(|x| *x == 10).rev().collect::<Vec<_>>(), splits);
899+
assert_eq!(xs.split(|x: &i32| *x == 10).rev().collect::<Vec<_>>(), splits);
899900

900901
let xs: &[i32] = &[];
901902
let splits: &[&[i32]] = &[&[]];
902-
assert_eq!(xs.split(|x| *x == 5).rev().collect::<Vec<&[i32]>>(), splits);
903+
assert_eq!(xs.split(|x: &i32| *x == 5).rev().collect::<Vec<&[i32]>>(), splits);
903904
}
904905

905906
#[test]
906907
fn test_rsplitnator() {
907908
let xs = &[1, 2, 3, 4, 5];
908909

909910
let splits: &[&[_]] = &[&[1, 2, 3, 4, 5]];
910-
assert_eq!(xs.rsplitn(1, |x| *x % 2 == 0).collect::<Vec<_>>(), splits);
911+
assert_eq!(xs.rsplitn(1, |x: &i32| *x % 2 == 0).collect::<Vec<_>>(), splits);
911912
let splits: &[&[_]] = &[&[5], &[1, 2, 3]];
912-
assert_eq!(xs.rsplitn(2, |x| *x % 2 == 0).collect::<Vec<_>>(), splits);
913+
assert_eq!(xs.rsplitn(2, |x: &i32| *x % 2 == 0).collect::<Vec<_>>(), splits);
913914
let splits: &[&[_]] = &[&[], &[], &[], &[1, 2]];
914-
assert_eq!(xs.rsplitn(4, |_| true).collect::<Vec<_>>(), splits);
915+
assert_eq!(xs.rsplitn(4, |_: &i32| true).collect::<Vec<_>>(), splits);
915916

916917
let xs: &[i32] = &[];
917918
let splits: &[&[i32]] = &[&[]];
918-
assert_eq!(xs.rsplitn(2, |x| *x == 5).collect::<Vec<&[i32]>>(), splits);
919-
assert!(xs.rsplitn(0, |x| *x % 2 == 0).next().is_none());
919+
assert_eq!(xs.rsplitn(2, |x: &i32| *x == 5).collect::<Vec<&[i32]>>(), splits);
920+
assert!(xs.rsplitn(0, |x: &i32| *x % 2 == 0).next().is_none());
920921
}
921922

922923
#[test]
@@ -1209,14 +1210,14 @@ fn test_ends_with() {
12091210
#[test]
12101211
fn test_mut_splitator() {
12111212
let mut xs = [0, 1, 0, 2, 3, 0, 0, 4, 5, 0];
1212-
assert_eq!(xs.split_mut(|x| *x == 0).count(), 6);
1213-
for slice in xs.split_mut(|x| *x == 0) {
1213+
assert_eq!(xs.split_mut(|x: &i32| *x == 0).count(), 6);
1214+
for slice in xs.split_mut(|x: &i32| *x == 0) {
12141215
slice.reverse();
12151216
}
12161217
assert!(xs == [0, 1, 0, 3, 2, 0, 0, 5, 4, 0]);
12171218

12181219
let mut xs = [0, 1, 0, 2, 3, 0, 0, 4, 5, 0, 6, 7];
1219-
for slice in xs.split_mut(|x| *x == 0).take(5) {
1220+
for slice in xs.split_mut(|x: &i32| *x == 0).take(5) {
12201221
slice.reverse();
12211222
}
12221223
assert!(xs == [0, 1, 0, 3, 2, 0, 0, 5, 4, 0, 6, 7]);
@@ -1225,7 +1226,7 @@ fn test_mut_splitator() {
12251226
#[test]
12261227
fn test_mut_splitator_rev() {
12271228
let mut xs = [1, 2, 0, 3, 4, 0, 0, 5, 6, 0];
1228-
for slice in xs.split_mut(|x| *x == 0).rev().take(4) {
1229+
for slice in xs.split_mut(|x: &i32| *x == 0).rev().take(4) {
12291230
slice.reverse();
12301231
}
12311232
assert!(xs == [1, 2, 0, 4, 3, 0, 0, 6, 5, 0]);
@@ -1646,3 +1647,56 @@ fn repeat_generic_slice() {
16461647
vec![1, 2, 3, 4, 1, 2, 3, 4, 1, 2, 3, 4]
16471648
);
16481649
}
1650+
1651+
#[test]
1652+
fn test_match_indices_simple() {
1653+
let haystack = &[1.0, 2.0, 3.0, 4.0, 5.0, 6.0, 7.0, 8.0, 2.0, 3.0, 2.0, 4.0, 8.0][..];
1654+
let needle = &[2.0, 3.0][..];
1655+
1656+
assert_eq!(haystack.match_indices(needle).collect::<Vec<_>>(), vec![
1657+
(1, needle),
1658+
(8, needle),
1659+
]);
1660+
}
1661+
1662+
#[test]
1663+
fn test_match_indices_nan_haystack() {
1664+
let haystack = &[1.0, 2.0, NAN, 1.0, 2.0, NAN, 1.0, NAN, NAN, NAN, 2.0, 1.0, 2.0][..];
1665+
let needle = &[1.0, 2.0][..];
1666+
1667+
assert_eq!(haystack.match_indices(needle).collect::<Vec<_>>(), vec![
1668+
(0, needle),
1669+
(3, needle),
1670+
(11, needle),
1671+
]);
1672+
}
1673+
1674+
#[test]
1675+
fn test_match_indices_nan_needle() {
1676+
let haystack = &[1.0, 2.0, NAN, 1.0, 2.0, NAN, 1.0, NAN, NAN, NAN, 2.0, 1.0, 2.0][..];
1677+
let needle = &[2.0, NAN][..];
1678+
1679+
assert_eq!(haystack.match_indices(needle).collect::<Vec<_>>(), vec![
1680+
]);
1681+
}
1682+
1683+
#[test]
1684+
fn test_match_indices_negative_zero() {
1685+
let haystack = &[-0.0, 0.0, 0.0, -0.0, 0.0][..];
1686+
let needle = &[0.0, -0.0][..];
1687+
1688+
assert_eq!(haystack.match_indices(needle).collect::<Vec<_>>(), vec![
1689+
(0, needle),
1690+
(2, needle),
1691+
]);
1692+
}
1693+
1694+
#[test]
1695+
fn test_replace() {
1696+
let haystack = &b" empowering everyone to build reliable and efficient software."[..];
1697+
1698+
assert_eq!(
1699+
haystack.replace(&b" e"[..], b" **E**"),
1700+
b" **E**mpowering **E**veryone to build reliable and **E**fficient software.".to_vec()
1701+
);
1702+
}

‎src/liballoc/tests/str.rs

+41-142
Original file line numberDiff line numberDiff line change
@@ -1606,145 +1606,6 @@ fn test_repeat() {
16061606
assert_eq!("α".repeat(3), "ααα");
16071607
}
16081608

1609-
mod pattern {
1610-
use std::str::pattern::{Pattern, Searcher, ReverseSearcher};
1611-
use std::str::pattern::SearchStep::{self, Match, Reject, Done};
1612-
1613-
macro_rules! make_test {
1614-
($name:ident, $p:expr, $h:expr, [$($e:expr,)*]) => {
1615-
#[allow(unused_imports)]
1616-
mod $name {
1617-
use std::str::pattern::SearchStep::{Match, Reject};
1618-
use super::{cmp_search_to_vec};
1619-
#[test]
1620-
fn fwd() {
1621-
cmp_search_to_vec(false, $p, $h, vec![$($e),*]);
1622-
}
1623-
#[test]
1624-
fn bwd() {
1625-
cmp_search_to_vec(true, $p, $h, vec![$($e),*]);
1626-
}
1627-
}
1628-
}
1629-
}
1630-
1631-
fn cmp_search_to_vec<'a, P: Pattern<'a>>(rev: bool, pat: P, haystack: &'a str,
1632-
right: Vec<SearchStep>)
1633-
where P::Searcher: ReverseSearcher<'a>
1634-
{
1635-
let mut searcher = pat.into_searcher(haystack);
1636-
let mut v = vec![];
1637-
loop {
1638-
match if !rev {searcher.next()} else {searcher.next_back()} {
1639-
Match(a, b) => v.push(Match(a, b)),
1640-
Reject(a, b) => v.push(Reject(a, b)),
1641-
Done => break,
1642-
}
1643-
}
1644-
if rev {
1645-
v.reverse();
1646-
}
1647-
1648-
let mut first_index = 0;
1649-
let mut err = None;
1650-
1651-
for (i, e) in right.iter().enumerate() {
1652-
match *e {
1653-
Match(a, b) | Reject(a, b)
1654-
if a <= b && a == first_index => {
1655-
first_index = b;
1656-
}
1657-
_ => {
1658-
err = Some(i);
1659-
break;
1660-
}
1661-
}
1662-
}
1663-
1664-
if let Some(err) = err {
1665-
panic!("Input skipped range at {}", err);
1666-
}
1667-
1668-
if first_index != haystack.len() {
1669-
panic!("Did not cover whole input");
1670-
}
1671-
1672-
assert_eq!(v, right);
1673-
}
1674-
1675-
make_test!(str_searcher_ascii_haystack, "bb", "abbcbbd", [
1676-
Reject(0, 1),
1677-
Match (1, 3),
1678-
Reject(3, 4),
1679-
Match (4, 6),
1680-
Reject(6, 7),
1681-
]);
1682-
make_test!(str_searcher_ascii_haystack_seq, "bb", "abbcbbbbd", [
1683-
Reject(0, 1),
1684-
Match (1, 3),
1685-
Reject(3, 4),
1686-
Match (4, 6),
1687-
Match (6, 8),
1688-
Reject(8, 9),
1689-
]);
1690-
make_test!(str_searcher_empty_needle_ascii_haystack, "", "abbcbbd", [
1691-
Match (0, 0),
1692-
Reject(0, 1),
1693-
Match (1, 1),
1694-
Reject(1, 2),
1695-
Match (2, 2),
1696-
Reject(2, 3),
1697-
Match (3, 3),
1698-
Reject(3, 4),
1699-
Match (4, 4),
1700-
Reject(4, 5),
1701-
Match (5, 5),
1702-
Reject(5, 6),
1703-
Match (6, 6),
1704-
Reject(6, 7),
1705-
Match (7, 7),
1706-
]);
1707-
make_test!(str_searcher_multibyte_haystack, " ", "├──", [
1708-
Reject(0, 3),
1709-
Reject(3, 6),
1710-
Reject(6, 9),
1711-
]);
1712-
make_test!(str_searcher_empty_needle_multibyte_haystack, "", "├──", [
1713-
Match (0, 0),
1714-
Reject(0, 3),
1715-
Match (3, 3),
1716-
Reject(3, 6),
1717-
Match (6, 6),
1718-
Reject(6, 9),
1719-
Match (9, 9),
1720-
]);
1721-
make_test!(str_searcher_empty_needle_empty_haystack, "", "", [
1722-
Match(0, 0),
1723-
]);
1724-
make_test!(str_searcher_nonempty_needle_empty_haystack, "├", "", [
1725-
]);
1726-
make_test!(char_searcher_ascii_haystack, 'b', "abbcbbd", [
1727-
Reject(0, 1),
1728-
Match (1, 2),
1729-
Match (2, 3),
1730-
Reject(3, 4),
1731-
Match (4, 5),
1732-
Match (5, 6),
1733-
Reject(6, 7),
1734-
]);
1735-
make_test!(char_searcher_multibyte_haystack, ' ', "├──", [
1736-
Reject(0, 3),
1737-
Reject(3, 6),
1738-
Reject(6, 9),
1739-
]);
1740-
make_test!(char_searcher_short_haystack, '\u{1F4A9}', "* \t", [
1741-
Reject(0, 1),
1742-
Reject(1, 2),
1743-
Reject(2, 3),
1744-
]);
1745-
1746-
}
1747-
17481609
macro_rules! generate_iterator_test {
17491610
{
17501611
$name:ident {
@@ -1837,13 +1698,51 @@ generate_iterator_test! {
18371698

18381699
#[test]
18391700
fn different_str_pattern_forwarding_lifetimes() {
1840-
use std::str::pattern::Pattern;
1701+
// FIXME: The generic form (see PR 31989) causes a strange "trait bound not satisfied" error.
1702+
// revisit this after RFC 2089 is implemented.
18411703

1842-
fn foo<'a, P>(p: P) where for<'b> &'b P: Pattern<'a> {
1704+
fn foo(p: &str) {
18431705
for _ in 0..3 {
18441706
"asdf".find(&p);
18451707
}
18461708
}
18471709

1848-
foo::<&str>("x");
1710+
foo("x");
1711+
}
1712+
1713+
#[test]
1714+
fn test_mut_str() {
1715+
use std::ops::Range;
1716+
1717+
let mut s = String::from("a1b2c3d4e");
1718+
{
1719+
let res: &mut str = s.trim_matches_mut(|c: char| c.is_ascii_alphabetic());
1720+
assert_eq!(res, "1b2c3d4");
1721+
}
1722+
{
1723+
let res: Vec<&mut str> = s.split_mut(|c: char| c.is_ascii_digit()).collect();
1724+
assert_eq!(res, vec!["a", "b", "c", "d", "e"]);
1725+
}
1726+
{
1727+
let res: Vec<(Range<usize>, &mut str)> =
1728+
s.match_ranges_mut(|c: char| c.is_ascii_digit()).collect();
1729+
let res = res.into_iter().map(|(r, ss)| (r, &*ss)).collect::<Vec<_>>();
1730+
assert_eq!(res, vec![
1731+
(1..2, "1"),
1732+
(3..4, "2"),
1733+
(5..6, "3"),
1734+
(7..8, "4"),
1735+
]);
1736+
}
1737+
{
1738+
let res: Vec<(Range<usize>, &mut str)> =
1739+
s.rmatch_ranges_mut(|c: char| c.is_ascii_digit()).collect();
1740+
let res = res.into_iter().map(|(r, ss)| (r, &*ss)).collect::<Vec<_>>();
1741+
assert_eq!(res, vec![
1742+
(7..8, "4"),
1743+
(5..6, "3"),
1744+
(3..4, "2"),
1745+
(1..2, "1"),
1746+
]);
1747+
}
18491748
}

‎src/liballoc/vec.rs

+33
Original file line numberDiff line numberDiff line change
@@ -67,6 +67,7 @@ use core::ops::{self, Index, IndexMut, RangeBounds};
6767
use core::ops::Bound::{Excluded, Included, Unbounded};
6868
use core::ptr::{self, NonNull};
6969
use core::slice::{self, SliceIndex};
70+
use core::needle::Needle;
7071

7172
use crate::borrow::{ToOwned, Cow};
7273
use crate::collections::CollectionAllocErr;
@@ -2724,3 +2725,35 @@ impl<T, F> Drop for DrainFilter<'_, T, F>
27242725
}
27252726
}
27262727
}
2728+
2729+
#[unstable(feature = "needle", issue = "56345")]
2730+
impl<'p, 'h, T: PartialEq + 'p + 'h> Needle<&'h [T]> for &'p Vec<T> {
2731+
type Searcher = <&'p [T] as Needle<&'h [T]>>::Searcher;
2732+
type Consumer = <&'p [T] as Needle<&'h [T]>>::Consumer;
2733+
2734+
#[inline]
2735+
fn into_searcher(self) -> Self::Searcher {
2736+
<&'p [T] as Needle<&'h [T]>>::into_searcher(&**self)
2737+
}
2738+
2739+
#[inline]
2740+
fn into_consumer(self) -> Self::Consumer {
2741+
<&'p [T] as Needle<&'h [T]>>::into_consumer(&**self)
2742+
}
2743+
}
2744+
2745+
#[unstable(feature = "needle", issue = "56345")]
2746+
impl<'p, 'h, T: PartialEq + 'p + 'h> Needle<&'h mut [T]> for &'p Vec<T> {
2747+
type Searcher = <&'p [T] as Needle<&'h mut [T]>>::Searcher;
2748+
type Consumer = <&'p [T] as Needle<&'h mut [T]>>::Consumer;
2749+
2750+
#[inline]
2751+
fn into_searcher(self) -> Self::Searcher {
2752+
<&'p [T] as Needle<&'h mut [T]>>::into_searcher(&**self)
2753+
}
2754+
2755+
#[inline]
2756+
fn into_consumer(self) -> Self::Consumer {
2757+
<&'p [T] as Needle<&'h mut [T]>>::into_consumer(&**self)
2758+
}
2759+
}

‎src/libcore/lib.rs

+1
Original file line numberDiff line numberDiff line change
@@ -208,6 +208,7 @@ pub mod fmt;
208208
pub mod time;
209209

210210
pub mod unicode;
211+
pub mod needle;
211212

212213
/* Async */
213214
pub mod future;

‎src/libcore/needle/ext.rs

+969
Large diffs are not rendered by default.

‎src/libcore/needle/haystack.rs

+726
Large diffs are not rendered by default.

‎src/libcore/needle/mod.rs

+39
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,39 @@
1+
#![unstable(feature = "needle", issue = "56345")]
2+
3+
//! The Needle API, support generalized searching on strings, arrays and more.
4+
//!
5+
//! This module provides traits to facilitate searching [`Needle`] in a [`Haystack`].
6+
//!
7+
//! [`Needle`]: trait.Needle.html
8+
//! [`Haystack`]: trait.Haystack.html
9+
//!
10+
//! Haystacks
11+
//! =========
12+
//!
13+
//! A *haystack* refers to any linear structure which can be split or sliced
14+
//! into smaller, non-overlapping parts. Examples are strings and vectors.
15+
//!
16+
//! ```rust
17+
//! let haystack: &str = "hello"; // a string slice (`&str`) is a haystack.
18+
//! let (a, b) = haystack.split_at(4); // it can be split into two strings.
19+
//! let c = &a[1..3]; // it can be sliced.
20+
//! ```
21+
//!
22+
//! The minimal haystack which cannot be further sliced is called a *codeword*.
23+
//! For instance, the codeword of a string would be a UTF-8 sequence. A haystack
24+
//! can therefore be viewed as a consecutive list of codewords.
25+
//!
26+
//! The boundary between codewords can be addressed using an *index*. The
27+
//! numbers 1, 3 and 4 in the snippet above are sample indices of a string. An
28+
//! index is usually a `usize`.
29+
//!
30+
//! An arbitrary number may point outside of a haystack, or in the interior of a
31+
//! codeword. These indices are invalid. A *valid index* of a certain haystack
32+
//! would only point to the boundaries.
33+
34+
mod haystack;
35+
mod needle;
36+
pub mod ext;
37+
38+
pub use self::haystack::*;
39+
pub use self::needle::*;

‎src/libcore/needle/needle.rs

+582
Large diffs are not rendered by default.

‎src/libcore/slice/mod.rs

+630-513
Large diffs are not rendered by default.

‎src/libcore/slice/needles.rs

+735
Large diffs are not rendered by default.

‎src/libcore/str/mod.rs

+587-555
Large diffs are not rendered by default.

‎src/libcore/str/needles.rs

+365
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,365 @@
1+
use needle::*;
2+
use ops::Range;
3+
use slice::needles::{SliceSearcher, NaiveSearcher, TwoWaySearcher};
4+
use slice::memchr::{memchr, memrchr};
5+
use fmt;
6+
7+
//------------------------------------------------------------------------------
8+
// Character function searcher
9+
//------------------------------------------------------------------------------
10+
11+
#[derive(Copy, Clone, Debug)]
12+
pub struct MultiCharEq<'p>(&'p [char]);
13+
14+
impl<'p> FnOnce<(char,)> for MultiCharEq<'p> {
15+
type Output = bool;
16+
#[inline]
17+
extern "rust-call" fn call_once(self, args: (char,)) -> bool {
18+
self.call(args)
19+
}
20+
}
21+
22+
impl<'p> FnMut<(char,)> for MultiCharEq<'p> {
23+
#[inline]
24+
extern "rust-call" fn call_mut(&mut self, args: (char,)) -> bool {
25+
self.call(args)
26+
}
27+
}
28+
29+
impl<'p> Fn<(char,)> for MultiCharEq<'p> {
30+
#[inline]
31+
extern "rust-call" fn call(&self, (c,): (char,)) -> bool {
32+
self.0.iter().any(|ch| *ch == c)
33+
}
34+
}
35+
36+
#[derive(Clone)]
37+
pub struct MultiCharSearcher<F> {
38+
predicate: F,
39+
}
40+
41+
// we need to impl Debug for everything due to stability guarantee.
42+
impl<F> fmt::Debug for MultiCharSearcher<F> {
43+
fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
44+
f.debug_struct("MultiCharSearcher").finish()
45+
}
46+
}
47+
48+
unsafe impl<F: FnMut(char) -> bool> Searcher<str> for MultiCharSearcher<F> {
49+
#[inline]
50+
fn search(&mut self, span: Span<&str>) -> Option<Range<usize>> {
51+
let (hay, range) = span.into_parts();
52+
let st = range.start;
53+
let h = &hay[range];
54+
let mut chars = h.chars();
55+
let c = chars.find(|c| (self.predicate)(*c))?;
56+
let end = chars.as_str().as_ptr();
57+
let end = unsafe { end.offset_from(h.as_ptr()) as usize } + st;
58+
Some((end - c.len_utf8())..end)
59+
}
60+
}
61+
62+
unsafe impl<F: FnMut(char) -> bool> Consumer<str> for MultiCharSearcher<F> {
63+
#[inline]
64+
fn consume(&mut self, hay: Span<&str>) -> Option<usize> {
65+
let (hay, range) = hay.into_parts();
66+
let start = range.start;
67+
if start == range.end {
68+
return None;
69+
}
70+
let c = unsafe { hay.get_unchecked(start..) }.chars().next().unwrap();
71+
if (self.predicate)(c) {
72+
Some(start + c.len_utf8())
73+
} else {
74+
None
75+
}
76+
}
77+
78+
#[inline]
79+
fn trim_start(&mut self, hay: &str) -> usize {
80+
let mut chars = hay.chars();
81+
let unconsume_amount = chars
82+
.find_map(|c| if !(self.predicate)(c) { Some(c.len_utf8()) } else { None })
83+
.unwrap_or(0);
84+
let consumed = unsafe { chars.as_str().as_ptr().offset_from(hay.as_ptr()) as usize };
85+
consumed.wrapping_sub(unconsume_amount)
86+
}
87+
}
88+
89+
unsafe impl<F: FnMut(char) -> bool> ReverseSearcher<str> for MultiCharSearcher<F> {
90+
#[inline]
91+
fn rsearch(&mut self, span: Span<&str>) -> Option<Range<usize>> {
92+
let (hay, range) = span.into_parts();
93+
let st = range.start;
94+
let h = &hay[range];
95+
let mut chars = h.chars();
96+
let c = chars.rfind(|c| (self.predicate)(*c))?;
97+
let start = chars.as_str().len() + st;
98+
Some(start..(start + c.len_utf8()))
99+
}
100+
}
101+
102+
unsafe impl<F: FnMut(char) -> bool> ReverseConsumer<str> for MultiCharSearcher<F> {
103+
#[inline]
104+
fn rconsume(&mut self, hay: Span<&str>) -> Option<usize> {
105+
let (hay, range) = hay.into_parts();
106+
let end = range.end;
107+
if range.start == end {
108+
return None;
109+
}
110+
let c = unsafe { hay.get_unchecked(..end) }.chars().next_back().unwrap();
111+
if (self.predicate)(c) {
112+
Some(end - c.len_utf8())
113+
} else {
114+
None
115+
}
116+
}
117+
118+
#[inline]
119+
fn trim_end(&mut self, hay: &str) -> usize {
120+
// `find.map_or` is faster in trim_end in the microbenchmark, while
121+
// `find.unwrap_or` is faster in trim_start. Don't ask me why.
122+
let mut chars = hay.chars();
123+
let unconsume_amount = chars
124+
.by_ref()
125+
.rev() // btw, `rev().find()` is faster than `rfind()`
126+
.find(|c| !(self.predicate)(*c))
127+
.map_or(0, |c| c.len_utf8());
128+
chars.as_str().len() + unconsume_amount
129+
}
130+
}
131+
132+
unsafe impl<F: FnMut(char) -> bool> DoubleEndedSearcher<str> for MultiCharSearcher<F> {}
133+
unsafe impl<F: FnMut(char) -> bool> DoubleEndedConsumer<str> for MultiCharSearcher<F> {}
134+
135+
macro_rules! impl_needle_with_multi_char_searcher {
136+
($ty:ty) => {
137+
impl<'h, F: FnMut(char) -> bool> Needle<$ty> for F {
138+
type Searcher = MultiCharSearcher<F>;
139+
type Consumer = MultiCharSearcher<F>;
140+
141+
#[inline]
142+
fn into_searcher(self) -> Self::Searcher {
143+
MultiCharSearcher { predicate: self }
144+
}
145+
146+
#[inline]
147+
fn into_consumer(self) -> Self::Consumer {
148+
MultiCharSearcher { predicate: self }
149+
}
150+
}
151+
152+
impl<'h, 'p> Needle<$ty> for &'p [char] {
153+
type Searcher = MultiCharSearcher<MultiCharEq<'p>>;
154+
type Consumer = MultiCharSearcher<MultiCharEq<'p>>;
155+
156+
#[inline]
157+
fn into_searcher(self) -> Self::Searcher {
158+
MultiCharSearcher { predicate: MultiCharEq(self) }
159+
}
160+
161+
#[inline]
162+
fn into_consumer(self) -> Self::Consumer {
163+
MultiCharSearcher { predicate: MultiCharEq(self) }
164+
}
165+
}
166+
}
167+
}
168+
169+
impl_needle_with_multi_char_searcher!(&'h str);
170+
impl_needle_with_multi_char_searcher!(&'h mut str);
171+
172+
//------------------------------------------------------------------------------
173+
// Character searcher
174+
//------------------------------------------------------------------------------
175+
176+
#[derive(Debug, Clone)]
177+
pub struct CharSearcher {
178+
// safety invariant: `utf8_size` must be less than 5
179+
utf8_size: usize,
180+
181+
/// A utf8 encoded copy of the `needle`
182+
utf8_encoded: [u8; 4],
183+
184+
/// The character currently being searched.
185+
c: char,
186+
}
187+
188+
impl CharSearcher {
189+
#[inline]
190+
fn as_bytes(&self) -> &[u8] {
191+
&self.utf8_encoded[..self.utf8_size]
192+
}
193+
194+
#[inline]
195+
fn last_byte(&self) -> u8 {
196+
self.utf8_encoded[self.utf8_size - 1]
197+
}
198+
199+
#[inline]
200+
fn new(c: char) -> Self {
201+
let mut utf8_encoded = [0u8; 4];
202+
let utf8_size = c.encode_utf8(&mut utf8_encoded).len();
203+
CharSearcher {
204+
utf8_size,
205+
utf8_encoded,
206+
c,
207+
}
208+
}
209+
}
210+
211+
unsafe impl Searcher<str> for CharSearcher {
212+
#[inline]
213+
fn search(&mut self, span: Span<&str>) -> Option<Range<usize>> {
214+
let (hay, range) = span.into_parts();
215+
let mut finger = range.start;
216+
let bytes = hay.as_bytes();
217+
loop {
218+
let index = memchr(self.last_byte(), &bytes[finger..range.end])?;
219+
finger += index + 1;
220+
if finger >= self.utf8_size {
221+
let found = &bytes[(finger - self.utf8_size)..finger];
222+
if found == self.as_bytes() {
223+
return Some((finger - self.utf8_size)..finger);
224+
}
225+
}
226+
}
227+
}
228+
}
229+
230+
unsafe impl Consumer<str> for CharSearcher {
231+
#[inline]
232+
fn consume(&mut self, span: Span<&str>) -> Option<usize> {
233+
let mut consumer = Needle::<&[u8]>::into_consumer(self.as_bytes());
234+
consumer.consume(span.as_bytes())
235+
}
236+
237+
#[inline]
238+
fn trim_start(&mut self, hay: &str) -> usize {
239+
let mut consumer = Needle::<&str>::into_consumer(|c: char| c == self.c);
240+
consumer.trim_start(hay)
241+
}
242+
}
243+
244+
unsafe impl ReverseSearcher<str> for CharSearcher {
245+
#[inline]
246+
fn rsearch(&mut self, span: Span<&str>) -> Option<Range<usize>> {
247+
let (hay, range) = span.into_parts();
248+
let start = range.start;
249+
let mut bytes = hay[range].as_bytes();
250+
loop {
251+
let index = memrchr(self.last_byte(), bytes)? + 1;
252+
if index >= self.utf8_size {
253+
let found = &bytes[(index - self.utf8_size)..index];
254+
if found == self.as_bytes() {
255+
let index = index + start;
256+
return Some((index - self.utf8_size)..index);
257+
}
258+
}
259+
bytes = &bytes[..(index - 1)];
260+
}
261+
}
262+
}
263+
264+
unsafe impl ReverseConsumer<str> for CharSearcher {
265+
#[inline]
266+
fn rconsume(&mut self, span: Span<&str>) -> Option<usize> {
267+
if self.utf8_size == 1 {
268+
let mut consumer = Needle::<&[u8]>::into_consumer(|b: &u8| *b == self.c as u8);
269+
consumer.rconsume(span.as_bytes())
270+
} else {
271+
let mut consumer = Needle::<&str>::into_consumer(|c: char| c == self.c);
272+
consumer.rconsume(span)
273+
}
274+
}
275+
276+
#[inline]
277+
fn trim_end(&mut self, haystack: &str) -> usize {
278+
let mut consumer = Needle::<&str>::into_consumer(|c: char| c == self.c);
279+
consumer.trim_end(haystack)
280+
}
281+
}
282+
283+
unsafe impl DoubleEndedSearcher<str> for CharSearcher {}
284+
unsafe impl DoubleEndedConsumer<str> for CharSearcher {}
285+
286+
impl<H: Haystack<Target = str>> Needle<H> for char {
287+
type Searcher = CharSearcher;
288+
type Consumer = CharSearcher;
289+
290+
#[inline]
291+
fn into_searcher(self) -> Self::Searcher {
292+
CharSearcher::new(self)
293+
}
294+
295+
#[inline]
296+
fn into_consumer(self) -> Self::Consumer {
297+
CharSearcher::new(self)
298+
}
299+
}
300+
301+
//------------------------------------------------------------------------------
302+
// String searcher
303+
//------------------------------------------------------------------------------
304+
305+
unsafe impl<'p> Searcher<str> for TwoWaySearcher<'p, u8> {
306+
#[inline]
307+
fn search(&mut self, span: Span<&str>) -> Option<Range<usize>> {
308+
let (hay, range) = span.into_parts();
309+
self.next(hay.as_bytes(), range)
310+
}
311+
}
312+
313+
unsafe impl<'p> ReverseSearcher<str> for TwoWaySearcher<'p, u8> {
314+
#[inline]
315+
fn rsearch(&mut self, span: Span<&str>) -> Option<Range<usize>> {
316+
let (hay, range) = span.into_parts();
317+
self.next_back(hay.as_bytes(), range)
318+
}
319+
}
320+
321+
unsafe impl<'p> Consumer<str> for NaiveSearcher<'p, u8> {
322+
#[inline]
323+
fn consume(&mut self, span: Span<&str>) -> Option<usize> {
324+
self.consume(span.as_bytes())
325+
}
326+
327+
#[inline]
328+
fn trim_start(&mut self, hay: &str) -> usize {
329+
self.trim_start(hay.as_bytes())
330+
}
331+
}
332+
333+
unsafe impl<'p> ReverseConsumer<str> for NaiveSearcher<'p, u8> {
334+
#[inline]
335+
fn rconsume(&mut self, span: Span<&str>) -> Option<usize> {
336+
self.rconsume(span.as_bytes())
337+
}
338+
339+
#[inline]
340+
fn trim_end(&mut self, hay: &str) -> usize {
341+
self.trim_end(hay.as_bytes())
342+
}
343+
}
344+
345+
macro_rules! impl_needle_for_str_searcher {
346+
(<[$($gen:tt)*]> for $pat:ty) => {
347+
impl<$($gen)*, H: Haystack<Target = str>> Needle<H> for $pat {
348+
type Searcher = SliceSearcher<'p, u8>;
349+
type Consumer = NaiveSearcher<'p, u8>;
350+
351+
#[inline]
352+
fn into_searcher(self) -> Self::Searcher {
353+
SliceSearcher::new(self.as_bytes())
354+
}
355+
356+
#[inline]
357+
fn into_consumer(self) -> Self::Consumer {
358+
NaiveSearcher::new(self.as_bytes())
359+
}
360+
}
361+
}
362+
}
363+
364+
impl_needle_for_str_searcher!(<['p]> for &'p str);
365+
impl_needle_for_str_searcher!(<['q, 'p]> for &'q &'p str);

‎src/libcore/str/pattern.rs

-1,402
This file was deleted.

‎src/libcore/tests/lib.rs

+1-1
Original file line numberDiff line numberDiff line change
@@ -13,7 +13,7 @@
1313
#![feature(iter_copied)]
1414
#![feature(iter_nth_back)]
1515
#![feature(iter_once_with)]
16-
#![feature(pattern)]
16+
#![feature(needle)]
1717
#![feature(range_is_empty)]
1818
#![feature(raw)]
1919
#![feature(slice_patterns)]

‎src/libcore/tests/pattern.rs

+272-253
Large diffs are not rendered by default.

‎src/libstd/ffi/os_str.rs

+806-14
Large diffs are not rendered by default.

‎src/libstd/lib.rs

+5
Original file line numberDiff line numberDiff line change
@@ -274,6 +274,7 @@
274274
#![feature(link_args)]
275275
#![feature(linkage)]
276276
#![feature(maybe_uninit)]
277+
#![feature(needle)]
277278
#![feature(needs_panic_runtime)]
278279
#![feature(never_type)]
279280
#![feature(nll)]
@@ -285,6 +286,7 @@
285286
#![feature(panic_unwind)]
286287
#![feature(prelude_import)]
287288
#![feature(ptr_internals)]
289+
#![feature(ptr_offset_from)]
288290
#![feature(raw)]
289291
#![feature(renamed_spin_loop)]
290292
#![feature(rustc_attrs)]
@@ -293,6 +295,7 @@
293295
#![feature(shrink_to)]
294296
#![feature(slice_concat_ext)]
295297
#![feature(slice_internals)]
298+
#![feature(slice_needle_methods)]
296299
#![feature(slice_patterns)]
297300
#![feature(staged_api)]
298301
#![feature(std_internals)]
@@ -436,6 +439,8 @@ pub use core::char;
436439
pub use core::u128;
437440
#[stable(feature = "core_hint", since = "1.27.0")]
438441
pub use core::hint;
442+
#[unstable(feature = "needle", issue = "56345")]
443+
pub use core::needle;
439444

440445
pub mod f32;
441446
pub mod f64;

‎src/libstd/path.rs

+2-2
Original file line numberDiff line numberDiff line change
@@ -315,7 +315,7 @@ unsafe fn u8_slice_as_os_str(s: &[u8]) -> &OsStr {
315315

316316
// Detect scheme on Redox
317317
fn has_redox_scheme(s: &[u8]) -> bool {
318-
cfg!(target_os = "redox") && s.split(|b| *b == b'/').next().unwrap_or(b"").contains(&b':')
318+
cfg!(target_os = "redox") && s.split_match(b"/").next().unwrap_or(b"").contains(&b':')
319319
}
320320

321321
////////////////////////////////////////////////////////////////////////////////
@@ -344,7 +344,7 @@ fn split_file_at_dot(file: &OsStr) -> (Option<&OsStr>, Option<&OsStr>) {
344344
// contents of the encoding and (2) new &OsStr values are produced
345345
// only from ASCII-bounded slices of existing &OsStr values.
346346

347-
let mut iter = os_str_as_u8_slice(file).rsplitn(2, |b| *b == b'.');
347+
let mut iter = os_str_as_u8_slice(file).rsplitn_match(2, b".");
348348
let after = iter.next();
349349
let before = iter.next();
350350
if before == Some(b"") {

‎src/libstd/sys/windows/args.rs

+2-2
Original file line numberDiff line numberDiff line change
@@ -64,7 +64,7 @@ unsafe fn parse_lp_cmd_line<F: Fn() -> OsString>(lp_cmd_line: *const u16, exe_na
6464
// no matter what.
6565
QUOTE => {
6666
let args = {
67-
let mut cut = cmd_line[1..].splitn(2, |&c| c == QUOTE);
67+
let mut cut = cmd_line[1..].splitn(2, |&c: &u16| c == QUOTE);
6868
if let Some(exe) = cut.next() {
6969
ret_val.push(OsString::from_wide(exe));
7070
}
@@ -89,7 +89,7 @@ unsafe fn parse_lp_cmd_line<F: Fn() -> OsString>(lp_cmd_line: *const u16, exe_na
8989
// no matter what.
9090
_ => {
9191
let args = {
92-
let mut cut = cmd_line.splitn(2, |&c| c > 0 && c <= SPACE);
92+
let mut cut = cmd_line.splitn(2, |&c: &u16| c > 0 && c <= SPACE);
9393
if let Some(exe) = cut.next() {
9494
ret_val.push(OsString::from_wide(exe));
9595
}

‎src/libstd/sys/windows/os_str.rs

+51-1
Original file line numberDiff line numberDiff line change
@@ -3,11 +3,14 @@
33
44
use crate::borrow::Cow;
55
use crate::fmt;
6-
use crate::sys_common::wtf8::{Wtf8, Wtf8Buf};
6+
use crate::sys_common::wtf8::{self, Wtf8, Wtf8Buf};
77
use crate::mem;
88
use crate::rc::Rc;
99
use crate::sync::Arc;
10+
use crate::ops::{Index, Range, RangeFrom, RangeTo};
1011
use crate::sys_common::{AsInner, IntoInner, FromInner};
12+
use core::slice::needles::{SliceSearcher, NaiveSearcher};
13+
use crate::needle::Hay;
1114

1215
#[derive(Clone, Hash)]
1316
pub struct Buf {
@@ -44,6 +47,7 @@ impl fmt::Display for Buf {
4447
}
4548
}
4649

50+
#[derive(PartialEq, Eq, PartialOrd, Ord, Hash)]
4751
pub struct Slice {
4852
pub inner: Wtf8
4953
}
@@ -60,6 +64,30 @@ impl fmt::Display for Slice {
6064
}
6165
}
6266

67+
impl Index<Range<usize>> for Slice {
68+
type Output = Slice;
69+
70+
fn index(&self, range: Range<usize>) -> &Slice {
71+
unsafe { mem::transmute(&self.inner[range]) }
72+
}
73+
}
74+
75+
impl Index<RangeFrom<usize>> for Slice {
76+
type Output = Slice;
77+
78+
fn index(&self, range: RangeFrom<usize>) -> &Slice {
79+
unsafe { mem::transmute(&self.inner[range]) }
80+
}
81+
}
82+
83+
impl Index<RangeTo<usize>> for Slice {
84+
type Output = Slice;
85+
86+
fn index(&self, range: RangeTo<usize>) -> &Slice {
87+
unsafe { mem::transmute(&self.inner[range]) }
88+
}
89+
}
90+
6391
impl Buf {
6492
pub fn with_capacity(capacity: usize) -> Buf {
6593
Buf {
@@ -169,4 +197,26 @@ impl Slice {
169197
let rc = self.inner.into_rc();
170198
unsafe { Rc::from_raw(Rc::into_raw(rc) as *const Slice) }
171199
}
200+
201+
pub unsafe fn next_index(&self, index: usize) -> usize {
202+
self.inner.next_index(index)
203+
}
204+
205+
pub unsafe fn prev_index(&self, index: usize) -> usize {
206+
self.inner.prev_index(index)
207+
}
208+
209+
pub fn into_searcher(&self) -> InnerSearcher<SliceSearcher<'_, u8>> {
210+
wtf8::new_wtf8_searcher(&self.inner)
211+
}
212+
213+
pub fn into_consumer(&self) -> InnerSearcher<NaiveSearcher<'_, u8>> {
214+
wtf8::new_wtf8_consumer(&self.inner)
215+
}
216+
217+
pub fn as_bytes_for_searcher(&self) -> &[u8] {
218+
self.inner.as_inner()
219+
}
172220
}
221+
222+
pub use crate::sys_common::wtf8::Wtf8Searcher as InnerSearcher;

‎src/libstd/sys_common/os_str_bytes.rs

+51
Original file line numberDiff line numberDiff line change
@@ -6,18 +6,22 @@ use crate::ffi::{OsStr, OsString};
66
use crate::fmt;
77
use crate::str;
88
use crate::mem;
9+
use crate::ops::{Index, Range, RangeFrom, RangeTo};
910
use crate::rc::Rc;
1011
use crate::sync::Arc;
1112
use crate::sys_common::{FromInner, IntoInner, AsInner};
1213
use crate::sys_common::bytestring::debug_fmt_bytestring;
1314

1415
use core::str::lossy::Utf8Lossy;
16+
use core::slice::needles::{SliceSearcher, NaiveSearcher};
17+
use crate::needle::Hay;
1518

1619
#[derive(Clone, Hash)]
1720
pub(crate) struct Buf {
1821
pub inner: Vec<u8>
1922
}
2023

24+
#[derive(PartialEq, Eq, PartialOrd, Ord, Hash)]
2125
pub(crate) struct Slice {
2226
pub inner: [u8]
2327
}
@@ -34,6 +38,30 @@ impl fmt::Display for Slice {
3438
}
3539
}
3640

41+
impl Index<Range<usize>> for Slice {
42+
type Output = Slice;
43+
44+
fn index(&self, range: Range<usize>) -> &Slice {
45+
Slice::from_u8_slice(&self.inner[range])
46+
}
47+
}
48+
49+
impl Index<RangeFrom<usize>> for Slice {
50+
type Output = Slice;
51+
52+
fn index(&self, range: RangeFrom<usize>) -> &Slice {
53+
Slice::from_u8_slice(&self.inner[range])
54+
}
55+
}
56+
57+
impl Index<RangeTo<usize>> for Slice {
58+
type Output = Slice;
59+
60+
fn index(&self, range: RangeTo<usize>) -> &Slice {
61+
Slice::from_u8_slice(&self.inner[range])
62+
}
63+
}
64+
3765
impl fmt::Debug for Buf {
3866
fn fmt(&self, formatter: &mut fmt::Formatter<'_>) -> fmt::Result {
3967
fmt::Debug::fmt(self.as_slice(), formatter)
@@ -178,8 +206,31 @@ impl Slice {
178206
let rc: Rc<[u8]> = Rc::from(&self.inner);
179207
unsafe { Rc::from_raw(Rc::into_raw(rc) as *const Slice) }
180208
}
209+
210+
pub unsafe fn next_index(&self, index: usize) -> usize {
211+
self.inner.next_index(index)
212+
}
213+
214+
pub unsafe fn prev_index(&self, index: usize) -> usize {
215+
self.inner.prev_index(index)
216+
}
217+
218+
pub fn into_searcher(&self) -> SliceSearcher<'_, u8> {
219+
SliceSearcher::new(&self.inner)
220+
}
221+
222+
pub fn into_consumer(&self) -> NaiveSearcher<'_, u8> {
223+
NaiveSearcher::new(&self.inner)
224+
}
225+
226+
pub fn as_bytes_for_searcher(&self) -> &[u8] {
227+
&self.inner
228+
}
181229
}
182230

231+
#[unstable(feature = "needle", issue = "56345")]
232+
pub type InnerSearcher<S> = S;
233+
183234
/// Platform-specific extensions to [`OsString`].
184235
///
185236
/// [`OsString`]: ../../../../std/ffi/struct.OsString.html

‎src/libstd/sys_common/wtf8.rs

+1,032-510
Large diffs are not rendered by default.

‎src/test/ui/issues/issue-2149.stderr

+1-1
Original file line numberDiff line numberDiff line change
@@ -10,7 +10,7 @@ error[E0599]: no method named `bind` found for type `[&str; 1]` in the current s
1010
--> $DIR/issue-2149.rs:13:12
1111
|
1212
LL | ["hi"].bind(|x| [x] );
13-
| ^^^^
13+
| ^^^^ help: did you mean: `find`
1414
|
1515
= help: items from traits can only be used if the trait is implemented and in scope
1616
= note: the following trait defines an item `bind`, perhaps you need to implement it:

‎src/test/ui/issues/issue-48364.rs

+1-1
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
11
fn foo() -> bool {
2-
b"".starts_with(stringify!(foo))
2+
b"".eq_ignore_ascii_case(stringify!(foo))
33
//~^ ERROR mismatched types
44
}
55

‎src/test/ui/issues/issue-48364.stderr

+3-3
Original file line numberDiff line numberDiff line change
@@ -1,8 +1,8 @@
11
error[E0308]: mismatched types
2-
--> $DIR/issue-48364.rs:2:21
2+
--> $DIR/issue-48364.rs:2:30
33
|
4-
LL | b"".starts_with(stringify!(foo))
5-
| ^^^^^^^^^^^^^^^ expected slice, found str
4+
LL | b"".eq_ignore_ascii_case(stringify!(foo))
5+
| ^^^^^^^^^^^^^^^ expected slice, found str
66
|
77
= note: expected type `&[u8]`
88
found type `&'static str`

0 commit comments

Comments
 (0)
Please sign in to comment.