Skip to content
Open
Show file tree
Hide file tree
Changes from 2 commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
58 changes: 58 additions & 0 deletions library/core/src/slice/ascii.rs
Original file line number Diff line number Diff line change
Expand Up @@ -60,6 +60,18 @@ impl [u8] {
return false;
}

#[cfg(all(target_arch = "x86_64", target_feature = "sse2"))]
if self.len() >= 16 {
return self.eq_ignore_ascii_case_chunks(other);
}

self.eq_ignore_ascii_case_simple(other)
}

/// ASCII case-insensitive equality check without chunk-at-a-time
/// optimization.
#[inline]
const fn eq_ignore_ascii_case_simple(&self, other: &[u8]) -> bool {
// FIXME(const-hack): This implementation can be reverted when
// `core::iter::zip` is allowed in const. The original implementation:
// self.len() == other.len() && iter::zip(self, other).all(|(a, b)| a.eq_ignore_ascii_case(b))
Expand All @@ -78,6 +90,52 @@ impl [u8] {
true
}

/// Optimized version of `eq_ignore_ascii_case` for byte lengths of at least
/// 16 bytes, which processes chunks at a time.
///
/// Platforms that have SIMD instructions may benefit from this
/// implementation over `eq_ignore_ascii_case_simple`.
#[cfg(all(target_arch = "x86_64", target_feature = "sse2"))]
#[inline]
const fn eq_ignore_ascii_case_chunks(&self, other: &[u8]) -> bool {
const N: usize = 16;
let (self_chunks, self_rem) = self.as_chunks::<N>();
let (other_chunks, _) = other.as_chunks::<N>();

// Branchless check to encourage auto-vectorization
const fn eq_ignore_ascii_inner(lhs: &[u8; N], rhs: &[u8; N]) -> bool {
Copy link
Contributor

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

When I copied this code into compiler explorer with -C opt_level=3, the call to eq_ignore_ascii_inner did not get inlined. I would suggest to mark this function #[inline(always)] and add a CHECK-NOT: call in the codegen test.

Copy link
Contributor Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

I added the annotation and filecheck adaptation in a5ba248

let mut equal_ascii = true;
let mut j = 0;
while j < N {
equal_ascii &= lhs[j].eq_ignore_ascii_case(&rhs[j]);
j += 1;
}

equal_ascii
}

// Process the chunks, returning early if an inequality is found
let mut i = 0;
while i < self_chunks.len() && i < other_chunks.len() {
if !eq_ignore_ascii_inner(&self_chunks[i], &other_chunks[i]) {
return false;
}
i += 1;
}

// If there are remaining tails, load the last N bytes in the slices to
// avoid falling back to per-byte checking.
if !self_rem.is_empty() {
if let (Some(a_rem), Some(b_rem)) = (self.last_chunk::<N>(), other.last_chunk::<N>()) {
if !eq_ignore_ascii_inner(a_rem, b_rem) {
return false;
}
}
}

true
}

/// Converts this slice to its ASCII upper case equivalent in-place.
///
/// ASCII letters 'a' to 'z' are mapped to 'A' to 'Z',
Expand Down
1 change: 1 addition & 0 deletions library/coretests/benches/ascii.rs
Original file line number Diff line number Diff line change
@@ -1,3 +1,4 @@
mod eq_ignore_ascii_case;
mod is_ascii;

// Lower-case ASCII 'a' is the first byte that has its highest bit set
Expand Down
56 changes: 56 additions & 0 deletions library/coretests/benches/ascii/eq_ignore_ascii_case.rs
Original file line number Diff line number Diff line change
@@ -0,0 +1,56 @@
use test::Bencher;

#[bench]
fn bench_str_under_8_bytes_eq(b: &mut Bencher) {
let s = "foo";
let other = "FOo";
b.iter(|| {
assert!(s.eq_ignore_ascii_case(other));
})
}

#[bench]
fn bench_str_of_8_bytes_eq(b: &mut Bencher) {
let s = "foobar78";
let other = "FOObAr78";
b.iter(|| {
assert!(s.eq_ignore_ascii_case(other));
})
}

#[bench]
fn bench_str_17_bytes_eq(b: &mut Bencher) {
let s = "performance-criti";
let other = "performANce-cRIti";
b.iter(|| {
assert!(s.eq_ignore_ascii_case(other));
})
}

#[bench]
fn bench_str_31_bytes_eq(b: &mut Bencher) {
let s = "foobarbazquux02foobarbazquux025";
let other = "fooBARbazQuuX02fooBARbazQuuX025";
b.iter(|| {
assert!(s.eq_ignore_ascii_case(other));
})
}

#[bench]
fn bench_long_str_eq(b: &mut Bencher) {
let s = "Lorem ipsum dolor sit amet, consectetur adipisicing elit, sed do eiusmod tempor \
incididunt ut labore et dolore magna aliqua. Ut enim ad minim veniam, quis nostrud \
exercitation ullamco laboris nisi ut aliquip ex ea commodo consequat. Duis aute \
irure dolor in reprehenderit in voluptate velit esse cillum dolore eu fugiat nulla \
pariatur. Excepteur sint occaecat cupidatat non proident, sunt in culpa qui \
officia deserunt mollit anim id est laborum.";
let other = "Lorem ipsum dolor sit amet, CONSECTETUR adipisicing elit, sed do eiusmod tempor \
incididunt ut labore et dolore MAGNA aliqua. Ut enim ad MINIM veniam, quis nostrud \
exercitation ullamco LABORIS nisi ut aliquip ex ea commodo consequat. Duis aute \
irure dolor in reprehenderit in voluptate velit esse cillum DOLORE eu fugiat nulla \
pariatur. Excepteur sint occaecat CUPIDATAT non proident, sunt in culpa qui \
officia deserunt mollit anim id est laborum.";
b.iter(|| {
assert!(s.eq_ignore_ascii_case(other));
})
}
14 changes: 14 additions & 0 deletions tests/codegen-llvm/lib-optimizations/eq_ignore_ascii_case.rs
Original file line number Diff line number Diff line change
@@ -0,0 +1,14 @@
//@ compile-flags: -Copt-level=3
//@ only-x86_64
#![crate_type = "lib"]

// Ensure that the optimized variant of the function gets auto-vectorized.
// CHECK-LABEL: @eq_ignore_ascii_case_autovectorized
#[no_mangle]
pub fn eq_ignore_ascii_case_autovectorized(s: &str, other: &str) -> bool {
// CHECK: load <16 x i8>
// CHECK: load <16 x i8>
// CHECK: bitcast <16 x i1>
// CHECK-NOT: panic
s.eq_ignore_ascii_case(other)
}
Loading