Skip to content

Commit 76e75ae

Browse files
authored
Rollup merge of rust-lang#130991 - LaihoE:vectorized_slice_contains, r=Noratrieb
Vectorized SliceContains Godbolt for the u32 case: https://rust.godbolt.org/z/exT9xYWGs Unsure about: - Should align_to be used? It didn't seem to matter in my benchmark but maybe I was lucky with alignment? - Should u8/i8 also be implemented? Currently uses memchr (SWAR) Some benchmarks on x86 (contains called on an array with no matches, worst case may be slightly worse): ## Large N ![large_n_contains](https://github.com/user-attachments/assets/5be79072-970b-44be-a56c-16dc677dee46) ## Small N ![small_n_contains](https://github.com/user-attachments/assets/b8a33790-c176-459f-84f4-05feee893cd0)
2 parents 054b256 + 01ed719 commit 76e75ae

File tree

1 file changed

+26
-0
lines changed

1 file changed

+26
-0
lines changed

core/src/slice/cmp.rs

+26
Original file line numberDiff line numberDiff line change
@@ -257,3 +257,29 @@ impl SliceContains for i8 {
257257
memchr::memchr(byte, bytes).is_some()
258258
}
259259
}
260+
261+
macro_rules! impl_slice_contains {
262+
($($t:ty),*) => {
263+
$(
264+
impl SliceContains for $t {
265+
#[inline]
266+
fn slice_contains(&self, arr: &[$t]) -> bool {
267+
// Make our LANE_COUNT 4x the normal lane count (aiming for 128 bit vectors).
268+
// The compiler will nicely unroll it.
269+
const LANE_COUNT: usize = 4 * (128 / (mem::size_of::<$t>() * 8));
270+
// SIMD
271+
let mut chunks = arr.chunks_exact(LANE_COUNT);
272+
for chunk in &mut chunks {
273+
if chunk.iter().fold(false, |acc, x| acc | (*x == *self)) {
274+
return true;
275+
}
276+
}
277+
// Scalar remainder
278+
return chunks.remainder().iter().any(|x| *x == *self);
279+
}
280+
}
281+
)*
282+
};
283+
}
284+
285+
impl_slice_contains!(u16, u32, u64, i16, i32, i64, f32, f64, usize, isize);

0 commit comments

Comments
 (0)