Skip to content

Commit 1a1e6b8

Browse files
committed
Auto merge of #28338 - erickt:str-cmp, r=bluss
llvm seems to be having some trouble optimizing the iterator-based string comparsion method into some equivalent to memcmp. This explicitly calls out to the memcmp intrinisic in order to allow llvm to generate better code. In some manual benchmarking, this memcmp-based approach is 20 times faster than the iterator approach.
2 parents 883b5cf + fbd91a7 commit 1a1e6b8

File tree

1 file changed

+20
-15
lines changed

1 file changed

+20
-15
lines changed

src/libcore/str/mod.rs

+20-15
Original file line numberDiff line numberDiff line change
@@ -896,14 +896,18 @@ Section: Comparing strings
896896
#[lang = "str_eq"]
897897
#[inline]
898898
fn eq_slice(a: &str, b: &str) -> bool {
899+
a.len() == b.len() && unsafe { cmp_slice(a, b, a.len()) == 0 }
900+
}
901+
902+
/// Bytewise slice comparison.
903+
/// NOTE: This uses the system's memcmp, which is currently dramatically
904+
/// faster than comparing each byte in a loop.
905+
#[inline]
906+
unsafe fn cmp_slice(a: &str, b: &str, len: usize) -> i32 {
899907
// NOTE: In theory n should be libc::size_t and not usize, but libc is not available here
900908
#[allow(improper_ctypes)]
901909
extern { fn memcmp(s1: *const i8, s2: *const i8, n: usize) -> i32; }
902-
a.len() == b.len() && unsafe {
903-
memcmp(a.as_ptr() as *const i8,
904-
b.as_ptr() as *const i8,
905-
a.len()) == 0
906-
}
910+
memcmp(a.as_ptr() as *const i8, b.as_ptr() as *const i8, len)
907911
}
908912

909913
/*
@@ -1039,8 +1043,8 @@ Section: Trait implementations
10391043
*/
10401044

10411045
mod traits {
1042-
use cmp::{Ordering, Ord, PartialEq, PartialOrd, Eq};
1043-
use cmp::Ordering::{Less, Equal, Greater};
1046+
use cmp::{self, Ordering, Ord, PartialEq, PartialOrd, Eq};
1047+
use cmp::Ordering::{Less, Greater};
10441048
use iter::Iterator;
10451049
use option::Option;
10461050
use option::Option::Some;
@@ -1051,15 +1055,16 @@ mod traits {
10511055
impl Ord for str {
10521056
#[inline]
10531057
fn cmp(&self, other: &str) -> Ordering {
1054-
for (s_b, o_b) in self.bytes().zip(other.bytes()) {
1055-
match s_b.cmp(&o_b) {
1056-
Greater => return Greater,
1057-
Less => return Less,
1058-
Equal => ()
1059-
}
1058+
let cmp = unsafe {
1059+
super::cmp_slice(self, other, cmp::min(self.len(), other.len()))
1060+
};
1061+
if cmp == 0 {
1062+
self.len().cmp(&other.len())
1063+
} else if cmp < 0 {
1064+
Less
1065+
} else {
1066+
Greater
10601067
}
1061-
1062-
self.len().cmp(&other.len())
10631068
}
10641069
}
10651070

0 commit comments

Comments
 (0)