Skip to content

Commit c87ef0a

Browse files
committed
Auto merge of #80749 - as-com:target-cpu-actually-native, r=nagisa
Make target-cpu=native detect individual features This PR makes target-cpu=native check for and enable/disable individual features instead of detecting and targeting a CPU by name. This brings the flag's behavior more in line with clang and gcc and ensures that the host actually supports each feature that we are compiling for. This should resolve issues with miscompilations on e.g. "Haswell" Pentiums and Celerons that lack support for AVX, and also enable support for `aes` on Broadwell processors that support it. It should also resolve issues with failing to detect feature support in newer CPUs that aren't yet known by LLVM (see: #80633). Fixes #54688 Fixes #48464 Fixes #38218
2 parents 26438b4 + 80ca198 commit c87ef0a

File tree

3 files changed

+38
-2
lines changed

3 files changed

+38
-2
lines changed

compiler/rustc_codegen_llvm/src/back/write.rs

+2-1
Original file line numberDiff line numberDiff line change
@@ -164,7 +164,8 @@ pub fn target_machine_factory(
164164

165165
let code_model = to_llvm_code_model(sess.code_model());
166166

167-
let features = attributes::llvm_target_features(sess).collect::<Vec<_>>();
167+
let mut features = llvm_util::handle_native_features(sess);
168+
features.extend(attributes::llvm_target_features(sess).map(|s| s.to_owned()));
168169
let mut singlethread = sess.target.singlethread;
169170

170171
// On the wasm target once the `atomics` feature is enabled that means that

compiler/rustc_codegen_llvm/src/llvm/ffi.rs

+4
Original file line numberDiff line numberDiff line change
@@ -1708,6 +1708,10 @@ extern "C" {
17081708
PM: &PassManager<'_>,
17091709
);
17101710

1711+
pub fn LLVMGetHostCPUFeatures() -> *mut c_char;
1712+
1713+
pub fn LLVMDisposeMessage(message: *mut c_char);
1714+
17111715
// Stuff that's in llvm-wrapper/ because it's not upstream yet.
17121716

17131717
/// Opens an object file.

compiler/rustc_codegen_llvm/src/llvm_util.rs

+32-1
Original file line numberDiff line numberDiff line change
@@ -8,7 +8,7 @@ use rustc_session::config::PrintRequest;
88
use rustc_session::Session;
99
use rustc_span::symbol::Symbol;
1010
use rustc_target::spec::{MergeFunctions, PanicStrategy};
11-
use std::ffi::CString;
11+
use std::ffi::{CStr, CString};
1212

1313
use std::slice;
1414
use std::str;
@@ -221,6 +221,37 @@ pub fn target_cpu(sess: &Session) -> &str {
221221
handle_native(name)
222222
}
223223

224+
pub fn handle_native_features(sess: &Session) -> Vec<String> {
225+
match sess.opts.cg.target_cpu {
226+
Some(ref s) => {
227+
if s != "native" {
228+
return vec![];
229+
}
230+
231+
let features_string = unsafe {
232+
let ptr = llvm::LLVMGetHostCPUFeatures();
233+
let features_string = if !ptr.is_null() {
234+
CStr::from_ptr(ptr)
235+
.to_str()
236+
.unwrap_or_else(|e| {
237+
bug!("LLVM returned a non-utf8 features string: {}", e);
238+
})
239+
.to_owned()
240+
} else {
241+
bug!("could not allocate host CPU features, LLVM returned a `null` string");
242+
};
243+
244+
llvm::LLVMDisposeMessage(ptr);
245+
246+
features_string
247+
};
248+
249+
features_string.split(",").map(|s| s.to_owned()).collect()
250+
}
251+
None => vec![],
252+
}
253+
}
254+
224255
pub fn tune_cpu(sess: &Session) -> Option<&str> {
225256
match sess.opts.debugging_opts.tune_cpu {
226257
Some(ref s) => Some(handle_native(&**s)),

0 commit comments

Comments
 (0)