1use std::collections::VecDeque;
2use std::ffi::{CStr, CString};
3use std::fmt::Write;
4use std::path::Path;
5use std::sync::Once;
6use std::{ptr, slice, str};
78use libc::c_int;
9use rustc_codegen_ssa::base::wants_wasm_eh;
10use rustc_codegen_ssa::target_features::cfg_target_feature;
11use rustc_codegen_ssa::{TargetConfig, target_features};
12use rustc_data_structures::fx::FxHashSet;
13use rustc_data_structures::small_c_str::SmallCStr;
14use rustc_fs_util::path_to_c_string;
15use rustc_middle::bug;
16use rustc_session::Session;
17use rustc_session::config::{PrintKind, PrintRequest};
18use rustc_target::spec::{
19Arch, CfgAbi, Env, MergeFunctions, Os, PanicStrategy, SmallDataThresholdSupport,
20};
21use smallvec::{SmallVec, smallvec};
2223use crate::back::write::create_informational_target_machine;
24use crate::{errors, llvm};
2526static INIT: Once = Once::new();
2728pub(crate) fn init(sess: &Session) {
29unsafe {
30// Before we touch LLVM, make sure that multithreading is enabled.
31if !llvm::LLVMIsMultithreaded().is_true() {
32::rustc_middle::util::bug::bug_fmt(format_args!("LLVM compiled without support for threads"));bug!("LLVM compiled without support for threads");
33 }
34INIT.call_once(|| {
35configure_llvm(sess);
36 });
37 }
38}
3940fn require_inited() {
41if !INIT.is_completed() {
42::rustc_middle::util::bug::bug_fmt(format_args!("LLVM is not initialized"));bug!("LLVM is not initialized");
43 }
44}
4546unsafe fn configure_llvm(sess: &Session) {
47let n_args = sess.opts.cg.llvm_args.len() + sess.target.llvm_args.len();
48let mut llvm_c_strs = Vec::with_capacity(n_args + 1);
49let mut llvm_args = Vec::with_capacity(n_args + 1);
5051unsafe {
52 llvm::LLVMRustInstallErrorHandlers();
53 }
54// On Windows, an LLVM assertion will open an Abort/Retry/Ignore dialog
55 // box for the purpose of launching a debugger. However, on CI this will
56 // cause it to hang until it times out, which can take several hours.
57if std::env::var_os("CI").is_some() {
58unsafe {
59 llvm::LLVMRustDisableSystemDialogsOnCrash();
60 }
61 }
6263fn llvm_arg_to_arg_name(full_arg: &str) -> &str {
64full_arg.trim().split(|c: char| c == '=' || c.is_whitespace()).next().unwrap_or("")
65 }
6667let cg_opts = sess.opts.cg.llvm_args.iter().map(AsRef::as_ref);
68let tg_opts = sess.target.llvm_args.iter().map(AsRef::as_ref);
69let sess_args = cg_opts.chain(tg_opts);
7071let user_specified_args: FxHashSet<_> =
72sess_args.clone().map(|s| llvm_arg_to_arg_name(s)).filter(|s| !s.is_empty()).collect();
7374 {
75// This adds the given argument to LLVM. Unless `force` is true
76 // user specified arguments are *not* overridden.
77let mut add = |arg: &str, force: bool| {
78if force || !user_specified_args.contains(llvm_arg_to_arg_name(arg)) {
79let s = CString::new(arg).unwrap();
80llvm_args.push(s.as_ptr());
81llvm_c_strs.push(s);
82 }
83 };
84// Set the llvm "program name" to make usage and invalid argument messages more clear.
85add("rustc -Cllvm-args=\"...\" with", true);
86if sess.opts.unstable_opts.time_llvm_passes {
87add("-time-passes", false);
88 }
89if sess.opts.unstable_opts.print_llvm_passes {
90add("-debug-pass=Structure", false);
91 }
92if sess.target.generate_arange_section
93 && !sess.opts.unstable_opts.no_generate_arange_section
94 {
95add("-generate-arange-section", false);
96 }
9798match sess.opts.unstable_opts.merge_functions.unwrap_or(sess.target.merge_functions) {
99 MergeFunctions::Disabled | MergeFunctions::Trampolines => {}
100 MergeFunctions::Aliases => {
101add("-mergefunc-use-aliases", false);
102 }
103 }
104105if wants_wasm_eh(sess) {
106add("-wasm-enable-eh", false);
107 }
108109if sess.target.os == Os::Emscripten110 && !sess.opts.unstable_opts.emscripten_wasm_eh
111 && sess.panic_strategy().unwinds()
112 {
113add("-enable-emscripten-cxx-exceptions", false);
114 }
115116// HACK(eddyb) LLVM inserts `llvm.assume` calls to preserve align attributes
117 // during inlining. Unfortunately these may block other optimizations.
118add("-preserve-alignment-assumptions-during-inlining=false", false);
119120// Use non-zero `import-instr-limit` multiplier for cold callsites.
121add("-import-cold-multiplier=0.1", false);
122123if sess.print_llvm_stats() {
124add("-stats", false);
125 }
126127for arg in sess_args {
128 add(&(*arg), true);
129 }
130131match (
132sess.opts.unstable_opts.small_data_threshold,
133sess.target.small_data_threshold_support(),
134 ) {
135// Set up the small-data optimization limit for architectures that use
136 // an LLVM argument to control this.
137(Some(threshold), SmallDataThresholdSupport::LlvmArg(arg)) => {
138add(&::alloc::__export::must_use({
::alloc::fmt::format(format_args!("--{0}={1}", arg, threshold))
})format!("--{arg}={threshold}"), false)
139 }
140_ => (),
141 };
142 }
143144if sess.opts.unstable_opts.llvm_time_trace {
145unsafe { llvm::LLVMRustTimeTraceProfilerInitialize() };
146 }
147148 rustc_llvm::initialize_available_targets();
149150unsafe { llvm::LLVMRustSetLLVMOptions(llvm_args.len() as c_int, llvm_args.as_ptr()) };
151}
152153pub(crate) fn time_trace_profiler_finish(file_name: &Path) {
154unsafe {
155let file_name = path_to_c_string(file_name);
156 llvm::LLVMRustTimeTraceProfilerFinish(file_name.as_ptr());
157 }
158}
159160enum TargetFeatureFoldStrength<'a> {
161// The feature is only tied when enabling the feature, disabling
162 // this feature shouldn't disable the tied feature.
163EnableOnly(&'a str),
164// The feature is tied for both enabling and disabling this feature.
165Both(&'a str),
166}
167168impl<'a> TargetFeatureFoldStrength<'a> {
169fn as_str(&self) -> &'a str {
170match self {
171 TargetFeatureFoldStrength::EnableOnly(feat) => feat,
172 TargetFeatureFoldStrength::Both(feat) => feat,
173 }
174 }
175}
176177pub(crate) struct LLVMFeature<'a> {
178 llvm_feature_name: &'a str,
179 dependencies: SmallVec<[TargetFeatureFoldStrength<'a>; 1]>,
180}
181182impl<'a> LLVMFeature<'a> {
183fn new(llvm_feature_name: &'a str) -> Self {
184Self { llvm_feature_name, dependencies: SmallVec::new() }
185 }
186187fn with_dependencies(
188 llvm_feature_name: &'a str,
189 dependencies: SmallVec<[TargetFeatureFoldStrength<'a>; 1]>,
190 ) -> Self {
191Self { llvm_feature_name, dependencies }
192 }
193}
194195impl<'a> IntoIteratorfor LLVMFeature<'a> {
196type Item = &'a str;
197type IntoIter = impl Iterator<Item = &'a str>;
198199fn into_iter(self) -> Self::IntoIter {
200let dependencies = self.dependencies.into_iter().map(|feat| feat.as_str());
201 std::iter::once(self.llvm_feature_name).chain(dependencies)
202 }
203}
204205/// Convert a Rust feature name to an LLVM feature name. Returning `None` means the
206/// feature should be skipped, usually because it is not supported by the current
207/// LLVM version.
208///
209/// WARNING: the features after applying `to_llvm_features` must be known
210/// to LLVM or the feature detection code will walk past the end of the feature
211/// array, leading to crashes.
212///
213/// To find a list of LLVM's names, see llvm-project/llvm/lib/Target/{ARCH}/*.td
214/// where `{ARCH}` is the architecture name. Look for instances of `SubtargetFeature`.
215///
216/// Check the current rustc fork of LLVM in the repo at
217/// <https://github.com/rust-lang/llvm-project/>. The commit in use can be found via the
218/// `llvm-project` submodule in <https://github.com/rust-lang/rust/tree/HEAD/src> Though note that
219/// Rust can also be build with an external precompiled version of LLVM which might lead to failures
220/// if the oldest tested / supported LLVM version doesn't yet support the relevant intrinsics.
221pub(crate) fn to_llvm_features<'a>(sess: &Session, s: &'a str) -> Option<LLVMFeature<'a>> {
222let (major, _, _) = get_version();
223match sess.target.arch {
224 Arch::AArch64 | Arch::Arm64EC => {
225match s {
226"rcpc2" => Some(LLVMFeature::new("rcpc-immo")),
227"dpb" => Some(LLVMFeature::new("ccpp")),
228"dpb2" => Some(LLVMFeature::new("ccdp")),
229"frintts" => Some(LLVMFeature::new("fptoint")),
230"fcma" => Some(LLVMFeature::new("complxnum")),
231"pmuv3" => Some(LLVMFeature::new("perfmon")),
232"paca" => Some(LLVMFeature::new("pauth")),
233"pacg" => Some(LLVMFeature::new("pauth")),
234"flagm2" => Some(LLVMFeature::new("altnzcv")),
235// Rust ties fp and neon together.
236"neon" => Some(LLVMFeature::with_dependencies(
237"neon",
238{
let count = 0usize + 1usize;
let mut vec = ::smallvec::SmallVec::new();
if count <= vec.inline_size() {
vec.push(TargetFeatureFoldStrength::Both("fp-armv8"));
vec
} else {
::smallvec::SmallVec::from_vec(::alloc::boxed::box_assume_init_into_vec_unsafe(::alloc::intrinsics::write_box_via_move(::alloc::boxed::Box::new_uninit(),
[TargetFeatureFoldStrength::Both("fp-armv8")])))
}
}smallvec![TargetFeatureFoldStrength::Both("fp-armv8")],
239 )),
240// In LLVM neon implicitly enables fp, but we manually enable
241 // neon when a feature only implicitly enables fp
242"fhm" => Some(LLVMFeature::new("fp16fml")),
243"fp16" => Some(LLVMFeature::new("fullfp16")),
244// Filter out features that are not supported by the current LLVM version
245"fpmr" => None, // only existed in 18
246 // Withdrawn by ARM; removed from LLVM in 22
247"tme" if major >= 22 => None,
248 s => Some(LLVMFeature::new(s)),
249 }
250 }
251 Arch::Arm => match s {
252"fp16" => Some(LLVMFeature::new("fullfp16")),
253 s => Some(LLVMFeature::new(s)),
254 },
255 Arch::Bpf => match s {
256"allows-misaligned-mem-access" if major < 22 => None,
257 s => Some(LLVMFeature::new(s)),
258 },
259// Filter out features that are not supported by the current LLVM version
260Arch::PowerPC | Arch::PowerPC64 => match s {
261"power8-crypto" => Some(LLVMFeature::new("crypto")),
262 s => Some(LLVMFeature::new(s)),
263 },
264 Arch::RiscV32 | Arch::RiscV64 => match s {
265// Filter out Rust-specific *virtual* target feature
266"zkne_or_zknd" => None,
267 s => Some(LLVMFeature::new(s)),
268 },
269 Arch::Sparc | Arch::Sparc64 => match s {
270"leoncasa" => Some(LLVMFeature::new("hasleoncasa")),
271 s => Some(LLVMFeature::new(s)),
272 },
273 Arch::Wasm32 | Arch::Wasm64 => match s {
274"gc" if major < 22 => None,
275 s => Some(LLVMFeature::new(s)),
276 },
277 Arch::X86 | Arch::X86_64 => {
278match s {
279"sse4.2" => Some(LLVMFeature::with_dependencies(
280"sse4.2",
281{
let count = 0usize + 1usize;
let mut vec = ::smallvec::SmallVec::new();
if count <= vec.inline_size() {
vec.push(TargetFeatureFoldStrength::EnableOnly("crc32"));
vec
} else {
::smallvec::SmallVec::from_vec(::alloc::boxed::box_assume_init_into_vec_unsafe(::alloc::intrinsics::write_box_via_move(::alloc::boxed::Box::new_uninit(),
[TargetFeatureFoldStrength::EnableOnly("crc32")])))
}
}smallvec![TargetFeatureFoldStrength::EnableOnly("crc32")],
282 )),
283"pclmulqdq" => Some(LLVMFeature::new("pclmul")),
284"rdrand" => Some(LLVMFeature::new("rdrnd")),
285"bmi1" => Some(LLVMFeature::new("bmi")),
286"cmpxchg16b" => Some(LLVMFeature::new("cx16")),
287"lahfsahf" => Some(LLVMFeature::new("sahf")),
288// Enable the evex512 target feature if an avx512 target feature is enabled.
289s if s.starts_with("avx512") && major < 22 => Some(LLVMFeature::with_dependencies(
290s,
291{
let count = 0usize + 1usize;
let mut vec = ::smallvec::SmallVec::new();
if count <= vec.inline_size() {
vec.push(TargetFeatureFoldStrength::EnableOnly("evex512"));
vec
} else {
::smallvec::SmallVec::from_vec(::alloc::boxed::box_assume_init_into_vec_unsafe(::alloc::intrinsics::write_box_via_move(::alloc::boxed::Box::new_uninit(),
[TargetFeatureFoldStrength::EnableOnly("evex512")])))
}
}smallvec![TargetFeatureFoldStrength::EnableOnly("evex512")],
292 )),
293"avx10.1" if major < 22 => Some(LLVMFeature::new("avx10.1-512")),
294"avx10.2" if major < 22 => Some(LLVMFeature::new("avx10.2-512")),
295"apxf" => Some(LLVMFeature::with_dependencies(
296"egpr",
297{
let count =
0usize + 1usize + 1usize + 1usize + 1usize + 1usize + 1usize + 1usize;
let mut vec = ::smallvec::SmallVec::new();
if count <= vec.inline_size() {
vec.push(TargetFeatureFoldStrength::Both("push2pop2"));
vec.push(TargetFeatureFoldStrength::Both("ppx"));
vec.push(TargetFeatureFoldStrength::Both("ndd"));
vec.push(TargetFeatureFoldStrength::Both("ccmp"));
vec.push(TargetFeatureFoldStrength::Both("cf"));
vec.push(TargetFeatureFoldStrength::Both("nf"));
vec.push(TargetFeatureFoldStrength::Both("zu"));
vec
} else {
::smallvec::SmallVec::from_vec(::alloc::boxed::box_assume_init_into_vec_unsafe(::alloc::intrinsics::write_box_via_move(::alloc::boxed::Box::new_uninit(),
[TargetFeatureFoldStrength::Both("push2pop2"),
TargetFeatureFoldStrength::Both("ppx"),
TargetFeatureFoldStrength::Both("ndd"),
TargetFeatureFoldStrength::Both("ccmp"),
TargetFeatureFoldStrength::Both("cf"),
TargetFeatureFoldStrength::Both("nf"),
TargetFeatureFoldStrength::Both("zu")])))
}
}smallvec![
298 TargetFeatureFoldStrength::Both("push2pop2"),
299 TargetFeatureFoldStrength::Both("ppx"),
300 TargetFeatureFoldStrength::Both("ndd"),
301 TargetFeatureFoldStrength::Both("ccmp"),
302 TargetFeatureFoldStrength::Both("cf"),
303 TargetFeatureFoldStrength::Both("nf"),
304 TargetFeatureFoldStrength::Both("zu"),
305 ],
306 )),
307 s => Some(LLVMFeature::new(s)),
308 }
309 }
310_ => Some(LLVMFeature::new(s)),
311 }
312}
313314/// Used to generate cfg variables and apply features.
315/// Must express features in the way Rust understands them.
316///
317/// We do not have to worry about RUSTC_SPECIFIC_FEATURES here, those are handled outside codegen.
318pub(crate) fn target_config(sess: &Session) -> TargetConfig {
319let target_machine = create_informational_target_machine(sess, true);
320321let (unstable_target_features, target_features) = cfg_target_feature(
322sess,
323 |feature| {
324to_llvm_features(sess, feature)
325 .map(|f| SmallVec::<[&str; 2]>::from_iter(f.into_iter()))
326 .unwrap_or_default()
327 },
328 |feature| {
329// This closure determines whether the target CPU has the feature according to LLVM. We do
330 // *not* consider the `-Ctarget-feature`s here, as that will be handled later in
331 // `cfg_target_feature`.
332if let Some(feat) = to_llvm_features(sess, feature) {
333// All the LLVM features this expands to must be enabled.
334for llvm_feature in feat {
335let cstr = SmallCStr::new(llvm_feature);
336// `LLVMRustHasFeature` is moderately expensive. On targets with many
337 // features (e.g. x86) these calls take a non-trivial fraction of runtime
338 // when compiling very small programs.
339if !unsafe { llvm::LLVMRustHasFeature(target_machine.raw(), cstr.as_ptr()) } {
340return false;
341 }
342 }
343true
344} else {
345false
346}
347 },
348 );
349350let mut cfg = TargetConfig {
351target_features,
352unstable_target_features,
353 has_reliable_f16: true,
354 has_reliable_f16_math: true,
355 has_reliable_f128: true,
356 has_reliable_f128_math: true,
357 };
358359update_target_reliable_float_cfg(sess, &mut cfg);
360cfg361}
362363/// Determine whether or not experimental float types are reliable based on known bugs.
364fn update_target_reliable_float_cfg(sess: &Session, cfg: &mut TargetConfig) {
365let target_arch = &sess.target.arch;
366let target_os = &sess.target.options.os;
367let target_env = &sess.target.options.env;
368let target_abi = &sess.target.options.cfg_abi;
369let target_pointer_width = sess.target.pointer_width;
370let version = get_version();
371let (major, _, _) = version;
372373cfg.has_reliable_f16 = match (target_arch, target_os) {
374// Unsupported <https://github.com/llvm/llvm-project/issues/94434> (fixed in llvm22)
375(Arch::Arm64EC, _) if major < 22 => false,
376// MinGW ABI bugs <https://gcc.gnu.org/bugzilla/show_bug.cgi?id=115054>
377(Arch::X86_64, Os::Windows) if *target_env == Env::Gnu && *target_abi != CfgAbi::Llvm => {
378false
379}
380// Infinite recursion <https://github.com/llvm/llvm-project/issues/97981>
381(Arch::CSky, _) if major < 22 => false, // (fixed in llvm22)
382(Arch::PowerPC | Arch::PowerPC64, _) if major < 22 => false, // (fixed in llvm22)
383(Arch::Sparc | Arch::Sparc64, _) if major < 22 => false, // (fixed in llvm22)
384(Arch::Wasm32 | Arch::Wasm64, _) if major < 22 => false, // (fixed in llvm22)
385 // `f16` support only requires that symbols converting to and from `f32` are available. We
386 // provide these in `compiler-builtins`, so `f16` should be available on all platforms that
387 // do not have other ABI issues or LLVM crashes.
388_ => true,
389 };
390391cfg.has_reliable_f128 = match (target_arch, target_os) {
392// Unsupported https://github.com/llvm/llvm-project/issues/121122
393(Arch::AmdGpu, _) => false,
394// Unsupported <https://github.com/llvm/llvm-project/issues/94434>
395(Arch::Arm64EC, _) => false,
396// Selection bug <https://github.com/llvm/llvm-project/issues/95471>. This issue is closed
397 // but basic math still does not work.
398(Arch::Nvptx64, _) => false,
399// ABI bugs <https://github.com/rust-lang/rust/issues/125109> et al. (full
400 // list at <https://github.com/rust-lang/rust/issues/116909>)
401(Arch::PowerPC | Arch::PowerPC64, _) => false,
402// ABI unsupported <https://github.com/llvm/llvm-project/issues/41838> (fixed in llvm22)
403(Arch::Sparc, _) if major < 22 => false,
404// MinGW ABI bugs <https://gcc.gnu.org/bugzilla/show_bug.cgi?id=115054>
405(Arch::X86_64, Os::Windows) if *target_env == Env::Gnu && *target_abi != CfgAbi::Llvm => {
406false
407}
408// There are no known problems on other platforms, so the only requirement is that symbols
409 // are available. `compiler-builtins` provides all symbols required for core `f128`
410 // support, so this should work for everything else.
411_ => true,
412 };
413414// Assume that working `f16` means working `f16` math for most platforms, since
415 // operations just go through `f32`.
416cfg.has_reliable_f16_math = cfg.has_reliable_f16;
417418cfg.has_reliable_f128_math = match (target_arch, target_os) {
419// LLVM lowers `fp128` math to `long double` symbols even on platforms where
420 // `long double` is not IEEE binary128. See
421 // <https://github.com/llvm/llvm-project/issues/44744>.
422 //
423 // This rules out anything that doesn't have `long double` = `binary128`; <= 32 bits
424 // (ld is `f64`), anything other than Linux (Windows and MacOS use `f64`), and `x86`
425 // (ld is 80-bit extended precision).
426 //
427 // musl does not implement the symbols required for f128 math at all.
428_ if *target_env == Env::Musl => false,
429 (Arch::X86_64, _) => false,
430 (_, Os::Linux) if target_pointer_width == 64 => true,
431_ => false,
432 } && cfg.has_reliable_f128;
433}
434435pub(crate) fn print_version() {
436let (major, minor, patch) = get_version();
437{
::std::io::_print(format_args!("LLVM version: {0}.{1}.{2}\n", major,
minor, patch));
};println!("LLVM version: {major}.{minor}.{patch}");
438}
439440pub(crate) fn get_version() -> (u32, u32, u32) {
441// Can be called without initializing LLVM
442unsafe {
443 (llvm::LLVMRustVersionMajor(), llvm::LLVMRustVersionMinor(), llvm::LLVMRustVersionPatch())
444 }
445}
446447pub(crate) fn print_passes() {
448// Can be called without initializing LLVM
449unsafe {
450 llvm::LLVMRustPrintPasses();
451 }
452}
453454fn llvm_target_features(tm: &llvm::TargetMachine) -> Vec<(&str, &str)> {
455let len = unsafe { llvm::LLVMRustGetTargetFeaturesCount(tm) };
456let mut ret = Vec::with_capacity(len);
457for i in 0..len {
458unsafe {
459let mut feature = ptr::null();
460let mut desc = ptr::null();
461 llvm::LLVMRustGetTargetFeature(tm, i, &mut feature, &mut desc);
462if feature.is_null() || desc.is_null() {
463::rustc_middle::util::bug::bug_fmt(format_args!("LLVM returned a `null` target feature string"));bug!("LLVM returned a `null` target feature string");
464 }
465let feature = CStr::from_ptr(feature).to_str().unwrap_or_else(|e| {
466::rustc_middle::util::bug::bug_fmt(format_args!("LLVM returned a non-utf8 feature string: {0}",
e));bug!("LLVM returned a non-utf8 feature string: {}", e);
467 });
468let desc = CStr::from_ptr(desc).to_str().unwrap_or_else(|e| {
469::rustc_middle::util::bug::bug_fmt(format_args!("LLVM returned a non-utf8 feature string: {0}",
e));bug!("LLVM returned a non-utf8 feature string: {}", e);
470 });
471 ret.push((feature, desc));
472 }
473 }
474ret475}
476477pub(crate) fn print(req: &PrintRequest, out: &mut String, sess: &Session) {
478require_inited();
479let tm = create_informational_target_machine(sess, false);
480match req.kind {
481 PrintKind::TargetCPUs => print_target_cpus(sess, tm.raw(), out),
482 PrintKind::TargetFeatures => print_target_features(sess, tm.raw(), out),
483_ => ::rustc_middle::util::bug::bug_fmt(format_args!("rustc_codegen_llvm can\'t handle print request: {0:?}",
req))bug!("rustc_codegen_llvm can't handle print request: {:?}", req),
484 }
485}
486487fn print_target_cpus(sess: &Session, tm: &llvm::TargetMachine, out: &mut String) {
488let cpu_names = llvm::build_string(|s| unsafe {
489 llvm::LLVMRustPrintTargetCPUs(&tm, s);
490 })
491 .unwrap();
492493struct Cpu<'a> {
494 cpu_name: &'a str,
495 remark: String,
496 }
497// Compare CPU against current target to label the default.
498let target_cpu = handle_native(&sess.target.cpu);
499let make_remark = |cpu_name| {
500if cpu_name == target_cpu {
501// FIXME(#132514): This prints the LLVM target string, which can be
502 // different from the Rust target string. Is that intended?
503let target = &sess.target.llvm_target;
504::alloc::__export::must_use({
::alloc::fmt::format(format_args!(" - This is the default target CPU for the current build target (currently {0}).",
target))
})format!(
505" - This is the default target CPU for the current build target (currently {target})."
506)507 } else {
508"".to_owned()
509 }
510 };
511let mut cpus = cpu_names512 .lines()
513 .map(|cpu_name| Cpu { cpu_name, remark: make_remark(cpu_name) })
514 .collect::<VecDeque<_>>();
515516// Only print the "native" entry when host and target are the same arch,
517 // since otherwise it could be wrong or misleading.
518if sess.host.arch == sess.target.arch {
519let host = get_host_cpu_name();
520cpus.push_front(Cpu {
521 cpu_name: "native",
522 remark: ::alloc::__export::must_use({
::alloc::fmt::format(format_args!(" - Select the CPU of the current host (currently {0}).",
host))
})format!(" - Select the CPU of the current host (currently {host})."),
523 });
524 }
525526let max_name_width = cpus.iter().map(|cpu| cpu.cpu_name.len()).max().unwrap_or(0);
527out.write_fmt(format_args!("Available CPUs for this target:\n"))writeln!(out, "Available CPUs for this target:").unwrap();
528for Cpu { cpu_name, remark } in cpus {
529// Only pad the CPU name if there's a remark to print after it.
530let width = if remark.is_empty() { 0 } else { max_name_width };
531out.write_fmt(format_args!(" {0:<1$}{2}\n", cpu_name, width, remark))writeln!(out, " {cpu_name:<width$}{remark}").unwrap();
532 }
533}
534535fn print_target_features(sess: &Session, tm: &llvm::TargetMachine, out: &mut String) {
536let mut llvm_target_features = llvm_target_features(tm);
537let mut known_llvm_target_features = FxHashSet::<&'static str>::default();
538let mut rustc_target_features = sess539 .target
540 .rust_target_features()
541 .iter()
542 .filter_map(|(feature, gate, _implied)| {
543if !gate.in_cfg() {
544// Only list (experimentally) supported features.
545return None;
546 }
547// LLVM asserts that these are sorted. LLVM and Rust both use byte comparison for these
548 // strings.
549let llvm_feature = to_llvm_features(sess, *feature)?.llvm_feature_name;
550let desc =
551match llvm_target_features.binary_search_by_key(&llvm_feature, |(f, _d)| f).ok() {
552Some(index) => {
553known_llvm_target_features.insert(llvm_feature);
554llvm_target_features[index].1
555}
556None => "",
557 };
558559Some((*feature, desc))
560 })
561 .collect::<Vec<_>>();
562563// Since we add this at the end ...
564rustc_target_features.extend_from_slice(&[(
565"crt-static",
566"Enables C Run-time Libraries to be statically linked",
567 )]);
568// ... we need to sort the list again.
569rustc_target_features.sort();
570571llvm_target_features.retain(|(f, _d)| !known_llvm_target_features.contains(f));
572573let max_feature_len = llvm_target_features574 .iter()
575 .chain(rustc_target_features.iter())
576 .map(|(feature, _desc)| feature.len())
577 .max()
578 .unwrap_or(0);
579580out.write_fmt(format_args!("Features supported by rustc for this target:\n"))writeln!(out, "Features supported by rustc for this target:").unwrap();
581for (feature, desc) in &rustc_target_features {
582out.write_fmt(format_args!(" {0:1$} - {2}.\n", feature, max_feature_len,
desc))writeln!(out, " {feature:max_feature_len$} - {desc}.").unwrap();
583 }
584out.write_fmt(format_args!("\nCode-generation features supported by LLVM for this target:\n"))writeln!(out, "\nCode-generation features supported by LLVM for this target:").unwrap();
585for (feature, desc) in &llvm_target_features {
586out.write_fmt(format_args!(" {0:1$} - {2}.\n", feature, max_feature_len,
desc))writeln!(out, " {feature:max_feature_len$} - {desc}.").unwrap();
587 }
588if llvm_target_features.is_empty() {
589out.write_fmt(format_args!(" Target features listing is not supported by this LLVM version.\n"))writeln!(out, " Target features listing is not supported by this LLVM version.")590 .unwrap();
591 }
592out.write_fmt(format_args!("\nUse +feature to enable a feature, or -feature to disable it.\n"))writeln!(out, "\nUse +feature to enable a feature, or -feature to disable it.").unwrap();
593out.write_fmt(format_args!("For example, rustc -C target-cpu=mycpu -C target-feature=+feature1,-feature2\n\n"))writeln!(out, "For example, rustc -C target-cpu=mycpu -C target-feature=+feature1,-feature2\n")594 .unwrap();
595out.write_fmt(format_args!("Code-generation features cannot be used in cfg or #[target_feature],\n"))writeln!(out, "Code-generation features cannot be used in cfg or #[target_feature],").unwrap();
596out.write_fmt(format_args!("and may be renamed or removed in a future version of LLVM or rustc.\n\n"))writeln!(out, "and may be renamed or removed in a future version of LLVM or rustc.\n").unwrap();
597}
598599/// Returns the host CPU name, according to LLVM.
600fn get_host_cpu_name() -> &'static str {
601let mut len = 0;
602// SAFETY: The underlying C++ global function returns a `StringRef` that
603 // isn't tied to any particular backing buffer, so it must be 'static.
604let slice: &'static [u8] = unsafe {
605let ptr = llvm::LLVMRustGetHostCPUName(&mut len);
606if !!ptr.is_null() {
::core::panicking::panic("assertion failed: !ptr.is_null()")
};assert!(!ptr.is_null());
607 slice::from_raw_parts(ptr, len)
608 };
609 str::from_utf8(slice).expect("host CPU name should be UTF-8")
610}
611612/// If the given string is `"native"`, returns the host CPU name according to
613/// LLVM. Otherwise, the string is returned as-is.
614fn handle_native(cpu_name: &str) -> &str {
615match cpu_name {
616"native" => get_host_cpu_name(),
617_ => cpu_name,
618 }
619}
620621pub(crate) fn target_cpu(sess: &Session) -> &str {
622let cpu_name = sess.opts.cg.target_cpu.as_deref().unwrap_or_else(|| &sess.target.cpu);
623handle_native(cpu_name)
624}
625626/// The target features for compiler flags other than `-Ctarget-features`.
627fn llvm_features_by_flags(sess: &Session, features: &mut Vec<String>) {
628if wants_wasm_eh(sess) && sess.panic_strategy() == PanicStrategy::Unwind {
629features.push("+exception-handling".into());
630 }
631632 target_features::retpoline_features_by_flags(sess, features);
633634// -Zfixed-x18
635if sess.opts.unstable_opts.fixed_x18 {
636if sess.target.arch != Arch::AArch64 {
637sess.dcx().emit_fatal(errors::FixedX18InvalidArch { arch: sess.target.arch.desc() });
638 } else {
639features.push("+reserve-x18".into());
640 }
641 }
642}
643644/// The list of LLVM features computed from CLI flags (`-Ctarget-cpu`, `-Ctarget-feature`,
645/// `--target` and similar).
646pub(crate) fn global_llvm_features(sess: &Session, only_base_features: bool) -> Vec<String> {
647// Features that come earlier are overridden by conflicting features later in the string.
648 // Typically we'll want more explicit settings to override the implicit ones, so:
649 //
650 // * Features from -Ctarget-cpu=*; are overridden by [^1]
651 // * Features implied by --target; are overridden by
652 // * Features from -Ctarget-feature; are overridden by
653 // * function specific features.
654 //
655 // [^1]: target-cpu=native is handled here, other target-cpu values are handled implicitly
656 // through LLVM TargetMachine implementation.
657 //
658 // FIXME(nagisa): it isn't clear what's the best interaction between features implied by
659 // `-Ctarget-cpu` and `--target` are. On one hand, you'd expect CLI arguments to always
660 // override anything that's implicit, so e.g. when there's no `--target` flag, features implied
661 // the host target are overridden by `-Ctarget-cpu=*`. On the other hand, what about when both
662 // `--target` and `-Ctarget-cpu=*` are specified? Both then imply some target features and both
663 // flags are specified by the user on the CLI. It isn't as clear-cut which order of precedence
664 // should be taken in cases like these.
665let mut features = ::alloc::vec::Vec::new()vec![];
666667// -Ctarget-cpu=native
668match sess.opts.cg.target_cpu {
669Some(ref s) if s == "native" => {
670// We have already figured out the actual CPU name with `LLVMRustGetHostCPUName` and set
671 // that for LLVM, so the features implied by that CPU name will be available everywhere.
672 // However, that is not sufficient: e.g. `skylake` alone is not sufficient to tell if
673 // some of the instructions are available or not. So we have to also explicitly ask for
674 // the exact set of features available on the host, and enable all of them.
675let features_string = unsafe {
676let ptr = llvm::LLVMGetHostCPUFeatures();
677let features_string = if !ptr.is_null() {
678CStr::from_ptr(ptr)
679 .to_str()
680 .unwrap_or_else(|e| {
681::rustc_middle::util::bug::bug_fmt(format_args!("LLVM returned a non-utf8 features string: {0}",
e));bug!("LLVM returned a non-utf8 features string: {}", e);
682 })
683 .to_owned()
684 } else {
685::rustc_middle::util::bug::bug_fmt(format_args!("could not allocate host CPU features, LLVM returned a `null` string"));bug!("could not allocate host CPU features, LLVM returned a `null` string");
686 };
687688 llvm::LLVMDisposeMessage(ptr);
689690features_string691 };
692if !features_string.is_empty() {
693features.extend(features_string.split(',').map(String::from));
694 }
695 }
696Some(_) | None => {}
697 };
698699let mut extend_backend_features = |feature: &str, enable: bool| {
700let enable_disable = if enable { '+' } else { '-' };
701// We run through `to_llvm_features` when
702 // passing requests down to LLVM. This means that all in-language
703 // features also work on the command line instead of having two
704 // different names when the LLVM name and the Rust name differ.
705let Some(llvm_feature) = to_llvm_features(sess, feature) else { return };
706707features.extend(
708 std::iter::once(::alloc::__export::must_use({
::alloc::fmt::format(format_args!("{0}{1}", enable_disable,
llvm_feature.llvm_feature_name))
})format!("{}{}", enable_disable, llvm_feature.llvm_feature_name)).chain(
709llvm_feature.dependencies.into_iter().filter_map(move |feat| {
710match (enable, feat) {
711 (_, TargetFeatureFoldStrength::Both(f))
712 | (true, TargetFeatureFoldStrength::EnableOnly(f)) => {
713Some(::alloc::__export::must_use({
::alloc::fmt::format(format_args!("{0}{1}", enable_disable, f))
})format!("{enable_disable}{f}"))
714 }
715_ => None,
716 }
717 }),
718 ),
719 );
720 };
721722// Features implied by an implicit or explicit `--target`.
723target_features::target_spec_to_backend_features(sess, &mut extend_backend_features);
724725// -Ctarget-features
726if !only_base_features {
727 target_features::flag_to_backend_features(sess, extend_backend_features);
728 }
729730// We add this in the "base target" so that these show up in `sess.unstable_target_features`.
731llvm_features_by_flags(sess, &mut features);
732733features734}
735736pub(crate) fn tune_cpu(sess: &Session) -> Option<&str> {
737let name = sess.opts.unstable_opts.tune_cpu.as_ref()?;
738Some(handle_native(name))
739}