1
Fork 0

Create a structure to define the features from to_llvm_features.

Rather than returning an array of features from to_llvm_features, return a structure that contains
the dependencies. This also contains metadata on how the features depend on each other to allow for
the correct enabling and disabling.
This commit is contained in:
Jamie Cunliffe 2023-05-22 14:46:40 +01:00
parent d51db4275b
commit a059e68d11
3 changed files with 133 additions and 70 deletions

View file

@ -10,6 +10,7 @@
#![feature(iter_intersperse)] #![feature(iter_intersperse)]
#![feature(let_chains)] #![feature(let_chains)]
#![feature(never_type)] #![feature(never_type)]
#![feature(impl_trait_in_assoc_type)]
#![recursion_limit = "256"] #![recursion_limit = "256"]
#![allow(rustc::potential_query_instability)] #![allow(rustc::potential_query_instability)]
#![deny(rustc::untranslatable_diagnostic)] #![deny(rustc::untranslatable_diagnostic)]

View file

@ -16,7 +16,6 @@ use rustc_session::config::PrintRequest;
use rustc_session::Session; use rustc_session::Session;
use rustc_span::symbol::Symbol; use rustc_span::symbol::Symbol;
use rustc_target::spec::{MergeFunctions, PanicStrategy}; use rustc_target::spec::{MergeFunctions, PanicStrategy};
use smallvec::{smallvec, SmallVec};
use std::ffi::{CStr, CString}; use std::ffi::{CStr, CString};
use std::path::Path; use std::path::Path;
@ -132,6 +131,60 @@ pub fn time_trace_profiler_finish(file_name: &Path) {
} }
} }
pub enum TargetFeatureFoldStrength<'a> {
// The feature is only tied when enabling the feature, disabling
// this feature shouldn't disable the tied feature.
EnableOnly(&'a str),
// The feature is tied for both enabling and disabling this feature.
Both(&'a str),
}
impl<'a> TargetFeatureFoldStrength<'a> {
fn as_str(&self) -> &'a str {
match self {
TargetFeatureFoldStrength::EnableOnly(feat) => feat,
TargetFeatureFoldStrength::Both(feat) => feat,
}
}
}
pub struct LLVMFeature<'a> {
pub llvm_feature_name: &'a str,
pub dependency: Option<TargetFeatureFoldStrength<'a>>,
}
impl<'a> LLVMFeature<'a> {
pub fn new(llvm_feature_name: &'a str) -> Self {
Self { llvm_feature_name, dependency: None }
}
pub fn with_dependency(
llvm_feature_name: &'a str,
dependency: TargetFeatureFoldStrength<'a>,
) -> Self {
Self { llvm_feature_name, dependency: Some(dependency) }
}
pub fn contains(&self, feat: &str) -> bool {
self.iter().any(|dep| dep == feat)
}
pub fn iter(&'a self) -> impl Iterator<Item = &'a str> {
let dependencies = self.dependency.iter().map(|feat| feat.as_str());
std::iter::once(self.llvm_feature_name).chain(dependencies)
}
}
impl<'a> IntoIterator for LLVMFeature<'a> {
type Item = &'a str;
type IntoIter = impl Iterator<Item = &'a str>;
fn into_iter(self) -> Self::IntoIter {
let dependencies = self.dependency.into_iter().map(|feat| feat.as_str());
std::iter::once(self.llvm_feature_name).chain(dependencies)
}
}
// WARNING: the features after applying `to_llvm_features` must be known // WARNING: the features after applying `to_llvm_features` must be known
// to LLVM or the feature detection code will walk past the end of the feature // to LLVM or the feature detection code will walk past the end of the feature
// array, leading to crashes. // array, leading to crashes.
@ -147,58 +200,65 @@ pub fn time_trace_profiler_finish(file_name: &Path) {
// Though note that Rust can also be build with an external precompiled version of LLVM // Though note that Rust can also be build with an external precompiled version of LLVM
// which might lead to failures if the oldest tested / supported LLVM version // which might lead to failures if the oldest tested / supported LLVM version
// doesn't yet support the relevant intrinsics // doesn't yet support the relevant intrinsics
// pub fn to_llvm_features<'a>(sess: &Session, s: &'a str) -> LLVMFeature<'a> {
// Note: The first feature in the list that is returned is the mapping to the feature that is
// provided from the `s` parameter.
pub fn to_llvm_features<'a>(sess: &Session, s: &'a str) -> SmallVec<[&'a str; 2]> {
let arch = if sess.target.arch == "x86_64" { "x86" } else { &*sess.target.arch }; let arch = if sess.target.arch == "x86_64" { "x86" } else { &*sess.target.arch };
match (arch, s) { match (arch, s) {
("x86", "sse4.2") => smallvec!["sse4.2", "crc32"], ("x86", "sse4.2") => {
("x86", "pclmulqdq") => smallvec!["pclmul"], LLVMFeature::with_dependency("sse4.2", TargetFeatureFoldStrength::EnableOnly("crc32"))
("x86", "rdrand") => smallvec!["rdrnd"], }
("x86", "bmi1") => smallvec!["bmi"], ("x86", "pclmulqdq") => LLVMFeature::new("pclmul"),
("x86", "cmpxchg16b") => smallvec!["cx16"], ("x86", "rdrand") => LLVMFeature::new("rdrnd"),
("aarch64", "rcpc2") => smallvec!["rcpc-immo"], ("x86", "bmi1") => LLVMFeature::new("bmi"),
("aarch64", "dpb") => smallvec!["ccpp"], ("x86", "cmpxchg16b") => LLVMFeature::new("cx16"),
("aarch64", "dpb2") => smallvec!["ccdp"], ("aarch64", "rcpc2") => LLVMFeature::new("rcpc-immo"),
("aarch64", "frintts") => smallvec!["fptoint"], ("aarch64", "dpb") => LLVMFeature::new("ccpp"),
("aarch64", "fcma") => smallvec!["complxnum"], ("aarch64", "dpb2") => LLVMFeature::new("ccdp"),
("aarch64", "pmuv3") => smallvec!["perfmon"], ("aarch64", "frintts") => LLVMFeature::new("fptoint"),
("aarch64", "paca") => smallvec!["pauth"], ("aarch64", "fcma") => LLVMFeature::new("complxnum"),
("aarch64", "pacg") => smallvec!["pauth"], ("aarch64", "pmuv3") => LLVMFeature::new("perfmon"),
("aarch64", "paca") => LLVMFeature::new("pauth"),
("aarch64", "pacg") => LLVMFeature::new("pauth"),
// Rust ties fp and neon together. // Rust ties fp and neon together.
("aarch64", "neon") => smallvec!["neon", "fp-armv8"], ("aarch64", "neon") => {
LLVMFeature::with_dependency("neon", TargetFeatureFoldStrength::Both("fp-armv8"))
}
// In LLVM neon implicitly enables fp, but we manually enable // In LLVM neon implicitly enables fp, but we manually enable
// neon when a feature only implicitly enables fp // neon when a feature only implicitly enables fp
("aarch64", "f32mm") => smallvec!["f32mm", "neon"], ("aarch64", "f32mm") => {
("aarch64", "f64mm") => smallvec!["f64mm", "neon"], LLVMFeature::with_dependency("f32mm", TargetFeatureFoldStrength::EnableOnly("neon"))
("aarch64", "fhm") => smallvec!["fp16fml", "neon"], }
("aarch64", "fp16") => smallvec!["fullfp16", "neon"], ("aarch64", "f64mm") => {
("aarch64", "jsconv") => smallvec!["jsconv", "neon"], LLVMFeature::with_dependency("f64mm", TargetFeatureFoldStrength::EnableOnly("neon"))
("aarch64", "sve") => smallvec!["sve", "neon"], }
("aarch64", "sve2") => smallvec!["sve2", "neon"], ("aarch64", "fhm") => {
("aarch64", "sve2-aes") => smallvec!["sve2-aes", "neon"], LLVMFeature::with_dependency("fp16fml", TargetFeatureFoldStrength::EnableOnly("neon"))
("aarch64", "sve2-sm4") => smallvec!["sve2-sm4", "neon"], }
("aarch64", "sve2-sha3") => smallvec!["sve2-sha3", "neon"], ("aarch64", "fp16") => {
("aarch64", "sve2-bitperm") => smallvec!["sve2-bitperm", "neon"], LLVMFeature::with_dependency("fullfp16", TargetFeatureFoldStrength::EnableOnly("neon"))
(_, s) => smallvec![s], }
} ("aarch64", "jsconv") => {
} LLVMFeature::with_dependency("jsconv", TargetFeatureFoldStrength::EnableOnly("neon"))
}
pub enum TargetFeatureFoldStrength { ("aarch64", "sve") => {
// The feature is only tied when enabling the feature, disabling LLVMFeature::with_dependency("sve", TargetFeatureFoldStrength::EnableOnly("neon"))
// this feature shouldn't disable the tied feature. }
EnableOnly, ("aarch64", "sve2") => {
// The feature is tied for both enabling and disabling this feature. LLVMFeature::with_dependency("sve2", TargetFeatureFoldStrength::EnableOnly("neon"))
Both, }
} ("aarch64", "sve2-aes") => {
LLVMFeature::with_dependency("sve2-aes", TargetFeatureFoldStrength::EnableOnly("neon"))
// Determines how the features are folded together, some features are }
// linked a lot more than some others. ("aarch64", "sve2-sm4") => {
pub fn feature_fold_strength<'a>(feats: &SmallVec<[&'a str; 2]>) -> TargetFeatureFoldStrength { LLVMFeature::with_dependency("sve2-sm4", TargetFeatureFoldStrength::EnableOnly("neon"))
match (feats.get(0), feats.get(1)) { }
(Some(&"neon"), Some(&"fp-armv8")) => TargetFeatureFoldStrength::Both, ("aarch64", "sve2-sha3") => {
_ => TargetFeatureFoldStrength::EnableOnly, LLVMFeature::with_dependency("sve2-sha3", TargetFeatureFoldStrength::EnableOnly("neon"))
}
("aarch64", "sve2-bitperm") => LLVMFeature::with_dependency(
"sve2-bitperm",
TargetFeatureFoldStrength::EnableOnly("neon"),
),
(_, s) => LLVMFeature::new(s),
} }
} }
@ -296,18 +356,17 @@ fn print_target_features(sess: &Session, tm: &llvm::TargetMachine) {
let mut rustc_target_features = supported_target_features(sess) let mut rustc_target_features = supported_target_features(sess)
.iter() .iter()
.map(|(feature, _gate)| { .map(|(feature, _gate)| {
let desc = if let Some(llvm_feature) = to_llvm_features(sess, *feature).first() { // LLVM asserts that these are sorted. LLVM and Rust both use byte comparison for these strings.
// LLVM asserts that these are sorted. LLVM and Rust both use byte comparison for these strings. let llvm_feature = to_llvm_features(sess, *feature).llvm_feature_name;
let desc =
match llvm_target_features.binary_search_by_key(&llvm_feature, |(f, _d)| f).ok() { match llvm_target_features.binary_search_by_key(&llvm_feature, |(f, _d)| f).ok() {
Some(index) => { Some(index) => {
known_llvm_target_features.insert(llvm_feature); known_llvm_target_features.insert(llvm_feature);
llvm_target_features[index].1 llvm_target_features[index].1
} }
None => "", None => "",
} };
} else {
""
};
(*feature, desc) (*feature, desc)
}) })
.collect::<Vec<_>>(); .collect::<Vec<_>>();
@ -491,17 +550,20 @@ pub(crate) fn global_llvm_features(sess: &Session, diagnostics: bool) -> Vec<Str
// passing requests down to LLVM. This means that all in-language // passing requests down to LLVM. This means that all in-language
// features also work on the command line instead of having two // features also work on the command line instead of having two
// different names when the LLVM name and the Rust name differ. // different names when the LLVM name and the Rust name differ.
let llvm_features = to_llvm_features(sess, feature); let llvm_feature = to_llvm_features(sess, feature);
Some(to_llvm_features(sess, feature).into_iter().enumerate().filter_map(
move |(idx, f)| match (enable_disable, feature_fold_strength(&llvm_features)) { Some(
('-' | '+', TargetFeatureFoldStrength::Both) std::iter::once(format!("{}{}", enable_disable, llvm_feature.llvm_feature_name))
| ('+', TargetFeatureFoldStrength::EnableOnly) => { .chain(llvm_feature.dependency.into_iter().filter_map(move |feat| {
Some(format!("{}{}", enable_disable, f)) match (enable_disable, feat) {
} ('-' | '+', TargetFeatureFoldStrength::Both(f))
_ if idx == 0 => Some(format!("{}{}", enable_disable, f)), | ('+', TargetFeatureFoldStrength::EnableOnly(f)) => {
_ => None, Some(format!("{}{}", enable_disable, f))
}, }
)) _ => None,
}
})),
)
}) })
.flatten(); .flatten();
features.extend(feats); features.extend(feats);

View file

@ -5,19 +5,19 @@
// The "+v8a" feature is matched as optional as it isn't added when we // The "+v8a" feature is matched as optional as it isn't added when we
// are targeting older LLVM versions. Once the min supported version // are targeting older LLVM versions. Once the min supported version
// is LLVM-14 we can remove the regex matching for this feature. // is LLVM-14 we can remove the optional regex matching for this feature.
// [ENABLE_SVE] compile-flags: -C target-feature=+sve // [ENABLE_SVE] compile-flags: -C target-feature=+sve
// ENABLE_SVE: attributes #0 = { {{.*}} "target-features"="+outline-atomics,+sve,+neon{{(,\+v8a)?}}" } // ENABLE_SVE: attributes #0 = { {{.*}} "target-features"="{{((\+outline-atomics,?)|(\+v8a,?)?|(\+sve,?)|(\+neon,?))*}}" }
// [DISABLE_SVE] compile-flags: -C target-feature=-sve // [DISABLE_SVE] compile-flags: -C target-feature=-sve
// DISABLE_SVE: attributes #0 = { {{.*}} "target-features"="+outline-atomics,-sve{{(,\+v8a)?}}" } // DISABLE_SVE: attributes #0 = { {{.*}} "target-features"="{{((\+outline-atomics,?)|(\+v8a,?)?|(-sve,?)|(\+neon,?))*}}" }
// [DISABLE_NEON] compile-flags: -C target-feature=-neon // [DISABLE_NEON] compile-flags: -C target-feature=-neon
// DISABLE_NEON: attributes #0 = { {{.*}} "target-features"="+outline-atomics,-neon,-fp-armv8{{(,\+v8a)?}}" } // DISABLE_NEON: attributes #0 = { {{.*}} "target-features"="{{((\+outline-atomics,?)|(\+v8a,?)?|(-fp-armv8,?)|(-neon,?))*}}" }
// [ENABLE_NEON] compile-flags: -C target-feature=+neon // [ENABLE_NEON] compile-flags: -C target-feature=+neon
// ENABLE_NEON: attributes #0 = { {{.*}} "target-features"="+outline-atomics,+neon,+fp-armv8{{(,\+v8a)?}}" } // ENABLE_NEON: attributes #0 = { {{.*}} "target-features"="{{((\+outline-atomics,?)|(\+v8a,?)?|(\+fp-armv8,?)|(\+neon,?))*}}" }
#![feature(no_core, lang_items)] #![feature(no_core, lang_items)]