Skip to content

Commit 67d6cc6

Browse files
authored
Rollup merge of #91608 - workingjubilee:fold-neon-fp, r=nagisa,Amanieu
Fold aarch64 feature +fp into +neon Arm's FEAT_FP and Feat_AdvSIMD describe the same thing on AArch64: The Neon unit, which handles both floating point and SIMD instructions. Moreover, a configuration for AArch64 must include both or neither. Arm says "entirely proprietary" toolchains may omit floating point: https://developer.arm.com/documentation/102374/0101/Data-processing---floating-point In the Programmer's Guide for Armv8-A, Arm says AArch64 can have both FP and Neon or neither in custom implementations: https://developer.arm.com/documentation/den0024/a/AArch64-Floating-point-and-NEON In "Bare metal boot code for Armv8-A", enabling Neon and FP is just disabling the same trap flag: https://developer.arm.com/documentation/dai0527/a In an unlikely future where "Neon and FP" become unrelated, we can add "[+-]fp" as its own feature flag. Until then, we can simplify programming with Rust on AArch64 by folding both into "[+-]neon", which is valid as it supersets both. "[+-]neon" is retained for niche uses such as firmware, kernels, "I just hate floats", and so on. I am... pretty sure no one is relying on this. An argument could be made that, as we are not an "entirely proprietary" toolchain, we should not support AArch64 without floats at all. I think that's a bit excessive. However, I want to recognize the intent: programming for AArch64 should be simplified where possible. For x86-64, programmers regularly set up illegal feature configurations because it's hard to understand them, see #89586. And per the above notes, plus the discussion in #86941, there should be no real use cases for leaving these features split: the two should in fact always go together. - Fixes #95002. - Fixes #95064. - Fixes #95122.
2 parents a4a5e79 + 6c19dc9 commit 67d6cc6

File tree

9 files changed

+155
-12
lines changed

9 files changed

+155
-12
lines changed

compiler/rustc_codegen_llvm/src/llvm_util.rs

+6-4
Original file line numberDiff line numberDiff line change
@@ -187,7 +187,6 @@ pub fn to_llvm_features<'a>(sess: &Session, s: &'a str) -> SmallVec<[&'a str; 2]
187187
("x86", "avx512vaes") => smallvec!["vaes"],
188188
("x86", "avx512gfni") => smallvec!["gfni"],
189189
("x86", "avx512vpclmulqdq") => smallvec!["vpclmulqdq"],
190-
("aarch64", "fp") => smallvec!["fp-armv8"],
191190
("aarch64", "rcpc2") => smallvec!["rcpc-immo"],
192191
("aarch64", "dpb") => smallvec!["ccpp"],
193192
("aarch64", "dpb2") => smallvec!["ccdp"],
@@ -230,6 +229,8 @@ pub fn check_tied_features(
230229
None
231230
}
232231

232+
// Used to generate cfg variables and apply features
233+
// Must express features in the way Rust understands them
233234
pub fn target_features(sess: &Session) -> Vec<Symbol> {
234235
let target_machine = create_informational_target_machine(sess);
235236
let mut features: Vec<Symbol> =
@@ -239,13 +240,14 @@ pub fn target_features(sess: &Session) -> Vec<Symbol> {
239240
if sess.is_nightly_build() || gate.is_none() { Some(feature) } else { None }
240241
})
241242
.filter(|feature| {
243+
// check that all features in a given smallvec are enabled
242244
for llvm_feature in to_llvm_features(sess, feature) {
243245
let cstr = SmallCStr::new(llvm_feature);
244-
if unsafe { llvm::LLVMRustHasFeature(target_machine, cstr.as_ptr()) } {
245-
return true;
246+
if !unsafe { llvm::LLVMRustHasFeature(target_machine, cstr.as_ptr()) } {
247+
return false;
246248
}
247249
}
248-
false
250+
true
249251
})
250252
.map(|feature| Symbol::intern(feature))
251253
.collect();

compiler/rustc_codegen_ssa/src/target_features.rs

+1-4
Original file line numberDiff line numberDiff line change
@@ -43,10 +43,8 @@ const ARM_ALLOWED_FEATURES: &[(&str, Option<Symbol>)] = &[
4343
];
4444

4545
const AARCH64_ALLOWED_FEATURES: &[(&str, Option<Symbol>)] = &[
46-
// FEAT_AdvSimd
46+
// FEAT_AdvSimd & FEAT_FP
4747
("neon", None),
48-
// FEAT_FP
49-
("fp", None),
5048
// FEAT_FP16
5149
("fp16", None),
5250
// FEAT_SVE
@@ -143,7 +141,6 @@ const AARCH64_ALLOWED_FEATURES: &[(&str, Option<Symbol>)] = &[
143141
];
144142

145143
const AARCH64_TIED_FEATURES: &[&[&str]] = &[
146-
&["fp", "neon"], // Silicon always has both, so avoid needless complications
147144
&["paca", "pacg"], // Together these represent `pauth` in LLVM
148145
];
149146

compiler/rustc_target/src/asm/aarch64.rs

+1-1
Original file line numberDiff line numberDiff line change
@@ -64,7 +64,7 @@ impl AArch64InlineAsmRegClass {
6464
match self {
6565
Self::reg => types! { _: I8, I16, I32, I64, F32, F64; },
6666
Self::vreg | Self::vreg_low16 => types! {
67-
fp: I8, I16, I32, I64, F32, F64,
67+
neon: I8, I16, I32, I64, F32, F64,
6868
VecI8(8), VecI16(4), VecI32(2), VecI64(1), VecF32(2), VecF64(1),
6969
VecI8(16), VecI16(8), VecI32(4), VecI64(2), VecF32(4), VecF64(2);
7070
},

library/std/tests/run-time-detect.rs

-1
Original file line numberDiff line numberDiff line change
@@ -29,7 +29,6 @@ fn aarch64_linux() {
2929
println!("neon: {}", is_aarch64_feature_detected!("neon"));
3030
println!("asimd: {}", is_aarch64_feature_detected!("asimd"));
3131
println!("pmull: {}", is_aarch64_feature_detected!("pmull"));
32-
println!("fp: {}", is_aarch64_feature_detected!("fp"));
3332
println!("fp16: {}", is_aarch64_feature_detected!("fp16"));
3433
println!("sve: {}", is_aarch64_feature_detected!("sve"));
3534
println!("crc: {}", is_aarch64_feature_detected!("crc"));

src/test/run-make-fulldeps/simd-ffi/Makefile

+1-1
Original file line numberDiff line numberDiff line change
@@ -41,7 +41,7 @@ define MK_TARGETS
4141
# now.
4242
$(1): simd.rs
4343
$$(RUSTC) --target=$(1) --emit=llvm-ir,asm simd.rs \
44-
-C target-feature='+fp,+neon,+sse2' -C extra-filename=-$(1)
44+
-C target-feature='+neon,+sse2' -C extra-filename=-$(1)
4545
endef
4646

4747
$(foreach targetxxx,$(TARGETS),$(eval $(call MK_TARGETS,$(targetxxx))))

src/test/ui/asm/aarch64/bad-reg.rs

+1-1
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
11
// only-aarch64
2-
// compile-flags: -C target-feature=+fp
2+
// compile-flags: -C target-feature=+neon
33

44
#![feature(asm_const, asm_sym)]
55

Original file line numberDiff line numberDiff line change
@@ -0,0 +1,23 @@
1+
// only-aarch64
2+
// run-pass
3+
#![allow(dead_code)]
4+
use std::arch::*;
5+
use std::arch::aarch64::*;
6+
7+
// Smoke test to verify aarch64 code that enables NEON compiles.
8+
fn main() {
9+
let _zero = if is_aarch64_feature_detected!("neon") {
10+
unsafe {
11+
let zeros = zero_vector();
12+
vgetq_lane_u8::<1>(zeros)
13+
}
14+
} else {
15+
0
16+
};
17+
}
18+
19+
20+
#[target_feature(enable = "neon")]
21+
unsafe fn zero_vector() -> uint8x16_t {
22+
vmovq_n_u8(0)
23+
}
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,58 @@
1+
// revisions: aarch64-neon aarch64-sve2
2+
// [aarch64-neon] compile-flags: -Ctarget-feature=+neon --target=aarch64-unknown-linux-gnu
3+
// [aarch64-neon] needs-llvm-components: aarch64
4+
// [aarch64-sve2] compile-flags: -Ctarget-feature=-neon,+sve2 --target=aarch64-unknown-linux-gnu
5+
// [aarch64-sve2] needs-llvm-components: aarch64
6+
// build-pass
7+
#![no_core]
8+
#![crate_type = "rlib"]
9+
#![feature(intrinsics, rustc_attrs, no_core, lang_items, staged_api)]
10+
#![stable(feature = "test", since = "1.0.0")]
11+
12+
// Tests vetting "feature hierarchies" in the cases where we impose them.
13+
14+
// Supporting minimal rust core code
15+
#[lang = "sized"]
16+
trait Sized {}
17+
#[lang = "copy"]
18+
trait Copy {}
19+
impl Copy for bool {}
20+
21+
extern "rust-intrinsic" {
22+
#[rustc_const_stable(feature = "test", since = "1.0.0")]
23+
fn unreachable() -> !;
24+
}
25+
26+
#[rustc_builtin_macro]
27+
macro_rules! cfg {
28+
($($cfg:tt)*) => {};
29+
}
30+
31+
// Test code
32+
const fn do_or_die(cond: bool) {
33+
if cond {
34+
} else {
35+
unsafe { unreachable() }
36+
}
37+
}
38+
39+
macro_rules! assert {
40+
($x:expr $(,)?) => {
41+
const _: () = do_or_die($x);
42+
};
43+
}
44+
45+
46+
#[cfg(aarch64_neon)]
47+
fn check_neon_not_sve2() {
48+
// This checks that a normal aarch64 target doesn't suddenly jump up the feature hierarchy.
49+
assert!(cfg!(target_feature = "neon"));
50+
assert!(cfg!(not(target_feature = "sve2")));
51+
}
52+
53+
#[cfg(aarch64_sve2)]
54+
fn check_sve2_includes_neon() {
55+
// This checks that aarch64's sve2 includes neon
56+
assert!(cfg!(target_feature = "neon"));
57+
assert!(cfg!(target_feature = "sve2"));
58+
}
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,64 @@
1+
// revisions: aarch64 x86-64
2+
// [aarch64] compile-flags: -Ctarget-feature=+neon,+fp16,+fhm --target=aarch64-unknown-linux-gnu
3+
// [aarch64] needs-llvm-components: aarch64
4+
// [x86-64] compile-flags: -Ctarget-feature=+sse4.2,+rdrand --target=x86_64-unknown-linux-gnu
5+
// [x86-64] needs-llvm-components: x86
6+
// build-pass
7+
#![no_core]
8+
#![crate_type = "rlib"]
9+
#![feature(intrinsics, rustc_attrs, no_core, lang_items, staged_api)]
10+
#![stable(feature = "test", since = "1.0.0")]
11+
12+
// Supporting minimal rust core code
13+
#[lang = "sized"]
14+
trait Sized {}
15+
#[lang = "copy"]
16+
trait Copy {}
17+
impl Copy for bool {}
18+
19+
extern "rust-intrinsic" {
20+
#[rustc_const_stable(feature = "test", since = "1.0.0")]
21+
fn unreachable() -> !;
22+
}
23+
24+
#[rustc_builtin_macro]
25+
macro_rules! cfg {
26+
($($cfg:tt)*) => {};
27+
}
28+
29+
// Test code
30+
const fn do_or_die(cond: bool) {
31+
if cond {
32+
} else {
33+
unsafe { unreachable() }
34+
}
35+
}
36+
37+
macro_rules! assert {
38+
($x:expr $(,)?) => {
39+
const _: () = do_or_die($x);
40+
};
41+
}
42+
43+
44+
#[cfg(target_arch = "aarch64")]
45+
fn check_aarch64() {
46+
// This checks that the rustc feature name is used, not the LLVM feature.
47+
assert!(cfg!(target_feature = "neon"));
48+
assert!(cfg!(not(target_feature = "fp-armv8")));
49+
assert!(cfg!(target_feature = "fhm"));
50+
assert!(cfg!(not(target_feature = "fp16fml")));
51+
assert!(cfg!(target_feature = "fp16"));
52+
assert!(cfg!(not(target_feature = "fullfp16")));
53+
}
54+
55+
#[cfg(target_arch = "x86_64")]
56+
fn check_x86_64() {
57+
// This checks that the rustc feature name is used, not the LLVM feature.
58+
assert!(cfg!(target_feature = "rdrand"));
59+
assert!(cfg!(not(target_feature = "rdrnd")));
60+
61+
// Likewise: We enable LLVM's crc32 feature with SSE4.2, but Rust says it's just SSE4.2
62+
assert!(cfg!(target_feature = "sse4.2"));
63+
assert!(cfg!(not(target_feature = "crc32")));
64+
}

0 commit comments

Comments
 (0)