Auto merge of #79801 - eddyb:scalar-transmute, r=nagisa
rustc_codegen_ssa: use bitcasts instead of type punning for scalar transmutes. This specifically helps with `f32` <-> `u32` (`from_bits`, `to_bits`) in Rust-GPU (`rustc_codegen_spirv`), where (AFAIK) we don't yet have enough infrastructure to turn type punning memory accesses into SSA bitcasts. (There may be more instances, but the one I've seen myself is `f32::signum` from `num-traits` inspecting e.g. the sign bit) Sadly I've had to make an exception for `transmute`s between pointers and non-pointers, as LLVM disallows using `bitcast` for them. r? `@nagisa` cc `@khyperia`
This commit is contained in:
commit
d7560e8968
2 changed files with 104 additions and 0 deletions
|
@ -1395,6 +1395,25 @@ impl<'a, 'tcx, Bx: BuilderMethods<'a, 'tcx>> FunctionCx<'a, 'tcx, Bx> {
|
||||||
dst: PlaceRef<'tcx, Bx::Value>,
|
dst: PlaceRef<'tcx, Bx::Value>,
|
||||||
) {
|
) {
|
||||||
let src = self.codegen_operand(bx, src);
|
let src = self.codegen_operand(bx, src);
|
||||||
|
|
||||||
|
// Special-case transmutes between scalars as simple bitcasts.
|
||||||
|
match (&src.layout.abi, &dst.layout.abi) {
|
||||||
|
(abi::Abi::Scalar(src_scalar), abi::Abi::Scalar(dst_scalar)) => {
|
||||||
|
// HACK(eddyb) LLVM doesn't like `bitcast`s between pointers and non-pointers.
|
||||||
|
if (src_scalar.value == abi::Pointer) == (dst_scalar.value == abi::Pointer) {
|
||||||
|
assert_eq!(src.layout.size, dst.layout.size);
|
||||||
|
|
||||||
|
// NOTE(eddyb) the `from_immediate` and `to_immediate_scalar`
|
||||||
|
// conversions allow handling `bool`s the same as `u8`s.
|
||||||
|
let src = bx.from_immediate(src.immediate());
|
||||||
|
let src_as_dst = bx.bitcast(src, bx.backend_type(dst.layout));
|
||||||
|
Immediate(bx.to_immediate_scalar(src_as_dst, dst_scalar)).store(bx, dst);
|
||||||
|
return;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
_ => {}
|
||||||
|
}
|
||||||
|
|
||||||
let llty = bx.backend_type(src.layout);
|
let llty = bx.backend_type(src.layout);
|
||||||
let cast_ptr = bx.pointercast(dst.llval, bx.type_ptr_to(llty));
|
let cast_ptr = bx.pointercast(dst.llval, bx.type_ptr_to(llty));
|
||||||
let align = src.layout.align.abi.min(dst.align);
|
let align = src.layout.align.abi.min(dst.align);
|
||||||
|
|
85
src/test/codegen/transmute-scalar.rs
Normal file
85
src/test/codegen/transmute-scalar.rs
Normal file
|
@ -0,0 +1,85 @@
|
||||||
|
// compile-flags: -O -C no-prepopulate-passes
|
||||||
|
|
||||||
|
#![crate_type = "lib"]
|
||||||
|
|
||||||
|
// FIXME(eddyb) all of these tests show memory stores and loads, even after a
|
||||||
|
// scalar `bitcast`, more special-casing is required to remove `alloca` usage.
|
||||||
|
|
||||||
|
// CHECK: define i32 @f32_to_bits(float %x)
|
||||||
|
// CHECK: %2 = bitcast float %x to i32
|
||||||
|
// CHECK-NEXT: store i32 %2, i32* %0
|
||||||
|
// CHECK-NEXT: %3 = load i32, i32* %0
|
||||||
|
// CHECK: ret i32 %3
|
||||||
|
#[no_mangle]
|
||||||
|
pub fn f32_to_bits(x: f32) -> u32 {
|
||||||
|
unsafe { std::mem::transmute(x) }
|
||||||
|
}
|
||||||
|
|
||||||
|
// CHECK: define i8 @bool_to_byte(i1 zeroext %b)
|
||||||
|
// CHECK: %1 = zext i1 %b to i8
|
||||||
|
// CHECK-NEXT: store i8 %1, i8* %0
|
||||||
|
// CHECK-NEXT: %2 = load i8, i8* %0
|
||||||
|
// CHECK: ret i8 %2
|
||||||
|
#[no_mangle]
|
||||||
|
pub fn bool_to_byte(b: bool) -> u8 {
|
||||||
|
unsafe { std::mem::transmute(b) }
|
||||||
|
}
|
||||||
|
|
||||||
|
// CHECK: define zeroext i1 @byte_to_bool(i8 %byte)
|
||||||
|
// CHECK: %1 = trunc i8 %byte to i1
|
||||||
|
// CHECK-NEXT: %2 = zext i1 %1 to i8
|
||||||
|
// CHECK-NEXT: store i8 %2, i8* %0
|
||||||
|
// CHECK-NEXT: %3 = load i8, i8* %0
|
||||||
|
// CHECK-NEXT: %4 = trunc i8 %3 to i1
|
||||||
|
// CHECK: ret i1 %4
|
||||||
|
#[no_mangle]
|
||||||
|
pub unsafe fn byte_to_bool(byte: u8) -> bool {
|
||||||
|
std::mem::transmute(byte)
|
||||||
|
}
|
||||||
|
|
||||||
|
// CHECK: define i8* @ptr_to_ptr(i16* %p)
|
||||||
|
// CHECK: %2 = bitcast i16* %p to i8*
|
||||||
|
// CHECK-NEXT: store i8* %2, i8** %0
|
||||||
|
// CHECK-NEXT: %3 = load i8*, i8** %0
|
||||||
|
// CHECK: ret i8* %3
|
||||||
|
#[no_mangle]
|
||||||
|
pub fn ptr_to_ptr(p: *mut u16) -> *mut u8 {
|
||||||
|
unsafe { std::mem::transmute(p) }
|
||||||
|
}
|
||||||
|
|
||||||
|
// HACK(eddyb) scalar `transmute`s between pointers and non-pointers are
|
||||||
|
// currently not special-cased like other scalar `transmute`s, because
|
||||||
|
// LLVM requires specifically `ptrtoint`/`inttoptr` instead of `bitcast`.
|
||||||
|
//
|
||||||
|
// Tests below show the non-special-cased behavior (with the possible
|
||||||
|
// future special-cased instructions in the "NOTE(eddyb)" comments).
|
||||||
|
|
||||||
|
// CHECK: define [[USIZE:i[0-9]+]] @ptr_to_int(i16* %p)
|
||||||
|
|
||||||
|
// NOTE(eddyb) see above, the following two CHECK lines should ideally be this:
|
||||||
|
// %2 = ptrtoint i16* %p to [[USIZE]]
|
||||||
|
// store [[USIZE]] %2, [[USIZE]]* %0
|
||||||
|
// CHECK: %2 = bitcast [[USIZE]]* %0 to i16**
|
||||||
|
// CHECK-NEXT: store i16* %p, i16** %2
|
||||||
|
|
||||||
|
// CHECK-NEXT: %3 = load [[USIZE]], [[USIZE]]* %0
|
||||||
|
// CHECK: ret [[USIZE]] %3
|
||||||
|
#[no_mangle]
|
||||||
|
pub fn ptr_to_int(p: *mut u16) -> usize {
|
||||||
|
unsafe { std::mem::transmute(p) }
|
||||||
|
}
|
||||||
|
|
||||||
|
// CHECK: define i16* @int_to_ptr([[USIZE]] %i)
|
||||||
|
|
||||||
|
// NOTE(eddyb) see above, the following two CHECK lines should ideally be this:
|
||||||
|
// %2 = inttoptr [[USIZE]] %i to i16*
|
||||||
|
// store i16* %2, i16** %0
|
||||||
|
// CHECK: %2 = bitcast i16** %0 to [[USIZE]]*
|
||||||
|
// CHECK-NEXT: store [[USIZE]] %i, [[USIZE]]* %2
|
||||||
|
|
||||||
|
// CHECK-NEXT: %3 = load i16*, i16** %0
|
||||||
|
// CHECK: ret i16* %3
|
||||||
|
#[no_mangle]
|
||||||
|
pub fn int_to_ptr(i: usize) -> *mut u16 {
|
||||||
|
unsafe { std::mem::transmute(i) }
|
||||||
|
}
|
Loading…
Add table
Add a link
Reference in a new issue