PR feedback
This commit is contained in:
parent
e30cb329d8
commit
4207c786e7
2 changed files with 20 additions and 14 deletions
|
@ -1,8 +1,16 @@
|
|||
//@ compile-flags: -Copt-level=3
|
||||
//@ revisions: host x86-64-v3
|
||||
//@ revisions: host x86-64 x86-64-v3
|
||||
//@ min-llvm-version: 20
|
||||
|
||||
// This particular CPU regressed in #131563
|
||||
//@[host] ignore-x86_64
|
||||
|
||||
// Set the base cpu explicitly, in case the default has been changed.
|
||||
//@[x86-64] only-x86_64
|
||||
//@[x86-64] compile-flags: -Ctarget-cpu=x86-64
|
||||
|
||||
// FIXME(cuviper) x86-64-v3 in particular regressed in #131563, and the workaround
|
||||
// at the time still sometimes fails, so only verify it for the power-of-two size
|
||||
// - https://github.com/llvm/llvm-project/issues/134735
|
||||
//@[x86-64-v3] only-x86_64
|
||||
//@[x86-64-v3] compile-flags: -Ctarget-cpu=x86-64-v3
|
||||
|
||||
|
@ -12,16 +20,14 @@
|
|||
pub fn test() -> usize {
|
||||
// CHECK-LABEL: @test(
|
||||
// host: ret {{i64|i32}} 165
|
||||
// x86-64: ret {{i64|i32}} 165
|
||||
|
||||
// FIXME: Now that this autovectorizes via a masked load, it doesn't actually
|
||||
// const-fold for certain widths. The `test_eight` case below shows that, yes,
|
||||
// what we're emitting *can* be const-folded, except that the way LLVM does it
|
||||
// for certain widths doesn't today. We should be able to put this back to
|
||||
// the same check after <https://github.com/llvm/llvm-project/issues/134513>
|
||||
// x86-64-v3: <i64 23, i64 16, i64 54, i64 3>
|
||||
// x86-64-v3: llvm.masked.load
|
||||
// x86-64-v3: %[[R:.+]] = {{.+}}llvm.vector.reduce.add.v4i64
|
||||
// x86-64-v3: ret i64 %[[R]]
|
||||
// x86-64-v3: masked.load
|
||||
|
||||
let values = [23, 16, 54, 3, 60, 9];
|
||||
let mut acc = 0;
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue