llvm-project/llvm/test/CodeGen/AMDGPU/schedule-amdgpu-tracker-physreg-crash.ll
Shilei Tian 75cf046f03 Re-apply "[AMDGPU] Fix test failures when expensive checks are enabled (#130644)"
As suggested on
5ec884e5d8 (commitcomment-153707488)
this seems to fix the following tests when building with -DLLVM_ENABLE_EXPENSIVE_CHECKS=ON:

  LLVM :: CodeGen/AMDGPU/materialize-frame-index-sgpr.gfx10.ll
  LLVM :: CodeGen/AMDGPU/materialize-frame-index-sgpr.ll
  LLVM :: CodeGen/AMDGPU/schedule-amdgpu-tracker-physreg-crash.ll

> This PR fixes test failures introduced in #127353 when expensive checks
> are enabled.
>
> For `llvm/test/CodeGen/AMDGPU/materialize-frame-index-sgpr.ll` and
> `llvm/test/CodeGen/AMDGPU/materialize-frame-index-sgpr.gfx10.ll`, `s59`
> is no longer in live-ins because it is caller saved. Switch to `s55` in
> this PR.
2025-03-14 09:49:20 +01:00

66 lines
2.7 KiB
LLVM

; RUN: not llc -mtriple=amdgcn-amd-amdhsa -mcpu=gfx900 -mattr=+xnack -amdgpu-use-amdgpu-trackers=1 2>&1 < %s | FileCheck -check-prefixes=ERR-GCNTRACKERS %s
; RUN: llc -mtriple=amdgcn-amd-amdhsa -mcpu=gfx900 -mattr=+xnack 2>&1 < %s | FileCheck -check-prefixes=GCN %s
%asm.output = type { <16 x i32>, <16 x i32>, <16 x i32>, <8 x i32>, <2 x i32>, i32, ; sgprs
<16 x i32>, <7 x i32>, ; vgprs
i64 ; vcc
}
%asm.output2 = type { <16 x i32>, <16 x i32>, <16 x i32>, <8 x i32>, <2 x i32>, i32, ; sgprs
<16 x i32>, <5 x i32>, ; vgprs
i64 ; vcc
}
%asm.output3 = type { <16 x i32>, <16 x i32>, <16 x i32>, <8 x i32>, <2 x i32>, ; sgprs
<16 x i32>, <6 x i32>, ; vgprs
i64 ; vcc
}
; ERR-GCNTRACKERS: ran out of registers during register allocation
; GCN-NOT: ran out of registers during register allocation
; FIXME: GCN Trackers do not track pressure from PhysRegs, so scheduling is actually worse
define void @scalar_mov_materializes_frame_index_no_live_scc_no_live_sgprs() #0 {
%alloca0 = alloca [4096 x i32], align 64, addrspace(5)
%alloca1 = alloca i32, align 4, addrspace(5)
call void asm sideeffect "; use alloca0 $0", "v"(ptr addrspace(5) %alloca0)
%asm = call %asm.output asm sideeffect
"; def $0, $1, $2, $3, $4, $5, $6, $7, $8",
"={s[0:15]},={s[16:31]},={s[32:47]},={s[48:55]},={s[56:57]},={s58},={v[0:15]},={v[16:22]},={vcc}"()
%s0 = extractvalue %asm.output %asm, 0
%s1 = extractvalue %asm.output %asm, 1
%s2 = extractvalue %asm.output %asm, 2
%s3 = extractvalue %asm.output %asm, 3
%s4 = extractvalue %asm.output %asm, 4
%s5 = extractvalue %asm.output %asm, 5
%v0 = extractvalue %asm.output %asm, 6
%v1 = extractvalue %asm.output %asm, 7
%vcc = extractvalue %asm.output %asm, 8
; scc is unavailable since it is live in
call void asm sideeffect "; use $0, $1, $2, $3, $4, $5, $6, $7, $8, $9, $10",
"{s[0:15]},{s[16:31]},{s[32:47]},{s[48:55]},{s[56:57]},{s58},{v[0:15]},{v[16:22]},{vcc},{s64},{scc}"(
<16 x i32> %s0,
<16 x i32> %s1,
<16 x i32> %s2,
<8 x i32> %s3,
<2 x i32> %s4,
i32 %s5,
<16 x i32> %v0,
<7 x i32> %v1,
i64 %vcc,
ptr addrspace(5) %alloca1,
i32 0) ; use of scc
ret void
}
attributes #0 = { nounwind alignstack=64 "amdgpu-no-workitem-id-x" "amdgpu-no-workitem-id-y" "amdgpu-no-workitem-id-z" "amdgpu-waves-per-eu"="10,10" "no-realign-stack" }
attributes #1 = { nounwind alignstack=16 "amdgpu-no-workitem-id-x" "amdgpu-no-workitem-id-y" "amdgpu-no-workitem-id-z" "amdgpu-waves-per-eu"="10,10" "no-realign-stack" }