Code Formating
This commit is contained in:
parent
15b3c6682f
commit
460ec42cc1
@ -5257,12 +5257,9 @@ static uint32_t getIdentityValueFor32BitWaveReduction(unsigned Opc) {
|
||||
case AMDGPU::S_ADD_I32:
|
||||
case AMDGPU::S_SUB_I32:
|
||||
case AMDGPU::S_OR_B32:
|
||||
case AMDGPU::S_OR_B64:
|
||||
case AMDGPU::S_XOR_B32:
|
||||
case AMDGPU::S_XOR_B64:
|
||||
return std::numeric_limits<uint32_t>::min();
|
||||
case AMDGPU::S_AND_B32:
|
||||
case AMDGPU::S_AND_B64:
|
||||
return std::numeric_limits<uint32_t>::max();
|
||||
default:
|
||||
llvm_unreachable(
|
||||
@ -5282,7 +5279,11 @@ static uint64_t getIdentityValueFor64BitWaveReduction(unsigned Opc) {
|
||||
return std::numeric_limits<int64_t>::min();
|
||||
case AMDGPU::S_ADD_U64_PSEUDO:
|
||||
case AMDGPU::S_SUB_U64_PSEUDO:
|
||||
case AMDGPU::S_OR_B64:
|
||||
case AMDGPU::S_XOR_B64:
|
||||
return std::numeric_limits<uint64_t>::min();
|
||||
case AMDGPU::S_AND_B64:
|
||||
return std::numeric_limits<uint64_t>::max();
|
||||
default:
|
||||
llvm_unreachable(
|
||||
"Unexpected opcode in getIdentityValueFor64BitWaveReduction");
|
||||
@ -5601,9 +5602,9 @@ static MachineBasicBlock *lowerWaveReduce(MachineInstr &MI,
|
||||
.addReg(LaneValueHiReg)
|
||||
.addImm(AMDGPU::sub1);
|
||||
switch (Opc) {
|
||||
case ::AMDGPU::S_OR_B64:
|
||||
case ::AMDGPU::S_AND_B64:
|
||||
case ::AMDGPU::S_XOR_B64: {
|
||||
case AMDGPU::S_OR_B64:
|
||||
case AMDGPU::S_AND_B64:
|
||||
case AMDGPU::S_XOR_B64: {
|
||||
NewAccumulator = BuildMI(*ComputeLoop, I, DL, TII->get(Opc), DstReg)
|
||||
.addReg(Accumulator->getOperand(0).getReg())
|
||||
.addReg(LaneValue->getOperand(0).getReg())
|
||||
|
@ -1269,9 +1269,8 @@ define void @divergent_value_i64(ptr addrspace(1) %out, i64 %id.x) {
|
||||
; GFX8DAGISEL-LABEL: divergent_value_i64:
|
||||
; GFX8DAGISEL: ; %bb.0: ; %entry
|
||||
; GFX8DAGISEL-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
|
||||
; GFX8DAGISEL-NEXT: s_mov_b32 s4, -1
|
||||
; GFX8DAGISEL-NEXT: s_mov_b64 s[4:5], -1
|
||||
; GFX8DAGISEL-NEXT: s_mov_b64 s[6:7], exec
|
||||
; GFX8DAGISEL-NEXT: s_mov_b32 s5, s4
|
||||
; GFX8DAGISEL-NEXT: .LBB8_1: ; =>This Inner Loop Header: Depth=1
|
||||
; GFX8DAGISEL-NEXT: s_ff1_i32_b64 s10, s[6:7]
|
||||
; GFX8DAGISEL-NEXT: v_readlane_b32 s8, v2, s10
|
||||
@ -1290,9 +1289,8 @@ define void @divergent_value_i64(ptr addrspace(1) %out, i64 %id.x) {
|
||||
; GFX8GISEL-LABEL: divergent_value_i64:
|
||||
; GFX8GISEL: ; %bb.0: ; %entry
|
||||
; GFX8GISEL-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
|
||||
; GFX8GISEL-NEXT: s_mov_b32 s4, -1
|
||||
; GFX8GISEL-NEXT: s_mov_b64 s[4:5], -1
|
||||
; GFX8GISEL-NEXT: s_mov_b64 s[6:7], exec
|
||||
; GFX8GISEL-NEXT: s_mov_b32 s5, s4
|
||||
; GFX8GISEL-NEXT: .LBB8_1: ; =>This Inner Loop Header: Depth=1
|
||||
; GFX8GISEL-NEXT: s_ff1_i32_b64 s10, s[6:7]
|
||||
; GFX8GISEL-NEXT: v_readlane_b32 s8, v2, s10
|
||||
@ -1311,9 +1309,8 @@ define void @divergent_value_i64(ptr addrspace(1) %out, i64 %id.x) {
|
||||
; GFX9DAGISEL-LABEL: divergent_value_i64:
|
||||
; GFX9DAGISEL: ; %bb.0: ; %entry
|
||||
; GFX9DAGISEL-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
|
||||
; GFX9DAGISEL-NEXT: s_mov_b32 s4, -1
|
||||
; GFX9DAGISEL-NEXT: s_mov_b64 s[4:5], -1
|
||||
; GFX9DAGISEL-NEXT: s_mov_b64 s[6:7], exec
|
||||
; GFX9DAGISEL-NEXT: s_mov_b32 s5, s4
|
||||
; GFX9DAGISEL-NEXT: .LBB8_1: ; =>This Inner Loop Header: Depth=1
|
||||
; GFX9DAGISEL-NEXT: s_ff1_i32_b64 s10, s[6:7]
|
||||
; GFX9DAGISEL-NEXT: v_readlane_b32 s8, v2, s10
|
||||
@ -1332,9 +1329,8 @@ define void @divergent_value_i64(ptr addrspace(1) %out, i64 %id.x) {
|
||||
; GFX9GISEL-LABEL: divergent_value_i64:
|
||||
; GFX9GISEL: ; %bb.0: ; %entry
|
||||
; GFX9GISEL-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
|
||||
; GFX9GISEL-NEXT: s_mov_b32 s4, -1
|
||||
; GFX9GISEL-NEXT: s_mov_b64 s[4:5], -1
|
||||
; GFX9GISEL-NEXT: s_mov_b64 s[6:7], exec
|
||||
; GFX9GISEL-NEXT: s_mov_b32 s5, s4
|
||||
; GFX9GISEL-NEXT: .LBB8_1: ; =>This Inner Loop Header: Depth=1
|
||||
; GFX9GISEL-NEXT: s_ff1_i32_b64 s10, s[6:7]
|
||||
; GFX9GISEL-NEXT: v_readlane_b32 s8, v2, s10
|
||||
@ -1353,9 +1349,8 @@ define void @divergent_value_i64(ptr addrspace(1) %out, i64 %id.x) {
|
||||
; GFX1064DAGISEL-LABEL: divergent_value_i64:
|
||||
; GFX1064DAGISEL: ; %bb.0: ; %entry
|
||||
; GFX1064DAGISEL-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
|
||||
; GFX1064DAGISEL-NEXT: s_mov_b32 s4, -1
|
||||
; GFX1064DAGISEL-NEXT: s_mov_b64 s[4:5], -1
|
||||
; GFX1064DAGISEL-NEXT: s_mov_b64 s[6:7], exec
|
||||
; GFX1064DAGISEL-NEXT: s_mov_b32 s5, s4
|
||||
; GFX1064DAGISEL-NEXT: .LBB8_1: ; =>This Inner Loop Header: Depth=1
|
||||
; GFX1064DAGISEL-NEXT: s_ff1_i32_b64 s10, s[6:7]
|
||||
; GFX1064DAGISEL-NEXT: v_readlane_b32 s8, v2, s10
|
||||
@ -1373,9 +1368,8 @@ define void @divergent_value_i64(ptr addrspace(1) %out, i64 %id.x) {
|
||||
; GFX1064GISEL-LABEL: divergent_value_i64:
|
||||
; GFX1064GISEL: ; %bb.0: ; %entry
|
||||
; GFX1064GISEL-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
|
||||
; GFX1064GISEL-NEXT: s_mov_b32 s4, -1
|
||||
; GFX1064GISEL-NEXT: s_mov_b64 s[4:5], -1
|
||||
; GFX1064GISEL-NEXT: s_mov_b64 s[6:7], exec
|
||||
; GFX1064GISEL-NEXT: s_mov_b32 s5, s4
|
||||
; GFX1064GISEL-NEXT: .LBB8_1: ; =>This Inner Loop Header: Depth=1
|
||||
; GFX1064GISEL-NEXT: s_ff1_i32_b64 s10, s[6:7]
|
||||
; GFX1064GISEL-NEXT: v_readlane_b32 s8, v2, s10
|
||||
@ -1393,9 +1387,8 @@ define void @divergent_value_i64(ptr addrspace(1) %out, i64 %id.x) {
|
||||
; GFX1032DAGISEL-LABEL: divergent_value_i64:
|
||||
; GFX1032DAGISEL: ; %bb.0: ; %entry
|
||||
; GFX1032DAGISEL-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
|
||||
; GFX1032DAGISEL-NEXT: s_mov_b32 s4, -1
|
||||
; GFX1032DAGISEL-NEXT: s_mov_b64 s[4:5], -1
|
||||
; GFX1032DAGISEL-NEXT: s_mov_b32 s6, exec_lo
|
||||
; GFX1032DAGISEL-NEXT: s_mov_b32 s5, s4
|
||||
; GFX1032DAGISEL-NEXT: .LBB8_1: ; =>This Inner Loop Header: Depth=1
|
||||
; GFX1032DAGISEL-NEXT: s_ff1_i32_b32 s7, s6
|
||||
; GFX1032DAGISEL-NEXT: v_readlane_b32 s8, v2, s7
|
||||
@ -1413,9 +1406,8 @@ define void @divergent_value_i64(ptr addrspace(1) %out, i64 %id.x) {
|
||||
; GFX1032GISEL-LABEL: divergent_value_i64:
|
||||
; GFX1032GISEL: ; %bb.0: ; %entry
|
||||
; GFX1032GISEL-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
|
||||
; GFX1032GISEL-NEXT: s_mov_b32 s4, -1
|
||||
; GFX1032GISEL-NEXT: s_mov_b64 s[4:5], -1
|
||||
; GFX1032GISEL-NEXT: s_mov_b32 s6, exec_lo
|
||||
; GFX1032GISEL-NEXT: s_mov_b32 s5, s4
|
||||
; GFX1032GISEL-NEXT: .LBB8_1: ; =>This Inner Loop Header: Depth=1
|
||||
; GFX1032GISEL-NEXT: s_ff1_i32_b32 s7, s6
|
||||
; GFX1032GISEL-NEXT: v_readlane_b32 s8, v2, s7
|
||||
@ -1433,12 +1425,11 @@ define void @divergent_value_i64(ptr addrspace(1) %out, i64 %id.x) {
|
||||
; GFX1164DAGISEL-LABEL: divergent_value_i64:
|
||||
; GFX1164DAGISEL: ; %bb.0: ; %entry
|
||||
; GFX1164DAGISEL-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
|
||||
; GFX1164DAGISEL-NEXT: s_mov_b32 s0, -1
|
||||
; GFX1164DAGISEL-NEXT: s_mov_b64 s[0:1], -1
|
||||
; GFX1164DAGISEL-NEXT: s_mov_b64 s[2:3], exec
|
||||
; GFX1164DAGISEL-NEXT: s_mov_b32 s1, s0
|
||||
; GFX1164DAGISEL-NEXT: .LBB8_1: ; =>This Inner Loop Header: Depth=1
|
||||
; GFX1164DAGISEL-NEXT: s_delay_alu instid0(SALU_CYCLE_1) | instskip(NEXT) | instid1(SALU_CYCLE_1)
|
||||
; GFX1164DAGISEL-NEXT: s_ctz_i32_b64 s6, s[2:3]
|
||||
; GFX1164DAGISEL-NEXT: s_delay_alu instid0(SALU_CYCLE_1)
|
||||
; GFX1164DAGISEL-NEXT: v_readlane_b32 s4, v2, s6
|
||||
; GFX1164DAGISEL-NEXT: v_readlane_b32 s5, v3, s6
|
||||
; GFX1164DAGISEL-NEXT: s_bitset0_b64 s[2:3], s6
|
||||
@ -1454,12 +1445,11 @@ define void @divergent_value_i64(ptr addrspace(1) %out, i64 %id.x) {
|
||||
; GFX1164GISEL-LABEL: divergent_value_i64:
|
||||
; GFX1164GISEL: ; %bb.0: ; %entry
|
||||
; GFX1164GISEL-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
|
||||
; GFX1164GISEL-NEXT: s_mov_b32 s0, -1
|
||||
; GFX1164GISEL-NEXT: s_mov_b64 s[0:1], -1
|
||||
; GFX1164GISEL-NEXT: s_mov_b64 s[2:3], exec
|
||||
; GFX1164GISEL-NEXT: s_mov_b32 s1, s0
|
||||
; GFX1164GISEL-NEXT: .LBB8_1: ; =>This Inner Loop Header: Depth=1
|
||||
; GFX1164GISEL-NEXT: s_delay_alu instid0(SALU_CYCLE_1) | instskip(NEXT) | instid1(SALU_CYCLE_1)
|
||||
; GFX1164GISEL-NEXT: s_ctz_i32_b64 s6, s[2:3]
|
||||
; GFX1164GISEL-NEXT: s_delay_alu instid0(SALU_CYCLE_1)
|
||||
; GFX1164GISEL-NEXT: v_readlane_b32 s4, v2, s6
|
||||
; GFX1164GISEL-NEXT: v_readlane_b32 s5, v3, s6
|
||||
; GFX1164GISEL-NEXT: s_bitset0_b64 s[2:3], s6
|
||||
@ -1475,12 +1465,11 @@ define void @divergent_value_i64(ptr addrspace(1) %out, i64 %id.x) {
|
||||
; GFX1132DAGISEL-LABEL: divergent_value_i64:
|
||||
; GFX1132DAGISEL: ; %bb.0: ; %entry
|
||||
; GFX1132DAGISEL-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
|
||||
; GFX1132DAGISEL-NEXT: s_mov_b32 s0, -1
|
||||
; GFX1132DAGISEL-NEXT: s_mov_b64 s[0:1], -1
|
||||
; GFX1132DAGISEL-NEXT: s_mov_b32 s2, exec_lo
|
||||
; GFX1132DAGISEL-NEXT: s_mov_b32 s1, s0
|
||||
; GFX1132DAGISEL-NEXT: .LBB8_1: ; =>This Inner Loop Header: Depth=1
|
||||
; GFX1132DAGISEL-NEXT: s_delay_alu instid0(SALU_CYCLE_1) | instskip(NEXT) | instid1(SALU_CYCLE_1)
|
||||
; GFX1132DAGISEL-NEXT: s_ctz_i32_b32 s3, s2
|
||||
; GFX1132DAGISEL-NEXT: s_delay_alu instid0(SALU_CYCLE_1)
|
||||
; GFX1132DAGISEL-NEXT: v_readlane_b32 s4, v2, s3
|
||||
; GFX1132DAGISEL-NEXT: v_readlane_b32 s5, v3, s3
|
||||
; GFX1132DAGISEL-NEXT: s_bitset0_b32 s2, s3
|
||||
@ -1495,12 +1484,11 @@ define void @divergent_value_i64(ptr addrspace(1) %out, i64 %id.x) {
|
||||
; GFX1132GISEL-LABEL: divergent_value_i64:
|
||||
; GFX1132GISEL: ; %bb.0: ; %entry
|
||||
; GFX1132GISEL-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
|
||||
; GFX1132GISEL-NEXT: s_mov_b32 s0, -1
|
||||
; GFX1132GISEL-NEXT: s_mov_b64 s[0:1], -1
|
||||
; GFX1132GISEL-NEXT: s_mov_b32 s2, exec_lo
|
||||
; GFX1132GISEL-NEXT: s_mov_b32 s1, s0
|
||||
; GFX1132GISEL-NEXT: .LBB8_1: ; =>This Inner Loop Header: Depth=1
|
||||
; GFX1132GISEL-NEXT: s_delay_alu instid0(SALU_CYCLE_1) | instskip(NEXT) | instid1(SALU_CYCLE_1)
|
||||
; GFX1132GISEL-NEXT: s_ctz_i32_b32 s3, s2
|
||||
; GFX1132GISEL-NEXT: s_delay_alu instid0(SALU_CYCLE_1)
|
||||
; GFX1132GISEL-NEXT: v_readlane_b32 s4, v2, s3
|
||||
; GFX1132GISEL-NEXT: v_readlane_b32 s5, v3, s3
|
||||
; GFX1132GISEL-NEXT: s_bitset0_b32 s2, s3
|
||||
|
@ -1269,9 +1269,8 @@ define void @divergent_value_i64(ptr addrspace(1) %out, i64 %id.x) {
|
||||
; GFX8DAGISEL-LABEL: divergent_value_i64:
|
||||
; GFX8DAGISEL: ; %bb.0: ; %entry
|
||||
; GFX8DAGISEL-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
|
||||
; GFX8DAGISEL-NEXT: s_mov_b32 s4, 0
|
||||
; GFX8DAGISEL-NEXT: s_mov_b64 s[4:5], 0
|
||||
; GFX8DAGISEL-NEXT: s_mov_b64 s[6:7], exec
|
||||
; GFX8DAGISEL-NEXT: s_mov_b32 s5, s4
|
||||
; GFX8DAGISEL-NEXT: .LBB8_1: ; =>This Inner Loop Header: Depth=1
|
||||
; GFX8DAGISEL-NEXT: s_ff1_i32_b64 s10, s[6:7]
|
||||
; GFX8DAGISEL-NEXT: v_readlane_b32 s8, v2, s10
|
||||
@ -1290,9 +1289,8 @@ define void @divergent_value_i64(ptr addrspace(1) %out, i64 %id.x) {
|
||||
; GFX8GISEL-LABEL: divergent_value_i64:
|
||||
; GFX8GISEL: ; %bb.0: ; %entry
|
||||
; GFX8GISEL-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
|
||||
; GFX8GISEL-NEXT: s_mov_b32 s4, 0
|
||||
; GFX8GISEL-NEXT: s_mov_b64 s[4:5], 0
|
||||
; GFX8GISEL-NEXT: s_mov_b64 s[6:7], exec
|
||||
; GFX8GISEL-NEXT: s_mov_b32 s5, s4
|
||||
; GFX8GISEL-NEXT: .LBB8_1: ; =>This Inner Loop Header: Depth=1
|
||||
; GFX8GISEL-NEXT: s_ff1_i32_b64 s10, s[6:7]
|
||||
; GFX8GISEL-NEXT: v_readlane_b32 s8, v2, s10
|
||||
@ -1311,9 +1309,8 @@ define void @divergent_value_i64(ptr addrspace(1) %out, i64 %id.x) {
|
||||
; GFX9DAGISEL-LABEL: divergent_value_i64:
|
||||
; GFX9DAGISEL: ; %bb.0: ; %entry
|
||||
; GFX9DAGISEL-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
|
||||
; GFX9DAGISEL-NEXT: s_mov_b32 s4, 0
|
||||
; GFX9DAGISEL-NEXT: s_mov_b64 s[4:5], 0
|
||||
; GFX9DAGISEL-NEXT: s_mov_b64 s[6:7], exec
|
||||
; GFX9DAGISEL-NEXT: s_mov_b32 s5, s4
|
||||
; GFX9DAGISEL-NEXT: .LBB8_1: ; =>This Inner Loop Header: Depth=1
|
||||
; GFX9DAGISEL-NEXT: s_ff1_i32_b64 s10, s[6:7]
|
||||
; GFX9DAGISEL-NEXT: v_readlane_b32 s8, v2, s10
|
||||
@ -1332,9 +1329,8 @@ define void @divergent_value_i64(ptr addrspace(1) %out, i64 %id.x) {
|
||||
; GFX9GISEL-LABEL: divergent_value_i64:
|
||||
; GFX9GISEL: ; %bb.0: ; %entry
|
||||
; GFX9GISEL-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
|
||||
; GFX9GISEL-NEXT: s_mov_b32 s4, 0
|
||||
; GFX9GISEL-NEXT: s_mov_b64 s[4:5], 0
|
||||
; GFX9GISEL-NEXT: s_mov_b64 s[6:7], exec
|
||||
; GFX9GISEL-NEXT: s_mov_b32 s5, s4
|
||||
; GFX9GISEL-NEXT: .LBB8_1: ; =>This Inner Loop Header: Depth=1
|
||||
; GFX9GISEL-NEXT: s_ff1_i32_b64 s10, s[6:7]
|
||||
; GFX9GISEL-NEXT: v_readlane_b32 s8, v2, s10
|
||||
@ -1353,9 +1349,8 @@ define void @divergent_value_i64(ptr addrspace(1) %out, i64 %id.x) {
|
||||
; GFX1064DAGISEL-LABEL: divergent_value_i64:
|
||||
; GFX1064DAGISEL: ; %bb.0: ; %entry
|
||||
; GFX1064DAGISEL-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
|
||||
; GFX1064DAGISEL-NEXT: s_mov_b32 s4, 0
|
||||
; GFX1064DAGISEL-NEXT: s_mov_b64 s[4:5], 0
|
||||
; GFX1064DAGISEL-NEXT: s_mov_b64 s[6:7], exec
|
||||
; GFX1064DAGISEL-NEXT: s_mov_b32 s5, s4
|
||||
; GFX1064DAGISEL-NEXT: .LBB8_1: ; =>This Inner Loop Header: Depth=1
|
||||
; GFX1064DAGISEL-NEXT: s_ff1_i32_b64 s10, s[6:7]
|
||||
; GFX1064DAGISEL-NEXT: v_readlane_b32 s8, v2, s10
|
||||
@ -1373,9 +1368,8 @@ define void @divergent_value_i64(ptr addrspace(1) %out, i64 %id.x) {
|
||||
; GFX1064GISEL-LABEL: divergent_value_i64:
|
||||
; GFX1064GISEL: ; %bb.0: ; %entry
|
||||
; GFX1064GISEL-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
|
||||
; GFX1064GISEL-NEXT: s_mov_b32 s4, 0
|
||||
; GFX1064GISEL-NEXT: s_mov_b64 s[4:5], 0
|
||||
; GFX1064GISEL-NEXT: s_mov_b64 s[6:7], exec
|
||||
; GFX1064GISEL-NEXT: s_mov_b32 s5, s4
|
||||
; GFX1064GISEL-NEXT: .LBB8_1: ; =>This Inner Loop Header: Depth=1
|
||||
; GFX1064GISEL-NEXT: s_ff1_i32_b64 s10, s[6:7]
|
||||
; GFX1064GISEL-NEXT: v_readlane_b32 s8, v2, s10
|
||||
@ -1393,9 +1387,8 @@ define void @divergent_value_i64(ptr addrspace(1) %out, i64 %id.x) {
|
||||
; GFX1032DAGISEL-LABEL: divergent_value_i64:
|
||||
; GFX1032DAGISEL: ; %bb.0: ; %entry
|
||||
; GFX1032DAGISEL-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
|
||||
; GFX1032DAGISEL-NEXT: s_mov_b32 s4, 0
|
||||
; GFX1032DAGISEL-NEXT: s_mov_b64 s[4:5], 0
|
||||
; GFX1032DAGISEL-NEXT: s_mov_b32 s6, exec_lo
|
||||
; GFX1032DAGISEL-NEXT: s_mov_b32 s5, s4
|
||||
; GFX1032DAGISEL-NEXT: .LBB8_1: ; =>This Inner Loop Header: Depth=1
|
||||
; GFX1032DAGISEL-NEXT: s_ff1_i32_b32 s7, s6
|
||||
; GFX1032DAGISEL-NEXT: v_readlane_b32 s8, v2, s7
|
||||
@ -1413,9 +1406,8 @@ define void @divergent_value_i64(ptr addrspace(1) %out, i64 %id.x) {
|
||||
; GFX1032GISEL-LABEL: divergent_value_i64:
|
||||
; GFX1032GISEL: ; %bb.0: ; %entry
|
||||
; GFX1032GISEL-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
|
||||
; GFX1032GISEL-NEXT: s_mov_b32 s4, 0
|
||||
; GFX1032GISEL-NEXT: s_mov_b64 s[4:5], 0
|
||||
; GFX1032GISEL-NEXT: s_mov_b32 s6, exec_lo
|
||||
; GFX1032GISEL-NEXT: s_mov_b32 s5, s4
|
||||
; GFX1032GISEL-NEXT: .LBB8_1: ; =>This Inner Loop Header: Depth=1
|
||||
; GFX1032GISEL-NEXT: s_ff1_i32_b32 s7, s6
|
||||
; GFX1032GISEL-NEXT: v_readlane_b32 s8, v2, s7
|
||||
@ -1433,12 +1425,11 @@ define void @divergent_value_i64(ptr addrspace(1) %out, i64 %id.x) {
|
||||
; GFX1164DAGISEL-LABEL: divergent_value_i64:
|
||||
; GFX1164DAGISEL: ; %bb.0: ; %entry
|
||||
; GFX1164DAGISEL-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
|
||||
; GFX1164DAGISEL-NEXT: s_mov_b32 s0, 0
|
||||
; GFX1164DAGISEL-NEXT: s_mov_b64 s[0:1], 0
|
||||
; GFX1164DAGISEL-NEXT: s_mov_b64 s[2:3], exec
|
||||
; GFX1164DAGISEL-NEXT: s_mov_b32 s1, s0
|
||||
; GFX1164DAGISEL-NEXT: .LBB8_1: ; =>This Inner Loop Header: Depth=1
|
||||
; GFX1164DAGISEL-NEXT: s_delay_alu instid0(SALU_CYCLE_1) | instskip(NEXT) | instid1(SALU_CYCLE_1)
|
||||
; GFX1164DAGISEL-NEXT: s_ctz_i32_b64 s6, s[2:3]
|
||||
; GFX1164DAGISEL-NEXT: s_delay_alu instid0(SALU_CYCLE_1)
|
||||
; GFX1164DAGISEL-NEXT: v_readlane_b32 s4, v2, s6
|
||||
; GFX1164DAGISEL-NEXT: v_readlane_b32 s5, v3, s6
|
||||
; GFX1164DAGISEL-NEXT: s_bitset0_b64 s[2:3], s6
|
||||
@ -1454,12 +1445,11 @@ define void @divergent_value_i64(ptr addrspace(1) %out, i64 %id.x) {
|
||||
; GFX1164GISEL-LABEL: divergent_value_i64:
|
||||
; GFX1164GISEL: ; %bb.0: ; %entry
|
||||
; GFX1164GISEL-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
|
||||
; GFX1164GISEL-NEXT: s_mov_b32 s0, 0
|
||||
; GFX1164GISEL-NEXT: s_mov_b64 s[0:1], 0
|
||||
; GFX1164GISEL-NEXT: s_mov_b64 s[2:3], exec
|
||||
; GFX1164GISEL-NEXT: s_mov_b32 s1, s0
|
||||
; GFX1164GISEL-NEXT: .LBB8_1: ; =>This Inner Loop Header: Depth=1
|
||||
; GFX1164GISEL-NEXT: s_delay_alu instid0(SALU_CYCLE_1) | instskip(NEXT) | instid1(SALU_CYCLE_1)
|
||||
; GFX1164GISEL-NEXT: s_ctz_i32_b64 s6, s[2:3]
|
||||
; GFX1164GISEL-NEXT: s_delay_alu instid0(SALU_CYCLE_1)
|
||||
; GFX1164GISEL-NEXT: v_readlane_b32 s4, v2, s6
|
||||
; GFX1164GISEL-NEXT: v_readlane_b32 s5, v3, s6
|
||||
; GFX1164GISEL-NEXT: s_bitset0_b64 s[2:3], s6
|
||||
@ -1475,12 +1465,11 @@ define void @divergent_value_i64(ptr addrspace(1) %out, i64 %id.x) {
|
||||
; GFX1132DAGISEL-LABEL: divergent_value_i64:
|
||||
; GFX1132DAGISEL: ; %bb.0: ; %entry
|
||||
; GFX1132DAGISEL-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
|
||||
; GFX1132DAGISEL-NEXT: s_mov_b32 s0, 0
|
||||
; GFX1132DAGISEL-NEXT: s_mov_b64 s[0:1], 0
|
||||
; GFX1132DAGISEL-NEXT: s_mov_b32 s2, exec_lo
|
||||
; GFX1132DAGISEL-NEXT: s_mov_b32 s1, s0
|
||||
; GFX1132DAGISEL-NEXT: .LBB8_1: ; =>This Inner Loop Header: Depth=1
|
||||
; GFX1132DAGISEL-NEXT: s_delay_alu instid0(SALU_CYCLE_1) | instskip(NEXT) | instid1(SALU_CYCLE_1)
|
||||
; GFX1132DAGISEL-NEXT: s_ctz_i32_b32 s3, s2
|
||||
; GFX1132DAGISEL-NEXT: s_delay_alu instid0(SALU_CYCLE_1)
|
||||
; GFX1132DAGISEL-NEXT: v_readlane_b32 s4, v2, s3
|
||||
; GFX1132DAGISEL-NEXT: v_readlane_b32 s5, v3, s3
|
||||
; GFX1132DAGISEL-NEXT: s_bitset0_b32 s2, s3
|
||||
@ -1495,12 +1484,11 @@ define void @divergent_value_i64(ptr addrspace(1) %out, i64 %id.x) {
|
||||
; GFX1132GISEL-LABEL: divergent_value_i64:
|
||||
; GFX1132GISEL: ; %bb.0: ; %entry
|
||||
; GFX1132GISEL-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
|
||||
; GFX1132GISEL-NEXT: s_mov_b32 s0, 0
|
||||
; GFX1132GISEL-NEXT: s_mov_b64 s[0:1], 0
|
||||
; GFX1132GISEL-NEXT: s_mov_b32 s2, exec_lo
|
||||
; GFX1132GISEL-NEXT: s_mov_b32 s1, s0
|
||||
; GFX1132GISEL-NEXT: .LBB8_1: ; =>This Inner Loop Header: Depth=1
|
||||
; GFX1132GISEL-NEXT: s_delay_alu instid0(SALU_CYCLE_1) | instskip(NEXT) | instid1(SALU_CYCLE_1)
|
||||
; GFX1132GISEL-NEXT: s_ctz_i32_b32 s3, s2
|
||||
; GFX1132GISEL-NEXT: s_delay_alu instid0(SALU_CYCLE_1)
|
||||
; GFX1132GISEL-NEXT: v_readlane_b32 s4, v2, s3
|
||||
; GFX1132GISEL-NEXT: v_readlane_b32 s5, v3, s3
|
||||
; GFX1132GISEL-NEXT: s_bitset0_b32 s2, s3
|
||||
|
@ -1856,9 +1856,8 @@ define void @divergent_value_i64(ptr addrspace(1) %out, i64 %id.x) {
|
||||
; GFX8DAGISEL-LABEL: divergent_value_i64:
|
||||
; GFX8DAGISEL: ; %bb.0: ; %entry
|
||||
; GFX8DAGISEL-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
|
||||
; GFX8DAGISEL-NEXT: s_mov_b32 s4, 0
|
||||
; GFX8DAGISEL-NEXT: s_mov_b64 s[4:5], 0
|
||||
; GFX8DAGISEL-NEXT: s_mov_b64 s[6:7], exec
|
||||
; GFX8DAGISEL-NEXT: s_mov_b32 s5, s4
|
||||
; GFX8DAGISEL-NEXT: .LBB8_1: ; =>This Inner Loop Header: Depth=1
|
||||
; GFX8DAGISEL-NEXT: s_ff1_i32_b64 s10, s[6:7]
|
||||
; GFX8DAGISEL-NEXT: v_readlane_b32 s8, v2, s10
|
||||
@ -1877,9 +1876,8 @@ define void @divergent_value_i64(ptr addrspace(1) %out, i64 %id.x) {
|
||||
; GFX8GISEL-LABEL: divergent_value_i64:
|
||||
; GFX8GISEL: ; %bb.0: ; %entry
|
||||
; GFX8GISEL-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
|
||||
; GFX8GISEL-NEXT: s_mov_b32 s4, 0
|
||||
; GFX8GISEL-NEXT: s_mov_b64 s[4:5], 0
|
||||
; GFX8GISEL-NEXT: s_mov_b64 s[6:7], exec
|
||||
; GFX8GISEL-NEXT: s_mov_b32 s5, s4
|
||||
; GFX8GISEL-NEXT: .LBB8_1: ; =>This Inner Loop Header: Depth=1
|
||||
; GFX8GISEL-NEXT: s_ff1_i32_b64 s10, s[6:7]
|
||||
; GFX8GISEL-NEXT: v_readlane_b32 s8, v2, s10
|
||||
@ -1898,9 +1896,8 @@ define void @divergent_value_i64(ptr addrspace(1) %out, i64 %id.x) {
|
||||
; GFX9DAGISEL-LABEL: divergent_value_i64:
|
||||
; GFX9DAGISEL: ; %bb.0: ; %entry
|
||||
; GFX9DAGISEL-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
|
||||
; GFX9DAGISEL-NEXT: s_mov_b32 s4, 0
|
||||
; GFX9DAGISEL-NEXT: s_mov_b64 s[4:5], 0
|
||||
; GFX9DAGISEL-NEXT: s_mov_b64 s[6:7], exec
|
||||
; GFX9DAGISEL-NEXT: s_mov_b32 s5, s4
|
||||
; GFX9DAGISEL-NEXT: .LBB8_1: ; =>This Inner Loop Header: Depth=1
|
||||
; GFX9DAGISEL-NEXT: s_ff1_i32_b64 s10, s[6:7]
|
||||
; GFX9DAGISEL-NEXT: v_readlane_b32 s8, v2, s10
|
||||
@ -1919,9 +1916,8 @@ define void @divergent_value_i64(ptr addrspace(1) %out, i64 %id.x) {
|
||||
; GFX9GISEL-LABEL: divergent_value_i64:
|
||||
; GFX9GISEL: ; %bb.0: ; %entry
|
||||
; GFX9GISEL-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
|
||||
; GFX9GISEL-NEXT: s_mov_b32 s4, 0
|
||||
; GFX9GISEL-NEXT: s_mov_b64 s[4:5], 0
|
||||
; GFX9GISEL-NEXT: s_mov_b64 s[6:7], exec
|
||||
; GFX9GISEL-NEXT: s_mov_b32 s5, s4
|
||||
; GFX9GISEL-NEXT: .LBB8_1: ; =>This Inner Loop Header: Depth=1
|
||||
; GFX9GISEL-NEXT: s_ff1_i32_b64 s10, s[6:7]
|
||||
; GFX9GISEL-NEXT: v_readlane_b32 s8, v2, s10
|
||||
@ -1940,9 +1936,8 @@ define void @divergent_value_i64(ptr addrspace(1) %out, i64 %id.x) {
|
||||
; GFX1064DAGISEL-LABEL: divergent_value_i64:
|
||||
; GFX1064DAGISEL: ; %bb.0: ; %entry
|
||||
; GFX1064DAGISEL-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
|
||||
; GFX1064DAGISEL-NEXT: s_mov_b32 s4, 0
|
||||
; GFX1064DAGISEL-NEXT: s_mov_b64 s[4:5], 0
|
||||
; GFX1064DAGISEL-NEXT: s_mov_b64 s[6:7], exec
|
||||
; GFX1064DAGISEL-NEXT: s_mov_b32 s5, s4
|
||||
; GFX1064DAGISEL-NEXT: .LBB8_1: ; =>This Inner Loop Header: Depth=1
|
||||
; GFX1064DAGISEL-NEXT: s_ff1_i32_b64 s10, s[6:7]
|
||||
; GFX1064DAGISEL-NEXT: v_readlane_b32 s8, v2, s10
|
||||
@ -1960,9 +1955,8 @@ define void @divergent_value_i64(ptr addrspace(1) %out, i64 %id.x) {
|
||||
; GFX1064GISEL-LABEL: divergent_value_i64:
|
||||
; GFX1064GISEL: ; %bb.0: ; %entry
|
||||
; GFX1064GISEL-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
|
||||
; GFX1064GISEL-NEXT: s_mov_b32 s4, 0
|
||||
; GFX1064GISEL-NEXT: s_mov_b64 s[4:5], 0
|
||||
; GFX1064GISEL-NEXT: s_mov_b64 s[6:7], exec
|
||||
; GFX1064GISEL-NEXT: s_mov_b32 s5, s4
|
||||
; GFX1064GISEL-NEXT: .LBB8_1: ; =>This Inner Loop Header: Depth=1
|
||||
; GFX1064GISEL-NEXT: s_ff1_i32_b64 s10, s[6:7]
|
||||
; GFX1064GISEL-NEXT: v_readlane_b32 s8, v2, s10
|
||||
@ -1980,9 +1974,8 @@ define void @divergent_value_i64(ptr addrspace(1) %out, i64 %id.x) {
|
||||
; GFX1032DAGISEL-LABEL: divergent_value_i64:
|
||||
; GFX1032DAGISEL: ; %bb.0: ; %entry
|
||||
; GFX1032DAGISEL-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
|
||||
; GFX1032DAGISEL-NEXT: s_mov_b32 s4, 0
|
||||
; GFX1032DAGISEL-NEXT: s_mov_b64 s[4:5], 0
|
||||
; GFX1032DAGISEL-NEXT: s_mov_b32 s6, exec_lo
|
||||
; GFX1032DAGISEL-NEXT: s_mov_b32 s5, s4
|
||||
; GFX1032DAGISEL-NEXT: .LBB8_1: ; =>This Inner Loop Header: Depth=1
|
||||
; GFX1032DAGISEL-NEXT: s_ff1_i32_b32 s7, s6
|
||||
; GFX1032DAGISEL-NEXT: v_readlane_b32 s8, v2, s7
|
||||
@ -2000,9 +1993,8 @@ define void @divergent_value_i64(ptr addrspace(1) %out, i64 %id.x) {
|
||||
; GFX1032GISEL-LABEL: divergent_value_i64:
|
||||
; GFX1032GISEL: ; %bb.0: ; %entry
|
||||
; GFX1032GISEL-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
|
||||
; GFX1032GISEL-NEXT: s_mov_b32 s4, 0
|
||||
; GFX1032GISEL-NEXT: s_mov_b64 s[4:5], 0
|
||||
; GFX1032GISEL-NEXT: s_mov_b32 s6, exec_lo
|
||||
; GFX1032GISEL-NEXT: s_mov_b32 s5, s4
|
||||
; GFX1032GISEL-NEXT: .LBB8_1: ; =>This Inner Loop Header: Depth=1
|
||||
; GFX1032GISEL-NEXT: s_ff1_i32_b32 s7, s6
|
||||
; GFX1032GISEL-NEXT: v_readlane_b32 s8, v2, s7
|
||||
@ -2020,12 +2012,11 @@ define void @divergent_value_i64(ptr addrspace(1) %out, i64 %id.x) {
|
||||
; GFX1164DAGISEL-LABEL: divergent_value_i64:
|
||||
; GFX1164DAGISEL: ; %bb.0: ; %entry
|
||||
; GFX1164DAGISEL-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
|
||||
; GFX1164DAGISEL-NEXT: s_mov_b32 s0, 0
|
||||
; GFX1164DAGISEL-NEXT: s_mov_b64 s[0:1], 0
|
||||
; GFX1164DAGISEL-NEXT: s_mov_b64 s[2:3], exec
|
||||
; GFX1164DAGISEL-NEXT: s_mov_b32 s1, s0
|
||||
; GFX1164DAGISEL-NEXT: .LBB8_1: ; =>This Inner Loop Header: Depth=1
|
||||
; GFX1164DAGISEL-NEXT: s_delay_alu instid0(SALU_CYCLE_1) | instskip(NEXT) | instid1(SALU_CYCLE_1)
|
||||
; GFX1164DAGISEL-NEXT: s_ctz_i32_b64 s6, s[2:3]
|
||||
; GFX1164DAGISEL-NEXT: s_delay_alu instid0(SALU_CYCLE_1)
|
||||
; GFX1164DAGISEL-NEXT: v_readlane_b32 s4, v2, s6
|
||||
; GFX1164DAGISEL-NEXT: v_readlane_b32 s5, v3, s6
|
||||
; GFX1164DAGISEL-NEXT: s_bitset0_b64 s[2:3], s6
|
||||
@ -2041,12 +2032,11 @@ define void @divergent_value_i64(ptr addrspace(1) %out, i64 %id.x) {
|
||||
; GFX1164GISEL-LABEL: divergent_value_i64:
|
||||
; GFX1164GISEL: ; %bb.0: ; %entry
|
||||
; GFX1164GISEL-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
|
||||
; GFX1164GISEL-NEXT: s_mov_b32 s0, 0
|
||||
; GFX1164GISEL-NEXT: s_mov_b64 s[0:1], 0
|
||||
; GFX1164GISEL-NEXT: s_mov_b64 s[2:3], exec
|
||||
; GFX1164GISEL-NEXT: s_mov_b32 s1, s0
|
||||
; GFX1164GISEL-NEXT: .LBB8_1: ; =>This Inner Loop Header: Depth=1
|
||||
; GFX1164GISEL-NEXT: s_delay_alu instid0(SALU_CYCLE_1) | instskip(NEXT) | instid1(SALU_CYCLE_1)
|
||||
; GFX1164GISEL-NEXT: s_ctz_i32_b64 s6, s[2:3]
|
||||
; GFX1164GISEL-NEXT: s_delay_alu instid0(SALU_CYCLE_1)
|
||||
; GFX1164GISEL-NEXT: v_readlane_b32 s4, v2, s6
|
||||
; GFX1164GISEL-NEXT: v_readlane_b32 s5, v3, s6
|
||||
; GFX1164GISEL-NEXT: s_bitset0_b64 s[2:3], s6
|
||||
@ -2062,12 +2052,11 @@ define void @divergent_value_i64(ptr addrspace(1) %out, i64 %id.x) {
|
||||
; GFX1132DAGISEL-LABEL: divergent_value_i64:
|
||||
; GFX1132DAGISEL: ; %bb.0: ; %entry
|
||||
; GFX1132DAGISEL-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
|
||||
; GFX1132DAGISEL-NEXT: s_mov_b32 s0, 0
|
||||
; GFX1132DAGISEL-NEXT: s_mov_b64 s[0:1], 0
|
||||
; GFX1132DAGISEL-NEXT: s_mov_b32 s2, exec_lo
|
||||
; GFX1132DAGISEL-NEXT: s_mov_b32 s1, s0
|
||||
; GFX1132DAGISEL-NEXT: .LBB8_1: ; =>This Inner Loop Header: Depth=1
|
||||
; GFX1132DAGISEL-NEXT: s_delay_alu instid0(SALU_CYCLE_1) | instskip(NEXT) | instid1(SALU_CYCLE_1)
|
||||
; GFX1132DAGISEL-NEXT: s_ctz_i32_b32 s3, s2
|
||||
; GFX1132DAGISEL-NEXT: s_delay_alu instid0(SALU_CYCLE_1)
|
||||
; GFX1132DAGISEL-NEXT: v_readlane_b32 s4, v2, s3
|
||||
; GFX1132DAGISEL-NEXT: v_readlane_b32 s5, v3, s3
|
||||
; GFX1132DAGISEL-NEXT: s_bitset0_b32 s2, s3
|
||||
@ -2082,12 +2071,11 @@ define void @divergent_value_i64(ptr addrspace(1) %out, i64 %id.x) {
|
||||
; GFX1132GISEL-LABEL: divergent_value_i64:
|
||||
; GFX1132GISEL: ; %bb.0: ; %entry
|
||||
; GFX1132GISEL-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
|
||||
; GFX1132GISEL-NEXT: s_mov_b32 s0, 0
|
||||
; GFX1132GISEL-NEXT: s_mov_b64 s[0:1], 0
|
||||
; GFX1132GISEL-NEXT: s_mov_b32 s2, exec_lo
|
||||
; GFX1132GISEL-NEXT: s_mov_b32 s1, s0
|
||||
; GFX1132GISEL-NEXT: .LBB8_1: ; =>This Inner Loop Header: Depth=1
|
||||
; GFX1132GISEL-NEXT: s_delay_alu instid0(SALU_CYCLE_1) | instskip(NEXT) | instid1(SALU_CYCLE_1)
|
||||
; GFX1132GISEL-NEXT: s_ctz_i32_b32 s3, s2
|
||||
; GFX1132GISEL-NEXT: s_delay_alu instid0(SALU_CYCLE_1)
|
||||
; GFX1132GISEL-NEXT: v_readlane_b32 s4, v2, s3
|
||||
; GFX1132GISEL-NEXT: v_readlane_b32 s5, v3, s3
|
||||
; GFX1132GISEL-NEXT: s_bitset0_b32 s2, s3
|
||||
|
Loading…
x
Reference in New Issue
Block a user