[PowerPC] Fix ppc-reduce-cr-ops mishandling of subregister uses (#144405)
Corrects the erroneous assumption that CR-logical operation's operands are always defined by a subreg copy. Fixes https://github.com/llvm/llvm-project/issues/141643 Patch by Nemanja Ivanovic
This commit is contained in:
parent
1f7ba23422
commit
0a822f82de
@ -108,6 +108,8 @@ struct BlockSplitInfo {
|
|||||||
MachineInstr *OrigBranch;
|
MachineInstr *OrigBranch;
|
||||||
MachineInstr *SplitBefore;
|
MachineInstr *SplitBefore;
|
||||||
MachineInstr *SplitCond;
|
MachineInstr *SplitCond;
|
||||||
|
unsigned OrigSubreg;
|
||||||
|
unsigned SplitCondSubreg;
|
||||||
bool InvertNewBranch;
|
bool InvertNewBranch;
|
||||||
bool InvertOrigBranch;
|
bool InvertOrigBranch;
|
||||||
bool BranchToFallThrough;
|
bool BranchToFallThrough;
|
||||||
@ -220,7 +222,7 @@ static bool splitMBB(BlockSplitInfo &BSI) {
|
|||||||
// Add the branches to ThisMBB.
|
// Add the branches to ThisMBB.
|
||||||
BuildMI(*ThisMBB, ThisMBB->end(), BSI.SplitBefore->getDebugLoc(),
|
BuildMI(*ThisMBB, ThisMBB->end(), BSI.SplitBefore->getDebugLoc(),
|
||||||
TII->get(NewBROpcode))
|
TII->get(NewBROpcode))
|
||||||
.addReg(BSI.SplitCond->getOperand(0).getReg())
|
.addReg(BSI.SplitCond->getOperand(0).getReg(), 0, BSI.SplitCondSubreg)
|
||||||
.addMBB(NewBRTarget);
|
.addMBB(NewBRTarget);
|
||||||
BuildMI(*ThisMBB, ThisMBB->end(), BSI.SplitBefore->getDebugLoc(),
|
BuildMI(*ThisMBB, ThisMBB->end(), BSI.SplitBefore->getDebugLoc(),
|
||||||
TII->get(PPC::B))
|
TII->get(PPC::B))
|
||||||
@ -234,6 +236,7 @@ static bool splitMBB(BlockSplitInfo &BSI) {
|
|||||||
assert(FirstTerminator->getOperand(0).isReg() &&
|
assert(FirstTerminator->getOperand(0).isReg() &&
|
||||||
"Can't update condition of unconditional branch.");
|
"Can't update condition of unconditional branch.");
|
||||||
FirstTerminator->getOperand(0).setReg(BSI.NewCond->getOperand(0).getReg());
|
FirstTerminator->getOperand(0).setReg(BSI.NewCond->getOperand(0).getReg());
|
||||||
|
FirstTerminator->getOperand(0).setSubReg(BSI.OrigSubreg);
|
||||||
}
|
}
|
||||||
if (BSI.InvertOrigBranch)
|
if (BSI.InvertOrigBranch)
|
||||||
FirstTerminator->setDesc(TII->get(InvertedOpcode));
|
FirstTerminator->setDesc(TII->get(InvertedOpcode));
|
||||||
@ -471,6 +474,7 @@ PPCReduceCRLogicals::createCRLogicalOpInfo(MachineInstr &MIParam) {
|
|||||||
} else {
|
} else {
|
||||||
MachineInstr *Def1 = lookThroughCRCopy(MIParam.getOperand(1).getReg(),
|
MachineInstr *Def1 = lookThroughCRCopy(MIParam.getOperand(1).getReg(),
|
||||||
Ret.SubregDef1, Ret.CopyDefs.first);
|
Ret.SubregDef1, Ret.CopyDefs.first);
|
||||||
|
Ret.SubregDef1 = MIParam.getOperand(1).getSubReg();
|
||||||
assert(Def1 && "Must be able to find a definition of operand 1.");
|
assert(Def1 && "Must be able to find a definition of operand 1.");
|
||||||
Ret.DefsSingleUse &=
|
Ret.DefsSingleUse &=
|
||||||
MRI->hasOneNonDBGUse(Def1->getOperand(0).getReg());
|
MRI->hasOneNonDBGUse(Def1->getOperand(0).getReg());
|
||||||
@ -481,6 +485,7 @@ PPCReduceCRLogicals::createCRLogicalOpInfo(MachineInstr &MIParam) {
|
|||||||
MachineInstr *Def2 = lookThroughCRCopy(MIParam.getOperand(2).getReg(),
|
MachineInstr *Def2 = lookThroughCRCopy(MIParam.getOperand(2).getReg(),
|
||||||
Ret.SubregDef2,
|
Ret.SubregDef2,
|
||||||
Ret.CopyDefs.second);
|
Ret.CopyDefs.second);
|
||||||
|
Ret.SubregDef2 = MIParam.getOperand(2).getSubReg();
|
||||||
assert(Def2 && "Must be able to find a definition of operand 2.");
|
assert(Def2 && "Must be able to find a definition of operand 2.");
|
||||||
Ret.DefsSingleUse &=
|
Ret.DefsSingleUse &=
|
||||||
MRI->hasOneNonDBGUse(Def2->getOperand(0).getReg());
|
MRI->hasOneNonDBGUse(Def2->getOperand(0).getReg());
|
||||||
@ -535,7 +540,6 @@ PPCReduceCRLogicals::createCRLogicalOpInfo(MachineInstr &MIParam) {
|
|||||||
MachineInstr *PPCReduceCRLogicals::lookThroughCRCopy(unsigned Reg,
|
MachineInstr *PPCReduceCRLogicals::lookThroughCRCopy(unsigned Reg,
|
||||||
unsigned &Subreg,
|
unsigned &Subreg,
|
||||||
MachineInstr *&CpDef) {
|
MachineInstr *&CpDef) {
|
||||||
Subreg = -1;
|
|
||||||
if (!Register::isVirtualRegister(Reg))
|
if (!Register::isVirtualRegister(Reg))
|
||||||
return nullptr;
|
return nullptr;
|
||||||
MachineInstr *Copy = MRI->getVRegDef(Reg);
|
MachineInstr *Copy = MRI->getVRegDef(Reg);
|
||||||
@ -543,18 +547,8 @@ MachineInstr *PPCReduceCRLogicals::lookThroughCRCopy(unsigned Reg,
|
|||||||
if (!Copy->isCopy())
|
if (!Copy->isCopy())
|
||||||
return Copy;
|
return Copy;
|
||||||
Register CopySrc = Copy->getOperand(1).getReg();
|
Register CopySrc = Copy->getOperand(1).getReg();
|
||||||
Subreg = Copy->getOperand(1).getSubReg();
|
|
||||||
if (!CopySrc.isVirtual()) {
|
if (!CopySrc.isVirtual()) {
|
||||||
const TargetRegisterInfo *TRI = &TII->getRegisterInfo();
|
const TargetRegisterInfo *TRI = &TII->getRegisterInfo();
|
||||||
// Set the Subreg
|
|
||||||
if (CopySrc == PPC::CR0EQ || CopySrc == PPC::CR6EQ)
|
|
||||||
Subreg = PPC::sub_eq;
|
|
||||||
if (CopySrc == PPC::CR0LT || CopySrc == PPC::CR6LT)
|
|
||||||
Subreg = PPC::sub_lt;
|
|
||||||
if (CopySrc == PPC::CR0GT || CopySrc == PPC::CR6GT)
|
|
||||||
Subreg = PPC::sub_gt;
|
|
||||||
if (CopySrc == PPC::CR0UN || CopySrc == PPC::CR6UN)
|
|
||||||
Subreg = PPC::sub_un;
|
|
||||||
// Loop backwards and return the first MI that modifies the physical CR Reg.
|
// Loop backwards and return the first MI that modifies the physical CR Reg.
|
||||||
MachineBasicBlock::iterator Me = Copy, B = Copy->getParent()->begin();
|
MachineBasicBlock::iterator Me = Copy, B = Copy->getParent()->begin();
|
||||||
while (Me != B)
|
while (Me != B)
|
||||||
@ -682,16 +676,21 @@ bool PPCReduceCRLogicals::splitBlockOnBinaryCROp(CRLogicalOpInfo &CRI) {
|
|||||||
computeBranchTargetAndInversion(Opc, Branch->getOpcode(), UsingDef1,
|
computeBranchTargetAndInversion(Opc, Branch->getOpcode(), UsingDef1,
|
||||||
InvertNewBranch, InvertOrigBranch,
|
InvertNewBranch, InvertOrigBranch,
|
||||||
TargetIsFallThrough);
|
TargetIsFallThrough);
|
||||||
MachineInstr *SplitCond =
|
MachineInstr *NewCond = CRI.CopyDefs.first;
|
||||||
UsingDef1 ? CRI.CopyDefs.second : CRI.CopyDefs.first;
|
MachineInstr *SplitCond = CRI.CopyDefs.second;
|
||||||
|
if (!UsingDef1) {
|
||||||
|
std::swap(NewCond, SplitCond);
|
||||||
|
std::swap(CRI.SubregDef1, CRI.SubregDef2);
|
||||||
|
}
|
||||||
LLVM_DEBUG(dbgs() << "We will " << (InvertNewBranch ? "invert" : "copy"));
|
LLVM_DEBUG(dbgs() << "We will " << (InvertNewBranch ? "invert" : "copy"));
|
||||||
LLVM_DEBUG(dbgs() << " the original branch and the target is the "
|
LLVM_DEBUG(dbgs() << " the original branch and the target is the "
|
||||||
<< (TargetIsFallThrough ? "fallthrough block\n"
|
<< (TargetIsFallThrough ? "fallthrough block\n"
|
||||||
: "orig. target block\n"));
|
: "orig. target block\n"));
|
||||||
LLVM_DEBUG(dbgs() << "Original branch instruction: "; Branch->dump());
|
LLVM_DEBUG(dbgs() << "Original branch instruction: "; Branch->dump());
|
||||||
BlockSplitInfo BSI { Branch, SplitBefore, SplitCond, InvertNewBranch,
|
BlockSplitInfo BSI{
|
||||||
InvertOrigBranch, TargetIsFallThrough, MBPI, CRI.MI,
|
Branch, SplitBefore, SplitCond, CRI.SubregDef1,
|
||||||
UsingDef1 ? CRI.CopyDefs.first : CRI.CopyDefs.second };
|
CRI.SubregDef2, InvertNewBranch, InvertOrigBranch, TargetIsFallThrough,
|
||||||
|
MBPI, CRI.MI, NewCond};
|
||||||
bool Changed = splitMBB(BSI);
|
bool Changed = splitMBB(BSI);
|
||||||
// If we've split on a CR logical that is fed by a CR logical,
|
// If we've split on a CR logical that is fed by a CR logical,
|
||||||
// recompute the source CR logical as it may be usable for splitting.
|
// recompute the source CR logical as it may be usable for splitting.
|
||||||
|
66
llvm/test/CodeGen/PowerPC/crreduce-reg.mir
Normal file
66
llvm/test/CodeGen/PowerPC/crreduce-reg.mir
Normal file
@ -0,0 +1,66 @@
|
|||||||
|
# NOTE: Assertions have been autogenerated by utils/update_mir_test_checks.py UTC_ARGS: --version 5
|
||||||
|
# RUN: llc -mtriple=powerpc64-unknown-linux-gnu -run-pass=ppc-reduce-cr-ops \
|
||||||
|
# RUN: -verify-machineinstrs -o - %s | FileCheck %s
|
||||||
|
|
||||||
|
---
|
||||||
|
name: subreg_folding_regression
|
||||||
|
tracksRegLiveness: true
|
||||||
|
isSSA: true
|
||||||
|
body: |
|
||||||
|
; CHECK-LABEL: name: subreg_folding_regression
|
||||||
|
; CHECK: bb.0:
|
||||||
|
; CHECK-NEXT: successors: %bb.1(0x80000000)
|
||||||
|
; CHECK-NEXT: liveins: $x3
|
||||||
|
; CHECK-NEXT: {{ $}}
|
||||||
|
; CHECK-NEXT: [[COPY:%[0-9]+]]:g8rc_and_g8rc_nox0 = COPY $x3
|
||||||
|
; CHECK-NEXT: [[LD:%[0-9]+]]:g8rc = LD 0, [[COPY]] :: (load (s64))
|
||||||
|
; CHECK-NEXT: {{ $}}
|
||||||
|
; CHECK-NEXT: bb.1:
|
||||||
|
; CHECK-NEXT: successors: %bb.2(0x20000000), %bb.3(0x60000000)
|
||||||
|
; CHECK-NEXT: {{ $}}
|
||||||
|
; CHECK-NEXT: [[PHI:%[0-9]+]]:g8rc_and_g8rc_nox0 = PHI [[LD]], %bb.0, %3, %bb.3, %4, %bb.2
|
||||||
|
; CHECK-NEXT: [[LBZ:%[0-9]+]]:gprc = LBZ 0, [[PHI]] :: (load (s8))
|
||||||
|
; CHECK-NEXT: [[CMPWI:%[0-9]+]]:crrc = CMPWI killed [[LBZ]], 0
|
||||||
|
; CHECK-NEXT: [[ADDI8_:%[0-9]+]]:g8rc = nuw ADDI8 [[PHI]], 1
|
||||||
|
; CHECK-NEXT: STD [[ADDI8_]], 0, [[COPY]] :: (store (s64))
|
||||||
|
; CHECK-NEXT: [[LBZ1:%[0-9]+]]:gprc = LBZ 1, [[PHI]] :: (load (s8))
|
||||||
|
; CHECK-NEXT: BCn [[CMPWI]].sub_lt, %bb.2
|
||||||
|
; CHECK-NEXT: B %bb.3
|
||||||
|
; CHECK-NEXT: {{ $}}
|
||||||
|
; CHECK-NEXT: bb.3:
|
||||||
|
; CHECK-NEXT: successors: %bb.1(0x55555555), %bb.2(0x2aaaaaab)
|
||||||
|
; CHECK-NEXT: {{ $}}
|
||||||
|
; CHECK-NEXT: [[CMPWI1:%[0-9]+]]:crrc = CMPWI killed [[LBZ1]], 0
|
||||||
|
; CHECK-NEXT: BC killed [[CMPWI1]].sub_eq, %bb.1
|
||||||
|
; CHECK-NEXT: B %bb.2
|
||||||
|
; CHECK-NEXT: {{ $}}
|
||||||
|
; CHECK-NEXT: bb.2:
|
||||||
|
; CHECK-NEXT: successors: %bb.1(0x80000000)
|
||||||
|
; CHECK-NEXT: {{ $}}
|
||||||
|
; CHECK-NEXT: [[ADDI8_1:%[0-9]+]]:g8rc = nuw ADDI8 [[PHI]], 2
|
||||||
|
; CHECK-NEXT: STD [[ADDI8_1]], 0, [[COPY]] :: (store (s64))
|
||||||
|
; CHECK-NEXT: B %bb.1
|
||||||
|
bb.0:
|
||||||
|
liveins: $x3
|
||||||
|
|
||||||
|
%0:g8rc_and_g8rc_nox0 = COPY $x3
|
||||||
|
%1:g8rc = LD 0, %0 :: (load (s64))
|
||||||
|
|
||||||
|
bb.1:
|
||||||
|
%2:g8rc_and_g8rc_nox0 = PHI %1, %bb.0, %3, %bb.1, %4, %bb.2
|
||||||
|
%5:gprc = LBZ 0, %2 :: (load (s8))
|
||||||
|
%6:crrc = CMPWI killed %5, 0
|
||||||
|
%3:g8rc = nuw ADDI8 %2, 1
|
||||||
|
STD %3, 0, %0 :: (store (s64))
|
||||||
|
%7:gprc = LBZ 1, %2 :: (load (s8))
|
||||||
|
%8:crrc = CMPWI killed %7, 0
|
||||||
|
%9:crbitrc = CRAND %8.sub_eq, %6.sub_lt
|
||||||
|
BC killed %9, %bb.1
|
||||||
|
B %bb.2
|
||||||
|
|
||||||
|
bb.2:
|
||||||
|
%4:g8rc = nuw ADDI8 %2, 2
|
||||||
|
STD %4, 0, %0 :: (store (s64))
|
||||||
|
B %bb.1
|
||||||
|
|
||||||
|
...
|
Loading…
x
Reference in New Issue
Block a user