94#define DEBUG_TYPE "aarch64-condopt"
96STATISTIC(NumConditionsAdjusted,
"Number of conditions adjusted");
107class AArch64ConditionOptimizerImpl {
112 MachineInstr *CondMI;
116 unsigned getOpc()
const {
return CmpMI->getOpcode(); }
119 const TargetInstrInfo *TII;
120 const TargetRegisterInfo *TRI;
121 MachineDominatorTree *DomTree;
122 const MachineRegisterInfo *MRI;
125 bool run(MachineFunction &MF, MachineDominatorTree &MDT);
128 bool canAdjustCmp(MachineInstr &CmpMI);
129 bool registersMatch(MachineInstr *FirstMI, MachineInstr *SecondMI);
130 bool nzcvLivesOut(MachineBasicBlock *
MBB);
131 MachineInstr *getBccTerminator(MachineBasicBlock *
MBB);
132 MachineInstr *findAdjustableCmp(MachineInstr *CondMI);
134 void updateCmpInstr(MachineInstr *CmpMI,
int NewImm,
unsigned NewOpc);
136 void applyCmpAdjustment(CmpCondPair &Pair,
const CmpInfo &Info);
137 bool tryOptimizePair(CmpCondPair &
First, CmpCondPair &Second);
138 bool optimizeIntraBlock(MachineBasicBlock &
MBB);
139 bool optimizeCrossBlock(MachineBasicBlock &HBB);
145 AArch64ConditionOptimizerLegacy() : MachineFunctionPass(ID) {}
147 void getAnalysisUsage(AnalysisUsage &AU)
const override;
148 bool runOnMachineFunction(MachineFunction &MF)
override;
150 StringRef getPassName()
const override {
151 return "AArch64 Condition Optimizer";
157char AArch64ConditionOptimizerLegacy::ID = 0;
160 "AArch64 CondOpt Pass",
false,
false)
166 return new AArch64ConditionOptimizerLegacy();
169void AArch64ConditionOptimizerLegacy::getAnalysisUsage(
178bool AArch64ConditionOptimizerImpl::canAdjustCmp(MachineInstr &CmpMI) {
181 LLVM_DEBUG(
dbgs() <<
"Immediate of cmp is symbolic, " << CmpMI <<
'\n');
184 LLVM_DEBUG(
dbgs() <<
"Immediate of cmp may be out of range, " << CmpMI
188 LLVM_DEBUG(
dbgs() <<
"Destination of cmp is not dead, " << CmpMI <<
'\n');
196bool AArch64ConditionOptimizerImpl::registersMatch(MachineInstr *FirstMI,
197 MachineInstr *SecondMI) {
201 FirstReg.
isVirtual() ?
TRI->lookThruCopyLike(FirstReg, MRI) : FirstReg;
203 SecondReg.
isVirtual() ?
TRI->lookThruCopyLike(SecondReg, MRI) : SecondReg;
204 if (FirstCmpReg != SecondCmpReg) {
213bool AArch64ConditionOptimizerImpl::nzcvLivesOut(MachineBasicBlock *
MBB) {
215 if (SuccBB->isLiveIn(AArch64::NZCV)) {
229 case AArch64::SUBSWri:
230 case AArch64::SUBSXri:
232 case AArch64::ADDSWri:
233 case AArch64::ADDSXri:
241 return Opc == AArch64::CSINCWr ||
Opc == AArch64::CSINCXr;
246AArch64ConditionOptimizerImpl::getBccTerminator(MachineBasicBlock *
MBB) {
254 if (
Term->getOpcode() != AArch64::Bcc) {
268AArch64ConditionOptimizerImpl::findAdjustableCmp(MachineInstr *CondMI) {
269 assert(CondMI &&
"CondMI cannot be null");
278 MachineInstr &
I = *It;
279 assert(!
I.isTerminator() &&
"Spurious terminator");
281 if (
I.readsRegister(AArch64::NZCV,
nullptr))
285 if (!canAdjustCmp(
I)) {
291 if (
I.modifiesRegister(AArch64::NZCV,
nullptr))
302 case AArch64::ADDSWri:
return AArch64::SUBSWri;
303 case AArch64::ADDSXri:
return AArch64::SUBSXri;
304 case AArch64::SUBSWri:
return AArch64::ADDSWri;
305 case AArch64::SUBSXri:
return AArch64::ADDSXri;
338AArch64ConditionOptimizerImpl::getAdjustedCmpInfo(MachineInstr *CmpMI,
347 bool Negative = (
Opc == AArch64::ADDSWri ||
Opc == AArch64::ADDSXri);
352 Correction = -Correction;
356 const int NewImm = std::abs(OldImm + Correction);
360 if (OldImm == 0 && Negative)
361 return {OldImm,
Opc,
Cmp};
363 if ((OldImm == 1 && Negative && Correction == -1) ||
364 (OldImm == 0 && Correction == -1)) {
369 return {OldImm,
Opc,
Cmp};
377void AArch64ConditionOptimizerImpl::updateCmpInstr(MachineInstr *CmpMI,
385void AArch64ConditionOptimizerImpl::updateCondInstr(MachineInstr *CondMI,
393 case AArch64::CSINCWr:
394 case AArch64::CSINCXr:
401 ++NumConditionsAdjusted;
405void AArch64ConditionOptimizerImpl::applyCmpAdjustment(CmpCondPair &Pair,
406 const CmpInfo &Info) {
407 updateCmpInstr(Pair.CmpMI,
Info.Imm,
Info.Opc);
408 updateCondInstr(Pair.CondMI,
Info.CC);
414 assert(!
Cond.empty() &&
"Expected non-empty condition from analyzeBranch");
417 assert(
Cond.size() == 1 &&
"Unknown Cond array format");
431bool AArch64ConditionOptimizerImpl::tryOptimizePair(CmpCondPair &
First,
432 CmpCondPair &Second) {
437 int FirstImmTrueValue =
First.getImm();
438 int SecondImmTrueValue = Second.getImm();
441 if (
First.getOpc() == AArch64::ADDSWri ||
First.getOpc() == AArch64::ADDSXri)
442 FirstImmTrueValue = -FirstImmTrueValue;
443 if (Second.getOpc() == AArch64::ADDSWri ||
444 Second.getOpc() == AArch64::ADDSXri)
445 SecondImmTrueValue = -SecondImmTrueValue;
447 CmpInfo FirstAdj = getAdjustedCmpInfo(
First.CmpMI,
First.CC);
448 CmpInfo SecondAdj = getAdjustedCmpInfo(Second.CmpMI, Second.CC);
452 std::abs(SecondImmTrueValue - FirstImmTrueValue) == 2) {
465 if (FirstAdj.Imm != SecondAdj.Imm || FirstAdj.Opc != SecondAdj.Opc)
470 <<
First.getImm() <<
", "
472 << Second.getImm() <<
" -> "
474 << FirstAdj.Imm <<
", "
476 << SecondAdj.Imm <<
'\n');
477 applyCmpAdjustment(
First, FirstAdj);
478 applyCmpAdjustment(Second, SecondAdj);
483 std::abs(SecondImmTrueValue - FirstImmTrueValue) == 1) {
496 bool AdjustFirst = (FirstImmTrueValue < SecondImmTrueValue);
498 AdjustFirst = !AdjustFirst;
500 CmpCondPair &
Target = AdjustFirst ? Second :
First;
501 CmpCondPair &ToChange = AdjustFirst ?
First : Second;
502 CmpInfo &Adj = AdjustFirst ? FirstAdj : SecondAdj;
506 if (Adj.Imm !=
Target.getImm() || Adj.Opc !=
Target.getOpc())
511 << ToChange.getImm() <<
" -> "
514 applyCmpAdjustment(ToChange, Adj);
540bool AArch64ConditionOptimizerImpl::optimizeIntraBlock(MachineBasicBlock &
MBB) {
541 MachineInstr *FirstCSINC =
nullptr;
542 MachineInstr *SecondCSINC =
nullptr;
545 for (MachineInstr &
MI :
MBB) {
549 }
else if (!SecondCSINC) {
556 if (!FirstCSINC || !SecondCSINC) {
561 if (nzcvLivesOut(&
MBB))
565 MachineInstr *FirstCmpMI = findAdjustableCmp(FirstCSINC);
566 MachineInstr *SecondCmpMI = findAdjustableCmp(SecondCSINC);
567 if (!FirstCmpMI || !SecondCmpMI)
571 if (FirstCmpMI == SecondCmpMI) {
572 LLVM_DEBUG(
dbgs() <<
"Both CSINCs already controlled by same CMP\n");
576 if (!registersMatch(FirstCmpMI, SecondCmpMI))
583 if (&*It != SecondCmpMI &&
584 It->modifiesRegister(AArch64::NZCV,
nullptr)) {
585 LLVM_DEBUG(
dbgs() <<
"Flags modified between CMPs by: " << *It <<
'\n');
593 if (It->readsRegister(AArch64::NZCV,
nullptr)) {
594 LLVM_DEBUG(
dbgs() <<
"Flags read after second CSINC by: " << *It <<
'\n');
611 << SecondImm <<
'\n');
615 if (FirstCond == SecondCond &&
617 std::abs(SecondImm - FirstImm) == 1) {
621 bool adjustFirst = (FirstImm < SecondImm);
623 adjustFirst = !adjustFirst;
626 MachineInstr *CmpToAdjust = adjustFirst ? FirstCmpMI : SecondCmpMI;
627 MachineInstr *CSINCToAdjust = adjustFirst ? FirstCSINC : SecondCSINC;
629 int TargetImm = adjustFirst ? SecondImm : FirstImm;
631 CmpInfo Adj = getAdjustedCmpInfo(CmpToAdjust, CondToAdjust);
633 if (Adj.Imm == TargetImm &&
634 Adj.Opc == (adjustFirst ? SecondCmpMI : FirstCmpMI)->getOpcode()) {
635 LLVM_DEBUG(
dbgs() <<
"Successfully optimizing intra-block CSINC pair\n");
638 CmpCondPair ToChange{CmpToAdjust, CSINCToAdjust, CondToAdjust};
639 applyCmpAdjustment(ToChange, Adj);
649bool AArch64ConditionOptimizerImpl::optimizeCrossBlock(MachineBasicBlock &HBB) {
651 MachineBasicBlock *
TBB =
nullptr, *FBB =
nullptr;
657 if (!
TBB ||
TBB == &HBB) {
662 MachineBasicBlock *TBB_TBB =
nullptr, *TBB_FBB =
nullptr;
667 MachineInstr *HeadBrMI = getBccTerminator(&HBB);
668 MachineInstr *TrueBrMI = getBccTerminator(
TBB);
669 if (!HeadBrMI || !TrueBrMI)
673 if (nzcvLivesOut(&HBB) || nzcvLivesOut(
TBB))
677 MachineInstr *HeadCmpMI = findAdjustableCmp(HeadBrMI);
678 MachineInstr *TrueCmpMI = findAdjustableCmp(TrueBrMI);
679 if (!HeadCmpMI || !TrueCmpMI)
682 if (!registersMatch(HeadCmpMI, TrueCmpMI))
687 if (HeadCondCode == AArch64CC::CondCode::Invalid ||
688 TrueCondCode == AArch64CC::CondCode::Invalid) {
698 CmpCondPair Head{HeadCmpMI, HeadBrMI, HeadCondCode};
699 CmpCondPair True{TrueCmpMI, TrueBrMI, TrueCondCode};
701 return tryOptimizePair(Head, True);
704bool AArch64ConditionOptimizerLegacy::runOnMachineFunction(
705 MachineFunction &MF) {
708 MachineDominatorTree &MDT =
709 getAnalysis<MachineDominatorTreeWrapperPass>().getDomTree();
710 return AArch64ConditionOptimizerImpl().run(MF, MDT);
713bool AArch64ConditionOptimizerImpl::run(MachineFunction &MF,
714 MachineDominatorTree &MDT) {
715 LLVM_DEBUG(
dbgs() <<
"********** AArch64 Conditional Compares **********\n"
716 <<
"********** Function: " << MF.
getName() <<
'\n');
731 MachineBasicBlock *HBB =
I->getBlock();
732 Changed |= optimizeIntraBlock(*HBB);
733 Changed |= optimizeCrossBlock(*HBB);
743 bool Changed = AArch64ConditionOptimizerImpl().run(MF, MDT);
static AArch64CC::CondCode parseCondCode(ArrayRef< MachineOperand > Cond)
static int getComplementOpc(int Opc)
static bool isGreaterThan(AArch64CC::CondCode Cmp)
static AArch64CC::CondCode getAdjustedCmp(AArch64CC::CondCode Cmp)
static bool isCSINCInstruction(unsigned Opc)
static bool isLessThan(AArch64CC::CondCode Cmp)
static bool isCmpInstruction(unsigned Opc)
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")
static GCRegistry::Add< OcamlGC > B("ocaml", "ocaml 3.10-compatible GC")
This file builds on the ADT/GraphTraits.h file to build generic depth first graph iterator.
const HexagonInstrInfo * TII
Register const TargetRegisterInfo * TRI
Promote Memory to Register
#define INITIALIZE_PASS_DEPENDENCY(depName)
#define INITIALIZE_PASS_END(passName, arg, name, cfg, analysis)
#define INITIALIZE_PASS_BEGIN(passName, arg, name, cfg, analysis)
const SmallVectorImpl< MachineOperand > MachineBasicBlock * TBB
const SmallVectorImpl< MachineOperand > & Cond
This file defines the SmallVector class.
This file defines the 'Statistic' class, which is designed to be an easy way to expose various metric...
#define STATISTIC(VARNAME, DESC)
PreservedAnalyses run(MachineFunction &MF, MachineFunctionAnalysisManager &MFAM)
PassT::Result & getResult(IRUnitT &IR, ExtraArgTs... ExtraArgs)
Get the result of an analysis pass for a given IR unit.
Represent the analysis usage information of a pass.
AnalysisUsage & addRequired()
AnalysisUsage & addPreserved()
Add the specified Pass class to the set of analyses preserved by this pass.
ArrayRef - Represent a constant reference to an array (0 or more elements consecutively in memory),...
Represents analyses that only rely on functions' control flow.
FunctionPass class - This class is used to implement most global optimizations.
bool analyzeBranch(MachineBasicBlock &MBB, MachineBasicBlock *&TBB, MachineBasicBlock *&FBB, SmallVectorImpl< MachineOperand > &Cond, bool AllowModify) const override
Analyze the branching code at the end of MBB, returning true if it cannot be understood (e....
LLVM_ABI iterator getFirstTerminator()
Returns an iterator to the first terminator instruction of this basic block.
iterator_range< succ_iterator > successors()
MachineInstrBundleIterator< MachineInstr > iterator
Analysis pass which computes a MachineDominatorTree.
Analysis pass which computes a MachineDominatorTree.
MachineFunctionPass - This class adapts the FunctionPass interface to allow convenient creation of pa...
void getAnalysisUsage(AnalysisUsage &AU) const override
getAnalysisUsage - Subclasses that override getAnalysisUsage must call this.
const TargetSubtargetInfo & getSubtarget() const
getSubtarget - Return the subtarget for which this machine code is being compiled.
StringRef getName() const
getName - Return the name of the corresponding LLVM function.
MachineRegisterInfo & getRegInfo()
getRegInfo - Return information about the registers currently in use.
Function & getFunction()
Return the LLVM function that this machine code represents.
unsigned getOpcode() const
Returns the opcode of this MachineInstr.
const MachineBasicBlock * getParent() const
LLVM_ABI void setDesc(const MCInstrDesc &TID)
Replace the instruction descriptor (thus opcode) of the current instruction with a new one.
const MachineOperand & getOperand(unsigned i) const
void setImm(int64_t immVal)
bool isImm() const
isImm - Tests if this is a MO_Immediate operand.
Register getReg() const
getReg - Returns the register number.
bool use_nodbg_empty(Register RegNo) const
use_nodbg_empty - Return true if there are no non-Debug instructions using the specified register.
A set of analyses that are preserved following a run of a transformation pass.
static PreservedAnalyses all()
Construct a special preserved set that preserves all passes.
PreservedAnalyses & preserveSet()
Mark an analysis set as preserved.
constexpr bool isVirtual() const
Return true if the specified register number is in the virtual register namespace.
virtual const TargetInstrInfo * getInstrInfo() const
virtual const TargetRegisterInfo * getRegisterInfo() const =0
Return the target's register information.
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
static const char * getCondCodeName(CondCode Code)
static unsigned getShiftValue(unsigned Imm)
getShiftValue - Extract the shift value.
PointerTypeMap run(const Module &M)
Compute the PointerTypeMap for the module M.
This is an optimization pass for GlobalISel generic memory operations.
FunctionPass * createAArch64ConditionOptimizerLegacyPass()
AnalysisManager< MachineFunction > MachineFunctionAnalysisManager
LLVM_ABI PreservedAnalyses getMachineFunctionPassPreservedAnalyses()
Returns the minimum set of Analyses that all machine function passes must preserve.
MachineInstr * getImm(const MachineOperand &MO, const MachineRegisterInfo *MRI)
LLVM_ABI raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
class LLVM_GSL_OWNER SmallVector
Forward declaration of SmallVector so that calculateSmallVectorDefaultInlinedElements can reference s...
DomTreeNodeBase< MachineBasicBlock > MachineDomTreeNode
@ First
Helpers to iterate all locations in the MemoryEffectsBase class.
iterator_range< df_iterator< T > > depth_first(const T &G)
IterT prev_nodbg(IterT It, IterT Begin, bool SkipPseudoOp=true)
Decrement It, then continue decrementing it while it points to a debug instruction.
LLVM_ABI Printable printMBBReference(const MachineBasicBlock &MBB)
Prints a machine basic block reference.