63#define DEBUG_TYPE "regalloc"
65STATISTIC(numJoins ,
"Number of interval joins performed");
66STATISTIC(numCrossRCs ,
"Number of cross class joins performed");
67STATISTIC(numCommutes ,
"Number of instruction commuting performed");
69STATISTIC(NumReMats ,
"Number of instructions re-materialized");
70STATISTIC(NumInflated ,
"Number of register classes inflated");
71STATISTIC(NumLaneConflicts,
"Number of dead lane conflicts tested");
72STATISTIC(NumLaneResolves,
"Number of dead lane conflicts resolved");
73STATISTIC(NumShrinkToUses,
"Number of shrinkToUses called");
76 cl::desc(
"Coalesce copies (default=true)"),
91 cl::desc(
"Coalesce copies that span blocks (default=subtarget)"),
96 cl::desc(
"Verify machine instrs before and after register coalescing"),
101 cl::desc(
"During rematerialization for a copy, if the def instruction has "
102 "many other copy uses to be rematerialized, delay the multiple "
103 "separate live interval update work and do them all at once after "
104 "all those rematerialization are done. It will save a lot of "
110 cl::desc(
"If the valnos size of an interval is larger than the threshold, "
111 "it is regarded as a large interval. "),
116 cl::desc(
"For a large interval, if it is coalesed with other live "
117 "intervals many times more than the threshold, stop its "
118 "coalescing to control the compile time. "),
153 using DbgValueLoc = std::pair<SlotIndex, MachineInstr*>;
162 bool ShrinkMainRange =
false;
166 bool JoinGlobalCopies =
false;
170 bool JoinSplitEdges =
false;
202 void coalesceLocals();
205 void joinAllIntervals();
220 void lateLiveIntervalUpdate();
225 bool copyValueUndefInPredecessors(
LiveRange &S,
290 std::pair<bool,bool> removeCopyByCommutingDef(
const CoalescerPair &CP,
361 MI->eraseFromParent();
397char RegisterCoalescer::ID = 0;
402 "Register Coalescer",
false,
false)
415 Dst =
MI->getOperand(0).getReg();
416 DstSub =
MI->getOperand(0).getSubReg();
417 Src =
MI->getOperand(1).getReg();
418 SrcSub =
MI->getOperand(1).getSubReg();
419 }
else if (
MI->isSubregToReg()) {
420 Dst =
MI->getOperand(0).getReg();
421 DstSub = tri.composeSubRegIndices(
MI->getOperand(0).getSubReg(),
422 MI->getOperand(3).getImm());
423 Src =
MI->getOperand(2).getReg();
424 SrcSub =
MI->getOperand(2).getSubReg();
439 for (
const auto &
MI : *
MBB) {
440 if (!
MI.isCopyLike() && !
MI.isUnconditionalBranch())
450 Flipped = CrossClass =
false;
453 unsigned SrcSub = 0, DstSub = 0;
456 Partial = SrcSub || DstSub;
459 if (Src.isPhysical()) {
460 if (Dst.isPhysical())
469 if (Dst.isPhysical()) {
472 Dst =
TRI.getSubReg(Dst, DstSub);
473 if (!Dst)
return false;
479 Dst =
TRI.getMatchingSuperReg(Dst, SrcSub,
MRI.getRegClass(Src));
480 if (!Dst)
return false;
481 }
else if (!
MRI.getRegClass(Src)->contains(Dst)) {
490 if (SrcSub && DstSub) {
492 if (Src == Dst && SrcSub != DstSub)
495 NewRC =
TRI.getCommonSuperRegClass(SrcRC, SrcSub, DstRC, DstSub,
502 NewRC =
TRI.getMatchingSuperRegClass(DstRC, SrcRC, DstSub);
506 NewRC =
TRI.getMatchingSuperRegClass(SrcRC, DstRC, SrcSub);
509 NewRC =
TRI.getCommonSubClass(DstRC, SrcRC);
518 if (DstIdx && !SrcIdx) {
524 CrossClass = NewRC != DstRC || NewRC != SrcRC;
527 assert(Src.isVirtual() &&
"Src must be virtual");
528 assert(!(Dst.isPhysical() && DstSub) &&
"Cannot have a physical SubIdx");
547 unsigned SrcSub = 0, DstSub = 0;
555 }
else if (Src != SrcReg) {
561 if (!Dst.isPhysical())
563 assert(!DstIdx && !SrcIdx &&
"Inconsistent CoalescerPair state.");
566 Dst =
TRI.getSubReg(Dst, DstSub);
569 return DstReg == Dst;
571 return Register(
TRI.getSubReg(DstReg, SrcSub)) == Dst;
577 return TRI.composeSubRegIndices(SrcIdx, SrcSub) ==
578 TRI.composeSubRegIndices(DstIdx, DstSub);
582void RegisterCoalescer::getAnalysisUsage(
AnalysisUsage &AU)
const {
594void RegisterCoalescer::eliminateDeadDefs(
LiveRangeEdit *Edit) {
604void RegisterCoalescer::LRE_WillEraseInstruction(
MachineInstr *
MI) {
609bool RegisterCoalescer::adjustCopiesBackFrom(
const CoalescerPair &CP,
611 assert(!
CP.isPartial() &&
"This doesn't work for partial copies.");
612 assert(!
CP.isPhys() &&
"This doesn't work for physreg copies.");
637 if (BS == IntB.
end())
return false;
638 VNInfo *BValNo = BS->valno;
643 if (BValNo->
def != CopyIdx)
return false;
649 if (AS == IntA.
end())
return false;
650 VNInfo *AValNo = AS->valno;
656 if (!
CP.isCoalescable(ACopyMI) || !ACopyMI->
isFullCopy())
662 if (ValS == IntB.
end())
675 if (ValS+1 != BS)
return false;
679 SlotIndex FillerStart = ValS->end, FillerEnd = BS->start;
683 BValNo->
def = FillerStart;
691 if (BValNo != ValS->valno)
700 S.removeSegment(*SS,
true);
704 if (!S.getVNInfoAt(FillerStart)) {
707 S.extendInBlock(BBStart, FillerStart);
709 VNInfo *SubBValNo = S.getVNInfoAt(CopyIdx);
712 if (SubBValNo != SubValSNo)
713 S.MergeValueNumberInto(SubBValNo, SubValSNo);
729 bool RecomputeLiveRange = AS->end == CopyIdx;
730 if (!RecomputeLiveRange) {
733 if (SS != S.end() &&
SS->end == CopyIdx) {
734 RecomputeLiveRange =
true;
739 if (RecomputeLiveRange)
746bool RegisterCoalescer::hasOtherReachingDefs(
LiveInterval &IntA,
756 if (ASeg.
valno != AValNo)
continue;
758 if (BI != IntB.
begin())
760 for (; BI != IntB.
end() && ASeg.
end >= BI->start; ++BI) {
761 if (BI->valno == BValNo)
763 if (BI->start <= ASeg.
start && BI->end > ASeg.
start)
765 if (BI->start > ASeg.
start && BI->start < ASeg.
end)
774static std::pair<bool,bool>
777 bool Changed =
false;
778 bool MergedWithDead =
false;
780 if (S.
valno != SrcValNo)
791 MergedWithDead =
true;
794 return std::make_pair(Changed, MergedWithDead);
798RegisterCoalescer::removeCopyByCommutingDef(
const CoalescerPair &CP,
831 assert(BValNo !=
nullptr && BValNo->
def == CopyIdx);
837 return {
false,
false };
840 return {
false,
false };
842 return {
false,
false };
849 return {
false,
false };
861 if (!
TII->findCommutedOpIndices(*
DefMI, UseOpIdx, NewDstIdx))
862 return {
false,
false };
867 return {
false,
false };
871 if (hasOtherReachingDefs(IntA, IntB, AValNo, BValNo))
872 return {
false,
false };
881 if (US == IntA.
end() || US->valno != AValNo)
885 return {
false,
false };
895 TII->commuteInstruction(*
DefMI,
false, UseOpIdx, NewDstIdx);
897 return {
false,
false };
899 !
MRI->constrainRegClass(IntB.
reg(),
MRI->getRegClass(IntA.
reg())))
900 return {
false,
false };
901 if (NewMI !=
DefMI) {
926 UseMO.setReg(NewReg);
931 assert(US != IntA.
end() &&
"Use must be live");
932 if (US->valno != AValNo)
935 UseMO.setIsKill(
false);
937 UseMO.substPhysReg(NewReg, *
TRI);
939 UseMO.setReg(NewReg);
958 VNInfo *SubDVNI = S.getVNInfoAt(DefIdx);
961 VNInfo *SubBValNo = S.getVNInfoAt(CopyIdx);
963 S.MergeValueNumberInto(SubDVNI, SubBValNo);
971 bool ShrinkB =
false;
985 VNInfo *ASubValNo = SA.getVNInfoAt(AIdx);
994 MaskA |= SA.LaneMask;
997 Allocator, SA.LaneMask,
998 [&Allocator, &SA, CopyIdx, ASubValNo,
1000 VNInfo *BSubValNo = SR.empty() ? SR.getNextValue(CopyIdx, Allocator)
1001 : SR.getVNInfoAt(CopyIdx);
1002 assert(BSubValNo != nullptr);
1003 auto P = addSegmentsWithValNo(SR, BSubValNo, SA, ASubValNo);
1004 ShrinkB |= P.second;
1006 BSubValNo->def = ASubValNo->def;
1014 if ((SB.LaneMask & MaskA).any())
1018 SB.removeSegment(*S,
true);
1022 BValNo->
def = AValNo->
def;
1024 ShrinkB |=
P.second;
1031 return {
true, ShrinkB };
1081bool RegisterCoalescer::removePartialRedundancy(
const CoalescerPair &CP,
1114 bool FoundReverseCopy =
false;
1133 bool ValB_Changed =
false;
1134 for (
auto *VNI : IntB.
valnos) {
1135 if (VNI->isUnused())
1138 ValB_Changed =
true;
1146 FoundReverseCopy =
true;
1150 if (!FoundReverseCopy)
1160 if (CopyLeftBB && CopyLeftBB->
succ_size() > 1)
1171 if (InsPos != CopyLeftBB->
end()) {
1177 LLVM_DEBUG(
dbgs() <<
"\tremovePartialRedundancy: Move the copy to "
1182 TII->get(TargetOpcode::COPY), IntB.
reg())
1193 ErasedInstrs.
erase(NewCopyMI);
1195 LLVM_DEBUG(
dbgs() <<
"\tremovePartialRedundancy: Remove the copy from "
1204 deleteInstr(&CopyMI);
1218 VNInfo *BValNo = SR.Query(CopyIdx).valueOutOrDead();
1219 assert(BValNo &&
"All sublanes should be live");
1228 for (
unsigned I = 0;
I != EndPoints.
size(); ) {
1230 EndPoints[
I] = EndPoints.
back();
1252 assert(!Reg.isPhysical() &&
"This code cannot handle physreg aliasing");
1255 if (
Op.getReg() != Reg)
1259 if (
Op.getSubReg() == 0 ||
Op.isUndef())
1265bool RegisterCoalescer::reMaterializeTrivialDef(
const CoalescerPair &CP,
1269 Register SrcReg =
CP.isFlipped() ?
CP.getDstReg() :
CP.getSrcReg();
1270 unsigned SrcIdx =
CP.isFlipped() ?
CP.getDstIdx() :
CP.getSrcIdx();
1271 Register DstReg =
CP.isFlipped() ?
CP.getSrcReg() :
CP.getDstReg();
1272 unsigned DstIdx =
CP.isFlipped() ?
CP.getSrcIdx() :
CP.getDstIdx();
1294 LiveRangeEdit Edit(&SrcInt, NewRegs, *MF, *LIS,
nullptr,
this);
1300 bool SawStore =
false;
1317 if (SrcIdx && DstIdx)
1325 unsigned NewDstIdx =
TRI->composeSubRegIndices(
CP.getSrcIdx(),
1328 NewDstReg =
TRI->getSubReg(DstReg, NewDstIdx);
1338 "Only expect to deal with virtual or physical registers");
1364 assert(SrcIdx == 0 &&
CP.isFlipped()
1365 &&
"Shouldn't have SrcIdx+DstIdx at this point");
1368 TRI->getCommonSubClass(DefRC, DstRC);
1369 if (CommonRC !=
nullptr) {
1377 if (MO.isReg() && MO.getReg() == DstReg && MO.getSubReg() == DstIdx) {
1398 assert(MO.
isImplicit() &&
"No explicit operands after implicit operands.");
1405 ErasedInstrs.
insert(CopyMI);
1424 if (DefRC !=
nullptr) {
1426 NewRC =
TRI->getMatchingSuperRegClass(NewRC, DefRC, NewIdx);
1428 NewRC =
TRI->getCommonSubClass(NewRC, DefRC);
1429 assert(NewRC &&
"subreg chosen for remat incompatible with instruction");
1434 SR.LaneMask =
TRI->composeSubRegIndexLaneMask(DstIdx, SR.LaneMask);
1436 MRI->setRegClass(DstReg, NewRC);
1439 updateRegDefsUses(DstReg, DstReg, DstIdx);
1467 if (!SR.liveAt(DefIndex))
1468 SR.createDeadDef(DefIndex,
Alloc);
1469 MaxMask &= ~SR.LaneMask;
1471 if (MaxMask.
any()) {
1489 bool UpdatedSubRanges =
false;
1494 if ((SR.
LaneMask & DstMask).none()) {
1496 <<
"Removing undefined SubRange "
1509 UpdatedSubRanges =
true;
1520 if (UpdatedSubRanges)
1527 "Only expect virtual or physical registers in remat");
1530 CopyDstReg,
true ,
true ,
false ));
1561 for (
unsigned i = 0, e = NewMIImplDefs.
size(); i != e; ++i) {
1573 if (
MRI->use_nodbg_empty(SrcReg)) {
1579 UseMO.substPhysReg(DstReg, *
TRI);
1581 UseMO.setReg(DstReg);
1590 if (ToBeUpdated.
count(SrcReg))
1593 unsigned NumCopyUses = 0;
1595 if (UseMO.getParent()->isCopyLike())
1601 if (!DeadDefs.
empty())
1602 eliminateDeadDefs(&Edit);
1604 ToBeUpdated.
insert(SrcReg);
1622 unsigned SrcSubIdx = 0, DstSubIdx = 0;
1623 if(!
isMoveInstr(*
TRI, CopyMI, SrcReg, DstReg, SrcSubIdx, DstSubIdx))
1632 if ((SR.
LaneMask & SrcMask).none())
1645 assert(Seg !=
nullptr &&
"No segment for defining instruction");
1650 if (((V &&
V->isPHIDef()) || (!V && !DstLI.
liveAt(
Idx)))) {
1651 CopyMI->
setDesc(
TII->get(TargetOpcode::IMPLICIT_DEF));
1673 if ((SR.
LaneMask & DstMask).none())
1695 if ((SR.
LaneMask & UseMask).none())
1703 isLive = DstLI.
liveAt(UseIdx);
1716 if (MO.
getReg() == DstReg)
1728 bool IsUndef =
true;
1730 if ((S.LaneMask & Mask).none())
1732 if (S.liveAt(UseIdx)) {
1745 ShrinkMainRange =
true;
1754 if (DstInt && DstInt->
hasSubRanges() && DstReg != SrcReg) {
1760 if (
MI.isDebugInstr())
1763 addUndefFlag(*DstInt, UseIdx, MO,
SubReg);
1769 I =
MRI->reg_instr_begin(SrcReg),
E =
MRI->reg_instr_end();
1778 if (SrcReg == DstReg && !Visited.
insert(
UseMI).second)
1791 for (
unsigned i = 0, e = Ops.
size(); i != e; ++i) {
1797 if (SubIdx && MO.
isDef())
1802 if (MO.
isUse() && !DstIsPhys) {
1803 unsigned SubUseIdx =
TRI->composeSubRegIndices(SubIdx, MO.
getSubReg());
1804 if (SubUseIdx != 0 &&
MRI->shouldTrackSubRegLiveness(DstReg)) {
1821 addUndefFlag(*DstInt, UseIdx, MO, SubUseIdx);
1832 dbgs() <<
"\t\tupdated: ";
1840bool RegisterCoalescer::canJoinPhys(
const CoalescerPair &CP) {
1844 if (!
MRI->isReserved(
CP.getDstReg())) {
1845 LLVM_DEBUG(
dbgs() <<
"\tCan only merge into reserved registers.\n");
1854 dbgs() <<
"\tCannot join complex intervals into reserved register.\n");
1858bool RegisterCoalescer::copyValueUndefInPredecessors(
1872void RegisterCoalescer::setUndefOnPrunedSubRegUses(
LiveInterval &LI,
1879 if (SubRegIdx == 0 || MO.
isUndef())
1885 if (!S.
liveAt(Pos) && (PrunedLanes & SubRegMask).any()) {
1901bool RegisterCoalescer::joinCopy(
MachineInstr *CopyMI,
bool &Again) {
1906 if (!
CP.setRegisters(CopyMI)) {
1911 if (
CP.getNewRC()) {
1912 auto SrcRC =
MRI->getRegClass(
CP.getSrcReg());
1913 auto DstRC =
MRI->getRegClass(
CP.getDstReg());
1914 unsigned SrcIdx =
CP.getSrcIdx();
1915 unsigned DstIdx =
CP.getDstIdx();
1916 if (
CP.isFlipped()) {
1920 if (!
TRI->shouldCoalesce(CopyMI, SrcRC, SrcIdx, DstRC, DstIdx,
1921 CP.getNewRC(), *LIS)) {
1933 eliminateDeadDefs();
1940 if (
MachineInstr *UndefMI = eliminateUndefCopy(CopyMI)) {
1941 if (UndefMI->isImplicitDef())
1943 deleteInstr(CopyMI);
1951 if (
CP.getSrcReg() ==
CP.getDstReg()) {
1953 LLVM_DEBUG(
dbgs() <<
"\tCopy already coalesced: " << LI <<
'\n');
1958 assert(ReadVNI &&
"No value before copy and no <undef> flag.");
1959 assert(ReadVNI != DefVNI &&
"Cannot read and define the same value.");
1974 if (copyValueUndefInPredecessors(S,
MBB, SLRQ)) {
1975 LLVM_DEBUG(
dbgs() <<
"Incoming sublane value is undef at copy\n");
1976 PrunedLanes |= S.LaneMask;
1983 if (PrunedLanes.
any()) {
1985 << PrunedLanes <<
'\n');
1986 setUndefOnPrunedSubRegUses(LI,
CP.getSrcReg(), PrunedLanes);
1991 deleteInstr(CopyMI);
2000 if (!canJoinPhys(CP)) {
2003 bool IsDefCopy =
false;
2004 if (reMaterializeTrivialDef(CP, CopyMI, IsDefCopy))
2017 dbgs() <<
"\tConsidering merging to "
2018 <<
TRI->getRegClassName(
CP.getNewRC()) <<
" with ";
2019 if (
CP.getDstIdx() &&
CP.getSrcIdx())
2021 <<
TRI->getSubRegIndexName(
CP.getDstIdx()) <<
" and "
2023 <<
TRI->getSubRegIndexName(
CP.getSrcIdx()) <<
'\n';
2031 ShrinkMainRange =
false;
2037 if (!joinIntervals(CP)) {
2042 bool IsDefCopy =
false;
2043 if (reMaterializeTrivialDef(CP, CopyMI, IsDefCopy))
2048 if (!
CP.isPartial() && !
CP.isPhys()) {
2049 bool Changed = adjustCopiesBackFrom(CP, CopyMI);
2050 bool Shrink =
false;
2052 std::tie(Changed, Shrink) = removeCopyByCommutingDef(CP, CopyMI);
2054 deleteInstr(CopyMI);
2056 Register DstReg =
CP.isFlipped() ?
CP.getSrcReg() :
CP.getDstReg();
2068 if (!
CP.isPartial() && !
CP.isPhys())
2069 if (removePartialRedundancy(CP, *CopyMI))
2080 if (
CP.isCrossClass()) {
2082 MRI->setRegClass(
CP.getDstReg(),
CP.getNewRC());
2093 ErasedInstrs.
erase(CopyMI);
2098 updateRegDefsUses(
CP.getDstReg(),
CP.getDstReg(),
CP.getDstIdx());
2099 updateRegDefsUses(
CP.getSrcReg(),
CP.getDstReg(),
CP.getSrcIdx());
2102 if (ShrinkMask.
any()) {
2105 if ((S.LaneMask & ShrinkMask).none())
2110 ShrinkMainRange =
true;
2118 if (ToBeUpdated.
count(
CP.getSrcReg()))
2119 ShrinkMainRange =
true;
2121 if (ShrinkMainRange) {
2131 TRI->updateRegAllocHint(
CP.getSrcReg(),
CP.getDstReg(), *MF);
2136 dbgs() <<
"\tResult = ";
2148bool RegisterCoalescer::joinReservedPhysReg(
CoalescerPair &CP) {
2151 assert(
CP.isPhys() &&
"Must be a physreg copy");
2152 assert(
MRI->isReserved(DstReg) &&
"Not a reserved register");
2156 assert(
RHS.containsOneValue() &&
"Invalid join with reserved register");
2165 if (!
MRI->isConstantPhysReg(DstReg)) {
2169 if (!
MRI->isReserved(*RI))
2182 !RegMaskUsable.
test(DstReg)) {
2195 if (
CP.isFlipped()) {
2203 CopyMI =
MRI->getVRegDef(SrcReg);
2204 deleteInstr(CopyMI);
2213 if (!
MRI->hasOneNonDBGUse(SrcReg)) {
2224 CopyMI = &*
MRI->use_instr_nodbg_begin(SrcReg);
2228 if (!
MRI->isConstantPhysReg(DstReg)) {
2236 if (
MI->readsRegister(DstReg,
TRI)) {
2246 <<
printReg(DstReg,
TRI) <<
" at " << CopyRegIdx <<
"\n");
2249 deleteInstr(CopyMI);
2259 MRI->clearKillFlags(
CP.getSrcReg());
2344 const unsigned SubIdx;
2352 const bool SubRangeJoin;
2355 const bool TrackSubRegLiveness;
2371 enum ConflictResolution {
2403 ConflictResolution Resolution = CR_Keep;
2413 VNInfo *RedefVNI =
nullptr;
2416 VNInfo *OtherVNI =
nullptr;
2429 bool ErasableImplicitDef =
false;
2433 bool Pruned =
false;
2436 bool PrunedComputed =
false;
2443 bool Identical =
false;
2447 bool isAnalyzed()
const {
return WriteLanes.
any(); }
2454 ErasableImplicitDef =
false;
2468 std::pair<const VNInfo *, Register> followCopyChain(
const VNInfo *VNI)
const;
2470 bool valuesIdentical(
VNInfo *Value0,
VNInfo *Value1,
const JoinVals &
Other)
const;
2479 ConflictResolution analyzeValue(
unsigned ValNo, JoinVals &
Other);
2484 void computeAssignment(
unsigned ValNo, JoinVals &
Other);
2515 bool isPrunedValue(
unsigned ValNo, JoinVals &
Other);
2521 bool TrackSubRegLiveness)
2522 : LR(LR),
Reg(
Reg), SubIdx(SubIdx), LaneMask(LaneMask),
2523 SubRangeJoin(SubRangeJoin), TrackSubRegLiveness(TrackSubRegLiveness),
2524 NewVNInfo(newVNInfo),
CP(cp), LIS(lis), Indexes(LIS->getSlotIndexes()),
2525 TRI(
TRI), Assignments(LR.getNumValNums(), -1),
2526 Vals(LR.getNumValNums()) {}
2530 bool mapValues(JoinVals &
Other);
2534 bool resolveConflicts(JoinVals &
Other);
2554 void pruneMainSegments(
LiveInterval &LI,
bool &ShrinkMainRange);
2565 void removeImplicitDefs();
2568 const int *getAssignments()
const {
return Assignments.
data(); }
2571 ConflictResolution getResolution(
unsigned Num)
const {
2572 return Vals[Num].Resolution;
2584 L |=
TRI->getSubRegIndexLaneMask(
2592std::pair<const VNInfo *, Register>
2593JoinVals::followCopyChain(
const VNInfo *VNI)
const {
2599 assert(
MI &&
"No defining instruction");
2600 if (!
MI->isFullCopy())
2601 return std::make_pair(VNI, TrackReg);
2602 Register SrcReg =
MI->getOperand(1).getReg();
2604 return std::make_pair(VNI, TrackReg);
2618 LaneBitmask SMask =
TRI->composeSubRegIndexLaneMask(SubIdx, S.LaneMask);
2619 if ((SMask & LaneMask).
none())
2627 return std::make_pair(VNI, TrackReg);
2630 if (ValueIn ==
nullptr) {
2637 return std::make_pair(
nullptr, SrcReg);
2642 return std::make_pair(VNI, TrackReg);
2645bool JoinVals::valuesIdentical(
VNInfo *Value0,
VNInfo *Value1,
2646 const JoinVals &
Other)
const {
2649 std::tie(Orig0, Reg0) = followCopyChain(Value0);
2650 if (Orig0 == Value1 && Reg0 ==
Other.Reg)
2655 std::tie(Orig1, Reg1) =
Other.followCopyChain(Value1);
2659 if (Orig0 ==
nullptr || Orig1 ==
nullptr)
2660 return Orig0 == Orig1 && Reg0 == Reg1;
2666 return Orig0->
def == Orig1->
def && Reg0 == Reg1;
2669JoinVals::ConflictResolution
2670JoinVals::analyzeValue(
unsigned ValNo, JoinVals &
Other) {
2671 Val &
V = Vals[ValNo];
2672 assert(!
V.isAnalyzed() &&
"Value has already been analyzed!");
2684 :
TRI->getSubRegIndexLaneMask(SubIdx);
2685 V.ValidLanes =
V.WriteLanes = Lanes;
2694 V.ErasableImplicitDef =
true;
2698 V.ValidLanes =
V.WriteLanes = computeWriteLanes(
DefMI, Redef);
2717 assert((TrackSubRegLiveness ||
V.RedefVNI) &&
2718 "Instruction is reading nonexistent value");
2719 if (
V.RedefVNI !=
nullptr) {
2720 computeAssignment(
V.RedefVNI->id,
Other);
2721 V.ValidLanes |= Vals[
V.RedefVNI->id].ValidLanes;
2733 V.ErasableImplicitDef =
true;
2750 if (OtherVNI->
def < VNI->
def)
2751 Other.computeAssignment(OtherVNI->
id, *
this);
2756 return CR_Impossible;
2758 V.OtherVNI = OtherVNI;
2759 Val &OtherV =
Other.Vals[OtherVNI->
id];
2763 if (!OtherV.isAnalyzed() ||
Other.Assignments[OtherVNI->
id] == -1)
2770 if ((
V.ValidLanes & OtherV.ValidLanes).any())
2772 return CR_Impossible;
2787 Other.computeAssignment(
V.OtherVNI->id, *
this);
2788 Val &OtherV =
Other.Vals[
V.OtherVNI->id];
2790 if (OtherV.ErasableImplicitDef) {
2810 <<
", keeping it.\n");
2811 OtherV.mustKeepImplicitDef(*
TRI, *OtherImpDef);
2818 dbgs() <<
"IMPLICIT_DEF defined at " <<
V.OtherVNI->def
2819 <<
" may be live into EH pad successors, keeping it.\n");
2820 OtherV.mustKeepImplicitDef(*
TRI, *OtherImpDef);
2823 OtherV.ValidLanes &= ~OtherV.WriteLanes;
2838 if (
CP.isCoalescable(
DefMI)) {
2841 V.ValidLanes &= ~V.WriteLanes | OtherV.ValidLanes;
2856 valuesIdentical(VNI,
V.OtherVNI,
Other)) {
2879 if ((
V.WriteLanes & OtherV.ValidLanes).none())
2892 "Only early clobber defs can overlap a kill");
2893 return CR_Impossible;
2900 if ((
TRI->getSubRegIndexLaneMask(
Other.SubIdx) & ~
V.WriteLanes).none())
2901 return CR_Impossible;
2903 if (TrackSubRegLiveness) {
2908 if (!OtherLI.hasSubRanges()) {
2910 return (OtherMask &
V.WriteLanes).none() ? CR_Replace : CR_Impossible;
2918 TRI->composeSubRegIndexLaneMask(
Other.SubIdx, OtherSR.LaneMask);
2919 if ((OtherMask &
V.WriteLanes).none())
2922 auto OtherSRQ = OtherSR.Query(VNI->
def);
2923 if (OtherSRQ.valueIn() && OtherSRQ.endPoint() > VNI->
def) {
2925 return CR_Impossible;
2938 return CR_Impossible;
2947 return CR_Unresolved;
2950void JoinVals::computeAssignment(
unsigned ValNo, JoinVals &
Other) {
2951 Val &
V = Vals[ValNo];
2952 if (
V.isAnalyzed()) {
2955 assert(Assignments[ValNo] != -1 &&
"Bad recursion?");
2958 switch ((
V.Resolution = analyzeValue(ValNo,
Other))) {
2962 assert(
V.OtherVNI &&
"OtherVNI not assigned, can't merge.");
2963 assert(
Other.Vals[
V.OtherVNI->id].isAnalyzed() &&
"Missing recursion");
2964 Assignments[ValNo] =
Other.Assignments[
V.OtherVNI->id];
2968 <<
V.OtherVNI->def <<
" --> @"
2969 << NewVNInfo[Assignments[ValNo]]->def <<
'\n');
2972 case CR_Unresolved: {
2974 assert(
V.OtherVNI &&
"OtherVNI not assigned, can't prune");
2975 Val &OtherV =
Other.Vals[
V.OtherVNI->id];
2976 OtherV.Pruned =
true;
2981 Assignments[ValNo] = NewVNInfo.
size();
2987bool JoinVals::mapValues(JoinVals &
Other) {
2989 computeAssignment(i,
Other);
2990 if (Vals[i].Resolution == CR_Impossible) {
3008 assert(OtherI !=
Other.LR.end() &&
"No conflict?");
3013 if (
End >= MBBEnd) {
3015 << OtherI->valno->id <<
'@' << OtherI->start <<
'\n');
3019 << OtherI->valno->id <<
'@' << OtherI->start <<
" to "
3024 TaintExtent.push_back(std::make_pair(
End, TaintedLanes));
3027 if (++OtherI ==
Other.LR.end() || OtherI->start >= MBBEnd)
3031 const Val &OV =
Other.Vals[OtherI->valno->id];
3032 TaintedLanes &= ~OV.WriteLanes;
3035 }
while (TaintedLanes.
any());
3041 if (
MI.isDebugOrPseudoInstr())
3048 unsigned S =
TRI->composeSubRegIndices(SubIdx, MO.
getSubReg());
3049 if ((Lanes &
TRI->getSubRegIndexLaneMask(S)).any())
3055bool JoinVals::resolveConflicts(JoinVals &
Other) {
3058 assert(
V.Resolution != CR_Impossible &&
"Unresolvable conflict");
3059 if (
V.Resolution != CR_Unresolved)
3068 assert(
V.OtherVNI &&
"Inconsistent conflict resolution.");
3070 const Val &OtherV =
Other.Vals[
V.OtherVNI->id];
3075 LaneBitmask TaintedLanes =
V.WriteLanes & OtherV.ValidLanes;
3077 if (!taintExtent(i, TaintedLanes,
Other, TaintExtent))
3081 assert(!TaintExtent.
empty() &&
"There should be at least one conflict.");
3094 "Interference ends on VNI->def. Should have been handled earlier");
3097 assert(LastMI &&
"Range must end at a proper instruction");
3098 unsigned TaintNum = 0;
3101 if (usesLanes(*
MI,
Other.Reg,
Other.SubIdx, TaintedLanes)) {
3106 if (&*
MI == LastMI) {
3107 if (++TaintNum == TaintExtent.
size())
3110 assert(LastMI &&
"Range must end at a proper instruction");
3111 TaintedLanes = TaintExtent[TaintNum].second;
3117 V.Resolution = CR_Replace;
3123bool JoinVals::isPrunedValue(
unsigned ValNo, JoinVals &
Other) {
3124 Val &
V = Vals[ValNo];
3125 if (
V.Pruned ||
V.PrunedComputed)
3128 if (
V.Resolution != CR_Erase &&
V.Resolution != CR_Merge)
3133 V.PrunedComputed =
true;
3134 V.Pruned =
Other.isPrunedValue(
V.OtherVNI->id, *
this);
3138void JoinVals::pruneValues(JoinVals &
Other,
3140 bool changeInstrs) {
3143 switch (Vals[i].Resolution) {
3153 Val &OtherV =
Other.Vals[Vals[i].OtherVNI->id];
3154 bool EraseImpDef = OtherV.ErasableImplicitDef &&
3155 OtherV.Resolution == CR_Keep;
3156 if (!
Def.isBlock()) {
3176 <<
": " <<
Other.LR <<
'\n');
3181 if (isPrunedValue(i,
Other)) {
3188 << Def <<
": " << LR <<
'\n');
3246 bool DidPrune =
false;
3251 if (
V.Resolution != CR_Erase &&
3252 (
V.Resolution != CR_Keep || !
V.ErasableImplicitDef || !
V.Pruned))
3259 OtherDef =
V.OtherVNI->def;
3262 LLVM_DEBUG(
dbgs() <<
"\t\tExpecting instruction removal at " << Def
3270 if (ValueOut !=
nullptr && (Q.
valueIn() ==
nullptr ||
3271 (
V.Identical &&
V.Resolution == CR_Erase &&
3272 ValueOut->
def == Def))) {
3274 <<
" at " << Def <<
"\n");
3281 if (
V.Identical && S.Query(OtherDef).valueOutOrDead()) {
3291 ShrinkMask |= S.LaneMask;
3305 ShrinkMask |= S.LaneMask;
3317 if (VNI->
def == Def)
3323void JoinVals::pruneMainSegments(
LiveInterval &LI,
bool &ShrinkMainRange) {
3327 if (Vals[i].Resolution != CR_Keep)
3332 Vals[i].Pruned =
true;
3333 ShrinkMainRange =
true;
3337void JoinVals::removeImplicitDefs() {
3340 if (
V.Resolution != CR_Keep || !
V.ErasableImplicitDef || !
V.Pruned)
3356 switch (Vals[i].Resolution) {
3361 if (!Vals[i].ErasableImplicitDef || !Vals[i].Pruned)
3373 if (LI !=
nullptr) {
3398 ED = ED.
isValid() ? std::min(ED,
I->start) :
I->start;
3400 LE =
LE.isValid() ? std::max(LE,
I->end) :
I->
end;
3403 NewEnd = std::min(NewEnd, LE);
3405 NewEnd = std::min(NewEnd, ED);
3411 if (S != LR.
begin())
3412 std::prev(S)->end = NewEnd;
3416 dbgs() <<
"\t\tremoved " << i <<
'@' <<
Def <<
": " << LR <<
'\n';
3418 dbgs() <<
"\t\t LHS = " << *LI <<
'\n';
3425 assert(
MI &&
"No instruction to erase");
3428 if (
Reg.isVirtual() && Reg !=
CP.getSrcReg() && Reg !=
CP.getDstReg())
3434 MI->eraseFromParent();
3447 JoinVals RHSVals(RRange,
CP.getSrcReg(),
CP.getSrcIdx(), LaneMask,
3448 NewVNInfo, CP, LIS,
TRI,
true,
true);
3449 JoinVals LHSVals(LRange,
CP.getDstReg(),
CP.getDstIdx(), LaneMask,
3450 NewVNInfo, CP, LIS,
TRI,
true,
true);
3457 if (!LHSVals.mapValues(RHSVals) || !RHSVals.mapValues(LHSVals)) {
3462 if (!LHSVals.resolveConflicts(RHSVals) ||
3463 !RHSVals.resolveConflicts(LHSVals)) {
3474 LHSVals.pruneValues(RHSVals, EndPoints,
false);
3475 RHSVals.pruneValues(LHSVals, EndPoints,
false);
3477 LHSVals.removeImplicitDefs();
3478 RHSVals.removeImplicitDefs();
3484 LRange.
join(RRange, LHSVals.getAssignments(), RHSVals.getAssignments(),
3488 <<
' ' << LRange <<
"\n");
3489 if (EndPoints.
empty())
3495 dbgs() <<
"\t\trestoring liveness to " << EndPoints.
size() <<
" points: ";
3496 for (
unsigned i = 0, n = EndPoints.
size(); i != n; ++i) {
3497 dbgs() << EndPoints[i];
3501 dbgs() <<
": " << LRange <<
'\n';
3506void RegisterCoalescer::mergeSubRangeInto(
LiveInterval &LI,
3510 unsigned ComposeSubRegIdx) {
3513 Allocator, LaneMask,
3516 SR.assign(ToMerge, Allocator);
3519 LiveRange RangeCopy(ToMerge, Allocator);
3520 joinSubRegRanges(SR, RangeCopy, SR.LaneMask, CP);
3526bool RegisterCoalescer::isHighCostLiveInterval(
LiveInterval &LI) {
3529 auto &Counter = LargeLIVisitCounter[LI.
reg()];
3541 bool TrackSubRegLiveness =
MRI->shouldTrackSubRegLiveness(*
CP.getNewRC());
3543 NewVNInfo, CP, LIS,
TRI,
false, TrackSubRegLiveness);
3545 NewVNInfo, CP, LIS,
TRI,
false, TrackSubRegLiveness);
3547 LLVM_DEBUG(
dbgs() <<
"\t\tRHS = " << RHS <<
"\n\t\tLHS = " << LHS <<
'\n');
3549 if (isHighCostLiveInterval(LHS) || isHighCostLiveInterval(RHS))
3554 if (!LHSVals.mapValues(RHSVals) || !RHSVals.mapValues(LHSVals))
3558 if (!LHSVals.resolveConflicts(RHSVals) || !RHSVals.resolveConflicts(LHSVals))
3562 if (
RHS.hasSubRanges() ||
LHS.hasSubRanges()) {
3567 unsigned DstIdx =
CP.getDstIdx();
3568 if (!
LHS.hasSubRanges()) {
3570 :
TRI->getSubRegIndexLaneMask(DstIdx);
3573 LHS.createSubRangeFrom(Allocator, Mask, LHS);
3574 }
else if (DstIdx != 0) {
3585 unsigned SrcIdx =
CP.getSrcIdx();
3586 if (!
RHS.hasSubRanges()) {
3588 :
TRI->getSubRegIndexLaneMask(SrcIdx);
3589 mergeSubRangeInto(LHS, RHS, Mask, CP, DstIdx);
3594 mergeSubRangeInto(LHS, R, Mask, CP, DstIdx);
3601 LHSVals.pruneMainSegments(LHS, ShrinkMainRange);
3603 LHSVals.pruneSubRegValues(LHS, ShrinkMask);
3604 RHSVals.pruneSubRegValues(LHS, ShrinkMask);
3612 LHSVals.pruneValues(RHSVals, EndPoints,
true);
3613 RHSVals.pruneValues(LHSVals, EndPoints,
true);
3618 LHSVals.eraseInstrs(ErasedInstrs, ShrinkRegs, &LHS);
3619 RHSVals.eraseInstrs(ErasedInstrs, ShrinkRegs);
3620 while (!ShrinkRegs.
empty())
3624 checkMergingChangesDbgValues(CP, LHS, LHSVals, RHS, RHSVals);
3628 auto RegIt = RegToPHIIdx.
find(
CP.getSrcReg());
3629 if (RegIt != RegToPHIIdx.
end()) {
3631 for (
unsigned InstID : RegIt->second) {
3632 auto PHIIt = PHIValToPos.
find(InstID);
3637 auto LII =
RHS.find(SI);
3638 if (LII ==
RHS.end() || LII->start > SI)
3653 if (
CP.getSrcIdx() != 0 ||
CP.getDstIdx() != 0)
3656 if (PHIIt->second.SubReg && PHIIt->second.SubReg !=
CP.getSrcIdx())
3660 PHIIt->second.Reg =
CP.getDstReg();
3664 if (
CP.getSrcIdx() != 0)
3665 PHIIt->second.SubReg =
CP.getSrcIdx();
3671 auto InstrNums = RegIt->second;
3672 RegToPHIIdx.
erase(RegIt);
3676 RegIt = RegToPHIIdx.
find(
CP.getDstReg());
3677 if (RegIt != RegToPHIIdx.
end())
3678 RegIt->second.insert(RegIt->second.end(), InstrNums.begin(),
3681 RegToPHIIdx.
insert({
CP.getDstReg(), InstrNums});
3685 LHS.join(RHS, LHSVals.getAssignments(), RHSVals.getAssignments(), NewVNInfo);
3690 MRI->clearKillFlags(
LHS.reg());
3691 MRI->clearKillFlags(
RHS.reg());
3693 if (!EndPoints.
empty()) {
3697 dbgs() <<
"\t\trestoring liveness to " << EndPoints.
size() <<
" points: ";
3698 for (
unsigned i = 0, n = EndPoints.
size(); i != n; ++i) {
3699 dbgs() << EndPoints[i];
3703 dbgs() <<
": " <<
LHS <<
'\n';
3712 return CP.isPhys() ? joinReservedPhysReg(CP) : joinVirtRegs(
CP);
3723 for (
auto *
X : ToInsert) {
3724 for (
const auto &
Op :
X->debug_operands()) {
3725 if (
Op.isReg() &&
Op.getReg().isVirtual())
3736 for (
auto &
MBB : MF) {
3739 for (
auto &
MI :
MBB) {
3740 if (
MI.isDebugValue()) {
3742 return MO.isReg() && MO.getReg().isVirtual();
3744 ToInsert.push_back(&
MI);
3745 }
else if (!
MI.isDebugOrPseudoInstr()) {
3747 CloseNewDVRange(CurrentSlot);
3756 for (
auto &Pair : DbgVRegToValues)
3760void RegisterCoalescer::checkMergingChangesDbgValues(
CoalescerPair &CP,
3764 JoinVals &RHSVals) {
3766 checkMergingChangesDbgValuesImpl(Reg, RHS, LHS, LHSVals);
3770 checkMergingChangesDbgValuesImpl(Reg, LHS, RHS, RHSVals);
3774 ScanForSrcReg(
CP.getSrcReg());
3775 ScanForDstReg(
CP.getDstReg());
3778void RegisterCoalescer::checkMergingChangesDbgValuesImpl(
Register Reg,
3781 JoinVals &RegVals) {
3783 auto VRegMapIt = DbgVRegToValues.
find(Reg);
3784 if (VRegMapIt == DbgVRegToValues.
end())
3787 auto &DbgValueSet = VRegMapIt->second;
3788 auto DbgValueSetIt = DbgValueSet.begin();
3789 auto SegmentIt = OtherLR.
begin();
3791 bool LastUndefResult =
false;
3796 auto ShouldUndef = [&RegVals, &
RegLR, &LastUndefResult,
3801 if (LastUndefIdx ==
Idx)
3802 return LastUndefResult;
3809 if (OtherIt ==
RegLR.end())
3818 auto Resolution = RegVals.getResolution(OtherIt->valno->id);
3819 LastUndefResult = Resolution != JoinVals::CR_Keep &&
3820 Resolution != JoinVals::CR_Erase;
3822 return LastUndefResult;
3828 while (DbgValueSetIt != DbgValueSet.end() && SegmentIt != OtherLR.
end()) {
3829 if (DbgValueSetIt->first < SegmentIt->end) {
3832 if (DbgValueSetIt->first >= SegmentIt->start) {
3833 bool HasReg = DbgValueSetIt->second->hasDebugOperandForReg(Reg);
3834 bool ShouldUndefReg = ShouldUndef(DbgValueSetIt->first);
3835 if (HasReg && ShouldUndefReg) {
3837 DbgValueSetIt->second->setDebugValueUndef();
3851struct MBBPriorityInfo {
3857 :
MBB(mbb),
Depth(depth), IsSplit(issplit) {}
3867 const MBBPriorityInfo *RHS) {
3869 if (
LHS->Depth !=
RHS->Depth)
3870 return LHS->Depth >
RHS->Depth ? -1 : 1;
3873 if (
LHS->IsSplit !=
RHS->IsSplit)
3874 return LHS->IsSplit ? -1 : 1;
3878 unsigned cl =
LHS->MBB->pred_size() +
LHS->MBB->succ_size();
3879 unsigned cr =
RHS->MBB->pred_size() +
RHS->MBB->succ_size();
3881 return cl > cr ? -1 : 1;
3884 return LHS->MBB->getNumber() <
RHS->MBB->getNumber() ? -1 : 1;
3889 if (!Copy->isCopy())
3892 if (Copy->getOperand(1).isUndef())
3895 Register SrcReg = Copy->getOperand(1).getReg();
3896 Register DstReg = Copy->getOperand(0).getReg();
3904void RegisterCoalescer::lateLiveIntervalUpdate() {
3910 if (!DeadDefs.
empty())
3911 eliminateDeadDefs();
3913 ToBeUpdated.clear();
3916bool RegisterCoalescer::
3918 bool Progress =
false;
3941 assert(Copy.isCopyLike());
3944 if (&
MI != &Copy &&
MI.isCopyLike())
3949bool RegisterCoalescer::applyTerminalRule(
const MachineInstr &Copy)
const {
3954 unsigned SrcSubReg = 0, DstSubReg = 0;
3955 if (!
isMoveInstr(*
TRI, &Copy, SrcReg, DstReg, SrcSubReg, DstSubReg))
3976 if (&
MI == &Copy || !
MI.isCopyLike() ||
MI.getParent() != OrigBB)
3979 unsigned OtherSrcSubReg = 0, OtherSubReg = 0;
3980 if (!
isMoveInstr(*
TRI, &Copy, OtherSrcReg, OtherReg, OtherSrcSubReg,
3983 if (OtherReg == SrcReg)
3984 OtherReg = OtherSrcReg;
4004 const unsigned PrevSize = WorkList.
size();
4005 if (JoinGlobalCopies) {
4013 if (!
MI.isCopyLike())
4015 bool ApplyTerminalRule = applyTerminalRule(
MI);
4017 if (ApplyTerminalRule)
4022 if (ApplyTerminalRule)
4029 LocalWorkList.
append(LocalTerminals.
begin(), LocalTerminals.
end());
4035 if (MII.isCopyLike()) {
4036 if (applyTerminalRule(MII))
4048 CurrList(WorkList.
begin() + PrevSize, WorkList.
end());
4049 if (copyCoalesceWorkList(CurrList))
4050 WorkList.
erase(std::remove(WorkList.
begin() + PrevSize, WorkList.
end(),
4051 nullptr), WorkList.
end());
4054void RegisterCoalescer::coalesceLocals() {
4055 copyCoalesceWorkList(LocalWorkList);
4056 for (
unsigned j = 0, je = LocalWorkList.
size(); j != je; ++j) {
4057 if (LocalWorkList[j])
4060 LocalWorkList.
clear();
4063void RegisterCoalescer::joinAllIntervals() {
4064 LLVM_DEBUG(
dbgs() <<
"********** JOINING INTERVALS ***********\n");
4065 assert(WorkList.
empty() && LocalWorkList.
empty() &&
"Old data still around.");
4067 std::vector<MBBPriorityInfo> MBBs;
4068 MBBs.reserve(MF->size());
4070 MBBs.push_back(MBBPriorityInfo(&
MBB,
Loops->getLoopDepth(&
MBB),
4076 unsigned CurrDepth = std::numeric_limits<unsigned>::max();
4077 for (MBBPriorityInfo &
MBB : MBBs) {
4079 if (JoinGlobalCopies &&
MBB.Depth < CurrDepth) {
4081 CurrDepth =
MBB.Depth;
4083 copyCoalesceInMBB(
MBB.MBB);
4085 lateLiveIntervalUpdate();
4090 while (copyCoalesceWorkList(WorkList))
4092 lateLiveIntervalUpdate();
4095void RegisterCoalescer::releaseMemory() {
4096 ErasedInstrs.
clear();
4099 InflateRegs.
clear();
4100 LargeLIVisitCounter.
clear();
4104 LLVM_DEBUG(
dbgs() <<
"********** REGISTER COALESCER **********\n"
4105 <<
"********** Function: " << fn.
getName() <<
'\n');
4117 dbgs() <<
"* Skipped as it exposes functions that returns twice.\n");
4126 LIS = &getAnalysis<LiveIntervals>();
4127 AA = &getAnalysis<AAResultsWrapperPass>().getAAResults();
4128 Loops = &getAnalysis<MachineLoopInfo>();
4137 for (
const auto &DebugPHI : MF->DebugPHIPositions) {
4140 unsigned SubReg = DebugPHI.second.SubReg;
4143 PHIValToPos.
insert(std::make_pair(DebugPHI.first,
P));
4144 RegToPHIIdx[
Reg].push_back(DebugPHI.first);
4153 MF->verify(
this,
"Before register coalescing");
4155 DbgVRegToValues.
clear();
4168 InflateRegs.
erase(std::unique(InflateRegs.
begin(), InflateRegs.
end()),
4172 for (
unsigned i = 0, e = InflateRegs.
size(); i != e; ++i) {
4174 if (
MRI->reg_nodbg_empty(Reg))
4176 if (
MRI->recomputeRegClass(Reg)) {
4178 <<
TRI->getRegClassName(
MRI->getRegClass(Reg)) <<
'\n');
4185 if (!
MRI->shouldTrackSubRegLiveness(Reg)) {
4193 assert((S.LaneMask & ~MaxMask).none());
4203 for (
auto &p : MF->DebugPHIPositions) {
4204 auto it = PHIValToPos.
find(
p.first);
4206 p.second.Reg = it->second.Reg;
4207 p.second.SubReg = it->second.SubReg;
4210 PHIValToPos.
clear();
4211 RegToPHIIdx.
clear();
4215 MF->verify(
this,
"After register coalescing");
unsigned const MachineRegisterInfo * MRI
MachineInstrBuilder & UseMI
MachineInstrBuilder MachineInstrBuilder & DefMI
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
This file implements the BitVector class.
static GCRegistry::Add< CoreCLRGC > E("coreclr", "CoreCLR-compatible GC")
Returns the sub type a function will return at a given Idx Should correspond to the result type of an ExtractValue instruction executed with just that one unsigned Idx
This file defines the DenseSet and SmallDenseSet classes.
std::optional< std::vector< StOtherPiece > > Other
SmallVector< uint32_t, 0 > Writes
static GCMetadataPrinterRegistry::Add< ErlangGCPrinter > X("erlang", "erlang-compatible garbage collector")
const HexagonInstrInfo * TII
A common definition of LaneBitmask for use in TableGen and CodeGen.
unsigned const TargetRegisterInfo * TRI
#define INITIALIZE_PASS_DEPENDENCY(depName)
#define INITIALIZE_PASS_END(passName, arg, name, cfg, analysis)
#define INITIALIZE_PASS_BEGIN(passName, arg, name, cfg, analysis)
static cl::opt< cl::boolOrDefault > EnableGlobalCopies("join-globalcopies", cl::desc("Coalesce copies that span blocks (default=subtarget)"), cl::init(cl::BOU_UNSET), cl::Hidden)
Temporary flag to test global copy optimization.
static bool isLocalCopy(MachineInstr *Copy, const LiveIntervals *LIS)
static bool isSplitEdge(const MachineBasicBlock *MBB)
Return true if this block should be vacated by the coalescer to eliminate branches.
static int compareMBBPriority(const MBBPriorityInfo *LHS, const MBBPriorityInfo *RHS)
C-style comparator that sorts first based on the loop depth of the basic block (the unsigned),...
register Register Coalescer
static cl::opt< unsigned > LargeIntervalSizeThreshold("large-interval-size-threshold", cl::Hidden, cl::desc("If the valnos size of an interval is larger than the threshold, " "it is regarded as a large interval. "), cl::init(100))
static bool isDefInSubRange(LiveInterval &LI, SlotIndex Def)
Check if any of the subranges of LI contain a definition at Def.
static cl::opt< unsigned > LargeIntervalFreqThreshold("large-interval-freq-threshold", cl::Hidden, cl::desc("For a large interval, if it is coalesed with other live " "intervals many times more than the threshold, stop its " "coalescing to control the compile time. "), cl::init(256))
static std::pair< bool, bool > addSegmentsWithValNo(LiveRange &Dst, VNInfo *DstValNo, const LiveRange &Src, const VNInfo *SrcValNo)
Copy segments with value number SrcValNo from liverange Src to live range @Dst and use value number D...
static bool isLiveThrough(const LiveQueryResult Q)
static bool isTerminalReg(Register DstReg, const MachineInstr &Copy, const MachineRegisterInfo *MRI)
Check if DstReg is a terminal node.
static cl::opt< bool > VerifyCoalescing("verify-coalescing", cl::desc("Verify machine instrs before and after register coalescing"), cl::Hidden)
register Register static false bool isMoveInstr(const TargetRegisterInfo &tri, const MachineInstr *MI, Register &Src, Register &Dst, unsigned &SrcSub, unsigned &DstSub)
static cl::opt< bool > EnableJoinSplits("join-splitedges", cl::desc("Coalesce copies on split edges (default=subtarget)"), cl::Hidden)
Temporary flag to test critical edge unsplitting.
static cl::opt< bool > EnableJoining("join-liveintervals", cl::desc("Coalesce copies (default=true)"), cl::init(true), cl::Hidden)
static bool definesFullReg(const MachineInstr &MI, Register Reg)
Returns true if MI defines the full vreg Reg, as opposed to just defining a subregister.
static cl::opt< unsigned > LateRematUpdateThreshold("late-remat-update-threshold", cl::Hidden, cl::desc("During rematerialization for a copy, if the def instruction has " "many other copy uses to be rematerialized, delay the multiple " "separate live interval update work and do them all at once after " "all those rematerialization are done. It will save a lot of " "repeated work. "), cl::init(100))
static cl::opt< bool > UseTerminalRule("terminal-rule", cl::desc("Apply the terminal rule"), cl::init(false), cl::Hidden)
assert(ImpDefSCC.getReg()==AMDGPU::SCC &&ImpDefSCC.isDef())
This file defines the SmallPtrSet class.
This file defines the SmallVector class.
This file defines the 'Statistic' class, which is designed to be an easy way to expose various metric...
#define STATISTIC(VARNAME, DESC)
static DenseMap< Register, std::vector< std::pair< SlotIndex, MachineInstr * > > > buildVRegToDbgValueMap(MachineFunction &MF, const LiveIntervals *Liveness)
static void shrinkToUses(LiveInterval &LI, LiveIntervals &LIS)
A wrapper pass to provide the legacy pass manager access to a suitably prepared AAResults object.
Represent the analysis usage information of a pass.
AnalysisUsage & addPreservedID(const void *ID)
AnalysisUsage & addRequired()
AnalysisUsage & addPreserved()
Add the specified Pass class to the set of analyses preserved by this pass.
void setPreservesCFG()
This function should be called by the pass, iff they do not:
bool test(unsigned Idx) const
Allocate memory in an ever growing pool, as if by bump-pointer.
A helper class for register coalescers.
bool flip()
Swap SrcReg and DstReg.
bool isCoalescable(const MachineInstr *) const
Return true if MI is a copy instruction that will become an identity copy after coalescing.
bool setRegisters(const MachineInstr *)
Set registers to match the copy instruction MI.
This class represents an Operation in the Expression.
The location of a single variable, composed of an expression and 0 or more DbgValueLocEntries.
iterator find(const_arg_type_t< KeyT > Val)
bool erase(const KeyT &Val)
std::pair< iterator, bool > insert(const std::pair< KeyT, ValueT > &KV)
Implements a dense probed hash-table based set.
bool isAsCheapAsAMove(const MachineInstr &MI) const override
A live range for subregisters.
LiveInterval - This class represents the liveness of a register, or stack slot.
void removeEmptySubRanges()
Removes all subranges without any segments (subranges without segments are not considered valid and s...
bool hasSubRanges() const
Returns true if subregister liveness information is available.
SubRange * createSubRangeFrom(BumpPtrAllocator &Allocator, LaneBitmask LaneMask, const LiveRange &CopyFrom)
Like createSubRange() but the new range is filled with a copy of the liveness information in CopyFrom...
iterator_range< subrange_iterator > subranges()
void refineSubRanges(BumpPtrAllocator &Allocator, LaneBitmask LaneMask, std::function< void(LiveInterval::SubRange &)> Apply, const SlotIndexes &Indexes, const TargetRegisterInfo &TRI, unsigned ComposeSubRegIdx=0)
Refines the subranges to support LaneMask.
void computeSubRangeUndefs(SmallVectorImpl< SlotIndex > &Undefs, LaneBitmask LaneMask, const MachineRegisterInfo &MRI, const SlotIndexes &Indexes) const
For a given lane mask LaneMask, compute indexes at which the lane is marked undefined by subregister ...
SubRange * createSubRange(BumpPtrAllocator &Allocator, LaneBitmask LaneMask)
Creates a new empty subregister live range.
void clearSubRanges()
Removes all subregister liveness information.
bool hasInterval(Register Reg) const
SlotIndex getMBBStartIdx(const MachineBasicBlock *mbb) const
Return the first index in the given basic block.
MachineInstr * getInstructionFromIndex(SlotIndex index) const
Returns the instruction associated with the given index.
bool hasPHIKill(const LiveInterval &LI, const VNInfo *VNI) const
Returns true if VNI is killed by any PHI-def values in LI.
SlotIndex InsertMachineInstrInMaps(MachineInstr &MI)
bool checkRegMaskInterference(const LiveInterval &LI, BitVector &UsableRegs)
Test if LI is live across any register mask instructions, and compute a bit mask of physical register...
SlotIndexes * getSlotIndexes() const
SlotIndex getInstructionIndex(const MachineInstr &Instr) const
Returns the base index of the given instruction.
void RemoveMachineInstrFromMaps(MachineInstr &MI)
VNInfo::Allocator & getVNInfoAllocator()
SlotIndex getMBBEndIdx(const MachineBasicBlock *mbb) const
Return the last index in the given basic block.
LiveRange & getRegUnit(unsigned Unit)
Return the live range for register unit Unit.
LiveRange * getCachedRegUnit(unsigned Unit)
Return the live range for register unit Unit if it has already been computed, or nullptr if it hasn't...
LiveInterval & getInterval(Register Reg)
void pruneValue(LiveRange &LR, SlotIndex Kill, SmallVectorImpl< SlotIndex > *EndPoints)
If LR has a live value at Kill, prune its live range by removing any liveness reachable from Kill.
void removeInterval(Register Reg)
Interval removal.
MachineBasicBlock * intervalIsInOneMBB(const LiveInterval &LI) const
If LI is confined to a single basic block, return a pointer to that block.
void removeVRegDefAt(LiveInterval &LI, SlotIndex Pos)
Remove value number and related live segments of LI and its subranges that start at position Pos.
bool shrinkToUses(LiveInterval *li, SmallVectorImpl< MachineInstr * > *dead=nullptr)
After removing some uses of a register, shrink its live range to just the remaining uses.
void extendToIndices(LiveRange &LR, ArrayRef< SlotIndex > Indices, ArrayRef< SlotIndex > Undefs)
Extend the live range LR to reach all points in Indices.
void removePhysRegDefAt(MCRegister Reg, SlotIndex Pos)
Remove value numbers and related live segments starting at position Pos that are part of any liverang...
void splitSeparateComponents(LiveInterval &LI, SmallVectorImpl< LiveInterval * > &SplitLIs)
Split separate components in LiveInterval LI into separate intervals.
MachineBasicBlock * getMBBFromIndex(SlotIndex index) const
bool isLiveInToMBB(const LiveRange &LR, const MachineBasicBlock *mbb) const
SlotIndex ReplaceMachineInstrInMaps(MachineInstr &MI, MachineInstr &NewMI)
void print(raw_ostream &O, const Module *=nullptr) const override
Implement the dump method.
Result of a LiveRange query.
VNInfo * valueOutOrDead() const
Returns the value alive at the end of the instruction, if any.
VNInfo * valueIn() const
Return the value that is live-in to the instruction.
VNInfo * valueOut() const
Return the value leaving the instruction, if any.
VNInfo * valueDefined() const
Return the value defined by this instruction, if any.
SlotIndex endPoint() const
Return the end point of the last live range segment to interact with the instruction,...
bool isKill() const
Return true if the live-in value is killed by this instruction.
Callback methods for LiveRangeEdit owners.
virtual void LRE_WillEraseInstruction(MachineInstr *MI)
Called immediately before erasing a dead machine instruction.
void eliminateDeadDefs(SmallVectorImpl< MachineInstr * > &Dead, ArrayRef< Register > RegsBeingSpilled=std::nullopt)
eliminateDeadDefs - Try to delete machine instructions that are now dead (allDefsAreDead returns true...
SlotIndex rematerializeAt(MachineBasicBlock &MBB, MachineBasicBlock::iterator MI, Register DestReg, const Remat &RM, const TargetRegisterInfo &, bool Late=false, unsigned SubIdx=0, MachineInstr *ReplaceIndexMI=nullptr)
rematerializeAt - Rematerialize RM.ParentVNI into DestReg by inserting an instruction into MBB before...
bool checkRematerializable(VNInfo *VNI, const MachineInstr *DefMI)
checkRematerializable - Manually add VNI to the list of rematerializable values if DefMI may be remat...
bool canRematerializeAt(Remat &RM, VNInfo *OrigVNI, SlotIndex UseIdx, bool cheapAsAMove)
canRematerializeAt - Determine if ParentVNI can be rematerialized at UseIdx.
This class represents the liveness of a register, stack slot, etc.
VNInfo * getValNumInfo(unsigned ValNo)
getValNumInfo - Returns pointer to the specified val#.
iterator addSegment(Segment S)
Add the specified Segment to this range, merging segments as appropriate.
const Segment * getSegmentContaining(SlotIndex Idx) const
Return the segment that contains the specified index, or null if there is none.
void join(LiveRange &Other, const int *ValNoAssignments, const int *RHSValNoAssignments, SmallVectorImpl< VNInfo * > &NewVNInfo)
join - Join two live ranges (this, and other) together.
bool liveAt(SlotIndex index) const
VNInfo * createDeadDef(SlotIndex Def, VNInfo::Allocator &VNIAlloc)
createDeadDef - Make sure the range has a value defined at Def.
void removeValNo(VNInfo *ValNo)
removeValNo - Remove all the segments defined by the specified value#.
void verify() const
Walk the range and assert if any invariants fail to hold.
bool overlaps(const LiveRange &other) const
overlaps - Return true if the intersection of the two live ranges is not empty.
LiveQueryResult Query(SlotIndex Idx) const
Query Liveness at Idx.
VNInfo * getVNInfoBefore(SlotIndex Idx) const
getVNInfoBefore - Return the VNInfo that is live up to but not necessarilly including Idx,...
VNInfo * MergeValueNumberInto(VNInfo *V1, VNInfo *V2)
MergeValueNumberInto - This method is called when two value numbers are found to be equivalent.
unsigned getNumValNums() const
bool containsOneValue() const
iterator FindSegmentContaining(SlotIndex Idx)
Return an iterator to the segment that contains the specified index, or end() if there is none.
VNInfo * getVNInfoAt(SlotIndex Idx) const
getVNInfoAt - Return the VNInfo that is live at Idx, or NULL.
iterator find(SlotIndex Pos)
find - Return an iterator pointing to the first segment that ends after Pos, or end().
Describe properties that are true of each instruction in the target description file.
unsigned getNumOperands() const
Return the number of declared MachineOperands for this MachineInstruction.
unsigned getNumDefs() const
Return the number of MachineOperands that are register definitions.
MCRegUnitRootIterator enumerates the root registers of a register unit.
bool isValid() const
Check if the iterator is at the end of the list.
Wrapper class representing physical registers. Should be passed by value.
bool isInlineAsmBrIndirectTarget() const
Returns true if this is the indirect dest of an INLINEASM_BR.
unsigned pred_size() const
bool hasEHPadSuccessor() const
bool isEHPad() const
Returns true if the block is a landing pad.
instr_iterator insert(instr_iterator I, MachineInstr *M)
Insert MI into the instruction list before I, possibly inside a bundle.
iterator getFirstTerminator()
Returns an iterator to the first terminator instruction of this basic block.
unsigned succ_size() const
instr_iterator erase(instr_iterator I)
Remove an instruction from the instruction list and delete it.
iterator_range< pred_iterator > predecessors()
void splice(iterator Where, MachineBasicBlock *Other, iterator From)
Take an instruction from MBB 'Other' at the position From, and insert it into this MBB right before '...
StringRef getName() const
Return the name of the corresponding LLVM basic block, or an empty string.
MachineFunctionPass - This class adapts the FunctionPass interface to allow convenient creation of pa...
void getAnalysisUsage(AnalysisUsage &AU) const override
getAnalysisUsage - Subclasses that override getAnalysisUsage must call this.
virtual bool runOnMachineFunction(MachineFunction &MF)=0
runOnMachineFunction - This method must be overloaded to perform the desired machine code transformat...
const TargetSubtargetInfo & getSubtarget() const
getSubtarget - Return the subtarget for which this machine code is being compiled.
StringRef getName() const
getName - Return the name of the corresponding LLVM function.
bool exposesReturnsTwice() const
exposesReturnsTwice - Returns true if the function calls setjmp or any other similar functions with a...
MachineRegisterInfo & getRegInfo()
getRegInfo - Return information about the registers currently in use.
const MachineInstrBuilder & addReg(Register RegNo, unsigned flags=0, unsigned SubReg=0) const
Add a new virtual register operand.
Representation of each machine instruction.
int findRegisterUseOperandIdx(Register Reg, bool isKill=false, const TargetRegisterInfo *TRI=nullptr) const
Returns the operand index that is a use of the specific register or -1 if it is not found.
bool isSafeToMove(AAResults *AA, bool &SawStore) const
Return true if it is safe to move this instruction.
bool isImplicitDef() const
const MachineBasicBlock * getParent() const
bool isCopyLike() const
Return true if the instruction behaves like a copy.
int findRegisterDefOperandIdx(Register Reg, bool isDead=false, bool Overlap=false, const TargetRegisterInfo *TRI=nullptr) const
Returns the operand index that is a def of the specified register or -1 if it is not found.
std::pair< bool, bool > readsWritesVirtualRegister(Register Reg, SmallVectorImpl< unsigned > *Ops=nullptr) const
Return a pair of bools (reads, writes) indicating if this instruction reads or writes Reg.
bool isRegTiedToDefOperand(unsigned UseOpIdx, unsigned *DefOpIdx=nullptr) const
Return true if the use operand of the specified index is tied to a def operand.
bool isDebugInstr() const
unsigned getNumOperands() const
Retuns the total number of operands.
void addOperand(MachineFunction &MF, const MachineOperand &Op)
Add the specified operand to the instruction.
bool isRegTiedToUseOperand(unsigned DefOpIdx, unsigned *UseOpIdx=nullptr) const
Given the index of a register def operand, check if the register def is tied to a source operand,...
const MCInstrDesc & getDesc() const
Returns the target instruction descriptor of this MachineInstr.
bool isCommutable(QueryType Type=IgnoreBundle) const
Return true if this may be a 2- or 3-address instruction (of the form "X = op Y, Z,...
iterator_range< mop_iterator > operands()
void substituteRegister(Register FromReg, Register ToReg, unsigned SubIdx, const TargetRegisterInfo &RegInfo)
Replace all occurrences of FromReg with ToReg:SubIdx, properly composing subreg indices where necessa...
const DebugLoc & getDebugLoc() const
Returns the debug location id of this MachineInstr.
void eraseFromParent()
Unlink 'this' from the containing basic block and delete it.
void removeOperand(unsigned OpNo)
Erase an operand from an instruction, leaving it with one fewer operand than it started with.
const MachineOperand & getOperand(unsigned i) const
iterator_range< filtered_mop_iterator > all_defs()
Returns an iterator range over all operands that are (explicit or implicit) register defs.
void setDesc(const MCInstrDesc &TID)
Replace the instruction descriptor (thus opcode) of the current instruction with a new one.
void setDebugLoc(DebugLoc DL)
Replace current source information with new such.
bool allDefsAreDead() const
Return true if all the defs of this instruction are dead.
MachineOperand class - Representation of each machine instruction operand.
void setSubReg(unsigned subReg)
unsigned getSubReg() const
void substVirtReg(Register Reg, unsigned SubIdx, const TargetRegisterInfo &)
substVirtReg - Substitute the current register with the virtual subregister Reg:SubReg.
bool readsReg() const
readsReg - Returns true if this operand reads the previous value of its register.
bool isReg() const
isReg - Tests if this is a MO_Register operand.
void setIsDead(bool Val=true)
void setIsKill(bool Val=true)
MachineInstr * getParent()
getParent - Return the instruction that this operand belongs to.
void substPhysReg(MCRegister Reg, const TargetRegisterInfo &)
substPhysReg - Substitute the current register with the physical register Reg, taking any existing Su...
void setIsUndef(bool Val=true)
bool isEarlyClobber() const
Register getReg() const
getReg - Returns the register number.
static MachineOperand CreateReg(Register Reg, bool isDef, bool isImp=false, bool isKill=false, bool isDead=false, bool isUndef=false, bool isEarlyClobber=false, unsigned SubReg=0, bool isDebug=false, bool isInternalRead=false, bool isRenamable=false)
defusechain_iterator - This class provides iterator support for machine operands in the function that...
MachineRegisterInfo - Keep track of information for virtual and physical registers,...
A Module instance is used to store all the information related to an LLVM module.
MutableArrayRef - Represent a mutable reference to an array (0 or more elements consecutively in memo...
static PassRegistry * getPassRegistry()
getPassRegistry - Access the global registry object, which is automatically initialized at applicatio...
virtual void print(raw_ostream &OS, const Module *M) const
print - Print out the internal state of the pass.
virtual void releaseMemory()
releaseMemory() - This member can be implemented by a pass if it wants to be able to release its memo...
bool isProperSubClass(const TargetRegisterClass *RC) const
isProperSubClass - Returns true if RC has a legal super-class with more allocatable registers.
void runOnMachineFunction(const MachineFunction &MF)
runOnFunction - Prepare to answer questions about MF.
Wrapper class representing virtual and physical registers.
MCRegister asMCReg() const
Utility to check-convert this value to a MCRegister.
constexpr bool isVirtual() const
Return true if the specified register number is in the virtual register namespace.
constexpr bool isPhysical() const
Return true if the specified register number is in the physical register namespace.
SlotIndex - An opaque wrapper around machine indexes.
static bool isSameInstr(SlotIndex A, SlotIndex B)
isSameInstr - Return true if A and B refer to the same instruction.
bool isEarlyClobber() const
isEarlyClobber - Returns true if this is an early-clobber slot.
bool isValid() const
Returns true if this is a valid index.
SlotIndex getBaseIndex() const
Returns the base index for associated with this index.
SlotIndex getPrevSlot() const
Returns the previous slot in the index list.
SlotIndex getRegSlot(bool EC=false) const
Returns the register use/def slot in the current instruction for a normal or early-clobber def.
bool isDead() const
isDead - Returns true if this is a dead def kill slot.
MachineBasicBlock * getMBBFromIndex(SlotIndex index) const
Returns the basic block which the given index falls in.
SlotIndex getMBBEndIdx(unsigned Num) const
Returns the last index in the given basic block number.
SlotIndex getNextNonNullIndex(SlotIndex Index)
Returns the next non-null index, if one exists.
SlotIndex getInstructionIndex(const MachineInstr &MI, bool IgnoreBundle=false) const
Returns the base index for the given instruction.
SlotIndex getMBBStartIdx(unsigned Num) const
Returns the first index in the given basic block number.
SlotIndex getIndexBefore(const MachineInstr &MI) const
getIndexBefore - Returns the index of the last indexed instruction before MI, or the start index of i...
MachineInstr * getInstructionFromIndex(SlotIndex index) const
Returns the instruction for the given index, or null if the given index has no instruction associated...
A templated base class for SmallPtrSet which provides the typesafe interface that is common across al...
bool erase(PtrType Ptr)
erase - If the set contains the specified pointer, remove it and return true, otherwise return false.
size_type count(ConstPtrType Ptr) const
count - Return 1 if the specified pointer is in the set, 0 otherwise.
std::pair< iterator, bool > insert(PtrType Ptr)
Inserts Ptr if and only if there is no element in the container equal to Ptr.
SmallPtrSet - This class implements a set which is optimized for holding SmallSize or less elements.
This class consists of common code factored out of the SmallVector class to reduce code duplication b...
void reserve(size_type N)
iterator erase(const_iterator CI)
void append(ItTy in_start, ItTy in_end)
Add the specified range to the end of the SmallVector.
void push_back(const T &Elt)
pointer data()
Return a pointer to the vector's buffer, even if empty().
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
TargetInstrInfo - Interface to description of machine instruction set.
static const unsigned CommuteAnyOperandIndex