Line data Source code
1 : //===- InterferenceCache.cpp - Caching per-block interference -------------===//
2 : //
3 : // The LLVM Compiler Infrastructure
4 : //
5 : // This file is distributed under the University of Illinois Open Source
6 : // License. See LICENSE.TXT for details.
7 : //
8 : //===----------------------------------------------------------------------===//
9 : //
10 : // InterferenceCache remembers per-block interference in LiveIntervalUnions.
11 : //
12 : //===----------------------------------------------------------------------===//
13 :
14 : #include "InterferenceCache.h"
15 : #include "llvm/ADT/ArrayRef.h"
16 : #include "llvm/CodeGen/LiveInterval.h"
17 : #include "llvm/CodeGen/LiveIntervalUnion.h"
18 : #include "llvm/CodeGen/LiveIntervals.h"
19 : #include "llvm/CodeGen/MachineBasicBlock.h"
20 : #include "llvm/CodeGen/MachineFunction.h"
21 : #include "llvm/CodeGen/MachineOperand.h"
22 : #include "llvm/CodeGen/SlotIndexes.h"
23 : #include "llvm/CodeGen/TargetRegisterInfo.h"
24 : #include "llvm/MC/MCRegisterInfo.h"
25 : #include "llvm/Support/ErrorHandling.h"
26 : #include <cassert>
27 : #include <cstdint>
28 : #include <cstdlib>
29 : #include <tuple>
30 :
31 : using namespace llvm;
32 :
33 : #define DEBUG_TYPE "regalloc"
34 :
35 : // Static member used for null interference cursors.
36 : const InterferenceCache::BlockInterference
37 : InterferenceCache::Cursor::NoInterference;
38 :
39 : // Initializes PhysRegEntries (instead of a SmallVector, PhysRegEntries is a
40 : // buffer of size NumPhysRegs to speed up alloc/clear for targets with large
41 : // reg files). Calloced memory is used for good form, and quites tools like
42 : // Valgrind too, but zero initialized memory is not required by the algorithm:
43 : // this is because PhysRegEntries works like a SparseSet and its entries are
44 : // only valid when there is a corresponding CacheEntries assignment. There is
45 : // also support for when pass managers are reused for targets with different
46 : // numbers of PhysRegs: in this case PhysRegEntries is freed and reinitialized.
47 193768 : void InterferenceCache::reinitPhysRegEntries() {
48 193768 : if (PhysRegEntriesCount == TRI->getNumRegs()) return;
49 18783 : free(PhysRegEntries);
50 18783 : PhysRegEntriesCount = TRI->getNumRegs();
51 18783 : PhysRegEntries = static_cast<unsigned char*>(
52 18783 : safe_calloc(PhysRegEntriesCount, sizeof(unsigned char)));
53 : }
54 :
55 193768 : void InterferenceCache::init(MachineFunction *mf,
56 : LiveIntervalUnion *liuarray,
57 : SlotIndexes *indexes,
58 : LiveIntervals *lis,
59 : const TargetRegisterInfo *tri) {
60 193768 : MF = mf;
61 193768 : LIUArray = liuarray;
62 193768 : TRI = tri;
63 193768 : reinitPhysRegEntries();
64 6394312 : for (unsigned i = 0; i != CacheEntries; ++i)
65 : Entries[i].clear(mf, indexes, lis);
66 193768 : }
67 :
68 320084 : InterferenceCache::Entry *InterferenceCache::get(unsigned PhysReg) {
69 320084 : unsigned E = PhysRegEntries[PhysReg];
70 320084 : if (E < CacheEntries && Entries[E].getPhysReg() == PhysReg) {
71 248768 : if (!Entries[E].valid(LIUArray, TRI))
72 28237 : Entries[E].revalidate(LIUArray, TRI);
73 248768 : return &Entries[E];
74 : }
75 : // No valid entry exists, pick the next round-robin entry.
76 71316 : E = RoundRobin;
77 71316 : if (++RoundRobin == CacheEntries)
78 2043 : RoundRobin = 0;
79 5510 : for (unsigned i = 0; i != CacheEntries; ++i) {
80 : // Skip entries that are in use.
81 76826 : if (Entries[E].hasRefs()) {
82 5510 : if (++E == CacheEntries)
83 : E = 0;
84 : continue;
85 : }
86 71316 : Entries[E].reset(PhysReg, LIUArray, TRI, MF);
87 71316 : PhysRegEntries[PhysReg] = E;
88 71316 : return &Entries[E];
89 : }
90 : llvm_unreachable("Ran out of interference cache entries.");
91 : }
92 :
93 : /// revalidate - LIU contents have changed, update tags.
94 28237 : void InterferenceCache::Entry::revalidate(LiveIntervalUnion *LIUArray,
95 : const TargetRegisterInfo *TRI) {
96 : // Invalidate all block entries.
97 28237 : ++Tag;
98 : // Invalidate all iterators.
99 28237 : PrevPos = SlotIndex();
100 : unsigned i = 0;
101 94963 : for (MCRegUnitIterator Units(PhysReg, TRI); Units.isValid(); ++Units, ++i)
102 133452 : RegUnits[i].VirtTag = LIUArray[*Units].getTag();
103 28237 : }
104 :
105 71316 : void InterferenceCache::Entry::reset(unsigned physReg,
106 : LiveIntervalUnion *LIUArray,
107 : const TargetRegisterInfo *TRI,
108 : const MachineFunction *MF) {
109 : assert(!hasRefs() && "Cannot reset cache entry with references");
110 : // LIU's changed, invalidate cache.
111 71316 : ++Tag;
112 71316 : PhysReg = physReg;
113 142632 : Blocks.resize(MF->getNumBlockIDs());
114 :
115 : // Reset iterators.
116 71316 : PrevPos = SlotIndex();
117 71316 : RegUnits.clear();
118 189871 : for (MCRegUnitIterator Units(PhysReg, TRI); Units.isValid(); ++Units) {
119 355665 : RegUnits.push_back(LIUArray[*Units]);
120 237110 : RegUnits.back().Fixed = &LIS->getRegUnit(*Units);
121 : }
122 71316 : }
123 :
124 248768 : bool InterferenceCache::Entry::valid(LiveIntervalUnion *LIUArray,
125 : const TargetRegisterInfo *TRI) {
126 248768 : unsigned i = 0, e = RegUnits.size();
127 737507 : for (MCRegUnitIterator Units(PhysReg, TRI); Units.isValid(); ++Units, ++i) {
128 516976 : if (i == e)
129 : return false;
130 1033952 : if (LIUArray[*Units].changedSince(RegUnits[i].VirtTag))
131 : return false;
132 : }
133 220531 : return i == e;
134 : }
135 :
136 1067350 : void InterferenceCache::Entry::update(unsigned MBBNum) {
137 : SlotIndex Start, Stop;
138 1067350 : std::tie(Start, Stop) = Indexes->getMBBRange(MBBNum);
139 :
140 : // Use advanceTo only when possible.
141 1067350 : if (PrevPos != Start) {
142 921234 : if (!PrevPos.isValid() || Start < PrevPos) {
143 1192324 : for (unsigned i = 0, e = RegUnits.size(); i != e; ++i) {
144 790455 : RegUnitInfo &RUI = RegUnits[i];
145 790455 : RUI.VirtI.find(Start);
146 790455 : RUI.FixedI = RUI.Fixed->find(Start);
147 : }
148 : } else {
149 1592208 : for (unsigned i = 0, e = RegUnits.size(); i != e; ++i) {
150 1072843 : RegUnitInfo &RUI = RegUnits[i];
151 1072843 : RUI.VirtI.advanceTo(Start);
152 2145686 : if (RUI.FixedI != RUI.Fixed->end())
153 394320 : RUI.FixedI = RUI.Fixed->advanceTo(RUI.FixedI, Start);
154 : }
155 : }
156 921234 : PrevPos = Start;
157 : }
158 :
159 : MachineFunction::const_iterator MFI =
160 2134700 : MF->getBlockNumbered(MBBNum)->getIterator();
161 : BlockInterference *BI = &Blocks[MBBNum];
162 : ArrayRef<SlotIndex> RegMaskSlots;
163 : ArrayRef<const uint32_t*> RegMaskBits;
164 : while (true) {
165 2287012 : BI->Tag = Tag;
166 2287012 : BI->First = BI->Last = SlotIndex();
167 :
168 : // Check for first interference from virtregs.
169 7175197 : for (unsigned i = 0, e = RegUnits.size(); i != e; ++i) {
170 4888185 : LiveIntervalUnion::SegmentIter &I = RegUnits[i].VirtI;
171 : if (!I.valid())
172 : continue;
173 3049303 : SlotIndex StartI = I.start();
174 3049303 : if (StartI >= Stop)
175 : continue;
176 927719 : if (!BI->First.isValid() || StartI < BI->First)
177 364075 : BI->First = StartI;
178 : }
179 :
180 : // Same thing for fixed interference.
181 7175197 : for (unsigned i = 0, e = RegUnits.size(); i != e; ++i) {
182 4888185 : LiveInterval::const_iterator I = RegUnits[i].FixedI;
183 4888185 : LiveInterval::const_iterator E = RegUnits[i].Fixed->end();
184 4888185 : if (I == E)
185 : continue;
186 1197789 : SlotIndex StartI = I->start;
187 1197789 : if (StartI >= Stop)
188 : continue;
189 286627 : if (!BI->First.isValid() || StartI < BI->First)
190 66359 : BI->First = StartI;
191 : }
192 :
193 : // Also check for register mask interference.
194 2287012 : RegMaskSlots = LIS->getRegMaskSlotsInBlock(MBBNum);
195 : RegMaskBits = LIS->getRegMaskBitsInBlock(MBBNum);
196 2287012 : SlotIndex Limit = BI->First.isValid() ? BI->First : Stop;
197 225035 : for (unsigned i = 0, e = RegMaskSlots.size();
198 2512047 : i != e && RegMaskSlots[i] < Limit; ++i)
199 2230149 : if (MachineOperand::clobbersPhysReg(RegMaskBits[i], PhysReg)) {
200 : // Register mask i clobbers PhysReg before the LIU interference.
201 518348 : BI->First = RegMaskSlots[i];
202 518348 : break;
203 : }
204 :
205 2287012 : PrevPos = Stop;
206 2287012 : if (BI->First.isValid())
207 : break;
208 :
209 : // No interference in this block? Go ahead and precompute the next block.
210 2727980 : if (++MFI == MF->end())
211 : return;
212 1348303 : MBBNum = MFI->getNumber();
213 1348303 : BI = &Blocks[MBBNum];
214 1348303 : if (BI->Tag == Tag)
215 : return;
216 1219662 : std::tie(Start, Stop) = Indexes->getMBBRange(MBBNum);
217 1219662 : }
218 :
219 : // Check for last interference in block.
220 2793830 : for (unsigned i = 0, e = RegUnits.size(); i != e; ++i) {
221 1870808 : LiveIntervalUnion::SegmentIter &I = RegUnits[i].VirtI;
222 1326364 : if (!I.valid() || I.start() >= Stop)
223 : continue;
224 927719 : I.advanceTo(Stop);
225 869747 : bool Backup = !I.valid() || I.start() >= Stop;
226 : if (Backup)
227 : --I;
228 927719 : SlotIndex StopI = I.stop();
229 927719 : if (!BI->Last.isValid() || StopI > BI->Last)
230 365325 : BI->Last = StopI;
231 927719 : if (Backup)
232 : ++I;
233 : }
234 :
235 : // Fixed interference.
236 2793830 : for (unsigned i = 0, e = RegUnits.size(); i != e; ++i) {
237 1870808 : LiveInterval::iterator &I = RegUnits[i].FixedI;
238 1870808 : LiveRange *LR = RegUnits[i].Fixed;
239 3741616 : if (I == LR->end() || I->start >= Stop)
240 : continue;
241 286627 : I = LR->advanceTo(I, Stop);
242 286627 : bool Backup = I == LR->end() || I->start >= Stop;
243 : if (Backup)
244 286627 : --I;
245 286627 : SlotIndex StopI = I->end;
246 286627 : if (!BI->Last.isValid() || StopI > BI->Last)
247 76453 : BI->Last = StopI;
248 286627 : if (Backup)
249 286627 : ++I;
250 : }
251 :
252 : // Also check for register mask interference.
253 923022 : SlotIndex Limit = BI->Last.isValid() ? BI->Last : Start;
254 : for (unsigned i = RegMaskSlots.size();
255 940659 : i && RegMaskSlots[i-1].getDeadSlot() > Limit; --i)
256 1834599 : if (MachineOperand::clobbersPhysReg(RegMaskBits[i-1], PhysReg)) {
257 : // Register mask i-1 clobbers PhysReg after the LIU interference.
258 : // Model the regmask clobber as a dead def.
259 593896 : BI->Last = RegMaskSlots[i-1].getDeadSlot();
260 593896 : break;
261 : }
262 : }
|