Bug Summary

File:llvm/lib/CodeGen/InlineSpiller.cpp
Warning:line 313, column 63
The left operand of '==' is a garbage value

Annotated Source Code

Press '?' to see keyboard shortcuts

clang -cc1 -cc1 -triple x86_64-pc-linux-gnu -analyze -disable-free -clear-ast-before-backend -disable-llvm-verifier -discard-value-names -main-file-name InlineSpiller.cpp -analyzer-store=region -analyzer-opt-analyze-nested-blocks -analyzer-checker=core -analyzer-checker=apiModeling -analyzer-checker=unix -analyzer-checker=deadcode -analyzer-checker=cplusplus -analyzer-checker=security.insecureAPI.UncheckedReturn -analyzer-checker=security.insecureAPI.getpw -analyzer-checker=security.insecureAPI.gets -analyzer-checker=security.insecureAPI.mktemp -analyzer-checker=security.insecureAPI.mkstemp -analyzer-checker=security.insecureAPI.vfork -analyzer-checker=nullability.NullPassedToNonnull -analyzer-checker=nullability.NullReturnedFromNonnull -analyzer-output plist -w -setup-static-analyzer -analyzer-config-compatibility-mode=true -mrelocation-model pic -pic-level 2 -mframe-pointer=none -fmath-errno -ffp-contract=on -fno-rounding-math -mconstructor-aliases -funwind-tables=2 -target-cpu x86-64 -tune-cpu generic -debugger-tuning=gdb -ffunction-sections -fdata-sections -fcoverage-compilation-dir=/build/llvm-toolchain-snapshot-14~++20220118101002+ec47dba1c8a2/build-llvm -resource-dir /usr/lib/llvm-14/lib/clang/14.0.0 -D _DEBUG -D _GNU_SOURCE -D __STDC_CONSTANT_MACROS -D __STDC_FORMAT_MACROS -D __STDC_LIMIT_MACROS -I lib/CodeGen -I /build/llvm-toolchain-snapshot-14~++20220118101002+ec47dba1c8a2/llvm/lib/CodeGen -I include -I /build/llvm-toolchain-snapshot-14~++20220118101002+ec47dba1c8a2/llvm/include -D _FORTIFY_SOURCE=2 -D NDEBUG -U NDEBUG -internal-isystem /usr/lib/gcc/x86_64-linux-gnu/10/../../../../include/c++/10 -internal-isystem /usr/lib/gcc/x86_64-linux-gnu/10/../../../../include/x86_64-linux-gnu/c++/10 -internal-isystem /usr/lib/gcc/x86_64-linux-gnu/10/../../../../include/c++/10/backward -internal-isystem /usr/lib/llvm-14/lib/clang/14.0.0/include -internal-isystem /usr/local/include -internal-isystem /usr/lib/gcc/x86_64-linux-gnu/10/../../../../x86_64-linux-gnu/include -internal-externc-isystem /usr/include/x86_64-linux-gnu -internal-externc-isystem /include -internal-externc-isystem /usr/include -fmacro-prefix-map=/build/llvm-toolchain-snapshot-14~++20220118101002+ec47dba1c8a2/build-llvm=build-llvm -fmacro-prefix-map=/build/llvm-toolchain-snapshot-14~++20220118101002+ec47dba1c8a2/= -fcoverage-prefix-map=/build/llvm-toolchain-snapshot-14~++20220118101002+ec47dba1c8a2/build-llvm=build-llvm -fcoverage-prefix-map=/build/llvm-toolchain-snapshot-14~++20220118101002+ec47dba1c8a2/= -O3 -Wno-unused-command-line-argument -Wno-unused-parameter -Wwrite-strings -Wno-missing-field-initializers -Wno-long-long -Wno-maybe-uninitialized -Wno-class-memaccess -Wno-redundant-move -Wno-pessimizing-move -Wno-noexcept-type -Wno-comment -std=c++14 -fdeprecated-macro -fdebug-compilation-dir=/build/llvm-toolchain-snapshot-14~++20220118101002+ec47dba1c8a2/build-llvm -fdebug-prefix-map=/build/llvm-toolchain-snapshot-14~++20220118101002+ec47dba1c8a2/build-llvm=build-llvm -fdebug-prefix-map=/build/llvm-toolchain-snapshot-14~++20220118101002+ec47dba1c8a2/= -ferror-limit 19 -fvisibility-inlines-hidden -stack-protector 2 -fgnuc-version=4.2.1 -fcolor-diagnostics -vectorize-loops -vectorize-slp -analyzer-output=html -analyzer-config stable-report-filename=true -faddrsig -D__GCC_HAVE_DWARF2_CFI_ASM=1 -o /tmp/scan-build-2022-01-19-001817-16337-1 -x c++ /build/llvm-toolchain-snapshot-14~++20220118101002+ec47dba1c8a2/llvm/lib/CodeGen/InlineSpiller.cpp

/build/llvm-toolchain-snapshot-14~++20220118101002+ec47dba1c8a2/llvm/lib/CodeGen/InlineSpiller.cpp

1//===- InlineSpiller.cpp - Insert spills and restores inline --------------===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8//
9// The inline spiller modifies the machine function directly instead of
10// inserting spills and restores in VirtRegMap.
11//
12//===----------------------------------------------------------------------===//
13
14#include "SplitKit.h"
15#include "llvm/ADT/ArrayRef.h"
16#include "llvm/ADT/DenseMap.h"
17#include "llvm/ADT/MapVector.h"
18#include "llvm/ADT/None.h"
19#include "llvm/ADT/STLExtras.h"
20#include "llvm/ADT/SetVector.h"
21#include "llvm/ADT/SmallPtrSet.h"
22#include "llvm/ADT/SmallVector.h"
23#include "llvm/ADT/Statistic.h"
24#include "llvm/Analysis/AliasAnalysis.h"
25#include "llvm/CodeGen/LiveInterval.h"
26#include "llvm/CodeGen/LiveIntervalCalc.h"
27#include "llvm/CodeGen/LiveIntervals.h"
28#include "llvm/CodeGen/LiveRangeEdit.h"
29#include "llvm/CodeGen/LiveStacks.h"
30#include "llvm/CodeGen/MachineBasicBlock.h"
31#include "llvm/CodeGen/MachineBlockFrequencyInfo.h"
32#include "llvm/CodeGen/MachineDominators.h"
33#include "llvm/CodeGen/MachineFunction.h"
34#include "llvm/CodeGen/MachineFunctionPass.h"
35#include "llvm/CodeGen/MachineInstr.h"
36#include "llvm/CodeGen/MachineInstrBuilder.h"
37#include "llvm/CodeGen/MachineInstrBundle.h"
38#include "llvm/CodeGen/MachineLoopInfo.h"
39#include "llvm/CodeGen/MachineOperand.h"
40#include "llvm/CodeGen/MachineRegisterInfo.h"
41#include "llvm/CodeGen/SlotIndexes.h"
42#include "llvm/CodeGen/Spiller.h"
43#include "llvm/CodeGen/StackMaps.h"
44#include "llvm/CodeGen/TargetInstrInfo.h"
45#include "llvm/CodeGen/TargetOpcodes.h"
46#include "llvm/CodeGen/TargetRegisterInfo.h"
47#include "llvm/CodeGen/TargetSubtargetInfo.h"
48#include "llvm/CodeGen/VirtRegMap.h"
49#include "llvm/Config/llvm-config.h"
50#include "llvm/Support/BlockFrequency.h"
51#include "llvm/Support/BranchProbability.h"
52#include "llvm/Support/CommandLine.h"
53#include "llvm/Support/Compiler.h"
54#include "llvm/Support/Debug.h"
55#include "llvm/Support/ErrorHandling.h"
56#include "llvm/Support/raw_ostream.h"
57#include <cassert>
58#include <iterator>
59#include <tuple>
60#include <utility>
61#include <vector>
62
63using namespace llvm;
64
65#define DEBUG_TYPE"regalloc" "regalloc"
66
67STATISTIC(NumSpilledRanges, "Number of spilled live ranges")static llvm::Statistic NumSpilledRanges = {"regalloc", "NumSpilledRanges"
, "Number of spilled live ranges"}
;
68STATISTIC(NumSnippets, "Number of spilled snippets")static llvm::Statistic NumSnippets = {"regalloc", "NumSnippets"
, "Number of spilled snippets"}
;
69STATISTIC(NumSpills, "Number of spills inserted")static llvm::Statistic NumSpills = {"regalloc", "NumSpills", "Number of spills inserted"
}
;
70STATISTIC(NumSpillsRemoved, "Number of spills removed")static llvm::Statistic NumSpillsRemoved = {"regalloc", "NumSpillsRemoved"
, "Number of spills removed"}
;
71STATISTIC(NumReloads, "Number of reloads inserted")static llvm::Statistic NumReloads = {"regalloc", "NumReloads"
, "Number of reloads inserted"}
;
72STATISTIC(NumReloadsRemoved, "Number of reloads removed")static llvm::Statistic NumReloadsRemoved = {"regalloc", "NumReloadsRemoved"
, "Number of reloads removed"}
;
73STATISTIC(NumFolded, "Number of folded stack accesses")static llvm::Statistic NumFolded = {"regalloc", "NumFolded", "Number of folded stack accesses"
}
;
74STATISTIC(NumFoldedLoads, "Number of folded loads")static llvm::Statistic NumFoldedLoads = {"regalloc", "NumFoldedLoads"
, "Number of folded loads"}
;
75STATISTIC(NumRemats, "Number of rematerialized defs for spilling")static llvm::Statistic NumRemats = {"regalloc", "NumRemats", "Number of rematerialized defs for spilling"
}
;
76
77static cl::opt<bool> DisableHoisting("disable-spill-hoist", cl::Hidden,
78 cl::desc("Disable inline spill hoisting"));
79static cl::opt<bool>
80RestrictStatepointRemat("restrict-statepoint-remat",
81 cl::init(false), cl::Hidden,
82 cl::desc("Restrict remat for statepoint operands"));
83
84namespace {
85
86class HoistSpillHelper : private LiveRangeEdit::Delegate {
87 MachineFunction &MF;
88 LiveIntervals &LIS;
89 LiveStacks &LSS;
90 AliasAnalysis *AA;
91 MachineDominatorTree &MDT;
92 MachineLoopInfo &Loops;
93 VirtRegMap &VRM;
94 MachineRegisterInfo &MRI;
95 const TargetInstrInfo &TII;
96 const TargetRegisterInfo &TRI;
97 const MachineBlockFrequencyInfo &MBFI;
98
99 InsertPointAnalysis IPA;
100
101 // Map from StackSlot to the LiveInterval of the original register.
102 // Note the LiveInterval of the original register may have been deleted
103 // after it is spilled. We keep a copy here to track the range where
104 // spills can be moved.
105 DenseMap<int, std::unique_ptr<LiveInterval>> StackSlotToOrigLI;
106
107 // Map from pair of (StackSlot and Original VNI) to a set of spills which
108 // have the same stackslot and have equal values defined by Original VNI.
109 // These spills are mergeable and are hoist candiates.
110 using MergeableSpillsMap =
111 MapVector<std::pair<int, VNInfo *>, SmallPtrSet<MachineInstr *, 16>>;
112 MergeableSpillsMap MergeableSpills;
113
114 /// This is the map from original register to a set containing all its
115 /// siblings. To hoist a spill to another BB, we need to find out a live
116 /// sibling there and use it as the source of the new spill.
117 DenseMap<Register, SmallSetVector<Register, 16>> Virt2SiblingsMap;
118
119 bool isSpillCandBB(LiveInterval &OrigLI, VNInfo &OrigVNI,
120 MachineBasicBlock &BB, Register &LiveReg);
121
122 void rmRedundantSpills(
123 SmallPtrSet<MachineInstr *, 16> &Spills,
124 SmallVectorImpl<MachineInstr *> &SpillsToRm,
125 DenseMap<MachineDomTreeNode *, MachineInstr *> &SpillBBToSpill);
126
127 void getVisitOrders(
128 MachineBasicBlock *Root, SmallPtrSet<MachineInstr *, 16> &Spills,
129 SmallVectorImpl<MachineDomTreeNode *> &Orders,
130 SmallVectorImpl<MachineInstr *> &SpillsToRm,
131 DenseMap<MachineDomTreeNode *, unsigned> &SpillsToKeep,
132 DenseMap<MachineDomTreeNode *, MachineInstr *> &SpillBBToSpill);
133
134 void runHoistSpills(LiveInterval &OrigLI, VNInfo &OrigVNI,
135 SmallPtrSet<MachineInstr *, 16> &Spills,
136 SmallVectorImpl<MachineInstr *> &SpillsToRm,
137 DenseMap<MachineBasicBlock *, unsigned> &SpillsToIns);
138
139public:
140 HoistSpillHelper(MachineFunctionPass &pass, MachineFunction &mf,
141 VirtRegMap &vrm)
142 : MF(mf), LIS(pass.getAnalysis<LiveIntervals>()),
143 LSS(pass.getAnalysis<LiveStacks>()),
144 AA(&pass.getAnalysis<AAResultsWrapperPass>().getAAResults()),
145 MDT(pass.getAnalysis<MachineDominatorTree>()),
146 Loops(pass.getAnalysis<MachineLoopInfo>()), VRM(vrm),
147 MRI(mf.getRegInfo()), TII(*mf.getSubtarget().getInstrInfo()),
148 TRI(*mf.getSubtarget().getRegisterInfo()),
149 MBFI(pass.getAnalysis<MachineBlockFrequencyInfo>()),
150 IPA(LIS, mf.getNumBlockIDs()) {}
151
152 void addToMergeableSpills(MachineInstr &Spill, int StackSlot,
153 unsigned Original);
154 bool rmFromMergeableSpills(MachineInstr &Spill, int StackSlot);
155 void hoistAllSpills();
156 void LRE_DidCloneVirtReg(Register, Register) override;
157};
158
159class InlineSpiller : public Spiller {
160 MachineFunction &MF;
161 LiveIntervals &LIS;
162 LiveStacks &LSS;
163 AliasAnalysis *AA;
164 MachineDominatorTree &MDT;
165 MachineLoopInfo &Loops;
166 VirtRegMap &VRM;
167 MachineRegisterInfo &MRI;
168 const TargetInstrInfo &TII;
169 const TargetRegisterInfo &TRI;
170 const MachineBlockFrequencyInfo &MBFI;
171
172 // Variables that are valid during spill(), but used by multiple methods.
173 LiveRangeEdit *Edit;
174 LiveInterval *StackInt;
175 int StackSlot;
176 Register Original;
177
178 // All registers to spill to StackSlot, including the main register.
179 SmallVector<Register, 8> RegsToSpill;
180
181 // All COPY instructions to/from snippets.
182 // They are ignored since both operands refer to the same stack slot.
183 SmallPtrSet<MachineInstr*, 8> SnippetCopies;
184
185 // Values that failed to remat at some point.
186 SmallPtrSet<VNInfo*, 8> UsedValues;
187
188 // Dead defs generated during spilling.
189 SmallVector<MachineInstr*, 8> DeadDefs;
190
191 // Object records spills information and does the hoisting.
192 HoistSpillHelper HSpiller;
193
194 // Live range weight calculator.
195 VirtRegAuxInfo &VRAI;
196
197 ~InlineSpiller() override = default;
198
199public:
200 InlineSpiller(MachineFunctionPass &Pass, MachineFunction &MF, VirtRegMap &VRM,
201 VirtRegAuxInfo &VRAI)
202 : MF(MF), LIS(Pass.getAnalysis<LiveIntervals>()),
203 LSS(Pass.getAnalysis<LiveStacks>()),
204 AA(&Pass.getAnalysis<AAResultsWrapperPass>().getAAResults()),
205 MDT(Pass.getAnalysis<MachineDominatorTree>()),
206 Loops(Pass.getAnalysis<MachineLoopInfo>()), VRM(VRM),
207 MRI(MF.getRegInfo()), TII(*MF.getSubtarget().getInstrInfo()),
208 TRI(*MF.getSubtarget().getRegisterInfo()),
209 MBFI(Pass.getAnalysis<MachineBlockFrequencyInfo>()),
210 HSpiller(Pass, MF, VRM), VRAI(VRAI) {}
211
212 void spill(LiveRangeEdit &) override;
213 void postOptimization() override;
214
215private:
216 bool isSnippet(const LiveInterval &SnipLI);
217 void collectRegsToSpill();
218
219 bool isRegToSpill(Register Reg) { return is_contained(RegsToSpill, Reg); }
220
221 bool isSibling(Register Reg);
222 bool hoistSpillInsideBB(LiveInterval &SpillLI, MachineInstr &CopyMI);
223 void eliminateRedundantSpills(LiveInterval &LI, VNInfo *VNI);
224
225 void markValueUsed(LiveInterval*, VNInfo*);
226 bool canGuaranteeAssignmentAfterRemat(Register VReg, MachineInstr &MI);
227 bool reMaterializeFor(LiveInterval &, MachineInstr &MI);
228 void reMaterializeAll();
229
230 bool coalesceStackAccess(MachineInstr *MI, Register Reg);
231 bool foldMemoryOperand(ArrayRef<std::pair<MachineInstr *, unsigned>>,
232 MachineInstr *LoadMI = nullptr);
233 void insertReload(Register VReg, SlotIndex, MachineBasicBlock::iterator MI);
234 void insertSpill(Register VReg, bool isKill, MachineBasicBlock::iterator MI);
235
236 void spillAroundUses(Register Reg);
237 void spillAll();
238};
239
240} // end anonymous namespace
241
242Spiller::~Spiller() = default;
243
244void Spiller::anchor() {}
245
246Spiller *llvm::createInlineSpiller(MachineFunctionPass &Pass,
247 MachineFunction &MF, VirtRegMap &VRM,
248 VirtRegAuxInfo &VRAI) {
249 return new InlineSpiller(Pass, MF, VRM, VRAI);
250}
251
252//===----------------------------------------------------------------------===//
253// Snippets
254//===----------------------------------------------------------------------===//
255
256// When spilling a virtual register, we also spill any snippets it is connected
257// to. The snippets are small live ranges that only have a single real use,
258// leftovers from live range splitting. Spilling them enables memory operand
259// folding or tightens the live range around the single use.
260//
261// This minimizes register pressure and maximizes the store-to-load distance for
262// spill slots which can be important in tight loops.
263
264/// isFullCopyOf - If MI is a COPY to or from Reg, return the other register,
265/// otherwise return 0.
266static Register isFullCopyOf(const MachineInstr &MI, Register Reg) {
267 if (!MI.isFullCopy())
6
Calling 'MachineInstr::isFullCopy'
8
Returning from 'MachineInstr::isFullCopy'
9
Taking true branch
268 return Register();
269 if (MI.getOperand(0).getReg() == Reg)
270 return MI.getOperand(1).getReg();
271 if (MI.getOperand(1).getReg() == Reg)
272 return MI.getOperand(0).getReg();
273 return Register();
274}
275
276static void getVDefInterval(const MachineInstr &MI, LiveIntervals &LIS) {
277 for (const MachineOperand &MO : MI.operands())
278 if (MO.isReg() && MO.isDef() && Register::isVirtualRegister(MO.getReg()))
279 LIS.getInterval(MO.getReg());
280}
281
282/// isSnippet - Identify if a live interval is a snippet that should be spilled.
283/// It is assumed that SnipLI is a virtual register with the same original as
284/// Edit->getReg().
285bool InlineSpiller::isSnippet(const LiveInterval &SnipLI) {
286 Register Reg = Edit->getReg();
287
288 // A snippet is a tiny live range with only a single instruction using it
289 // besides copies to/from Reg or spills/fills. We accept:
290 //
291 // %snip = COPY %Reg / FILL fi#
292 // %snip = USE %snip
293 // %Reg = COPY %snip / SPILL %snip, fi#
294 //
295 if (SnipLI.getNumValNums() > 2 || !LIS.intervalIsInOneMBB(SnipLI))
1
Assuming the condition is false
2
Assuming the condition is false
3
Taking false branch
296 return false;
297
298 MachineInstr *UseMI = nullptr;
299
300 // Check that all uses satisfy our criteria.
301 for (MachineRegisterInfo::reg_instr_nodbg_iterator
4
Loop condition is true. Entering loop body
302 RI = MRI.reg_instr_nodbg_begin(SnipLI.reg()),
303 E = MRI.reg_instr_nodbg_end();
304 RI != E;) {
305 MachineInstr &MI = *RI++;
306
307 // Allow copies to/from Reg.
308 if (isFullCopyOf(MI, Reg))
5
Calling 'isFullCopyOf'
10
Returning from 'isFullCopyOf'
11
Calling 'Register::operator unsigned int'
13
Returning from 'Register::operator unsigned int'
14
Taking false branch
309 continue;
310
311 // Allow stack slot loads.
312 int FI;
15
'FI' declared without an initial value
313 if (SnipLI.reg() == TII.isLoadFromStackSlot(MI, FI) && FI == StackSlot)
16
Calling 'TargetInstrInfo::isLoadFromStackSlot'
18
Returning from 'TargetInstrInfo::isLoadFromStackSlot'
19
Calling 'Register::operator=='
22
Returning from 'Register::operator=='
23
The left operand of '==' is a garbage value
314 continue;
315
316 // Allow stack slot stores.
317 if (SnipLI.reg() == TII.isStoreToStackSlot(MI, FI) && FI == StackSlot)
318 continue;
319
320 // Allow a single additional instruction.
321 if (UseMI && &MI != UseMI)
322 return false;
323 UseMI = &MI;
324 }
325 return true;
326}
327
328/// collectRegsToSpill - Collect live range snippets that only have a single
329/// real use.
330void InlineSpiller::collectRegsToSpill() {
331 Register Reg = Edit->getReg();
332
333 // Main register always spills.
334 RegsToSpill.assign(1, Reg);
335 SnippetCopies.clear();
336
337 // Snippets all have the same original, so there can't be any for an original
338 // register.
339 if (Original == Reg)
340 return;
341
342 for (MachineInstr &MI :
343 llvm::make_early_inc_range(MRI.reg_instructions(Reg))) {
344 Register SnipReg = isFullCopyOf(MI, Reg);
345 if (!isSibling(SnipReg))
346 continue;
347 LiveInterval &SnipLI = LIS.getInterval(SnipReg);
348 if (!isSnippet(SnipLI))
349 continue;
350 SnippetCopies.insert(&MI);
351 if (isRegToSpill(SnipReg))
352 continue;
353 RegsToSpill.push_back(SnipReg);
354 LLVM_DEBUG(dbgs() << "\talso spill snippet " << SnipLI << '\n')do { if (::llvm::DebugFlag && ::llvm::isCurrentDebugType
("regalloc")) { dbgs() << "\talso spill snippet " <<
SnipLI << '\n'; } } while (false)
;
355 ++NumSnippets;
356 }
357}
358
359bool InlineSpiller::isSibling(Register Reg) {
360 return Reg.isVirtual() && VRM.getOriginal(Reg) == Original;
361}
362
363/// It is beneficial to spill to earlier place in the same BB in case
364/// as follows:
365/// There is an alternative def earlier in the same MBB.
366/// Hoist the spill as far as possible in SpillMBB. This can ease
367/// register pressure:
368///
369/// x = def
370/// y = use x
371/// s = copy x
372///
373/// Hoisting the spill of s to immediately after the def removes the
374/// interference between x and y:
375///
376/// x = def
377/// spill x
378/// y = use killed x
379///
380/// This hoist only helps when the copy kills its source.
381///
382bool InlineSpiller::hoistSpillInsideBB(LiveInterval &SpillLI,
383 MachineInstr &CopyMI) {
384 SlotIndex Idx = LIS.getInstructionIndex(CopyMI);
385#ifndef NDEBUG
386 VNInfo *VNI = SpillLI.getVNInfoAt(Idx.getRegSlot());
387 assert(VNI && VNI->def == Idx.getRegSlot() && "Not defined by copy")(static_cast <bool> (VNI && VNI->def == Idx.
getRegSlot() && "Not defined by copy") ? void (0) : __assert_fail
("VNI && VNI->def == Idx.getRegSlot() && \"Not defined by copy\""
, "llvm/lib/CodeGen/InlineSpiller.cpp", 387, __extension__ __PRETTY_FUNCTION__
))
;
388#endif
389
390 Register SrcReg = CopyMI.getOperand(1).getReg();
391 LiveInterval &SrcLI = LIS.getInterval(SrcReg);
392 VNInfo *SrcVNI = SrcLI.getVNInfoAt(Idx);
393 LiveQueryResult SrcQ = SrcLI.Query(Idx);
394 MachineBasicBlock *DefMBB = LIS.getMBBFromIndex(SrcVNI->def);
395 if (DefMBB != CopyMI.getParent() || !SrcQ.isKill())
396 return false;
397
398 // Conservatively extend the stack slot range to the range of the original
399 // value. We may be able to do better with stack slot coloring by being more
400 // careful here.
401 assert(StackInt && "No stack slot assigned yet.")(static_cast <bool> (StackInt && "No stack slot assigned yet."
) ? void (0) : __assert_fail ("StackInt && \"No stack slot assigned yet.\""
, "llvm/lib/CodeGen/InlineSpiller.cpp", 401, __extension__ __PRETTY_FUNCTION__
))
;
402 LiveInterval &OrigLI = LIS.getInterval(Original);
403 VNInfo *OrigVNI = OrigLI.getVNInfoAt(Idx);
404 StackInt->MergeValueInAsValue(OrigLI, OrigVNI, StackInt->getValNumInfo(0));
405 LLVM_DEBUG(dbgs() << "\tmerged orig valno " << OrigVNI->id << ": "do { if (::llvm::DebugFlag && ::llvm::isCurrentDebugType
("regalloc")) { dbgs() << "\tmerged orig valno " <<
OrigVNI->id << ": " << *StackInt << '\n'
; } } while (false)
406 << *StackInt << '\n')do { if (::llvm::DebugFlag && ::llvm::isCurrentDebugType
("regalloc")) { dbgs() << "\tmerged orig valno " <<
OrigVNI->id << ": " << *StackInt << '\n'
; } } while (false)
;
407
408 // We are going to spill SrcVNI immediately after its def, so clear out
409 // any later spills of the same value.
410 eliminateRedundantSpills(SrcLI, SrcVNI);
411
412 MachineBasicBlock *MBB = LIS.getMBBFromIndex(SrcVNI->def);
413 MachineBasicBlock::iterator MII;
414 if (SrcVNI->isPHIDef())
415 MII = MBB->SkipPHIsLabelsAndDebug(MBB->begin());
416 else {
417 MachineInstr *DefMI = LIS.getInstructionFromIndex(SrcVNI->def);
418 assert(DefMI && "Defining instruction disappeared")(static_cast <bool> (DefMI && "Defining instruction disappeared"
) ? void (0) : __assert_fail ("DefMI && \"Defining instruction disappeared\""
, "llvm/lib/CodeGen/InlineSpiller.cpp", 418, __extension__ __PRETTY_FUNCTION__
))
;
419 MII = DefMI;
420 ++MII;
421 }
422 MachineInstrSpan MIS(MII, MBB);
423 // Insert spill without kill flag immediately after def.
424 TII.storeRegToStackSlot(*MBB, MII, SrcReg, false, StackSlot,
425 MRI.getRegClass(SrcReg), &TRI);
426 LIS.InsertMachineInstrRangeInMaps(MIS.begin(), MII);
427 for (const MachineInstr &MI : make_range(MIS.begin(), MII))
428 getVDefInterval(MI, LIS);
429 --MII; // Point to store instruction.
430 LLVM_DEBUG(dbgs() << "\thoisted: " << SrcVNI->def << '\t' << *MII)do { if (::llvm::DebugFlag && ::llvm::isCurrentDebugType
("regalloc")) { dbgs() << "\thoisted: " << SrcVNI
->def << '\t' << *MII; } } while (false)
;
431
432 // If there is only 1 store instruction is required for spill, add it
433 // to mergeable list. In X86 AMX, 2 intructions are required to store.
434 // We disable the merge for this case.
435 if (MIS.begin() == MII)
436 HSpiller.addToMergeableSpills(*MII, StackSlot, Original);
437 ++NumSpills;
438 return true;
439}
440
441/// eliminateRedundantSpills - SLI:VNI is known to be on the stack. Remove any
442/// redundant spills of this value in SLI.reg and sibling copies.
443void InlineSpiller::eliminateRedundantSpills(LiveInterval &SLI, VNInfo *VNI) {
444 assert(VNI && "Missing value")(static_cast <bool> (VNI && "Missing value") ? void
(0) : __assert_fail ("VNI && \"Missing value\"", "llvm/lib/CodeGen/InlineSpiller.cpp"
, 444, __extension__ __PRETTY_FUNCTION__))
;
445 SmallVector<std::pair<LiveInterval*, VNInfo*>, 8> WorkList;
446 WorkList.push_back(std::make_pair(&SLI, VNI));
447 assert(StackInt && "No stack slot assigned yet.")(static_cast <bool> (StackInt && "No stack slot assigned yet."
) ? void (0) : __assert_fail ("StackInt && \"No stack slot assigned yet.\""
, "llvm/lib/CodeGen/InlineSpiller.cpp", 447, __extension__ __PRETTY_FUNCTION__
))
;
448
449 do {
450 LiveInterval *LI;
451 std::tie(LI, VNI) = WorkList.pop_back_val();
452 Register Reg = LI->reg();
453 LLVM_DEBUG(dbgs() << "Checking redundant spills for " << VNI->id << '@'do { if (::llvm::DebugFlag && ::llvm::isCurrentDebugType
("regalloc")) { dbgs() << "Checking redundant spills for "
<< VNI->id << '@' << VNI->def <<
" in " << *LI << '\n'; } } while (false)
454 << VNI->def << " in " << *LI << '\n')do { if (::llvm::DebugFlag && ::llvm::isCurrentDebugType
("regalloc")) { dbgs() << "Checking redundant spills for "
<< VNI->id << '@' << VNI->def <<
" in " << *LI << '\n'; } } while (false)
;
455
456 // Regs to spill are taken care of.
457 if (isRegToSpill(Reg))
458 continue;
459
460 // Add all of VNI's live range to StackInt.
461 StackInt->MergeValueInAsValue(*LI, VNI, StackInt->getValNumInfo(0));
462 LLVM_DEBUG(dbgs() << "Merged to stack int: " << *StackInt << '\n')do { if (::llvm::DebugFlag && ::llvm::isCurrentDebugType
("regalloc")) { dbgs() << "Merged to stack int: " <<
*StackInt << '\n'; } } while (false)
;
463
464 // Find all spills and copies of VNI.
465 for (MachineInstr &MI :
466 llvm::make_early_inc_range(MRI.use_nodbg_instructions(Reg))) {
467 if (!MI.isCopy() && !MI.mayStore())
468 continue;
469 SlotIndex Idx = LIS.getInstructionIndex(MI);
470 if (LI->getVNInfoAt(Idx) != VNI)
471 continue;
472
473 // Follow sibling copies down the dominator tree.
474 if (Register DstReg = isFullCopyOf(MI, Reg)) {
475 if (isSibling(DstReg)) {
476 LiveInterval &DstLI = LIS.getInterval(DstReg);
477 VNInfo *DstVNI = DstLI.getVNInfoAt(Idx.getRegSlot());
478 assert(DstVNI && "Missing defined value")(static_cast <bool> (DstVNI && "Missing defined value"
) ? void (0) : __assert_fail ("DstVNI && \"Missing defined value\""
, "llvm/lib/CodeGen/InlineSpiller.cpp", 478, __extension__ __PRETTY_FUNCTION__
))
;
479 assert(DstVNI->def == Idx.getRegSlot() && "Wrong copy def slot")(static_cast <bool> (DstVNI->def == Idx.getRegSlot()
&& "Wrong copy def slot") ? void (0) : __assert_fail
("DstVNI->def == Idx.getRegSlot() && \"Wrong copy def slot\""
, "llvm/lib/CodeGen/InlineSpiller.cpp", 479, __extension__ __PRETTY_FUNCTION__
))
;
480 WorkList.push_back(std::make_pair(&DstLI, DstVNI));
481 }
482 continue;
483 }
484
485 // Erase spills.
486 int FI;
487 if (Reg == TII.isStoreToStackSlot(MI, FI) && FI == StackSlot) {
488 LLVM_DEBUG(dbgs() << "Redundant spill " << Idx << '\t' << MI)do { if (::llvm::DebugFlag && ::llvm::isCurrentDebugType
("regalloc")) { dbgs() << "Redundant spill " << Idx
<< '\t' << MI; } } while (false)
;
489 // eliminateDeadDefs won't normally remove stores, so switch opcode.
490 MI.setDesc(TII.get(TargetOpcode::KILL));
491 DeadDefs.push_back(&MI);
492 ++NumSpillsRemoved;
493 if (HSpiller.rmFromMergeableSpills(MI, StackSlot))
494 --NumSpills;
495 }
496 }
497 } while (!WorkList.empty());
498}
499
500//===----------------------------------------------------------------------===//
501// Rematerialization
502//===----------------------------------------------------------------------===//
503
504/// markValueUsed - Remember that VNI failed to rematerialize, so its defining
505/// instruction cannot be eliminated. See through snippet copies
506void InlineSpiller::markValueUsed(LiveInterval *LI, VNInfo *VNI) {
507 SmallVector<std::pair<LiveInterval*, VNInfo*>, 8> WorkList;
508 WorkList.push_back(std::make_pair(LI, VNI));
509 do {
510 std::tie(LI, VNI) = WorkList.pop_back_val();
511 if (!UsedValues.insert(VNI).second)
512 continue;
513
514 if (VNI->isPHIDef()) {
515 MachineBasicBlock *MBB = LIS.getMBBFromIndex(VNI->def);
516 for (MachineBasicBlock *P : MBB->predecessors()) {
517 VNInfo *PVNI = LI->getVNInfoBefore(LIS.getMBBEndIdx(P));
518 if (PVNI)
519 WorkList.push_back(std::make_pair(LI, PVNI));
520 }
521 continue;
522 }
523
524 // Follow snippet copies.
525 MachineInstr *MI = LIS.getInstructionFromIndex(VNI->def);
526 if (!SnippetCopies.count(MI))
527 continue;
528 LiveInterval &SnipLI = LIS.getInterval(MI->getOperand(1).getReg());
529 assert(isRegToSpill(SnipLI.reg()) && "Unexpected register in copy")(static_cast <bool> (isRegToSpill(SnipLI.reg()) &&
"Unexpected register in copy") ? void (0) : __assert_fail ("isRegToSpill(SnipLI.reg()) && \"Unexpected register in copy\""
, "llvm/lib/CodeGen/InlineSpiller.cpp", 529, __extension__ __PRETTY_FUNCTION__
))
;
530 VNInfo *SnipVNI = SnipLI.getVNInfoAt(VNI->def.getRegSlot(true));
531 assert(SnipVNI && "Snippet undefined before copy")(static_cast <bool> (SnipVNI && "Snippet undefined before copy"
) ? void (0) : __assert_fail ("SnipVNI && \"Snippet undefined before copy\""
, "llvm/lib/CodeGen/InlineSpiller.cpp", 531, __extension__ __PRETTY_FUNCTION__
))
;
532 WorkList.push_back(std::make_pair(&SnipLI, SnipVNI));
533 } while (!WorkList.empty());
534}
535
536bool InlineSpiller::canGuaranteeAssignmentAfterRemat(Register VReg,
537 MachineInstr &MI) {
538 if (!RestrictStatepointRemat)
539 return true;
540 // Here's a quick explanation of the problem we're trying to handle here:
541 // * There are some pseudo instructions with more vreg uses than there are
542 // physical registers on the machine.
543 // * This is normally handled by spilling the vreg, and folding the reload
544 // into the user instruction. (Thus decreasing the number of used vregs
545 // until the remainder can be assigned to physregs.)
546 // * However, since we may try to spill vregs in any order, we can end up
547 // trying to spill each operand to the instruction, and then rematting it
548 // instead. When that happens, the new live intervals (for the remats) are
549 // expected to be trivially assignable (i.e. RS_Done). However, since we
550 // may have more remats than physregs, we're guaranteed to fail to assign
551 // one.
552 // At the moment, we only handle this for STATEPOINTs since they're the only
553 // pseudo op where we've seen this. If we start seeing other instructions
554 // with the same problem, we need to revisit this.
555 if (MI.getOpcode() != TargetOpcode::STATEPOINT)
556 return true;
557 // For STATEPOINTs we allow re-materialization for fixed arguments only hoping
558 // that number of physical registers is enough to cover all fixed arguments.
559 // If it is not true we need to revisit it.
560 for (unsigned Idx = StatepointOpers(&MI).getVarIdx(),
561 EndIdx = MI.getNumOperands();
562 Idx < EndIdx; ++Idx) {
563 MachineOperand &MO = MI.getOperand(Idx);
564 if (MO.isReg() && MO.getReg() == VReg)
565 return false;
566 }
567 return true;
568}
569
570/// reMaterializeFor - Attempt to rematerialize before MI instead of reloading.
571bool InlineSpiller::reMaterializeFor(LiveInterval &VirtReg, MachineInstr &MI) {
572 // Analyze instruction
573 SmallVector<std::pair<MachineInstr *, unsigned>, 8> Ops;
574 VirtRegInfo RI = AnalyzeVirtRegInBundle(MI, VirtReg.reg(), &Ops);
575
576 if (!RI.Reads)
577 return false;
578
579 SlotIndex UseIdx = LIS.getInstructionIndex(MI).getRegSlot(true);
580 VNInfo *ParentVNI = VirtReg.getVNInfoAt(UseIdx.getBaseIndex());
581
582 if (!ParentVNI) {
583 LLVM_DEBUG(dbgs() << "\tadding <undef> flags: ")do { if (::llvm::DebugFlag && ::llvm::isCurrentDebugType
("regalloc")) { dbgs() << "\tadding <undef> flags: "
; } } while (false)
;
584 for (MachineOperand &MO : MI.operands())
585 if (MO.isReg() && MO.isUse() && MO.getReg() == VirtReg.reg())
586 MO.setIsUndef();
587 LLVM_DEBUG(dbgs() << UseIdx << '\t' << MI)do { if (::llvm::DebugFlag && ::llvm::isCurrentDebugType
("regalloc")) { dbgs() << UseIdx << '\t' <<
MI; } } while (false)
;
588 return true;
589 }
590
591 if (SnippetCopies.count(&MI))
592 return false;
593
594 LiveInterval &OrigLI = LIS.getInterval(Original);
595 VNInfo *OrigVNI = OrigLI.getVNInfoAt(UseIdx);
596 LiveRangeEdit::Remat RM(ParentVNI);
597 RM.OrigMI = LIS.getInstructionFromIndex(OrigVNI->def);
598
599 if (!Edit->canRematerializeAt(RM, OrigVNI, UseIdx, false)) {
600 markValueUsed(&VirtReg, ParentVNI);
601 LLVM_DEBUG(dbgs() << "\tcannot remat for " << UseIdx << '\t' << MI)do { if (::llvm::DebugFlag && ::llvm::isCurrentDebugType
("regalloc")) { dbgs() << "\tcannot remat for " <<
UseIdx << '\t' << MI; } } while (false)
;
602 return false;
603 }
604
605 // If the instruction also writes VirtReg.reg, it had better not require the
606 // same register for uses and defs.
607 if (RI.Tied) {
608 markValueUsed(&VirtReg, ParentVNI);
609 LLVM_DEBUG(dbgs() << "\tcannot remat tied reg: " << UseIdx << '\t' << MI)do { if (::llvm::DebugFlag && ::llvm::isCurrentDebugType
("regalloc")) { dbgs() << "\tcannot remat tied reg: " <<
UseIdx << '\t' << MI; } } while (false)
;
610 return false;
611 }
612
613 // Before rematerializing into a register for a single instruction, try to
614 // fold a load into the instruction. That avoids allocating a new register.
615 if (RM.OrigMI->canFoldAsLoad() &&
616 foldMemoryOperand(Ops, RM.OrigMI)) {
617 Edit->markRematerialized(RM.ParentVNI);
618 ++NumFoldedLoads;
619 return true;
620 }
621
622 // If we can't guarantee that we'll be able to actually assign the new vreg,
623 // we can't remat.
624 if (!canGuaranteeAssignmentAfterRemat(VirtReg.reg(), MI)) {
625 markValueUsed(&VirtReg, ParentVNI);
626 LLVM_DEBUG(dbgs() << "\tcannot remat for " << UseIdx << '\t' << MI)do { if (::llvm::DebugFlag && ::llvm::isCurrentDebugType
("regalloc")) { dbgs() << "\tcannot remat for " <<
UseIdx << '\t' << MI; } } while (false)
;
627 return false;
628 }
629
630 // Allocate a new register for the remat.
631 Register NewVReg = Edit->createFrom(Original);
632
633 // Finally we can rematerialize OrigMI before MI.
634 SlotIndex DefIdx =
635 Edit->rematerializeAt(*MI.getParent(), MI, NewVReg, RM, TRI);
636
637 // We take the DebugLoc from MI, since OrigMI may be attributed to a
638 // different source location.
639 auto *NewMI = LIS.getInstructionFromIndex(DefIdx);
640 NewMI->setDebugLoc(MI.getDebugLoc());
641
642 (void)DefIdx;
643 LLVM_DEBUG(dbgs() << "\tremat: " << DefIdx << '\t'do { if (::llvm::DebugFlag && ::llvm::isCurrentDebugType
("regalloc")) { dbgs() << "\tremat: " << DefIdx <<
'\t' << *LIS.getInstructionFromIndex(DefIdx); } } while
(false)
644 << *LIS.getInstructionFromIndex(DefIdx))do { if (::llvm::DebugFlag && ::llvm::isCurrentDebugType
("regalloc")) { dbgs() << "\tremat: " << DefIdx <<
'\t' << *LIS.getInstructionFromIndex(DefIdx); } } while
(false)
;
645
646 // Replace operands
647 for (const auto &OpPair : Ops) {
648 MachineOperand &MO = OpPair.first->getOperand(OpPair.second);
649 if (MO.isReg() && MO.isUse() && MO.getReg() == VirtReg.reg()) {
650 MO.setReg(NewVReg);
651 MO.setIsKill();
652 }
653 }
654 LLVM_DEBUG(dbgs() << "\t " << UseIdx << '\t' << MI << '\n')do { if (::llvm::DebugFlag && ::llvm::isCurrentDebugType
("regalloc")) { dbgs() << "\t " << UseIdx <<
'\t' << MI << '\n'; } } while (false)
;
655
656 ++NumRemats;
657 return true;
658}
659
660/// reMaterializeAll - Try to rematerialize as many uses as possible,
661/// and trim the live ranges after.
662void InlineSpiller::reMaterializeAll() {
663 if (!Edit->anyRematerializable(AA))
664 return;
665
666 UsedValues.clear();
667
668 // Try to remat before all uses of snippets.
669 bool anyRemat = false;
670 for (Register Reg : RegsToSpill) {
671 LiveInterval &LI = LIS.getInterval(Reg);
672 for (MachineInstr &MI : llvm::make_early_inc_range(MRI.reg_bundles(Reg))) {
673 // Debug values are not allowed to affect codegen.
674 if (MI.isDebugValue())
675 continue;
676
677 assert(!MI.isDebugInstr() && "Did not expect to find a use in debug "(static_cast <bool> (!MI.isDebugInstr() && "Did not expect to find a use in debug "
"instruction that isn't a DBG_VALUE") ? void (0) : __assert_fail
("!MI.isDebugInstr() && \"Did not expect to find a use in debug \" \"instruction that isn't a DBG_VALUE\""
, "llvm/lib/CodeGen/InlineSpiller.cpp", 678, __extension__ __PRETTY_FUNCTION__
))
678 "instruction that isn't a DBG_VALUE")(static_cast <bool> (!MI.isDebugInstr() && "Did not expect to find a use in debug "
"instruction that isn't a DBG_VALUE") ? void (0) : __assert_fail
("!MI.isDebugInstr() && \"Did not expect to find a use in debug \" \"instruction that isn't a DBG_VALUE\""
, "llvm/lib/CodeGen/InlineSpiller.cpp", 678, __extension__ __PRETTY_FUNCTION__
))
;
679
680 anyRemat |= reMaterializeFor(LI, MI);
681 }
682 }
683 if (!anyRemat)
684 return;
685
686 // Remove any values that were completely rematted.
687 for (Register Reg : RegsToSpill) {
688 LiveInterval &LI = LIS.getInterval(Reg);
689 for (VNInfo *VNI : llvm::make_range(LI.vni_begin(), LI.vni_end())) {
690 if (VNI->isUnused() || VNI->isPHIDef() || UsedValues.count(VNI))
691 continue;
692 MachineInstr *MI = LIS.getInstructionFromIndex(VNI->def);
693 MI->addRegisterDead(Reg, &TRI);
694 if (!MI->allDefsAreDead())
695 continue;
696 LLVM_DEBUG(dbgs() << "All defs dead: " << *MI)do { if (::llvm::DebugFlag && ::llvm::isCurrentDebugType
("regalloc")) { dbgs() << "All defs dead: " << *MI
; } } while (false)
;
697 DeadDefs.push_back(MI);
698 }
699 }
700
701 // Eliminate dead code after remat. Note that some snippet copies may be
702 // deleted here.
703 if (DeadDefs.empty())
704 return;
705 LLVM_DEBUG(dbgs() << "Remat created " << DeadDefs.size() << " dead defs.\n")do { if (::llvm::DebugFlag && ::llvm::isCurrentDebugType
("regalloc")) { dbgs() << "Remat created " << DeadDefs
.size() << " dead defs.\n"; } } while (false)
;
706 Edit->eliminateDeadDefs(DeadDefs, RegsToSpill, AA);
707
708 // LiveRangeEdit::eliminateDeadDef is used to remove dead define instructions
709 // after rematerialization. To remove a VNI for a vreg from its LiveInterval,
710 // LiveIntervals::removeVRegDefAt is used. However, after non-PHI VNIs are all
711 // removed, PHI VNI are still left in the LiveInterval.
712 // So to get rid of unused reg, we need to check whether it has non-dbg
713 // reference instead of whether it has non-empty interval.
714 unsigned ResultPos = 0;
715 for (Register Reg : RegsToSpill) {
716 if (MRI.reg_nodbg_empty(Reg)) {
717 Edit->eraseVirtReg(Reg);
718 continue;
719 }
720
721 assert(LIS.hasInterval(Reg) &&(static_cast <bool> (LIS.hasInterval(Reg) && (!
LIS.getInterval(Reg).empty() || !MRI.reg_nodbg_empty(Reg)) &&
"Empty and not used live-range?!") ? void (0) : __assert_fail
("LIS.hasInterval(Reg) && (!LIS.getInterval(Reg).empty() || !MRI.reg_nodbg_empty(Reg)) && \"Empty and not used live-range?!\""
, "llvm/lib/CodeGen/InlineSpiller.cpp", 723, __extension__ __PRETTY_FUNCTION__
))
722 (!LIS.getInterval(Reg).empty() || !MRI.reg_nodbg_empty(Reg)) &&(static_cast <bool> (LIS.hasInterval(Reg) && (!
LIS.getInterval(Reg).empty() || !MRI.reg_nodbg_empty(Reg)) &&
"Empty and not used live-range?!") ? void (0) : __assert_fail
("LIS.hasInterval(Reg) && (!LIS.getInterval(Reg).empty() || !MRI.reg_nodbg_empty(Reg)) && \"Empty and not used live-range?!\""
, "llvm/lib/CodeGen/InlineSpiller.cpp", 723, __extension__ __PRETTY_FUNCTION__
))
723 "Empty and not used live-range?!")(static_cast <bool> (LIS.hasInterval(Reg) && (!
LIS.getInterval(Reg).empty() || !MRI.reg_nodbg_empty(Reg)) &&
"Empty and not used live-range?!") ? void (0) : __assert_fail
("LIS.hasInterval(Reg) && (!LIS.getInterval(Reg).empty() || !MRI.reg_nodbg_empty(Reg)) && \"Empty and not used live-range?!\""
, "llvm/lib/CodeGen/InlineSpiller.cpp", 723, __extension__ __PRETTY_FUNCTION__
))
;
724
725 RegsToSpill[ResultPos++] = Reg;
726 }
727 RegsToSpill.erase(RegsToSpill.begin() + ResultPos, RegsToSpill.end());
728 LLVM_DEBUG(dbgs() << RegsToSpill.size()do { if (::llvm::DebugFlag && ::llvm::isCurrentDebugType
("regalloc")) { dbgs() << RegsToSpill.size() << " registers to spill after remat.\n"
; } } while (false)
729 << " registers to spill after remat.\n")do { if (::llvm::DebugFlag && ::llvm::isCurrentDebugType
("regalloc")) { dbgs() << RegsToSpill.size() << " registers to spill after remat.\n"
; } } while (false)
;
730}
731
732//===----------------------------------------------------------------------===//
733// Spilling
734//===----------------------------------------------------------------------===//
735
736/// If MI is a load or store of StackSlot, it can be removed.
737bool InlineSpiller::coalesceStackAccess(MachineInstr *MI, Register Reg) {
738 int FI = 0;
739 Register InstrReg = TII.isLoadFromStackSlot(*MI, FI);
740 bool IsLoad = InstrReg;
741 if (!IsLoad)
742 InstrReg = TII.isStoreToStackSlot(*MI, FI);
743
744 // We have a stack access. Is it the right register and slot?
745 if (InstrReg != Reg || FI != StackSlot)
746 return false;
747
748 if (!IsLoad)
749 HSpiller.rmFromMergeableSpills(*MI, StackSlot);
750
751 LLVM_DEBUG(dbgs() << "Coalescing stack access: " << *MI)do { if (::llvm::DebugFlag && ::llvm::isCurrentDebugType
("regalloc")) { dbgs() << "Coalescing stack access: " <<
*MI; } } while (false)
;
752 LIS.RemoveMachineInstrFromMaps(*MI);
753 MI->eraseFromParent();
754
755 if (IsLoad) {
756 ++NumReloadsRemoved;
757 --NumReloads;
758 } else {
759 ++NumSpillsRemoved;
760 --NumSpills;
761 }
762
763 return true;
764}
765
766#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
767LLVM_DUMP_METHOD__attribute__((noinline)) __attribute__((__used__))
768// Dump the range of instructions from B to E with their slot indexes.
769static void dumpMachineInstrRangeWithSlotIndex(MachineBasicBlock::iterator B,
770 MachineBasicBlock::iterator E,
771 LiveIntervals const &LIS,
772 const char *const header,
773 Register VReg = Register()) {
774 char NextLine = '\n';
775 char SlotIndent = '\t';
776
777 if (std::next(B) == E) {
778 NextLine = ' ';
779 SlotIndent = ' ';
780 }
781
782 dbgs() << '\t' << header << ": " << NextLine;
783
784 for (MachineBasicBlock::iterator I = B; I != E; ++I) {
785 SlotIndex Idx = LIS.getInstructionIndex(*I).getRegSlot();
786
787 // If a register was passed in and this instruction has it as a
788 // destination that is marked as an early clobber, print the
789 // early-clobber slot index.
790 if (VReg) {
791 MachineOperand *MO = I->findRegisterDefOperand(VReg);
792 if (MO && MO->isEarlyClobber())
793 Idx = Idx.getRegSlot(true);
794 }
795
796 dbgs() << SlotIndent << Idx << '\t' << *I;
797 }
798}
799#endif
800
801/// foldMemoryOperand - Try folding stack slot references in Ops into their
802/// instructions.
803///
804/// @param Ops Operand indices from AnalyzeVirtRegInBundle().
805/// @param LoadMI Load instruction to use instead of stack slot when non-null.
806/// @return True on success.
807bool InlineSpiller::
808foldMemoryOperand(ArrayRef<std::pair<MachineInstr *, unsigned>> Ops,
809 MachineInstr *LoadMI) {
810 if (Ops.empty())
811 return false;
812 // Don't attempt folding in bundles.
813 MachineInstr *MI = Ops.front().first;
814 if (Ops.back().first != MI || MI->isBundled())
815 return false;
816
817 bool WasCopy = MI->isCopy();
818 Register ImpReg;
819
820 // TII::foldMemoryOperand will do what we need here for statepoint
821 // (fold load into use and remove corresponding def). We will replace
822 // uses of removed def with loads (spillAroundUses).
823 // For that to work we need to untie def and use to pass it through
824 // foldMemoryOperand and signal foldPatchpoint that it is allowed to
825 // fold them.
826 bool UntieRegs = MI->getOpcode() == TargetOpcode::STATEPOINT;
827
828 // Spill subregs if the target allows it.
829 // We always want to spill subregs for stackmap/patchpoint pseudos.
830 bool SpillSubRegs = TII.isSubregFoldable() ||
831 MI->getOpcode() == TargetOpcode::STATEPOINT ||
832 MI->getOpcode() == TargetOpcode::PATCHPOINT ||
833 MI->getOpcode() == TargetOpcode::STACKMAP;
834
835 // TargetInstrInfo::foldMemoryOperand only expects explicit, non-tied
836 // operands.
837 SmallVector<unsigned, 8> FoldOps;
838 for (const auto &OpPair : Ops) {
839 unsigned Idx = OpPair.second;
840 assert(MI == OpPair.first && "Instruction conflict during operand folding")(static_cast <bool> (MI == OpPair.first && "Instruction conflict during operand folding"
) ? void (0) : __assert_fail ("MI == OpPair.first && \"Instruction conflict during operand folding\""
, "llvm/lib/CodeGen/InlineSpiller.cpp", 840, __extension__ __PRETTY_FUNCTION__
))
;
841 MachineOperand &MO = MI->getOperand(Idx);
842 if (MO.isImplicit()) {
843 ImpReg = MO.getReg();
844 continue;
845 }
846
847 if (!SpillSubRegs && MO.getSubReg())
848 return false;
849 // We cannot fold a load instruction into a def.
850 if (LoadMI && MO.isDef())
851 return false;
852 // Tied use operands should not be passed to foldMemoryOperand.
853 if (UntieRegs || !MI->isRegTiedToDefOperand(Idx))
854 FoldOps.push_back(Idx);
855 }
856
857 // If we only have implicit uses, we won't be able to fold that.
858 // Moreover, TargetInstrInfo::foldMemoryOperand will assert if we try!
859 if (FoldOps.empty())
860 return false;
861
862 MachineInstrSpan MIS(MI, MI->getParent());
863
864 SmallVector<std::pair<unsigned, unsigned> > TiedOps;
865 if (UntieRegs)
866 for (unsigned Idx : FoldOps) {
867 MachineOperand &MO = MI->getOperand(Idx);
868 if (!MO.isTied())
869 continue;
870 unsigned Tied = MI->findTiedOperandIdx(Idx);
871 if (MO.isUse())
872 TiedOps.emplace_back(Tied, Idx);
873 else {
874 assert(MO.isDef() && "Tied to not use and def?")(static_cast <bool> (MO.isDef() && "Tied to not use and def?"
) ? void (0) : __assert_fail ("MO.isDef() && \"Tied to not use and def?\""
, "llvm/lib/CodeGen/InlineSpiller.cpp", 874, __extension__ __PRETTY_FUNCTION__
))
;
875 TiedOps.emplace_back(Idx, Tied);
876 }
877 MI->untieRegOperand(Idx);
878 }
879
880 MachineInstr *FoldMI =
881 LoadMI ? TII.foldMemoryOperand(*MI, FoldOps, *LoadMI, &LIS)
882 : TII.foldMemoryOperand(*MI, FoldOps, StackSlot, &LIS, &VRM);
883 if (!FoldMI) {
884 // Re-tie operands.
885 for (auto Tied : TiedOps)
886 MI->tieOperands(Tied.first, Tied.second);
887 return false;
888 }
889
890 // Remove LIS for any dead defs in the original MI not in FoldMI.
891 for (MIBundleOperands MO(*MI); MO.isValid(); ++MO) {
892 if (!MO->isReg())
893 continue;
894 Register Reg = MO->getReg();
895 if (!Reg || Register::isVirtualRegister(Reg) || MRI.isReserved(Reg)) {
896 continue;
897 }
898 // Skip non-Defs, including undef uses and internal reads.
899 if (MO->isUse())
900 continue;
901 PhysRegInfo RI = AnalyzePhysRegInBundle(*FoldMI, Reg, &TRI);
902 if (RI.FullyDefined)
903 continue;
904 // FoldMI does not define this physreg. Remove the LI segment.
905 assert(MO->isDead() && "Cannot fold physreg def")(static_cast <bool> (MO->isDead() && "Cannot fold physreg def"
) ? void (0) : __assert_fail ("MO->isDead() && \"Cannot fold physreg def\""
, "llvm/lib/CodeGen/InlineSpiller.cpp", 905, __extension__ __PRETTY_FUNCTION__
))
;
906 SlotIndex Idx = LIS.getInstructionIndex(*MI).getRegSlot();
907 LIS.removePhysRegDefAt(Reg.asMCReg(), Idx);
908 }
909
910 int FI;
911 if (TII.isStoreToStackSlot(*MI, FI) &&
912 HSpiller.rmFromMergeableSpills(*MI, FI))
913 --NumSpills;
914 LIS.ReplaceMachineInstrInMaps(*MI, *FoldMI);
915 // Update the call site info.
916 if (MI->isCandidateForCallSiteEntry())
917 MI->getMF()->moveCallSiteInfo(MI, FoldMI);
918
919 // If we've folded a store into an instruction labelled with debug-info,
920 // record a substitution from the old operand to the memory operand. Handle
921 // the simple common case where operand 0 is the one being folded, plus when
922 // the destination operand is also a tied def. More values could be
923 // substituted / preserved with more analysis.
924 if (MI->peekDebugInstrNum() && Ops[0].second == 0) {
925 // Helper lambda.
926 auto MakeSubstitution = [this,FoldMI,MI,&Ops]() {
927 // Substitute old operand zero to the new instructions memory operand.
928 unsigned OldOperandNum = Ops[0].second;
929 unsigned NewNum = FoldMI->getDebugInstrNum();
930 unsigned OldNum = MI->getDebugInstrNum();
931 MF.makeDebugValueSubstitution({OldNum, OldOperandNum},
932 {NewNum, MachineFunction::DebugOperandMemNumber});
933 };
934
935 const MachineOperand &Op0 = MI->getOperand(Ops[0].second);
936 if (Ops.size() == 1 && Op0.isDef()) {
937 MakeSubstitution();
938 } else if (Ops.size() == 2 && Op0.isDef() && MI->getOperand(1).isTied() &&
939 Op0.getReg() == MI->getOperand(1).getReg()) {
940 MakeSubstitution();
941 }
942 } else if (MI->peekDebugInstrNum()) {
943 // This is a debug-labelled instruction, but the operand being folded isn't
944 // at operand zero. Most likely this means it's a load being folded in.
945 // Substitute any register defs from operand zero up to the one being
946 // folded -- past that point, we don't know what the new operand indexes
947 // will be.
948 MF.substituteDebugValuesForInst(*MI, *FoldMI, Ops[0].second);
949 }
950
951 MI->eraseFromParent();
952
953 // Insert any new instructions other than FoldMI into the LIS maps.
954 assert(!MIS.empty() && "Unexpected empty span of instructions!")(static_cast <bool> (!MIS.empty() && "Unexpected empty span of instructions!"
) ? void (0) : __assert_fail ("!MIS.empty() && \"Unexpected empty span of instructions!\""
, "llvm/lib/CodeGen/InlineSpiller.cpp", 954, __extension__ __PRETTY_FUNCTION__
))
;
955 for (MachineInstr &MI : MIS)
956 if (&MI != FoldMI)
957 LIS.InsertMachineInstrInMaps(MI);
958
959 // TII.foldMemoryOperand may have left some implicit operands on the
960 // instruction. Strip them.
961 if (ImpReg)
962 for (unsigned i = FoldMI->getNumOperands(); i; --i) {
963 MachineOperand &MO = FoldMI->getOperand(i - 1);
964 if (!MO.isReg() || !MO.isImplicit())
965 break;
966 if (MO.getReg() == ImpReg)
967 FoldMI->RemoveOperand(i - 1);
968 }
969
970 LLVM_DEBUG(dumpMachineInstrRangeWithSlotIndex(MIS.begin(), MIS.end(), LIS,do { if (::llvm::DebugFlag && ::llvm::isCurrentDebugType
("regalloc")) { dumpMachineInstrRangeWithSlotIndex(MIS.begin(
), MIS.end(), LIS, "folded"); } } while (false)
971 "folded"))do { if (::llvm::DebugFlag && ::llvm::isCurrentDebugType
("regalloc")) { dumpMachineInstrRangeWithSlotIndex(MIS.begin(
), MIS.end(), LIS, "folded"); } } while (false)
;
972
973 if (!WasCopy)
974 ++NumFolded;
975 else if (Ops.front().second == 0) {
976 ++NumSpills;
977 // If there is only 1 store instruction is required for spill, add it
978 // to mergeable list. In X86 AMX, 2 intructions are required to store.
979 // We disable the merge for this case.
980 if (std::distance(MIS.begin(), MIS.end()) <= 1)
981 HSpiller.addToMergeableSpills(*FoldMI, StackSlot, Original);
982 } else
983 ++NumReloads;
984 return true;
985}
986
987void InlineSpiller::insertReload(Register NewVReg,
988 SlotIndex Idx,
989 MachineBasicBlock::iterator MI) {
990 MachineBasicBlock &MBB = *MI->getParent();
991
992 MachineInstrSpan MIS(MI, &MBB);
993 TII.loadRegFromStackSlot(MBB, MI, NewVReg, StackSlot,
994 MRI.getRegClass(NewVReg), &TRI);
995
996 LIS.InsertMachineInstrRangeInMaps(MIS.begin(), MI);
997
998 LLVM_DEBUG(dumpMachineInstrRangeWithSlotIndex(MIS.begin(), MI, LIS, "reload",do { if (::llvm::DebugFlag && ::llvm::isCurrentDebugType
("regalloc")) { dumpMachineInstrRangeWithSlotIndex(MIS.begin(
), MI, LIS, "reload", NewVReg); } } while (false)
999 NewVReg))do { if (::llvm::DebugFlag && ::llvm::isCurrentDebugType
("regalloc")) { dumpMachineInstrRangeWithSlotIndex(MIS.begin(
), MI, LIS, "reload", NewVReg); } } while (false)
;
1000 ++NumReloads;
1001}
1002
1003/// Check if \p Def fully defines a VReg with an undefined value.
1004/// If that's the case, that means the value of VReg is actually
1005/// not relevant.
1006static bool isRealSpill(const MachineInstr &Def) {
1007 if (!Def.isImplicitDef())
1008 return true;
1009 assert(Def.getNumOperands() == 1 &&(static_cast <bool> (Def.getNumOperands() == 1 &&
"Implicit def with more than one definition") ? void (0) : __assert_fail
("Def.getNumOperands() == 1 && \"Implicit def with more than one definition\""
, "llvm/lib/CodeGen/InlineSpiller.cpp", 1010, __extension__ __PRETTY_FUNCTION__
))
1010 "Implicit def with more than one definition")(static_cast <bool> (Def.getNumOperands() == 1 &&
"Implicit def with more than one definition") ? void (0) : __assert_fail
("Def.getNumOperands() == 1 && \"Implicit def with more than one definition\""
, "llvm/lib/CodeGen/InlineSpiller.cpp", 1010, __extension__ __PRETTY_FUNCTION__
))
;
1011 // We can say that the VReg defined by Def is undef, only if it is
1012 // fully defined by Def. Otherwise, some of the lanes may not be
1013 // undef and the value of the VReg matters.
1014 return Def.getOperand(0).getSubReg();
1015}
1016
1017/// insertSpill - Insert a spill of NewVReg after MI.
1018void InlineSpiller::insertSpill(Register NewVReg, bool isKill,
1019 MachineBasicBlock::iterator MI) {
1020 // Spill are not terminators, so inserting spills after terminators will
1021 // violate invariants in MachineVerifier.
1022 assert(!MI->isTerminator() && "Inserting a spill after a terminator")(static_cast <bool> (!MI->isTerminator() && "Inserting a spill after a terminator"
) ? void (0) : __assert_fail ("!MI->isTerminator() && \"Inserting a spill after a terminator\""
, "llvm/lib/CodeGen/InlineSpiller.cpp", 1022, __extension__ __PRETTY_FUNCTION__
))
;
1023 MachineBasicBlock &MBB = *MI->getParent();
1024
1025 MachineInstrSpan MIS(MI, &MBB);
1026 MachineBasicBlock::iterator SpillBefore = std::next(MI);
1027 bool IsRealSpill = isRealSpill(*MI);
1028
1029 if (IsRealSpill)
1030 TII.storeRegToStackSlot(MBB, SpillBefore, NewVReg, isKill, StackSlot,
1031 MRI.getRegClass(NewVReg), &TRI);
1032 else
1033 // Don't spill undef value.
1034 // Anything works for undef, in particular keeping the memory
1035 // uninitialized is a viable option and it saves code size and
1036 // run time.
1037 BuildMI(MBB, SpillBefore, MI->getDebugLoc(), TII.get(TargetOpcode::KILL))
1038 .addReg(NewVReg, getKillRegState(isKill));
1039
1040 MachineBasicBlock::iterator Spill = std::next(MI);
1041 LIS.InsertMachineInstrRangeInMaps(Spill, MIS.end());
1042 for (const MachineInstr &MI : make_range(Spill, MIS.end()))
1043 getVDefInterval(MI, LIS);
1044
1045 LLVM_DEBUG(do { if (::llvm::DebugFlag && ::llvm::isCurrentDebugType
("regalloc")) { dumpMachineInstrRangeWithSlotIndex(Spill, MIS
.end(), LIS, "spill"); } } while (false)
1046 dumpMachineInstrRangeWithSlotIndex(Spill, MIS.end(), LIS, "spill"))do { if (::llvm::DebugFlag && ::llvm::isCurrentDebugType
("regalloc")) { dumpMachineInstrRangeWithSlotIndex(Spill, MIS
.end(), LIS, "spill"); } } while (false)
;
1047 ++NumSpills;
1048 // If there is only 1 store instruction is required for spill, add it
1049 // to mergeable list. In X86 AMX, 2 intructions are required to store.
1050 // We disable the merge for this case.
1051 if (IsRealSpill && std::distance(Spill, MIS.end()) <= 1)
1052 HSpiller.addToMergeableSpills(*Spill, StackSlot, Original);
1053}
1054
1055/// spillAroundUses - insert spill code around each use of Reg.
1056void InlineSpiller::spillAroundUses(Register Reg) {
1057 LLVM_DEBUG(dbgs() << "spillAroundUses " << printReg(Reg) << '\n')do { if (::llvm::DebugFlag && ::llvm::isCurrentDebugType
("regalloc")) { dbgs() << "spillAroundUses " << printReg
(Reg) << '\n'; } } while (false)
;
1058 LiveInterval &OldLI = LIS.getInterval(Reg);
1059
1060 // Iterate over instructions using Reg.
1061 for (MachineInstr &MI : llvm::make_early_inc_range(MRI.reg_bundles(Reg))) {
1062 // Debug values are not allowed to affect codegen.
1063 if (MI.isDebugValue()) {
1064 // Modify DBG_VALUE now that the value is in a spill slot.
1065 MachineBasicBlock *MBB = MI.getParent();
1066 LLVM_DEBUG(dbgs() << "Modifying debug info due to spill:\t" << MI)do { if (::llvm::DebugFlag && ::llvm::isCurrentDebugType
("regalloc")) { dbgs() << "Modifying debug info due to spill:\t"
<< MI; } } while (false)
;
1067 buildDbgValueForSpill(*MBB, &MI, MI, StackSlot, Reg);
1068 MBB->erase(MI);
1069 continue;
1070 }
1071
1072 assert(!MI.isDebugInstr() && "Did not expect to find a use in debug "(static_cast <bool> (!MI.isDebugInstr() && "Did not expect to find a use in debug "
"instruction that isn't a DBG_VALUE") ? void (0) : __assert_fail
("!MI.isDebugInstr() && \"Did not expect to find a use in debug \" \"instruction that isn't a DBG_VALUE\""
, "llvm/lib/CodeGen/InlineSpiller.cpp", 1073, __extension__ __PRETTY_FUNCTION__
))
1073 "instruction that isn't a DBG_VALUE")(static_cast <bool> (!MI.isDebugInstr() && "Did not expect to find a use in debug "
"instruction that isn't a DBG_VALUE") ? void (0) : __assert_fail
("!MI.isDebugInstr() && \"Did not expect to find a use in debug \" \"instruction that isn't a DBG_VALUE\""
, "llvm/lib/CodeGen/InlineSpiller.cpp", 1073, __extension__ __PRETTY_FUNCTION__
))
;
1074
1075 // Ignore copies to/from snippets. We'll delete them.
1076 if (SnippetCopies.count(&MI))
1077 continue;
1078
1079 // Stack slot accesses may coalesce away.
1080 if (coalesceStackAccess(&MI, Reg))
1081 continue;
1082
1083 // Analyze instruction.
1084 SmallVector<std::pair<MachineInstr*, unsigned>, 8> Ops;
1085 VirtRegInfo RI = AnalyzeVirtRegInBundle(MI, Reg, &Ops);
1086
1087 // Find the slot index where this instruction reads and writes OldLI.
1088 // This is usually the def slot, except for tied early clobbers.
1089 SlotIndex Idx = LIS.getInstructionIndex(MI).getRegSlot();
1090 if (VNInfo *VNI = OldLI.getVNInfoAt(Idx.getRegSlot(true)))
1091 if (SlotIndex::isSameInstr(Idx, VNI->def))
1092 Idx = VNI->def;
1093
1094 // Check for a sibling copy.
1095 Register SibReg = isFullCopyOf(MI, Reg);
1096 if (SibReg && isSibling(SibReg)) {
1097 // This may actually be a copy between snippets.
1098 if (isRegToSpill(SibReg)) {
1099 LLVM_DEBUG(dbgs() << "Found new snippet copy: " << MI)do { if (::llvm::DebugFlag && ::llvm::isCurrentDebugType
("regalloc")) { dbgs() << "Found new snippet copy: " <<
MI; } } while (false)
;
1100 SnippetCopies.insert(&MI);
1101 continue;
1102 }
1103 if (RI.Writes) {
1104 if (hoistSpillInsideBB(OldLI, MI)) {
1105 // This COPY is now dead, the value is already in the stack slot.
1106 MI.getOperand(0).setIsDead();
1107 DeadDefs.push_back(&MI);
1108 continue;
1109 }
1110 } else {
1111 // This is a reload for a sib-reg copy. Drop spills downstream.
1112 LiveInterval &SibLI = LIS.getInterval(SibReg);
1113 eliminateRedundantSpills(SibLI, SibLI.getVNInfoAt(Idx));
1114 // The COPY will fold to a reload below.
1115 }
1116 }
1117
1118 // Attempt to fold memory ops.
1119 if (foldMemoryOperand(Ops))
1120 continue;
1121
1122 // Create a new virtual register for spill/fill.
1123 // FIXME: Infer regclass from instruction alone.
1124 Register NewVReg = Edit->createFrom(Reg);
1125
1126 if (RI.Reads)
1127 insertReload(NewVReg, Idx, &MI);
1128
1129 // Rewrite instruction operands.
1130 bool hasLiveDef = false;
1131 for (const auto &OpPair : Ops) {
1132 MachineOperand &MO = OpPair.first->getOperand(OpPair.second);
1133 MO.setReg(NewVReg);
1134 if (MO.isUse()) {
1135 if (!OpPair.first->isRegTiedToDefOperand(OpPair.second))
1136 MO.setIsKill();
1137 } else {
1138 if (!MO.isDead())
1139 hasLiveDef = true;
1140 }
1141 }
1142 LLVM_DEBUG(dbgs() << "\trewrite: " << Idx << '\t' << MI << '\n')do { if (::llvm::DebugFlag && ::llvm::isCurrentDebugType
("regalloc")) { dbgs() << "\trewrite: " << Idx <<
'\t' << MI << '\n'; } } while (false)
;
1143
1144 // FIXME: Use a second vreg if instruction has no tied ops.
1145 if (RI.Writes)
1146 if (hasLiveDef)
1147 insertSpill(NewVReg, true, &MI);
1148 }
1149}
1150
1151/// spillAll - Spill all registers remaining after rematerialization.
1152void InlineSpiller::spillAll() {
1153 // Update LiveStacks now that we are committed to spilling.
1154 if (StackSlot == VirtRegMap::NO_STACK_SLOT) {
1155 StackSlot = VRM.assignVirt2StackSlot(Original);
1156 StackInt = &LSS.getOrCreateInterval(StackSlot, MRI.getRegClass(Original));
1157 StackInt->getNextValue(SlotIndex(), LSS.getVNInfoAllocator());
1158 } else
1159 StackInt = &LSS.getInterval(StackSlot);
1160
1161 if (Original != Edit->getReg())
1162 VRM.assignVirt2StackSlot(Edit->getReg(), StackSlot);
1163
1164 assert(StackInt->getNumValNums() == 1 && "Bad stack interval values")(static_cast <bool> (StackInt->getNumValNums() == 1 &&
"Bad stack interval values") ? void (0) : __assert_fail ("StackInt->getNumValNums() == 1 && \"Bad stack interval values\""
, "llvm/lib/CodeGen/InlineSpiller.cpp", 1164, __extension__ __PRETTY_FUNCTION__
))
;
1165 for (Register Reg : RegsToSpill)
1166 StackInt->MergeSegmentsInAsValue(LIS.getInterval(Reg),
1167 StackInt->getValNumInfo(0));
1168 LLVM_DEBUG(dbgs() << "Merged spilled regs: " << *StackInt << '\n')do { if (::llvm::DebugFlag && ::llvm::isCurrentDebugType
("regalloc")) { dbgs() << "Merged spilled regs: " <<
*StackInt << '\n'; } } while (false)
;
1169
1170 // Spill around uses of all RegsToSpill.
1171 for (Register Reg : RegsToSpill)
1172 spillAroundUses(Reg);
1173
1174 // Hoisted spills may cause dead code.
1175 if (!DeadDefs.empty()) {
1176 LLVM_DEBUG(dbgs() << "Eliminating " << DeadDefs.size() << " dead defs\n")do { if (::llvm::DebugFlag && ::llvm::isCurrentDebugType
("regalloc")) { dbgs() << "Eliminating " << DeadDefs
.size() << " dead defs\n"; } } while (false)
;
1177 Edit->eliminateDeadDefs(DeadDefs, RegsToSpill, AA);
1178 }
1179
1180 // Finally delete the SnippetCopies.
1181 for (Register Reg : RegsToSpill) {
1182 for (MachineInstr &MI :
1183 llvm::make_early_inc_range(MRI.reg_instructions(Reg))) {
1184 assert(SnippetCopies.count(&MI) && "Remaining use wasn't a snippet copy")(static_cast <bool> (SnippetCopies.count(&MI) &&
"Remaining use wasn't a snippet copy") ? void (0) : __assert_fail
("SnippetCopies.count(&MI) && \"Remaining use wasn't a snippet copy\""
, "llvm/lib/CodeGen/InlineSpiller.cpp", 1184, __extension__ __PRETTY_FUNCTION__
))
;
1185 // FIXME: Do this with a LiveRangeEdit callback.
1186 LIS.RemoveMachineInstrFromMaps(MI);
1187 MI.eraseFromParent();
1188 }
1189 }
1190
1191 // Delete all spilled registers.
1192 for (Register Reg : RegsToSpill)
1193 Edit->eraseVirtReg(Reg);
1194}
1195
1196void InlineSpiller::spill(LiveRangeEdit &edit) {
1197 ++NumSpilledRanges;
1198 Edit = &edit;
1199 assert(!Register::isStackSlot(edit.getReg()) &&(static_cast <bool> (!Register::isStackSlot(edit.getReg
()) && "Trying to spill a stack slot.") ? void (0) : __assert_fail
("!Register::isStackSlot(edit.getReg()) && \"Trying to spill a stack slot.\""
, "llvm/lib/CodeGen/InlineSpiller.cpp", 1200, __extension__ __PRETTY_FUNCTION__
))
1200 "Trying to spill a stack slot.")(static_cast <bool> (!Register::isStackSlot(edit.getReg
()) && "Trying to spill a stack slot.") ? void (0) : __assert_fail
("!Register::isStackSlot(edit.getReg()) && \"Trying to spill a stack slot.\""
, "llvm/lib/CodeGen/InlineSpiller.cpp", 1200, __extension__ __PRETTY_FUNCTION__
))
;
1201 // Share a stack slot among all descendants of Original.
1202 Original = VRM.getOriginal(edit.getReg());
1203 StackSlot = VRM.getStackSlot(Original);
1204 StackInt = nullptr;
1205
1206 LLVM_DEBUG(dbgs() << "Inline spilling "do { if (::llvm::DebugFlag && ::llvm::isCurrentDebugType
("regalloc")) { dbgs() << "Inline spilling " << TRI
.getRegClassName(MRI.getRegClass(edit.getReg())) << ':'
<< edit.getParent() << "\nFrom original " <<
printReg(Original) << '\n'; } } while (false)
1207 << TRI.getRegClassName(MRI.getRegClass(edit.getReg()))do { if (::llvm::DebugFlag && ::llvm::isCurrentDebugType
("regalloc")) { dbgs() << "Inline spilling " << TRI
.getRegClassName(MRI.getRegClass(edit.getReg())) << ':'
<< edit.getParent() << "\nFrom original " <<
printReg(Original) << '\n'; } } while (false)
1208 << ':' << edit.getParent() << "\nFrom original "do { if (::llvm::DebugFlag && ::llvm::isCurrentDebugType
("regalloc")) { dbgs() << "Inline spilling " << TRI
.getRegClassName(MRI.getRegClass(edit.getReg())) << ':'
<< edit.getParent() << "\nFrom original " <<
printReg(Original) << '\n'; } } while (false)
1209 << printReg(Original) << '\n')do { if (::llvm::DebugFlag && ::llvm::isCurrentDebugType
("regalloc")) { dbgs() << "Inline spilling " << TRI
.getRegClassName(MRI.getRegClass(edit.getReg())) << ':'
<< edit.getParent() << "\nFrom original " <<
printReg(Original) << '\n'; } } while (false)
;
1210 assert(edit.getParent().isSpillable() &&(static_cast <bool> (edit.getParent().isSpillable() &&
"Attempting to spill already spilled value.") ? void (0) : __assert_fail
("edit.getParent().isSpillable() && \"Attempting to spill already spilled value.\""
, "llvm/lib/CodeGen/InlineSpiller.cpp", 1211, __extension__ __PRETTY_FUNCTION__
))
1211 "Attempting to spill already spilled value.")(static_cast <bool> (edit.getParent().isSpillable() &&
"Attempting to spill already spilled value.") ? void (0) : __assert_fail
("edit.getParent().isSpillable() && \"Attempting to spill already spilled value.\""
, "llvm/lib/CodeGen/InlineSpiller.cpp", 1211, __extension__ __PRETTY_FUNCTION__
))
;
1212 assert(DeadDefs.empty() && "Previous spill didn't remove dead defs")(static_cast <bool> (DeadDefs.empty() && "Previous spill didn't remove dead defs"
) ? void (0) : __assert_fail ("DeadDefs.empty() && \"Previous spill didn't remove dead defs\""
, "llvm/lib/CodeGen/InlineSpiller.cpp", 1212, __extension__ __PRETTY_FUNCTION__
))
;
1213
1214 collectRegsToSpill();
1215 reMaterializeAll();
1216
1217 // Remat may handle everything.
1218 if (!RegsToSpill.empty())
1219 spillAll();
1220
1221 Edit->calculateRegClassAndHint(MF, VRAI);
1222}
1223
1224/// Optimizations after all the reg selections and spills are done.
1225void InlineSpiller::postOptimization() { HSpiller.hoistAllSpills(); }
1226
1227/// When a spill is inserted, add the spill to MergeableSpills map.
1228void HoistSpillHelper::addToMergeableSpills(MachineInstr &Spill, int StackSlot,
1229 unsigned Original) {
1230 BumpPtrAllocator &Allocator = LIS.getVNInfoAllocator();
1231 LiveInterval &OrigLI = LIS.getInterval(Original);
1232 // save a copy of LiveInterval in StackSlotToOrigLI because the original
1233 // LiveInterval may be cleared after all its references are spilled.
1234 if (StackSlotToOrigLI.find(StackSlot) == StackSlotToOrigLI.end()) {
1235 auto LI = std::make_unique<LiveInterval>(OrigLI.reg(), OrigLI.weight());
1236 LI->assign(OrigLI, Allocator);
1237 StackSlotToOrigLI[StackSlot] = std::move(LI);
1238 }
1239 SlotIndex Idx = LIS.getInstructionIndex(Spill);
1240 VNInfo *OrigVNI = StackSlotToOrigLI[StackSlot]->getVNInfoAt(Idx.getRegSlot());
1241 std::pair<int, VNInfo *> MIdx = std::make_pair(StackSlot, OrigVNI);
1242 MergeableSpills[MIdx].insert(&Spill);
1243}
1244
1245/// When a spill is removed, remove the spill from MergeableSpills map.
1246/// Return true if the spill is removed successfully.
1247bool HoistSpillHelper::rmFromMergeableSpills(MachineInstr &Spill,
1248 int StackSlot) {
1249 auto It = StackSlotToOrigLI.find(StackSlot);
1250 if (It == StackSlotToOrigLI.end())
1251 return false;
1252 SlotIndex Idx = LIS.getInstructionIndex(Spill);
1253 VNInfo *OrigVNI = It->second->getVNInfoAt(Idx.getRegSlot());
1254 std::pair<int, VNInfo *> MIdx = std::make_pair(StackSlot, OrigVNI);
1255 return MergeableSpills[MIdx].erase(&Spill);
1256}
1257
1258/// Check BB to see if it is a possible target BB to place a hoisted spill,
1259/// i.e., there should be a living sibling of OrigReg at the insert point.
1260bool HoistSpillHelper::isSpillCandBB(LiveInterval &OrigLI, VNInfo &OrigVNI,
1261 MachineBasicBlock &BB, Register &LiveReg) {
1262 SlotIndex Idx = IPA.getLastInsertPoint(OrigLI, BB);
1263 // The original def could be after the last insert point in the root block,
1264 // we can't hoist to here.
1265 if (Idx < OrigVNI.def) {
1266 // TODO: We could be better here. If LI is not alive in landing pad
1267 // we could hoist spill after LIP.
1268 LLVM_DEBUG(dbgs() << "can't spill in root block - def after LIP\n")do { if (::llvm::DebugFlag && ::llvm::isCurrentDebugType
("regalloc")) { dbgs() << "can't spill in root block - def after LIP\n"
; } } while (false)
;
1269 return false;
1270 }
1271 Register OrigReg = OrigLI.reg();
1272 SmallSetVector<Register, 16> &Siblings = Virt2SiblingsMap[OrigReg];
1273 assert(OrigLI.getVNInfoAt(Idx) == &OrigVNI && "Unexpected VNI")(static_cast <bool> (OrigLI.getVNInfoAt(Idx) == &OrigVNI
&& "Unexpected VNI") ? void (0) : __assert_fail ("OrigLI.getVNInfoAt(Idx) == &OrigVNI && \"Unexpected VNI\""
, "llvm/lib/CodeGen/InlineSpiller.cpp", 1273, __extension__ __PRETTY_FUNCTION__
))
;
1274
1275 for (const Register &SibReg : Siblings) {
1276 LiveInterval &LI = LIS.getInterval(SibReg);
1277 VNInfo *VNI = LI.getVNInfoAt(Idx);
1278 if (VNI) {
1279 LiveReg = SibReg;
1280 return true;
1281 }
1282 }
1283 return false;
1284}
1285
1286/// Remove redundant spills in the same BB. Save those redundant spills in
1287/// SpillsToRm, and save the spill to keep and its BB in SpillBBToSpill map.
1288void HoistSpillHelper::rmRedundantSpills(
1289 SmallPtrSet<MachineInstr *, 16> &Spills,
1290 SmallVectorImpl<MachineInstr *> &SpillsToRm,
1291 DenseMap<MachineDomTreeNode *, MachineInstr *> &SpillBBToSpill) {
1292 // For each spill saw, check SpillBBToSpill[] and see if its BB already has
1293 // another spill inside. If a BB contains more than one spill, only keep the
1294 // earlier spill with smaller SlotIndex.
1295 for (const auto CurrentSpill : Spills) {
1296 MachineBasicBlock *Block = CurrentSpill->getParent();
1297 MachineDomTreeNode *Node = MDT.getBase().getNode(Block);
1298 MachineInstr *PrevSpill = SpillBBToSpill[Node];
1299 if (PrevSpill) {
1300 SlotIndex PIdx = LIS.getInstructionIndex(*PrevSpill);
1301 SlotIndex CIdx = LIS.getInstructionIndex(*CurrentSpill);
1302 MachineInstr *SpillToRm = (CIdx > PIdx) ? CurrentSpill : PrevSpill;
1303 MachineInstr *SpillToKeep = (CIdx > PIdx) ? PrevSpill : CurrentSpill;
1304 SpillsToRm.push_back(SpillToRm);
1305 SpillBBToSpill[MDT.getBase().getNode(Block)] = SpillToKeep;
1306 } else {
1307 SpillBBToSpill[MDT.getBase().getNode(Block)] = CurrentSpill;
1308 }
1309 }
1310 for (const auto SpillToRm : SpillsToRm)
1311 Spills.erase(SpillToRm);
1312}
1313
1314/// Starting from \p Root find a top-down traversal order of the dominator
1315/// tree to visit all basic blocks containing the elements of \p Spills.
1316/// Redundant spills will be found and put into \p SpillsToRm at the same
1317/// time. \p SpillBBToSpill will be populated as part of the process and
1318/// maps a basic block to the first store occurring in the basic block.
1319/// \post SpillsToRm.union(Spills\@post) == Spills\@pre
1320void HoistSpillHelper::getVisitOrders(
1321 MachineBasicBlock *Root, SmallPtrSet<MachineInstr *, 16> &Spills,
1322 SmallVectorImpl<MachineDomTreeNode *> &Orders,
1323 SmallVectorImpl<MachineInstr *> &SpillsToRm,
1324 DenseMap<MachineDomTreeNode *, unsigned> &SpillsToKeep,
1325 DenseMap<MachineDomTreeNode *, MachineInstr *> &SpillBBToSpill) {
1326 // The set contains all the possible BB nodes to which we may hoist
1327 // original spills.
1328 SmallPtrSet<MachineDomTreeNode *, 8> WorkSet;
1329 // Save the BB nodes on the path from the first BB node containing
1330 // non-redundant spill to the Root node.
1331 SmallPtrSet<MachineDomTreeNode *, 8> NodesOnPath;
1332 // All the spills to be hoisted must originate from a single def instruction
1333 // to the OrigReg. It means the def instruction should dominate all the spills
1334 // to be hoisted. We choose the BB where the def instruction is located as
1335 // the Root.
1336 MachineDomTreeNode *RootIDomNode = MDT[Root]->getIDom();
1337 // For every node on the dominator tree with spill, walk up on the dominator
1338 // tree towards the Root node until it is reached. If there is other node
1339 // containing spill in the middle of the path, the previous spill saw will
1340 // be redundant and the node containing it will be removed. All the nodes on
1341 // the path starting from the first node with non-redundant spill to the Root
1342 // node will be added to the WorkSet, which will contain all the possible
1343 // locations where spills may be hoisted to after the loop below is done.
1344 for (const auto Spill : Spills) {
1345 MachineBasicBlock *Block = Spill->getParent();
1346 MachineDomTreeNode *Node = MDT[Block];
1347 MachineInstr *SpillToRm = nullptr;
1348 while (Node != RootIDomNode) {
1349 // If Node dominates Block, and it already contains a spill, the spill in
1350 // Block will be redundant.
1351 if (Node != MDT[Block] && SpillBBToSpill[Node]) {
1352 SpillToRm = SpillBBToSpill[MDT[Block]];
1353 break;
1354 /// If we see the Node already in WorkSet, the path from the Node to
1355 /// the Root node must already be traversed by another spill.
1356 /// Then no need to repeat.
1357 } else if (WorkSet.count(Node)) {
1358 break;
1359 } else {
1360 NodesOnPath.insert(Node);
1361 }
1362 Node = Node->getIDom();
1363 }
1364 if (SpillToRm) {
1365 SpillsToRm.push_back(SpillToRm);
1366 } else {
1367 // Add a BB containing the original spills to SpillsToKeep -- i.e.,
1368 // set the initial status before hoisting start. The value of BBs
1369 // containing original spills is set to 0, in order to descriminate
1370 // with BBs containing hoisted spills which will be inserted to
1371 // SpillsToKeep later during hoisting.
1372 SpillsToKeep[MDT[Block]] = 0;
1373 WorkSet.insert(NodesOnPath.begin(), NodesOnPath.end());
1374 }
1375 NodesOnPath.clear();
1376 }
1377
1378 // Sort the nodes in WorkSet in top-down order and save the nodes
1379 // in Orders. Orders will be used for hoisting in runHoistSpills.
1380 unsigned idx = 0;
1381 Orders.push_back(MDT.getBase().getNode(Root));
1382 do {
1383 MachineDomTreeNode *Node = Orders[idx++];
1384 for (MachineDomTreeNode *Child : Node->children()) {
1385 if (WorkSet.count(Child))
1386 Orders.push_back(Child);
1387 }
1388 } while (idx != Orders.size());
1389 assert(Orders.size() == WorkSet.size() &&(static_cast <bool> (Orders.size() == WorkSet.size() &&
"Orders have different size with WorkSet") ? void (0) : __assert_fail
("Orders.size() == WorkSet.size() && \"Orders have different size with WorkSet\""
, "llvm/lib/CodeGen/InlineSpiller.cpp", 1390, __extension__ __PRETTY_FUNCTION__
))
1390 "Orders have different size with WorkSet")(static_cast <bool> (Orders.size() == WorkSet.size() &&
"Orders have different size with WorkSet") ? void (0) : __assert_fail
("Orders.size() == WorkSet.size() && \"Orders have different size with WorkSet\""
, "llvm/lib/CodeGen/InlineSpiller.cpp", 1390, __extension__ __PRETTY_FUNCTION__
))
;
1391
1392#ifndef NDEBUG
1393 LLVM_DEBUG(dbgs() << "Orders size is " << Orders.size() << "\n")do { if (::llvm::DebugFlag && ::llvm::isCurrentDebugType
("regalloc")) { dbgs() << "Orders size is " << Orders
.size() << "\n"; } } while (false)
;
1394 SmallVector<MachineDomTreeNode *, 32>::reverse_iterator RIt = Orders.rbegin();
1395 for (; RIt != Orders.rend(); RIt++)
1396 LLVM_DEBUG(dbgs() << "BB" << (*RIt)->getBlock()->getNumber() << ",")do { if (::llvm::DebugFlag && ::llvm::isCurrentDebugType
("regalloc")) { dbgs() << "BB" << (*RIt)->getBlock
()->getNumber() << ","; } } while (false)
;
1397 LLVM_DEBUG(dbgs() << "\n")do { if (::llvm::DebugFlag && ::llvm::isCurrentDebugType
("regalloc")) { dbgs() << "\n"; } } while (false)
;
1398#endif
1399}
1400
1401/// Try to hoist spills according to BB hotness. The spills to removed will
1402/// be saved in \p SpillsToRm. The spills to be inserted will be saved in
1403/// \p SpillsToIns.
1404void HoistSpillHelper::runHoistSpills(
1405 LiveInterval &OrigLI, VNInfo &OrigVNI,
1406 SmallPtrSet<MachineInstr *, 16> &Spills,
1407 SmallVectorImpl<MachineInstr *> &SpillsToRm,
1408 DenseMap<MachineBasicBlock *, unsigned> &SpillsToIns) {
1409 // Visit order of dominator tree nodes.
1410 SmallVector<MachineDomTreeNode *, 32> Orders;
1411 // SpillsToKeep contains all the nodes where spills are to be inserted
1412 // during hoisting. If the spill to be inserted is an original spill
1413 // (not a hoisted one), the value of the map entry is 0. If the spill
1414 // is a hoisted spill, the value of the map entry is the VReg to be used
1415 // as the source of the spill.
1416 DenseMap<MachineDomTreeNode *, unsigned> SpillsToKeep;
1417 // Map from BB to the first spill inside of it.
1418 DenseMap<MachineDomTreeNode *, MachineInstr *> SpillBBToSpill;
1419
1420 rmRedundantSpills(Spills, SpillsToRm, SpillBBToSpill);
1421
1422 MachineBasicBlock *Root = LIS.getMBBFromIndex(OrigVNI.def);
1423 getVisitOrders(Root, Spills, Orders, SpillsToRm, SpillsToKeep,
1424 SpillBBToSpill);
1425
1426 // SpillsInSubTreeMap keeps the map from a dom tree node to a pair of
1427 // nodes set and the cost of all the spills inside those nodes.
1428 // The nodes set are the locations where spills are to be inserted
1429 // in the subtree of current node.
1430 using NodesCostPair =
1431 std::pair<SmallPtrSet<MachineDomTreeNode *, 16>, BlockFrequency>;
1432 DenseMap<MachineDomTreeNode *, NodesCostPair> SpillsInSubTreeMap;
1433
1434 // Iterate Orders set in reverse order, which will be a bottom-up order
1435 // in the dominator tree. Once we visit a dom tree node, we know its
1436 // children have already been visited and the spill locations in the
1437 // subtrees of all the children have been determined.
1438 SmallVector<MachineDomTreeNode *, 32>::reverse_iterator RIt = Orders.rbegin();
1439 for (; RIt != Orders.rend(); RIt++) {
1440 MachineBasicBlock *Block = (*RIt)->getBlock();
1441
1442 // If Block contains an original spill, simply continue.
1443 if (SpillsToKeep.find(*RIt) != SpillsToKeep.end() && !SpillsToKeep[*RIt]) {
1444 SpillsInSubTreeMap[*RIt].first.insert(*RIt);
1445 // SpillsInSubTreeMap[*RIt].second contains the cost of spill.
1446 SpillsInSubTreeMap[*RIt].second = MBFI.getBlockFreq(Block);
1447 continue;
1448 }
1449
1450 // Collect spills in subtree of current node (*RIt) to
1451 // SpillsInSubTreeMap[*RIt].first.
1452 for (MachineDomTreeNode *Child : (*RIt)->children()) {
1453 if (SpillsInSubTreeMap.find(Child) == SpillsInSubTreeMap.end())
1454 continue;
1455 // The stmt "SpillsInSubTree = SpillsInSubTreeMap[*RIt].first" below
1456 // should be placed before getting the begin and end iterators of
1457 // SpillsInSubTreeMap[Child].first, or else the iterators may be
1458 // invalidated when SpillsInSubTreeMap[*RIt] is seen the first time
1459 // and the map grows and then the original buckets in the map are moved.
1460 SmallPtrSet<MachineDomTreeNode *, 16> &SpillsInSubTree =
1461 SpillsInSubTreeMap[*RIt].first;
1462 BlockFrequency &SubTreeCost = SpillsInSubTreeMap[*RIt].second;
1463 SubTreeCost += SpillsInSubTreeMap[Child].second;
1464 auto BI = SpillsInSubTreeMap[Child].first.begin();
1465 auto EI = SpillsInSubTreeMap[Child].first.end();
1466 SpillsInSubTree.insert(BI, EI);
1467 SpillsInSubTreeMap.erase(Child);
1468 }
1469
1470 SmallPtrSet<MachineDomTreeNode *, 16> &SpillsInSubTree =
1471 SpillsInSubTreeMap[*RIt].first;
1472 BlockFrequency &SubTreeCost = SpillsInSubTreeMap[*RIt].second;
1473 // No spills in subtree, simply continue.
1474 if (SpillsInSubTree.empty())
1475 continue;
1476
1477 // Check whether Block is a possible candidate to insert spill.
1478 Register LiveReg;
1479 if (!isSpillCandBB(OrigLI, OrigVNI, *Block, LiveReg))
1480 continue;
1481
1482 // If there are multiple spills that could be merged, bias a little
1483 // to hoist the spill.
1484 BranchProbability MarginProb = (SpillsInSubTree.size() > 1)
1485 ? BranchProbability(9, 10)
1486 : BranchProbability(1, 1);
1487 if (SubTreeCost > MBFI.getBlockFreq(Block) * MarginProb) {
1488 // Hoist: Move spills to current Block.
1489 for (const auto SpillBB : SpillsInSubTree) {
1490 // When SpillBB is a BB contains original spill, insert the spill
1491 // to SpillsToRm.
1492 if (SpillsToKeep.find(SpillBB) != SpillsToKeep.end() &&
1493 !SpillsToKeep[SpillBB]) {
1494 MachineInstr *SpillToRm = SpillBBToSpill[SpillBB];
1495 SpillsToRm.push_back(SpillToRm);
1496 }
1497 // SpillBB will not contain spill anymore, remove it from SpillsToKeep.
1498 SpillsToKeep.erase(SpillBB);
1499 }
1500 // Current Block is the BB containing the new hoisted spill. Add it to
1501 // SpillsToKeep. LiveReg is the source of the new spill.
1502 SpillsToKeep[*RIt] = LiveReg;
1503 LLVM_DEBUG({do { if (::llvm::DebugFlag && ::llvm::isCurrentDebugType
("regalloc")) { { dbgs() << "spills in BB: "; for (const
auto Rspill : SpillsInSubTree) dbgs() << Rspill->getBlock
()->getNumber() << " "; dbgs() << "were promoted to BB"
<< (*RIt)->getBlock()->getNumber() << "\n"
; }; } } while (false)
1504 dbgs() << "spills in BB: ";do { if (::llvm::DebugFlag && ::llvm::isCurrentDebugType
("regalloc")) { { dbgs() << "spills in BB: "; for (const
auto Rspill : SpillsInSubTree) dbgs() << Rspill->getBlock
()->getNumber() << " "; dbgs() << "were promoted to BB"
<< (*RIt)->getBlock()->getNumber() << "\n"
; }; } } while (false)
1505 for (const auto Rspill : SpillsInSubTree)do { if (::llvm::DebugFlag && ::llvm::isCurrentDebugType
("regalloc")) { { dbgs() << "spills in BB: "; for (const
auto Rspill : SpillsInSubTree) dbgs() << Rspill->getBlock
()->getNumber() << " "; dbgs() << "were promoted to BB"
<< (*RIt)->getBlock()->getNumber() << "\n"
; }; } } while (false)
1506 dbgs() << Rspill->getBlock()->getNumber() << " ";do { if (::llvm::DebugFlag && ::llvm::isCurrentDebugType
("regalloc")) { { dbgs() << "spills in BB: "; for (const
auto Rspill : SpillsInSubTree) dbgs() << Rspill->getBlock
()->getNumber() << " "; dbgs() << "were promoted to BB"
<< (*RIt)->getBlock()->getNumber() << "\n"
; }; } } while (false)
1507 dbgs() << "were promoted to BB" << (*RIt)->getBlock()->getNumber()do { if (::llvm::DebugFlag && ::llvm::isCurrentDebugType
("regalloc")) { { dbgs() << "spills in BB: "; for (const
auto Rspill : SpillsInSubTree) dbgs() << Rspill->getBlock
()->getNumber() << " "; dbgs() << "were promoted to BB"
<< (*RIt)->getBlock()->getNumber() << "\n"
; }; } } while (false)
1508 << "\n";do { if (::llvm::DebugFlag && ::llvm::isCurrentDebugType
("regalloc")) { { dbgs() << "spills in BB: "; for (const
auto Rspill : SpillsInSubTree) dbgs() << Rspill->getBlock
()->getNumber() << " "; dbgs() << "were promoted to BB"
<< (*RIt)->getBlock()->getNumber() << "\n"
; }; } } while (false)
1509 })do { if (::llvm::DebugFlag && ::llvm::isCurrentDebugType
("regalloc")) { { dbgs() << "spills in BB: "; for (const
auto Rspill : SpillsInSubTree) dbgs() << Rspill->getBlock
()->getNumber() << " "; dbgs() << "were promoted to BB"
<< (*RIt)->getBlock()->getNumber() << "\n"
; }; } } while (false)
;
1510 SpillsInSubTree.clear();
1511 SpillsInSubTree.insert(*RIt);
1512 SubTreeCost = MBFI.getBlockFreq(Block);
1513 }
1514 }
1515 // For spills in SpillsToKeep with LiveReg set (i.e., not original spill),
1516 // save them to SpillsToIns.
1517 for (const auto &Ent : SpillsToKeep) {
1518 if (Ent.second)
1519 SpillsToIns[Ent.first->getBlock()] = Ent.second;
1520 }
1521}
1522
1523/// For spills with equal values, remove redundant spills and hoist those left
1524/// to less hot spots.
1525///
1526/// Spills with equal values will be collected into the same set in
1527/// MergeableSpills when spill is inserted. These equal spills are originated
1528/// from the same defining instruction and are dominated by the instruction.
1529/// Before hoisting all the equal spills, redundant spills inside in the same
1530/// BB are first marked to be deleted. Then starting from the spills left, walk
1531/// up on the dominator tree towards the Root node where the define instruction
1532/// is located, mark the dominated spills to be deleted along the way and
1533/// collect the BB nodes on the path from non-dominated spills to the define
1534/// instruction into a WorkSet. The nodes in WorkSet are the candidate places
1535/// where we are considering to hoist the spills. We iterate the WorkSet in
1536/// bottom-up order, and for each node, we will decide whether to hoist spills
1537/// inside its subtree to that node. In this way, we can get benefit locally
1538/// even if hoisting all the equal spills to one cold place is impossible.
1539void HoistSpillHelper::hoistAllSpills() {
1540 SmallVector<Register, 4> NewVRegs;
1541 LiveRangeEdit Edit(nullptr, NewVRegs, MF, LIS, &VRM, this);
1542
1543 for (unsigned i = 0, e = MRI.getNumVirtRegs(); i != e; ++i) {
1544 Register Reg = Register::index2VirtReg(i);
1545 Register Original = VRM.getPreSplitReg(Reg);
1546 if (!MRI.def_empty(Reg))
1547 Virt2SiblingsMap[Original].insert(Reg);
1548 }
1549
1550 // Each entry in MergeableSpills contains a spill set with equal values.
1551 for (auto &Ent : MergeableSpills) {
1552 int Slot = Ent.first.first;
1553 LiveInterval &OrigLI = *StackSlotToOrigLI[Slot];
1554 VNInfo *OrigVNI = Ent.first.second;
1555 SmallPtrSet<MachineInstr *, 16> &EqValSpills = Ent.second;
1556 if (Ent.second.empty())
1557 continue;
1558
1559 LLVM_DEBUG({do { if (::llvm::DebugFlag && ::llvm::isCurrentDebugType
("regalloc")) { { dbgs() << "\nFor Slot" << Slot <<
" and VN" << OrigVNI->id << ":\n" << "Equal spills in BB: "
; for (const auto spill : EqValSpills) dbgs() << spill->
getParent()->getNumber() << " "; dbgs() << "\n"
; }; } } while (false)
1560 dbgs() << "\nFor Slot" << Slot << " and VN" << OrigVNI->id << ":\n"do { if (::llvm::DebugFlag && ::llvm::isCurrentDebugType
("regalloc")) { { dbgs() << "\nFor Slot" << Slot <<
" and VN" << OrigVNI->id << ":\n" << "Equal spills in BB: "
; for (const auto spill : EqValSpills) dbgs() << spill->
getParent()->getNumber() << " "; dbgs() << "\n"
; }; } } while (false)
1561 << "Equal spills in BB: ";do { if (::llvm::DebugFlag && ::llvm::isCurrentDebugType
("regalloc")) { { dbgs() << "\nFor Slot" << Slot <<
" and VN" << OrigVNI->id << ":\n" << "Equal spills in BB: "
; for (const auto spill : EqValSpills) dbgs() << spill->
getParent()->getNumber() << " "; dbgs() << "\n"
; }; } } while (false)
1562 for (const auto spill : EqValSpills)do { if (::llvm::DebugFlag && ::llvm::isCurrentDebugType
("regalloc")) { { dbgs() << "\nFor Slot" << Slot <<
" and VN" << OrigVNI->id << ":\n" << "Equal spills in BB: "
; for (const auto spill : EqValSpills) dbgs() << spill->
getParent()->getNumber() << " "; dbgs() << "\n"
; }; } } while (false)
1563 dbgs() << spill->getParent()->getNumber() << " ";do { if (::llvm::DebugFlag && ::llvm::isCurrentDebugType
("regalloc")) { { dbgs() << "\nFor Slot" << Slot <<
" and VN" << OrigVNI->id << ":\n" << "Equal spills in BB: "
; for (const auto spill : EqValSpills) dbgs() << spill->
getParent()->getNumber() << " "; dbgs() << "\n"
; }; } } while (false)
1564 dbgs() << "\n";do { if (::llvm::DebugFlag && ::llvm::isCurrentDebugType
("regalloc")) { { dbgs() << "\nFor Slot" << Slot <<
" and VN" << OrigVNI->id << ":\n" << "Equal spills in BB: "
; for (const auto spill : EqValSpills) dbgs() << spill->
getParent()->getNumber() << " "; dbgs() << "\n"
; }; } } while (false)
1565 })do { if (::llvm::DebugFlag && ::llvm::isCurrentDebugType
("regalloc")) { { dbgs() << "\nFor Slot" << Slot <<
" and VN" << OrigVNI->id << ":\n" << "Equal spills in BB: "
; for (const auto spill : EqValSpills) dbgs() << spill->
getParent()->getNumber() << " "; dbgs() << "\n"
; }; } } while (false)
;
1566
1567 // SpillsToRm is the spill set to be removed from EqValSpills.
1568 SmallVector<MachineInstr *, 16> SpillsToRm;
1569 // SpillsToIns is the spill set to be newly inserted after hoisting.
1570 DenseMap<MachineBasicBlock *, unsigned> SpillsToIns;
1571
1572 runHoistSpills(OrigLI, *OrigVNI, EqValSpills, SpillsToRm, SpillsToIns);
1573
1574 LLVM_DEBUG({do { if (::llvm::DebugFlag && ::llvm::isCurrentDebugType
("regalloc")) { { dbgs() << "Finally inserted spills in BB: "
; for (const auto &Ispill : SpillsToIns) dbgs() << Ispill
.first->getNumber() << " "; dbgs() << "\nFinally removed spills in BB: "
; for (const auto Rspill : SpillsToRm) dbgs() << Rspill
->getParent()->getNumber() << " "; dbgs() <<
"\n"; }; } } while (false)
1575 dbgs() << "Finally inserted spills in BB: ";do { if (::llvm::DebugFlag && ::llvm::isCurrentDebugType
("regalloc")) { { dbgs() << "Finally inserted spills in BB: "
; for (const auto &Ispill : SpillsToIns) dbgs() << Ispill
.first->getNumber() << " "; dbgs() << "\nFinally removed spills in BB: "
; for (const auto Rspill : SpillsToRm) dbgs() << Rspill
->getParent()->getNumber() << " "; dbgs() <<
"\n"; }; } } while (false)
1576 for (const auto &Ispill : SpillsToIns)do { if (::llvm::DebugFlag && ::llvm::isCurrentDebugType
("regalloc")) { { dbgs() << "Finally inserted spills in BB: "
; for (const auto &Ispill : SpillsToIns) dbgs() << Ispill
.first->getNumber() << " "; dbgs() << "\nFinally removed spills in BB: "
; for (const auto Rspill : SpillsToRm) dbgs() << Rspill
->getParent()->getNumber() << " "; dbgs() <<
"\n"; }; } } while (false)
1577 dbgs() << Ispill.first->getNumber() << " ";do { if (::llvm::DebugFlag && ::llvm::isCurrentDebugType
("regalloc")) { { dbgs() << "Finally inserted spills in BB: "
; for (const auto &Ispill : SpillsToIns) dbgs() << Ispill
.first->getNumber() << " "; dbgs() << "\nFinally removed spills in BB: "
; for (const auto Rspill : SpillsToRm) dbgs() << Rspill
->getParent()->getNumber() << " "; dbgs() <<
"\n"; }; } } while (false)
1578 dbgs() << "\nFinally removed spills in BB: ";do { if (::llvm::DebugFlag && ::llvm::isCurrentDebugType
("regalloc")) { { dbgs() << "Finally inserted spills in BB: "
; for (const auto &Ispill : SpillsToIns) dbgs() << Ispill
.first->getNumber() << " "; dbgs() << "\nFinally removed spills in BB: "
; for (const auto Rspill : SpillsToRm) dbgs() << Rspill
->getParent()->getNumber() << " "; dbgs() <<
"\n"; }; } } while (false)
1579 for (const auto Rspill : SpillsToRm)do { if (::llvm::DebugFlag && ::llvm::isCurrentDebugType
("regalloc")) { { dbgs() << "Finally inserted spills in BB: "
; for (const auto &Ispill : SpillsToIns) dbgs() << Ispill
.first->getNumber() << " "; dbgs() << "\nFinally removed spills in BB: "
; for (const auto Rspill : SpillsToRm) dbgs() << Rspill
->getParent()->getNumber() << " "; dbgs() <<
"\n"; }; } } while (false)
1580 dbgs() << Rspill->getParent()->getNumber() << " ";do { if (::llvm::DebugFlag && ::llvm::isCurrentDebugType
("regalloc")) { { dbgs() << "Finally inserted spills in BB: "
; for (const auto &Ispill : SpillsToIns) dbgs() << Ispill
.first->getNumber() << " "; dbgs() << "\nFinally removed spills in BB: "
; for (const auto Rspill : SpillsToRm) dbgs() << Rspill
->getParent()->getNumber() << " "; dbgs() <<
"\n"; }; } } while (false)
1581 dbgs() << "\n";do { if (::llvm::DebugFlag && ::llvm::isCurrentDebugType
("regalloc")) { { dbgs() << "Finally inserted spills in BB: "
; for (const auto &Ispill : SpillsToIns) dbgs() << Ispill
.first->getNumber() << " "; dbgs() << "\nFinally removed spills in BB: "
; for (const auto Rspill : SpillsToRm) dbgs() << Rspill
->getParent()->getNumber() << " "; dbgs() <<
"\n"; }; } } while (false)
1582 })do { if (::llvm::DebugFlag && ::llvm::isCurrentDebugType
("regalloc")) { { dbgs() << "Finally inserted spills in BB: "
; for (const auto &Ispill : SpillsToIns) dbgs() << Ispill
.first->getNumber() << " "; dbgs() << "\nFinally removed spills in BB: "
; for (const auto Rspill : SpillsToRm) dbgs() << Rspill
->getParent()->getNumber() << " "; dbgs() <<
"\n"; }; } } while (false)
;
1583
1584 // Stack live range update.
1585 LiveInterval &StackIntvl = LSS.getInterval(Slot);
1586 if (!SpillsToIns.empty() || !SpillsToRm.empty())
1587 StackIntvl.MergeValueInAsValue(OrigLI, OrigVNI,
1588 StackIntvl.getValNumInfo(0));
1589
1590 // Insert hoisted spills.
1591 for (auto const &Insert : SpillsToIns) {
1592 MachineBasicBlock *BB = Insert.first;
1593 Register LiveReg = Insert.second;
1594 MachineBasicBlock::iterator MII = IPA.getLastInsertPointIter(OrigLI, *BB);
1595 MachineInstrSpan MIS(MII, BB);
1596 TII.storeRegToStackSlot(*BB, MII, LiveReg, false, Slot,
1597 MRI.getRegClass(LiveReg), &TRI);
1598 LIS.InsertMachineInstrRangeInMaps(MIS.begin(), MII);
1599 for (const MachineInstr &MI : make_range(MIS.begin(), MII))
1600 getVDefInterval(MI, LIS);
1601 ++NumSpills;
1602 }
1603
1604 // Remove redundant spills or change them to dead instructions.
1605 NumSpills -= SpillsToRm.size();
1606 for (auto const RMEnt : SpillsToRm) {
1607 RMEnt->setDesc(TII.get(TargetOpcode::KILL));
1608 for (unsigned i = RMEnt->getNumOperands(); i; --i) {
1609 MachineOperand &MO = RMEnt->getOperand(i - 1);
1610 if (MO.isReg() && MO.isImplicit() && MO.isDef() && !MO.isDead())
1611 RMEnt->RemoveOperand(i - 1);
1612 }
1613 }
1614 Edit.eliminateDeadDefs(SpillsToRm, None, AA);
1615 }
1616}
1617
1618/// For VirtReg clone, the \p New register should have the same physreg or
1619/// stackslot as the \p old register.
1620void HoistSpillHelper::LRE_DidCloneVirtReg(Register New, Register Old) {
1621 if (VRM.hasPhys(Old))
1622 VRM.assignVirt2Phys(New, VRM.getPhys(Old));
1623 else if (VRM.getStackSlot(Old) != VirtRegMap::NO_STACK_SLOT)
1624 VRM.assignVirt2StackSlot(New, VRM.getStackSlot(Old));
1625 else
1626 llvm_unreachable("VReg should be assigned either physreg or stackslot")::llvm::llvm_unreachable_internal("VReg should be assigned either physreg or stackslot"
, "llvm/lib/CodeGen/InlineSpiller.cpp", 1626)
;
1627 if (VRM.hasShape(Old))
1628 VRM.assignVirt2Shape(New, VRM.getShape(Old));
1629}

/build/llvm-toolchain-snapshot-14~++20220118101002+ec47dba1c8a2/llvm/include/llvm/CodeGen/MachineInstr.h

1//===- llvm/CodeGen/MachineInstr.h - MachineInstr class ---------*- C++ -*-===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8//
9// This file contains the declaration of the MachineInstr class, which is the
10// basic representation for all target dependent machine instructions used by
11// the back end.
12//
13//===----------------------------------------------------------------------===//
14
15#ifndef LLVM_CODEGEN_MACHINEINSTR_H
16#define LLVM_CODEGEN_MACHINEINSTR_H
17
18#include "llvm/ADT/DenseMapInfo.h"
19#include "llvm/ADT/PointerSumType.h"
20#include "llvm/ADT/SmallSet.h"
21#include "llvm/ADT/ilist.h"
22#include "llvm/ADT/ilist_node.h"
23#include "llvm/ADT/iterator_range.h"
24#include "llvm/CodeGen/MachineMemOperand.h"
25#include "llvm/CodeGen/MachineOperand.h"
26#include "llvm/CodeGen/TargetOpcodes.h"
27#include "llvm/IR/DebugLoc.h"
28#include "llvm/IR/InlineAsm.h"
29#include "llvm/IR/PseudoProbe.h"
30#include "llvm/MC/MCInstrDesc.h"
31#include "llvm/MC/MCSymbol.h"
32#include "llvm/Support/ArrayRecycler.h"
33#include "llvm/Support/TrailingObjects.h"
34#include <algorithm>
35#include <cassert>
36#include <cstdint>
37#include <utility>
38
39namespace llvm {
40
41class AAResults;
42template <typename T> class ArrayRef;
43class DIExpression;
44class DILocalVariable;
45class MachineBasicBlock;
46class MachineFunction;
47class MachineRegisterInfo;
48class ModuleSlotTracker;
49class raw_ostream;
50template <typename T> class SmallVectorImpl;
51class SmallBitVector;
52class StringRef;
53class TargetInstrInfo;
54class TargetRegisterClass;
55class TargetRegisterInfo;
56
57//===----------------------------------------------------------------------===//
58/// Representation of each machine instruction.
59///
60/// This class isn't a POD type, but it must have a trivial destructor. When a
61/// MachineFunction is deleted, all the contained MachineInstrs are deallocated
62/// without having their destructor called.
63///
64class MachineInstr
65 : public ilist_node_with_parent<MachineInstr, MachineBasicBlock,
66 ilist_sentinel_tracking<true>> {
67public:
68 using mmo_iterator = ArrayRef<MachineMemOperand *>::iterator;
69
70 /// Flags to specify different kinds of comments to output in
71 /// assembly code. These flags carry semantic information not
72 /// otherwise easily derivable from the IR text.
73 ///
74 enum CommentFlag {
75 ReloadReuse = 0x1, // higher bits are reserved for target dep comments.
76 NoSchedComment = 0x2,
77 TAsmComments = 0x4 // Target Asm comments should start from this value.
78 };
79
80 enum MIFlag {
81 NoFlags = 0,
82 FrameSetup = 1 << 0, // Instruction is used as a part of
83 // function frame setup code.
84 FrameDestroy = 1 << 1, // Instruction is used as a part of
85 // function frame destruction code.
86 BundledPred = 1 << 2, // Instruction has bundled predecessors.
87 BundledSucc = 1 << 3, // Instruction has bundled successors.
88 FmNoNans = 1 << 4, // Instruction does not support Fast
89 // math nan values.
90 FmNoInfs = 1 << 5, // Instruction does not support Fast
91 // math infinity values.
92 FmNsz = 1 << 6, // Instruction is not required to retain
93 // signed zero values.
94 FmArcp = 1 << 7, // Instruction supports Fast math
95 // reciprocal approximations.
96 FmContract = 1 << 8, // Instruction supports Fast math
97 // contraction operations like fma.
98 FmAfn = 1 << 9, // Instruction may map to Fast math
99 // instrinsic approximation.
100 FmReassoc = 1 << 10, // Instruction supports Fast math
101 // reassociation of operand order.
102 NoUWrap = 1 << 11, // Instruction supports binary operator
103 // no unsigned wrap.
104 NoSWrap = 1 << 12, // Instruction supports binary operator
105 // no signed wrap.
106 IsExact = 1 << 13, // Instruction supports division is
107 // known to be exact.
108 NoFPExcept = 1 << 14, // Instruction does not raise
109 // floatint-point exceptions.
110 NoMerge = 1 << 15, // Passes that drop source location info
111 // (e.g. branch folding) should skip
112 // this instruction.
113 };
114
115private:
116 const MCInstrDesc *MCID; // Instruction descriptor.
117 MachineBasicBlock *Parent = nullptr; // Pointer to the owning basic block.
118
119 // Operands are allocated by an ArrayRecycler.
120 MachineOperand *Operands = nullptr; // Pointer to the first operand.
121 unsigned NumOperands = 0; // Number of operands on instruction.
122
123 uint16_t Flags = 0; // Various bits of additional
124 // information about machine
125 // instruction.
126
127 uint8_t AsmPrinterFlags = 0; // Various bits of information used by
128 // the AsmPrinter to emit helpful
129 // comments. This is *not* semantic
130 // information. Do not use this for
131 // anything other than to convey comment
132 // information to AsmPrinter.
133
134 // OperandCapacity has uint8_t size, so it should be next to AsmPrinterFlags
135 // to properly pack.
136 using OperandCapacity = ArrayRecycler<MachineOperand>::Capacity;
137 OperandCapacity CapOperands; // Capacity of the Operands array.
138
139 /// Internal implementation detail class that provides out-of-line storage for
140 /// extra info used by the machine instruction when this info cannot be stored
141 /// in-line within the instruction itself.
142 ///
143 /// This has to be defined eagerly due to the implementation constraints of
144 /// `PointerSumType` where it is used.
145 class ExtraInfo final
146 : TrailingObjects<ExtraInfo, MachineMemOperand *, MCSymbol *, MDNode *> {
147 public:
148 static ExtraInfo *create(BumpPtrAllocator &Allocator,
149 ArrayRef<MachineMemOperand *> MMOs,
150 MCSymbol *PreInstrSymbol = nullptr,
151 MCSymbol *PostInstrSymbol = nullptr,
152 MDNode *HeapAllocMarker = nullptr) {
153 bool HasPreInstrSymbol = PreInstrSymbol != nullptr;
154 bool HasPostInstrSymbol = PostInstrSymbol != nullptr;
155 bool HasHeapAllocMarker = HeapAllocMarker != nullptr;
156 auto *Result = new (Allocator.Allocate(
157 totalSizeToAlloc<MachineMemOperand *, MCSymbol *, MDNode *>(
158 MMOs.size(), HasPreInstrSymbol + HasPostInstrSymbol,
159 HasHeapAllocMarker),
160 alignof(ExtraInfo)))
161 ExtraInfo(MMOs.size(), HasPreInstrSymbol, HasPostInstrSymbol,
162 HasHeapAllocMarker);
163
164 // Copy the actual data into the trailing objects.
165 std::copy(MMOs.begin(), MMOs.end(),
166 Result->getTrailingObjects<MachineMemOperand *>());
167
168 if (HasPreInstrSymbol)
169 Result->getTrailingObjects<MCSymbol *>()[0] = PreInstrSymbol;
170 if (HasPostInstrSymbol)
171 Result->getTrailingObjects<MCSymbol *>()[HasPreInstrSymbol] =
172 PostInstrSymbol;
173 if (HasHeapAllocMarker)
174 Result->getTrailingObjects<MDNode *>()[0] = HeapAllocMarker;
175
176 return Result;
177 }
178
179 ArrayRef<MachineMemOperand *> getMMOs() const {
180 return makeArrayRef(getTrailingObjects<MachineMemOperand *>(), NumMMOs);
181 }
182
183 MCSymbol *getPreInstrSymbol() const {
184 return HasPreInstrSymbol ? getTrailingObjects<MCSymbol *>()[0] : nullptr;
185 }
186
187 MCSymbol *getPostInstrSymbol() const {
188 return HasPostInstrSymbol
189 ? getTrailingObjects<MCSymbol *>()[HasPreInstrSymbol]
190 : nullptr;
191 }
192
193 MDNode *getHeapAllocMarker() const {
194 return HasHeapAllocMarker ? getTrailingObjects<MDNode *>()[0] : nullptr;
195 }
196
197 private:
198 friend TrailingObjects;
199
200 // Description of the extra info, used to interpret the actual optional
201 // data appended.
202 //
203 // Note that this is not terribly space optimized. This leaves a great deal
204 // of flexibility to fit more in here later.
205 const int NumMMOs;
206 const bool HasPreInstrSymbol;
207 const bool HasPostInstrSymbol;
208 const bool HasHeapAllocMarker;
209
210 // Implement the `TrailingObjects` internal API.
211 size_t numTrailingObjects(OverloadToken<MachineMemOperand *>) const {
212 return NumMMOs;
213 }
214 size_t numTrailingObjects(OverloadToken<MCSymbol *>) const {
215 return HasPreInstrSymbol + HasPostInstrSymbol;
216 }
217 size_t numTrailingObjects(OverloadToken<MDNode *>) const {
218 return HasHeapAllocMarker;
219 }
220
221 // Just a boring constructor to allow us to initialize the sizes. Always use
222 // the `create` routine above.
223 ExtraInfo(int NumMMOs, bool HasPreInstrSymbol, bool HasPostInstrSymbol,
224 bool HasHeapAllocMarker)
225 : NumMMOs(NumMMOs), HasPreInstrSymbol(HasPreInstrSymbol),
226 HasPostInstrSymbol(HasPostInstrSymbol),
227 HasHeapAllocMarker(HasHeapAllocMarker) {}
228 };
229
230 /// Enumeration of the kinds of inline extra info available. It is important
231 /// that the `MachineMemOperand` inline kind has a tag value of zero to make
232 /// it accessible as an `ArrayRef`.
233 enum ExtraInfoInlineKinds {
234 EIIK_MMO = 0,
235 EIIK_PreInstrSymbol,
236 EIIK_PostInstrSymbol,
237 EIIK_OutOfLine
238 };
239
240 // We store extra information about the instruction here. The common case is
241 // expected to be nothing or a single pointer (typically a MMO or a symbol).
242 // We work to optimize this common case by storing it inline here rather than
243 // requiring a separate allocation, but we fall back to an allocation when
244 // multiple pointers are needed.
245 PointerSumType<ExtraInfoInlineKinds,
246 PointerSumTypeMember<EIIK_MMO, MachineMemOperand *>,
247 PointerSumTypeMember<EIIK_PreInstrSymbol, MCSymbol *>,
248 PointerSumTypeMember<EIIK_PostInstrSymbol, MCSymbol *>,
249 PointerSumTypeMember<EIIK_OutOfLine, ExtraInfo *>>
250 Info;
251
252 DebugLoc DbgLoc; // Source line information.
253
254 /// Unique instruction number. Used by DBG_INSTR_REFs to refer to the values
255 /// defined by this instruction.
256 unsigned DebugInstrNum;
257
258 // Intrusive list support
259 friend struct ilist_traits<MachineInstr>;
260 friend struct ilist_callback_traits<MachineBasicBlock>;
261 void setParent(MachineBasicBlock *P) { Parent = P; }
262
263 /// This constructor creates a copy of the given
264 /// MachineInstr in the given MachineFunction.
265 MachineInstr(MachineFunction &, const MachineInstr &);
266
267 /// This constructor create a MachineInstr and add the implicit operands.
268 /// It reserves space for number of operands specified by
269 /// MCInstrDesc. An explicit DebugLoc is supplied.
270 MachineInstr(MachineFunction &, const MCInstrDesc &TID, DebugLoc DL,
271 bool NoImp = false);
272
273 // MachineInstrs are pool-allocated and owned by MachineFunction.
274 friend class MachineFunction;
275
276 void
277 dumprImpl(const MachineRegisterInfo &MRI, unsigned Depth, unsigned MaxDepth,
278 SmallPtrSetImpl<const MachineInstr *> &AlreadySeenInstrs) const;
279
280public:
281 MachineInstr(const MachineInstr &) = delete;
282 MachineInstr &operator=(const MachineInstr &) = delete;
283 // Use MachineFunction::DeleteMachineInstr() instead.
284 ~MachineInstr() = delete;
285
286 const MachineBasicBlock* getParent() const { return Parent; }
287 MachineBasicBlock* getParent() { return Parent; }
288
289 /// Move the instruction before \p MovePos.
290 void moveBefore(MachineInstr *MovePos);
291
292 /// Return the function that contains the basic block that this instruction
293 /// belongs to.
294 ///
295 /// Note: this is undefined behaviour if the instruction does not have a
296 /// parent.
297 const MachineFunction *getMF() const;
298 MachineFunction *getMF() {
299 return const_cast<MachineFunction *>(
300 static_cast<const MachineInstr *>(this)->getMF());
301 }
302
303 /// Return the asm printer flags bitvector.
304 uint8_t getAsmPrinterFlags() const { return AsmPrinterFlags; }
305
306 /// Clear the AsmPrinter bitvector.
307 void clearAsmPrinterFlags() { AsmPrinterFlags = 0; }
308
309 /// Return whether an AsmPrinter flag is set.
310 bool getAsmPrinterFlag(CommentFlag Flag) const {
311 return AsmPrinterFlags & Flag;
312 }
313
314 /// Set a flag for the AsmPrinter.
315 void setAsmPrinterFlag(uint8_t Flag) {
316 AsmPrinterFlags |= Flag;
317 }
318
319 /// Clear specific AsmPrinter flags.
320 void clearAsmPrinterFlag(CommentFlag Flag) {
321 AsmPrinterFlags &= ~Flag;
322 }
323
324 /// Return the MI flags bitvector.
325 uint16_t getFlags() const {
326 return Flags;
327 }
328
329 /// Return whether an MI flag is set.
330 bool getFlag(MIFlag Flag) const {
331 return Flags & Flag;
332 }
333
334 /// Set a MI flag.
335 void setFlag(MIFlag Flag) {
336 Flags |= (uint16_t)Flag;
337 }
338
339 void setFlags(unsigned flags) {
340 // Filter out the automatically maintained flags.
341 unsigned Mask = BundledPred | BundledSucc;
342 Flags = (Flags & Mask) | (flags & ~Mask);
343 }
344
345 /// clearFlag - Clear a MI flag.
346 void clearFlag(MIFlag Flag) {
347 Flags &= ~((uint16_t)Flag);
348 }
349
350 /// Return true if MI is in a bundle (but not the first MI in a bundle).
351 ///
352 /// A bundle looks like this before it's finalized:
353 /// ----------------
354 /// | MI |
355 /// ----------------
356 /// |
357 /// ----------------
358 /// | MI * |
359 /// ----------------
360 /// |
361 /// ----------------
362 /// | MI * |
363 /// ----------------
364 /// In this case, the first MI starts a bundle but is not inside a bundle, the
365 /// next 2 MIs are considered "inside" the bundle.
366 ///
367 /// After a bundle is finalized, it looks like this:
368 /// ----------------
369 /// | Bundle |
370 /// ----------------
371 /// |
372 /// ----------------
373 /// | MI * |
374 /// ----------------
375 /// |
376 /// ----------------
377 /// | MI * |
378 /// ----------------
379 /// |
380 /// ----------------
381 /// | MI * |
382 /// ----------------
383 /// The first instruction has the special opcode "BUNDLE". It's not "inside"
384 /// a bundle, but the next three MIs are.
385 bool isInsideBundle() const {
386 return getFlag(BundledPred);
387 }
388
389 /// Return true if this instruction part of a bundle. This is true
390 /// if either itself or its following instruction is marked "InsideBundle".
391 bool isBundled() const {
392 return isBundledWithPred() || isBundledWithSucc();
393 }
394
395 /// Return true if this instruction is part of a bundle, and it is not the
396 /// first instruction in the bundle.
397 bool isBundledWithPred() const { return getFlag(BundledPred); }
398
399 /// Return true if this instruction is part of a bundle, and it is not the
400 /// last instruction in the bundle.
401 bool isBundledWithSucc() const { return getFlag(BundledSucc); }
402
403 /// Bundle this instruction with its predecessor. This can be an unbundled
404 /// instruction, or it can be the first instruction in a bundle.
405 void bundleWithPred();
406
407 /// Bundle this instruction with its successor. This can be an unbundled
408 /// instruction, or it can be the last instruction in a bundle.
409 void bundleWithSucc();
410
411 /// Break bundle above this instruction.
412 void unbundleFromPred();
413
414 /// Break bundle below this instruction.
415 void unbundleFromSucc();
416
417 /// Returns the debug location id of this MachineInstr.
418 const DebugLoc &getDebugLoc() const { return DbgLoc; }
419
420 /// Return the operand containing the offset to be used if this DBG_VALUE
421 /// instruction is indirect; will be an invalid register if this value is
422 /// not indirect, and an immediate with value 0 otherwise.
423 const MachineOperand &getDebugOffset() const {
424 assert(isNonListDebugValue() && "not a DBG_VALUE")(static_cast <bool> (isNonListDebugValue() && "not a DBG_VALUE"
) ? void (0) : __assert_fail ("isNonListDebugValue() && \"not a DBG_VALUE\""
, "llvm/include/llvm/CodeGen/MachineInstr.h", 424, __extension__
__PRETTY_FUNCTION__))
;
425 return getOperand(1);
426 }
427 MachineOperand &getDebugOffset() {
428 assert(isNonListDebugValue() && "not a DBG_VALUE")(static_cast <bool> (isNonListDebugValue() && "not a DBG_VALUE"
) ? void (0) : __assert_fail ("isNonListDebugValue() && \"not a DBG_VALUE\""
, "llvm/include/llvm/CodeGen/MachineInstr.h", 428, __extension__
__PRETTY_FUNCTION__))
;
429 return getOperand(1);
430 }
431
432 /// Return the operand for the debug variable referenced by
433 /// this DBG_VALUE instruction.
434 const MachineOperand &getDebugVariableOp() const;
435 MachineOperand &getDebugVariableOp();
436
437 /// Return the debug variable referenced by
438 /// this DBG_VALUE instruction.
439 const DILocalVariable *getDebugVariable() const;
440
441 /// Return the operand for the complex address expression referenced by
442 /// this DBG_VALUE instruction.
443 const MachineOperand &getDebugExpressionOp() const;
444 MachineOperand &getDebugExpressionOp();
445
446 /// Return the complex address expression referenced by
447 /// this DBG_VALUE instruction.
448 const DIExpression *getDebugExpression() const;
449
450 /// Return the debug label referenced by
451 /// this DBG_LABEL instruction.
452 const DILabel *getDebugLabel() const;
453
454 /// Fetch the instruction number of this MachineInstr. If it does not have
455 /// one already, a new and unique number will be assigned.
456 unsigned getDebugInstrNum();
457
458 /// Fetch instruction number of this MachineInstr -- but before it's inserted
459 /// into \p MF. Needed for transformations that create an instruction but
460 /// don't immediately insert them.
461 unsigned getDebugInstrNum(MachineFunction &MF);
462
463 /// Examine the instruction number of this MachineInstr. May be zero if
464 /// it hasn't been assigned a number yet.
465 unsigned peekDebugInstrNum() const { return DebugInstrNum; }
466
467 /// Set instruction number of this MachineInstr. Avoid using unless you're
468 /// deserializing this information.
469 void setDebugInstrNum(unsigned Num) { DebugInstrNum = Num; }
470
471 /// Drop any variable location debugging information associated with this
472 /// instruction. Use when an instruction is modified in such a way that it no
473 /// longer defines the value it used to. Variable locations using that value
474 /// will be dropped.
475 void dropDebugNumber() { DebugInstrNum = 0; }
476
477 /// Emit an error referring to the source location of this instruction.
478 /// This should only be used for inline assembly that is somehow
479 /// impossible to compile. Other errors should have been handled much
480 /// earlier.
481 ///
482 /// If this method returns, the caller should try to recover from the error.
483 void emitError(StringRef Msg) const;
484
485 /// Returns the target instruction descriptor of this MachineInstr.
486 const MCInstrDesc &getDesc() const { return *MCID; }
487
488 /// Returns the opcode of this MachineInstr.
489 unsigned getOpcode() const { return MCID->Opcode; }
490
491 /// Retuns the total number of operands.
492 unsigned getNumOperands() const { return NumOperands; }
493
494 /// Returns the total number of operands which are debug locations.
495 unsigned getNumDebugOperands() const {
496 return std::distance(debug_operands().begin(), debug_operands().end());
497 }
498
499 const MachineOperand& getOperand(unsigned i) const {
500 assert(i < getNumOperands() && "getOperand() out of range!")(static_cast <bool> (i < getNumOperands() &&
"getOperand() out of range!") ? void (0) : __assert_fail ("i < getNumOperands() && \"getOperand() out of range!\""
, "llvm/include/llvm/CodeGen/MachineInstr.h", 500, __extension__
__PRETTY_FUNCTION__))
;
501 return Operands[i];
502 }
503 MachineOperand& getOperand(unsigned i) {
504 assert(i < getNumOperands() && "getOperand() out of range!")(static_cast <bool> (i < getNumOperands() &&
"getOperand() out of range!") ? void (0) : __assert_fail ("i < getNumOperands() && \"getOperand() out of range!\""
, "llvm/include/llvm/CodeGen/MachineInstr.h", 504, __extension__
__PRETTY_FUNCTION__))
;
505 return Operands[i];
506 }
507
508 MachineOperand &getDebugOperand(unsigned Index) {
509 assert(Index < getNumDebugOperands() && "getDebugOperand() out of range!")(static_cast <bool> (Index < getNumDebugOperands() &&
"getDebugOperand() out of range!") ? void (0) : __assert_fail
("Index < getNumDebugOperands() && \"getDebugOperand() out of range!\""
, "llvm/include/llvm/CodeGen/MachineInstr.h", 509, __extension__
__PRETTY_FUNCTION__))
;
510 return *(debug_operands().begin() + Index);
511 }
512 const MachineOperand &getDebugOperand(unsigned Index) const {
513 assert(Index < getNumDebugOperands() && "getDebugOperand() out of range!")(static_cast <bool> (Index < getNumDebugOperands() &&
"getDebugOperand() out of range!") ? void (0) : __assert_fail
("Index < getNumDebugOperands() && \"getDebugOperand() out of range!\""
, "llvm/include/llvm/CodeGen/MachineInstr.h", 513, __extension__
__PRETTY_FUNCTION__))
;
514 return *(debug_operands().begin() + Index);
515 }
516
517 SmallSet<Register, 4> getUsedDebugRegs() const {
518 assert(isDebugValue() && "not a DBG_VALUE*")(static_cast <bool> (isDebugValue() && "not a DBG_VALUE*"
) ? void (0) : __assert_fail ("isDebugValue() && \"not a DBG_VALUE*\""
, "llvm/include/llvm/CodeGen/MachineInstr.h", 518, __extension__
__PRETTY_FUNCTION__))
;
519 SmallSet<Register, 4> UsedRegs;
520 for (const auto &MO : debug_operands())
521 if (MO.isReg() && MO.getReg())
522 UsedRegs.insert(MO.getReg());
523 return UsedRegs;
524 }
525
526 /// Returns whether this debug value has at least one debug operand with the
527 /// register \p Reg.
528 bool hasDebugOperandForReg(Register Reg) const {
529 return any_of(debug_operands(), [Reg](const MachineOperand &Op) {
530 return Op.isReg() && Op.getReg() == Reg;
531 });
532 }
533
534 /// Returns a range of all of the operands that correspond to a debug use of
535 /// \p Reg.
536 template <typename Operand, typename Instruction>
537 static iterator_range<
538 filter_iterator<Operand *, std::function<bool(Operand &Op)>>>
539 getDebugOperandsForReg(Instruction *MI, Register Reg) {
540 std::function<bool(Operand & Op)> OpUsesReg(
541 [Reg](Operand &Op) { return Op.isReg() && Op.getReg() == Reg; });
542 return make_filter_range(MI->debug_operands(), OpUsesReg);
543 }
544 iterator_range<filter_iterator<const MachineOperand *,
545 std::function<bool(const MachineOperand &Op)>>>
546 getDebugOperandsForReg(Register Reg) const {
547 return MachineInstr::getDebugOperandsForReg<const MachineOperand,
548 const MachineInstr>(this, Reg);
549 }
550 iterator_range<filter_iterator<MachineOperand *,
551 std::function<bool(MachineOperand &Op)>>>
552 getDebugOperandsForReg(Register Reg) {
553 return MachineInstr::getDebugOperandsForReg<MachineOperand, MachineInstr>(
554 this, Reg);
555 }
556
557 bool isDebugOperand(const MachineOperand *Op) const {
558 return Op >= adl_begin(debug_operands()) && Op <= adl_end(debug_operands());
559 }
560
561 unsigned getDebugOperandIndex(const MachineOperand *Op) const {
562 assert(isDebugOperand(Op) && "Expected a debug operand.")(static_cast <bool> (isDebugOperand(Op) && "Expected a debug operand."
) ? void (0) : __assert_fail ("isDebugOperand(Op) && \"Expected a debug operand.\""
, "llvm/include/llvm/CodeGen/MachineInstr.h", 562, __extension__
__PRETTY_FUNCTION__))
;
563 return std::distance(adl_begin(debug_operands()), Op);
564 }
565
566 /// Returns the total number of definitions.
567 unsigned getNumDefs() const {
568 return getNumExplicitDefs() + MCID->getNumImplicitDefs();
569 }
570
571 /// Returns true if the instruction has implicit definition.
572 bool hasImplicitDef() const {
573 for (unsigned I = getNumExplicitOperands(), E = getNumOperands();
574 I != E; ++I) {
575 const MachineOperand &MO = getOperand(I);
576 if (MO.isDef() && MO.isImplicit())
577 return true;
578 }
579 return false;
580 }
581
582 /// Returns the implicit operands number.
583 unsigned getNumImplicitOperands() const {
584 return getNumOperands() - getNumExplicitOperands();
585 }
586
587 /// Return true if operand \p OpIdx is a subregister index.
588 bool isOperandSubregIdx(unsigned OpIdx) const {
589 assert(getOperand(OpIdx).getType() == MachineOperand::MO_Immediate &&(static_cast <bool> (getOperand(OpIdx).getType() == MachineOperand
::MO_Immediate && "Expected MO_Immediate operand type."
) ? void (0) : __assert_fail ("getOperand(OpIdx).getType() == MachineOperand::MO_Immediate && \"Expected MO_Immediate operand type.\""
, "llvm/include/llvm/CodeGen/MachineInstr.h", 590, __extension__
__PRETTY_FUNCTION__))
590 "Expected MO_Immediate operand type.")(static_cast <bool> (getOperand(OpIdx).getType() == MachineOperand
::MO_Immediate && "Expected MO_Immediate operand type."
) ? void (0) : __assert_fail ("getOperand(OpIdx).getType() == MachineOperand::MO_Immediate && \"Expected MO_Immediate operand type.\""
, "llvm/include/llvm/CodeGen/MachineInstr.h", 590, __extension__
__PRETTY_FUNCTION__))
;
591 if (isExtractSubreg() && OpIdx == 2)
592 return true;
593 if (isInsertSubreg() && OpIdx == 3)
594 return true;
595 if (isRegSequence() && OpIdx > 1 && (OpIdx % 2) == 0)
596 return true;
597 if (isSubregToReg() && OpIdx == 3)
598 return true;
599 return false;
600 }
601
602 /// Returns the number of non-implicit operands.
603 unsigned getNumExplicitOperands() const;
604
605 /// Returns the number of non-implicit definitions.
606 unsigned getNumExplicitDefs() const;
607
608 /// iterator/begin/end - Iterate over all operands of a machine instruction.
609 using mop_iterator = MachineOperand *;
610 using const_mop_iterator = const MachineOperand *;
611
612 mop_iterator operands_begin() { return Operands; }
613 mop_iterator operands_end() { return Operands + NumOperands; }
614
615 const_mop_iterator operands_begin() const { return Operands; }
616 const_mop_iterator operands_end() const { return Operands + NumOperands; }
617
618 iterator_range<mop_iterator> operands() {
619 return make_range(operands_begin(), operands_end());
620 }
621 iterator_range<const_mop_iterator> operands() const {
622 return make_range(operands_begin(), operands_end());
623 }
624 iterator_range<mop_iterator> explicit_operands() {
625 return make_range(operands_begin(),
626 operands_begin() + getNumExplicitOperands());
627 }
628 iterator_range<const_mop_iterator> explicit_operands() const {
629 return make_range(operands_begin(),
630 operands_begin() + getNumExplicitOperands());
631 }
632 iterator_range<mop_iterator> implicit_operands() {
633 return make_range(explicit_operands().end(), operands_end());
634 }
635 iterator_range<const_mop_iterator> implicit_operands() const {
636 return make_range(explicit_operands().end(), operands_end());
637 }
638 /// Returns a range over all operands that are used to determine the variable
639 /// location for this DBG_VALUE instruction.
640 iterator_range<mop_iterator> debug_operands() {
641 assert(isDebugValue() && "Must be a debug value instruction.")(static_cast <bool> (isDebugValue() && "Must be a debug value instruction."
) ? void (0) : __assert_fail ("isDebugValue() && \"Must be a debug value instruction.\""
, "llvm/include/llvm/CodeGen/MachineInstr.h", 641, __extension__
__PRETTY_FUNCTION__))
;
642 return isDebugValueList()
643 ? make_range(operands_begin() + 2, operands_end())
644 : make_range(operands_begin(), operands_begin() + 1);
645 }
646 /// \copydoc debug_operands()
647 iterator_range<const_mop_iterator> debug_operands() const {
648 assert(isDebugValue() && "Must be a debug value instruction.")(static_cast <bool> (isDebugValue() && "Must be a debug value instruction."
) ? void (0) : __assert_fail ("isDebugValue() && \"Must be a debug value instruction.\""
, "llvm/include/llvm/CodeGen/MachineInstr.h", 648, __extension__
__PRETTY_FUNCTION__))
;
649 return isDebugValueList()
650 ? make_range(operands_begin() + 2, operands_end())
651 : make_range(operands_begin(), operands_begin() + 1);
652 }
653 /// Returns a range over all explicit operands that are register definitions.
654 /// Implicit definition are not included!
655 iterator_range<mop_iterator> defs() {
656 return make_range(operands_begin(),
657 operands_begin() + getNumExplicitDefs());
658 }
659 /// \copydoc defs()
660 iterator_range<const_mop_iterator> defs() const {
661 return make_range(operands_begin(),
662 operands_begin() + getNumExplicitDefs());
663 }
664 /// Returns a range that includes all operands that are register uses.
665 /// This may include unrelated operands which are not register uses.
666 iterator_range<mop_iterator> uses() {
667 return make_range(operands_begin() + getNumExplicitDefs(), operands_end());
668 }
669 /// \copydoc uses()
670 iterator_range<const_mop_iterator> uses() const {
671 return make_range(operands_begin() + getNumExplicitDefs(), operands_end());
672 }
673 iterator_range<mop_iterator> explicit_uses() {
674 return make_range(operands_begin() + getNumExplicitDefs(),
675 operands_begin() + getNumExplicitOperands());
676 }
677 iterator_range<const_mop_iterator> explicit_uses() const {
678 return make_range(operands_begin() + getNumExplicitDefs(),
679 operands_begin() + getNumExplicitOperands());
680 }
681
682 /// Returns the number of the operand iterator \p I points to.
683 unsigned getOperandNo(const_mop_iterator I) const {
684 return I - operands_begin();
685 }
686
687 /// Access to memory operands of the instruction. If there are none, that does
688 /// not imply anything about whether the function accesses memory. Instead,
689 /// the caller must behave conservatively.
690 ArrayRef<MachineMemOperand *> memoperands() const {
691 if (!Info)
692 return {};
693
694 if (Info.is<EIIK_MMO>())
695 return makeArrayRef(Info.getAddrOfZeroTagPointer(), 1);
696
697 if (ExtraInfo *EI = Info.get<EIIK_OutOfLine>())
698 return EI->getMMOs();
699
700 return {};
701 }
702
703 /// Access to memory operands of the instruction.
704 ///
705 /// If `memoperands_begin() == memoperands_end()`, that does not imply
706 /// anything about whether the function accesses memory. Instead, the caller
707 /// must behave conservatively.
708 mmo_iterator memoperands_begin() const { return memoperands().begin(); }
709
710 /// Access to memory operands of the instruction.
711 ///
712 /// If `memoperands_begin() == memoperands_end()`, that does not imply
713 /// anything about whether the function accesses memory. Instead, the caller
714 /// must behave conservatively.
715 mmo_iterator memoperands_end() const { return memoperands().end(); }
716
717 /// Return true if we don't have any memory operands which described the
718 /// memory access done by this instruction. If this is true, calling code
719 /// must be conservative.
720 bool memoperands_empty() const { return memoperands().empty(); }
721
722 /// Return true if this instruction has exactly one MachineMemOperand.
723 bool hasOneMemOperand() const { return memoperands().size() == 1; }
724
725 /// Return the number of memory operands.
726 unsigned getNumMemOperands() const { return memoperands().size(); }
727
728 /// Helper to extract a pre-instruction symbol if one has been added.
729 MCSymbol *getPreInstrSymbol() const {
730 if (!Info)
731 return nullptr;
732 if (MCSymbol *S = Info.get<EIIK_PreInstrSymbol>())
733 return S;
734 if (ExtraInfo *EI = Info.get<EIIK_OutOfLine>())
735 return EI->getPreInstrSymbol();
736
737 return nullptr;
738 }
739
740 /// Helper to extract a post-instruction symbol if one has been added.
741 MCSymbol *getPostInstrSymbol() const {
742 if (!Info)
743 return nullptr;
744 if (MCSymbol *S = Info.get<EIIK_PostInstrSymbol>())
745 return S;
746 if (ExtraInfo *EI = Info.get<EIIK_OutOfLine>())
747 return EI->getPostInstrSymbol();
748
749 return nullptr;
750 }
751
752 /// Helper to extract a heap alloc marker if one has been added.
753 MDNode *getHeapAllocMarker() const {
754 if (!Info)
755 return nullptr;
756 if (ExtraInfo *EI = Info.get<EIIK_OutOfLine>())
757 return EI->getHeapAllocMarker();
758
759 return nullptr;
760 }
761
762 /// API for querying MachineInstr properties. They are the same as MCInstrDesc
763 /// queries but they are bundle aware.
764
765 enum QueryType {
766 IgnoreBundle, // Ignore bundles
767 AnyInBundle, // Return true if any instruction in bundle has property
768 AllInBundle // Return true if all instructions in bundle have property
769 };
770
771 /// Return true if the instruction (or in the case of a bundle,
772 /// the instructions inside the bundle) has the specified property.
773 /// The first argument is the property being queried.
774 /// The second argument indicates whether the query should look inside
775 /// instruction bundles.
776 bool hasProperty(unsigned MCFlag, QueryType Type = AnyInBundle) const {
777 assert(MCFlag < 64 &&(static_cast <bool> (MCFlag < 64 && "MCFlag out of range for bit mask in getFlags/hasPropertyInBundle."
) ? void (0) : __assert_fail ("MCFlag < 64 && \"MCFlag out of range for bit mask in getFlags/hasPropertyInBundle.\""
, "llvm/include/llvm/CodeGen/MachineInstr.h", 778, __extension__
__PRETTY_FUNCTION__))
778 "MCFlag out of range for bit mask in getFlags/hasPropertyInBundle.")(static_cast <bool> (MCFlag < 64 && "MCFlag out of range for bit mask in getFlags/hasPropertyInBundle."
) ? void (0) : __assert_fail ("MCFlag < 64 && \"MCFlag out of range for bit mask in getFlags/hasPropertyInBundle.\""
, "llvm/include/llvm/CodeGen/MachineInstr.h", 778, __extension__
__PRETTY_FUNCTION__))
;
779 // Inline the fast path for unbundled or bundle-internal instructions.
780 if (Type == IgnoreBundle || !isBundled() || isBundledWithPred())
781 return getDesc().getFlags() & (1ULL << MCFlag);
782
783 // If this is the first instruction in a bundle, take the slow path.
784 return hasPropertyInBundle(1ULL << MCFlag, Type);
785 }
786
787 /// Return true if this is an instruction that should go through the usual
788 /// legalization steps.
789 bool isPreISelOpcode(QueryType Type = IgnoreBundle) const {
790 return hasProperty(MCID::PreISelOpcode, Type);
791 }
792
793 /// Return true if this instruction can have a variable number of operands.
794 /// In this case, the variable operands will be after the normal
795 /// operands but before the implicit definitions and uses (if any are
796 /// present).
797 bool isVariadic(QueryType Type = IgnoreBundle) const {
798 return hasProperty(MCID::Variadic, Type);
799 }
800
801 /// Set if this instruction has an optional definition, e.g.
802 /// ARM instructions which can set condition code if 's' bit is set.
803 bool hasOptionalDef(QueryType Type = IgnoreBundle) const {
804 return hasProperty(MCID::HasOptionalDef, Type);
805 }
806
807 /// Return true if this is a pseudo instruction that doesn't
808 /// correspond to a real machine instruction.
809 bool isPseudo(QueryType Type = IgnoreBundle) const {
810 return hasProperty(MCID::Pseudo, Type);
811 }
812
813 bool isReturn(QueryType Type = AnyInBundle) const {
814 return hasProperty(MCID::Return, Type);
815 }
816
817 /// Return true if this is an instruction that marks the end of an EH scope,
818 /// i.e., a catchpad or a cleanuppad instruction.
819 bool isEHScopeReturn(QueryType Type = AnyInBundle) const {
820 return hasProperty(MCID::EHScopeReturn, Type);
821 }
822
823 bool isCall(QueryType Type = AnyInBundle) const {
824 return hasProperty(MCID::Call, Type);
825 }
826
827 /// Return true if this is a call instruction that may have an associated
828 /// call site entry in the debug info.
829 bool isCandidateForCallSiteEntry(QueryType Type = IgnoreBundle) const;
830 /// Return true if copying, moving, or erasing this instruction requires
831 /// updating Call Site Info (see \ref copyCallSiteInfo, \ref moveCallSiteInfo,
832 /// \ref eraseCallSiteInfo).
833 bool shouldUpdateCallSiteInfo() const;
834
835 /// Returns true if the specified instruction stops control flow
836 /// from executing the instruction immediately following it. Examples include
837 /// unconditional branches and return instructions.
838 bool isBarrier(QueryType Type = AnyInBundle) const {
839 return hasProperty(MCID::Barrier, Type);
840 }
841
842 /// Returns true if this instruction part of the terminator for a basic block.
843 /// Typically this is things like return and branch instructions.
844 ///
845 /// Various passes use this to insert code into the bottom of a basic block,
846 /// but before control flow occurs.
847 bool isTerminator(QueryType Type = AnyInBundle) const {
848 return hasProperty(MCID::Terminator, Type);
849 }
850
851 /// Returns true if this is a conditional, unconditional, or indirect branch.
852 /// Predicates below can be used to discriminate between
853 /// these cases, and the TargetInstrInfo::analyzeBranch method can be used to
854 /// get more information.
855 bool isBranch(QueryType Type = AnyInBundle) const {
856 return hasProperty(MCID::Branch, Type);
857 }
858
859 /// Return true if this is an indirect branch, such as a
860 /// branch through a register.
861 bool isIndirectBranch(QueryType Type = AnyInBundle) const {
862 return hasProperty(MCID::IndirectBranch, Type);
863 }
864
865 /// Return true if this is a branch which may fall
866 /// through to the next instruction or may transfer control flow to some other
867 /// block. The TargetInstrInfo::analyzeBranch method can be used to get more
868 /// information about this branch.
869 bool isConditionalBranch(QueryType Type = AnyInBundle) const {
870 return isBranch(Type) && !isBarrier(Type) && !isIndirectBranch(Type);
871 }
872
873 /// Return true if this is a branch which always
874 /// transfers control flow to some other block. The
875 /// TargetInstrInfo::analyzeBranch method can be used to get more information
876 /// about this branch.
877 bool isUnconditionalBranch(QueryType Type = AnyInBundle) const {
878 return isBranch(Type) && isBarrier(Type) && !isIndirectBranch(Type);
879 }
880
881 /// Return true if this instruction has a predicate operand that
882 /// controls execution. It may be set to 'always', or may be set to other
883 /// values. There are various methods in TargetInstrInfo that can be used to
884 /// control and modify the predicate in this instruction.
885 bool isPredicable(QueryType Type = AllInBundle) const {
886 // If it's a bundle than all bundled instructions must be predicable for this
887 // to return true.
888 return hasProperty(MCID::Predicable, Type);
889 }
890
891 /// Return true if this instruction is a comparison.
892 bool isCompare(QueryType Type = IgnoreBundle) const {
893 return hasProperty(MCID::Compare, Type);
894 }
895
896 /// Return true if this instruction is a move immediate
897 /// (including conditional moves) instruction.
898 bool isMoveImmediate(QueryType Type = IgnoreBundle) const {
899 return hasProperty(MCID::MoveImm, Type);
900 }
901
902 /// Return true if this instruction is a register move.
903 /// (including moving values from subreg to reg)
904 bool isMoveReg(QueryType Type = IgnoreBundle) const {
905 return hasProperty(MCID::MoveReg, Type);
906 }
907
908 /// Return true if this instruction is a bitcast instruction.
909 bool isBitcast(QueryType Type = IgnoreBundle) const {
910 return hasProperty(MCID::Bitcast, Type);
911 }
912
913 /// Return true if this instruction is a select instruction.
914 bool isSelect(QueryType Type = IgnoreBundle) const {
915 return hasProperty(MCID::Select, Type);
916 }
917
918 /// Return true if this instruction cannot be safely duplicated.
919 /// For example, if the instruction has a unique labels attached
920 /// to it, duplicating it would cause multiple definition errors.
921 bool isNotDuplicable(QueryType Type = AnyInBundle) const {
922 return hasProperty(MCID::NotDuplicable, Type);
923 }
924
925 /// Return true if this instruction is convergent.
926 /// Convergent instructions can not be made control-dependent on any
927 /// additional values.
928 bool isConvergent(QueryType Type = AnyInBundle) const {
929 if (isInlineAsm()) {
930 unsigned ExtraInfo = getOperand(InlineAsm::MIOp_ExtraInfo).getImm();
931 if (ExtraInfo & InlineAsm::Extra_IsConvergent)
932 return true;
933 }
934 return hasProperty(MCID::Convergent, Type);
935 }
936
937 /// Returns true if the specified instruction has a delay slot
938 /// which must be filled by the code generator.
939 bool hasDelaySlot(QueryType Type = AnyInBundle) const {
940 return hasProperty(MCID::DelaySlot, Type);
941 }
942
943 /// Return true for instructions that can be folded as
944 /// memory operands in other instructions. The most common use for this
945 /// is instructions that are simple loads from memory that don't modify
946 /// the loaded value in any way, but it can also be used for instructions
947 /// that can be expressed as constant-pool loads, such as V_SETALLONES
948 /// on x86, to allow them to be folded when it is beneficial.
949 /// This should only be set on instructions that return a value in their
950 /// only virtual register definition.
951 bool canFoldAsLoad(QueryType Type = IgnoreBundle) const {
952 return hasProperty(MCID::FoldableAsLoad, Type);
953 }
954
955 /// Return true if this instruction behaves
956 /// the same way as the generic REG_SEQUENCE instructions.
957 /// E.g., on ARM,
958 /// dX VMOVDRR rY, rZ
959 /// is equivalent to
960 /// dX = REG_SEQUENCE rY, ssub_0, rZ, ssub_1.
961 ///
962 /// Note that for the optimizers to be able to take advantage of
963 /// this property, TargetInstrInfo::getRegSequenceLikeInputs has to be
964 /// override accordingly.
965 bool isRegSequenceLike(QueryType Type = IgnoreBundle) const {
966 return hasProperty(MCID::RegSequence, Type);
967 }
968
969 /// Return true if this instruction behaves
970 /// the same way as the generic EXTRACT_SUBREG instructions.
971 /// E.g., on ARM,
972 /// rX, rY VMOVRRD dZ
973 /// is equivalent to two EXTRACT_SUBREG:
974 /// rX = EXTRACT_SUBREG dZ, ssub_0
975 /// rY = EXTRACT_SUBREG dZ, ssub_1
976 ///
977 /// Note that for the optimizers to be able to take advantage of
978 /// this property, TargetInstrInfo::getExtractSubregLikeInputs has to be
979 /// override accordingly.
980 bool isExtractSubregLike(QueryType Type = IgnoreBundle) const {
981 return hasProperty(MCID::ExtractSubreg, Type);
982 }
983
984 /// Return true if this instruction behaves
985 /// the same way as the generic INSERT_SUBREG instructions.
986 /// E.g., on ARM,
987 /// dX = VSETLNi32 dY, rZ, Imm
988 /// is equivalent to a INSERT_SUBREG:
989 /// dX = INSERT_SUBREG dY, rZ, translateImmToSubIdx(Imm)
990 ///
991 /// Note that for the optimizers to be able to take advantage of
992 /// this property, TargetInstrInfo::getInsertSubregLikeInputs has to be
993 /// override accordingly.
994 bool isInsertSubregLike(QueryType Type = IgnoreBundle) const {
995 return hasProperty(MCID::InsertSubreg, Type);
996 }
997
998 //===--------------------------------------------------------------------===//
999 // Side Effect Analysis
1000 //===--------------------------------------------------------------------===//
1001
1002 /// Return true if this instruction could possibly read memory.
1003 /// Instructions with this flag set are not necessarily simple load
1004 /// instructions, they may load a value and modify it, for example.
1005 bool mayLoad(QueryType Type = AnyInBundle) const {
1006 if (isInlineAsm()) {
1007 unsigned ExtraInfo = getOperand(InlineAsm::MIOp_ExtraInfo).getImm();
1008 if (ExtraInfo & InlineAsm::Extra_MayLoad)
1009 return true;
1010 }
1011 return hasProperty(MCID::MayLoad, Type);
1012 }
1013
1014 /// Return true if this instruction could possibly modify memory.
1015 /// Instructions with this flag set are not necessarily simple store
1016 /// instructions, they may store a modified value based on their operands, or
1017 /// may not actually modify anything, for example.
1018 bool mayStore(QueryType Type = AnyInBundle) const {
1019 if (isInlineAsm()) {
1020 unsigned ExtraInfo = getOperand(InlineAsm::MIOp_ExtraInfo).getImm();
1021 if (ExtraInfo & InlineAsm::Extra_MayStore)
1022 return true;
1023 }
1024 return hasProperty(MCID::MayStore, Type);
1025 }
1026
1027 /// Return true if this instruction could possibly read or modify memory.
1028 bool mayLoadOrStore(QueryType Type = AnyInBundle) const {
1029 return mayLoad(Type) || mayStore(Type);
1030 }
1031
1032 /// Return true if this instruction could possibly raise a floating-point
1033 /// exception. This is the case if the instruction is a floating-point
1034 /// instruction that can in principle raise an exception, as indicated
1035 /// by the MCID::MayRaiseFPException property, *and* at the same time,
1036 /// the instruction is used in a context where we expect floating-point
1037 /// exceptions are not disabled, as indicated by the NoFPExcept MI flag.
1038 bool mayRaiseFPException() const {
1039 return hasProperty(MCID::MayRaiseFPException) &&
1040 !getFlag(MachineInstr::MIFlag::NoFPExcept);
1041 }
1042
1043 //===--------------------------------------------------------------------===//
1044 // Flags that indicate whether an instruction can be modified by a method.
1045 //===--------------------------------------------------------------------===//
1046
1047 /// Return true if this may be a 2- or 3-address
1048 /// instruction (of the form "X = op Y, Z, ..."), which produces the same
1049 /// result if Y and Z are exchanged. If this flag is set, then the
1050 /// TargetInstrInfo::commuteInstruction method may be used to hack on the
1051 /// instruction.
1052 ///
1053 /// Note that this flag may be set on instructions that are only commutable
1054 /// sometimes. In these cases, the call to commuteInstruction will fail.
1055 /// Also note that some instructions require non-trivial modification to
1056 /// commute them.
1057 bool isCommutable(QueryType Type = IgnoreBundle) const {
1058 return hasProperty(MCID::Commutable, Type);
1059 }
1060
1061 /// Return true if this is a 2-address instruction
1062 /// which can be changed into a 3-address instruction if needed. Doing this
1063 /// transformation can be profitable in the register allocator, because it
1064 /// means that the instruction can use a 2-address form if possible, but
1065 /// degrade into a less efficient form if the source and dest register cannot
1066 /// be assigned to the same register. For example, this allows the x86
1067 /// backend to turn a "shl reg, 3" instruction into an LEA instruction, which
1068 /// is the same speed as the shift but has bigger code size.
1069 ///
1070 /// If this returns true, then the target must implement the
1071 /// TargetInstrInfo::convertToThreeAddress method for this instruction, which
1072 /// is allowed to fail if the transformation isn't valid for this specific
1073 /// instruction (e.g. shl reg, 4 on x86).
1074 ///
1075 bool isConvertibleTo3Addr(QueryType Type = IgnoreBundle) const {
1076 return hasProperty(MCID::ConvertibleTo3Addr, Type);
1077 }
1078
1079 /// Return true if this instruction requires
1080 /// custom insertion support when the DAG scheduler is inserting it into a
1081 /// machine basic block. If this is true for the instruction, it basically
1082 /// means that it is a pseudo instruction used at SelectionDAG time that is
1083 /// expanded out into magic code by the target when MachineInstrs are formed.
1084 ///
1085 /// If this is true, the TargetLoweringInfo::InsertAtEndOfBasicBlock method
1086 /// is used to insert this into the MachineBasicBlock.
1087 bool usesCustomInsertionHook(QueryType Type = IgnoreBundle) const {
1088 return hasProperty(MCID::UsesCustomInserter, Type);
1089 }
1090
1091 /// Return true if this instruction requires *adjustment*
1092 /// after instruction selection by calling a target hook. For example, this
1093 /// can be used to fill in ARM 's' optional operand depending on whether
1094 /// the conditional flag register is used.
1095 bool hasPostISelHook(QueryType Type = IgnoreBundle) const {
1096 return hasProperty(MCID::HasPostISelHook, Type);
1097 }
1098
1099 /// Returns true if this instruction is a candidate for remat.
1100 /// This flag is deprecated, please don't use it anymore. If this
1101 /// flag is set, the isReallyTriviallyReMaterializable() method is called to
1102 /// verify the instruction is really rematable.
1103 bool isRematerializable(QueryType Type = AllInBundle) const {
1104 // It's only possible to re-mat a bundle if all bundled instructions are
1105 // re-materializable.
1106 return hasProperty(MCID::Rematerializable, Type);
1107 }
1108
1109 /// Returns true if this instruction has the same cost (or less) than a move
1110 /// instruction. This is useful during certain types of optimizations
1111 /// (e.g., remat during two-address conversion or machine licm)
1112 /// where we would like to remat or hoist the instruction, but not if it costs
1113 /// more than moving the instruction into the appropriate register. Note, we
1114 /// are not marking copies from and to the same register class with this flag.
1115 bool isAsCheapAsAMove(QueryType Type = AllInBundle) const {
1116 // Only returns true for a bundle if all bundled instructions are cheap.
1117 return hasProperty(MCID::CheapAsAMove, Type);
1118 }
1119
1120 /// Returns true if this instruction source operands
1121 /// have special register allocation requirements that are not captured by the
1122 /// operand register classes. e.g. ARM::STRD's two source registers must be an
1123 /// even / odd pair, ARM::STM registers have to be in ascending order.
1124 /// Post-register allocation passes should not attempt to change allocations
1125 /// for sources of instructions with this flag.
1126 bool hasExtraSrcRegAllocReq(QueryType Type = AnyInBundle) const {
1127 return hasProperty(MCID::ExtraSrcRegAllocReq, Type);
1128 }
1129
1130 /// Returns true if this instruction def operands
1131 /// have special register allocation requirements that are not captured by the
1132 /// operand register classes. e.g. ARM::LDRD's two def registers must be an
1133 /// even / odd pair, ARM::LDM registers have to be in ascending order.
1134 /// Post-register allocation passes should not attempt to change allocations
1135 /// for definitions of instructions with this flag.
1136 bool hasExtraDefRegAllocReq(QueryType Type = AnyInBundle) const {
1137 return hasProperty(MCID::ExtraDefRegAllocReq, Type);
1138 }
1139
1140 enum MICheckType {
1141 CheckDefs, // Check all operands for equality
1142 CheckKillDead, // Check all operands including kill / dead markers
1143 IgnoreDefs, // Ignore all definitions
1144 IgnoreVRegDefs // Ignore virtual register definitions
1145 };
1146
1147 /// Return true if this instruction is identical to \p Other.
1148 /// Two instructions are identical if they have the same opcode and all their
1149 /// operands are identical (with respect to MachineOperand::isIdenticalTo()).
1150 /// Note that this means liveness related flags (dead, undef, kill) do not
1151 /// affect the notion of identical.
1152 bool isIdenticalTo(const MachineInstr &Other,
1153 MICheckType Check = CheckDefs) const;
1154
1155 /// Unlink 'this' from the containing basic block, and return it without
1156 /// deleting it.
1157 ///
1158 /// This function can not be used on bundled instructions, use
1159 /// removeFromBundle() to remove individual instructions from a bundle.
1160 MachineInstr *removeFromParent();
1161
1162 /// Unlink this instruction from its basic block and return it without
1163 /// deleting it.
1164 ///
1165 /// If the instruction is part of a bundle, the other instructions in the
1166 /// bundle remain bundled.
1167 MachineInstr *removeFromBundle();
1168
1169 /// Unlink 'this' from the containing basic block and delete it.
1170 ///
1171 /// If this instruction is the header of a bundle, the whole bundle is erased.
1172 /// This function can not be used for instructions inside a bundle, use
1173 /// eraseFromBundle() to erase individual bundled instructions.
1174 void eraseFromParent();
1175
1176 /// Unlink 'this' form its basic block and delete it.
1177 ///
1178 /// If the instruction is part of a bundle, the other instructions in the
1179 /// bundle remain bundled.
1180 void eraseFromBundle();
1181
1182 bool isEHLabel() const { return getOpcode() == TargetOpcode::EH_LABEL; }
1183 bool isGCLabel() const { return getOpcode() == TargetOpcode::GC_LABEL; }
1184 bool isAnnotationLabel() const {
1185 return getOpcode() == TargetOpcode::ANNOTATION_LABEL;
1186 }
1187
1188 /// Returns true if the MachineInstr represents a label.
1189 bool isLabel() const {
1190 return isEHLabel() || isGCLabel() || isAnnotationLabel();
1191 }
1192
1193 bool isCFIInstruction() const {
1194 return getOpcode() == TargetOpcode::CFI_INSTRUCTION;
1195 }
1196
1197 bool isPseudoProbe() const {
1198 return getOpcode() == TargetOpcode::PSEUDO_PROBE;
1199 }
1200
1201 // True if the instruction represents a position in the function.
1202 bool isPosition() const { return isLabel() || isCFIInstruction(); }
1203
1204 bool isNonListDebugValue() const {
1205 return getOpcode() == TargetOpcode::DBG_VALUE;
1206 }
1207 bool isDebugValueList() const {
1208 return getOpcode() == TargetOpcode::DBG_VALUE_LIST;
1209 }
1210 bool isDebugValue() const {
1211 return isNonListDebugValue() || isDebugValueList();
1212 }
1213 bool isDebugLabel() const { return getOpcode() == TargetOpcode::DBG_LABEL; }
1214 bool isDebugRef() const { return getOpcode() == TargetOpcode::DBG_INSTR_REF; }
1215 bool isDebugPHI() const { return getOpcode() == TargetOpcode::DBG_PHI; }
1216 bool isDebugInstr() const {
1217 return isDebugValue() || isDebugLabel() || isDebugRef() || isDebugPHI();
1218 }
1219 bool isDebugOrPseudoInstr() const {
1220 return isDebugInstr() || isPseudoProbe();
1221 }
1222
1223 bool isDebugOffsetImm() const {
1224 return isNonListDebugValue() && getDebugOffset().isImm();
1225 }
1226
1227 /// A DBG_VALUE is indirect iff the location operand is a register and
1228 /// the offset operand is an immediate.
1229 bool isIndirectDebugValue() const {
1230 return isDebugOffsetImm() && getDebugOperand(0).isReg();
1231 }
1232
1233 /// A DBG_VALUE is an entry value iff its debug expression contains the
1234 /// DW_OP_LLVM_entry_value operation.
1235 bool isDebugEntryValue() const;
1236
1237 /// Return true if the instruction is a debug value which describes a part of
1238 /// a variable as unavailable.
1239 bool isUndefDebugValue() const {
1240 if (!isDebugValue())
1241 return false;
1242 // If any $noreg locations are given, this DV is undef.
1243 for (const MachineOperand &Op : debug_operands())
1244 if (Op.isReg() && !Op.getReg().isValid())
1245 return true;
1246 return false;
1247 }
1248
1249 bool isPHI() const {
1250 return getOpcode() == TargetOpcode::PHI ||
1251 getOpcode() == TargetOpcode::G_PHI;
1252 }
1253 bool isKill() const { return getOpcode() == TargetOpcode::KILL; }
1254 bool isImplicitDef() const { return getOpcode()==TargetOpcode::IMPLICIT_DEF; }
1255 bool isInlineAsm() const {
1256 return getOpcode() == TargetOpcode::INLINEASM ||
1257 getOpcode() == TargetOpcode::INLINEASM_BR;
1258 }
1259
1260 /// FIXME: Seems like a layering violation that the AsmDialect, which is X86
1261 /// specific, be attached to a generic MachineInstr.
1262 bool isMSInlineAsm() const {
1263 return isInlineAsm() && getInlineAsmDialect() == InlineAsm::AD_Intel;
1264 }
1265
1266 bool isStackAligningInlineAsm() const;
1267 InlineAsm::AsmDialect getInlineAsmDialect() const;
1268
1269 bool isInsertSubreg() const {
1270 return getOpcode() == TargetOpcode::INSERT_SUBREG;
1271 }
1272
1273 bool isSubregToReg() const {
1274 return getOpcode() == TargetOpcode::SUBREG_TO_REG;
1275 }
1276
1277 bool isRegSequence() const {
1278 return getOpcode() == TargetOpcode::REG_SEQUENCE;
1279 }
1280
1281 bool isBundle() const {
1282 return getOpcode() == TargetOpcode::BUNDLE;
1283 }
1284
1285 bool isCopy() const {
1286 return getOpcode() == TargetOpcode::COPY;
1287 }
1288
1289 bool isFullCopy() const {
1290 return isCopy() && !getOperand(0).getSubReg() && !getOperand(1).getSubReg();
7
Returning zero, which participates in a condition later
1291 }
1292
1293 bool isExtractSubreg() const {
1294 return getOpcode() == TargetOpcode::EXTRACT_SUBREG;
1295 }
1296
1297 /// Return true if the instruction behaves like a copy.
1298 /// This does not include native copy instructions.
1299 bool isCopyLike() const {
1300 return isCopy() || isSubregToReg();
1301 }
1302
1303 /// Return true is the instruction is an identity copy.
1304 bool isIdentityCopy() const {
1305 return isCopy() && getOperand(0).getReg() == getOperand(1).getReg() &&
1306 getOperand(0).getSubReg() == getOperand(1).getSubReg();
1307 }
1308
1309 /// Return true if this instruction doesn't produce any output in the form of
1310 /// executable instructions.
1311 bool isMetaInstruction() const {
1312 switch (getOpcode()) {
1313 default:
1314 return false;
1315 case TargetOpcode::IMPLICIT_DEF:
1316 case TargetOpcode::KILL:
1317 case TargetOpcode::CFI_INSTRUCTION:
1318 case TargetOpcode::EH_LABEL:
1319 case TargetOpcode::GC_LABEL:
1320 case TargetOpcode::DBG_VALUE:
1321 case TargetOpcode::DBG_VALUE_LIST:
1322 case TargetOpcode::DBG_INSTR_REF:
1323 case TargetOpcode::DBG_PHI:
1324 case TargetOpcode::DBG_LABEL:
1325 case TargetOpcode::LIFETIME_START:
1326 case TargetOpcode::LIFETIME_END:
1327 case TargetOpcode::PSEUDO_PROBE:
1328 case TargetOpcode::ARITH_FENCE:
1329 return true;
1330 }
1331 }
1332
1333 /// Return true if this is a transient instruction that is either very likely
1334 /// to be eliminated during register allocation (such as copy-like
1335 /// instructions), or if this instruction doesn't have an execution-time cost.
1336 bool isTransient() const {
1337 switch (getOpcode()) {
1338 default:
1339 return isMetaInstruction();
1340 // Copy-like instructions are usually eliminated during register allocation.
1341 case TargetOpcode::PHI:
1342 case TargetOpcode::G_PHI:
1343 case TargetOpcode::COPY:
1344 case TargetOpcode::INSERT_SUBREG:
1345 case TargetOpcode::SUBREG_TO_REG:
1346 case TargetOpcode::REG_SEQUENCE:
1347 return true;
1348 }
1349 }
1350
1351 /// Return the number of instructions inside the MI bundle, excluding the
1352 /// bundle header.
1353 ///
1354 /// This is the number of instructions that MachineBasicBlock::iterator
1355 /// skips, 0 for unbundled instructions.
1356 unsigned getBundleSize() const;
1357
1358 /// Return true if the MachineInstr reads the specified register.
1359 /// If TargetRegisterInfo is passed, then it also checks if there
1360 /// is a read of a super-register.
1361 /// This does not count partial redefines of virtual registers as reads:
1362 /// %reg1024:6 = OP.
1363 bool readsRegister(Register Reg,
1364 const TargetRegisterInfo *TRI = nullptr) const {
1365 return findRegisterUseOperandIdx(Reg, false, TRI) != -1;
1366 }
1367
1368 /// Return true if the MachineInstr reads the specified virtual register.
1369 /// Take into account that a partial define is a
1370 /// read-modify-write operation.
1371 bool readsVirtualRegister(Register Reg) const {
1372 return readsWritesVirtualRegister(Reg).first;
1373 }
1374
1375 /// Return a pair of bools (reads, writes) indicating if this instruction
1376 /// reads or writes Reg. This also considers partial defines.
1377 /// If Ops is not null, all operand indices for Reg are added.
1378 std::pair<bool,bool> readsWritesVirtualRegister(Register Reg,
1379 SmallVectorImpl<unsigned> *Ops = nullptr) const;
1380
1381 /// Return true if the MachineInstr kills the specified register.
1382 /// If TargetRegisterInfo is passed, then it also checks if there is
1383 /// a kill of a super-register.
1384 bool killsRegister(Register Reg,
1385 const TargetRegisterInfo *TRI = nullptr) const {
1386 return findRegisterUseOperandIdx(Reg, true, TRI) != -1;
1387 }
1388
1389 /// Return true if the MachineInstr fully defines the specified register.
1390 /// If TargetRegisterInfo is passed, then it also checks
1391 /// if there is a def of a super-register.
1392 /// NOTE: It's ignoring subreg indices on virtual registers.
1393 bool definesRegister(Register Reg,
1394 const TargetRegisterInfo *TRI = nullptr) const {
1395 return findRegisterDefOperandIdx(Reg, false, false, TRI) != -1;
1396 }
1397
1398 /// Return true if the MachineInstr modifies (fully define or partially
1399 /// define) the specified register.
1400 /// NOTE: It's ignoring subreg indices on virtual registers.
1401 bool modifiesRegister(Register Reg,
1402 const TargetRegisterInfo *TRI = nullptr) const {
1403 return findRegisterDefOperandIdx(Reg, false, true, TRI) != -1;
1404 }
1405
1406 /// Returns true if the register is dead in this machine instruction.
1407 /// If TargetRegisterInfo is passed, then it also checks
1408 /// if there is a dead def of a super-register.
1409 bool registerDefIsDead(Register Reg,
1410 const TargetRegisterInfo *TRI = nullptr) const {
1411 return findRegisterDefOperandIdx(Reg, true, false, TRI) != -1;
1412 }
1413
1414 /// Returns true if the MachineInstr has an implicit-use operand of exactly
1415 /// the given register (not considering sub/super-registers).
1416 bool hasRegisterImplicitUseOperand(Register Reg) const;
1417
1418 /// Returns the operand index that is a use of the specific register or -1
1419 /// if it is not found. It further tightens the search criteria to a use
1420 /// that kills the register if isKill is true.
1421 int findRegisterUseOperandIdx(Register Reg, bool isKill = false,
1422 const TargetRegisterInfo *TRI = nullptr) const;
1423
1424 /// Wrapper for findRegisterUseOperandIdx, it returns
1425 /// a pointer to the MachineOperand rather than an index.
1426 MachineOperand *findRegisterUseOperand(Register Reg, bool isKill = false,
1427 const TargetRegisterInfo *TRI = nullptr) {
1428 int Idx = findRegisterUseOperandIdx(Reg, isKill, TRI);
1429 return (Idx == -1) ? nullptr : &getOperand(Idx);
1430 }
1431
1432 const MachineOperand *findRegisterUseOperand(
1433 Register Reg, bool isKill = false,
1434 const TargetRegisterInfo *TRI = nullptr) const {
1435 return const_cast<MachineInstr *>(this)->
1436 findRegisterUseOperand(Reg, isKill, TRI);
1437 }
1438
1439 /// Returns the operand index that is a def of the specified register or
1440 /// -1 if it is not found. If isDead is true, defs that are not dead are
1441 /// skipped. If Overlap is true, then it also looks for defs that merely
1442 /// overlap the specified register. If TargetRegisterInfo is non-null,
1443 /// then it also checks if there is a def of a super-register.
1444 /// This may also return a register mask operand when Overlap is true.
1445 int findRegisterDefOperandIdx(Register Reg,
1446 bool isDead = false, bool Overlap = false,
1447 const TargetRegisterInfo *TRI = nullptr) const;
1448
1449 /// Wrapper for findRegisterDefOperandIdx, it returns
1450 /// a pointer to the MachineOperand rather than an index.
1451 MachineOperand *
1452 findRegisterDefOperand(Register Reg, bool isDead = false,
1453 bool Overlap = false,
1454 const TargetRegisterInfo *TRI = nullptr) {
1455 int Idx = findRegisterDefOperandIdx(Reg, isDead, Overlap, TRI);
1456 return (Idx == -1) ? nullptr : &getOperand(Idx);
1457 }
1458
1459 const MachineOperand *
1460 findRegisterDefOperand(Register Reg, bool isDead = false,
1461 bool Overlap = false,
1462 const TargetRegisterInfo *TRI = nullptr) const {
1463 return const_cast<MachineInstr *>(this)->findRegisterDefOperand(
1464 Reg, isDead, Overlap, TRI);
1465 }
1466
1467 /// Find the index of the first operand in the
1468 /// operand list that is used to represent the predicate. It returns -1 if
1469 /// none is found.
1470 int findFirstPredOperandIdx() const;
1471
1472 /// Find the index of the flag word operand that
1473 /// corresponds to operand OpIdx on an inline asm instruction. Returns -1 if
1474 /// getOperand(OpIdx) does not belong to an inline asm operand group.
1475 ///
1476 /// If GroupNo is not NULL, it will receive the number of the operand group
1477 /// containing OpIdx.
1478 int findInlineAsmFlagIdx(unsigned OpIdx, unsigned *GroupNo = nullptr) const;
1479
1480 /// Compute the static register class constraint for operand OpIdx.
1481 /// For normal instructions, this is derived from the MCInstrDesc.
1482 /// For inline assembly it is derived from the flag words.
1483 ///
1484 /// Returns NULL if the static register class constraint cannot be
1485 /// determined.
1486 const TargetRegisterClass*
1487 getRegClassConstraint(unsigned OpIdx,
1488 const TargetInstrInfo *TII,
1489 const TargetRegisterInfo *TRI) const;
1490
1491 /// Applies the constraints (def/use) implied by this MI on \p Reg to
1492 /// the given \p CurRC.
1493 /// If \p ExploreBundle is set and MI is part of a bundle, all the
1494 /// instructions inside the bundle will be taken into account. In other words,
1495 /// this method accumulates all the constraints of the operand of this MI and
1496 /// the related bundle if MI is a bundle or inside a bundle.
1497 ///
1498 /// Returns the register class that satisfies both \p CurRC and the
1499 /// constraints set by MI. Returns NULL if such a register class does not
1500 /// exist.
1501 ///
1502 /// \pre CurRC must not be NULL.
1503 const TargetRegisterClass *getRegClassConstraintEffectForVReg(
1504 Register Reg, const TargetRegisterClass *CurRC,
1505 const TargetInstrInfo *TII, const TargetRegisterInfo *TRI,
1506 bool ExploreBundle = false) const;
1507
1508 /// Applies the constraints (def/use) implied by the \p OpIdx operand
1509 /// to the given \p CurRC.
1510 ///
1511 /// Returns the register class that satisfies both \p CurRC and the
1512 /// constraints set by \p OpIdx MI. Returns NULL if such a register class
1513 /// does not exist.
1514 ///
1515 /// \pre CurRC must not be NULL.
1516 /// \pre The operand at \p OpIdx must be a register.
1517 const TargetRegisterClass *
1518 getRegClassConstraintEffect(unsigned OpIdx, const TargetRegisterClass *CurRC,
1519 const TargetInstrInfo *TII,
1520 const TargetRegisterInfo *TRI) const;
1521
1522 /// Add a tie between the register operands at DefIdx and UseIdx.
1523 /// The tie will cause the register allocator to ensure that the two
1524 /// operands are assigned the same physical register.
1525 ///
1526 /// Tied operands are managed automatically for explicit operands in the
1527 /// MCInstrDesc. This method is for exceptional cases like inline asm.
1528 void tieOperands(unsigned DefIdx, unsigned UseIdx);
1529
1530 /// Given the index of a tied register operand, find the
1531 /// operand it is tied to. Defs are tied to uses and vice versa. Returns the
1532 /// index of the tied operand which must exist.
1533 unsigned findTiedOperandIdx(unsigned OpIdx) const;
1534
1535 /// Given the index of a register def operand,
1536 /// check if the register def is tied to a source operand, due to either
1537 /// two-address elimination or inline assembly constraints. Returns the
1538 /// first tied use operand index by reference if UseOpIdx is not null.
1539 bool isRegTiedToUseOperand(unsigned DefOpIdx,
1540 unsigned *UseOpIdx = nullptr) const {
1541 const MachineOperand &MO = getOperand(DefOpIdx);
1542 if (!MO.isReg() || !MO.isDef() || !MO.isTied())
1543 return false;
1544 if (UseOpIdx)
1545 *UseOpIdx = findTiedOperandIdx(DefOpIdx);
1546 return true;
1547 }
1548
1549 /// Return true if the use operand of the specified index is tied to a def
1550 /// operand. It also returns the def operand index by reference if DefOpIdx
1551 /// is not null.
1552 bool isRegTiedToDefOperand(unsigned UseOpIdx,
1553 unsigned *DefOpIdx = nullptr) const {
1554 const MachineOperand &MO = getOperand(UseOpIdx);
1555 if (!MO.isReg() || !MO.isUse() || !MO.isTied())
1556 return false;
1557 if (DefOpIdx)
1558 *DefOpIdx = findTiedOperandIdx(UseOpIdx);
1559 return true;
1560 }
1561
1562 /// Clears kill flags on all operands.
1563 void clearKillInfo();
1564
1565 /// Replace all occurrences of FromReg with ToReg:SubIdx,
1566 /// properly composing subreg indices where necessary.
1567 void substituteRegister(Register FromReg, Register ToReg, unsigned SubIdx,
1568 const TargetRegisterInfo &RegInfo);
1569
1570 /// We have determined MI kills a register. Look for the
1571 /// operand that uses it and mark it as IsKill. If AddIfNotFound is true,
1572 /// add a implicit operand if it's not found. Returns true if the operand
1573 /// exists / is added.
1574 bool addRegisterKilled(Register IncomingReg,
1575 const TargetRegisterInfo *RegInfo,
1576 bool AddIfNotFound = false);
1577
1578 /// Clear all kill flags affecting Reg. If RegInfo is provided, this includes
1579 /// all aliasing registers.
1580 void clearRegisterKills(Register Reg, const TargetRegisterInfo *RegInfo);
1581
1582 /// We have determined MI defined a register without a use.
1583 /// Look for the operand that defines it and mark it as IsDead. If
1584 /// AddIfNotFound is true, add a implicit operand if it's not found. Returns
1585 /// true if the operand exists / is added.
1586 bool addRegisterDead(Register Reg, const TargetRegisterInfo *RegInfo,
1587 bool AddIfNotFound = false);
1588
1589 /// Clear all dead flags on operands defining register @p Reg.
1590 void clearRegisterDeads(Register Reg);
1591
1592 /// Mark all subregister defs of register @p Reg with the undef flag.
1593 /// This function is used when we determined to have a subregister def in an
1594 /// otherwise undefined super register.
1595 void setRegisterDefReadUndef(Register Reg, bool IsUndef = true);
1596
1597 /// We have determined MI defines a register. Make sure there is an operand
1598 /// defining Reg.
1599 void addRegisterDefined(Register Reg,
1600 const TargetRegisterInfo *RegInfo = nullptr);
1601
1602 /// Mark every physreg used by this instruction as
1603 /// dead except those in the UsedRegs list.
1604 ///
1605 /// On instructions with register mask operands, also add implicit-def
1606 /// operands for all registers in UsedRegs.
1607 void setPhysRegsDeadExcept(ArrayRef<Register> UsedRegs,
1608 const TargetRegisterInfo &TRI);
1609
1610 /// Return true if it is safe to move this instruction. If
1611 /// SawStore is set to true, it means that there is a store (or call) between
1612 /// the instruction's location and its intended destination.
1613 bool isSafeToMove(AAResults *AA, bool &SawStore) const;
1614
1615 /// Returns true if this instruction's memory access aliases the memory
1616 /// access of Other.
1617 //
1618 /// Assumes any physical registers used to compute addresses
1619 /// have the same value for both instructions. Returns false if neither
1620 /// instruction writes to memory.
1621 ///
1622 /// @param AA Optional alias analysis, used to compare memory operands.
1623 /// @param Other MachineInstr to check aliasing against.
1624 /// @param UseTBAA Whether to pass TBAA information to alias analysis.
1625 bool mayAlias(AAResults *AA, const MachineInstr &Other, bool UseTBAA) const;
1626
1627 /// Return true if this instruction may have an ordered
1628 /// or volatile memory reference, or if the information describing the memory
1629 /// reference is not available. Return false if it is known to have no
1630 /// ordered or volatile memory references.
1631 bool hasOrderedMemoryRef() const;
1632
1633 /// Return true if this load instruction never traps and points to a memory
1634 /// location whose value doesn't change during the execution of this function.
1635 ///
1636 /// Examples include loading a value from the constant pool or from the
1637 /// argument area of a function (if it does not change). If the instruction
1638 /// does multiple loads, this returns true only if all of the loads are
1639 /// dereferenceable and invariant.
1640 bool isDereferenceableInvariantLoad(AAResults *AA) const;
1641
1642 /// If the specified instruction is a PHI that always merges together the
1643 /// same virtual register, return the register, otherwise return 0.
1644 unsigned isConstantValuePHI() const;
1645
1646 /// Return true if this instruction has side effects that are not modeled
1647 /// by mayLoad / mayStore, etc.
1648 /// For all instructions, the property is encoded in MCInstrDesc::Flags
1649 /// (see MCInstrDesc::hasUnmodeledSideEffects(). The only exception is
1650 /// INLINEASM instruction, in which case the side effect property is encoded
1651 /// in one of its operands (see InlineAsm::Extra_HasSideEffect).
1652 ///
1653 bool hasUnmodeledSideEffects() const;
1654
1655 /// Returns true if it is illegal to fold a load across this instruction.
1656 bool isLoadFoldBarrier() const;
1657
1658 /// Return true if all the defs of this instruction are dead.
1659 bool allDefsAreDead() const;
1660
1661 /// Return a valid size if the instruction is a spill instruction.
1662 Optional<unsigned> getSpillSize(const TargetInstrInfo *TII) const;
1663
1664 /// Return a valid size if the instruction is a folded spill instruction.
1665 Optional<unsigned> getFoldedSpillSize(const TargetInstrInfo *TII) const;
1666
1667 /// Return a valid size if the instruction is a restore instruction.
1668 Optional<unsigned> getRestoreSize(const TargetInstrInfo *TII) const;
1669
1670 /// Return a valid size if the instruction is a folded restore instruction.
1671 Optional<unsigned>
1672 getFoldedRestoreSize(const TargetInstrInfo *TII) const;
1673
1674 /// Copy implicit register operands from specified
1675 /// instruction to this instruction.
1676 void copyImplicitOps(MachineFunction &MF, const MachineInstr &MI);
1677
1678 /// Debugging support
1679 /// @{
1680 /// Determine the generic type to be printed (if needed) on uses and defs.
1681 LLT getTypeToPrint(unsigned OpIdx, SmallBitVector &PrintedTypes,
1682 const MachineRegisterInfo &MRI) const;
1683
1684 /// Return true when an instruction has tied register that can't be determined
1685 /// by the instruction's descriptor. This is useful for MIR printing, to
1686 /// determine whether we need to print the ties or not.
1687 bool hasComplexRegisterTies() const;
1688
1689 /// Print this MI to \p OS.
1690 /// Don't print information that can be inferred from other instructions if
1691 /// \p IsStandalone is false. It is usually true when only a fragment of the
1692 /// function is printed.
1693 /// Only print the defs and the opcode if \p SkipOpers is true.
1694 /// Otherwise, also print operands if \p SkipDebugLoc is true.
1695 /// Otherwise, also print the debug loc, with a terminating newline.
1696 /// \p TII is used to print the opcode name. If it's not present, but the
1697 /// MI is in a function, the opcode will be printed using the function's TII.
1698 void print(raw_ostream &OS, bool IsStandalone = true, bool SkipOpers = false,
1699 bool SkipDebugLoc = false, bool AddNewLine = true,
1700 const TargetInstrInfo *TII = nullptr) const;
1701 void print(raw_ostream &OS, ModuleSlotTracker &MST, bool IsStandalone = true,
1702 bool SkipOpers = false, bool SkipDebugLoc = false,
1703 bool AddNewLine = true,
1704 const TargetInstrInfo *TII = nullptr) const;
1705 void dump() const;
1706 /// Print on dbgs() the current instruction and the instructions defining its
1707 /// operands and so on until we reach \p MaxDepth.
1708 void dumpr(const MachineRegisterInfo &MRI,
1709 unsigned MaxDepth = UINT_MAX(2147483647 *2U +1U)) const;
1710 /// @}
1711
1712 //===--------------------------------------------------------------------===//
1713 // Accessors used to build up machine instructions.
1714
1715 /// Add the specified operand to the instruction. If it is an implicit
1716 /// operand, it is added to the end of the operand list. If it is an
1717 /// explicit operand it is added at the end of the explicit operand list
1718 /// (before the first implicit operand).
1719 ///
1720 /// MF must be the machine function that was used to allocate this
1721 /// instruction.
1722 ///
1723 /// MachineInstrBuilder provides a more convenient interface for creating
1724 /// instructions and adding operands.
1725 void addOperand(MachineFunction &MF, const MachineOperand &Op);
1726
1727 /// Add an operand without providing an MF reference. This only works for
1728 /// instructions that are inserted in a basic block.
1729 ///
1730 /// MachineInstrBuilder and the two-argument addOperand(MF, MO) should be
1731 /// preferred.
1732 void addOperand(const MachineOperand &Op);
1733
1734 /// Replace the instruction descriptor (thus opcode) of
1735 /// the current instruction with a new one.
1736 void setDesc(const MCInstrDesc &TID) { MCID = &TID; }
1737
1738 /// Replace current source information with new such.
1739 /// Avoid using this, the constructor argument is preferable.
1740 void setDebugLoc(DebugLoc DL) {
1741 DbgLoc = std::move(DL);
1742 assert(DbgLoc.hasTrivialDestructor() && "Expected trivial destructor")(static_cast <bool> (DbgLoc.hasTrivialDestructor() &&
"Expected trivial destructor") ? void (0) : __assert_fail ("DbgLoc.hasTrivialDestructor() && \"Expected trivial destructor\""
, "llvm/include/llvm/CodeGen/MachineInstr.h", 1742, __extension__
__PRETTY_FUNCTION__))
;
1743 }
1744
1745 /// Erase an operand from an instruction, leaving it with one
1746 /// fewer operand than it started with.
1747 void RemoveOperand(unsigned OpNo);
1748
1749 /// Clear this MachineInstr's memory reference descriptor list. This resets
1750 /// the memrefs to their most conservative state. This should be used only
1751 /// as a last resort since it greatly pessimizes our knowledge of the memory
1752 /// access performed by the instruction.
1753 void dropMemRefs(MachineFunction &MF);
1754
1755 /// Assign this MachineInstr's memory reference descriptor list.
1756 ///
1757 /// Unlike other methods, this *will* allocate them into a new array
1758 /// associated with the provided `MachineFunction`.
1759 void setMemRefs(MachineFunction &MF, ArrayRef<MachineMemOperand *> MemRefs);
1760
1761 /// Add a MachineMemOperand to the machine instruction.
1762 /// This function should be used only occasionally. The setMemRefs function
1763 /// is the primary method for setting up a MachineInstr's MemRefs list.
1764 void addMemOperand(MachineFunction &MF, MachineMemOperand *MO);
1765
1766 /// Clone another MachineInstr's memory reference descriptor list and replace
1767 /// ours with it.
1768 ///
1769 /// Note that `*this` may be the incoming MI!
1770 ///
1771 /// Prefer this API whenever possible as it can avoid allocations in common
1772 /// cases.
1773 void cloneMemRefs(MachineFunction &MF, const MachineInstr &MI);
1774
1775 /// Clone the merge of multiple MachineInstrs' memory reference descriptors
1776 /// list and replace ours with it.
1777 ///
1778 /// Note that `*this` may be one of the incoming MIs!
1779 ///
1780 /// Prefer this API whenever possible as it can avoid allocations in common
1781 /// cases.
1782 void cloneMergedMemRefs(MachineFunction &MF,
1783 ArrayRef<const MachineInstr *> MIs);
1784
1785 /// Set a symbol that will be emitted just prior to the instruction itself.
1786 ///
1787 /// Setting this to a null pointer will remove any such symbol.
1788 ///
1789 /// FIXME: This is not fully implemented yet.
1790 void setPreInstrSymbol(MachineFunction &MF, MCSymbol *Symbol);
1791
1792 /// Set a symbol that will be emitted just after the instruction itself.
1793 ///
1794 /// Setting this to a null pointer will remove any such symbol.
1795 ///
1796 /// FIXME: This is not fully implemented yet.
1797 void setPostInstrSymbol(MachineFunction &MF, MCSymbol *Symbol);
1798
1799 /// Clone another MachineInstr's pre- and post- instruction symbols and
1800 /// replace ours with it.
1801 void cloneInstrSymbols(MachineFunction &MF, const MachineInstr &MI);
1802
1803 /// Set a marker on instructions that denotes where we should create and emit
1804 /// heap alloc site labels. This waits until after instruction selection and
1805 /// optimizations to create the label, so it should still work if the
1806 /// instruction is removed or duplicated.
1807 void setHeapAllocMarker(MachineFunction &MF, MDNode *MD);
1808
1809 /// Return the MIFlags which represent both MachineInstrs. This
1810 /// should be used when merging two MachineInstrs into one. This routine does
1811 /// not modify the MIFlags of this MachineInstr.
1812 uint16_t mergeFlagsWith(const MachineInstr& Other) const;
1813
1814 static uint16_t copyFlagsFromInstruction(const Instruction &I);
1815
1816 /// Copy all flags to MachineInst MIFlags
1817 void copyIRFlags(const Instruction &I);
1818
1819 /// Break any tie involving OpIdx.
1820 void untieRegOperand(unsigned OpIdx) {
1821 MachineOperand &MO = getOperand(OpIdx);
1822 if (MO.isReg() && MO.isTied()) {
1823 getOperand(findTiedOperandIdx(OpIdx)).TiedTo = 0;
1824 MO.TiedTo = 0;
1825 }
1826 }
1827
1828 /// Add all implicit def and use operands to this instruction.
1829 void addImplicitDefUseOperands(MachineFunction &MF);
1830
1831 /// Scan instructions immediately following MI and collect any matching
1832 /// DBG_VALUEs.
1833 void collectDebugValues(SmallVectorImpl<MachineInstr *> &DbgValues);
1834
1835 /// Find all DBG_VALUEs that point to the register def in this instruction
1836 /// and point them to \p Reg instead.
1837 void changeDebugValuesDefReg(Register Reg);
1838
1839 /// Returns the Intrinsic::ID for this instruction.
1840 /// \pre Must have an intrinsic ID operand.
1841 unsigned getIntrinsicID() const {
1842 return getOperand(getNumExplicitDefs()).getIntrinsicID();
1843 }
1844
1845 /// Sets all register debug operands in this debug value instruction to be
1846 /// undef.
1847 void setDebugValueUndef() {
1848 assert(isDebugValue() && "Must be a debug value instruction.")(static_cast <bool> (isDebugValue() && "Must be a debug value instruction."
) ? void (0) : __assert_fail ("isDebugValue() && \"Must be a debug value instruction.\""
, "llvm/include/llvm/CodeGen/MachineInstr.h", 1848, __extension__
__PRETTY_FUNCTION__))
;
1849 for (MachineOperand &MO : debug_operands()) {
1850 if (MO.isReg()) {
1851 MO.setReg(0);
1852 MO.setSubReg(0);
1853 }
1854 }
1855 }
1856
1857private:
1858 /// If this instruction is embedded into a MachineFunction, return the
1859 /// MachineRegisterInfo object for the current function, otherwise
1860 /// return null.
1861 MachineRegisterInfo *getRegInfo();
1862
1863 /// Unlink all of the register operands in this instruction from their
1864 /// respective use lists. This requires that the operands already be on their
1865 /// use lists.
1866 void RemoveRegOperandsFromUseLists(MachineRegisterInfo&);
1867
1868 /// Add all of the register operands in this instruction from their
1869 /// respective use lists. This requires that the operands not be on their
1870 /// use lists yet.
1871 void AddRegOperandsToUseLists(MachineRegisterInfo&);
1872
1873 /// Slow path for hasProperty when we're dealing with a bundle.
1874 bool hasPropertyInBundle(uint64_t Mask, QueryType Type) const;
1875
1876 /// Implements the logic of getRegClassConstraintEffectForVReg for the
1877 /// this MI and the given operand index \p OpIdx.
1878 /// If the related operand does not constrained Reg, this returns CurRC.
1879 const TargetRegisterClass *getRegClassConstraintEffectForVRegImpl(
1880 unsigned OpIdx, Register Reg, const TargetRegisterClass *CurRC,
1881 const TargetInstrInfo *TII, const TargetRegisterInfo *TRI) const;
1882
1883 /// Stores extra instruction information inline or allocates as ExtraInfo
1884 /// based on the number of pointers.
1885 void setExtraInfo(MachineFunction &MF, ArrayRef<MachineMemOperand *> MMOs,
1886 MCSymbol *PreInstrSymbol, MCSymbol *PostInstrSymbol,
1887 MDNode *HeapAllocMarker);
1888};
1889
1890/// Special DenseMapInfo traits to compare MachineInstr* by *value* of the
1891/// instruction rather than by pointer value.
1892/// The hashing and equality testing functions ignore definitions so this is
1893/// useful for CSE, etc.
1894struct MachineInstrExpressionTrait : DenseMapInfo<MachineInstr*> {
1895 static inline MachineInstr *getEmptyKey() {
1896 return nullptr;
1897 }
1898
1899 static inline MachineInstr *getTombstoneKey() {
1900 return reinterpret_cast<MachineInstr*>(-1);
1901 }
1902
1903 static unsigned getHashValue(const MachineInstr* const &MI);
1904
1905 static bool isEqual(const MachineInstr* const &LHS,
1906 const MachineInstr* const &RHS) {
1907 if (RHS == getEmptyKey() || RHS == getTombstoneKey() ||
1908 LHS == getEmptyKey() || LHS == getTombstoneKey())
1909 return LHS == RHS;
1910 return LHS->isIdenticalTo(*RHS, MachineInstr::IgnoreVRegDefs);
1911 }
1912};
1913
1914//===----------------------------------------------------------------------===//
1915// Debugging Support
1916
1917inline raw_ostream& operator<<(raw_ostream &OS, const MachineInstr &MI) {
1918 MI.print(OS);
1919 return OS;
1920}
1921
1922} // end namespace llvm
1923
1924#endif // LLVM_CODEGEN_MACHINEINSTR_H

/build/llvm-toolchain-snapshot-14~++20220118101002+ec47dba1c8a2/llvm/include/llvm/CodeGen/Register.h

1//===-- llvm/CodeGen/Register.h ---------------------------------*- C++ -*-===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8
9#ifndef LLVM_CODEGEN_REGISTER_H
10#define LLVM_CODEGEN_REGISTER_H
11
12#include "llvm/MC/MCRegister.h"
13#include <cassert>
14
15namespace llvm {
16
17/// Wrapper class representing virtual and physical registers. Should be passed
18/// by value.
19class Register {
20 unsigned Reg;
21
22public:
23 constexpr Register(unsigned Val = 0): Reg(Val) {}
24 constexpr Register(MCRegister Val): Reg(Val) {}
25
26 // Register numbers can represent physical registers, virtual registers, and
27 // sometimes stack slots. The unsigned values are divided into these ranges:
28 //
29 // 0 Not a register, can be used as a sentinel.
30 // [1;2^30) Physical registers assigned by TableGen.
31 // [2^30;2^31) Stack slots. (Rarely used.)
32 // [2^31;2^32) Virtual registers assigned by MachineRegisterInfo.
33 //
34 // Further sentinels can be allocated from the small negative integers.
35 // DenseMapInfo<unsigned> uses -1u and -2u.
36 static_assert(std::numeric_limits<decltype(Reg)>::max() >= 0xFFFFFFFF,
37 "Reg isn't large enough to hold full range.");
38
39 /// isStackSlot - Sometimes it is useful the be able to store a non-negative
40 /// frame index in a variable that normally holds a register. isStackSlot()
41 /// returns true if Reg is in the range used for stack slots.
42 ///
43 /// FIXME: remove in favor of member.
44 static bool isStackSlot(unsigned Reg) {
45 return MCRegister::isStackSlot(Reg);
46 }
47
48 /// Return true if this is a stack slot.
49 bool isStack() const { return MCRegister::isStackSlot(Reg); }
50
51 /// Compute the frame index from a register value representing a stack slot.
52 static int stackSlot2Index(Register Reg) {
53 assert(Reg.isStack() && "Not a stack slot")(static_cast <bool> (Reg.isStack() && "Not a stack slot"
) ? void (0) : __assert_fail ("Reg.isStack() && \"Not a stack slot\""
, "llvm/include/llvm/CodeGen/Register.h", 53, __extension__ __PRETTY_FUNCTION__
))
;
54 return int(Reg - MCRegister::FirstStackSlot);
55 }
56
57 /// Convert a non-negative frame index to a stack slot register value.
58 static Register index2StackSlot(int FI) {
59 assert(FI >= 0 && "Cannot hold a negative frame index.")(static_cast <bool> (FI >= 0 && "Cannot hold a negative frame index."
) ? void (0) : __assert_fail ("FI >= 0 && \"Cannot hold a negative frame index.\""
, "llvm/include/llvm/CodeGen/Register.h", 59, __extension__ __PRETTY_FUNCTION__
))
;
60 return Register(FI + MCRegister::FirstStackSlot);
61 }
62
63 /// Return true if the specified register number is in
64 /// the physical register namespace.
65 static bool isPhysicalRegister(unsigned Reg) {
66 return MCRegister::isPhysicalRegister(Reg);
67 }
68
69 /// Return true if the specified register number is in
70 /// the virtual register namespace.
71 static bool isVirtualRegister(unsigned Reg) {
72 return Reg & MCRegister::VirtualRegFlag && !isStackSlot(Reg);
73 }
74
75 /// Convert a virtual register number to a 0-based index.
76 /// The first virtual register in a function will get the index 0.
77 static unsigned virtReg2Index(Register Reg) {
78 assert(isVirtualRegister(Reg) && "Not a virtual register")(static_cast <bool> (isVirtualRegister(Reg) && "Not a virtual register"
) ? void (0) : __assert_fail ("isVirtualRegister(Reg) && \"Not a virtual register\""
, "llvm/include/llvm/CodeGen/Register.h", 78, __extension__ __PRETTY_FUNCTION__
))
;
79 return Reg & ~MCRegister::VirtualRegFlag;
80 }
81
82 /// Convert a 0-based index to a virtual register number.
83 /// This is the inverse operation of VirtReg2IndexFunctor below.
84 static Register index2VirtReg(unsigned Index) {
85 assert(Index < (1u << 31) && "Index too large for virtual register range.")(static_cast <bool> (Index < (1u << 31) &&
"Index too large for virtual register range.") ? void (0) : __assert_fail
("Index < (1u << 31) && \"Index too large for virtual register range.\""
, "llvm/include/llvm/CodeGen/Register.h", 85, __extension__ __PRETTY_FUNCTION__
))
;
86 return Index | MCRegister::VirtualRegFlag;
87 }
88
89 /// Return true if the specified register number is in the virtual register
90 /// namespace.
91 bool isVirtual() const {
92 return isVirtualRegister(Reg);
93 }
94
95 /// Return true if the specified register number is in the physical register
96 /// namespace.
97 bool isPhysical() const {
98 return isPhysicalRegister(Reg);
99 }
100
101 /// Convert a virtual register number to a 0-based index. The first virtual
102 /// register in a function will get the index 0.
103 unsigned virtRegIndex() const {
104 return virtReg2Index(Reg);
105 }
106
107 constexpr operator unsigned() const {
108 return Reg;
12
Returning zero, which participates in a condition later
109 }
110
111 unsigned id() const { return Reg; }
112
113 operator MCRegister() const {
114 return MCRegister(Reg);
115 }
116
117 /// Utility to check-convert this value to a MCRegister. The caller is
118 /// expected to have already validated that this Register is, indeed,
119 /// physical.
120 MCRegister asMCReg() const {
121 assert(Reg == MCRegister::NoRegister ||(static_cast <bool> (Reg == MCRegister::NoRegister || MCRegister
::isPhysicalRegister(Reg)) ? void (0) : __assert_fail ("Reg == MCRegister::NoRegister || MCRegister::isPhysicalRegister(Reg)"
, "llvm/include/llvm/CodeGen/Register.h", 122, __extension__ __PRETTY_FUNCTION__
))
122 MCRegister::isPhysicalRegister(Reg))(static_cast <bool> (Reg == MCRegister::NoRegister || MCRegister
::isPhysicalRegister(Reg)) ? void (0) : __assert_fail ("Reg == MCRegister::NoRegister || MCRegister::isPhysicalRegister(Reg)"
, "llvm/include/llvm/CodeGen/Register.h", 122, __extension__ __PRETTY_FUNCTION__
))
;
123 return MCRegister(Reg);
124 }
125
126 bool isValid() const { return Reg != MCRegister::NoRegister; }
127
128 /// Comparisons between register objects
129 bool operator==(const Register &Other) const { return Reg == Other.Reg; }
130 bool operator!=(const Register &Other) const { return Reg != Other.Reg; }
131 bool operator==(const MCRegister &Other) const { return Reg == Other.id(); }
132 bool operator!=(const MCRegister &Other) const { return Reg != Other.id(); }
133
134 /// Comparisons against register constants. E.g.
135 /// * R == AArch64::WZR
136 /// * R == 0
137 /// * R == VirtRegMap::NO_PHYS_REG
138 bool operator==(unsigned Other) const { return Reg == Other; }
20
Assuming 'Other' is equal to field 'Reg'
21
Returning the value 1, which participates in a condition later
139 bool operator!=(unsigned Other) const { return Reg != Other; }
140 bool operator==(int Other) const { return Reg == unsigned(Other); }
141 bool operator!=(int Other) const { return Reg != unsigned(Other); }
142 // MSVC requires that we explicitly declare these two as well.
143 bool operator==(MCPhysReg Other) const { return Reg == unsigned(Other); }
144 bool operator!=(MCPhysReg Other) const { return Reg != unsigned(Other); }
145};
146
147// Provide DenseMapInfo for Register
148template<> struct DenseMapInfo<Register> {
149 static inline unsigned getEmptyKey() {
150 return DenseMapInfo<unsigned>::getEmptyKey();
151 }
152 static inline unsigned getTombstoneKey() {
153 return DenseMapInfo<unsigned>::getTombstoneKey();
154 }
155 static unsigned getHashValue(const Register &Val) {
156 return DenseMapInfo<unsigned>::getHashValue(Val.id());
157 }
158 static bool isEqual(const Register &LHS, const Register &RHS) {
159 return DenseMapInfo<unsigned>::isEqual(LHS.id(), RHS.id());
160 }
161};
162
163}
164
165#endif // LLVM_CODEGEN_REGISTER_H

/build/llvm-toolchain-snapshot-14~++20220118101002+ec47dba1c8a2/llvm/include/llvm/CodeGen/TargetInstrInfo.h

1//===- llvm/CodeGen/TargetInstrInfo.h - Instruction Info --------*- C++ -*-===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8//
9// This file describes the target machine instruction set to the code generator.
10//
11//===----------------------------------------------------------------------===//
12
13#ifndef LLVM_CODEGEN_TARGETINSTRINFO_H
14#define LLVM_CODEGEN_TARGETINSTRINFO_H
15
16#include "llvm/ADT/ArrayRef.h"
17#include "llvm/ADT/DenseMap.h"
18#include "llvm/ADT/DenseMapInfo.h"
19#include "llvm/ADT/None.h"
20#include "llvm/CodeGen/MIRFormatter.h"
21#include "llvm/CodeGen/MachineBasicBlock.h"
22#include "llvm/CodeGen/MachineCombinerPattern.h"
23#include "llvm/CodeGen/MachineFunction.h"
24#include "llvm/CodeGen/MachineInstr.h"
25#include "llvm/CodeGen/MachineInstrBuilder.h"
26#include "llvm/CodeGen/MachineOperand.h"
27#include "llvm/CodeGen/MachineOutliner.h"
28#include "llvm/CodeGen/RegisterClassInfo.h"
29#include "llvm/CodeGen/VirtRegMap.h"
30#include "llvm/MC/MCInstrInfo.h"
31#include "llvm/Support/BranchProbability.h"
32#include "llvm/Support/ErrorHandling.h"
33#include <cassert>
34#include <cstddef>
35#include <cstdint>
36#include <utility>
37#include <vector>
38
39namespace llvm {
40
41class AAResults;
42class DFAPacketizer;
43class InstrItineraryData;
44class LiveIntervals;
45class LiveVariables;
46class MachineLoop;
47class MachineMemOperand;
48class MachineRegisterInfo;
49class MCAsmInfo;
50class MCInst;
51struct MCSchedModel;
52class Module;
53class ScheduleDAG;
54class ScheduleDAGMI;
55class ScheduleHazardRecognizer;
56class SDNode;
57class SelectionDAG;
58class RegScavenger;
59class TargetRegisterClass;
60class TargetRegisterInfo;
61class TargetSchedModel;
62class TargetSubtargetInfo;
63
64template <class T> class SmallVectorImpl;
65
66using ParamLoadedValue = std::pair<MachineOperand, DIExpression*>;
67
68struct DestSourcePair {
69 const MachineOperand *Destination;
70 const MachineOperand *Source;
71
72 DestSourcePair(const MachineOperand &Dest, const MachineOperand &Src)
73 : Destination(&Dest), Source(&Src) {}
74};
75
76/// Used to describe a register and immediate addition.
77struct RegImmPair {
78 Register Reg;
79 int64_t Imm;
80
81 RegImmPair(Register Reg, int64_t Imm) : Reg(Reg), Imm(Imm) {}
82};
83
84/// Used to describe addressing mode similar to ExtAddrMode in CodeGenPrepare.
85/// It holds the register values, the scale value and the displacement.
86struct ExtAddrMode {
87 Register BaseReg;
88 Register ScaledReg;
89 int64_t Scale;
90 int64_t Displacement;
91};
92
93//---------------------------------------------------------------------------
94///
95/// TargetInstrInfo - Interface to description of machine instruction set
96///
97class TargetInstrInfo : public MCInstrInfo {
98public:
99 TargetInstrInfo(unsigned CFSetupOpcode = ~0u, unsigned CFDestroyOpcode = ~0u,
100 unsigned CatchRetOpcode = ~0u, unsigned ReturnOpcode = ~0u)
101 : CallFrameSetupOpcode(CFSetupOpcode),
102 CallFrameDestroyOpcode(CFDestroyOpcode), CatchRetOpcode(CatchRetOpcode),
103 ReturnOpcode(ReturnOpcode) {}
104 TargetInstrInfo(const TargetInstrInfo &) = delete;
105 TargetInstrInfo &operator=(const TargetInstrInfo &) = delete;
106 virtual ~TargetInstrInfo();
107
108 static bool isGenericOpcode(unsigned Opc) {
109 return Opc <= TargetOpcode::GENERIC_OP_END;
110 }
111
112 /// Given a machine instruction descriptor, returns the register
113 /// class constraint for OpNum, or NULL.
114 virtual
115 const TargetRegisterClass *getRegClass(const MCInstrDesc &MCID, unsigned OpNum,
116 const TargetRegisterInfo *TRI,
117 const MachineFunction &MF) const;
118
119 /// Return true if the instruction is trivially rematerializable, meaning it
120 /// has no side effects and requires no operands that aren't always available.
121 /// This means the only allowed uses are constants and unallocatable physical
122 /// registers so that the instructions result is independent of the place
123 /// in the function.
124 bool isTriviallyReMaterializable(const MachineInstr &MI,
125 AAResults *AA = nullptr) const {
126 return MI.getOpcode() == TargetOpcode::IMPLICIT_DEF ||
127 (MI.getDesc().isRematerializable() &&
128 (isReallyTriviallyReMaterializable(MI, AA) ||
129 isReallyTriviallyReMaterializableGeneric(MI, AA)));
130 }
131
132 /// Given \p MO is a PhysReg use return if it can be ignored for the purpose
133 /// of instruction rematerialization or sinking.
134 virtual bool isIgnorableUse(const MachineOperand &MO) const {
135 return false;
136 }
137
138protected:
139 /// For instructions with opcodes for which the M_REMATERIALIZABLE flag is
140 /// set, this hook lets the target specify whether the instruction is actually
141 /// trivially rematerializable, taking into consideration its operands. This
142 /// predicate must return false if the instruction has any side effects other
143 /// than producing a value, or if it requres any address registers that are
144 /// not always available.
145 /// Requirements must be check as stated in isTriviallyReMaterializable() .
146 virtual bool isReallyTriviallyReMaterializable(const MachineInstr &MI,
147 AAResults *AA) const {
148 return false;
149 }
150
151 /// This method commutes the operands of the given machine instruction MI.
152 /// The operands to be commuted are specified by their indices OpIdx1 and
153 /// OpIdx2.
154 ///
155 /// If a target has any instructions that are commutable but require
156 /// converting to different instructions or making non-trivial changes
157 /// to commute them, this method can be overloaded to do that.
158 /// The default implementation simply swaps the commutable operands.
159 ///
160 /// If NewMI is false, MI is modified in place and returned; otherwise, a
161 /// new machine instruction is created and returned.
162 ///
163 /// Do not call this method for a non-commutable instruction.
164 /// Even though the instruction is commutable, the method may still
165 /// fail to commute the operands, null pointer is returned in such cases.
166 virtual MachineInstr *commuteInstructionImpl(MachineInstr &MI, bool NewMI,
167 unsigned OpIdx1,
168 unsigned OpIdx2) const;
169
170 /// Assigns the (CommutableOpIdx1, CommutableOpIdx2) pair of commutable
171 /// operand indices to (ResultIdx1, ResultIdx2).
172 /// One or both input values of the pair: (ResultIdx1, ResultIdx2) may be
173 /// predefined to some indices or be undefined (designated by the special
174 /// value 'CommuteAnyOperandIndex').
175 /// The predefined result indices cannot be re-defined.
176 /// The function returns true iff after the result pair redefinition
177 /// the fixed result pair is equal to or equivalent to the source pair of
178 /// indices: (CommutableOpIdx1, CommutableOpIdx2). It is assumed here that
179 /// the pairs (x,y) and (y,x) are equivalent.
180 static bool fixCommutedOpIndices(unsigned &ResultIdx1, unsigned &ResultIdx2,
181 unsigned CommutableOpIdx1,
182 unsigned CommutableOpIdx2);
183
184private:
185 /// For instructions with opcodes for which the M_REMATERIALIZABLE flag is
186 /// set and the target hook isReallyTriviallyReMaterializable returns false,
187 /// this function does target-independent tests to determine if the
188 /// instruction is really trivially rematerializable.
189 bool isReallyTriviallyReMaterializableGeneric(const MachineInstr &MI,
190 AAResults *AA) const;
191
192public:
193 /// These methods return the opcode of the frame setup/destroy instructions
194 /// if they exist (-1 otherwise). Some targets use pseudo instructions in
195 /// order to abstract away the difference between operating with a frame
196 /// pointer and operating without, through the use of these two instructions.
197 ///
198 unsigned getCallFrameSetupOpcode() const { return CallFrameSetupOpcode; }
199 unsigned getCallFrameDestroyOpcode() const { return CallFrameDestroyOpcode; }
200
201 /// Returns true if the argument is a frame pseudo instruction.
202 bool isFrameInstr(const MachineInstr &I) const {
203 return I.getOpcode() == getCallFrameSetupOpcode() ||
204 I.getOpcode() == getCallFrameDestroyOpcode();
205 }
206
207 /// Returns true if the argument is a frame setup pseudo instruction.
208 bool isFrameSetup(const MachineInstr &I) const {
209 return I.getOpcode() == getCallFrameSetupOpcode();
210 }
211
212 /// Returns size of the frame associated with the given frame instruction.
213 /// For frame setup instruction this is frame that is set up space set up
214 /// after the instruction. For frame destroy instruction this is the frame
215 /// freed by the caller.
216 /// Note, in some cases a call frame (or a part of it) may be prepared prior
217 /// to the frame setup instruction. It occurs in the calls that involve
218 /// inalloca arguments. This function reports only the size of the frame part
219 /// that is set up between the frame setup and destroy pseudo instructions.
220 int64_t getFrameSize(const MachineInstr &I) const {
221 assert(isFrameInstr(I) && "Not a frame instruction")(static_cast <bool> (isFrameInstr(I) && "Not a frame instruction"
) ? void (0) : __assert_fail ("isFrameInstr(I) && \"Not a frame instruction\""
, "llvm/include/llvm/CodeGen/TargetInstrInfo.h", 221, __extension__
__PRETTY_FUNCTION__))
;
222 assert(I.getOperand(0).getImm() >= 0)(static_cast <bool> (I.getOperand(0).getImm() >= 0) ?
void (0) : __assert_fail ("I.getOperand(0).getImm() >= 0"
, "llvm/include/llvm/CodeGen/TargetInstrInfo.h", 222, __extension__
__PRETTY_FUNCTION__))
;
223 return I.getOperand(0).getImm();
224 }
225
226 /// Returns the total frame size, which is made up of the space set up inside
227 /// the pair of frame start-stop instructions and the space that is set up
228 /// prior to the pair.
229 int64_t getFrameTotalSize(const MachineInstr &I) const {
230 if (isFrameSetup(I)) {
231 assert(I.getOperand(1).getImm() >= 0 &&(static_cast <bool> (I.getOperand(1).getImm() >= 0 &&
"Frame size must not be negative") ? void (0) : __assert_fail
("I.getOperand(1).getImm() >= 0 && \"Frame size must not be negative\""
, "llvm/include/llvm/CodeGen/TargetInstrInfo.h", 232, __extension__
__PRETTY_FUNCTION__))
232 "Frame size must not be negative")(static_cast <bool> (I.getOperand(1).getImm() >= 0 &&
"Frame size must not be negative") ? void (0) : __assert_fail
("I.getOperand(1).getImm() >= 0 && \"Frame size must not be negative\""
, "llvm/include/llvm/CodeGen/TargetInstrInfo.h", 232, __extension__
__PRETTY_FUNCTION__))
;
233 return getFrameSize(I) + I.getOperand(1).getImm();
234 }
235 return getFrameSize(I);
236 }
237
238 unsigned getCatchReturnOpcode() const { return CatchRetOpcode; }
239 unsigned getReturnOpcode() const { return ReturnOpcode; }
240
241 /// Returns the actual stack pointer adjustment made by an instruction
242 /// as part of a call sequence. By default, only call frame setup/destroy
243 /// instructions adjust the stack, but targets may want to override this
244 /// to enable more fine-grained adjustment, or adjust by a different value.
245 virtual int getSPAdjust(const MachineInstr &MI) const;
246
247 /// Return true if the instruction is a "coalescable" extension instruction.
248 /// That is, it's like a copy where it's legal for the source to overlap the
249 /// destination. e.g. X86::MOVSX64rr32. If this returns true, then it's
250 /// expected the pre-extension value is available as a subreg of the result
251 /// register. This also returns the sub-register index in SubIdx.
252 virtual bool isCoalescableExtInstr(const MachineInstr &MI, Register &SrcReg,
253 Register &DstReg, unsigned &SubIdx) const {
254 return false;
255 }
256
257 /// If the specified machine instruction is a direct
258 /// load from a stack slot, return the virtual or physical register number of
259 /// the destination along with the FrameIndex of the loaded stack slot. If
260 /// not, return 0. This predicate must return 0 if the instruction has
261 /// any side effects other than loading from the stack slot.
262 virtual unsigned isLoadFromStackSlot(const MachineInstr &MI,
263 int &FrameIndex) const {
264 return 0;
17
Returning without writing to 'FrameIndex'
265 }
266
267 /// Optional extension of isLoadFromStackSlot that returns the number of
268 /// bytes loaded from the stack. This must be implemented if a backend
269 /// supports partial stack slot spills/loads to further disambiguate
270 /// what the load does.
271 virtual unsigned isLoadFromStackSlot(const MachineInstr &MI,
272 int &FrameIndex,
273 unsigned &MemBytes) const {
274 MemBytes = 0;
275 return isLoadFromStackSlot(MI, FrameIndex);
276 }
277
278 /// Check for post-frame ptr elimination stack locations as well.
279 /// This uses a heuristic so it isn't reliable for correctness.
280 virtual unsigned isLoadFromStackSlotPostFE(const MachineInstr &MI,
281 int &FrameIndex) const {
282 return 0;
283 }
284
285 /// If the specified machine instruction has a load from a stack slot,
286 /// return true along with the FrameIndices of the loaded stack slot and the
287 /// machine mem operands containing the reference.
288 /// If not, return false. Unlike isLoadFromStackSlot, this returns true for
289 /// any instructions that loads from the stack. This is just a hint, as some
290 /// cases may be missed.
291 virtual bool hasLoadFromStackSlot(
292 const MachineInstr &MI,
293 SmallVectorImpl<const MachineMemOperand *> &Accesses) const;
294
295 /// If the specified machine instruction is a direct
296 /// store to a stack slot, return the virtual or physical register number of
297 /// the source reg along with the FrameIndex of the loaded stack slot. If
298 /// not, return 0. This predicate must return 0 if the instruction has
299 /// any side effects other than storing to the stack slot.
300 virtual unsigned isStoreToStackSlot(const MachineInstr &MI,
301 int &FrameIndex) const {
302 return 0;
303 }
304
305 /// Optional extension of isStoreToStackSlot that returns the number of
306 /// bytes stored to the stack. This must be implemented if a backend
307 /// supports partial stack slot spills/loads to further disambiguate
308 /// what the store does.
309 virtual unsigned isStoreToStackSlot(const MachineInstr &MI,
310 int &FrameIndex,
311 unsigned &MemBytes) const {
312 MemBytes = 0;
313 return isStoreToStackSlot(MI, FrameIndex);
314 }
315
316 /// Check for post-frame ptr elimination stack locations as well.
317 /// This uses a heuristic, so it isn't reliable for correctness.
318 virtual unsigned isStoreToStackSlotPostFE(const MachineInstr &MI,
319 int &FrameIndex) const {
320 return 0;
321 }
322
323 /// If the specified machine instruction has a store to a stack slot,
324 /// return true along with the FrameIndices of the loaded stack slot and the
325 /// machine mem operands containing the reference.
326 /// If not, return false. Unlike isStoreToStackSlot,
327 /// this returns true for any instructions that stores to the
328 /// stack. This is just a hint, as some cases may be missed.
329 virtual bool hasStoreToStackSlot(
330 const MachineInstr &MI,
331 SmallVectorImpl<const MachineMemOperand *> &Accesses) const;
332
333 /// Return true if the specified machine instruction
334 /// is a copy of one stack slot to another and has no other effect.
335 /// Provide the identity of the two frame indices.
336 virtual bool isStackSlotCopy(const MachineInstr &MI, int &DestFrameIndex,
337 int &SrcFrameIndex) const {
338 return false;
339 }
340
341 /// Compute the size in bytes and offset within a stack slot of a spilled
342 /// register or subregister.
343 ///
344 /// \param [out] Size in bytes of the spilled value.
345 /// \param [out] Offset in bytes within the stack slot.
346 /// \returns true if both Size and Offset are successfully computed.
347 ///
348 /// Not all subregisters have computable spill slots. For example,
349 /// subregisters registers may not be byte-sized, and a pair of discontiguous
350 /// subregisters has no single offset.
351 ///
352 /// Targets with nontrivial bigendian implementations may need to override
353 /// this, particularly to support spilled vector registers.
354 virtual bool getStackSlotRange(const TargetRegisterClass *RC, unsigned SubIdx,
355 unsigned &Size, unsigned &Offset,
356 const MachineFunction &MF) const;
357
358 /// Return true if the given instruction is terminator that is unspillable,
359 /// according to isUnspillableTerminatorImpl.
360 bool isUnspillableTerminator(const MachineInstr *MI) const {
361 return MI->isTerminator() && isUnspillableTerminatorImpl(MI);
362 }
363
364 /// Returns the size in bytes of the specified MachineInstr, or ~0U
365 /// when this function is not implemented by a target.
366 virtual unsigned getInstSizeInBytes(const MachineInstr &MI) const {
367 return ~0U;
368 }
369
370 /// Return true if the instruction is as cheap as a move instruction.
371 ///
372 /// Targets for different archs need to override this, and different
373 /// micro-architectures can also be finely tuned inside.
374 virtual bool isAsCheapAsAMove(const MachineInstr &MI) const {
375 return MI.isAsCheapAsAMove();
376 }
377
378 /// Return true if the instruction should be sunk by MachineSink.
379 ///
380 /// MachineSink determines on its own whether the instruction is safe to sink;
381 /// this gives the target a hook to override the default behavior with regards
382 /// to which instructions should be sunk.
383 virtual bool shouldSink(const MachineInstr &MI) const { return true; }
384
385 /// Re-issue the specified 'original' instruction at the
386 /// specific location targeting a new destination register.
387 /// The register in Orig->getOperand(0).getReg() will be substituted by
388 /// DestReg:SubIdx. Any existing subreg index is preserved or composed with
389 /// SubIdx.
390 virtual void reMaterialize(MachineBasicBlock &MBB,
391 MachineBasicBlock::iterator MI, Register DestReg,
392 unsigned SubIdx, const MachineInstr &Orig,
393 const TargetRegisterInfo &TRI) const;
394
395 /// Clones instruction or the whole instruction bundle \p Orig and
396 /// insert into \p MBB before \p InsertBefore. The target may update operands
397 /// that are required to be unique.
398 ///
399 /// \p Orig must not return true for MachineInstr::isNotDuplicable().
400 virtual MachineInstr &duplicate(MachineBasicBlock &MBB,
401 MachineBasicBlock::iterator InsertBefore,
402 const MachineInstr &Orig) const;
403
404 /// This method must be implemented by targets that
405 /// set the M_CONVERTIBLE_TO_3_ADDR flag. When this flag is set, the target
406 /// may be able to convert a two-address instruction into one or more true
407 /// three-address instructions on demand. This allows the X86 target (for
408 /// example) to convert ADD and SHL instructions into LEA instructions if they
409 /// would require register copies due to two-addressness.
410 ///
411 /// This method returns a null pointer if the transformation cannot be
412 /// performed, otherwise it returns the last new instruction.
413 ///
414 /// If \p LIS is not nullptr, the LiveIntervals info should be updated for
415 /// replacing \p MI with new instructions, even though this function does not
416 /// remove MI.
417 virtual MachineInstr *convertToThreeAddress(MachineInstr &MI,
418 LiveVariables *LV,
419 LiveIntervals *LIS) const {
420 return nullptr;
421 }
422
423 // This constant can be used as an input value of operand index passed to
424 // the method findCommutedOpIndices() to tell the method that the
425 // corresponding operand index is not pre-defined and that the method
426 // can pick any commutable operand.
427 static const unsigned CommuteAnyOperandIndex = ~0U;
428
429 /// This method commutes the operands of the given machine instruction MI.
430 ///
431 /// The operands to be commuted are specified by their indices OpIdx1 and
432 /// OpIdx2. OpIdx1 and OpIdx2 arguments may be set to a special value
433 /// 'CommuteAnyOperandIndex', which means that the method is free to choose
434 /// any arbitrarily chosen commutable operand. If both arguments are set to
435 /// 'CommuteAnyOperandIndex' then the method looks for 2 different commutable
436 /// operands; then commutes them if such operands could be found.
437 ///
438 /// If NewMI is false, MI is modified in place and returned; otherwise, a
439 /// new machine instruction is created and returned.
440 ///
441 /// Do not call this method for a non-commutable instruction or
442 /// for non-commuable operands.
443 /// Even though the instruction is commutable, the method may still
444 /// fail to commute the operands, null pointer is returned in such cases.
445 MachineInstr *
446 commuteInstruction(MachineInstr &MI, bool NewMI = false,
447 unsigned OpIdx1 = CommuteAnyOperandIndex,
448 unsigned OpIdx2 = CommuteAnyOperandIndex) const;
449
450 /// Returns true iff the routine could find two commutable operands in the
451 /// given machine instruction.
452 /// The 'SrcOpIdx1' and 'SrcOpIdx2' are INPUT and OUTPUT arguments.
453 /// If any of the INPUT values is set to the special value
454 /// 'CommuteAnyOperandIndex' then the method arbitrarily picks a commutable
455 /// operand, then returns its index in the corresponding argument.
456 /// If both of INPUT values are set to 'CommuteAnyOperandIndex' then method
457 /// looks for 2 commutable operands.
458 /// If INPUT values refer to some operands of MI, then the method simply
459 /// returns true if the corresponding operands are commutable and returns
460 /// false otherwise.
461 ///
462 /// For example, calling this method this way:
463 /// unsigned Op1 = 1, Op2 = CommuteAnyOperandIndex;
464 /// findCommutedOpIndices(MI, Op1, Op2);
465 /// can be interpreted as a query asking to find an operand that would be
466 /// commutable with the operand#1.
467 virtual bool findCommutedOpIndices(const MachineInstr &MI,
468 unsigned &SrcOpIdx1,
469 unsigned &SrcOpIdx2) const;
470
471 /// Returns true if the target has a preference on the operands order of
472 /// the given machine instruction. And specify if \p Commute is required to
473 /// get the desired operands order.
474 virtual bool hasCommutePreference(MachineInstr &MI, bool &Commute) const {
475 return false;
476 }
477
478 /// A pair composed of a register and a sub-register index.
479 /// Used to give some type checking when modeling Reg:SubReg.
480 struct RegSubRegPair {
481 Register Reg;
482 unsigned SubReg;
483
484 RegSubRegPair(Register Reg = Register(), unsigned SubReg = 0)
485 : Reg(Reg), SubReg(SubReg) {}
486
487 bool operator==(const RegSubRegPair& P) const {
488 return Reg == P.Reg && SubReg == P.SubReg;
489 }
490 bool operator!=(const RegSubRegPair& P) const {
491 return !(*this == P);
492 }
493 };
494
495 /// A pair composed of a pair of a register and a sub-register index,
496 /// and another sub-register index.
497 /// Used to give some type checking when modeling Reg:SubReg1, SubReg2.
498 struct RegSubRegPairAndIdx : RegSubRegPair {
499 unsigned SubIdx;
500
501 RegSubRegPairAndIdx(Register Reg = Register(), unsigned SubReg = 0,
502 unsigned SubIdx = 0)
503 : RegSubRegPair(Reg, SubReg), SubIdx(SubIdx) {}
504 };
505
506 /// Build the equivalent inputs of a REG_SEQUENCE for the given \p MI
507 /// and \p DefIdx.
508 /// \p [out] InputRegs of the equivalent REG_SEQUENCE. Each element of
509 /// the list is modeled as <Reg:SubReg, SubIdx>. Operands with the undef
510 /// flag are not added to this list.
511 /// E.g., REG_SEQUENCE %1:sub1, sub0, %2, sub1 would produce
512 /// two elements:
513 /// - %1:sub1, sub0
514 /// - %2<:0>, sub1
515 ///
516 /// \returns true if it is possible to build such an input sequence
517 /// with the pair \p MI, \p DefIdx. False otherwise.
518 ///
519 /// \pre MI.isRegSequence() or MI.isRegSequenceLike().
520 ///
521 /// \note The generic implementation does not provide any support for
522 /// MI.isRegSequenceLike(). In other words, one has to override
523 /// getRegSequenceLikeInputs for target specific instructions.
524 bool
525 getRegSequenceInputs(const MachineInstr &MI, unsigned DefIdx,
526 SmallVectorImpl<RegSubRegPairAndIdx> &InputRegs) const;
527
528 /// Build the equivalent inputs of a EXTRACT_SUBREG for the given \p MI
529 /// and \p DefIdx.
530 /// \p [out] InputReg of the equivalent EXTRACT_SUBREG.
531 /// E.g., EXTRACT_SUBREG %1:sub1, sub0, sub1 would produce:
532 /// - %1:sub1, sub0
533 ///
534 /// \returns true if it is possible to build such an input sequence
535 /// with the pair \p MI, \p DefIdx and the operand has no undef flag set.
536 /// False otherwise.
537 ///
538 /// \pre MI.isExtractSubreg() or MI.isExtractSubregLike().
539 ///
540 /// \note The generic implementation does not provide any support for
541 /// MI.isExtractSubregLike(). In other words, one has to override
542 /// getExtractSubregLikeInputs for target specific instructions.
543 bool getExtractSubregInputs(const MachineInstr &MI, unsigned DefIdx,
544 RegSubRegPairAndIdx &InputReg) const;
545
546 /// Build the equivalent inputs of a INSERT_SUBREG for the given \p MI
547 /// and \p DefIdx.
548 /// \p [out] BaseReg and \p [out] InsertedReg contain
549 /// the equivalent inputs of INSERT_SUBREG.
550 /// E.g., INSERT_SUBREG %0:sub0, %1:sub1, sub3 would produce:
551 /// - BaseReg: %0:sub0
552 /// - InsertedReg: %1:sub1, sub3
553 ///
554 /// \returns true if it is possible to build such an input sequence
555 /// with the pair \p MI, \p DefIdx and the operand has no undef flag set.
556 /// False otherwise.
557 ///
558 /// \pre MI.isInsertSubreg() or MI.isInsertSubregLike().
559 ///
560 /// \note The generic implementation does not provide any support for
561 /// MI.isInsertSubregLike(). In other words, one has to override
562 /// getInsertSubregLikeInputs for target specific instructions.
563 bool getInsertSubregInputs(const MachineInstr &MI, unsigned DefIdx,
564 RegSubRegPair &BaseReg,
565 RegSubRegPairAndIdx &InsertedReg) const;
566
567 /// Return true if two machine instructions would produce identical values.
568 /// By default, this is only true when the two instructions
569 /// are deemed identical except for defs. If this function is called when the
570 /// IR is still in SSA form, the caller can pass the MachineRegisterInfo for
571 /// aggressive checks.
572 virtual bool produceSameValue(const MachineInstr &MI0,
573 const MachineInstr &MI1,
574 const MachineRegisterInfo *MRI = nullptr) const;
575
576 /// \returns true if a branch from an instruction with opcode \p BranchOpc
577 /// bytes is capable of jumping to a position \p BrOffset bytes away.
578 virtual bool isBranchOffsetInRange(unsigned BranchOpc,
579 int64_t BrOffset) const {
580 llvm_unreachable("target did not implement")::llvm::llvm_unreachable_internal("target did not implement",
"llvm/include/llvm/CodeGen/TargetInstrInfo.h", 580)
;
581 }
582
583 /// \returns The block that branch instruction \p MI jumps to.
584 virtual MachineBasicBlock *getBranchDestBlock(const MachineInstr &MI) const {
585 llvm_unreachable("target did not implement")::llvm::llvm_unreachable_internal("target did not implement",
"llvm/include/llvm/CodeGen/TargetInstrInfo.h", 585)
;
586 }
587
588 /// Insert an unconditional indirect branch at the end of \p MBB to \p
589 /// NewDestBB. Optionally, insert the clobbered register restoring in \p
590 /// RestoreBB. \p BrOffset indicates the offset of \p NewDestBB relative to
591 /// the offset of the position to insert the new branch.
592 virtual void insertIndirectBranch(MachineBasicBlock &MBB,
593 MachineBasicBlock &NewDestBB,
594 MachineBasicBlock &RestoreBB,
595 const DebugLoc &DL, int64_t BrOffset = 0,
596 RegScavenger *RS = nullptr) const {
597 llvm_unreachable("target did not implement")::llvm::llvm_unreachable_internal("target did not implement",
"llvm/include/llvm/CodeGen/TargetInstrInfo.h", 597)
;
598 }
599
600 /// Analyze the branching code at the end of MBB, returning
601 /// true if it cannot be understood (e.g. it's a switch dispatch or isn't
602 /// implemented for a target). Upon success, this returns false and returns
603 /// with the following information in various cases:
604 ///
605 /// 1. If this block ends with no branches (it just falls through to its succ)
606 /// just return false, leaving TBB/FBB null.
607 /// 2. If this block ends with only an unconditional branch, it sets TBB to be
608 /// the destination block.
609 /// 3. If this block ends with a conditional branch and it falls through to a
610 /// successor block, it sets TBB to be the branch destination block and a
611 /// list of operands that evaluate the condition. These operands can be
612 /// passed to other TargetInstrInfo methods to create new branches.
613 /// 4. If this block ends with a conditional branch followed by an
614 /// unconditional branch, it returns the 'true' destination in TBB, the
615 /// 'false' destination in FBB, and a list of operands that evaluate the
616 /// condition. These operands can be passed to other TargetInstrInfo
617 /// methods to create new branches.
618 ///
619 /// Note that removeBranch and insertBranch must be implemented to support
620 /// cases where this method returns success.
621 ///
622 /// If AllowModify is true, then this routine is allowed to modify the basic
623 /// block (e.g. delete instructions after the unconditional branch).
624 ///
625 /// The CFG information in MBB.Predecessors and MBB.Successors must be valid
626 /// before calling this function.
627 virtual bool analyzeBranch(MachineBasicBlock &MBB, MachineBasicBlock *&TBB,
628 MachineBasicBlock *&FBB,
629 SmallVectorImpl<MachineOperand> &Cond,
630 bool AllowModify = false) const {
631 return true;
632 }
633
634 /// Represents a predicate at the MachineFunction level. The control flow a
635 /// MachineBranchPredicate represents is:
636 ///
637 /// Reg = LHS `Predicate` RHS == ConditionDef
638 /// if Reg then goto TrueDest else goto FalseDest
639 ///
640 struct MachineBranchPredicate {
641 enum ComparePredicate {
642 PRED_EQ, // True if two values are equal
643 PRED_NE, // True if two values are not equal
644 PRED_INVALID // Sentinel value
645 };
646
647 ComparePredicate Predicate = PRED_INVALID;
648 MachineOperand LHS = MachineOperand::CreateImm(0);
649 MachineOperand RHS = MachineOperand::CreateImm(0);
650 MachineBasicBlock *TrueDest = nullptr;
651 MachineBasicBlock *FalseDest = nullptr;
652 MachineInstr *ConditionDef = nullptr;
653
654 /// SingleUseCondition is true if ConditionDef is dead except for the
655 /// branch(es) at the end of the basic block.
656 ///
657 bool SingleUseCondition = false;
658
659 explicit MachineBranchPredicate() = default;
660 };
661
662 /// Analyze the branching code at the end of MBB and parse it into the
663 /// MachineBranchPredicate structure if possible. Returns false on success
664 /// and true on failure.
665 ///
666 /// If AllowModify is true, then this routine is allowed to modify the basic
667 /// block (e.g. delete instructions after the unconditional branch).
668 ///
669 virtual bool analyzeBranchPredicate(MachineBasicBlock &MBB,
670 MachineBranchPredicate &MBP,
671 bool AllowModify = false) const {
672 return true;
673 }
674
675 /// Remove the branching code at the end of the specific MBB.
676 /// This is only invoked in cases where analyzeBranch returns success. It
677 /// returns the number of instructions that were removed.
678 /// If \p BytesRemoved is non-null, report the change in code size from the
679 /// removed instructions.
680 virtual unsigned removeBranch(MachineBasicBlock &MBB,
681 int *BytesRemoved = nullptr) const {
682 llvm_unreachable("Target didn't implement TargetInstrInfo::removeBranch!")::llvm::llvm_unreachable_internal("Target didn't implement TargetInstrInfo::removeBranch!"
, "llvm/include/llvm/CodeGen/TargetInstrInfo.h", 682)
;
683 }
684
685 /// Insert branch code into the end of the specified MachineBasicBlock. The
686 /// operands to this method are the same as those returned by analyzeBranch.
687 /// This is only invoked in cases where analyzeBranch returns success. It
688 /// returns the number of instructions inserted. If \p BytesAdded is non-null,
689 /// report the change in code size from the added instructions.
690 ///
691 /// It is also invoked by tail merging to add unconditional branches in
692 /// cases where analyzeBranch doesn't apply because there was no original
693 /// branch to analyze. At least this much must be implemented, else tail
694 /// merging needs to be disabled.
695 ///
696 /// The CFG information in MBB.Predecessors and MBB.Successors must be valid
697 /// before calling this function.
698 virtual unsigned insertBranch(MachineBasicBlock &MBB, MachineBasicBlock *TBB,
699 MachineBasicBlock *FBB,
700 ArrayRef<MachineOperand> Cond,
701 const DebugLoc &DL,
702 int *BytesAdded = nullptr) const {
703 llvm_unreachable("Target didn't implement TargetInstrInfo::insertBranch!")::llvm::llvm_unreachable_internal("Target didn't implement TargetInstrInfo::insertBranch!"
, "llvm/include/llvm/CodeGen/TargetInstrInfo.h", 703)
;
704 }
705
706 unsigned insertUnconditionalBranch(MachineBasicBlock &MBB,
707 MachineBasicBlock *DestBB,
708 const DebugLoc &DL,
709 int *BytesAdded = nullptr) const {
710 return insertBranch(MBB, DestBB, nullptr, ArrayRef<MachineOperand>(), DL,
711 BytesAdded);
712 }
713
714 /// Object returned by analyzeLoopForPipelining. Allows software pipelining
715 /// implementations to query attributes of the loop being pipelined and to
716 /// apply target-specific updates to the loop once pipelining is complete.
717 class PipelinerLoopInfo {
718 public:
719 virtual ~PipelinerLoopInfo();
720 /// Return true if the given instruction should not be pipelined and should
721 /// be ignored. An example could be a loop comparison, or induction variable
722 /// update with no users being pipelined.
723 virtual bool shouldIgnoreForPipelining(const MachineInstr *MI) const = 0;
724
725 /// Create a condition to determine if the trip count of the loop is greater
726 /// than TC.
727 ///
728 /// If the trip count is statically known to be greater than TC, return
729 /// true. If the trip count is statically known to be not greater than TC,
730 /// return false. Otherwise return nullopt and fill out Cond with the test
731 /// condition.
732 virtual Optional<bool>
733 createTripCountGreaterCondition(int TC, MachineBasicBlock &MBB,
734 SmallVectorImpl<MachineOperand> &Cond) = 0;
735
736 /// Modify the loop such that the trip count is
737 /// OriginalTC + TripCountAdjust.
738 virtual void adjustTripCount(int TripCountAdjust) = 0;
739
740 /// Called when the loop's preheader has been modified to NewPreheader.
741 virtual void setPreheader(MachineBasicBlock *NewPreheader) = 0;
742
743 /// Called when the loop is being removed. Any instructions in the preheader
744 /// should be removed.
745 ///
746 /// Once this function is called, no other functions on this object are
747 /// valid; the loop has been removed.
748 virtual void disposed() = 0;
749 };
750
751 /// Analyze loop L, which must be a single-basic-block loop, and if the
752 /// conditions can be understood enough produce a PipelinerLoopInfo object.
753 virtual std::unique_ptr<PipelinerLoopInfo>
754 analyzeLoopForPipelining(MachineBasicBlock *LoopBB) const {
755 return nullptr;
756 }
757
758 /// Analyze the loop code, return true if it cannot be understood. Upon
759 /// success, this function returns false and returns information about the
760 /// induction variable and compare instruction used at the end.
761 virtual bool analyzeLoop(MachineLoop &L, MachineInstr *&IndVarInst,
762 MachineInstr *&CmpInst) const {
763 return true;
764 }
765
766 /// Generate code to reduce the loop iteration by one and check if the loop
767 /// is finished. Return the value/register of the new loop count. We need
768 /// this function when peeling off one or more iterations of a loop. This
769 /// function assumes the nth iteration is peeled first.
770 virtual unsigned reduceLoopCount(MachineBasicBlock &MBB,
771 MachineBasicBlock &PreHeader,
772 MachineInstr *IndVar, MachineInstr &Cmp,
773 SmallVectorImpl<MachineOperand> &Cond,
774 SmallVectorImpl<MachineInstr *> &PrevInsts,
775 unsigned Iter, unsigned MaxIter) const {
776 llvm_unreachable("Target didn't implement ReduceLoopCount")::llvm::llvm_unreachable_internal("Target didn't implement ReduceLoopCount"
, "llvm/include/llvm/CodeGen/TargetInstrInfo.h", 776)
;
777 }
778
779 /// Delete the instruction OldInst and everything after it, replacing it with
780 /// an unconditional branch to NewDest. This is used by the tail merging pass.
781 virtual void ReplaceTailWithBranchTo(MachineBasicBlock::iterator Tail,
782 MachineBasicBlock *NewDest) const;
783
784 /// Return true if it's legal to split the given basic
785 /// block at the specified instruction (i.e. instruction would be the start
786 /// of a new basic block).
787 virtual bool isLegalToSplitMBBAt(MachineBasicBlock &MBB,
788 MachineBasicBlock::iterator MBBI) const {
789 return true;
790 }
791
792 /// Return true if it's profitable to predicate
793 /// instructions with accumulated instruction latency of "NumCycles"
794 /// of the specified basic block, where the probability of the instructions
795 /// being executed is given by Probability, and Confidence is a measure
796 /// of our confidence that it will be properly predicted.
797 virtual bool isProfitableToIfCvt(MachineBasicBlock &MBB, unsigned NumCycles,
798 unsigned ExtraPredCycles,
799 BranchProbability Probability) const {
800 return false;
801 }
802
803 /// Second variant of isProfitableToIfCvt. This one
804 /// checks for the case where two basic blocks from true and false path
805 /// of a if-then-else (diamond) are predicated on mutually exclusive
806 /// predicates, where the probability of the true path being taken is given
807 /// by Probability, and Confidence is a measure of our confidence that it
808 /// will be properly predicted.
809 virtual bool isProfitableToIfCvt(MachineBasicBlock &TMBB, unsigned NumTCycles,
810 unsigned ExtraTCycles,
811 MachineBasicBlock &FMBB, unsigned NumFCycles,
812 unsigned ExtraFCycles,
813 BranchProbability Probability) const {
814 return false;
815 }
816
817 /// Return true if it's profitable for if-converter to duplicate instructions
818 /// of specified accumulated instruction latencies in the specified MBB to
819 /// enable if-conversion.
820 /// The probability of the instructions being executed is given by
821 /// Probability, and Confidence is a measure of our confidence that it
822 /// will be properly predicted.
823 virtual bool isProfitableToDupForIfCvt(MachineBasicBlock &MBB,
824 unsigned NumCycles,
825 BranchProbability Probability) const {
826 return false;
827 }
828
829 /// Return the increase in code size needed to predicate a contiguous run of
830 /// NumInsts instructions.
831 virtual unsigned extraSizeToPredicateInstructions(const MachineFunction &MF,
832 unsigned NumInsts) const {
833 return 0;
834 }
835
836 /// Return an estimate for the code size reduction (in bytes) which will be
837 /// caused by removing the given branch instruction during if-conversion.
838 virtual unsigned predictBranchSizeForIfCvt(MachineInstr &MI) const {
839 return getInstSizeInBytes(MI);
840 }
841
842 /// Return true if it's profitable to unpredicate
843 /// one side of a 'diamond', i.e. two sides of if-else predicated on mutually
844 /// exclusive predicates.
845 /// e.g.
846 /// subeq r0, r1, #1
847 /// addne r0, r1, #1
848 /// =>
849 /// sub r0, r1, #1
850 /// addne r0, r1, #1
851 ///
852 /// This may be profitable is conditional instructions are always executed.
853 virtual bool isProfitableToUnpredicate(MachineBasicBlock &TMBB,
854 MachineBasicBlock &FMBB) const {
855 return false;
856 }
857
858 /// Return true if it is possible to insert a select
859 /// instruction that chooses between TrueReg and FalseReg based on the
860 /// condition code in Cond.
861 ///
862 /// When successful, also return the latency in cycles from TrueReg,
863 /// FalseReg, and Cond to the destination register. In most cases, a select
864 /// instruction will be 1 cycle, so CondCycles = TrueCycles = FalseCycles = 1
865 ///
866 /// Some x86 implementations have 2-cycle cmov instructions.
867 ///
868 /// @param MBB Block where select instruction would be inserted.
869 /// @param Cond Condition returned by analyzeBranch.
870 /// @param DstReg Virtual dest register that the result should write to.
871 /// @param TrueReg Virtual register to select when Cond is true.
872 /// @param FalseReg Virtual register to select when Cond is false.
873 /// @param CondCycles Latency from Cond+Branch to select output.
874 /// @param TrueCycles Latency from TrueReg to select output.
875 /// @param FalseCycles Latency from FalseReg to select output.
876 virtual bool canInsertSelect(const MachineBasicBlock &MBB,
877 ArrayRef<MachineOperand> Cond, Register DstReg,
878 Register TrueReg, Register FalseReg,
879 int &CondCycles, int &TrueCycles,
880 int &FalseCycles) const {
881 return false;
882 }
883
884 /// Insert a select instruction into MBB before I that will copy TrueReg to
885 /// DstReg when Cond is true, and FalseReg to DstReg when Cond is false.
886 ///
887 /// This function can only be called after canInsertSelect() returned true.
888 /// The condition in Cond comes from analyzeBranch, and it can be assumed
889 /// that the same flags or registers required by Cond are available at the
890 /// insertion point.
891 ///
892 /// @param MBB Block where select instruction should be inserted.
893 /// @param I Insertion point.
894 /// @param DL Source location for debugging.
895 /// @param DstReg Virtual register to be defined by select instruction.
896 /// @param Cond Condition as computed by analyzeBranch.
897 /// @param TrueReg Virtual register to copy when Cond is true.
898 /// @param FalseReg Virtual register to copy when Cons is false.
899 virtual void insertSelect(MachineBasicBlock &MBB,
900 MachineBasicBlock::iterator I, const DebugLoc &DL,
901 Register DstReg, ArrayRef<MachineOperand> Cond,
902 Register TrueReg, Register FalseReg) const {
903 llvm_unreachable("Target didn't implement TargetInstrInfo::insertSelect!")::llvm::llvm_unreachable_internal("Target didn't implement TargetInstrInfo::insertSelect!"
, "llvm/include/llvm/CodeGen/TargetInstrInfo.h", 903)
;
904 }
905
906 /// Analyze the given select instruction, returning true if
907 /// it cannot be understood. It is assumed that MI->isSelect() is true.
908 ///
909 /// When successful, return the controlling condition and the operands that
910 /// determine the true and false result values.
911 ///
912 /// Result = SELECT Cond, TrueOp, FalseOp
913 ///
914 /// Some targets can optimize select instructions, for example by predicating
915 /// the instruction defining one of the operands. Such targets should set
916 /// Optimizable.
917 ///
918 /// @param MI Select instruction to analyze.
919 /// @param Cond Condition controlling the select.
920 /// @param TrueOp Operand number of the value selected when Cond is true.
921 /// @param FalseOp Operand number of the value selected when Cond is false.
922 /// @param Optimizable Returned as true if MI is optimizable.
923 /// @returns False on success.
924 virtual bool analyzeSelect(const MachineInstr &MI,
925 SmallVectorImpl<MachineOperand> &Cond,
926 unsigned &TrueOp, unsigned &FalseOp,
927 bool &Optimizable) const {
928 assert(MI.getDesc().isSelect() && "MI must be a select instruction")(static_cast <bool> (MI.getDesc().isSelect() &&
"MI must be a select instruction") ? void (0) : __assert_fail
("MI.getDesc().isSelect() && \"MI must be a select instruction\""
, "llvm/include/llvm/CodeGen/TargetInstrInfo.h", 928, __extension__
__PRETTY_FUNCTION__))
;
929 return true;
930 }
931
932 /// Given a select instruction that was understood by
933 /// analyzeSelect and returned Optimizable = true, attempt to optimize MI by
934 /// merging it with one of its operands. Returns NULL on failure.
935 ///
936 /// When successful, returns the new select instruction. The client is
937 /// responsible for deleting MI.
938 ///
939 /// If both sides of the select can be optimized, PreferFalse is used to pick
940 /// a side.
941 ///
942 /// @param MI Optimizable select instruction.
943 /// @param NewMIs Set that record all MIs in the basic block up to \p
944 /// MI. Has to be updated with any newly created MI or deleted ones.
945 /// @param PreferFalse Try to optimize FalseOp instead of TrueOp.
946 /// @returns Optimized instruction or NULL.
947 virtual MachineInstr *optimizeSelect(MachineInstr &MI,
948 SmallPtrSetImpl<MachineInstr *> &NewMIs,
949 bool PreferFalse = false) const {
950 // This function must be implemented if Optimizable is ever set.
951 llvm_unreachable("Target must implement TargetInstrInfo::optimizeSelect!")::llvm::llvm_unreachable_internal("Target must implement TargetInstrInfo::optimizeSelect!"
, "llvm/include/llvm/CodeGen/TargetInstrInfo.h", 951)
;
952 }
953
954 /// Emit instructions to copy a pair of physical registers.
955 ///
956 /// This function should support copies within any legal register class as
957 /// well as any cross-class copies created during instruction selection.
958 ///
959 /// The source and destination registers may overlap, which may require a
960 /// careful implementation when multiple copy instructions are required for
961 /// large registers. See for example the ARM target.
962 virtual void copyPhysReg(MachineBasicBlock &MBB,
963 MachineBasicBlock::iterator MI, const DebugLoc &DL,
964 MCRegister DestReg, MCRegister SrcReg,
965 bool KillSrc) const {
966 llvm_unreachable("Target didn't implement TargetInstrInfo::copyPhysReg!")::llvm::llvm_unreachable_internal("Target didn't implement TargetInstrInfo::copyPhysReg!"
, "llvm/include/llvm/CodeGen/TargetInstrInfo.h", 966)
;
967 }
968
969 /// Allow targets to tell MachineVerifier whether a specific register
970 /// MachineOperand can be used as part of PC-relative addressing.
971 /// PC-relative addressing modes in many CISC architectures contain
972 /// (non-PC) registers as offsets or scaling values, which inherently
973 /// tags the corresponding MachineOperand with OPERAND_PCREL.
974 ///
975 /// @param MO The MachineOperand in question. MO.isReg() should always
976 /// be true.
977 /// @return Whether this operand is allowed to be used PC-relatively.
978 virtual bool isPCRelRegisterOperandLegal(const MachineOperand &MO) const {
979 return false;
980 }
981
982protected:
983 /// Target-dependent implementation for IsCopyInstr.
984 /// If the specific machine instruction is a instruction that moves/copies
985 /// value from one register to another register return destination and source
986 /// registers as machine operands.
987 virtual Optional<DestSourcePair>
988 isCopyInstrImpl(const MachineInstr &MI) const {
989 return None;
990 }
991
992 /// Return true if the given terminator MI is not expected to spill. This
993 /// sets the live interval as not spillable and adjusts phi node lowering to
994 /// not introduce copies after the terminator. Use with care, these are
995 /// currently used for hardware loop intrinsics in very controlled situations,
996 /// created prior to registry allocation in loops that only have single phi
997 /// users for the terminators value. They may run out of registers if not used
998 /// carefully.
999 virtual bool isUnspillableTerminatorImpl(const MachineInstr *MI) const {
1000 return false;
1001 }
1002
1003public:
1004 /// If the specific machine instruction is a instruction that moves/copies
1005 /// value from one register to another register return destination and source
1006 /// registers as machine operands.
1007 /// For COPY-instruction the method naturally returns destination and source
1008 /// registers as machine operands, for all other instructions the method calls
1009 /// target-dependent implementation.
1010 Optional<DestSourcePair> isCopyInstr(const MachineInstr &MI) const {
1011 if (MI.isCopy()) {
1012 return DestSourcePair{MI.getOperand(0), MI.getOperand(1)};
1013 }
1014 return isCopyInstrImpl(MI);
1015 }
1016
1017 /// If the specific machine instruction is an instruction that adds an
1018 /// immediate value and a physical register, and stores the result in
1019 /// the given physical register \c Reg, return a pair of the source
1020 /// register and the offset which has been added.
1021 virtual Optional<RegImmPair> isAddImmediate(const MachineInstr &MI,
1022 Register Reg) const {
1023 return None;
1024 }
1025
1026 /// Returns true if MI is an instruction that defines Reg to have a constant
1027 /// value and the value is recorded in ImmVal. The ImmVal is a result that
1028 /// should be interpreted as modulo size of Reg.
1029 virtual bool getConstValDefinedInReg(const MachineInstr &MI,
1030 const Register Reg,
1031 int64_t &ImmVal) const {
1032 return false;
1033 }
1034
1035 /// Store the specified register of the given register class to the specified
1036 /// stack frame index. The store instruction is to be added to the given
1037 /// machine basic block before the specified machine instruction. If isKill
1038 /// is true, the register operand is the last use and must be marked kill.
1039 virtual void storeRegToStackSlot(MachineBasicBlock &MBB,
1040 MachineBasicBlock::iterator MI,
1041 Register SrcReg, bool isKill, int FrameIndex,
1042 const TargetRegisterClass *RC,
1043 const TargetRegisterInfo *TRI) const {
1044 llvm_unreachable("Target didn't implement "::llvm::llvm_unreachable_internal("Target didn't implement " "TargetInstrInfo::storeRegToStackSlot!"
, "llvm/include/llvm/CodeGen/TargetInstrInfo.h", 1045)
1045 "TargetInstrInfo::storeRegToStackSlot!")::llvm::llvm_unreachable_internal("Target didn't implement " "TargetInstrInfo::storeRegToStackSlot!"
, "llvm/include/llvm/CodeGen/TargetInstrInfo.h", 1045)
;
1046 }
1047
1048 /// Load the specified register of the given register class from the specified
1049 /// stack frame index. The load instruction is to be added to the given
1050 /// machine basic block before the specified machine instruction.
1051 virtual void loadRegFromStackSlot(MachineBasicBlock &MBB,
1052 MachineBasicBlock::iterator MI,
1053 Register DestReg, int FrameIndex,
1054 const TargetRegisterClass *RC,
1055 const TargetRegisterInfo *TRI) const {
1056 llvm_unreachable("Target didn't implement "::llvm::llvm_unreachable_internal("Target didn't implement " "TargetInstrInfo::loadRegFromStackSlot!"
, "llvm/include/llvm/CodeGen/TargetInstrInfo.h", 1057)
1057 "TargetInstrInfo::loadRegFromStackSlot!")::llvm::llvm_unreachable_internal("Target didn't implement " "TargetInstrInfo::loadRegFromStackSlot!"
, "llvm/include/llvm/CodeGen/TargetInstrInfo.h", 1057)
;
1058 }
1059
1060 /// This function is called for all pseudo instructions
1061 /// that remain after register allocation. Many pseudo instructions are
1062 /// created to help register allocation. This is the place to convert them
1063 /// into real instructions. The target can edit MI in place, or it can insert
1064 /// new instructions and erase MI. The function should return true if
1065 /// anything was changed.
1066 virtual bool expandPostRAPseudo(MachineInstr &MI) const { return false; }
1067
1068 /// Check whether the target can fold a load that feeds a subreg operand
1069 /// (or a subreg operand that feeds a store).
1070 /// For example, X86 may want to return true if it can fold
1071 /// movl (%esp), %eax
1072 /// subb, %al, ...
1073 /// Into:
1074 /// subb (%esp), ...
1075 ///
1076 /// Ideally, we'd like the target implementation of foldMemoryOperand() to
1077 /// reject subregs - but since this behavior used to be enforced in the
1078 /// target-independent code, moving this responsibility to the targets
1079 /// has the potential of causing nasty silent breakage in out-of-tree targets.
1080 virtual bool isSubregFoldable() const { return false; }
1081
1082 /// For a patchpoint, stackmap, or statepoint intrinsic, return the range of
1083 /// operands which can't be folded into stack references. Operands outside
1084 /// of the range are most likely foldable but it is not guaranteed.
1085 /// These instructions are unique in that stack references for some operands
1086 /// have the same execution cost (e.g. none) as the unfolded register forms.
1087 /// The ranged return is guaranteed to include all operands which can't be
1088 /// folded at zero cost.
1089 virtual std::pair<unsigned, unsigned>
1090 getPatchpointUnfoldableRange(const MachineInstr &MI) const;
1091
1092 /// Attempt to fold a load or store of the specified stack
1093 /// slot into the specified machine instruction for the specified operand(s).
1094 /// If this is possible, a new instruction is returned with the specified
1095 /// operand folded, otherwise NULL is returned.
1096 /// The new instruction is inserted before MI, and the client is responsible
1097 /// for removing the old instruction.
1098 /// If VRM is passed, the assigned physregs can be inspected by target to
1099 /// decide on using an opcode (note that those assignments can still change).
1100 MachineInstr *foldMemoryOperand(MachineInstr &MI, ArrayRef<unsigned> Ops,
1101 int FI,
1102 LiveIntervals *LIS = nullptr,
1103 VirtRegMap *VRM = nullptr) const;
1104
1105 /// Same as the previous version except it allows folding of any load and
1106 /// store from / to any address, not just from a specific stack slot.
1107 MachineInstr *foldMemoryOperand(MachineInstr &MI, ArrayRef<unsigned> Ops,
1108 MachineInstr &LoadMI,
1109 LiveIntervals *LIS = nullptr) const;
1110
1111 /// Return true when there is potentially a faster code sequence
1112 /// for an instruction chain ending in \p Root. All potential patterns are
1113 /// returned in the \p Pattern vector. Pattern should be sorted in priority
1114 /// order since the pattern evaluator stops checking as soon as it finds a
1115 /// faster sequence.
1116 /// \param Root - Instruction that could be combined with one of its operands
1117 /// \param Patterns - Vector of possible combination patterns
1118 virtual bool
1119 getMachineCombinerPatterns(MachineInstr &Root,
1120 SmallVectorImpl<MachineCombinerPattern> &Patterns,
1121 bool DoRegPressureReduce) const;
1122
1123 /// Return true if target supports reassociation of instructions in machine
1124 /// combiner pass to reduce register pressure for a given BB.
1125 virtual bool
1126 shouldReduceRegisterPressure(MachineBasicBlock *MBB,
1127 RegisterClassInfo *RegClassInfo) const {
1128 return false;
1129 }
1130
1131 /// Fix up the placeholder we may add in genAlternativeCodeSequence().
1132 virtual void
1133 finalizeInsInstrs(MachineInstr &Root, MachineCombinerPattern &P,
1134 SmallVectorImpl<MachineInstr *> &InsInstrs) const {}
1135
1136 /// Return true when a code sequence can improve throughput. It
1137 /// should be called only for instructions in loops.
1138 /// \param Pattern - combiner pattern
1139 virtual bool isThroughputPattern(MachineCombinerPattern Pattern) const;
1140
1141 /// Return true if the input \P Inst is part of a chain of dependent ops
1142 /// that are suitable for reassociation, otherwise return false.
1143 /// If the instruction's operands must be commuted to have a previous
1144 /// instruction of the same type define the first source operand, \P Commuted
1145 /// will be set to true.
1146 bool isReassociationCandidate(const MachineInstr &Inst, bool &Commuted) const;
1147
1148 /// Return true when \P Inst is both associative and commutative.
1149 virtual bool isAssociativeAndCommutative(const MachineInstr &Inst) const {
1150 return false;
1151 }
1152
1153 /// Return true when \P Inst has reassociable operands in the same \P MBB.
1154 virtual bool hasReassociableOperands(const MachineInstr &Inst,
1155 const MachineBasicBlock *MBB) const;
1156
1157 /// Return true when \P Inst has reassociable sibling.
1158 bool hasReassociableSibling(const MachineInstr &Inst, bool &Commuted) const;
1159
1160 /// When getMachineCombinerPatterns() finds patterns, this function generates
1161 /// the instructions that could replace the original code sequence. The client
1162 /// has to decide whether the actual replacement is beneficial or not.
1163 /// \param Root - Instruction that could be combined with one of its operands
1164 /// \param Pattern - Combination pattern for Root
1165 /// \param InsInstrs - Vector of new instructions that implement P
1166 /// \param DelInstrs - Old instructions, including Root, that could be
1167 /// replaced by InsInstr
1168 /// \param InstIdxForVirtReg - map of virtual register to instruction in
1169 /// InsInstr that defines it
1170 virtual void genAlternativeCodeSequence(
1171 MachineInstr &Root, MachineCombinerPattern Pattern,
1172 SmallVectorImpl<MachineInstr *> &InsInstrs,
1173 SmallVectorImpl<MachineInstr *> &DelInstrs,
1174 DenseMap<unsigned, unsigned> &InstIdxForVirtReg) const;
1175
1176 /// Attempt to reassociate \P Root and \P Prev according to \P Pattern to
1177 /// reduce critical path length.
1178 void reassociateOps(MachineInstr &Root, MachineInstr &Prev,
1179 MachineCombinerPattern Pattern,
1180 SmallVectorImpl<MachineInstr *> &InsInstrs,
1181 SmallVectorImpl<MachineInstr *> &DelInstrs,
1182 DenseMap<unsigned, unsigned> &InstrIdxForVirtReg) const;
1183
1184 /// The limit on resource length extension we accept in MachineCombiner Pass.
1185 virtual int getExtendResourceLenLimit() const { return 0; }
1186
1187 /// This is an architecture-specific helper function of reassociateOps.
1188 /// Set special operand attributes for new instructions after reassociation.
1189 virtual void setSpecialOperandAttr(MachineInstr &OldMI1, MachineInstr &OldMI2,
1190 MachineInstr &NewMI1,
1191 MachineInstr &NewMI2) const {}
1192
1193 /// Return true when a target supports MachineCombiner.
1194 virtual bool useMachineCombiner() const { return false; }
1195
1196 /// Return true if the given SDNode can be copied during scheduling
1197 /// even if it has glue.
1198 virtual bool canCopyGluedNodeDuringSchedule(SDNode *N) const { return false; }
1199
1200protected:
1201 /// Target-dependent implementation for foldMemoryOperand.
1202 /// Target-independent code in foldMemoryOperand will
1203 /// take care of adding a MachineMemOperand to the newly created instruction.
1204 /// The instruction and any auxiliary instructions necessary will be inserted
1205 /// at InsertPt.
1206 virtual MachineInstr *
1207 foldMemoryOperandImpl(MachineFunction &MF, MachineInstr &MI,
1208 ArrayRef<unsigned> Ops,
1209 MachineBasicBlock::iterator InsertPt, int FrameIndex,
1210 LiveIntervals *LIS = nullptr,
1211 VirtRegMap *VRM = nullptr) const {
1212 return nullptr;
1213 }
1214
1215 /// Target-dependent implementation for foldMemoryOperand.
1216 /// Target-independent code in foldMemoryOperand will
1217 /// take care of adding a MachineMemOperand to the newly created instruction.
1218 /// The instruction and any auxiliary instructions necessary will be inserted
1219 /// at InsertPt.
1220 virtual MachineInstr *foldMemoryOperandImpl(
1221 MachineFunction &MF, MachineInstr &MI, ArrayRef<unsigned> Ops,
1222 MachineBasicBlock::iterator InsertPt, MachineInstr &LoadMI,
1223 LiveIntervals *LIS = nullptr) const {
1224 return nullptr;
1225 }
1226
1227 /// Target-dependent implementation of getRegSequenceInputs.
1228 ///
1229 /// \returns true if it is possible to build the equivalent
1230 /// REG_SEQUENCE inputs with the pair \p MI, \p DefIdx. False otherwise.
1231 ///
1232 /// \pre MI.isRegSequenceLike().
1233 ///
1234 /// \see TargetInstrInfo::getRegSequenceInputs.
1235 virtual bool getRegSequenceLikeInputs(
1236 const MachineInstr &MI, unsigned DefIdx,
1237 SmallVectorImpl<RegSubRegPairAndIdx> &InputRegs) const {
1238 return false;
1239 }
1240
1241 /// Target-dependent implementation of getExtractSubregInputs.
1242 ///
1243 /// \returns true if it is possible to build the equivalent
1244 /// EXTRACT_SUBREG inputs with the pair \p MI, \p DefIdx. False otherwise.
1245 ///
1246 /// \pre MI.isExtractSubregLike().
1247 ///
1248 /// \see TargetInstrInfo::getExtractSubregInputs.
1249 virtual bool getExtractSubregLikeInputs(const MachineInstr &MI,
1250 unsigned DefIdx,
1251 RegSubRegPairAndIdx &InputReg) const {
1252 return false;
1253 }
1254
1255 /// Target-dependent implementation of getInsertSubregInputs.
1256 ///
1257 /// \returns true if it is possible to build the equivalent
1258 /// INSERT_SUBREG inputs with the pair \p MI, \p DefIdx. False otherwise.
1259 ///
1260 /// \pre MI.isInsertSubregLike().
1261 ///
1262 /// \see TargetInstrInfo::getInsertSubregInputs.
1263 virtual bool
1264 getInsertSubregLikeInputs(const MachineInstr &MI, unsigned DefIdx,
1265 RegSubRegPair &BaseReg,
1266 RegSubRegPairAndIdx &InsertedReg) const {
1267 return false;
1268 }
1269
1270public:
1271 /// getAddressSpaceForPseudoSourceKind - Given the kind of memory
1272 /// (e.g. stack) the target returns the corresponding address space.
1273 virtual unsigned
1274 getAddressSpaceForPseudoSourceKind(unsigned Kind) const {
1275 return 0;
1276 }
1277
1278 /// unfoldMemoryOperand - Separate a single instruction which folded a load or
1279 /// a store or a load and a store into two or more instruction. If this is
1280 /// possible, returns true as well as the new instructions by reference.
1281 virtual bool
1282 unfoldMemoryOperand(MachineFunction &MF, MachineInstr &MI, unsigned Reg,
1283 bool UnfoldLoad, bool UnfoldStore,
1284 SmallVectorImpl<MachineInstr *> &NewMIs) const {
1285 return false;
1286 }
1287
1288 virtual bool unfoldMemoryOperand(SelectionDAG &DAG, SDNode *N,
1289 SmallVectorImpl<SDNode *> &NewNodes) const {
1290 return false;
1291 }
1292
1293 /// Returns the opcode of the would be new
1294 /// instruction after load / store are unfolded from an instruction of the
1295 /// specified opcode. It returns zero if the specified unfolding is not
1296 /// possible. If LoadRegIndex is non-null, it is filled in with the operand
1297 /// index of the operand which will hold the register holding the loaded
1298 /// value.
1299 virtual unsigned
1300 getOpcodeAfterMemoryUnfold(unsigned Opc, bool UnfoldLoad, bool UnfoldStore,
1301 unsigned *LoadRegIndex = nullptr) const {
1302 return 0;
1303 }
1304
1305 /// This is used by the pre-regalloc scheduler to determine if two loads are
1306 /// loading from the same base address. It should only return true if the base
1307 /// pointers are the same and the only differences between the two addresses
1308 /// are the offset. It also returns the offsets by reference.
1309 virtual bool areLoadsFromSameBasePtr(SDNode *Load1, SDNode *Load2,
1310 int64_t &Offset1,
1311 int64_t &Offset2) const {
1312 return false;
1313 }
1314
1315 /// This is a used by the pre-regalloc scheduler to determine (in conjunction
1316 /// with areLoadsFromSameBasePtr) if two loads should be scheduled together.
1317 /// On some targets if two loads are loading from
1318 /// addresses in the same cache line, it's better if they are scheduled
1319 /// together. This function takes two integers that represent the load offsets
1320 /// from the common base address. It returns true if it decides it's desirable
1321 /// to schedule the two loads together. "NumLoads" is the number of loads that
1322 /// have already been scheduled after Load1.
1323 virtual bool shouldScheduleLoadsNear(SDNode *Load1, SDNode *Load2,
1324 int64_t Offset1, int64_t Offset2,
1325 unsigned NumLoads) const {
1326 return false;
1327 }
1328
1329 /// Get the base operand and byte offset of an instruction that reads/writes
1330 /// memory. This is a convenience function for callers that are only prepared
1331 /// to handle a single base operand.
1332 bool getMemOperandWithOffset(const MachineInstr &MI,
1333 const MachineOperand *&BaseOp, int64_t &Offset,
1334 bool &OffsetIsScalable,
1335 const TargetRegisterInfo *TRI) const;
1336
1337 /// Get zero or more base operands and the byte offset of an instruction that
1338 /// reads/writes memory. Note that there may be zero base operands if the
1339 /// instruction accesses a constant address.
1340 /// It returns false if MI does not read/write memory.
1341 /// It returns false if base operands and offset could not be determined.
1342 /// It is not guaranteed to always recognize base operands and offsets in all
1343 /// cases.
1344 virtual bool getMemOperandsWithOffsetWidth(
1345 const MachineInstr &MI, SmallVectorImpl<const MachineOperand *> &BaseOps,
1346 int64_t &Offset, bool &OffsetIsScalable, unsigned &Width,
1347 const TargetRegisterInfo *TRI) const {
1348 return false;
1349 }
1350
1351 /// Return true if the instruction contains a base register and offset. If
1352 /// true, the function also sets the operand position in the instruction
1353 /// for the base register and offset.
1354 virtual bool getBaseAndOffsetPosition(const MachineInstr &MI,
1355 unsigned &BasePos,
1356 unsigned &OffsetPos) const {
1357 return false;
1358 }
1359
1360 /// Target dependent implementation to get the values constituting the address
1361 /// MachineInstr that is accessing memory. These values are returned as a
1362 /// struct ExtAddrMode which contains all relevant information to make up the
1363 /// address.
1364 virtual Optional<ExtAddrMode>
1365 getAddrModeFromMemoryOp(const MachineInstr &MemI,
1366 const TargetRegisterInfo *TRI) const {
1367 return None;
1368 }
1369
1370 /// Returns true if MI's Def is NullValueReg, and the MI
1371 /// does not change the Zero value. i.e. cases such as rax = shr rax, X where
1372 /// NullValueReg = rax. Note that if the NullValueReg is non-zero, this
1373 /// function can return true even if becomes zero. Specifically cases such as
1374 /// NullValueReg = shl NullValueReg, 63.
1375 virtual bool preservesZeroValueInReg(const MachineInstr *MI,
1376 const Register NullValueReg,
1377 const TargetRegisterInfo *TRI) const {
1378 return false;
1379 }
1380
1381 /// If the instruction is an increment of a constant value, return the amount.
1382 virtual bool getIncrementValue(const MachineInstr &MI, int &Value) const {
1383 return false;
1384 }
1385
1386 /// Returns true if the two given memory operations should be scheduled
1387 /// adjacent. Note that you have to add:
1388 /// DAG->addMutation(createLoadClusterDAGMutation(DAG->TII, DAG->TRI));
1389 /// or
1390 /// DAG->addMutation(createStoreClusterDAGMutation(DAG->TII, DAG->TRI));
1391 /// to TargetPassConfig::createMachineScheduler() to have an effect.
1392 ///
1393 /// \p BaseOps1 and \p BaseOps2 are memory operands of two memory operations.
1394 /// \p NumLoads is the number of loads that will be in the cluster if this
1395 /// hook returns true.
1396 /// \p NumBytes is the number of bytes that will be loaded from all the
1397 /// clustered loads if this hook returns true.
1398 virtual bool shouldClusterMemOps(ArrayRef<const MachineOperand *> BaseOps1,
1399 ArrayRef<const MachineOperand *> BaseOps2,
1400 unsigned NumLoads, unsigned NumBytes) const {
1401 llvm_unreachable("target did not implement shouldClusterMemOps()")::llvm::llvm_unreachable_internal("target did not implement shouldClusterMemOps()"
, "llvm/include/llvm/CodeGen/TargetInstrInfo.h", 1401)
;
1402 }
1403
1404 /// Reverses the branch condition of the specified condition list,
1405 /// returning false on success and true if it cannot be reversed.
1406 virtual bool
1407 reverseBranchCondition(SmallVectorImpl<MachineOperand> &Cond) const {
1408 return true;
1409 }
1410
1411 /// Insert a noop into the instruction stream at the specified point.
1412 virtual void insertNoop(MachineBasicBlock &MBB,
1413 MachineBasicBlock::iterator MI) const;
1414
1415 /// Insert noops into the instruction stream at the specified point.
1416 virtual void insertNoops(MachineBasicBlock &MBB,
1417 MachineBasicBlock::iterator MI,
1418 unsigned Quantity) const;
1419
1420 /// Return the noop instruction to use for a noop.
1421 virtual MCInst getNop() const;
1422
1423 /// Return true for post-incremented instructions.
1424 virtual bool isPostIncrement(const MachineInstr &MI) const { return false; }
1425
1426 /// Returns true if the instruction is already predicated.
1427 virtual bool isPredicated(const MachineInstr &MI) const { return false; }
1428
1429 // Returns a MIRPrinter comment for this machine operand.
1430 virtual std::string
1431 createMIROperandComment(const MachineInstr &MI, const MachineOperand &Op,
1432 unsigned OpIdx, const TargetRegisterInfo *TRI) const;
1433
1434 /// Returns true if the instruction is a
1435 /// terminator instruction that has not been predicated.
1436 bool isUnpredicatedTerminator(const MachineInstr &MI) const;
1437
1438 /// Returns true if MI is an unconditional tail call.
1439 virtual bool isUnconditionalTailCall(const MachineInstr &MI) const {
1440 return false;
1441 }
1442
1443 /// Returns true if the tail call can be made conditional on BranchCond.
1444 virtual bool canMakeTailCallConditional(SmallVectorImpl<MachineOperand> &Cond,
1445 const MachineInstr &TailCall) const {
1446 return false;
1447 }
1448
1449 /// Replace the conditional branch in MBB with a conditional tail call.
1450 virtual void replaceBranchWithTailCall(MachineBasicBlock &MBB,
1451 SmallVectorImpl<MachineOperand> &Cond,
1452 const MachineInstr &TailCall) const {
1453 llvm_unreachable("Target didn't implement replaceBranchWithTailCall!")::llvm::llvm_unreachable_internal("Target didn't implement replaceBranchWithTailCall!"
, "llvm/include/llvm/CodeGen/TargetInstrInfo.h", 1453)
;
1454 }
1455
1456 /// Convert the instruction into a predicated instruction.
1457 /// It returns true if the operation was successful.
1458 virtual bool PredicateInstruction(MachineInstr &MI,
1459 ArrayRef<MachineOperand> Pred) const;
1460
1461 /// Returns true if the first specified predicate
1462 /// subsumes the second, e.g. GE subsumes GT.
1463 virtual bool SubsumesPredicate(ArrayRef<MachineOperand> Pred1,
1464 ArrayRef<MachineOperand> Pred2) const {
1465 return false;
1466 }
1467
1468 /// If the specified instruction defines any predicate
1469 /// or condition code register(s) used for predication, returns true as well
1470 /// as the definition predicate(s) by reference.
1471 /// SkipDead should be set to false at any point that dead
1472 /// predicate instructions should be considered as being defined.
1473 /// A dead predicate instruction is one that is guaranteed to be removed
1474 /// after a call to PredicateInstruction.
1475 virtual bool ClobbersPredicate(MachineInstr &MI,
1476 std::vector<MachineOperand> &Pred,
1477 bool SkipDead) const {
1478 return false;
1479 }
1480
1481 /// Return true if the specified instruction can be predicated.
1482 /// By default, this returns true for every instruction with a
1483 /// PredicateOperand.
1484 virtual bool isPredicable(const MachineInstr &MI) const {
1485 return MI.getDesc().isPredicable();
1486 }
1487
1488 /// Return true if it's safe to move a machine
1489 /// instruction that defines the specified register class.
1490 virtual bool isSafeToMoveRegClassDefs(const TargetRegisterClass *RC) const {
1491 return true;
1492 }
1493
1494 /// Test if the given instruction should be considered a scheduling boundary.
1495 /// This primarily includes labels and terminators.
1496 virtual bool isSchedulingBoundary(const MachineInstr &MI,
1497 const MachineBasicBlock *MBB,
1498 const MachineFunction &MF) const;
1499
1500 /// Measure the specified inline asm to determine an approximation of its
1501 /// length.
1502 virtual unsigned getInlineAsmLength(
1503 const char *Str, const MCAsmInfo &MAI,
1504 const TargetSubtargetInfo *STI = nullptr) const;
1505
1506 /// Allocate and return a hazard recognizer to use for this target when
1507 /// scheduling the machine instructions before register allocation.
1508 virtual ScheduleHazardRecognizer *
1509 CreateTargetHazardRecognizer(const TargetSubtargetInfo *STI,
1510 const ScheduleDAG *DAG) const;
1511
1512 /// Allocate and return a hazard recognizer to use for this target when
1513 /// scheduling the machine instructions before register allocation.
1514 virtual ScheduleHazardRecognizer *
1515 CreateTargetMIHazardRecognizer(const InstrItineraryData *,
1516 const ScheduleDAGMI *DAG) const;
1517
1518 /// Allocate and return a hazard recognizer to use for this target when
1519 /// scheduling the machine instructions after register allocation.
1520 virtual ScheduleHazardRecognizer *
1521 CreateTargetPostRAHazardRecognizer(const InstrItineraryData *,
1522 const ScheduleDAG *DAG) const;
1523
1524 /// Allocate and return a hazard recognizer to use for by non-scheduling
1525 /// passes.
1526 virtual ScheduleHazardRecognizer *
1527 CreateTargetPostRAHazardRecognizer(const MachineFunction &MF) const {
1528 return nullptr;
1529 }
1530
1531 /// Provide a global flag for disabling the PreRA hazard recognizer that
1532 /// targets may choose to honor.
1533 bool usePreRAHazardRecognizer() const;
1534
1535 /// For a comparison instruction, return the source registers
1536 /// in SrcReg and SrcReg2 if having two register operands, and the value it
1537 /// compares against in CmpValue. Return true if the comparison instruction
1538 /// can be analyzed.
1539 virtual bool analyzeCompare(const MachineInstr &MI, Register &SrcReg,
1540 Register &SrcReg2, int64_t &Mask,
1541 int64_t &Value) const {
1542 return false;
1543 }
1544
1545 /// See if the comparison instruction can be converted
1546 /// into something more efficient. E.g., on ARM most instructions can set the
1547 /// flags register, obviating the need for a separate CMP.
1548 virtual bool optimizeCompareInstr(MachineInstr &CmpInstr, Register SrcReg,
1549 Register SrcReg2, int64_t Mask,
1550 int64_t Value,
1551 const MachineRegisterInfo *MRI) const {
1552 return false;
1553 }
1554 virtual bool optimizeCondBranch(MachineInstr &MI) const { return false; }
1555
1556 /// Try to remove the load by folding it to a register operand at the use.
1557 /// We fold the load instructions if and only if the
1558 /// def and use are in the same BB. We only look at one load and see
1559 /// whether it can be folded into MI. FoldAsLoadDefReg is the virtual register
1560 /// defined by the load we are trying to fold. DefMI returns the machine
1561 /// instruction that defines FoldAsLoadDefReg, and the function returns
1562 /// the machine instruction generated due to folding.
1563 virtual MachineInstr *optimizeLoadInstr(MachineInstr &MI,
1564 const MachineRegisterInfo *MRI,
1565 Register &FoldAsLoadDefReg,
1566 MachineInstr *&DefMI) const {
1567 return nullptr;
1568 }
1569
1570 /// 'Reg' is known to be defined by a move immediate instruction,
1571 /// try to fold the immediate into the use instruction.
1572 /// If MRI->hasOneNonDBGUse(Reg) is true, and this function returns true,
1573 /// then the caller may assume that DefMI has been erased from its parent
1574 /// block. The caller may assume that it will not be erased by this
1575 /// function otherwise.
1576 virtual bool FoldImmediate(MachineInstr &UseMI, MachineInstr &DefMI,
1577 Register Reg, MachineRegisterInfo *MRI) const {
1578 return false;
1579 }
1580
1581 /// Return the number of u-operations the given machine
1582 /// instruction will be decoded to on the target cpu. The itinerary's
1583 /// IssueWidth is the number of microops that can be dispatched each
1584 /// cycle. An instruction with zero microops takes no dispatch resources.
1585 virtual unsigned getNumMicroOps(const InstrItineraryData *ItinData,
1586 const MachineInstr &MI) const;
1587
1588 /// Return true for pseudo instructions that don't consume any
1589 /// machine resources in their current form. These are common cases that the
1590 /// scheduler should consider free, rather than conservatively handling them
1591 /// as instructions with no itinerary.
1592 bool isZeroCost(unsigned Opcode) const {
1593 return Opcode <= TargetOpcode::COPY;
1594 }
1595
1596 virtual int getOperandLatency(const InstrItineraryData *ItinData,
1597 SDNode *DefNode, unsigned DefIdx,
1598 SDNode *UseNode, unsigned UseIdx) const;
1599
1600 /// Compute and return the use operand latency of a given pair of def and use.
1601 /// In most cases, the static scheduling itinerary was enough to determine the
1602 /// operand latency. But it may not be possible for instructions with variable
1603 /// number of defs / uses.
1604 ///
1605 /// This is a raw interface to the itinerary that may be directly overridden
1606 /// by a target. Use computeOperandLatency to get the best estimate of
1607 /// latency.
1608 virtual int getOperandLatency(const InstrItineraryData *ItinData,
1609 const MachineInstr &DefMI, unsigned DefIdx,
1610 const MachineInstr &UseMI,
1611 unsigned UseIdx) const;
1612
1613 /// Compute the instruction latency of a given instruction.
1614 /// If the instruction has higher cost when predicated, it's returned via
1615 /// PredCost.
1616 virtual unsigned getInstrLatency(const InstrItineraryData *ItinData,
1617 const MachineInstr &MI,
1618 unsigned *PredCost = nullptr) const;
1619
1620 virtual unsigned getPredicationCost(const MachineInstr &MI) const;
1621
1622 virtual int getInstrLatency(const InstrItineraryData *ItinData,
1623 SDNode *Node) const;
1624
1625 /// Return the default expected latency for a def based on its opcode.
1626 unsigned defaultDefLatency(const MCSchedModel &SchedModel,
1627 const MachineInstr &DefMI) const;
1628
1629 /// Return true if this opcode has high latency to its result.
1630 virtual bool isHighLatencyDef(int opc) const { return false; }
1631
1632 /// Compute operand latency between a def of 'Reg'
1633 /// and a use in the current loop. Return true if the target considered
1634 /// it 'high'. This is used by optimization passes such as machine LICM to
1635 /// determine whether it makes sense to hoist an instruction out even in a
1636 /// high register pressure situation.
1637 virtual bool hasHighOperandLatency(const TargetSchedModel &SchedModel,
1638 const MachineRegisterInfo *MRI,
1639 const MachineInstr &DefMI, unsigned DefIdx,
1640 const MachineInstr &UseMI,
1641 unsigned UseIdx) const {
1642 return false;
1643 }
1644
1645 /// Compute operand latency of a def of 'Reg'. Return true
1646 /// if the target considered it 'low'.
1647 virtual bool hasLowDefLatency(const TargetSchedModel &SchedModel,
1648 const MachineInstr &DefMI,
1649 unsigned DefIdx) const;
1650
1651 /// Perform target-specific instruction verification.
1652 virtual bool verifyInstruction(const MachineInstr &MI,
1653 StringRef &ErrInfo) const {
1654 return true;
1655 }
1656
1657 /// Return the current execution domain and bit mask of
1658 /// possible domains for instruction.
1659 ///
1660 /// Some micro-architectures have multiple execution domains, and multiple
1661 /// opcodes that perform the same operation in different domains. For
1662 /// example, the x86 architecture provides the por, orps, and orpd
1663 /// instructions that all do the same thing. There is a latency penalty if a
1664 /// register is written in one domain and read in another.
1665 ///
1666 /// This function returns a pair (domain, mask) containing the execution
1667 /// domain of MI, and a bit mask of possible domains. The setExecutionDomain
1668 /// function can be used to change the opcode to one of the domains in the
1669 /// bit mask. Instructions whose execution domain can't be changed should
1670 /// return a 0 mask.
1671 ///
1672 /// The execution domain numbers don't have any special meaning except domain
1673 /// 0 is used for instructions that are not associated with any interesting
1674 /// execution domain.
1675 ///
1676 virtual std::pair<uint16_t, uint16_t>
1677 getExecutionDomain(const MachineInstr &MI) const {
1678 return std::make_pair(0, 0);
1679 }
1680
1681 /// Change the opcode of MI to execute in Domain.
1682 ///
1683 /// The bit (1 << Domain) must be set in the mask returned from
1684 /// getExecutionDomain(MI).
1685 virtual void setExecutionDomain(MachineInstr &MI, unsigned Domain) const {}
1686
1687 /// Returns the preferred minimum clearance
1688 /// before an instruction with an unwanted partial register update.
1689 ///
1690 /// Some instructions only write part of a register, and implicitly need to
1691 /// read the other parts of the register. This may cause unwanted stalls
1692 /// preventing otherwise unrelated instructions from executing in parallel in
1693 /// an out-of-order CPU.
1694 ///
1695 /// For example, the x86 instruction cvtsi2ss writes its result to bits
1696 /// [31:0] of the destination xmm register. Bits [127:32] are unaffected, so
1697 /// the instruction needs to wait for the old value of the register to become
1698 /// available:
1699 ///
1700 /// addps %xmm1, %xmm0
1701 /// movaps %xmm0, (%rax)
1702 /// cvtsi2ss %rbx, %xmm0
1703 ///
1704 /// In the code above, the cvtsi2ss instruction needs to wait for the addps
1705 /// instruction before it can issue, even though the high bits of %xmm0
1706 /// probably aren't needed.
1707 ///
1708 /// This hook returns the preferred clearance before MI, measured in
1709 /// instructions. Other defs of MI's operand OpNum are avoided in the last N
1710 /// instructions before MI. It should only return a positive value for
1711 /// unwanted dependencies. If the old bits of the defined register have
1712 /// useful values, or if MI is determined to otherwise read the dependency,
1713 /// the hook should return 0.
1714 ///
1715 /// The unwanted dependency may be handled by:
1716 ///
1717 /// 1. Allocating the same register for an MI def and use. That makes the
1718 /// unwanted dependency identical to a required dependency.
1719 ///
1720 /// 2. Allocating a register for the def that has no defs in the previous N
1721 /// instructions.
1722 ///
1723 /// 3. Calling breakPartialRegDependency() with the same arguments. This
1724 /// allows the target to insert a dependency breaking instruction.
1725 ///
1726 virtual unsigned
1727 getPartialRegUpdateClearance(const MachineInstr &MI, unsigned OpNum,
1728 const TargetRegisterInfo *TRI) const {
1729 // The default implementation returns 0 for no partial register dependency.
1730 return 0;
1731 }
1732
1733