LLVM 23.0.0git
JumpTableToSwitch.cpp
Go to the documentation of this file.
1//===- JumpTableToSwitch.cpp ----------------------------------------------===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8
10#include "llvm/ADT/DenseSet.h"
11#include "llvm/ADT/STLExtras.h"
13#include "llvm/ADT/Statistic.h"
19#include "llvm/IR/IRBuilder.h"
20#include "llvm/IR/LLVMContext.h"
24#include "llvm/Support/Error.h"
26#include <limits>
27
28using namespace llvm;
29
31 JumpTableSizeThreshold("jump-table-to-switch-size-threshold", cl::Hidden,
32 cl::desc("Only split jump tables with size less or "
33 "equal than JumpTableSizeThreshold."),
34 cl::init(10));
35
36// TODO: Consider adding a cost model for profitability analysis of this
37// transformation. Currently we replace a jump table with a switch if all the
38// functions in the jump table are smaller than the provided threshold.
40 "jump-table-to-switch-function-size-threshold", cl::Hidden,
41 cl::desc("Only split jump tables containing functions whose sizes are less "
42 "or equal than this threshold."),
43 cl::init(50));
44
45namespace llvm {
47} // end namespace llvm
48
49#define DEBUG_TYPE "jump-table-to-switch"
50
51STATISTIC(NumEligibleJumpTables, "The number of jump tables seen by the pass "
52 "that can be converted if deemed profitable.");
53STATISTIC(NumJumpTablesConverted,
54 "The number of jump tables converted into switches.");
55
56namespace {
57struct JumpTableTy {
58 Value *Index;
60};
61} // anonymous namespace
62
63static std::optional<JumpTableTy> parseJumpTable(GetElementPtrInst *GEP,
64 PointerType *PtrTy) {
65 Constant *Ptr = dyn_cast<Constant>(GEP->getPointerOperand());
66 if (!Ptr)
67 return std::nullopt;
68
70 if (!GV || !GV->isConstant() || !GV->hasDefinitiveInitializer())
71 return std::nullopt;
72
73 Function &F = *GEP->getParent()->getParent();
74 const DataLayout &DL = F.getDataLayout();
75 const unsigned BitWidth =
76 DL.getIndexSizeInBits(GEP->getPointerAddressSpace());
78 APInt ConstantOffset(BitWidth, 0);
79 if (!GEP->collectOffset(DL, BitWidth, VariableOffsets, ConstantOffset))
80 return std::nullopt;
81 if (VariableOffsets.size() != 1)
82 return std::nullopt;
83 // TODO: consider supporting more general patterns
84 if (!ConstantOffset.isZero())
85 return std::nullopt;
86 APInt StrideBytes = VariableOffsets.front().second;
87 const uint64_t JumpTableSizeBytes = GV->getGlobalSize(DL);
88 if (JumpTableSizeBytes % StrideBytes.getZExtValue() != 0)
89 return std::nullopt;
90 ++NumEligibleJumpTables;
91 const uint64_t N = JumpTableSizeBytes / StrideBytes.getZExtValue();
93 return std::nullopt;
94
95 JumpTableTy JumpTable;
96 JumpTable.Index = VariableOffsets.front().first;
97 JumpTable.Funcs.reserve(N);
98 for (uint64_t Index = 0; Index < N; ++Index) {
99 // ConstantOffset is zero.
100 APInt Offset = Index * StrideBytes;
101 Constant *C =
103 auto *Func = dyn_cast_or_null<Function>(C);
104 if (!Func || Func->isDeclaration() ||
105 Func->getInstructionCount() > FunctionSizeThreshold)
106 return std::nullopt;
107 JumpTable.Funcs.push_back(Func);
108 }
109 return JumpTable;
110}
111
112static BasicBlock *
113expandToSwitch(CallBase *CB, const JumpTableTy &JT, DomTreeUpdater &DTU,
116 GetGuidForFunction) {
117 ++NumJumpTablesConverted;
118 const bool IsVoid = CB->getType() == Type::getVoidTy(CB->getContext());
119
121 BasicBlock *BB = CB->getParent();
122 BasicBlock *Tail = SplitBlock(BB, CB, &DTU, nullptr, nullptr,
123 BB->getName() + Twine(".tail"));
124 DTUpdates.push_back({DominatorTree::Delete, BB, Tail});
126
127 Function &F = *BB->getParent();
128 BasicBlock *BBUnreachable = BasicBlock::Create(
129 F.getContext(), "default.switch.case.unreachable", &F, Tail);
130 IRBuilder<> BuilderUnreachable(BBUnreachable);
131 BuilderUnreachable.CreateUnreachable();
132
133 IRBuilder<> Builder(BB);
134 SwitchInst *Switch = Builder.CreateSwitch(JT.Index, BBUnreachable);
135 DTUpdates.push_back({DominatorTree::Insert, BB, BBUnreachable});
136
137 IRBuilder<> BuilderTail(CB);
138 PHINode *PHI =
139 IsVoid ? nullptr : BuilderTail.CreatePHI(CB->getType(), JT.Funcs.size());
140 const auto *ProfMD = CB->getMetadata(LLVMContext::MD_prof);
141
142 SmallVector<uint64_t> BranchWeights;
144 const bool HadProfile = isValueProfileMD(ProfMD);
145 if (HadProfile) {
146 // The assumptions, coming in, are that the functions in JT.Funcs are
147 // defined in this module (from parseJumpTable).
149 JT.Funcs, [](const Function *F) { return F && !F->isDeclaration(); }));
150 BranchWeights.reserve(JT.Funcs.size() + 1);
151 // The first is the default target, which is the unreachable block created
152 // above.
153 BranchWeights.push_back(0U);
154 uint64_t TotalCount = 0;
155 auto Targets = getValueProfDataFromInst(
156 *CB, InstrProfValueKind::IPVK_IndirectCallTarget,
157 std::numeric_limits<uint32_t>::max(), TotalCount);
158
159 for (const auto &[G, C] : Targets) {
160 [[maybe_unused]] auto It = GuidToCounter.insert({G, C});
161 assert(It.second);
162 }
163 }
164 for (auto [Index, Func] : llvm::enumerate(JT.Funcs)) {
165 BasicBlock *B = BasicBlock::Create(Func->getContext(),
166 "call." + Twine(Index), &F, Tail);
167 DTUpdates.push_back({DominatorTree::Insert, BB, B});
168 DTUpdates.push_back({DominatorTree::Insert, B, Tail});
169
171 // The MD_prof metadata (VP kind), if it existed, can be dropped, it doesn't
172 // make sense on a direct call. Note that the values are used for the branch
173 // weights of the switch.
174 Call->setMetadata(LLVMContext::MD_prof, nullptr);
175 Call->setCalledFunction(Func);
176 Call->insertInto(B, B->end());
177 Switch->addCase(
178 cast<ConstantInt>(ConstantInt::get(JT.Index->getType(), Index)), B);
179 GlobalValue::GUID FctID = GetGuidForFunction(*Func);
180 // It'd be OK to _not_ find target functions in GuidToCounter, e.g. suppose
181 // just some of the jump targets are taken (for the given profile).
182 BranchWeights.push_back(FctID == 0U ? 0U
183 : GuidToCounter.lookup_or(FctID, 0U));
185 if (PHI)
186 PHI->addIncoming(Call, B);
187 }
188 DTU.applyUpdates(DTUpdates);
189 ORE.emit([&]() {
190 return OptimizationRemark(DEBUG_TYPE, "ReplacedJumpTableWithSwitch", CB)
191 << "expanded indirect call into switch";
192 });
193 if (HadProfile && !ProfcheckDisableMetadataFixes) {
194 // At least one of the targets must've been taken.
195 assert(llvm::any_of(BranchWeights, not_equal_to(0)));
196 setBranchWeights(*Switch, downscaleWeights(BranchWeights),
197 /*IsExpected=*/false);
198 } else
200 if (PHI)
202 CB->eraseFromParent();
203 return Tail;
204}
205
212 DomTreeUpdater DTU(DT, PDT, DomTreeUpdater::UpdateStrategy::Lazy);
213 bool Changed = false;
214 auto FuncToGuid = [&](const Function &Fct) {
215 if (Fct.getMetadata(AssignGUIDPass::GUIDMetadataName))
216 return AssignGUIDPass::getGUID(Fct);
217
219 };
220
221 for (BasicBlock &BB : make_early_inc_range(F)) {
222 BasicBlock *CurrentBB = &BB;
223 while (CurrentBB) {
224 BasicBlock *SplittedOutTail = nullptr;
225 for (Instruction &I : make_early_inc_range(*CurrentBB)) {
226 auto *Call = dyn_cast<CallInst>(&I);
227 if (!Call || Call->getCalledFunction() || Call->isMustTailCall())
228 continue;
229 auto *L = dyn_cast<LoadInst>(Call->getCalledOperand());
230 // Skip atomic or volatile loads.
231 if (!L || !L->isSimple())
232 continue;
233 auto *GEP = dyn_cast<GetElementPtrInst>(L->getPointerOperand());
234 if (!GEP)
235 continue;
236 auto *PtrTy = dyn_cast<PointerType>(L->getType());
237 assert(PtrTy && "call operand must be a pointer");
238 std::optional<JumpTableTy> JumpTable = parseJumpTable(GEP, PtrTy);
239 if (!JumpTable)
240 continue;
241 SplittedOutTail =
242 expandToSwitch(Call, *JumpTable, DTU, ORE, FuncToGuid);
243 Changed = true;
244 break;
245 }
246 CurrentBB = SplittedOutTail ? SplittedOutTail : nullptr;
247 }
248 }
249
250 if (!Changed)
251 return PreservedAnalyses::all();
252
254 if (DT)
256 if (PDT)
258 return PA;
259}
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")
Rewrite undef for PHI
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
static GCRegistry::Add< OcamlGC > B("ocaml", "ocaml 3.10-compatible GC")
This file defines the DenseSet and SmallDenseSet classes.
#define DEBUG_TYPE
Hexagon Common GEP
static cl::opt< unsigned > FunctionSizeThreshold("jump-table-to-switch-function-size-threshold", cl::Hidden, cl::desc("Only split jump tables containing functions whose sizes are less " "or equal than this threshold."), cl::init(50))
static BasicBlock * expandToSwitch(CallBase *CB, const JumpTableTy &JT, DomTreeUpdater &DTU, OptimizationRemarkEmitter &ORE, llvm::function_ref< GlobalValue::GUID(const Function &)> GetGuidForFunction)
static cl::opt< unsigned > JumpTableSizeThreshold("jump-table-to-switch-size-threshold", cl::Hidden, cl::desc("Only split jump tables with size less or " "equal than JumpTableSizeThreshold."), cl::init(10))
static std::optional< JumpTableTy > parseJumpTable(GetElementPtrInst *GEP, PointerType *PtrTy)
#define F(x, y, z)
Definition MD5.cpp:54
#define I(x, y, z)
Definition MD5.cpp:57
#define G(x, y, z)
Definition MD5.cpp:55
This file contains the declarations for profiling metadata utility functions.
This file contains some templates that are useful if you are working with the STL at all.
This file defines the SmallVector class.
This file defines the 'Statistic' class, which is designed to be an easy way to expose various metric...
#define STATISTIC(VARNAME, DESC)
Definition Statistic.h:171
Class for arbitrary precision integers.
Definition APInt.h:78
uint64_t getZExtValue() const
Get zero extended value.
Definition APInt.h:1555
bool isZero() const
Determine if this value is zero, i.e. all bits are clear.
Definition APInt.h:381
PassT::Result * getCachedResult(IRUnitT &IR) const
Get the cached result of an analysis pass for a given IR unit.
PassT::Result & getResult(IRUnitT &IR, ExtraArgTs... ExtraArgs)
Get the result of an analysis pass for a given IR unit.
static LLVM_ABI uint64_t getGUID(const Function &F)
static LLVM_ABI const char * GUIDMetadataName
LLVM Basic Block Representation.
Definition BasicBlock.h:62
const Function * getParent() const
Return the enclosing method, or null if none.
Definition BasicBlock.h:213
static BasicBlock * Create(LLVMContext &Context, const Twine &Name="", Function *Parent=nullptr, BasicBlock *InsertBefore=nullptr)
Creates a new BasicBlock.
Definition BasicBlock.h:206
const Instruction * getTerminator() const LLVM_READONLY
Returns the terminator instruction if the block is well formed or null if the block is not well forme...
Definition BasicBlock.h:233
static BranchInst * Create(BasicBlock *IfTrue, InsertPosition InsertBefore=nullptr)
Base class for all callable instructions (InvokeInst and CallInst) Holds everything related to callin...
This is an important base class in LLVM.
Definition Constant.h:43
A parsed version of the target data layout string in and methods for querying it.
Definition DataLayout.h:64
ValueT lookup_or(const_arg_type_t< KeyT > Val, U &&Default) const
Definition DenseMap.h:215
std::pair< iterator, bool > insert(const std::pair< KeyT, ValueT > &KV)
Definition DenseMap.h:241
Analysis pass which computes a DominatorTree.
Definition Dominators.h:283
Concrete subclass of DominatorTreeBase that is used to compute a normal dominator tree.
Definition Dominators.h:164
void applyUpdates(ArrayRef< UpdateT > Updates)
Submit updates to all available trees.
an instruction for type-safe pointer arithmetic to access elements of arrays and structs
static LLVM_ABI GUID getGUIDAssumingExternalLinkage(StringRef GlobalName)
Return a 64-bit global unique ID constructed from the name of a global symbol.
Definition Globals.cpp:78
uint64_t GUID
Declare a type to represent a global unique identifier for a global value.
const Constant * getInitializer() const
getInitializer - Return the initializer for this global variable.
LLVM_ABI uint64_t getGlobalSize(const DataLayout &DL) const
Get the size of this global variable in bytes.
Definition Globals.cpp:561
bool isConstant() const
If the value is a global constant, its value is immutable throughout the runtime execution of the pro...
bool hasDefinitiveInitializer() const
hasDefinitiveInitializer - Whether the global variable has an initializer, and any other instances of...
UnreachableInst * CreateUnreachable()
Definition IRBuilder.h:1342
PHINode * CreatePHI(Type *Ty, unsigned NumReservedValues, const Twine &Name="")
Definition IRBuilder.h:2473
This provides a uniform API for creating instructions and inserting them into a basic block: either a...
Definition IRBuilder.h:2787
LLVM_ABI Instruction * clone() const
Create a copy of 'this' instruction that is identical in all ways except the following:
LLVM_ABI InstListType::iterator eraseFromParent()
This method unlinks 'this' from the containing basic block and deletes it.
MDNode * getMetadata(unsigned KindID) const
Get the metadata of given kind attached to this Instruction.
PreservedAnalyses run(Function &F, FunctionAnalysisManager &AM)
Run the pass over the function.
size_type size() const
Definition MapVector.h:56
std::pair< KeyT, ValueT > & front()
Definition MapVector.h:79
The optimization diagnostic interface.
LLVM_ABI void emit(DiagnosticInfoOptimizationBase &OptDiag)
Output the remark via the diagnostic handler and to the optimization record file.
Diagnostic information for applied optimization remarks.
Analysis pass which computes a PostDominatorTree.
PostDominatorTree Class - Concrete subclass of DominatorTree that is used to compute the post-dominat...
A set of analyses that are preserved following a run of a transformation pass.
Definition Analysis.h:112
static PreservedAnalyses all()
Construct a special preserved set that preserves all passes.
Definition Analysis.h:118
PreservedAnalyses & preserve()
Mark an analysis as preserved.
Definition Analysis.h:132
void reserve(size_type N)
void push_back(const T &Elt)
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
Multiway switch.
Twine - A lightweight data structure for efficiently representing the concatenation of temporary valu...
Definition Twine.h:82
static LLVM_ABI Type * getVoidTy(LLVMContext &C)
Definition Type.cpp:280
LLVM Value Representation.
Definition Value.h:75
Type * getType() const
All values are typed, get the type of this value.
Definition Value.h:256
LLVM_ABI void replaceAllUsesWith(Value *V)
Change all uses of this to point to a new Value.
Definition Value.cpp:553
LLVMContext & getContext() const
All values hold a context through their type.
Definition Value.h:259
LLVM_ABI StringRef getName() const
Return a constant reference to the value's name.
Definition Value.cpp:322
An efficient, type-erasing, non-owning reference to a callable.
const ParentTy * getParent() const
Definition ilist_node.h:34
CallInst * Call
Changed
@ Tail
Attemps to make calls as fast as possible while guaranteeing that tail call optimization can always b...
Definition CallingConv.h:76
@ C
The default llvm calling convention, compatible with C.
Definition CallingConv.h:34
initializer< Ty > init(const Ty &Val)
This is an optimization pass for GlobalISel generic memory operations.
Definition Types.h:26
@ Offset
Definition DWP.cpp:532
constexpr auto not_equal_to(T &&Arg)
Functor variant of std::not_equal_to that can be used as a UnaryPredicate in functional algorithms li...
Definition STLExtras.h:2180
bool all_of(R &&range, UnaryPredicate P)
Provide wrappers to std::all_of which take ranges instead of having to pass begin/end explicitly.
Definition STLExtras.h:1739
LLVM_ABI std::string getIRPGOFuncName(const Function &F, bool InLTO=false)
auto enumerate(FirstRange &&First, RestRanges &&...Rest)
Given two or more input ranges, returns a new range whose values are tuples (A, B,...
Definition STLExtras.h:2554
decltype(auto) dyn_cast(const From &Val)
dyn_cast<X> - Return the argument parameter cast to the specified type.
Definition Casting.h:643
iterator_range< early_inc_iterator_impl< detail::IterOfRange< RangeT > > > make_early_inc_range(RangeT &&Range)
Make a range that does early increment to allow mutation of the underlying range without disrupting i...
Definition STLExtras.h:634
LLVM_ABI void setExplicitlyUnknownBranchWeights(Instruction &I, StringRef PassName)
Specify that the branch weights for this terminator cannot be known at compile time.
LLVM_ABI void setBranchWeights(Instruction &I, ArrayRef< uint32_t > Weights, bool IsExpected, bool ElideAllZero=false)
Create a new branch_weights metadata node and add or overwrite a prof metadata reference to instructi...
auto dyn_cast_or_null(const Y &Val)
Definition Casting.h:753
bool any_of(R &&range, UnaryPredicate P)
Provide wrappers to std::any_of which take ranges instead of having to pass begin/end explicitly.
Definition STLExtras.h:1746
LLVM_ABI Constant * ConstantFoldLoadFromConst(Constant *C, Type *Ty, const APInt &Offset, const DataLayout &DL)
Extract value of C at the given Offset reinterpreted as Ty.
LLVM_ABI SmallVector< InstrProfValueData, 4 > getValueProfDataFromInst(const Instruction &Inst, InstrProfValueKind ValueKind, uint32_t MaxNumValueData, uint64_t &TotalC, bool GetNoICPValue=false)
Extract the value profile data from Inst and returns them if Inst is annotated with value profile dat...
LLVM_ABI bool isValueProfileMD(const MDNode *ProfileData)
Checks if an MDNode contains value profiling Metadata.
LLVM_ABI BasicBlock * SplitBlock(BasicBlock *Old, BasicBlock::iterator SplitPt, DominatorTree *DT, LoopInfo *LI=nullptr, MemorySSAUpdater *MSSAU=nullptr, const Twine &BBName="")
Split the specified block at the specified instruction.
constexpr unsigned BitWidth
decltype(auto) cast(const From &Val)
cast<X> - Return the argument parameter cast to the specified type.
Definition Casting.h:559
cl::opt< bool > ProfcheckDisableMetadataFixes("profcheck-disable-metadata-fixes", cl::Hidden, cl::init(false), cl::desc("Disable metadata propagation fixes discovered through Issue #147390"))
Definition Metadata.cpp:64
AnalysisManager< Function > FunctionAnalysisManager
Convenience typedef for the Function analysis manager.
LLVM_ABI SmallVector< uint32_t > downscaleWeights(ArrayRef< uint64_t > Weights, std::optional< uint64_t > KnownMaxCount=std::nullopt)
downscale the given weights preserving the ratio.
#define N
A MapVector that performs no allocations if smaller than a certain size.
Definition MapVector.h:276