LLVM 23.0.0git
VPlanUtils.h
Go to the documentation of this file.
1//===- VPlanUtils.h - VPlan-related utilities -------------------*- C++ -*-===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8
9#ifndef LLVM_TRANSFORMS_VECTORIZE_VPLANUTILS_H
10#define LLVM_TRANSFORMS_VECTORIZE_VPLANUTILS_H
11
12#include "VPlan.h"
13#include "VPlanPatternMatch.h"
15
16namespace llvm {
17class MemoryLocation;
18class ScalarEvolution;
19class SCEV;
21} // namespace llvm
22
23namespace llvm {
24
25namespace vputils {
26/// Returns true if only the first lane of \p Def is used.
27bool onlyFirstLaneUsed(const VPValue *Def);
28
29/// Returns true if only the first part of \p Def is used.
30bool onlyFirstPartUsed(const VPValue *Def);
31
32/// Returns true if only scalar values of \p Def are used by all users.
33bool onlyScalarValuesUsed(const VPValue *Def);
34
35/// Get or create a VPValue that corresponds to the expansion of \p Expr. If \p
36/// Expr is a SCEVConstant or SCEVUnknown, return a VPValue wrapping the live-in
37/// value. Otherwise return a VPExpandSCEVRecipe to expand \p Expr. If \p Plan's
38/// pre-header already contains a recipe expanding \p Expr, return it. If not,
39/// create a new one.
41
42/// Return the SCEV expression for \p V. Returns SCEVCouldNotCompute if no
43/// SCEV expression could be constructed.
44const SCEV *getSCEVExprForVPValue(const VPValue *V,
46 const Loop *L = nullptr);
47
48/// Returns true if \p Addr is an address SCEV that can be passed to
49/// TTI::getAddressComputationCost, i.e. the address SCEV is loop invariant, an
50/// affine AddRec (i.e. induction ), or an add expression of such operands or a
51/// sign-extended AddRec.
52bool isAddressSCEVForCost(const SCEV *Addr, ScalarEvolution &SE, const Loop *L);
53
54/// Returns true if \p VPV is a single scalar, either because it produces the
55/// same value for all lanes or only has its first lane used.
56bool isSingleScalar(const VPValue *VPV);
57
58/// Return true if \p V is a header mask in \p Plan.
59bool isHeaderMask(const VPValue *V, const VPlan &Plan);
60
61/// Checks if \p V is uniform across all VF lanes and UF parts. It is considered
62/// as such if it is either loop invariant (defined outside the vector region)
63/// or its operand is known to be uniform across all VFs and UFs (e.g.
64/// VPDerivedIV or VPCanonicalIVPHI).
66
67/// Returns the header block of the first, top-level loop, or null if none
68/// exist.
70
71/// Get the VF scaling factor applied to the recipe's output, if the recipe has
72/// one.
74
75/// Returns the VPValue representing the uncountable exit comparison used by
76/// AnyOf if the recipes it depends on can be traced back to live-ins and
77/// the addresses (in GEP/PtrAdd form) of any (non-masked) load used in
78/// generating the values for the comparison. The recipes are stored in
79/// \p Recipes, and recipes forming an address for a load are also added to
80/// \p GEPs.
82std::optional<VPValue *>
86
87/// Return a MemoryLocation for \p R with noalias metadata populated from
88/// \p R, if the recipe is supported and std::nullopt otherwise. The pointer of
89/// the location is conservatively set to nullptr.
90std::optional<MemoryLocation> getMemoryLocation(const VPRecipeBase &R);
91
92/// Extracts and returns NoWrap and FastMath flags from the induction binop in
93/// \p ID.
96 return ID.getInductionBinOp()->getFastMathFlags();
97
99 ID.getInductionBinOp()))
100 return VPIRFlags::WrapFlagsTy(OBO->hasNoUnsignedWrap(),
101 OBO->hasNoSignedWrap());
102
104 "Expected int induction");
105 return VPIRFlags::WrapFlagsTy(false, false);
106}
107
108/// Search \p Start's users for a recipe satisfying \p Pred, looking through
109/// recipes with definitions.
110template <typename PredT>
111inline VPRecipeBase *findRecipe(VPValue *Start, PredT Pred) {
112 SetVector<VPValue *> Worklist;
113 Worklist.insert(Start);
114 for (unsigned I = 0; I != Worklist.size(); ++I) {
115 VPValue *Cur = Worklist[I];
116 auto *R = Cur->getDefiningRecipe();
117 if (!R)
118 continue;
119 if (Pred(R))
120 return R;
121 for (VPUser *U : Cur->users()) {
122 for (VPValue *V : cast<VPRecipeBase>(U)->definedValues())
123 Worklist.insert(V);
124 }
125 }
126 return nullptr;
127}
128
129/// If \p V is used by a recipe matching pattern \p P, return it. Otherwise
130/// return nullptr;
131template <typename MatchT>
132static VPRecipeBase *findUserOf(VPValue *V, const MatchT &P) {
133 auto It = find_if(V->users(), match_fn(P));
134 return It == V->user_end() ? nullptr : cast<VPRecipeBase>(*It);
135}
136
137/// If \p V is used by a VPInstruction with \p Opcode, return it. Otherwise
138/// return nullptr.
139template <unsigned Opcode> static VPInstruction *findUserOf(VPValue *V) {
140 using namespace llvm::VPlanPatternMatch;
142}
143
144/// Find the ComputeReductionResult recipe for \p PhiR, looking through selects
145/// inserted for predicated reductions or tail folding.
147
148/// Collect the header mask with the pattern:
149/// (ICMP_ULE, WideCanonicalIV, backedge-taken-count)
150/// TODO: Introduce explicit recipe for header-mask instead of searching
151/// the header-mask pattern manually.
153
154} // namespace vputils
155
156//===----------------------------------------------------------------------===//
157// Utilities for modifying predecessors and successors of VPlan blocks.
158//===----------------------------------------------------------------------===//
159
160/// Class that provides utilities for VPBlockBases in VPlan.
162public:
163 VPBlockUtils() = delete;
164
165 /// Insert disconnected VPBlockBase \p NewBlock after \p BlockPtr. Add \p
166 /// NewBlock as successor of \p BlockPtr and \p BlockPtr as predecessor of \p
167 /// NewBlock, and propagate \p BlockPtr parent to \p NewBlock. \p BlockPtr's
168 /// successors are moved from \p BlockPtr to \p NewBlock. \p NewBlock must
169 /// have neither successors nor predecessors.
170 static void insertBlockAfter(VPBlockBase *NewBlock, VPBlockBase *BlockPtr) {
171 assert(!NewBlock->hasSuccessors() && !NewBlock->hasPredecessors() &&
172 "Can't insert new block with predecessors or successors.");
173 NewBlock->setParent(BlockPtr->getParent());
174 transferSuccessors(BlockPtr, NewBlock);
175 connectBlocks(BlockPtr, NewBlock);
176 }
177
178 /// Insert disconnected block \p NewBlock before \p Blockptr. First
179 /// disconnects all predecessors of \p BlockPtr and connects them to \p
180 /// NewBlock. Add \p NewBlock as predecessor of \p BlockPtr and \p BlockPtr as
181 /// successor of \p NewBlock.
182 static void insertBlockBefore(VPBlockBase *NewBlock, VPBlockBase *BlockPtr) {
183 assert(!NewBlock->hasSuccessors() && !NewBlock->hasPredecessors() &&
184 "Can't insert new block with predecessors or successors.");
185 NewBlock->setParent(BlockPtr->getParent());
186 for (VPBlockBase *Pred : to_vector(BlockPtr->predecessors())) {
187 Pred->replaceSuccessor(BlockPtr, NewBlock);
188 NewBlock->appendPredecessor(Pred);
189 }
190 BlockPtr->clearPredecessors();
191 connectBlocks(NewBlock, BlockPtr);
192 }
193
194 /// Insert disconnected VPBlockBases \p IfTrue and \p IfFalse after \p
195 /// BlockPtr. Add \p IfTrue and \p IfFalse as succesors of \p BlockPtr and \p
196 /// BlockPtr as predecessor of \p IfTrue and \p IfFalse. Propagate \p BlockPtr
197 /// parent to \p IfTrue and \p IfFalse. \p BlockPtr must have no successors
198 /// and \p IfTrue and \p IfFalse must have neither successors nor
199 /// predecessors.
200 static void insertTwoBlocksAfter(VPBlockBase *IfTrue, VPBlockBase *IfFalse,
201 VPBlockBase *BlockPtr) {
202 assert(!IfTrue->hasSuccessors() && "Can't insert IfTrue with successors.");
203 assert(!IfFalse->hasSuccessors() &&
204 "Can't insert IfFalse with successors.");
205 BlockPtr->setTwoSuccessors(IfTrue, IfFalse);
206 IfTrue->setPredecessors({BlockPtr});
207 IfFalse->setPredecessors({BlockPtr});
208 IfTrue->setParent(BlockPtr->getParent());
209 IfFalse->setParent(BlockPtr->getParent());
210 }
211
212 /// Connect VPBlockBases \p From and \p To bi-directionally. If \p PredIdx is
213 /// -1, append \p From to the predecessors of \p To, otherwise set \p To's
214 /// predecessor at \p PredIdx to \p From. If \p SuccIdx is -1, append \p To to
215 /// the successors of \p From, otherwise set \p From's successor at \p SuccIdx
216 /// to \p To. Both VPBlockBases must have the same parent, which can be null.
217 /// Both VPBlockBases can be already connected to other VPBlockBases.
218 static void connectBlocks(VPBlockBase *From, VPBlockBase *To,
219 unsigned PredIdx = -1u, unsigned SuccIdx = -1u) {
220 assert((From->getParent() == To->getParent()) &&
221 "Can't connect two block with different parents");
222
223 if (SuccIdx == -1u)
224 From->appendSuccessor(To);
225 else
226 From->getSuccessors()[SuccIdx] = To;
227
228 if (PredIdx == -1u)
229 To->appendPredecessor(From);
230 else
231 To->getPredecessors()[PredIdx] = From;
232 }
233
234 /// Disconnect VPBlockBases \p From and \p To bi-directionally. Remove \p To
235 /// from the successors of \p From and \p From from the predecessors of \p To.
236 static void disconnectBlocks(VPBlockBase *From, VPBlockBase *To) {
237 assert(To && "Successor to disconnect is null.");
238 From->removeSuccessor(To);
239 To->removePredecessor(From);
240 }
241
242 /// Reassociate all the blocks connected to \p Old so that they now point to
243 /// \p New.
244 static void reassociateBlocks(VPBlockBase *Old, VPBlockBase *New) {
245 for (auto *Pred : to_vector(Old->getPredecessors()))
246 Pred->replaceSuccessor(Old, New);
247 for (auto *Succ : to_vector(Old->getSuccessors()))
248 Succ->replacePredecessor(Old, New);
249 New->setPredecessors(Old->getPredecessors());
250 New->setSuccessors(Old->getSuccessors());
251 Old->clearPredecessors();
252 Old->clearSuccessors();
253 }
254
255 /// Transfer successors from \p Old to \p New. \p New must have no successors.
257 for (auto *Succ : Old->getSuccessors())
258 Succ->replacePredecessor(Old, New);
259 New->setSuccessors(Old->getSuccessors());
260 Old->clearSuccessors();
261 }
262
263 /// Return an iterator range over \p Range which only includes \p BlockTy
264 /// blocks. The accesses are casted to \p BlockTy.
265 template <typename BlockTy, typename T>
266 static auto blocksOnly(const T &Range) {
267 // Create BaseTy with correct const-ness based on BlockTy.
268 using BaseTy = std::conditional_t<std::is_const<BlockTy>::value,
269 const VPBlockBase, VPBlockBase>;
270
271 // We need to first create an iterator range over (const) BlocktTy & instead
272 // of (const) BlockTy * for filter_range to work properly.
273 auto Mapped =
274 map_range(Range, [](BaseTy *Block) -> BaseTy & { return *Block; });
276 Mapped, [](BaseTy &Block) { return isa<BlockTy>(&Block); });
277 return map_range(Filter, [](BaseTy &Block) -> BlockTy * {
278 return cast<BlockTy>(&Block);
279 });
280 }
281
282 /// Inserts \p BlockPtr on the edge between \p From and \p To. That is, update
283 /// \p From's successor to \p To to point to \p BlockPtr and \p To's
284 /// predecessor from \p From to \p BlockPtr. \p From and \p To are added to \p
285 /// BlockPtr's predecessors and successors respectively. There must be a
286 /// single edge between \p From and \p To.
287 static void insertOnEdge(VPBlockBase *From, VPBlockBase *To,
288 VPBlockBase *BlockPtr) {
289 unsigned SuccIdx = From->getIndexForSuccessor(To);
290 unsigned PredIx = To->getIndexForPredecessor(From);
291 VPBlockUtils::connectBlocks(From, BlockPtr, -1, SuccIdx);
292 VPBlockUtils::connectBlocks(BlockPtr, To, PredIx, -1);
293 }
294
295 /// Returns true if \p VPB is a loop header, based on regions or \p VPDT in
296 /// their absence.
297 static bool isHeader(const VPBlockBase *VPB, const VPDominatorTree &VPDT);
298
299 /// Returns true if \p VPB is a loop latch, using isHeader().
300 static bool isLatch(const VPBlockBase *VPB, const VPDominatorTree &VPDT);
301};
302
303} // namespace llvm
304
305#endif
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")
#define LLVM_ABI_FOR_TEST
Definition Compiler.h:218
std::pair< BasicBlock *, unsigned > BlockTy
A pair of (basic block, score).
#define I(x, y, z)
Definition MD5.cpp:57
#define T
ConstantRange Range(APInt(BitWidth, Low), APInt(BitWidth, High))
#define P(N)
This file contains the declarations of the Vectorization Plan base classes:
A struct for saving information about induction variables.
@ IK_FpInduction
Floating point induction variable.
@ IK_IntInduction
Integer induction variable. Step = C.
Represents a single loop in the control flow graph.
Definition LoopInfo.h:40
Representation for a specific memory location.
An interface layer with SCEV used to manage how we see SCEV expressions for values in the context of ...
This class represents an analyzed expression in the program.
The main scalar evolution driver.
A vector that has set insertion semantics.
Definition SetVector.h:57
size_type size() const
Determine the number of elements in the SetVector.
Definition SetVector.h:103
bool insert(const value_type &X)
Insert a new element into the SetVector.
Definition SetVector.h:151
This class consists of common code factored out of the SmallVector class to reduce code duplication b...
VPBasicBlock serves as the leaf of the Hierarchical Control-Flow Graph.
Definition VPlan.h:4239
VPBlockBase is the building block of the Hierarchical Control-Flow Graph.
Definition VPlan.h:82
VPRegionBlock * getParent()
Definition VPlan.h:174
iterator_range< VPBlockBase ** > predecessors()
Definition VPlan.h:208
bool hasPredecessors() const
Returns true if this block has any predecessors.
Definition VPlan.h:205
unsigned getIndexForSuccessor(const VPBlockBase *Succ) const
Returns the index for Succ in the blocks successor list.
Definition VPlan.h:338
void setPredecessors(ArrayRef< VPBlockBase * > NewPreds)
Set each VPBasicBlock in NewPreds as predecessor of this VPBlockBase.
Definition VPlan.h:294
unsigned getIndexForPredecessor(const VPBlockBase *Pred) const
Returns the index for Pred in the blocks predecessors list.
Definition VPlan.h:331
bool hasSuccessors() const
Returns true if this block has any successors.
Definition VPlan.h:203
const VPBlocksTy & getPredecessors() const
Definition VPlan.h:210
void clearSuccessors()
Remove all the successors of this block.
Definition VPlan.h:313
void setTwoSuccessors(VPBlockBase *IfTrue, VPBlockBase *IfFalse)
Set two given VPBlockBases IfTrue and IfFalse to be the two successors of this VPBlockBase.
Definition VPlan.h:285
void clearPredecessors()
Remove all the predecessor of this block.
Definition VPlan.h:310
void setParent(VPRegionBlock *P)
Definition VPlan.h:185
const VPBlocksTy & getSuccessors() const
Definition VPlan.h:199
static auto blocksOnly(const T &Range)
Return an iterator range over Range which only includes BlockTy blocks.
Definition VPlanUtils.h:266
static void insertBlockAfter(VPBlockBase *NewBlock, VPBlockBase *BlockPtr)
Insert disconnected VPBlockBase NewBlock after BlockPtr.
Definition VPlanUtils.h:170
static void insertOnEdge(VPBlockBase *From, VPBlockBase *To, VPBlockBase *BlockPtr)
Inserts BlockPtr on the edge between From and To.
Definition VPlanUtils.h:287
static bool isLatch(const VPBlockBase *VPB, const VPDominatorTree &VPDT)
Returns true if VPB is a loop latch, using isHeader().
static bool isHeader(const VPBlockBase *VPB, const VPDominatorTree &VPDT)
Returns true if VPB is a loop header, based on regions or VPDT in their absence.
static void insertTwoBlocksAfter(VPBlockBase *IfTrue, VPBlockBase *IfFalse, VPBlockBase *BlockPtr)
Insert disconnected VPBlockBases IfTrue and IfFalse after BlockPtr.
Definition VPlanUtils.h:200
static void connectBlocks(VPBlockBase *From, VPBlockBase *To, unsigned PredIdx=-1u, unsigned SuccIdx=-1u)
Connect VPBlockBases From and To bi-directionally.
Definition VPlanUtils.h:218
static void disconnectBlocks(VPBlockBase *From, VPBlockBase *To)
Disconnect VPBlockBases From and To bi-directionally.
Definition VPlanUtils.h:236
static void reassociateBlocks(VPBlockBase *Old, VPBlockBase *New)
Reassociate all the blocks connected to Old so that they now point to New.
Definition VPlanUtils.h:244
static void insertBlockBefore(VPBlockBase *NewBlock, VPBlockBase *BlockPtr)
Insert disconnected block NewBlock before Blockptr.
Definition VPlanUtils.h:182
static void transferSuccessors(VPBlockBase *Old, VPBlockBase *New)
Transfer successors from Old to New. New must have no successors.
Definition VPlanUtils.h:256
Template specialization of the standard LLVM dominator tree utility for VPBlockBases.
Class to record and manage LLVM IR flags.
Definition VPlan.h:674
This is a concrete Recipe that models a single VPlan-level instruction.
Definition VPlan.h:1195
VPRecipeBase is a base class modeling a sequence of one or more output IR instructions.
Definition VPlan.h:390
A recipe for handling reduction phis.
Definition VPlan.h:2670
VPSingleDef is a base class for recipes for modeling a sequence of one or more output IR that define ...
Definition VPlan.h:591
This class augments VPValue with operands which provide the inverse def-use edges from VPValue's user...
Definition VPlanValue.h:297
This is the base class of the VPlan Def/Use graph, used for modeling the data flow into,...
Definition VPlanValue.h:46
VPRecipeBase * getDefiningRecipe()
Returns the recipe defining this VPValue or nullptr if it is not defined by a recipe,...
Definition VPlan.cpp:127
user_range users()
Definition VPlanValue.h:150
VPlan models a candidate for vectorization, encoding various decisions take to produce efficient outp...
Definition VPlan.h:4557
unsigned ID
LLVM IR allows to use arbitrary numbers as calling convention identifiers.
Definition CallingConv.h:24
auto match_fn(const Pattern &P)
A match functor that can be used as a UnaryPredicate in functional algorithms like all_of.
bind_ty< VPInstruction > m_VPInstruction(VPInstruction *&V)
Match a VPInstruction, capturing if we match.
bool isSingleScalar(const VPValue *VPV)
Returns true if VPV is a single scalar, either because it produces the same value for all lanes or on...
bool isUniformAcrossVFsAndUFs(VPValue *V)
Checks if V is uniform across all VF lanes and UF parts.
VPValue * getOrCreateVPValueForSCEVExpr(VPlan &Plan, const SCEV *Expr)
Get or create a VPValue that corresponds to the expansion of Expr.
VPBasicBlock * getFirstLoopHeader(VPlan &Plan, VPDominatorTree &VPDT)
Returns the header block of the first, top-level loop, or null if none exist.
bool isAddressSCEVForCost(const SCEV *Addr, ScalarEvolution &SE, const Loop *L)
Returns true if Addr is an address SCEV that can be passed to TTI::getAddressComputationCost,...
bool onlyFirstPartUsed(const VPValue *Def)
Returns true if only the first part of Def is used.
VPInstruction * findComputeReductionResult(VPReductionPHIRecipe *PhiR)
Find the ComputeReductionResult recipe for PhiR, looking through selects inserted for predicated redu...
std::optional< MemoryLocation > getMemoryLocation(const VPRecipeBase &R)
Return a MemoryLocation for R with noalias metadata populated from R, if the recipe is supported and ...
bool onlyFirstLaneUsed(const VPValue *Def)
Returns true if only the first lane of Def is used.
VPIRFlags getFlagsFromIndDesc(const InductionDescriptor &ID)
Extracts and returns NoWrap and FastMath flags from the induction binop in ID.
Definition VPlanUtils.h:94
VPRecipeBase * findRecipe(VPValue *Start, PredT Pred)
Search Start's users for a recipe satisfying Pred, looking through recipes with definitions.
Definition VPlanUtils.h:111
VPSingleDefRecipe * findHeaderMask(VPlan &Plan)
Collect the header mask with the pattern: (ICMP_ULE, WideCanonicalIV, backedge-taken-count) TODO: Int...
bool onlyScalarValuesUsed(const VPValue *Def)
Returns true if only scalar values of Def are used by all users.
static VPRecipeBase * findUserOf(VPValue *V, const MatchT &P)
If V is used by a recipe matching pattern P, return it.
Definition VPlanUtils.h:132
const SCEV * getSCEVExprForVPValue(const VPValue *V, PredicatedScalarEvolution &PSE, const Loop *L=nullptr)
Return the SCEV expression for V.
unsigned getVFScaleFactor(VPRecipeBase *R)
Get the VF scaling factor applied to the recipe's output, if the recipe has one.
bool isHeaderMask(const VPValue *V, const VPlan &Plan)
Return true if V is a header mask in Plan.
LLVM_ABI_FOR_TEST std::optional< VPValue * > getRecipesForUncountableExit(VPlan &Plan, SmallVectorImpl< VPRecipeBase * > &Recipes, SmallVectorImpl< VPRecipeBase * > &GEPs)
Returns the VPValue representing the uncountable exit comparison used by AnyOf if the recipes it depe...
This is an optimization pass for GlobalISel generic memory operations.
Definition Types.h:26
auto dyn_cast_if_present(const Y &Val)
dyn_cast_if_present<X> - Functionally identical to dyn_cast, except that a null (or none in the case ...
Definition Casting.h:732
auto cast_or_null(const Y &Val)
Definition Casting.h:714
auto map_range(ContainerTy &&C, FuncTy F)
Return a range that applies F to the elements of C.
Definition STLExtras.h:366
SmallVector< ValueTypeFromRangeType< R >, Size > to_vector(R &&Range)
Given a range of type R, iterate the entire range and return a SmallVector with elements of the vecto...
iterator_range< filter_iterator< detail::IterOfRange< RangeT >, PredicateT > > make_filter_range(RangeT &&Range, PredicateT Pred)
Convenience function that takes a range of elements and a predicate, and return a new filter_iterator...
Definition STLExtras.h:552
bool isa(const From &Val)
isa<X> - Return true if the parameter to the template is an instance of one of the template type argu...
Definition Casting.h:547
decltype(auto) cast(const From &Val)
cast<X> - Return the argument parameter cast to the specified type.
Definition Casting.h:559
auto find_if(R &&Range, UnaryPredicate P)
Provide wrappers to std::find_if which take ranges instead of having to pass begin/end explicitly.
Definition STLExtras.h:1772