LLVM 20.0.0git
VPRecipeBuilder.h
Go to the documentation of this file.
1//===- VPRecipeBuilder.h - Helper class to build recipes --------*- C++ -*-===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8
9#ifndef LLVM_TRANSFORMS_VECTORIZE_VPRECIPEBUILDER_H
10#define LLVM_TRANSFORMS_VECTORIZE_VPRECIPEBUILDER_H
11
13#include "VPlan.h"
14#include "llvm/ADT/DenseMap.h"
17#include "llvm/IR/IRBuilder.h"
18
19namespace llvm {
20
21class LoopVectorizationLegality;
22class LoopVectorizationCostModel;
23class TargetLibraryInfo;
24class TargetTransformInfo;
25struct HistogramInfo;
26
27/// A chain of instructions that form a partial reduction.
28/// Designed to match: reduction_bin_op (bin_op (extend (A), (extend (B))),
29/// accumulator).
34 }
35 /// The top-level binary operation that forms the reduction to a scalar
36 /// after the loop body.
38 /// The extension of each of the inner binary operation's operands.
41
42 /// The binary operation using the extends that is then reduced.
44};
45
46/// Helper class to create VPRecipies from IR instructions.
48 /// The VPlan new recipes are added to.
49 VPlan &Plan;
50
51 /// The loop that we evaluate.
52 Loop *OrigLoop;
53
54 /// Target Library Info.
55 const TargetLibraryInfo *TLI;
56
57 // Target Transform Info.
59
60 /// The legality analysis.
62
63 /// The profitablity analysis.
65
67
68 VPBuilder &Builder;
69
70 /// When we if-convert we need to create edge masks. We have to cache values
71 /// so that we don't end up with exponential recursion/IR. Note that
72 /// if-conversion currently takes place during VPlan-construction, so these
73 /// caches are only used at that stage.
74 using EdgeMaskCacheTy =
77 EdgeMaskCacheTy EdgeMaskCache;
78 BlockMaskCacheTy BlockMaskCache;
79
80 // VPlan construction support: Hold a mapping from ingredients to
81 // their recipe.
83
84 /// Cross-iteration reduction & first-order recurrence phis for which we need
85 /// to add the incoming value from the backedge after all recipes have been
86 /// created.
88
89 /// The set of reduction exit instructions that will be scaled to
90 /// a smaller VF via partial reductions, paired with the scaling factor.
92 ScaledReductionExitInstrs;
93
94 /// Check if \p I can be widened at the start of \p Range and possibly
95 /// decrease the range such that the returned value holds for the entire \p
96 /// Range. The function should not be called for memory instructions or calls.
97 bool shouldWiden(Instruction *I, VFRange &Range) const;
98
99 /// Check if the load or store instruction \p I should widened for \p
100 /// Range.Start and potentially masked. Such instructions are handled by a
101 /// recipe that takes an additional VPInstruction for the mask.
102 VPWidenMemoryRecipe *tryToWidenMemory(Instruction *I,
104 VFRange &Range);
105
106 /// Check if an induction recipe should be constructed for \p Phi. If so build
107 /// and return it. If not, return null.
108 VPHeaderPHIRecipe *tryToOptimizeInductionPHI(PHINode *Phi,
110 VFRange &Range);
111
112 /// Optimize the special case where the operand of \p I is a constant integer
113 /// induction variable.
115 tryToOptimizeInductionTruncate(TruncInst *I, ArrayRef<VPValue *> Operands,
116 VFRange &Range);
117
118 /// Handle non-loop phi nodes. Return a new VPBlendRecipe otherwise. Currently
119 /// all such phi nodes are turned into a sequence of select instructions as
120 /// the vectorizer currently performs full if-conversion.
122
123 /// Handle call instructions. If \p CI can be widened for \p Range.Start,
124 /// return a new VPWidenCallRecipe or VPWidenIntrinsicRecipe. Range.End may be
125 /// decreased to ensure same decision from \p Range.Start to \p Range.End.
127 VFRange &Range);
128
129 /// Check if \p I has an opcode that can be widened and return a VPWidenRecipe
130 /// if it can. The function should only be called if the cost-model indicates
131 /// that widening should be performed.
133 VPBasicBlock *VPBB);
134
135 /// Makes Histogram count operations safe for vectorization, by emitting a
136 /// llvm.experimental.vector.histogram.add intrinsic in place of the
137 /// Load + Add|Sub + Store operations that perform the histogram in the
138 /// original scalar loop.
139 VPHistogramRecipe *tryToWidenHistogram(const HistogramInfo *HI,
141
142 /// Examines reduction operations to see if the target can use a cheaper
143 /// operation with a wider per-iteration input VF and narrower PHI VF.
144 /// Returns null if no scaled reduction was found, otherwise a pair with a
145 /// struct containing reduction information and the scaling factor between the
146 /// number of elements in the input and output.
147 std::optional<std::pair<PartialReductionChain, unsigned>>
148 getScaledReduction(PHINode *PHI, const RecurrenceDescriptor &Rdx,
149 VFRange &Range);
150
151public:
152 VPRecipeBuilder(VPlan &Plan, Loop *OrigLoop, const TargetLibraryInfo *TLI,
157 : Plan(Plan), OrigLoop(OrigLoop), TLI(TLI), TTI(TTI), Legal(Legal),
158 CM(CM), PSE(PSE), Builder(Builder) {}
159
160 std::optional<std::pair<PartialReductionChain, unsigned>>
162 auto It = ScaledReductionExitInstrs.find(ExitInst);
163 return It == ScaledReductionExitInstrs.end()
164 ? std::nullopt
165 : std::make_optional(It->second);
166 }
167
168 /// Find all possible partial reductions in the loop and track all of those
169 /// that are valid so recipes can be formed later.
171
172 /// Create and return a widened recipe for \p I if one can be created within
173 /// the given VF \p Range.
176 VFRange &Range, VPBasicBlock *VPBB);
177
178 /// Create and return a partial reduction recipe for a reduction instruction
179 /// along with binary operation and reduction phi operands.
182
183 /// Set the recipe created for given ingredient.
185 assert(!Ingredient2Recipe.contains(I) &&
186 "Cannot reset recipe for instruction.");
187 Ingredient2Recipe[I] = R;
188 }
189
190 /// Create the mask for the vector loop header block.
191 void createHeaderMask();
192
193 /// A helper function that computes the predicate of the block BB, assuming
194 /// that the header block of the loop is set to True or the loop mask when
195 /// tail folding.
197
198 /// Returns the *entry* mask for the block \p BB.
200
201 /// Create an edge mask for every destination of cases and/or default.
203
204 /// A helper function that computes the predicate of the edge between SRC
205 /// and DST.
207
208 /// A helper that returns the previously computed predicate of the edge
209 /// between SRC and DST.
210 VPValue *getEdgeMask(BasicBlock *Src, BasicBlock *Dst) const;
211
212 /// Return the recipe created for given ingredient.
214 assert(Ingredient2Recipe.count(I) &&
215 "Recording this ingredients recipe was not requested");
216 assert(Ingredient2Recipe[I] != nullptr &&
217 "Ingredient doesn't have a recipe");
218 return Ingredient2Recipe[I];
219 }
220
221 /// Build a VPReplicationRecipe for \p I. If it is predicated, add the mask as
222 /// last operand. Range.End may be decreased to ensure same recipe behavior
223 /// from \p Range.Start to \p Range.End.
225
226 /// Add the incoming values from the backedge to reduction & first-order
227 /// recurrence cross-iteration phis.
228 void fixHeaderPhis();
229
230 /// Returns a range mapping the values of the range \p Operands to their
231 /// corresponding VPValues.
232 iterator_range<mapped_iterator<Use *, std::function<VPValue *(Value *)>>>
234
236 if (auto *I = dyn_cast<Instruction>(V)) {
237 if (auto *R = Ingredient2Recipe.lookup(I))
238 return R->getVPSingleValue();
239 }
240 return Plan.getOrAddLiveIn(V);
241 }
242};
243} // end namespace llvm
244
245#endif // LLVM_TRANSFORMS_VECTORIZE_VPRECIPEBUILDER_H
Rewrite undef for PHI
This file defines the DenseMap class.
This file provides a LoopVectorizationPlanner class.
#define I(x, y, z)
Definition: MD5.cpp:58
mir Rename Register Operands
ConstantRange Range(APInt(BitWidth, Low), APInt(BitWidth, High))
This file defines the PointerUnion class, which is a discriminated union of pointer types.
assert(ImpDefSCC.getReg()==AMDGPU::SCC &&ImpDefSCC.isDef())
This file contains the declarations of the Vectorization Plan base classes:
ArrayRef - Represent a constant reference to an array (0 or more elements consecutively in memory),...
Definition: ArrayRef.h:41
LLVM Basic Block Representation.
Definition: BasicBlock.h:61
This class represents a function call, abstracting a target machine's calling convention.
ValueT lookup(const_arg_type_t< KeyT > Val) const
lookup - Return the entry for the specified key, or a default constructed value if no such entry exis...
Definition: DenseMap.h:194
iterator find(const_arg_type_t< KeyT > Val)
Definition: DenseMap.h:156
size_type count(const_arg_type_t< KeyT > Val) const
Return 1 if the specified key is in the map, 0 otherwise.
Definition: DenseMap.h:152
iterator end()
Definition: DenseMap.h:84
bool contains(const_arg_type_t< KeyT > Val) const
Return true if the specified key is in the map, false otherwise.
Definition: DenseMap.h:147
LoopVectorizationCostModel - estimates the expected speedups due to vectorization.
LoopVectorizationLegality checks if it is legal to vectorize a loop, and to what vectorization factor...
Represents a single loop in the control flow graph.
Definition: LoopInfo.h:39
An interface layer with SCEV used to manage how we see SCEV expressions for values in the context of ...
The RecurrenceDescriptor is used to identify recurrences variables in a loop.
Definition: IVDescriptors.h:77
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
Definition: SmallVector.h:1196
Multiway switch.
Provides information about what library functions are available for the current target.
This pass provides access to the codegen interfaces that are needed for IR-level transformations.
This class represents a truncation of integer types.
A Use represents the edge between a Value definition and its users.
Definition: Use.h:43
VPBasicBlock serves as the leaf of the Hierarchical Control-Flow Graph.
Definition: VPlan.h:3529
A recipe for vectorizing a phi-node as a sequence of mask-based select instructions.
Definition: VPlan.h:2487
VPlan-based builder utility analogous to IRBuilder.
A pure virtual base class for all recipes modeling header phis, including phis for first order recurr...
Definition: VPlan.h:2026
A recipe representing a sequence of load -> update -> store as part of a histogram operation.
Definition: VPlan.h:1775
VPRecipeBase is a base class modeling a sequence of one or more output IR instructions.
Definition: VPlan.h:714
Helper class to create VPRecipies from IR instructions.
VPRecipeBase * tryToCreatePartialReduction(Instruction *Reduction, ArrayRef< VPValue * > Operands)
Create and return a partial reduction recipe for a reduction instruction along with binary operation ...
VPValue * createEdgeMask(BasicBlock *Src, BasicBlock *Dst)
A helper function that computes the predicate of the edge between SRC and DST.
VPReplicateRecipe * handleReplication(Instruction *I, VFRange &Range)
Build a VPReplicationRecipe for I.
void createSwitchEdgeMasks(SwitchInst *SI)
Create an edge mask for every destination of cases and/or default.
std::optional< std::pair< PartialReductionChain, unsigned > > getScaledReductionForInstr(const Instruction *ExitInst)
VPValue * getBlockInMask(BasicBlock *BB) const
Returns the entry mask for the block BB.
VPValue * getEdgeMask(BasicBlock *Src, BasicBlock *Dst) const
A helper that returns the previously computed predicate of the edge between SRC and DST.
iterator_range< mapped_iterator< Use *, std::function< VPValue *(Value *)> > > mapToVPValues(User::op_range Operands)
Returns a range mapping the values of the range Operands to their corresponding VPValues.
void fixHeaderPhis()
Add the incoming values from the backedge to reduction & first-order recurrence cross-iteration phis.
VPRecipeBase * tryToCreateWidenRecipe(Instruction *Instr, ArrayRef< VPValue * > Operands, VFRange &Range, VPBasicBlock *VPBB)
Create and return a widened recipe for I if one can be created within the given VF Range.
VPValue * getVPValueOrAddLiveIn(Value *V)
void createHeaderMask()
Create the mask for the vector loop header block.
void createBlockInMask(BasicBlock *BB)
A helper function that computes the predicate of the block BB, assuming that the header block of the ...
void collectScaledReductions(VFRange &Range)
Find all possible partial reductions in the loop and track all of those that are valid so recipes can...
void setRecipe(Instruction *I, VPRecipeBase *R)
Set the recipe created for given ingredient.
VPRecipeBase * getRecipe(Instruction *I)
Return the recipe created for given ingredient.
VPRecipeBuilder(VPlan &Plan, Loop *OrigLoop, const TargetLibraryInfo *TLI, const TargetTransformInfo *TTI, LoopVectorizationLegality *Legal, LoopVectorizationCostModel &CM, PredicatedScalarEvolution &PSE, VPBuilder &Builder)
VPReplicateRecipe replicates a given instruction producing multiple scalar copies of the original sca...
Definition: VPlan.h:2770
VPSingleDef is a base class for recipes for modeling a sequence of one or more output IR that define ...
Definition: VPlan.h:841
A recipe for handling phi nodes of integer and floating-point inductions, producing their vector valu...
Definition: VPlan.h:2141
A common base class for widening memory operations.
Definition: VPlan.h:2943
VPWidenRecipe is a recipe for producing a widened instruction using the opcode and operands of the re...
Definition: VPlan.h:1429
VPlan models a candidate for vectorization, encoding various decisions take to produce efficient outp...
Definition: VPlan.h:3796
VPValue * getOrAddLiveIn(Value *V)
Gets the live-in VPValue for V or adds a new live-in (if none exists yet) for V.
Definition: VPlan.h:4020
LLVM Value Representation.
Definition: Value.h:74
A range adaptor for a pair of iterators.
This is an optimization pass for GlobalISel generic memory operations.
Definition: AddressRanges.h:18
This holds details about a histogram operation – a load -> update -> store sequence where each lane i...
A chain of instructions that form a partial reduction.
Instruction * BinOp
The binary operation using the extends that is then reduced.
PartialReductionChain(Instruction *Reduction, Instruction *ExtendA, Instruction *ExtendB, Instruction *BinOp)
Instruction * Reduction
The top-level binary operation that forms the reduction to a scalar after the loop body.
Instruction * ExtendA
The extension of each of the inner binary operation's operands.
A range of powers-of-2 vectorization factors with fixed start and adjustable end.
Definition: VPlan.h:97