LLVM 22.0.0git
VPRecipeBuilder.h
Go to the documentation of this file.
1//===- VPRecipeBuilder.h - Helper class to build recipes --------*- C++ -*-===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8
9#ifndef LLVM_TRANSFORMS_VECTORIZE_VPRECIPEBUILDER_H
10#define LLVM_TRANSFORMS_VECTORIZE_VPRECIPEBUILDER_H
11
13#include "VPlan.h"
14#include "llvm/ADT/DenseMap.h"
16
17namespace llvm {
18
23struct HistogramInfo;
24struct VFRange;
25
26/// A chain of instructions that form a partial reduction.
27/// Designed to match either:
28/// reduction_bin_op (extend (A), accumulator), or
29/// reduction_bin_op (bin_op (extend (A), (extend (B))), accumulator).
35 /// The top-level binary operation that forms the reduction to a scalar
36 /// after the loop body.
38 /// The extension of each of the inner binary operation's operands.
41
42 /// The user of the extends that is then reduced.
44};
45
46/// Helper class to create VPRecipies from IR instructions.
48 /// The VPlan new recipes are added to.
49 VPlan &Plan;
50
51 /// The loop that we evaluate.
52 Loop *OrigLoop;
53
54 /// Target Library Info.
55 const TargetLibraryInfo *TLI;
56
57 // Target Transform Info.
58 const TargetTransformInfo *TTI;
59
60 /// The legality analysis.
62
63 /// The profitablity analysis.
65
67
68 VPBuilder &Builder;
69
70 /// The mask of each VPBB, generated earlier and used for predicating recipes
71 /// in VPBB.
72 /// TODO: remove by applying predication when generating the masks.
74
75 // VPlan construction support: Hold a mapping from ingredients to
76 // their recipe.
78
79 /// Cross-iteration reduction & first-order recurrence phis for which we need
80 /// to add the incoming value from the backedge after all recipes have been
81 /// created.
83
84 /// A mapping of partial reduction exit instructions to their scaling factor.
86
87 /// Check if \p I can be widened at the start of \p Range and possibly
88 /// decrease the range such that the returned value holds for the entire \p
89 /// Range. The function should not be called for memory instructions or calls.
90 bool shouldWiden(Instruction *I, VFRange &Range) const;
91
92 /// Check if the load or store instruction \p VPI should widened for \p
93 /// Range.Start and potentially masked. Such instructions are handled by a
94 /// recipe that takes an additional VPInstruction for the mask.
95 VPWidenMemoryRecipe *tryToWidenMemory(VPInstruction *VPI, VFRange &Range);
96
97 /// Check if an induction recipe should be constructed for \p VPI. If so build
98 /// and return it. If not, return null.
99 VPHeaderPHIRecipe *tryToOptimizeInductionPHI(VPInstruction *VPI);
100
101 /// Optimize the special case where the operand of \p VPI is a constant
102 /// integer induction variable.
104 tryToOptimizeInductionTruncate(VPInstruction *VPI, VFRange &Range);
105
106 /// Handle call instructions. If \p VPI can be widened for \p Range.Start,
107 /// return a new VPWidenCallRecipe or VPWidenIntrinsicRecipe. Range.End may be
108 /// decreased to ensure same decision from \p Range.Start to \p Range.End.
109 VPSingleDefRecipe *tryToWidenCall(VPInstruction *VPI, VFRange &Range);
110
111 /// Check if \p VPI has an opcode that can be widened and return a
112 /// VPWidenRecipe if it can. The function should only be called if the
113 /// cost-model indicates that widening should be performed.
114 VPWidenRecipe *tryToWiden(VPInstruction *VPI);
115
116 /// Makes Histogram count operations safe for vectorization, by emitting a
117 /// llvm.experimental.vector.histogram.add intrinsic in place of the
118 /// Load + Add|Sub + Store operations that perform the histogram in the
119 /// original scalar loop.
120 VPHistogramRecipe *tryToWidenHistogram(const HistogramInfo *HI,
121 VPInstruction *VPI);
122
123 /// Examines reduction operations to see if the target can use a cheaper
124 /// operation with a wider per-iteration input VF and narrower PHI VF.
125 /// Each element within Chains is a pair with a struct containing reduction
126 /// information and the scaling factor between the number of elements in
127 /// the input and output.
128 /// Recursively calls itself to identify chained scaled reductions.
129 /// Returns true if this invocation added an entry to Chains, otherwise false.
130 /// i.e. returns false in the case that a subcall adds an entry to Chains,
131 /// but the top-level call does not.
132 bool getScaledReductions(
133 Instruction *PHI, Instruction *RdxExitInstr, VFRange &Range,
134 SmallVectorImpl<std::pair<PartialReductionChain, unsigned>> &Chains);
135
136public:
137 VPRecipeBuilder(VPlan &Plan, Loop *OrigLoop, const TargetLibraryInfo *TLI,
138 const TargetTransformInfo *TTI,
143 : Plan(Plan), OrigLoop(OrigLoop), TLI(TLI), TTI(TTI), Legal(Legal),
144 CM(CM), PSE(PSE), Builder(Builder), BlockMaskCache(BlockMaskCache) {}
145
146 std::optional<unsigned> getScalingForReduction(const Instruction *ExitInst) {
147 auto It = ScaledReductionMap.find(ExitInst);
148 return It == ScaledReductionMap.end() ? std::nullopt
149 : std::make_optional(It->second);
150 }
151
152 /// Find all possible partial reductions in the loop and track all of those
153 /// that are valid so recipes can be formed later.
155
156 /// Create and return a widened recipe for \p R if one can be created within
157 /// the given VF \p Range.
159
160 /// Create and return a partial reduction recipe for a reduction instruction
161 /// along with binary operation and reduction phi operands.
163 unsigned ScaleFactor);
164
165 /// Set the recipe created for given ingredient.
167 assert(!Ingredient2Recipe.contains(I) &&
168 "Cannot reset recipe for instruction.");
169 Ingredient2Recipe[I] = R;
170 }
171
172 /// Returns the *entry* mask for block \p VPBB or null if the mask is
173 /// all-true.
175 return BlockMaskCache.lookup(VPBB);
176 }
177
178 /// Return the recipe created for given ingredient.
180 assert(Ingredient2Recipe.count(I) &&
181 "Recording this ingredients recipe was not requested");
182 assert(Ingredient2Recipe[I] != nullptr &&
183 "Ingredient doesn't have a recipe");
184 return Ingredient2Recipe[I];
185 }
186
187 /// Build a VPReplicationRecipe for \p VPI. If it is predicated, add the mask
188 /// as last operand. Range.End may be decreased to ensure same recipe behavior
189 /// from \p Range.Start to \p Range.End.
191
193 if (auto *I = dyn_cast<Instruction>(V)) {
194 if (auto *R = Ingredient2Recipe.lookup(I))
195 return R->getVPSingleValue();
196 }
197 return Plan.getOrAddLiveIn(V);
198 }
199
201 for (auto &[_, V] : BlockMaskCache) {
202 if (auto *New = Old2New.lookup(V)) {
203 V->replaceAllUsesWith(New);
204 V = New;
205 }
206 }
207 }
208};
209} // end namespace llvm
210
211#endif // LLVM_TRANSFORMS_VECTORIZE_VPRECIPEBUILDER_H
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")
Rewrite undef for PHI
This file defines the DenseMap class.
#define _
This file provides a LoopVectorizationPlanner class.
#define I(x, y, z)
Definition MD5.cpp:57
ConstantRange Range(APInt(BitWidth, Low), APInt(BitWidth, High))
This file contains the declarations of the Vectorization Plan base classes:
ValueT lookup(const_arg_type_t< KeyT > Val) const
lookup - Return the entry for the specified key, or a default constructed value if no such entry exis...
Definition DenseMap.h:205
LoopVectorizationCostModel - estimates the expected speedups due to vectorization.
LoopVectorizationLegality checks if it is legal to vectorize a loop, and to what vectorization factor...
Represents a single loop in the control flow graph.
Definition LoopInfo.h:40
An interface layer with SCEV used to manage how we see SCEV expressions for values in the context of ...
This class consists of common code factored out of the SmallVector class to reduce code duplication b...
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
Provides information about what library functions are available for the current target.
This pass provides access to the codegen interfaces that are needed for IR-level transformations.
VPBasicBlock serves as the leaf of the Hierarchical Control-Flow Graph.
Definition VPlan.h:3971
VPlan-based builder utility analogous to IRBuilder.
A pure virtual base class for all recipes modeling header phis, including phis for first order recurr...
Definition VPlan.h:2054
A recipe representing a sequence of load -> update -> store as part of a histogram operation.
Definition VPlan.h:1762
This is a concrete Recipe that models a single VPlan-level instruction.
Definition VPlan.h:1031
VPRecipeBase is a base class modeling a sequence of one or more output IR instructions.
Definition VPlan.h:387
VPRecipeBase * tryToCreateWidenRecipe(VPSingleDefRecipe *R, VFRange &Range)
Create and return a widened recipe for R if one can be created within the given VF Range.
VPValue * getBlockInMask(VPBasicBlock *VPBB) const
Returns the entry mask for block VPBB or null if the mask is all-true.
VPRecipeBuilder(VPlan &Plan, Loop *OrigLoop, const TargetLibraryInfo *TLI, const TargetTransformInfo *TTI, LoopVectorizationLegality *Legal, LoopVectorizationCostModel &CM, PredicatedScalarEvolution &PSE, VPBuilder &Builder, DenseMap< VPBasicBlock *, VPValue * > &BlockMaskCache)
VPValue * getVPValueOrAddLiveIn(Value *V)
VPRecipeBase * tryToCreatePartialReduction(VPInstruction *Reduction, unsigned ScaleFactor)
Create and return a partial reduction recipe for a reduction instruction along with binary operation ...
std::optional< unsigned > getScalingForReduction(const Instruction *ExitInst)
void collectScaledReductions(VFRange &Range)
Find all possible partial reductions in the loop and track all of those that are valid so recipes can...
void setRecipe(Instruction *I, VPRecipeBase *R)
Set the recipe created for given ingredient.
VPReplicateRecipe * handleReplication(VPInstruction *VPI, VFRange &Range)
Build a VPReplicationRecipe for VPI.
VPRecipeBase * getRecipe(Instruction *I)
Return the recipe created for given ingredient.
void updateBlockMaskCache(DenseMap< VPValue *, VPValue * > &Old2New)
VPReplicateRecipe replicates a given instruction producing multiple scalar copies of the original sca...
Definition VPlan.h:2940
VPSingleDef is a base class for recipes for modeling a sequence of one or more output IR that define ...
Definition VPlan.h:531
This is the base class of the VPlan Def/Use graph, used for modeling the data flow into,...
Definition VPlanValue.h:48
A recipe for handling phi nodes of integer and floating-point inductions, producing their vector valu...
Definition VPlan.h:2197
A common base class for widening memory operations.
Definition VPlan.h:3251
VPWidenRecipe is a recipe for producing a widened instruction using the opcode and operands of the re...
Definition VPlan.h:1509
VPlan models a candidate for vectorization, encoding various decisions take to produce efficient outp...
Definition VPlan.h:4289
LLVM Value Representation.
Definition Value.h:75
This is an optimization pass for GlobalISel generic memory operations.
decltype(auto) dyn_cast(const From &Val)
dyn_cast<X> - Return the argument parameter cast to the specified type.
Definition Casting.h:643
This holds details about a histogram operation – a load -> update -> store sequence where each lane i...
PartialReductionChain(Instruction *Reduction, Instruction *ExtendA, Instruction *ExtendB, Instruction *ExtendUser)
Instruction * ExtendUser
The user of the extends that is then reduced.
Instruction * Reduction
The top-level binary operation that forms the reduction to a scalar after the loop body.
Instruction * ExtendA
The extension of each of the inner binary operation's operands.
A range of powers-of-2 vectorization factors with fixed start and adjustable end.