LLVM 20.0.0git
LoopVectorizationLegality.h
Go to the documentation of this file.
1//===- llvm/Transforms/Vectorize/LoopVectorizationLegality.h ----*- C++ -*-===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8//
9/// \file
10/// This file defines the LoopVectorizationLegality class. Original code
11/// in Loop Vectorizer has been moved out to its own file for modularity
12/// and reusability.
13///
14/// Currently, it works for innermost loop vectorization. Extending this to
15/// outer loop vectorization is a TODO item.
16///
17/// Also provides:
18/// 1) LoopVectorizeHints class which keeps a number of loop annotations
19/// locally for easy look up. It has the ability to write them back as
20/// loop metadata, upon request.
21/// 2) LoopVectorizationRequirements class for lazy bail out for the purpose
22/// of reporting useful failure to vectorize message.
23//
24//===----------------------------------------------------------------------===//
25
26#ifndef LLVM_TRANSFORMS_VECTORIZE_LOOPVECTORIZATIONLEGALITY_H
27#define LLVM_TRANSFORMS_VECTORIZE_LOOPVECTORIZATIONLEGALITY_H
28
29#include "llvm/ADT/MapVector.h"
33
34namespace llvm {
35class AssumptionCache;
36class BasicBlock;
37class BlockFrequencyInfo;
38class DemandedBits;
39class DominatorTree;
40class Function;
41class Loop;
42class LoopInfo;
43class Metadata;
44class OptimizationRemarkEmitter;
45class PredicatedScalarEvolution;
46class ProfileSummaryInfo;
47class TargetLibraryInfo;
48class TargetTransformInfo;
49class Type;
50
51/// Utility class for getting and setting loop vectorizer hints in the form
52/// of loop metadata.
53/// This class keeps a number of loop annotations locally (as member variables)
54/// and can, upon request, write them back as metadata on the loop. It will
55/// initially scan the loop for existing metadata, and will update the local
56/// values based on information in the loop.
57/// We cannot write all values to metadata, as the mere presence of some info,
58/// for example 'force', means a decision has been made. So, we need to be
59/// careful NOT to add them if the user hasn't specifically asked so.
61 enum HintKind {
62 HK_WIDTH,
63 HK_INTERLEAVE,
64 HK_FORCE,
65 HK_ISVECTORIZED,
66 HK_PREDICATE,
67 HK_SCALABLE
68 };
69
70 /// Hint - associates name and validation with the hint value.
71 struct Hint {
72 const char *Name;
73 unsigned Value; // This may have to change for non-numeric values.
74 HintKind Kind;
75
76 Hint(const char *Name, unsigned Value, HintKind Kind)
77 : Name(Name), Value(Value), Kind(Kind) {}
78
79 bool validate(unsigned Val);
80 };
81
82 /// Vectorization width.
83 Hint Width;
84
85 /// Vectorization interleave factor.
86 Hint Interleave;
87
88 /// Vectorization forced
89 Hint Force;
90
91 /// Already Vectorized
92 Hint IsVectorized;
93
94 /// Vector Predicate
95 Hint Predicate;
96
97 /// Says whether we should use fixed width or scalable vectorization.
98 Hint Scalable;
99
100 /// Return the loop metadata prefix.
101 static StringRef Prefix() { return "llvm.loop."; }
102
103 /// True if there is any unsafe math in the loop.
104 bool PotentiallyUnsafe = false;
105
106public:
108 FK_Undefined = -1, ///< Not selected.
109 FK_Disabled = 0, ///< Forcing disabled.
110 FK_Enabled = 1, ///< Forcing enabled.
111 };
112
114 /// Not selected.
116 /// Disables vectorization with scalable vectors.
118 /// Vectorize loops using scalable vectors or fixed-width vectors, but favor
119 /// scalable vectors when the cost-model is inconclusive. This is the
120 /// default when the scalable.enable hint is enabled through a pragma.
122 };
123
124 LoopVectorizeHints(const Loop *L, bool InterleaveOnlyWhenForced,
126 const TargetTransformInfo *TTI = nullptr);
127
128 /// Mark the loop L as already vectorized by setting the width to 1.
130
132 bool VectorizeOnlyWhenForced) const;
133
134 /// Dumps all the hint information.
135 void emitRemarkWithHints() const;
136
138 return ElementCount::get(Width.Value, (ScalableForceKind)Scalable.Value ==
140 }
141
142 unsigned getInterleave() const {
143 if (Interleave.Value)
144 return Interleave.Value;
145 // If interleaving is not explicitly set, assume that if we do not want
146 // unrolling, we also don't want any interleaving.
148 return 1;
149 return 0;
150 }
151 unsigned getIsVectorized() const { return IsVectorized.Value; }
152 unsigned getPredicate() const { return Predicate.Value; }
153 enum ForceKind getForce() const {
154 if ((ForceKind)Force.Value == FK_Undefined &&
156 return FK_Disabled;
157 return (ForceKind)Force.Value;
158 }
159
160 /// \return true if scalable vectorization has been explicitly disabled.
162 return (ScalableForceKind)Scalable.Value == SK_FixedWidthOnly;
163 }
164
165 /// If hints are provided that force vectorization, use the AlwaysPrint
166 /// pass name to force the frontend to print the diagnostic.
167 const char *vectorizeAnalysisPassName() const;
168
169 /// When enabling loop hints are provided we allow the vectorizer to change
170 /// the order of operations that is given by the scalar loop. This is not
171 /// enabled by default because can be unsafe or inefficient. For example,
172 /// reordering floating-point operations will change the way round-off
173 /// error accumulates in the loop.
174 bool allowReordering() const;
175
176 bool isPotentiallyUnsafe() const {
177 // Avoid FP vectorization if the target is unsure about proper support.
178 // This may be related to the SIMD unit in the target not handling
179 // IEEE 754 FP ops properly, or bad single-to-double promotions.
180 // Otherwise, a sequence of vectorized loops, even without reduction,
181 // could lead to different end results on the destination vectors.
182 return getForce() != LoopVectorizeHints::FK_Enabled && PotentiallyUnsafe;
183 }
184
185 void setPotentiallyUnsafe() { PotentiallyUnsafe = true; }
186
187private:
188 /// Find hints specified in the loop metadata and update local values.
189 void getHintsFromMetadata();
190
191 /// Checks string hint with one operand and set value if valid.
192 void setHint(StringRef Name, Metadata *Arg);
193
194 /// The loop these hints belong to.
195 const Loop *TheLoop;
196
197 /// Interface to emit optimization remarks.
199};
200
201/// This holds vectorization requirements that must be verified late in
202/// the process. The requirements are set by legalize and costmodel. Once
203/// vectorization has been determined to be possible and profitable the
204/// requirements can be verified by looking for metadata or compiler options.
205/// For example, some loops require FP commutativity which is only allowed if
206/// vectorization is explicitly specified or if the fast-math compiler option
207/// has been provided.
208/// Late evaluation of these requirements allows helpful diagnostics to be
209/// composed that tells the user what need to be done to vectorize the loop. For
210/// example, by specifying #pragma clang loop vectorize or -ffast-math. Late
211/// evaluation should be used only when diagnostics can generated that can be
212/// followed by a non-expert user.
214public:
215 /// Track the 1st floating-point instruction that can not be reassociated.
217 if (I && !ExactFPMathInst)
218 ExactFPMathInst = I;
219 }
220
221 Instruction *getExactFPInst() { return ExactFPMathInst; }
222
223private:
224 Instruction *ExactFPMathInst = nullptr;
225};
226
227/// This holds details about a histogram operation -- a load -> update -> store
228/// sequence where each lane in a vector might be updating the same element as
229/// another lane.
234
236 : Load(Load), Update(Update), Store(Store) {}
237};
238
239/// LoopVectorizationLegality checks if it is legal to vectorize a loop, and
240/// to what vectorization factor.
241/// This class does not look at the profitability of vectorization, only the
242/// legality. This class has two main kinds of checks:
243/// * Memory checks - The code in canVectorizeMemory checks if vectorization
244/// will change the order of memory accesses in a way that will change the
245/// correctness of the program.
246/// * Scalars checks - The code in canVectorizeInstrs and canVectorizeMemory
247/// checks for a number of different conditions, such as the availability of a
248/// single induction variable, that all types are supported and vectorize-able,
249/// etc. This code reflects the capabilities of InnerLoopVectorizer.
250/// This class is also used by InnerLoopVectorizer for identifying
251/// induction variable and the different reduction variables.
253public:
260 : TheLoop(L), LI(LI), PSE(PSE), TTI(TTI), TLI(TLI), DT(DT), LAIs(LAIs),
261 ORE(ORE), Requirements(R), Hints(H), DB(DB), AC(AC), BFI(BFI),
262 PSI(PSI) {}
263
264 /// ReductionList contains the reduction descriptors for all
265 /// of the reductions that were found in the loop.
267
268 /// InductionList saves induction variables and maps them to the
269 /// induction descriptor.
271
272 /// RecurrenceSet contains the phi nodes that are recurrences other than
273 /// inductions and reductions.
275
276 /// Returns true if it is legal to vectorize this loop.
277 /// This does not mean that it is profitable to vectorize this
278 /// loop, only that it is legal to do so.
279 /// Temporarily taking UseVPlanNativePath parameter. If true, take
280 /// the new code path being implemented for outer loop vectorization
281 /// (should be functional for inner loop vectorization) based on VPlan.
282 /// If false, good old LV code.
283 bool canVectorize(bool UseVPlanNativePath);
284
285 /// Returns true if it is legal to vectorize the FP math operations in this
286 /// loop. Vectorizing is legal if we allow reordering of FP operations, or if
287 /// we can use in-order reductions.
288 bool canVectorizeFPMath(bool EnableStrictReductions);
289
290 /// Return true if we can vectorize this loop while folding its tail by
291 /// masking.
292 bool canFoldTailByMasking() const;
293
294 /// Mark all respective loads/stores for masking. Must only be called when
295 /// tail-folding is possible.
297
298 /// Returns the primary induction variable.
299 PHINode *getPrimaryInduction() { return PrimaryInduction; }
300
301 /// Returns the reduction variables found in the loop.
302 const ReductionList &getReductionVars() const { return Reductions; }
303
304 /// Returns the induction variables found in the loop.
305 const InductionList &getInductionVars() const { return Inductions; }
306
307 /// Return the fixed-order recurrences found in the loop.
308 RecurrenceSet &getFixedOrderRecurrences() { return FixedOrderRecurrences; }
309
310 /// Returns the widest induction type.
311 Type *getWidestInductionType() { return WidestIndTy; }
312
313 /// Returns True if given store is a final invariant store of one of the
314 /// reductions found in the loop.
316
317 /// Returns True if given address is invariant and is used to store recurrent
318 /// expression
320
321 /// Returns True if V is a Phi node of an induction variable in this loop.
322 bool isInductionPhi(const Value *V) const;
323
324 /// Returns a pointer to the induction descriptor, if \p Phi is an integer or
325 /// floating point induction.
327
328 /// Returns a pointer to the induction descriptor, if \p Phi is pointer
329 /// induction.
331
332 /// Returns True if V is a cast that is part of an induction def-use chain,
333 /// and had been proven to be redundant under a runtime guard (in other
334 /// words, the cast has the same SCEV expression as the induction phi).
335 bool isCastedInductionVariable(const Value *V) const;
336
337 /// Returns True if V can be considered as an induction variable in this
338 /// loop. V can be the induction phi, or some redundant cast in the def-use
339 /// chain of the inducion phi.
340 bool isInductionVariable(const Value *V) const;
341
342 /// Returns True if PN is a reduction variable in this loop.
343 bool isReductionVariable(PHINode *PN) const { return Reductions.count(PN); }
344
345 /// Returns True if Phi is a fixed-order recurrence in this loop.
346 bool isFixedOrderRecurrence(const PHINode *Phi) const;
347
348 /// Return true if the block BB needs to be predicated in order for the loop
349 /// to be vectorized.
350 bool blockNeedsPredication(BasicBlock *BB) const;
351
352 /// Check if this pointer is consecutive when vectorizing. This happens
353 /// when the last index of the GEP is the induction variable, or that the
354 /// pointer itself is an induction variable.
355 /// This check allows us to vectorize A[idx] into a wide load/store.
356 /// Returns:
357 /// 0 - Stride is unknown or non-consecutive.
358 /// 1 - Address is consecutive.
359 /// -1 - Address is consecutive, and decreasing.
360 /// NOTE: This method must only be used before modifying the original scalar
361 /// loop. Do not use after invoking 'createVectorizedLoopSkeleton' (PR34965).
362 int isConsecutivePtr(Type *AccessTy, Value *Ptr) const;
363
364 /// Returns true if \p V is invariant across all loop iterations according to
365 /// SCEV.
366 bool isInvariant(Value *V) const;
367
368 /// Returns true if value V is uniform across \p VF lanes, when \p VF is
369 /// provided, and otherwise if \p V is invariant across all loop iterations.
370 bool isUniform(Value *V, ElementCount VF) const;
371
372 /// A uniform memory op is a load or store which accesses the same memory
373 /// location on all \p VF lanes, if \p VF is provided and otherwise if the
374 /// memory location is invariant.
375 bool isUniformMemOp(Instruction &I, ElementCount VF) const;
376
377 /// Returns the information that we collected about runtime memory check.
379 return LAI->getRuntimePointerChecking();
380 }
381
382 const LoopAccessInfo *getLAI() const { return LAI; }
383
386 }
387
390 }
391
392 /// Returns true if the loop has an uncountable early exit, i.e. an
393 /// uncountable exit that isn't the latch block.
394 bool hasUncountableEarlyExit() const { return HasUncountableEarlyExit; }
395
396 /// Returns the uncountable early exiting block.
398 if (!HasUncountableEarlyExit) {
400 "Expected no uncountable exiting blocks");
401 return nullptr;
402 }
404 "Expected only a single uncountable exiting block");
405 return getUncountableExitingBlocks()[0];
406 }
407
408 /// Returns the destination of an uncountable early exiting block.
411 "Expected only a single uncountable exit block");
412 return getUncountableExitBlocks()[0];
413 }
414
415 /// Returns true if vector representation of the instruction \p I
416 /// requires mask.
417 bool isMaskRequired(const Instruction *I) const {
418 return MaskedOp.contains(I);
419 }
420
421 /// Returns true if there is at least one function call in the loop which
422 /// has a vectorized variant available.
423 bool hasVectorCallVariants() const { return VecCallVariantsFound; }
424
425 /// Returns true if there is at least one function call in the loop which
426 /// returns a struct type and needs to be vectorized.
427 bool hasStructVectorCall() const { return StructVecCallFound; }
428
429 unsigned getNumStores() const { return LAI->getNumStores(); }
430 unsigned getNumLoads() const { return LAI->getNumLoads(); }
431
432 /// Returns a HistogramInfo* for the given instruction if it was determined
433 /// to be part of a load -> update -> store sequence where multiple lanes
434 /// may be working on the same memory address.
435 std::optional<const HistogramInfo *> getHistogramInfo(Instruction *I) const {
436 for (const HistogramInfo &HGram : Histograms)
437 if (HGram.Load == I || HGram.Update == I || HGram.Store == I)
438 return &HGram;
439
440 return std::nullopt;
441 }
442
443 /// Returns a list of all known histogram operations in the loop.
444 bool hasHistograms() const { return !Histograms.empty(); }
445
447 return &PSE;
448 }
449
450 Loop *getLoop() const { return TheLoop; }
451
452 LoopInfo *getLoopInfo() const { return LI; }
453
454 AssumptionCache *getAssumptionCache() const { return AC; }
455
456 ScalarEvolution *getScalarEvolution() const { return PSE.getSE(); }
457
458 DominatorTree *getDominatorTree() const { return DT; }
459
460 /// Returns all exiting blocks with a countable exit, i.e. the
461 /// exit-not-taken count is known exactly at compile time.
463 return CountableExitingBlocks;
464 }
465
466 /// Returns all the exiting blocks with an uncountable exit.
468 return UncountableExitingBlocks;
469 }
470
471 /// Returns all the exit blocks from uncountable exiting blocks.
473 return UncountableExitBlocks;
474 }
475
476private:
477 /// Return true if the pre-header, exiting and latch blocks of \p Lp and all
478 /// its nested loops are considered legal for vectorization. These legal
479 /// checks are common for inner and outer loop vectorization.
480 /// Temporarily taking UseVPlanNativePath parameter. If true, take
481 /// the new code path being implemented for outer loop vectorization
482 /// (should be functional for inner loop vectorization) based on VPlan.
483 /// If false, good old LV code.
484 bool canVectorizeLoopNestCFG(Loop *Lp, bool UseVPlanNativePath);
485
486 /// Set up outer loop inductions by checking Phis in outer loop header for
487 /// supported inductions (int inductions). Return false if any of these Phis
488 /// is not a supported induction or if we fail to find an induction.
489 bool setupOuterLoopInductions();
490
491 /// Return true if the pre-header, exiting and latch blocks of \p Lp
492 /// (non-recursive) are considered legal for vectorization.
493 /// Temporarily taking UseVPlanNativePath parameter. If true, take
494 /// the new code path being implemented for outer loop vectorization
495 /// (should be functional for inner loop vectorization) based on VPlan.
496 /// If false, good old LV code.
497 bool canVectorizeLoopCFG(Loop *Lp, bool UseVPlanNativePath);
498
499 /// Check if a single basic block loop is vectorizable.
500 /// At this point we know that this is a loop with a constant trip count
501 /// and we only need to check individual instructions.
502 bool canVectorizeInstrs();
503
504 /// When we vectorize loops we may change the order in which
505 /// we read and write from memory. This method checks if it is
506 /// legal to vectorize the code, considering only memory constrains.
507 /// Returns true if the loop is vectorizable
508 bool canVectorizeMemory();
509
510 /// If LAA cannot determine whether all dependences are safe, we may be able
511 /// to further analyse some IndirectUnsafe dependences and if they match a
512 /// certain pattern (like a histogram) then we may still be able to vectorize.
513 bool canVectorizeIndirectUnsafeDependences();
514
515 /// Return true if we can vectorize this loop using the IF-conversion
516 /// transformation.
517 bool canVectorizeWithIfConvert();
518
519 /// Return true if we can vectorize this outer loop. The method performs
520 /// specific checks for outer loop vectorization.
521 bool canVectorizeOuterLoop();
522
523 /// Returns true if this is an early exit loop that can be vectorized.
524 /// Currently, a loop with an uncountable early exit is considered
525 /// vectorizable if:
526 /// 1. There are no writes to memory in the loop.
527 /// 2. The loop has only one early uncountable exit
528 /// 3. The early exit block dominates the latch block.
529 /// 4. The latch block has an exact exit count.
530 /// 5. The loop does not contain reductions or recurrences.
531 /// 6. We can prove at compile-time that loops will not contain faulting
532 /// loads.
533 /// 7. It is safe to speculatively execute instructions such as divide or
534 /// call instructions.
535 /// The list above is not based on theoretical limitations of vectorization,
536 /// but simply a statement that more work is needed to support these
537 /// additional cases safely.
538 bool isVectorizableEarlyExitLoop();
539
540 /// Return true if all of the instructions in the block can be speculatively
541 /// executed, and record the loads/stores that require masking.
542 /// \p SafePtrs is a list of addresses that are known to be legal and we know
543 /// that we can read from them without segfault.
544 /// \p MaskedOp is a list of instructions that have to be transformed into
545 /// calls to the appropriate masked intrinsic when the loop is vectorized
546 /// or dropped if the instruction is a conditional assume intrinsic.
547 bool
548 blockCanBePredicated(BasicBlock *BB, SmallPtrSetImpl<Value *> &SafePtrs,
550
551 /// Updates the vectorization state by adding \p Phi to the inductions list.
552 /// This can set \p Phi as the main induction of the loop if \p Phi is a
553 /// better choice for the main induction than the existing one.
554 void addInductionPhi(PHINode *Phi, const InductionDescriptor &ID,
555 SmallPtrSetImpl<Value *> &AllowedExit);
556
557 /// The loop that we evaluate.
558 Loop *TheLoop;
559
560 /// Loop Info analysis.
561 LoopInfo *LI;
562
563 /// A wrapper around ScalarEvolution used to add runtime SCEV checks.
564 /// Applies dynamic knowledge to simplify SCEV expressions in the context
565 /// of existing SCEV assumptions. The analysis will also add a minimal set
566 /// of new predicates if this is required to enable vectorization and
567 /// unrolling.
569
570 /// Target Transform Info.
572
573 /// Target Library Info.
575
576 /// Dominator Tree.
577 DominatorTree *DT;
578
579 // LoopAccess analysis.
581
582 const LoopAccessInfo *LAI = nullptr;
583
584 /// Interface to emit optimization remarks.
586
587 // --- vectorization state --- //
588
589 /// Holds the primary induction variable. This is the counter of the
590 /// loop.
591 PHINode *PrimaryInduction = nullptr;
592
593 /// Holds the reduction variables.
594 ReductionList Reductions;
595
596 /// Holds all of the induction variables that we found in the loop.
597 /// Notice that inductions don't need to start at zero and that induction
598 /// variables can be pointers.
599 InductionList Inductions;
600
601 /// Holds all the casts that participate in the update chain of the induction
602 /// variables, and that have been proven to be redundant (possibly under a
603 /// runtime guard). These casts can be ignored when creating the vectorized
604 /// loop body.
605 SmallPtrSet<Instruction *, 4> InductionCastsToIgnore;
606
607 /// Holds the phi nodes that are fixed-order recurrences.
608 RecurrenceSet FixedOrderRecurrences;
609
610 /// Holds the widest induction type encountered.
611 Type *WidestIndTy = nullptr;
612
613 /// Allowed outside users. This holds the variables that can be accessed from
614 /// outside the loop.
615 SmallPtrSet<Value *, 4> AllowedExit;
616
617 /// Vectorization requirements that will go through late-evaluation.
618 LoopVectorizationRequirements *Requirements;
619
620 /// Used to emit an analysis of any legality issues.
621 LoopVectorizeHints *Hints;
622
623 /// The demanded bits analysis is used to compute the minimum type size in
624 /// which a reduction can be computed.
625 DemandedBits *DB;
626
627 /// The assumption cache analysis is used to compute the minimum type size in
628 /// which a reduction can be computed.
629 AssumptionCache *AC;
630
631 /// While vectorizing these instructions we have to generate a
632 /// call to the appropriate masked intrinsic or drop them in case of
633 /// conditional assumes.
635
636 /// Contains all identified histogram operations, which are sequences of
637 /// load -> update -> store instructions where multiple lanes in a vector
638 /// may work on the same memory location.
640
641 /// BFI and PSI are used to check for profile guided size optimizations.
644
645 /// If we discover function calls within the loop which have a valid
646 /// vectorized variant, record that fact so that LoopVectorize can
647 /// (potentially) make a better decision on the maximum VF and enable
648 /// the use of those function variants.
649 bool VecCallVariantsFound = false;
650
651 /// If we find a call (to be vectorized) that returns a struct type, record
652 /// that so we can bail out until this is supported.
653 /// TODO: Remove this flag once vectorizing calls with struct returns is
654 /// supported.
655 bool StructVecCallFound = false;
656
657 /// Indicates whether this loop has an uncountable early exit, i.e. an
658 /// uncountable exiting block that is not the latch.
659 bool HasUncountableEarlyExit = false;
660
661 /// Keep track of all the countable and uncountable exiting blocks if
662 /// the exact backedge taken count is not computable.
663 SmallVector<BasicBlock *, 4> CountableExitingBlocks;
664 SmallVector<BasicBlock *, 4> UncountableExitingBlocks;
665
666 /// Keep track of the destinations of all uncountable exits if the
667 /// exact backedge taken count is not computable.
668 SmallVector<BasicBlock *, 4> UncountableExitBlocks;
669};
670
671} // namespace llvm
672
673#endif // LLVM_TRANSFORMS_VECTORIZE_LOOPVECTORIZATIONLEGALITY_H
RelocType Type
Definition: COFFYAML.cpp:410
dxil translate DXIL Translate Metadata
std::string Name
#define F(x, y, z)
Definition: MD5.cpp:55
#define I(x, y, z)
Definition: MD5.cpp:58
#define H(x, y, z)
Definition: MD5.cpp:57
This file implements a map that provides insertion order iteration.
assert(ImpDefSCC.getReg()==AMDGPU::SCC &&ImpDefSCC.isDef())
A cache of @llvm.assume calls within a function.
LLVM Basic Block Representation.
Definition: BasicBlock.h:61
BlockFrequencyInfo pass uses BlockFrequencyInfoImpl implementation to estimate IR basic block frequen...
Concrete subclass of DominatorTreeBase that is used to compute a normal dominator tree.
Definition: Dominators.h:162
static constexpr ElementCount get(ScalarTy MinVal, bool Scalable)
Definition: TypeSize.h:317
A struct for saving information about induction variables.
An instruction for reading from memory.
Definition: Instructions.h:176
Drive the analysis of memory accesses in the loop.
const MemoryDepChecker & getDepChecker() const
the Memory Dependence Checker which can determine the loop-independent and loop-carried dependences b...
const RuntimePointerChecking * getRuntimePointerChecking() const
unsigned getNumLoads() const
unsigned getNumStores() const
LoopVectorizationLegality checks if it is legal to vectorize a loop, and to what vectorization factor...
MapVector< PHINode *, InductionDescriptor > InductionList
InductionList saves induction variables and maps them to the induction descriptor.
SmallVector< BasicBlock *, 4 > getUncountableExitBlocks() const
Returns all the exit blocks from uncountable exiting blocks.
const SmallVector< BasicBlock *, 4 > & getUncountableExitingBlocks() const
Returns all the exiting blocks with an uncountable exit.
bool isInvariantStoreOfReduction(StoreInst *SI)
Returns True if given store is a final invariant store of one of the reductions found in the loop.
bool hasVectorCallVariants() const
Returns true if there is at least one function call in the loop which has a vectorized variant availa...
RecurrenceSet & getFixedOrderRecurrences()
Return the fixed-order recurrences found in the loop.
bool isInvariantAddressOfReduction(Value *V)
Returns True if given address is invariant and is used to store recurrent expression.
bool blockNeedsPredication(BasicBlock *BB) const
Return true if the block BB needs to be predicated in order for the loop to be vectorized.
bool canVectorize(bool UseVPlanNativePath)
Returns true if it is legal to vectorize this loop.
PredicatedScalarEvolution * getPredicatedScalarEvolution() const
int isConsecutivePtr(Type *AccessTy, Value *Ptr) const
Check if this pointer is consecutive when vectorizing.
AssumptionCache * getAssumptionCache() const
std::optional< const HistogramInfo * > getHistogramInfo(Instruction *I) const
Returns a HistogramInfo* for the given instruction if it was determined to be part of a load -> updat...
SmallPtrSet< const PHINode *, 8 > RecurrenceSet
RecurrenceSet contains the phi nodes that are recurrences other than inductions and reductions.
bool canVectorizeFPMath(bool EnableStrictReductions)
Returns true if it is legal to vectorize the FP math operations in this loop.
LoopVectorizationLegality(Loop *L, PredicatedScalarEvolution &PSE, DominatorTree *DT, TargetTransformInfo *TTI, TargetLibraryInfo *TLI, Function *F, LoopAccessInfoManager &LAIs, LoopInfo *LI, OptimizationRemarkEmitter *ORE, LoopVectorizationRequirements *R, LoopVectorizeHints *H, DemandedBits *DB, AssumptionCache *AC, BlockFrequencyInfo *BFI, ProfileSummaryInfo *PSI)
bool isReductionVariable(PHINode *PN) const
Returns True if PN is a reduction variable in this loop.
bool isFixedOrderRecurrence(const PHINode *Phi) const
Returns True if Phi is a fixed-order recurrence in this loop.
BasicBlock * getUncountableEarlyExitBlock() const
Returns the destination of an uncountable early exiting block.
const InductionDescriptor * getPointerInductionDescriptor(PHINode *Phi) const
Returns a pointer to the induction descriptor, if Phi is pointer induction.
const InductionDescriptor * getIntOrFpInductionDescriptor(PHINode *Phi) const
Returns a pointer to the induction descriptor, if Phi is an integer or floating point induction.
bool isInductionPhi(const Value *V) const
Returns True if V is a Phi node of an induction variable in this loop.
PHINode * getPrimaryInduction()
Returns the primary induction variable.
const SmallVector< BasicBlock *, 4 > & getCountableExitingBlocks() const
Returns all exiting blocks with a countable exit, i.e.
bool isUniform(Value *V, ElementCount VF) const
Returns true if value V is uniform across VF lanes, when VF is provided, and otherwise if V is invari...
const InductionList & getInductionVars() const
Returns the induction variables found in the loop.
bool hasStructVectorCall() const
Returns true if there is at least one function call in the loop which returns a struct type and needs...
bool isInvariant(Value *V) const
Returns true if V is invariant across all loop iterations according to SCEV.
const ReductionList & getReductionVars() const
Returns the reduction variables found in the loop.
bool canFoldTailByMasking() const
Return true if we can vectorize this loop while folding its tail by masking.
void prepareToFoldTailByMasking()
Mark all respective loads/stores for masking.
Type * getWidestInductionType()
Returns the widest induction type.
bool hasUncountableEarlyExit() const
Returns true if the loop has an uncountable early exit, i.e.
bool hasHistograms() const
Returns a list of all known histogram operations in the loop.
const LoopAccessInfo * getLAI() const
MapVector< PHINode *, RecurrenceDescriptor > ReductionList
ReductionList contains the reduction descriptors for all of the reductions that were found in the loo...
ScalarEvolution * getScalarEvolution() const
bool isUniformMemOp(Instruction &I, ElementCount VF) const
A uniform memory op is a load or store which accesses the same memory location on all VF lanes,...
BasicBlock * getUncountableEarlyExitingBlock() const
Returns the uncountable early exiting block.
bool isMaskRequired(const Instruction *I) const
Returns true if vector representation of the instruction I requires mask.
const RuntimePointerChecking * getRuntimePointerChecking() const
Returns the information that we collected about runtime memory check.
bool isInductionVariable(const Value *V) const
Returns True if V can be considered as an induction variable in this loop.
bool isCastedInductionVariable(const Value *V) const
Returns True if V is a cast that is part of an induction def-use chain, and had been proven to be red...
This holds vectorization requirements that must be verified late in the process.
void addExactFPMathInst(Instruction *I)
Track the 1st floating-point instruction that can not be reassociated.
Utility class for getting and setting loop vectorizer hints in the form of loop metadata.
@ SK_PreferScalable
Vectorize loops using scalable vectors or fixed-width vectors, but favor scalable vectors when the co...
@ SK_FixedWidthOnly
Disables vectorization with scalable vectors.
bool allowVectorization(Function *F, Loop *L, bool VectorizeOnlyWhenForced) const
bool allowReordering() const
When enabling loop hints are provided we allow the vectorizer to change the order of operations that ...
void emitRemarkWithHints() const
Dumps all the hint information.
void setAlreadyVectorized()
Mark the loop L as already vectorized by setting the width to 1.
const char * vectorizeAnalysisPassName() const
If hints are provided that force vectorization, use the AlwaysPrint pass name to force the frontend t...
Represents a single loop in the control flow graph.
Definition: LoopInfo.h:39
size_type count(const KeyT &Key) const
Definition: MapVector.h:165
bool isSafeForAnyVectorWidth() const
Return true if the number of elements that are safe to operate on simultaneously is not bounded.
uint64_t getMaxSafeVectorWidthInBits() const
Return the number of elements that are safe to operate on simultaneously, multiplied by the size of t...
Root of the metadata hierarchy.
Definition: Metadata.h:62
The optimization diagnostic interface.
An interface layer with SCEV used to manage how we see SCEV expressions for values in the context of ...
ScalarEvolution * getSE() const
Returns the ScalarEvolution analysis used.
Analysis providing profile information.
Holds information about the memory runtime legality checks to verify that a group of pointers do not ...
The main scalar evolution driver.
A templated base class for SmallPtrSet which provides the typesafe interface that is common across al...
Definition: SmallPtrSet.h:363
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
Definition: SmallVector.h:1196
An instruction for storing to memory.
Definition: Instructions.h:292
StringRef - Represent a constant reference to a string, i.e.
Definition: StringRef.h:51
Provides information about what library functions are available for the current target.
This pass provides access to the codegen interfaces that are needed for IR-level transformations.
The instances of the Type class are immutable: once they are created, they are never changed.
Definition: Type.h:45
LLVM Value Representation.
Definition: Value.h:74
@ BasicBlock
Various leaf nodes.
Definition: ISDOpcodes.h:71
This is an optimization pass for GlobalISel generic memory operations.
Definition: AddressRanges.h:18
auto size(R &&Range, std::enable_if_t< std::is_base_of< std::random_access_iterator_tag, typename std::iterator_traits< decltype(Range.begin())>::iterator_category >::value, void > *=nullptr)
Get the size of a range.
Definition: STLExtras.h:1697
bool hasDisableAllTransformsHint(const Loop *L)
Look for the loop attribute that disables all transformation heuristic.
Definition: LoopUtils.cpp:344
TransformationMode hasUnrollTransformation(const Loop *L)
Definition: LoopUtils.cpp:352
@ TM_Disable
The transformation should not be applied.
Definition: LoopUtils.h:286
This holds details about a histogram operation – a load -> update -> store sequence where each lane i...
HistogramInfo(LoadInst *Load, Instruction *Update, StoreInst *Store)