25#define DEBUG_TYPE "loop-vectorize"
49 bool verifyLastActiveLaneRecipe(
const VPInstruction &LastActiveLane)
const;
72 : VPDT(VPDT), TypeInfo(TypeInfo), VerifyLate(VerifyLate) {}
78bool VPlanVerifier::verifyPhiRecipes(
const VPBasicBlock *VPBB) {
79 auto RecipeI = VPBB->
begin();
80 auto End = VPBB->
end();
81 unsigned NumActiveLaneMaskPhiRecipes = 0;
83 while (RecipeI != End && RecipeI->isPhi()) {
85 NumActiveLaneMaskPhiRecipes++;
89 errs() <<
"Found non-header PHI recipe in header VPBB";
90#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
98 errs() <<
"Found header PHI recipe in non-header VPBB";
99#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
110 errs() <<
"Phi-like recipe with different number of operands and "
121 if (!VerifyLate && NumActiveLaneMaskPhiRecipes > 1) {
122 errs() <<
"There should be no more than one VPActiveLaneMaskPHIRecipe";
126 while (RecipeI != End) {
128 errs() <<
"Found phi-like recipe after non-phi recipe";
130#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
134 std::prev(RecipeI)->dump();
143bool VPlanVerifier::verifyEVLRecipe(
const VPInstruction &EVL)
const {
145 errs() <<
"verifyEVLRecipe should only be called on "
146 "VPInstruction::ExplicitVectorLength\n";
149 auto VerifyEVLUse = [&](
const VPRecipeBase &
R,
150 const unsigned ExpectedIdx) ->
bool {
152 unsigned UseCount =
count(
Ops, &EVL);
153 if (UseCount != 1 ||
Ops[ExpectedIdx] != &EVL) {
154 errs() <<
"EVL is used as non-last operand in EVL-based recipe\n";
159 return all_of(EVL.
users(), [
this, &VerifyEVLUse](VPUser *U) {
160 return TypeSwitch<const VPUser *, bool>(U)
161 .Case<VPWidenIntrinsicRecipe>([&](const VPWidenIntrinsicRecipe *S) {
162 return VerifyEVLUse(*S, S->getNumOperands() - 1);
164 .Case<VPWidenStoreEVLRecipe, VPReductionEVLRecipe,
165 VPWidenIntOrFpInductionRecipe, VPWidenPointerInductionRecipe>(
166 [&](
const VPRecipeBase *S) {
return VerifyEVLUse(*S, 2); })
167 .Case<VPScalarIVStepsRecipe>([&](
auto *R) {
168 if (
R->getNumOperands() != 3) {
169 errs() <<
"Unrolling with EVL tail folding not yet supported\n";
172 return VerifyEVLUse(*R, 2);
174 .Case<VPWidenLoadEVLRecipe, VPVectorEndPointerRecipe,
175 VPInterleaveEVLRecipe>(
176 [&](
const VPRecipeBase *R) {
return VerifyEVLUse(*R, 1); })
177 .Case<VPInstructionWithType>(
178 [&](
const VPInstructionWithType *S) {
return VerifyEVLUse(*S, 0); })
179 .Case<VPInstruction>([&](
const VPInstruction *
I) {
180 if (
I->getOpcode() == Instruction::PHI ||
181 I->getOpcode() == Instruction::ICmp ||
182 I->getOpcode() == Instruction::Sub)
183 return VerifyEVLUse(*
I, 1);
184 switch (
I->getOpcode()) {
185 case Instruction::Add:
187 case Instruction::UIToFP:
188 case Instruction::Trunc:
189 case Instruction::ZExt:
190 case Instruction::Mul:
191 case Instruction::Shl:
192 case Instruction::FMul:
198 errs() <<
"EVL used by unexpected VPInstruction\n";
203 errs() <<
"EVL used by unexpected VPInstruction\n";
207 errs() <<
"Result of VPInstruction::Add with EVL operand is "
208 "not used by VPEVLBasedIVPHIRecipe\n";
213 .
Default([&](
const VPUser *U) {
214 errs() <<
"EVL has unexpected user\n";
220bool VPlanVerifier::verifyLastActiveLaneRecipe(
221 const VPInstruction &LastActiveLane)
const {
223 "must be called with VPInstruction::LastActiveLane");
226 errs() <<
"LastActiveLane must have at least one operand\n";
234 for (VPValue *
Op : LastActiveLane.
operands()) {
239 auto BroadcastOrEVL =
245 errs() <<
"LastActiveLane operand ";
246#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
247 VPSlotTracker Tracker(&Plan);
248 Op->printAsOperand(
errs(), Tracker);
250 errs() <<
" must be prefix mask (a header mask or an "
251 "EVL-derived mask currently)\n";
258bool VPlanVerifier::verifyVPBasicBlock(
const VPBasicBlock *VPBB) {
259 if (!verifyPhiRecipes(VPBB))
263 DenseMap<const VPRecipeBase *, unsigned> RecipeNumbering;
265 for (
const VPRecipeBase &R : *VPBB)
266 RecipeNumbering[&
R] = Cnt++;
268 for (
const VPRecipeBase &R : *VPBB) {
270 errs() <<
"VPIRInstructions ";
271#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
275 errs() <<
"not in a VPIRBasicBlock!\n";
278 for (
const VPValue *V :
R.definedValues()) {
283 errs() <<
"Failed to infer scalar type!\n";
287 for (
const VPUser *U :
V->users()) {
290 UI->getNumOperands() != UI->getParent()->getNumPredecessors()) {
291 errs() <<
"Phi-like recipe with different number of operands and "
297 for (
const auto &[IncomingVPV, IncomingVPBB] :
298 Phi->incoming_values_and_blocks()) {
299 if (IncomingVPV != V)
305 errs() <<
"Incoming def does not dominate incoming block!\n";
306#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
307 VPSlotTracker Tracker(VPBB->getPlan());
308 IncomingVPV->getDefiningRecipe()->print(
errs(),
" ", Tracker);
309 errs() <<
"\n does not dominate " << IncomingVPBB->getName()
311 UI->print(
errs(),
" ", Tracker);
323 if (UI->getParent() == VPBB) {
324 if (RecipeNumbering[UI] >= RecipeNumbering[&R])
327 if (VPDT.
dominates(VPBB, UI->getParent()))
331 errs() <<
"Use before def!\n";
332#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
333 VPSlotTracker Tracker(VPBB->getPlan());
334 UI->print(
errs(),
" ", Tracker);
335 errs() <<
"\n before\n";
336 R.print(
errs(),
" ", Tracker);
343 switch (VPI->getOpcode()) {
345 if (!verifyEVLRecipe(*VPI)) {
346 errs() <<
"EVL VPValue is not used correctly\n";
351 if (!verifyLastActiveLaneRecipe(*VPI))
364 if (!WrappedIRBBs.
insert(IRBB->getIRBasicBlock()).second) {
365 errs() <<
"Same IR basic block used by multiple wrapper blocks!\n";
376 for (
const auto *
Block : VPBlockVec) {
383bool VPlanVerifier::verifyBlock(
const VPBlockBase *VPB) {
388 (VPBB->getParent() && VPBB->isExiting() &&
389 !VPBB->getParent()->isReplicator())) {
390 if (!VPBB->getTerminator()) {
391 errs() <<
"Block has multiple successors but doesn't "
392 "have a proper branch recipe!\n";
395 }
else if (VPBB->getTerminator()) {
396 errs() <<
"Unexpected branch recipe!\n";
406 errs() <<
"Multiple instances of the same successor.\n";
410 for (
const VPBlockBase *Succ : Successors) {
412 const auto &SuccPreds = Succ->getPredecessors();
414 errs() <<
"Missing predecessor link.\n";
425 errs() <<
"Multiple instances of the same predecessor.\n";
429 for (
const VPBlockBase *Pred : Predecessors) {
431 if (Pred->getParent() != VPB->
getParent()) {
432 errs() <<
"Predecessor is not in the same region.\n";
437 const auto &PredSuccs = Pred->getSuccessors();
439 errs() <<
"Missing successor link.\n";
443 return !VPBB || verifyVPBasicBlock(VPBB);
446bool VPlanVerifier::verifyBlocksInRegion(
const VPRegionBlock *Region) {
450 errs() <<
"VPBlockBase has wrong parent\n";
454 if (!verifyBlock(VPB))
460bool VPlanVerifier::verifyRegion(
const VPRegionBlock *Region) {
462 const VPBlockBase *Exiting =
Region->getExiting();
465 if (
Entry->hasPredecessors()) {
466 errs() <<
"region entry block has predecessors\n";
470 errs() <<
"region exiting block has successors\n";
474 return verifyBlocksInRegion(Region);
477bool VPlanVerifier::verifyRegionRec(
const VPRegionBlock *Region) {
479 return verifyRegion(Region) &&
481 [
this](
const VPBlockBase *VPB) {
482 const auto *SubRegion = dyn_cast<VPRegionBlock>(VPB);
483 return !SubRegion || verifyRegionRec(SubRegion);
487bool VPlanVerifier::verify(
const VPlan &Plan) {
489 [
this](
const VPBlockBase *VPB) { return !verifyBlock(VPB); }))
497 if (!verifyRegionRec(TopRegion))
501 errs() <<
"VPlan Top Region should have no parent.\n";
507 errs() <<
"VPlan entry block is not a VPBasicBlock\n";
512 errs() <<
"VPlan vector loop header does not start with a "
513 "VPCanonicalIVPHIRecipe\n";
519 errs() <<
"VPlan exiting block is not a VPBasicBlock\n";
523 if (Exiting->
empty()) {
524 errs() <<
"VPlan vector loop exiting block must end with BranchOnCount, "
525 "BranchOnCond, or BranchOnTwoConds VPInstruction but is empty\n";
533 errs() <<
"VPlan vector loop exit must end with BranchOnCount, "
534 "BranchOnCond, or BranchOnTwoConds VPInstruction\n";
544 VPlanVerifier
Verifier(VPDT, TypeInfo, VerifyLate);
545 return Verifier.verify(Plan);
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")
const AbstractManglingParser< Derived, Alloc >::OperatorInfo AbstractManglingParser< Derived, Alloc >::Ops[]
verify safepoint Safepoint IR Verifier
This file defines the SmallPtrSet class.
This file implements the TypeSwitch template, which mimics a switch() statement whose cases are type ...
This file implements dominator tree analysis for a single level of a VPlan's H-CFG.
This file contains the declarations of different VPlan-related auxiliary helpers.
static bool hasDuplicates(const SmallVectorImpl< VPBlockBase * > &VPBlockVec)
Utility function that checks whether VPBlockVec has duplicate VPBlockBases.
This file declares the class VPlanVerifier, which contains utility functions to check the consistency...
This file contains the declarations of the Vectorization Plan base classes:
bool dominates(const DomTreeNodeBase< NodeT > *A, const DomTreeNodeBase< NodeT > *B) const
dominates - Returns true iff A dominates B.
Implements a dense probed hash-table based set with some number of buckets stored inline.
std::pair< iterator, bool > insert(PtrType Ptr)
Inserts Ptr if and only if there is no element in the container equal to Ptr.
SmallPtrSet - This class implements a set which is optimized for holding SmallSize or less elements.
This class consists of common code factored out of the SmallVector class to reduce code duplication b...
VPBasicBlock serves as the leaf of the Hierarchical Control-Flow Graph.
iterator begin()
Recipe iterator methods.
VPBlockBase is the building block of the Hierarchical Control-Flow Graph.
VPRegionBlock * getParent()
size_t getNumSuccessors() const
size_t getNumPredecessors() const
const VPBlocksTy & getPredecessors() const
const VPBlocksTy & getSuccessors() const
static bool isHeader(const VPBlockBase *VPB, const VPDominatorTree &VPDT)
Returns true if VPB is a loop header, based on regions or VPDT in their absence.
Template specialization of the standard LLVM dominator tree utility for VPBlockBases.
This is a concrete Recipe that models a single VPlan-level instruction.
unsigned getOpcode() const
VPBasicBlock * getParent()
VPRegionBlock represents a collection of VPBasicBlocks and VPRegionBlocks which form a Single-Entry-S...
const VPBlockBase * getEntry() const
const VPBlockBase * getExiting() const
An analysis for type-inference for VPValues.
Type * inferScalarType(const VPValue *V)
Infer the type of V. Returns the scalar type of V.
unsigned getNumOperands() const
VPlan models a candidate for vectorization, encoding various decisions take to produce efficient outp...
VPBasicBlock * getEntry()
LLVM_ABI_FOR_TEST VPRegionBlock * getVectorLoopRegion()
Returns the VPRegionBlock of the vector loop.
std::pair< iterator, bool > insert(const ValueT &V)
bool match(Val *V, const Pattern &P)
CmpClass_match< LHS, RHS, ICmpInst > m_ICmp(CmpPredicate &Pred, const LHS &L, const RHS &R)
match_combine_or< LTy, RTy > m_CombineOr(const LTy &L, const RTy &R)
Combine two pattern matchers matching L || R.
VPInstruction_match< VPInstruction::StepVector > m_StepVector()
VPInstruction_match< VPInstruction::BranchOnTwoConds > m_BranchOnTwoConds()
VPInstruction_match< VPInstruction::BranchOnCount > m_BranchOnCount()
VPInstruction_match< VPInstruction::Broadcast, Op0_t > m_Broadcast(const Op0_t &Op0)
class_match< VPValue > m_VPValue()
Match an arbitrary VPValue and ignore it.
VPInstruction_match< VPInstruction::ExplicitVectorLength, Op0_t > m_EVL(const Op0_t &Op0)
VPInstruction_match< VPInstruction::BranchOnCond > m_BranchOnCond()
NodeAddr< PhiNode * > Phi
bool isHeaderMask(const VPValue *V, const VPlan &Plan)
Return true if V is a header mask in Plan.
This is an optimization pass for GlobalISel generic memory operations.
bool all_of(R &&range, UnaryPredicate P)
Provide wrappers to std::all_of which take ranges instead of having to pass begin/end explicitly.
LLVM_ABI_FOR_TEST bool verifyVPlanIsValid(const VPlan &Plan, bool VerifyLate=false)
Verify invariants for general VPlans.
decltype(auto) dyn_cast(const From &Val)
dyn_cast<X> - Return the argument parameter cast to the specified type.
iterator_range< df_iterator< VPBlockShallowTraversalWrapper< VPBlockBase * > > > vp_depth_first_shallow(VPBlockBase *G)
Returns an iterator range to traverse the graph starting at G in depth-first order.
bool any_of(R &&range, UnaryPredicate P)
Provide wrappers to std::any_of which take ranges instead of having to pass begin/end explicitly.
class LLVM_GSL_OWNER SmallVector
Forward declaration of SmallVector so that calculateSmallVectorDefaultInlinedElements can reference s...
bool isa(const From &Val)
isa<X> - Return true if the parameter to the template is an instance of one of the template type argu...
LLVM_ABI raw_fd_ostream & errs()
This returns a reference to a raw_ostream for standard error.
auto count(R &&Range, const E &Element)
Wrapper function around std::count to count the number of times an element Element occurs in the give...
DWARFExpression::Operation Op
decltype(auto) cast(const From &Val)
cast<X> - Return the argument parameter cast to the specified type.
bool is_contained(R &&Range, const E &Element)
Returns true if Element is found in Range.