doxygen/SVEShuffleOpts_8cpp_source.html

//===------- SVEShuffleOpts - SVE Shuffle Optimization --------------------===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//

//

// Tries to pattern match and combine scalable vector shuffles that could

// be more efficiently performed by tbl instructions.

//

// An example would be a loop with 4 multiply-accumulate reductions, where the

// new data in each vector iterations comes from a 4-way deinterleaving of

// smaller datatypes loaded from memory which are then zero extended.

//

// Something like the following:

//   %bgra = call ... @llvm.masked.load

//   %deinterleave = call ... @llvm.vector.deinterleave4(%bgra)

// If the load was of a <vscale x 8 x i16>, we now have 4 deinterleaved

// <vscale x 2 x i16> values.

//   %b.i16 = extractvalue %deinterleave, 0

//   %b.i64 = zext <vscale x 2 x i16> %b.i16 to <vscale x 2 x i64>

//   %acc.b.next = add <vscale x 2 x i64> %acc.b, %b.i64

//   <repeat for the other 3 subvectors>

//

// If the initial load is a legal vector rather than 4x the size (generating a

// structured ld4 instead), we would see multiple uunpkhi/lo instructions for

// the extensions, followed by uzp1/2 instructions for the deinterleave.

// Instead, we can replace all of those with 4 tbl instructions. The tradeoff,

// of course, is that we now have 4 mask values to maintain which may increase

// register pressure.

//

// This basic transform could be performed in CodeGenPrepare (as the equivalent

// for NEON is), or in a DAG Combine. However, we hope to extend it to detect

// other shuffles that we can fold into the tbl. Extending the above example,

// if instead of directly adding to the accumulator we multiplied it by a

// common term for all 4 components that had been reversed:

//   %common.load = call @llvm.masked.load

//   %common.reverse = call @llvm.vector.reverse

// These would be loaded at the extended size, <vscale x 2 x i64> in our

// example.

//   %b.mul = mul <vscale x 2 x i64> %b.i64, %common.reverse

//   %acc.b.next = add <vscale x 2 x i64> %acc.b, %b.mul

//   <repeat for the other 3 subvectors, using %common.reverse for each)

//

// In this case, the reverse isn't applied to the deinterleaved data in the

// original IR, but to the common term multiplied by the individual bgra

// elements. If the order of the elements in the accumulator is important, we

// cannot change that. If, however, we know that the accumulator is reduced to

// a single scalar after the loop and the data is either integers or floating

// point with reassociation allowed, we could instead choose a different mask

// for the tbls to reverse the individual bgra elements instead, removing an

// additional instruction from the loop. This does require looking beyond the

// blocks in the loop, so DAGCombine won't help.

//

// We should also be able to introduce new shuffles in order to balance out

// SVE's bottom/top instruction pairs, which act on even/odd lanes instead of

// the high or low half of a register.

//

// This pass may end up being a temporary solution that is removed if we can

// create a generic vector shuffle intrinsic and move this feature to

// LoopVectorize itself, as that would allow for better cost modelling.

//

//===----------------------------------------------------------------------===//


#include "AArch64.h"

#include "AArch64Subtarget.h"

#include "AArch64TargetMachine.h"

#include "llvm/Analysis/AssumptionCache.h"

#include "llvm/Analysis/LoopInfo.h"

#include "llvm/Analysis/LoopPass.h"

#include "llvm/Analysis/MemorySSA.h"

#include "llvm/Analysis/TargetTransformInfo.h"

#include "llvm/Analysis/ValueTracking.h"

#include "llvm/CodeGen/TargetLowering.h"

#include "llvm/CodeGen/TargetPassConfig.h"

#include "llvm/CodeGen/TargetSubtargetInfo.h"

#include "llvm/IR/Constants.h"

#include "llvm/IR/IRBuilder.h"

#include "llvm/IR/Instructions.h"

#include "llvm/IR/IntrinsicInst.h"

#include "llvm/IR/IntrinsicsAArch64.h"

#include "llvm/IR/LLVMContext.h"

#include "llvm/IR/PassManager.h"

#include "llvm/IR/PatternMatch.h"

#include "llvm/InitializePasses.h"

#include <array>


using namespace llvm;

using namespace llvm::PatternMatch;


#define DEBUG_TYPE "aarch64-sve-shuffle-opts"


/// A mapping between a vector_deinterleaveN intrinsic and extending cast

/// instructions used on the resulting subvectors.

using DeinterleaveMap = SmallDenseMap<CallInst *, std::array<CastInst *, 4>>;


/// Evaluate a deinterleave and see what the uses are. If we find other

/// operations that we can combine into a tbl shuffle, add the deinterleave and

/// the operations (currently only zext or uitofp) to the candidates map.


static void evaluateDeinterleave(IntrinsicInst *I, DeinterleaveMap &Candidates,

                                 Loop &L, const AArch64TargetLowering &TL,

                                 const DataLayout DL) {

  assert(I->getIntrinsicID() == Intrinsic::vector_deinterleave4 &&

         "Only deinterleave4 supported currently");


  ConstantRange VScaleRange = getVScaleRange(I->getFunction(), 64);

  // TBL zeroes elements with an out-of-bounds index, but for the largest

  // possible SVE vector (2048b) the maximum value for i8 elements (255) is not

  // large enough to encode an 'out of bounds' value. So we can only perform

  // this optimization for i8 elements if we know vscale is < 16.

  EVT InputVT = TL.getValueType(DL, I->getOperand(0)->getType());

  if (!InputVT.isScalableVector() ||

      (InputVT.getScalarSizeInBits() < 16 &&

       (!VScaleRange.getUpper().ult(16) || VScaleRange.isUpperWrapped())) ||

      TL.getTypeConversion(I->getContext(), InputVT).first !=

          TargetLoweringBase::TypeLegal)

    return;


  std::array<CastInst *, 4> Extends = {};

  unsigned Opcode = 0;

  Type *DestTy = nullptr;

  for (User *U : I->users()) {

    auto *Extract = dyn_cast<ExtractValueInst>(U);

    if (!Extract || !Extract->hasOneUse())

      return;


    // We expect only a single cast instruction as a user for the extract.

    auto *Extend = dyn_cast_if_present<CastInst>(*Extract->users().begin());

    if (!Extend || (!isa<ZExtInst>(Extend) && !isa<UIToFPInst>(Extend)))

      return;


    // We're only interested if the uses are in the loop. This is almost

    // certainly the case.

    if (!L.contains(Extend))

      return;


    Opcode = Extend->getOpcode();

    DestTy = Extend->getDestTy();


    // Make sure DestTy matches the input size.

    if (DestTy->getPrimitiveSizeInBits() != InputVT.getSizeInBits())

      return;


    Extends[Extract->getIndices().front()] = Extend;

  }


  // Check that all extracted values are being extended the same way, and that

  // we have the expected number of extensions.

  if (!all_of(Extends, [DestTy, Opcode](CastInst *CI) {

        return !CI || (CI->getDestTy() == DestTy && CI->getOpcode() == Opcode);

      }))

    return;


  Candidates.try_emplace(I, Extends);

}


/// Given a map of deinterleaves to zext or uitofp casts, remove the operations

/// and replace them with tbl shuffles.


static void optimizeSVEDeinterleavedExtends(DeinterleaveMap Deinterleaves) {

  for (auto &[Deinterleave, Extends] : Deinterleaves) {

    VectorType *DestTy = cast<VectorType>(Extends[0]->getDestTy());

    VectorType *SrcTy = cast<VectorType>(Extends[0]->getSrcTy());

    unsigned DstBits = DestTy->getScalarSizeInBits();

    unsigned SrcBits = SrcTy->getScalarSizeInBits();

    bool IsUIToFP = isa<UIToFPInst>(Extends[0]);

    VectorType *StepVecTy = VectorType::getInteger(DestTy);

    Value *Input = Deinterleave->getOperand(0);

    Type *InputTy = Input->getType();


    APInt Invalid = APInt::getAllOnes(DstBits);

    for (auto [Idx, Extend] : enumerate(Extends)) {

      // If not all lanes were extracted, we can have gaps. Skip over them.

      if (!Extend)

        continue;

      // Build the mask using stepvectors and casting.

      // We want to select the Idx'th element, and every 4 elements after that.

      // Each element needs to be zero extended; we can do that by providing

      // tbl index values that are out of range. We can't do that nicely with

      // a stepvector of the same element type as the input type, but we can

      // do it with elements the size of the output type.

      // E.g. for element 0 of a 16b -> 64b zext, we would start with a mask of

      // 0xFFFF_FFFF_FFFF_0000 + Idx for the start of the stepvector, and use a

      // step of 4. We then cast that back to an element size of 16b, yielding

      // <0x0000 + Idx, 0xFFFF, 0xFFFF, 0xFFFF, 0x0004 + Idx, 0xFFFF...>.

      APInt StartIdx = Invalid << SrcBits;

      StartIdx += Idx;

      IRBuilder<> Builder(Extend);

      Value *StepVector = Builder.CreateStepVector(StepVecTy);

      Value *ScaledSteps =

          Builder.CreateNUWMul(StepVector, ConstantInt::get(StepVecTy, 4));

      Value *ZextTbl = Builder.CreateNUWAdd(

          ScaledSteps, ConstantInt::get(StepVecTy, StartIdx));

      Value *FinalMask = Builder.CreateBitCast(ZextTbl, InputTy);


      // Replace the deinterleave, extractvalue, and extension chain with

      // a tbl directly on the input value.

      Value *Tbl = Builder.CreateIntrinsic(Intrinsic::aarch64_sve_tbl,

                                           {InputTy}, {Input, FinalMask});

      Value *Widen = Builder.CreateBitCast(Tbl, StepVecTy);

      if (IsUIToFP)

        Widen = Builder.CreateUIToFP(Widen, DestTy);

      LLVM_DEBUG(dbgs() << "SVETBLOPT: Replaced " << *Extend << " with "

                        << *Widen << "\n");

      Extend->replaceAllUsesWith(Widen);

      Extend->eraseFromParent();

    }


    // Delete the unused extracts and deinterleave.

    for (User *U : make_early_inc_range(Deinterleave->users()))

      cast<Instruction>(U)->eraseFromParent();

    Deinterleave->eraseFromParent();

  }

}


static bool processLoop(Loop &L, const AArch64Subtarget &ST, DataLayout DL) {

  // At present, we only want to do this for innermost loops when SVE

  // is available.

  if (!L.isInnermost() || !ST.isSVEorStreamingSVEAvailable())

    return false;


  // TODO: Pull other shuffles into the tbl where possible.

  // TODO: Add more advanced cases, such as introducing shuffles so that

  //       the SVE odd/even BT narrowing instructions can be used.

  // TODO: Support other deinterleaves.

  const AArch64TargetLowering &TL = *ST.getTargetLowering();

  assert(DL.isLittleEndian() &&

         "Shuffle optimizations unsupported for big endian targets.");

  DeinterleaveMap Candidates;

  for (auto *BB : L.blocks())

    for (auto &I : *BB)

      if (match(&I, m_Intrinsic<Intrinsic::vector_deinterleave4>(m_Value())))

        evaluateDeinterleave(cast<IntrinsicInst>(&I), Candidates, L, TL, DL);


  if (Candidates.empty())

    return false;


  optimizeSVEDeinterleavedExtends(Candidates);

  return true;

}


namespace {

struct SVEShuffleOpts : public LoopPass {

  static char ID; // Pass identification, replacement for typeid

  SVEShuffleOpts() : LoopPass(ID) {}


  bool runOnLoop(Loop *L, LPPassManager &PM) override {

    if (skipLoop(L))

      return false;


    TargetPassConfig &TPC = getAnalysis<TargetPassConfig>();

    const AArch64TargetMachine &TM = TPC.getTM<AArch64TargetMachine>();

    const AArch64Subtarget &ST =

        *TM.getSubtargetImpl(*L->getHeader()->getParent());


    return processLoop(*L, ST, TM.createDataLayout());

  }


  void getAnalysisUsage(AnalysisUsage &AU) const override {

    AU.addRequired<TargetPassConfig>();

    AU.setPreservesCFG();

  }


  StringRef getPassName() const override { return "SVE Shuffle Optimizations"; }

};

} // end anonymous namespace


char SVEShuffleOpts::ID = 0;

static const char *name = "SVE Shuffle Optimizations";

INITIALIZE_PASS_BEGIN(SVEShuffleOpts, DEBUG_TYPE, name, false, false)

INITIALIZE_PASS_DEPENDENCY(TargetPassConfig)

INITIALIZE_PASS_END(SVEShuffleOpts, DEBUG_TYPE, name, false, false)


Pass *llvm::createSVEShuffleOptsPass() { return new SVEShuffleOpts(); }


PreservedAnalyses


AArch64SVEShuffleOptsPass::run(Loop &L, LoopAnalysisManager &AM,

                               LoopStandardAnalysisResults &AR, LPMUpdater &U) {

  const AArch64Subtarget &ST =

      *TM.getSubtargetImpl(*L.getHeader()->getParent());


  if (processLoop(L, ST, TM.createDataLayout())) {

    PreservedAnalyses PA;

    PA.preserveSet<CFGAnalyses>();

    PA.preserve<TargetIRAnalysis>();

    PA.preserve<AssumptionAnalysis>();

    PA.preserve<MemorySSAAnalysis>();

    return PA;

  }


  return PreservedAnalyses::all();

}


Widen
static SDValue Widen(SelectionDAG *CurDAG, SDValue N)
Definition AArch64ISelDAGToDAG.cpp:1412

assert
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")

AArch64Subtarget.h

AArch64TargetMachine.h

AArch64.h

DL
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
Definition ARMSLSHardening.cpp:73

AssumptionCache.h

Constants.h
This file contains the declarations for the subclasses of Constant, which represent the different fla...

DEBUG_TYPE
#define DEBUG_TYPE
Definition GenericCycleImpl.h:34

IRBuilder.h

IntrinsicInst.h

PassManager.h
This header defines various interfaces for pass management in LLVM.

InitializePasses.h

Instructions.h

LLVMContext.h

LoopInfo.h

LoopPass.h

I
#define I(x, y, z)
Definition MD5.cpp:57

MemorySSA.h
This file exposes an interface to building/using memory SSA to walk memory instructions using a use/d...

INITIALIZE_PASS_DEPENDENCY
#define INITIALIZE_PASS_DEPENDENCY(depName)
Definition PassSupport.h:42

INITIALIZE_PASS_END
#define INITIALIZE_PASS_END(passName, arg, name, cfg, analysis)
Definition PassSupport.h:44

INITIALIZE_PASS_BEGIN
#define INITIALIZE_PASS_BEGIN(passName, arg, name, cfg, analysis)
Definition PassSupport.h:39

PatternMatch.h

DeinterleaveMap
SmallDenseMap< CallInst *, std::array< CastInst *, 4 > > DeinterleaveMap
A mapping between a vector_deinterleaveN intrinsic and extending cast instructions used on the result...
Definition SVEShuffleOpts.cpp:96

processLoop
static bool processLoop(Loop &L, const AArch64Subtarget &ST, DataLayout DL)
Definition SVEShuffleOpts.cpp:216

optimizeSVEDeinterleavedExtends
static void optimizeSVEDeinterleavedExtends(DeinterleaveMap Deinterleaves)
Given a map of deinterleaves to zext or uitofp casts, remove the operations and replace them with tbl...
Definition SVEShuffleOpts.cpp:160

name
static const char * name
Definition SVEShuffleOpts.cpp:269

evaluateDeinterleave
static void evaluateDeinterleave(IntrinsicInst *I, DeinterleaveMap &Candidates, Loop &L, const AArch64TargetLowering &TL, const DataLayout DL)
Evaluate a deinterleave and see what the uses are.
Definition SVEShuffleOpts.cpp:101

LLVM_DEBUG
#define LLVM_DEBUG(...)
Definition Debug.h:119

TargetLowering.h
This file describes how to lower LLVM code to machine code.

TargetPassConfig.h
Target-Independent Code Generator Pass Configuration Options pass.

TargetSubtargetInfo.h

TargetTransformInfo.h
This pass exposes codegen information to IR-level passes.

ValueTracking.h

Input
The Input class is used to parse a yaml document into in-memory structs and vectors.
Definition YAMLTraits.h:1314

VectorType
Definition ItaniumDemangle.h:1189

llvm::AArch64SVEShuffleOptsPass::run
LLVM_ABI PreservedAnalyses run(Loop &L, LoopAnalysisManager &AM, LoopStandardAnalysisResults &AR, LPMUpdater &U)
Definition SVEShuffleOpts.cpp:277

llvm::AArch64Subtarget
Definition AArch64Subtarget.h:38

llvm::AArch64TargetLowering
Definition AArch64ISelLowering.h:64

llvm::AArch64TargetMachine::getSubtargetImpl
const AArch64Subtarget * getSubtargetImpl(const Function &F) const override
Virtual method implemented by subclasses that returns a reference to that target's TargetSubtargetInf...
Definition AArch64TargetMachine.cpp:437

llvm::APInt
Class for arbitrary precision integers.
Definition APInt.h:78

llvm::APInt::getAllOnes
static APInt getAllOnes(unsigned numBits)
Return an APInt of a specified width with all bits set.
Definition APInt.h:235

llvm::APInt::ult
bool ult(const APInt &RHS) const
Unsigned less than comparison.
Definition APInt.h:1120

llvm::AnalysisUsage::addRequired
AnalysisUsage & addRequired()
Definition PassAnalysisSupport.h:76

llvm::AnalysisUsage::setPreservesCFG
LLVM_ABI void setPreservesCFG()
This function should be called by the pass, iff they do not:
Definition Pass.cpp:275

llvm::AssumptionAnalysis
A function analysis which provides an AssumptionCache.
Definition AssumptionCache.h:187

llvm::CFGAnalyses
Represents analyses that only rely on functions' control flow.
Definition Analysis.h:73

llvm::CastInst
This is the base class for all instructions that perform data casts.
Definition InstrTypes.h:512

llvm::CastInst::getOpcode
Instruction::CastOps getOpcode() const
Return the opcode of this CastInst.
Definition InstrTypes.h:674

llvm::CastInst::getDestTy
Type * getDestTy() const
Return the destination type, as a convenience.
Definition InstrTypes.h:681

llvm::ConstantRange
This class represents a range of values.
Definition ConstantRange.h:48

llvm::ConstantRange::getUpper
const APInt & getUpper() const
Return the upper value for this range.
Definition ConstantRange.h:220

llvm::ConstantRange::isUpperWrapped
LLVM_ABI bool isUpperWrapped() const
Return true if the exclusive upper bound wraps around the unsigned domain.
Definition ConstantRange.cpp:446

llvm::DataLayout
A parsed version of the target data layout string in and methods for querying it.
Definition DataLayout.h:64

llvm::IRBuilder
This provides a uniform API for creating instructions and inserting them into a basic block: either a...
Definition IRBuilder.h:2893

llvm::IntrinsicInst
A wrapper class for inspecting calls to intrinsic functions.
Definition IntrinsicInst.h:49

llvm::LPMUpdater
This class provides an interface for updating the loop pass manager based on mutations to the loop ne...
Definition LoopPassManager.h:218

llvm::LoopPass
Definition LoopPass.h:29

llvm::Loop
Represents a single loop in the control flow graph.
Definition LoopInfo.h:40

llvm::MemorySSAAnalysis
An analysis that produces MemorySSA for a function.
Definition MemorySSA.h:922

llvm::Pass
Pass interface - Implemented by all 'passes'.
Definition Pass.h:99

llvm::PreservedAnalyses
A set of analyses that are preserved following a run of a transformation pass.
Definition Analysis.h:112

llvm::PreservedAnalyses::all
static PreservedAnalyses all()
Construct a special preserved set that preserves all passes.
Definition Analysis.h:118

llvm::PreservedAnalyses::preserveSet
PreservedAnalyses & preserveSet()
Mark an analysis set as preserved.
Definition Analysis.h:151

llvm::PreservedAnalyses::preserve
PreservedAnalyses & preserve()
Mark an analysis as preserved.
Definition Analysis.h:132

llvm::SmallDenseMap
Definition DenseMap.h:975

llvm::TargetIRAnalysis
Analysis pass providing the TargetTransformInfo.
Definition TargetTransformInfo.h:2135

llvm::TargetLoweringBase::getValueType
EVT getValueType(const DataLayout &DL, Type *Ty, bool AllowUnknown=false) const
Return the EVT corresponding to this LLVM type.
Definition TargetLowering.h:1797

llvm::TargetLoweringBase::TypeLegal
@ TypeLegal
Definition TargetLowering.h:232

llvm::TargetLoweringBase::getTypeConversion
LegalizeKind getTypeConversion(LLVMContext &Context, EVT VT) const
Return pair that represents the legalization kind (first) that needs to happen to EVT (second) in ord...
Definition TargetLoweringBase.cpp:1393

llvm::TargetMachine::createDataLayout
const DataLayout createDataLayout() const
Create a DataLayout.
Definition TargetMachine.h:208

llvm::TargetPassConfig
Target-Independent Code Generator Pass Configuration Options.
Definition TargetPassConfig.h:84

llvm::TargetPassConfig::getTM
TMC & getTM() const
Get the right type of TargetMachine for this target.
Definition TargetPassConfig.h:159

llvm::Type
The instances of the Type class are immutable: once they are created, they are never changed.
Definition Type.h:46

llvm::Type::getPrimitiveSizeInBits
LLVM_ABI TypeSize getPrimitiveSizeInBits() const LLVM_READONLY
Return the basic size of this type if it is a primitive type.
Definition Type.cpp:197

llvm::User
Definition User.h:44

llvm::Value
LLVM Value Representation.
Definition Value.h:75

llvm::VectorType::getInteger
static VectorType * getInteger(VectorType *VTy)
This static method gets a VectorType with the same number of elements as the input type,...
Definition DerivedTypes.h:541

false
Definition MachinePipeliner.cpp:244

llvm::ARM_MB::ST
@ ST
Definition ARMBaseInfo.h:73

llvm::M68k::MemAddrModeKind::L
@ L
Definition M68kBaseInfo.h:69

llvm::PatternMatch
Definition PatternMatch.h:50

llvm::PatternMatch::match
bool match(Val *V, const Pattern &P)
Definition PatternMatch.h:54

llvm::PatternMatch::m_Value
auto m_Value()
Match an arbitrary value and ignore it.
Definition PatternMatch.h:136

llvm::PatternMatch::m_Intrinsic
auto m_Intrinsic(const Ts &...Ops)
Match intrinsic calls like this: m_Intrinsic<Intrinsic::fabs>(m_Value(X))
Definition PatternMatch.h:2804

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition FunctionInfo.h:25

llvm::all_of
bool all_of(R &&range, UnaryPredicate P)
Provide wrappers to std::all_of which take ranges instead of having to pass begin/end explicitly.
Definition STLExtras.h:1739

llvm::enumerate
auto enumerate(FirstRange &&First, RestRanges &&...Rest)
Given two or more input ranges, returns a new range whose values are tuples (A, B,...
Definition STLExtras.h:2554

llvm::dyn_cast
decltype(auto) dyn_cast(const From &Val)
dyn_cast<X> - Return the argument parameter cast to the specified type.
Definition Casting.h:643

llvm::dyn_cast_if_present
auto dyn_cast_if_present(const Y &Val)
dyn_cast_if_present<X> - Functionally identical to dyn_cast, except that a null (or none in the case ...
Definition Casting.h:732

llvm::make_early_inc_range
iterator_range< early_inc_iterator_impl< detail::IterOfRange< RangeT > > > make_early_inc_range(RangeT &&Range)
Make a range that does early increment to allow mutation of the underlying range without disrupting i...
Definition STLExtras.h:633

llvm::LoopAnalysisManager
AnalysisManager< Loop, LoopStandardAnalysisResults & > LoopAnalysisManager
The loop analysis manager.
Definition LoopAnalysisManager.h:75

llvm::ComplexDeinterleavingOperation::Deinterleave
@ Deinterleave
Definition ComplexDeinterleavingPass.h:41

llvm::dbgs
LLVM_ABI raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
Definition Debug.cpp:209

llvm::getVScaleRange
LLVM_ABI ConstantRange getVScaleRange(const Function *F, unsigned BitWidth)
Determine the possible constant range of vscale with the given bit width, based on the vscale_range f...
Definition ValueTracking.cpp:1301

llvm::isa
bool isa(const From &Val)
isa<X> - Return true if the parameter to the template is an instance of one of the template type argu...
Definition Casting.h:547

llvm::cast
decltype(auto) cast(const From &Val)
cast<X> - Return the argument parameter cast to the specified type.
Definition Casting.h:559

llvm::createSVEShuffleOptsPass
Pass * createSVEShuffleOptsPass()
Definition SVEShuffleOpts.cpp:274

llvm::Invalid
@ Invalid
Definition PGOCtxProfWriter.h:24

llvm::EVT
Extended Value Type.
Definition ValueTypes.h:35

llvm::EVT::getSizeInBits
TypeSize getSizeInBits() const
Return the size of the specified value type in bits.
Definition ValueTypes.h:396

llvm::EVT::getScalarSizeInBits
uint64_t getScalarSizeInBits() const
Definition ValueTypes.h:408

llvm::EVT::isScalableVector
bool isScalableVector() const
Return true if this is a vector type where the runtime length is machine dependent.
Definition ValueTypes.h:187

llvm::LoopStandardAnalysisResults
The adaptor from a function pass to a loop pass computes these analyses and makes them available to t...
Definition LoopAnalysisManager.h:52