doxygen/RISCVGatherScatterLowering_8cpp_source.html

//===- RISCVGatherScatterLowering.cpp - Gather/Scatter lowering -----------===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//

//

// This pass custom lowers llvm.gather and llvm.scatter instructions to

// RISC-V intrinsics.

//

//===----------------------------------------------------------------------===//


#include "RISCV.h"

#include "RISCVTargetMachine.h"

#include "llvm/Analysis/InstSimplifyFolder.h"

#include "llvm/Analysis/LoopInfo.h"

#include "llvm/Analysis/ValueTracking.h"

#include "llvm/Analysis/VectorUtils.h"

#include "llvm/CodeGen/TargetPassConfig.h"

#include "llvm/IR/GetElementPtrTypeIterator.h"

#include "llvm/IR/IRBuilder.h"

#include "llvm/IR/IntrinsicInst.h"

#include "llvm/IR/PatternMatch.h"

#include "llvm/Transforms/Utils/Local.h"

#include <optional>


using namespace llvm;

using namespace PatternMatch;


#define DEBUG_TYPE "riscv-gather-scatter-lowering"


namespace {


class RISCVGatherScatterLowering : public FunctionPass {

  const RISCVSubtarget *ST = nullptr;

  const RISCVTargetLowering *TLI = nullptr;

  LoopInfo *LI = nullptr;

  const DataLayout *DL = nullptr;


  SmallVector<WeakTrackingVH> MaybeDeadPHIs;


  // Cache of the BasePtr and Stride determined from this GEP. When a GEP is

  // used by multiple gathers/scatters, this allow us to reuse the scalar

  // instructions we created for the first gather/scatter for the others.

  DenseMap<GetElementPtrInst *, std::pair<Value *, Value *>> StridedAddrs;


public:

  static char ID; // Pass identification, replacement for typeid


  RISCVGatherScatterLowering() : FunctionPass(ID) {}


  bool runOnFunction(Function &F) override;


  void getAnalysisUsage(AnalysisUsage &AU) const override {

    AU.setPreservesCFG();

    AU.addRequired<TargetPassConfig>();

    AU.addRequired<LoopInfoWrapperPass>();

  }


  StringRef getPassName() const override {

    return "RISC-V gather/scatter lowering";

  }


private:

  bool tryCreateStridedLoadStore(IntrinsicInst *II);


  std::pair<Value *, Value *> determineBaseAndStride(Instruction *Ptr,

                                                     IRBuilderBase &Builder);


  bool matchStridedRecurrence(Value *Index, Loop *L, Value *&Stride,

                              PHINode *&BasePtr, BinaryOperator *&Inc,

                              IRBuilderBase &Builder);

};


} // end anonymous namespace


char RISCVGatherScatterLowering::ID = 0;


INITIALIZE_PASS(RISCVGatherScatterLowering, DEBUG_TYPE,

                "RISC-V gather/scatter lowering pass", false, false)


FunctionPass *llvm::createRISCVGatherScatterLoweringPass() {

  return new RISCVGatherScatterLowering();

}


// TODO: Should we consider the mask when looking for a stride?

static std::pair<Value *, Value *> matchStridedConstant(Constant *StartC) {

  if (!isa<FixedVectorType>(StartC->getType()))

    return std::make_pair(nullptr, nullptr);


  unsigned NumElts = cast<FixedVectorType>(StartC->getType())->getNumElements();


  // Check that the start value is a strided constant.

  auto *StartVal =

      dyn_cast_or_null<ConstantInt>(StartC->getAggregateElement((unsigned)0));

  if (!StartVal)

    return std::make_pair(nullptr, nullptr);

  APInt StrideVal(StartVal->getValue().getBitWidth(), 0);

  ConstantInt *Prev = StartVal;

  for (unsigned i = 1; i != NumElts; ++i) {

    auto *C = dyn_cast_or_null<ConstantInt>(StartC->getAggregateElement(i));

    if (!C)

      return std::make_pair(nullptr, nullptr);


    APInt LocalStride = C->getValue() - Prev->getValue();

    if (i == 1)

      StrideVal = LocalStride;

    else if (StrideVal != LocalStride)

      return std::make_pair(nullptr, nullptr);


    Prev = C;

  }


  Value *Stride = ConstantInt::get(StartVal->getType(), StrideVal);


  return std::make_pair(StartVal, Stride);

}


static std::pair<Value *, Value *> matchStridedStart(Value *Start,

                                                     IRBuilderBase &Builder) {

  // Base case, start is a strided constant.

  auto *StartC = dyn_cast<Constant>(Start);

  if (StartC)

    return matchStridedConstant(StartC);


  // Base case, start is a stepvector

  if (match(Start, m_Intrinsic<Intrinsic::stepvector>())) {

    auto *Ty = Start->getType()->getScalarType();

    return std::make_pair(ConstantInt::get(Ty, 0), ConstantInt::get(Ty, 1));

  }


  // Not a constant, maybe it's a strided constant with a splat added or

  // multipled.

  auto *BO = dyn_cast<BinaryOperator>(Start);

  if (!BO || (BO->getOpcode() != Instruction::Add &&

              BO->getOpcode() != Instruction::Or &&

              BO->getOpcode() != Instruction::Shl &&

              BO->getOpcode() != Instruction::Mul))

    return std::make_pair(nullptr, nullptr);


  if (BO->getOpcode() == Instruction::Or &&

      !cast<PossiblyDisjointInst>(BO)->isDisjoint())

    return std::make_pair(nullptr, nullptr);


  // Look for an operand that is splatted.

  unsigned OtherIndex = 0;

  Value *Splat = getSplatValue(BO->getOperand(1));

  if (!Splat && Instruction::isCommutative(BO->getOpcode())) {

    Splat = getSplatValue(BO->getOperand(0));

    OtherIndex = 1;

  }

  if (!Splat)

    return std::make_pair(nullptr, nullptr);


  Value *Stride;

  std::tie(Start, Stride) = matchStridedStart(BO->getOperand(OtherIndex),

                                              Builder);

  if (!Start)

    return std::make_pair(nullptr, nullptr);


  Builder.SetInsertPoint(BO);

  Builder.SetCurrentDebugLocation(DebugLoc());

  // Add the splat value to the start or multiply the start and stride by the

  // splat.

  switch (BO->getOpcode()) {

  default:

    llvm_unreachable("Unexpected opcode");

  case Instruction::Or:

    // TODO: We'd be better off creating disjoint or here, but we don't yet

    // have an IRBuilder API for that.

    [[fallthrough]];

  case Instruction::Add:

    Start = Builder.CreateAdd(Start, Splat);

    break;

  case Instruction::Mul:

    Start = Builder.CreateMul(Start, Splat);

    Stride = Builder.CreateMul(Stride, Splat);

    break;

  case Instruction::Shl:

    Start = Builder.CreateShl(Start, Splat);

    Stride = Builder.CreateShl(Stride, Splat);

    break;

  }


  return std::make_pair(Start, Stride);

}


// Recursively, walk about the use-def chain until we find a Phi with a strided

// start value. Build and update a scalar recurrence as we unwind the recursion.

// We also update the Stride as we unwind. Our goal is to move all of the

// arithmetic out of the loop.

bool RISCVGatherScatterLowering::matchStridedRecurrence(Value *Index, Loop *L,

                                                        Value *&Stride,

                                                        PHINode *&BasePtr,

                                                        BinaryOperator *&Inc,

                                                        IRBuilderBase &Builder) {

  // Our base case is a Phi.

  if (auto *Phi = dyn_cast<PHINode>(Index)) {

    // A phi node we want to perform this function on should be from the

    // loop header.

    if (Phi->getParent() != L->getHeader())

      return false;


    Value *Step, *Start;

    if (!matchSimpleRecurrence(Phi, Inc, Start, Step) ||

        Inc->getOpcode() != Instruction::Add)

      return false;

    assert(Phi->getNumIncomingValues() == 2 && "Expected 2 operand phi.");

    unsigned IncrementingBlock = Phi->getIncomingValue(0) == Inc ? 0 : 1;

    assert(Phi->getIncomingValue(IncrementingBlock) == Inc &&

           "Expected one operand of phi to be Inc");


    // Only proceed if the step is loop invariant.

    if (!L->isLoopInvariant(Step))

      return false;


    // Step should be a splat.

    Step = getSplatValue(Step);

    if (!Step)

      return false;


    std::tie(Start, Stride) = matchStridedStart(Start, Builder);

    if (!Start)

      return false;

    assert(Stride != nullptr);


    // Build scalar phi and increment.

    BasePtr =

        PHINode::Create(Start->getType(), 2, Phi->getName() + ".scalar", Phi->getIterator());

    Inc = BinaryOperator::CreateAdd(BasePtr, Step, Inc->getName() + ".scalar",

                                    Inc->getIterator());

    BasePtr->addIncoming(Start, Phi->getIncomingBlock(1 - IncrementingBlock));

    BasePtr->addIncoming(Inc, Phi->getIncomingBlock(IncrementingBlock));


    // Note that this Phi might be eligible for removal.

    MaybeDeadPHIs.push_back(Phi);

    return true;

  }


  // Otherwise look for binary operator.

  auto *BO = dyn_cast<BinaryOperator>(Index);

  if (!BO)

    return false;


  switch (BO->getOpcode()) {

  default:

    return false;

  case Instruction::Or:

    // We need to be able to treat Or as Add.

    if (!cast<PossiblyDisjointInst>(BO)->isDisjoint())

      return false;

    break;

  case Instruction::Add:

    break;

  case Instruction::Shl:

    break;

  case Instruction::Mul:

    break;

  }


  // We should have one operand in the loop and one splat.

  Value *OtherOp;

  if (isa<Instruction>(BO->getOperand(0)) &&

      L->contains(cast<Instruction>(BO->getOperand(0)))) {

    Index = cast<Instruction>(BO->getOperand(0));

    OtherOp = BO->getOperand(1);

  } else if (isa<Instruction>(BO->getOperand(1)) &&

             L->contains(cast<Instruction>(BO->getOperand(1))) &&

             Instruction::isCommutative(BO->getOpcode())) {

    Index = cast<Instruction>(BO->getOperand(1));

    OtherOp = BO->getOperand(0);

  } else {

    return false;

  }


  // Make sure other op is loop invariant.

  if (!L->isLoopInvariant(OtherOp))

    return false;


  // Make sure we have a splat.

  Value *SplatOp = getSplatValue(OtherOp);

  if (!SplatOp)

    return false;


  // Recurse up the use-def chain.

  if (!matchStridedRecurrence(Index, L, Stride, BasePtr, Inc, Builder))

    return false;


  // Locate the Step and Start values from the recurrence.

  unsigned StepIndex = Inc->getOperand(0) == BasePtr ? 1 : 0;

  unsigned StartBlock = BasePtr->getOperand(0) == Inc ? 1 : 0;

  Value *Step = Inc->getOperand(StepIndex);

  Value *Start = BasePtr->getOperand(StartBlock);


  // We need to adjust the start value in the preheader.

  Builder.SetInsertPoint(

      BasePtr->getIncomingBlock(StartBlock)->getTerminator());

  Builder.SetCurrentDebugLocation(DebugLoc());


  switch (BO->getOpcode()) {

  default:

    llvm_unreachable("Unexpected opcode!");

  case Instruction::Add:

  case Instruction::Or: {

    // An add only affects the start value. It's ok to do this for Or because

    // we already checked that there are no common set bits.

    Start = Builder.CreateAdd(Start, SplatOp, "start");

    break;

  }

  case Instruction::Mul: {

    Start = Builder.CreateMul(Start, SplatOp, "start");

    Step = Builder.CreateMul(Step, SplatOp, "step");

    Stride = Builder.CreateMul(Stride, SplatOp, "stride");

    break;

  }

  case Instruction::Shl: {

    Start = Builder.CreateShl(Start, SplatOp, "start");

    Step = Builder.CreateShl(Step, SplatOp, "step");

    Stride = Builder.CreateShl(Stride, SplatOp, "stride");

    break;

  }

  }


  Inc->setOperand(StepIndex, Step);

  BasePtr->setIncomingValue(StartBlock, Start);

  return true;

}


std::pair<Value *, Value *>

RISCVGatherScatterLowering::determineBaseAndStride(Instruction *Ptr,

                                                   IRBuilderBase &Builder) {


  // A gather/scatter of a splat is a zero strided load/store.

  if (auto *BasePtr = getSplatValue(Ptr)) {

    Type *IntPtrTy = DL->getIntPtrType(BasePtr->getType());

    return std::make_pair(BasePtr, ConstantInt::get(IntPtrTy, 0));

  }


  auto *GEP = dyn_cast<GetElementPtrInst>(Ptr);

  if (!GEP)

    return std::make_pair(nullptr, nullptr);


  auto I = StridedAddrs.find(GEP);

  if (I != StridedAddrs.end())

    return I->second;


  SmallVector<Value *, 2> Ops(GEP->operands());


  // If the base pointer is a vector, check if it's strided.

  Value *Base = GEP->getPointerOperand();

  if (auto *BaseInst = dyn_cast<Instruction>(Base);

      BaseInst && BaseInst->getType()->isVectorTy()) {

    // If GEP's offset is scalar then we can add it to the base pointer's base.

    auto IsScalar = [](Value *Idx) { return !Idx->getType()->isVectorTy(); };

    if (all_of(GEP->indices(), IsScalar)) {

      auto [BaseBase, Stride] = determineBaseAndStride(BaseInst, Builder);

      if (BaseBase) {

        Builder.SetInsertPoint(GEP);

        SmallVector<Value *> Indices(GEP->indices());

        Value *OffsetBase =

            Builder.CreateGEP(GEP->getSourceElementType(), BaseBase, Indices,

                              GEP->getName() + "offset", GEP->isInBounds());

        return {OffsetBase, Stride};

      }

    }

  }


  // Base pointer needs to be a scalar.

  Value *ScalarBase = Base;

  if (ScalarBase->getType()->isVectorTy()) {

    ScalarBase = getSplatValue(ScalarBase);

    if (!ScalarBase)

      return std::make_pair(nullptr, nullptr);

  }


  std::optional<unsigned> VecOperand;

  unsigned TypeScale = 0;


  // Look for a vector operand and scale.

  gep_type_iterator GTI = gep_type_begin(GEP);

  for (unsigned i = 1, e = GEP->getNumOperands(); i != e; ++i, ++GTI) {

    if (!Ops[i]->getType()->isVectorTy())

      continue;


    if (VecOperand)

      return std::make_pair(nullptr, nullptr);


    VecOperand = i;


    TypeSize TS = GTI.getSequentialElementStride(*DL);

    if (TS.isScalable())

      return std::make_pair(nullptr, nullptr);


    TypeScale = TS.getFixedValue();

  }


  // We need to find a vector index to simplify.

  if (!VecOperand)

    return std::make_pair(nullptr, nullptr);


  // We can't extract the stride if the arithmetic is done at a different size

  // than the pointer type. Adding the stride later may not wrap correctly.

  // Technically we could handle wider indices, but I don't expect that in

  // practice.  Handle one special case here - constants.  This simplifies

  // writing test cases.

  Value *VecIndex = Ops[*VecOperand];

  Type *VecIntPtrTy = DL->getIntPtrType(GEP->getType());

  if (VecIndex->getType() != VecIntPtrTy) {

    auto *VecIndexC = dyn_cast<Constant>(VecIndex);

    if (!VecIndexC)

      return std::make_pair(nullptr, nullptr);

    if (VecIndex->getType()->getScalarSizeInBits() > VecIntPtrTy->getScalarSizeInBits())

      VecIndex = ConstantFoldCastInstruction(Instruction::Trunc, VecIndexC, VecIntPtrTy);

    else

      VecIndex = ConstantFoldCastInstruction(Instruction::SExt, VecIndexC, VecIntPtrTy);

  }


  // Handle the non-recursive case.  This is what we see if the vectorizer

  // decides to use a scalar IV + vid on demand instead of a vector IV.

  auto [Start, Stride] = matchStridedStart(VecIndex, Builder);

  if (Start) {

    assert(Stride);

    Builder.SetInsertPoint(GEP);


    // Replace the vector index with the scalar start and build a scalar GEP.

    Ops[*VecOperand] = Start;

    Type *SourceTy = GEP->getSourceElementType();

    Value *BasePtr =

        Builder.CreateGEP(SourceTy, ScalarBase, ArrayRef(Ops).drop_front());


    // Convert stride to pointer size if needed.

    Type *IntPtrTy = DL->getIntPtrType(BasePtr->getType());

    assert(Stride->getType() == IntPtrTy && "Unexpected type");


    // Scale the stride by the size of the indexed type.

    if (TypeScale != 1)

      Stride = Builder.CreateMul(Stride, ConstantInt::get(IntPtrTy, TypeScale));


    auto P = std::make_pair(BasePtr, Stride);

    StridedAddrs[GEP] = P;

    return P;

  }


  // Make sure we're in a loop and that has a pre-header and a single latch.

  Loop *L = LI->getLoopFor(GEP->getParent());

  if (!L || !L->getLoopPreheader() || !L->getLoopLatch())

    return std::make_pair(nullptr, nullptr);


  BinaryOperator *Inc;

  PHINode *BasePhi;

  if (!matchStridedRecurrence(VecIndex, L, Stride, BasePhi, Inc, Builder))

    return std::make_pair(nullptr, nullptr);


  assert(BasePhi->getNumIncomingValues() == 2 && "Expected 2 operand phi.");

  unsigned IncrementingBlock = BasePhi->getOperand(0) == Inc ? 0 : 1;

  assert(BasePhi->getIncomingValue(IncrementingBlock) == Inc &&

         "Expected one operand of phi to be Inc");


  Builder.SetInsertPoint(GEP);


  // Replace the vector index with the scalar phi and build a scalar GEP.

  Ops[*VecOperand] = BasePhi;

  Type *SourceTy = GEP->getSourceElementType();

  Value *BasePtr =

      Builder.CreateGEP(SourceTy, ScalarBase, ArrayRef(Ops).drop_front());


  // Final adjustments to stride should go in the start block.

  Builder.SetInsertPoint(

      BasePhi->getIncomingBlock(1 - IncrementingBlock)->getTerminator());


  // Convert stride to pointer size if needed.

  Type *IntPtrTy = DL->getIntPtrType(BasePtr->getType());

  assert(Stride->getType() == IntPtrTy && "Unexpected type");


  // Scale the stride by the size of the indexed type.

  if (TypeScale != 1)

    Stride = Builder.CreateMul(Stride, ConstantInt::get(IntPtrTy, TypeScale));


  auto P = std::make_pair(BasePtr, Stride);

  StridedAddrs[GEP] = P;

  return P;

}


bool RISCVGatherScatterLowering::tryCreateStridedLoadStore(IntrinsicInst *II) {

  VectorType *DataType;

  Value *StoreVal = nullptr, *Ptr, *Mask, *EVL = nullptr;

  MaybeAlign MA;

  switch (II->getIntrinsicID()) {

  case Intrinsic::masked_gather:

    DataType = cast<VectorType>(II->getType());

    Ptr = II->getArgOperand(0);

    MA = cast<ConstantInt>(II->getArgOperand(1))->getMaybeAlignValue();

    Mask = II->getArgOperand(2);

    break;

  case Intrinsic::vp_gather:

    DataType = cast<VectorType>(II->getType());

    Ptr = II->getArgOperand(0);

    MA = II->getParamAlign(0).value_or(

        DL->getABITypeAlign(DataType->getElementType()));

    Mask = II->getArgOperand(1);

    EVL = II->getArgOperand(2);

    break;

  case Intrinsic::masked_scatter:

    DataType = cast<VectorType>(II->getArgOperand(0)->getType());

    StoreVal = II->getArgOperand(0);

    Ptr = II->getArgOperand(1);

    MA = cast<ConstantInt>(II->getArgOperand(2))->getMaybeAlignValue();

    Mask = II->getArgOperand(3);

    break;

  case Intrinsic::vp_scatter:

    DataType = cast<VectorType>(II->getArgOperand(0)->getType());

    StoreVal = II->getArgOperand(0);

    Ptr = II->getArgOperand(1);

    MA = II->getParamAlign(1).value_or(

        DL->getABITypeAlign(DataType->getElementType()));

    Mask = II->getArgOperand(2);

    EVL = II->getArgOperand(3);

    break;

  default:

    llvm_unreachable("Unexpected intrinsic");

  }


  // Make sure the operation will be supported by the backend.

  EVT DataTypeVT = TLI->getValueType(*DL, DataType);

  if (!MA || !TLI->isLegalStridedLoadStore(DataTypeVT, *MA))

    return false;


  // FIXME: Let the backend type legalize by splitting/widening?

  if (!TLI->isTypeLegal(DataTypeVT))

    return false;


  // Pointer should be an instruction.

  auto *PtrI = dyn_cast<Instruction>(Ptr);

  if (!PtrI)

    return false;


  LLVMContext &Ctx = PtrI->getContext();

  IRBuilder Builder(Ctx, InstSimplifyFolder(*DL));

  Builder.SetInsertPoint(PtrI);


  Value *BasePtr, *Stride;

  std::tie(BasePtr, Stride) = determineBaseAndStride(PtrI, Builder);

  if (!BasePtr)

    return false;

  assert(Stride != nullptr);


  Builder.SetInsertPoint(II);


  if (!EVL)

    EVL = Builder.CreateElementCount(

        Builder.getInt32Ty(), cast<VectorType>(DataType)->getElementCount());


  CallInst *Call;


  if (!StoreVal) {

    Call = Builder.CreateIntrinsic(

        Intrinsic::experimental_vp_strided_load,

        {DataType, BasePtr->getType(), Stride->getType()},

        {BasePtr, Stride, Mask, EVL});


    // Merge llvm.masked.gather's passthru

    if (II->getIntrinsicID() == Intrinsic::masked_gather)

      Call = Builder.CreateIntrinsic(Intrinsic::vp_select, {DataType},

                                     {Mask, Call, II->getArgOperand(3), EVL});

  } else

    Call = Builder.CreateIntrinsic(

        Intrinsic::experimental_vp_strided_store,

        {DataType, BasePtr->getType(), Stride->getType()},

        {StoreVal, BasePtr, Stride, Mask, EVL});


  Call->takeName(II);

  II->replaceAllUsesWith(Call);

  II->eraseFromParent();


  if (PtrI->use_empty())

    RecursivelyDeleteTriviallyDeadInstructions(PtrI);


  return true;

}


bool RISCVGatherScatterLowering::runOnFunction(Function &F) {

  if (skipFunction(F))

    return false;


  auto &TPC = getAnalysis<TargetPassConfig>();

  auto &TM = TPC.getTM<RISCVTargetMachine>();

  ST = &TM.getSubtarget<RISCVSubtarget>(F);

  if (!ST->hasVInstructions() || !ST->useRVVForFixedLengthVectors())

    return false;


  TLI = ST->getTargetLowering();

  DL = &F.getDataLayout();

  LI = &getAnalysis<LoopInfoWrapperPass>().getLoopInfo();


  StridedAddrs.clear();


  SmallVector<IntrinsicInst *, 4> Worklist;


  bool Changed = false;


  for (BasicBlock &BB : F) {

    for (Instruction &I : BB) {

      IntrinsicInst *II = dyn_cast<IntrinsicInst>(&I);

      if (!II)

        continue;

      switch (II->getIntrinsicID()) {

      case Intrinsic::masked_gather:

      case Intrinsic::masked_scatter:

      case Intrinsic::vp_gather:

      case Intrinsic::vp_scatter:

        Worklist.push_back(II);

        break;

      default:

        break;

      }

    }

  }


  // Rewrite gather/scatter to form strided load/store if possible.

  for (auto *II : Worklist)

    Changed |= tryCreateStridedLoadStore(II);


  // Remove any dead phis.

  while (!MaybeDeadPHIs.empty()) {

    if (auto *Phi = dyn_cast_or_null<PHINode>(MaybeDeadPHIs.pop_back_val()))

      RecursivelyDeleteDeadPHINode(Phi);

  }


  return Changed;

}

DL
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
Definition: ARMSLSHardening.cpp:73

Idx
Returns the sub type a function will return at a given Idx Should correspond to the result type of an ExtractValue instruction executed with just that one unsigned Idx
Definition: DeadArgumentElimination.cpp:353

GetElementPtrTypeIterator.h

GEP
Hexagon Common GEP
Definition: HexagonCommonGEP.cpp:170

IRBuilder.h

IntrinsicInst.h

InstSimplifyFolder.h

LoopInfo.h

F
#define F(x, y, z)
Definition: MD5.cpp:55

I
#define I(x, y, z)
Definition: MD5.cpp:58

II
uint64_t IntrinsicInst * II
Definition: NVVMIntrRange.cpp:51

P
#define P(N)

INITIALIZE_PASS
#define INITIALIZE_PASS(passName, arg, name, cfg, analysis)
Definition: PassSupport.h:38

PatternMatch.h

matchStridedStart
static std::pair< Value *, Value * > matchStridedStart(Value *Start, IRBuilderBase &Builder)
Definition: RISCVGatherScatterLowering.cpp:120

matchStridedConstant
static std::pair< Value *, Value * > matchStridedConstant(Constant *StartC)
Definition: RISCVGatherScatterLowering.cpp:88

DEBUG_TYPE
#define DEBUG_TYPE
Definition: RISCVGatherScatterLowering.cpp:31

RISCVTargetMachine.h

RISCV.h

assert
assert(ImpDefSCC.getReg()==AMDGPU::SCC &&ImpDefSCC.isDef())

getType
static SymbolRef::Type getType(const Symbol *Sym)
Definition: TapiFile.cpp:39

Ptr
@ Ptr
Definition: TargetLibraryInfo.cpp:77

TargetPassConfig.h
Target-Independent Code Generator Pass Configuration Options pass.

Local.h

ValueTracking.h

VectorUtils.h

VectorType
Definition: ItaniumDemangle.h:1173

llvm::APInt
Class for arbitrary precision integers.
Definition: APInt.h:78

llvm::AnalysisUsage
Represent the analysis usage information of a pass.
Definition: PassAnalysisSupport.h:47

llvm::AnalysisUsage::addRequired
AnalysisUsage & addRequired()
Definition: PassAnalysisSupport.h:75

llvm::AnalysisUsage::setPreservesCFG
void setPreservesCFG()
This function should be called by the pass, iff they do not:
Definition: Pass.cpp:256

llvm::ArrayRef
ArrayRef - Represent a constant reference to an array (0 or more elements consecutively in memory),...
Definition: ArrayRef.h:41

llvm::BasicBlock
LLVM Basic Block Representation.
Definition: BasicBlock.h:61

llvm::BasicBlock::getTerminator
const Instruction * getTerminator() const LLVM_READONLY
Returns the terminator instruction if the block is well formed or null if the block is not well forme...
Definition: BasicBlock.h:239

llvm::BinaryOperator
Definition: InstrTypes.h:170

llvm::BinaryOperator::getOpcode
BinaryOps getOpcode() const
Definition: InstrTypes.h:370

llvm::CallInst
This class represents a function call, abstracting a target machine's calling convention.
Definition: Instructions.h:1479

llvm::ConstantInt
This is the shared class of boolean and integer constants.
Definition: Constants.h:83

llvm::ConstantInt::getValue
const APInt & getValue() const
Return the constant as an APInt value reference.
Definition: Constants.h:148

llvm::Constant
This is an important base class in LLVM.
Definition: Constant.h:42

llvm::Constant::getAggregateElement
Constant * getAggregateElement(unsigned Elt) const
For aggregates (struct/array/vector) return the constant that corresponds to the specified element if...
Definition: Constants.cpp:435

llvm::DataLayout
A parsed version of the target data layout string in and methods for querying it.
Definition: DataLayout.h:63

llvm::DebugLoc
A debug info location.
Definition: DebugLoc.h:33

llvm::DenseMap
Definition: DenseMap.h:727

llvm::FunctionPass
FunctionPass class - This class is used to implement most global optimizations.
Definition: Pass.h:310

llvm::FunctionPass::runOnFunction
virtual bool runOnFunction(Function &F)=0
runOnFunction - Virtual method overriden by subclasses to do the per-function processing of the pass.

llvm::Function
Definition: Function.h:63

llvm::IRBuilderBase
Common base class shared among various IRBuilders.
Definition: IRBuilder.h:113

llvm::IRBuilderBase::getInt32Ty
IntegerType * getInt32Ty()
Fetch the type representing a 32-bit integer.
Definition: IRBuilder.h:545

llvm::IRBuilderBase::SetCurrentDebugLocation
void SetCurrentDebugLocation(DebugLoc L)
Set location information used by debugging information.
Definition: IRBuilder.h:239

llvm::IRBuilderBase::CreateGEP
Value * CreateGEP(Type *Ty, Value *Ptr, ArrayRef< Value * > IdxList, const Twine &Name="", GEPNoWrapFlags NW=GEPNoWrapFlags::none())
Definition: IRBuilder.h:1874

llvm::IRBuilderBase::CreateIntrinsic
CallInst * CreateIntrinsic(Intrinsic::ID ID, ArrayRef< Type * > Types, ArrayRef< Value * > Args, FMFSource FMFSource={}, const Twine &Name="")
Create a call to intrinsic ID with Args, mangled using Types.
Definition: IRBuilder.cpp:900

llvm::IRBuilderBase::CreateShl
Value * CreateShl(Value *LHS, Value *RHS, const Twine &Name="", bool HasNUW=false, bool HasNSW=false)
Definition: IRBuilder.h:1459

llvm::IRBuilderBase::CreateAdd
Value * CreateAdd(Value *LHS, Value *RHS, const Twine &Name="", bool HasNUW=false, bool HasNSW=false)
Definition: IRBuilder.h:1370

llvm::IRBuilderBase::CreateElementCount
Value * CreateElementCount(Type *DstType, ElementCount EC)
Create an expression which evaluates to the number of elements in EC at runtime.
Definition: IRBuilder.cpp:98

llvm::IRBuilderBase::SetInsertPoint
void SetInsertPoint(BasicBlock *TheBB)
This specifies that created instructions should be appended to the end of the specified block.
Definition: IRBuilder.h:199

llvm::IRBuilderBase::CreateMul
Value * CreateMul(Value *LHS, Value *RHS, const Twine &Name="", bool HasNUW=false, bool HasNSW=false)
Definition: IRBuilder.h:1404

llvm::IRBuilder
This provides a uniform API for creating instructions and inserting them into a basic block: either a...
Definition: IRBuilder.h:2705

llvm::InstSimplifyFolder
InstSimplifyFolder - Use InstructionSimplify to fold operations to existing values.
Definition: InstSimplifyFolder.h:35

llvm::Instruction
Definition: Instruction.h:68

llvm::Instruction::isCommutative
bool isCommutative() const LLVM_READONLY
Return true if the instruction is commutative:
Definition: Instruction.cpp:1256

llvm::IntrinsicInst
A wrapper class for inspecting calls to intrinsic functions.
Definition: IntrinsicInst.h:48

llvm::LLVMContext
This is an important class for using LLVM in a threaded context.
Definition: LLVMContext.h:67

llvm::LoopInfoWrapperPass
The legacy pass manager's analysis pass to compute loop information.
Definition: LoopInfo.h:593

llvm::LoopInfo
Definition: LoopInfo.h:407

llvm::Loop
Represents a single loop in the control flow graph.
Definition: LoopInfo.h:39

llvm::PHINode
Definition: Instructions.h:2600

llvm::PHINode::getIncomingBlock
BasicBlock * getIncomingBlock(unsigned i) const
Return incoming basic block number i.
Definition: Instructions.h:2695

llvm::PHINode::getIncomingValue
Value * getIncomingValue(unsigned i) const
Return incoming value number x.
Definition: Instructions.h:2675

llvm::PHINode::getNumIncomingValues
unsigned getNumIncomingValues() const
Return the number of incoming edges.
Definition: Instructions.h:2671

llvm::PHINode::Create
static PHINode * Create(Type *Ty, unsigned NumReservedValues, const Twine &NameStr="", InsertPosition InsertBefore=nullptr)
Constructors - NumReservedValues is a hint for the number of incoming edges that this phi node will h...
Definition: Instructions.h:2635

llvm::Pass::getAnalysisUsage
virtual void getAnalysisUsage(AnalysisUsage &) const
getAnalysisUsage - This function should be overriden by passes that need analysis information to do t...
Definition: Pass.cpp:98

llvm::Pass::getPassName
virtual StringRef getPassName() const
getPassName - Return a nice clean name for a pass.
Definition: Pass.cpp:81

llvm::RISCVSubtarget
Definition: RISCVSubtarget.h:78

llvm::RISCVTargetLowering
Definition: RISCVISelLowering.h:506

llvm::RISCVTargetMachine
Definition: RISCVTargetMachine.h:23

llvm::SmallVectorTemplateBase::push_back
void push_back(const T &Elt)
Definition: SmallVector.h:413

llvm::SmallVector
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
Definition: SmallVector.h:1196

llvm::StringRef
StringRef - Represent a constant reference to a string, i.e.
Definition: StringRef.h:51

llvm::TargetPassConfig
Target-Independent Code Generator Pass Configuration Options.
Definition: TargetPassConfig.h:85

llvm::TypeSize
Definition: TypeSize.h:334

llvm::Type
The instances of the Type class are immutable: once they are created, they are never changed.
Definition: Type.h:45

llvm::Type::isVectorTy
bool isVectorTy() const
True if this is an instance of VectorType.
Definition: Type.h:270

llvm::Type::getScalarSizeInBits
unsigned getScalarSizeInBits() const LLVM_READONLY
If this is a vector type, return the getPrimitiveSizeInBits value for the element type.

llvm::User::setOperand
void setOperand(unsigned i, Value *Val)
Definition: User.h:233

llvm::User::getOperand
Value * getOperand(unsigned i) const
Definition: User.h:228

llvm::Value
LLVM Value Representation.
Definition: Value.h:74

llvm::Value::getType
Type * getType() const
All values are typed, get the type of this value.
Definition: Value.h:255

llvm::Value::getName
StringRef getName() const
Return a constant reference to the value's name.
Definition: Value.cpp:309

llvm::details::FixedOrScalableQuantity::getFixedValue
constexpr ScalarTy getFixedValue() const
Definition: TypeSize.h:202

llvm::details::FixedOrScalableQuantity::isScalable
constexpr bool isScalable() const
Returns whether the quantity is scaled by a runtime quantity (vscale).
Definition: TypeSize.h:171

llvm::generic_gep_type_iterator
Definition: GetElementPtrTypeIterator.h:31

llvm::generic_gep_type_iterator::getSequentialElementStride
TypeSize getSequentialElementStride(const DataLayout &DL) const
Definition: GetElementPtrTypeIterator.h:154

llvm::ilist_node_impl::getIterator
self_iterator getIterator()
Definition: ilist_node.h:132

unsigned

llvm_unreachable
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
Definition: ErrorHandling.h:143

llvm::ARM_MB::ST
@ ST
Definition: ARMBaseInfo.h:73

llvm::BitmaskEnumDetail::Mask
constexpr std::underlying_type_t< E > Mask()
Get a bitmask with 1s in all places up to the high-order bit of E's largest value.
Definition: BitmaskEnum.h:125

llvm::CallingConv::C
@ C
The default llvm calling convention, compatible with C.
Definition: CallingConv.h:34

llvm::CallingConv::ID
unsigned ID
LLVM IR allows to use arbitrary numbers as calling convention identifiers.
Definition: CallingConv.h:24

llvm::M68k::MemAddrModeKind::L
@ L

llvm::MCID::Call
@ Call
Definition: MCInstrDesc.h:156

llvm::PatternMatch::match
bool match(Val *V, const Pattern &P)
Definition: PatternMatch.h:49

llvm::SystemZISD::TM
@ TM
Definition: SystemZISelLowering.h:66

llvm::codeview::EncodedFramePtrReg::BasePtr
@ BasePtr

llvm::dwarf::Index
Index
Definition: Dwarf.h:882

llvm::rdf::Phi
NodeAddr< PhiNode * > Phi
Definition: RDFGraph.h:390

llvm::sampleprof::Base
@ Base
Definition: Discriminator.h:58

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition: AddressRanges.h:18

llvm::all_of
bool all_of(R &&range, UnaryPredicate P)
Provide wrappers to std::all_of which take ranges instead of having to pass begin/end explicitly.
Definition: STLExtras.h:1739

llvm::RecursivelyDeleteTriviallyDeadInstructions
bool RecursivelyDeleteTriviallyDeadInstructions(Value *V, const TargetLibraryInfo *TLI=nullptr, MemorySSAUpdater *MSSAU=nullptr, std::function< void(Value *)> AboutToDeleteCallback=std::function< void(Value *)>())
If the specified value is a trivially dead instruction, delete it.
Definition: Local.cpp:546

llvm::getSplatValue
Value * getSplatValue(const Value *V)
Get splat value if the input is a splat vector or return nullptr.
Definition: VectorUtils.cpp:312

llvm::createRISCVGatherScatterLoweringPass
FunctionPass * createRISCVGatherScatterLoweringPass()

llvm::matchSimpleRecurrence
bool matchSimpleRecurrence(const PHINode *P, BinaryOperator *&BO, Value *&Start, Value *&Step)
Attempt to match a simple first order recurrence cycle of the form: iv = phi Ty [Start,...
Definition: ValueTracking.cpp:9200

llvm::ComplexDeinterleavingOperation::Splat
@ Splat

llvm::gep_type_begin
gep_type_iterator gep_type_begin(const User *GEP)
Definition: GetElementPtrTypeIterator.h:173

llvm::RecursivelyDeleteDeadPHINode
bool RecursivelyDeleteDeadPHINode(PHINode *PN, const TargetLibraryInfo *TLI=nullptr, MemorySSAUpdater *MSSAU=nullptr)
If the specified value is an effectively dead PHI node, due to being a def-use chain of single-use no...
Definition: Local.cpp:657

llvm::ConstantFoldCastInstruction
Constant * ConstantFoldCastInstruction(unsigned opcode, Constant *V, Type *DestTy)
Definition: ConstantFold.cpp:131

llvm::EVT
Extended Value Type.
Definition: ValueTypes.h:35

llvm::MaybeAlign
This struct is a compact representation of a valid (power of two) or undefined (0) alignment.
Definition: Alignment.h:117