doxygen/RISCVCodeGenPrepare_8cpp_source.html

//===----- RISCVCodeGenPrepare.cpp ----------------------------------------===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//

//

// This is a RISC-V specific version of CodeGenPrepare.

// It munges the code in the input function to better prepare it for

// SelectionDAG-based code generation. This works around limitations in it's

// basic-block-at-a-time approach.

//

//===----------------------------------------------------------------------===//


#include "RISCV.h"

#include "RISCVTargetMachine.h"

#include "llvm/ADT/Statistic.h"

#include "llvm/Analysis/ValueTracking.h"

#include "llvm/CodeGen/TargetPassConfig.h"

#include "llvm/IR/Dominators.h"

#include "llvm/IR/IRBuilder.h"

#include "llvm/IR/InstVisitor.h"

#include "llvm/IR/Intrinsics.h"

#include "llvm/IR/PatternMatch.h"

#include "llvm/InitializePasses.h"

#include "llvm/Pass.h"


using namespace llvm;


#define DEBUG_TYPE "riscv-codegenprepare"

#define PASS_NAME "RISC-V CodeGenPrepare"


namespace {


class RISCVCodeGenPrepare : public FunctionPass,

                            public InstVisitor<RISCVCodeGenPrepare, bool> {

  const DataLayout *DL;

  const DominatorTree *DT;

  const RISCVSubtarget *ST;


public:

  static char ID;


  RISCVCodeGenPrepare() : FunctionPass(ID) {}


  bool runOnFunction(Function &F) override;


  StringRef getPassName() const override { return PASS_NAME; }


  void getAnalysisUsage(AnalysisUsage &AU) const override {

    AU.setPreservesCFG();

    AU.addRequired<DominatorTreeWrapperPass>();

    AU.addRequired<TargetPassConfig>();

  }


  bool visitInstruction(Instruction &I) { return false; }

  bool visitAnd(BinaryOperator &BO);

  bool visitIntrinsicInst(IntrinsicInst &I);

  bool expandVPStrideLoad(IntrinsicInst &I);

};


} // end anonymous namespace


// Try to optimize (i64 (and (zext/sext (i32 X), C1))) if C1 has bit 31 set,

// but bits 63:32 are zero. If we know that bit 31 of X is 0, we can fill

// the upper 32 bits with ones.

bool RISCVCodeGenPrepare::visitAnd(BinaryOperator &BO) {

  if (!ST->is64Bit())

    return false;


  if (!BO.getType()->isIntegerTy(64))

    return false;


  using namespace PatternMatch;


  // Left hand side should be a zext nneg.

  Value *LHSSrc;

  if (!match(BO.getOperand(0), m_NNegZExt(m_Value(LHSSrc))))

    return false;


  if (!LHSSrc->getType()->isIntegerTy(32))

    return false;


  // Right hand side should be a constant.

  Value *RHS = BO.getOperand(1);


  auto *CI = dyn_cast<ConstantInt>(RHS);

  if (!CI)

    return false;

  uint64_t C = CI->getZExtValue();


  // Look for constants that fit in 32 bits but not simm12, and can be made

  // into simm12 by sign extending bit 31. This will allow use of ANDI.

  // TODO: Is worth making simm32?

  if (!isUInt<32>(C) || isInt<12>(C) || !isInt<12>(SignExtend64<32>(C)))

    return false;


  // Sign extend the constant and replace the And operand.

  C = SignExtend64<32>(C);

  BO.setOperand(1, ConstantInt::get(RHS->getType(), C));


  return true;

}


// LLVM vector reduction intrinsics return a scalar result, but on RISC-V vector

// reduction instructions write the result in the first element of a vector

// register. So when a reduction in a loop uses a scalar phi, we end up with

// unnecessary scalar moves:

//

// loop:

// vfmv.s.f v10, fa0

// vfredosum.vs v8, v8, v10

// vfmv.f.s fa0, v8

//

// This mainly affects ordered fadd reductions, since other types of reduction

// typically use element-wise vectorisation in the loop body. This tries to

// vectorize any scalar phis that feed into a fadd reduction:

//

// loop:

// %phi = phi <float> [ ..., %entry ], [ %acc, %loop ]

// %acc = call float @llvm.vector.reduce.fadd.nxv2f32(float %phi,

//                                                    <vscale x 2 x float> %vec)

//

// ->

//

// loop:

// %phi = phi <vscale x 2 x float> [ ..., %entry ], [ %acc.vec, %loop ]

// %phi.scalar = extractelement <vscale x 2 x float> %phi, i64 0

// %acc = call float @llvm.vector.reduce.fadd.nxv2f32(float %x,

//                                                    <vscale x 2 x float> %vec)

// %acc.vec = insertelement <vscale x 2 x float> poison, float %acc.next, i64 0

//

// Which eliminates the scalar -> vector -> scalar crossing during instruction

// selection.

bool RISCVCodeGenPrepare::visitIntrinsicInst(IntrinsicInst &I) {

  if (expandVPStrideLoad(I))

    return true;


  if (I.getIntrinsicID() != Intrinsic::vector_reduce_fadd)

    return false;


  auto *PHI = dyn_cast<PHINode>(I.getOperand(0));

  if (!PHI || !PHI->hasOneUse() ||

      !llvm::is_contained(PHI->incoming_values(), &I))

    return false;


  Type *VecTy = I.getOperand(1)->getType();

  IRBuilder<> Builder(PHI);

  auto *VecPHI = Builder.CreatePHI(VecTy, PHI->getNumIncomingValues());


  for (auto *BB : PHI->blocks()) {

    Builder.SetInsertPoint(BB->getTerminator());

    Value *InsertElt = Builder.CreateInsertElement(

        VecTy, PHI->getIncomingValueForBlock(BB), (uint64_t)0);

    VecPHI->addIncoming(InsertElt, BB);

  }


  Builder.SetInsertPoint(&I);

  I.setOperand(0, Builder.CreateExtractElement(VecPHI, (uint64_t)0));


  PHI->eraseFromParent();


  return true;

}


// Always expand zero strided loads so we match more .vx splat patterns, even if

// we have +optimized-zero-stride-loads. RISCVDAGToDAGISel::Select will convert

// it back to a strided load if it's optimized.

bool RISCVCodeGenPrepare::expandVPStrideLoad(IntrinsicInst &II) {

  Value *BasePtr, *VL;


  using namespace PatternMatch;

  if (!match(&II, m_Intrinsic<Intrinsic::experimental_vp_strided_load>(

                      m_Value(BasePtr), m_Zero(), m_AllOnes(), m_Value(VL))))

    return false;


  // If SEW>XLEN then a splat will get lowered as a zero strided load anyway, so

  // avoid expanding here.

  if (II.getType()->getScalarSizeInBits() > ST->getXLen())

    return false;


  if (!isKnownNonZero(VL, {*DL, DT, nullptr, &II}))

    return false;


  auto *VTy = cast<VectorType>(II.getType());


  IRBuilder<> Builder(&II);

  Type *STy = VTy->getElementType();

  Value *Val = Builder.CreateLoad(STy, BasePtr);

  Value *Res = Builder.CreateIntrinsic(Intrinsic::experimental_vp_splat, {VTy},

                                       {Val, II.getOperand(2), VL});


  II.replaceAllUsesWith(Res);

  II.eraseFromParent();

  return true;

}


bool RISCVCodeGenPrepare::runOnFunction(Function &F) {

  if (skipFunction(F))

    return false;


  auto &TPC = getAnalysis<TargetPassConfig>();

  auto &TM = TPC.getTM<RISCVTargetMachine>();

  ST = &TM.getSubtarget<RISCVSubtarget>(F);


  DL = &F.getDataLayout();

  DT = &getAnalysis<DominatorTreeWrapperPass>().getDomTree();


  bool MadeChange = false;

  for (auto &BB : F)

    for (Instruction &I : llvm::make_early_inc_range(BB))

      MadeChange |= visit(I);


  return MadeChange;

}


INITIALIZE_PASS_BEGIN(RISCVCodeGenPrepare, DEBUG_TYPE, PASS_NAME, false, false)

INITIALIZE_PASS_DEPENDENCY(TargetPassConfig)

INITIALIZE_PASS_END(RISCVCodeGenPrepare, DEBUG_TYPE, PASS_NAME, false, false)


char RISCVCodeGenPrepare::ID = 0;


FunctionPass *llvm::createRISCVCodeGenPreparePass() {

  return new RISCVCodeGenPrepare();

}

PHI
Rewrite undef for PHI
Definition: AMDGPURewriteUndefForPHI.cpp:100

DL
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
Definition: ARMSLSHardening.cpp:73

Dominators.h

IRBuilder.h

InitializePasses.h

InstVisitor.h

Intrinsics.h

F
#define F(x, y, z)
Definition: MD5.cpp:55

I
#define I(x, y, z)
Definition: MD5.cpp:58

II
uint64_t IntrinsicInst * II
Definition: NVVMIntrRange.cpp:51

INITIALIZE_PASS_DEPENDENCY
#define INITIALIZE_PASS_DEPENDENCY(depName)
Definition: PassSupport.h:55

INITIALIZE_PASS_END
#define INITIALIZE_PASS_END(passName, arg, name, cfg, analysis)
Definition: PassSupport.h:57

INITIALIZE_PASS_BEGIN
#define INITIALIZE_PASS_BEGIN(passName, arg, name, cfg, analysis)
Definition: PassSupport.h:52

Pass.h

PatternMatch.h

PASS_NAME
#define PASS_NAME
Definition: RISCVCodeGenPrepare.cpp:32

DEBUG_TYPE
#define DEBUG_TYPE
Definition: RISCVCodeGenPrepare.cpp:31

RISCVTargetMachine.h

RISCV.h

visit
void visit(MachineFunction &MF, MachineBasicBlock &Start, std::function< void(MachineBasicBlock *)> op)
Definition: SPIRVPostLegalizer.cpp:132

Statistic.h
This file defines the 'Statistic' class, which is designed to be an easy way to expose various metric...

TargetPassConfig.h
Target-Independent Code Generator Pass Configuration Options pass.

PASS_NAME
#define PASS_NAME
Definition: TypePromotion.cpp:43

ValueTracking.h

RHS
Value * RHS
Definition: X86PartialReduction.cpp:74

llvm::AnalysisUsage
Represent the analysis usage information of a pass.
Definition: PassAnalysisSupport.h:47

llvm::AnalysisUsage::addRequired
AnalysisUsage & addRequired()
Definition: PassAnalysisSupport.h:75

llvm::AnalysisUsage::setPreservesCFG
void setPreservesCFG()
This function should be called by the pass, iff they do not:
Definition: Pass.cpp:256

llvm::BinaryOperator
Definition: InstrTypes.h:170

llvm::DataLayout
A parsed version of the target data layout string in and methods for querying it.
Definition: DataLayout.h:63

llvm::DominatorTreeWrapperPass
Legacy analysis pass which computes a DominatorTree.
Definition: Dominators.h:317

llvm::DominatorTree
Concrete subclass of DominatorTreeBase that is used to compute a normal dominator tree.
Definition: Dominators.h:162

llvm::FunctionPass
FunctionPass class - This class is used to implement most global optimizations.
Definition: Pass.h:310

llvm::FunctionPass::runOnFunction
virtual bool runOnFunction(Function &F)=0
runOnFunction - Virtual method overriden by subclasses to do the per-function processing of the pass.

llvm::Function
Definition: Function.h:63

llvm::IRBuilder
This provides a uniform API for creating instructions and inserting them into a basic block: either a...
Definition: IRBuilder.h:2697

llvm::InstVisitor
Base class for instruction visitors.
Definition: InstVisitor.h:78

llvm::InstVisitor::visitIntrinsicInst
RetTy visitIntrinsicInst(IntrinsicInst &I)
Definition: InstVisitor.h:222

llvm::InstVisitor::visitInstruction
void visitInstruction(Instruction &I)
Definition: InstVisitor.h:283

llvm::Instruction
Definition: Instruction.h:68

llvm::IntrinsicInst
A wrapper class for inspecting calls to intrinsic functions.
Definition: IntrinsicInst.h:48

llvm::Pass::getAnalysisUsage
virtual void getAnalysisUsage(AnalysisUsage &) const
getAnalysisUsage - This function should be overriden by passes that need analysis information to do t...
Definition: Pass.cpp:98

llvm::Pass::getPassName
virtual StringRef getPassName() const
getPassName - Return a nice clean name for a pass.
Definition: Pass.cpp:81

llvm::RISCVSubtarget
Definition: RISCVSubtarget.h:78

llvm::RISCVTargetMachine
Definition: RISCVTargetMachine.h:23

llvm::StringRef
StringRef - Represent a constant reference to a string, i.e.
Definition: StringRef.h:51

llvm::TargetPassConfig
Target-Independent Code Generator Pass Configuration Options.
Definition: TargetPassConfig.h:85

llvm::Type
The instances of the Type class are immutable: once they are created, they are never changed.
Definition: Type.h:45

llvm::Type::isIntegerTy
bool isIntegerTy() const
True if this is an instance of IntegerType.
Definition: Type.h:237

llvm::User::setOperand
void setOperand(unsigned i, Value *Val)
Definition: User.h:233

llvm::User::getOperand
Value * getOperand(unsigned i) const
Definition: User.h:228

llvm::Value
LLVM Value Representation.
Definition: Value.h:74

llvm::Value::getType
Type * getType() const
All values are typed, get the type of this value.
Definition: Value.h:255

uint64_t

unsigned

false
Definition: StackSlotColoring.cpp:193

llvm::ARM_MB::ST
@ ST
Definition: ARMBaseInfo.h:73

llvm::CallingConv::C
@ C
The default llvm calling convention, compatible with C.
Definition: CallingConv.h:34

llvm::CallingConv::ID
unsigned ID
LLVM IR allows to use arbitrary numbers as calling convention identifiers.
Definition: CallingConv.h:24

llvm::PatternMatch::m_AllOnes
cst_pred_ty< is_all_ones > m_AllOnes()
Match an integer or vector with all bits set.
Definition: PatternMatch.h:524

llvm::PatternMatch::match
bool match(Val *V, const Pattern &P)
Definition: PatternMatch.h:49

llvm::PatternMatch::m_NNegZExt
NNegZExt_match< OpTy > m_NNegZExt(const OpTy &Op)
Definition: PatternMatch.h:2084

llvm::PatternMatch::m_Value
class_match< Value > m_Value()
Match an arbitrary value and ignore it.
Definition: PatternMatch.h:92

llvm::PatternMatch::m_Zero
is_zero m_Zero()
Match any null constant or a vector with all elements equal to 0.
Definition: PatternMatch.h:612

llvm::SystemZISD::TM
@ TM
Definition: SystemZISelLowering.h:66

llvm::codeview::EncodedFramePtrReg::BasePtr
@ BasePtr

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition: AddressRanges.h:18

llvm::make_early_inc_range
iterator_range< early_inc_iterator_impl< detail::IterOfRange< RangeT > > > make_early_inc_range(RangeT &&Range)
Make a range that does early increment to allow mutation of the underlying range without disrupting i...
Definition: STLExtras.h:657

llvm::isKnownNonZero
bool isKnownNonZero(const Value *V, const SimplifyQuery &Q, unsigned Depth=0)
Return true if the given value is known to be non-zero when defined.
Definition: ValueTracking.cpp:3390

llvm::createRISCVCodeGenPreparePass
FunctionPass * createRISCVCodeGenPreparePass()
Definition: RISCVCodeGenPrepare.cpp:224

llvm::is_contained
bool is_contained(R &&Range, const E &Element)
Returns true if Element is found in Range.
Definition: STLExtras.h:1903