doxygen/ExpandLargeDivRem_8cpp_source.html

//===--- ExpandLargeDivRem.cpp - Expand large div/rem ---------------------===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//

//

// This pass expands div/rem instructions with a bitwidth above a threshold

// into a call to auto-generated functions.

// This is useful for targets like x86_64 that cannot lower divisions

// with more than 128 bits or targets like x86_32 that cannot lower divisions

// with more than 64 bits.

//

//===----------------------------------------------------------------------===//


#include "llvm/CodeGen/ExpandLargeDivRem.h"

#include "llvm/ADT/SmallVector.h"

#include "llvm/Analysis/GlobalsModRef.h"

#include "llvm/CodeGen/Passes.h"

#include "llvm/CodeGen/TargetLowering.h"

#include "llvm/CodeGen/TargetPassConfig.h"

#include "llvm/CodeGen/TargetSubtargetInfo.h"

#include "llvm/IR/IRBuilder.h"

#include "llvm/IR/InstIterator.h"

#include "llvm/IR/PassManager.h"

#include "llvm/InitializePasses.h"

#include "llvm/Pass.h"

#include "llvm/Support/CommandLine.h"

#include "llvm/Target/TargetMachine.h"

#include "llvm/Transforms/Utils/IntegerDivision.h"


using namespace llvm;


static cl::opt<unsigned>

    ExpandDivRemBits("expand-div-rem-bits", cl::Hidden,

                     cl::init(llvm::IntegerType::MAX_INT_BITS),

                     cl::desc("div and rem instructions on integers with "

                              "more than <N> bits are expanded."));


static bool isConstantPowerOfTwo(llvm::Value *V, bool SignedOp) {

  auto *C = dyn_cast<ConstantInt>(V);

  if (!C)

    return false;


  APInt Val = C->getValue();

  if (SignedOp && Val.isNegative())

    Val = -Val;

  return Val.isPowerOf2();

}


static bool isSigned(unsigned int Opcode) {

  return Opcode == Instruction::SDiv || Opcode == Instruction::SRem;

}


static void scalarize(BinaryOperator *BO,

                      SmallVectorImpl<BinaryOperator *> &Replace) {

  VectorType *VTy = cast<FixedVectorType>(BO->getType());


  IRBuilder<> Builder(BO);


  unsigned NumElements = VTy->getElementCount().getFixedValue();

  Value *Result = PoisonValue::get(VTy);

  for (unsigned Idx = 0; Idx < NumElements; ++Idx) {

    Value *LHS = Builder.CreateExtractElement(BO->getOperand(0), Idx);

    Value *RHS = Builder.CreateExtractElement(BO->getOperand(1), Idx);

    Value *Op = Builder.CreateBinOp(BO->getOpcode(), LHS, RHS);

    Result = Builder.CreateInsertElement(Result, Op, Idx);

    if (auto *NewBO = dyn_cast<BinaryOperator>(Op)) {

      NewBO->copyIRFlags(Op, true);

      Replace.push_back(NewBO);

    }

  }

  BO->replaceAllUsesWith(Result);

  BO->dropAllReferences();

  BO->eraseFromParent();

}


static bool runImpl(Function &F, const TargetLowering &TLI) {

  SmallVector<BinaryOperator *, 4> Replace;

  SmallVector<BinaryOperator *, 4> ReplaceVector;

  bool Modified = false;


  unsigned MaxLegalDivRemBitWidth = TLI.getMaxDivRemBitWidthSupported();

  if (ExpandDivRemBits != llvm::IntegerType::MAX_INT_BITS)

    MaxLegalDivRemBitWidth = ExpandDivRemBits;


  if (MaxLegalDivRemBitWidth >= llvm::IntegerType::MAX_INT_BITS)

    return false;


  for (auto &I : instructions(F)) {

    switch (I.getOpcode()) {

    case Instruction::UDiv:

    case Instruction::SDiv:

    case Instruction::URem:

    case Instruction::SRem: {

      // TODO: This pass doesn't handle scalable vectors.

      if (I.getOperand(0)->getType()->isScalableTy())

        continue;


      auto *IntTy = dyn_cast<IntegerType>(I.getType()->getScalarType());

      if (!IntTy || IntTy->getIntegerBitWidth() <= MaxLegalDivRemBitWidth)

        continue;


      // The backend has peephole optimizations for powers of two.

      // TODO: We don't consider vectors here.

      if (isConstantPowerOfTwo(I.getOperand(1), isSigned(I.getOpcode())))

        continue;


      if (I.getOperand(0)->getType()->isVectorTy())

        ReplaceVector.push_back(&cast<BinaryOperator>(I));

      else

        Replace.push_back(&cast<BinaryOperator>(I));

      Modified = true;

      break;

    }

    default:

      break;

    }

  }


  while (!ReplaceVector.empty()) {

    BinaryOperator *BO = ReplaceVector.pop_back_val();

    scalarize(BO, Replace);

  }


  if (Replace.empty())

    return false;


  while (!Replace.empty()) {

    BinaryOperator *I = Replace.pop_back_val();


    if (I->getOpcode() == Instruction::UDiv ||

        I->getOpcode() == Instruction::SDiv) {

      expandDivision(I);

    } else {

      expandRemainder(I);

    }

  }


  return Modified;

}


namespace {

class ExpandLargeDivRemLegacyPass : public FunctionPass {

public:

  static char ID;


  ExpandLargeDivRemLegacyPass() : FunctionPass(ID) {

    initializeExpandLargeDivRemLegacyPassPass(*PassRegistry::getPassRegistry());

  }


  bool runOnFunction(Function &F) override {

    auto *TM = &getAnalysis<TargetPassConfig>().getTM<TargetMachine>();

    auto *TLI = TM->getSubtargetImpl(F)->getTargetLowering();

    return runImpl(F, *TLI);

  }


  void getAnalysisUsage(AnalysisUsage &AU) const override {

    AU.addRequired<TargetPassConfig>();

    AU.addPreserved<AAResultsWrapperPass>();

    AU.addPreserved<GlobalsAAWrapperPass>();

  }

};

} // namespace


PreservedAnalyses ExpandLargeDivRemPass::run(Function &F,

                                             FunctionAnalysisManager &FAM) {

  const TargetSubtargetInfo *STI = TM->getSubtargetImpl(F);

  return runImpl(F, *STI->getTargetLowering()) ? PreservedAnalyses::none()

                                               : PreservedAnalyses::all();

}


char ExpandLargeDivRemLegacyPass::ID = 0;

INITIALIZE_PASS_BEGIN(ExpandLargeDivRemLegacyPass, "expand-large-div-rem",

                      "Expand large div/rem", false, false)

INITIALIZE_PASS_END(ExpandLargeDivRemLegacyPass, "expand-large-div-rem",

                    "Expand large div/rem", false, false)


FunctionPass *llvm::createExpandLargeDivRemPass() {

  return new ExpandLargeDivRemLegacyPass();

}

instructions
Expand Atomic instructions
Definition: AtomicExpandPass.cpp:172

Passes.h

CommandLine.h

Idx
Returns the sub type a function will return at a given Idx Should correspond to the result type of an ExtractValue instruction executed with just that one unsigned Idx
Definition: DeadArgumentElimination.cpp:353

ExpandDivRemBits
static cl::opt< unsigned > ExpandDivRemBits("expand-div-rem-bits", cl::Hidden, cl::init(llvm::IntegerType::MAX_INT_BITS), cl::desc("div and rem instructions on integers with " "more than <N> bits are expanded."))

isSigned
static bool isSigned(unsigned int Opcode)
Definition: ExpandLargeDivRem.cpp:52

scalarize
static void scalarize(BinaryOperator *BO, SmallVectorImpl< BinaryOperator * > &Replace)
Definition: ExpandLargeDivRem.cpp:56

rem
expand large div rem
Definition: ExpandLargeDivRem.cpp:177

runImpl
static bool runImpl(Function &F, const TargetLowering &TLI)
Definition: ExpandLargeDivRem.cpp:79

isConstantPowerOfTwo
static bool isConstantPowerOfTwo(llvm::Value *V, bool SignedOp)
Definition: ExpandLargeDivRem.cpp:41

ExpandLargeDivRem.h

expand
static Expected< BitVector > expand(StringRef S, StringRef Original)
Definition: GlobPattern.cpp:21

GlobalsModRef.h
This is the interface for a simple mod/ref and alias analysis over globals.

IRBuilder.h

PassManager.h
This header defines various interfaces for pass management in LLVM.

InitializePasses.h

InstIterator.h

IntegerDivision.h

LoopDeletionResult::Modified
@ Modified

F
#define F(x, y, z)
Definition: MD5.cpp:55

I
#define I(x, y, z)
Definition: MD5.cpp:58

FAM
FunctionAnalysisManager FAM
Definition: PassBuilderBindings.cpp:61

INITIALIZE_PASS_END
#define INITIALIZE_PASS_END(passName, arg, name, cfg, analysis)
Definition: PassSupport.h:57

INITIALIZE_PASS_BEGIN
#define INITIALIZE_PASS_BEGIN(passName, arg, name, cfg, analysis)
Definition: PassSupport.h:52

Pass.h

SmallVector.h
This file defines the SmallVector class.

TargetLowering.h
This file describes how to lower LLVM code to machine code.

TargetPassConfig.h
Target-Independent Code Generator Pass Configuration Options pass.

TargetSubtargetInfo.h

RHS
Value * RHS
Definition: X86PartialReduction.cpp:74

LHS
Value * LHS
Definition: X86PartialReduction.cpp:73

VectorType
Definition: ItaniumDemangle.h:1173

llvm::AAResultsWrapperPass
A wrapper pass to provide the legacy pass manager access to a suitably prepared AAResults object.
Definition: AliasAnalysis.h:981

llvm::APInt
Class for arbitrary precision integers.
Definition: APInt.h:78

llvm::APInt::isNegative
bool isNegative() const
Determine sign of this APInt.
Definition: APInt.h:329

llvm::APInt::isPowerOf2
bool isPowerOf2() const
Check if this APInt's value is a power of two greater than zero.
Definition: APInt.h:440

llvm::AnalysisManager
A container for analyses that lazily runs them and caches their results.
Definition: PassManager.h:253

llvm::AnalysisUsage
Represent the analysis usage information of a pass.
Definition: PassAnalysisSupport.h:47

llvm::AnalysisUsage::addRequired
AnalysisUsage & addRequired()
Definition: PassAnalysisSupport.h:75

llvm::AnalysisUsage::addPreserved
AnalysisUsage & addPreserved()
Add the specified Pass class to the set of analyses preserved by this pass.
Definition: PassAnalysisSupport.h:98

llvm::BinaryOperator
Definition: InstrTypes.h:170

llvm::BinaryOperator::getOpcode
BinaryOps getOpcode() const
Definition: InstrTypes.h:370

llvm::DWARFExpression::Operation
This class represents an Operation in the Expression.
Definition: DWARFExpression.h:32

llvm::ExpandLargeDivRemPass::run
PreservedAnalyses run(Function &F, FunctionAnalysisManager &AM)
Definition: ExpandLargeDivRem.cpp:167

llvm::FunctionPass
FunctionPass class - This class is used to implement most global optimizations.
Definition: Pass.h:310

llvm::FunctionPass::runOnFunction
virtual bool runOnFunction(Function &F)=0
runOnFunction - Virtual method overriden by subclasses to do the per-function processing of the pass.

llvm::Function
Definition: Function.h:63

llvm::GlobalsAAWrapperPass
Legacy wrapper pass to provide the GlobalsAAResult object.
Definition: GlobalsModRef.h:142

llvm::IRBuilderBase::CreateInsertElement
Value * CreateInsertElement(Type *VecTy, Value *NewElt, Value *Idx, const Twine &Name="")
Definition: IRBuilder.h:2511

llvm::IRBuilderBase::CreateExtractElement
Value * CreateExtractElement(Value *Vec, Value *Idx, const Twine &Name="")
Definition: IRBuilder.h:2499

llvm::IRBuilderBase::CreateBinOp
Value * CreateBinOp(Instruction::BinaryOps Opc, Value *LHS, Value *RHS, const Twine &Name="", MDNode *FPMathTag=nullptr)
Definition: IRBuilder.h:1671

llvm::IRBuilder
This provides a uniform API for creating instructions and inserting them into a basic block: either a...
Definition: IRBuilder.h:2705

llvm::Instruction::eraseFromParent
InstListType::iterator eraseFromParent()
This method unlinks 'this' from the containing basic block and deletes it.
Definition: Instruction.cpp:94

llvm::IntegerType::MAX_INT_BITS
@ MAX_INT_BITS
Maximum number of bits that can be specified.
Definition: DerivedTypes.h:54

llvm::PassRegistry::getPassRegistry
static PassRegistry * getPassRegistry()
getPassRegistry - Access the global registry object, which is automatically initialized at applicatio...
Definition: PassRegistry.cpp:24

llvm::Pass::getAnalysisUsage
virtual void getAnalysisUsage(AnalysisUsage &) const
getAnalysisUsage - This function should be overriden by passes that need analysis information to do t...
Definition: Pass.cpp:98

llvm::PoisonValue::get
static PoisonValue * get(Type *T)
Static factory methods - Return an 'poison' object of the specified type.
Definition: Constants.cpp:1878

llvm::PreservedAnalyses
A set of analyses that are preserved following a run of a transformation pass.
Definition: Analysis.h:111

llvm::PreservedAnalyses::none
static PreservedAnalyses none()
Convenience factory function for the empty preserved set.
Definition: Analysis.h:114

llvm::PreservedAnalyses::all
static PreservedAnalyses all()
Construct a special preserved set that preserves all passes.
Definition: Analysis.h:117

llvm::SmallVectorBase::empty
bool empty() const
Definition: SmallVector.h:81

llvm::SmallVectorImpl
This class consists of common code factored out of the SmallVector class to reduce code duplication b...
Definition: SmallVector.h:573

llvm::SmallVectorImpl::pop_back_val
T pop_back_val()
Definition: SmallVector.h:673

llvm::SmallVectorTemplateBase::push_back
void push_back(const T &Elt)
Definition: SmallVector.h:413

llvm::SmallVector
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
Definition: SmallVector.h:1196

llvm::TargetLoweringBase::getMaxDivRemBitWidthSupported
unsigned getMaxDivRemBitWidthSupported() const
Returns the size in bits of the maximum div/rem the backend supports.
Definition: TargetLowering.h:2142

llvm::TargetLowering
This class defines information used to lower LLVM code to legal SelectionDAG operators that the targe...
Definition: TargetLowering.h:3776

llvm::TargetMachine
Primary interface to the complete machine description for the target machine.
Definition: TargetMachine.h:77

llvm::TargetMachine::getSubtargetImpl
virtual const TargetSubtargetInfo * getSubtargetImpl(const Function &) const
Virtual method implemented by subclasses that returns a reference to that target's TargetSubtargetInf...
Definition: TargetMachine.h:133

llvm::TargetPassConfig
Target-Independent Code Generator Pass Configuration Options.
Definition: TargetPassConfig.h:85

llvm::TargetSubtargetInfo
TargetSubtargetInfo - Generic base class for all target subtargets.
Definition: TargetSubtargetInfo.h:63

llvm::TargetSubtargetInfo::getTargetLowering
virtual const TargetLowering * getTargetLowering() const
Definition: TargetSubtargetInfo.h:101

llvm::User::dropAllReferences
void dropAllReferences()
Drop all references to operands.
Definition: User.h:345

llvm::User::getOperand
Value * getOperand(unsigned i) const
Definition: User.h:228

llvm::Value
LLVM Value Representation.
Definition: Value.h:74

llvm::Value::getType
Type * getType() const
All values are typed, get the type of this value.
Definition: Value.h:255

llvm::Value::replaceAllUsesWith
void replaceAllUsesWith(Value *V)
Change all uses of this to point to a new Value.
Definition: Value.cpp:534

llvm::cl::opt
Definition: CommandLine.h:1423

unsigned

TargetMachine.h

false
Definition: StackSlotColoring.cpp:193

llvm::CallingConv::C
@ C
The default llvm calling convention, compatible with C.
Definition: CallingConv.h:34

llvm::CallingConv::ID
unsigned ID
LLVM IR allows to use arbitrary numbers as calling convention identifiers.
Definition: CallingConv.h:24

llvm::SystemZISD::TM
@ TM
Definition: SystemZISelLowering.h:66

llvm::cl::Hidden
@ Hidden
Definition: CommandLine.h:137

llvm::cl::init
initializer< Ty > init(const Ty &Val)
Definition: CommandLine.h:443

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition: AddressRanges.h:18

llvm::expandDivision
bool expandDivision(BinaryOperator *Div)
Generate code to divide two integers, replacing Div with the generated code.
Definition: IntegerDivision.cpp:406

llvm::initializeExpandLargeDivRemLegacyPassPass
void initializeExpandLargeDivRemLegacyPassPass(PassRegistry &)

llvm::createExpandLargeDivRemPass
FunctionPass * createExpandLargeDivRemPass()
Definition: ExpandLargeDivRem.cpp:180

llvm::expandRemainder
bool expandRemainder(BinaryOperator *Rem)
Generate code to calculate the remainder of two integers, replacing Rem with the generated code.
Definition: IntegerDivision.cpp:354

llvm::cl::desc
Definition: CommandLine.h:409