docs/doxygen/ExpandLargeFpConvert_8cpp_source.html

//===--- ExpandLargeFpConvert.cpp - Expand large fp convert----------------===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//

//


// This pass expands ‘fptoui .. to’, ‘fptosi .. to’, ‘uitofp .. to’,

// ‘sitofp .. to’ instructions with a bitwidth above a threshold into

// auto-generated functions. This is useful for targets like x86_64 that cannot

// lower fp convertions with more than 128 bits.

//

//===----------------------------------------------------------------------===//


#include "llvm/CodeGen/ExpandLargeFpConvert.h"

#include "llvm/ADT/SmallVector.h"

#include "llvm/Analysis/GlobalsModRef.h"

#include "llvm/CodeGen/Passes.h"

#include "llvm/CodeGen/TargetLowering.h"

#include "llvm/CodeGen/TargetPassConfig.h"

#include "llvm/CodeGen/TargetSubtargetInfo.h"

#include "llvm/IR/IRBuilder.h"

#include "llvm/IR/InstIterator.h"

#include "llvm/IR/PassManager.h"

#include "llvm/InitializePasses.h"

#include "llvm/Pass.h"

#include "llvm/Support/CommandLine.h"

#include "llvm/Target/TargetMachine.h"


using namespace llvm;


static cl::opt<unsigned>

    ExpandFpConvertBits("expand-fp-convert-bits", cl::Hidden,

                     cl::init(llvm::IntegerType::MAX_INT_BITS),

                     cl::desc("fp convert instructions on integers with "

                              "more than <N> bits are expanded."));


/// Generate code to convert a fp number to integer, replacing FPToS(U)I with

/// the generated code. This currently generates code similarly to compiler-rt's

/// implementations.

///

/// An example IR generated from compiler-rt/fixsfdi.c looks like below:

/// define dso_local i64 @foo(float noundef %a) local_unnamed_addr #0 {

/// entry:

///   %0 = bitcast float %a to i32

///   %conv.i = zext i32 %0 to i64

///   %tobool.not = icmp sgt i32 %0, -1

///   %conv = select i1 %tobool.not, i64 1, i64 -1

///   %and = lshr i64 %conv.i, 23

///   %shr = and i64 %and, 255

///   %and2 = and i64 %conv.i, 8388607

///   %or = or i64 %and2, 8388608

///   %cmp = icmp ult i64 %shr, 127

///   br i1 %cmp, label %cleanup, label %if.end

///

/// if.end:                                           ; preds = %entry

///   %sub = add nuw nsw i64 %shr, 4294967169

///   %conv5 = and i64 %sub, 4294967232

///   %cmp6.not = icmp eq i64 %conv5, 0

///   br i1 %cmp6.not, label %if.end12, label %if.then8

///

/// if.then8:                                         ; preds = %if.end

///   %cond11 = select i1 %tobool.not, i64 9223372036854775807, i64 -9223372036854775808

///   br label %cleanup

///

/// if.end12:                                         ; preds = %if.end

///   %cmp13 = icmp ult i64 %shr, 150

///   br i1 %cmp13, label %if.then15, label %if.else

///

/// if.then15:                                        ; preds = %if.end12

///   %sub16 = sub nuw nsw i64 150, %shr

///   %shr17 = lshr i64 %or, %sub16

///   %mul = mul nsw i64 %shr17, %conv

///   br label %cleanup

///

/// if.else:                                          ; preds = %if.end12

///   %sub18 = add nsw i64 %shr, -150

///   %shl = shl i64 %or, %sub18

///   %mul19 = mul nsw i64 %shl, %conv

///   br label %cleanup

///

/// cleanup:                                          ; preds = %entry, %if.else, %if.then15, %if.then8

///   %retval.0 = phi i64 [ %cond11, %if.then8 ], [ %mul, %if.then15 ], [ %mul19, %if.else ], [ 0, %entry ]

///   ret i64 %retval.0

/// }

///

/// Replace fp to integer with generated code.

static void expandFPToI(Instruction *FPToI) {

  IRBuilder<> Builder(FPToI);

  auto *FloatVal = FPToI->getOperand(0);

  IntegerType *IntTy = cast<IntegerType>(FPToI->getType());


  unsigned BitWidth = FPToI->getType()->getIntegerBitWidth();

  unsigned FPMantissaWidth = FloatVal->getType()->getFPMantissaWidth() - 1;


  // FIXME: fp16's range is covered by i32. So `fptoi half` can convert

  // to i32 first following a sext/zext to target integer type.

  Value *A1 = nullptr;

  if (FloatVal->getType()->isHalfTy()) {

    if (FPToI->getOpcode() == Instruction::FPToUI) {

      Value *A0 = Builder.CreateFPToUI(FloatVal, Builder.getIntNTy(32));

      A1 = Builder.CreateZExt(A0, IntTy);

    } else { // FPToSI

      Value *A0 = Builder.CreateFPToSI(FloatVal, Builder.getIntNTy(32));

      A1 = Builder.CreateSExt(A0, IntTy);

    }

    FPToI->replaceAllUsesWith(A1);

    FPToI->dropAllReferences();

    FPToI->eraseFromParent();

    return;

  }


  // fp80 conversion is implemented by fpext to fp128 first then do the

  // conversion.

  FPMantissaWidth = FPMantissaWidth == 63 ? 112 : FPMantissaWidth;

  unsigned FloatWidth =

      PowerOf2Ceil(FloatVal->getType()->getScalarSizeInBits());

  unsigned ExponentWidth = FloatWidth - FPMantissaWidth - 1;

  unsigned ExponentBias = (1 << (ExponentWidth - 1)) - 1;

  Value *ImplicitBit = Builder.CreateShl(

      Builder.getIntN(BitWidth, 1), Builder.getIntN(BitWidth, FPMantissaWidth));

  Value *SignificandMask =

      Builder.CreateSub(ImplicitBit, Builder.getIntN(BitWidth, 1));

  Value *NegOne = Builder.CreateSExt(

      ConstantInt::getSigned(Builder.getInt32Ty(), -1), IntTy);

  Value *NegInf =

      Builder.CreateShl(ConstantInt::getSigned(IntTy, 1),

                        ConstantInt::getSigned(IntTy, BitWidth - 1));


  BasicBlock *Entry = Builder.GetInsertBlock();

  Function *F = Entry->getParent();

  Entry->setName(Twine(Entry->getName(), "fp-to-i-entry"));

  BasicBlock *End =

      Entry->splitBasicBlock(Builder.GetInsertPoint(), "fp-to-i-cleanup");

  BasicBlock *IfEnd =

      BasicBlock::Create(Builder.getContext(), "fp-to-i-if-end", F, End);

  BasicBlock *IfThen5 =

      BasicBlock::Create(Builder.getContext(), "fp-to-i-if-then5", F, End);

  BasicBlock *IfEnd9 =

      BasicBlock::Create(Builder.getContext(), "fp-to-i-if-end9", F, End);

  BasicBlock *IfThen12 =

      BasicBlock::Create(Builder.getContext(), "fp-to-i-if-then12", F, End);

  BasicBlock *IfElse =

      BasicBlock::Create(Builder.getContext(), "fp-to-i-if-else", F, End);


  Entry->getTerminator()->eraseFromParent();


  // entry:

  Builder.SetInsertPoint(Entry);

  Value *FloatVal0 = FloatVal;

  // fp80 conversion is implemented by fpext to fp128 first then do the

  // conversion.

  if (FloatVal->getType()->isX86_FP80Ty())

    FloatVal0 =

        Builder.CreateFPExt(FloatVal, Type::getFP128Ty(Builder.getContext()));

  Value *ARep0 =

      Builder.CreateBitCast(FloatVal0, Builder.getIntNTy(FloatWidth));

  Value *ARep = Builder.CreateZExt(ARep0, FPToI->getType());

  Value *PosOrNeg = Builder.CreateICmpSGT(

      ARep0, ConstantInt::getSigned(Builder.getIntNTy(FloatWidth), -1));

  Value *Sign = Builder.CreateSelect(PosOrNeg, ConstantInt::getSigned(IntTy, 1),

                                     ConstantInt::getSigned(IntTy, -1));

  Value *And =

      Builder.CreateLShr(ARep, Builder.getIntN(BitWidth, FPMantissaWidth));

  Value *And2 = Builder.CreateAnd(

      And, Builder.getIntN(BitWidth, (1 << ExponentWidth) - 1));

  Value *Abs = Builder.CreateAnd(ARep, SignificandMask);

  Value *Or = Builder.CreateOr(Abs, ImplicitBit);

  Value *Cmp =

      Builder.CreateICmpULT(And2, Builder.getIntN(BitWidth, ExponentBias));

  Builder.CreateCondBr(Cmp, End, IfEnd);


  // if.end:

  Builder.SetInsertPoint(IfEnd);

  Value *Add1 = Builder.CreateAdd(

      And2, ConstantInt::getSigned(

                IntTy, -static_cast<int64_t>(ExponentBias + BitWidth)));

  Value *Cmp3 = Builder.CreateICmpULT(

      Add1, ConstantInt::getSigned(IntTy, -static_cast<int64_t>(BitWidth)));

  Builder.CreateCondBr(Cmp3, IfThen5, IfEnd9);


  // if.then5:

  Builder.SetInsertPoint(IfThen5);

  Value *PosInf = Builder.CreateXor(NegOne, NegInf);

  Value *Cond8 = Builder.CreateSelect(PosOrNeg, PosInf, NegInf);

  Builder.CreateBr(End);


  // if.end9:

  Builder.SetInsertPoint(IfEnd9);

  Value *Cmp10 = Builder.CreateICmpULT(

      And2, Builder.getIntN(BitWidth, ExponentBias + FPMantissaWidth));

  Builder.CreateCondBr(Cmp10, IfThen12, IfElse);


  // if.then12:

  Builder.SetInsertPoint(IfThen12);

  Value *Sub13 = Builder.CreateSub(

      Builder.getIntN(BitWidth, ExponentBias + FPMantissaWidth), And2);

  Value *Shr14 = Builder.CreateLShr(Or, Sub13);

  Value *Mul = Builder.CreateMul(Shr14, Sign);

  Builder.CreateBr(End);


  // if.else:

  Builder.SetInsertPoint(IfElse);

  Value *Sub15 = Builder.CreateAdd(

      And2, ConstantInt::getSigned(

                IntTy, -static_cast<int64_t>(ExponentBias + FPMantissaWidth)));

  Value *Shl = Builder.CreateShl(Or, Sub15);

  Value *Mul16 = Builder.CreateMul(Shl, Sign);

  Builder.CreateBr(End);


  // cleanup:

  Builder.SetInsertPoint(End, End->begin());

  PHINode *Retval0 = Builder.CreatePHI(FPToI->getType(), 4);


  Retval0->addIncoming(Cond8, IfThen5);

  Retval0->addIncoming(Mul, IfThen12);

  Retval0->addIncoming(Mul16, IfElse);

  Retval0->addIncoming(Builder.getIntN(BitWidth, 0), Entry);


  FPToI->replaceAllUsesWith(Retval0);

  FPToI->dropAllReferences();

  FPToI->eraseFromParent();

}


/// Generate code to convert a fp number to integer, replacing S(U)IToFP with

/// the generated code. This currently generates code similarly to compiler-rt's

/// implementations. This implementation has an implicit assumption that integer

/// width is larger than fp.

///

/// An example IR generated from compiler-rt/floatdisf.c looks like below:

/// define dso_local float @__floatdisf(i64 noundef %a) local_unnamed_addr #0 {

/// entry:

///   %cmp = icmp eq i64 %a, 0

///   br i1 %cmp, label %return, label %if.end

///

/// if.end:                                           ; preds = %entry

///   %shr = ashr i64 %a, 63

///   %xor = xor i64 %shr, %a

///   %sub = sub nsw i64 %xor, %shr

///   %0 = tail call i64 @llvm.ctlz.i64(i64 %sub, i1 true), !range !5

///   %cast = trunc i64 %0 to i32

///   %sub1 = sub nuw nsw i32 64, %cast

///   %sub2 = xor i32 %cast, 63

///   %cmp3 = icmp ult i32 %cast, 40

///   br i1 %cmp3, label %if.then4, label %if.else

///

/// if.then4:                                         ; preds = %if.end

///   switch i32 %sub1, label %sw.default [

///     i32 25, label %sw.bb

///     i32 26, label %sw.epilog

///   ]

///

/// sw.bb:                                            ; preds = %if.then4

///   %shl = shl i64 %sub, 1

///   br label %sw.epilog

///

/// sw.default:                                       ; preds = %if.then4

///   %sub5 = sub nsw i64 38, %0

///   %sh_prom = and i64 %sub5, 4294967295

///   %shr6 = lshr i64 %sub, %sh_prom

///   %shr9 = lshr i64 274877906943, %0

///   %and = and i64 %shr9, %sub

///   %cmp10 = icmp ne i64 %and, 0

///   %conv11 = zext i1 %cmp10 to i64

///   %or = or i64 %shr6, %conv11

///   br label %sw.epilog

///

/// sw.epilog:                                        ; preds = %sw.default, %if.then4, %sw.bb

///   %a.addr.0 = phi i64 [ %or, %sw.default ], [ %sub, %if.then4 ], [ %shl, %sw.bb ]

///   %1 = lshr i64 %a.addr.0, 2

///   %2 = and i64 %1, 1

///   %or16 = or i64 %2, %a.addr.0

///   %inc = add nsw i64 %or16, 1

///   %3 = and i64 %inc, 67108864

///   %tobool.not = icmp eq i64 %3, 0

///   %spec.select.v = select i1 %tobool.not, i64 2, i64 3

///   %spec.select = ashr i64 %inc, %spec.select.v

///   %spec.select56 = select i1 %tobool.not, i32 %sub2, i32 %sub1

///   br label %if.end26

///

/// if.else:                                          ; preds = %if.end

///   %sub23 = add nuw nsw i64 %0, 4294967256

///   %sh_prom24 = and i64 %sub23, 4294967295

///   %shl25 = shl i64 %sub, %sh_prom24

///   br label %if.end26

///

/// if.end26:                                         ; preds = %sw.epilog, %if.else

///   %a.addr.1 = phi i64 [ %shl25, %if.else ], [ %spec.select, %sw.epilog ]

///   %e.0 = phi i32 [ %sub2, %if.else ], [ %spec.select56, %sw.epilog ]

///   %conv27 = trunc i64 %shr to i32

///   %and28 = and i32 %conv27, -2147483648

///   %add = shl nuw nsw i32 %e.0, 23

///   %shl29 = add nuw nsw i32 %add, 1065353216

///   %conv31 = trunc i64 %a.addr.1 to i32

///   %and32 = and i32 %conv31, 8388607

///   %or30 = or i32 %and32, %and28

///   %or33 = or i32 %or30, %shl29

///   %4 = bitcast i32 %or33 to float

///   br label %return

///

/// return:                                           ; preds = %entry, %if.end26

///   %retval.0 = phi float [ %4, %if.end26 ], [ 0.000000e+00, %entry ]

///   ret float %retval.0

/// }

///

/// Replace integer to fp with generated code.

static void expandIToFP(Instruction *IToFP) {

  IRBuilder<> Builder(IToFP);

  auto *IntVal = IToFP->getOperand(0);

  IntegerType *IntTy = cast<IntegerType>(IntVal->getType());


  unsigned BitWidth = IntVal->getType()->getIntegerBitWidth();

  unsigned FPMantissaWidth = IToFP->getType()->getFPMantissaWidth() - 1;

  // fp80 conversion is implemented by conversion tp fp128 first following

  // a fptrunc to fp80.

  FPMantissaWidth = FPMantissaWidth == 63 ? 112 : FPMantissaWidth;

  // FIXME: As there is no related builtins added in compliler-rt,

  // here currently utilized the fp32 <-> fp16 lib calls to implement.

  FPMantissaWidth = FPMantissaWidth == 10 ? 23 : FPMantissaWidth;

  FPMantissaWidth = FPMantissaWidth == 7 ? 23 : FPMantissaWidth;

  unsigned FloatWidth = PowerOf2Ceil(FPMantissaWidth);

  bool IsSigned = IToFP->getOpcode() == Instruction::SIToFP;


  assert(BitWidth > FloatWidth && "Unexpected conversion. expandIToFP() "

                                  "assumes integer width is larger than fp.");


  Value *Temp1 =

      Builder.CreateShl(Builder.getIntN(BitWidth, 1),

                        Builder.getIntN(BitWidth, FPMantissaWidth + 3));


  BasicBlock *Entry = Builder.GetInsertBlock();

  Function *F = Entry->getParent();

  Entry->setName(Twine(Entry->getName(), "itofp-entry"));

  BasicBlock *End =

      Entry->splitBasicBlock(Builder.GetInsertPoint(), "itofp-return");

  BasicBlock *IfEnd =

      BasicBlock::Create(Builder.getContext(), "itofp-if-end", F, End);

  BasicBlock *IfThen4 =

      BasicBlock::Create(Builder.getContext(), "itofp-if-then4", F, End);

  BasicBlock *SwBB =

      BasicBlock::Create(Builder.getContext(), "itofp-sw-bb", F, End);

  BasicBlock *SwDefault =

      BasicBlock::Create(Builder.getContext(), "itofp-sw-default", F, End);

  BasicBlock *SwEpilog =

      BasicBlock::Create(Builder.getContext(), "itofp-sw-epilog", F, End);

  BasicBlock *IfThen20 =

      BasicBlock::Create(Builder.getContext(), "itofp-if-then20", F, End);

  BasicBlock *IfElse =

      BasicBlock::Create(Builder.getContext(), "itofp-if-else", F, End);

  BasicBlock *IfEnd26 =

      BasicBlock::Create(Builder.getContext(), "itofp-if-end26", F, End);


  Entry->getTerminator()->eraseFromParent();


  Function *CTLZ =

      Intrinsic::getOrInsertDeclaration(F->getParent(), Intrinsic::ctlz, IntTy);

  ConstantInt *True = Builder.getTrue();


  // entry:

  Builder.SetInsertPoint(Entry);

  Value *Cmp = Builder.CreateICmpEQ(IntVal, ConstantInt::getSigned(IntTy, 0));

  Builder.CreateCondBr(Cmp, End, IfEnd);


  // if.end:

  Builder.SetInsertPoint(IfEnd);

  Value *Shr =

      Builder.CreateAShr(IntVal, Builder.getIntN(BitWidth, BitWidth - 1));

  Value *Xor = Builder.CreateXor(Shr, IntVal);

  Value *Sub = Builder.CreateSub(Xor, Shr);

  Value *Call = Builder.CreateCall(CTLZ, {IsSigned ? Sub : IntVal, True});

  Value *Cast = Builder.CreateTrunc(Call, Builder.getInt32Ty());

  int BitWidthNew = FloatWidth == 128 ? BitWidth : 32;

  Value *Sub1 = Builder.CreateSub(Builder.getIntN(BitWidthNew, BitWidth),

                                  FloatWidth == 128 ? Call : Cast);

  Value *Sub2 = Builder.CreateSub(Builder.getIntN(BitWidthNew, BitWidth - 1),

                                  FloatWidth == 128 ? Call : Cast);

  Value *Cmp3 = Builder.CreateICmpSGT(

      Sub1, Builder.getIntN(BitWidthNew, FPMantissaWidth + 1));

  Builder.CreateCondBr(Cmp3, IfThen4, IfElse);


  // if.then4:

  Builder.SetInsertPoint(IfThen4);

  llvm::SwitchInst *SI = Builder.CreateSwitch(Sub1, SwDefault);

  SI->addCase(Builder.getIntN(BitWidthNew, FPMantissaWidth + 2), SwBB);

  SI->addCase(Builder.getIntN(BitWidthNew, FPMantissaWidth + 3), SwEpilog);


  // sw.bb:

  Builder.SetInsertPoint(SwBB);

  Value *Shl =

      Builder.CreateShl(IsSigned ? Sub : IntVal, Builder.getIntN(BitWidth, 1));

  Builder.CreateBr(SwEpilog);


  // sw.default:

  Builder.SetInsertPoint(SwDefault);

  Value *Sub5 = Builder.CreateSub(

      Builder.getIntN(BitWidthNew, BitWidth - FPMantissaWidth - 3),

      FloatWidth == 128 ? Call : Cast);

  Value *ShProm = Builder.CreateZExt(Sub5, IntTy);

  Value *Shr6 = Builder.CreateLShr(IsSigned ? Sub : IntVal,

                                   FloatWidth == 128 ? Sub5 : ShProm);

  Value *Sub8 =

      Builder.CreateAdd(FloatWidth == 128 ? Call : Cast,

                        Builder.getIntN(BitWidthNew, FPMantissaWidth + 3));

  Value *ShProm9 = Builder.CreateZExt(Sub8, IntTy);

  Value *Shr9 = Builder.CreateLShr(ConstantInt::getSigned(IntTy, -1),

                                   FloatWidth == 128 ? Sub8 : ShProm9);

  Value *And = Builder.CreateAnd(Shr9, IsSigned ? Sub : IntVal);

  Value *Cmp10 = Builder.CreateICmpNE(And, Builder.getIntN(BitWidth, 0));

  Value *Conv11 = Builder.CreateZExt(Cmp10, IntTy);

  Value *Or = Builder.CreateOr(Shr6, Conv11);

  Builder.CreateBr(SwEpilog);


  // sw.epilog:

  Builder.SetInsertPoint(SwEpilog);

  PHINode *AAddr0 = Builder.CreatePHI(IntTy, 3);

  AAddr0->addIncoming(Or, SwDefault);

  AAddr0->addIncoming(IsSigned ? Sub : IntVal, IfThen4);

  AAddr0->addIncoming(Shl, SwBB);

  Value *A0 = Builder.CreateTrunc(AAddr0, Builder.getInt32Ty());

  Value *A1 = Builder.CreateLShr(A0, Builder.getIntN(32, 2));

  Value *A2 = Builder.CreateAnd(A1, Builder.getIntN(32, 1));

  Value *Conv16 = Builder.CreateZExt(A2, IntTy);

  Value *Or17 = Builder.CreateOr(AAddr0, Conv16);

  Value *Inc = Builder.CreateAdd(Or17, Builder.getIntN(BitWidth, 1));

  Value *Shr18 = nullptr;

  if (IsSigned)

    Shr18 = Builder.CreateAShr(Inc, Builder.getIntN(BitWidth, 2));

  else

    Shr18 = Builder.CreateLShr(Inc, Builder.getIntN(BitWidth, 2));

  Value *A3 = Builder.CreateAnd(Inc, Temp1, "a3");

  Value *PosOrNeg = Builder.CreateICmpEQ(A3, Builder.getIntN(BitWidth, 0));

  Value *ExtractT60 = Builder.CreateTrunc(Shr18, Builder.getIntNTy(FloatWidth));

  Value *Extract63 = Builder.CreateLShr(Shr18, Builder.getIntN(BitWidth, 32));

  Value *ExtractT64 = nullptr;

  if (FloatWidth > 80)

    ExtractT64 = Builder.CreateTrunc(Sub2, Builder.getInt64Ty());

  else

    ExtractT64 = Builder.CreateTrunc(Extract63, Builder.getInt32Ty());

  Builder.CreateCondBr(PosOrNeg, IfEnd26, IfThen20);


  // if.then20

  Builder.SetInsertPoint(IfThen20);

  Value *Shr21 = nullptr;

  if (IsSigned)

    Shr21 = Builder.CreateAShr(Inc, Builder.getIntN(BitWidth, 3));

  else

    Shr21 = Builder.CreateLShr(Inc, Builder.getIntN(BitWidth, 3));

  Value *ExtractT = Builder.CreateTrunc(Shr21, Builder.getIntNTy(FloatWidth));

  Value *Extract = Builder.CreateLShr(Shr21, Builder.getIntN(BitWidth, 32));

  Value *ExtractT62 = nullptr;

  if (FloatWidth > 80)

    ExtractT62 = Builder.CreateTrunc(Sub1, Builder.getIntNTy(64));

  else

    ExtractT62 = Builder.CreateTrunc(Extract, Builder.getIntNTy(32));

  Builder.CreateBr(IfEnd26);


  // if.else:

  Builder.SetInsertPoint(IfElse);

  Value *Sub24 = Builder.CreateAdd(

      FloatWidth == 128 ? Call : Cast,

      ConstantInt::getSigned(Builder.getIntNTy(BitWidthNew),

                             -(BitWidth - FPMantissaWidth - 1)));

  Value *ShProm25 = Builder.CreateZExt(Sub24, IntTy);

  Value *Shl26 = Builder.CreateShl(IsSigned ? Sub : IntVal,

                                   FloatWidth == 128 ? Sub24 : ShProm25);

  Value *ExtractT61 = Builder.CreateTrunc(Shl26, Builder.getIntNTy(FloatWidth));

  Value *Extract65 = Builder.CreateLShr(Shl26, Builder.getIntN(BitWidth, 32));

  Value *ExtractT66 = nullptr;

  if (FloatWidth > 80)

    ExtractT66 = Builder.CreateTrunc(Sub2, Builder.getIntNTy(64));

  else

    ExtractT66 = Builder.CreateTrunc(Extract65, Builder.getInt32Ty());

  Builder.CreateBr(IfEnd26);


  // if.end26:

  Builder.SetInsertPoint(IfEnd26);

  PHINode *AAddr1Off0 = Builder.CreatePHI(Builder.getIntNTy(FloatWidth), 3);

  AAddr1Off0->addIncoming(ExtractT, IfThen20);

  AAddr1Off0->addIncoming(ExtractT60, SwEpilog);

  AAddr1Off0->addIncoming(ExtractT61, IfElse);

  PHINode *AAddr1Off32 = nullptr;

  if (FloatWidth > 32) {

    AAddr1Off32 =

        Builder.CreatePHI(Builder.getIntNTy(FloatWidth > 80 ? 64 : 32), 3);

    AAddr1Off32->addIncoming(ExtractT62, IfThen20);

    AAddr1Off32->addIncoming(ExtractT64, SwEpilog);

    AAddr1Off32->addIncoming(ExtractT66, IfElse);

  }

  PHINode *E0 = nullptr;

  if (FloatWidth <= 80) {

    E0 = Builder.CreatePHI(Builder.getIntNTy(BitWidthNew), 3);

    E0->addIncoming(Sub1, IfThen20);

    E0->addIncoming(Sub2, SwEpilog);

    E0->addIncoming(Sub2, IfElse);

  }

  Value *And29 = nullptr;

  if (FloatWidth > 80) {

    Value *Temp2 = Builder.CreateShl(Builder.getIntN(BitWidth, 1),

                                     Builder.getIntN(BitWidth, 63));

    And29 = Builder.CreateAnd(Shr, Temp2, "and29");

  } else {

    Value *Conv28 = Builder.CreateTrunc(Shr, Builder.getIntNTy(32));

    And29 = Builder.CreateAnd(

        Conv28, ConstantInt::getSigned(Builder.getIntNTy(32), 0x80000000));

  }

  unsigned TempMod = FPMantissaWidth % 32;

  Value *And34 = nullptr;

  Value *Shl30 = nullptr;

  if (FloatWidth > 80) {

    TempMod += 32;

    Value *Add = Builder.CreateShl(AAddr1Off32, Builder.getIntN(64, TempMod));

    Shl30 = Builder.CreateAdd(

        Add,

        Builder.getIntN(64, ((1ull << (62ull - TempMod)) - 1ull) << TempMod));

    And34 = Builder.CreateZExt(Shl30, Builder.getIntNTy(128));

  } else {

    Value *Add = Builder.CreateShl(E0, Builder.getIntN(32, TempMod));

    Shl30 = Builder.CreateAdd(

        Add, Builder.getIntN(32, ((1 << (30 - TempMod)) - 1) << TempMod));

    And34 = Builder.CreateAnd(FloatWidth > 32 ? AAddr1Off32 : AAddr1Off0,

                              Builder.getIntN(32, (1 << TempMod) - 1));

  }

  Value *Or35 = nullptr;

  if (FloatWidth > 80) {

    Value *And29Trunc = Builder.CreateTrunc(And29, Builder.getIntNTy(128));

    Value *Or31 = Builder.CreateOr(And29Trunc, And34);

    Value *Or34 = Builder.CreateShl(Or31, Builder.getIntN(128, 64));

    Value *Temp3 = Builder.CreateShl(Builder.getIntN(128, 1),

                                     Builder.getIntN(128, FPMantissaWidth));

    Value *Temp4 = Builder.CreateSub(Temp3, Builder.getIntN(128, 1));

    Value *A6 = Builder.CreateAnd(AAddr1Off0, Temp4);

    Or35 = Builder.CreateOr(Or34, A6);

  } else {

    Value *Or31 = Builder.CreateOr(And34, And29);

    Or35 = Builder.CreateOr(IsSigned ? Or31 : And34, Shl30);

  }

  Value *A4 = nullptr;

  if (IToFP->getType()->isDoubleTy()) {

    Value *ZExt1 = Builder.CreateZExt(Or35, Builder.getIntNTy(FloatWidth));

    Value *Shl1 = Builder.CreateShl(ZExt1, Builder.getIntN(FloatWidth, 32));

    Value *And1 =

        Builder.CreateAnd(AAddr1Off0, Builder.getIntN(FloatWidth, 0xFFFFFFFF));

    Value *Or1 = Builder.CreateOr(Shl1, And1);

    A4 = Builder.CreateBitCast(Or1, IToFP->getType());

  } else if (IToFP->getType()->isX86_FP80Ty()) {

    Value *A40 =

        Builder.CreateBitCast(Or35, Type::getFP128Ty(Builder.getContext()));

    A4 = Builder.CreateFPTrunc(A40, IToFP->getType());

  } else if (IToFP->getType()->isHalfTy() || IToFP->getType()->isBFloatTy()) {

    // Deal with "half" situation. This is a workaround since we don't have

    // floattihf.c currently as referring.

    Value *A40 =

        Builder.CreateBitCast(Or35, Type::getFloatTy(Builder.getContext()));

    A4 = Builder.CreateFPTrunc(A40, IToFP->getType());

  } else // float type

    A4 = Builder.CreateBitCast(Or35, IToFP->getType());

  Builder.CreateBr(End);


  // return:

  Builder.SetInsertPoint(End, End->begin());

  PHINode *Retval0 = Builder.CreatePHI(IToFP->getType(), 2);

  Retval0->addIncoming(A4, IfEnd26);

  Retval0->addIncoming(ConstantFP::getZero(IToFP->getType(), false), Entry);


  IToFP->replaceAllUsesWith(Retval0);

  IToFP->dropAllReferences();

  IToFP->eraseFromParent();

}


static void scalarize(Instruction *I, SmallVectorImpl<Instruction *> &Replace) {

  VectorType *VTy = cast<FixedVectorType>(I->getType());


  IRBuilder<> Builder(I);


  unsigned NumElements = VTy->getElementCount().getFixedValue();

  Value *Result = PoisonValue::get(VTy);

  for (unsigned Idx = 0; Idx < NumElements; ++Idx) {

    Value *Ext = Builder.CreateExtractElement(I->getOperand(0), Idx);

    Value *Cast = Builder.CreateCast(cast<CastInst>(I)->getOpcode(), Ext,

                                     I->getType()->getScalarType());

    Result = Builder.CreateInsertElement(Result, Cast, Idx);

    if (isa<Instruction>(Cast))

      Replace.push_back(cast<Instruction>(Cast));

  }

  I->replaceAllUsesWith(Result);

  I->dropAllReferences();

  I->eraseFromParent();

}


static bool runImpl(Function &F, const TargetLowering &TLI) {

  SmallVector<Instruction *, 4> Replace;

  SmallVector<Instruction *, 4> ReplaceVector;

  bool Modified = false;


  unsigned MaxLegalFpConvertBitWidth =

      TLI.getMaxLargeFPConvertBitWidthSupported();

  if (ExpandFpConvertBits != llvm::IntegerType::MAX_INT_BITS)

    MaxLegalFpConvertBitWidth = ExpandFpConvertBits;


  if (MaxLegalFpConvertBitWidth >= llvm::IntegerType::MAX_INT_BITS)

    return false;


  for (auto &I : instructions(F)) {

    switch (I.getOpcode()) {

    case Instruction::FPToUI:

    case Instruction::FPToSI: {

      // TODO: This pass doesn't handle scalable vectors.

      if (I.getOperand(0)->getType()->isScalableTy())

        continue;


      auto *IntTy = cast<IntegerType>(I.getType()->getScalarType());

      if (IntTy->getIntegerBitWidth() <= MaxLegalFpConvertBitWidth)

        continue;


      if (I.getOperand(0)->getType()->isVectorTy())

        ReplaceVector.push_back(&I);

      else

        Replace.push_back(&I);

      Modified = true;

      break;

    }

    case Instruction::UIToFP:

    case Instruction::SIToFP: {

      // TODO: This pass doesn't handle scalable vectors.

      if (I.getOperand(0)->getType()->isScalableTy())

        continue;


      auto *IntTy =

          cast<IntegerType>(I.getOperand(0)->getType()->getScalarType());

      if (IntTy->getIntegerBitWidth() <= MaxLegalFpConvertBitWidth)

        continue;


      if (I.getOperand(0)->getType()->isVectorTy())

        ReplaceVector.push_back(&I);

      else

        Replace.push_back(&I);

      Modified = true;

      break;

    }

    default:

      break;

    }

  }


  while (!ReplaceVector.empty()) {

    Instruction *I = ReplaceVector.pop_back_val();

    scalarize(I, Replace);

  }


  if (Replace.empty())

    return false;


  while (!Replace.empty()) {

    Instruction *I = Replace.pop_back_val();

    if (I->getOpcode() == Instruction::FPToUI ||

        I->getOpcode() == Instruction::FPToSI) {

      expandFPToI(I);

    } else {

      expandIToFP(I);

    }

  }


  return Modified;

}


namespace {

class ExpandLargeFpConvertLegacyPass : public FunctionPass {

public:

  static char ID;


  ExpandLargeFpConvertLegacyPass() : FunctionPass(ID) {

    initializeExpandLargeFpConvertLegacyPassPass(

        *PassRegistry::getPassRegistry());

  }


  bool runOnFunction(Function &F) override {

    auto *TM = &getAnalysis<TargetPassConfig>().getTM<TargetMachine>();

    auto *TLI = TM->getSubtargetImpl(F)->getTargetLowering();

    return runImpl(F, *TLI);

  }


  void getAnalysisUsage(AnalysisUsage &AU) const override {

    AU.addRequired<TargetPassConfig>();

    AU.addPreserved<AAResultsWrapperPass>();

    AU.addPreserved<GlobalsAAWrapperPass>();

  }

};

} // namespace


PreservedAnalyses ExpandLargeFpConvertPass::run(Function &F,

                                                FunctionAnalysisManager &FAM) {

  const TargetSubtargetInfo *STI = TM->getSubtargetImpl(F);

  return runImpl(F, *STI->getTargetLowering()) ? PreservedAnalyses::none()

                                               : PreservedAnalyses::all();

}


char ExpandLargeFpConvertLegacyPass::ID = 0;

INITIALIZE_PASS_BEGIN(ExpandLargeFpConvertLegacyPass, "expand-large-fp-convert",

                      "Expand large fp convert", false, false)

INITIALIZE_PASS_END(ExpandLargeFpConvertLegacyPass, "expand-large-fp-convert",

                    "Expand large fp convert", false, false)


FunctionPass *llvm::createExpandLargeFpConvertPass() {

  return new ExpandLargeFpConvertLegacyPass();

}

instructions
Expand Atomic instructions
Definition: AtomicExpandPass.cpp:172

Passes.h

CommandLine.h

Idx
Returns the sub type a function will return at a given Idx Should correspond to the result type of an ExtractValue instruction executed with just that one unsigned Idx
Definition: DeadArgumentElimination.cpp:353

End
bool End
Definition: ELF_riscv.cpp:480

runImpl
static bool runImpl(Function &F, const TargetLowering &TLI)
Definition: ExpandLargeDivRem.cpp:79

expandIToFP
static void expandIToFP(Instruction *IToFP)
Generate code to convert a fp number to integer, replacing S(U)IToFP with the generated code.
Definition: ExpandLargeFpConvert.cpp:309

expandFPToI
static void expandFPToI(Instruction *FPToI)
Generate code to convert a fp number to integer, replacing FPToS(U)I with the generated code.
Definition: ExpandLargeFpConvert.cpp:90

scalarize
static void scalarize(Instruction *I, SmallVectorImpl< Instruction * > &Replace)
Definition: ExpandLargeFpConvert.cpp:572

convert
expand large fp convert
Definition: ExpandLargeFpConvert.cpp:702

ExpandFpConvertBits
static cl::opt< unsigned > ExpandFpConvertBits("expand-fp-convert-bits", cl::Hidden, cl::init(llvm::IntegerType::MAX_INT_BITS), cl::desc("fp convert instructions on integers with " "more than <N> bits are expanded."))

runImpl
static bool runImpl(Function &F, const TargetLowering &TLI)
Definition: ExpandLargeFpConvert.cpp:592

ExpandLargeFpConvert.h

expand
static Expected< BitVector > expand(StringRef S, StringRef Original)
Definition: GlobPattern.cpp:21

GlobalsModRef.h
This is the interface for a simple mod/ref and alias analysis over globals.

IRBuilder.h

PassManager.h
This header defines various interfaces for pass management in LLVM.

InitializePasses.h

InstIterator.h

LoopDeletionResult::Modified
@ Modified

F
#define F(x, y, z)
Definition: MD5.cpp:55

I
#define I(x, y, z)
Definition: MD5.cpp:58

FAM
FunctionAnalysisManager FAM
Definition: PassBuilderBindings.cpp:61

INITIALIZE_PASS_END
#define INITIALIZE_PASS_END(passName, arg, name, cfg, analysis)
Definition: PassSupport.h:57

INITIALIZE_PASS_BEGIN
#define INITIALIZE_PASS_BEGIN(passName, arg, name, cfg, analysis)
Definition: PassSupport.h:52

Pass.h

assert
assert(ImpDefSCC.getReg()==AMDGPU::SCC &&ImpDefSCC.isDef())

SmallVector.h
This file defines the SmallVector class.

TargetLowering.h
This file describes how to lower LLVM code to machine code.

TargetPassConfig.h
Target-Independent Code Generator Pass Configuration Options pass.

TargetSubtargetInfo.h

getOpcode
static std::optional< unsigned > getOpcode(ArrayRef< VPValue * > Values)
Returns the opcode of Values or ~0 if they do not all agree.
Definition: VPlanSLP.cpp:191

Mul
BinaryOperator * Mul
Definition: X86PartialReduction.cpp:68

VectorType
Definition: ItaniumDemangle.h:1173

llvm::AAResultsWrapperPass
A wrapper pass to provide the legacy pass manager access to a suitably prepared AAResults object.
Definition: AliasAnalysis.h:975

llvm::AnalysisManager
A container for analyses that lazily runs them and caches their results.
Definition: PassManager.h:253

llvm::AnalysisUsage
Represent the analysis usage information of a pass.
Definition: PassAnalysisSupport.h:47

llvm::AnalysisUsage::addRequired
AnalysisUsage & addRequired()
Definition: PassAnalysisSupport.h:75

llvm::AnalysisUsage::addPreserved
AnalysisUsage & addPreserved()
Add the specified Pass class to the set of analyses preserved by this pass.
Definition: PassAnalysisSupport.h:98

llvm::BasicBlock
LLVM Basic Block Representation.
Definition: BasicBlock.h:61

llvm::BasicBlock::Create
static BasicBlock * Create(LLVMContext &Context, const Twine &Name="", Function *Parent=nullptr, BasicBlock *InsertBefore=nullptr)
Creates a new BasicBlock.
Definition: BasicBlock.h:212

llvm::ConstantFP::getZero
static Constant * getZero(Type *Ty, bool Negative=false)
Definition: Constants.cpp:1057

llvm::ConstantInt
This is the shared class of boolean and integer constants.
Definition: Constants.h:83

llvm::ConstantInt::getSigned
static ConstantInt * getSigned(IntegerType *Ty, int64_t V)
Return a ConstantInt with the specified value for the specified type.
Definition: Constants.h:126

llvm::ExpandLargeFpConvertPass::run
PreservedAnalyses run(Function &F, FunctionAnalysisManager &AM)
Definition: ExpandLargeFpConvert.cpp:692

llvm::FunctionPass
FunctionPass class - This class is used to implement most global optimizations.
Definition: Pass.h:310

llvm::FunctionPass::runOnFunction
virtual bool runOnFunction(Function &F)=0
runOnFunction - Virtual method overriden by subclasses to do the per-function processing of the pass.

llvm::Function
Definition: Function.h:63

llvm::GlobalsAAWrapperPass
Legacy wrapper pass to provide the GlobalsAAResult object.
Definition: GlobalsModRef.h:142

llvm::IRBuilderBase::CreateICmpULT
Value * CreateICmpULT(Value *LHS, Value *RHS, const Twine &Name="")
Definition: IRBuilder.h:2286

llvm::IRBuilderBase::CreateInsertElement
Value * CreateInsertElement(Type *VecTy, Value *NewElt, Value *Idx, const Twine &Name="")
Definition: IRBuilder.h:2511

llvm::IRBuilderBase::CreateExtractElement
Value * CreateExtractElement(Value *Vec, Value *Idx, const Twine &Name="")
Definition: IRBuilder.h:2499

llvm::IRBuilderBase::getIntNTy
IntegerType * getIntNTy(unsigned N)
Fetch the type representing an N-bit integer.
Definition: IRBuilder.h:558

llvm::IRBuilderBase::CreateICmpSGT
Value * CreateICmpSGT(Value *LHS, Value *RHS, const Twine &Name="")
Definition: IRBuilder.h:2294

llvm::IRBuilderBase::CreateFPTrunc
Value * CreateFPTrunc(Value *V, Type *DestTy, const Twine &Name="", MDNode *FPMathTag=nullptr)
Definition: IRBuilder.h:2113

llvm::IRBuilderBase::getTrue
ConstantInt * getTrue()
Get the constant value for i1 true.
Definition: IRBuilder.h:485

llvm::IRBuilderBase::CreateSelect
Value * CreateSelect(Value *C, Value *True, Value *False, const Twine &Name="", Instruction *MDFrom=nullptr)
Definition: IRBuilder.cpp:1053

llvm::IRBuilderBase::CreateFPToUI
Value * CreateFPToUI(Value *V, Type *DestTy, const Twine &Name="")
Definition: IRBuilder.h:2079

llvm::IRBuilderBase::GetInsertPoint
BasicBlock::iterator GetInsertPoint() const
Definition: IRBuilder.h:194

llvm::IRBuilderBase::CreateSExt
Value * CreateSExt(Value *V, Type *DestTy, const Twine &Name="")
Definition: IRBuilder.h:2045

llvm::IRBuilderBase::CreateLShr
Value * CreateLShr(Value *LHS, Value *RHS, const Twine &Name="", bool isExact=false)
Definition: IRBuilder.h:1480

llvm::IRBuilderBase::getInt32Ty
IntegerType * getInt32Ty()
Fetch the type representing a 32-bit integer.
Definition: IRBuilder.h:545

llvm::IRBuilderBase::CreateCast
Value * CreateCast(Instruction::CastOps Op, Value *V, Type *DestTy, const Twine &Name="", MDNode *FPMathTag=nullptr, FMFSource FMFSource={})
Definition: IRBuilder.h:2186

llvm::IRBuilderBase::GetInsertBlock
BasicBlock * GetInsertBlock() const
Definition: IRBuilder.h:193

llvm::IRBuilderBase::getInt64Ty
IntegerType * getInt64Ty()
Fetch the type representing a 64-bit integer.
Definition: IRBuilder.h:550

llvm::IRBuilderBase::CreateICmpNE
Value * CreateICmpNE(Value *LHS, Value *RHS, const Twine &Name="")
Definition: IRBuilder.h:2274

llvm::IRBuilderBase::CreatePHI
PHINode * CreatePHI(Type *Ty, unsigned NumReservedValues, const Twine &Name="")
Definition: IRBuilder.h:2435

llvm::IRBuilderBase::CreateSwitch
SwitchInst * CreateSwitch(Value *V, BasicBlock *Dest, unsigned NumCases=10, MDNode *BranchWeights=nullptr, MDNode *Unpredictable=nullptr)
Create a switch instruction with the specified value, default dest, and with a hint for the number of...
Definition: IRBuilder.h:1187

llvm::IRBuilderBase::CreateICmpEQ
Value * CreateICmpEQ(Value *LHS, Value *RHS, const Twine &Name="")
Definition: IRBuilder.h:2270

llvm::IRBuilderBase::CreateSub
Value * CreateSub(Value *LHS, Value *RHS, const Twine &Name="", bool HasNUW=false, bool HasNSW=false)
Definition: IRBuilder.h:1387

llvm::IRBuilderBase::CreateBitCast
Value * CreateBitCast(Value *V, Type *DestTy, const Twine &Name="")
Definition: IRBuilder.h:2152

llvm::IRBuilderBase::getIntN
ConstantInt * getIntN(unsigned N, uint64_t C)
Get a constant N-bit value, zero extended or truncated from a 64-bit value.
Definition: IRBuilder.h:516

llvm::IRBuilderBase::CreateCondBr
BranchInst * CreateCondBr(Value *Cond, BasicBlock *True, BasicBlock *False, MDNode *BranchWeights=nullptr, MDNode *Unpredictable=nullptr)
Create a conditional 'br Cond, TrueDest, FalseDest' instruction.
Definition: IRBuilder.h:1164

llvm::IRBuilderBase::CreateShl
Value * CreateShl(Value *LHS, Value *RHS, const Twine &Name="", bool HasNUW=false, bool HasNSW=false)
Definition: IRBuilder.h:1459

llvm::IRBuilderBase::CreateZExt
Value * CreateZExt(Value *V, Type *DestTy, const Twine &Name="", bool IsNonNeg=false)
Definition: IRBuilder.h:2033

llvm::IRBuilderBase::getContext
LLVMContext & getContext() const
Definition: IRBuilder.h:195

llvm::IRBuilderBase::CreateAnd
Value * CreateAnd(Value *LHS, Value *RHS, const Twine &Name="")
Definition: IRBuilder.h:1518

llvm::IRBuilderBase::CreateAdd
Value * CreateAdd(Value *LHS, Value *RHS, const Twine &Name="", bool HasNUW=false, bool HasNSW=false)
Definition: IRBuilder.h:1370

llvm::IRBuilderBase::CreateCall
CallInst * CreateCall(FunctionType *FTy, Value *Callee, ArrayRef< Value * > Args={}, const Twine &Name="", MDNode *FPMathTag=nullptr)
Definition: IRBuilder.h:2449

llvm::IRBuilderBase::CreateTrunc
Value * CreateTrunc(Value *V, Type *DestTy, const Twine &Name="", bool IsNUW=false, bool IsNSW=false)
Definition: IRBuilder.h:2019

llvm::IRBuilderBase::CreateOr
Value * CreateOr(Value *LHS, Value *RHS, const Twine &Name="")
Definition: IRBuilder.h:1540

llvm::IRBuilderBase::CreateBr
BranchInst * CreateBr(BasicBlock *Dest)
Create an unconditional 'br label X' instruction.
Definition: IRBuilder.h:1158

llvm::IRBuilderBase::SetInsertPoint
void SetInsertPoint(BasicBlock *TheBB)
This specifies that created instructions should be appended to the end of the specified block.
Definition: IRBuilder.h:199

llvm::IRBuilderBase::CreateFPExt
Value * CreateFPExt(Value *V, Type *DestTy, const Twine &Name="", MDNode *FPMathTag=nullptr)
Definition: IRBuilder.h:2128

llvm::IRBuilderBase::CreateAShr
Value * CreateAShr(Value *LHS, Value *RHS, const Twine &Name="", bool isExact=false)
Definition: IRBuilder.h:1499

llvm::IRBuilderBase::CreateXor
Value * CreateXor(Value *LHS, Value *RHS, const Twine &Name="")
Definition: IRBuilder.h:1562

llvm::IRBuilderBase::CreateMul
Value * CreateMul(Value *LHS, Value *RHS, const Twine &Name="", bool HasNUW=false, bool HasNSW=false)
Definition: IRBuilder.h:1404

llvm::IRBuilderBase::CreateFPToSI
Value * CreateFPToSI(Value *V, Type *DestTy, const Twine &Name="")
Definition: IRBuilder.h:2086

llvm::IRBuilder
This provides a uniform API for creating instructions and inserting them into a basic block: either a...
Definition: IRBuilder.h:2705

llvm::Instruction
Definition: Instruction.h:68

llvm::Instruction::eraseFromParent
InstListType::iterator eraseFromParent()
This method unlinks 'this' from the containing basic block and deletes it.
Definition: Instruction.cpp:94

llvm::Instruction::getOpcode
unsigned getOpcode() const
Returns a member of one of the enums like Instruction::Add.
Definition: Instruction.h:274

llvm::IntegerType
Class to represent integer types.
Definition: DerivedTypes.h:42

llvm::IntegerType::MAX_INT_BITS
@ MAX_INT_BITS
Maximum number of bits that can be specified.
Definition: DerivedTypes.h:54

llvm::PHINode
Definition: Instructions.h:2600

llvm::PHINode::addIncoming
void addIncoming(Value *V, BasicBlock *BB)
Add an incoming value to the end of the PHI list.
Definition: Instructions.h:2735

llvm::PassRegistry::getPassRegistry
static PassRegistry * getPassRegistry()
getPassRegistry - Access the global registry object, which is automatically initialized at applicatio...
Definition: PassRegistry.cpp:24

llvm::Pass::getAnalysisUsage
virtual void getAnalysisUsage(AnalysisUsage &) const
getAnalysisUsage - This function should be overriden by passes that need analysis information to do t...
Definition: Pass.cpp:98

llvm::PoisonValue::get
static PoisonValue * get(Type *T)
Static factory methods - Return an 'poison' object of the specified type.
Definition: Constants.cpp:1878

llvm::PreservedAnalyses
A set of analyses that are preserved following a run of a transformation pass.
Definition: Analysis.h:111

llvm::PreservedAnalyses::none
static PreservedAnalyses none()
Convenience factory function for the empty preserved set.
Definition: Analysis.h:114

llvm::PreservedAnalyses::all
static PreservedAnalyses all()
Construct a special preserved set that preserves all passes.
Definition: Analysis.h:117

llvm::SmallVectorBase::empty
bool empty() const
Definition: SmallVector.h:81

llvm::SmallVectorImpl
This class consists of common code factored out of the SmallVector class to reduce code duplication b...
Definition: SmallVector.h:573

llvm::SmallVectorImpl::pop_back_val
T pop_back_val()
Definition: SmallVector.h:673

llvm::SmallVectorTemplateBase::push_back
void push_back(const T &Elt)
Definition: SmallVector.h:413

llvm::SmallVector
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
Definition: SmallVector.h:1196

llvm::SwitchInst
Multiway switch.
Definition: Instructions.h:3154

llvm::TargetLoweringBase::getMaxLargeFPConvertBitWidthSupported
unsigned getMaxLargeFPConvertBitWidthSupported() const
Returns the size in bits of the maximum larget fp convert the backend supports.
Definition: TargetLowering.h:2148

llvm::TargetLowering
This class defines information used to lower LLVM code to legal SelectionDAG operators that the targe...
Definition: TargetLowering.h:3780

llvm::TargetMachine
Primary interface to the complete machine description for the target machine.
Definition: TargetMachine.h:77

llvm::TargetMachine::getSubtargetImpl
virtual const TargetSubtargetInfo * getSubtargetImpl(const Function &) const
Virtual method implemented by subclasses that returns a reference to that target's TargetSubtargetInf...
Definition: TargetMachine.h:133

llvm::TargetPassConfig
Target-Independent Code Generator Pass Configuration Options.
Definition: TargetPassConfig.h:85

llvm::TargetSubtargetInfo
TargetSubtargetInfo - Generic base class for all target subtargets.
Definition: TargetSubtargetInfo.h:63

llvm::TargetSubtargetInfo::getTargetLowering
virtual const TargetLowering * getTargetLowering() const
Definition: TargetSubtargetInfo.h:101

llvm::Twine
Twine - A lightweight data structure for efficiently representing the concatenation of temporary valu...
Definition: Twine.h:81

llvm::Type::getIntegerBitWidth
unsigned getIntegerBitWidth() const

llvm::Type::isX86_FP80Ty
bool isX86_FP80Ty() const
Return true if this is x86 long double.
Definition: Type.h:159

llvm::Type::isBFloatTy
bool isBFloatTy() const
Return true if this is 'bfloat', a 16-bit bfloat type.
Definition: Type.h:145

llvm::Type::getFP128Ty
static Type * getFP128Ty(LLVMContext &C)

llvm::Type::isHalfTy
bool isHalfTy() const
Return true if this is 'half', a 16-bit IEEE fp type.
Definition: Type.h:142

llvm::Type::getFPMantissaWidth
int getFPMantissaWidth() const
Return the width of the mantissa of this type.

llvm::Type::isDoubleTy
bool isDoubleTy() const
Return true if this is 'double', a 64-bit IEEE fp type.
Definition: Type.h:156

llvm::Type::getFloatTy
static Type * getFloatTy(LLVMContext &C)

llvm::User::dropAllReferences
void dropAllReferences()
Drop all references to operands.
Definition: User.h:345

llvm::User::getOperand
Value * getOperand(unsigned i) const
Definition: User.h:228

llvm::Value
LLVM Value Representation.
Definition: Value.h:74

llvm::Value::getType
Type * getType() const
All values are typed, get the type of this value.
Definition: Value.h:255

llvm::Value::replaceAllUsesWith
void replaceAllUsesWith(Value *V)
Change all uses of this to point to a new Value.
Definition: Value.cpp:534

llvm::cl::opt
Definition: CommandLine.h:1423

unsigned

TargetMachine.h

false
Definition: StackSlotColoring.cpp:193

llvm::CallingConv::ID
unsigned ID
LLVM IR allows to use arbitrary numbers as calling convention identifiers.
Definition: CallingConv.h:24

llvm::Intrinsic::getOrInsertDeclaration
Function * getOrInsertDeclaration(Module *M, ID id, ArrayRef< Type * > Tys={})
Look up the Function declaration of the intrinsic id in the Module M.
Definition: Intrinsics.cpp:731

llvm::SystemZISD::TM
@ TM
Definition: SystemZISelLowering.h:66

llvm::cl::Hidden
@ Hidden
Definition: CommandLine.h:137

llvm::cl::init
initializer< Ty > init(const Ty &Val)
Definition: CommandLine.h:443

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition: AddressRanges.h:18

llvm::PowerOf2Ceil
uint64_t PowerOf2Ceil(uint64_t A)
Returns the power of two which is greater than or equal to the given value.
Definition: MathExtras.h:396

llvm::createExpandLargeFpConvertPass
FunctionPass * createExpandLargeFpConvertPass()
Definition: ExpandLargeFpConvert.cpp:705

llvm::initializeExpandLargeFpConvertLegacyPassPass
void initializeExpandLargeFpConvertLegacyPassPass(PassRegistry &)

llvm::RecurKind::Or
@ Or
Bitwise or logical OR of integers.

llvm::RecurKind::Xor
@ Xor
Bitwise or logical XOR of integers.

llvm::RecurKind::And
@ And
Bitwise or logical AND of integers.

llvm::RecurKind::Add
@ Add
Sum of integers.

llvm::BitWidth
constexpr unsigned BitWidth
Definition: BitmaskEnum.h:217

llvm::cl::desc
Definition: CommandLine.h:409