doxygen/ExpandLargeFpConvert_8cpp_source.html

//===--- ExpandLargeFpConvert.cpp - Expand large fp convert----------------===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//

//


// This pass expands ‘fptoui .. to’, ‘fptosi .. to’, ‘uitofp .. to’,

// ‘sitofp .. to’ instructions with a bitwidth above a threshold into

// auto-generated functions. This is useful for targets like x86_64 that cannot

// lower fp convertions with more than 128 bits.

//

//===----------------------------------------------------------------------===//


#include "llvm/CodeGen/ExpandLargeFpConvert.h"

#include "llvm/ADT/SmallVector.h"

#include "llvm/ADT/StringExtras.h"

#include "llvm/Analysis/GlobalsModRef.h"

#include "llvm/CodeGen/Passes.h"

#include "llvm/CodeGen/TargetLowering.h"

#include "llvm/CodeGen/TargetPassConfig.h"

#include "llvm/CodeGen/TargetSubtargetInfo.h"

#include "llvm/IR/IRBuilder.h"

#include "llvm/IR/InstIterator.h"

#include "llvm/IR/PassManager.h"

#include "llvm/InitializePasses.h"

#include "llvm/Pass.h"

#include "llvm/Support/CommandLine.h"

#include "llvm/Target/TargetMachine.h"


using namespace llvm;


static cl::opt<unsigned>

    ExpandFpConvertBits("expand-fp-convert-bits", cl::Hidden,

                     cl::init(llvm::IntegerType::MAX_INT_BITS),

                     cl::desc("fp convert instructions on integers with "

                              "more than <N> bits are expanded."));


/// Generate code to convert a fp number to integer, replacing FPToS(U)I with

/// the generated code. This currently generates code similarly to compiler-rt's

/// implementations.

///

/// An example IR generated from compiler-rt/fixsfdi.c looks like below:

/// define dso_local i64 @foo(float noundef %a) local_unnamed_addr #0 {

/// entry:

///   %0 = bitcast float %a to i32

///   %conv.i = zext i32 %0 to i64

///   %tobool.not = icmp sgt i32 %0, -1

///   %conv = select i1 %tobool.not, i64 1, i64 -1

///   %and = lshr i64 %conv.i, 23

///   %shr = and i64 %and, 255

///   %and2 = and i64 %conv.i, 8388607

///   %or = or i64 %and2, 8388608

///   %cmp = icmp ult i64 %shr, 127

///   br i1 %cmp, label %cleanup, label %if.end

///

/// if.end:                                           ; preds = %entry

///   %sub = add nuw nsw i64 %shr, 4294967169

///   %conv5 = and i64 %sub, 4294967232

///   %cmp6.not = icmp eq i64 %conv5, 0

///   br i1 %cmp6.not, label %if.end12, label %if.then8

///

/// if.then8:                                         ; preds = %if.end

///   %cond11 = select i1 %tobool.not, i64 9223372036854775807, i64 -9223372036854775808

///   br label %cleanup

///

/// if.end12:                                         ; preds = %if.end

///   %cmp13 = icmp ult i64 %shr, 150

///   br i1 %cmp13, label %if.then15, label %if.else

///

/// if.then15:                                        ; preds = %if.end12

///   %sub16 = sub nuw nsw i64 150, %shr

///   %shr17 = lshr i64 %or, %sub16

///   %mul = mul nsw i64 %shr17, %conv

///   br label %cleanup

///

/// if.else:                                          ; preds = %if.end12

///   %sub18 = add nsw i64 %shr, -150

///   %shl = shl i64 %or, %sub18

///   %mul19 = mul nsw i64 %shl, %conv

///   br label %cleanup

///

/// cleanup:                                          ; preds = %entry, %if.else, %if.then15, %if.then8

///   %retval.0 = phi i64 [ %cond11, %if.then8 ], [ %mul, %if.then15 ], [ %mul19, %if.else ], [ 0, %entry ]

///   ret i64 %retval.0

/// }

///

/// Replace fp to integer with generated code.

static void expandFPToI(Instruction *FPToI) {

  IRBuilder<> Builder(FPToI);

  auto *FloatVal = FPToI->getOperand(0);

  IntegerType *IntTy = cast<IntegerType>(FPToI->getType());


  unsigned BitWidth = FPToI->getType()->getIntegerBitWidth();

  unsigned FPMantissaWidth = FloatVal->getType()->getFPMantissaWidth() - 1;


  // FIXME: fp16's range is covered by i32. So `fptoi half` can convert

  // to i32 first following a sext/zext to target integer type.

  Value *A1 = nullptr;

  if (FloatVal->getType()->isHalfTy()) {

    if (FPToI->getOpcode() == Instruction::FPToUI) {

      Value *A0 = Builder.CreateFPToUI(FloatVal, Builder.getIntNTy(32));

      A1 = Builder.CreateZExt(A0, IntTy);

    } else { // FPToSI

      Value *A0 = Builder.CreateFPToSI(FloatVal, Builder.getIntNTy(32));

      A1 = Builder.CreateSExt(A0, IntTy);

    }

    FPToI->replaceAllUsesWith(A1);

    FPToI->dropAllReferences();

    FPToI->eraseFromParent();

    return;

  }


  // fp80 conversion is implemented by fpext to fp128 first then do the

  // conversion.

  FPMantissaWidth = FPMantissaWidth == 63 ? 112 : FPMantissaWidth;

  unsigned FloatWidth =

      PowerOf2Ceil(FloatVal->getType()->getScalarSizeInBits());

  unsigned ExponentWidth = FloatWidth - FPMantissaWidth - 1;

  unsigned ExponentBias = (1 << (ExponentWidth - 1)) - 1;

  Value *ImplicitBit = Builder.CreateShl(

      Builder.getIntN(BitWidth, 1), Builder.getIntN(BitWidth, FPMantissaWidth));

  Value *SignificandMask =

      Builder.CreateSub(ImplicitBit, Builder.getIntN(BitWidth, 1));

  Value *NegOne = Builder.CreateSExt(

      ConstantInt::getSigned(Builder.getInt32Ty(), -1), IntTy);

  Value *NegInf =

      Builder.CreateShl(ConstantInt::getSigned(IntTy, 1),

                        ConstantInt::getSigned(IntTy, BitWidth - 1));


  BasicBlock *Entry = Builder.GetInsertBlock();

  Function *F = Entry->getParent();

  Entry->setName(Twine(Entry->getName(), "fp-to-i-entry"));

  BasicBlock *End =

      Entry->splitBasicBlock(Builder.GetInsertPoint(), "fp-to-i-cleanup");

  BasicBlock *IfEnd =

      BasicBlock::Create(Builder.getContext(), "fp-to-i-if-end", F, End);

  BasicBlock *IfThen5 =

      BasicBlock::Create(Builder.getContext(), "fp-to-i-if-then5", F, End);

  BasicBlock *IfEnd9 =

      BasicBlock::Create(Builder.getContext(), "fp-to-i-if-end9", F, End);

  BasicBlock *IfThen12 =

      BasicBlock::Create(Builder.getContext(), "fp-to-i-if-then12", F, End);

  BasicBlock *IfElse =

      BasicBlock::Create(Builder.getContext(), "fp-to-i-if-else", F, End);


  Entry->getTerminator()->eraseFromParent();


  // entry:

  Builder.SetInsertPoint(Entry);

  Value *FloatVal0 = FloatVal;

  // fp80 conversion is implemented by fpext to fp128 first then do the

  // conversion.

  if (FloatVal->getType()->isX86_FP80Ty())

    FloatVal0 =

        Builder.CreateFPExt(FloatVal, Type::getFP128Ty(Builder.getContext()));

  Value *ARep0 =

      Builder.CreateBitCast(FloatVal0, Builder.getIntNTy(FloatWidth));

  Value *ARep = Builder.CreateZExt(ARep0, FPToI->getType());

  Value *PosOrNeg = Builder.CreateICmpSGT(

      ARep0, ConstantInt::getSigned(Builder.getIntNTy(FloatWidth), -1));

  Value *Sign = Builder.CreateSelect(PosOrNeg, ConstantInt::getSigned(IntTy, 1),

                                     ConstantInt::getSigned(IntTy, -1));

  Value *And =

      Builder.CreateLShr(ARep, Builder.getIntN(BitWidth, FPMantissaWidth));

  Value *And2 = Builder.CreateAnd(

      And, Builder.getIntN(BitWidth, (1 << ExponentWidth) - 1));

  Value *Abs = Builder.CreateAnd(ARep, SignificandMask);

  Value *Or = Builder.CreateOr(Abs, ImplicitBit);

  Value *Cmp =

      Builder.CreateICmpULT(And2, Builder.getIntN(BitWidth, ExponentBias));

  Builder.CreateCondBr(Cmp, End, IfEnd);


  // if.end:

  Builder.SetInsertPoint(IfEnd);

  Value *Add1 = Builder.CreateAdd(

      And2, ConstantInt::getSigned(

                IntTy, -static_cast<int64_t>(ExponentBias + BitWidth)));

  Value *Cmp3 = Builder.CreateICmpULT(

      Add1, ConstantInt::getSigned(IntTy, -static_cast<int64_t>(BitWidth)));

  Builder.CreateCondBr(Cmp3, IfThen5, IfEnd9);


  // if.then5:

  Builder.SetInsertPoint(IfThen5);

  Value *PosInf = Builder.CreateXor(NegOne, NegInf);

  Value *Cond8 = Builder.CreateSelect(PosOrNeg, PosInf, NegInf);

  Builder.CreateBr(End);


  // if.end9:

  Builder.SetInsertPoint(IfEnd9);

  Value *Cmp10 = Builder.CreateICmpULT(

      And2, Builder.getIntN(BitWidth, ExponentBias + FPMantissaWidth));

  Builder.CreateCondBr(Cmp10, IfThen12, IfElse);


  // if.then12:

  Builder.SetInsertPoint(IfThen12);

  Value *Sub13 = Builder.CreateSub(

      Builder.getIntN(BitWidth, ExponentBias + FPMantissaWidth), And2);

  Value *Shr14 = Builder.CreateLShr(Or, Sub13);

  Value *Mul = Builder.CreateMul(Shr14, Sign);

  Builder.CreateBr(End);


  // if.else:

  Builder.SetInsertPoint(IfElse);

  Value *Sub15 = Builder.CreateAdd(

      And2, ConstantInt::getSigned(

                IntTy, -static_cast<int64_t>(ExponentBias + FPMantissaWidth)));

  Value *Shl = Builder.CreateShl(Or, Sub15);

  Value *Mul16 = Builder.CreateMul(Shl, Sign);

  Builder.CreateBr(End);


  // cleanup:

  Builder.SetInsertPoint(End, End->begin());

  PHINode *Retval0 = Builder.CreatePHI(FPToI->getType(), 4);


  Retval0->addIncoming(Cond8, IfThen5);

  Retval0->addIncoming(Mul, IfThen12);

  Retval0->addIncoming(Mul16, IfElse);

  Retval0->addIncoming(Builder.getIntN(BitWidth, 0), Entry);


  FPToI->replaceAllUsesWith(Retval0);

  FPToI->dropAllReferences();

  FPToI->eraseFromParent();

}


/// Generate code to convert a fp number to integer, replacing S(U)IToFP with

/// the generated code. This currently generates code similarly to compiler-rt's

/// implementations. This implementation has an implicit assumption that integer

/// width is larger than fp.

///

/// An example IR generated from compiler-rt/floatdisf.c looks like below:

/// define dso_local float @__floatdisf(i64 noundef %a) local_unnamed_addr #0 {

/// entry:

///   %cmp = icmp eq i64 %a, 0

///   br i1 %cmp, label %return, label %if.end

///

/// if.end:                                           ; preds = %entry

///   %shr = ashr i64 %a, 63

///   %xor = xor i64 %shr, %a

///   %sub = sub nsw i64 %xor, %shr

///   %0 = tail call i64 @llvm.ctlz.i64(i64 %sub, i1 true), !range !5

///   %cast = trunc i64 %0 to i32

///   %sub1 = sub nuw nsw i32 64, %cast

///   %sub2 = xor i32 %cast, 63

///   %cmp3 = icmp ult i32 %cast, 40

///   br i1 %cmp3, label %if.then4, label %if.else

///

/// if.then4:                                         ; preds = %if.end

///   switch i32 %sub1, label %sw.default [

///     i32 25, label %sw.bb

///     i32 26, label %sw.epilog

///   ]

///

/// sw.bb:                                            ; preds = %if.then4

///   %shl = shl i64 %sub, 1

///   br label %sw.epilog

///

/// sw.default:                                       ; preds = %if.then4

///   %sub5 = sub nsw i64 38, %0

///   %sh_prom = and i64 %sub5, 4294967295

///   %shr6 = lshr i64 %sub, %sh_prom

///   %shr9 = lshr i64 274877906943, %0

///   %and = and i64 %shr9, %sub

///   %cmp10 = icmp ne i64 %and, 0

///   %conv11 = zext i1 %cmp10 to i64

///   %or = or i64 %shr6, %conv11

///   br label %sw.epilog

///

/// sw.epilog:                                        ; preds = %sw.default, %if.then4, %sw.bb

///   %a.addr.0 = phi i64 [ %or, %sw.default ], [ %sub, %if.then4 ], [ %shl, %sw.bb ]

///   %1 = lshr i64 %a.addr.0, 2

///   %2 = and i64 %1, 1

///   %or16 = or i64 %2, %a.addr.0

///   %inc = add nsw i64 %or16, 1

///   %3 = and i64 %inc, 67108864

///   %tobool.not = icmp eq i64 %3, 0

///   %spec.select.v = select i1 %tobool.not, i64 2, i64 3

///   %spec.select = ashr i64 %inc, %spec.select.v

///   %spec.select56 = select i1 %tobool.not, i32 %sub2, i32 %sub1

///   br label %if.end26

///

/// if.else:                                          ; preds = %if.end

///   %sub23 = add nuw nsw i64 %0, 4294967256

///   %sh_prom24 = and i64 %sub23, 4294967295

///   %shl25 = shl i64 %sub, %sh_prom24

///   br label %if.end26

///

/// if.end26:                                         ; preds = %sw.epilog, %if.else

///   %a.addr.1 = phi i64 [ %shl25, %if.else ], [ %spec.select, %sw.epilog ]

///   %e.0 = phi i32 [ %sub2, %if.else ], [ %spec.select56, %sw.epilog ]

///   %conv27 = trunc i64 %shr to i32

///   %and28 = and i32 %conv27, -2147483648

///   %add = shl nuw nsw i32 %e.0, 23

///   %shl29 = add nuw nsw i32 %add, 1065353216

///   %conv31 = trunc i64 %a.addr.1 to i32

///   %and32 = and i32 %conv31, 8388607

///   %or30 = or i32 %and32, %and28

///   %or33 = or i32 %or30, %shl29

///   %4 = bitcast i32 %or33 to float

///   br label %return

///

/// return:                                           ; preds = %entry, %if.end26

///   %retval.0 = phi float [ %4, %if.end26 ], [ 0.000000e+00, %entry ]

///   ret float %retval.0

/// }

///

/// Replace integer to fp with generated code.

static void expandIToFP(Instruction *IToFP) {

  IRBuilder<> Builder(IToFP);

  auto *IntVal = IToFP->getOperand(0);

  IntegerType *IntTy = cast<IntegerType>(IntVal->getType());


  unsigned BitWidth = IntVal->getType()->getIntegerBitWidth();

  unsigned FPMantissaWidth = IToFP->getType()->getFPMantissaWidth() - 1;

  // fp80 conversion is implemented by conversion tp fp128 first following

  // a fptrunc to fp80.

  FPMantissaWidth = FPMantissaWidth == 63 ? 112 : FPMantissaWidth;

  // FIXME: As there is no related builtins added in compliler-rt,

  // here currently utilized the fp32 <-> fp16 lib calls to implement.

  FPMantissaWidth = FPMantissaWidth == 10 ? 23 : FPMantissaWidth;

  FPMantissaWidth = FPMantissaWidth == 7 ? 23 : FPMantissaWidth;

  unsigned FloatWidth = PowerOf2Ceil(FPMantissaWidth);

  bool IsSigned = IToFP->getOpcode() == Instruction::SIToFP;


  assert(BitWidth > FloatWidth && "Unexpected conversion. expandIToFP() "

                                  "assumes integer width is larger than fp.");


  Value *Temp1 =

      Builder.CreateShl(Builder.getIntN(BitWidth, 1),

                        Builder.getIntN(BitWidth, FPMantissaWidth + 3));


  BasicBlock *Entry = Builder.GetInsertBlock();

  Function *F = Entry->getParent();

  Entry->setName(Twine(Entry->getName(), "itofp-entry"));

  BasicBlock *End =

      Entry->splitBasicBlock(Builder.GetInsertPoint(), "itofp-return");

  BasicBlock *IfEnd =

      BasicBlock::Create(Builder.getContext(), "itofp-if-end", F, End);

  BasicBlock *IfThen4 =

      BasicBlock::Create(Builder.getContext(), "itofp-if-then4", F, End);

  BasicBlock *SwBB =

      BasicBlock::Create(Builder.getContext(), "itofp-sw-bb", F, End);

  BasicBlock *SwDefault =

      BasicBlock::Create(Builder.getContext(), "itofp-sw-default", F, End);

  BasicBlock *SwEpilog =

      BasicBlock::Create(Builder.getContext(), "itofp-sw-epilog", F, End);

  BasicBlock *IfThen20 =

      BasicBlock::Create(Builder.getContext(), "itofp-if-then20", F, End);

  BasicBlock *IfElse =

      BasicBlock::Create(Builder.getContext(), "itofp-if-else", F, End);

  BasicBlock *IfEnd26 =

      BasicBlock::Create(Builder.getContext(), "itofp-if-end26", F, End);


  Entry->getTerminator()->eraseFromParent();


  Function *CTLZ =

      Intrinsic::getDeclaration(F->getParent(), Intrinsic::ctlz, IntTy);

  ConstantInt *True = Builder.getTrue();


  // entry:

  Builder.SetInsertPoint(Entry);

  Value *Cmp = Builder.CreateICmpEQ(IntVal, ConstantInt::getSigned(IntTy, 0));

  Builder.CreateCondBr(Cmp, End, IfEnd);


  // if.end:

  Builder.SetInsertPoint(IfEnd);

  Value *Shr =

      Builder.CreateAShr(IntVal, Builder.getIntN(BitWidth, BitWidth - 1));

  Value *Xor = Builder.CreateXor(Shr, IntVal);

  Value *Sub = Builder.CreateSub(Xor, Shr);

  Value *Call = Builder.CreateCall(CTLZ, {IsSigned ? Sub : IntVal, True});

  Value *Cast = Builder.CreateTrunc(Call, Builder.getInt32Ty());

  int BitWidthNew = FloatWidth == 128 ? BitWidth : 32;

  Value *Sub1 = Builder.CreateSub(Builder.getIntN(BitWidthNew, BitWidth),

                                  FloatWidth == 128 ? Call : Cast);

  Value *Sub2 = Builder.CreateSub(Builder.getIntN(BitWidthNew, BitWidth - 1),

                                  FloatWidth == 128 ? Call : Cast);

  Value *Cmp3 = Builder.CreateICmpSGT(

      Sub1, Builder.getIntN(BitWidthNew, FPMantissaWidth + 1));

  Builder.CreateCondBr(Cmp3, IfThen4, IfElse);


  // if.then4:

  Builder.SetInsertPoint(IfThen4);

  llvm::SwitchInst *SI = Builder.CreateSwitch(Sub1, SwDefault);

  SI->addCase(Builder.getIntN(BitWidthNew, FPMantissaWidth + 2), SwBB);

  SI->addCase(Builder.getIntN(BitWidthNew, FPMantissaWidth + 3), SwEpilog);


  // sw.bb:

  Builder.SetInsertPoint(SwBB);

  Value *Shl =

      Builder.CreateShl(IsSigned ? Sub : IntVal, Builder.getIntN(BitWidth, 1));

  Builder.CreateBr(SwEpilog);


  // sw.default:

  Builder.SetInsertPoint(SwDefault);

  Value *Sub5 = Builder.CreateSub(

      Builder.getIntN(BitWidthNew, BitWidth - FPMantissaWidth - 3),

      FloatWidth == 128 ? Call : Cast);

  Value *ShProm = Builder.CreateZExt(Sub5, IntTy);

  Value *Shr6 = Builder.CreateLShr(IsSigned ? Sub : IntVal,

                                   FloatWidth == 128 ? Sub5 : ShProm);

  Value *Sub8 =

      Builder.CreateAdd(FloatWidth == 128 ? Call : Cast,

                        Builder.getIntN(BitWidthNew, FPMantissaWidth + 3));

  Value *ShProm9 = Builder.CreateZExt(Sub8, IntTy);

  Value *Shr9 = Builder.CreateLShr(ConstantInt::getSigned(IntTy, -1),

                                   FloatWidth == 128 ? Sub8 : ShProm9);

  Value *And = Builder.CreateAnd(Shr9, IsSigned ? Sub : IntVal);

  Value *Cmp10 = Builder.CreateICmpNE(And, Builder.getIntN(BitWidth, 0));

  Value *Conv11 = Builder.CreateZExt(Cmp10, IntTy);

  Value *Or = Builder.CreateOr(Shr6, Conv11);

  Builder.CreateBr(SwEpilog);


  // sw.epilog:

  Builder.SetInsertPoint(SwEpilog);

  PHINode *AAddr0 = Builder.CreatePHI(IntTy, 3);

  AAddr0->addIncoming(Or, SwDefault);

  AAddr0->addIncoming(IsSigned ? Sub : IntVal, IfThen4);

  AAddr0->addIncoming(Shl, SwBB);

  Value *A0 = Builder.CreateTrunc(AAddr0, Builder.getInt32Ty());

  Value *A1 = Builder.CreateLShr(A0, Builder.getIntN(32, 2));

  Value *A2 = Builder.CreateAnd(A1, Builder.getIntN(32, 1));

  Value *Conv16 = Builder.CreateZExt(A2, IntTy);

  Value *Or17 = Builder.CreateOr(AAddr0, Conv16);

  Value *Inc = Builder.CreateAdd(Or17, Builder.getIntN(BitWidth, 1));

  Value *Shr18 = nullptr;

  if (IsSigned)

    Shr18 = Builder.CreateAShr(Inc, Builder.getIntN(BitWidth, 2));

  else

    Shr18 = Builder.CreateLShr(Inc, Builder.getIntN(BitWidth, 2));

  Value *A3 = Builder.CreateAnd(Inc, Temp1, "a3");

  Value *PosOrNeg = Builder.CreateICmpEQ(A3, Builder.getIntN(BitWidth, 0));

  Value *ExtractT60 = Builder.CreateTrunc(Shr18, Builder.getIntNTy(FloatWidth));

  Value *Extract63 = Builder.CreateLShr(Shr18, Builder.getIntN(BitWidth, 32));

  Value *ExtractT64 = nullptr;

  if (FloatWidth > 80)

    ExtractT64 = Builder.CreateTrunc(Sub2, Builder.getInt64Ty());

  else

    ExtractT64 = Builder.CreateTrunc(Extract63, Builder.getInt32Ty());

  Builder.CreateCondBr(PosOrNeg, IfEnd26, IfThen20);


  // if.then20

  Builder.SetInsertPoint(IfThen20);

  Value *Shr21 = nullptr;

  if (IsSigned)

    Shr21 = Builder.CreateAShr(Inc, Builder.getIntN(BitWidth, 3));

  else

    Shr21 = Builder.CreateLShr(Inc, Builder.getIntN(BitWidth, 3));

  Value *ExtractT = Builder.CreateTrunc(Shr21, Builder.getIntNTy(FloatWidth));

  Value *Extract = Builder.CreateLShr(Shr21, Builder.getIntN(BitWidth, 32));

  Value *ExtractT62 = nullptr;

  if (FloatWidth > 80)

    ExtractT62 = Builder.CreateTrunc(Sub1, Builder.getIntNTy(64));

  else

    ExtractT62 = Builder.CreateTrunc(Extract, Builder.getIntNTy(32));

  Builder.CreateBr(IfEnd26);


  // if.else:

  Builder.SetInsertPoint(IfElse);

  Value *Sub24 = Builder.CreateAdd(

      FloatWidth == 128 ? Call : Cast,

      ConstantInt::getSigned(Builder.getIntNTy(BitWidthNew),

                             -(BitWidth - FPMantissaWidth - 1)));

  Value *ShProm25 = Builder.CreateZExt(Sub24, IntTy);

  Value *Shl26 = Builder.CreateShl(IsSigned ? Sub : IntVal,

                                   FloatWidth == 128 ? Sub24 : ShProm25);

  Value *ExtractT61 = Builder.CreateTrunc(Shl26, Builder.getIntNTy(FloatWidth));

  Value *Extract65 = Builder.CreateLShr(Shl26, Builder.getIntN(BitWidth, 32));

  Value *ExtractT66 = nullptr;

  if (FloatWidth > 80)

    ExtractT66 = Builder.CreateTrunc(Sub2, Builder.getIntNTy(64));

  else

    ExtractT66 = Builder.CreateTrunc(Extract65, Builder.getInt32Ty());

  Builder.CreateBr(IfEnd26);


  // if.end26:

  Builder.SetInsertPoint(IfEnd26);

  PHINode *AAddr1Off0 = Builder.CreatePHI(Builder.getIntNTy(FloatWidth), 3);

  AAddr1Off0->addIncoming(ExtractT, IfThen20);

  AAddr1Off0->addIncoming(ExtractT60, SwEpilog);

  AAddr1Off0->addIncoming(ExtractT61, IfElse);

  PHINode *AAddr1Off32 = nullptr;

  if (FloatWidth > 32) {

    AAddr1Off32 =

        Builder.CreatePHI(Builder.getIntNTy(FloatWidth > 80 ? 64 : 32), 3);

    AAddr1Off32->addIncoming(ExtractT62, IfThen20);

    AAddr1Off32->addIncoming(ExtractT64, SwEpilog);

    AAddr1Off32->addIncoming(ExtractT66, IfElse);

  }

  PHINode *E0 = nullptr;

  if (FloatWidth <= 80) {

    E0 = Builder.CreatePHI(Builder.getIntNTy(BitWidthNew), 3);

    E0->addIncoming(Sub1, IfThen20);

    E0->addIncoming(Sub2, SwEpilog);

    E0->addIncoming(Sub2, IfElse);

  }

  Value *And29 = nullptr;

  if (FloatWidth > 80) {

    Value *Temp2 = Builder.CreateShl(Builder.getIntN(BitWidth, 1),

                                     Builder.getIntN(BitWidth, 63));

    And29 = Builder.CreateAnd(Shr, Temp2, "and29");

  } else {

    Value *Conv28 = Builder.CreateTrunc(Shr, Builder.getIntNTy(32));

    And29 = Builder.CreateAnd(

        Conv28, ConstantInt::getSigned(Builder.getIntNTy(32), 0x80000000));

  }

  unsigned TempMod = FPMantissaWidth % 32;

  Value *And34 = nullptr;

  Value *Shl30 = nullptr;

  if (FloatWidth > 80) {

    TempMod += 32;

    Value *Add = Builder.CreateShl(AAddr1Off32, Builder.getIntN(64, TempMod));

    Shl30 = Builder.CreateAdd(

        Add,

        Builder.getIntN(64, ((1ull << (62ull - TempMod)) - 1ull) << TempMod));

    And34 = Builder.CreateZExt(Shl30, Builder.getIntNTy(128));

  } else {

    Value *Add = Builder.CreateShl(E0, Builder.getIntN(32, TempMod));

    Shl30 = Builder.CreateAdd(

        Add, Builder.getIntN(32, ((1 << (30 - TempMod)) - 1) << TempMod));

    And34 = Builder.CreateAnd(FloatWidth > 32 ? AAddr1Off32 : AAddr1Off0,

                              Builder.getIntN(32, (1 << TempMod) - 1));

  }

  Value *Or35 = nullptr;

  if (FloatWidth > 80) {

    Value *And29Trunc = Builder.CreateTrunc(And29, Builder.getIntNTy(128));

    Value *Or31 = Builder.CreateOr(And29Trunc, And34);

    Value *Or34 = Builder.CreateShl(Or31, Builder.getIntN(128, 64));

    Value *Temp3 = Builder.CreateShl(Builder.getIntN(128, 1),

                                     Builder.getIntN(128, FPMantissaWidth));

    Value *Temp4 = Builder.CreateSub(Temp3, Builder.getIntN(128, 1));

    Value *A6 = Builder.CreateAnd(AAddr1Off0, Temp4);

    Or35 = Builder.CreateOr(Or34, A6);

  } else {

    Value *Or31 = Builder.CreateOr(And34, And29);

    Or35 = Builder.CreateOr(IsSigned ? Or31 : And34, Shl30);

  }

  Value *A4 = nullptr;

  if (IToFP->getType()->isDoubleTy()) {

    Value *ZExt1 = Builder.CreateZExt(Or35, Builder.getIntNTy(FloatWidth));

    Value *Shl1 = Builder.CreateShl(ZExt1, Builder.getIntN(FloatWidth, 32));

    Value *And1 =

        Builder.CreateAnd(AAddr1Off0, Builder.getIntN(FloatWidth, 0xFFFFFFFF));

    Value *Or1 = Builder.CreateOr(Shl1, And1);

    A4 = Builder.CreateBitCast(Or1, IToFP->getType());

  } else if (IToFP->getType()->isX86_FP80Ty()) {

    Value *A40 =

        Builder.CreateBitCast(Or35, Type::getFP128Ty(Builder.getContext()));

    A4 = Builder.CreateFPTrunc(A40, IToFP->getType());

  } else if (IToFP->getType()->isHalfTy() || IToFP->getType()->isBFloatTy()) {

    // Deal with "half" situation. This is a workaround since we don't have

    // floattihf.c currently as referring.

    Value *A40 =

        Builder.CreateBitCast(Or35, Type::getFloatTy(Builder.getContext()));

    A4 = Builder.CreateFPTrunc(A40, IToFP->getType());

  } else // float type

    A4 = Builder.CreateBitCast(Or35, IToFP->getType());

  Builder.CreateBr(End);


  // return:

  Builder.SetInsertPoint(End, End->begin());

  PHINode *Retval0 = Builder.CreatePHI(IToFP->getType(), 2);

  Retval0->addIncoming(A4, IfEnd26);

  Retval0->addIncoming(ConstantFP::getZero(IToFP->getType(), false), Entry);


  IToFP->replaceAllUsesWith(Retval0);

  IToFP->dropAllReferences();

  IToFP->eraseFromParent();

}


static void scalarize(Instruction *I, SmallVectorImpl<Instruction *> &Replace) {

  VectorType *VTy = cast<FixedVectorType>(I->getType());


  IRBuilder<> Builder(I);


  unsigned NumElements = VTy->getElementCount().getFixedValue();

  Value *Result = PoisonValue::get(VTy);

  for (unsigned Idx = 0; Idx < NumElements; ++Idx) {

    Value *Ext = Builder.CreateExtractElement(I->getOperand(0), Idx);

    Value *Cast = Builder.CreateCast(cast<CastInst>(I)->getOpcode(), Ext,

                                     I->getType()->getScalarType());

    Result = Builder.CreateInsertElement(Result, Cast, Idx);

    if (isa<Instruction>(Cast))

      Replace.push_back(cast<Instruction>(Cast));

  }

  I->replaceAllUsesWith(Result);

  I->dropAllReferences();

  I->eraseFromParent();

}


static bool runImpl(Function &F, const TargetLowering &TLI) {

  SmallVector<Instruction *, 4> Replace;

  SmallVector<Instruction *, 4> ReplaceVector;

  bool Modified = false;


  unsigned MaxLegalFpConvertBitWidth =

      TLI.getMaxLargeFPConvertBitWidthSupported();

  if (ExpandFpConvertBits != llvm::IntegerType::MAX_INT_BITS)

    MaxLegalFpConvertBitWidth = ExpandFpConvertBits;


  if (MaxLegalFpConvertBitWidth >= llvm::IntegerType::MAX_INT_BITS)

    return false;


  for (auto &I : instructions(F)) {

    switch (I.getOpcode()) {

    case Instruction::FPToUI:

    case Instruction::FPToSI: {

      // TODO: This pass doesn't handle scalable vectors.

      if (I.getOperand(0)->getType()->isScalableTy())

        continue;


      auto *IntTy = dyn_cast<IntegerType>(I.getType()->getScalarType());

      if (IntTy->getIntegerBitWidth() <= MaxLegalFpConvertBitWidth)

        continue;


      if (I.getOperand(0)->getType()->isVectorTy())

        ReplaceVector.push_back(&I);

      else

        Replace.push_back(&I);

      Modified = true;

      break;

    }

    case Instruction::UIToFP:

    case Instruction::SIToFP: {

      // TODO: This pass doesn't handle scalable vectors.

      if (I.getOperand(0)->getType()->isScalableTy())

        continue;


      auto *IntTy =

          dyn_cast<IntegerType>(I.getOperand(0)->getType()->getScalarType());

      if (IntTy->getIntegerBitWidth() <= MaxLegalFpConvertBitWidth)

        continue;


      if (I.getOperand(0)->getType()->isVectorTy())

        ReplaceVector.push_back(&I);

      else

        Replace.push_back(&I);

      Modified = true;

      break;

    }

    default:

      break;

    }

  }


  while (!ReplaceVector.empty()) {

    Instruction *I = ReplaceVector.pop_back_val();

    scalarize(I, Replace);

  }


  if (Replace.empty())

    return false;


  while (!Replace.empty()) {

    Instruction *I = Replace.pop_back_val();

    if (I->getOpcode() == Instruction::FPToUI ||

        I->getOpcode() == Instruction::FPToSI) {

      expandFPToI(I);

    } else {

      expandIToFP(I);

    }

  }


  return Modified;

}


namespace {

class ExpandLargeFpConvertLegacyPass : public FunctionPass {

public:

  static char ID;


  ExpandLargeFpConvertLegacyPass() : FunctionPass(ID) {

    initializeExpandLargeFpConvertLegacyPassPass(

        *PassRegistry::getPassRegistry());

  }


  bool runOnFunction(Function &F) override {

    auto *TM = &getAnalysis<TargetPassConfig>().getTM<TargetMachine>();

    auto *TLI = TM->getSubtargetImpl(F)->getTargetLowering();

    return runImpl(F, *TLI);

  }


  void getAnalysisUsage(AnalysisUsage &AU) const override {

    AU.addRequired<TargetPassConfig>();

    AU.addPreserved<AAResultsWrapperPass>();

    AU.addPreserved<GlobalsAAWrapperPass>();

  }

};

} // namespace


PreservedAnalyses ExpandLargeFpConvertPass::run(Function &F,

                                                FunctionAnalysisManager &FAM) {

  const TargetSubtargetInfo *STI = TM->getSubtargetImpl(F);

  return runImpl(F, *STI->getTargetLowering()) ? PreservedAnalyses::none()

                                               : PreservedAnalyses::all();

}


char ExpandLargeFpConvertLegacyPass::ID = 0;

INITIALIZE_PASS_BEGIN(ExpandLargeFpConvertLegacyPass, "expand-large-fp-convert",

                      "Expand large fp convert", false, false)

INITIALIZE_PASS_END(ExpandLargeFpConvertLegacyPass, "expand-large-fp-convert",

                    "Expand large fp convert", false, false)


FunctionPass *llvm::createExpandLargeFpConvertPass() {

  return new ExpandLargeFpConvertLegacyPass();

}

instructions
Expand Atomic instructions
Definition: AtomicExpandPass.cpp:171

Passes.h

CommandLine.h

Idx
Returns the sub type a function will return at a given Idx Should correspond to the result type of an ExtractValue instruction executed with just that one unsigned Idx
Definition: DeadArgumentElimination.cpp:354

End
bool End
Definition: ELF_riscv.cpp:480

runImpl
static bool runImpl(Function &F, const TargetLowering &TLI)
Definition: ExpandLargeDivRem.cpp:80

expandIToFP
static void expandIToFP(Instruction *IToFP)
Generate code to convert a fp number to integer, replacing S(U)IToFP with the generated code.
Definition: ExpandLargeFpConvert.cpp:310

expandFPToI
static void expandFPToI(Instruction *FPToI)
Generate code to convert a fp number to integer, replacing FPToS(U)I with the generated code.
Definition: ExpandLargeFpConvert.cpp:91

scalarize
static void scalarize(Instruction *I, SmallVectorImpl< Instruction * > &Replace)
Definition: ExpandLargeFpConvert.cpp:573

convert
expand large fp convert
Definition: ExpandLargeFpConvert.cpp:703

ExpandFpConvertBits
static cl::opt< unsigned > ExpandFpConvertBits("expand-fp-convert-bits", cl::Hidden, cl::init(llvm::IntegerType::MAX_INT_BITS), cl::desc("fp convert instructions on integers with " "more than <N> bits are expanded."))

runImpl
static bool runImpl(Function &F, const TargetLowering &TLI)
Definition: ExpandLargeFpConvert.cpp:593

ExpandLargeFpConvert.h

expand
static Expected< BitVector > expand(StringRef S, StringRef Original)
Definition: GlobPattern.cpp:21

GlobalsModRef.h
This is the interface for a simple mod/ref and alias analysis over globals.

IRBuilder.h

InitializePasses.h

InstIterator.h

LoopDeletionResult::Modified
@ Modified

F
#define F(x, y, z)
Definition: MD5.cpp:55

I
#define I(x, y, z)
Definition: MD5.cpp:58

FAM
FunctionAnalysisManager FAM
Definition: PassBuilderBindings.cpp:59

TM
const char LLVMTargetMachineRef TM
Definition: PassBuilderBindings.cpp:47

PassManager.h
This header defines various interfaces for pass management in LLVM.

INITIALIZE_PASS_END
#define INITIALIZE_PASS_END(passName, arg, name, cfg, analysis)
Definition: PassSupport.h:59

INITIALIZE_PASS_BEGIN
#define INITIALIZE_PASS_BEGIN(passName, arg, name, cfg, analysis)
Definition: PassSupport.h:52

Pass.h

assert
assert(ImpDefSCC.getReg()==AMDGPU::SCC &&ImpDefSCC.isDef())

SmallVector.h
This file defines the SmallVector class.

StringExtras.h
This file contains some functions that are useful when dealing with strings.

TargetLowering.h
This file describes how to lower LLVM code to machine code.

TargetPassConfig.h
Target-Independent Code Generator Pass Configuration Options pass.

TargetSubtargetInfo.h

getOpcode
static std::optional< unsigned > getOpcode(ArrayRef< VPValue * > Values)
Returns the opcode of Values or ~0 if they do not all agree.
Definition: VPlanSLP.cpp:191

Mul
BinaryOperator * Mul
Definition: X86PartialReduction.cpp:70

VectorType
Definition: ItaniumDemangle.h:1149

llvm::AAResultsWrapperPass
A wrapper pass to provide the legacy pass manager access to a suitably prepared AAResults object.
Definition: AliasAnalysis.h:960

llvm::AnalysisManager
A container for analyses that lazily runs them and caches their results.
Definition: PassManager.h:321

llvm::AnalysisUsage
Represent the analysis usage information of a pass.
Definition: PassAnalysisSupport.h:47

llvm::AnalysisUsage::addRequired
AnalysisUsage & addRequired()
Definition: PassAnalysisSupport.h:75

llvm::AnalysisUsage::addPreserved
AnalysisUsage & addPreserved()
Add the specified Pass class to the set of analyses preserved by this pass.
Definition: PassAnalysisSupport.h:98

llvm::BasicBlock
LLVM Basic Block Representation.
Definition: BasicBlock.h:60

llvm::BasicBlock::Create
static BasicBlock * Create(LLVMContext &Context, const Twine &Name="", Function *Parent=nullptr, BasicBlock *InsertBefore=nullptr)
Creates a new BasicBlock.
Definition: BasicBlock.h:199

llvm::ConstantFP::getZero
static Constant * getZero(Type *Ty, bool Negative=false)
Definition: Constants.cpp:1037

llvm::ConstantInt
This is the shared class of boolean and integer constants.
Definition: Constants.h:80

llvm::ConstantInt::getSigned
static ConstantInt * getSigned(IntegerType *Ty, int64_t V)
Return a ConstantInt with the specified value for the specified type.
Definition: Constants.h:123

llvm::ExpandLargeFpConvertPass::run
PreservedAnalyses run(Function &F, FunctionAnalysisManager &AM)
Definition: ExpandLargeFpConvert.cpp:693

llvm::FunctionPass
FunctionPass class - This class is used to implement most global optimizations.
Definition: Pass.h:311

llvm::FunctionPass::runOnFunction
virtual bool runOnFunction(Function &F)=0
runOnFunction - Virtual method overriden by subclasses to do the per-function processing of the pass.

llvm::Function
Definition: Function.h:63

llvm::GlobalsAAWrapperPass
Legacy wrapper pass to provide the GlobalsAAResult object.
Definition: GlobalsModRef.h:142

llvm::IRBuilderBase::CreateICmpULT
Value * CreateICmpULT(Value *LHS, Value *RHS, const Twine &Name="")
Definition: IRBuilder.h:2257

llvm::IRBuilderBase::CreateInsertElement
Value * CreateInsertElement(Type *VecTy, Value *NewElt, Value *Idx, const Twine &Name="")
Definition: IRBuilder.h:2472

llvm::IRBuilderBase::CreateExtractElement
Value * CreateExtractElement(Value *Vec, Value *Idx, const Twine &Name="")
Definition: IRBuilder.h:2460

llvm::IRBuilderBase::getIntNTy
IntegerType * getIntNTy(unsigned N)
Fetch the type representing an N-bit integer.
Definition: IRBuilder.h:539

llvm::IRBuilderBase::CreateICmpSGT
Value * CreateICmpSGT(Value *LHS, Value *RHS, const Twine &Name="")
Definition: IRBuilder.h:2265

llvm::IRBuilderBase::CreateFPTrunc
Value * CreateFPTrunc(Value *V, Type *DestTy, const Twine &Name="")
Definition: IRBuilder.h:2101

llvm::IRBuilderBase::getTrue
ConstantInt * getTrue()
Get the constant value for i1 true.
Definition: IRBuilder.h:466

llvm::IRBuilderBase::CreateSelect
Value * CreateSelect(Value *C, Value *True, Value *False, const Twine &Name="", Instruction *MDFrom=nullptr)
Definition: IRBuilder.cpp:1110

llvm::IRBuilderBase::CreateFPToUI
Value * CreateFPToUI(Value *V, Type *DestTy, const Twine &Name="")
Definition: IRBuilder.h:2067

llvm::IRBuilderBase::GetInsertPoint
BasicBlock::iterator GetInsertPoint() const
Definition: IRBuilder.h:175

llvm::IRBuilderBase::CreateSExt
Value * CreateSExt(Value *V, Type *DestTy, const Twine &Name="")
Definition: IRBuilder.h:2033

llvm::IRBuilderBase::CreateLShr
Value * CreateLShr(Value *LHS, Value *RHS, const Twine &Name="", bool isExact=false)
Definition: IRBuilder.h:1437

llvm::IRBuilderBase::getInt32Ty
IntegerType * getInt32Ty()
Fetch the type representing a 32-bit integer.
Definition: IRBuilder.h:526

llvm::IRBuilderBase::GetInsertBlock
BasicBlock * GetInsertBlock() const
Definition: IRBuilder.h:174

llvm::IRBuilderBase::getInt64Ty
IntegerType * getInt64Ty()
Fetch the type representing a 64-bit integer.
Definition: IRBuilder.h:531

llvm::IRBuilderBase::CreateICmpNE
Value * CreateICmpNE(Value *LHS, Value *RHS, const Twine &Name="")
Definition: IRBuilder.h:2245

llvm::IRBuilderBase::CreatePHI
PHINode * CreatePHI(Type *Ty, unsigned NumReservedValues, const Twine &Name="")
Definition: IRBuilder.h:2397

llvm::IRBuilderBase::CreateSwitch
SwitchInst * CreateSwitch(Value *V, BasicBlock *Dest, unsigned NumCases=10, MDNode *BranchWeights=nullptr, MDNode *Unpredictable=nullptr)
Create a switch instruction with the specified value, default dest, and with a hint for the number of...
Definition: IRBuilder.h:1143

llvm::IRBuilderBase::CreateICmpEQ
Value * CreateICmpEQ(Value *LHS, Value *RHS, const Twine &Name="")
Definition: IRBuilder.h:2241

llvm::IRBuilderBase::CreateSub
Value * CreateSub(Value *LHS, Value *RHS, const Twine &Name="", bool HasNUW=false, bool HasNSW=false)
Definition: IRBuilder.h:1344

llvm::IRBuilderBase::CreateBitCast
Value * CreateBitCast(Value *V, Type *DestTy, const Twine &Name="")
Definition: IRBuilder.h:2127

llvm::IRBuilderBase::getIntN
ConstantInt * getIntN(unsigned N, uint64_t C)
Get a constant N-bit value, zero extended or truncated from a 64-bit value.
Definition: IRBuilder.h:497

llvm::IRBuilderBase::CreateCondBr
BranchInst * CreateCondBr(Value *Cond, BasicBlock *True, BasicBlock *False, MDNode *BranchWeights=nullptr, MDNode *Unpredictable=nullptr)
Create a conditional 'br Cond, TrueDest, FalseDest' instruction.
Definition: IRBuilder.h:1120

llvm::IRBuilderBase::CreateShl
Value * CreateShl(Value *LHS, Value *RHS, const Twine &Name="", bool HasNUW=false, bool HasNSW=false)
Definition: IRBuilder.h:1416

llvm::IRBuilderBase::CreateZExt
Value * CreateZExt(Value *V, Type *DestTy, const Twine &Name="", bool IsNonNeg=false)
Definition: IRBuilder.h:2021

llvm::IRBuilderBase::getContext
LLVMContext & getContext() const
Definition: IRBuilder.h:176

llvm::IRBuilderBase::CreateAnd
Value * CreateAnd(Value *LHS, Value *RHS, const Twine &Name="")
Definition: IRBuilder.h:1475

llvm::IRBuilderBase::CreateAdd
Value * CreateAdd(Value *LHS, Value *RHS, const Twine &Name="", bool HasNUW=false, bool HasNSW=false)
Definition: IRBuilder.h:1327

llvm::IRBuilderBase::CreateTrunc
Value * CreateTrunc(Value *V, Type *DestTy, const Twine &Name="", bool IsNUW=false, bool IsNSW=false)
Definition: IRBuilder.h:2007

llvm::IRBuilderBase::CreateOr
Value * CreateOr(Value *LHS, Value *RHS, const Twine &Name="")
Definition: IRBuilder.h:1497

llvm::IRBuilderBase::CreateBr
BranchInst * CreateBr(BasicBlock *Dest)
Create an unconditional 'br label X' instruction.
Definition: IRBuilder.h:1114

llvm::IRBuilderBase::CreateCast
Value * CreateCast(Instruction::CastOps Op, Value *V, Type *DestTy, const Twine &Name="")
Definition: IRBuilder.h:2161

llvm::IRBuilderBase::SetInsertPoint
void SetInsertPoint(BasicBlock *TheBB)
This specifies that created instructions should be appended to the end of the specified block.
Definition: IRBuilder.h:180

llvm::IRBuilderBase::CreateCall
CallInst * CreateCall(FunctionType *FTy, Value *Callee, ArrayRef< Value * > Args=std::nullopt, const Twine &Name="", MDNode *FPMathTag=nullptr)
Definition: IRBuilder.h:2412

llvm::IRBuilderBase::CreateAShr
Value * CreateAShr(Value *LHS, Value *RHS, const Twine &Name="", bool isExact=false)
Definition: IRBuilder.h:1456

llvm::IRBuilderBase::CreateFPExt
Value * CreateFPExt(Value *V, Type *DestTy, const Twine &Name="")
Definition: IRBuilder.h:2110

llvm::IRBuilderBase::CreateXor
Value * CreateXor(Value *LHS, Value *RHS, const Twine &Name="")
Definition: IRBuilder.h:1519

llvm::IRBuilderBase::CreateMul
Value * CreateMul(Value *LHS, Value *RHS, const Twine &Name="", bool HasNUW=false, bool HasNSW=false)
Definition: IRBuilder.h:1361

llvm::IRBuilderBase::CreateFPToSI
Value * CreateFPToSI(Value *V, Type *DestTy, const Twine &Name="")
Definition: IRBuilder.h:2074

llvm::IRBuilder
This provides a uniform API for creating instructions and inserting them into a basic block: either a...
Definition: IRBuilder.h:2666

llvm::Instruction
Definition: Instruction.h:49

llvm::Instruction::eraseFromParent
InstListType::iterator eraseFromParent()
This method unlinks 'this' from the containing basic block and deletes it.
Definition: Instruction.cpp:105

llvm::Instruction::getOpcode
unsigned getOpcode() const
Returns a member of one of the enums like Instruction::Add.
Definition: Instruction.h:252

llvm::IntegerType
Class to represent integer types.
Definition: DerivedTypes.h:40

llvm::IntegerType::MAX_INT_BITS
@ MAX_INT_BITS
Maximum number of bits that can be specified.
Definition: DerivedTypes.h:52

llvm::PHINode
Definition: Instructions.h:2973

llvm::PHINode::addIncoming
void addIncoming(Value *V, BasicBlock *BB)
Add an incoming value to the end of the PHI list.
Definition: Instructions.h:3134

llvm::PassRegistry::getPassRegistry
static PassRegistry * getPassRegistry()
getPassRegistry - Access the global registry object, which is automatically initialized at applicatio...
Definition: PassRegistry.cpp:24

llvm::Pass::getAnalysisUsage
virtual void getAnalysisUsage(AnalysisUsage &) const
getAnalysisUsage - This function should be overriden by passes that need analysis information to do t...
Definition: Pass.cpp:98

llvm::PoisonValue::get
static PoisonValue * get(Type *T)
Static factory methods - Return an 'poison' object of the specified type.
Definition: Constants.cpp:1827

llvm::PreservedAnalyses
A set of analyses that are preserved following a run of a transformation pass.
Definition: Analysis.h:109

llvm::PreservedAnalyses::none
static PreservedAnalyses none()
Convenience factory function for the empty preserved set.
Definition: Analysis.h:112

llvm::PreservedAnalyses::all
static PreservedAnalyses all()
Construct a special preserved set that preserves all passes.
Definition: Analysis.h:115

llvm::SmallVectorBase::empty
bool empty() const
Definition: SmallVector.h:94

llvm::SmallVectorImpl
This class consists of common code factored out of the SmallVector class to reduce code duplication b...
Definition: SmallVector.h:586

llvm::SmallVectorImpl::pop_back_val
T pop_back_val()
Definition: SmallVector.h:686

llvm::SmallVectorTemplateBase::push_back
void push_back(const T &Elt)
Definition: SmallVector.h:426

llvm::SmallVector
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
Definition: SmallVector.h:1209

llvm::SwitchInst
Multiway switch.
Definition: Instructions.h:3598

llvm::TargetLoweringBase::getMaxLargeFPConvertBitWidthSupported
unsigned getMaxLargeFPConvertBitWidthSupported() const
Returns the size in bits of the maximum larget fp convert the backend supports.
Definition: TargetLowering.h:2126

llvm::TargetLowering
This class defines information used to lower LLVM code to legal SelectionDAG operators that the targe...
Definition: TargetLowering.h:3765

llvm::TargetMachine
Primary interface to the complete machine description for the target machine.
Definition: TargetMachine.h:76

llvm::TargetMachine::getSubtargetImpl
virtual const TargetSubtargetInfo * getSubtargetImpl(const Function &) const
Virtual method implemented by subclasses that returns a reference to that target's TargetSubtargetInf...
Definition: TargetMachine.h:132

llvm::TargetPassConfig
Target-Independent Code Generator Pass Configuration Options.
Definition: TargetPassConfig.h:85

llvm::TargetSubtargetInfo
TargetSubtargetInfo - Generic base class for all target subtargets.
Definition: TargetSubtargetInfo.h:63

llvm::TargetSubtargetInfo::getTargetLowering
virtual const TargetLowering * getTargetLowering() const
Definition: TargetSubtargetInfo.h:100

llvm::Twine
Twine - A lightweight data structure for efficiently representing the concatenation of temporary valu...
Definition: Twine.h:81

llvm::Type::getIntegerBitWidth
unsigned getIntegerBitWidth() const

llvm::Type::isX86_FP80Ty
bool isX86_FP80Ty() const
Return true if this is x86 long double.
Definition: Type.h:160

llvm::Type::isBFloatTy
bool isBFloatTy() const
Return true if this is 'bfloat', a 16-bit bfloat type.
Definition: Type.h:146

llvm::Type::getFP128Ty
static Type * getFP128Ty(LLVMContext &C)

llvm::Type::isHalfTy
bool isHalfTy() const
Return true if this is 'half', a 16-bit IEEE fp type.
Definition: Type.h:143

llvm::Type::getFPMantissaWidth
int getFPMantissaWidth() const
Return the width of the mantissa of this type.

llvm::Type::isDoubleTy
bool isDoubleTy() const
Return true if this is 'double', a 64-bit IEEE fp type.
Definition: Type.h:157

llvm::Type::getFloatTy
static Type * getFloatTy(LLVMContext &C)

llvm::User::dropAllReferences
void dropAllReferences()
Drop all references to operands.
Definition: User.h:299

llvm::User::getOperand
Value * getOperand(unsigned i) const
Definition: User.h:169

llvm::Value
LLVM Value Representation.
Definition: Value.h:74

llvm::Value::getType
Type * getType() const
All values are typed, get the type of this value.
Definition: Value.h:255

llvm::Value::replaceAllUsesWith
void replaceAllUsesWith(Value *V)
Change all uses of this to point to a new Value.
Definition: Value.cpp:534

llvm::cl::opt
Definition: CommandLine.h:1430

unsigned

TargetMachine.h

false
Definition: StackSlotColoring.cpp:184

llvm::CallingConv::ID
unsigned ID
LLVM IR allows to use arbitrary numbers as calling convention identifiers.
Definition: CallingConv.h:24

llvm::Intrinsic::getDeclaration
Function * getDeclaration(Module *M, ID id, ArrayRef< Type * > Tys=std::nullopt)
Create or insert an LLVM Function declaration for an intrinsic, and return it.
Definition: Function.cpp:1469

llvm::cl::Hidden
@ Hidden
Definition: CommandLine.h:138

llvm::cl::init
initializer< Ty > init(const Ty &Val)
Definition: CommandLine.h:450

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition: AddressRanges.h:18

llvm::PowerOf2Ceil
uint64_t PowerOf2Ceil(uint64_t A)
Returns the power of two which is greater than or equal to the given value.
Definition: MathExtras.h:372

llvm::createExpandLargeFpConvertPass
FunctionPass * createExpandLargeFpConvertPass()
Definition: ExpandLargeFpConvert.cpp:706

llvm::initializeExpandLargeFpConvertLegacyPassPass
void initializeExpandLargeFpConvertLegacyPassPass(PassRegistry &)

llvm::RecurKind::Or
@ Or
Bitwise or logical OR of integers.

llvm::RecurKind::Xor
@ Xor
Bitwise or logical XOR of integers.

llvm::RecurKind::And
@ And
Bitwise or logical AND of integers.

llvm::RecurKind::Add
@ Add
Sum of integers.

llvm::BitWidth
constexpr unsigned BitWidth
Definition: BitmaskEnum.h:191

llvm::cl::desc
Definition: CommandLine.h:416