doxygen/html/LoongArchISelLowering_8cpp_source.html

//=- LoongArchISelLowering.cpp - LoongArch DAG Lowering Implementation  ---===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//

//

// This file defines the interfaces that LoongArch uses to lower LLVM code into

// a selection DAG.

//

//===----------------------------------------------------------------------===//


#include "LoongArchISelLowering.h"

#include "LoongArch.h"

#include "LoongArchMachineFunctionInfo.h"

#include "LoongArchRegisterInfo.h"

#include "LoongArchSubtarget.h"

#include "MCTargetDesc/LoongArchBaseInfo.h"

#include "MCTargetDesc/LoongArchMCTargetDesc.h"

#include "llvm/ADT/Statistic.h"

#include "llvm/ADT/StringExtras.h"

#include "llvm/CodeGen/ISDOpcodes.h"

#include "llvm/CodeGen/RuntimeLibcallUtil.h"

#include "llvm/CodeGen/SelectionDAGNodes.h"

#include "llvm/IR/IRBuilder.h"

#include "llvm/IR/IntrinsicInst.h"

#include "llvm/IR/IntrinsicsLoongArch.h"

#include "llvm/Support/CodeGen.h"

#include "llvm/Support/Debug.h"

#include "llvm/Support/ErrorHandling.h"

#include "llvm/Support/KnownBits.h"

#include "llvm/Support/MathExtras.h"


using namespace llvm;


#define DEBUG_TYPE "loongarch-isel-lowering"


STATISTIC(NumTailCalls, "Number of tail calls");


static cl::opt<bool> ZeroDivCheck("loongarch-check-zero-division", cl::Hidden,

                                  cl::desc("Trap on integer division by zero."),

                                  cl::init(false));


LoongArchTargetLowering::LoongArchTargetLowering(const TargetMachine &TM,

                                                 const LoongArchSubtarget &STI)

    : TargetLowering(TM), Subtarget(STI) {


  MVT GRLenVT = Subtarget.getGRLenVT();


  // Set up the register classes.


  addRegisterClass(GRLenVT, &LoongArch::GPRRegClass);

  if (Subtarget.hasBasicF())

    addRegisterClass(MVT::f32, &LoongArch::FPR32RegClass);

  if (Subtarget.hasBasicD())

    addRegisterClass(MVT::f64, &LoongArch::FPR64RegClass);


  static const MVT::SimpleValueType LSXVTs[] = {

      MVT::v16i8, MVT::v8i16, MVT::v4i32, MVT::v2i64, MVT::v4f32, MVT::v2f64};

  static const MVT::SimpleValueType LASXVTs[] = {

      MVT::v32i8, MVT::v16i16, MVT::v8i32, MVT::v4i64, MVT::v8f32, MVT::v4f64};


  if (Subtarget.hasExtLSX())

    for (MVT VT : LSXVTs)

      addRegisterClass(VT, &LoongArch::LSX128RegClass);


  if (Subtarget.hasExtLASX())

    for (MVT VT : LASXVTs)

      addRegisterClass(VT, &LoongArch::LASX256RegClass);


  // Set operations for LA32 and LA64.


  setLoadExtAction({ISD::EXTLOAD, ISD::SEXTLOAD, ISD::ZEXTLOAD}, GRLenVT,

                   MVT::i1, Promote);


  setOperationAction(ISD::SHL_PARTS, GRLenVT, Custom);

  setOperationAction(ISD::SRA_PARTS, GRLenVT, Custom);

  setOperationAction(ISD::SRL_PARTS, GRLenVT, Custom);

  setOperationAction(ISD::FP_TO_SINT, GRLenVT, Custom);

  setOperationAction(ISD::ROTL, GRLenVT, Expand);

  setOperationAction(ISD::CTPOP, GRLenVT, Expand);


  setOperationAction({ISD::GlobalAddress, ISD::BlockAddress, ISD::ConstantPool,

                      ISD::JumpTable, ISD::GlobalTLSAddress},

                     GRLenVT, Custom);


  setOperationAction(ISD::EH_DWARF_CFA, GRLenVT, Custom);


  setOperationAction(ISD::DYNAMIC_STACKALLOC, GRLenVT, Expand);

  setOperationAction({ISD::STACKSAVE, ISD::STACKRESTORE}, MVT::Other, Expand);

  setOperationAction(ISD::VASTART, MVT::Other, Custom);

  setOperationAction({ISD::VAARG, ISD::VACOPY, ISD::VAEND}, MVT::Other, Expand);


  setOperationAction(ISD::DEBUGTRAP, MVT::Other, Legal);

  setOperationAction(ISD::TRAP, MVT::Other, Legal);


  setOperationAction(ISD::INTRINSIC_VOID, MVT::Other, Custom);

  setOperationAction(ISD::INTRINSIC_W_CHAIN, MVT::Other, Custom);

  setOperationAction(ISD::INTRINSIC_WO_CHAIN, MVT::Other, Custom);


  setOperationAction(ISD::PREFETCH, MVT::Other, Legal);


  // Expand bitreverse.i16 with native-width bitrev and shift for now, before

  // we get to know which of sll and revb.2h is faster.

  setOperationAction(ISD::BITREVERSE, MVT::i8, Custom);

  setOperationAction(ISD::BITREVERSE, GRLenVT, Legal);


  // LA32 does not have REVB.2W and REVB.D due to the 64-bit operands, and

  // the narrower REVB.W does not exist. But LA32 does have REVB.2H, so i16

  // and i32 could still be byte-swapped relatively cheaply.

  setOperationAction(ISD::BSWAP, MVT::i16, Custom);


  setOperationAction(ISD::BR_JT, MVT::Other, Expand);

  setOperationAction(ISD::BR_CC, GRLenVT, Expand);

  setOperationAction(ISD::SELECT_CC, GRLenVT, Expand);

  setOperationAction(ISD::SIGN_EXTEND_INREG, MVT::i1, Expand);

  setOperationAction({ISD::SMUL_LOHI, ISD::UMUL_LOHI}, GRLenVT, Expand);


  setOperationAction(ISD::FP_TO_UINT, GRLenVT, Custom);

  setOperationAction(ISD::UINT_TO_FP, GRLenVT, Expand);


  // Set operations for LA64 only.


  if (Subtarget.is64Bit()) {

    setOperationAction(ISD::ADD, MVT::i32, Custom);

    setOperationAction(ISD::SUB, MVT::i32, Custom);

    setOperationAction(ISD::SHL, MVT::i32, Custom);

    setOperationAction(ISD::SRA, MVT::i32, Custom);

    setOperationAction(ISD::SRL, MVT::i32, Custom);

    setOperationAction(ISD::FP_TO_SINT, MVT::i32, Custom);

    setOperationAction(ISD::BITCAST, MVT::i32, Custom);

    setOperationAction(ISD::ROTR, MVT::i32, Custom);

    setOperationAction(ISD::ROTL, MVT::i32, Custom);

    setOperationAction(ISD::CTTZ, MVT::i32, Custom);

    setOperationAction(ISD::CTLZ, MVT::i32, Custom);

    setOperationAction(ISD::EH_DWARF_CFA, MVT::i32, Custom);

    setOperationAction(ISD::READ_REGISTER, MVT::i32, Custom);

    setOperationAction(ISD::WRITE_REGISTER, MVT::i32, Custom);

    setOperationAction(ISD::INTRINSIC_VOID, MVT::i32, Custom);

    setOperationAction(ISD::INTRINSIC_WO_CHAIN, MVT::i32, Custom);

    setOperationAction(ISD::INTRINSIC_W_CHAIN, MVT::i32, Custom);


    setOperationAction(ISD::BITREVERSE, MVT::i32, Custom);

    setOperationAction(ISD::BSWAP, MVT::i32, Custom);

    setOperationAction({ISD::SDIV, ISD::UDIV, ISD::SREM, ISD::UREM}, MVT::i32,

                       Custom);

    setOperationAction(ISD::LROUND, MVT::i32, Custom);

  }


  // Set operations for LA32 only.


  if (!Subtarget.is64Bit()) {

    setOperationAction(ISD::READ_REGISTER, MVT::i64, Custom);

    setOperationAction(ISD::WRITE_REGISTER, MVT::i64, Custom);

    setOperationAction(ISD::INTRINSIC_VOID, MVT::i64, Custom);

    setOperationAction(ISD::INTRINSIC_WO_CHAIN, MVT::i64, Custom);

    setOperationAction(ISD::INTRINSIC_W_CHAIN, MVT::i64, Custom);

  }


  setOperationAction(ISD::ATOMIC_FENCE, MVT::Other, Custom);


  static const ISD::CondCode FPCCToExpand[] = {

      ISD::SETOGT, ISD::SETOGE, ISD::SETUGT, ISD::SETUGE,

      ISD::SETGE,  ISD::SETNE,  ISD::SETGT};


  // Set operations for 'F' feature.


  if (Subtarget.hasBasicF()) {

    setLoadExtAction(ISD::EXTLOAD, MVT::f32, MVT::f16, Expand);

    setTruncStoreAction(MVT::f32, MVT::f16, Expand);

    setCondCodeAction(FPCCToExpand, MVT::f32, Expand);


    setOperationAction(ISD::SELECT_CC, MVT::f32, Expand);

    setOperationAction(ISD::BR_CC, MVT::f32, Expand);

    setOperationAction(ISD::FMA, MVT::f32, Legal);

    setOperationAction(ISD::FMINNUM_IEEE, MVT::f32, Legal);

    setOperationAction(ISD::FMAXNUM_IEEE, MVT::f32, Legal);

    setOperationAction(ISD::STRICT_FSETCCS, MVT::f32, Legal);

    setOperationAction(ISD::STRICT_FSETCC, MVT::f32, Legal);

    setOperationAction(ISD::IS_FPCLASS, MVT::f32, Legal);

    setOperationAction(ISD::FSIN, MVT::f32, Expand);

    setOperationAction(ISD::FCOS, MVT::f32, Expand);

    setOperationAction(ISD::FSINCOS, MVT::f32, Expand);

    setOperationAction(ISD::FPOW, MVT::f32, Expand);

    setOperationAction(ISD::FREM, MVT::f32, Expand);

    setOperationAction(ISD::FP16_TO_FP, MVT::f32, Expand);

    setOperationAction(ISD::FP_TO_FP16, MVT::f32, Expand);


    if (Subtarget.is64Bit())

      setOperationAction(ISD::FRINT, MVT::f32, Legal);


    if (!Subtarget.hasBasicD()) {

      setOperationAction(ISD::FP_TO_UINT, MVT::i32, Custom);

      if (Subtarget.is64Bit()) {

        setOperationAction(ISD::SINT_TO_FP, MVT::i64, Custom);

        setOperationAction(ISD::UINT_TO_FP, MVT::i64, Custom);

      }

    }

  }


  // Set operations for 'D' feature.


  if (Subtarget.hasBasicD()) {

    setLoadExtAction(ISD::EXTLOAD, MVT::f64, MVT::f16, Expand);

    setLoadExtAction(ISD::EXTLOAD, MVT::f64, MVT::f32, Expand);

    setTruncStoreAction(MVT::f64, MVT::f16, Expand);

    setTruncStoreAction(MVT::f64, MVT::f32, Expand);

    setCondCodeAction(FPCCToExpand, MVT::f64, Expand);


    setOperationAction(ISD::SELECT_CC, MVT::f64, Expand);

    setOperationAction(ISD::BR_CC, MVT::f64, Expand);

    setOperationAction(ISD::STRICT_FSETCCS, MVT::f64, Legal);

    setOperationAction(ISD::STRICT_FSETCC, MVT::f64, Legal);

    setOperationAction(ISD::FMA, MVT::f64, Legal);

    setOperationAction(ISD::FMINNUM_IEEE, MVT::f64, Legal);

    setOperationAction(ISD::FMAXNUM_IEEE, MVT::f64, Legal);

    setOperationAction(ISD::IS_FPCLASS, MVT::f64, Legal);

    setOperationAction(ISD::FSIN, MVT::f64, Expand);

    setOperationAction(ISD::FCOS, MVT::f64, Expand);

    setOperationAction(ISD::FSINCOS, MVT::f64, Expand);

    setOperationAction(ISD::FPOW, MVT::f64, Expand);

    setOperationAction(ISD::FREM, MVT::f64, Expand);

    setOperationAction(ISD::FP16_TO_FP, MVT::f64, Expand);

    setOperationAction(ISD::FP_TO_FP16, MVT::f64, Expand);


    if (Subtarget.is64Bit())

      setOperationAction(ISD::FRINT, MVT::f64, Legal);

  }


  // Set operations for 'LSX' feature.


  if (Subtarget.hasExtLSX()) {

    for (MVT VT : MVT::fixedlen_vector_valuetypes()) {

      // Expand all truncating stores and extending loads.

      for (MVT InnerVT : MVT::fixedlen_vector_valuetypes()) {

        setTruncStoreAction(VT, InnerVT, Expand);

        setLoadExtAction(ISD::SEXTLOAD, VT, InnerVT, Expand);

        setLoadExtAction(ISD::ZEXTLOAD, VT, InnerVT, Expand);

        setLoadExtAction(ISD::EXTLOAD, VT, InnerVT, Expand);

      }

      // By default everything must be expanded. Then we will selectively turn

      // on ones that can be effectively codegen'd.

      for (unsigned Op = 0; Op < ISD::BUILTIN_OP_END; ++Op)

        setOperationAction(Op, VT, Expand);

    }


    for (MVT VT : LSXVTs) {

      setOperationAction({ISD::LOAD, ISD::STORE}, VT, Legal);

      setOperationAction(ISD::BITCAST, VT, Legal);

      setOperationAction(ISD::UNDEF, VT, Legal);


      setOperationAction(ISD::INSERT_VECTOR_ELT, VT, Custom);

      setOperationAction(ISD::EXTRACT_VECTOR_ELT, VT, Legal);

      setOperationAction(ISD::BUILD_VECTOR, VT, Custom);


      setOperationAction(ISD::SETCC, VT, Legal);

      setOperationAction(ISD::VSELECT, VT, Legal);

      setOperationAction(ISD::VECTOR_SHUFFLE, VT, Custom);

    }

    for (MVT VT : {MVT::v16i8, MVT::v8i16, MVT::v4i32, MVT::v2i64}) {

      setOperationAction({ISD::ADD, ISD::SUB}, VT, Legal);

      setOperationAction({ISD::UMAX, ISD::UMIN, ISD::SMAX, ISD::SMIN}, VT,

                         Legal);

      setOperationAction({ISD::MUL, ISD::SDIV, ISD::SREM, ISD::UDIV, ISD::UREM},

                         VT, Legal);

      setOperationAction({ISD::AND, ISD::OR, ISD::XOR}, VT, Legal);

      setOperationAction({ISD::SHL, ISD::SRA, ISD::SRL}, VT, Legal);

      setOperationAction({ISD::CTPOP, ISD::CTLZ}, VT, Legal);

      setOperationAction({ISD::MULHS, ISD::MULHU}, VT, Legal);

      setCondCodeAction(

          {ISD::SETNE, ISD::SETGE, ISD::SETGT, ISD::SETUGE, ISD::SETUGT}, VT,

          Expand);

      setOperationAction(ISD::SCALAR_TO_VECTOR, VT, Custom);

    }

    for (MVT VT : {MVT::v16i8, MVT::v8i16, MVT::v4i32})

      setOperationAction(ISD::BITREVERSE, VT, Custom);

    for (MVT VT : {MVT::v8i16, MVT::v4i32, MVT::v2i64})

      setOperationAction(ISD::BSWAP, VT, Legal);

    for (MVT VT : {MVT::v4i32, MVT::v2i64}) {

      setOperationAction({ISD::SINT_TO_FP, ISD::UINT_TO_FP}, VT, Legal);

      setOperationAction({ISD::FP_TO_SINT, ISD::FP_TO_UINT}, VT, Legal);

    }

    for (MVT VT : {MVT::v4f32, MVT::v2f64}) {

      setOperationAction({ISD::FADD, ISD::FSUB}, VT, Legal);

      setOperationAction({ISD::FMUL, ISD::FDIV}, VT, Legal);

      setOperationAction(ISD::FMA, VT, Legal);

      setOperationAction(ISD::FSQRT, VT, Legal);

      setOperationAction(ISD::FNEG, VT, Legal);

      setCondCodeAction({ISD::SETGE, ISD::SETGT, ISD::SETOGE, ISD::SETOGT,

                         ISD::SETUGE, ISD::SETUGT},

                        VT, Expand);

      setOperationAction(ISD::SCALAR_TO_VECTOR, VT, Legal);

    }

    setOperationAction(ISD::CTPOP, GRLenVT, Legal);

    setOperationAction(ISD::FCEIL, {MVT::f32, MVT::f64}, Legal);

    setOperationAction(ISD::FFLOOR, {MVT::f32, MVT::f64}, Legal);

    setOperationAction(ISD::FTRUNC, {MVT::f32, MVT::f64}, Legal);

    setOperationAction(ISD::FROUNDEVEN, {MVT::f32, MVT::f64}, Legal);

  }


  // Set operations for 'LASX' feature.


  if (Subtarget.hasExtLASX()) {

    for (MVT VT : LASXVTs) {

      setOperationAction({ISD::LOAD, ISD::STORE}, VT, Legal);

      setOperationAction(ISD::BITCAST, VT, Legal);

      setOperationAction(ISD::UNDEF, VT, Legal);


      setOperationAction(ISD::INSERT_VECTOR_ELT, VT, Custom);

      setOperationAction(ISD::EXTRACT_VECTOR_ELT, VT, Custom);

      setOperationAction(ISD::BUILD_VECTOR, VT, Custom);

      setOperationAction(ISD::CONCAT_VECTORS, VT, Legal);


      setOperationAction(ISD::SETCC, VT, Legal);

      setOperationAction(ISD::VSELECT, VT, Legal);

      setOperationAction(ISD::VECTOR_SHUFFLE, VT, Custom);

    }

    for (MVT VT : {MVT::v4i64, MVT::v8i32, MVT::v16i16, MVT::v32i8}) {

      setOperationAction({ISD::ADD, ISD::SUB}, VT, Legal);

      setOperationAction({ISD::UMAX, ISD::UMIN, ISD::SMAX, ISD::SMIN}, VT,

                         Legal);

      setOperationAction({ISD::MUL, ISD::SDIV, ISD::SREM, ISD::UDIV, ISD::UREM},

                         VT, Legal);

      setOperationAction({ISD::AND, ISD::OR, ISD::XOR}, VT, Legal);

      setOperationAction({ISD::SHL, ISD::SRA, ISD::SRL}, VT, Legal);

      setOperationAction({ISD::CTPOP, ISD::CTLZ}, VT, Legal);

      setOperationAction({ISD::MULHS, ISD::MULHU}, VT, Legal);

      setCondCodeAction(

          {ISD::SETNE, ISD::SETGE, ISD::SETGT, ISD::SETUGE, ISD::SETUGT}, VT,

          Expand);

      setOperationAction(ISD::SCALAR_TO_VECTOR, VT, Custom);

    }

    for (MVT VT : {MVT::v32i8, MVT::v16i16, MVT::v8i32})

      setOperationAction(ISD::BITREVERSE, VT, Custom);

    for (MVT VT : {MVT::v16i16, MVT::v8i32, MVT::v4i64})

      setOperationAction(ISD::BSWAP, VT, Legal);

    for (MVT VT : {MVT::v8i32, MVT::v4i32, MVT::v4i64}) {

      setOperationAction({ISD::SINT_TO_FP, ISD::UINT_TO_FP}, VT, Legal);

      setOperationAction({ISD::FP_TO_SINT, ISD::FP_TO_UINT}, VT, Legal);

    }

    for (MVT VT : {MVT::v8f32, MVT::v4f64}) {

      setOperationAction({ISD::FADD, ISD::FSUB}, VT, Legal);

      setOperationAction({ISD::FMUL, ISD::FDIV}, VT, Legal);

      setOperationAction(ISD::FMA, VT, Legal);

      setOperationAction(ISD::FSQRT, VT, Legal);

      setOperationAction(ISD::FNEG, VT, Legal);

      setCondCodeAction({ISD::SETGE, ISD::SETGT, ISD::SETOGE, ISD::SETOGT,

                         ISD::SETUGE, ISD::SETUGT},

                        VT, Expand);

      setOperationAction(ISD::SCALAR_TO_VECTOR, VT, Legal);

    }

  }


  // Set DAG combine for LA32 and LA64.


  setTargetDAGCombine(ISD::AND);

  setTargetDAGCombine(ISD::OR);

  setTargetDAGCombine(ISD::SRL);

  setTargetDAGCombine(ISD::SETCC);


  // Set DAG combine for 'LSX' feature.


  if (Subtarget.hasExtLSX())

    setTargetDAGCombine(ISD::INTRINSIC_WO_CHAIN);


  // Compute derived properties from the register classes.

  computeRegisterProperties(Subtarget.getRegisterInfo());


  setStackPointerRegisterToSaveRestore(LoongArch::R3);


  setBooleanContents(ZeroOrOneBooleanContent);

  setBooleanVectorContents(ZeroOrNegativeOneBooleanContent);


  setMaxAtomicSizeInBitsSupported(Subtarget.getGRLen());


  setMinCmpXchgSizeInBits(32);


  // Function alignments.

  setMinFunctionAlignment(Align(4));

  // Set preferred alignments.

  setPrefFunctionAlignment(Subtarget.getPrefFunctionAlignment());

  setPrefLoopAlignment(Subtarget.getPrefLoopAlignment());

  setMaxBytesForAlignment(Subtarget.getMaxBytesForAlignment());


  // cmpxchg sizes down to 8 bits become legal if LAMCAS is available.

  if (Subtarget.hasLAMCAS())

    setMinCmpXchgSizeInBits(8);


  if (Subtarget.hasSCQ()) {

    setMaxAtomicSizeInBitsSupported(128);

    setOperationAction(ISD::ATOMIC_CMP_SWAP, MVT::i128, Custom);

  }

}


bool LoongArchTargetLowering::isOffsetFoldingLegal(

    const GlobalAddressSDNode *GA) const {

  // In order to maximise the opportunity for common subexpression elimination,

  // keep a separate ADD node for the global address offset instead of folding

  // it in the global address node. Later peephole optimisations may choose to

  // fold it back in when profitable.

  return false;

}


SDValue LoongArchTargetLowering::LowerOperation(SDValue Op,

                                                SelectionDAG &DAG) const {

  switch (Op.getOpcode()) {

  case ISD::ATOMIC_FENCE:

    return lowerATOMIC_FENCE(Op, DAG);

  case ISD::EH_DWARF_CFA:

    return lowerEH_DWARF_CFA(Op, DAG);

  case ISD::GlobalAddress:

    return lowerGlobalAddress(Op, DAG);

  case ISD::GlobalTLSAddress:

    return lowerGlobalTLSAddress(Op, DAG);

  case ISD::INTRINSIC_WO_CHAIN:

    return lowerINTRINSIC_WO_CHAIN(Op, DAG);

  case ISD::INTRINSIC_W_CHAIN:

    return lowerINTRINSIC_W_CHAIN(Op, DAG);

  case ISD::INTRINSIC_VOID:

    return lowerINTRINSIC_VOID(Op, DAG);

  case ISD::BlockAddress:

    return lowerBlockAddress(Op, DAG);

  case ISD::JumpTable:

    return lowerJumpTable(Op, DAG);

  case ISD::SHL_PARTS:

    return lowerShiftLeftParts(Op, DAG);

  case ISD::SRA_PARTS:

    return lowerShiftRightParts(Op, DAG, true);

  case ISD::SRL_PARTS:

    return lowerShiftRightParts(Op, DAG, false);

  case ISD::ConstantPool:

    return lowerConstantPool(Op, DAG);

  case ISD::FP_TO_SINT:

    return lowerFP_TO_SINT(Op, DAG);

  case ISD::BITCAST:

    return lowerBITCAST(Op, DAG);

  case ISD::UINT_TO_FP:

    return lowerUINT_TO_FP(Op, DAG);

  case ISD::SINT_TO_FP:

    return lowerSINT_TO_FP(Op, DAG);

  case ISD::VASTART:

    return lowerVASTART(Op, DAG);

  case ISD::FRAMEADDR:

    return lowerFRAMEADDR(Op, DAG);

  case ISD::RETURNADDR:

    return lowerRETURNADDR(Op, DAG);

  case ISD::WRITE_REGISTER:

    return lowerWRITE_REGISTER(Op, DAG);

  case ISD::INSERT_VECTOR_ELT:

    return lowerINSERT_VECTOR_ELT(Op, DAG);

  case ISD::EXTRACT_VECTOR_ELT:

    return lowerEXTRACT_VECTOR_ELT(Op, DAG);

  case ISD::BUILD_VECTOR:

    return lowerBUILD_VECTOR(Op, DAG);

  case ISD::VECTOR_SHUFFLE:

    return lowerVECTOR_SHUFFLE(Op, DAG);

  case ISD::BITREVERSE:

    return lowerBITREVERSE(Op, DAG);

  case ISD::SCALAR_TO_VECTOR:

    return lowerSCALAR_TO_VECTOR(Op, DAG);

  }

  return SDValue();

}


SDValue

LoongArchTargetLowering::lowerSCALAR_TO_VECTOR(SDValue Op,

                                               SelectionDAG &DAG) const {

  SDLoc DL(Op);

  MVT OpVT = Op.getSimpleValueType();


  SDValue Vector = DAG.getUNDEF(OpVT);

  SDValue Val = Op.getOperand(0);

  SDValue Idx = DAG.getConstant(0, DL, Subtarget.getGRLenVT());


  return DAG.getNode(ISD::INSERT_VECTOR_ELT, DL, OpVT, Vector, Val, Idx);

}


SDValue LoongArchTargetLowering::lowerBITREVERSE(SDValue Op,

                                                 SelectionDAG &DAG) const {

  EVT ResTy = Op->getValueType(0);

  SDValue Src = Op->getOperand(0);

  SDLoc DL(Op);


  EVT NewVT = ResTy.is128BitVector() ? MVT::v2i64 : MVT::v4i64;

  unsigned int OrigEltNum = ResTy.getVectorNumElements();

  unsigned int NewEltNum = NewVT.getVectorNumElements();


  SDValue NewSrc = DAG.getNode(ISD::BITCAST, DL, NewVT, Src);


  SmallVector<SDValue, 8> Ops;

  for (unsigned int i = 0; i < NewEltNum; i++) {

    SDValue Op = DAG.getNode(ISD::EXTRACT_VECTOR_ELT, DL, MVT::i64, NewSrc,

                             DAG.getConstant(i, DL, MVT::i64));

    unsigned RevOp = (ResTy == MVT::v16i8 || ResTy == MVT::v32i8)

                         ? (unsigned)LoongArchISD::BITREV_8B

                         : (unsigned)ISD::BITREVERSE;

    Ops.push_back(DAG.getNode(RevOp, DL, MVT::i64, Op));

  }

  SDValue Res =

      DAG.getNode(ISD::BITCAST, DL, ResTy, DAG.getBuildVector(NewVT, DL, Ops));


  switch (ResTy.getSimpleVT().SimpleTy) {

  default:

    return SDValue();

  case MVT::v16i8:

  case MVT::v32i8:

    return Res;

  case MVT::v8i16:

  case MVT::v16i16:

  case MVT::v4i32:

  case MVT::v8i32: {

    SmallVector<int, 32> Mask;

    for (unsigned int i = 0; i < NewEltNum; i++)

      for (int j = OrigEltNum / NewEltNum - 1; j >= 0; j--)

        Mask.push_back(j + (OrigEltNum / NewEltNum) * i);

    return DAG.getVectorShuffle(ResTy, DL, Res, DAG.getUNDEF(ResTy), Mask);

  }

  }

}


/// Determine whether a range fits a regular pattern of values.

/// This function accounts for the possibility of jumping over the End iterator.

template <typename ValType>

static bool

fitsRegularPattern(typename SmallVectorImpl<ValType>::const_iterator Begin,

                   unsigned CheckStride,

                   typename SmallVectorImpl<ValType>::const_iterator End,

                   ValType ExpectedIndex, unsigned ExpectedIndexStride) {

  auto &I = Begin;


  while (I != End) {

    if (*I != -1 && *I != ExpectedIndex)

      return false;

    ExpectedIndex += ExpectedIndexStride;


    // Incrementing past End is undefined behaviour so we must increment one

    // step at a time and check for End at each step.

    for (unsigned n = 0; n < CheckStride && I != End; ++n, ++I)

      ; // Empty loop body.

  }

  return true;

}


/// Lower VECTOR_SHUFFLE into VREPLVEI (if possible).

///

/// VREPLVEI performs vector broadcast based on an element specified by an

/// integer immediate, with its mask being similar to:

///   <x, x, x, ...>

/// where x is any valid index.

///

/// When undef's appear in the mask they are treated as if they were whatever

/// value is necessary in order to fit the above form.

static SDValue lowerVECTOR_SHUFFLE_VREPLVEI(const SDLoc &DL, ArrayRef<int> Mask,

                                            MVT VT, SDValue V1, SDValue V2,

                                            SelectionDAG &DAG) {

  int SplatIndex = -1;

  for (const auto &M : Mask) {

    if (M != -1) {

      SplatIndex = M;

      break;

    }

  }


  if (SplatIndex == -1)

    return DAG.getUNDEF(VT);


  assert(SplatIndex < (int)Mask.size() && "Out of bounds mask index");

  if (fitsRegularPattern<int>(Mask.begin(), 1, Mask.end(), SplatIndex, 0)) {

    APInt Imm(64, SplatIndex);

    return DAG.getNode(LoongArchISD::VREPLVEI, DL, VT, V1,

                       DAG.getConstant(Imm, DL, MVT::i64));

  }


  return SDValue();

}


/// Lower VECTOR_SHUFFLE into VSHUF4I (if possible).

///

/// VSHUF4I splits the vector into blocks of four elements, then shuffles these

/// elements according to a <4 x i2> constant (encoded as an integer immediate).

///

/// It is therefore possible to lower into VSHUF4I when the mask takes the form:

///   <a, b, c, d, a+4, b+4, c+4, d+4, a+8, b+8, c+8, d+8, ...>

/// When undef's appear they are treated as if they were whatever value is

/// necessary in order to fit the above forms.

///

/// For example:

///   %2 = shufflevector <8 x i16> %0, <8 x i16> undef,

///                      <8 x i32> <i32 3, i32 2, i32 1, i32 0,

///                                 i32 7, i32 6, i32 5, i32 4>

/// is lowered to:

///   (VSHUF4I_H $v0, $v1, 27)

/// where the 27 comes from:

///   3 + (2 << 2) + (1 << 4) + (0 << 6)

static SDValue lowerVECTOR_SHUFFLE_VSHUF4I(const SDLoc &DL, ArrayRef<int> Mask,

                                           MVT VT, SDValue V1, SDValue V2,

                                           SelectionDAG &DAG) {


  // When the size is less than 4, lower cost instructions may be used.

  if (Mask.size() < 4)

    return SDValue();


  int SubMask[4] = {-1, -1, -1, -1};

  for (unsigned i = 0; i < 4; ++i) {

    for (unsigned j = i; j < Mask.size(); j += 4) {

      int Idx = Mask[j];


      // Convert from vector index to 4-element subvector index

      // If an index refers to an element outside of the subvector then give up

      if (Idx != -1) {

        Idx -= 4 * (j / 4);

        if (Idx < 0 || Idx >= 4)

          return SDValue();

      }


      // If the mask has an undef, replace it with the current index.

      // Note that it might still be undef if the current index is also undef

      if (SubMask[i] == -1)

        SubMask[i] = Idx;

      // Check that non-undef values are the same as in the mask. If they

      // aren't then give up

      else if (Idx != -1 && Idx != SubMask[i])

        return SDValue();

    }

  }


  // Calculate the immediate. Replace any remaining undefs with zero

  APInt Imm(64, 0);

  for (int i = 3; i >= 0; --i) {

    int Idx = SubMask[i];


    if (Idx == -1)

      Idx = 0;


    Imm <<= 2;

    Imm |= Idx & 0x3;

  }


  return DAG.getNode(LoongArchISD::VSHUF4I, DL, VT, V1,

                     DAG.getConstant(Imm, DL, MVT::i64));

}


/// Lower VECTOR_SHUFFLE into VPACKEV (if possible).

///

/// VPACKEV interleaves the even elements from each vector.

///

/// It is possible to lower into VPACKEV when the mask consists of two of the

/// following forms interleaved:

///   <0, 2, 4, ...>

///   <n, n+2, n+4, ...>

/// where n is the number of elements in the vector.

/// For example:

///   <0, 0, 2, 2, 4, 4, ...>

///   <0, n, 2, n+2, 4, n+4, ...>

///

/// When undef's appear in the mask they are treated as if they were whatever

/// value is necessary in order to fit the above forms.

static SDValue lowerVECTOR_SHUFFLE_VPACKEV(const SDLoc &DL, ArrayRef<int> Mask,

                                           MVT VT, SDValue V1, SDValue V2,

                                           SelectionDAG &DAG) {


  const auto &Begin = Mask.begin();

  const auto &End = Mask.end();

  SDValue OriV1 = V1, OriV2 = V2;


  if (fitsRegularPattern<int>(Begin, 2, End, 0, 2))

    V1 = OriV1;

  else if (fitsRegularPattern<int>(Begin, 2, End, Mask.size(), 2))

    V1 = OriV2;

  else

    return SDValue();


  if (fitsRegularPattern<int>(Begin + 1, 2, End, 0, 2))

    V2 = OriV1;

  else if (fitsRegularPattern<int>(Begin + 1, 2, End, Mask.size(), 2))

    V2 = OriV2;

  else

    return SDValue();


  return DAG.getNode(LoongArchISD::VPACKEV, DL, VT, V2, V1);

}


/// Lower VECTOR_SHUFFLE into VPACKOD (if possible).

///

/// VPACKOD interleaves the odd elements from each vector.

///

/// It is possible to lower into VPACKOD when the mask consists of two of the

/// following forms interleaved:

///   <1, 3, 5, ...>

///   <n+1, n+3, n+5, ...>

/// where n is the number of elements in the vector.

/// For example:

///   <1, 1, 3, 3, 5, 5, ...>

///   <1, n+1, 3, n+3, 5, n+5, ...>

///

/// When undef's appear in the mask they are treated as if they were whatever

/// value is necessary in order to fit the above forms.

static SDValue lowerVECTOR_SHUFFLE_VPACKOD(const SDLoc &DL, ArrayRef<int> Mask,

                                           MVT VT, SDValue V1, SDValue V2,

                                           SelectionDAG &DAG) {


  const auto &Begin = Mask.begin();

  const auto &End = Mask.end();

  SDValue OriV1 = V1, OriV2 = V2;


  if (fitsRegularPattern<int>(Begin, 2, End, 1, 2))

    V1 = OriV1;

  else if (fitsRegularPattern<int>(Begin, 2, End, Mask.size() + 1, 2))

    V1 = OriV2;

  else

    return SDValue();


  if (fitsRegularPattern<int>(Begin + 1, 2, End, 1, 2))

    V2 = OriV1;

  else if (fitsRegularPattern<int>(Begin + 1, 2, End, Mask.size() + 1, 2))

    V2 = OriV2;

  else

    return SDValue();


  return DAG.getNode(LoongArchISD::VPACKOD, DL, VT, V2, V1);

}


/// Lower VECTOR_SHUFFLE into VILVH (if possible).

///

/// VILVH interleaves consecutive elements from the left (highest-indexed) half

/// of each vector.

///

/// It is possible to lower into VILVH when the mask consists of two of the

/// following forms interleaved:

///   <x, x+1, x+2, ...>

///   <n+x, n+x+1, n+x+2, ...>

/// where n is the number of elements in the vector and x is half n.

/// For example:

///   <x, x, x+1, x+1, x+2, x+2, ...>

///   <x, n+x, x+1, n+x+1, x+2, n+x+2, ...>

///

/// When undef's appear in the mask they are treated as if they were whatever

/// value is necessary in order to fit the above forms.

static SDValue lowerVECTOR_SHUFFLE_VILVH(const SDLoc &DL, ArrayRef<int> Mask,

                                         MVT VT, SDValue V1, SDValue V2,

                                         SelectionDAG &DAG) {


  const auto &Begin = Mask.begin();

  const auto &End = Mask.end();

  unsigned HalfSize = Mask.size() / 2;

  SDValue OriV1 = V1, OriV2 = V2;


  if (fitsRegularPattern<int>(Begin, 2, End, HalfSize, 1))

    V1 = OriV1;

  else if (fitsRegularPattern<int>(Begin, 2, End, Mask.size() + HalfSize, 1))

    V1 = OriV2;

  else

    return SDValue();


  if (fitsRegularPattern<int>(Begin + 1, 2, End, HalfSize, 1))

    V2 = OriV1;

  else if (fitsRegularPattern<int>(Begin + 1, 2, End, Mask.size() + HalfSize,

                                   1))

    V2 = OriV2;

  else

    return SDValue();


  return DAG.getNode(LoongArchISD::VILVH, DL, VT, V2, V1);

}


/// Lower VECTOR_SHUFFLE into VILVL (if possible).

///

/// VILVL interleaves consecutive elements from the right (lowest-indexed) half

/// of each vector.

///

/// It is possible to lower into VILVL when the mask consists of two of the

/// following forms interleaved:

///   <0, 1, 2, ...>

///   <n, n+1, n+2, ...>

/// where n is the number of elements in the vector.

/// For example:

///   <0, 0, 1, 1, 2, 2, ...>

///   <0, n, 1, n+1, 2, n+2, ...>

///

/// When undef's appear in the mask they are treated as if they were whatever

/// value is necessary in order to fit the above forms.

static SDValue lowerVECTOR_SHUFFLE_VILVL(const SDLoc &DL, ArrayRef<int> Mask,

                                         MVT VT, SDValue V1, SDValue V2,

                                         SelectionDAG &DAG) {


  const auto &Begin = Mask.begin();

  const auto &End = Mask.end();

  SDValue OriV1 = V1, OriV2 = V2;


  if (fitsRegularPattern<int>(Begin, 2, End, 0, 1))

    V1 = OriV1;

  else if (fitsRegularPattern<int>(Begin, 2, End, Mask.size(), 1))

    V1 = OriV2;

  else

    return SDValue();


  if (fitsRegularPattern<int>(Begin + 1, 2, End, 0, 1))

    V2 = OriV1;

  else if (fitsRegularPattern<int>(Begin + 1, 2, End, Mask.size(), 1))

    V2 = OriV2;

  else

    return SDValue();


  return DAG.getNode(LoongArchISD::VILVL, DL, VT, V2, V1);

}


/// Lower VECTOR_SHUFFLE into VPICKEV (if possible).

///

/// VPICKEV copies the even elements of each vector into the result vector.

///

/// It is possible to lower into VPICKEV when the mask consists of two of the

/// following forms concatenated:

///   <0, 2, 4, ...>

///   <n, n+2, n+4, ...>

/// where n is the number of elements in the vector.

/// For example:

///   <0, 2, 4, ..., 0, 2, 4, ...>

///   <0, 2, 4, ..., n, n+2, n+4, ...>

///

/// When undef's appear in the mask they are treated as if they were whatever

/// value is necessary in order to fit the above forms.

static SDValue lowerVECTOR_SHUFFLE_VPICKEV(const SDLoc &DL, ArrayRef<int> Mask,

                                           MVT VT, SDValue V1, SDValue V2,

                                           SelectionDAG &DAG) {


  const auto &Begin = Mask.begin();

  const auto &Mid = Mask.begin() + Mask.size() / 2;

  const auto &End = Mask.end();

  SDValue OriV1 = V1, OriV2 = V2;


  if (fitsRegularPattern<int>(Begin, 1, Mid, 0, 2))

    V1 = OriV1;

  else if (fitsRegularPattern<int>(Begin, 1, Mid, Mask.size(), 2))

    V1 = OriV2;

  else

    return SDValue();


  if (fitsRegularPattern<int>(Mid, 1, End, 0, 2))

    V2 = OriV1;

  else if (fitsRegularPattern<int>(Mid, 1, End, Mask.size(), 2))

    V2 = OriV2;


  else

    return SDValue();


  return DAG.getNode(LoongArchISD::VPICKEV, DL, VT, V2, V1);

}


/// Lower VECTOR_SHUFFLE into VPICKOD (if possible).

///

/// VPICKOD copies the odd elements of each vector into the result vector.

///

/// It is possible to lower into VPICKOD when the mask consists of two of the

/// following forms concatenated:

///   <1, 3, 5, ...>

///   <n+1, n+3, n+5, ...>

/// where n is the number of elements in the vector.

/// For example:

///   <1, 3, 5, ..., 1, 3, 5, ...>

///   <1, 3, 5, ..., n+1, n+3, n+5, ...>

///

/// When undef's appear in the mask they are treated as if they were whatever

/// value is necessary in order to fit the above forms.

static SDValue lowerVECTOR_SHUFFLE_VPICKOD(const SDLoc &DL, ArrayRef<int> Mask,

                                           MVT VT, SDValue V1, SDValue V2,

                                           SelectionDAG &DAG) {


  const auto &Begin = Mask.begin();

  const auto &Mid = Mask.begin() + Mask.size() / 2;

  const auto &End = Mask.end();

  SDValue OriV1 = V1, OriV2 = V2;


  if (fitsRegularPattern<int>(Begin, 1, Mid, 1, 2))

    V1 = OriV1;

  else if (fitsRegularPattern<int>(Begin, 1, Mid, Mask.size() + 1, 2))

    V1 = OriV2;

  else

    return SDValue();


  if (fitsRegularPattern<int>(Mid, 1, End, 1, 2))

    V2 = OriV1;

  else if (fitsRegularPattern<int>(Mid, 1, End, Mask.size() + 1, 2))

    V2 = OriV2;

  else

    return SDValue();


  return DAG.getNode(LoongArchISD::VPICKOD, DL, VT, V2, V1);

}


/// Lower VECTOR_SHUFFLE into VSHUF.

///

/// This mostly consists of converting the shuffle mask into a BUILD_VECTOR and

/// adding it as an operand to the resulting VSHUF.

static SDValue lowerVECTOR_SHUFFLE_VSHUF(const SDLoc &DL, ArrayRef<int> Mask,

                                         MVT VT, SDValue V1, SDValue V2,

                                         SelectionDAG &DAG) {


  SmallVector<SDValue, 16> Ops;

  for (auto M : Mask)

    Ops.push_back(DAG.getConstant(M, DL, MVT::i64));


  EVT MaskVecTy = VT.changeVectorElementTypeToInteger();

  SDValue MaskVec = DAG.getBuildVector(MaskVecTy, DL, Ops);


  // VECTOR_SHUFFLE concatenates the vectors in an vectorwise fashion.

  // <0b00, 0b01> + <0b10, 0b11> -> <0b00, 0b01, 0b10, 0b11>

  // VSHF concatenates the vectors in a bitwise fashion:

  // <0b00, 0b01> + <0b10, 0b11> ->

  // 0b0100       + 0b1110       -> 0b01001110

  //                                <0b10, 0b11, 0b00, 0b01>

  // We must therefore swap the operands to get the correct result.

  return DAG.getNode(LoongArchISD::VSHUF, DL, VT, MaskVec, V2, V1);

}


/// Dispatching routine to lower various 128-bit LoongArch vector shuffles.

///

/// This routine breaks down the specific type of 128-bit shuffle and

/// dispatches to the lowering routines accordingly.

static SDValue lower128BitShuffle(const SDLoc &DL, ArrayRef<int> Mask, MVT VT,

                                  SDValue V1, SDValue V2, SelectionDAG &DAG) {

  assert((VT.SimpleTy == MVT::v16i8 || VT.SimpleTy == MVT::v8i16 ||

          VT.SimpleTy == MVT::v4i32 || VT.SimpleTy == MVT::v2i64 ||

          VT.SimpleTy == MVT::v4f32 || VT.SimpleTy == MVT::v2f64) &&

         "Vector type is unsupported for lsx!");

  assert(V1.getSimpleValueType() == V2.getSimpleValueType() &&

         "Two operands have different types!");

  assert(VT.getVectorNumElements() == Mask.size() &&

         "Unexpected mask size for shuffle!");

  assert(Mask.size() % 2 == 0 && "Expected even mask size.");


  SDValue Result;

  // TODO: Add more comparison patterns.

  if (V2.isUndef()) {

    if ((Result = lowerVECTOR_SHUFFLE_VREPLVEI(DL, Mask, VT, V1, V2, DAG)))

      return Result;

    if ((Result = lowerVECTOR_SHUFFLE_VSHUF4I(DL, Mask, VT, V1, V2, DAG)))

      return Result;


    // TODO: This comment may be enabled in the future to better match the

    // pattern for instruction selection.

    /* V2 = V1; */

  }


  // It is recommended not to change the pattern comparison order for better

  // performance.

  if ((Result = lowerVECTOR_SHUFFLE_VPACKEV(DL, Mask, VT, V1, V2, DAG)))

    return Result;

  if ((Result = lowerVECTOR_SHUFFLE_VPACKOD(DL, Mask, VT, V1, V2, DAG)))

    return Result;

  if ((Result = lowerVECTOR_SHUFFLE_VILVH(DL, Mask, VT, V1, V2, DAG)))

    return Result;

  if ((Result = lowerVECTOR_SHUFFLE_VILVL(DL, Mask, VT, V1, V2, DAG)))

    return Result;

  if ((Result = lowerVECTOR_SHUFFLE_VPICKEV(DL, Mask, VT, V1, V2, DAG)))

    return Result;

  if ((Result = lowerVECTOR_SHUFFLE_VPICKOD(DL, Mask, VT, V1, V2, DAG)))

    return Result;

  if ((Result = lowerVECTOR_SHUFFLE_VSHUF(DL, Mask, VT, V1, V2, DAG)))

    return Result;


  return SDValue();

}


/// Lower VECTOR_SHUFFLE into XVREPLVEI (if possible).

///

/// It is a XVREPLVEI when the mask is:

///   <x, x, x, ..., x+n, x+n, x+n, ...>

/// where the number of x is equal to n and n is half the length of vector.

///

/// When undef's appear in the mask they are treated as if they were whatever

/// value is necessary in order to fit the above form.

static SDValue lowerVECTOR_SHUFFLE_XVREPLVEI(const SDLoc &DL,

                                             ArrayRef<int> Mask, MVT VT,

                                             SDValue V1, SDValue V2,

                                             SelectionDAG &DAG) {

  int SplatIndex = -1;

  for (const auto &M : Mask) {

    if (M != -1) {

      SplatIndex = M;

      break;

    }

  }


  if (SplatIndex == -1)

    return DAG.getUNDEF(VT);


  const auto &Begin = Mask.begin();

  const auto &End = Mask.end();

  unsigned HalfSize = Mask.size() / 2;


  assert(SplatIndex < (int)Mask.size() && "Out of bounds mask index");

  if (fitsRegularPattern<int>(Begin, 1, End - HalfSize, SplatIndex, 0) &&

      fitsRegularPattern<int>(Begin + HalfSize, 1, End, SplatIndex + HalfSize,

                              0)) {

    APInt Imm(64, SplatIndex);

    return DAG.getNode(LoongArchISD::VREPLVEI, DL, VT, V1,

                       DAG.getConstant(Imm, DL, MVT::i64));

  }


  return SDValue();

}


/// Lower VECTOR_SHUFFLE into XVSHUF4I (if possible).

static SDValue lowerVECTOR_SHUFFLE_XVSHUF4I(const SDLoc &DL, ArrayRef<int> Mask,

                                            MVT VT, SDValue V1, SDValue V2,

                                            SelectionDAG &DAG) {

  // When the size is less than or equal to 4, lower cost instructions may be

  // used.

  if (Mask.size() <= 4)

    return SDValue();

  return lowerVECTOR_SHUFFLE_VSHUF4I(DL, Mask, VT, V1, V2, DAG);

}


/// Lower VECTOR_SHUFFLE into XVPACKEV (if possible).

static SDValue lowerVECTOR_SHUFFLE_XVPACKEV(const SDLoc &DL, ArrayRef<int> Mask,

                                            MVT VT, SDValue V1, SDValue V2,

                                            SelectionDAG &DAG) {

  return lowerVECTOR_SHUFFLE_VPACKEV(DL, Mask, VT, V1, V2, DAG);

}


/// Lower VECTOR_SHUFFLE into XVPACKOD (if possible).

static SDValue lowerVECTOR_SHUFFLE_XVPACKOD(const SDLoc &DL, ArrayRef<int> Mask,

                                            MVT VT, SDValue V1, SDValue V2,

                                            SelectionDAG &DAG) {

  return lowerVECTOR_SHUFFLE_VPACKOD(DL, Mask, VT, V1, V2, DAG);

}


/// Lower VECTOR_SHUFFLE into XVILVH (if possible).

static SDValue lowerVECTOR_SHUFFLE_XVILVH(const SDLoc &DL, ArrayRef<int> Mask,

                                          MVT VT, SDValue V1, SDValue V2,

                                          SelectionDAG &DAG) {


  const auto &Begin = Mask.begin();

  const auto &End = Mask.end();

  unsigned HalfSize = Mask.size() / 2;

  unsigned LeftSize = HalfSize / 2;

  SDValue OriV1 = V1, OriV2 = V2;


  if (fitsRegularPattern<int>(Begin, 2, End - HalfSize, HalfSize - LeftSize,

                              1) &&

      fitsRegularPattern<int>(Begin + HalfSize, 2, End, HalfSize + LeftSize, 1))

    V1 = OriV1;

  else if (fitsRegularPattern<int>(Begin, 2, End - HalfSize,

                                   Mask.size() + HalfSize - LeftSize, 1) &&

           fitsRegularPattern<int>(Begin + HalfSize, 2, End,

                                   Mask.size() + HalfSize + LeftSize, 1))

    V1 = OriV2;

  else

    return SDValue();


  if (fitsRegularPattern<int>(Begin + 1, 2, End - HalfSize, HalfSize - LeftSize,

                              1) &&

      fitsRegularPattern<int>(Begin + 1 + HalfSize, 2, End, HalfSize + LeftSize,

                              1))

    V2 = OriV1;

  else if (fitsRegularPattern<int>(Begin + 1, 2, End - HalfSize,

                                   Mask.size() + HalfSize - LeftSize, 1) &&

           fitsRegularPattern<int>(Begin + 1 + HalfSize, 2, End,

                                   Mask.size() + HalfSize + LeftSize, 1))

    V2 = OriV2;

  else

    return SDValue();


  return DAG.getNode(LoongArchISD::VILVH, DL, VT, V2, V1);

}


/// Lower VECTOR_SHUFFLE into XVILVL (if possible).

static SDValue lowerVECTOR_SHUFFLE_XVILVL(const SDLoc &DL, ArrayRef<int> Mask,

                                          MVT VT, SDValue V1, SDValue V2,

                                          SelectionDAG &DAG) {


  const auto &Begin = Mask.begin();

  const auto &End = Mask.end();

  unsigned HalfSize = Mask.size() / 2;

  SDValue OriV1 = V1, OriV2 = V2;


  if (fitsRegularPattern<int>(Begin, 2, End - HalfSize, 0, 1) &&

      fitsRegularPattern<int>(Begin + HalfSize, 2, End, HalfSize, 1))

    V1 = OriV1;

  else if (fitsRegularPattern<int>(Begin, 2, End - HalfSize, Mask.size(), 1) &&

           fitsRegularPattern<int>(Begin + HalfSize, 2, End,

                                   Mask.size() + HalfSize, 1))

    V1 = OriV2;

  else

    return SDValue();


  if (fitsRegularPattern<int>(Begin + 1, 2, End - HalfSize, 0, 1) &&

      fitsRegularPattern<int>(Begin + 1 + HalfSize, 2, End, HalfSize, 1))

    V2 = OriV1;

  else if (fitsRegularPattern<int>(Begin + 1, 2, End - HalfSize, Mask.size(),

                                   1) &&

           fitsRegularPattern<int>(Begin + 1 + HalfSize, 2, End,

                                   Mask.size() + HalfSize, 1))

    V2 = OriV2;

  else

    return SDValue();


  return DAG.getNode(LoongArchISD::VILVL, DL, VT, V2, V1);

}


/// Lower VECTOR_SHUFFLE into XVPICKEV (if possible).

static SDValue lowerVECTOR_SHUFFLE_XVPICKEV(const SDLoc &DL, ArrayRef<int> Mask,

                                            MVT VT, SDValue V1, SDValue V2,

                                            SelectionDAG &DAG) {


  const auto &Begin = Mask.begin();

  const auto &LeftMid = Mask.begin() + Mask.size() / 4;

  const auto &Mid = Mask.begin() + Mask.size() / 2;

  const auto &RightMid = Mask.end() - Mask.size() / 4;

  const auto &End = Mask.end();

  unsigned HalfSize = Mask.size() / 2;

  SDValue OriV1 = V1, OriV2 = V2;


  if (fitsRegularPattern<int>(Begin, 1, LeftMid, 0, 2) &&

      fitsRegularPattern<int>(Mid, 1, RightMid, HalfSize, 2))

    V1 = OriV1;

  else if (fitsRegularPattern<int>(Begin, 1, LeftMid, Mask.size(), 2) &&

           fitsRegularPattern<int>(Mid, 1, RightMid, Mask.size() + HalfSize, 2))

    V1 = OriV2;

  else

    return SDValue();


  if (fitsRegularPattern<int>(LeftMid, 1, Mid, 0, 2) &&

      fitsRegularPattern<int>(RightMid, 1, End, HalfSize, 2))

    V2 = OriV1;

  else if (fitsRegularPattern<int>(LeftMid, 1, Mid, Mask.size(), 2) &&

           fitsRegularPattern<int>(RightMid, 1, End, Mask.size() + HalfSize, 2))

    V2 = OriV2;


  else

    return SDValue();


  return DAG.getNode(LoongArchISD::VPICKEV, DL, VT, V2, V1);

}


/// Lower VECTOR_SHUFFLE into XVPICKOD (if possible).

static SDValue lowerVECTOR_SHUFFLE_XVPICKOD(const SDLoc &DL, ArrayRef<int> Mask,

                                            MVT VT, SDValue V1, SDValue V2,

                                            SelectionDAG &DAG) {


  const auto &Begin = Mask.begin();

  const auto &LeftMid = Mask.begin() + Mask.size() / 4;

  const auto &Mid = Mask.begin() + Mask.size() / 2;

  const auto &RightMid = Mask.end() - Mask.size() / 4;

  const auto &End = Mask.end();

  unsigned HalfSize = Mask.size() / 2;

  SDValue OriV1 = V1, OriV2 = V2;


  if (fitsRegularPattern<int>(Begin, 1, LeftMid, 1, 2) &&

      fitsRegularPattern<int>(Mid, 1, RightMid, HalfSize + 1, 2))

    V1 = OriV1;

  else if (fitsRegularPattern<int>(Begin, 1, LeftMid, Mask.size() + 1, 2) &&

           fitsRegularPattern<int>(Mid, 1, RightMid, Mask.size() + HalfSize + 1,

                                   2))

    V1 = OriV2;

  else

    return SDValue();


  if (fitsRegularPattern<int>(LeftMid, 1, Mid, 1, 2) &&

      fitsRegularPattern<int>(RightMid, 1, End, HalfSize + 1, 2))

    V2 = OriV1;

  else if (fitsRegularPattern<int>(LeftMid, 1, Mid, Mask.size() + 1, 2) &&

           fitsRegularPattern<int>(RightMid, 1, End, Mask.size() + HalfSize + 1,

                                   2))

    V2 = OriV2;

  else

    return SDValue();


  return DAG.getNode(LoongArchISD::VPICKOD, DL, VT, V2, V1);

}


/// Lower VECTOR_SHUFFLE into XVSHUF (if possible).

static SDValue lowerVECTOR_SHUFFLE_XVSHUF(const SDLoc &DL, ArrayRef<int> Mask,

                                          MVT VT, SDValue V1, SDValue V2,

                                          SelectionDAG &DAG) {


  int MaskSize = Mask.size();

  int HalfSize = Mask.size() / 2;

  const auto &Begin = Mask.begin();

  const auto &Mid = Mask.begin() + HalfSize;

  const auto &End = Mask.end();


  // VECTOR_SHUFFLE concatenates the vectors:

  //  <0, 1, 2, 3, 4, 5, 6, 7> + <8, 9, 10, 11, 12, 13, 14, 15>

  //  shuffling ->

  //  <0, 1, 2, 3, 8, 9, 10, 11> <4, 5, 6, 7, 12, 13, 14, 15>

  //

  // XVSHUF concatenates the vectors:

  //  <a0, a1, a2, a3, b0, b1, b2, b3> + <a4, a5, a6, a7, b4, b5, b6, b7>

  //  shuffling ->

  //  <a0, a1, a2, a3, a4, a5, a6, a7> + <b0, b1, b2, b3, b4, b5, b6, b7>

  SmallVector<SDValue, 8> MaskAlloc;

  for (auto it = Begin; it < Mid; it++) {

    if (*it < 0) // UNDEF

      MaskAlloc.push_back(DAG.getTargetConstant(0, DL, MVT::i64));

    else if ((*it >= 0 && *it < HalfSize) ||

             (*it >= MaskSize && *it <= MaskSize + HalfSize)) {

      int M = *it < HalfSize ? *it : *it - HalfSize;

      MaskAlloc.push_back(DAG.getTargetConstant(M, DL, MVT::i64));

    } else

      return SDValue();

  }

  assert((int)MaskAlloc.size() == HalfSize && "xvshuf convert failed!");


  for (auto it = Mid; it < End; it++) {

    if (*it < 0) // UNDEF

      MaskAlloc.push_back(DAG.getTargetConstant(0, DL, MVT::i64));

    else if ((*it >= HalfSize && *it < MaskSize) ||

             (*it >= MaskSize + HalfSize && *it < MaskSize * 2)) {

      int M = *it < MaskSize ? *it - HalfSize : *it - MaskSize;

      MaskAlloc.push_back(DAG.getTargetConstant(M, DL, MVT::i64));

    } else

      return SDValue();

  }

  assert((int)MaskAlloc.size() == MaskSize && "xvshuf convert failed!");


  EVT MaskVecTy = VT.changeVectorElementTypeToInteger();

  SDValue MaskVec = DAG.getBuildVector(MaskVecTy, DL, MaskAlloc);

  return DAG.getNode(LoongArchISD::VSHUF, DL, VT, MaskVec, V2, V1);

}


/// Shuffle vectors by lane to generate more optimized instructions.

/// 256-bit shuffles are always considered as 2-lane 128-bit shuffles.

///

/// Therefore, except for the following four cases, other cases are regarded

/// as cross-lane shuffles, where optimization is relatively limited.

///

/// - Shuffle high, low lanes of two inputs vector

///   <0, 1, 2, 3> + <4, 5, 6, 7> --- <0, 5, 3, 6>

/// - Shuffle low, high lanes of two inputs vector

///   <0, 1, 2, 3> + <4, 5, 6, 7> --- <3, 6, 0, 5>

/// - Shuffle low, low lanes of two inputs vector

///   <0, 1, 2, 3> + <4, 5, 6, 7> --- <3, 6, 3, 6>

/// - Shuffle high, high lanes of two inputs vector

///   <0, 1, 2, 3> + <4, 5, 6, 7> --- <0, 5, 0, 5>

///

/// The first case is the closest to LoongArch instructions and the other

/// cases need to be converted to it for processing.

///

/// This function may modify V1, V2 and Mask

static void canonicalizeShuffleVectorByLane(const SDLoc &DL,

                                            MutableArrayRef<int> Mask, MVT VT,

                                            SDValue &V1, SDValue &V2,

                                            SelectionDAG &DAG) {


  enum HalfMaskType { HighLaneTy, LowLaneTy, None };


  int MaskSize = Mask.size();

  int HalfSize = Mask.size() / 2;


  HalfMaskType preMask = None, postMask = None;


  if (std::all_of(Mask.begin(), Mask.begin() + HalfSize, [&](int M) {

        return M < 0 || (M >= 0 && M < HalfSize) ||

               (M >= MaskSize && M < MaskSize + HalfSize);

      }))

    preMask = HighLaneTy;

  else if (std::all_of(Mask.begin(), Mask.begin() + HalfSize, [&](int M) {

             return M < 0 || (M >= HalfSize && M < MaskSize) ||

                    (M >= MaskSize + HalfSize && M < MaskSize * 2);

           }))

    preMask = LowLaneTy;


  if (std::all_of(Mask.begin() + HalfSize, Mask.end(), [&](int M) {

        return M < 0 || (M >= 0 && M < HalfSize) ||

               (M >= MaskSize && M < MaskSize + HalfSize);

      }))

    postMask = HighLaneTy;

  else if (std::all_of(Mask.begin() + HalfSize, Mask.end(), [&](int M) {

             return M < 0 || (M >= HalfSize && M < MaskSize) ||

                    (M >= MaskSize + HalfSize && M < MaskSize * 2);

           }))

    postMask = LowLaneTy;


  // The pre-half of mask is high lane type, and the post-half of mask

  // is low lane type, which is closest to the LoongArch instructions.

  //

  // Note: In the LoongArch architecture, the high lane of mask corresponds

  // to the lower 128-bit of vector register, and the low lane of mask

  // corresponds the higher 128-bit of vector register.

  if (preMask == HighLaneTy && postMask == LowLaneTy) {

    return;

  }

  if (preMask == LowLaneTy && postMask == HighLaneTy) {

    V1 = DAG.getBitcast(MVT::v4i64, V1);

    V1 = DAG.getNode(LoongArchISD::XVPERMI, DL, MVT::v4i64, V1,

                     DAG.getConstant(0b01001110, DL, MVT::i64));

    V1 = DAG.getBitcast(VT, V1);


    if (!V2.isUndef()) {

      V2 = DAG.getBitcast(MVT::v4i64, V2);

      V2 = DAG.getNode(LoongArchISD::XVPERMI, DL, MVT::v4i64, V2,

                       DAG.getConstant(0b01001110, DL, MVT::i64));

      V2 = DAG.getBitcast(VT, V2);

    }


    for (auto it = Mask.begin(); it < Mask.begin() + HalfSize; it++) {

      *it = *it < 0 ? *it : *it - HalfSize;

    }

    for (auto it = Mask.begin() + HalfSize; it < Mask.end(); it++) {

      *it = *it < 0 ? *it : *it + HalfSize;

    }

  } else if (preMask == LowLaneTy && postMask == LowLaneTy) {

    V1 = DAG.getBitcast(MVT::v4i64, V1);

    V1 = DAG.getNode(LoongArchISD::XVPERMI, DL, MVT::v4i64, V1,

                     DAG.getConstant(0b11101110, DL, MVT::i64));

    V1 = DAG.getBitcast(VT, V1);


    if (!V2.isUndef()) {

      V2 = DAG.getBitcast(MVT::v4i64, V2);

      V2 = DAG.getNode(LoongArchISD::XVPERMI, DL, MVT::v4i64, V2,

                       DAG.getConstant(0b11101110, DL, MVT::i64));

      V2 = DAG.getBitcast(VT, V2);

    }


    for (auto it = Mask.begin(); it < Mask.begin() + HalfSize; it++) {

      *it = *it < 0 ? *it : *it - HalfSize;

    }

  } else if (preMask == HighLaneTy && postMask == HighLaneTy) {

    V1 = DAG.getBitcast(MVT::v4i64, V1);

    V1 = DAG.getNode(LoongArchISD::XVPERMI, DL, MVT::v4i64, V1,

                     DAG.getConstant(0b01000100, DL, MVT::i64));

    V1 = DAG.getBitcast(VT, V1);


    if (!V2.isUndef()) {

      V2 = DAG.getBitcast(MVT::v4i64, V2);

      V2 = DAG.getNode(LoongArchISD::XVPERMI, DL, MVT::v4i64, V2,

                       DAG.getConstant(0b01000100, DL, MVT::i64));

      V2 = DAG.getBitcast(VT, V2);

    }


    for (auto it = Mask.begin() + HalfSize; it < Mask.end(); it++) {

      *it = *it < 0 ? *it : *it + HalfSize;

    }

  } else { // cross-lane

    return;

  }

}


/// Dispatching routine to lower various 256-bit LoongArch vector shuffles.

///

/// This routine breaks down the specific type of 256-bit shuffle and

/// dispatches to the lowering routines accordingly.

static SDValue lower256BitShuffle(const SDLoc &DL, ArrayRef<int> Mask, MVT VT,

                                  SDValue V1, SDValue V2, SelectionDAG &DAG) {

  assert((VT.SimpleTy == MVT::v32i8 || VT.SimpleTy == MVT::v16i16 ||

          VT.SimpleTy == MVT::v8i32 || VT.SimpleTy == MVT::v4i64 ||

          VT.SimpleTy == MVT::v8f32 || VT.SimpleTy == MVT::v4f64) &&

         "Vector type is unsupported for lasx!");

  assert(V1.getSimpleValueType() == V2.getSimpleValueType() &&

         "Two operands have different types!");

  assert(VT.getVectorNumElements() == Mask.size() &&

         "Unexpected mask size for shuffle!");

  assert(Mask.size() % 2 == 0 && "Expected even mask size.");

  assert(Mask.size() >= 4 && "Mask size is less than 4.");


  // canonicalize non cross-lane shuffle vector

  SmallVector<int> NewMask(Mask);

  canonicalizeShuffleVectorByLane(DL, NewMask, VT, V1, V2, DAG);


  SDValue Result;

  // TODO: Add more comparison patterns.

  if (V2.isUndef()) {

    if ((Result = lowerVECTOR_SHUFFLE_XVREPLVEI(DL, NewMask, VT, V1, V2, DAG)))

      return Result;

    if ((Result = lowerVECTOR_SHUFFLE_XVSHUF4I(DL, NewMask, VT, V1, V2, DAG)))

      return Result;


    // TODO: This comment may be enabled in the future to better match the

    // pattern for instruction selection.

    /* V2 = V1; */

  }


  // It is recommended not to change the pattern comparison order for better

  // performance.

  if ((Result = lowerVECTOR_SHUFFLE_XVPACKEV(DL, NewMask, VT, V1, V2, DAG)))

    return Result;

  if ((Result = lowerVECTOR_SHUFFLE_XVPACKOD(DL, NewMask, VT, V1, V2, DAG)))

    return Result;

  if ((Result = lowerVECTOR_SHUFFLE_XVILVH(DL, NewMask, VT, V1, V2, DAG)))

    return Result;

  if ((Result = lowerVECTOR_SHUFFLE_XVILVL(DL, NewMask, VT, V1, V2, DAG)))

    return Result;

  if ((Result = lowerVECTOR_SHUFFLE_XVPICKEV(DL, NewMask, VT, V1, V2, DAG)))

    return Result;

  if ((Result = lowerVECTOR_SHUFFLE_XVPICKOD(DL, NewMask, VT, V1, V2, DAG)))

    return Result;

  if ((Result = lowerVECTOR_SHUFFLE_XVSHUF(DL, NewMask, VT, V1, V2, DAG)))

    return Result;


  return SDValue();

}


SDValue LoongArchTargetLowering::lowerVECTOR_SHUFFLE(SDValue Op,

                                                     SelectionDAG &DAG) const {

  ShuffleVectorSDNode *SVOp = cast<ShuffleVectorSDNode>(Op);

  ArrayRef<int> OrigMask = SVOp->getMask();

  SDValue V1 = Op.getOperand(0);

  SDValue V2 = Op.getOperand(1);

  MVT VT = Op.getSimpleValueType();

  int NumElements = VT.getVectorNumElements();

  SDLoc DL(Op);


  bool V1IsUndef = V1.isUndef();

  bool V2IsUndef = V2.isUndef();

  if (V1IsUndef && V2IsUndef)

    return DAG.getUNDEF(VT);


  // When we create a shuffle node we put the UNDEF node to second operand,

  // but in some cases the first operand may be transformed to UNDEF.

  // In this case we should just commute the node.

  if (V1IsUndef)

    return DAG.getCommutedVectorShuffle(*SVOp);


  // Check for non-undef masks pointing at an undef vector and make the masks

  // undef as well. This makes it easier to match the shuffle based solely on

  // the mask.

  if (V2IsUndef &&

      any_of(OrigMask, [NumElements](int M) { return M >= NumElements; })) {

    SmallVector<int, 8> NewMask(OrigMask);

    for (int &M : NewMask)

      if (M >= NumElements)

        M = -1;

    return DAG.getVectorShuffle(VT, DL, V1, V2, NewMask);

  }


  // Check for illegal shuffle mask element index values.

  int MaskUpperLimit = OrigMask.size() * (V2IsUndef ? 1 : 2);

  (void)MaskUpperLimit;

  assert(llvm::all_of(OrigMask,

                      [&](int M) { return -1 <= M && M < MaskUpperLimit; }) &&

         "Out of bounds shuffle index");


  // For each vector width, delegate to a specialized lowering routine.

  if (VT.is128BitVector())

    return lower128BitShuffle(DL, OrigMask, VT, V1, V2, DAG);


  if (VT.is256BitVector())

    return lower256BitShuffle(DL, OrigMask, VT, V1, V2, DAG);


  return SDValue();

}


static bool isConstantOrUndef(const SDValue Op) {

  if (Op->isUndef())

    return true;

  if (isa<ConstantSDNode>(Op))

    return true;

  if (isa<ConstantFPSDNode>(Op))

    return true;

  return false;

}


static bool isConstantOrUndefBUILD_VECTOR(const BuildVectorSDNode *Op) {

  for (unsigned i = 0; i < Op->getNumOperands(); ++i)

    if (isConstantOrUndef(Op->getOperand(i)))

      return true;

  return false;

}


SDValue LoongArchTargetLowering::lowerBUILD_VECTOR(SDValue Op,

                                                   SelectionDAG &DAG) const {

  BuildVectorSDNode *Node = cast<BuildVectorSDNode>(Op);

  EVT ResTy = Op->getValueType(0);

  SDLoc DL(Op);

  APInt SplatValue, SplatUndef;

  unsigned SplatBitSize;

  bool HasAnyUndefs;

  bool Is128Vec = ResTy.is128BitVector();

  bool Is256Vec = ResTy.is256BitVector();


  if ((!Subtarget.hasExtLSX() || !Is128Vec) &&

      (!Subtarget.hasExtLASX() || !Is256Vec))

    return SDValue();


  if (Node->isConstantSplat(SplatValue, SplatUndef, SplatBitSize, HasAnyUndefs,

                            /*MinSplatBits=*/8) &&

      SplatBitSize <= 64) {

    // We can only cope with 8, 16, 32, or 64-bit elements.

    if (SplatBitSize != 8 && SplatBitSize != 16 && SplatBitSize != 32 &&

        SplatBitSize != 64)

      return SDValue();


    EVT ViaVecTy;


    switch (SplatBitSize) {

    default:

      return SDValue();

    case 8:

      ViaVecTy = Is128Vec ? MVT::v16i8 : MVT::v32i8;

      break;

    case 16:

      ViaVecTy = Is128Vec ? MVT::v8i16 : MVT::v16i16;

      break;

    case 32:

      ViaVecTy = Is128Vec ? MVT::v4i32 : MVT::v8i32;

      break;

    case 64:

      ViaVecTy = Is128Vec ? MVT::v2i64 : MVT::v4i64;

      break;

    }


    // SelectionDAG::getConstant will promote SplatValue appropriately.

    SDValue Result = DAG.getConstant(SplatValue, DL, ViaVecTy);


    // Bitcast to the type we originally wanted.

    if (ViaVecTy != ResTy)

      Result = DAG.getNode(ISD::BITCAST, SDLoc(Node), ResTy, Result);


    return Result;

  }


  if (DAG.isSplatValue(Op, /*AllowUndefs=*/false))

    return Op;


  if (!isConstantOrUndefBUILD_VECTOR(Node)) {

    // Use INSERT_VECTOR_ELT operations rather than expand to stores.

    // The resulting code is the same length as the expansion, but it doesn't

    // use memory operations.

    EVT ResTy = Node->getValueType(0);


    assert(ResTy.isVector());


    unsigned NumElts = ResTy.getVectorNumElements();

    SDValue Vector = DAG.getUNDEF(ResTy);

    for (unsigned i = 0; i < NumElts; ++i) {

      Vector = DAG.getNode(ISD::INSERT_VECTOR_ELT, DL, ResTy, Vector,

                           Node->getOperand(i),

                           DAG.getConstant(i, DL, Subtarget.getGRLenVT()));

    }

    return Vector;

  }


  return SDValue();

}


SDValue

LoongArchTargetLowering::lowerEXTRACT_VECTOR_ELT(SDValue Op,

                                                 SelectionDAG &DAG) const {

  EVT VecTy = Op->getOperand(0)->getValueType(0);

  SDValue Idx = Op->getOperand(1);

  EVT EltTy = VecTy.getVectorElementType();

  unsigned NumElts = VecTy.getVectorNumElements();


  if (isa<ConstantSDNode>(Idx) &&

      (EltTy == MVT::i32 || EltTy == MVT::i64 || EltTy == MVT::f32 ||

       EltTy == MVT::f64 || Idx->getAsZExtVal() < NumElts / 2))

    return Op;


  return SDValue();

}


SDValue

LoongArchTargetLowering::lowerINSERT_VECTOR_ELT(SDValue Op,

                                                SelectionDAG &DAG) const {

  if (isa<ConstantSDNode>(Op->getOperand(2)))

    return Op;

  return SDValue();

}


SDValue LoongArchTargetLowering::lowerATOMIC_FENCE(SDValue Op,

                                                   SelectionDAG &DAG) const {

  SDLoc DL(Op);

  SyncScope::ID FenceSSID =

      static_cast<SyncScope::ID>(Op.getConstantOperandVal(2));


  // singlethread fences only synchronize with signal handlers on the same

  // thread and thus only need to preserve instruction order, not actually

  // enforce memory ordering.

  if (FenceSSID == SyncScope::SingleThread)

    // MEMBARRIER is a compiler barrier; it codegens to a no-op.

    return DAG.getNode(ISD::MEMBARRIER, DL, MVT::Other, Op.getOperand(0));


  return Op;

}


SDValue LoongArchTargetLowering::lowerWRITE_REGISTER(SDValue Op,

                                                     SelectionDAG &DAG) const {


  if (Subtarget.is64Bit() && Op.getOperand(2).getValueType() == MVT::i32) {

    DAG.getContext()->emitError(

        "On LA64, only 64-bit registers can be written.");

    return Op.getOperand(0);

  }


  if (!Subtarget.is64Bit() && Op.getOperand(2).getValueType() == MVT::i64) {

    DAG.getContext()->emitError(

        "On LA32, only 32-bit registers can be written.");

    return Op.getOperand(0);

  }


  return Op;

}


SDValue LoongArchTargetLowering::lowerFRAMEADDR(SDValue Op,

                                                SelectionDAG &DAG) const {

  if (!isa<ConstantSDNode>(Op.getOperand(0))) {

    DAG.getContext()->emitError("argument to '__builtin_frame_address' must "

                                "be a constant integer");

    return SDValue();

  }


  MachineFunction &MF = DAG.getMachineFunction();

  MF.getFrameInfo().setFrameAddressIsTaken(true);

  Register FrameReg = Subtarget.getRegisterInfo()->getFrameRegister(MF);

  EVT VT = Op.getValueType();

  SDLoc DL(Op);

  SDValue FrameAddr = DAG.getCopyFromReg(DAG.getEntryNode(), DL, FrameReg, VT);

  unsigned Depth = Op.getConstantOperandVal(0);

  int GRLenInBytes = Subtarget.getGRLen() / 8;


  while (Depth--) {

    int Offset = -(GRLenInBytes * 2);

    SDValue Ptr = DAG.getNode(ISD::ADD, DL, VT, FrameAddr,

                              DAG.getSignedConstant(Offset, DL, VT));

    FrameAddr =

        DAG.getLoad(VT, DL, DAG.getEntryNode(), Ptr, MachinePointerInfo());

  }

  return FrameAddr;

}


SDValue LoongArchTargetLowering::lowerRETURNADDR(SDValue Op,

                                                 SelectionDAG &DAG) const {

  if (verifyReturnAddressArgumentIsConstant(Op, DAG))

    return SDValue();


  // Currently only support lowering return address for current frame.

  if (Op.getConstantOperandVal(0) != 0) {

    DAG.getContext()->emitError(

        "return address can only be determined for the current frame");

    return SDValue();

  }


  MachineFunction &MF = DAG.getMachineFunction();

  MF.getFrameInfo().setReturnAddressIsTaken(true);

  MVT GRLenVT = Subtarget.getGRLenVT();


  // Return the value of the return address register, marking it an implicit

  // live-in.

  Register Reg = MF.addLiveIn(Subtarget.getRegisterInfo()->getRARegister(),

                              getRegClassFor(GRLenVT));

  return DAG.getCopyFromReg(DAG.getEntryNode(), SDLoc(Op), Reg, GRLenVT);

}


SDValue LoongArchTargetLowering::lowerEH_DWARF_CFA(SDValue Op,

                                                   SelectionDAG &DAG) const {

  MachineFunction &MF = DAG.getMachineFunction();

  auto Size = Subtarget.getGRLen() / 8;

  auto FI = MF.getFrameInfo().CreateFixedObject(Size, 0, false);

  return DAG.getFrameIndex(FI, getPointerTy(DAG.getDataLayout()));

}


SDValue LoongArchTargetLowering::lowerVASTART(SDValue Op,

                                              SelectionDAG &DAG) const {

  MachineFunction &MF = DAG.getMachineFunction();

  auto *FuncInfo = MF.getInfo<LoongArchMachineFunctionInfo>();


  SDLoc DL(Op);

  SDValue FI = DAG.getFrameIndex(FuncInfo->getVarArgsFrameIndex(),

                                 getPointerTy(MF.getDataLayout()));


  // vastart just stores the address of the VarArgsFrameIndex slot into the

  // memory location argument.

  const Value *SV = cast<SrcValueSDNode>(Op.getOperand(2))->getValue();

  return DAG.getStore(Op.getOperand(0), DL, FI, Op.getOperand(1),

                      MachinePointerInfo(SV));

}


SDValue LoongArchTargetLowering::lowerUINT_TO_FP(SDValue Op,

                                                 SelectionDAG &DAG) const {

  assert(Subtarget.is64Bit() && Subtarget.hasBasicF() &&

         !Subtarget.hasBasicD() && "unexpected target features");


  SDLoc DL(Op);

  SDValue Op0 = Op.getOperand(0);

  if (Op0->getOpcode() == ISD::AND) {

    auto *C = dyn_cast<ConstantSDNode>(Op0.getOperand(1));

    if (C && C->getZExtValue() < UINT64_C(0xFFFFFFFF))

      return Op;

  }


  if (Op0->getOpcode() == LoongArchISD::BSTRPICK &&

      Op0.getConstantOperandVal(1) < UINT64_C(0X1F) &&

      Op0.getConstantOperandVal(2) == UINT64_C(0))

    return Op;


  if (Op0.getOpcode() == ISD::AssertZext &&

      dyn_cast<VTSDNode>(Op0.getOperand(1))->getVT().bitsLT(MVT::i32))

    return Op;


  EVT OpVT = Op0.getValueType();

  EVT RetVT = Op.getValueType();

  RTLIB::Libcall LC = RTLIB::getUINTTOFP(OpVT, RetVT);

  MakeLibCallOptions CallOptions;

  CallOptions.setTypeListBeforeSoften(OpVT, RetVT, true);

  SDValue Chain = SDValue();

  SDValue Result;

  std::tie(Result, Chain) =

      makeLibCall(DAG, LC, Op.getValueType(), Op0, CallOptions, DL, Chain);

  return Result;

}


SDValue LoongArchTargetLowering::lowerSINT_TO_FP(SDValue Op,

                                                 SelectionDAG &DAG) const {

  assert(Subtarget.is64Bit() && Subtarget.hasBasicF() &&

         !Subtarget.hasBasicD() && "unexpected target features");


  SDLoc DL(Op);

  SDValue Op0 = Op.getOperand(0);


  if ((Op0.getOpcode() == ISD::AssertSext ||

       Op0.getOpcode() == ISD::SIGN_EXTEND_INREG) &&

      dyn_cast<VTSDNode>(Op0.getOperand(1))->getVT().bitsLE(MVT::i32))

    return Op;


  EVT OpVT = Op0.getValueType();

  EVT RetVT = Op.getValueType();

  RTLIB::Libcall LC = RTLIB::getSINTTOFP(OpVT, RetVT);

  MakeLibCallOptions CallOptions;

  CallOptions.setTypeListBeforeSoften(OpVT, RetVT, true);

  SDValue Chain = SDValue();

  SDValue Result;

  std::tie(Result, Chain) =

      makeLibCall(DAG, LC, Op.getValueType(), Op0, CallOptions, DL, Chain);

  return Result;

}


SDValue LoongArchTargetLowering::lowerBITCAST(SDValue Op,

                                              SelectionDAG &DAG) const {


  SDLoc DL(Op);

  SDValue Op0 = Op.getOperand(0);


  if (Op.getValueType() == MVT::f32 && Op0.getValueType() == MVT::i32 &&

      Subtarget.is64Bit() && Subtarget.hasBasicF()) {

    SDValue NewOp0 = DAG.getNode(ISD::ANY_EXTEND, DL, MVT::i64, Op0);

    return DAG.getNode(LoongArchISD::MOVGR2FR_W_LA64, DL, MVT::f32, NewOp0);

  }

  return Op;

}


SDValue LoongArchTargetLowering::lowerFP_TO_SINT(SDValue Op,

                                                 SelectionDAG &DAG) const {


  SDLoc DL(Op);

  SDValue Op0 = Op.getOperand(0);


  if (Op0.getValueType() == MVT::f16)

    Op0 = DAG.getNode(ISD::FP_EXTEND, DL, MVT::f32, Op0);


  if (Op.getValueSizeInBits() > 32 && Subtarget.hasBasicF() &&

      !Subtarget.hasBasicD()) {

    SDValue Dst = DAG.getNode(LoongArchISD::FTINT, DL, MVT::f32, Op0);

    return DAG.getNode(LoongArchISD::MOVFR2GR_S_LA64, DL, MVT::i64, Dst);

  }


  EVT FPTy = EVT::getFloatingPointVT(Op.getValueSizeInBits());

  SDValue Trunc = DAG.getNode(LoongArchISD::FTINT, DL, FPTy, Op0);

  return DAG.getNode(ISD::BITCAST, DL, Op.getValueType(), Trunc);

}


static SDValue getTargetNode(GlobalAddressSDNode *N, SDLoc DL, EVT Ty,

                             SelectionDAG &DAG, unsigned Flags) {

  return DAG.getTargetGlobalAddress(N->getGlobal(), DL, Ty, 0, Flags);

}


static SDValue getTargetNode(BlockAddressSDNode *N, SDLoc DL, EVT Ty,

                             SelectionDAG &DAG, unsigned Flags) {

  return DAG.getTargetBlockAddress(N->getBlockAddress(), Ty, N->getOffset(),

                                   Flags);

}


static SDValue getTargetNode(ConstantPoolSDNode *N, SDLoc DL, EVT Ty,

                             SelectionDAG &DAG, unsigned Flags) {

  return DAG.getTargetConstantPool(N->getConstVal(), Ty, N->getAlign(),

                                   N->getOffset(), Flags);

}


static SDValue getTargetNode(JumpTableSDNode *N, SDLoc DL, EVT Ty,

                             SelectionDAG &DAG, unsigned Flags) {

  return DAG.getTargetJumpTable(N->getIndex(), Ty, Flags);

}


template <class NodeTy>

SDValue LoongArchTargetLowering::getAddr(NodeTy *N, SelectionDAG &DAG,

                                         CodeModel::Model M,

                                         bool IsLocal) const {

  SDLoc DL(N);

  EVT Ty = getPointerTy(DAG.getDataLayout());

  SDValue Addr = getTargetNode(N, DL, Ty, DAG, 0);

  SDValue Load;


  switch (M) {

  default:

    report_fatal_error("Unsupported code model");


  case CodeModel::Large: {

    assert(Subtarget.is64Bit() && "Large code model requires LA64");


    // This is not actually used, but is necessary for successfully matching

    // the PseudoLA_*_LARGE nodes.

    SDValue Tmp = DAG.getConstant(0, DL, Ty);

    if (IsLocal) {

      // This generates the pattern (PseudoLA_PCREL_LARGE tmp sym), that

      // eventually becomes the desired 5-insn code sequence.

      Load = SDValue(DAG.getMachineNode(LoongArch::PseudoLA_PCREL_LARGE, DL, Ty,

                                        Tmp, Addr),

                     0);

    } else {

      // This generates the pattern (PseudoLA_GOT_LARGE tmp sym), that

      // eventually becomes the desired 5-insn code sequence.

      Load = SDValue(

          DAG.getMachineNode(LoongArch::PseudoLA_GOT_LARGE, DL, Ty, Tmp, Addr),

          0);

    }

    break;

  }


  case CodeModel::Small:

  case CodeModel::Medium:

    if (IsLocal) {

      // This generates the pattern (PseudoLA_PCREL sym), which expands to

      // (addi.w/d (pcalau12i %pc_hi20(sym)) %pc_lo12(sym)).

      Load = SDValue(

          DAG.getMachineNode(LoongArch::PseudoLA_PCREL, DL, Ty, Addr), 0);

    } else {

      // This generates the pattern (PseudoLA_GOT sym), which expands to (ld.w/d

      // (pcalau12i %got_pc_hi20(sym)) %got_pc_lo12(sym)).

      Load =

          SDValue(DAG.getMachineNode(LoongArch::PseudoLA_GOT, DL, Ty, Addr), 0);

    }

  }


  if (!IsLocal) {

    // Mark the load instruction as invariant to enable hoisting in MachineLICM.

    MachineFunction &MF = DAG.getMachineFunction();

    MachineMemOperand *MemOp = MF.getMachineMemOperand(

        MachinePointerInfo::getGOT(MF),

        MachineMemOperand::MOLoad | MachineMemOperand::MODereferenceable |

            MachineMemOperand::MOInvariant,

        LLT(Ty.getSimpleVT()), Align(Ty.getFixedSizeInBits() / 8));

    DAG.setNodeMemRefs(cast<MachineSDNode>(Load.getNode()), {MemOp});

  }


  return Load;

}


SDValue LoongArchTargetLowering::lowerBlockAddress(SDValue Op,

                                                   SelectionDAG &DAG) const {

  return getAddr(cast<BlockAddressSDNode>(Op), DAG,

                 DAG.getTarget().getCodeModel());

}


SDValue LoongArchTargetLowering::lowerJumpTable(SDValue Op,

                                                SelectionDAG &DAG) const {

  return getAddr(cast<JumpTableSDNode>(Op), DAG,

                 DAG.getTarget().getCodeModel());

}


SDValue LoongArchTargetLowering::lowerConstantPool(SDValue Op,

                                                   SelectionDAG &DAG) const {

  return getAddr(cast<ConstantPoolSDNode>(Op), DAG,

                 DAG.getTarget().getCodeModel());

}


SDValue LoongArchTargetLowering::lowerGlobalAddress(SDValue Op,

                                                    SelectionDAG &DAG) const {

  GlobalAddressSDNode *N = cast<GlobalAddressSDNode>(Op);

  assert(N->getOffset() == 0 && "unexpected offset in global node");

  auto CM = DAG.getTarget().getCodeModel();

  const GlobalValue *GV = N->getGlobal();


  if (GV->isDSOLocal() && isa<GlobalVariable>(GV)) {

    if (auto GCM = dyn_cast<GlobalVariable>(GV)->getCodeModel())

      CM = *GCM;

  }


  return getAddr(N, DAG, CM, GV->isDSOLocal());

}


SDValue LoongArchTargetLowering::getStaticTLSAddr(GlobalAddressSDNode *N,

                                                  SelectionDAG &DAG,

                                                  unsigned Opc, bool UseGOT,

                                                  bool Large) const {

  SDLoc DL(N);

  EVT Ty = getPointerTy(DAG.getDataLayout());

  MVT GRLenVT = Subtarget.getGRLenVT();


  // This is not actually used, but is necessary for successfully matching the

  // PseudoLA_*_LARGE nodes.

  SDValue Tmp = DAG.getConstant(0, DL, Ty);

  SDValue Addr = DAG.getTargetGlobalAddress(N->getGlobal(), DL, Ty, 0, 0);


  // Only IE needs an extra argument for large code model.

  SDValue Offset = Opc == LoongArch::PseudoLA_TLS_IE_LARGE

                       ? SDValue(DAG.getMachineNode(Opc, DL, Ty, Tmp, Addr), 0)

                       : SDValue(DAG.getMachineNode(Opc, DL, Ty, Addr), 0);


  // If it is LE for normal/medium code model, the add tp operation will occur

  // during the pseudo-instruction expansion.

  if (Opc == LoongArch::PseudoLA_TLS_LE && !Large)

    return Offset;


  if (UseGOT) {

    // Mark the load instruction as invariant to enable hoisting in MachineLICM.

    MachineFunction &MF = DAG.getMachineFunction();

    MachineMemOperand *MemOp = MF.getMachineMemOperand(

        MachinePointerInfo::getGOT(MF),

        MachineMemOperand::MOLoad | MachineMemOperand::MODereferenceable |

            MachineMemOperand::MOInvariant,

        LLT(Ty.getSimpleVT()), Align(Ty.getFixedSizeInBits() / 8));

    DAG.setNodeMemRefs(cast<MachineSDNode>(Offset.getNode()), {MemOp});

  }


  // Add the thread pointer.

  return DAG.getNode(ISD::ADD, DL, Ty, Offset,

                     DAG.getRegister(LoongArch::R2, GRLenVT));

}


SDValue LoongArchTargetLowering::getDynamicTLSAddr(GlobalAddressSDNode *N,

                                                   SelectionDAG &DAG,

                                                   unsigned Opc,

                                                   bool Large) const {

  SDLoc DL(N);

  EVT Ty = getPointerTy(DAG.getDataLayout());

  IntegerType *CallTy = Type::getIntNTy(*DAG.getContext(), Ty.getSizeInBits());


  // This is not actually used, but is necessary for successfully matching the

  // PseudoLA_*_LARGE nodes.

  SDValue Tmp = DAG.getConstant(0, DL, Ty);


  // Use a PC-relative addressing mode to access the dynamic GOT address.

  SDValue Addr = DAG.getTargetGlobalAddress(N->getGlobal(), DL, Ty, 0, 0);

  SDValue Load = Large ? SDValue(DAG.getMachineNode(Opc, DL, Ty, Tmp, Addr), 0)

                       : SDValue(DAG.getMachineNode(Opc, DL, Ty, Addr), 0);


  // Prepare argument list to generate call.

  ArgListTy Args;

  ArgListEntry Entry;

  Entry.Node = Load;

  Entry.Ty = CallTy;

  Args.push_back(Entry);


  // Setup call to __tls_get_addr.

  TargetLowering::CallLoweringInfo CLI(DAG);

  CLI.setDebugLoc(DL)

      .setChain(DAG.getEntryNode())

      .setLibCallee(CallingConv::C, CallTy,

                    DAG.getExternalSymbol("__tls_get_addr", Ty),

                    std::move(Args));


  return LowerCallTo(CLI).first;

}


SDValue LoongArchTargetLowering::getTLSDescAddr(GlobalAddressSDNode *N,

                                                SelectionDAG &DAG, unsigned Opc,

                                                bool Large) const {

  SDLoc DL(N);

  EVT Ty = getPointerTy(DAG.getDataLayout());

  const GlobalValue *GV = N->getGlobal();


  // This is not actually used, but is necessary for successfully matching the

  // PseudoLA_*_LARGE nodes.

  SDValue Tmp = DAG.getConstant(0, DL, Ty);


  // Use a PC-relative addressing mode to access the global dynamic GOT address.

  // This generates the pattern (PseudoLA_TLS_DESC_PC{,LARGE} sym).

  SDValue Addr = DAG.getTargetGlobalAddress(GV, DL, Ty, 0, 0);

  return Large ? SDValue(DAG.getMachineNode(Opc, DL, Ty, Tmp, Addr), 0)

               : SDValue(DAG.getMachineNode(Opc, DL, Ty, Addr), 0);

}


SDValue

LoongArchTargetLowering::lowerGlobalTLSAddress(SDValue Op,

                                               SelectionDAG &DAG) const {

  if (DAG.getMachineFunction().getFunction().getCallingConv() ==

      CallingConv::GHC)

    report_fatal_error("In GHC calling convention TLS is not supported");


  bool Large = DAG.getTarget().getCodeModel() == CodeModel::Large;

  assert((!Large || Subtarget.is64Bit()) && "Large code model requires LA64");


  GlobalAddressSDNode *N = cast<GlobalAddressSDNode>(Op);

  assert(N->getOffset() == 0 && "unexpected offset in global node");


  if (DAG.getTarget().useEmulatedTLS())

    report_fatal_error("the emulated TLS is prohibited",

                       /*GenCrashDiag=*/false);


  bool IsDesc = DAG.getTarget().useTLSDESC();


  switch (getTargetMachine().getTLSModel(N->getGlobal())) {

  case TLSModel::GeneralDynamic:

    // In this model, application code calls the dynamic linker function

    // __tls_get_addr to locate TLS offsets into the dynamic thread vector at

    // runtime.

    if (!IsDesc)

      return getDynamicTLSAddr(N, DAG,

                               Large ? LoongArch::PseudoLA_TLS_GD_LARGE

                                     : LoongArch::PseudoLA_TLS_GD,

                               Large);

    break;

  case TLSModel::LocalDynamic:

    // Same as GeneralDynamic, except for assembly modifiers and relocation

    // records.

    if (!IsDesc)

      return getDynamicTLSAddr(N, DAG,

                               Large ? LoongArch::PseudoLA_TLS_LD_LARGE

                                     : LoongArch::PseudoLA_TLS_LD,

                               Large);

    break;

  case TLSModel::InitialExec:

    // This model uses the GOT to resolve TLS offsets.

    return getStaticTLSAddr(N, DAG,

                            Large ? LoongArch::PseudoLA_TLS_IE_LARGE

                                  : LoongArch::PseudoLA_TLS_IE,

                            /*UseGOT=*/true, Large);

  case TLSModel::LocalExec:

    // This model is used when static linking as the TLS offsets are resolved

    // during program linking.

    //

    // This node doesn't need an extra argument for the large code model.

    return getStaticTLSAddr(N, DAG, LoongArch::PseudoLA_TLS_LE,

                            /*UseGOT=*/false, Large);

  }


  return getTLSDescAddr(N, DAG,

                        Large ? LoongArch::PseudoLA_TLS_DESC_LARGE

                              : LoongArch::PseudoLA_TLS_DESC,

                        Large);

}


template <unsigned N>

static SDValue checkIntrinsicImmArg(SDValue Op, unsigned ImmOp,

                                    SelectionDAG &DAG, bool IsSigned = false) {

  auto *CImm = cast<ConstantSDNode>(Op->getOperand(ImmOp));

  // Check the ImmArg.

  if ((IsSigned && !isInt<N>(CImm->getSExtValue())) ||

      (!IsSigned && !isUInt<N>(CImm->getZExtValue()))) {

    DAG.getContext()->emitError(Op->getOperationName(0) +

                                ": argument out of range.");

    return DAG.getNode(ISD::UNDEF, SDLoc(Op), Op.getValueType());

  }

  return SDValue();

}


SDValue

LoongArchTargetLowering::lowerINTRINSIC_WO_CHAIN(SDValue Op,

                                                 SelectionDAG &DAG) const {

  SDLoc DL(Op);

  switch (Op.getConstantOperandVal(0)) {

  default:

    return SDValue(); // Don't custom lower most intrinsics.

  case Intrinsic::thread_pointer: {

    EVT PtrVT = getPointerTy(DAG.getDataLayout());

    return DAG.getRegister(LoongArch::R2, PtrVT);

  }

  case Intrinsic::loongarch_lsx_vpickve2gr_d:

  case Intrinsic::loongarch_lsx_vpickve2gr_du:

  case Intrinsic::loongarch_lsx_vreplvei_d:

  case Intrinsic::loongarch_lasx_xvrepl128vei_d:

    return checkIntrinsicImmArg<1>(Op, 2, DAG);

  case Intrinsic::loongarch_lsx_vreplvei_w:

  case Intrinsic::loongarch_lasx_xvrepl128vei_w:

  case Intrinsic::loongarch_lasx_xvpickve2gr_d:

  case Intrinsic::loongarch_lasx_xvpickve2gr_du:

  case Intrinsic::loongarch_lasx_xvpickve_d:

  case Intrinsic::loongarch_lasx_xvpickve_d_f:

    return checkIntrinsicImmArg<2>(Op, 2, DAG);

  case Intrinsic::loongarch_lasx_xvinsve0_d:

    return checkIntrinsicImmArg<2>(Op, 3, DAG);

  case Intrinsic::loongarch_lsx_vsat_b:

  case Intrinsic::loongarch_lsx_vsat_bu:

  case Intrinsic::loongarch_lsx_vrotri_b:

  case Intrinsic::loongarch_lsx_vsllwil_h_b:

  case Intrinsic::loongarch_lsx_vsllwil_hu_bu:

  case Intrinsic::loongarch_lsx_vsrlri_b:

  case Intrinsic::loongarch_lsx_vsrari_b:

  case Intrinsic::loongarch_lsx_vreplvei_h:

  case Intrinsic::loongarch_lasx_xvsat_b:

  case Intrinsic::loongarch_lasx_xvsat_bu:

  case Intrinsic::loongarch_lasx_xvrotri_b:

  case Intrinsic::loongarch_lasx_xvsllwil_h_b:

  case Intrinsic::loongarch_lasx_xvsllwil_hu_bu:

  case Intrinsic::loongarch_lasx_xvsrlri_b:

  case Intrinsic::loongarch_lasx_xvsrari_b:

  case Intrinsic::loongarch_lasx_xvrepl128vei_h:

  case Intrinsic::loongarch_lasx_xvpickve_w:

  case Intrinsic::loongarch_lasx_xvpickve_w_f:

    return checkIntrinsicImmArg<3>(Op, 2, DAG);

  case Intrinsic::loongarch_lasx_xvinsve0_w:

    return checkIntrinsicImmArg<3>(Op, 3, DAG);

  case Intrinsic::loongarch_lsx_vsat_h:

  case Intrinsic::loongarch_lsx_vsat_hu:

  case Intrinsic::loongarch_lsx_vrotri_h:

  case Intrinsic::loongarch_lsx_vsllwil_w_h:

  case Intrinsic::loongarch_lsx_vsllwil_wu_hu:

  case Intrinsic::loongarch_lsx_vsrlri_h:

  case Intrinsic::loongarch_lsx_vsrari_h:

  case Intrinsic::loongarch_lsx_vreplvei_b:

  case Intrinsic::loongarch_lasx_xvsat_h:

  case Intrinsic::loongarch_lasx_xvsat_hu:

  case Intrinsic::loongarch_lasx_xvrotri_h:

  case Intrinsic::loongarch_lasx_xvsllwil_w_h:

  case Intrinsic::loongarch_lasx_xvsllwil_wu_hu:

  case Intrinsic::loongarch_lasx_xvsrlri_h:

  case Intrinsic::loongarch_lasx_xvsrari_h:

  case Intrinsic::loongarch_lasx_xvrepl128vei_b:

    return checkIntrinsicImmArg<4>(Op, 2, DAG);

  case Intrinsic::loongarch_lsx_vsrlni_b_h:

  case Intrinsic::loongarch_lsx_vsrani_b_h:

  case Intrinsic::loongarch_lsx_vsrlrni_b_h:

  case Intrinsic::loongarch_lsx_vsrarni_b_h:

  case Intrinsic::loongarch_lsx_vssrlni_b_h:

  case Intrinsic::loongarch_lsx_vssrani_b_h:

  case Intrinsic::loongarch_lsx_vssrlni_bu_h:

  case Intrinsic::loongarch_lsx_vssrani_bu_h:

  case Intrinsic::loongarch_lsx_vssrlrni_b_h:

  case Intrinsic::loongarch_lsx_vssrarni_b_h:

  case Intrinsic::loongarch_lsx_vssrlrni_bu_h:

  case Intrinsic::loongarch_lsx_vssrarni_bu_h:

  case Intrinsic::loongarch_lasx_xvsrlni_b_h:

  case Intrinsic::loongarch_lasx_xvsrani_b_h:

  case Intrinsic::loongarch_lasx_xvsrlrni_b_h:

  case Intrinsic::loongarch_lasx_xvsrarni_b_h:

  case Intrinsic::loongarch_lasx_xvssrlni_b_h:

  case Intrinsic::loongarch_lasx_xvssrani_b_h:

  case Intrinsic::loongarch_lasx_xvssrlni_bu_h:

  case Intrinsic::loongarch_lasx_xvssrani_bu_h:

  case Intrinsic::loongarch_lasx_xvssrlrni_b_h:

  case Intrinsic::loongarch_lasx_xvssrarni_b_h:

  case Intrinsic::loongarch_lasx_xvssrlrni_bu_h:

  case Intrinsic::loongarch_lasx_xvssrarni_bu_h:

    return checkIntrinsicImmArg<4>(Op, 3, DAG);

  case Intrinsic::loongarch_lsx_vsat_w:

  case Intrinsic::loongarch_lsx_vsat_wu:

  case Intrinsic::loongarch_lsx_vrotri_w:

  case Intrinsic::loongarch_lsx_vsllwil_d_w:

  case Intrinsic::loongarch_lsx_vsllwil_du_wu:

  case Intrinsic::loongarch_lsx_vsrlri_w:

  case Intrinsic::loongarch_lsx_vsrari_w:

  case Intrinsic::loongarch_lsx_vslei_bu:

  case Intrinsic::loongarch_lsx_vslei_hu:

  case Intrinsic::loongarch_lsx_vslei_wu:

  case Intrinsic::loongarch_lsx_vslei_du:

  case Intrinsic::loongarch_lsx_vslti_bu:

  case Intrinsic::loongarch_lsx_vslti_hu:

  case Intrinsic::loongarch_lsx_vslti_wu:

  case Intrinsic::loongarch_lsx_vslti_du:

  case Intrinsic::loongarch_lsx_vbsll_v:

  case Intrinsic::loongarch_lsx_vbsrl_v:

  case Intrinsic::loongarch_lasx_xvsat_w:

  case Intrinsic::loongarch_lasx_xvsat_wu:

  case Intrinsic::loongarch_lasx_xvrotri_w:

  case Intrinsic::loongarch_lasx_xvsllwil_d_w:

  case Intrinsic::loongarch_lasx_xvsllwil_du_wu:

  case Intrinsic::loongarch_lasx_xvsrlri_w:

  case Intrinsic::loongarch_lasx_xvsrari_w:

  case Intrinsic::loongarch_lasx_xvslei_bu:

  case Intrinsic::loongarch_lasx_xvslei_hu:

  case Intrinsic::loongarch_lasx_xvslei_wu:

  case Intrinsic::loongarch_lasx_xvslei_du:

  case Intrinsic::loongarch_lasx_xvslti_bu:

  case Intrinsic::loongarch_lasx_xvslti_hu:

  case Intrinsic::loongarch_lasx_xvslti_wu:

  case Intrinsic::loongarch_lasx_xvslti_du:

  case Intrinsic::loongarch_lasx_xvbsll_v:

  case Intrinsic::loongarch_lasx_xvbsrl_v:

    return checkIntrinsicImmArg<5>(Op, 2, DAG);

  case Intrinsic::loongarch_lsx_vseqi_b:

  case Intrinsic::loongarch_lsx_vseqi_h:

  case Intrinsic::loongarch_lsx_vseqi_w:

  case Intrinsic::loongarch_lsx_vseqi_d:

  case Intrinsic::loongarch_lsx_vslei_b:

  case Intrinsic::loongarch_lsx_vslei_h:

  case Intrinsic::loongarch_lsx_vslei_w:

  case Intrinsic::loongarch_lsx_vslei_d:

  case Intrinsic::loongarch_lsx_vslti_b:

  case Intrinsic::loongarch_lsx_vslti_h:

  case Intrinsic::loongarch_lsx_vslti_w:

  case Intrinsic::loongarch_lsx_vslti_d:

  case Intrinsic::loongarch_lasx_xvseqi_b:

  case Intrinsic::loongarch_lasx_xvseqi_h:

  case Intrinsic::loongarch_lasx_xvseqi_w:

  case Intrinsic::loongarch_lasx_xvseqi_d:

  case Intrinsic::loongarch_lasx_xvslei_b:

  case Intrinsic::loongarch_lasx_xvslei_h:

  case Intrinsic::loongarch_lasx_xvslei_w:

  case Intrinsic::loongarch_lasx_xvslei_d:

  case Intrinsic::loongarch_lasx_xvslti_b:

  case Intrinsic::loongarch_lasx_xvslti_h:

  case Intrinsic::loongarch_lasx_xvslti_w:

  case Intrinsic::loongarch_lasx_xvslti_d:

    return checkIntrinsicImmArg<5>(Op, 2, DAG, /*IsSigned=*/true);

  case Intrinsic::loongarch_lsx_vsrlni_h_w:

  case Intrinsic::loongarch_lsx_vsrani_h_w:

  case Intrinsic::loongarch_lsx_vsrlrni_h_w:

  case Intrinsic::loongarch_lsx_vsrarni_h_w:

  case Intrinsic::loongarch_lsx_vssrlni_h_w:

  case Intrinsic::loongarch_lsx_vssrani_h_w:

  case Intrinsic::loongarch_lsx_vssrlni_hu_w:

  case Intrinsic::loongarch_lsx_vssrani_hu_w:

  case Intrinsic::loongarch_lsx_vssrlrni_h_w:

  case Intrinsic::loongarch_lsx_vssrarni_h_w:

  case Intrinsic::loongarch_lsx_vssrlrni_hu_w:

  case Intrinsic::loongarch_lsx_vssrarni_hu_w:

  case Intrinsic::loongarch_lsx_vfrstpi_b:

  case Intrinsic::loongarch_lsx_vfrstpi_h:

  case Intrinsic::loongarch_lasx_xvsrlni_h_w:

  case Intrinsic::loongarch_lasx_xvsrani_h_w:

  case Intrinsic::loongarch_lasx_xvsrlrni_h_w:

  case Intrinsic::loongarch_lasx_xvsrarni_h_w:

  case Intrinsic::loongarch_lasx_xvssrlni_h_w:

  case Intrinsic::loongarch_lasx_xvssrani_h_w:

  case Intrinsic::loongarch_lasx_xvssrlni_hu_w:

  case Intrinsic::loongarch_lasx_xvssrani_hu_w:

  case Intrinsic::loongarch_lasx_xvssrlrni_h_w:

  case Intrinsic::loongarch_lasx_xvssrarni_h_w:

  case Intrinsic::loongarch_lasx_xvssrlrni_hu_w:

  case Intrinsic::loongarch_lasx_xvssrarni_hu_w:

  case Intrinsic::loongarch_lasx_xvfrstpi_b:

  case Intrinsic::loongarch_lasx_xvfrstpi_h:

    return checkIntrinsicImmArg<5>(Op, 3, DAG);

  case Intrinsic::loongarch_lsx_vsat_d:

  case Intrinsic::loongarch_lsx_vsat_du:

  case Intrinsic::loongarch_lsx_vrotri_d:

  case Intrinsic::loongarch_lsx_vsrlri_d:

  case Intrinsic::loongarch_lsx_vsrari_d:

  case Intrinsic::loongarch_lasx_xvsat_d:

  case Intrinsic::loongarch_lasx_xvsat_du:

  case Intrinsic::loongarch_lasx_xvrotri_d:

  case Intrinsic::loongarch_lasx_xvsrlri_d:

  case Intrinsic::loongarch_lasx_xvsrari_d:

    return checkIntrinsicImmArg<6>(Op, 2, DAG);

  case Intrinsic::loongarch_lsx_vsrlni_w_d:

  case Intrinsic::loongarch_lsx_vsrani_w_d:

  case Intrinsic::loongarch_lsx_vsrlrni_w_d:

  case Intrinsic::loongarch_lsx_vsrarni_w_d:

  case Intrinsic::loongarch_lsx_vssrlni_w_d:

  case Intrinsic::loongarch_lsx_vssrani_w_d:

  case Intrinsic::loongarch_lsx_vssrlni_wu_d:

  case Intrinsic::loongarch_lsx_vssrani_wu_d:

  case Intrinsic::loongarch_lsx_vssrlrni_w_d:

  case Intrinsic::loongarch_lsx_vssrarni_w_d:

  case Intrinsic::loongarch_lsx_vssrlrni_wu_d:

  case Intrinsic::loongarch_lsx_vssrarni_wu_d:

  case Intrinsic::loongarch_lasx_xvsrlni_w_d:

  case Intrinsic::loongarch_lasx_xvsrani_w_d:

  case Intrinsic::loongarch_lasx_xvsrlrni_w_d:

  case Intrinsic::loongarch_lasx_xvsrarni_w_d:

  case Intrinsic::loongarch_lasx_xvssrlni_w_d:

  case Intrinsic::loongarch_lasx_xvssrani_w_d:

  case Intrinsic::loongarch_lasx_xvssrlni_wu_d:

  case Intrinsic::loongarch_lasx_xvssrani_wu_d:

  case Intrinsic::loongarch_lasx_xvssrlrni_w_d:

  case Intrinsic::loongarch_lasx_xvssrarni_w_d:

  case Intrinsic::loongarch_lasx_xvssrlrni_wu_d:

  case Intrinsic::loongarch_lasx_xvssrarni_wu_d:

    return checkIntrinsicImmArg<6>(Op, 3, DAG);

  case Intrinsic::loongarch_lsx_vsrlni_d_q:

  case Intrinsic::loongarch_lsx_vsrani_d_q:

  case Intrinsic::loongarch_lsx_vsrlrni_d_q:

  case Intrinsic::loongarch_lsx_vsrarni_d_q:

  case Intrinsic::loongarch_lsx_vssrlni_d_q:

  case Intrinsic::loongarch_lsx_vssrani_d_q:

  case Intrinsic::loongarch_lsx_vssrlni_du_q:

  case Intrinsic::loongarch_lsx_vssrani_du_q:

  case Intrinsic::loongarch_lsx_vssrlrni_d_q:

  case Intrinsic::loongarch_lsx_vssrarni_d_q:

  case Intrinsic::loongarch_lsx_vssrlrni_du_q:

  case Intrinsic::loongarch_lsx_vssrarni_du_q:

  case Intrinsic::loongarch_lasx_xvsrlni_d_q:

  case Intrinsic::loongarch_lasx_xvsrani_d_q:

  case Intrinsic::loongarch_lasx_xvsrlrni_d_q:

  case Intrinsic::loongarch_lasx_xvsrarni_d_q:

  case Intrinsic::loongarch_lasx_xvssrlni_d_q:

  case Intrinsic::loongarch_lasx_xvssrani_d_q:

  case Intrinsic::loongarch_lasx_xvssrlni_du_q:

  case Intrinsic::loongarch_lasx_xvssrani_du_q:

  case Intrinsic::loongarch_lasx_xvssrlrni_d_q:

  case Intrinsic::loongarch_lasx_xvssrarni_d_q:

  case Intrinsic::loongarch_lasx_xvssrlrni_du_q:

  case Intrinsic::loongarch_lasx_xvssrarni_du_q:

    return checkIntrinsicImmArg<7>(Op, 3, DAG);

  case Intrinsic::loongarch_lsx_vnori_b:

  case Intrinsic::loongarch_lsx_vshuf4i_b:

  case Intrinsic::loongarch_lsx_vshuf4i_h:

  case Intrinsic::loongarch_lsx_vshuf4i_w:

  case Intrinsic::loongarch_lasx_xvnori_b:

  case Intrinsic::loongarch_lasx_xvshuf4i_b:

  case Intrinsic::loongarch_lasx_xvshuf4i_h:

  case Intrinsic::loongarch_lasx_xvshuf4i_w:

  case Intrinsic::loongarch_lasx_xvpermi_d:

    return checkIntrinsicImmArg<8>(Op, 2, DAG);

  case Intrinsic::loongarch_lsx_vshuf4i_d:

  case Intrinsic::loongarch_lsx_vpermi_w:

  case Intrinsic::loongarch_lsx_vbitseli_b:

  case Intrinsic::loongarch_lsx_vextrins_b:

  case Intrinsic::loongarch_lsx_vextrins_h:

  case Intrinsic::loongarch_lsx_vextrins_w:

  case Intrinsic::loongarch_lsx_vextrins_d:

  case Intrinsic::loongarch_lasx_xvshuf4i_d:

  case Intrinsic::loongarch_lasx_xvpermi_w:

  case Intrinsic::loongarch_lasx_xvpermi_q:

  case Intrinsic::loongarch_lasx_xvbitseli_b:

  case Intrinsic::loongarch_lasx_xvextrins_b:

  case Intrinsic::loongarch_lasx_xvextrins_h:

  case Intrinsic::loongarch_lasx_xvextrins_w:

  case Intrinsic::loongarch_lasx_xvextrins_d:

    return checkIntrinsicImmArg<8>(Op, 3, DAG);

  case Intrinsic::loongarch_lsx_vrepli_b:

  case Intrinsic::loongarch_lsx_vrepli_h:

  case Intrinsic::loongarch_lsx_vrepli_w:

  case Intrinsic::loongarch_lsx_vrepli_d:

  case Intrinsic::loongarch_lasx_xvrepli_b:

  case Intrinsic::loongarch_lasx_xvrepli_h:

  case Intrinsic::loongarch_lasx_xvrepli_w:

  case Intrinsic::loongarch_lasx_xvrepli_d:

    return checkIntrinsicImmArg<10>(Op, 1, DAG, /*IsSigned=*/true);

  case Intrinsic::loongarch_lsx_vldi:

  case Intrinsic::loongarch_lasx_xvldi:

    return checkIntrinsicImmArg<13>(Op, 1, DAG, /*IsSigned=*/true);

  }

}


// Helper function that emits error message for intrinsics with chain and return

// merge values of a UNDEF and the chain.

static SDValue emitIntrinsicWithChainErrorMessage(SDValue Op,

                                                  StringRef ErrorMsg,

                                                  SelectionDAG &DAG) {

  DAG.getContext()->emitError(Op->getOperationName(0) + ": " + ErrorMsg + ".");

  return DAG.getMergeValues({DAG.getUNDEF(Op.getValueType()), Op.getOperand(0)},

                            SDLoc(Op));

}


SDValue

LoongArchTargetLowering::lowerINTRINSIC_W_CHAIN(SDValue Op,

                                                SelectionDAG &DAG) const {

  SDLoc DL(Op);

  MVT GRLenVT = Subtarget.getGRLenVT();

  EVT VT = Op.getValueType();

  SDValue Chain = Op.getOperand(0);

  const StringRef ErrorMsgOOR = "argument out of range";

  const StringRef ErrorMsgReqLA64 = "requires loongarch64";

  const StringRef ErrorMsgReqF = "requires basic 'f' target feature";


  switch (Op.getConstantOperandVal(1)) {

  default:

    return Op;

  case Intrinsic::loongarch_crc_w_b_w:

  case Intrinsic::loongarch_crc_w_h_w:

  case Intrinsic::loongarch_crc_w_w_w:

  case Intrinsic::loongarch_crc_w_d_w:

  case Intrinsic::loongarch_crcc_w_b_w:

  case Intrinsic::loongarch_crcc_w_h_w:

  case Intrinsic::loongarch_crcc_w_w_w:

  case Intrinsic::loongarch_crcc_w_d_w:

    return emitIntrinsicWithChainErrorMessage(Op, ErrorMsgReqLA64, DAG);

  case Intrinsic::loongarch_csrrd_w:

  case Intrinsic::loongarch_csrrd_d: {

    unsigned Imm = Op.getConstantOperandVal(2);

    return !isUInt<14>(Imm)

               ? emitIntrinsicWithChainErrorMessage(Op, ErrorMsgOOR, DAG)

               : DAG.getNode(LoongArchISD::CSRRD, DL, {GRLenVT, MVT::Other},

                             {Chain, DAG.getConstant(Imm, DL, GRLenVT)});

  }

  case Intrinsic::loongarch_csrwr_w:

  case Intrinsic::loongarch_csrwr_d: {

    unsigned Imm = Op.getConstantOperandVal(3);

    return !isUInt<14>(Imm)

               ? emitIntrinsicWithChainErrorMessage(Op, ErrorMsgOOR, DAG)

               : DAG.getNode(LoongArchISD::CSRWR, DL, {GRLenVT, MVT::Other},

                             {Chain, Op.getOperand(2),

                              DAG.getConstant(Imm, DL, GRLenVT)});

  }

  case Intrinsic::loongarch_csrxchg_w:

  case Intrinsic::loongarch_csrxchg_d: {

    unsigned Imm = Op.getConstantOperandVal(4);

    return !isUInt<14>(Imm)

               ? emitIntrinsicWithChainErrorMessage(Op, ErrorMsgOOR, DAG)

               : DAG.getNode(LoongArchISD::CSRXCHG, DL, {GRLenVT, MVT::Other},

                             {Chain, Op.getOperand(2), Op.getOperand(3),

                              DAG.getConstant(Imm, DL, GRLenVT)});

  }

  case Intrinsic::loongarch_iocsrrd_d: {

    return DAG.getNode(

        LoongArchISD::IOCSRRD_D, DL, {GRLenVT, MVT::Other},

        {Chain, DAG.getNode(ISD::ANY_EXTEND, DL, MVT::i64, Op.getOperand(2))});

  }

#define IOCSRRD_CASE(NAME, NODE)                                               \

  case Intrinsic::loongarch_##NAME: {                                          \

    return DAG.getNode(LoongArchISD::NODE, DL, {GRLenVT, MVT::Other},          \

                       {Chain, Op.getOperand(2)});                             \

  }

    IOCSRRD_CASE(iocsrrd_b, IOCSRRD_B);

    IOCSRRD_CASE(iocsrrd_h, IOCSRRD_H);

    IOCSRRD_CASE(iocsrrd_w, IOCSRRD_W);

#undef IOCSRRD_CASE

  case Intrinsic::loongarch_cpucfg: {

    return DAG.getNode(LoongArchISD::CPUCFG, DL, {GRLenVT, MVT::Other},

                       {Chain, Op.getOperand(2)});

  }

  case Intrinsic::loongarch_lddir_d: {

    unsigned Imm = Op.getConstantOperandVal(3);

    return !isUInt<8>(Imm)

               ? emitIntrinsicWithChainErrorMessage(Op, ErrorMsgOOR, DAG)

               : Op;

  }

  case Intrinsic::loongarch_movfcsr2gr: {

    if (!Subtarget.hasBasicF())

      return emitIntrinsicWithChainErrorMessage(Op, ErrorMsgReqF, DAG);

    unsigned Imm = Op.getConstantOperandVal(2);

    return !isUInt<2>(Imm)

               ? emitIntrinsicWithChainErrorMessage(Op, ErrorMsgOOR, DAG)

               : DAG.getNode(LoongArchISD::MOVFCSR2GR, DL, {VT, MVT::Other},

                             {Chain, DAG.getConstant(Imm, DL, GRLenVT)});

  }

  case Intrinsic::loongarch_lsx_vld:

  case Intrinsic::loongarch_lsx_vldrepl_b:

  case Intrinsic::loongarch_lasx_xvld:

  case Intrinsic::loongarch_lasx_xvldrepl_b:

    return !isInt<12>(cast<ConstantSDNode>(Op.getOperand(3))->getSExtValue())

               ? emitIntrinsicWithChainErrorMessage(Op, ErrorMsgOOR, DAG)

               : SDValue();

  case Intrinsic::loongarch_lsx_vldrepl_h:

  case Intrinsic::loongarch_lasx_xvldrepl_h:

    return !isShiftedInt<11, 1>(

               cast<ConstantSDNode>(Op.getOperand(3))->getSExtValue())

               ? emitIntrinsicWithChainErrorMessage(

                     Op, "argument out of range or not a multiple of 2", DAG)

               : SDValue();

  case Intrinsic::loongarch_lsx_vldrepl_w:

  case Intrinsic::loongarch_lasx_xvldrepl_w:

    return !isShiftedInt<10, 2>(

               cast<ConstantSDNode>(Op.getOperand(3))->getSExtValue())

               ? emitIntrinsicWithChainErrorMessage(

                     Op, "argument out of range or not a multiple of 4", DAG)

               : SDValue();

  case Intrinsic::loongarch_lsx_vldrepl_d:

  case Intrinsic::loongarch_lasx_xvldrepl_d:

    return !isShiftedInt<9, 3>(

               cast<ConstantSDNode>(Op.getOperand(3))->getSExtValue())

               ? emitIntrinsicWithChainErrorMessage(

                     Op, "argument out of range or not a multiple of 8", DAG)

               : SDValue();

  }

}


// Helper function that emits error message for intrinsics with void return

// value and return the chain.

static SDValue emitIntrinsicErrorMessage(SDValue Op, StringRef ErrorMsg,

                                         SelectionDAG &DAG) {


  DAG.getContext()->emitError(Op->getOperationName(0) + ": " + ErrorMsg + ".");

  return Op.getOperand(0);

}


SDValue LoongArchTargetLowering::lowerINTRINSIC_VOID(SDValue Op,

                                                     SelectionDAG &DAG) const {

  SDLoc DL(Op);

  MVT GRLenVT = Subtarget.getGRLenVT();

  SDValue Chain = Op.getOperand(0);

  uint64_t IntrinsicEnum = Op.getConstantOperandVal(1);

  SDValue Op2 = Op.getOperand(2);

  const StringRef ErrorMsgOOR = "argument out of range";

  const StringRef ErrorMsgReqLA64 = "requires loongarch64";

  const StringRef ErrorMsgReqLA32 = "requires loongarch32";

  const StringRef ErrorMsgReqF = "requires basic 'f' target feature";


  switch (IntrinsicEnum) {

  default:

    // TODO: Add more Intrinsics.

    return SDValue();

  case Intrinsic::loongarch_cacop_d:

  case Intrinsic::loongarch_cacop_w: {

    if (IntrinsicEnum == Intrinsic::loongarch_cacop_d && !Subtarget.is64Bit())

      return emitIntrinsicErrorMessage(Op, ErrorMsgReqLA64, DAG);

    if (IntrinsicEnum == Intrinsic::loongarch_cacop_w && Subtarget.is64Bit())

      return emitIntrinsicErrorMessage(Op, ErrorMsgReqLA32, DAG);

    // call void @llvm.loongarch.cacop.[d/w](uimm5, rj, simm12)

    unsigned Imm1 = Op2->getAsZExtVal();

    int Imm2 = cast<ConstantSDNode>(Op.getOperand(4))->getSExtValue();

    if (!isUInt<5>(Imm1) || !isInt<12>(Imm2))

      return emitIntrinsicErrorMessage(Op, ErrorMsgOOR, DAG);

    return Op;

  }

  case Intrinsic::loongarch_dbar: {

    unsigned Imm = Op2->getAsZExtVal();

    return !isUInt<15>(Imm)

               ? emitIntrinsicErrorMessage(Op, ErrorMsgOOR, DAG)

               : DAG.getNode(LoongArchISD::DBAR, DL, MVT::Other, Chain,

                             DAG.getConstant(Imm, DL, GRLenVT));

  }

  case Intrinsic::loongarch_ibar: {

    unsigned Imm = Op2->getAsZExtVal();

    return !isUInt<15>(Imm)

               ? emitIntrinsicErrorMessage(Op, ErrorMsgOOR, DAG)

               : DAG.getNode(LoongArchISD::IBAR, DL, MVT::Other, Chain,

                             DAG.getConstant(Imm, DL, GRLenVT));

  }

  case Intrinsic::loongarch_break: {

    unsigned Imm = Op2->getAsZExtVal();

    return !isUInt<15>(Imm)

               ? emitIntrinsicErrorMessage(Op, ErrorMsgOOR, DAG)

               : DAG.getNode(LoongArchISD::BREAK, DL, MVT::Other, Chain,

                             DAG.getConstant(Imm, DL, GRLenVT));

  }

  case Intrinsic::loongarch_movgr2fcsr: {

    if (!Subtarget.hasBasicF())

      return emitIntrinsicErrorMessage(Op, ErrorMsgReqF, DAG);

    unsigned Imm = Op2->getAsZExtVal();

    return !isUInt<2>(Imm)

               ? emitIntrinsicErrorMessage(Op, ErrorMsgOOR, DAG)

               : DAG.getNode(LoongArchISD::MOVGR2FCSR, DL, MVT::Other, Chain,

                             DAG.getConstant(Imm, DL, GRLenVT),

                             DAG.getNode(ISD::ANY_EXTEND, DL, GRLenVT,

                                         Op.getOperand(3)));

  }

  case Intrinsic::loongarch_syscall: {

    unsigned Imm = Op2->getAsZExtVal();

    return !isUInt<15>(Imm)

               ? emitIntrinsicErrorMessage(Op, ErrorMsgOOR, DAG)

               : DAG.getNode(LoongArchISD::SYSCALL, DL, MVT::Other, Chain,

                             DAG.getConstant(Imm, DL, GRLenVT));

  }

#define IOCSRWR_CASE(NAME, NODE)                                               \

  case Intrinsic::loongarch_##NAME: {                                          \

    SDValue Op3 = Op.getOperand(3);                                            \

    return Subtarget.is64Bit()                                                 \

               ? DAG.getNode(LoongArchISD::NODE, DL, MVT::Other, Chain,        \

                             DAG.getNode(ISD::ANY_EXTEND, DL, MVT::i64, Op2),  \

                             DAG.getNode(ISD::ANY_EXTEND, DL, MVT::i64, Op3))  \

               : DAG.getNode(LoongArchISD::NODE, DL, MVT::Other, Chain, Op2,   \

                             Op3);                                             \

  }

    IOCSRWR_CASE(iocsrwr_b, IOCSRWR_B);

    IOCSRWR_CASE(iocsrwr_h, IOCSRWR_H);

    IOCSRWR_CASE(iocsrwr_w, IOCSRWR_W);

#undef IOCSRWR_CASE

  case Intrinsic::loongarch_iocsrwr_d: {

    return !Subtarget.is64Bit()

               ? emitIntrinsicErrorMessage(Op, ErrorMsgReqLA64, DAG)

               : DAG.getNode(LoongArchISD::IOCSRWR_D, DL, MVT::Other, Chain,

                             Op2,

                             DAG.getNode(ISD::ANY_EXTEND, DL, MVT::i64,

                                         Op.getOperand(3)));

  }

#define ASRT_LE_GT_CASE(NAME)                                                  \

  case Intrinsic::loongarch_##NAME: {                                          \

    return !Subtarget.is64Bit()                                                \

               ? emitIntrinsicErrorMessage(Op, ErrorMsgReqLA64, DAG)           \

               : Op;                                                           \

  }

    ASRT_LE_GT_CASE(asrtle_d)

    ASRT_LE_GT_CASE(asrtgt_d)

#undef ASRT_LE_GT_CASE

  case Intrinsic::loongarch_ldpte_d: {

    unsigned Imm = Op.getConstantOperandVal(3);

    return !Subtarget.is64Bit()

               ? emitIntrinsicErrorMessage(Op, ErrorMsgReqLA64, DAG)

           : !isUInt<8>(Imm) ? emitIntrinsicErrorMessage(Op, ErrorMsgOOR, DAG)

                             : Op;

  }

  case Intrinsic::loongarch_lsx_vst:

  case Intrinsic::loongarch_lasx_xvst:

    return !isInt<12>(cast<ConstantSDNode>(Op.getOperand(4))->getSExtValue())

               ? emitIntrinsicErrorMessage(Op, ErrorMsgOOR, DAG)

               : SDValue();

  case Intrinsic::loongarch_lasx_xvstelm_b:

    return (!isInt<8>(cast<ConstantSDNode>(Op.getOperand(4))->getSExtValue()) ||

            !isUInt<5>(Op.getConstantOperandVal(5)))

               ? emitIntrinsicErrorMessage(Op, ErrorMsgOOR, DAG)

               : SDValue();

  case Intrinsic::loongarch_lsx_vstelm_b:

    return (!isInt<8>(cast<ConstantSDNode>(Op.getOperand(4))->getSExtValue()) ||

            !isUInt<4>(Op.getConstantOperandVal(5)))

               ? emitIntrinsicErrorMessage(Op, ErrorMsgOOR, DAG)

               : SDValue();

  case Intrinsic::loongarch_lasx_xvstelm_h:

    return (!isShiftedInt<8, 1>(

                cast<ConstantSDNode>(Op.getOperand(4))->getSExtValue()) ||

            !isUInt<4>(Op.getConstantOperandVal(5)))

               ? emitIntrinsicErrorMessage(

                     Op, "argument out of range or not a multiple of 2", DAG)

               : SDValue();

  case Intrinsic::loongarch_lsx_vstelm_h:

    return (!isShiftedInt<8, 1>(

                cast<ConstantSDNode>(Op.getOperand(4))->getSExtValue()) ||

            !isUInt<3>(Op.getConstantOperandVal(5)))

               ? emitIntrinsicErrorMessage(

                     Op, "argument out of range or not a multiple of 2", DAG)

               : SDValue();

  case Intrinsic::loongarch_lasx_xvstelm_w:

    return (!isShiftedInt<8, 2>(

                cast<ConstantSDNode>(Op.getOperand(4))->getSExtValue()) ||

            !isUInt<3>(Op.getConstantOperandVal(5)))

               ? emitIntrinsicErrorMessage(

                     Op, "argument out of range or not a multiple of 4", DAG)

               : SDValue();

  case Intrinsic::loongarch_lsx_vstelm_w:

    return (!isShiftedInt<8, 2>(

                cast<ConstantSDNode>(Op.getOperand(4))->getSExtValue()) ||

            !isUInt<2>(Op.getConstantOperandVal(5)))

               ? emitIntrinsicErrorMessage(

                     Op, "argument out of range or not a multiple of 4", DAG)

               : SDValue();

  case Intrinsic::loongarch_lasx_xvstelm_d:

    return (!isShiftedInt<8, 3>(

                cast<ConstantSDNode>(Op.getOperand(4))->getSExtValue()) ||

            !isUInt<2>(Op.getConstantOperandVal(5)))

               ? emitIntrinsicErrorMessage(

                     Op, "argument out of range or not a multiple of 8", DAG)

               : SDValue();

  case Intrinsic::loongarch_lsx_vstelm_d:

    return (!isShiftedInt<8, 3>(

                cast<ConstantSDNode>(Op.getOperand(4))->getSExtValue()) ||

            !isUInt<1>(Op.getConstantOperandVal(5)))

               ? emitIntrinsicErrorMessage(

                     Op, "argument out of range or not a multiple of 8", DAG)

               : SDValue();

  }

}


SDValue LoongArchTargetLowering::lowerShiftLeftParts(SDValue Op,

                                                     SelectionDAG &DAG) const {

  SDLoc DL(Op);

  SDValue Lo = Op.getOperand(0);

  SDValue Hi = Op.getOperand(1);

  SDValue Shamt = Op.getOperand(2);

  EVT VT = Lo.getValueType();


  // if Shamt-GRLen < 0: // Shamt < GRLen

  //   Lo = Lo << Shamt

  //   Hi = (Hi << Shamt) | ((Lo >>u 1) >>u (GRLen-1 ^ Shamt))

  // else:

  //   Lo = 0

  //   Hi = Lo << (Shamt-GRLen)


  SDValue Zero = DAG.getConstant(0, DL, VT);

  SDValue One = DAG.getConstant(1, DL, VT);

  SDValue MinusGRLen =

      DAG.getSignedConstant(-(int)Subtarget.getGRLen(), DL, VT);

  SDValue GRLenMinus1 = DAG.getConstant(Subtarget.getGRLen() - 1, DL, VT);

  SDValue ShamtMinusGRLen = DAG.getNode(ISD::ADD, DL, VT, Shamt, MinusGRLen);

  SDValue GRLenMinus1Shamt = DAG.getNode(ISD::XOR, DL, VT, Shamt, GRLenMinus1);


  SDValue LoTrue = DAG.getNode(ISD::SHL, DL, VT, Lo, Shamt);

  SDValue ShiftRight1Lo = DAG.getNode(ISD::SRL, DL, VT, Lo, One);

  SDValue ShiftRightLo =

      DAG.getNode(ISD::SRL, DL, VT, ShiftRight1Lo, GRLenMinus1Shamt);

  SDValue ShiftLeftHi = DAG.getNode(ISD::SHL, DL, VT, Hi, Shamt);

  SDValue HiTrue = DAG.getNode(ISD::OR, DL, VT, ShiftLeftHi, ShiftRightLo);

  SDValue HiFalse = DAG.getNode(ISD::SHL, DL, VT, Lo, ShamtMinusGRLen);


  SDValue CC = DAG.getSetCC(DL, VT, ShamtMinusGRLen, Zero, ISD::SETLT);


  Lo = DAG.getNode(ISD::SELECT, DL, VT, CC, LoTrue, Zero);

  Hi = DAG.getNode(ISD::SELECT, DL, VT, CC, HiTrue, HiFalse);


  SDValue Parts[2] = {Lo, Hi};

  return DAG.getMergeValues(Parts, DL);

}


SDValue LoongArchTargetLowering::lowerShiftRightParts(SDValue Op,

                                                      SelectionDAG &DAG,

                                                      bool IsSRA) const {

  SDLoc DL(Op);

  SDValue Lo = Op.getOperand(0);

  SDValue Hi = Op.getOperand(1);

  SDValue Shamt = Op.getOperand(2);

  EVT VT = Lo.getValueType();


  // SRA expansion:

  //   if Shamt-GRLen < 0: // Shamt < GRLen

  //     Lo = (Lo >>u Shamt) | ((Hi << 1) << (ShAmt ^ GRLen-1))

  //     Hi = Hi >>s Shamt

  //   else:

  //     Lo = Hi >>s (Shamt-GRLen);

  //     Hi = Hi >>s (GRLen-1)

  //

  // SRL expansion:

  //   if Shamt-GRLen < 0: // Shamt < GRLen

  //     Lo = (Lo >>u Shamt) | ((Hi << 1) << (ShAmt ^ GRLen-1))

  //     Hi = Hi >>u Shamt

  //   else:

  //     Lo = Hi >>u (Shamt-GRLen);

  //     Hi = 0;


  unsigned ShiftRightOp = IsSRA ? ISD::SRA : ISD::SRL;


  SDValue Zero = DAG.getConstant(0, DL, VT);

  SDValue One = DAG.getConstant(1, DL, VT);

  SDValue MinusGRLen =

      DAG.getSignedConstant(-(int)Subtarget.getGRLen(), DL, VT);

  SDValue GRLenMinus1 = DAG.getConstant(Subtarget.getGRLen() - 1, DL, VT);

  SDValue ShamtMinusGRLen = DAG.getNode(ISD::ADD, DL, VT, Shamt, MinusGRLen);

  SDValue GRLenMinus1Shamt = DAG.getNode(ISD::XOR, DL, VT, Shamt, GRLenMinus1);


  SDValue ShiftRightLo = DAG.getNode(ISD::SRL, DL, VT, Lo, Shamt);

  SDValue ShiftLeftHi1 = DAG.getNode(ISD::SHL, DL, VT, Hi, One);

  SDValue ShiftLeftHi =

      DAG.getNode(ISD::SHL, DL, VT, ShiftLeftHi1, GRLenMinus1Shamt);

  SDValue LoTrue = DAG.getNode(ISD::OR, DL, VT, ShiftRightLo, ShiftLeftHi);

  SDValue HiTrue = DAG.getNode(ShiftRightOp, DL, VT, Hi, Shamt);

  SDValue LoFalse = DAG.getNode(ShiftRightOp, DL, VT, Hi, ShamtMinusGRLen);

  SDValue HiFalse =

      IsSRA ? DAG.getNode(ISD::SRA, DL, VT, Hi, GRLenMinus1) : Zero;


  SDValue CC = DAG.getSetCC(DL, VT, ShamtMinusGRLen, Zero, ISD::SETLT);


  Lo = DAG.getNode(ISD::SELECT, DL, VT, CC, LoTrue, LoFalse);

  Hi = DAG.getNode(ISD::SELECT, DL, VT, CC, HiTrue, HiFalse);


  SDValue Parts[2] = {Lo, Hi};

  return DAG.getMergeValues(Parts, DL);

}


// Returns the opcode of the target-specific SDNode that implements the 32-bit

// form of the given Opcode.

static LoongArchISD::NodeType getLoongArchWOpcode(unsigned Opcode) {

  switch (Opcode) {

  default:

    llvm_unreachable("Unexpected opcode");

  case ISD::SDIV:

    return LoongArchISD::DIV_W;

  case ISD::UDIV:

    return LoongArchISD::DIV_WU;

  case ISD::SREM:

    return LoongArchISD::MOD_W;

  case ISD::UREM:

    return LoongArchISD::MOD_WU;

  case ISD::SHL:

    return LoongArchISD::SLL_W;

  case ISD::SRA:

    return LoongArchISD::SRA_W;

  case ISD::SRL:

    return LoongArchISD::SRL_W;

  case ISD::ROTL:

  case ISD::ROTR:

    return LoongArchISD::ROTR_W;

  case ISD::CTTZ:

    return LoongArchISD::CTZ_W;

  case ISD::CTLZ:

    return LoongArchISD::CLZ_W;

  }

}


// Converts the given i8/i16/i32 operation to a target-specific SelectionDAG

// node. Because i8/i16/i32 isn't a legal type for LA64, these operations would

// otherwise be promoted to i64, making it difficult to select the

// SLL_W/.../*W later one because the fact the operation was originally of

// type i8/i16/i32 is lost.

static SDValue customLegalizeToWOp(SDNode *N, SelectionDAG &DAG, int NumOp,

                                   unsigned ExtOpc = ISD::ANY_EXTEND) {

  SDLoc DL(N);

  LoongArchISD::NodeType WOpcode = getLoongArchWOpcode(N->getOpcode());

  SDValue NewOp0, NewRes;


  switch (NumOp) {

  default:

    llvm_unreachable("Unexpected NumOp");

  case 1: {

    NewOp0 = DAG.getNode(ExtOpc, DL, MVT::i64, N->getOperand(0));

    NewRes = DAG.getNode(WOpcode, DL, MVT::i64, NewOp0);

    break;

  }

  case 2: {

    NewOp0 = DAG.getNode(ExtOpc, DL, MVT::i64, N->getOperand(0));

    SDValue NewOp1 = DAG.getNode(ExtOpc, DL, MVT::i64, N->getOperand(1));

    if (N->getOpcode() == ISD::ROTL) {

      SDValue TmpOp = DAG.getConstant(32, DL, MVT::i64);

      NewOp1 = DAG.getNode(ISD::SUB, DL, MVT::i64, TmpOp, NewOp1);

    }

    NewRes = DAG.getNode(WOpcode, DL, MVT::i64, NewOp0, NewOp1);

    break;

  }

    // TODO:Handle more NumOp.

  }


  // ReplaceNodeResults requires we maintain the same type for the return

  // value.

  return DAG.getNode(ISD::TRUNCATE, DL, N->getValueType(0), NewRes);

}


// Converts the given 32-bit operation to a i64 operation with signed extension

// semantic to reduce the signed extension instructions.

static SDValue customLegalizeToWOpWithSExt(SDNode *N, SelectionDAG &DAG) {

  SDLoc DL(N);

  SDValue NewOp0 = DAG.getNode(ISD::ANY_EXTEND, DL, MVT::i64, N->getOperand(0));

  SDValue NewOp1 = DAG.getNode(ISD::ANY_EXTEND, DL, MVT::i64, N->getOperand(1));

  SDValue NewWOp = DAG.getNode(N->getOpcode(), DL, MVT::i64, NewOp0, NewOp1);

  SDValue NewRes = DAG.getNode(ISD::SIGN_EXTEND_INREG, DL, MVT::i64, NewWOp,

                               DAG.getValueType(MVT::i32));

  return DAG.getNode(ISD::TRUNCATE, DL, MVT::i32, NewRes);

}


// Helper function that emits error message for intrinsics with/without chain

// and return a UNDEF or and the chain as the results.

static void emitErrorAndReplaceIntrinsicResults(

    SDNode *N, SmallVectorImpl<SDValue> &Results, SelectionDAG &DAG,

    StringRef ErrorMsg, bool WithChain = true) {

  DAG.getContext()->emitError(N->getOperationName(0) + ": " + ErrorMsg + ".");

  Results.push_back(DAG.getUNDEF(N->getValueType(0)));

  if (!WithChain)

    return;

  Results.push_back(N->getOperand(0));

}


template <unsigned N>

static void

replaceVPICKVE2GRResults(SDNode *Node, SmallVectorImpl<SDValue> &Results,

                         SelectionDAG &DAG, const LoongArchSubtarget &Subtarget,

                         unsigned ResOp) {

  const StringRef ErrorMsgOOR = "argument out of range";

  unsigned Imm = Node->getConstantOperandVal(2);

  if (!isUInt<N>(Imm)) {

    emitErrorAndReplaceIntrinsicResults(Node, Results, DAG, ErrorMsgOOR,

                                        /*WithChain=*/false);

    return;

  }

  SDLoc DL(Node);

  SDValue Vec = Node->getOperand(1);


  SDValue PickElt =

      DAG.getNode(ResOp, DL, Subtarget.getGRLenVT(), Vec,

                  DAG.getConstant(Imm, DL, Subtarget.getGRLenVT()),

                  DAG.getValueType(Vec.getValueType().getVectorElementType()));

  Results.push_back(DAG.getNode(ISD::TRUNCATE, DL, Node->getValueType(0),

                                PickElt.getValue(0)));

}


static void replaceVecCondBranchResults(SDNode *N,

                                        SmallVectorImpl<SDValue> &Results,

                                        SelectionDAG &DAG,

                                        const LoongArchSubtarget &Subtarget,

                                        unsigned ResOp) {

  SDLoc DL(N);

  SDValue Vec = N->getOperand(1);


  SDValue CB = DAG.getNode(ResOp, DL, Subtarget.getGRLenVT(), Vec);

  Results.push_back(

      DAG.getNode(ISD::TRUNCATE, DL, N->getValueType(0), CB.getValue(0)));

}


static void

replaceINTRINSIC_WO_CHAINResults(SDNode *N, SmallVectorImpl<SDValue> &Results,

                                 SelectionDAG &DAG,

                                 const LoongArchSubtarget &Subtarget) {

  switch (N->getConstantOperandVal(0)) {

  default:

    llvm_unreachable("Unexpected Intrinsic.");

  case Intrinsic::loongarch_lsx_vpickve2gr_b:

    replaceVPICKVE2GRResults<4>(N, Results, DAG, Subtarget,

                                LoongArchISD::VPICK_SEXT_ELT);

    break;

  case Intrinsic::loongarch_lsx_vpickve2gr_h:

  case Intrinsic::loongarch_lasx_xvpickve2gr_w:

    replaceVPICKVE2GRResults<3>(N, Results, DAG, Subtarget,

                                LoongArchISD::VPICK_SEXT_ELT);

    break;

  case Intrinsic::loongarch_lsx_vpickve2gr_w:

    replaceVPICKVE2GRResults<2>(N, Results, DAG, Subtarget,

                                LoongArchISD::VPICK_SEXT_ELT);

    break;

  case Intrinsic::loongarch_lsx_vpickve2gr_bu:

    replaceVPICKVE2GRResults<4>(N, Results, DAG, Subtarget,

                                LoongArchISD::VPICK_ZEXT_ELT);

    break;

  case Intrinsic::loongarch_lsx_vpickve2gr_hu:

  case Intrinsic::loongarch_lasx_xvpickve2gr_wu:

    replaceVPICKVE2GRResults<3>(N, Results, DAG, Subtarget,

                                LoongArchISD::VPICK_ZEXT_ELT);

    break;

  case Intrinsic::loongarch_lsx_vpickve2gr_wu:

    replaceVPICKVE2GRResults<2>(N, Results, DAG, Subtarget,

                                LoongArchISD::VPICK_ZEXT_ELT);

    break;

  case Intrinsic::loongarch_lsx_bz_b:

  case Intrinsic::loongarch_lsx_bz_h:

  case Intrinsic::loongarch_lsx_bz_w:

  case Intrinsic::loongarch_lsx_bz_d:

  case Intrinsic::loongarch_lasx_xbz_b:

  case Intrinsic::loongarch_lasx_xbz_h:

  case Intrinsic::loongarch_lasx_xbz_w:

  case Intrinsic::loongarch_lasx_xbz_d:

    replaceVecCondBranchResults(N, Results, DAG, Subtarget,

                                LoongArchISD::VALL_ZERO);

    break;

  case Intrinsic::loongarch_lsx_bz_v:

  case Intrinsic::loongarch_lasx_xbz_v:

    replaceVecCondBranchResults(N, Results, DAG, Subtarget,

                                LoongArchISD::VANY_ZERO);

    break;

  case Intrinsic::loongarch_lsx_bnz_b:

  case Intrinsic::loongarch_lsx_bnz_h:

  case Intrinsic::loongarch_lsx_bnz_w:

  case Intrinsic::loongarch_lsx_bnz_d:

  case Intrinsic::loongarch_lasx_xbnz_b:

  case Intrinsic::loongarch_lasx_xbnz_h:

  case Intrinsic::loongarch_lasx_xbnz_w:

  case Intrinsic::loongarch_lasx_xbnz_d:

    replaceVecCondBranchResults(N, Results, DAG, Subtarget,

                                LoongArchISD::VALL_NONZERO);

    break;

  case Intrinsic::loongarch_lsx_bnz_v:

  case Intrinsic::loongarch_lasx_xbnz_v:

    replaceVecCondBranchResults(N, Results, DAG, Subtarget,

                                LoongArchISD::VANY_NONZERO);

    break;

  }

}


static void replaceCMP_XCHG_128Results(SDNode *N,

                                       SmallVectorImpl<SDValue> &Results,

                                       SelectionDAG &DAG) {

  assert(N->getValueType(0) == MVT::i128 &&

         "AtomicCmpSwap on types less than 128 should be legal");

  MachineMemOperand *MemOp = cast<MemSDNode>(N)->getMemOperand();


  unsigned Opcode;

  switch (MemOp->getMergedOrdering()) {

  case AtomicOrdering::Acquire:

  case AtomicOrdering::AcquireRelease:

  case AtomicOrdering::SequentiallyConsistent:

    Opcode = LoongArch::PseudoCmpXchg128Acquire;

    break;

  case AtomicOrdering::Monotonic:

  case AtomicOrdering::Release:

    Opcode = LoongArch::PseudoCmpXchg128;

    break;

  default:

    llvm_unreachable("Unexpected ordering!");

  }


  SDLoc DL(N);

  auto CmpVal = DAG.SplitScalar(N->getOperand(2), DL, MVT::i64, MVT::i64);

  auto NewVal = DAG.SplitScalar(N->getOperand(3), DL, MVT::i64, MVT::i64);

  SDValue Ops[] = {N->getOperand(1), CmpVal.first,  CmpVal.second,

                   NewVal.first,     NewVal.second, N->getOperand(0)};


  SDNode *CmpSwap = DAG.getMachineNode(

      Opcode, SDLoc(N), DAG.getVTList(MVT::i64, MVT::i64, MVT::i64, MVT::Other),

      Ops);

  DAG.setNodeMemRefs(cast<MachineSDNode>(CmpSwap), {MemOp});

  Results.push_back(DAG.getNode(ISD::BUILD_PAIR, DL, MVT::i128,

                                SDValue(CmpSwap, 0), SDValue(CmpSwap, 1)));

  Results.push_back(SDValue(CmpSwap, 3));

}


void LoongArchTargetLowering::ReplaceNodeResults(

    SDNode *N, SmallVectorImpl<SDValue> &Results, SelectionDAG &DAG) const {

  SDLoc DL(N);

  EVT VT = N->getValueType(0);

  switch (N->getOpcode()) {

  default:

    llvm_unreachable("Don't know how to legalize this operation");

  case ISD::ADD:

  case ISD::SUB:

    assert(N->getValueType(0) == MVT::i32 && Subtarget.is64Bit() &&

           "Unexpected custom legalisation");

    Results.push_back(customLegalizeToWOpWithSExt(N, DAG));

    break;

  case ISD::SDIV:

  case ISD::UDIV:

  case ISD::SREM:

  case ISD::UREM:

    assert(VT == MVT::i32 && Subtarget.is64Bit() &&

           "Unexpected custom legalisation");

    Results.push_back(customLegalizeToWOp(N, DAG, 2,

                                          Subtarget.hasDiv32() && VT == MVT::i32

                                              ? ISD::ANY_EXTEND

                                              : ISD::SIGN_EXTEND));

    break;

  case ISD::SHL:

  case ISD::SRA:

  case ISD::SRL:

    assert(VT == MVT::i32 && Subtarget.is64Bit() &&

           "Unexpected custom legalisation");

    if (N->getOperand(1).getOpcode() != ISD::Constant) {

      Results.push_back(customLegalizeToWOp(N, DAG, 2));

      break;

    }

    break;

  case ISD::ROTL:

  case ISD::ROTR:

    assert(VT == MVT::i32 && Subtarget.is64Bit() &&

           "Unexpected custom legalisation");

    Results.push_back(customLegalizeToWOp(N, DAG, 2));

    break;

  case ISD::FP_TO_SINT: {

    assert(VT == MVT::i32 && Subtarget.is64Bit() &&

           "Unexpected custom legalisation");

    SDValue Src = N->getOperand(0);

    EVT FVT = EVT::getFloatingPointVT(N->getValueSizeInBits(0));

    if (getTypeAction(*DAG.getContext(), Src.getValueType()) !=

        TargetLowering::TypeSoftenFloat) {

      if (Src.getValueType() == MVT::f16)

        Src = DAG.getNode(ISD::FP_EXTEND, DL, MVT::f32, Src);

      SDValue Dst = DAG.getNode(LoongArchISD::FTINT, DL, FVT, Src);

      Results.push_back(DAG.getNode(ISD::BITCAST, DL, VT, Dst));

      return;

    }

    // If the FP type needs to be softened, emit a library call using the 'si'

    // version. If we left it to default legalization we'd end up with 'di'.

    RTLIB::Libcall LC;

    LC = RTLIB::getFPTOSINT(Src.getValueType(), VT);

    MakeLibCallOptions CallOptions;

    EVT OpVT = Src.getValueType();

    CallOptions.setTypeListBeforeSoften(OpVT, VT, true);

    SDValue Chain = SDValue();

    SDValue Result;

    std::tie(Result, Chain) =

        makeLibCall(DAG, LC, VT, Src, CallOptions, DL, Chain);

    Results.push_back(Result);

    break;

  }

  case ISD::BITCAST: {

    SDValue Src = N->getOperand(0);

    EVT SrcVT = Src.getValueType();

    if (VT == MVT::i32 && SrcVT == MVT::f32 && Subtarget.is64Bit() &&

        Subtarget.hasBasicF()) {

      SDValue Dst =

          DAG.getNode(LoongArchISD::MOVFR2GR_S_LA64, DL, MVT::i64, Src);

      Results.push_back(DAG.getNode(ISD::TRUNCATE, DL, MVT::i32, Dst));

    }

    break;

  }

  case ISD::FP_TO_UINT: {

    assert(VT == MVT::i32 && Subtarget.is64Bit() &&

           "Unexpected custom legalisation");

    auto &TLI = DAG.getTargetLoweringInfo();

    SDValue Tmp1, Tmp2;

    TLI.expandFP_TO_UINT(N, Tmp1, Tmp2, DAG);

    Results.push_back(DAG.getNode(ISD::TRUNCATE, DL, MVT::i32, Tmp1));

    break;

  }

  case ISD::BSWAP: {

    SDValue Src = N->getOperand(0);

    assert((VT == MVT::i16 || VT == MVT::i32) &&

           "Unexpected custom legalization");

    MVT GRLenVT = Subtarget.getGRLenVT();

    SDValue NewSrc = DAG.getNode(ISD::ANY_EXTEND, DL, GRLenVT, Src);

    SDValue Tmp;

    switch (VT.getSizeInBits()) {

    default:

      llvm_unreachable("Unexpected operand width");

    case 16:

      Tmp = DAG.getNode(LoongArchISD::REVB_2H, DL, GRLenVT, NewSrc);

      break;

    case 32:

      // Only LA64 will get to here due to the size mismatch between VT and

      // GRLenVT, LA32 lowering is directly defined in LoongArchInstrInfo.

      Tmp = DAG.getNode(LoongArchISD::REVB_2W, DL, GRLenVT, NewSrc);

      break;

    }

    Results.push_back(DAG.getNode(ISD::TRUNCATE, DL, VT, Tmp));

    break;

  }

  case ISD::BITREVERSE: {

    SDValue Src = N->getOperand(0);

    assert((VT == MVT::i8 || (VT == MVT::i32 && Subtarget.is64Bit())) &&

           "Unexpected custom legalization");

    MVT GRLenVT = Subtarget.getGRLenVT();

    SDValue NewSrc = DAG.getNode(ISD::ANY_EXTEND, DL, GRLenVT, Src);

    SDValue Tmp;

    switch (VT.getSizeInBits()) {

    default:

      llvm_unreachable("Unexpected operand width");

    case 8:

      Tmp = DAG.getNode(LoongArchISD::BITREV_4B, DL, GRLenVT, NewSrc);

      break;

    case 32:

      Tmp = DAG.getNode(LoongArchISD::BITREV_W, DL, GRLenVT, NewSrc);

      break;

    }

    Results.push_back(DAG.getNode(ISD::TRUNCATE, DL, VT, Tmp));

    break;

  }

  case ISD::CTLZ:

  case ISD::CTTZ: {

    assert(VT == MVT::i32 && Subtarget.is64Bit() &&

           "Unexpected custom legalisation");

    Results.push_back(customLegalizeToWOp(N, DAG, 1));

    break;

  }

  case ISD::INTRINSIC_W_CHAIN: {

    SDValue Chain = N->getOperand(0);

    SDValue Op2 = N->getOperand(2);

    MVT GRLenVT = Subtarget.getGRLenVT();

    const StringRef ErrorMsgOOR = "argument out of range";

    const StringRef ErrorMsgReqLA64 = "requires loongarch64";

    const StringRef ErrorMsgReqF = "requires basic 'f' target feature";


    switch (N->getConstantOperandVal(1)) {

    default:

      llvm_unreachable("Unexpected Intrinsic.");

    case Intrinsic::loongarch_movfcsr2gr: {

      if (!Subtarget.hasBasicF()) {

        emitErrorAndReplaceIntrinsicResults(N, Results, DAG, ErrorMsgReqF);

        return;

      }

      unsigned Imm = Op2->getAsZExtVal();

      if (!isUInt<2>(Imm)) {

        emitErrorAndReplaceIntrinsicResults(N, Results, DAG, ErrorMsgOOR);

        return;

      }

      SDValue MOVFCSR2GRResults = DAG.getNode(

          LoongArchISD::MOVFCSR2GR, SDLoc(N), {MVT::i64, MVT::Other},

          {Chain, DAG.getConstant(Imm, DL, GRLenVT)});

      Results.push_back(

          DAG.getNode(ISD::TRUNCATE, DL, VT, MOVFCSR2GRResults.getValue(0)));

      Results.push_back(MOVFCSR2GRResults.getValue(1));

      break;

    }

#define CRC_CASE_EXT_BINARYOP(NAME, NODE)                                      \

  case Intrinsic::loongarch_##NAME: {                                          \

    SDValue NODE = DAG.getNode(                                                \

        LoongArchISD::NODE, DL, {MVT::i64, MVT::Other},                        \

        {Chain, DAG.getNode(ISD::ANY_EXTEND, DL, MVT::i64, Op2),               \

         DAG.getNode(ISD::ANY_EXTEND, DL, MVT::i64, N->getOperand(3))});       \

    Results.push_back(DAG.getNode(ISD::TRUNCATE, DL, VT, NODE.getValue(0)));   \

    Results.push_back(NODE.getValue(1));                                       \

    break;                                                                     \

  }

      CRC_CASE_EXT_BINARYOP(crc_w_b_w, CRC_W_B_W)

      CRC_CASE_EXT_BINARYOP(crc_w_h_w, CRC_W_H_W)

      CRC_CASE_EXT_BINARYOP(crc_w_w_w, CRC_W_W_W)

      CRC_CASE_EXT_BINARYOP(crcc_w_b_w, CRCC_W_B_W)

      CRC_CASE_EXT_BINARYOP(crcc_w_h_w, CRCC_W_H_W)

      CRC_CASE_EXT_BINARYOP(crcc_w_w_w, CRCC_W_W_W)

#undef CRC_CASE_EXT_BINARYOP


#define CRC_CASE_EXT_UNARYOP(NAME, NODE)                                       \

  case Intrinsic::loongarch_##NAME: {                                          \

    SDValue NODE = DAG.getNode(                                                \

        LoongArchISD::NODE, DL, {MVT::i64, MVT::Other},                        \

        {Chain, Op2,                                                           \

         DAG.getNode(ISD::ANY_EXTEND, DL, MVT::i64, N->getOperand(3))});       \

    Results.push_back(DAG.getNode(ISD::TRUNCATE, DL, VT, NODE.getValue(0)));   \

    Results.push_back(NODE.getValue(1));                                       \

    break;                                                                     \

  }

      CRC_CASE_EXT_UNARYOP(crc_w_d_w, CRC_W_D_W)

      CRC_CASE_EXT_UNARYOP(crcc_w_d_w, CRCC_W_D_W)

#undef CRC_CASE_EXT_UNARYOP

#define CSR_CASE(ID)                                                           \

  case Intrinsic::loongarch_##ID: {                                            \

    if (!Subtarget.is64Bit())                                                  \

      emitErrorAndReplaceIntrinsicResults(N, Results, DAG, ErrorMsgReqLA64);   \

    break;                                                                     \

  }

      CSR_CASE(csrrd_d);

      CSR_CASE(csrwr_d);

      CSR_CASE(csrxchg_d);

      CSR_CASE(iocsrrd_d);

#undef CSR_CASE

    case Intrinsic::loongarch_csrrd_w: {

      unsigned Imm = Op2->getAsZExtVal();

      if (!isUInt<14>(Imm)) {

        emitErrorAndReplaceIntrinsicResults(N, Results, DAG, ErrorMsgOOR);

        return;

      }

      SDValue CSRRDResults =

          DAG.getNode(LoongArchISD::CSRRD, DL, {GRLenVT, MVT::Other},

                      {Chain, DAG.getConstant(Imm, DL, GRLenVT)});

      Results.push_back(

          DAG.getNode(ISD::TRUNCATE, DL, VT, CSRRDResults.getValue(0)));

      Results.push_back(CSRRDResults.getValue(1));

      break;

    }

    case Intrinsic::loongarch_csrwr_w: {

      unsigned Imm = N->getConstantOperandVal(3);

      if (!isUInt<14>(Imm)) {

        emitErrorAndReplaceIntrinsicResults(N, Results, DAG, ErrorMsgOOR);

        return;

      }

      SDValue CSRWRResults =

          DAG.getNode(LoongArchISD::CSRWR, DL, {GRLenVT, MVT::Other},

                      {Chain, DAG.getNode(ISD::ANY_EXTEND, DL, MVT::i64, Op2),

                       DAG.getConstant(Imm, DL, GRLenVT)});

      Results.push_back(

          DAG.getNode(ISD::TRUNCATE, DL, VT, CSRWRResults.getValue(0)));

      Results.push_back(CSRWRResults.getValue(1));

      break;

    }

    case Intrinsic::loongarch_csrxchg_w: {

      unsigned Imm = N->getConstantOperandVal(4);

      if (!isUInt<14>(Imm)) {

        emitErrorAndReplaceIntrinsicResults(N, Results, DAG, ErrorMsgOOR);

        return;

      }

      SDValue CSRXCHGResults = DAG.getNode(

          LoongArchISD::CSRXCHG, DL, {GRLenVT, MVT::Other},

          {Chain, DAG.getNode(ISD::ANY_EXTEND, DL, MVT::i64, Op2),

           DAG.getNode(ISD::ANY_EXTEND, DL, MVT::i64, N->getOperand(3)),

           DAG.getConstant(Imm, DL, GRLenVT)});

      Results.push_back(

          DAG.getNode(ISD::TRUNCATE, DL, VT, CSRXCHGResults.getValue(0)));

      Results.push_back(CSRXCHGResults.getValue(1));

      break;

    }

#define IOCSRRD_CASE(NAME, NODE)                                               \

  case Intrinsic::loongarch_##NAME: {                                          \

    SDValue IOCSRRDResults =                                                   \

        DAG.getNode(LoongArchISD::NODE, DL, {MVT::i64, MVT::Other},            \

                    {Chain, DAG.getNode(ISD::ANY_EXTEND, DL, MVT::i64, Op2)}); \

    Results.push_back(                                                         \

        DAG.getNode(ISD::TRUNCATE, DL, VT, IOCSRRDResults.getValue(0)));       \

    Results.push_back(IOCSRRDResults.getValue(1));                             \

    break;                                                                     \

  }

      IOCSRRD_CASE(iocsrrd_b, IOCSRRD_B);

      IOCSRRD_CASE(iocsrrd_h, IOCSRRD_H);

      IOCSRRD_CASE(iocsrrd_w, IOCSRRD_W);

#undef IOCSRRD_CASE

    case Intrinsic::loongarch_cpucfg: {

      SDValue CPUCFGResults =

          DAG.getNode(LoongArchISD::CPUCFG, DL, {GRLenVT, MVT::Other},

                      {Chain, DAG.getNode(ISD::ANY_EXTEND, DL, MVT::i64, Op2)});

      Results.push_back(

          DAG.getNode(ISD::TRUNCATE, DL, VT, CPUCFGResults.getValue(0)));

      Results.push_back(CPUCFGResults.getValue(1));

      break;

    }

    case Intrinsic::loongarch_lddir_d: {

      if (!Subtarget.is64Bit()) {

        emitErrorAndReplaceIntrinsicResults(N, Results, DAG, ErrorMsgReqLA64);

        return;

      }

      break;

    }

    }

    break;

  }

  case ISD::READ_REGISTER: {

    if (Subtarget.is64Bit())

      DAG.getContext()->emitError(

          "On LA64, only 64-bit registers can be read.");

    else

      DAG.getContext()->emitError(

          "On LA32, only 32-bit registers can be read.");

    Results.push_back(DAG.getUNDEF(VT));

    Results.push_back(N->getOperand(0));

    break;

  }

  case ISD::INTRINSIC_WO_CHAIN: {

    replaceINTRINSIC_WO_CHAINResults(N, Results, DAG, Subtarget);

    break;

  }

  case ISD::LROUND: {

    SDValue Op0 = N->getOperand(0);

    EVT OpVT = Op0.getValueType();

    RTLIB::Libcall LC =

        OpVT == MVT::f64 ? RTLIB::LROUND_F64 : RTLIB::LROUND_F32;

    MakeLibCallOptions CallOptions;

    CallOptions.setTypeListBeforeSoften(OpVT, MVT::i64, true);

    SDValue Result = makeLibCall(DAG, LC, MVT::i64, Op0, CallOptions, DL).first;

    Result = DAG.getNode(ISD::TRUNCATE, DL, MVT::i32, Result);

    Results.push_back(Result);

    break;

  }

  case ISD::ATOMIC_CMP_SWAP: {

    replaceCMP_XCHG_128Results(N, Results, DAG);

    break;

  }

  }

}


static SDValue performANDCombine(SDNode *N, SelectionDAG &DAG,

                                 TargetLowering::DAGCombinerInfo &DCI,

                                 const LoongArchSubtarget &Subtarget) {

  if (DCI.isBeforeLegalizeOps())

    return SDValue();


  SDValue FirstOperand = N->getOperand(0);

  SDValue SecondOperand = N->getOperand(1);

  unsigned FirstOperandOpc = FirstOperand.getOpcode();

  EVT ValTy = N->getValueType(0);

  SDLoc DL(N);

  uint64_t lsb, msb;

  unsigned SMIdx, SMLen;

  ConstantSDNode *CN;

  SDValue NewOperand;

  MVT GRLenVT = Subtarget.getGRLenVT();


  // Op's second operand must be a shifted mask.

  if (!(CN = dyn_cast<ConstantSDNode>(SecondOperand)) ||

      !isShiftedMask_64(CN->getZExtValue(), SMIdx, SMLen))

    return SDValue();


  if (FirstOperandOpc == ISD::SRA || FirstOperandOpc == ISD::SRL) {

    // Pattern match BSTRPICK.

    //  $dst = and ((sra or srl) $src , lsb), (2**len - 1)

    //  => BSTRPICK $dst, $src, msb, lsb

    //  where msb = lsb + len - 1


    // The second operand of the shift must be an immediate.

    if (!(CN = dyn_cast<ConstantSDNode>(FirstOperand.getOperand(1))))

      return SDValue();


    lsb = CN->getZExtValue();


    // Return if the shifted mask does not start at bit 0 or the sum of its

    // length and lsb exceeds the word's size.

    if (SMIdx != 0 || lsb + SMLen > ValTy.getSizeInBits())

      return SDValue();


    NewOperand = FirstOperand.getOperand(0);

  } else {

    // Pattern match BSTRPICK.

    //  $dst = and $src, (2**len- 1) , if len > 12

    //  => BSTRPICK $dst, $src, msb, lsb

    //  where lsb = 0 and msb = len - 1


    // If the mask is <= 0xfff, andi can be used instead.

    if (CN->getZExtValue() <= 0xfff)

      return SDValue();


    // Return if the MSB exceeds.

    if (SMIdx + SMLen > ValTy.getSizeInBits())

      return SDValue();


    if (SMIdx > 0) {

      // Omit if the constant has more than 2 uses. This a conservative

      // decision. Whether it is a win depends on the HW microarchitecture.

      // However it should always be better for 1 and 2 uses.

      if (CN->use_size() > 2)

        return SDValue();

      // Return if the constant can be composed by a single LU12I.W.

      if ((CN->getZExtValue() & 0xfff) == 0)

        return SDValue();

      // Return if the constand can be composed by a single ADDI with

      // the zero register.

      if (CN->getSExtValue() >= -2048 && CN->getSExtValue() < 0)

        return SDValue();

    }


    lsb = SMIdx;

    NewOperand = FirstOperand;

  }


  msb = lsb + SMLen - 1;

  SDValue NR0 = DAG.getNode(LoongArchISD::BSTRPICK, DL, ValTy, NewOperand,

                            DAG.getConstant(msb, DL, GRLenVT),

                            DAG.getConstant(lsb, DL, GRLenVT));

  if (FirstOperandOpc == ISD::SRA || FirstOperandOpc == ISD::SRL || lsb == 0)

    return NR0;

  // Try to optimize to

  //   bstrpick $Rd, $Rs, msb, lsb

  //   slli     $Rd, $Rd, lsb

  return DAG.getNode(ISD::SHL, DL, ValTy, NR0,

                     DAG.getConstant(lsb, DL, GRLenVT));

}


static SDValue performSRLCombine(SDNode *N, SelectionDAG &DAG,

                                 TargetLowering::DAGCombinerInfo &DCI,

                                 const LoongArchSubtarget &Subtarget) {

  if (DCI.isBeforeLegalizeOps())

    return SDValue();


  // $dst = srl (and $src, Mask), Shamt

  // =>

  // BSTRPICK $dst, $src, MaskIdx+MaskLen-1, Shamt

  // when Mask is a shifted mask, and MaskIdx <= Shamt <= MaskIdx+MaskLen-1

  //


  SDValue FirstOperand = N->getOperand(0);

  ConstantSDNode *CN;

  EVT ValTy = N->getValueType(0);

  SDLoc DL(N);

  MVT GRLenVT = Subtarget.getGRLenVT();

  unsigned MaskIdx, MaskLen;

  uint64_t Shamt;


  // The first operand must be an AND and the second operand of the AND must be

  // a shifted mask.

  if (FirstOperand.getOpcode() != ISD::AND ||

      !(CN = dyn_cast<ConstantSDNode>(FirstOperand.getOperand(1))) ||

      !isShiftedMask_64(CN->getZExtValue(), MaskIdx, MaskLen))

    return SDValue();


  // The second operand (shift amount) must be an immediate.

  if (!(CN = dyn_cast<ConstantSDNode>(N->getOperand(1))))

    return SDValue();


  Shamt = CN->getZExtValue();

  if (MaskIdx <= Shamt && Shamt <= MaskIdx + MaskLen - 1)

    return DAG.getNode(LoongArchISD::BSTRPICK, DL, ValTy,

                       FirstOperand->getOperand(0),

                       DAG.getConstant(MaskIdx + MaskLen - 1, DL, GRLenVT),

                       DAG.getConstant(Shamt, DL, GRLenVT));


  return SDValue();

}


static SDValue performORCombine(SDNode *N, SelectionDAG &DAG,

                                TargetLowering::DAGCombinerInfo &DCI,

                                const LoongArchSubtarget &Subtarget) {

  MVT GRLenVT = Subtarget.getGRLenVT();

  EVT ValTy = N->getValueType(0);

  SDValue N0 = N->getOperand(0), N1 = N->getOperand(1);

  ConstantSDNode *CN0, *CN1;

  SDLoc DL(N);

  unsigned ValBits = ValTy.getSizeInBits();

  unsigned MaskIdx0, MaskLen0, MaskIdx1, MaskLen1;

  unsigned Shamt;

  bool SwapAndRetried = false;


  if (DCI.isBeforeLegalizeOps())

    return SDValue();


  if (ValBits != 32 && ValBits != 64)

    return SDValue();


Retry:

  // 1st pattern to match BSTRINS:

  //  R = or (and X, mask0), (and (shl Y, lsb), mask1)

  //  where mask1 = (2**size - 1) << lsb, mask0 = ~mask1

  //  =>

  //  R = BSTRINS X, Y, msb, lsb (where msb = lsb + size - 1)

  if (N0.getOpcode() == ISD::AND &&

      (CN0 = dyn_cast<ConstantSDNode>(N0.getOperand(1))) &&

      isShiftedMask_64(~CN0->getSExtValue(), MaskIdx0, MaskLen0) &&

      N1.getOpcode() == ISD::AND && N1.getOperand(0).getOpcode() == ISD::SHL &&

      (CN1 = dyn_cast<ConstantSDNode>(N1.getOperand(1))) &&

      isShiftedMask_64(CN1->getZExtValue(), MaskIdx1, MaskLen1) &&

      MaskIdx0 == MaskIdx1 && MaskLen0 == MaskLen1 &&

      (CN1 = dyn_cast<ConstantSDNode>(N1.getOperand(0).getOperand(1))) &&

      (Shamt = CN1->getZExtValue()) == MaskIdx0 &&

      (MaskIdx0 + MaskLen0 <= ValBits)) {

    LLVM_DEBUG(dbgs() << "Perform OR combine: match pattern 1\n");

    return DAG.getNode(LoongArchISD::BSTRINS, DL, ValTy, N0.getOperand(0),

                       N1.getOperand(0).getOperand(0),

                       DAG.getConstant((MaskIdx0 + MaskLen0 - 1), DL, GRLenVT),

                       DAG.getConstant(MaskIdx0, DL, GRLenVT));

  }


  // 2nd pattern to match BSTRINS:

  //  R = or (and X, mask0), (shl (and Y, mask1), lsb)

  //  where mask1 = (2**size - 1), mask0 = ~(mask1 << lsb)

  //  =>

  //  R = BSTRINS X, Y, msb, lsb (where msb = lsb + size - 1)

  if (N0.getOpcode() == ISD::AND &&

      (CN0 = dyn_cast<ConstantSDNode>(N0.getOperand(1))) &&

      isShiftedMask_64(~CN0->getSExtValue(), MaskIdx0, MaskLen0) &&

      N1.getOpcode() == ISD::SHL && N1.getOperand(0).getOpcode() == ISD::AND &&

      (CN1 = dyn_cast<ConstantSDNode>(N1.getOperand(1))) &&

      (Shamt = CN1->getZExtValue()) == MaskIdx0 &&

      (CN1 = dyn_cast<ConstantSDNode>(N1.getOperand(0).getOperand(1))) &&

      isShiftedMask_64(CN1->getZExtValue(), MaskIdx1, MaskLen1) &&

      MaskLen0 == MaskLen1 && MaskIdx1 == 0 &&

      (MaskIdx0 + MaskLen0 <= ValBits)) {

    LLVM_DEBUG(dbgs() << "Perform OR combine: match pattern 2\n");

    return DAG.getNode(LoongArchISD::BSTRINS, DL, ValTy, N0.getOperand(0),

                       N1.getOperand(0).getOperand(0),

                       DAG.getConstant((MaskIdx0 + MaskLen0 - 1), DL, GRLenVT),

                       DAG.getConstant(MaskIdx0, DL, GRLenVT));

  }


  // 3rd pattern to match BSTRINS:

  //  R = or (and X, mask0), (and Y, mask1)

  //  where ~mask0 = (2**size - 1) << lsb, mask0 & mask1 = 0

  //  =>

  //  R = BSTRINS X, (shr (and Y, mask1), lsb), msb, lsb

  //  where msb = lsb + size - 1

  if (N0.getOpcode() == ISD::AND && N1.getOpcode() == ISD::AND &&

      (CN0 = dyn_cast<ConstantSDNode>(N0.getOperand(1))) &&

      isShiftedMask_64(~CN0->getSExtValue(), MaskIdx0, MaskLen0) &&

      (MaskIdx0 + MaskLen0 <= 64) &&

      (CN1 = dyn_cast<ConstantSDNode>(N1->getOperand(1))) &&

      (CN1->getSExtValue() & CN0->getSExtValue()) == 0) {

    LLVM_DEBUG(dbgs() << "Perform OR combine: match pattern 3\n");

    return DAG.getNode(LoongArchISD::BSTRINS, DL, ValTy, N0.getOperand(0),

                       DAG.getNode(ISD::SRL, DL, N1->getValueType(0), N1,

                                   DAG.getConstant(MaskIdx0, DL, GRLenVT)),

                       DAG.getConstant(ValBits == 32

                                           ? (MaskIdx0 + (MaskLen0 & 31) - 1)

                                           : (MaskIdx0 + MaskLen0 - 1),

                                       DL, GRLenVT),

                       DAG.getConstant(MaskIdx0, DL, GRLenVT));

  }


  // 4th pattern to match BSTRINS:

  //  R = or (and X, mask), (shl Y, shamt)

  //  where mask = (2**shamt - 1)

  //  =>

  //  R = BSTRINS X, Y, ValBits - 1, shamt

  //  where ValBits = 32 or 64

  if (N0.getOpcode() == ISD::AND && N1.getOpcode() == ISD::SHL &&

      (CN0 = dyn_cast<ConstantSDNode>(N0.getOperand(1))) &&

      isShiftedMask_64(CN0->getZExtValue(), MaskIdx0, MaskLen0) &&

      MaskIdx0 == 0 && (CN1 = dyn_cast<ConstantSDNode>(N1.getOperand(1))) &&

      (Shamt = CN1->getZExtValue()) == MaskLen0 &&

      (MaskIdx0 + MaskLen0 <= ValBits)) {

    LLVM_DEBUG(dbgs() << "Perform OR combine: match pattern 4\n");

    return DAG.getNode(LoongArchISD::BSTRINS, DL, ValTy, N0.getOperand(0),

                       N1.getOperand(0),

                       DAG.getConstant((ValBits - 1), DL, GRLenVT),

                       DAG.getConstant(Shamt, DL, GRLenVT));

  }


  // 5th pattern to match BSTRINS:

  //  R = or (and X, mask), const

  //  where ~mask = (2**size - 1) << lsb, mask & const = 0

  //  =>

  //  R = BSTRINS X, (const >> lsb), msb, lsb

  //  where msb = lsb + size - 1

  if (N0.getOpcode() == ISD::AND &&

      (CN0 = dyn_cast<ConstantSDNode>(N0.getOperand(1))) &&

      isShiftedMask_64(~CN0->getSExtValue(), MaskIdx0, MaskLen0) &&

      (CN1 = dyn_cast<ConstantSDNode>(N1)) &&

      (CN1->getSExtValue() & CN0->getSExtValue()) == 0) {

    LLVM_DEBUG(dbgs() << "Perform OR combine: match pattern 5\n");

    return DAG.getNode(

        LoongArchISD::BSTRINS, DL, ValTy, N0.getOperand(0),

        DAG.getConstant(CN1->getSExtValue() >> MaskIdx0, DL, ValTy),

        DAG.getConstant(ValBits == 32 ? (MaskIdx0 + (MaskLen0 & 31) - 1)

                                      : (MaskIdx0 + MaskLen0 - 1),

                        DL, GRLenVT),

        DAG.getConstant(MaskIdx0, DL, GRLenVT));

  }


  // 6th pattern.

  // a = b | ((c & mask) << shamt), where all positions in b to be overwritten

  // by the incoming bits are known to be zero.

  // =>

  // a = BSTRINS b, c, shamt + MaskLen - 1, shamt

  //

  // Note that the 1st pattern is a special situation of the 6th, i.e. the 6th

  // pattern is more common than the 1st. So we put the 1st before the 6th in

  // order to match as many nodes as possible.

  ConstantSDNode *CNMask, *CNShamt;

  unsigned MaskIdx, MaskLen;

  if (N1.getOpcode() == ISD::SHL && N1.getOperand(0).getOpcode() == ISD::AND &&

      (CNMask = dyn_cast<ConstantSDNode>(N1.getOperand(0).getOperand(1))) &&

      isShiftedMask_64(CNMask->getZExtValue(), MaskIdx, MaskLen) &&

      MaskIdx == 0 && (CNShamt = dyn_cast<ConstantSDNode>(N1.getOperand(1))) &&

      CNShamt->getZExtValue() + MaskLen <= ValBits) {

    Shamt = CNShamt->getZExtValue();

    APInt ShMask(ValBits, CNMask->getZExtValue() << Shamt);

    if (ShMask.isSubsetOf(DAG.computeKnownBits(N0).Zero)) {

      LLVM_DEBUG(dbgs() << "Perform OR combine: match pattern 6\n");

      return DAG.getNode(LoongArchISD::BSTRINS, DL, ValTy, N0,

                         N1.getOperand(0).getOperand(0),

                         DAG.getConstant(Shamt + MaskLen - 1, DL, GRLenVT),

                         DAG.getConstant(Shamt, DL, GRLenVT));

    }

  }


  // 7th pattern.

  // a = b | ((c << shamt) & shifted_mask), where all positions in b to be

  // overwritten by the incoming bits are known to be zero.

  // =>

  // a = BSTRINS b, c, MaskIdx + MaskLen - 1, MaskIdx

  //

  // Similarly, the 7th pattern is more common than the 2nd. So we put the 2nd

  // before the 7th in order to match as many nodes as possible.

  if (N1.getOpcode() == ISD::AND &&

      (CNMask = dyn_cast<ConstantSDNode>(N1.getOperand(1))) &&

      isShiftedMask_64(CNMask->getZExtValue(), MaskIdx, MaskLen) &&

      N1.getOperand(0).getOpcode() == ISD::SHL &&

      (CNShamt = dyn_cast<ConstantSDNode>(N1.getOperand(0).getOperand(1))) &&

      CNShamt->getZExtValue() == MaskIdx) {

    APInt ShMask(ValBits, CNMask->getZExtValue());

    if (ShMask.isSubsetOf(DAG.computeKnownBits(N0).Zero)) {

      LLVM_DEBUG(dbgs() << "Perform OR combine: match pattern 7\n");

      return DAG.getNode(LoongArchISD::BSTRINS, DL, ValTy, N0,

                         N1.getOperand(0).getOperand(0),

                         DAG.getConstant(MaskIdx + MaskLen - 1, DL, GRLenVT),

                         DAG.getConstant(MaskIdx, DL, GRLenVT));

    }

  }


  // (or a, b) and (or b, a) are equivalent, so swap the operands and retry.

  if (!SwapAndRetried) {

    std::swap(N0, N1);

    SwapAndRetried = true;

    goto Retry;

  }


  SwapAndRetried = false;

Retry2:

  // 8th pattern.

  // a = b | (c & shifted_mask), where all positions in b to be overwritten by

  // the incoming bits are known to be zero.

  // =>

  // a = BSTRINS b, c >> MaskIdx, MaskIdx + MaskLen - 1, MaskIdx

  //

  // Similarly, the 8th pattern is more common than the 4th and 5th patterns. So

  // we put it here in order to match as many nodes as possible or generate less

  // instructions.

  if (N1.getOpcode() == ISD::AND &&

      (CNMask = dyn_cast<ConstantSDNode>(N1.getOperand(1))) &&

      isShiftedMask_64(CNMask->getZExtValue(), MaskIdx, MaskLen)) {

    APInt ShMask(ValBits, CNMask->getZExtValue());

    if (ShMask.isSubsetOf(DAG.computeKnownBits(N0).Zero)) {

      LLVM_DEBUG(dbgs() << "Perform OR combine: match pattern 8\n");

      return DAG.getNode(LoongArchISD::BSTRINS, DL, ValTy, N0,

                         DAG.getNode(ISD::SRL, DL, N1->getValueType(0),

                                     N1->getOperand(0),

                                     DAG.getConstant(MaskIdx, DL, GRLenVT)),

                         DAG.getConstant(MaskIdx + MaskLen - 1, DL, GRLenVT),

                         DAG.getConstant(MaskIdx, DL, GRLenVT));

    }

  }

  // Swap N0/N1 and retry.

  if (!SwapAndRetried) {

    std::swap(N0, N1);

    SwapAndRetried = true;

    goto Retry2;

  }


  return SDValue();

}


static bool checkValueWidth(SDValue V, ISD::LoadExtType &ExtType) {

  ExtType = ISD::NON_EXTLOAD;


  switch (V.getNode()->getOpcode()) {

  case ISD::LOAD: {

    LoadSDNode *LoadNode = cast<LoadSDNode>(V.getNode());

    if ((LoadNode->getMemoryVT() == MVT::i8) ||

        (LoadNode->getMemoryVT() == MVT::i16)) {

      ExtType = LoadNode->getExtensionType();

      return true;

    }

    return false;

  }

  case ISD::AssertSext: {

    VTSDNode *TypeNode = cast<VTSDNode>(V.getNode()->getOperand(1));

    if ((TypeNode->getVT() == MVT::i8) || (TypeNode->getVT() == MVT::i16)) {

      ExtType = ISD::SEXTLOAD;

      return true;

    }

    return false;

  }

  case ISD::AssertZext: {

    VTSDNode *TypeNode = cast<VTSDNode>(V.getNode()->getOperand(1));

    if ((TypeNode->getVT() == MVT::i8) || (TypeNode->getVT() == MVT::i16)) {

      ExtType = ISD::ZEXTLOAD;

      return true;

    }

    return false;

  }

  default:

    return false;

  }


  return false;

}


// Eliminate redundant truncation and zero-extension nodes.

// * Case 1:

//  +------------+ +------------+ +------------+

//  |   Input1   | |   Input2   | |     CC     |

//  +------------+ +------------+ +------------+

//         |              |              |

//         V              V              +----+

//  +------------+ +------------+             |

//  |  TRUNCATE  | |  TRUNCATE  |             |

//  +------------+ +------------+             |

//         |              |                   |

//         V              V                   |

//  +------------+ +------------+             |

//  |  ZERO_EXT  | |  ZERO_EXT  |             |

//  +------------+ +------------+             |

//         |              |                   |

//         |              +-------------+     |

//         V              V             |     |

//        +----------------+            |     |

//        |      AND       |            |     |

//        +----------------+            |     |

//                |                     |     |

//                +---------------+     |     |

//                                |     |     |

//                                V     V     V

//                               +-------------+

//                               |     CMP     |

//                               +-------------+

// * Case 2:

//  +------------+ +------------+ +-------------+ +------------+ +------------+

//  |   Input1   | |   Input2   | | Constant -1 | | Constant 0 | |     CC     |

//  +------------+ +------------+ +-------------+ +------------+ +------------+

//         |              |             |               |               |

//         V              |             |               |               |

//  +------------+        |             |               |               |

//  |     XOR    |<---------------------+               |               |

//  +------------+        |                             |               |

//         |              |                             |               |

//         V              V             +---------------+               |

//  +------------+ +------------+       |                               |

//  |  TRUNCATE  | |  TRUNCATE  |       |     +-------------------------+

//  +------------+ +------------+       |     |

//         |              |             |     |

//         V              V             |     |

//  +------------+ +------------+       |     |

//  |  ZERO_EXT  | |  ZERO_EXT  |       |     |

//  +------------+ +------------+       |     |

//         |              |             |     |

//         V              V             |     |

//        +----------------+            |     |

//        |      AND       |            |     |

//        +----------------+            |     |

//                |                     |     |

//                +---------------+     |     |

//                                |     |     |

//                                V     V     V

//                               +-------------+

//                               |     CMP     |

//                               +-------------+

static SDValue performSETCCCombine(SDNode *N, SelectionDAG &DAG,

                                   TargetLowering::DAGCombinerInfo &DCI,

                                   const LoongArchSubtarget &Subtarget) {

  ISD::CondCode CC = cast<CondCodeSDNode>(N->getOperand(2))->get();


  SDNode *AndNode = N->getOperand(0).getNode();

  if (AndNode->getOpcode() != ISD::AND)

    return SDValue();


  SDValue AndInputValue2 = AndNode->getOperand(1);

  if (AndInputValue2.getOpcode() != ISD::ZERO_EXTEND)

    return SDValue();


  SDValue CmpInputValue = N->getOperand(1);

  SDValue AndInputValue1 = AndNode->getOperand(0);

  if (AndInputValue1.getOpcode() == ISD::XOR) {

    if (CC != ISD::SETEQ && CC != ISD::SETNE)

      return SDValue();

    ConstantSDNode *CN = dyn_cast<ConstantSDNode>(AndInputValue1.getOperand(1));

    if (!CN || CN->getSExtValue() != -1)

      return SDValue();

    CN = dyn_cast<ConstantSDNode>(CmpInputValue);

    if (!CN || CN->getSExtValue() != 0)

      return SDValue();

    AndInputValue1 = AndInputValue1.getOperand(0);

    if (AndInputValue1.getOpcode() != ISD::ZERO_EXTEND)

      return SDValue();

  } else if (AndInputValue1.getOpcode() == ISD::ZERO_EXTEND) {

    if (AndInputValue2 != CmpInputValue)

      return SDValue();

  } else {

    return SDValue();

  }


  SDValue TruncValue1 = AndInputValue1.getNode()->getOperand(0);

  if (TruncValue1.getOpcode() != ISD::TRUNCATE)

    return SDValue();


  SDValue TruncValue2 = AndInputValue2.getNode()->getOperand(0);

  if (TruncValue2.getOpcode() != ISD::TRUNCATE)

    return SDValue();


  SDValue TruncInputValue1 = TruncValue1.getNode()->getOperand(0);

  SDValue TruncInputValue2 = TruncValue2.getNode()->getOperand(0);

  ISD::LoadExtType ExtType1;

  ISD::LoadExtType ExtType2;


  if (!checkValueWidth(TruncInputValue1, ExtType1) ||

      !checkValueWidth(TruncInputValue2, ExtType2))

    return SDValue();


  if (TruncInputValue1->getValueType(0) != TruncInputValue2->getValueType(0) ||

      AndNode->getValueType(0) != TruncInputValue1->getValueType(0))

    return SDValue();


  if ((ExtType2 != ISD::ZEXTLOAD) &&

      ((ExtType2 != ISD::SEXTLOAD) && (ExtType1 != ISD::SEXTLOAD)))

    return SDValue();


  // These truncation and zero-extension nodes are not necessary, remove them.

  SDValue NewAnd = DAG.getNode(ISD::AND, SDLoc(N), AndNode->getValueType(0),

                               TruncInputValue1, TruncInputValue2);

  SDValue NewSetCC =

      DAG.getSetCC(SDLoc(N), N->getValueType(0), NewAnd, TruncInputValue2, CC);

  DAG.ReplaceAllUsesWith(N, NewSetCC.getNode());

  return SDValue(N, 0);

}


// Combine (loongarch_bitrev_w (loongarch_revb_2w X)) to loongarch_bitrev_4b.

static SDValue performBITREV_WCombine(SDNode *N, SelectionDAG &DAG,

                                      TargetLowering::DAGCombinerInfo &DCI,

                                      const LoongArchSubtarget &Subtarget) {

  if (DCI.isBeforeLegalizeOps())

    return SDValue();


  SDValue Src = N->getOperand(0);

  if (Src.getOpcode() != LoongArchISD::REVB_2W)

    return SDValue();


  return DAG.getNode(LoongArchISD::BITREV_4B, SDLoc(N), N->getValueType(0),

                     Src.getOperand(0));

}


template <unsigned N>

static SDValue legalizeIntrinsicImmArg(SDNode *Node, unsigned ImmOp,

                                       SelectionDAG &DAG,

                                       const LoongArchSubtarget &Subtarget,

                                       bool IsSigned = false) {

  SDLoc DL(Node);

  auto *CImm = cast<ConstantSDNode>(Node->getOperand(ImmOp));

  // Check the ImmArg.

  if ((IsSigned && !isInt<N>(CImm->getSExtValue())) ||

      (!IsSigned && !isUInt<N>(CImm->getZExtValue()))) {

    DAG.getContext()->emitError(Node->getOperationName(0) +

                                ": argument out of range.");

    return DAG.getNode(ISD::UNDEF, DL, Subtarget.getGRLenVT());

  }

  return DAG.getConstant(CImm->getZExtValue(), DL, Subtarget.getGRLenVT());

}


template <unsigned N>

static SDValue lowerVectorSplatImm(SDNode *Node, unsigned ImmOp,

                                   SelectionDAG &DAG, bool IsSigned = false) {

  SDLoc DL(Node);

  EVT ResTy = Node->getValueType(0);

  auto *CImm = cast<ConstantSDNode>(Node->getOperand(ImmOp));


  // Check the ImmArg.

  if ((IsSigned && !isInt<N>(CImm->getSExtValue())) ||

      (!IsSigned && !isUInt<N>(CImm->getZExtValue()))) {

    DAG.getContext()->emitError(Node->getOperationName(0) +

                                ": argument out of range.");

    return DAG.getNode(ISD::UNDEF, DL, ResTy);

  }

  return DAG.getConstant(

      APInt(ResTy.getScalarType().getSizeInBits(),

            IsSigned ? CImm->getSExtValue() : CImm->getZExtValue(), IsSigned),

      DL, ResTy);

}


static SDValue truncateVecElts(SDNode *Node, SelectionDAG &DAG) {

  SDLoc DL(Node);

  EVT ResTy = Node->getValueType(0);

  SDValue Vec = Node->getOperand(2);

  SDValue Mask = DAG.getConstant(Vec.getScalarValueSizeInBits() - 1, DL, ResTy);

  return DAG.getNode(ISD::AND, DL, ResTy, Vec, Mask);

}


static SDValue lowerVectorBitClear(SDNode *Node, SelectionDAG &DAG) {

  SDLoc DL(Node);

  EVT ResTy = Node->getValueType(0);

  SDValue One = DAG.getConstant(1, DL, ResTy);

  SDValue Bit =

      DAG.getNode(ISD::SHL, DL, ResTy, One, truncateVecElts(Node, DAG));


  return DAG.getNode(ISD::AND, DL, ResTy, Node->getOperand(1),

                     DAG.getNOT(DL, Bit, ResTy));

}


template <unsigned N>

static SDValue lowerVectorBitClearImm(SDNode *Node, SelectionDAG &DAG) {

  SDLoc DL(Node);

  EVT ResTy = Node->getValueType(0);

  auto *CImm = cast<ConstantSDNode>(Node->getOperand(2));

  // Check the unsigned ImmArg.

  if (!isUInt<N>(CImm->getZExtValue())) {

    DAG.getContext()->emitError(Node->getOperationName(0) +

                                ": argument out of range.");

    return DAG.getNode(ISD::UNDEF, DL, ResTy);

  }


  APInt BitImm = APInt(ResTy.getScalarSizeInBits(), 1) << CImm->getAPIntValue();

  SDValue Mask = DAG.getConstant(~BitImm, DL, ResTy);


  return DAG.getNode(ISD::AND, DL, ResTy, Node->getOperand(1), Mask);

}


template <unsigned N>

static SDValue lowerVectorBitSetImm(SDNode *Node, SelectionDAG &DAG) {

  SDLoc DL(Node);

  EVT ResTy = Node->getValueType(0);

  auto *CImm = cast<ConstantSDNode>(Node->getOperand(2));

  // Check the unsigned ImmArg.

  if (!isUInt<N>(CImm->getZExtValue())) {

    DAG.getContext()->emitError(Node->getOperationName(0) +

                                ": argument out of range.");

    return DAG.getNode(ISD::UNDEF, DL, ResTy);

  }


  APInt Imm = APInt(ResTy.getScalarSizeInBits(), 1) << CImm->getAPIntValue();

  SDValue BitImm = DAG.getConstant(Imm, DL, ResTy);

  return DAG.getNode(ISD::OR, DL, ResTy, Node->getOperand(1), BitImm);

}


template <unsigned N>

static SDValue lowerVectorBitRevImm(SDNode *Node, SelectionDAG &DAG) {

  SDLoc DL(Node);

  EVT ResTy = Node->getValueType(0);

  auto *CImm = cast<ConstantSDNode>(Node->getOperand(2));

  // Check the unsigned ImmArg.

  if (!isUInt<N>(CImm->getZExtValue())) {

    DAG.getContext()->emitError(Node->getOperationName(0) +

                                ": argument out of range.");

    return DAG.getNode(ISD::UNDEF, DL, ResTy);

  }


  APInt Imm = APInt(ResTy.getScalarSizeInBits(), 1) << CImm->getAPIntValue();

  SDValue BitImm = DAG.getConstant(Imm, DL, ResTy);

  return DAG.getNode(ISD::XOR, DL, ResTy, Node->getOperand(1), BitImm);

}


static SDValue

performINTRINSIC_WO_CHAINCombine(SDNode *N, SelectionDAG &DAG,

                                 TargetLowering::DAGCombinerInfo &DCI,

                                 const LoongArchSubtarget &Subtarget) {

  SDLoc DL(N);

  switch (N->getConstantOperandVal(0)) {

  default:

    break;

  case Intrinsic::loongarch_lsx_vadd_b:

  case Intrinsic::loongarch_lsx_vadd_h:

  case Intrinsic::loongarch_lsx_vadd_w:

  case Intrinsic::loongarch_lsx_vadd_d:

  case Intrinsic::loongarch_lasx_xvadd_b:

  case Intrinsic::loongarch_lasx_xvadd_h:

  case Intrinsic::loongarch_lasx_xvadd_w:

  case Intrinsic::loongarch_lasx_xvadd_d:

    return DAG.getNode(ISD::ADD, DL, N->getValueType(0), N->getOperand(1),

                       N->getOperand(2));

  case Intrinsic::loongarch_lsx_vaddi_bu:

  case Intrinsic::loongarch_lsx_vaddi_hu:

  case Intrinsic::loongarch_lsx_vaddi_wu:

  case Intrinsic::loongarch_lsx_vaddi_du:

  case Intrinsic::loongarch_lasx_xvaddi_bu:

  case Intrinsic::loongarch_lasx_xvaddi_hu:

  case Intrinsic::loongarch_lasx_xvaddi_wu:

  case Intrinsic::loongarch_lasx_xvaddi_du:

    return DAG.getNode(ISD::ADD, DL, N->getValueType(0), N->getOperand(1),

                       lowerVectorSplatImm<5>(N, 2, DAG));

  case Intrinsic::loongarch_lsx_vsub_b:

  case Intrinsic::loongarch_lsx_vsub_h:

  case Intrinsic::loongarch_lsx_vsub_w:

  case Intrinsic::loongarch_lsx_vsub_d:

  case Intrinsic::loongarch_lasx_xvsub_b:

  case Intrinsic::loongarch_lasx_xvsub_h:

  case Intrinsic::loongarch_lasx_xvsub_w:

  case Intrinsic::loongarch_lasx_xvsub_d:

    return DAG.getNode(ISD::SUB, DL, N->getValueType(0), N->getOperand(1),

                       N->getOperand(2));

  case Intrinsic::loongarch_lsx_vsubi_bu:

  case Intrinsic::loongarch_lsx_vsubi_hu:

  case Intrinsic::loongarch_lsx_vsubi_wu:

  case Intrinsic::loongarch_lsx_vsubi_du:

  case Intrinsic::loongarch_lasx_xvsubi_bu:

  case Intrinsic::loongarch_lasx_xvsubi_hu:

  case Intrinsic::loongarch_lasx_xvsubi_wu:

  case Intrinsic::loongarch_lasx_xvsubi_du:

    return DAG.getNode(ISD::SUB, DL, N->getValueType(0), N->getOperand(1),

                       lowerVectorSplatImm<5>(N, 2, DAG));

  case Intrinsic::loongarch_lsx_vneg_b:

  case Intrinsic::loongarch_lsx_vneg_h:

  case Intrinsic::loongarch_lsx_vneg_w:

  case Intrinsic::loongarch_lsx_vneg_d:

  case Intrinsic::loongarch_lasx_xvneg_b:

  case Intrinsic::loongarch_lasx_xvneg_h:

  case Intrinsic::loongarch_lasx_xvneg_w:

  case Intrinsic::loongarch_lasx_xvneg_d:

    return DAG.getNode(

        ISD::SUB, DL, N->getValueType(0),

        DAG.getConstant(

            APInt(N->getValueType(0).getScalarType().getSizeInBits(), 0,

                  /*isSigned=*/true),

            SDLoc(N), N->getValueType(0)),

        N->getOperand(1));

  case Intrinsic::loongarch_lsx_vmax_b:

  case Intrinsic::loongarch_lsx_vmax_h:

  case Intrinsic::loongarch_lsx_vmax_w:

  case Intrinsic::loongarch_lsx_vmax_d:

  case Intrinsic::loongarch_lasx_xvmax_b:

  case Intrinsic::loongarch_lasx_xvmax_h:

  case Intrinsic::loongarch_lasx_xvmax_w:

  case Intrinsic::loongarch_lasx_xvmax_d:

    return DAG.getNode(ISD::SMAX, DL, N->getValueType(0), N->getOperand(1),

                       N->getOperand(2));

  case Intrinsic::loongarch_lsx_vmax_bu:

  case Intrinsic::loongarch_lsx_vmax_hu:

  case Intrinsic::loongarch_lsx_vmax_wu:

  case Intrinsic::loongarch_lsx_vmax_du:

  case Intrinsic::loongarch_lasx_xvmax_bu:

  case Intrinsic::loongarch_lasx_xvmax_hu:

  case Intrinsic::loongarch_lasx_xvmax_wu:

  case Intrinsic::loongarch_lasx_xvmax_du:

    return DAG.getNode(ISD::UMAX, DL, N->getValueType(0), N->getOperand(1),

                       N->getOperand(2));

  case Intrinsic::loongarch_lsx_vmaxi_b:

  case Intrinsic::loongarch_lsx_vmaxi_h:

  case Intrinsic::loongarch_lsx_vmaxi_w:

  case Intrinsic::loongarch_lsx_vmaxi_d:

  case Intrinsic::loongarch_lasx_xvmaxi_b:

  case Intrinsic::loongarch_lasx_xvmaxi_h:

  case Intrinsic::loongarch_lasx_xvmaxi_w:

  case Intrinsic::loongarch_lasx_xvmaxi_d:

    return DAG.getNode(ISD::SMAX, DL, N->getValueType(0), N->getOperand(1),

                       lowerVectorSplatImm<5>(N, 2, DAG, /*IsSigned=*/true));

  case Intrinsic::loongarch_lsx_vmaxi_bu:

  case Intrinsic::loongarch_lsx_vmaxi_hu:

  case Intrinsic::loongarch_lsx_vmaxi_wu:

  case Intrinsic::loongarch_lsx_vmaxi_du:

  case Intrinsic::loongarch_lasx_xvmaxi_bu:

  case Intrinsic::loongarch_lasx_xvmaxi_hu:

  case Intrinsic::loongarch_lasx_xvmaxi_wu:

  case Intrinsic::loongarch_lasx_xvmaxi_du:

    return DAG.getNode(ISD::UMAX, DL, N->getValueType(0), N->getOperand(1),

                       lowerVectorSplatImm<5>(N, 2, DAG));

  case Intrinsic::loongarch_lsx_vmin_b:

  case Intrinsic::loongarch_lsx_vmin_h:

  case Intrinsic::loongarch_lsx_vmin_w:

  case Intrinsic::loongarch_lsx_vmin_d:

  case Intrinsic::loongarch_lasx_xvmin_b:

  case Intrinsic::loongarch_lasx_xvmin_h:

  case Intrinsic::loongarch_lasx_xvmin_w:

  case Intrinsic::loongarch_lasx_xvmin_d:

    return DAG.getNode(ISD::SMIN, DL, N->getValueType(0), N->getOperand(1),

                       N->getOperand(2));

  case Intrinsic::loongarch_lsx_vmin_bu:

  case Intrinsic::loongarch_lsx_vmin_hu:

  case Intrinsic::loongarch_lsx_vmin_wu:

  case Intrinsic::loongarch_lsx_vmin_du:

  case Intrinsic::loongarch_lasx_xvmin_bu:

  case Intrinsic::loongarch_lasx_xvmin_hu:

  case Intrinsic::loongarch_lasx_xvmin_wu:

  case Intrinsic::loongarch_lasx_xvmin_du:

    return DAG.getNode(ISD::UMIN, DL, N->getValueType(0), N->getOperand(1),

                       N->getOperand(2));

  case Intrinsic::loongarch_lsx_vmini_b:

  case Intrinsic::loongarch_lsx_vmini_h:

  case Intrinsic::loongarch_lsx_vmini_w:

  case Intrinsic::loongarch_lsx_vmini_d:

  case Intrinsic::loongarch_lasx_xvmini_b:

  case Intrinsic::loongarch_lasx_xvmini_h:

  case Intrinsic::loongarch_lasx_xvmini_w:

  case Intrinsic::loongarch_lasx_xvmini_d:

    return DAG.getNode(ISD::SMIN, DL, N->getValueType(0), N->getOperand(1),

                       lowerVectorSplatImm<5>(N, 2, DAG, /*IsSigned=*/true));

  case Intrinsic::loongarch_lsx_vmini_bu:

  case Intrinsic::loongarch_lsx_vmini_hu:

  case Intrinsic::loongarch_lsx_vmini_wu:

  case Intrinsic::loongarch_lsx_vmini_du:

  case Intrinsic::loongarch_lasx_xvmini_bu:

  case Intrinsic::loongarch_lasx_xvmini_hu:

  case Intrinsic::loongarch_lasx_xvmini_wu:

  case Intrinsic::loongarch_lasx_xvmini_du:

    return DAG.getNode(ISD::UMIN, DL, N->getValueType(0), N->getOperand(1),

                       lowerVectorSplatImm<5>(N, 2, DAG));

  case Intrinsic::loongarch_lsx_vmul_b:

  case Intrinsic::loongarch_lsx_vmul_h:

  case Intrinsic::loongarch_lsx_vmul_w:

  case Intrinsic::loongarch_lsx_vmul_d:

  case Intrinsic::loongarch_lasx_xvmul_b:

  case Intrinsic::loongarch_lasx_xvmul_h:

  case Intrinsic::loongarch_lasx_xvmul_w:

  case Intrinsic::loongarch_lasx_xvmul_d:

    return DAG.getNode(ISD::MUL, DL, N->getValueType(0), N->getOperand(1),

                       N->getOperand(2));

  case Intrinsic::loongarch_lsx_vmadd_b:

  case Intrinsic::loongarch_lsx_vmadd_h:

  case Intrinsic::loongarch_lsx_vmadd_w:

  case Intrinsic::loongarch_lsx_vmadd_d:

  case Intrinsic::loongarch_lasx_xvmadd_b:

  case Intrinsic::loongarch_lasx_xvmadd_h:

  case Intrinsic::loongarch_lasx_xvmadd_w:

  case Intrinsic::loongarch_lasx_xvmadd_d: {

    EVT ResTy = N->getValueType(0);

    return DAG.getNode(ISD::ADD, SDLoc(N), ResTy, N->getOperand(1),

                       DAG.getNode(ISD::MUL, SDLoc(N), ResTy, N->getOperand(2),

                                   N->getOperand(3)));

  }

  case Intrinsic::loongarch_lsx_vmsub_b:

  case Intrinsic::loongarch_lsx_vmsub_h:

  case Intrinsic::loongarch_lsx_vmsub_w:

  case Intrinsic::loongarch_lsx_vmsub_d:

  case Intrinsic::loongarch_lasx_xvmsub_b:

  case Intrinsic::loongarch_lasx_xvmsub_h:

  case Intrinsic::loongarch_lasx_xvmsub_w:

  case Intrinsic::loongarch_lasx_xvmsub_d: {

    EVT ResTy = N->getValueType(0);

    return DAG.getNode(ISD::SUB, SDLoc(N), ResTy, N->getOperand(1),

                       DAG.getNode(ISD::MUL, SDLoc(N), ResTy, N->getOperand(2),

                                   N->getOperand(3)));

  }

  case Intrinsic::loongarch_lsx_vdiv_b:

  case Intrinsic::loongarch_lsx_vdiv_h:

  case Intrinsic::loongarch_lsx_vdiv_w:

  case Intrinsic::loongarch_lsx_vdiv_d:

  case Intrinsic::loongarch_lasx_xvdiv_b:

  case Intrinsic::loongarch_lasx_xvdiv_h:

  case Intrinsic::loongarch_lasx_xvdiv_w:

  case Intrinsic::loongarch_lasx_xvdiv_d:

    return DAG.getNode(ISD::SDIV, DL, N->getValueType(0), N->getOperand(1),

                       N->getOperand(2));

  case Intrinsic::loongarch_lsx_vdiv_bu:

  case Intrinsic::loongarch_lsx_vdiv_hu:

  case Intrinsic::loongarch_lsx_vdiv_wu:

  case Intrinsic::loongarch_lsx_vdiv_du:

  case Intrinsic::loongarch_lasx_xvdiv_bu:

  case Intrinsic::loongarch_lasx_xvdiv_hu:

  case Intrinsic::loongarch_lasx_xvdiv_wu:

  case Intrinsic::loongarch_lasx_xvdiv_du:

    return DAG.getNode(ISD::UDIV, DL, N->getValueType(0), N->getOperand(1),

                       N->getOperand(2));

  case Intrinsic::loongarch_lsx_vmod_b:

  case Intrinsic::loongarch_lsx_vmod_h:

  case Intrinsic::loongarch_lsx_vmod_w:

  case Intrinsic::loongarch_lsx_vmod_d:

  case Intrinsic::loongarch_lasx_xvmod_b:

  case Intrinsic::loongarch_lasx_xvmod_h:

  case Intrinsic::loongarch_lasx_xvmod_w:

  case Intrinsic::loongarch_lasx_xvmod_d:

    return DAG.getNode(ISD::SREM, DL, N->getValueType(0), N->getOperand(1),

                       N->getOperand(2));

  case Intrinsic::loongarch_lsx_vmod_bu:

  case Intrinsic::loongarch_lsx_vmod_hu:

  case Intrinsic::loongarch_lsx_vmod_wu:

  case Intrinsic::loongarch_lsx_vmod_du:

  case Intrinsic::loongarch_lasx_xvmod_bu:

  case Intrinsic::loongarch_lasx_xvmod_hu:

  case Intrinsic::loongarch_lasx_xvmod_wu:

  case Intrinsic::loongarch_lasx_xvmod_du:

    return DAG.getNode(ISD::UREM, DL, N->getValueType(0), N->getOperand(1),

                       N->getOperand(2));

  case Intrinsic::loongarch_lsx_vand_v:

  case Intrinsic::loongarch_lasx_xvand_v:

    return DAG.getNode(ISD::AND, DL, N->getValueType(0), N->getOperand(1),

                       N->getOperand(2));

  case Intrinsic::loongarch_lsx_vor_v:

  case Intrinsic::loongarch_lasx_xvor_v:

    return DAG.getNode(ISD::OR, DL, N->getValueType(0), N->getOperand(1),

                       N->getOperand(2));

  case Intrinsic::loongarch_lsx_vxor_v:

  case Intrinsic::loongarch_lasx_xvxor_v:

    return DAG.getNode(ISD::XOR, DL, N->getValueType(0), N->getOperand(1),

                       N->getOperand(2));

  case Intrinsic::loongarch_lsx_vnor_v:

  case Intrinsic::loongarch_lasx_xvnor_v: {

    SDValue Res = DAG.getNode(ISD::OR, DL, N->getValueType(0), N->getOperand(1),

                              N->getOperand(2));

    return DAG.getNOT(DL, Res, Res->getValueType(0));

  }

  case Intrinsic::loongarch_lsx_vandi_b:

  case Intrinsic::loongarch_lasx_xvandi_b:

    return DAG.getNode(ISD::AND, DL, N->getValueType(0), N->getOperand(1),

                       lowerVectorSplatImm<8>(N, 2, DAG));

  case Intrinsic::loongarch_lsx_vori_b:

  case Intrinsic::loongarch_lasx_xvori_b:

    return DAG.getNode(ISD::OR, DL, N->getValueType(0), N->getOperand(1),

                       lowerVectorSplatImm<8>(N, 2, DAG));

  case Intrinsic::loongarch_lsx_vxori_b:

  case Intrinsic::loongarch_lasx_xvxori_b:

    return DAG.getNode(ISD::XOR, DL, N->getValueType(0), N->getOperand(1),

                       lowerVectorSplatImm<8>(N, 2, DAG));

  case Intrinsic::loongarch_lsx_vsll_b:

  case Intrinsic::loongarch_lsx_vsll_h:

  case Intrinsic::loongarch_lsx_vsll_w:

  case Intrinsic::loongarch_lsx_vsll_d:

  case Intrinsic::loongarch_lasx_xvsll_b:

  case Intrinsic::loongarch_lasx_xvsll_h:

  case Intrinsic::loongarch_lasx_xvsll_w:

  case Intrinsic::loongarch_lasx_xvsll_d:

    return DAG.getNode(ISD::SHL, DL, N->getValueType(0), N->getOperand(1),

                       truncateVecElts(N, DAG));

  case Intrinsic::loongarch_lsx_vslli_b:

  case Intrinsic::loongarch_lasx_xvslli_b:

    return DAG.getNode(ISD::SHL, DL, N->getValueType(0), N->getOperand(1),

                       lowerVectorSplatImm<3>(N, 2, DAG));

  case Intrinsic::loongarch_lsx_vslli_h:

  case Intrinsic::loongarch_lasx_xvslli_h:

    return DAG.getNode(ISD::SHL, DL, N->getValueType(0), N->getOperand(1),

                       lowerVectorSplatImm<4>(N, 2, DAG));

  case Intrinsic::loongarch_lsx_vslli_w:

  case Intrinsic::loongarch_lasx_xvslli_w:

    return DAG.getNode(ISD::SHL, DL, N->getValueType(0), N->getOperand(1),

                       lowerVectorSplatImm<5>(N, 2, DAG));

  case Intrinsic::loongarch_lsx_vslli_d:

  case Intrinsic::loongarch_lasx_xvslli_d:

    return DAG.getNode(ISD::SHL, DL, N->getValueType(0), N->getOperand(1),

                       lowerVectorSplatImm<6>(N, 2, DAG));

  case Intrinsic::loongarch_lsx_vsrl_b:

  case Intrinsic::loongarch_lsx_vsrl_h:

  case Intrinsic::loongarch_lsx_vsrl_w:

  case Intrinsic::loongarch_lsx_vsrl_d:

  case Intrinsic::loongarch_lasx_xvsrl_b:

  case Intrinsic::loongarch_lasx_xvsrl_h:

  case Intrinsic::loongarch_lasx_xvsrl_w:

  case Intrinsic::loongarch_lasx_xvsrl_d:

    return DAG.getNode(ISD::SRL, DL, N->getValueType(0), N->getOperand(1),

                       truncateVecElts(N, DAG));

  case Intrinsic::loongarch_lsx_vsrli_b:

  case Intrinsic::loongarch_lasx_xvsrli_b:

    return DAG.getNode(ISD::SRL, DL, N->getValueType(0), N->getOperand(1),

                       lowerVectorSplatImm<3>(N, 2, DAG));

  case Intrinsic::loongarch_lsx_vsrli_h:

  case Intrinsic::loongarch_lasx_xvsrli_h:

    return DAG.getNode(ISD::SRL, DL, N->getValueType(0), N->getOperand(1),

                       lowerVectorSplatImm<4>(N, 2, DAG));

  case Intrinsic::loongarch_lsx_vsrli_w:

  case Intrinsic::loongarch_lasx_xvsrli_w:

    return DAG.getNode(ISD::SRL, DL, N->getValueType(0), N->getOperand(1),

                       lowerVectorSplatImm<5>(N, 2, DAG));

  case Intrinsic::loongarch_lsx_vsrli_d:

  case Intrinsic::loongarch_lasx_xvsrli_d:

    return DAG.getNode(ISD::SRL, DL, N->getValueType(0), N->getOperand(1),

                       lowerVectorSplatImm<6>(N, 2, DAG));

  case Intrinsic::loongarch_lsx_vsra_b:

  case Intrinsic::loongarch_lsx_vsra_h:

  case Intrinsic::loongarch_lsx_vsra_w:

  case Intrinsic::loongarch_lsx_vsra_d:

  case Intrinsic::loongarch_lasx_xvsra_b:

  case Intrinsic::loongarch_lasx_xvsra_h:

  case Intrinsic::loongarch_lasx_xvsra_w:

  case Intrinsic::loongarch_lasx_xvsra_d:

    return DAG.getNode(ISD::SRA, DL, N->getValueType(0), N->getOperand(1),

                       truncateVecElts(N, DAG));

  case Intrinsic::loongarch_lsx_vsrai_b:

  case Intrinsic::loongarch_lasx_xvsrai_b:

    return DAG.getNode(ISD::SRA, DL, N->getValueType(0), N->getOperand(1),

                       lowerVectorSplatImm<3>(N, 2, DAG));

  case Intrinsic::loongarch_lsx_vsrai_h:

  case Intrinsic::loongarch_lasx_xvsrai_h:

    return DAG.getNode(ISD::SRA, DL, N->getValueType(0), N->getOperand(1),

                       lowerVectorSplatImm<4>(N, 2, DAG));

  case Intrinsic::loongarch_lsx_vsrai_w:

  case Intrinsic::loongarch_lasx_xvsrai_w:

    return DAG.getNode(ISD::SRA, DL, N->getValueType(0), N->getOperand(1),

                       lowerVectorSplatImm<5>(N, 2, DAG));

  case Intrinsic::loongarch_lsx_vsrai_d:

  case Intrinsic::loongarch_lasx_xvsrai_d:

    return DAG.getNode(ISD::SRA, DL, N->getValueType(0), N->getOperand(1),

                       lowerVectorSplatImm<6>(N, 2, DAG));

  case Intrinsic::loongarch_lsx_vclz_b:

  case Intrinsic::loongarch_lsx_vclz_h:

  case Intrinsic::loongarch_lsx_vclz_w:

  case Intrinsic::loongarch_lsx_vclz_d:

  case Intrinsic::loongarch_lasx_xvclz_b:

  case Intrinsic::loongarch_lasx_xvclz_h:

  case Intrinsic::loongarch_lasx_xvclz_w:

  case Intrinsic::loongarch_lasx_xvclz_d:

    return DAG.getNode(ISD::CTLZ, DL, N->getValueType(0), N->getOperand(1));

  case Intrinsic::loongarch_lsx_vpcnt_b:

  case Intrinsic::loongarch_lsx_vpcnt_h:

  case Intrinsic::loongarch_lsx_vpcnt_w:

  case Intrinsic::loongarch_lsx_vpcnt_d:

  case Intrinsic::loongarch_lasx_xvpcnt_b:

  case Intrinsic::loongarch_lasx_xvpcnt_h:

  case Intrinsic::loongarch_lasx_xvpcnt_w:

  case Intrinsic::loongarch_lasx_xvpcnt_d:

    return DAG.getNode(ISD::CTPOP, DL, N->getValueType(0), N->getOperand(1));

  case Intrinsic::loongarch_lsx_vbitclr_b:

  case Intrinsic::loongarch_lsx_vbitclr_h:

  case Intrinsic::loongarch_lsx_vbitclr_w:

  case Intrinsic::loongarch_lsx_vbitclr_d:

  case Intrinsic::loongarch_lasx_xvbitclr_b:

  case Intrinsic::loongarch_lasx_xvbitclr_h:

  case Intrinsic::loongarch_lasx_xvbitclr_w:

  case Intrinsic::loongarch_lasx_xvbitclr_d:

    return lowerVectorBitClear(N, DAG);

  case Intrinsic::loongarch_lsx_vbitclri_b:

  case Intrinsic::loongarch_lasx_xvbitclri_b:

    return lowerVectorBitClearImm<3>(N, DAG);

  case Intrinsic::loongarch_lsx_vbitclri_h:

  case Intrinsic::loongarch_lasx_xvbitclri_h:

    return lowerVectorBitClearImm<4>(N, DAG);

  case Intrinsic::loongarch_lsx_vbitclri_w:

  case Intrinsic::loongarch_lasx_xvbitclri_w:

    return lowerVectorBitClearImm<5>(N, DAG);

  case Intrinsic::loongarch_lsx_vbitclri_d:

  case Intrinsic::loongarch_lasx_xvbitclri_d:

    return lowerVectorBitClearImm<6>(N, DAG);

  case Intrinsic::loongarch_lsx_vbitset_b:

  case Intrinsic::loongarch_lsx_vbitset_h:

  case Intrinsic::loongarch_lsx_vbitset_w:

  case Intrinsic::loongarch_lsx_vbitset_d:

  case Intrinsic::loongarch_lasx_xvbitset_b:

  case Intrinsic::loongarch_lasx_xvbitset_h:

  case Intrinsic::loongarch_lasx_xvbitset_w:

  case Intrinsic::loongarch_lasx_xvbitset_d: {

    EVT VecTy = N->getValueType(0);

    SDValue One = DAG.getConstant(1, DL, VecTy);

    return DAG.getNode(

        ISD::OR, DL, VecTy, N->getOperand(1),

        DAG.getNode(ISD::SHL, DL, VecTy, One, truncateVecElts(N, DAG)));

  }

  case Intrinsic::loongarch_lsx_vbitseti_b:

  case Intrinsic::loongarch_lasx_xvbitseti_b:

    return lowerVectorBitSetImm<3>(N, DAG);

  case Intrinsic::loongarch_lsx_vbitseti_h:

  case Intrinsic::loongarch_lasx_xvbitseti_h:

    return lowerVectorBitSetImm<4>(N, DAG);

  case Intrinsic::loongarch_lsx_vbitseti_w:

  case Intrinsic::loongarch_lasx_xvbitseti_w:

    return lowerVectorBitSetImm<5>(N, DAG);

  case Intrinsic::loongarch_lsx_vbitseti_d:

  case Intrinsic::loongarch_lasx_xvbitseti_d:

    return lowerVectorBitSetImm<6>(N, DAG);

  case Intrinsic::loongarch_lsx_vbitrev_b:

  case Intrinsic::loongarch_lsx_vbitrev_h:

  case Intrinsic::loongarch_lsx_vbitrev_w:

  case Intrinsic::loongarch_lsx_vbitrev_d:

  case Intrinsic::loongarch_lasx_xvbitrev_b:

  case Intrinsic::loongarch_lasx_xvbitrev_h:

  case Intrinsic::loongarch_lasx_xvbitrev_w:

  case Intrinsic::loongarch_lasx_xvbitrev_d: {

    EVT VecTy = N->getValueType(0);

    SDValue One = DAG.getConstant(1, DL, VecTy);

    return DAG.getNode(

        ISD::XOR, DL, VecTy, N->getOperand(1),

        DAG.getNode(ISD::SHL, DL, VecTy, One, truncateVecElts(N, DAG)));

  }

  case Intrinsic::loongarch_lsx_vbitrevi_b:

  case Intrinsic::loongarch_lasx_xvbitrevi_b:

    return lowerVectorBitRevImm<3>(N, DAG);

  case Intrinsic::loongarch_lsx_vbitrevi_h:

  case Intrinsic::loongarch_lasx_xvbitrevi_h:

    return lowerVectorBitRevImm<4>(N, DAG);

  case Intrinsic::loongarch_lsx_vbitrevi_w:

  case Intrinsic::loongarch_lasx_xvbitrevi_w:

    return lowerVectorBitRevImm<5>(N, DAG);

  case Intrinsic::loongarch_lsx_vbitrevi_d:

  case Intrinsic::loongarch_lasx_xvbitrevi_d:

    return lowerVectorBitRevImm<6>(N, DAG);

  case Intrinsic::loongarch_lsx_vfadd_s:

  case Intrinsic::loongarch_lsx_vfadd_d:

  case Intrinsic::loongarch_lasx_xvfadd_s:

  case Intrinsic::loongarch_lasx_xvfadd_d:

    return DAG.getNode(ISD::FADD, DL, N->getValueType(0), N->getOperand(1),

                       N->getOperand(2));

  case Intrinsic::loongarch_lsx_vfsub_s:

  case Intrinsic::loongarch_lsx_vfsub_d:

  case Intrinsic::loongarch_lasx_xvfsub_s:

  case Intrinsic::loongarch_lasx_xvfsub_d:

    return DAG.getNode(ISD::FSUB, DL, N->getValueType(0), N->getOperand(1),

                       N->getOperand(2));

  case Intrinsic::loongarch_lsx_vfmul_s:

  case Intrinsic::loongarch_lsx_vfmul_d:

  case Intrinsic::loongarch_lasx_xvfmul_s:

  case Intrinsic::loongarch_lasx_xvfmul_d:

    return DAG.getNode(ISD::FMUL, DL, N->getValueType(0), N->getOperand(1),

                       N->getOperand(2));

  case Intrinsic::loongarch_lsx_vfdiv_s:

  case Intrinsic::loongarch_lsx_vfdiv_d:

  case Intrinsic::loongarch_lasx_xvfdiv_s:

  case Intrinsic::loongarch_lasx_xvfdiv_d:

    return DAG.getNode(ISD::FDIV, DL, N->getValueType(0), N->getOperand(1),

                       N->getOperand(2));

  case Intrinsic::loongarch_lsx_vfmadd_s:

  case Intrinsic::loongarch_lsx_vfmadd_d:

  case Intrinsic::loongarch_lasx_xvfmadd_s:

  case Intrinsic::loongarch_lasx_xvfmadd_d:

    return DAG.getNode(ISD::FMA, DL, N->getValueType(0), N->getOperand(1),

                       N->getOperand(2), N->getOperand(3));

  case Intrinsic::loongarch_lsx_vinsgr2vr_b:

    return DAG.getNode(ISD::INSERT_VECTOR_ELT, SDLoc(N), N->getValueType(0),

                       N->getOperand(1), N->getOperand(2),

                       legalizeIntrinsicImmArg<4>(N, 3, DAG, Subtarget));

  case Intrinsic::loongarch_lsx_vinsgr2vr_h:

  case Intrinsic::loongarch_lasx_xvinsgr2vr_w:

    return DAG.getNode(ISD::INSERT_VECTOR_ELT, SDLoc(N), N->getValueType(0),

                       N->getOperand(1), N->getOperand(2),

                       legalizeIntrinsicImmArg<3>(N, 3, DAG, Subtarget));

  case Intrinsic::loongarch_lsx_vinsgr2vr_w:

  case Intrinsic::loongarch_lasx_xvinsgr2vr_d:

    return DAG.getNode(ISD::INSERT_VECTOR_ELT, SDLoc(N), N->getValueType(0),

                       N->getOperand(1), N->getOperand(2),

                       legalizeIntrinsicImmArg<2>(N, 3, DAG, Subtarget));

  case Intrinsic::loongarch_lsx_vinsgr2vr_d:

    return DAG.getNode(ISD::INSERT_VECTOR_ELT, SDLoc(N), N->getValueType(0),

                       N->getOperand(1), N->getOperand(2),

                       legalizeIntrinsicImmArg<1>(N, 3, DAG, Subtarget));

  case Intrinsic::loongarch_lsx_vreplgr2vr_b:

  case Intrinsic::loongarch_lsx_vreplgr2vr_h:

  case Intrinsic::loongarch_lsx_vreplgr2vr_w:

  case Intrinsic::loongarch_lsx_vreplgr2vr_d:

  case Intrinsic::loongarch_lasx_xvreplgr2vr_b:

  case Intrinsic::loongarch_lasx_xvreplgr2vr_h:

  case Intrinsic::loongarch_lasx_xvreplgr2vr_w:

  case Intrinsic::loongarch_lasx_xvreplgr2vr_d:

    return DAG.getNode(LoongArchISD::VREPLGR2VR, DL, N->getValueType(0),

                       DAG.getNode(ISD::ANY_EXTEND, DL, Subtarget.getGRLenVT(),

                                   N->getOperand(1)));

  case Intrinsic::loongarch_lsx_vreplve_b:

  case Intrinsic::loongarch_lsx_vreplve_h:

  case Intrinsic::loongarch_lsx_vreplve_w:

  case Intrinsic::loongarch_lsx_vreplve_d:

  case Intrinsic::loongarch_lasx_xvreplve_b:

  case Intrinsic::loongarch_lasx_xvreplve_h:

  case Intrinsic::loongarch_lasx_xvreplve_w:

  case Intrinsic::loongarch_lasx_xvreplve_d:

    return DAG.getNode(LoongArchISD::VREPLVE, DL, N->getValueType(0),

                       N->getOperand(1),

                       DAG.getNode(ISD::ANY_EXTEND, DL, Subtarget.getGRLenVT(),

                                   N->getOperand(2)));

  }

  return SDValue();

}


SDValue LoongArchTargetLowering::PerformDAGCombine(SDNode *N,

                                                   DAGCombinerInfo &DCI) const {

  SelectionDAG &DAG = DCI.DAG;

  switch (N->getOpcode()) {

  default:

    break;

  case ISD::AND:

    return performANDCombine(N, DAG, DCI, Subtarget);

  case ISD::OR:

    return performORCombine(N, DAG, DCI, Subtarget);

  case ISD::SETCC:

    return performSETCCCombine(N, DAG, DCI, Subtarget);

  case ISD::SRL:

    return performSRLCombine(N, DAG, DCI, Subtarget);

  case LoongArchISD::BITREV_W:

    return performBITREV_WCombine(N, DAG, DCI, Subtarget);

  case ISD::INTRINSIC_WO_CHAIN:

    return performINTRINSIC_WO_CHAINCombine(N, DAG, DCI, Subtarget);

  }

  return SDValue();

}


static MachineBasicBlock *insertDivByZeroTrap(MachineInstr &MI,

                                              MachineBasicBlock *MBB) {

  if (!ZeroDivCheck)

    return MBB;


  // Build instructions:

  // MBB:

  //   div(or mod)   $dst, $dividend, $divisor

  //   bnez          $divisor, SinkMBB

  // BreakMBB:

  //   break         7 // BRK_DIVZERO

  // SinkMBB:

  //   fallthrough

  const BasicBlock *LLVM_BB = MBB->getBasicBlock();

  MachineFunction::iterator It = ++MBB->getIterator();

  MachineFunction *MF = MBB->getParent();

  auto BreakMBB = MF->CreateMachineBasicBlock(LLVM_BB);

  auto SinkMBB = MF->CreateMachineBasicBlock(LLVM_BB);

  MF->insert(It, BreakMBB);

  MF->insert(It, SinkMBB);


  // Transfer the remainder of MBB and its successor edges to SinkMBB.

  SinkMBB->splice(SinkMBB->end(), MBB, std::next(MI.getIterator()), MBB->end());

  SinkMBB->transferSuccessorsAndUpdatePHIs(MBB);


  const TargetInstrInfo &TII = *MF->getSubtarget().getInstrInfo();

  DebugLoc DL = MI.getDebugLoc();

  MachineOperand &Divisor = MI.getOperand(2);

  Register DivisorReg = Divisor.getReg();


  // MBB:

  BuildMI(MBB, DL, TII.get(LoongArch::BNEZ))

      .addReg(DivisorReg, getKillRegState(Divisor.isKill()))

      .addMBB(SinkMBB);

  MBB->addSuccessor(BreakMBB);

  MBB->addSuccessor(SinkMBB);


  // BreakMBB:

  // See linux header file arch/loongarch/include/uapi/asm/break.h for the

  // definition of BRK_DIVZERO.

  BuildMI(BreakMBB, DL, TII.get(LoongArch::BREAK)).addImm(7 /*BRK_DIVZERO*/);

  BreakMBB->addSuccessor(SinkMBB);


  // Clear Divisor's kill flag.

  Divisor.setIsKill(false);


  return SinkMBB;

}


static MachineBasicBlock *

emitVecCondBranchPseudo(MachineInstr &MI, MachineBasicBlock *BB,

                        const LoongArchSubtarget &Subtarget) {

  unsigned CondOpc;

  switch (MI.getOpcode()) {

  default:

    llvm_unreachable("Unexpected opcode");

  case LoongArch::PseudoVBZ:

    CondOpc = LoongArch::VSETEQZ_V;

    break;

  case LoongArch::PseudoVBZ_B:

    CondOpc = LoongArch::VSETANYEQZ_B;

    break;

  case LoongArch::PseudoVBZ_H:

    CondOpc = LoongArch::VSETANYEQZ_H;

    break;

  case LoongArch::PseudoVBZ_W:

    CondOpc = LoongArch::VSETANYEQZ_W;

    break;

  case LoongArch::PseudoVBZ_D:

    CondOpc = LoongArch::VSETANYEQZ_D;

    break;

  case LoongArch::PseudoVBNZ:

    CondOpc = LoongArch::VSETNEZ_V;

    break;

  case LoongArch::PseudoVBNZ_B:

    CondOpc = LoongArch::VSETALLNEZ_B;

    break;

  case LoongArch::PseudoVBNZ_H:

    CondOpc = LoongArch::VSETALLNEZ_H;

    break;

  case LoongArch::PseudoVBNZ_W:

    CondOpc = LoongArch::VSETALLNEZ_W;

    break;

  case LoongArch::PseudoVBNZ_D:

    CondOpc = LoongArch::VSETALLNEZ_D;

    break;

  case LoongArch::PseudoXVBZ:

    CondOpc = LoongArch::XVSETEQZ_V;

    break;

  case LoongArch::PseudoXVBZ_B:

    CondOpc = LoongArch::XVSETANYEQZ_B;

    break;

  case LoongArch::PseudoXVBZ_H:

    CondOpc = LoongArch::XVSETANYEQZ_H;

    break;

  case LoongArch::PseudoXVBZ_W:

    CondOpc = LoongArch::XVSETANYEQZ_W;

    break;

  case LoongArch::PseudoXVBZ_D:

    CondOpc = LoongArch::XVSETANYEQZ_D;

    break;

  case LoongArch::PseudoXVBNZ:

    CondOpc = LoongArch::XVSETNEZ_V;

    break;

  case LoongArch::PseudoXVBNZ_B:

    CondOpc = LoongArch::XVSETALLNEZ_B;

    break;

  case LoongArch::PseudoXVBNZ_H:

    CondOpc = LoongArch::XVSETALLNEZ_H;

    break;

  case LoongArch::PseudoXVBNZ_W:

    CondOpc = LoongArch::XVSETALLNEZ_W;

    break;

  case LoongArch::PseudoXVBNZ_D:

    CondOpc = LoongArch::XVSETALLNEZ_D;

    break;

  }


  const TargetInstrInfo *TII = Subtarget.getInstrInfo();

  const BasicBlock *LLVM_BB = BB->getBasicBlock();

  DebugLoc DL = MI.getDebugLoc();

  MachineRegisterInfo &MRI = BB->getParent()->getRegInfo();

  MachineFunction::iterator It = ++BB->getIterator();


  MachineFunction *F = BB->getParent();

  MachineBasicBlock *FalseBB = F->CreateMachineBasicBlock(LLVM_BB);

  MachineBasicBlock *TrueBB = F->CreateMachineBasicBlock(LLVM_BB);

  MachineBasicBlock *SinkBB = F->CreateMachineBasicBlock(LLVM_BB);


  F->insert(It, FalseBB);

  F->insert(It, TrueBB);

  F->insert(It, SinkBB);


  // Transfer the remainder of MBB and its successor edges to Sink.

  SinkBB->splice(SinkBB->end(), BB, std::next(MI.getIterator()), BB->end());

  SinkBB->transferSuccessorsAndUpdatePHIs(BB);


  // Insert the real instruction to BB.

  Register FCC = MRI.createVirtualRegister(&LoongArch::CFRRegClass);

  BuildMI(BB, DL, TII->get(CondOpc), FCC).addReg(MI.getOperand(1).getReg());


  // Insert branch.

  BuildMI(BB, DL, TII->get(LoongArch::BCNEZ)).addReg(FCC).addMBB(TrueBB);

  BB->addSuccessor(FalseBB);

  BB->addSuccessor(TrueBB);


  // FalseBB.

  Register RD1 = MRI.createVirtualRegister(&LoongArch::GPRRegClass);

  BuildMI(FalseBB, DL, TII->get(LoongArch::ADDI_W), RD1)

      .addReg(LoongArch::R0)

      .addImm(0);

  BuildMI(FalseBB, DL, TII->get(LoongArch::PseudoBR)).addMBB(SinkBB);

  FalseBB->addSuccessor(SinkBB);


  // TrueBB.

  Register RD2 = MRI.createVirtualRegister(&LoongArch::GPRRegClass);

  BuildMI(TrueBB, DL, TII->get(LoongArch::ADDI_W), RD2)

      .addReg(LoongArch::R0)

      .addImm(1);

  TrueBB->addSuccessor(SinkBB);


  // SinkBB: merge the results.

  BuildMI(*SinkBB, SinkBB->begin(), DL, TII->get(LoongArch::PHI),

          MI.getOperand(0).getReg())

      .addReg(RD1)

      .addMBB(FalseBB)

      .addReg(RD2)

      .addMBB(TrueBB);


  // The pseudo instruction is gone now.

  MI.eraseFromParent();

  return SinkBB;

}


static MachineBasicBlock *

emitPseudoXVINSGR2VR(MachineInstr &MI, MachineBasicBlock *BB,

                     const LoongArchSubtarget &Subtarget) {

  unsigned InsOp;

  unsigned HalfSize;

  switch (MI.getOpcode()) {

  default:

    llvm_unreachable("Unexpected opcode");

  case LoongArch::PseudoXVINSGR2VR_B:

    HalfSize = 16;

    InsOp = LoongArch::VINSGR2VR_B;

    break;

  case LoongArch::PseudoXVINSGR2VR_H:

    HalfSize = 8;

    InsOp = LoongArch::VINSGR2VR_H;

    break;

  }

  const TargetInstrInfo *TII = Subtarget.getInstrInfo();

  const TargetRegisterClass *RC = &LoongArch::LASX256RegClass;

  const TargetRegisterClass *SubRC = &LoongArch::LSX128RegClass;

  DebugLoc DL = MI.getDebugLoc();

  MachineRegisterInfo &MRI = BB->getParent()->getRegInfo();

  // XDst = vector_insert XSrc, Elt, Idx

  Register XDst = MI.getOperand(0).getReg();

  Register XSrc = MI.getOperand(1).getReg();

  Register Elt = MI.getOperand(2).getReg();

  unsigned Idx = MI.getOperand(3).getImm();


  Register ScratchReg1 = XSrc;

  if (Idx >= HalfSize) {

    ScratchReg1 = MRI.createVirtualRegister(RC);

    BuildMI(*BB, MI, DL, TII->get(LoongArch::XVPERMI_Q), ScratchReg1)

        .addReg(XSrc)

        .addReg(XSrc)

        .addImm(1);

  }


  Register ScratchSubReg1 = MRI.createVirtualRegister(SubRC);

  Register ScratchSubReg2 = MRI.createVirtualRegister(SubRC);

  BuildMI(*BB, MI, DL, TII->get(LoongArch::COPY), ScratchSubReg1)

      .addReg(ScratchReg1, 0, LoongArch::sub_128);

  BuildMI(*BB, MI, DL, TII->get(InsOp), ScratchSubReg2)

      .addReg(ScratchSubReg1)

      .addReg(Elt)

      .addImm(Idx >= HalfSize ? Idx - HalfSize : Idx);


  Register ScratchReg2 = XDst;

  if (Idx >= HalfSize)

    ScratchReg2 = MRI.createVirtualRegister(RC);


  BuildMI(*BB, MI, DL, TII->get(LoongArch::SUBREG_TO_REG), ScratchReg2)

      .addImm(0)

      .addReg(ScratchSubReg2)

      .addImm(LoongArch::sub_128);


  if (Idx >= HalfSize)

    BuildMI(*BB, MI, DL, TII->get(LoongArch::XVPERMI_Q), XDst)

        .addReg(XSrc)

        .addReg(ScratchReg2)

        .addImm(2);


  MI.eraseFromParent();

  return BB;

}


static MachineBasicBlock *emitPseudoCTPOP(MachineInstr &MI,

                                          MachineBasicBlock *BB,

                                          const LoongArchSubtarget &Subtarget) {

  assert(Subtarget.hasExtLSX());

  const TargetInstrInfo *TII = Subtarget.getInstrInfo();

  const TargetRegisterClass *RC = &LoongArch::LSX128RegClass;

  DebugLoc DL = MI.getDebugLoc();

  MachineRegisterInfo &MRI = BB->getParent()->getRegInfo();

  Register Dst = MI.getOperand(0).getReg();

  Register Src = MI.getOperand(1).getReg();

  Register ScratchReg1 = MRI.createVirtualRegister(RC);

  Register ScratchReg2 = MRI.createVirtualRegister(RC);

  Register ScratchReg3 = MRI.createVirtualRegister(RC);


  BuildMI(*BB, MI, DL, TII->get(LoongArch::VLDI), ScratchReg1).addImm(0);

  BuildMI(*BB, MI, DL,

          TII->get(Subtarget.is64Bit() ? LoongArch::VINSGR2VR_D

                                       : LoongArch::VINSGR2VR_W),

          ScratchReg2)

      .addReg(ScratchReg1)

      .addReg(Src)

      .addImm(0);

  BuildMI(

      *BB, MI, DL,

      TII->get(Subtarget.is64Bit() ? LoongArch::VPCNT_D : LoongArch::VPCNT_W),

      ScratchReg3)

      .addReg(ScratchReg2);

  BuildMI(*BB, MI, DL,

          TII->get(Subtarget.is64Bit() ? LoongArch::VPICKVE2GR_D

                                       : LoongArch::VPICKVE2GR_W),

          Dst)

      .addReg(ScratchReg3)

      .addImm(0);


  MI.eraseFromParent();

  return BB;

}


MachineBasicBlock *LoongArchTargetLowering::EmitInstrWithCustomInserter(

    MachineInstr &MI, MachineBasicBlock *BB) const {

  const TargetInstrInfo *TII = Subtarget.getInstrInfo();

  DebugLoc DL = MI.getDebugLoc();


  switch (MI.getOpcode()) {

  default:

    llvm_unreachable("Unexpected instr type to insert");

  case LoongArch::DIV_W:

  case LoongArch::DIV_WU:

  case LoongArch::MOD_W:

  case LoongArch::MOD_WU:

  case LoongArch::DIV_D:

  case LoongArch::DIV_DU:

  case LoongArch::MOD_D:

  case LoongArch::MOD_DU:

    return insertDivByZeroTrap(MI, BB);

    break;

  case LoongArch::WRFCSR: {

    BuildMI(*BB, MI, DL, TII->get(LoongArch::MOVGR2FCSR),

            LoongArch::FCSR0 + MI.getOperand(0).getImm())

        .addReg(MI.getOperand(1).getReg());

    MI.eraseFromParent();

    return BB;

  }

  case LoongArch::RDFCSR: {

    MachineInstr *ReadFCSR =

        BuildMI(*BB, MI, DL, TII->get(LoongArch::MOVFCSR2GR),

                MI.getOperand(0).getReg())

            .addReg(LoongArch::FCSR0 + MI.getOperand(1).getImm());

    ReadFCSR->getOperand(1).setIsUndef();

    MI.eraseFromParent();

    return BB;

  }

  case LoongArch::PseudoVBZ:

  case LoongArch::PseudoVBZ_B:

  case LoongArch::PseudoVBZ_H:

  case LoongArch::PseudoVBZ_W:

  case LoongArch::PseudoVBZ_D:

  case LoongArch::PseudoVBNZ:

  case LoongArch::PseudoVBNZ_B:

  case LoongArch::PseudoVBNZ_H:

  case LoongArch::PseudoVBNZ_W:

  case LoongArch::PseudoVBNZ_D:

  case LoongArch::PseudoXVBZ:

  case LoongArch::PseudoXVBZ_B:

  case LoongArch::PseudoXVBZ_H:

  case LoongArch::PseudoXVBZ_W:

  case LoongArch::PseudoXVBZ_D:

  case LoongArch::PseudoXVBNZ:

  case LoongArch::PseudoXVBNZ_B:

  case LoongArch::PseudoXVBNZ_H:

  case LoongArch::PseudoXVBNZ_W:

  case LoongArch::PseudoXVBNZ_D:

    return emitVecCondBranchPseudo(MI, BB, Subtarget);

  case LoongArch::PseudoXVINSGR2VR_B:

  case LoongArch::PseudoXVINSGR2VR_H:

    return emitPseudoXVINSGR2VR(MI, BB, Subtarget);

  case LoongArch::PseudoCTPOP:

    return emitPseudoCTPOP(MI, BB, Subtarget);

  case TargetOpcode::STATEPOINT:

    // STATEPOINT is a pseudo instruction which has no implicit defs/uses

    // while bl call instruction (where statepoint will be lowered at the

    // end) has implicit def. This def is early-clobber as it will be set at

    // the moment of the call and earlier than any use is read.

    // Add this implicit dead def here as a workaround.

    MI.addOperand(*MI.getMF(),

                  MachineOperand::CreateReg(

                      LoongArch::R1, /*isDef*/ true,

                      /*isImp*/ true, /*isKill*/ false, /*isDead*/ true,

                      /*isUndef*/ false, /*isEarlyClobber*/ true));

    if (!Subtarget.is64Bit())

      report_fatal_error("STATEPOINT is only supported on 64-bit targets");

    return emitPatchPoint(MI, BB);

  }

}


bool LoongArchTargetLowering::allowsMisalignedMemoryAccesses(

    EVT VT, unsigned AddrSpace, Align Alignment, MachineMemOperand::Flags Flags,

    unsigned *Fast) const {

  if (!Subtarget.hasUAL())

    return false;


  // TODO: set reasonable speed number.

  if (Fast)

    *Fast = 1;

  return true;

}


const char *LoongArchTargetLowering::getTargetNodeName(unsigned Opcode) const {

  switch ((LoongArchISD::NodeType)Opcode) {

  case LoongArchISD::FIRST_NUMBER:

    break;


#define NODE_NAME_CASE(node)                                                   \

  case LoongArchISD::node:                                                     \

    return "LoongArchISD::" #node;


    // TODO: Add more target-dependent nodes later.

    NODE_NAME_CASE(CALL)

    NODE_NAME_CASE(CALL_MEDIUM)

    NODE_NAME_CASE(CALL_LARGE)

    NODE_NAME_CASE(RET)

    NODE_NAME_CASE(TAIL)

    NODE_NAME_CASE(TAIL_MEDIUM)

    NODE_NAME_CASE(TAIL_LARGE)

    NODE_NAME_CASE(SLL_W)

    NODE_NAME_CASE(SRA_W)

    NODE_NAME_CASE(SRL_W)

    NODE_NAME_CASE(BSTRINS)

    NODE_NAME_CASE(BSTRPICK)

    NODE_NAME_CASE(MOVGR2FR_W_LA64)

    NODE_NAME_CASE(MOVFR2GR_S_LA64)

    NODE_NAME_CASE(FTINT)

    NODE_NAME_CASE(REVB_2H)

    NODE_NAME_CASE(REVB_2W)

    NODE_NAME_CASE(BITREV_4B)

    NODE_NAME_CASE(BITREV_8B)

    NODE_NAME_CASE(BITREV_W)

    NODE_NAME_CASE(ROTR_W)

    NODE_NAME_CASE(ROTL_W)

    NODE_NAME_CASE(DIV_W)

    NODE_NAME_CASE(DIV_WU)

    NODE_NAME_CASE(MOD_W)

    NODE_NAME_CASE(MOD_WU)

    NODE_NAME_CASE(CLZ_W)

    NODE_NAME_CASE(CTZ_W)

    NODE_NAME_CASE(DBAR)

    NODE_NAME_CASE(IBAR)

    NODE_NAME_CASE(BREAK)

    NODE_NAME_CASE(SYSCALL)

    NODE_NAME_CASE(CRC_W_B_W)

    NODE_NAME_CASE(CRC_W_H_W)

    NODE_NAME_CASE(CRC_W_W_W)

    NODE_NAME_CASE(CRC_W_D_W)

    NODE_NAME_CASE(CRCC_W_B_W)

    NODE_NAME_CASE(CRCC_W_H_W)

    NODE_NAME_CASE(CRCC_W_W_W)

    NODE_NAME_CASE(CRCC_W_D_W)

    NODE_NAME_CASE(CSRRD)

    NODE_NAME_CASE(CSRWR)

    NODE_NAME_CASE(CSRXCHG)

    NODE_NAME_CASE(IOCSRRD_B)

    NODE_NAME_CASE(IOCSRRD_H)

    NODE_NAME_CASE(IOCSRRD_W)

    NODE_NAME_CASE(IOCSRRD_D)

    NODE_NAME_CASE(IOCSRWR_B)

    NODE_NAME_CASE(IOCSRWR_H)

    NODE_NAME_CASE(IOCSRWR_W)

    NODE_NAME_CASE(IOCSRWR_D)

    NODE_NAME_CASE(CPUCFG)

    NODE_NAME_CASE(MOVGR2FCSR)

    NODE_NAME_CASE(MOVFCSR2GR)

    NODE_NAME_CASE(CACOP_D)

    NODE_NAME_CASE(CACOP_W)

    NODE_NAME_CASE(VSHUF)

    NODE_NAME_CASE(VPICKEV)

    NODE_NAME_CASE(VPICKOD)

    NODE_NAME_CASE(VPACKEV)

    NODE_NAME_CASE(VPACKOD)

    NODE_NAME_CASE(VILVL)

    NODE_NAME_CASE(VILVH)

    NODE_NAME_CASE(VSHUF4I)

    NODE_NAME_CASE(VREPLVEI)

    NODE_NAME_CASE(VREPLGR2VR)

    NODE_NAME_CASE(XVPERMI)

    NODE_NAME_CASE(VPICK_SEXT_ELT)

    NODE_NAME_CASE(VPICK_ZEXT_ELT)

    NODE_NAME_CASE(VREPLVE)

    NODE_NAME_CASE(VALL_ZERO)

    NODE_NAME_CASE(VANY_ZERO)

    NODE_NAME_CASE(VALL_NONZERO)

    NODE_NAME_CASE(VANY_NONZERO)

    NODE_NAME_CASE(FRECIPE)

    NODE_NAME_CASE(FRSQRTE)

  }

#undef NODE_NAME_CASE

  return nullptr;

}


//===----------------------------------------------------------------------===//

//                     Calling Convention Implementation

//===----------------------------------------------------------------------===//


// Eight general-purpose registers a0-a7 used for passing integer arguments,

// with a0-a1 reused to return values. Generally, the GPRs are used to pass

// fixed-point arguments, and floating-point arguments when no FPR is available

// or with soft float ABI.

const MCPhysReg ArgGPRs[] = {LoongArch::R4,  LoongArch::R5, LoongArch::R6,

                             LoongArch::R7,  LoongArch::R8, LoongArch::R9,

                             LoongArch::R10, LoongArch::R11};

// Eight floating-point registers fa0-fa7 used for passing floating-point

// arguments, and fa0-fa1 are also used to return values.

const MCPhysReg ArgFPR32s[] = {LoongArch::F0, LoongArch::F1, LoongArch::F2,

                               LoongArch::F3, LoongArch::F4, LoongArch::F5,

                               LoongArch::F6, LoongArch::F7};

// FPR32 and FPR64 alias each other.

const MCPhysReg ArgFPR64s[] = {

    LoongArch::F0_64, LoongArch::F1_64, LoongArch::F2_64, LoongArch::F3_64,

    LoongArch::F4_64, LoongArch::F5_64, LoongArch::F6_64, LoongArch::F7_64};


const MCPhysReg ArgVRs[] = {LoongArch::VR0, LoongArch::VR1, LoongArch::VR2,

                            LoongArch::VR3, LoongArch::VR4, LoongArch::VR5,

                            LoongArch::VR6, LoongArch::VR7};


const MCPhysReg ArgXRs[] = {LoongArch::XR0, LoongArch::XR1, LoongArch::XR2,

                            LoongArch::XR3, LoongArch::XR4, LoongArch::XR5,

                            LoongArch::XR6, LoongArch::XR7};


// Pass a 2*GRLen argument that has been split into two GRLen values through

// registers or the stack as necessary.

static bool CC_LoongArchAssign2GRLen(unsigned GRLen, CCState &State,

                                     CCValAssign VA1, ISD::ArgFlagsTy ArgFlags1,

                                     unsigned ValNo2, MVT ValVT2, MVT LocVT2,

                                     ISD::ArgFlagsTy ArgFlags2) {

  unsigned GRLenInBytes = GRLen / 8;

  if (Register Reg = State.AllocateReg(ArgGPRs)) {

    // At least one half can be passed via register.

    State.addLoc(CCValAssign::getReg(VA1.getValNo(), VA1.getValVT(), Reg,

                                     VA1.getLocVT(), CCValAssign::Full));

  } else {

    // Both halves must be passed on the stack, with proper alignment.

    Align StackAlign =

        std::max(Align(GRLenInBytes), ArgFlags1.getNonZeroOrigAlign());

    State.addLoc(

        CCValAssign::getMem(VA1.getValNo(), VA1.getValVT(),

                            State.AllocateStack(GRLenInBytes, StackAlign),

                            VA1.getLocVT(), CCValAssign::Full));

    State.addLoc(CCValAssign::getMem(

        ValNo2, ValVT2, State.AllocateStack(GRLenInBytes, Align(GRLenInBytes)),

        LocVT2, CCValAssign::Full));

    return false;

  }

  if (Register Reg = State.AllocateReg(ArgGPRs)) {

    // The second half can also be passed via register.

    State.addLoc(

        CCValAssign::getReg(ValNo2, ValVT2, Reg, LocVT2, CCValAssign::Full));

  } else {

    // The second half is passed via the stack, without additional alignment.

    State.addLoc(CCValAssign::getMem(

        ValNo2, ValVT2, State.AllocateStack(GRLenInBytes, Align(GRLenInBytes)),

        LocVT2, CCValAssign::Full));

  }

  return false;

}


// Implements the LoongArch calling convention. Returns true upon failure.

static bool CC_LoongArch(const DataLayout &DL, LoongArchABI::ABI ABI,

                         unsigned ValNo, MVT ValVT,

                         CCValAssign::LocInfo LocInfo, ISD::ArgFlagsTy ArgFlags,

                         CCState &State, bool IsFixed, bool IsRet,

                         Type *OrigTy) {

  unsigned GRLen = DL.getLargestLegalIntTypeSizeInBits();

  assert((GRLen == 32 || GRLen == 64) && "Unspport GRLen");

  MVT GRLenVT = GRLen == 32 ? MVT::i32 : MVT::i64;

  MVT LocVT = ValVT;


  // Any return value split into more than two values can't be returned

  // directly.

  if (IsRet && ValNo > 1)

    return true;


  // If passing a variadic argument, or if no FPR is available.

  bool UseGPRForFloat = true;


  switch (ABI) {

  default:

    llvm_unreachable("Unexpected ABI");

    break;

  case LoongArchABI::ABI_ILP32F:

  case LoongArchABI::ABI_LP64F:

  case LoongArchABI::ABI_ILP32D:

  case LoongArchABI::ABI_LP64D:

    UseGPRForFloat = !IsFixed;

    break;

  case LoongArchABI::ABI_ILP32S:

  case LoongArchABI::ABI_LP64S:

    break;

  }


  // FPR32 and FPR64 alias each other.

  if (State.getFirstUnallocated(ArgFPR32s) == std::size(ArgFPR32s))

    UseGPRForFloat = true;


  if (UseGPRForFloat && ValVT == MVT::f32) {

    LocVT = GRLenVT;

    LocInfo = CCValAssign::BCvt;

  } else if (UseGPRForFloat && GRLen == 64 && ValVT == MVT::f64) {

    LocVT = MVT::i64;

    LocInfo = CCValAssign::BCvt;

  } else if (UseGPRForFloat && GRLen == 32 && ValVT == MVT::f64) {

    // TODO: Handle passing f64 on LA32 with D feature.

    report_fatal_error("Passing f64 with GPR on LA32 is undefined");

  }


  // If this is a variadic argument, the LoongArch calling convention requires

  // that it is assigned an 'even' or 'aligned' register if it has (2*GRLen)/8

  // byte alignment. An aligned register should be used regardless of whether

  // the original argument was split during legalisation or not. The argument

  // will not be passed by registers if the original type is larger than

  // 2*GRLen, so the register alignment rule does not apply.

  unsigned TwoGRLenInBytes = (2 * GRLen) / 8;

  if (!IsFixed && ArgFlags.getNonZeroOrigAlign() == TwoGRLenInBytes &&

      DL.getTypeAllocSize(OrigTy) == TwoGRLenInBytes) {

    unsigned RegIdx = State.getFirstUnallocated(ArgGPRs);

    // Skip 'odd' register if necessary.

    if (RegIdx != std::size(ArgGPRs) && RegIdx % 2 == 1)

      State.AllocateReg(ArgGPRs);

  }


  SmallVectorImpl<CCValAssign> &PendingLocs = State.getPendingLocs();

  SmallVectorImpl<ISD::ArgFlagsTy> &PendingArgFlags =

      State.getPendingArgFlags();


  assert(PendingLocs.size() == PendingArgFlags.size() &&

         "PendingLocs and PendingArgFlags out of sync");


  // Split arguments might be passed indirectly, so keep track of the pending

  // values.

  if (ValVT.isScalarInteger() && (ArgFlags.isSplit() || !PendingLocs.empty())) {

    LocVT = GRLenVT;

    LocInfo = CCValAssign::Indirect;

    PendingLocs.push_back(

        CCValAssign::getPending(ValNo, ValVT, LocVT, LocInfo));

    PendingArgFlags.push_back(ArgFlags);

    if (!ArgFlags.isSplitEnd()) {

      return false;

    }

  }


  // If the split argument only had two elements, it should be passed directly

  // in registers or on the stack.

  if (ValVT.isScalarInteger() && ArgFlags.isSplitEnd() &&

      PendingLocs.size() <= 2) {

    assert(PendingLocs.size() == 2 && "Unexpected PendingLocs.size()");

    // Apply the normal calling convention rules to the first half of the

    // split argument.

    CCValAssign VA = PendingLocs[0];

    ISD::ArgFlagsTy AF = PendingArgFlags[0];

    PendingLocs.clear();

    PendingArgFlags.clear();

    return CC_LoongArchAssign2GRLen(GRLen, State, VA, AF, ValNo, ValVT, LocVT,

                                    ArgFlags);

  }


  // Allocate to a register if possible, or else a stack slot.

  Register Reg;

  unsigned StoreSizeBytes = GRLen / 8;

  Align StackAlign = Align(GRLen / 8);


  if (ValVT == MVT::f32 && !UseGPRForFloat)

    Reg = State.AllocateReg(ArgFPR32s);

  else if (ValVT == MVT::f64 && !UseGPRForFloat)

    Reg = State.AllocateReg(ArgFPR64s);

  else if (ValVT.is128BitVector())

    Reg = State.AllocateReg(ArgVRs);

  else if (ValVT.is256BitVector())

    Reg = State.AllocateReg(ArgXRs);

  else

    Reg = State.AllocateReg(ArgGPRs);


  unsigned StackOffset =

      Reg ? 0 : State.AllocateStack(StoreSizeBytes, StackAlign);


  // If we reach this point and PendingLocs is non-empty, we must be at the

  // end of a split argument that must be passed indirectly.

  if (!PendingLocs.empty()) {

    assert(ArgFlags.isSplitEnd() && "Expected ArgFlags.isSplitEnd()");

    assert(PendingLocs.size() > 2 && "Unexpected PendingLocs.size()");

    for (auto &It : PendingLocs) {

      if (Reg)

        It.convertToReg(Reg);

      else

        It.convertToMem(StackOffset);

      State.addLoc(It);

    }

    PendingLocs.clear();

    PendingArgFlags.clear();

    return false;

  }

  assert((!UseGPRForFloat || LocVT == GRLenVT) &&

         "Expected an GRLenVT at this stage");


  if (Reg) {

    State.addLoc(CCValAssign::getReg(ValNo, ValVT, Reg, LocVT, LocInfo));

    return false;

  }


  // When a floating-point value is passed on the stack, no bit-cast is needed.

  if (ValVT.isFloatingPoint()) {

    LocVT = ValVT;

    LocInfo = CCValAssign::Full;

  }


  State.addLoc(CCValAssign::getMem(ValNo, ValVT, StackOffset, LocVT, LocInfo));

  return false;

}


void LoongArchTargetLowering::analyzeInputArgs(

    MachineFunction &MF, CCState &CCInfo,

    const SmallVectorImpl<ISD::InputArg> &Ins, bool IsRet,

    LoongArchCCAssignFn Fn) const {

  FunctionType *FType = MF.getFunction().getFunctionType();

  for (unsigned i = 0, e = Ins.size(); i != e; ++i) {

    MVT ArgVT = Ins[i].VT;

    Type *ArgTy = nullptr;

    if (IsRet)

      ArgTy = FType->getReturnType();

    else if (Ins[i].isOrigArg())

      ArgTy = FType->getParamType(Ins[i].getOrigArgIndex());

    LoongArchABI::ABI ABI =

        MF.getSubtarget<LoongArchSubtarget>().getTargetABI();

    if (Fn(MF.getDataLayout(), ABI, i, ArgVT, CCValAssign::Full, Ins[i].Flags,

           CCInfo, /*IsFixed=*/true, IsRet, ArgTy)) {

      LLVM_DEBUG(dbgs() << "InputArg #" << i << " has unhandled type " << ArgVT

                        << '\n');

      llvm_unreachable("");

    }

  }

}


void LoongArchTargetLowering::analyzeOutputArgs(

    MachineFunction &MF, CCState &CCInfo,

    const SmallVectorImpl<ISD::OutputArg> &Outs, bool IsRet,

    CallLoweringInfo *CLI, LoongArchCCAssignFn Fn) const {

  for (unsigned i = 0, e = Outs.size(); i != e; ++i) {

    MVT ArgVT = Outs[i].VT;

    Type *OrigTy = CLI ? CLI->getArgs()[Outs[i].OrigArgIndex].Ty : nullptr;

    LoongArchABI::ABI ABI =

        MF.getSubtarget<LoongArchSubtarget>().getTargetABI();

    if (Fn(MF.getDataLayout(), ABI, i, ArgVT, CCValAssign::Full, Outs[i].Flags,

           CCInfo, Outs[i].IsFixed, IsRet, OrigTy)) {

      LLVM_DEBUG(dbgs() << "OutputArg #" << i << " has unhandled type " << ArgVT

                        << "\n");

      llvm_unreachable("");

    }

  }

}


// Convert Val to a ValVT. Should not be called for CCValAssign::Indirect

// values.

static SDValue convertLocVTToValVT(SelectionDAG &DAG, SDValue Val,

                                   const CCValAssign &VA, const SDLoc &DL) {

  switch (VA.getLocInfo()) {

  default:

    llvm_unreachable("Unexpected CCValAssign::LocInfo");

  case CCValAssign::Full:

  case CCValAssign::Indirect:

    break;

  case CCValAssign::BCvt:

    if (VA.getLocVT() == MVT::i64 && VA.getValVT() == MVT::f32)

      Val = DAG.getNode(LoongArchISD::MOVGR2FR_W_LA64, DL, MVT::f32, Val);

    else

      Val = DAG.getNode(ISD::BITCAST, DL, VA.getValVT(), Val);

    break;

  }

  return Val;

}


static SDValue unpackFromRegLoc(SelectionDAG &DAG, SDValue Chain,

                                const CCValAssign &VA, const SDLoc &DL,

                                const ISD::InputArg &In,

                                const LoongArchTargetLowering &TLI) {

  MachineFunction &MF = DAG.getMachineFunction();

  MachineRegisterInfo &RegInfo = MF.getRegInfo();

  EVT LocVT = VA.getLocVT();

  SDValue Val;

  const TargetRegisterClass *RC = TLI.getRegClassFor(LocVT.getSimpleVT());

  Register VReg = RegInfo.createVirtualRegister(RC);

  RegInfo.addLiveIn(VA.getLocReg(), VReg);

  Val = DAG.getCopyFromReg(Chain, DL, VReg, LocVT);


  // If input is sign extended from 32 bits, note it for the OptW pass.

  if (In.isOrigArg()) {

    Argument *OrigArg = MF.getFunction().getArg(In.getOrigArgIndex());

    if (OrigArg->getType()->isIntegerTy()) {

      unsigned BitWidth = OrigArg->getType()->getIntegerBitWidth();

      // An input zero extended from i31 can also be considered sign extended.

      if ((BitWidth <= 32 && In.Flags.isSExt()) ||

          (BitWidth < 32 && In.Flags.isZExt())) {

        LoongArchMachineFunctionInfo *LAFI =

            MF.getInfo<LoongArchMachineFunctionInfo>();

        LAFI->addSExt32Register(VReg);

      }

    }

  }


  return convertLocVTToValVT(DAG, Val, VA, DL);

}


// The caller is responsible for loading the full value if the argument is

// passed with CCValAssign::Indirect.

static SDValue unpackFromMemLoc(SelectionDAG &DAG, SDValue Chain,

                                const CCValAssign &VA, const SDLoc &DL) {

  MachineFunction &MF = DAG.getMachineFunction();

  MachineFrameInfo &MFI = MF.getFrameInfo();

  EVT ValVT = VA.getValVT();

  int FI = MFI.CreateFixedObject(ValVT.getStoreSize(), VA.getLocMemOffset(),

                                 /*IsImmutable=*/true);

  SDValue FIN = DAG.getFrameIndex(

      FI, MVT::getIntegerVT(DAG.getDataLayout().getPointerSizeInBits(0)));


  ISD::LoadExtType ExtType;

  switch (VA.getLocInfo()) {

  default:

    llvm_unreachable("Unexpected CCValAssign::LocInfo");

  case CCValAssign::Full:

  case CCValAssign::Indirect:

  case CCValAssign::BCvt:

    ExtType = ISD::NON_EXTLOAD;

    break;

  }

  return DAG.getExtLoad(

      ExtType, DL, VA.getLocVT(), Chain, FIN,

      MachinePointerInfo::getFixedStack(DAG.getMachineFunction(), FI), ValVT);

}


static SDValue convertValVTToLocVT(SelectionDAG &DAG, SDValue Val,

                                   const CCValAssign &VA, const SDLoc &DL) {

  EVT LocVT = VA.getLocVT();


  switch (VA.getLocInfo()) {

  default:

    llvm_unreachable("Unexpected CCValAssign::LocInfo");

  case CCValAssign::Full:

    break;

  case CCValAssign::BCvt:

    if (VA.getLocVT() == MVT::i64 && VA.getValVT() == MVT::f32)

      Val = DAG.getNode(LoongArchISD::MOVFR2GR_S_LA64, DL, MVT::i64, Val);

    else

      Val = DAG.getNode(ISD::BITCAST, DL, LocVT, Val);

    break;

  }

  return Val;

}


static bool CC_LoongArch_GHC(unsigned ValNo, MVT ValVT, MVT LocVT,

                             CCValAssign::LocInfo LocInfo,

                             ISD::ArgFlagsTy ArgFlags, CCState &State) {

  if (LocVT == MVT::i32 || LocVT == MVT::i64) {

    // Pass in STG registers: Base, Sp, Hp, R1, R2, R3, R4, R5, SpLim

    //                        s0    s1  s2  s3  s4  s5  s6  s7  s8

    static const MCPhysReg GPRList[] = {

        LoongArch::R23, LoongArch::R24, LoongArch::R25,

        LoongArch::R26, LoongArch::R27, LoongArch::R28,

        LoongArch::R29, LoongArch::R30, LoongArch::R31};

    if (MCRegister Reg = State.AllocateReg(GPRList)) {

      State.addLoc(CCValAssign::getReg(ValNo, ValVT, Reg, LocVT, LocInfo));

      return false;

    }

  }


  if (LocVT == MVT::f32) {

    // Pass in STG registers: F1, F2, F3, F4

    //                        fs0,fs1,fs2,fs3

    static const MCPhysReg FPR32List[] = {LoongArch::F24, LoongArch::F25,

                                          LoongArch::F26, LoongArch::F27};

    if (MCRegister Reg = State.AllocateReg(FPR32List)) {

      State.addLoc(CCValAssign::getReg(ValNo, ValVT, Reg, LocVT, LocInfo));

      return false;

    }

  }


  if (LocVT == MVT::f64) {

    // Pass in STG registers: D1, D2, D3, D4

    //                        fs4,fs5,fs6,fs7

    static const MCPhysReg FPR64List[] = {LoongArch::F28_64, LoongArch::F29_64,

                                          LoongArch::F30_64, LoongArch::F31_64};

    if (MCRegister Reg = State.AllocateReg(FPR64List)) {

      State.addLoc(CCValAssign::getReg(ValNo, ValVT, Reg, LocVT, LocInfo));

      return false;

    }

  }


  report_fatal_error("No registers left in GHC calling convention");

  return true;

}


// Transform physical registers into virtual registers.

SDValue LoongArchTargetLowering::LowerFormalArguments(

    SDValue Chain, CallingConv::ID CallConv, bool IsVarArg,

    const SmallVectorImpl<ISD::InputArg> &Ins, const SDLoc &DL,

    SelectionDAG &DAG, SmallVectorImpl<SDValue> &InVals) const {


  MachineFunction &MF = DAG.getMachineFunction();


  switch (CallConv) {

  default:

    llvm_unreachable("Unsupported calling convention");

  case CallingConv::C:

  case CallingConv::Fast:

    break;

  case CallingConv::GHC:

    if (!MF.getSubtarget().hasFeature(LoongArch::FeatureBasicF) ||

        !MF.getSubtarget().hasFeature(LoongArch::FeatureBasicD))

      report_fatal_error(

          "GHC calling convention requires the F and D extensions");

  }


  EVT PtrVT = getPointerTy(DAG.getDataLayout());

  MVT GRLenVT = Subtarget.getGRLenVT();

  unsigned GRLenInBytes = Subtarget.getGRLen() / 8;

  // Used with varargs to acumulate store chains.

  std::vector<SDValue> OutChains;


  // Assign locations to all of the incoming arguments.

  SmallVector<CCValAssign> ArgLocs;

  CCState CCInfo(CallConv, IsVarArg, MF, ArgLocs, *DAG.getContext());


  if (CallConv == CallingConv::GHC)

    CCInfo.AnalyzeFormalArguments(Ins, CC_LoongArch_GHC);

  else

    analyzeInputArgs(MF, CCInfo, Ins, /*IsRet=*/false, CC_LoongArch);


  for (unsigned i = 0, e = ArgLocs.size(); i != e; ++i) {

    CCValAssign &VA = ArgLocs[i];

    SDValue ArgValue;

    if (VA.isRegLoc())

      ArgValue = unpackFromRegLoc(DAG, Chain, VA, DL, Ins[i], *this);

    else

      ArgValue = unpackFromMemLoc(DAG, Chain, VA, DL);

    if (VA.getLocInfo() == CCValAssign::Indirect) {

      // If the original argument was split and passed by reference, we need to

      // load all parts of it here (using the same address).

      InVals.push_back(DAG.getLoad(VA.getValVT(), DL, Chain, ArgValue,

                                   MachinePointerInfo()));

      unsigned ArgIndex = Ins[i].OrigArgIndex;

      unsigned ArgPartOffset = Ins[i].PartOffset;

      assert(ArgPartOffset == 0);

      while (i + 1 != e && Ins[i + 1].OrigArgIndex == ArgIndex) {

        CCValAssign &PartVA = ArgLocs[i + 1];

        unsigned PartOffset = Ins[i + 1].PartOffset - ArgPartOffset;

        SDValue Offset = DAG.getIntPtrConstant(PartOffset, DL);

        SDValue Address = DAG.getNode(ISD::ADD, DL, PtrVT, ArgValue, Offset);

        InVals.push_back(DAG.getLoad(PartVA.getValVT(), DL, Chain, Address,

                                     MachinePointerInfo()));

        ++i;

      }

      continue;

    }

    InVals.push_back(ArgValue);

  }


  if (IsVarArg) {

    ArrayRef<MCPhysReg> ArgRegs = ArrayRef(ArgGPRs);

    unsigned Idx = CCInfo.getFirstUnallocated(ArgRegs);

    const TargetRegisterClass *RC = &LoongArch::GPRRegClass;

    MachineFrameInfo &MFI = MF.getFrameInfo();

    MachineRegisterInfo &RegInfo = MF.getRegInfo();

    auto *LoongArchFI = MF.getInfo<LoongArchMachineFunctionInfo>();


    // Offset of the first variable argument from stack pointer, and size of

    // the vararg save area. For now, the varargs save area is either zero or

    // large enough to hold a0-a7.

    int VaArgOffset, VarArgsSaveSize;


    // If all registers are allocated, then all varargs must be passed on the

    // stack and we don't need to save any argregs.

    if (ArgRegs.size() == Idx) {

      VaArgOffset = CCInfo.getStackSize();

      VarArgsSaveSize = 0;

    } else {

      VarArgsSaveSize = GRLenInBytes * (ArgRegs.size() - Idx);

      VaArgOffset = -VarArgsSaveSize;

    }


    // Record the frame index of the first variable argument

    // which is a value necessary to VASTART.

    int FI = MFI.CreateFixedObject(GRLenInBytes, VaArgOffset, true);

    LoongArchFI->setVarArgsFrameIndex(FI);


    // If saving an odd number of registers then create an extra stack slot to

    // ensure that the frame pointer is 2*GRLen-aligned, which in turn ensures

    // offsets to even-numbered registered remain 2*GRLen-aligned.

    if (Idx % 2) {

      MFI.CreateFixedObject(GRLenInBytes, VaArgOffset - (int)GRLenInBytes,

                            true);

      VarArgsSaveSize += GRLenInBytes;

    }


    // Copy the integer registers that may have been used for passing varargs

    // to the vararg save area.

    for (unsigned I = Idx; I < ArgRegs.size();

         ++I, VaArgOffset += GRLenInBytes) {

      const Register Reg = RegInfo.createVirtualRegister(RC);

      RegInfo.addLiveIn(ArgRegs[I], Reg);

      SDValue ArgValue = DAG.getCopyFromReg(Chain, DL, Reg, GRLenVT);

      FI = MFI.CreateFixedObject(GRLenInBytes, VaArgOffset, true);

      SDValue PtrOff = DAG.getFrameIndex(FI, getPointerTy(DAG.getDataLayout()));

      SDValue Store = DAG.getStore(Chain, DL, ArgValue, PtrOff,

                                   MachinePointerInfo::getFixedStack(MF, FI));

      cast<StoreSDNode>(Store.getNode())

          ->getMemOperand()

          ->setValue((Value *)nullptr);

      OutChains.push_back(Store);

    }

    LoongArchFI->setVarArgsSaveSize(VarArgsSaveSize);

  }


  // All stores are grouped in one node to allow the matching between

  // the size of Ins and InVals. This only happens for vararg functions.

  if (!OutChains.empty()) {

    OutChains.push_back(Chain);

    Chain = DAG.getNode(ISD::TokenFactor, DL, MVT::Other, OutChains);

  }


  return Chain;

}


bool LoongArchTargetLowering::mayBeEmittedAsTailCall(const CallInst *CI) const {

  return CI->isTailCall();

}


// Check if the return value is used as only a return value, as otherwise

// we can't perform a tail-call.

bool LoongArchTargetLowering::isUsedByReturnOnly(SDNode *N,

                                                 SDValue &Chain) const {

  if (N->getNumValues() != 1)

    return false;

  if (!N->hasNUsesOfValue(1, 0))

    return false;


  SDNode *Copy = *N->user_begin();

  if (Copy->getOpcode() != ISD::CopyToReg)

    return false;


  // If the ISD::CopyToReg has a glue operand, we conservatively assume it

  // isn't safe to perform a tail call.

  if (Copy->getGluedNode())

    return false;


  // The copy must be used by a LoongArchISD::RET, and nothing else.

  bool HasRet = false;

  for (SDNode *Node : Copy->users()) {

    if (Node->getOpcode() != LoongArchISD::RET)

      return false;

    HasRet = true;

  }


  if (!HasRet)

    return false;


  Chain = Copy->getOperand(0);

  return true;

}


// Check whether the call is eligible for tail call optimization.

bool LoongArchTargetLowering::isEligibleForTailCallOptimization(

    CCState &CCInfo, CallLoweringInfo &CLI, MachineFunction &MF,

    const SmallVectorImpl<CCValAssign> &ArgLocs) const {


  auto CalleeCC = CLI.CallConv;

  auto &Outs = CLI.Outs;

  auto &Caller = MF.getFunction();

  auto CallerCC = Caller.getCallingConv();


  // Do not tail call opt if the stack is used to pass parameters.

  if (CCInfo.getStackSize() != 0)

    return false;


  // Do not tail call opt if any parameters need to be passed indirectly.

  for (auto &VA : ArgLocs)

    if (VA.getLocInfo() == CCValAssign::Indirect)

      return false;


  // Do not tail call opt if either caller or callee uses struct return

  // semantics.

  auto IsCallerStructRet = Caller.hasStructRetAttr();

  auto IsCalleeStructRet = Outs.empty() ? false : Outs[0].Flags.isSRet();

  if (IsCallerStructRet || IsCalleeStructRet)

    return false;


  // Do not tail call opt if either the callee or caller has a byval argument.

  for (auto &Arg : Outs)

    if (Arg.Flags.isByVal())

      return false;


  // The callee has to preserve all registers the caller needs to preserve.

  const LoongArchRegisterInfo *TRI = Subtarget.getRegisterInfo();

  const uint32_t *CallerPreserved = TRI->getCallPreservedMask(MF, CallerCC);

  if (CalleeCC != CallerCC) {

    const uint32_t *CalleePreserved = TRI->getCallPreservedMask(MF, CalleeCC);

    if (!TRI->regmaskSubsetEqual(CallerPreserved, CalleePreserved))

      return false;

  }

  return true;

}


static Align getPrefTypeAlign(EVT VT, SelectionDAG &DAG) {

  return DAG.getDataLayout().getPrefTypeAlign(

      VT.getTypeForEVT(*DAG.getContext()));

}


// Lower a call to a callseq_start + CALL + callseq_end chain, and add input

// and output parameter nodes.

SDValue

LoongArchTargetLowering::LowerCall(CallLoweringInfo &CLI,

                                   SmallVectorImpl<SDValue> &InVals) const {

  SelectionDAG &DAG = CLI.DAG;

  SDLoc &DL = CLI.DL;

  SmallVectorImpl<ISD::OutputArg> &Outs = CLI.Outs;

  SmallVectorImpl<SDValue> &OutVals = CLI.OutVals;

  SmallVectorImpl<ISD::InputArg> &Ins = CLI.Ins;

  SDValue Chain = CLI.Chain;

  SDValue Callee = CLI.Callee;

  CallingConv::ID CallConv = CLI.CallConv;

  bool IsVarArg = CLI.IsVarArg;

  EVT PtrVT = getPointerTy(DAG.getDataLayout());

  MVT GRLenVT = Subtarget.getGRLenVT();

  bool &IsTailCall = CLI.IsTailCall;


  MachineFunction &MF = DAG.getMachineFunction();


  // Analyze the operands of the call, assigning locations to each operand.

  SmallVector<CCValAssign> ArgLocs;

  CCState ArgCCInfo(CallConv, IsVarArg, MF, ArgLocs, *DAG.getContext());


  if (CallConv == CallingConv::GHC)

    ArgCCInfo.AnalyzeCallOperands(Outs, CC_LoongArch_GHC);

  else

    analyzeOutputArgs(MF, ArgCCInfo, Outs, /*IsRet=*/false, &CLI, CC_LoongArch);


  // Check if it's really possible to do a tail call.

  if (IsTailCall)

    IsTailCall = isEligibleForTailCallOptimization(ArgCCInfo, CLI, MF, ArgLocs);


  if (IsTailCall)

    ++NumTailCalls;

  else if (CLI.CB && CLI.CB->isMustTailCall())

    report_fatal_error("failed to perform tail call elimination on a call "

                       "site marked musttail");


  // Get a count of how many bytes are to be pushed on the stack.

  unsigned NumBytes = ArgCCInfo.getStackSize();


  // Create local copies for byval args.

  SmallVector<SDValue> ByValArgs;

  for (unsigned i = 0, e = Outs.size(); i != e; ++i) {

    ISD::ArgFlagsTy Flags = Outs[i].Flags;

    if (!Flags.isByVal())

      continue;


    SDValue Arg = OutVals[i];

    unsigned Size = Flags.getByValSize();

    Align Alignment = Flags.getNonZeroByValAlign();


    int FI =

        MF.getFrameInfo().CreateStackObject(Size, Alignment, /*isSS=*/false);

    SDValue FIPtr = DAG.getFrameIndex(FI, getPointerTy(DAG.getDataLayout()));

    SDValue SizeNode = DAG.getConstant(Size, DL, GRLenVT);


    Chain = DAG.getMemcpy(Chain, DL, FIPtr, Arg, SizeNode, Alignment,

                          /*IsVolatile=*/false,

                          /*AlwaysInline=*/false, /*CI=*/nullptr, std::nullopt,

                          MachinePointerInfo(), MachinePointerInfo());

    ByValArgs.push_back(FIPtr);

  }


  if (!IsTailCall)

    Chain = DAG.getCALLSEQ_START(Chain, NumBytes, 0, CLI.DL);


  // Copy argument values to their designated locations.

  SmallVector<std::pair<Register, SDValue>> RegsToPass;

  SmallVector<SDValue> MemOpChains;

  SDValue StackPtr;

  for (unsigned i = 0, j = 0, e = ArgLocs.size(); i != e; ++i) {

    CCValAssign &VA = ArgLocs[i];

    SDValue ArgValue = OutVals[i];

    ISD::ArgFlagsTy Flags = Outs[i].Flags;


    // Promote the value if needed.

    // For now, only handle fully promoted and indirect arguments.

    if (VA.getLocInfo() == CCValAssign::Indirect) {

      // Store the argument in a stack slot and pass its address.

      Align StackAlign =

          std::max(getPrefTypeAlign(Outs[i].ArgVT, DAG),

                   getPrefTypeAlign(ArgValue.getValueType(), DAG));

      TypeSize StoredSize = ArgValue.getValueType().getStoreSize();

      // If the original argument was split and passed by reference, we need to

      // store the required parts of it here (and pass just one address).

      unsigned ArgIndex = Outs[i].OrigArgIndex;

      unsigned ArgPartOffset = Outs[i].PartOffset;

      assert(ArgPartOffset == 0);

      // Calculate the total size to store. We don't have access to what we're

      // actually storing other than performing the loop and collecting the

      // info.

      SmallVector<std::pair<SDValue, SDValue>> Parts;

      while (i + 1 != e && Outs[i + 1].OrigArgIndex == ArgIndex) {

        SDValue PartValue = OutVals[i + 1];

        unsigned PartOffset = Outs[i + 1].PartOffset - ArgPartOffset;

        SDValue Offset = DAG.getIntPtrConstant(PartOffset, DL);

        EVT PartVT = PartValue.getValueType();


        StoredSize += PartVT.getStoreSize();

        StackAlign = std::max(StackAlign, getPrefTypeAlign(PartVT, DAG));

        Parts.push_back(std::make_pair(PartValue, Offset));

        ++i;

      }

      SDValue SpillSlot = DAG.CreateStackTemporary(StoredSize, StackAlign);

      int FI = cast<FrameIndexSDNode>(SpillSlot)->getIndex();

      MemOpChains.push_back(

          DAG.getStore(Chain, DL, ArgValue, SpillSlot,

                       MachinePointerInfo::getFixedStack(MF, FI)));

      for (const auto &Part : Parts) {

        SDValue PartValue = Part.first;

        SDValue PartOffset = Part.second;

        SDValue Address =

            DAG.getNode(ISD::ADD, DL, PtrVT, SpillSlot, PartOffset);

        MemOpChains.push_back(

            DAG.getStore(Chain, DL, PartValue, Address,

                         MachinePointerInfo::getFixedStack(MF, FI)));

      }

      ArgValue = SpillSlot;

    } else {

      ArgValue = convertValVTToLocVT(DAG, ArgValue, VA, DL);

    }


    // Use local copy if it is a byval arg.

    if (Flags.isByVal())

      ArgValue = ByValArgs[j++];


    if (VA.isRegLoc()) {

      // Queue up the argument copies and emit them at the end.

      RegsToPass.push_back(std::make_pair(VA.getLocReg(), ArgValue));

    } else {

      assert(VA.isMemLoc() && "Argument not register or memory");

      assert(!IsTailCall && "Tail call not allowed if stack is used "

                            "for passing parameters");


      // Work out the address of the stack slot.

      if (!StackPtr.getNode())

        StackPtr = DAG.getCopyFromReg(Chain, DL, LoongArch::R3, PtrVT);

      SDValue Address =

          DAG.getNode(ISD::ADD, DL, PtrVT, StackPtr,

                      DAG.getIntPtrConstant(VA.getLocMemOffset(), DL));


      // Emit the store.

      MemOpChains.push_back(

          DAG.getStore(Chain, DL, ArgValue, Address, MachinePointerInfo()));

    }

  }


  // Join the stores, which are independent of one another.

  if (!MemOpChains.empty())

    Chain = DAG.getNode(ISD::TokenFactor, DL, MVT::Other, MemOpChains);


  SDValue Glue;


  // Build a sequence of copy-to-reg nodes, chained and glued together.

  for (auto &Reg : RegsToPass) {

    Chain = DAG.getCopyToReg(Chain, DL, Reg.first, Reg.second, Glue);

    Glue = Chain.getValue(1);

  }


  // If the callee is a GlobalAddress/ExternalSymbol node, turn it into a

  // TargetGlobalAddress/TargetExternalSymbol node so that legalize won't

  // split it and then direct call can be matched by PseudoCALL.

  if (GlobalAddressSDNode *S = dyn_cast<GlobalAddressSDNode>(Callee)) {

    const GlobalValue *GV = S->getGlobal();

    unsigned OpFlags = getTargetMachine().shouldAssumeDSOLocal(GV)

                           ? LoongArchII::MO_CALL

                           : LoongArchII::MO_CALL_PLT;

    Callee = DAG.getTargetGlobalAddress(S->getGlobal(), DL, PtrVT, 0, OpFlags);

  } else if (ExternalSymbolSDNode *S = dyn_cast<ExternalSymbolSDNode>(Callee)) {

    unsigned OpFlags = getTargetMachine().shouldAssumeDSOLocal(nullptr)

                           ? LoongArchII::MO_CALL

                           : LoongArchII::MO_CALL_PLT;

    Callee = DAG.getTargetExternalSymbol(S->getSymbol(), PtrVT, OpFlags);

  }


  // The first call operand is the chain and the second is the target address.

  SmallVector<SDValue> Ops;

  Ops.push_back(Chain);

  Ops.push_back(Callee);


  // Add argument registers to the end of the list so that they are

  // known live into the call.

  for (auto &Reg : RegsToPass)

    Ops.push_back(DAG.getRegister(Reg.first, Reg.second.getValueType()));


  if (!IsTailCall) {

    // Add a register mask operand representing the call-preserved registers.

    const TargetRegisterInfo *TRI = Subtarget.getRegisterInfo();

    const uint32_t *Mask = TRI->getCallPreservedMask(MF, CallConv);

    assert(Mask && "Missing call preserved mask for calling convention");

    Ops.push_back(DAG.getRegisterMask(Mask));

  }


  // Glue the call to the argument copies, if any.

  if (Glue.getNode())

    Ops.push_back(Glue);


  // Emit the call.

  SDVTList NodeTys = DAG.getVTList(MVT::Other, MVT::Glue);

  unsigned Op;

  switch (DAG.getTarget().getCodeModel()) {

  default:

    report_fatal_error("Unsupported code model");

  case CodeModel::Small:

    Op = IsTailCall ? LoongArchISD::TAIL : LoongArchISD::CALL;

    break;

  case CodeModel::Medium:

    assert(Subtarget.is64Bit() && "Medium code model requires LA64");

    Op = IsTailCall ? LoongArchISD::TAIL_MEDIUM : LoongArchISD::CALL_MEDIUM;

    break;

  case CodeModel::Large:

    assert(Subtarget.is64Bit() && "Large code model requires LA64");

    Op = IsTailCall ? LoongArchISD::TAIL_LARGE : LoongArchISD::CALL_LARGE;

    break;

  }


  if (IsTailCall) {

    MF.getFrameInfo().setHasTailCall();

    SDValue Ret = DAG.getNode(Op, DL, NodeTys, Ops);

    DAG.addNoMergeSiteInfo(Ret.getNode(), CLI.NoMerge);

    return Ret;

  }


  Chain = DAG.getNode(Op, DL, NodeTys, Ops);

  DAG.addNoMergeSiteInfo(Chain.getNode(), CLI.NoMerge);

  Glue = Chain.getValue(1);


  // Mark the end of the call, which is glued to the call itself.

  Chain = DAG.getCALLSEQ_END(Chain, NumBytes, 0, Glue, DL);

  Glue = Chain.getValue(1);


  // Assign locations to each value returned by this call.

  SmallVector<CCValAssign> RVLocs;

  CCState RetCCInfo(CallConv, IsVarArg, MF, RVLocs, *DAG.getContext());

  analyzeInputArgs(MF, RetCCInfo, Ins, /*IsRet=*/true, CC_LoongArch);


  // Copy all of the result registers out of their specified physreg.

  for (auto &VA : RVLocs) {

    // Copy the value out.

    SDValue RetValue =

        DAG.getCopyFromReg(Chain, DL, VA.getLocReg(), VA.getLocVT(), Glue);

    // Glue the RetValue to the end of the call sequence.

    Chain = RetValue.getValue(1);

    Glue = RetValue.getValue(2);


    RetValue = convertLocVTToValVT(DAG, RetValue, VA, DL);


    InVals.push_back(RetValue);

  }


  return Chain;

}


bool LoongArchTargetLowering::CanLowerReturn(

    CallingConv::ID CallConv, MachineFunction &MF, bool IsVarArg,

    const SmallVectorImpl<ISD::OutputArg> &Outs, LLVMContext &Context,

    const Type *RetTy) const {

  SmallVector<CCValAssign> RVLocs;

  CCState CCInfo(CallConv, IsVarArg, MF, RVLocs, Context);


  for (unsigned i = 0, e = Outs.size(); i != e; ++i) {

    LoongArchABI::ABI ABI =

        MF.getSubtarget<LoongArchSubtarget>().getTargetABI();

    if (CC_LoongArch(MF.getDataLayout(), ABI, i, Outs[i].VT, CCValAssign::Full,

                     Outs[i].Flags, CCInfo, /*IsFixed=*/true, /*IsRet=*/true,

                     nullptr))

      return false;

  }

  return true;

}


SDValue LoongArchTargetLowering::LowerReturn(

    SDValue Chain, CallingConv::ID CallConv, bool IsVarArg,

    const SmallVectorImpl<ISD::OutputArg> &Outs,

    const SmallVectorImpl<SDValue> &OutVals, const SDLoc &DL,

    SelectionDAG &DAG) const {

  // Stores the assignment of the return value to a location.

  SmallVector<CCValAssign> RVLocs;


  // Info about the registers and stack slot.

  CCState CCInfo(CallConv, IsVarArg, DAG.getMachineFunction(), RVLocs,

                 *DAG.getContext());


  analyzeOutputArgs(DAG.getMachineFunction(), CCInfo, Outs, /*IsRet=*/true,

                    nullptr, CC_LoongArch);

  if (CallConv == CallingConv::GHC && !RVLocs.empty())

    report_fatal_error("GHC functions return void only");

  SDValue Glue;

  SmallVector<SDValue, 4> RetOps(1, Chain);


  // Copy the result values into the output registers.

  for (unsigned i = 0, e = RVLocs.size(); i < e; ++i) {

    CCValAssign &VA = RVLocs[i];

    assert(VA.isRegLoc() && "Can only return in registers!");


    // Handle a 'normal' return.

    SDValue Val = convertValVTToLocVT(DAG, OutVals[i], VA, DL);

    Chain = DAG.getCopyToReg(Chain, DL, VA.getLocReg(), Val, Glue);


    // Guarantee that all emitted copies are stuck together.

    Glue = Chain.getValue(1);

    RetOps.push_back(DAG.getRegister(VA.getLocReg(), VA.getLocVT()));

  }


  RetOps[0] = Chain; // Update chain.


  // Add the glue node if we have it.

  if (Glue.getNode())

    RetOps.push_back(Glue);


  return DAG.getNode(LoongArchISD::RET, DL, MVT::Other, RetOps);

}


bool LoongArchTargetLowering::isFPImmVLDILegal(const APFloat &Imm,

                                               EVT VT) const {

  if (!Subtarget.hasExtLSX())

    return false;


  if (VT == MVT::f32) {

    uint64_t masked = Imm.bitcastToAPInt().getZExtValue() & 0x7e07ffff;

    return (masked == 0x3e000000 || masked == 0x40000000);

  }


  if (VT == MVT::f64) {

    uint64_t masked = Imm.bitcastToAPInt().getZExtValue() & 0x7fc0ffffffffffff;

    return (masked == 0x3fc0000000000000 || masked == 0x4000000000000000);

  }


  return false;

}


bool LoongArchTargetLowering::isFPImmLegal(const APFloat &Imm, EVT VT,

                                           bool ForCodeSize) const {

  // TODO: Maybe need more checks here after vector extension is supported.

  if (VT == MVT::f32 && !Subtarget.hasBasicF())

    return false;

  if (VT == MVT::f64 && !Subtarget.hasBasicD())

    return false;

  return (Imm.isZero() || Imm.isExactlyValue(1.0) || isFPImmVLDILegal(Imm, VT));

}


bool LoongArchTargetLowering::isCheapToSpeculateCttz(Type *) const {

  return true;

}


bool LoongArchTargetLowering::isCheapToSpeculateCtlz(Type *) const {

  return true;

}


bool LoongArchTargetLowering::shouldInsertFencesForAtomic(

    const Instruction *I) const {

  if (!Subtarget.is64Bit())

    return isa<LoadInst>(I) || isa<StoreInst>(I);


  if (isa<LoadInst>(I))

    return true;


  // On LA64, atomic store operations with IntegerBitWidth of 32 and 64 do not

  // require fences beacuse we can use amswap_db.[w/d].

  Type *Ty = I->getOperand(0)->getType();

  if (isa<StoreInst>(I) && Ty->isIntegerTy()) {

    unsigned Size = Ty->getIntegerBitWidth();

    return (Size == 8 || Size == 16);

  }


  return false;

}


EVT LoongArchTargetLowering::getSetCCResultType(const DataLayout &DL,

                                                LLVMContext &Context,

                                                EVT VT) const {

  if (!VT.isVector())

    return getPointerTy(DL);

  return VT.changeVectorElementTypeToInteger();

}


bool LoongArchTargetLowering::hasAndNot(SDValue Y) const {

  // TODO: Support vectors.

  return Y.getValueType().isScalarInteger() && !isa<ConstantSDNode>(Y);

}


bool LoongArchTargetLowering::getTgtMemIntrinsic(IntrinsicInfo &Info,

                                                 const CallInst &I,

                                                 MachineFunction &MF,

                                                 unsigned Intrinsic) const {

  switch (Intrinsic) {

  default:

    return false;

  case Intrinsic::loongarch_masked_atomicrmw_xchg_i32:

  case Intrinsic::loongarch_masked_atomicrmw_add_i32:

  case Intrinsic::loongarch_masked_atomicrmw_sub_i32:

  case Intrinsic::loongarch_masked_atomicrmw_nand_i32:

    Info.opc = ISD::INTRINSIC_W_CHAIN;

    Info.memVT = MVT::i32;

    Info.ptrVal = I.getArgOperand(0);

    Info.offset = 0;

    Info.align = Align(4);

    Info.flags = MachineMemOperand::MOLoad | MachineMemOperand::MOStore |

                 MachineMemOperand::MOVolatile;

    return true;

    // TODO: Add more Intrinsics later.

  }

}


// When -mlamcas is enabled, MinCmpXchgSizeInBits will be set to 8,

// atomicrmw and/or/xor operations with operands less than 32 bits cannot be

// expanded to am{and/or/xor}[_db].w through AtomicExpandPass. To prevent

// regression, we need to implement it manually.

void LoongArchTargetLowering::emitExpandAtomicRMW(AtomicRMWInst *AI) const {

  AtomicRMWInst::BinOp Op = AI->getOperation();


  assert((Op == AtomicRMWInst::Or || Op == AtomicRMWInst::Xor ||

          Op == AtomicRMWInst::And) &&

         "Unable to expand");

  unsigned MinWordSize = 4;


  IRBuilder<> Builder(AI);

  LLVMContext &Ctx = Builder.getContext();

  const DataLayout &DL = AI->getDataLayout();

  Type *ValueType = AI->getType();

  Type *WordType = Type::getIntNTy(Ctx, MinWordSize * 8);


  Value *Addr = AI->getPointerOperand();

  PointerType *PtrTy = cast<PointerType>(Addr->getType());

  IntegerType *IntTy = DL.getIndexType(Ctx, PtrTy->getAddressSpace());


  Value *AlignedAddr = Builder.CreateIntrinsic(

      Intrinsic::ptrmask, {PtrTy, IntTy},

      {Addr, ConstantInt::get(IntTy, ~(uint64_t)(MinWordSize - 1))}, nullptr,

      "AlignedAddr");


  Value *AddrInt = Builder.CreatePtrToInt(Addr, IntTy);

  Value *PtrLSB = Builder.CreateAnd(AddrInt, MinWordSize - 1, "PtrLSB");

  Value *ShiftAmt = Builder.CreateShl(PtrLSB, 3);

  ShiftAmt = Builder.CreateTrunc(ShiftAmt, WordType, "ShiftAmt");

  Value *Mask = Builder.CreateShl(

      ConstantInt::get(WordType,

                       (1 << (DL.getTypeStoreSize(ValueType) * 8)) - 1),

      ShiftAmt, "Mask");

  Value *Inv_Mask = Builder.CreateNot(Mask, "Inv_Mask");

  Value *ValOperand_Shifted =

      Builder.CreateShl(Builder.CreateZExt(AI->getValOperand(), WordType),

                        ShiftAmt, "ValOperand_Shifted");

  Value *NewOperand;

  if (Op == AtomicRMWInst::And)

    NewOperand = Builder.CreateOr(ValOperand_Shifted, Inv_Mask, "AndOperand");

  else

    NewOperand = ValOperand_Shifted;


  AtomicRMWInst *NewAI =

      Builder.CreateAtomicRMW(Op, AlignedAddr, NewOperand, Align(MinWordSize),

                              AI->getOrdering(), AI->getSyncScopeID());


  Value *Shift = Builder.CreateLShr(NewAI, ShiftAmt, "shifted");

  Value *Trunc = Builder.CreateTrunc(Shift, ValueType, "extracted");

  Value *FinalOldResult = Builder.CreateBitCast(Trunc, ValueType);

  AI->replaceAllUsesWith(FinalOldResult);

  AI->eraseFromParent();

}


TargetLowering::AtomicExpansionKind

LoongArchTargetLowering::shouldExpandAtomicRMWInIR(AtomicRMWInst *AI) const {

  // TODO: Add more AtomicRMWInst that needs to be extended.


  // Since floating-point operation requires a non-trivial set of data

  // operations, use CmpXChg to expand.

  if (AI->isFloatingPointOperation() ||

      AI->getOperation() == AtomicRMWInst::UIncWrap ||

      AI->getOperation() == AtomicRMWInst::UDecWrap ||

      AI->getOperation() == AtomicRMWInst::USubCond ||

      AI->getOperation() == AtomicRMWInst::USubSat)

    return AtomicExpansionKind::CmpXChg;


  if (Subtarget.hasLAM_BH() && Subtarget.is64Bit() &&

      (AI->getOperation() == AtomicRMWInst::Xchg ||

       AI->getOperation() == AtomicRMWInst::Add ||

       AI->getOperation() == AtomicRMWInst::Sub)) {

    return AtomicExpansionKind::None;

  }


  unsigned Size = AI->getType()->getPrimitiveSizeInBits();

  if (Subtarget.hasLAMCAS()) {

    if (Size < 32 && (AI->getOperation() == AtomicRMWInst::And ||

                      AI->getOperation() == AtomicRMWInst::Or ||

                      AI->getOperation() == AtomicRMWInst::Xor))

      return AtomicExpansionKind::Expand;

    if (AI->getOperation() == AtomicRMWInst::Nand || Size < 32)

      return AtomicExpansionKind::CmpXChg;

  }


  if (Size == 8 || Size == 16)

    return AtomicExpansionKind::MaskedIntrinsic;

  return AtomicExpansionKind::None;

}


static Intrinsic::ID

getIntrinsicForMaskedAtomicRMWBinOp(unsigned GRLen,

                                    AtomicRMWInst::BinOp BinOp) {

  if (GRLen == 64) {

    switch (BinOp) {

    default:

      llvm_unreachable("Unexpected AtomicRMW BinOp");

    case AtomicRMWInst::Xchg:

      return Intrinsic::loongarch_masked_atomicrmw_xchg_i64;

    case AtomicRMWInst::Add:

      return Intrinsic::loongarch_masked_atomicrmw_add_i64;

    case AtomicRMWInst::Sub:

      return Intrinsic::loongarch_masked_atomicrmw_sub_i64;

    case AtomicRMWInst::Nand:

      return Intrinsic::loongarch_masked_atomicrmw_nand_i64;

    case AtomicRMWInst::UMax:

      return Intrinsic::loongarch_masked_atomicrmw_umax_i64;

    case AtomicRMWInst::UMin:

      return Intrinsic::loongarch_masked_atomicrmw_umin_i64;

    case AtomicRMWInst::Max:

      return Intrinsic::loongarch_masked_atomicrmw_max_i64;

    case AtomicRMWInst::Min:

      return Intrinsic::loongarch_masked_atomicrmw_min_i64;

      // TODO: support other AtomicRMWInst.

    }

  }


  if (GRLen == 32) {

    switch (BinOp) {

    default:

      llvm_unreachable("Unexpected AtomicRMW BinOp");

    case AtomicRMWInst::Xchg:

      return Intrinsic::loongarch_masked_atomicrmw_xchg_i32;

    case AtomicRMWInst::Add:

      return Intrinsic::loongarch_masked_atomicrmw_add_i32;

    case AtomicRMWInst::Sub:

      return Intrinsic::loongarch_masked_atomicrmw_sub_i32;

    case AtomicRMWInst::Nand:

      return Intrinsic::loongarch_masked_atomicrmw_nand_i32;

      // TODO: support other AtomicRMWInst.

    }

  }


  llvm_unreachable("Unexpected GRLen\n");

}


TargetLowering::AtomicExpansionKind

LoongArchTargetLowering::shouldExpandAtomicCmpXchgInIR(

    AtomicCmpXchgInst *CI) const {


  if (Subtarget.hasLAMCAS())

    return AtomicExpansionKind::None;


  unsigned Size = CI->getCompareOperand()->getType()->getPrimitiveSizeInBits();

  if (Size == 8 || Size == 16)

    return AtomicExpansionKind::MaskedIntrinsic;

  return AtomicExpansionKind::None;

}


Value *LoongArchTargetLowering::emitMaskedAtomicCmpXchgIntrinsic(

    IRBuilderBase &Builder, AtomicCmpXchgInst *CI, Value *AlignedAddr,

    Value *CmpVal, Value *NewVal, Value *Mask, AtomicOrdering Ord) const {

  AtomicOrdering FailOrd = CI->getFailureOrdering();

  Value *FailureOrdering =

      Builder.getIntN(Subtarget.getGRLen(), static_cast<uint64_t>(FailOrd));


  // TODO: Support cmpxchg on LA32.

  Intrinsic::ID CmpXchgIntrID = Intrinsic::loongarch_masked_cmpxchg_i64;

  CmpVal = Builder.CreateSExt(CmpVal, Builder.getInt64Ty());

  NewVal = Builder.CreateSExt(NewVal, Builder.getInt64Ty());

  Mask = Builder.CreateSExt(Mask, Builder.getInt64Ty());

  Type *Tys[] = {AlignedAddr->getType()};

  Value *Result = Builder.CreateIntrinsic(

      CmpXchgIntrID, Tys, {AlignedAddr, CmpVal, NewVal, Mask, FailureOrdering});

  Result = Builder.CreateTrunc(Result, Builder.getInt32Ty());

  return Result;

}


Value *LoongArchTargetLowering::emitMaskedAtomicRMWIntrinsic(

    IRBuilderBase &Builder, AtomicRMWInst *AI, Value *AlignedAddr, Value *Incr,

    Value *Mask, Value *ShiftAmt, AtomicOrdering Ord) const {

  // In the case of an atomicrmw xchg with a constant 0/-1 operand, replace

  // the atomic instruction with an AtomicRMWInst::And/Or with appropriate

  // mask, as this produces better code than the LL/SC loop emitted by

  // int_loongarch_masked_atomicrmw_xchg.

  if (AI->getOperation() == AtomicRMWInst::Xchg &&

      isa<ConstantInt>(AI->getValOperand())) {

    ConstantInt *CVal = cast<ConstantInt>(AI->getValOperand());

    if (CVal->isZero())

      return Builder.CreateAtomicRMW(AtomicRMWInst::And, AlignedAddr,

                                     Builder.CreateNot(Mask, "Inv_Mask"),

                                     AI->getAlign(), Ord);

    if (CVal->isMinusOne())

      return Builder.CreateAtomicRMW(AtomicRMWInst::Or, AlignedAddr, Mask,

                                     AI->getAlign(), Ord);

  }


  unsigned GRLen = Subtarget.getGRLen();

  Value *Ordering =

      Builder.getIntN(GRLen, static_cast<uint64_t>(AI->getOrdering()));

  Type *Tys[] = {AlignedAddr->getType()};

  Function *LlwOpScwLoop = Intrinsic::getOrInsertDeclaration(

      AI->getModule(),

      getIntrinsicForMaskedAtomicRMWBinOp(GRLen, AI->getOperation()), Tys);


  if (GRLen == 64) {

    Incr = Builder.CreateSExt(Incr, Builder.getInt64Ty());

    Mask = Builder.CreateSExt(Mask, Builder.getInt64Ty());

    ShiftAmt = Builder.CreateSExt(ShiftAmt, Builder.getInt64Ty());

  }


  Value *Result;


  // Must pass the shift amount needed to sign extend the loaded value prior

  // to performing a signed comparison for min/max. ShiftAmt is the number of

  // bits to shift the value into position. Pass GRLen-ShiftAmt-ValWidth, which

  // is the number of bits to left+right shift the value in order to

  // sign-extend.

  if (AI->getOperation() == AtomicRMWInst::Min ||

      AI->getOperation() == AtomicRMWInst::Max) {

    const DataLayout &DL = AI->getDataLayout();

    unsigned ValWidth =

        DL.getTypeStoreSizeInBits(AI->getValOperand()->getType());

    Value *SextShamt =

        Builder.CreateSub(Builder.getIntN(GRLen, GRLen - ValWidth), ShiftAmt);

    Result = Builder.CreateCall(LlwOpScwLoop,

                                {AlignedAddr, Incr, Mask, SextShamt, Ordering});

  } else {

    Result =

        Builder.CreateCall(LlwOpScwLoop, {AlignedAddr, Incr, Mask, Ordering});

  }


  if (GRLen == 64)

    Result = Builder.CreateTrunc(Result, Builder.getInt32Ty());

  return Result;

}


bool LoongArchTargetLowering::isFMAFasterThanFMulAndFAdd(

    const MachineFunction &MF, EVT VT) const {

  VT = VT.getScalarType();


  if (!VT.isSimple())

    return false;


  switch (VT.getSimpleVT().SimpleTy) {

  case MVT::f32:

  case MVT::f64:

    return true;

  default:

    break;

  }


  return false;

}


Register LoongArchTargetLowering::getExceptionPointerRegister(

    const Constant *PersonalityFn) const {

  return LoongArch::R4;

}


Register LoongArchTargetLowering::getExceptionSelectorRegister(

    const Constant *PersonalityFn) const {

  return LoongArch::R5;

}


//===----------------------------------------------------------------------===//

// Target Optimization Hooks

//===----------------------------------------------------------------------===//


static int getEstimateRefinementSteps(EVT VT,

                                      const LoongArchSubtarget &Subtarget) {

  // Feature FRECIPE instrucions relative accuracy is 2^-14.

  // IEEE float has 23 digits and double has 52 digits.

  int RefinementSteps = VT.getScalarType() == MVT::f64 ? 2 : 1;

  return RefinementSteps;

}


SDValue LoongArchTargetLowering::getSqrtEstimate(SDValue Operand,

                                                 SelectionDAG &DAG, int Enabled,

                                                 int &RefinementSteps,

                                                 bool &UseOneConstNR,

                                                 bool Reciprocal) const {

  if (Subtarget.hasFrecipe()) {

    SDLoc DL(Operand);

    EVT VT = Operand.getValueType();


    if (VT == MVT::f32 || (VT == MVT::f64 && Subtarget.hasBasicD()) ||

        (VT == MVT::v4f32 && Subtarget.hasExtLSX()) ||

        (VT == MVT::v2f64 && Subtarget.hasExtLSX()) ||

        (VT == MVT::v8f32 && Subtarget.hasExtLASX()) ||

        (VT == MVT::v4f64 && Subtarget.hasExtLASX())) {


      if (RefinementSteps == ReciprocalEstimate::Unspecified)

        RefinementSteps = getEstimateRefinementSteps(VT, Subtarget);


      SDValue Estimate = DAG.getNode(LoongArchISD::FRSQRTE, DL, VT, Operand);

      if (Reciprocal)

        Estimate = DAG.getNode(ISD::FMUL, DL, VT, Operand, Estimate);


      return Estimate;

    }

  }


  return SDValue();

}


SDValue LoongArchTargetLowering::getRecipEstimate(SDValue Operand,

                                                  SelectionDAG &DAG,

                                                  int Enabled,

                                                  int &RefinementSteps) const {

  if (Subtarget.hasFrecipe()) {

    SDLoc DL(Operand);

    EVT VT = Operand.getValueType();


    if (VT == MVT::f32 || (VT == MVT::f64 && Subtarget.hasBasicD()) ||

        (VT == MVT::v4f32 && Subtarget.hasExtLSX()) ||

        (VT == MVT::v2f64 && Subtarget.hasExtLSX()) ||

        (VT == MVT::v8f32 && Subtarget.hasExtLASX()) ||

        (VT == MVT::v4f64 && Subtarget.hasExtLASX())) {


      if (RefinementSteps == ReciprocalEstimate::Unspecified)

        RefinementSteps = getEstimateRefinementSteps(VT, Subtarget);


      return DAG.getNode(LoongArchISD::FRECIPE, DL, VT, Operand);

    }

  }


  return SDValue();

}


//===----------------------------------------------------------------------===//

//                           LoongArch Inline Assembly Support

//===----------------------------------------------------------------------===//


LoongArchTargetLowering::ConstraintType

LoongArchTargetLowering::getConstraintType(StringRef Constraint) const {

  // LoongArch specific constraints in GCC: config/loongarch/constraints.md

  //

  // 'f':  A floating-point register (if available).

  // 'k':  A memory operand whose address is formed by a base register and

  //       (optionally scaled) index register.

  // 'l':  A signed 16-bit constant.

  // 'm':  A memory operand whose address is formed by a base register and

  //       offset that is suitable for use in instructions with the same

  //       addressing mode as st.w and ld.w.

  // 'I':  A signed 12-bit constant (for arithmetic instructions).

  // 'J':  Integer zero.

  // 'K':  An unsigned 12-bit constant (for logic instructions).

  // "ZB": An address that is held in a general-purpose register. The offset is

  //       zero.

  // "ZC": A memory operand whose address is formed by a base register and

  //       offset that is suitable for use in instructions with the same

  //       addressing mode as ll.w and sc.w.

  if (Constraint.size() == 1) {

    switch (Constraint[0]) {

    default:

      break;

    case 'f':

      return C_RegisterClass;

    case 'l':

    case 'I':

    case 'J':

    case 'K':

      return C_Immediate;

    case 'k':

      return C_Memory;

    }

  }


  if (Constraint == "ZC" || Constraint == "ZB")

    return C_Memory;


  // 'm' is handled here.

  return TargetLowering::getConstraintType(Constraint);

}


InlineAsm::ConstraintCode LoongArchTargetLowering::getInlineAsmMemConstraint(

    StringRef ConstraintCode) const {

  return StringSwitch<InlineAsm::ConstraintCode>(ConstraintCode)

      .Case("k", InlineAsm::ConstraintCode::k)

      .Case("ZB", InlineAsm::ConstraintCode::ZB)

      .Case("ZC", InlineAsm::ConstraintCode::ZC)

      .Default(TargetLowering::getInlineAsmMemConstraint(ConstraintCode));

}


std::pair<unsigned, const TargetRegisterClass *>

LoongArchTargetLowering::getRegForInlineAsmConstraint(

    const TargetRegisterInfo *TRI, StringRef Constraint, MVT VT) const {

  // First, see if this is a constraint that directly corresponds to a LoongArch

  // register class.

  if (Constraint.size() == 1) {

    switch (Constraint[0]) {

    case 'r':

      // TODO: Support fixed vectors up to GRLen?

      if (VT.isVector())

        break;

      return std::make_pair(0U, &LoongArch::GPRRegClass);

    case 'f':

      if (Subtarget.hasBasicF() && VT == MVT::f32)

        return std::make_pair(0U, &LoongArch::FPR32RegClass);

      if (Subtarget.hasBasicD() && VT == MVT::f64)

        return std::make_pair(0U, &LoongArch::FPR64RegClass);

      if (Subtarget.hasExtLSX() &&

          TRI->isTypeLegalForClass(LoongArch::LSX128RegClass, VT))

        return std::make_pair(0U, &LoongArch::LSX128RegClass);

      if (Subtarget.hasExtLASX() &&

          TRI->isTypeLegalForClass(LoongArch::LASX256RegClass, VT))

        return std::make_pair(0U, &LoongArch::LASX256RegClass);

      break;

    default:

      break;

    }

  }


  // TargetLowering::getRegForInlineAsmConstraint uses the name of the TableGen

  // record (e.g. the "R0" in `def R0`) to choose registers for InlineAsm

  // constraints while the official register name is prefixed with a '$'. So we

  // clip the '$' from the original constraint string (e.g. {$r0} to {r0}.)

  // before it being parsed. And TargetLowering::getRegForInlineAsmConstraint is

  // case insensitive, so no need to convert the constraint to upper case here.

  //

  // For now, no need to support ABI names (e.g. `$a0`) as clang will correctly

  // decode the usage of register name aliases into their official names. And

  // AFAIK, the not yet upstreamed `rustc` for LoongArch will always use

  // official register names.

  if (Constraint.starts_with("{$r") || Constraint.starts_with("{$f") ||

      Constraint.starts_with("{$vr") || Constraint.starts_with("{$xr")) {

    bool IsFP = Constraint[2] == 'f';

    std::pair<StringRef, StringRef> Temp = Constraint.split('$');

    std::pair<unsigned, const TargetRegisterClass *> R;

    R = TargetLowering::getRegForInlineAsmConstraint(

        TRI, join_items("", Temp.first, Temp.second), VT);

    // Match those names to the widest floating point register type available.

    if (IsFP) {

      unsigned RegNo = R.first;

      if (LoongArch::F0 <= RegNo && RegNo <= LoongArch::F31) {

        if (Subtarget.hasBasicD() && (VT == MVT::f64 || VT == MVT::Other)) {

          unsigned DReg = RegNo - LoongArch::F0 + LoongArch::F0_64;

          return std::make_pair(DReg, &LoongArch::FPR64RegClass);

        }

      }

    }

    return R;

  }


  return TargetLowering::getRegForInlineAsmConstraint(TRI, Constraint, VT);

}


void LoongArchTargetLowering::LowerAsmOperandForConstraint(

    SDValue Op, StringRef Constraint, std::vector<SDValue> &Ops,

    SelectionDAG &DAG) const {

  // Currently only support length 1 constraints.

  if (Constraint.size() == 1) {

    switch (Constraint[0]) {

    case 'l':

      // Validate & create a 16-bit signed immediate operand.

      if (auto *C = dyn_cast<ConstantSDNode>(Op)) {

        uint64_t CVal = C->getSExtValue();

        if (isInt<16>(CVal))

          Ops.push_back(DAG.getSignedTargetConstant(CVal, SDLoc(Op),

                                                    Subtarget.getGRLenVT()));

      }

      return;

    case 'I':

      // Validate & create a 12-bit signed immediate operand.

      if (auto *C = dyn_cast<ConstantSDNode>(Op)) {

        uint64_t CVal = C->getSExtValue();

        if (isInt<12>(CVal))

          Ops.push_back(DAG.getSignedTargetConstant(CVal, SDLoc(Op),

                                                    Subtarget.getGRLenVT()));

      }

      return;

    case 'J':

      // Validate & create an integer zero operand.

      if (auto *C = dyn_cast<ConstantSDNode>(Op))

        if (C->getZExtValue() == 0)

          Ops.push_back(

              DAG.getTargetConstant(0, SDLoc(Op), Subtarget.getGRLenVT()));

      return;

    case 'K':

      // Validate & create a 12-bit unsigned immediate operand.

      if (auto *C = dyn_cast<ConstantSDNode>(Op)) {

        uint64_t CVal = C->getZExtValue();

        if (isUInt<12>(CVal))

          Ops.push_back(

              DAG.getTargetConstant(CVal, SDLoc(Op), Subtarget.getGRLenVT()));

      }

      return;

    default:

      break;

    }

  }

  TargetLowering::LowerAsmOperandForConstraint(Op, Constraint, Ops, DAG);

}


#define GET_REGISTER_MATCHER

#include "LoongArchGenAsmMatcher.inc"


Register

LoongArchTargetLowering::getRegisterByName(const char *RegName, LLT VT,

                                           const MachineFunction &MF) const {

  std::pair<StringRef, StringRef> Name = StringRef(RegName).split('$');

  std::string NewRegName = Name.second.str();

  Register Reg = MatchRegisterAltName(NewRegName);

  if (Reg == LoongArch::NoRegister)

    Reg = MatchRegisterName(NewRegName);

  if (Reg == LoongArch::NoRegister)

    report_fatal_error(

        Twine("Invalid register name \"" + StringRef(RegName) + "\"."));

  BitVector ReservedRegs = Subtarget.getRegisterInfo()->getReservedRegs(MF);

  if (!ReservedRegs.test(Reg))

    report_fatal_error(Twine("Trying to obtain non-reserved register \"" +

                             StringRef(RegName) + "\"."));

  return Reg;

}


bool LoongArchTargetLowering::decomposeMulByConstant(LLVMContext &Context,

                                                     EVT VT, SDValue C) const {

  // TODO: Support vectors.

  if (!VT.isScalarInteger())

    return false;


  // Omit the optimization if the data size exceeds GRLen.

  if (VT.getSizeInBits() > Subtarget.getGRLen())

    return false;


  if (auto *ConstNode = dyn_cast<ConstantSDNode>(C.getNode())) {

    const APInt &Imm = ConstNode->getAPIntValue();

    // Break MUL into (SLLI + ADD/SUB) or ALSL.

    if ((Imm + 1).isPowerOf2() || (Imm - 1).isPowerOf2() ||

        (1 - Imm).isPowerOf2() || (-1 - Imm).isPowerOf2())

      return true;

    // Break MUL into (ALSL x, (SLLI x, imm0), imm1).

    if (ConstNode->hasOneUse() &&

        ((Imm - 2).isPowerOf2() || (Imm - 4).isPowerOf2() ||

         (Imm - 8).isPowerOf2() || (Imm - 16).isPowerOf2()))

      return true;

    // Break (MUL x, imm) into (ADD (SLLI x, s0), (SLLI x, s1)),

    // in which the immediate has two set bits. Or Break (MUL x, imm)

    // into (SUB (SLLI x, s0), (SLLI x, s1)), in which the immediate

    // equals to (1 << s0) - (1 << s1).

    if (ConstNode->hasOneUse() && !(Imm.sge(-2048) && Imm.sle(4095))) {

      unsigned Shifts = Imm.countr_zero();

      // Reject immediates which can be composed via a single LUI.

      if (Shifts >= 12)

        return false;

      // Reject multiplications can be optimized to

      // (SLLI (ALSL x, x, 1/2/3/4), s).

      APInt ImmPop = Imm.ashr(Shifts);

      if (ImmPop == 3 || ImmPop == 5 || ImmPop == 9 || ImmPop == 17)

        return false;

      // We do not consider the case `(-Imm - ImmSmall).isPowerOf2()`,

      // since it needs one more instruction than other 3 cases.

      APInt ImmSmall = APInt(Imm.getBitWidth(), 1ULL << Shifts, true);

      if ((Imm - ImmSmall).isPowerOf2() || (Imm + ImmSmall).isPowerOf2() ||

          (ImmSmall - Imm).isPowerOf2())

        return true;

    }

  }


  return false;

}


bool LoongArchTargetLowering::isLegalAddressingMode(const DataLayout &DL,

                                                    const AddrMode &AM,

                                                    Type *Ty, unsigned AS,

                                                    Instruction *I) const {

  // LoongArch has four basic addressing modes:

  //  1. reg

  //  2. reg + 12-bit signed offset

  //  3. reg + 14-bit signed offset left-shifted by 2

  //  4. reg1 + reg2

  // TODO: Add more checks after support vector extension.


  // No global is ever allowed as a base.

  if (AM.BaseGV)

    return false;


  // Require a 12-bit signed offset or 14-bit signed offset left-shifted by 2

  // with `UAL` feature.

  if (!isInt<12>(AM.BaseOffs) &&

      !(isShiftedInt<14, 2>(AM.BaseOffs) && Subtarget.hasUAL()))

    return false;


  switch (AM.Scale) {

  case 0:

    // "r+i" or just "i", depending on HasBaseReg.

    break;

  case 1:

    // "r+r+i" is not allowed.

    if (AM.HasBaseReg && AM.BaseOffs)

      return false;

    // Otherwise we have "r+r" or "r+i".

    break;

  case 2:

    // "2*r+r" or "2*r+i" is not allowed.

    if (AM.HasBaseReg || AM.BaseOffs)

      return false;

    // Allow "2*r" as "r+r".

    break;

  default:

    return false;

  }


  return true;

}


bool LoongArchTargetLowering::isLegalICmpImmediate(int64_t Imm) const {

  return isInt<12>(Imm);

}


bool LoongArchTargetLowering::isLegalAddImmediate(int64_t Imm) const {

  return isInt<12>(Imm);

}


bool LoongArchTargetLowering::isZExtFree(SDValue Val, EVT VT2) const {

  // Zexts are free if they can be combined with a load.

  // Don't advertise i32->i64 zextload as being free for LA64. It interacts

  // poorly with type legalization of compares preferring sext.

  if (auto *LD = dyn_cast<LoadSDNode>(Val)) {

    EVT MemVT = LD->getMemoryVT();

    if ((MemVT == MVT::i8 || MemVT == MVT::i16) &&

        (LD->getExtensionType() == ISD::NON_EXTLOAD ||

         LD->getExtensionType() == ISD::ZEXTLOAD))

      return true;

  }


  return TargetLowering::isZExtFree(Val, VT2);

}


bool LoongArchTargetLowering::isSExtCheaperThanZExt(EVT SrcVT,

                                                    EVT DstVT) const {

  return Subtarget.is64Bit() && SrcVT == MVT::i32 && DstVT == MVT::i64;

}


bool LoongArchTargetLowering::signExtendConstant(const ConstantInt *CI) const {

  return Subtarget.is64Bit() && CI->getType()->isIntegerTy(32);

}


bool LoongArchTargetLowering::hasAndNotCompare(SDValue Y) const {

  // TODO: Support vectors.

  if (Y.getValueType().isVector())

    return false;


  return !isa<ConstantSDNode>(Y);

}


ISD::NodeType LoongArchTargetLowering::getExtendForAtomicCmpSwapArg() const {

  // LAMCAS will use amcas[_DB].{b/h/w/d} which does not require extension.

  return Subtarget.hasLAMCAS() ? ISD::ANY_EXTEND : ISD::SIGN_EXTEND;

}


bool LoongArchTargetLowering::shouldSignExtendTypeInLibCall(

    Type *Ty, bool IsSigned) const {

  if (Subtarget.is64Bit() && Ty->isIntegerTy(32))

    return true;


  return IsSigned;

}


bool LoongArchTargetLowering::shouldExtendTypeInLibCall(EVT Type) const {

  // Return false to suppress the unnecessary extensions if the LibCall

  // arguments or return value is a float narrower than GRLEN on a soft FP ABI.

  if (Subtarget.isSoftFPABI() && (Type.isFloatingPoint() && !Type.isVector() &&

                                  Type.getSizeInBits() < Subtarget.getGRLen()))

    return false;

  return true;

}


// memcpy, and other memory intrinsics, typically tries to use wider load/store

// if the source/dest is aligned and the copy size is large enough. We therefore

// want to align such objects passed to memory intrinsics.

bool LoongArchTargetLowering::shouldAlignPointerArgs(CallInst *CI,

                                                     unsigned &MinSize,

                                                     Align &PrefAlign) const {

  if (!isa<MemIntrinsic>(CI))

    return false;


  if (Subtarget.is64Bit()) {

    MinSize = 8;

    PrefAlign = Align(8);

  } else {

    MinSize = 4;

    PrefAlign = Align(4);

  }


  return true;

}

MRI
unsigned const MachineRegisterInfo * MRI
Definition: AArch64AdvSIMDScalarPass.cpp:105

MatchRegisterName
static MCRegister MatchRegisterName(StringRef Name)

checkValueWidth
static bool checkValueWidth(SDValue V, unsigned width, ISD::LoadExtType &ExtType)
Definition: AArch64ISelLowering.cpp:24242

performORCombine
static SDValue performORCombine(SDNode *N, TargetLowering::DAGCombinerInfo &DCI, const AArch64Subtarget *Subtarget, const AArch64TargetLowering &TLI)
Definition: AArch64ISelLowering.cpp:19359

performANDCombine
static SDValue performANDCombine(SDNode *N, TargetLowering::DAGCombinerInfo &DCI)
Definition: AArch64ISelLowering.cpp:19567

performSETCCCombine
static SDValue performSETCCCombine(SDNode *N, TargetLowering::DAGCombinerInfo &DCI, SelectionDAG &DAG)
Definition: AArch64ISelLowering.cpp:24965

getNode
static msgpack::DocNode getNode(msgpack::DocNode DN, msgpack::Type Type, MCValue Val)
Definition: AMDGPUDelayedMCExpr.cpp:15

NODE_NAME_CASE
#define NODE_NAME_CASE(node)
Definition: AMDGPUISelLowering.cpp:5459

MBB
MachineBasicBlock & MBB
Definition: ARMSLSHardening.cpp:71

DL
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
Definition: ARMSLSHardening.cpp:73

MatchRegisterAltName
static MCRegister MatchRegisterAltName(StringRef Name)
Maps from the set of all alternative registernames to a register number.

Results
Function Alias Analysis Results
Definition: AliasAnalysis.cpp:731

getConstant
static uint64_t getConstant(const Value *IndexValue)
Definition: BPFAbstractMemberAccess.cpp:319

getTargetNode
static SDValue getTargetNode(GlobalAddressSDNode *N, const SDLoc &DL, EVT Ty, SelectionDAG &DAG, unsigned Flags)
Definition: BPFISelLowering.cpp:724

Info
Analysis containing CSE Info
Definition: CSEInfo.cpp:27

convertValVTToLocVT
static SDValue convertValVTToLocVT(SelectionDAG &DAG, SDValue Val, const CCValAssign &VA, const SDLoc &DL)
Definition: CSKYISelLowering.cpp:199

unpackFromMemLoc
static SDValue unpackFromMemLoc(SelectionDAG &DAG, SDValue Chain, const CCValAssign &VA, const SDLoc &DL)
Definition: CSKYISelLowering.cpp:261

convertLocVTToValVT
static SDValue convertLocVTToValVT(SelectionDAG &DAG, SDValue Val, const CCValAssign &VA, const SDLoc &DL)
Definition: CSKYISelLowering.cpp:215

unpackFromRegLoc
static SDValue unpackFromRegLoc(const CSKYSubtarget &Subtarget, SelectionDAG &DAG, SDValue Chain, const CCValAssign &VA, const SDLoc &DL)
Definition: CSKYISelLowering.cpp:229

CodeGen.h

RetTy
return RetTy
Definition: DeadArgumentElimination.cpp:361

Idx
Returns the sub type a function will return at a given Idx Should correspond to the result type of an ExtractValue instruction executed with just that one unsigned Idx
Definition: DeadArgumentElimination.cpp:353

Debug.h

LLVM_DEBUG
#define LLVM_DEBUG(...)
Definition: Debug.h:106

Addr
uint64_t Addr
Definition: ELFObjHandler.cpp:79

Name
std::string Name
Definition: ELFObjHandler.cpp:77

Size
uint64_t Size
Definition: ELFObjHandler.cpp:81

End
bool End
Definition: ELF_riscv.cpp:480

TII
const HexagonInstrInfo * TII
Definition: HexagonCopyToCombine.cpp:125

IRBuilder.h

MI
IRTranslator LLVM IR MI
Definition: IRTranslator.cpp:112

IntrinsicInst.h

ISDOpcodes.h

KnownBits.h

RegName
#define RegName(no)

LoongArchBaseInfo.h

performINTRINSIC_WO_CHAINCombine
static SDValue performINTRINSIC_WO_CHAINCombine(SDNode *N, SelectionDAG &DAG, TargetLowering::DAGCombinerInfo &DCI, const LoongArchSubtarget &Subtarget)
Definition: LoongArchISelLowering.cpp:3904

lowerVECTOR_SHUFFLE_VREPLVEI
static SDValue lowerVECTOR_SHUFFLE_VREPLVEI(const SDLoc &DL, ArrayRef< int > Mask, MVT VT, SDValue V1, SDValue V2, SelectionDAG &DAG)
Lower VECTOR_SHUFFLE into VREPLVEI (if possible).
Definition: LoongArchISelLowering.cpp:554

ArgFPR32s
const MCPhysReg ArgFPR32s[]
Definition: LoongArchISelLowering.cpp:4888

lowerVECTOR_SHUFFLE_VSHUF4I
static SDValue lowerVECTOR_SHUFFLE_VSHUF4I(const SDLoc &DL, ArrayRef< int > Mask, MVT VT, SDValue V1, SDValue V2, SelectionDAG &DAG)
Lower VECTOR_SHUFFLE into VSHUF4I (if possible).
Definition: LoongArchISelLowering.cpp:596

ArgVRs
const MCPhysReg ArgVRs[]
Definition: LoongArchISelLowering.cpp:4896

lowerVECTOR_SHUFFLE_VPICKEV
static SDValue lowerVECTOR_SHUFFLE_VPICKEV(const SDLoc &DL, ArrayRef< int > Mask, MVT VT, SDValue V1, SDValue V2, SelectionDAG &DAG)
Lower VECTOR_SHUFFLE into VPICKEV (if possible).
Definition: LoongArchISelLowering.cpp:823

lowerVECTOR_SHUFFLE_XVPICKOD
static SDValue lowerVECTOR_SHUFFLE_XVPICKOD(const SDLoc &DL, ArrayRef< int > Mask, MVT VT, SDValue V1, SDValue V2, SelectionDAG &DAG)
Lower VECTOR_SHUFFLE into XVPICKOD (if possible).
Definition: LoongArchISelLowering.cpp:1138

fitsRegularPattern
static bool fitsRegularPattern(typename SmallVectorImpl< ValType >::const_iterator Begin, unsigned CheckStride, typename SmallVectorImpl< ValType >::const_iterator End, ValType ExpectedIndex, unsigned ExpectedIndexStride)
Determine whether a range fits a regular pattern of values.
Definition: LoongArchISelLowering.cpp:526

canonicalizeShuffleVectorByLane
static void canonicalizeShuffleVectorByLane(const SDLoc &DL, MutableArrayRef< int > Mask, MVT VT, SDValue &V1, SDValue &V2, SelectionDAG &DAG)
Shuffle vectors by lane to generate more optimized instructions.
Definition: LoongArchISelLowering.cpp:1242

emitIntrinsicErrorMessage
static SDValue emitIntrinsicErrorMessage(SDValue Op, StringRef ErrorMsg, SelectionDAG &DAG)
Definition: LoongArchISelLowering.cpp:2452

ZeroDivCheck
static cl::opt< bool > ZeroDivCheck("loongarch-check-zero-division", cl::Hidden, cl::desc("Trap on integer division by zero."), cl::init(false))

lower256BitShuffle
static SDValue lower256BitShuffle(const SDLoc &DL, ArrayRef< int > Mask, MVT VT, SDValue V1, SDValue V2, SelectionDAG &DAG)
Dispatching routine to lower various 256-bit LoongArch vector shuffles.
Definition: LoongArchISelLowering.cpp:1345

getEstimateRefinementSteps
static int getEstimateRefinementSteps(EVT VT, const LoongArchSubtarget &Subtarget)
Definition: LoongArchISelLowering.cpp:6154

emitErrorAndReplaceIntrinsicResults
static void emitErrorAndReplaceIntrinsicResults(SDNode *N, SmallVectorImpl< SDValue > &Results, SelectionDAG &DAG, StringRef ErrorMsg, bool WithChain=true)
Definition: LoongArchISelLowering.cpp:2800

checkIntrinsicImmArg
static SDValue checkIntrinsicImmArg(SDValue Op, unsigned ImmOp, SelectionDAG &DAG, bool IsSigned=false)
Definition: LoongArchISelLowering.cpp:2035

lowerVECTOR_SHUFFLE_XVSHUF4I
static SDValue lowerVECTOR_SHUFFLE_XVSHUF4I(const SDLoc &DL, ArrayRef< int > Mask, MVT VT, SDValue V1, SDValue V2, SelectionDAG &DAG)
Lower VECTOR_SHUFFLE into XVSHUF4I (if possible).
Definition: LoongArchISelLowering.cpp:1005

lowerVECTOR_SHUFFLE_VILVH
static SDValue lowerVECTOR_SHUFFLE_VILVH(const SDLoc &DL, ArrayRef< int > Mask, MVT VT, SDValue V1, SDValue V2, SelectionDAG &DAG)
Lower VECTOR_SHUFFLE into VILVH (if possible).
Definition: LoongArchISelLowering.cpp:740

getPrefTypeAlign
static Align getPrefTypeAlign(EVT VT, SelectionDAG &DAG)
Definition: LoongArchISelLowering.cpp:5483

CC_LoongArch
static bool CC_LoongArch(const DataLayout &DL, LoongArchABI::ABI ABI, unsigned ValNo, MVT ValVT, CCValAssign::LocInfo LocInfo, ISD::ArgFlagsTy ArgFlags, CCState &State, bool IsFixed, bool IsRet, Type *OrigTy)
Definition: LoongArchISelLowering.cpp:4942

performSRLCombine
static SDValue performSRLCombine(SDNode *N, SelectionDAG &DAG, TargetLowering::DAGCombinerInfo &DCI, const LoongArchSubtarget &Subtarget)
Definition: LoongArchISelLowering.cpp:3356

lowerVectorBitSetImm
static SDValue lowerVectorBitSetImm(SDNode *Node, SelectionDAG &DAG)
Definition: LoongArchISelLowering.cpp:3870

lowerVECTOR_SHUFFLE_XVPACKOD
static SDValue lowerVECTOR_SHUFFLE_XVPACKOD(const SDLoc &DL, ArrayRef< int > Mask, MVT VT, SDValue V1, SDValue V2, SelectionDAG &DAG)
Lower VECTOR_SHUFFLE into XVPACKOD (if possible).
Definition: LoongArchISelLowering.cpp:1023

CRC_CASE_EXT_BINARYOP
#define CRC_CASE_EXT_BINARYOP(NAME, NODE)

lowerVectorBitRevImm
static SDValue lowerVectorBitRevImm(SDNode *Node, SelectionDAG &DAG)
Definition: LoongArchISelLowering.cpp:3887

truncateVecElts
static SDValue truncateVecElts(SDNode *Node, SelectionDAG &DAG)
Definition: LoongArchISelLowering.cpp:3832

insertDivByZeroTrap
static MachineBasicBlock * insertDivByZeroTrap(MachineInstr &MI, MachineBasicBlock *MBB)
Definition: LoongArchISelLowering.cpp:4418

customLegalizeToWOpWithSExt
static SDValue customLegalizeToWOpWithSExt(SDNode *N, SelectionDAG &DAG)
Definition: LoongArchISelLowering.cpp:2788

lowerVectorBitClear
static SDValue lowerVectorBitClear(SDNode *Node, SelectionDAG &DAG)
Definition: LoongArchISelLowering.cpp:3840

CC_LoongArch_GHC
static bool CC_LoongArch_GHC(unsigned ValNo, MVT ValVT, MVT LocVT, CCValAssign::LocInfo LocInfo, ISD::ArgFlagsTy ArgFlags, CCState &State)
Definition: LoongArchISelLowering.cpp:5231

lowerVECTOR_SHUFFLE_VPACKEV
static SDValue lowerVECTOR_SHUFFLE_VPACKEV(const SDLoc &DL, ArrayRef< int > Mask, MVT VT, SDValue V1, SDValue V2, SelectionDAG &DAG)
Lower VECTOR_SHUFFLE into VPACKEV (if possible).
Definition: LoongArchISelLowering.cpp:659

replaceVPICKVE2GRResults
static void replaceVPICKVE2GRResults(SDNode *Node, SmallVectorImpl< SDValue > &Results, SelectionDAG &DAG, const LoongArchSubtarget &Subtarget, unsigned ResOp)
Definition: LoongArchISelLowering.cpp:2812

legalizeIntrinsicImmArg
static SDValue legalizeIntrinsicImmArg(SDNode *Node, unsigned ImmOp, SelectionDAG &DAG, const LoongArchSubtarget &Subtarget, bool IsSigned=false)
Definition: LoongArchISelLowering.cpp:3796

emitIntrinsicWithChainErrorMessage
static SDValue emitIntrinsicWithChainErrorMessage(SDValue Op, StringRef ErrorMsg, SelectionDAG &DAG)
Definition: LoongArchISelLowering.cpp:2329

ArgXRs
const MCPhysReg ArgXRs[]
Definition: LoongArchISelLowering.cpp:4900

CC_LoongArchAssign2GRLen
static bool CC_LoongArchAssign2GRLen(unsigned GRLen, CCState &State, CCValAssign VA1, ISD::ArgFlagsTy ArgFlags1, unsigned ValNo2, MVT ValVT2, MVT LocVT2, ISD::ArgFlagsTy ArgFlags2)
Definition: LoongArchISelLowering.cpp:4906

ArgFPR64s
const MCPhysReg ArgFPR64s[]
Definition: LoongArchISelLowering.cpp:4892

emitPseudoCTPOP
static MachineBasicBlock * emitPseudoCTPOP(MachineInstr &MI, MachineBasicBlock *BB, const LoongArchSubtarget &Subtarget)
Definition: LoongArchISelLowering.cpp:4657

IOCSRWR_CASE
#define IOCSRWR_CASE(NAME, NODE)

CRC_CASE_EXT_UNARYOP
#define CRC_CASE_EXT_UNARYOP(NAME, NODE)

lowerVECTOR_SHUFFLE_VPACKOD
static SDValue lowerVECTOR_SHUFFLE_VPACKOD(const SDLoc &DL, ArrayRef< int > Mask, MVT VT, SDValue V1, SDValue V2, SelectionDAG &DAG)
Lower VECTOR_SHUFFLE into VPACKOD (if possible).
Definition: LoongArchISelLowering.cpp:699

emitPseudoXVINSGR2VR
static MachineBasicBlock * emitPseudoXVINSGR2VR(MachineInstr &MI, MachineBasicBlock *BB, const LoongArchSubtarget &Subtarget)
Definition: LoongArchISelLowering.cpp:4593

lowerVectorSplatImm
static SDValue lowerVectorSplatImm(SDNode *Node, unsigned ImmOp, SelectionDAG &DAG, bool IsSigned=false)
Definition: LoongArchISelLowering.cpp:3813

ArgGPRs
const MCPhysReg ArgGPRs[]
Definition: LoongArchISelLowering.cpp:4883

lowerVECTOR_SHUFFLE_XVILVL
static SDValue lowerVECTOR_SHUFFLE_XVILVL(const SDLoc &DL, ArrayRef< int > Mask, MVT VT, SDValue V1, SDValue V2, SelectionDAG &DAG)
Lower VECTOR_SHUFFLE into XVILVL (if possible).
Definition: LoongArchISelLowering.cpp:1069

customLegalizeToWOp
static SDValue customLegalizeToWOp(SDNode *N, SelectionDAG &DAG, int NumOp, unsigned ExtOpc=ISD::ANY_EXTEND)
Definition: LoongArchISelLowering.cpp:2754

replaceVecCondBranchResults
static void replaceVecCondBranchResults(SDNode *N, SmallVectorImpl< SDValue > &Results, SelectionDAG &DAG, const LoongArchSubtarget &Subtarget, unsigned ResOp)
Definition: LoongArchISelLowering.cpp:2833

ASRT_LE_GT_CASE
#define ASRT_LE_GT_CASE(NAME)

isConstantOrUndef
static bool isConstantOrUndef(const SDValue Op)
Definition: LoongArchISelLowering.cpp:1445

lowerVECTOR_SHUFFLE_XVPACKEV
static SDValue lowerVECTOR_SHUFFLE_XVPACKEV(const SDLoc &DL, ArrayRef< int > Mask, MVT VT, SDValue V1, SDValue V2, SelectionDAG &DAG)
Lower VECTOR_SHUFFLE into XVPACKEV (if possible).
Definition: LoongArchISelLowering.cpp:1016

emitVecCondBranchPseudo
static MachineBasicBlock * emitVecCondBranchPseudo(MachineInstr &MI, MachineBasicBlock *BB, const LoongArchSubtarget &Subtarget)
Definition: LoongArchISelLowering.cpp:4468

lowerVECTOR_SHUFFLE_XVILVH
static SDValue lowerVECTOR_SHUFFLE_XVILVH(const SDLoc &DL, ArrayRef< int > Mask, MVT VT, SDValue V1, SDValue V2, SelectionDAG &DAG)
Lower VECTOR_SHUFFLE into XVILVH (if possible).
Definition: LoongArchISelLowering.cpp:1030

lowerVECTOR_SHUFFLE_XVSHUF
static SDValue lowerVECTOR_SHUFFLE_XVSHUF(const SDLoc &DL, ArrayRef< int > Mask, MVT VT, SDValue V1, SDValue V2, SelectionDAG &DAG)
Lower VECTOR_SHUFFLE into XVSHUF (if possible).
Definition: LoongArchISelLowering.cpp:1174

replaceCMP_XCHG_128Results
static void replaceCMP_XCHG_128Results(SDNode *N, SmallVectorImpl< SDValue > &Results, SelectionDAG &DAG)
Definition: LoongArchISelLowering.cpp:2914

performBITREV_WCombine
static SDValue performBITREV_WCombine(SDNode *N, SelectionDAG &DAG, TargetLowering::DAGCombinerInfo &DCI, const LoongArchSubtarget &Subtarget)
Definition: LoongArchISelLowering.cpp:3781

IOCSRRD_CASE
#define IOCSRRD_CASE(NAME, NODE)

lower128BitShuffle
static SDValue lower128BitShuffle(const SDLoc &DL, ArrayRef< int > Mask, MVT VT, SDValue V1, SDValue V2, SelectionDAG &DAG)
Dispatching routine to lower various 128-bit LoongArch vector shuffles.
Definition: LoongArchISelLowering.cpp:920

lowerVECTOR_SHUFFLE_XVPICKEV
static SDValue lowerVECTOR_SHUFFLE_XVPICKEV(const SDLoc &DL, ArrayRef< int > Mask, MVT VT, SDValue V1, SDValue V2, SelectionDAG &DAG)
Lower VECTOR_SHUFFLE into XVPICKEV (if possible).
Definition: LoongArchISelLowering.cpp:1103

lowerVECTOR_SHUFFLE_VILVL
static SDValue lowerVECTOR_SHUFFLE_VILVL(const SDLoc &DL, ArrayRef< int > Mask, MVT VT, SDValue V1, SDValue V2, SelectionDAG &DAG)
Lower VECTOR_SHUFFLE into VILVL (if possible).
Definition: LoongArchISelLowering.cpp:783

lowerVectorBitClearImm
static SDValue lowerVectorBitClearImm(SDNode *Node, SelectionDAG &DAG)
Definition: LoongArchISelLowering.cpp:3852

isConstantOrUndefBUILD_VECTOR
static bool isConstantOrUndefBUILD_VECTOR(const BuildVectorSDNode *Op)
Definition: LoongArchISelLowering.cpp:1455

replaceINTRINSIC_WO_CHAINResults
static void replaceINTRINSIC_WO_CHAINResults(SDNode *N, SmallVectorImpl< SDValue > &Results, SelectionDAG &DAG, const LoongArchSubtarget &Subtarget)
Definition: LoongArchISelLowering.cpp:2847

lowerVECTOR_SHUFFLE_XVREPLVEI
static SDValue lowerVECTOR_SHUFFLE_XVREPLVEI(const SDLoc &DL, ArrayRef< int > Mask, MVT VT, SDValue V1, SDValue V2, SelectionDAG &DAG)
Lower VECTOR_SHUFFLE into XVREPLVEI (if possible).
Definition: LoongArchISelLowering.cpp:973

CSR_CASE
#define CSR_CASE(ID)

lowerVECTOR_SHUFFLE_VPICKOD
static SDValue lowerVECTOR_SHUFFLE_VPICKOD(const SDLoc &DL, ArrayRef< int > Mask, MVT VT, SDValue V1, SDValue V2, SelectionDAG &DAG)
Lower VECTOR_SHUFFLE into VPICKOD (if possible).
Definition: LoongArchISelLowering.cpp:865

getIntrinsicForMaskedAtomicRMWBinOp
static Intrinsic::ID getIntrinsicForMaskedAtomicRMWBinOp(unsigned GRLen, AtomicRMWInst::BinOp BinOp)
Definition: LoongArchISelLowering.cpp:5986

lowerVECTOR_SHUFFLE_VSHUF
static SDValue lowerVECTOR_SHUFFLE_VSHUF(const SDLoc &DL, ArrayRef< int > Mask, MVT VT, SDValue V1, SDValue V2, SelectionDAG &DAG)
Lower VECTOR_SHUFFLE into VSHUF.
Definition: LoongArchISelLowering.cpp:895

getLoongArchWOpcode
static LoongArchISD::NodeType getLoongArchWOpcode(unsigned Opcode)
Definition: LoongArchISelLowering.cpp:2721

LoongArchISelLowering.h

LoongArchMCTargetDesc.h

LoongArchMachineFunctionInfo.h

LoongArchRegisterInfo.h

LoongArchSubtarget.h

LoongArch.h

F
#define F(x, y, z)
Definition: MD5.cpp:55

I
#define I(x, y, z)
Definition: MD5.cpp:58

TRI
unsigned const TargetRegisterInfo * TRI
Definition: MachineSink.cpp:2029

MathExtras.h

Y
static GCMetadataPrinterRegistry::Add< OcamlGCMetadataPrinter > Y("ocaml", "ocaml 3.10-compatible collector")

getCodeModel
static CodeModel::Model getCodeModel(const PPCSubtarget &S, const TargetMachine &TM, const MachineOperand &MO)
Definition: PPCAsmPrinter.cpp:479

CC
auto CC
Definition: RISCVRedundantCopyElimination.cpp:79

RuntimeLibcallUtil.h

assert
assert(ImpDefSCC.getReg()==AMDGPU::SCC &&ImpDefSCC.isDef())

SelectionDAGNodes.h

Enabled
static bool Enabled
Definition: Statistic.cpp:46

Statistic.h
This file defines the 'Statistic' class, which is designed to be an easy way to expose various metric...

STATISTIC
#define STATISTIC(VARNAME, DESC)
Definition: Statistic.h:166

StringExtras.h
This file contains some functions that are useful when dealing with strings.

Ptr
@ Ptr
Definition: TargetLibraryInfo.cpp:77

FunctionType
Definition: ItaniumDemangle.h:823

Node
Definition: ItaniumDemangle.h:163

T

llvm::APFloat
Definition: APFloat.h:904

llvm::APInt
Class for arbitrary precision integers.
Definition: APInt.h:78

llvm::APInt::isSubsetOf
bool isSubsetOf(const APInt &RHS) const
This operation checks that all bits set in this APInt are also set in RHS.
Definition: APInt.h:1257

llvm::Argument
This class represents an incoming formal argument to a Function.
Definition: Argument.h:31

llvm::ArrayRef
ArrayRef - Represent a constant reference to an array (0 or more elements consecutively in memory),...
Definition: ArrayRef.h:41

llvm::ArrayRef::size
size_t size() const
size - Get the array size.
Definition: ArrayRef.h:168

llvm::AtomicCmpXchgInst
An instruction that atomically checks whether a specified value is in a memory location,...
Definition: Instructions.h:501

llvm::AtomicCmpXchgInst::getCompareOperand
Value * getCompareOperand()
Definition: Instructions.h:633

llvm::AtomicCmpXchgInst::getFailureOrdering
AtomicOrdering getFailureOrdering() const
Returns the failure ordering constraint of this cmpxchg instruction.
Definition: Instructions.h:594

llvm::AtomicRMWInst
an instruction that atomically reads a memory location, combines it with another value,...
Definition: Instructions.h:704

llvm::AtomicRMWInst::getAlign
Align getAlign() const
Return the alignment of the memory that is being allocated by the instruction.
Definition: Instructions.h:827

llvm::AtomicRMWInst::BinOp
BinOp
This enumeration lists the possible modifications atomicrmw can make.
Definition: Instructions.h:716

llvm::AtomicRMWInst::Add
@ Add
*p = old + v
Definition: Instructions.h:720

llvm::AtomicRMWInst::USubCond
@ USubCond
Subtract only if no unsigned overflow.
Definition: Instructions.h:764

llvm::AtomicRMWInst::Min
@ Min
*p = old <signed v ? old : v
Definition: Instructions.h:734

llvm::AtomicRMWInst::Or
@ Or
*p = old | v
Definition: Instructions.h:728

llvm::AtomicRMWInst::Sub
@ Sub
*p = old - v
Definition: Instructions.h:722

llvm::AtomicRMWInst::And
@ And
*p = old & v
Definition: Instructions.h:724

llvm::AtomicRMWInst::Xor
@ Xor
*p = old ^ v
Definition: Instructions.h:730

llvm::AtomicRMWInst::USubSat
@ USubSat
*p = usub.sat(old, v) usub.sat matches the behavior of llvm.usub.sat.
Definition: Instructions.h:768

llvm::AtomicRMWInst::UIncWrap
@ UIncWrap
Increment one up to a maximum value.
Definition: Instructions.h:756

llvm::AtomicRMWInst::Max
@ Max
*p = old >signed v ? old : v
Definition: Instructions.h:732

llvm::AtomicRMWInst::UMin
@ UMin
*p = old <unsigned v ? old : v
Definition: Instructions.h:738

llvm::AtomicRMWInst::UMax
@ UMax
*p = old >unsigned v ? old : v
Definition: Instructions.h:736

llvm::AtomicRMWInst::UDecWrap
@ UDecWrap
Decrement one until a minimum value or zero.
Definition: Instructions.h:760

llvm::AtomicRMWInst::Xchg
@ Xchg
*p = v
Definition: Instructions.h:718

llvm::AtomicRMWInst::Nand
@ Nand
*p = ~(old & v)
Definition: Instructions.h:726

llvm::AtomicRMWInst::getPointerOperand
Value * getPointerOperand()
Definition: Instructions.h:870

llvm::AtomicRMWInst::isFloatingPointOperation
bool isFloatingPointOperation() const
Definition: Instructions.h:882

llvm::AtomicRMWInst::getOperation
BinOp getOperation() const
Definition: Instructions.h:805

llvm::AtomicRMWInst::getSyncScopeID
SyncScope::ID getSyncScopeID() const
Returns the synchronization scope ID of this rmw instruction.
Definition: Instructions.h:861

llvm::AtomicRMWInst::getValOperand
Value * getValOperand()
Definition: Instructions.h:874

llvm::AtomicRMWInst::getOrdering
AtomicOrdering getOrdering() const
Returns the ordering constraint of this rmw instruction.
Definition: Instructions.h:847

llvm::BasicBlock
LLVM Basic Block Representation.
Definition: BasicBlock.h:61

llvm::BitVector
Definition: BitVector.h:82

llvm::BitVector::test
bool test(unsigned Idx) const
Definition: BitVector.h:461

llvm::BlockAddressSDNode
Definition: SelectionDAGNodes.h:2314

llvm::BuildVectorSDNode
A "pseudo-class" with methods for operating on BUILD_VECTORs.
Definition: SelectionDAGNodes.h:2107

llvm::CCState
CCState - This class holds information needed while lowering arguments and return values.
Definition: CallingConvLower.h:170

llvm::CCState::getFirstUnallocated
unsigned getFirstUnallocated(ArrayRef< MCPhysReg > Regs) const
getFirstUnallocated - Return the index of the first unallocated register in the set,...
Definition: CallingConvLower.h:315

llvm::CCState::getPendingArgFlags
SmallVectorImpl< ISD::ArgFlagsTy > & getPendingArgFlags()
Definition: CallingConvLower.h:488

llvm::CCState::AllocateReg
MCRegister AllocateReg(MCPhysReg Reg)
AllocateReg - Attempt to allocate one register.
Definition: CallingConvLower.h:330

llvm::CCState::AllocateStack
int64_t AllocateStack(unsigned Size, Align Alignment)
AllocateStack - Allocate a chunk of stack space with the specified size and alignment.
Definition: CallingConvLower.h:405

llvm::CCState::AnalyzeCallOperands
void AnalyzeCallOperands(const SmallVectorImpl< ISD::OutputArg > &Outs, CCAssignFn Fn)
AnalyzeCallOperands - Analyze the outgoing arguments to a call, incorporating info about the passed v...
Definition: CallingConvLower.cpp:126

llvm::CCState::getStackSize
uint64_t getStackSize() const
Returns the size of the currently allocated portion of the stack.
Definition: CallingConvLower.h:245

llvm::CCState::getPendingLocs
SmallVectorImpl< CCValAssign > & getPendingLocs()
Definition: CallingConvLower.h:483

llvm::CCState::AnalyzeFormalArguments
void AnalyzeFormalArguments(const SmallVectorImpl< ISD::InputArg > &Ins, CCAssignFn Fn)
AnalyzeFormalArguments - Analyze an array of argument values, incorporating info about the formals in...
Definition: CallingConvLower.cpp:85

llvm::CCState::addLoc
void addLoc(const CCValAssign &V)
Definition: CallingConvLower.h:235

llvm::CCValAssign
CCValAssign - Represent assignment of one arg/retval to a location.
Definition: CallingConvLower.h:33

llvm::CCValAssign::isRegLoc
bool isRegLoc() const
Definition: CallingConvLower.h:122

llvm::CCValAssign::getPending
static CCValAssign getPending(unsigned ValNo, MVT ValVT, MVT LocVT, LocInfo HTP, unsigned ExtraInfo=0)
Definition: CallingConvLower.h:108

llvm::CCValAssign::getLocReg
Register getLocReg() const
Definition: CallingConvLower.h:128

llvm::CCValAssign::getLocInfo
LocInfo getLocInfo() const
Definition: CallingConvLower.h:134

llvm::CCValAssign::getReg
static CCValAssign getReg(unsigned ValNo, MVT ValVT, MCRegister Reg, MVT LocVT, LocInfo HTP, bool IsCustom=false)
Definition: CallingConvLower.h:84

llvm::CCValAssign::LocInfo
LocInfo
Definition: CallingConvLower.h:35

llvm::CCValAssign::BCvt
@ BCvt
Definition: CallingConvLower.h:46

llvm::CCValAssign::Full
@ Full
Definition: CallingConvLower.h:36

llvm::CCValAssign::Indirect
@ Indirect
Definition: CallingConvLower.h:52

llvm::CCValAssign::getMem
static CCValAssign getMem(unsigned ValNo, MVT ValVT, int64_t Offset, MVT LocVT, LocInfo HTP, bool IsCustom=false)
Definition: CallingConvLower.h:96

llvm::CCValAssign::getValVT
MVT getValVT() const
Definition: CallingConvLower.h:120

llvm::CCValAssign::isMemLoc
bool isMemLoc() const
Definition: CallingConvLower.h:123

llvm::CCValAssign::getLocMemOffset
int64_t getLocMemOffset() const
Definition: CallingConvLower.h:129

llvm::CCValAssign::getValNo
unsigned getValNo() const
Definition: CallingConvLower.h:119

llvm::CCValAssign::getLocVT
MVT getLocVT() const
Definition: CallingConvLower.h:132

llvm::CallBase::isMustTailCall
bool isMustTailCall() const
Tests if this call site must be tail call optimized.
Definition: Instructions.cpp:343

llvm::CallInst
This class represents a function call, abstracting a target machine's calling convention.
Definition: Instructions.h:1479

llvm::CallInst::isTailCall
bool isTailCall() const
Definition: Instructions.h:1589

llvm::ConstantInt
This is the shared class of boolean and integer constants.
Definition: Constants.h:83

llvm::ConstantInt::isMinusOne
bool isMinusOne() const
This function will return true iff every bit in this constant is set to true.
Definition: Constants.h:220

llvm::ConstantInt::isZero
bool isZero() const
This is just a convenience method to make client code smaller for a common code.
Definition: Constants.h:208

llvm::ConstantPoolSDNode
Definition: SelectionDAGNodes.h:2002

llvm::ConstantSDNode
Definition: SelectionDAGNodes.h:1684

llvm::ConstantSDNode::getZExtValue
uint64_t getZExtValue() const
Definition: SelectionDAGNodes.h:1701

llvm::ConstantSDNode::getSExtValue
int64_t getSExtValue() const
Definition: SelectionDAGNodes.h:1702

llvm::Constant
This is an important base class in LLVM.
Definition: Constant.h:42

llvm::DWARFExpression::Operation
This class represents an Operation in the Expression.
Definition: DWARFExpression.h:32

llvm::DWARFExpression::Operation::getNumOperands
uint64_t getNumOperands() const
Definition: DWARFExpression.h:90

llvm::DataLayout
A parsed version of the target data layout string in and methods for querying it.
Definition: DataLayout.h:63

llvm::DataLayout::getPointerSizeInBits
unsigned getPointerSizeInBits(unsigned AS=0) const
Layout pointer size, in bits FIXME: The defaults need to be removed once all of the backends/clients ...
Definition: DataLayout.h:364

llvm::DataLayout::getPrefTypeAlign
Align getPrefTypeAlign(Type *Ty) const
Returns the preferred stack/global alignment for the specified type.
Definition: DataLayout.cpp:847

llvm::DebugLoc
A debug info location.
Definition: DebugLoc.h:33

llvm::ExternalSymbolSDNode
Definition: SelectionDAGNodes.h:2356

llvm::Function
Definition: Function.h:63

llvm::Function::getFunctionType
FunctionType * getFunctionType() const
Returns the FunctionType for me.
Definition: Function.h:216

llvm::Function::getCallingConv
CallingConv::ID getCallingConv() const
getCallingConv()/setCallingConv(CC) - These method get and set the calling convention of this functio...
Definition: Function.h:277

llvm::Function::getArg
Argument * getArg(unsigned i) const
Definition: Function.h:886

llvm::GlobalAddressSDNode
Definition: SelectionDAGNodes.h:1876

llvm::GlobalValue
Definition: GlobalValue.h:48

llvm::GlobalValue::isDSOLocal
bool isDSOLocal() const
Definition: GlobalValue.h:306

llvm::IRBuilderBase
Common base class shared among various IRBuilders.
Definition: IRBuilder.h:113

llvm::IRBuilderBase::CreateSExt
Value * CreateSExt(Value *V, Type *DestTy, const Twine &Name="")
Definition: IRBuilder.h:2045

llvm::IRBuilderBase::CreateLShr
Value * CreateLShr(Value *LHS, Value *RHS, const Twine &Name="", bool isExact=false)
Definition: IRBuilder.h:1480

llvm::IRBuilderBase::getInt32Ty
IntegerType * getInt32Ty()
Fetch the type representing a 32-bit integer.
Definition: IRBuilder.h:545

llvm::IRBuilderBase::getInt64Ty
IntegerType * getInt64Ty()
Fetch the type representing a 64-bit integer.
Definition: IRBuilder.h:550

llvm::IRBuilderBase::CreateIntrinsic
CallInst * CreateIntrinsic(Intrinsic::ID ID, ArrayRef< Type * > Types, ArrayRef< Value * > Args, FMFSource FMFSource={}, const Twine &Name="")
Create a call to intrinsic ID with Args, mangled using Types.
Definition: IRBuilder.cpp:900

llvm::IRBuilderBase::CreateNot
Value * CreateNot(Value *V, const Twine &Name="")
Definition: IRBuilder.h:1757

llvm::IRBuilderBase::CreateSub
Value * CreateSub(Value *LHS, Value *RHS, const Twine &Name="", bool HasNUW=false, bool HasNSW=false)
Definition: IRBuilder.h:1387

llvm::IRBuilderBase::CreateBitCast
Value * CreateBitCast(Value *V, Type *DestTy, const Twine &Name="")
Definition: IRBuilder.h:2152

llvm::IRBuilderBase::getIntN
ConstantInt * getIntN(unsigned N, uint64_t C)
Get a constant N-bit value, zero extended or truncated from a 64-bit value.
Definition: IRBuilder.h:516

llvm::IRBuilderBase::CreateShl
Value * CreateShl(Value *LHS, Value *RHS, const Twine &Name="", bool HasNUW=false, bool HasNSW=false)
Definition: IRBuilder.h:1459

llvm::IRBuilderBase::CreateZExt
Value * CreateZExt(Value *V, Type *DestTy, const Twine &Name="", bool IsNonNeg=false)
Definition: IRBuilder.h:2033

llvm::IRBuilderBase::getContext
LLVMContext & getContext() const
Definition: IRBuilder.h:195

llvm::IRBuilderBase::CreateAnd
Value * CreateAnd(Value *LHS, Value *RHS, const Twine &Name="")
Definition: IRBuilder.h:1518

llvm::IRBuilderBase::CreatePtrToInt
Value * CreatePtrToInt(Value *V, Type *DestTy, const Twine &Name="")
Definition: IRBuilder.h:2142

llvm::IRBuilderBase::CreateCall
CallInst * CreateCall(FunctionType *FTy, Value *Callee, ArrayRef< Value * > Args={}, const Twine &Name="", MDNode *FPMathTag=nullptr)
Definition: IRBuilder.h:2449

llvm::IRBuilderBase::CreateAtomicRMW
AtomicRMWInst * CreateAtomicRMW(AtomicRMWInst::BinOp Op, Value *Ptr, Value *Val, MaybeAlign Align, AtomicOrdering Ordering, SyncScope::ID SSID=SyncScope::System)
Definition: IRBuilder.h:1862

llvm::IRBuilderBase::CreateTrunc
Value * CreateTrunc(Value *V, Type *DestTy, const Twine &Name="", bool IsNUW=false, bool IsNSW=false)
Definition: IRBuilder.h:2019

llvm::IRBuilderBase::CreateOr
Value * CreateOr(Value *LHS, Value *RHS, const Twine &Name="")
Definition: IRBuilder.h:1540

llvm::IRBuilder
This provides a uniform API for creating instructions and inserting them into a basic block: either a...
Definition: IRBuilder.h:2705

llvm::InlineAsm::ConstraintCode
ConstraintCode
Definition: InlineAsm.h:239

llvm::InlineAsm::ConstraintCode::k
@ k

llvm::InlineAsm::ConstraintCode::ZB
@ ZB

llvm::InlineAsm::ConstraintCode::ZC
@ ZC

llvm::Instruction
Definition: Instruction.h:68

llvm::Instruction::getModule
const Module * getModule() const
Return the module owning the function this instruction belongs to or nullptr it the function does not...
Definition: Instruction.cpp:68

llvm::Instruction::eraseFromParent
InstListType::iterator eraseFromParent()
This method unlinks 'this' from the containing basic block and deletes it.
Definition: Instruction.cpp:94

llvm::Instruction::getDataLayout
const DataLayout & getDataLayout() const
Get the data layout of the module this instruction belongs to.
Definition: Instruction.cpp:76

llvm::IntegerType
Class to represent integer types.
Definition: DerivedTypes.h:42

llvm::JumpTableSDNode
Definition: SelectionDAGNodes.h:1981

llvm::LLT
Definition: LowLevelType.h:39

llvm::LLVMContext
This is an important class for using LLVM in a threaded context.
Definition: LLVMContext.h:67

llvm::LLVMContext::emitError
void emitError(const Instruction *I, const Twine &ErrorStr)
emitError - Emit an error message to the currently installed error handler with optional location inf...
Definition: LLVMContext.cpp:210

llvm::LoadSDNode
This class is used to represent ISD::LOAD nodes.
Definition: SelectionDAGNodes.h:2464

llvm::LoadSDNode::getExtensionType
ISD::LoadExtType getExtensionType() const
Return whether this is a plain node, or one of the varieties of value-extending loads.
Definition: SelectionDAGNodes.h:2479

llvm::LoongArchMachineFunctionInfo
LoongArchMachineFunctionInfo - This class is derived from MachineFunctionInfo and contains private Lo...
Definition: LoongArchMachineFunctionInfo.h:25

llvm::LoongArchMachineFunctionInfo::addSExt32Register
void addSExt32Register(Register Reg)
Definition: LoongArchMachineFunctionInfo.h:73

llvm::LoongArchSubtarget
Definition: LoongArchSubtarget.h:32

llvm::LoongArchSubtarget::getRegisterInfo
const LoongArchRegisterInfo * getRegisterInfo() const override
Definition: LoongArchSubtarget.h:80

llvm::LoongArchSubtarget::getGRLenVT
MVT getGRLenVT() const
Definition: LoongArchSubtarget.h:95

llvm::LoongArchSubtarget::is64Bit
bool is64Bit() const
Definition: LoongArchSubtarget.h:94

llvm::LoongArchSubtarget::isSoftFPABI
bool isSoftFPABI() const
Definition: LoongArchSubtarget.h:98

llvm::LoongArchSubtarget::getInstrInfo
const LoongArchInstrInfo * getInstrInfo() const override
Definition: LoongArchSubtarget.h:79

llvm::LoongArchSubtarget::getMaxBytesForAlignment
unsigned getMaxBytesForAlignment() const
Definition: LoongArchSubtarget.h:105

llvm::LoongArchSubtarget::getPrefFunctionAlignment
Align getPrefFunctionAlignment() const
Definition: LoongArchSubtarget.h:103

llvm::LoongArchSubtarget::getGRLen
unsigned getGRLen() const
Definition: LoongArchSubtarget.h:96

llvm::LoongArchSubtarget::getPrefLoopAlignment
Align getPrefLoopAlignment() const
Definition: LoongArchSubtarget.h:104

llvm::LoongArchTargetLowering
Definition: LoongArchISelLowering.h:156

llvm::LoongArchTargetLowering::isUsedByReturnOnly
bool isUsedByReturnOnly(SDNode *N, SDValue &Chain) const override
Return true if result of the specified node is used by a return node only.
Definition: LoongArchISelLowering.cpp:5410

llvm::LoongArchTargetLowering::PerformDAGCombine
SDValue PerformDAGCombine(SDNode *N, DAGCombinerInfo &DCI) const override
This method will be invoked for all target nodes and for any target-independent nodes that the target...
Definition: LoongArchISelLowering.cpp:4396

llvm::LoongArchTargetLowering::getSqrtEstimate
SDValue getSqrtEstimate(SDValue Operand, SelectionDAG &DAG, int Enabled, int &RefinementSteps, bool &UseOneConstNR, bool Reciprocal) const override
Hooks for building estimates in place of slower divisions and square roots.
Definition: LoongArchISelLowering.cpp:6162

llvm::LoongArchTargetLowering::isLegalICmpImmediate
bool isLegalICmpImmediate(int64_t Imm) const override
Return true if the specified immediate is legal icmp immediate, that is the target has icmp instructi...
Definition: LoongArchISelLowering.cpp:6492

llvm::LoongArchTargetLowering::shouldExpandAtomicCmpXchgInIR
TargetLowering::AtomicExpansionKind shouldExpandAtomicCmpXchgInIR(AtomicCmpXchgInst *CI) const override
Returns how the given atomic cmpxchg should be expanded by the IR-level AtomicExpand pass.
Definition: LoongArchISelLowering.cpp:6032

llvm::LoongArchTargetLowering::emitMaskedAtomicCmpXchgIntrinsic
Value * emitMaskedAtomicCmpXchgIntrinsic(IRBuilderBase &Builder, AtomicCmpXchgInst *CI, Value *AlignedAddr, Value *CmpVal, Value *NewVal, Value *Mask, AtomicOrdering Ord) const override
Perform a masked cmpxchg using a target-specific intrinsic.
Definition: LoongArchISelLowering.cpp:6044

llvm::LoongArchTargetLowering::getSetCCResultType
EVT getSetCCResultType(const DataLayout &DL, LLVMContext &Context, EVT VT) const override
Return the ValueType of the result of SETCC operations.
Definition: LoongArchISelLowering.cpp:5858

llvm::LoongArchTargetLowering::isFMAFasterThanFMulAndFAdd
bool isFMAFasterThanFMulAndFAdd(const MachineFunction &MF, EVT VT) const override
Return true if an FMA operation is faster than a pair of fmul and fadd instructions.
Definition: LoongArchISelLowering.cpp:6122

llvm::LoongArchTargetLowering::LowerCall
SDValue LowerCall(TargetLowering::CallLoweringInfo &CLI, SmallVectorImpl< SDValue > &InVals) const override
This hook must be implemented to lower calls into the specified DAG.
Definition: LoongArchISelLowering.cpp:5491

llvm::LoongArchTargetLowering::decomposeMulByConstant
bool decomposeMulByConstant(LLVMContext &Context, EVT VT, SDValue C) const override
Return true if it is profitable to transform an integer multiplication-by-constant into simpler opera...
Definition: LoongArchISelLowering.cpp:6401

llvm::LoongArchTargetLowering::isSExtCheaperThanZExt
bool isSExtCheaperThanZExt(EVT SrcVT, EVT DstVT) const override
Return true if sign-extension from FromTy to ToTy is cheaper than zero-extension.
Definition: LoongArchISelLowering.cpp:6515

llvm::LoongArchTargetLowering::shouldExpandAtomicRMWInIR
TargetLowering::AtomicExpansionKind shouldExpandAtomicRMWInIR(AtomicRMWInst *AI) const override
Returns how the IR-level AtomicExpand pass should expand the given AtomicRMW, if at all.
Definition: LoongArchISelLowering.cpp:5951

llvm::LoongArchTargetLowering::allowsMisalignedMemoryAccesses
bool allowsMisalignedMemoryAccesses(EVT VT, unsigned AddrSpace=0, Align Alignment=Align(1), MachineMemOperand::Flags Flags=MachineMemOperand::MONone, unsigned *Fast=nullptr) const override
Determine if the target supports unaligned memory accesses.
Definition: LoongArchISelLowering.cpp:4772

llvm::LoongArchTargetLowering::isCheapToSpeculateCtlz
bool isCheapToSpeculateCtlz(Type *Ty) const override
Return true if it is cheap to speculate a call to intrinsic ctlz.
Definition: LoongArchISelLowering.cpp:5835

llvm::LoongArchTargetLowering::LowerOperation
SDValue LowerOperation(SDValue Op, SelectionDAG &DAG) const override
This callback is invoked for operations that are unsupported by the target, which are registered to u...
Definition: LoongArchISelLowering.cpp:405

llvm::LoongArchTargetLowering::shouldAlignPointerArgs
bool shouldAlignPointerArgs(CallInst *CI, unsigned &MinSize, Align &PrefAlign) const override
Return true if the pointer arguments to CI should be aligned by aligning the object whose address is ...
Definition: LoongArchISelLowering.cpp:6557

llvm::LoongArchTargetLowering::emitMaskedAtomicRMWIntrinsic
Value * emitMaskedAtomicRMWIntrinsic(IRBuilderBase &Builder, AtomicRMWInst *AI, Value *AlignedAddr, Value *Incr, Value *Mask, Value *ShiftAmt, AtomicOrdering Ord) const override
Perform a masked atomicrmw using a target-specific intrinsic.
Definition: LoongArchISelLowering.cpp:6063

llvm::LoongArchTargetLowering::isZExtFree
bool isZExtFree(SDValue Val, EVT VT2) const override
Return true if zero-extending the specific node Val to type VT2 is free (either because it's implicit...
Definition: LoongArchISelLowering.cpp:6500

llvm::LoongArchTargetLowering::getExceptionPointerRegister
Register getExceptionPointerRegister(const Constant *PersonalityFn) const override
If a physical register, this returns the register that receives the exception address on entry to an ...
Definition: LoongArchISelLowering.cpp:6140

llvm::LoongArchTargetLowering::signExtendConstant
bool signExtendConstant(const ConstantInt *CI) const override
Return true if this constant should be sign extended when promoting to a larger type.
Definition: LoongArchISelLowering.cpp:6520

llvm::LoongArchTargetLowering::getTargetNodeName
const char * getTargetNodeName(unsigned Opcode) const override
This method returns the name of a target specific DAG node.
Definition: LoongArchISelLowering.cpp:4784

llvm::LoongArchTargetLowering::getTgtMemIntrinsic
bool getTgtMemIntrinsic(IntrinsicInfo &Info, const CallInst &I, MachineFunction &MF, unsigned Intrinsic) const override
Given an intrinsic, checks if on the target the intrinsic will need to map to a MemIntrinsicNode (tou...
Definition: LoongArchISelLowering.cpp:5871

llvm::LoongArchTargetLowering::isLegalAddImmediate
bool isLegalAddImmediate(int64_t Imm) const override
Return true if the specified immediate is legal add immediate, that is the target has add instruction...
Definition: LoongArchISelLowering.cpp:6496

llvm::LoongArchTargetLowering::isCheapToSpeculateCttz
bool isCheapToSpeculateCttz(Type *Ty) const override
Return true if it is cheap to speculate a call to intrinsic cttz.
Definition: LoongArchISelLowering.cpp:5831

llvm::LoongArchTargetLowering::isLegalAddressingMode
bool isLegalAddressingMode(const DataLayout &DL, const AddrMode &AM, Type *Ty, unsigned AS, Instruction *I=nullptr) const override
Return true if the addressing mode represented by AM is legal for this target, for a load/store of th...
Definition: LoongArchISelLowering.cpp:6448

llvm::LoongArchTargetLowering::shouldSignExtendTypeInLibCall
bool shouldSignExtendTypeInLibCall(Type *Ty, bool IsSigned) const override
Returns true if arguments should be sign-extended in lib calls.
Definition: LoongArchISelLowering.cpp:6537

llvm::LoongArchTargetLowering::isFPImmVLDILegal
bool isFPImmVLDILegal(const APFloat &Imm, EVT VT) const
Definition: LoongArchISelLowering.cpp:5803

llvm::LoongArchTargetLowering::shouldExtendTypeInLibCall
bool shouldExtendTypeInLibCall(EVT Type) const override
Returns true if arguments should be extended in lib calls.
Definition: LoongArchISelLowering.cpp:6545

llvm::LoongArchTargetLowering::getRegisterByName
Register getRegisterByName(const char *RegName, LLT VT, const MachineFunction &MF) const override
Return the register ID of the name passed in.
Definition: LoongArchISelLowering.cpp:6384

llvm::LoongArchTargetLowering::hasAndNot
bool hasAndNot(SDValue Y) const override
Return true if the target has a bitwise and-not operation: X = ~A & B This can be used to simplify se...
Definition: LoongArchISelLowering.cpp:5866

llvm::LoongArchTargetLowering::isOffsetFoldingLegal
bool isOffsetFoldingLegal(const GlobalAddressSDNode *GA) const override
Return true if folding a constant offset with the given GlobalAddress is legal.
Definition: LoongArchISelLowering.cpp:396

llvm::LoongArchTargetLowering::getExceptionSelectorRegister
Register getExceptionSelectorRegister(const Constant *PersonalityFn) const override
If a physical register, this returns the register that receives the exception typeid on entry to a la...
Definition: LoongArchISelLowering.cpp:6145

llvm::LoongArchTargetLowering::ReplaceNodeResults
void ReplaceNodeResults(SDNode *N, SmallVectorImpl< SDValue > &Results, SelectionDAG &DAG) const override
This callback is invoked when a node result type is illegal for the target, and the operation was reg...
Definition: LoongArchISelLowering.cpp:2951

llvm::LoongArchTargetLowering::emitExpandAtomicRMW
void emitExpandAtomicRMW(AtomicRMWInst *AI) const override
Perform a atomicrmw expansion using a target-specific way.
Definition: LoongArchISelLowering.cpp:5898

llvm::LoongArchTargetLowering::getExtendForAtomicCmpSwapArg
ISD::NodeType getExtendForAtomicCmpSwapArg() const override
Returns how the platform's atomic compare and swap expects its comparison value to be extended (ZERO_...
Definition: LoongArchISelLowering.cpp:6532

llvm::LoongArchTargetLowering::LoongArchTargetLowering
LoongArchTargetLowering(const TargetMachine &TM, const LoongArchSubtarget &STI)
Definition: LoongArchISelLowering.cpp:45

llvm::LoongArchTargetLowering::LowerReturn
SDValue LowerReturn(SDValue Chain, CallingConv::ID CallConv, bool IsVarArg, const SmallVectorImpl< ISD::OutputArg > &Outs, const SmallVectorImpl< SDValue > &OutVals, const SDLoc &DL, SelectionDAG &DAG) const override
This hook must be implemented to lower outgoing return values, described by the Outs array,...
Definition: LoongArchISelLowering.cpp:5761

llvm::LoongArchTargetLowering::hasAndNotCompare
bool hasAndNotCompare(SDValue Y) const override
Return true if the target should transform: (X & Y) == Y —> (~X & Y) == 0 (X & Y) !...
Definition: LoongArchISelLowering.cpp:6524

llvm::LoongArchTargetLowering::getRecipEstimate
SDValue getRecipEstimate(SDValue Operand, SelectionDAG &DAG, int Enabled, int &RefinementSteps) const override
Return a reciprocal estimate value for the input operand.
Definition: LoongArchISelLowering.cpp:6191

llvm::LoongArchTargetLowering::CanLowerReturn
bool CanLowerReturn(CallingConv::ID CallConv, MachineFunction &MF, bool IsVarArg, const SmallVectorImpl< ISD::OutputArg > &Outs, LLVMContext &Context, const Type *RetTy) const override
This hook should be implemented to check whether the return values described by the Outs array can fi...
Definition: LoongArchISelLowering.cpp:5743

llvm::LoongArchTargetLowering::LowerFormalArguments
SDValue LowerFormalArguments(SDValue Chain, CallingConv::ID CallConv, bool IsVarArg, const SmallVectorImpl< ISD::InputArg > &Ins, const SDLoc &DL, SelectionDAG &DAG, SmallVectorImpl< SDValue > &InVals) const override
This hook must be implemented to lower the incoming (formal) arguments, described by the Ins array,...
Definition: LoongArchISelLowering.cpp:5274

llvm::LoongArchTargetLowering::mayBeEmittedAsTailCall
bool mayBeEmittedAsTailCall(const CallInst *CI) const override
Return true if the target may be able emit the call instruction as a tail call.
Definition: LoongArchISelLowering.cpp:5404

llvm::MCRegister
Wrapper class representing physical registers. Should be passed by value.
Definition: MCRegister.h:33

llvm::MCSubtargetInfo::hasFeature
bool hasFeature(unsigned Feature) const
Definition: MCSubtargetInfo.h:121

llvm::MVT
Machine Value Type.
Definition: MachineValueType.h:35

llvm::MVT::is128BitVector
bool is128BitVector() const
Return true if this is a 128-bit vector type.
Definition: MachineValueType.h:156

llvm::MVT::SimpleValueType
SimpleValueType
Definition: MachineValueType.h:37

llvm::MVT::SimpleTy
SimpleValueType SimpleTy
Definition: MachineValueType.h:55

llvm::MVT::getVectorNumElements
unsigned getVectorNumElements() const
Definition: MachineValueType.h:294

llvm::MVT::isVector
bool isVector() const
Return true if this is a vector value type.
Definition: MachineValueType.h:106

llvm::MVT::fixedlen_vector_valuetypes
static auto fixedlen_vector_valuetypes()
Definition: MachineValueType.h:542

llvm::MVT::is256BitVector
bool is256BitVector() const
Return true if this is a 256-bit vector type.
Definition: MachineValueType.h:161

llvm::MVT::isScalarInteger
bool isScalarInteger() const
Return true if this is an integer, not including vectors.
Definition: MachineValueType.h:100

llvm::MVT::isFloatingPoint
bool isFloatingPoint() const
Return true if this is a FP or a vector FP type.
Definition: MachineValueType.h:80

llvm::MVT::getIntegerVT
static MVT getIntegerVT(unsigned BitWidth)
Definition: MachineValueType.h:441

llvm::MVT::changeVectorElementTypeToInteger
MVT changeVectorElementTypeToInteger() const
Return a vector with the same number of elements as this vector, but with the element type converted ...
Definition: MachineValueType.h:196

llvm::MachineBasicBlock
Definition: MachineBasicBlock.h:125

llvm::MachineBasicBlock::transferSuccessorsAndUpdatePHIs
void transferSuccessorsAndUpdatePHIs(MachineBasicBlock *FromMBB)
Transfers all the successors, as in transferSuccessors, and update PHI operands in the successor bloc...
Definition: MachineBasicBlock.cpp:937

llvm::MachineBasicBlock::getBasicBlock
const BasicBlock * getBasicBlock() const
Return the LLVM basic block that this instance corresponded to originally.
Definition: MachineBasicBlock.h:256

llvm::MachineBasicBlock::addSuccessor
void addSuccessor(MachineBasicBlock *Succ, BranchProbability Prob=BranchProbability::getUnknown())
Add Succ as a successor of this MachineBasicBlock.
Definition: MachineBasicBlock.cpp:798

llvm::MachineBasicBlock::begin
iterator begin()
Definition: MachineBasicBlock.h:355

llvm::MachineBasicBlock::end
iterator end()
Definition: MachineBasicBlock.h:357

llvm::MachineBasicBlock::getParent
const MachineFunction * getParent() const
Return the MachineFunction containing this basic block.
Definition: MachineBasicBlock.h:311

llvm::MachineBasicBlock::splice
void splice(iterator Where, MachineBasicBlock *Other, iterator From)
Take an instruction from MBB 'Other' at the position From, and insert it into this MBB right before '...
Definition: MachineBasicBlock.h:1109

llvm::MachineFrameInfo
The MachineFrameInfo class represents an abstract stack frame until prolog/epilog code is inserted.
Definition: MachineFrameInfo.h:106

llvm::MachineFrameInfo::CreateFixedObject
int CreateFixedObject(uint64_t Size, int64_t SPOffset, bool IsImmutable, bool isAliased=false)
Create a new object at a fixed location on the stack.
Definition: MachineFrameInfo.cpp:83

llvm::MachineFrameInfo::CreateStackObject
int CreateStackObject(uint64_t Size, Align Alignment, bool isSpillSlot, const AllocaInst *Alloca=nullptr, uint8_t ID=0)
Create a new statically sized stack object, returning a nonnegative identifier to represent it.
Definition: MachineFrameInfo.cpp:51

llvm::MachineFrameInfo::setFrameAddressIsTaken
void setFrameAddressIsTaken(bool T)
Definition: MachineFrameInfo.h:374

llvm::MachineFrameInfo::setHasTailCall
void setHasTailCall(bool V=true)
Definition: MachineFrameInfo.h:647

llvm::MachineFrameInfo::setReturnAddressIsTaken
void setReturnAddressIsTaken(bool s)
Definition: MachineFrameInfo.h:380

llvm::MachineFunction
Definition: MachineFunction.h:267

llvm::MachineFunction::getSubtarget
const TargetSubtargetInfo & getSubtarget() const
getSubtarget - Return the subtarget for which this machine code is being compiled.
Definition: MachineFunction.h:733

llvm::MachineFunction::getMachineMemOperand
MachineMemOperand * getMachineMemOperand(MachinePointerInfo PtrInfo, MachineMemOperand::Flags f, LLT MemTy, Align base_alignment, const AAMDNodes &AAInfo=AAMDNodes(), const MDNode *Ranges=nullptr, SyncScope::ID SSID=SyncScope::System, AtomicOrdering Ordering=AtomicOrdering::NotAtomic, AtomicOrdering FailureOrdering=AtomicOrdering::NotAtomic)
getMachineMemOperand - Allocate a new MachineMemOperand.
Definition: MachineFunction.cpp:536

llvm::MachineFunction::getFrameInfo
MachineFrameInfo & getFrameInfo()
getFrameInfo - Return the frame info object for the current function.
Definition: MachineFunction.h:749

llvm::MachineFunction::getRegInfo
MachineRegisterInfo & getRegInfo()
getRegInfo - Return information about the registers currently in use.
Definition: MachineFunction.h:743

llvm::MachineFunction::getDataLayout
const DataLayout & getDataLayout() const
Return the DataLayout attached to the Module associated to this MF.
Definition: MachineFunction.cpp:309

llvm::MachineFunction::getFunction
Function & getFunction()
Return the LLVM function that this machine code represents.
Definition: MachineFunction.h:704

llvm::MachineFunction::getInfo
Ty * getInfo()
getInfo - Keep track of various per-function pieces of information for backends that would like to do...
Definition: MachineFunction.h:831

llvm::MachineFunction::addLiveIn
Register addLiveIn(MCRegister PReg, const TargetRegisterClass *RC)
addLiveIn - Add the specified physical register as a live-in value and create a corresponding virtual...
Definition: MachineFunction.cpp:762

llvm::MachineFunction::CreateMachineBasicBlock
MachineBasicBlock * CreateMachineBasicBlock(const BasicBlock *BB=nullptr, std::optional< UniqueBBID > BBID=std::nullopt)
CreateMachineBasicBlock - Allocate a new MachineBasicBlock.
Definition: MachineFunction.cpp:499

llvm::MachineFunction::insert
void insert(iterator MBBI, MachineBasicBlock *MBB)
Definition: MachineFunction.h:966

llvm::MachineInstrBuilder::addImm
const MachineInstrBuilder & addImm(int64_t Val) const
Add a new immediate operand.
Definition: MachineInstrBuilder.h:133

llvm::MachineInstrBuilder::addReg
const MachineInstrBuilder & addReg(Register RegNo, unsigned flags=0, unsigned SubReg=0) const
Add a new virtual register operand.
Definition: MachineInstrBuilder.h:99

llvm::MachineInstrBuilder::addMBB
const MachineInstrBuilder & addMBB(MachineBasicBlock *MBB, unsigned TargetFlags=0) const
Definition: MachineInstrBuilder.h:148

llvm::MachineInstr
Representation of each machine instruction.
Definition: MachineInstr.h:71

llvm::MachineInstr::getOperand
const MachineOperand & getOperand(unsigned i) const
Definition: MachineInstr.h:587

llvm::MachineMemOperand
A description of a memory reference used in the backend.
Definition: MachineMemOperand.h:129

llvm::MachineMemOperand::Flags
Flags
Flags values. These may be or'd together.
Definition: MachineMemOperand.h:132

llvm::MachineMemOperand::MOVolatile
@ MOVolatile
The memory access is volatile.
Definition: MachineMemOperand.h:140

llvm::MachineMemOperand::MODereferenceable
@ MODereferenceable
The memory access is dereferenceable (i.e., doesn't trap).
Definition: MachineMemOperand.h:144

llvm::MachineMemOperand::MOLoad
@ MOLoad
The memory access reads data.
Definition: MachineMemOperand.h:136

llvm::MachineMemOperand::MOInvariant
@ MOInvariant
The memory access always returns the same value (or traps).
Definition: MachineMemOperand.h:146

llvm::MachineMemOperand::MOStore
@ MOStore
The memory access writes data.
Definition: MachineMemOperand.h:138

llvm::MachineOperand
MachineOperand class - Representation of each machine instruction operand.
Definition: MachineOperand.h:48

llvm::MachineOperand::isKill
bool isKill() const
Definition: MachineOperand.h:399

llvm::MachineOperand::setIsKill
void setIsKill(bool Val=true)
Definition: MachineOperand.h:519

llvm::MachineOperand::setIsUndef
void setIsUndef(bool Val=true)
Definition: MachineOperand.h:530

llvm::MachineOperand::getReg
Register getReg() const
getReg - Returns the register number.
Definition: MachineOperand.h:369

llvm::MachineOperand::CreateReg
static MachineOperand CreateReg(Register Reg, bool isDef, bool isImp=false, bool isKill=false, bool isDead=false, bool isUndef=false, bool isEarlyClobber=false, unsigned SubReg=0, bool isDebug=false, bool isInternalRead=false, bool isRenamable=false)
Definition: MachineOperand.h:838

llvm::MachineRegisterInfo
MachineRegisterInfo - Keep track of information for virtual and physical registers,...
Definition: MachineRegisterInfo.h:51

llvm::MachineRegisterInfo::createVirtualRegister
Register createVirtualRegister(const TargetRegisterClass *RegClass, StringRef Name="")
createVirtualRegister - Create and return a new virtual register in the function with the specified r...
Definition: MachineRegisterInfo.cpp:156

llvm::MachineRegisterInfo::addLiveIn
void addLiveIn(MCRegister Reg, Register vreg=Register())
addLiveIn - Add the specified register as a live-in.
Definition: MachineRegisterInfo.h:1006

llvm::MemSDNode::getMemoryVT
EVT getMemoryVT() const
Return the type of the in-memory value.
Definition: SelectionDAGNodes.h:1432

llvm::MutableArrayRef
MutableArrayRef - Represent a mutable reference to an array (0 or more elements consecutively in memo...
Definition: ArrayRef.h:310

llvm::PointerType
Class to represent pointers.
Definition: DerivedTypes.h:670

llvm::PointerType::getAddressSpace
unsigned getAddressSpace() const
Return the address space of the Pointer type.
Definition: DerivedTypes.h:703

llvm::PointerUnion< const Value *, const PseudoSourceValue * >

llvm::Register
Wrapper class representing virtual and physical registers.
Definition: Register.h:19

llvm::SDLoc
Wrapper class for IR location info (IR ordering and DebugLoc) to be passed into SDNode creation funct...
Definition: SelectionDAGNodes.h:1182

llvm::SDNode
Represents one node in the SelectionDAG.
Definition: SelectionDAGNodes.h:496

llvm::SDNode::getOpcode
unsigned getOpcode() const
Return the SelectionDAG opcode value for this node.
Definition: SelectionDAGNodes.h:687

llvm::SDNode::use_size
size_t use_size() const
Return the number of uses of this node.
Definition: SelectionDAGNodes.h:743

llvm::SDNode::getAsZExtVal
uint64_t getAsZExtVal() const
Helper method returns the zero-extended integer value of a ConstantSDNode.
Definition: SelectionDAGNodes.h:1727

llvm::SDNode::getOperand
const SDValue & getOperand(unsigned Num) const
Definition: SelectionDAGNodes.h:992

llvm::SDNode::getValueType
EVT getValueType(unsigned ResNo) const
Return the type of a specified result.
Definition: SelectionDAGNodes.h:1062

llvm::SDValue
Unlike LLVM values, Selection DAG nodes may return multiple values as the result of a computation.
Definition: SelectionDAGNodes.h:145

llvm::SDValue::isUndef
bool isUndef() const
Definition: SelectionDAGNodes.h:1249

llvm::SDValue::getNode
SDNode * getNode() const
get the SDNode which holds the desired result
Definition: SelectionDAGNodes.h:159

llvm::SDValue::getValue
SDValue getValue(unsigned R) const
Definition: SelectionDAGNodes.h:179

llvm::SDValue::getValueType
EVT getValueType() const
Return the ValueType of the referenced return value.
Definition: SelectionDAGNodes.h:1217

llvm::SDValue::getOperand
const SDValue & getOperand(unsigned i) const
Definition: SelectionDAGNodes.h:1225

llvm::SDValue::getScalarValueSizeInBits
uint64_t getScalarValueSizeInBits() const
Definition: SelectionDAGNodes.h:203

llvm::SDValue::getConstantOperandVal
uint64_t getConstantOperandVal(unsigned i) const
Definition: SelectionDAGNodes.h:1229

llvm::SDValue::getSimpleValueType
MVT getSimpleValueType() const
Return the simple ValueType of the referenced return value.
Definition: SelectionDAGNodes.h:190

llvm::SDValue::getOpcode
unsigned getOpcode() const
Definition: SelectionDAGNodes.h:1213

llvm::SelectionDAG
This is used to represent a portion of an LLVM function in a low-level Data Dependence DAG representa...
Definition: SelectionDAG.h:228

llvm::SelectionDAG::getExtLoad
SDValue getExtLoad(ISD::LoadExtType ExtType, const SDLoc &dl, EVT VT, SDValue Chain, SDValue Ptr, MachinePointerInfo PtrInfo, EVT MemVT, MaybeAlign Alignment=MaybeAlign(), MachineMemOperand::Flags MMOFlags=MachineMemOperand::MONone, const AAMDNodes &AAInfo=AAMDNodes())
Definition: SelectionDAG.cpp:9287

llvm::SelectionDAG::getTargetGlobalAddress
SDValue getTargetGlobalAddress(const GlobalValue *GV, const SDLoc &DL, EVT VT, int64_t offset=0, unsigned TargetFlags=0)
Definition: SelectionDAG.h:751

llvm::SelectionDAG::getCopyToReg
SDValue getCopyToReg(SDValue Chain, const SDLoc &dl, Register Reg, SDValue N)
Definition: SelectionDAG.h:802

llvm::SelectionDAG::getMergeValues
SDValue getMergeValues(ArrayRef< SDValue > Ops, const SDLoc &dl)
Create a MERGE_VALUES node from the given operands.
Definition: SelectionDAG.cpp:9034

llvm::SelectionDAG::getVTList
SDVTList getVTList(EVT VT)
Return an SDVTList that represents the list of values specified.
Definition: SelectionDAG.cpp:10708

llvm::SelectionDAG::getMachineNode
MachineSDNode * getMachineNode(unsigned Opcode, const SDLoc &dl, EVT VT)
These are used for target selectors to create a new node with specified return type(s),...
Definition: SelectionDAG.cpp:11149

llvm::SelectionDAG::getSetCC
SDValue getSetCC(const SDLoc &DL, EVT VT, SDValue LHS, SDValue RHS, ISD::CondCode Cond, SDValue Chain=SDValue(), bool IsSignaling=false)
Helper function to make it easier to build SetCC's if you just have an ISD::CondCode instead of an SD...
Definition: SelectionDAG.h:1251

llvm::SelectionDAG::getRegister
SDValue getRegister(Register Reg, EVT VT)
Definition: SelectionDAG.cpp:2328

llvm::SelectionDAG::getLoad
SDValue getLoad(EVT VT, const SDLoc &dl, SDValue Chain, SDValue Ptr, MachinePointerInfo PtrInfo, MaybeAlign Alignment=MaybeAlign(), MachineMemOperand::Flags MMOFlags=MachineMemOperand::MONone, const AAMDNodes &AAInfo=AAMDNodes(), const MDNode *Ranges=nullptr)
Loads are not normal binary operators: their result type is not determined by their operands,...
Definition: SelectionDAG.cpp:9270

llvm::SelectionDAG::getMemcpy
SDValue getMemcpy(SDValue Chain, const SDLoc &dl, SDValue Dst, SDValue Src, SDValue Size, Align Alignment, bool isVol, bool AlwaysInline, const CallInst *CI, std::optional< bool > OverrideTailCall, MachinePointerInfo DstPtrInfo, MachinePointerInfo SrcPtrInfo, const AAMDNodes &AAInfo=AAMDNodes(), BatchAAResults *BatchAA=nullptr)
Definition: SelectionDAG.cpp:8581

llvm::SelectionDAG::addNoMergeSiteInfo
void addNoMergeSiteInfo(const SDNode *Node, bool NoMerge)
Set NoMergeSiteInfo to be associated with Node if NoMerge is true.
Definition: SelectionDAG.h:2394

llvm::SelectionDAG::getNOT
SDValue getNOT(const SDLoc &DL, SDValue Val, EVT VT)
Create a bitwise NOT operation as (XOR Val, -1).
Definition: SelectionDAG.cpp:1622

llvm::SelectionDAG::getTargetLoweringInfo
const TargetLowering & getTargetLoweringInfo() const
Definition: SelectionDAG.h:503

llvm::SelectionDAG::getTargetJumpTable
SDValue getTargetJumpTable(int JTI, EVT VT, unsigned TargetFlags=0)
Definition: SelectionDAG.h:761

llvm::SelectionDAG::getUNDEF
SDValue getUNDEF(EVT VT)
Return an UNDEF node. UNDEF does not have a useful SDLoc.
Definition: SelectionDAG.h:1129

llvm::SelectionDAG::getCALLSEQ_END
SDValue getCALLSEQ_END(SDValue Chain, SDValue Op1, SDValue Op2, SDValue InGlue, const SDLoc &DL)
Return a new CALLSEQ_END node, which always must have a glue result (to ensure it's not CSE'd).
Definition: SelectionDAG.h:1106

llvm::SelectionDAG::getBuildVector
SDValue getBuildVector(EVT VT, const SDLoc &DL, ArrayRef< SDValue > Ops)
Return an ISD::BUILD_VECTOR node.
Definition: SelectionDAG.h:857

llvm::SelectionDAG::isSplatValue
bool isSplatValue(SDValue V, const APInt &DemandedElts, APInt &UndefElts, unsigned Depth=0) const
Test whether V has a splatted value for all the demanded elements.
Definition: SelectionDAG.cpp:3029

llvm::SelectionDAG::getBitcast
SDValue getBitcast(EVT VT, SDValue V)
Return a bitcast using the SDLoc of the value operand, and casting to the provided type.
Definition: SelectionDAG.cpp:2433

llvm::SelectionDAG::getCopyFromReg
SDValue getCopyFromReg(SDValue Chain, const SDLoc &dl, Register Reg, EVT VT)
Definition: SelectionDAG.h:828

llvm::SelectionDAG::setNodeMemRefs
void setNodeMemRefs(MachineSDNode *N, ArrayRef< MachineMemOperand * > NewMemRefs)
Mutate the specified machine node's memory references to the provided list.
Definition: SelectionDAG.cpp:10917

llvm::SelectionDAG::getDataLayout
const DataLayout & getDataLayout() const
Definition: SelectionDAG.h:497

llvm::SelectionDAG::getConstant
SDValue getConstant(uint64_t Val, const SDLoc &DL, EVT VT, bool isTarget=false, bool isOpaque=false)
Create a ConstantSDNode wrapping a constant value.
Definition: SelectionDAG.cpp:1666

llvm::SelectionDAG::getSignedTargetConstant
SDValue getSignedTargetConstant(int64_t Val, const SDLoc &DL, EVT VT, bool isOpaque=false)
Definition: SelectionDAG.h:713

llvm::SelectionDAG::ReplaceAllUsesWith
void ReplaceAllUsesWith(SDValue From, SDValue To)
Modify anything using 'From' to use 'To' instead.
Definition: SelectionDAG.cpp:11653

llvm::SelectionDAG::getCommutedVectorShuffle
SDValue getCommutedVectorShuffle(const ShuffleVectorSDNode &SV)
Returns an ISD::VECTOR_SHUFFLE node semantically equivalent to the shuffle node in input but with swa...
Definition: SelectionDAG.cpp:2318

llvm::SelectionDAG::getStore
SDValue getStore(SDValue Chain, const SDLoc &dl, SDValue Val, SDValue Ptr, MachinePointerInfo PtrInfo, Align Alignment, MachineMemOperand::Flags MMOFlags=MachineMemOperand::MONone, const AAMDNodes &AAInfo=AAMDNodes())
Helper function to build ISD::STORE nodes.
Definition: SelectionDAG.cpp:9320

llvm::SelectionDAG::getSignedConstant
SDValue getSignedConstant(int64_t Val, const SDLoc &DL, EVT VT, bool isTarget=false, bool isOpaque=false)
Definition: SelectionDAG.cpp:1794

llvm::SelectionDAG::getCALLSEQ_START
SDValue getCALLSEQ_START(SDValue Chain, uint64_t InSize, uint64_t OutSize, const SDLoc &DL)
Return a new CALLSEQ_START node, that starts new call frame, in which InSize bytes are set up inside ...
Definition: SelectionDAG.h:1094

llvm::SelectionDAG::getExternalSymbol
SDValue getExternalSymbol(const char *Sym, EVT VT)
Definition: SelectionDAG.cpp:2052

llvm::SelectionDAG::getTarget
const TargetMachine & getTarget() const
Definition: SelectionDAG.h:498

llvm::SelectionDAG::getIntPtrConstant
SDValue getIntPtrConstant(uint64_t Val, const SDLoc &DL, bool isTarget=false)
Definition: SelectionDAG.cpp:1806

llvm::SelectionDAG::getValueType
SDValue getValueType(EVT)
Definition: SelectionDAG.cpp:2038

llvm::SelectionDAG::getNode
SDValue getNode(unsigned Opcode, const SDLoc &DL, EVT VT, ArrayRef< SDUse > Ops)
Gets or creates the specified node.
Definition: SelectionDAG.cpp:10327

llvm::SelectionDAG::getTargetConstant
SDValue getTargetConstant(uint64_t Val, const SDLoc &DL, EVT VT, bool isOpaque=false)
Definition: SelectionDAG.h:701

llvm::SelectionDAG::getTargetBlockAddress
SDValue getTargetBlockAddress(const BlockAddress *BA, EVT VT, int64_t Offset=0, unsigned TargetFlags=0)
Definition: SelectionDAG.h:797

llvm::SelectionDAG::getMachineFunction
MachineFunction & getMachineFunction() const
Definition: SelectionDAG.h:492

llvm::SelectionDAG::getFrameIndex
SDValue getFrameIndex(int FI, EVT VT, bool isTarget=false)
Definition: SelectionDAG.cpp:1925

llvm::SelectionDAG::computeKnownBits
KnownBits computeKnownBits(SDValue Op, unsigned Depth=0) const
Determine which bits of Op are known to be either zero or one and return them in Known.
Definition: SelectionDAG.cpp:3415

llvm::SelectionDAG::getRegisterMask
SDValue getRegisterMask(const uint32_t *RegMask)
Definition: SelectionDAG.cpp:2344

llvm::SelectionDAG::getContext
LLVMContext * getContext() const
Definition: SelectionDAG.h:510

llvm::SelectionDAG::getTargetExternalSymbol
SDValue getTargetExternalSymbol(const char *Sym, EVT VT, unsigned TargetFlags=0)
Definition: SelectionDAG.cpp:2069

llvm::SelectionDAG::CreateStackTemporary
SDValue CreateStackTemporary(TypeSize Bytes, Align Alignment)
Create a stack temporary based on the size in bytes and the alignment.
Definition: SelectionDAG.cpp:2776

llvm::SelectionDAG::getTargetConstantPool
SDValue getTargetConstantPool(const Constant *C, EVT VT, MaybeAlign Align=std::nullopt, int Offset=0, unsigned TargetFlags=0)
Definition: SelectionDAG.h:768

llvm::SelectionDAG::getEntryNode
SDValue getEntryNode() const
Return the token chain corresponding to the entry of the function.
Definition: SelectionDAG.h:580

llvm::SelectionDAG::SplitScalar
std::pair< SDValue, SDValue > SplitScalar(const SDValue &N, const SDLoc &DL, const EVT &LoVT, const EVT &HiVT)
Split the scalar node with EXTRACT_ELEMENT using the provided VTs and return the low/high part.
Definition: SelectionDAG.cpp:12946

llvm::SelectionDAG::getVectorShuffle
SDValue getVectorShuffle(EVT VT, const SDLoc &dl, SDValue N1, SDValue N2, ArrayRef< int > Mask)
Return an ISD::VECTOR_SHUFFLE node.
Definition: SelectionDAG.cpp:2147

llvm::ShuffleVectorSDNode
This SDNode is used to implement the code generator support for the llvm IR shufflevector instruction...
Definition: SelectionDAGNodes.h:1625

llvm::ShuffleVectorSDNode::getMask
ArrayRef< int > getMask() const
Definition: SelectionDAGNodes.h:1638

llvm::SmallVectorBase::empty
bool empty() const
Definition: SmallVector.h:81

llvm::SmallVectorBase::size
size_t size() const
Definition: SmallVector.h:78

llvm::SmallVectorImpl
This class consists of common code factored out of the SmallVector class to reduce code duplication b...
Definition: SmallVector.h:573

llvm::SmallVectorImpl::const_iterator
typename SuperClass::const_iterator const_iterator
Definition: SmallVector.h:578

llvm::SmallVectorImpl::clear
void clear()
Definition: SmallVector.h:610

llvm::SmallVectorTemplateBase::push_back
void push_back(const T &Elt)
Definition: SmallVector.h:413

llvm::SmallVector
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
Definition: SmallVector.h:1196

llvm::StackOffset
StackOffset holds a fixed and a scalable offset in bytes.
Definition: TypeSize.h:33

llvm::StringRef
StringRef - Represent a constant reference to a string, i.e.
Definition: StringRef.h:51

llvm::StringRef::split
std::pair< StringRef, StringRef > split(char Separator) const
Split into two substrings around the first occurrence of a separator character.
Definition: StringRef.h:700

llvm::StringRef::starts_with
bool starts_with(StringRef Prefix) const
Check if this string starts with the given Prefix.
Definition: StringRef.h:265

llvm::StringRef::size
constexpr size_t size() const
size - Get the string size.
Definition: StringRef.h:150

llvm::StringSwitch
A switch()-like statement whose cases are string literals.
Definition: StringSwitch.h:44

llvm::StringSwitch::Case
StringSwitch & Case(StringLiteral S, T Value)
Definition: StringSwitch.h:69

llvm::StringSwitch::Default
R Default(T Value)
Definition: StringSwitch.h:182

llvm::TargetInstrInfo
TargetInstrInfo - Interface to description of machine instruction set.
Definition: TargetInstrInfo.h:112

llvm::TargetLoweringBase::setBooleanVectorContents
void setBooleanVectorContents(BooleanContent Ty)
Specify how the target extends the result of a vector boolean value from a vector of i1 to a wider ty...
Definition: TargetLowering.h:2493

llvm::TargetLoweringBase::setOperationAction
void setOperationAction(unsigned Op, MVT VT, LegalizeAction Action)
Indicate that the specified operation does not work with the specified type and indicate what to do a...
Definition: TargetLowering.h:2562

llvm::TargetLoweringBase::Unspecified
@ Unspecified
Definition: TargetLowering.h:574

llvm::TargetLoweringBase::Custom
@ Custom
Definition: TargetLowering.h:204

llvm::TargetLoweringBase::Expand
@ Expand
Definition: TargetLowering.h:202

llvm::TargetLoweringBase::Promote
@ Promote
Definition: TargetLowering.h:201

llvm::TargetLoweringBase::emitPatchPoint
MachineBasicBlock * emitPatchPoint(MachineInstr &MI, MachineBasicBlock *MBB) const
Replace/modify any TargetFrameIndex operands with a targte-dependent sequence of memory operands that...
Definition: TargetLoweringBase.cpp:1155

llvm::TargetLoweringBase::getRegClassFor
virtual const TargetRegisterClass * getRegClassFor(MVT VT, bool isDivergent=false) const
Return the register class that should be used for the specified value type.
Definition: TargetLowering.h:1042

llvm::TargetLoweringBase::getTargetMachine
const TargetMachine & getTargetMachine() const
Definition: TargetLowering.h:364

llvm::TargetLoweringBase::isZExtFree
virtual bool isZExtFree(Type *FromTy, Type *ToTy) const
Return true if any actual instruction that defines a value of type FromTy implicitly zero-extends the...
Definition: TargetLowering.h:3066

llvm::TargetLoweringBase::TypeSoftenFloat
@ TypeSoftenFloat
Definition: TargetLowering.h:213

llvm::TargetLoweringBase::setMaxBytesForAlignment
void setMaxBytesForAlignment(unsigned MaxBytes)
Definition: TargetLowering.h:2753

llvm::TargetLoweringBase::setPrefLoopAlignment
void setPrefLoopAlignment(Align Alignment)
Set the target's preferred loop alignment.
Definition: TargetLowering.h:2752

llvm::TargetLoweringBase::setMaxAtomicSizeInBitsSupported
void setMaxAtomicSizeInBitsSupported(unsigned SizeInBits)
Set the maximum atomic operation size supported by the backend.
Definition: TargetLowering.h:2766

llvm::TargetLoweringBase::setMinFunctionAlignment
void setMinFunctionAlignment(Align Alignment)
Set the target's minimum function alignment.
Definition: TargetLowering.h:2739

llvm::TargetLoweringBase::setBooleanContents
void setBooleanContents(BooleanContent Ty)
Specify how the target extends the result of integer and floating point boolean values from i1 to a w...
Definition: TargetLowering.h:2479

llvm::TargetLoweringBase::computeRegisterProperties
void computeRegisterProperties(const TargetRegisterInfo *TRI)
Once all of the register classes are added, this allows us to compute derived properties we expose.
Definition: TargetLoweringBase.cpp:1275

llvm::TargetLoweringBase::addRegisterClass
void addRegisterClass(MVT VT, const TargetRegisterClass *RC)
Add the specified register class as an available regclass for the specified value type.
Definition: TargetLowering.h:2545

llvm::TargetLoweringBase::getPointerTy
virtual MVT getPointerTy(const DataLayout &DL, uint32_t AS=0) const
Return the pointer type for the given address space, defaults to the pointer type from the data layou...
Definition: TargetLowering.h:371

llvm::TargetLoweringBase::setPrefFunctionAlignment
void setPrefFunctionAlignment(Align Alignment)
Set the target's preferred function alignment.
Definition: TargetLowering.h:2745

llvm::TargetLoweringBase::setTruncStoreAction
void setTruncStoreAction(MVT ValVT, MVT MemVT, LegalizeAction Action)
Indicate that the specified truncating store does not work with the specified type and indicate what ...
Definition: TargetLowering.h:2625

llvm::TargetLoweringBase::ZeroOrOneBooleanContent
@ ZeroOrOneBooleanContent
Definition: TargetLowering.h:236

llvm::TargetLoweringBase::ZeroOrNegativeOneBooleanContent
@ ZeroOrNegativeOneBooleanContent
Definition: TargetLowering.h:237

llvm::TargetLoweringBase::setMinCmpXchgSizeInBits
void setMinCmpXchgSizeInBits(unsigned SizeInBits)
Sets the minimum cmpxchg or ll/sc size supported by the backend.
Definition: TargetLowering.h:2783

llvm::TargetLoweringBase::setStackPointerRegisterToSaveRestore
void setStackPointerRegisterToSaveRestore(Register R)
If set to a physical register, this specifies the register that llvm.savestack/llvm....
Definition: TargetLowering.h:2511

llvm::TargetLoweringBase::AtomicExpansionKind
AtomicExpansionKind
Enum that specifies what an atomic load/AtomicRMWInst is expanded to, if at all.
Definition: TargetLowering.h:253

llvm::TargetLoweringBase::AtomicExpansionKind::CmpXChg
@ CmpXChg

llvm::TargetLoweringBase::AtomicExpansionKind::None
@ None

llvm::TargetLoweringBase::AtomicExpansionKind::Expand
@ Expand

llvm::TargetLoweringBase::AtomicExpansionKind::MaskedIntrinsic
@ MaskedIntrinsic

llvm::TargetLoweringBase::setCondCodeAction
void setCondCodeAction(ArrayRef< ISD::CondCode > CCs, MVT VT, LegalizeAction Action)
Indicate that the specified condition code is or isn't supported on the target and indicate what to d...
Definition: TargetLowering.h:2686

llvm::TargetLoweringBase::setTargetDAGCombine
void setTargetDAGCombine(ArrayRef< ISD::NodeType > NTs)
Targets should invoke this method for each target independent node that they want to provide a custom...
Definition: TargetLowering.h:2731

llvm::TargetLoweringBase::setLoadExtAction
void setLoadExtAction(unsigned ExtType, MVT ValVT, MVT MemVT, LegalizeAction Action)
Indicate that the specified load with extension does not work with the specified type and indicate wh...
Definition: TargetLowering.h:2579

llvm::TargetLoweringBase::getTypeAction
LegalizeTypeAction getTypeAction(LLVMContext &Context, EVT VT) const
Return how we should legalize values of this type, either it is already legal (return 'Legal') or we ...
Definition: TargetLowering.h:1143

llvm::TargetLoweringBase::ArgListTy
std::vector< ArgListEntry > ArgListTy
Definition: TargetLowering.h:329

llvm::TargetLowering
This class defines information used to lower LLVM code to legal SelectionDAG operators that the targe...
Definition: TargetLowering.h:3780

llvm::TargetLowering::ConstraintType
ConstraintType
Definition: TargetLowering.h:4950

llvm::TargetLowering::C_RegisterClass
@ C_RegisterClass
Definition: TargetLowering.h:4952

llvm::TargetLowering::C_Memory
@ C_Memory
Definition: TargetLowering.h:4953

llvm::TargetLowering::C_Immediate
@ C_Immediate
Definition: TargetLowering.h:4955

llvm::TargetLowering::makeLibCall
std::pair< SDValue, SDValue > makeLibCall(SelectionDAG &DAG, RTLIB::Libcall LC, EVT RetVT, ArrayRef< SDValue > Ops, MakeLibCallOptions CallOptions, const SDLoc &dl, SDValue Chain=SDValue()) const
Returns a pair of (return value, chain).
Definition: TargetLowering.cpp:147

llvm::TargetLowering::getInlineAsmMemConstraint
virtual InlineAsm::ConstraintCode getInlineAsmMemConstraint(StringRef ConstraintCode) const
Definition: TargetLowering.h:5062

llvm::TargetLowering::getConstraintType
virtual ConstraintType getConstraintType(StringRef Constraint) const
Given a constraint, return the type of constraint it is for this target.
Definition: TargetLowering.cpp:5525

llvm::TargetLowering::LowerCallTo
std::pair< SDValue, SDValue > LowerCallTo(CallLoweringInfo &CLI) const
This function lowers an abstract call to a function into an actual call.
Definition: SelectionDAGBuilder.cpp:10958

llvm::TargetLowering::getRegForInlineAsmConstraint
virtual std::pair< unsigned, const TargetRegisterClass * > getRegForInlineAsmConstraint(const TargetRegisterInfo *TRI, StringRef Constraint, MVT VT) const
Given a physical register constraint (e.g.
Definition: TargetLowering.cpp:5669

llvm::TargetLowering::verifyReturnAddressArgumentIsConstant
bool verifyReturnAddressArgumentIsConstant(SDValue Op, SelectionDAG &DAG) const
Definition: TargetLowering.cpp:7260

llvm::TargetLowering::LowerAsmOperandForConstraint
virtual void LowerAsmOperandForConstraint(SDValue Op, StringRef Constraint, std::vector< SDValue > &Ops, SelectionDAG &DAG) const
Lower the specified operand into the Ops vector.
Definition: TargetLowering.cpp:5587

llvm::TargetMachine
Primary interface to the complete machine description for the target machine.
Definition: TargetMachine.h:77

llvm::TargetMachine::useTLSDESC
bool useTLSDESC() const
Returns true if this target uses TLS Descriptors.
Definition: TargetMachine.cpp:236

llvm::TargetMachine::useEmulatedTLS
bool useEmulatedTLS() const
Returns true if this target uses emulated TLS.
Definition: TargetMachine.cpp:235

llvm::TargetMachine::shouldAssumeDSOLocal
bool shouldAssumeDSOLocal(const GlobalValue *GV) const
Definition: TargetMachine.cpp:178

llvm::TargetMachine::getCodeModel
CodeModel::Model getCodeModel() const
Returns the code model.
Definition: TargetMachine.h:232

llvm::TargetRegisterClass
Definition: TargetRegisterInfo.h:44

llvm::TargetRegisterInfo
TargetRegisterInfo base class - We assume that the target defines a static array of TargetRegisterDes...
Definition: TargetRegisterInfo.h:235

llvm::TargetSubtargetInfo::getInstrInfo
virtual const TargetInstrInfo * getInstrInfo() const
Definition: TargetSubtargetInfo.h:97

llvm::Twine
Twine - A lightweight data structure for efficiently representing the concatenation of temporary valu...
Definition: Twine.h:81

llvm::TypeSize
Definition: TypeSize.h:334

llvm::Type
The instances of the Type class are immutable: once they are created, they are never changed.
Definition: Type.h:45

llvm::Type::getIntegerBitWidth
unsigned getIntegerBitWidth() const

llvm::Type::getIntNTy
static IntegerType * getIntNTy(LLVMContext &C, unsigned N)

llvm::Type::isIntegerTy
bool isIntegerTy() const
True if this is an instance of IntegerType.
Definition: Type.h:237

llvm::Type::getPrimitiveSizeInBits
TypeSize getPrimitiveSizeInBits() const LLVM_READONLY
Return the basic size of this type if it is a primitive type.

llvm::VTSDNode
This class is used to represent EVT's, which are used to parameterize some operations.
Definition: SelectionDAGNodes.h:2413

llvm::VTSDNode::getVT
EVT getVT() const
Definition: SelectionDAGNodes.h:2423

llvm::Value
LLVM Value Representation.
Definition: Value.h:74

llvm::Value::getType
Type * getType() const
All values are typed, get the type of this value.
Definition: Value.h:255

llvm::Value::replaceAllUsesWith
void replaceAllUsesWith(Value *V)
Change all uses of this to point to a new Value.
Definition: Value.cpp:534

llvm::cl::opt
Definition: CommandLine.h:1423

llvm::ilist_node_impl::getIterator
self_iterator getIterator()
Definition: ilist_node.h:132

uint16_t

uint32_t

uint64_t

uint8_t

unsigned

ErrorHandling.h

llvm_unreachable
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
Definition: ErrorHandling.h:143

false
Definition: StackSlotColoring.cpp:193

llvm::AMDGPU::HSAMD::Kernel::Key::Args
constexpr char Args[]
Key for Kernel::Metadata::mArgs.
Definition: AMDGPUMetadata.h:395

llvm::AMDGPU::Imm
@ Imm
Definition: AMDGPURegBankLegalizeRules.h:105

llvm::ARM::ProfileKind::M
@ M

llvm::BitmaskEnumDetail::Mask
constexpr std::underlying_type_t< E > Mask()
Get a bitmask with 1s in all places up to the high-order bit of E's largest value.
Definition: BitmaskEnum.h:125

llvm::COFF::Entry
@ Entry
Definition: COFF.h:844

llvm::CallingConv::GHC
@ GHC
Used by the Glasgow Haskell Compiler (GHC).
Definition: CallingConv.h:50

llvm::CallingConv::Fast
@ Fast
Attempts to make calls as fast as possible (e.g.
Definition: CallingConv.h:41

llvm::CallingConv::C
@ C
The default llvm calling convention, compatible with C.
Definition: CallingConv.h:34

llvm::CodeModel::Model
Model
Definition: CodeGen.h:31

llvm::CodeModel::Medium
@ Medium
Definition: CodeGen.h:31

llvm::CodeModel::Large
@ Large
Definition: CodeGen.h:31

llvm::CodeModel::Small
@ Small
Definition: CodeGen.h:31

llvm::IRSimilarity::Legal
@ Legal
Definition: IRSimilarityIdentifier.h:76

llvm::ISD::NodeType
NodeType
ISD::NodeType enum - This enum defines the target-independent operators for a SelectionDAG.
Definition: ISDOpcodes.h:40

llvm::ISD::SETCC
@ SETCC
SetCC operator - This evaluates to a true value iff the condition is true.
Definition: ISDOpcodes.h:780

llvm::ISD::STACKRESTORE
@ STACKRESTORE
STACKRESTORE has two operands, an input chain and a pointer to restore to it returns an output chain.
Definition: ISDOpcodes.h:1197

llvm::ISD::STACKSAVE
@ STACKSAVE
STACKSAVE - STACKSAVE has one operand, an input chain.
Definition: ISDOpcodes.h:1193

llvm::ISD::STRICT_FSETCC
@ STRICT_FSETCC
STRICT_FSETCC/STRICT_FSETCCS - Constrained versions of SETCC, used for floating-point operands only.
Definition: ISDOpcodes.h:491

llvm::ISD::STORE
@ STORE
Definition: ISDOpcodes.h:1103

llvm::ISD::JumpTable
@ JumpTable
Definition: ISDOpcodes.h:81

llvm::ISD::SREM
@ SREM
Definition: ISDOpcodes.h:251

llvm::ISD::SMUL_LOHI
@ SMUL_LOHI
SMUL_LOHI/UMUL_LOHI - Multiply two integers of type iN, producing a signed/unsigned value of type i[2...
Definition: ISDOpcodes.h:257

llvm::ISD::UDIV
@ UDIV
Definition: ISDOpcodes.h:250

llvm::ISD::UINT_TO_FP
@ UINT_TO_FP
Definition: ISDOpcodes.h:842

llvm::ISD::UMIN
@ UMIN
Definition: ISDOpcodes.h:699

llvm::ISD::BSWAP
@ BSWAP
Byte Swap and Counting operators.
Definition: ISDOpcodes.h:744

llvm::ISD::ROTR
@ ROTR
Definition: ISDOpcodes.h:739

llvm::ISD::FPOW
@ FPOW
Definition: ISDOpcodes.h:994

llvm::ISD::VAEND
@ VAEND
VAEND, VASTART - VAEND and VASTART have three operands: an input chain, pointer, and a SRCVALUE.
Definition: ISDOpcodes.h:1226

llvm::ISD::FTRUNC
@ FTRUNC
Definition: ISDOpcodes.h:1013

llvm::ISD::SDIV
@ SDIV
Definition: ISDOpcodes.h:249

llvm::ISD::FMAXNUM_IEEE
@ FMAXNUM_IEEE
Definition: ISDOpcodes.h:1045

llvm::ISD::ADD
@ ADD
Simple integer binary arithmetic operators.
Definition: ISDOpcodes.h:246

llvm::ISD::LOAD
@ LOAD
LOAD and STORE have token chains as their first operand, then the same operands as an LLVM load/store...
Definition: ISDOpcodes.h:1102

llvm::ISD::ANY_EXTEND
@ ANY_EXTEND
ANY_EXTEND - Used for integer types. The high bits are undefined.
Definition: ISDOpcodes.h:814

llvm::ISD::FSUB
@ FSUB
Definition: ISDOpcodes.h:398

llvm::ISD::FMA
@ FMA
FMA - Perform a * b + c with no intermediate rounding step.
Definition: ISDOpcodes.h:498

llvm::ISD::INTRINSIC_VOID
@ INTRINSIC_VOID
OUTCHAIN = INTRINSIC_VOID(INCHAIN, INTRINSICID, arg1, arg2, ...) This node represents a target intrin...
Definition: ISDOpcodes.h:205

llvm::ISD::RETURNADDR
@ RETURNADDR
Definition: ISDOpcodes.h:101

llvm::ISD::GlobalAddress
@ GlobalAddress
Definition: ISDOpcodes.h:78

llvm::ISD::SINT_TO_FP
@ SINT_TO_FP
[SU]INT_TO_FP - These operators convert integers (whose interpreted sign depends on the first letter)...
Definition: ISDOpcodes.h:841

llvm::ISD::CONCAT_VECTORS
@ CONCAT_VECTORS
CONCAT_VECTORS(VECTOR0, VECTOR1, ...) - Given a number of values of vector type with the same length ...
Definition: ISDOpcodes.h:558

llvm::ISD::FADD
@ FADD
Simple binary floating point operators.
Definition: ISDOpcodes.h:397

llvm::ISD::MEMBARRIER
@ MEMBARRIER
MEMBARRIER - Compiler barrier only; generate a no-op.
Definition: ISDOpcodes.h:1299

llvm::ISD::ATOMIC_FENCE
@ ATOMIC_FENCE
OUTCHAIN = ATOMIC_FENCE(INCHAIN, ordering, scope) This corresponds to the fence instruction.
Definition: ISDOpcodes.h:1304

llvm::ISD::FP_TO_FP16
@ FP_TO_FP16
Definition: ISDOpcodes.h:965

llvm::ISD::SRL
@ SRL
Definition: ISDOpcodes.h:737

llvm::ISD::STRICT_FSETCCS
@ STRICT_FSETCCS
Definition: ISDOpcodes.h:492

llvm::ISD::FP16_TO_FP
@ FP16_TO_FP
FP16_TO_FP, FP_TO_FP16 - These operators are used to perform promotions and truncation for half-preci...
Definition: ISDOpcodes.h:964

llvm::ISD::BITCAST
@ BITCAST
BITCAST - This operator converts between integer, vector and FP values, as if the value was stored to...
Definition: ISDOpcodes.h:954

llvm::ISD::BUILD_PAIR
@ BUILD_PAIR
BUILD_PAIR - This is the opposite of EXTRACT_ELEMENT in some ways.
Definition: ISDOpcodes.h:236

llvm::ISD::FFLOOR
@ FFLOOR
Definition: ISDOpcodes.h:1018

llvm::ISD::BUILTIN_OP_END
@ BUILTIN_OP_END
BUILTIN_OP_END - This must be the last enum value in this list.
Definition: ISDOpcodes.h:1494

llvm::ISD::GlobalTLSAddress
@ GlobalTLSAddress
Definition: ISDOpcodes.h:79

llvm::ISD::SRA
@ SRA
Definition: ISDOpcodes.h:736

llvm::ISD::SIGN_EXTEND
@ SIGN_EXTEND
Conversion operators.
Definition: ISDOpcodes.h:805

llvm::ISD::SCALAR_TO_VECTOR
@ SCALAR_TO_VECTOR
SCALAR_TO_VECTOR(VAL) - This represents the operation of loading a scalar value into element 0 of the...
Definition: ISDOpcodes.h:635

llvm::ISD::WRITE_REGISTER
@ WRITE_REGISTER
Definition: ISDOpcodes.h:125

llvm::ISD::FRINT
@ FRINT
Definition: ISDOpcodes.h:1014

llvm::ISD::PREFETCH
@ PREFETCH
PREFETCH - This corresponds to a prefetch intrinsic.
Definition: ISDOpcodes.h:1292

llvm::ISD::FSINCOS
@ FSINCOS
FSINCOS - Compute both fsin and fcos as a single operation.
Definition: ISDOpcodes.h:1059

llvm::ISD::FNEG
@ FNEG
Perform various unary floating-point operations inspired by libm.
Definition: ISDOpcodes.h:981

llvm::ISD::BR_CC
@ BR_CC
BR_CC - Conditional branch.
Definition: ISDOpcodes.h:1148

llvm::ISD::CTTZ
@ CTTZ
Definition: ISDOpcodes.h:745

llvm::ISD::FP_TO_UINT
@ FP_TO_UINT
Definition: ISDOpcodes.h:888

llvm::ISD::BR_JT
@ BR_JT
BR_JT - Jumptable branch.
Definition: ISDOpcodes.h:1127

llvm::ISD::OR
@ OR
Definition: ISDOpcodes.h:710

llvm::ISD::IS_FPCLASS
@ IS_FPCLASS
Performs a check of floating point class property, defined by IEEE-754.
Definition: ISDOpcodes.h:522

llvm::ISD::SRA_PARTS
@ SRA_PARTS
Definition: ISDOpcodes.h:795

llvm::ISD::SELECT
@ SELECT
Select(COND, TRUEVAL, FALSEVAL).
Definition: ISDOpcodes.h:757

llvm::ISD::UMUL_LOHI
@ UMUL_LOHI
Definition: ISDOpcodes.h:258

llvm::ISD::UNDEF
@ UNDEF
UNDEF - An undefined node.
Definition: ISDOpcodes.h:218

llvm::ISD::VACOPY
@ VACOPY
VACOPY - VACOPY has 5 operands: an input chain, a destination pointer, a source pointer,...
Definition: ISDOpcodes.h:1222

llvm::ISD::MULHU
@ MULHU
MULHU/MULHS - Multiply high - Multiply two integers of type iN, producing an unsigned/signed value of...
Definition: ISDOpcodes.h:674

llvm::ISD::SHL
@ SHL
Shift and rotation operations.
Definition: ISDOpcodes.h:735

llvm::ISD::VECTOR_SHUFFLE
@ VECTOR_SHUFFLE
VECTOR_SHUFFLE(VEC1, VEC2) - Returns a vector, of the same type as VEC1/VEC2.
Definition: ISDOpcodes.h:615

llvm::ISD::FMINNUM_IEEE
@ FMINNUM_IEEE
FMINNUM_IEEE/FMAXNUM_IEEE - Perform floating-point minimumNumber or maximumNumber on two values,...
Definition: ISDOpcodes.h:1044

llvm::ISD::FCOS
@ FCOS
Definition: ISDOpcodes.h:986

llvm::ISD::READ_REGISTER
@ READ_REGISTER
READ_REGISTER, WRITE_REGISTER - This node represents llvm.register on the DAG, which implements the n...
Definition: ISDOpcodes.h:124

llvm::ISD::XOR
@ XOR
Definition: ISDOpcodes.h:711

llvm::ISD::EXTRACT_VECTOR_ELT
@ EXTRACT_VECTOR_ELT
EXTRACT_VECTOR_ELT(VECTOR, IDX) - Returns a single element from VECTOR identified by the (potentially...
Definition: ISDOpcodes.h:550

llvm::ISD::CopyToReg
@ CopyToReg
CopyToReg - This node has three operands: a chain, a register number to set to this value,...
Definition: ISDOpcodes.h:209

llvm::ISD::ZERO_EXTEND
@ ZERO_EXTEND
ZERO_EXTEND - Used for integer types, zeroing the new bits.
Definition: ISDOpcodes.h:811

llvm::ISD::DEBUGTRAP
@ DEBUGTRAP
DEBUGTRAP - Trap intended to get the attention of a debugger.
Definition: ISDOpcodes.h:1282

llvm::ISD::CTPOP
@ CTPOP
Definition: ISDOpcodes.h:747

llvm::ISD::SELECT_CC
@ SELECT_CC
Select with condition operator - This selects between a true value and a false value (ops #2 and #3) ...
Definition: ISDOpcodes.h:772

llvm::ISD::FMUL
@ FMUL
Definition: ISDOpcodes.h:399

llvm::ISD::ATOMIC_CMP_SWAP
@ ATOMIC_CMP_SWAP
Val, OUTCHAIN = ATOMIC_CMP_SWAP(INCHAIN, ptr, cmp, swap) For double-word atomic operations: ValLo,...
Definition: ISDOpcodes.h:1319

llvm::ISD::SRL_PARTS
@ SRL_PARTS
Definition: ISDOpcodes.h:796

llvm::ISD::SUB
@ SUB
Definition: ISDOpcodes.h:247

llvm::ISD::MULHS
@ MULHS
Definition: ISDOpcodes.h:675

llvm::ISD::DYNAMIC_STACKALLOC
@ DYNAMIC_STACKALLOC
DYNAMIC_STACKALLOC - Allocate some number of bytes on the stack aligned to a specified boundary.
Definition: ISDOpcodes.h:1112

llvm::ISD::ConstantPool
@ ConstantPool
Definition: ISDOpcodes.h:82

llvm::ISD::SIGN_EXTEND_INREG
@ SIGN_EXTEND_INREG
SIGN_EXTEND_INREG - This operator atomically performs a SHL/SRA pair to sign extend a small value in ...
Definition: ISDOpcodes.h:849

llvm::ISD::SMIN
@ SMIN
[US]{MIN/MAX} - Binary minimum or maximum of signed or unsigned integers.
Definition: ISDOpcodes.h:697

llvm::ISD::Constant
@ Constant
Definition: ISDOpcodes.h:76

llvm::ISD::FP_EXTEND
@ FP_EXTEND
X = FP_EXTEND(Y) - Extend a smaller FP type into a larger FP type.
Definition: ISDOpcodes.h:939

llvm::ISD::VSELECT
@ VSELECT
Select with a vector condition (op #0) and two vector operands (ops #1 and #2), returning a vector re...
Definition: ISDOpcodes.h:766

llvm::ISD::FROUNDEVEN
@ FROUNDEVEN
Definition: ISDOpcodes.h:1017

llvm::ISD::EH_DWARF_CFA
@ EH_DWARF_CFA
EH_DWARF_CFA - This node represents the pointer to the DWARF Canonical Frame Address (CFA),...
Definition: ISDOpcodes.h:135

llvm::ISD::FDIV
@ FDIV
Definition: ISDOpcodes.h:400

llvm::ISD::FRAMEADDR
@ FRAMEADDR
FRAMEADDR, RETURNADDR - These nodes represent llvm.frameaddress and llvm.returnaddress on the DAG.
Definition: ISDOpcodes.h:100

llvm::ISD::FREM
@ FREM
Definition: ISDOpcodes.h:401

llvm::ISD::FP_TO_SINT
@ FP_TO_SINT
FP_TO_[US]INT - Convert a floating point value to a signed or unsigned integer.
Definition: ISDOpcodes.h:887

llvm::ISD::AND
@ AND
Bitwise operators - logical and, logical or, logical xor.
Definition: ISDOpcodes.h:709

llvm::ISD::TRAP
@ TRAP
TRAP - Trapping instruction.
Definition: ISDOpcodes.h:1279

llvm::ISD::INTRINSIC_WO_CHAIN
@ INTRINSIC_WO_CHAIN
RESULT = INTRINSIC_WO_CHAIN(INTRINSICID, arg1, arg2, ...) This node represents a target intrinsic fun...
Definition: ISDOpcodes.h:190

llvm::ISD::UREM
@ UREM
Definition: ISDOpcodes.h:252

llvm::ISD::INSERT_VECTOR_ELT
@ INSERT_VECTOR_ELT
INSERT_VECTOR_ELT(VECTOR, VAL, IDX) - Returns VECTOR with the element at IDX replaced with VAL.
Definition: ISDOpcodes.h:539

llvm::ISD::TokenFactor
@ TokenFactor
TokenFactor - This node takes multiple tokens as input and produces a single token result.
Definition: ISDOpcodes.h:52

llvm::ISD::FSIN
@ FSIN
Definition: ISDOpcodes.h:985

llvm::ISD::FCEIL
@ FCEIL
Definition: ISDOpcodes.h:1012

llvm::ISD::MUL
@ MUL
Definition: ISDOpcodes.h:248

llvm::ISD::LROUND
@ LROUND
Definition: ISDOpcodes.h:1019

llvm::ISD::CTLZ
@ CTLZ
Definition: ISDOpcodes.h:746

llvm::ISD::VASTART
@ VASTART
Definition: ISDOpcodes.h:1227

llvm::ISD::FSQRT
@ FSQRT
Definition: ISDOpcodes.h:983

llvm::ISD::TRUNCATE
@ TRUNCATE
TRUNCATE - Completely drop the high bits.
Definition: ISDOpcodes.h:817

llvm::ISD::VAARG
@ VAARG
VAARG - VAARG has four operands: an input chain, a pointer, a SRCVALUE, and the alignment.
Definition: ISDOpcodes.h:1217

llvm::ISD::ROTL
@ ROTL
Definition: ISDOpcodes.h:738

llvm::ISD::BlockAddress
@ BlockAddress
Definition: ISDOpcodes.h:84

llvm::ISD::SHL_PARTS
@ SHL_PARTS
SHL_PARTS/SRA_PARTS/SRL_PARTS - These operators are used for expanded integer shift operations.
Definition: ISDOpcodes.h:794

llvm::ISD::AssertSext
@ AssertSext
AssertSext, AssertZext - These nodes record if a register contains a value that has already been zero...
Definition: ISDOpcodes.h:61

llvm::ISD::BITREVERSE
@ BITREVERSE
Definition: ISDOpcodes.h:748

llvm::ISD::AssertZext
@ AssertZext
Definition: ISDOpcodes.h:62

llvm::ISD::SMAX
@ SMAX
Definition: ISDOpcodes.h:698

llvm::ISD::UMAX
@ UMAX
Definition: ISDOpcodes.h:700

llvm::ISD::INTRINSIC_W_CHAIN
@ INTRINSIC_W_CHAIN
RESULT,OUTCHAIN = INTRINSIC_W_CHAIN(INCHAIN, INTRINSICID, arg1, ...) This node represents a target in...
Definition: ISDOpcodes.h:198

llvm::ISD::BUILD_VECTOR
@ BUILD_VECTOR
BUILD_VECTOR(ELT0, ELT1, ELT2, ELT3,...) - Return a fixed-width vector with the specified,...
Definition: ISDOpcodes.h:530

llvm::ISD::CondCode
CondCode
ISD::CondCode enum - These are ordered carefully to make the bitfields below work out,...
Definition: ISDOpcodes.h:1610

llvm::ISD::SETNE
@ SETNE
Definition: ISDOpcodes.h:1635

llvm::ISD::SETUGT
@ SETUGT
Definition: ISDOpcodes.h:1622

llvm::ISD::SETOGT
@ SETOGT
Definition: ISDOpcodes.h:1614

llvm::ISD::SETGT
@ SETGT
Definition: ISDOpcodes.h:1631

llvm::ISD::SETLT
@ SETLT
Definition: ISDOpcodes.h:1633

llvm::ISD::SETGE
@ SETGE
Definition: ISDOpcodes.h:1632

llvm::ISD::SETUGE
@ SETUGE
Definition: ISDOpcodes.h:1623

llvm::ISD::SETOGE
@ SETOGE
Definition: ISDOpcodes.h:1615

llvm::ISD::SETEQ
@ SETEQ
Definition: ISDOpcodes.h:1630

llvm::ISD::LoadExtType
LoadExtType
LoadExtType enum - This enum defines the three variants of LOADEXT (load with extension).
Definition: ISDOpcodes.h:1590

llvm::ISD::NON_EXTLOAD
@ NON_EXTLOAD
Definition: ISDOpcodes.h:1590

llvm::ISD::SEXTLOAD
@ SEXTLOAD
Definition: ISDOpcodes.h:1590

llvm::ISD::ZEXTLOAD
@ ZEXTLOAD
Definition: ISDOpcodes.h:1590

llvm::ISD::EXTLOAD
@ EXTLOAD
Definition: ISDOpcodes.h:1590

llvm::Intrinsic::getOrInsertDeclaration
Function * getOrInsertDeclaration(Module *M, ID id, ArrayRef< Type * > Tys={})
Look up the Function declaration of the intrinsic id in the Module M.
Definition: Intrinsics.cpp:732

llvm::LoongArchABI::ABI
ABI
Definition: LoongArchBaseInfo.h:119

llvm::LoongArchABI::ABI_LP64F
@ ABI_LP64F
Definition: LoongArchBaseInfo.h:124

llvm::LoongArchABI::ABI_LP64S
@ ABI_LP64S
Definition: LoongArchBaseInfo.h:123

llvm::LoongArchABI::ABI_ILP32S
@ ABI_ILP32S
Definition: LoongArchBaseInfo.h:120

llvm::LoongArchABI::ABI_ILP32F
@ ABI_ILP32F
Definition: LoongArchBaseInfo.h:121

llvm::LoongArchABI::ABI_ILP32D
@ ABI_ILP32D
Definition: LoongArchBaseInfo.h:122

llvm::LoongArchABI::ABI_LP64D
@ ABI_LP64D
Definition: LoongArchBaseInfo.h:125

llvm::LoongArchABI::getTargetABI
ABI getTargetABI(StringRef ABIName)
Definition: LoongArchBaseInfo.cpp:176

llvm::LoongArchII::MO_CALL
@ MO_CALL
Definition: LoongArchBaseInfo.h:31

llvm::LoongArchII::MO_CALL_PLT
@ MO_CALL_PLT
Definition: LoongArchBaseInfo.h:32

llvm::LoongArchISD::NodeType
NodeType
Definition: LoongArchISelLowering.h:25

llvm::LoongArchISD::BSTRPICK
@ BSTRPICK
Definition: LoongArchISelLowering.h:65

llvm::LoongArchISD::VPACKEV
@ VPACKEV
Definition: LoongArchISelLowering.h:129

llvm::LoongArchISD::VPACKOD
@ VPACKOD
Definition: LoongArchISelLowering.h:130

llvm::LoongArchISD::REVB_2H
@ REVB_2H
Definition: LoongArchISelLowering.h:68

llvm::LoongArchISD::CSRWR
@ CSRWR
Definition: LoongArchISelLowering.h:100

llvm::LoongArchISD::IBAR
@ IBAR
Definition: LoongArchISelLowering.h:79

llvm::LoongArchISD::CLZ_W
@ CLZ_W
Definition: LoongArchISelLowering.h:61

llvm::LoongArchISD::MOVFCSR2GR
@ MOVFCSR2GR
Definition: LoongArchISelLowering.h:55

llvm::LoongArchISD::SLL_W
@ SLL_W
Definition: LoongArchISelLowering.h:39

llvm::LoongArchISD::BITREV_8B
@ BITREV_8B
Definition: LoongArchISelLowering.h:71

llvm::LoongArchISD::VREPLVEI
@ VREPLVEI
Definition: LoongArchISelLowering.h:134

llvm::LoongArchISD::FRECIPE
@ FRECIPE
Definition: LoongArchISelLowering.h:149

llvm::LoongArchISD::VREPLVE
@ VREPLVE
Definition: LoongArchISelLowering.h:125

llvm::LoongArchISD::TAIL
@ TAIL
Definition: LoongArchISelLowering.h:33

llvm::LoongArchISD::VPICK_SEXT_ELT
@ VPICK_SEXT_ELT
Definition: LoongArchISelLowering.h:139

llvm::LoongArchISD::VILVH
@ VILVH
Definition: LoongArchISelLowering.h:132

llvm::LoongArchISD::BSTRINS
@ BSTRINS
Definition: LoongArchISelLowering.h:64

llvm::LoongArchISD::TAIL_LARGE
@ TAIL_LARGE
Definition: LoongArchISelLowering.h:35

llvm::LoongArchISD::REVB_2W
@ REVB_2W
Definition: LoongArchISelLowering.h:69

llvm::LoongArchISD::BITREV_4B
@ BITREV_4B
Definition: LoongArchISelLowering.h:70

llvm::LoongArchISD::VPICKOD
@ VPICKOD
Definition: LoongArchISelLowering.h:128

llvm::LoongArchISD::VREPLGR2VR
@ VREPLGR2VR
Definition: LoongArchISelLowering.h:135

llvm::LoongArchISD::CTZ_W
@ CTZ_W
Definition: LoongArchISelLowering.h:62

llvm::LoongArchISD::MOD_W
@ MOD_W
Definition: LoongArchISelLowering.h:48

llvm::LoongArchISD::SRA_W
@ SRA_W
Definition: LoongArchISelLowering.h:40

llvm::LoongArchISD::IOCSRWR_D
@ IOCSRWR_D
Definition: LoongArchISelLowering.h:119

llvm::LoongArchISD::FTINT
@ FTINT
Definition: LoongArchISelLowering.h:58

llvm::LoongArchISD::ROTR_W
@ ROTR_W
Definition: LoongArchISelLowering.h:44

llvm::LoongArchISD::CSRXCHG
@ CSRXCHG
Definition: LoongArchISelLowering.h:109

llvm::LoongArchISD::DBAR
@ DBAR
Definition: LoongArchISelLowering.h:78

llvm::LoongArchISD::VALL_ZERO
@ VALL_ZERO
Definition: LoongArchISelLowering.h:143

llvm::LoongArchISD::SRL_W
@ SRL_W
Definition: LoongArchISelLowering.h:41

llvm::LoongArchISD::CPUCFG
@ CPUCFG
Definition: LoongArchISelLowering.h:122

llvm::LoongArchISD::VSHUF4I
@ VSHUF4I
Definition: LoongArchISelLowering.h:133

llvm::LoongArchISD::BREAK
@ BREAK
Definition: LoongArchISelLowering.h:75

llvm::LoongArchISD::IOCSRRD_D
@ IOCSRRD_D
Definition: LoongArchISelLowering.h:115

llvm::LoongArchISD::CALL_LARGE
@ CALL_LARGE
Definition: LoongArchISelLowering.h:31

llvm::LoongArchISD::CALL_MEDIUM
@ CALL_MEDIUM
Definition: LoongArchISelLowering.h:30

llvm::LoongArchISD::MOVGR2FCSR
@ MOVGR2FCSR
Definition: LoongArchISelLowering.h:56

llvm::LoongArchISD::FRSQRTE
@ FRSQRTE
Definition: LoongArchISelLowering.h:150

llvm::LoongArchISD::FIRST_NUMBER
@ FIRST_NUMBER
Definition: LoongArchISelLowering.h:26

llvm::LoongArchISD::VANY_NONZERO
@ VANY_NONZERO
Definition: LoongArchISelLowering.h:146

llvm::LoongArchISD::XVPERMI
@ XVPERMI
Definition: LoongArchISelLowering.h:136

llvm::LoongArchISD::MOVFR2GR_S_LA64
@ MOVFR2GR_S_LA64
Definition: LoongArchISelLowering.h:54

llvm::LoongArchISD::MOVGR2FR_W_LA64
@ MOVGR2FR_W_LA64
Definition: LoongArchISelLowering.h:53

llvm::LoongArchISD::DIV_W
@ DIV_W
Definition: LoongArchISelLowering.h:47

llvm::LoongArchISD::VALL_NONZERO
@ VALL_NONZERO
Definition: LoongArchISelLowering.h:145

llvm::LoongArchISD::SYSCALL
@ SYSCALL
Definition: LoongArchISelLowering.h:80

llvm::LoongArchISD::VPICKEV
@ VPICKEV
Definition: LoongArchISelLowering.h:127

llvm::LoongArchISD::TAIL_MEDIUM
@ TAIL_MEDIUM
Definition: LoongArchISelLowering.h:34

llvm::LoongArchISD::VILVL
@ VILVL
Definition: LoongArchISelLowering.h:131

llvm::LoongArchISD::VPICK_ZEXT_ELT
@ VPICK_ZEXT_ELT
Definition: LoongArchISelLowering.h:140

llvm::LoongArchISD::VANY_ZERO
@ VANY_ZERO
Definition: LoongArchISelLowering.h:144

llvm::LoongArchISD::CALL
@ CALL
Definition: LoongArchISelLowering.h:29

llvm::LoongArchISD::RET
@ RET
Definition: LoongArchISelLowering.h:32

llvm::LoongArchISD::VSHUF
@ VSHUF
Definition: LoongArchISelLowering.h:126

llvm::LoongArchISD::CSRRD
@ CSRRD
Definition: LoongArchISelLowering.h:92

llvm::LoongArchISD::DIV_WU
@ DIV_WU
Definition: LoongArchISelLowering.h:49

llvm::LoongArchISD::MOD_WU
@ MOD_WU
Definition: LoongArchISelLowering.h:50

llvm::LoongArchISD::BITREV_W
@ BITREV_W
Definition: LoongArchISelLowering.h:72

llvm::M68kBeads::DReg
@ DReg
Definition: M68kBaseInfo.h:106

llvm::M68k::MemAddrModeKind::j
@ j

llvm::MipsISD::Ins
@ Ins
Definition: MipsISelLowering.h:158

llvm::NVPTX::PTXLdStInstCode::V2
@ V2
Definition: NVPTX.h:163

llvm::RISCVFenceField::R
@ R
Definition: RISCVBaseInfo.h:373

llvm::RTLIB::getSINTTOFP
Libcall getSINTTOFP(EVT OpVT, EVT RetVT)
getSINTTOFP - Return the SINTTOFP_*_* value for the given types, or UNKNOWN_LIBCALL if there is none.
Definition: TargetLoweringBase.cpp:300

llvm::RTLIB::getUINTTOFP
Libcall getUINTTOFP(EVT OpVT, EVT RetVT)
getUINTTOFP - Return the UINTTOFP_*_* value for the given types, or UNKNOWN_LIBCALL if there is none.
Definition: TargetLoweringBase.cpp:346

llvm::RTLIB::Libcall
Libcall
RTLIB::Libcall enum - This enum defines all of the runtime library calls the backend can emit.
Definition: RuntimeLibcalls.h:33

llvm::RTLIB::getFPTOSINT
Libcall getFPTOSINT(EVT OpVT, EVT RetVT)
getFPTOSINT - Return the FPTOSINT_*_* value for the given types, or UNKNOWN_LIBCALL if there is none.
Definition: TargetLoweringBase.cpp:202

llvm::SPII::Load
@ Load
Definition: SparcInstrInfo.h:32

llvm::SyncScope::SingleThread
@ SingleThread
Synchronized with respect to signal handlers executing in the same thread.
Definition: LLVMContext.h:54

llvm::TLSModel::LocalDynamic
@ LocalDynamic
Definition: CodeGen.h:47

llvm::TLSModel::InitialExec
@ InitialExec
Definition: CodeGen.h:48

llvm::TLSModel::GeneralDynamic
@ GeneralDynamic
Definition: CodeGen.h:46

llvm::TLSModel::LocalExec
@ LocalExec
Definition: CodeGen.h:49

llvm::X86Disassembler::Reg
Reg
All possible values of the reg field in the ModR/M byte.
Definition: X86DisassemblerDecoder.h:621

llvm::cl::Hidden
@ Hidden
Definition: CommandLine.h:137

llvm::cl::init
initializer< Ty > init(const Ty &Val)
Definition: CommandLine.h:443

llvm::coro::ABI
ABI
Definition: CoroShape.h:25

llvm::logicalview::LVAttributeKind::Zero
@ Zero

llvm::ms_demangle::QualifierMangleMode::Result
@ Result

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition: AddressRanges.h:18

llvm::Offset
@ Offset
Definition: DWP.cpp:480

llvm::all_of
bool all_of(R &&range, UnaryPredicate P)
Provide wrappers to std::all_of which take ranges instead of having to pass begin/end explicitly.
Definition: STLExtras.h:1739

llvm::BuildMI
MachineInstrBuilder BuildMI(MachineFunction &MF, const MIMetadata &MIMD, const MCInstrDesc &MCID)
Builder interface. Specify how to create the initial instruction itself.
Definition: MachineInstrBuilder.h:373

llvm::Depth
@ Depth
Definition: SIMachineScheduler.h:36

llvm::isShiftedMask_64
constexpr bool isShiftedMask_64(uint64_t Value)
Return true if the argument contains a non-empty sequence of ones with the remainder zero (64 bit ver...
Definition: MathExtras.h:286

llvm::any_of
bool any_of(R &&range, UnaryPredicate P)
Provide wrappers to std::any_of which take ranges instead of having to pass begin/end explicitly.
Definition: STLExtras.h:1746

llvm::None
@ None
Definition: CodeGenData.h:106

llvm::dbgs
raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
Definition: Debug.cpp:163

llvm::report_fatal_error
void report_fatal_error(Error Err, bool gen_crash_diag=true)
Report a serious error, calling any installed error handler.
Definition: Error.cpp:167

llvm::isUInt
constexpr bool isUInt(uint64_t x)
Checks if an unsigned integer fits into the given bit width.
Definition: MathExtras.h:194

llvm::CaptureComponents::Address
@ Address

llvm::PackElem::Hi
@ Hi

llvm::PackElem::Lo
@ Lo

llvm::AtomicOrdering
AtomicOrdering
Atomic ordering for LLVM's memory model.
Definition: AtomicOrdering.h:56

llvm::AtomicOrdering::Monotonic
@ Monotonic

llvm::AtomicOrdering::AcquireRelease
@ AcquireRelease

llvm::AtomicOrdering::Acquire
@ Acquire

llvm::AtomicOrdering::Release
@ Release

llvm::AtomicOrdering::SequentiallyConsistent
@ SequentiallyConsistent

llvm::IRMemLocation::Other
@ Other
Any other memory.

llvm::getKillRegState
unsigned getKillRegState(bool B)
Definition: MachineInstrBuilder.h:555

llvm::Op
DWARFExpression::Operation Op
Definition: DWARFExpression.cpp:22

llvm::BitWidth
constexpr unsigned BitWidth
Definition: BitmaskEnum.h:217

llvm::VFParamKind::Vector
@ Vector

std::swap
void swap(llvm::BitVector &LHS, llvm::BitVector &RHS)
Implement std::swap in terms of BitVector swap.
Definition: BitVector.h:860

N
#define N

RegInfo
Definition: AMDGPUAsmParser.cpp:2770

llvm::Align
This struct is a compact representation of a valid (non-zero power of two) alignment.
Definition: Alignment.h:39

llvm::EVT
Extended Value Type.
Definition: ValueTypes.h:35

llvm::EVT::changeVectorElementTypeToInteger
EVT changeVectorElementTypeToInteger() const
Return a vector with the same number of elements as this vector, but with the element type converted ...
Definition: ValueTypes.h:94

llvm::EVT::getStoreSize
TypeSize getStoreSize() const
Return the number of bytes overwritten by a store of the specified value type.
Definition: ValueTypes.h:390

llvm::EVT::isSimple
bool isSimple() const
Test if the given EVT is simple (as opposed to being extended).
Definition: ValueTypes.h:137

llvm::EVT::getSizeInBits
TypeSize getSizeInBits() const
Return the size of the specified value type in bits.
Definition: ValueTypes.h:368

llvm::EVT::getScalarSizeInBits
uint64_t getScalarSizeInBits() const
Definition: ValueTypes.h:380

llvm::EVT::getSimpleVT
MVT getSimpleVT() const
Return the SimpleValueType held in the specified simple EVT.
Definition: ValueTypes.h:311

llvm::EVT::is128BitVector
bool is128BitVector() const
Return true if this is a 128-bit vector type.
Definition: ValueTypes.h:207

llvm::EVT::getFixedSizeInBits
uint64_t getFixedSizeInBits() const
Return the size of the specified fixed width value type in bits.
Definition: ValueTypes.h:376

llvm::EVT::getFloatingPointVT
static EVT getFloatingPointVT(unsigned BitWidth)
Returns the EVT that represents a floating-point type with the given number of bits.
Definition: ValueTypes.h:59

llvm::EVT::isVector
bool isVector() const
Return true if this is a vector value type.
Definition: ValueTypes.h:168

llvm::EVT::getScalarType
EVT getScalarType() const
If this is a vector type, return the element type, otherwise return this.
Definition: ValueTypes.h:318

llvm::EVT::is256BitVector
bool is256BitVector() const
Return true if this is a 256-bit vector type.
Definition: ValueTypes.h:212

llvm::EVT::getTypeForEVT
Type * getTypeForEVT(LLVMContext &Context) const
This method returns an LLVM type corresponding to the specified EVT.
Definition: ValueTypes.cpp:210

llvm::EVT::getVectorElementType
EVT getVectorElementType() const
Given a vector type, return the type of each element.
Definition: ValueTypes.h:323

llvm::EVT::isScalarInteger
bool isScalarInteger() const
Return true if this is an integer, but not a vector.
Definition: ValueTypes.h:157

llvm::EVT::getVectorNumElements
unsigned getVectorNumElements() const
Given a vector type, return the number of elements it contains.
Definition: ValueTypes.h:331

llvm::ISD::ArgFlagsTy
Definition: TargetCallingConv.h:27

llvm::ISD::ArgFlagsTy::isSplitEnd
bool isSplitEnd() const
Definition: TargetCallingConv.h:139

llvm::ISD::ArgFlagsTy::getNonZeroOrigAlign
Align getNonZeroOrigAlign() const
Definition: TargetCallingConv.h:164

llvm::ISD::ArgFlagsTy::isSplit
bool isSplit() const
Definition: TargetCallingConv.h:136

llvm::ISD::InputArg
InputArg - This struct carries flags and type information about a single incoming (formal) argument o...
Definition: TargetCallingConv.h:199

llvm::KnownBits::Zero
APInt Zero
Definition: KnownBits.h:24

llvm::LoongArchRegisterInfo
Definition: LoongArchRegisterInfo.h:24

llvm::LoongArchRegisterInfo::getFrameRegister
Register getFrameRegister(const MachineFunction &MF) const override
Definition: LoongArchRegisterInfo.cpp:107

llvm::LoongArchRegisterInfo::getReservedRegs
BitVector getReservedRegs(const MachineFunction &MF) const override
Definition: LoongArchRegisterInfo.cpp:86

llvm::MachinePointerInfo
This class contains a discriminated union of information about pointers in memory operands,...
Definition: MachineMemOperand.h:41

llvm::MachinePointerInfo::getGOT
static MachinePointerInfo getGOT(MachineFunction &MF)
Return a MachinePointerInfo record that refers to a GOT entry.
Definition: MachineOperand.cpp:1081

llvm::MachinePointerInfo::getFixedStack
static MachinePointerInfo getFixedStack(MachineFunction &MF, int FI, int64_t Offset=0)
Return a MachinePointerInfo record that refers to the specified FrameIndex.
Definition: MachineOperand.cpp:1072

llvm::MemOp
Definition: TargetLowering.h:115

llvm::SDVTList
This represents a list of ValueType's that has been intern'd by a SelectionDAG.
Definition: SelectionDAGNodes.h:79

llvm::TargetLoweringBase::AddrMode
This represents an addressing mode of: BaseGV + BaseOffs + BaseReg + Scale*ScaleReg + ScalableOffset*...
Definition: TargetLowering.h:2816

llvm::TargetLoweringBase::AddrMode::BaseOffs
int64_t BaseOffs
Definition: TargetLowering.h:2818

llvm::TargetLoweringBase::AddrMode::BaseGV
GlobalValue * BaseGV
Definition: TargetLowering.h:2817

llvm::TargetLoweringBase::AddrMode::HasBaseReg
bool HasBaseReg
Definition: TargetLowering.h:2819

llvm::TargetLoweringBase::AddrMode::Scale
int64_t Scale
Definition: TargetLowering.h:2820

llvm::TargetLoweringBase::IntrinsicInfo
Definition: TargetLowering.h:1202

llvm::TargetLowering::CallLoweringInfo
This structure contains all information that is necessary for lowering calls.
Definition: TargetLowering.h:4529

llvm::TargetLowering::CallLoweringInfo::IsTailCall
bool IsTailCall
Definition: TargetLowering.h:4545

llvm::TargetLowering::CallLoweringInfo::Callee
SDValue Callee
Definition: TargetLowering.h:4552

llvm::TargetLowering::CallLoweringInfo::DL
SDLoc DL
Definition: TargetLowering.h:4555

llvm::TargetLowering::CallLoweringInfo::IsVarArg
bool IsVarArg
Definition: TargetLowering.h:4534

llvm::TargetLowering::CallLoweringInfo::Ins
SmallVector< ISD::InputArg, 32 > Ins
Definition: TargetLowering.h:4559

llvm::TargetLowering::CallLoweringInfo::Chain
SDValue Chain
Definition: TargetLowering.h:4530

llvm::TargetLowering::CallLoweringInfo::NoMerge
bool NoMerge
Definition: TargetLowering.h:4541

llvm::TargetLowering::CallLoweringInfo::CB
const CallBase * CB
Definition: TargetLowering.h:4556

llvm::TargetLowering::CallLoweringInfo::Outs
SmallVector< ISD::OutputArg, 32 > Outs
Definition: TargetLowering.h:4557

llvm::TargetLowering::CallLoweringInfo::OutVals
SmallVector< SDValue, 32 > OutVals
Definition: TargetLowering.h:4558

llvm::TargetLowering::CallLoweringInfo::CallConv
CallingConv::ID CallConv
Definition: TargetLowering.h:4551

llvm::TargetLowering::CallLoweringInfo::DAG
SelectionDAG & DAG
Definition: TargetLowering.h:4554

llvm::TargetLowering::DAGCombinerInfo
Definition: TargetLowering.h:4228

llvm::TargetLowering::DAGCombinerInfo::isBeforeLegalizeOps
bool isBeforeLegalizeOps() const
Definition: TargetLowering.h:4240

llvm::TargetLowering::DAGCombinerInfo::DAG
SelectionDAG & DAG
Definition: TargetLowering.h:4234

llvm::TargetLowering::MakeLibCallOptions
This structure is used to pass arguments to makeLibCall function.
Definition: TargetLowering.h:4714

llvm::TargetLowering::MakeLibCallOptions::setTypeListBeforeSoften
MakeLibCallOptions & setTypeListBeforeSoften(ArrayRef< EVT > OpsVT, EVT RetVT, bool Value=true)
Definition: TargetLowering.h:4749

llvm::cl::desc
Definition: CommandLine.h:409