/build/llvm-toolchain-snapshot-13~++20210621111111+acefe0eaaf82/llvm/lib/Target/AArch64/GISel/AArch64LegalizerInfo.cpp

Bug Summary

File:	llvm/lib/Target/AArch64/GISel/AArch64LegalizerInfo.cpp
Warning:	line 602, column 40 Division by zero

Annotated Source Code

Press '?' to see keyboard shortcuts

Show analyzer invocation

clang -cc1 -cc1 -triple x86_64-pc-linux-gnu -analyze -disable-free -disable-llvm-verifier -discard-value-names -main-file-name AArch64LegalizerInfo.cpp -analyzer-store=region -analyzer-opt-analyze-nested-blocks -analyzer-checker=core -analyzer-checker=apiModeling -analyzer-checker=unix -analyzer-checker=deadcode -analyzer-checker=cplusplus -analyzer-checker=security.insecureAPI.UncheckedReturn -analyzer-checker=security.insecureAPI.getpw -analyzer-checker=security.insecureAPI.gets -analyzer-checker=security.insecureAPI.mktemp -analyzer-checker=security.insecureAPI.mkstemp -analyzer-checker=security.insecureAPI.vfork -analyzer-checker=nullability.NullPassedToNonnull -analyzer-checker=nullability.NullReturnedFromNonnull -analyzer-output plist -w -setup-static-analyzer -analyzer-config-compatibility-mode=true -mrelocation-model pic -pic-level 2 -mframe-pointer=none -fmath-errno -fno-rounding-math -mconstructor-aliases -munwind-tables -target-cpu x86-64 -tune-cpu generic -debugger-tuning=gdb -ffunction-sections -fdata-sections -fcoverage-compilation-dir=/build/llvm-toolchain-snapshot-13~++20210621111111+acefe0eaaf82/build-llvm/lib/Target/AArch64 -resource-dir /usr/lib/llvm-13/lib/clang/13.0.0 -D _DEBUG -D _GNU_SOURCE -D __STDC_CONSTANT_MACROS -D __STDC_FORMAT_MACROS -D __STDC_LIMIT_MACROS -I /build/llvm-toolchain-snapshot-13~++20210621111111+acefe0eaaf82/build-llvm/lib/Target/AArch64 -I /build/llvm-toolchain-snapshot-13~++20210621111111+acefe0eaaf82/llvm/lib/Target/AArch64 -I /build/llvm-toolchain-snapshot-13~++20210621111111+acefe0eaaf82/build-llvm/include -I /build/llvm-toolchain-snapshot-13~++20210621111111+acefe0eaaf82/llvm/include -D NDEBUG -U NDEBUG -internal-isystem /usr/lib/gcc/x86_64-linux-gnu/10/../../../../include/c++/10 -internal-isystem /usr/lib/gcc/x86_64-linux-gnu/10/../../../../include/x86_64-linux-gnu/c++/10 -internal-isystem /usr/lib/gcc/x86_64-linux-gnu/10/../../../../include/c++/10/backward -internal-isystem /usr/lib/llvm-13/lib/clang/13.0.0/include -internal-isystem /usr/local/include -internal-isystem /usr/lib/gcc/x86_64-linux-gnu/10/../../../../x86_64-linux-gnu/include -internal-externc-isystem /usr/include/x86_64-linux-gnu -internal-externc-isystem /include -internal-externc-isystem /usr/include -O2 -Wno-unused-parameter -Wwrite-strings -Wno-missing-field-initializers -Wno-long-long -Wno-maybe-uninitialized -Wno-class-memaccess -Wno-redundant-move -Wno-pessimizing-move -Wno-noexcept-type -Wno-comment -std=c++14 -fdeprecated-macro -fdebug-compilation-dir=/build/llvm-toolchain-snapshot-13~++20210621111111+acefe0eaaf82/build-llvm/lib/Target/AArch64 -fdebug-prefix-map=/build/llvm-toolchain-snapshot-13~++20210621111111+acefe0eaaf82=. -ferror-limit 19 -fvisibility hidden -fvisibility-inlines-hidden -stack-protector 2 -fgnuc-version=4.2.1 -vectorize-loops -vectorize-slp -analyzer-output=html -analyzer-config stable-report-filename=true -faddrsig -D__GCC_HAVE_DWARF2_CFI_ASM=1 -o /tmp/scan-build-2021-06-21-164211-33944-1 -x c++ /build/llvm-toolchain-snapshot-13~++20210621111111+acefe0eaaf82/llvm/lib/Target/AArch64/GISel/AArch64LegalizerInfo.cpp

/build/llvm-toolchain-snapshot-13~++20210621111111+acefe0eaaf82/llvm/lib/Target/AArch64/GISel/AArch64LegalizerInfo.cpp

→

1//===- AArch64LegalizerInfo.cpp ----------------------------------*- C++ -*-==//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8/// \file
9/// This file implements the targeting of the Machinelegalizer class for
10/// AArch64.
11/// \todo This should be generated by TableGen.
12//===----------------------------------------------------------------------===//

14#include "AArch64LegalizerInfo.h"
15#include "AArch64RegisterBankInfo.h"
16#include "AArch64Subtarget.h"
17#include "llvm/CodeGen/GlobalISel/LegalizerHelper.h"
18#include "llvm/CodeGen/GlobalISel/LegalizerInfo.h"
19#include "llvm/CodeGen/GlobalISel/MachineIRBuilder.h"
20#include "llvm/CodeGen/GlobalISel/Utils.h"
21#include "llvm/CodeGen/MachineInstr.h"
22#include "llvm/CodeGen/MachineRegisterInfo.h"
23#include "llvm/CodeGen/TargetOpcodes.h"
24#include "llvm/CodeGen/ValueTypes.h"
25#include "llvm/IR/DerivedTypes.h"
26#include "llvm/IR/IntrinsicsAArch64.h"
27#include "llvm/IR/Type.h"
28#include "llvm/Support/MathExtras.h"
29#include <initializer_list>

31#define DEBUG_TYPE"aarch64-legalinfo" "aarch64-legalinfo"

33using namespace llvm;
34using namespace LegalizeActions;
35using namespace LegalizeMutations;
36using namespace LegalityPredicates;

38AArch64LegalizerInfo::AArch64LegalizerInfo(const AArch64Subtarget &ST)
  : ST(&ST) {
using namespace TargetOpcode;
const LLT p0 = LLT::pointer(0, 64);
const LLT s1 = LLT::scalar(1);
const LLT s8 = LLT::scalar(8);
const LLT s16 = LLT::scalar(16);
const LLT s32 = LLT::scalar(32);
const LLT s64 = LLT::scalar(64);
const LLT s128 = LLT::scalar(128);
const LLT s256 = LLT::scalar(256);
const LLT s512 = LLT::scalar(512);
const LLT v16s8 = LLT::vector(16, 8);
const LLT v8s8 = LLT::vector(8, 8);
const LLT v4s8 = LLT::vector(4, 8);
const LLT v8s16 = LLT::vector(8, 16);
const LLT v4s16 = LLT::vector(4, 16);
const LLT v2s16 = LLT::vector(2, 16);
const LLT v2s32 = LLT::vector(2, 32);
const LLT v4s32 = LLT::vector(4, 32);
const LLT v2s64 = LLT::vector(2, 64);
const LLT v2p0 = LLT::vector(2, p0);

std::initializer_list<LLT> PackedVectorAllTypeList = {/* Begin 128bit types */
                                                      v16s8, v8s16, v4s32,
                                                      v2s64, v2p0,
                                                      /* End 128bit types */
                                                      /* Begin 64bit types */
                                                      v8s8, v4s16, v2s32};

const TargetMachine &TM = ST.getTargetLowering()->getTargetMachine();

// FIXME: support subtargets which have neon/fp-armv8 disabled.
if (!ST.hasNEON() || !ST.hasFPARMv8()) {
  getLegacyLegalizerInfo().computeTables();
  return;
}

// Some instructions only support s16 if the subtarget has full 16-bit FP
// support.
const bool HasFP16 = ST.hasFullFP16();
const LLT &MinFPScalar = HasFP16 ? s16 : s32;

getActionDefinitionsBuilder({G_IMPLICIT_DEF, G_FREEZE})
    .legalFor({p0, s1, s8, s16, s32, s64})
    .legalFor(PackedVectorAllTypeList)
    .clampScalar(0, s1, s64)
    .widenScalarToNextPow2(0, 8)
    .fewerElementsIf(
        [=](const LegalityQuery &Query) {
          return Query.Types[0].isVector() &&
                 (Query.Types[0].getElementType() != s64 ||
                  Query.Types[0].getNumElements() != 2);
        },
        [=](const LegalityQuery &Query) {
          LLT EltTy = Query.Types[0].getElementType();
          if (EltTy == s64)
            return std::make_pair(0, LLT::vector(2, 64));
          return std::make_pair(0, EltTy);
        });

getActionDefinitionsBuilder(G_PHI).legalFor({p0, s16, s32, s64})
    .legalFor(PackedVectorAllTypeList)
    .clampScalar(0, s16, s64)
    .widenScalarToNextPow2(0);

getActionDefinitionsBuilder(G_BSWAP)
    .legalFor({s32, s64, v4s32, v2s32, v2s64})
    .clampScalar(0, s32, s64)
    .widenScalarToNextPow2(0);

getActionDefinitionsBuilder({G_ADD, G_SUB, G_MUL, G_AND, G_OR, G_XOR})
    .legalFor({s32, s64, v2s32, v4s32, v4s16, v8s16, v16s8, v8s8})
    .scalarizeIf(
        [=](const LegalityQuery &Query) {
          return Query.Opcode == G_MUL && Query.Types[0] == v2s64;
        },
        0)
    .legalFor({v2s64})
    .clampScalar(0, s32, s64)
    .widenScalarToNextPow2(0)
    .clampNumElements(0, v2s32, v4s32)
    .clampNumElements(0, v2s64, v2s64)
    .moreElementsToNextPow2(0);

getActionDefinitionsBuilder({G_SHL, G_ASHR, G_LSHR})
    .customIf([=](const LegalityQuery &Query) {
      const auto &SrcTy = Query.Types[0];
      const auto &AmtTy = Query.Types[1];
      return !SrcTy.isVector() && SrcTy.getSizeInBits() == 32 &&
             AmtTy.getSizeInBits() == 32;
    })
    .legalFor({
        {s32, s32},
        {s32, s64},
        {s64, s64},
        {v8s8, v8s8},
        {v16s8, v16s8},
        {v4s16, v4s16},
        {v8s16, v8s16},
        {v2s32, v2s32},
        {v4s32, v4s32},
        {v2s64, v2s64},
    })
    .clampScalar(1, s32, s64)
    .clampScalar(0, s32, s64)
    .widenScalarToNextPow2(0)
    .clampNumElements(0, v2s32, v4s32)
    .clampNumElements(0, v2s64, v2s64)
    .moreElementsToNextPow2(0)
    .minScalarSameAs(1, 0);

getActionDefinitionsBuilder(G_PTR_ADD)
    .legalFor({{p0, s64}, {v2p0, v2s64}})
    .clampScalar(1, s64, s64);

getActionDefinitionsBuilder(G_PTRMASK).legalFor({{p0, s64}});

getActionDefinitionsBuilder({G_SDIV, G_UDIV})
    .legalFor({s32, s64})
    .libcallFor({s128})
    .clampScalar(0, s32, s64)
    .widenScalarToNextPow2(0)
    .scalarize(0);

getActionDefinitionsBuilder({G_SREM, G_UREM, G_SDIVREM, G_UDIVREM})
    .lowerFor({s1, s8, s16, s32, s64});

getActionDefinitionsBuilder({G_SMULO, G_UMULO}).lowerFor({{s64, s1}});

getActionDefinitionsBuilder({G_SMULH, G_UMULH}).legalFor({s32, s64});

getActionDefinitionsBuilder({G_SMIN, G_SMAX, G_UMIN, G_UMAX})
    .lowerIf([=](const LegalityQuery &Q) { return Q.Types[0].isScalar(); });

getActionDefinitionsBuilder(
    {G_SADDE, G_SSUBE, G_UADDE, G_USUBE, G_SADDO, G_SSUBO, G_UADDO, G_USUBO})
    .legalFor({{s32, s1}, {s64, s1}})
    .clampScalar(0, s32, s64)
    .widenScalarToNextPow2(0);

getActionDefinitionsBuilder({G_FADD, G_FSUB, G_FMUL, G_FDIV, G_FNEG})
    .legalFor({s32, s64, v2s64, v4s32, v2s32})
    .clampNumElements(0, v2s32, v4s32)
    .clampNumElements(0, v2s64, v2s64);

getActionDefinitionsBuilder(G_FREM).libcallFor({s32, s64});

getActionDefinitionsBuilder({G_FCEIL, G_FABS, G_FSQRT, G_FFLOOR, G_FRINT,
                             G_FMA, G_INTRINSIC_TRUNC, G_INTRINSIC_ROUND,
                             G_FNEARBYINT, G_INTRINSIC_LRINT})
    // If we don't have full FP16 support, then scalarize the elements of
    // vectors containing fp16 types.
    .fewerElementsIf(
        [=, &ST](const LegalityQuery &Query) {
          const auto &Ty = Query.Types[0];
          return Ty.isVector() && Ty.getElementType() == s16 &&
                 !ST.hasFullFP16();
        },
        [=](const LegalityQuery &Query) { return std::make_pair(0, s16); })
    // If we don't have full FP16 support, then widen s16 to s32 if we
    // encounter it.
    .widenScalarIf(
        [=, &ST](const LegalityQuery &Query) {
          return Query.Types[0] == s16 && !ST.hasFullFP16();
        },
        [=](const LegalityQuery &Query) { return std::make_pair(0, s32); })
    .legalFor({s16, s32, s64, v2s32, v4s32, v2s64, v2s16, v4s16, v8s16});

getActionDefinitionsBuilder(
    {G_FCOS, G_FSIN, G_FLOG10, G_FLOG, G_FLOG2, G_FEXP, G_FEXP2, G_FPOW})
    // We need a call for these, so we always need to scalarize.
    .scalarize(0)
    // Regardless of FP16 support, widen 16-bit elements to 32-bits.
    .minScalar(0, s32)
    .libcallFor({s32, s64, v2s32, v4s32, v2s64});

getActionDefinitionsBuilder(G_INSERT)
    .unsupportedIf([=](const LegalityQuery &Query) {
      return Query.Types[0].getSizeInBits() <= Query.Types[1].getSizeInBits();
    })
    .legalIf([=](const LegalityQuery &Query) {
      const LLT &Ty0 = Query.Types[0];
      const LLT &Ty1 = Query.Types[1];
      if (Ty0 != s32 && Ty0 != s64 && Ty0 != p0)
        return false;
      return isPowerOf2_32(Ty1.getSizeInBits()) &&
             (Ty1.getSizeInBits() == 1 || Ty1.getSizeInBits() >= 8);
    })
    .clampScalar(0, s32, s64)
    .widenScalarToNextPow2(0)
    .maxScalarIf(typeInSet(0, {s32}), 1, s16)
    .maxScalarIf(typeInSet(0, {s64}), 1, s32)
    .widenScalarToNextPow2(1);

getActionDefinitionsBuilder(G_EXTRACT)
    .unsupportedIf([=](const LegalityQuery &Query) {
      return Query.Types[0].getSizeInBits() >= Query.Types[1].getSizeInBits();
    })
    .legalIf([=](const LegalityQuery &Query) {
      const LLT &Ty0 = Query.Types[0];
      const LLT &Ty1 = Query.Types[1];
      if (Ty1 != s32 && Ty1 != s64 && Ty1 != s128)
        return false;
      if (Ty1 == p0)
        return true;
      return isPowerOf2_32(Ty0.getSizeInBits()) &&
             (Ty0.getSizeInBits() == 1 || Ty0.getSizeInBits() >= 8);
    })
    .clampScalar(1, s32, s128)
    .widenScalarToNextPow2(1)
    .maxScalarIf(typeInSet(1, {s32}), 0, s16)
    .maxScalarIf(typeInSet(1, {s64}), 0, s32)
    .widenScalarToNextPow2(0);

getActionDefinitionsBuilder({G_SEXTLOAD, G_ZEXTLOAD})
    .lowerIf(atomicOrderingAtLeastOrStrongerThan(0, AtomicOrdering::Unordered))
    .legalForTypesWithMemDesc({{s32, p0, 8, 8},
                               {s32, p0, 16, 8},
                               {s32, p0, 32, 8},
                               {s64, p0, 8, 2},
                               {s64, p0, 16, 2},
                               {s64, p0, 32, 4},
                               {s64, p0, 64, 8},
                               {p0, p0, 64, 8},
                               {v2s32, p0, 64, 8}})
    .clampScalar(0, s32, s64)
    .widenScalarToNextPow2(0)
    // TODO: We could support sum-of-pow2's but the lowering code doesn't know
    //       how to do that yet.
    .unsupportedIfMemSizeNotPow2()
    // Lower anything left over into G_*EXT and G_LOAD
    .lower();

auto IsPtrVecPred = [=](const LegalityQuery &Query) {
  const LLT &ValTy = Query.Types[0];
  if (!ValTy.isVector())
    return false;
  const LLT EltTy = ValTy.getElementType();
  return EltTy.isPointer() && EltTy.getAddressSpace() == 0;
};

getActionDefinitionsBuilder(G_LOAD)
    .legalForTypesWithMemDesc({{s8, p0, 8, 8},
                               {s16, p0, 16, 8},
                               {s32, p0, 32, 8},
                               {s64, p0, 64, 8},
                               {p0, p0, 64, 8},
                               {s128, p0, 128, 8},
                               {v8s8, p0, 64, 8},
                               {v16s8, p0, 128, 8},
                               {v4s16, p0, 64, 8},
                               {v8s16, p0, 128, 8},
                               {v2s32, p0, 64, 8},
                               {v4s32, p0, 128, 8},
                               {v2s64, p0, 128, 8}})
    // These extends are also legal
    .legalForTypesWithMemDesc({{s32, p0, 8, 8}, {s32, p0, 16, 8}})
    .clampScalar(0, s8, s64)
    .lowerIfMemSizeNotPow2()
    .widenScalarToNextPow2(0)
    .narrowScalarIf([=](const LegalityQuery &Query) {
      // Clamp extending load results to 32-bits.
      return Query.Types[0].isScalar() &&
             Query.Types[0].getSizeInBits() != Query.MMODescrs[0].SizeInBits &&
             Query.Types[0].getSizeInBits() > 32;
      },
      changeTo(0, s32))
    // Lower any any-extending loads left into G_ANYEXT and G_LOAD
    .lowerIf([=](const LegalityQuery &Query) {
      return Query.Types[0].getSizeInBits() != Query.MMODescrs[0].SizeInBits;
    })
    .clampMaxNumElements(0, s8, 16)
    .clampMaxNumElements(0, s16, 8)
    .clampMaxNumElements(0, s32, 4)
    .clampMaxNumElements(0, s64, 2)
    .customIf(IsPtrVecPred);

getActionDefinitionsBuilder(G_STORE)
    .legalForTypesWithMemDesc({{s8, p0, 8, 8},
                               {s16, p0, 8, 8}, // truncstorei8 from s16
                               {s32, p0, 8, 8}, // truncstorei8 from s32
                               {s64, p0, 8, 8}, // truncstorei8 from s64
                               {s16, p0, 16, 8},
                               {s32, p0, 16, 8}, // truncstorei16 from s32
                               {s64, p0, 16, 8}, // truncstorei16 from s64
                               {s32, p0, 8, 8},
                               {s32, p0, 16, 8},
                               {s32, p0, 32, 8},
                               {s64, p0, 64, 8},
                               {s64, p0, 32, 8}, // truncstorei32 from s64
                               {p0, p0, 64, 8},
                               {s128, p0, 128, 8},
                               {v16s8, p0, 128, 8},
                               {v8s8, p0, 64, 8},
                               {v4s16, p0, 64, 8},
                               {v8s16, p0, 128, 8},
                               {v2s32, p0, 64, 8},
                               {v4s32, p0, 128, 8},
                               {v2s64, p0, 128, 8}})
    .clampScalar(0, s8, s64)
    .lowerIf([=](const LegalityQuery &Query) {
      return Query.Types[0].isScalar() &&
             Query.Types[0].getSizeInBits() != Query.MMODescrs[0].SizeInBits;
    })
    // Maximum: sN * k = 128
    .clampMaxNumElements(0, s8, 16)
    .clampMaxNumElements(0, s16, 8)
    .clampMaxNumElements(0, s32, 4)
    .clampMaxNumElements(0, s64, 2)
    .lowerIfMemSizeNotPow2()
    .customIf(IsPtrVecPred);

// Constants
getActionDefinitionsBuilder(G_CONSTANT)
    .legalFor({p0, s8, s16, s32, s64})
    .clampScalar(0, s8, s64)
    .widenScalarToNextPow2(0);
getActionDefinitionsBuilder(G_FCONSTANT)
    .legalIf([=](const LegalityQuery &Query) {
      const auto &Ty = Query.Types[0];
      if (HasFP16 && Ty == s16)
        return true;
      return Ty == s32 || Ty == s64 || Ty == s128;
    })
    .clampScalar(0, MinFPScalar, s128);

getActionDefinitionsBuilder({G_ICMP, G_FCMP})
    .legalFor({{s32, s32},
               {s32, s64},
               {s32, p0},
               {v4s32, v4s32},
               {v2s32, v2s32},
               {v2s64, v2s64},
               {v2s64, v2p0},
               {v4s16, v4s16},
               {v8s16, v8s16},
               {v8s8, v8s8},
               {v16s8, v16s8}})
    .clampScalar(1, s32, s64)
    .clampScalar(0, s32, s32)
    .minScalarEltSameAsIf(
        [=](const LegalityQuery &Query) {
          const LLT &Ty = Query.Types[0];
          const LLT &SrcTy = Query.Types[1];
          return Ty.isVector() && !SrcTy.getElementType().isPointer() &&
                 Ty.getElementType() != SrcTy.getElementType();
        },
        0, 1)
    .minScalarOrEltIf(
        [=](const LegalityQuery &Query) { return Query.Types[1] == v2s16; },
        1, s32)
    .minScalarOrEltIf(
        [=](const LegalityQuery &Query) { return Query.Types[1] == v2p0; }, 0,
        s64)
    .widenScalarOrEltToNextPow2(1)
    .clampNumElements(0, v2s32, v4s32);

// Extensions
auto ExtLegalFunc = [=](const LegalityQuery &Query) {
  unsigned DstSize = Query.Types[0].getSizeInBits();

  if (DstSize == 128 && !Query.Types[0].isVector())
    return false; // Extending to a scalar s128 needs narrowing.

  // Make sure that we have something that will fit in a register, and
  // make sure it's a power of 2.
  if (DstSize < 8 || DstSize > 128 || !isPowerOf2_32(DstSize))
    return false;

  const LLT &SrcTy = Query.Types[1];

  // Special case for s1.
  if (SrcTy == s1)
    return true;

  // Make sure we fit in a register otherwise. Don't bother checking that
  // the source type is below 128 bits. We shouldn't be allowing anything
  // through which is wider than the destination in the first place.
  unsigned SrcSize = SrcTy.getSizeInBits();
  if (SrcSize < 8 || !isPowerOf2_32(SrcSize))
    return false;

  return true;
};
getActionDefinitionsBuilder({G_ZEXT, G_SEXT, G_ANYEXT})
    .legalIf(ExtLegalFunc)
    .clampScalar(0, s64, s64); // Just for s128, others are handled above.

getActionDefinitionsBuilder(G_TRUNC)
    .minScalarOrEltIf(
        [=](const LegalityQuery &Query) { return Query.Types[0].isVector(); },
        0, s8)
    .customIf([=](const LegalityQuery &Query) {
      LLT DstTy = Query.Types[0];
      LLT SrcTy = Query.Types[1];
      return DstTy == v8s8 && SrcTy.getSizeInBits() > 128;
    })
    .alwaysLegal();

getActionDefinitionsBuilder(G_SEXT_INREG).legalFor({s32, s64}).lower();

// FP conversions
getActionDefinitionsBuilder(G_FPTRUNC)
    .legalFor(
        {{s16, s32}, {s16, s64}, {s32, s64}, {v4s16, v4s32}, {v2s32, v2s64}})
    .clampMaxNumElements(0, s32, 2);
getActionDefinitionsBuilder(G_FPEXT)
    .legalFor(
        {{s32, s16}, {s64, s16}, {s64, s32}, {v4s32, v4s16}, {v2s64, v2s32}})
    .clampMaxNumElements(0, s64, 2);

// Conversions
getActionDefinitionsBuilder({G_FPTOSI, G_FPTOUI})
    .legalForCartesianProduct({s32, s64, v2s64, v4s32, v2s32})
    .clampScalar(0, s32, s64)
    .widenScalarToNextPow2(0)
    .clampScalar(1, s32, s64)
    .widenScalarToNextPow2(1);

getActionDefinitionsBuilder({G_SITOFP, G_UITOFP})
    .legalForCartesianProduct({s32, s64, v2s64, v4s32, v2s32})
    .clampScalar(1, s32, s64)
    .minScalarSameAs(1, 0)
    .clampScalar(0, s32, s64)
    .widenScalarToNextPow2(0);

// Control-flow
getActionDefinitionsBuilder(G_BRCOND).legalFor({s1, s8, s16, s32});
getActionDefinitionsBuilder(G_BRINDIRECT).legalFor({p0});

getActionDefinitionsBuilder(G_SELECT)
    .legalFor({{s32, s1}, {s64, s1}, {p0, s1}})
    .clampScalar(0, s32, s64)
    .widenScalarToNextPow2(0)
    .minScalarEltSameAsIf(all(isVector(0), isVector(1)), 1, 0)
    .lowerIf(isVector(0));

// Pointer-handling
getActionDefinitionsBuilder(G_FRAME_INDEX).legalFor({p0});

if (TM.getCodeModel() == CodeModel::Small)
  getActionDefinitionsBuilder(G_GLOBAL_VALUE).custom();
else
  getActionDefinitionsBuilder(G_GLOBAL_VALUE).legalFor({p0});

getActionDefinitionsBuilder(G_PTRTOINT)
    .legalForCartesianProduct({s1, s8, s16, s32, s64}, {p0})
    .maxScalar(0, s64)
    .widenScalarToNextPow2(0, /*Min*/ 8);

getActionDefinitionsBuilder(G_INTTOPTR)
    .unsupportedIf([&](const LegalityQuery &Query) {
      return Query.Types[0].getSizeInBits() != Query.Types[1].getSizeInBits();
    })
    .legalFor({{p0, s64}});

// Casts for 32 and 64-bit width type are just copies.
// Same for 128-bit width type, except they are on the FPR bank.
getActionDefinitionsBuilder(G_BITCAST)
    // FIXME: This is wrong since G_BITCAST is not allowed to change the
    // number of bits but it's what the previous code described and fixing
    // it breaks tests.
    .legalForCartesianProduct({s1, s8, s16, s32, s64, s128, v16s8, v8s8, v4s8,
                               v8s16, v4s16, v2s16, v4s32, v2s32, v2s64,
                               v2p0});

getActionDefinitionsBuilder(G_VASTART).legalFor({p0});

// va_list must be a pointer, but most sized types are pretty easy to handle
// as the destination.
getActionDefinitionsBuilder(G_VAARG)
    .customForCartesianProduct({s8, s16, s32, s64, p0}, {p0})
    .clampScalar(0, s8, s64)
    .widenScalarToNextPow2(0, /*Min*/ 8);

getActionDefinitionsBuilder(G_ATOMIC_CMPXCHG_WITH_SUCCESS)
    .lowerIf(
        all(typeInSet(0, {s8, s16, s32, s64, s128}), typeIs(1, s1), typeIs(2, p0)));

getActionDefinitionsBuilder(G_ATOMIC_CMPXCHG)
    .legalIf(all(typeInSet(0, {s8, s16, s32, s64}), typeIs(1, p0)))
    .customIf([](const LegalityQuery &Query) {
      return Query.Types[0].getSizeInBits() == 128;
    });

getActionDefinitionsBuilder(
    {G_ATOMICRMW_XCHG, G_ATOMICRMW_ADD, G_ATOMICRMW_SUB, G_ATOMICRMW_AND,
     G_ATOMICRMW_OR, G_ATOMICRMW_XOR, G_ATOMICRMW_MIN, G_ATOMICRMW_MAX,
     G_ATOMICRMW_UMIN, G_ATOMICRMW_UMAX})
    .legalIf(all(typeInSet(0, {s8, s16, s32, s64}), typeIs(1, p0)));

getActionDefinitionsBuilder(G_BLOCK_ADDR).legalFor({p0});

// Merge/Unmerge
for (unsigned Op : {G_MERGE_VALUES, G_UNMERGE_VALUES}) {
  unsigned BigTyIdx = Op == G_MERGE_VALUES ? 0 : 1;
  unsigned LitTyIdx = Op == G_MERGE_VALUES ? 1 : 0;

  auto notValidElt = [](const LegalityQuery &Query, unsigned TypeIdx) {
    const LLT &Ty = Query.Types[TypeIdx];
    if (Ty.isVector()) {
      const LLT &EltTy = Ty.getElementType();
      if (EltTy.getSizeInBits() < 8 || EltTy.getSizeInBits() > 64)
        return true;
      if (!isPowerOf2_32(EltTy.getSizeInBits()))
        return true;
    }
    return false;
  };

  // FIXME: This rule is horrible, but specifies the same as what we had
  // before with the particularly strange definitions removed (e.g.
  // s8 = G_MERGE_VALUES s32, s32).
  // Part of the complexity comes from these ops being extremely flexible. For
  // example, you can build/decompose vectors with it, concatenate vectors,
  // etc. and in addition to this you can also bitcast with it at the same
  // time. We've been considering breaking it up into multiple ops to make it
  // more manageable throughout the backend.
  getActionDefinitionsBuilder(Op)
      // Break up vectors with weird elements into scalars
      .fewerElementsIf(
          [=](const LegalityQuery &Query) { return notValidElt(Query, 0); },
          scalarize(0))
      .fewerElementsIf(
          [=](const LegalityQuery &Query) { return notValidElt(Query, 1); },
          scalarize(1))
      // Clamp the big scalar to s8-s512 and make it either a power of 2, 192,
      // or 384.
      .clampScalar(BigTyIdx, s8, s512)
      .widenScalarIf(
          [=](const LegalityQuery &Query) {
            const LLT &Ty = Query.Types[BigTyIdx];
            return !isPowerOf2_32(Ty.getSizeInBits()) &&
                   Ty.getSizeInBits() % 64 != 0;
          },
          [=](const LegalityQuery &Query) {
            // Pick the next power of 2, or a multiple of 64 over 128.
            // Whichever is smaller.
            const LLT &Ty = Query.Types[BigTyIdx];
            unsigned NewSizeInBits = 1
                                     << Log2_32_Ceil(Ty.getSizeInBits() + 1);
            if (NewSizeInBits >= 256) {
              unsigned RoundedTo = alignTo<64>(Ty.getSizeInBits() + 1);
              if (RoundedTo < NewSizeInBits)
                NewSizeInBits = RoundedTo;
            }
            return std::make_pair(BigTyIdx, LLT::scalar(NewSizeInBits));
          })
      // Clamp the little scalar to s8-s256 and make it a power of 2. It's not
      // worth considering the multiples of 64 since 2*192 and 2*384 are not
      // valid.
      .clampScalar(LitTyIdx, s8, s256)
      .widenScalarToNextPow2(LitTyIdx, /*Min*/ 8)
      // So at this point, we have s8, s16, s32, s64, s128, s192, s256, s384,
      // s512, <X x s8>, <X x s16>, <X x s32>, or <X x s64>.
      // At this point it's simple enough to accept the legal types.
      .legalIf([=](const LegalityQuery &Query) {
        const LLT &BigTy = Query.Types[BigTyIdx];
        const LLT &LitTy = Query.Types[LitTyIdx];
        if (BigTy.isVector() && BigTy.getSizeInBits() < 32)
1
Calling 'LLT::isVector'→
3
←
Returning from 'LLT::isVector'→
4
←
Assuming the condition is false→
          return false;
        if (LitTy.isVector() && LitTy.getSizeInBits() < 32)
5
←
Calling 'LLT::isVector'→
7
←
Returning from 'LLT::isVector'→
          return false;
        return BigTy.getSizeInBits() % LitTy.getSizeInBits() == 0;
8
←
Calling 'LLT::getSizeInBits'→
11
←
Returning from 'LLT::getSizeInBits'→
12
←
Division by zero
      })
      // Any vectors left are the wrong size. Scalarize them.
      .scalarize(0)
      .scalarize(1);
}

getActionDefinitionsBuilder(G_EXTRACT_VECTOR_ELT)
    .unsupportedIf([=](const LegalityQuery &Query) {
      const LLT &EltTy = Query.Types[1].getElementType();
      return Query.Types[0] != EltTy;
    })
    .minScalar(2, s64)
    .legalIf([=](const LegalityQuery &Query) {
      const LLT &VecTy = Query.Types[1];
      return VecTy == v2s16 || VecTy == v4s16 || VecTy == v8s16 ||
             VecTy == v4s32 || VecTy == v2s64 || VecTy == v2s32 ||
             VecTy == v16s8 || VecTy == v2s32 || VecTy == v2p0;
    })
    .minScalarOrEltIf(
        [=](const LegalityQuery &Query) {
          // We want to promote to <M x s1> to <M x s64> if that wouldn't
          // cause the total vec size to be > 128b.
          return Query.Types[1].getNumElements() <= 2;
        },
        0, s64)
    .minScalarOrEltIf(
        [=](const LegalityQuery &Query) {
          return Query.Types[1].getNumElements() <= 4;
        },
        0, s32)
    .minScalarOrEltIf(
        [=](const LegalityQuery &Query) {
          return Query.Types[1].getNumElements() <= 8;
        },
        0, s16)
    .minScalarOrEltIf(
        [=](const LegalityQuery &Query) {
          return Query.Types[1].getNumElements() <= 16;
        },
        0, s8)
    .minScalarOrElt(0, s8) // Worst case, we need at least s8.
    .clampMaxNumElements(1, s64, 2)
    .clampMaxNumElements(1, s32, 4)
    .clampMaxNumElements(1, s16, 8);

getActionDefinitionsBuilder(G_INSERT_VECTOR_ELT)
    .legalIf(typeInSet(0, {v8s16, v2s32, v4s32, v2s64}));

getActionDefinitionsBuilder(G_BUILD_VECTOR)
    .legalFor({{v8s8, s8},
               {v16s8, s8},
               {v4s16, s16},
               {v8s16, s16},
               {v2s32, s32},
               {v4s32, s32},
               {v2p0, p0},
               {v2s64, s64}})
    .clampNumElements(0, v4s32, v4s32)
    .clampNumElements(0, v2s64, v2s64)
    .minScalarSameAs(1, 0);

getActionDefinitionsBuilder(G_BUILD_VECTOR_TRUNC).lower();

getActionDefinitionsBuilder(G_CTLZ)
    .legalForCartesianProduct(
        {s32, s64, v8s8, v16s8, v4s16, v8s16, v2s32, v4s32})
    .scalarize(1);
getActionDefinitionsBuilder(G_CTLZ_ZERO_UNDEF).lower();

// TODO: Custom lowering for v2s32, v4s32, v2s64.
getActionDefinitionsBuilder(G_BITREVERSE).legalFor({s32, s64, v8s8, v16s8});

getActionDefinitionsBuilder(G_CTTZ_ZERO_UNDEF).lower();

// TODO: Handle vector types.
getActionDefinitionsBuilder(G_CTTZ)
    .clampScalar(0, s32, s64)
    .scalarSameSizeAs(1, 0)
    .customFor({s32, s64});

getActionDefinitionsBuilder(G_SHUFFLE_VECTOR)
    .legalIf([=](const LegalityQuery &Query) {
      const LLT &DstTy = Query.Types[0];
      const LLT &SrcTy = Query.Types[1];
      // For now just support the TBL2 variant which needs the source vectors
      // to be the same size as the dest.
      if (DstTy != SrcTy)
        return false;
      for (auto &Ty : {v2s32, v4s32, v2s64, v2p0, v16s8, v8s16}) {
        if (DstTy == Ty)
          return true;
      }
      return false;
    })
    // G_SHUFFLE_VECTOR can have scalar sources (from 1 x s vectors), we
    // just want those lowered into G_BUILD_VECTOR
    .lowerIf([=](const LegalityQuery &Query) {
      return !Query.Types[1].isVector();
    })
    .clampNumElements(0, v4s32, v4s32)
    .clampNumElements(0, v2s64, v2s64);

getActionDefinitionsBuilder(G_CONCAT_VECTORS)
    .legalFor({{v4s32, v2s32}, {v8s16, v4s16}});

getActionDefinitionsBuilder(G_JUMP_TABLE).legalFor({{p0}, {s64}});

getActionDefinitionsBuilder(G_BRJT).legalIf([=](const LegalityQuery &Query) {
  return Query.Types[0] == p0 && Query.Types[1] == s64;
});

getActionDefinitionsBuilder(G_DYN_STACKALLOC).lower();

getActionDefinitionsBuilder({G_BZERO, G_MEMCPY, G_MEMMOVE, G_MEMSET})
    .libcall();

// FIXME: Legal types are only legal with NEON.
getActionDefinitionsBuilder(G_ABS)
    .lowerIf(isScalar(0))
    .legalFor(PackedVectorAllTypeList);

getActionDefinitionsBuilder(G_VECREDUCE_FADD)
    // We only have FADDP to do reduction-like operations. Lower the rest.
    .legalFor({{s32, v2s32}, {s64, v2s64}})
    .clampMaxNumElements(1, s64, 2)
    .clampMaxNumElements(1, s32, 2)
    .lower();

getActionDefinitionsBuilder(G_VECREDUCE_ADD)
    .legalFor(
        {{s8, v16s8}, {s16, v8s16}, {s32, v4s32}, {s32, v2s32}, {s64, v2s64}})
    .clampMaxNumElements(1, s64, 2)
    .clampMaxNumElements(1, s32, 4)
    .lower();

getActionDefinitionsBuilder({G_UADDSAT, G_USUBSAT})
    .lowerIf([=](const LegalityQuery &Q) { return Q.Types[0].isScalar(); });

getActionDefinitionsBuilder({G_FSHL, G_FSHR}).lower();

getActionDefinitionsBuilder(G_ROTR)
    .legalFor({{s32, s64}, {s64, s64}})
    .customIf([=](const LegalityQuery &Q) {
      return Q.Types[0].isScalar() && Q.Types[1].getScalarSizeInBits() < 64;
    })
    .lower();
getActionDefinitionsBuilder(G_ROTL).lower();

getActionDefinitionsBuilder({G_SBFX, G_UBFX})
    .customFor({{s32, s32}, {s64, s64}});

// TODO: Custom legalization for s128
// TODO: v2s64, v2s32, v4s32, v4s16, v8s16
// TODO: Use generic lowering when custom lowering is not possible.
auto always = [=](const LegalityQuery &Q) { return true; };
getActionDefinitionsBuilder(G_CTPOP)
    .legalFor({{v8s8, v8s8}, {v16s8, v16s8}})
    .clampScalar(0, s32, s128)
    .widenScalarToNextPow2(0)
    .minScalarEltSameAsIf(always, 1, 0)
    .maxScalarEltSameAsIf(always, 1, 0)
    .customFor({{s32, s32}, {s64, s64}});

getLegacyLegalizerInfo().computeTables();
verify(*ST.getInstrInfo());
768}

770bool AArch64LegalizerInfo::legalizeCustom(LegalizerHelper &Helper,
                                        MachineInstr &MI) const {
MachineIRBuilder &MIRBuilder = Helper.MIRBuilder;
MachineRegisterInfo &MRI = *MIRBuilder.getMRI();
GISelChangeObserver &Observer = Helper.Observer;
switch (MI.getOpcode()) {
default:
  // No idea what to do.
  return false;
case TargetOpcode::G_VAARG:
  return legalizeVaArg(MI, MRI, MIRBuilder);
case TargetOpcode::G_LOAD:
case TargetOpcode::G_STORE:
  return legalizeLoadStore(MI, MRI, MIRBuilder, Observer);
case TargetOpcode::G_SHL:
case TargetOpcode::G_ASHR:
case TargetOpcode::G_LSHR:
  return legalizeShlAshrLshr(MI, MRI, MIRBuilder, Observer);
case TargetOpcode::G_GLOBAL_VALUE:
  return legalizeSmallCMGlobalValue(MI, MRI, MIRBuilder, Observer);
case TargetOpcode::G_TRUNC:
  return legalizeVectorTrunc(MI, Helper);
case TargetOpcode::G_SBFX:
case TargetOpcode::G_UBFX:
  return legalizeBitfieldExtract(MI, MRI, Helper);
case TargetOpcode::G_ROTR:
  return legalizeRotate(MI, MRI, Helper);
case TargetOpcode::G_CTPOP:
  return legalizeCTPOP(MI, MRI, Helper);
case TargetOpcode::G_ATOMIC_CMPXCHG:
  return legalizeAtomicCmpxchg128(MI, MRI, Helper);
case TargetOpcode::G_CTTZ:
  return legalizeCTTZ(MI, Helper);
}

llvm_unreachable("expected switch to return")::llvm::llvm_unreachable_internal("expected switch to return"
, "/build/llvm-toolchain-snapshot-13~++20210621111111+acefe0eaaf82/llvm/lib/Target/AArch64/GISel/AArch64LegalizerInfo.cpp"
, 805);
806}

808bool AArch64LegalizerInfo::legalizeRotate(MachineInstr &MI,
                                        MachineRegisterInfo &MRI,
                                        LegalizerHelper &Helper) const {
// To allow for imported patterns to match, we ensure that the rotate amount
// is 64b with an extension.
Register AmtReg = MI.getOperand(2).getReg();
LLT AmtTy = MRI.getType(AmtReg);
(void)AmtTy;
assert(AmtTy.isScalar() && "Expected a scalar rotate")(static_cast <bool> (AmtTy.isScalar() && "Expected a scalar rotate"
) ? void (0) : __assert_fail ("AmtTy.isScalar() && \"Expected a scalar rotate\""
, "/build/llvm-toolchain-snapshot-13~++20210621111111+acefe0eaaf82/llvm/lib/Target/AArch64/GISel/AArch64LegalizerInfo.cpp"
, 816, __extension__ __PRETTY_FUNCTION__));
assert(AmtTy.getSizeInBits() < 64 && "Expected this rotate to be legal")(static_cast <bool> (AmtTy.getSizeInBits() < 64 &&
 "Expected this rotate to be legal") ? void (0) : __assert_fail
 ("AmtTy.getSizeInBits() < 64 && \"Expected this rotate to be legal\""
, "/build/llvm-toolchain-snapshot-13~++20210621111111+acefe0eaaf82/llvm/lib/Target/AArch64/GISel/AArch64LegalizerInfo.cpp"
, 817, __extension__ __PRETTY_FUNCTION__));
auto NewAmt = Helper.MIRBuilder.buildSExt(LLT::scalar(64), AmtReg);
Helper.Observer.changingInstr(MI);
MI.getOperand(2).setReg(NewAmt.getReg(0));
Helper.Observer.changedInstr(MI);
return true;
823}

825static void extractParts(Register Reg, MachineRegisterInfo &MRI,
                       MachineIRBuilder &MIRBuilder, LLT Ty, int NumParts,
                       SmallVectorImpl<Register> &VRegs) {
for (int I = 0; I < NumParts; ++I)
  VRegs.push_back(MRI.createGenericVirtualRegister(Ty));
MIRBuilder.buildUnmerge(VRegs, Reg);
831}

833bool AArch64LegalizerInfo::legalizeVectorTrunc(
  MachineInstr &MI, LegalizerHelper &Helper) const {
MachineIRBuilder &MIRBuilder = Helper.MIRBuilder;
MachineRegisterInfo &MRI = *MIRBuilder.getMRI();
// Similar to how operand splitting is done in SelectiondDAG, we can handle
// %res(v8s8) = G_TRUNC %in(v8s32) by generating:
//   %inlo(<4x s32>), %inhi(<4 x s32>) = G_UNMERGE %in(<8 x s32>)
//   %lo16(<4 x s16>) = G_TRUNC %inlo
//   %hi16(<4 x s16>) = G_TRUNC %inhi
//   %in16(<8 x s16>) = G_CONCAT_VECTORS %lo16, %hi16
//   %res(<8 x s8>) = G_TRUNC %in16

Register DstReg = MI.getOperand(0).getReg();
Register SrcReg = MI.getOperand(1).getReg();
LLT DstTy = MRI.getType(DstReg);
LLT SrcTy = MRI.getType(SrcReg);
assert(isPowerOf2_32(DstTy.getSizeInBits()) &&(static_cast <bool> (isPowerOf2_32(DstTy.getSizeInBits(
)) && isPowerOf2_32(SrcTy.getSizeInBits())) ? void (0
) : __assert_fail ("isPowerOf2_32(DstTy.getSizeInBits()) && isPowerOf2_32(SrcTy.getSizeInBits())"
, "/build/llvm-toolchain-snapshot-13~++20210621111111+acefe0eaaf82/llvm/lib/Target/AArch64/GISel/AArch64LegalizerInfo.cpp"
, 850, __extension__ __PRETTY_FUNCTION__))
       isPowerOf2_32(SrcTy.getSizeInBits()))(static_cast <bool> (isPowerOf2_32(DstTy.getSizeInBits(
)) && isPowerOf2_32(SrcTy.getSizeInBits())) ? void (0
) : __assert_fail ("isPowerOf2_32(DstTy.getSizeInBits()) && isPowerOf2_32(SrcTy.getSizeInBits())"
, "/build/llvm-toolchain-snapshot-13~++20210621111111+acefe0eaaf82/llvm/lib/Target/AArch64/GISel/AArch64LegalizerInfo.cpp"
, 850, __extension__ __PRETTY_FUNCTION__));

// Split input type.
LLT SplitSrcTy = SrcTy.changeNumElements(SrcTy.getNumElements() / 2);
// First, split the source into two smaller vectors.
SmallVector<Register, 2> SplitSrcs;
extractParts(SrcReg, MRI, MIRBuilder, SplitSrcTy, 2, SplitSrcs);

// Truncate the splits into intermediate narrower elements.
LLT InterTy = SplitSrcTy.changeElementSize(DstTy.getScalarSizeInBits() * 2);
for (unsigned I = 0; I < SplitSrcs.size(); ++I)
  SplitSrcs[I] = MIRBuilder.buildTrunc(InterTy, SplitSrcs[I]).getReg(0);

auto Concat = MIRBuilder.buildConcatVectors(
    DstTy.changeElementSize(DstTy.getScalarSizeInBits() * 2), SplitSrcs);

Helper.Observer.changingInstr(MI);
MI.getOperand(1).setReg(Concat.getReg(0));
Helper.Observer.changedInstr(MI);
return true;
870}

872bool AArch64LegalizerInfo::legalizeSmallCMGlobalValue(
  MachineInstr &MI, MachineRegisterInfo &MRI, MachineIRBuilder &MIRBuilder,
  GISelChangeObserver &Observer) const {
assert(MI.getOpcode() == TargetOpcode::G_GLOBAL_VALUE)(static_cast <bool> (MI.getOpcode() == TargetOpcode::G_GLOBAL_VALUE
) ? void (0) : __assert_fail ("MI.getOpcode() == TargetOpcode::G_GLOBAL_VALUE"
, "/build/llvm-toolchain-snapshot-13~++20210621111111+acefe0eaaf82/llvm/lib/Target/AArch64/GISel/AArch64LegalizerInfo.cpp"
, 875, __extension__ __PRETTY_FUNCTION__));
// We do this custom legalization to convert G_GLOBAL_VALUE into target ADRP +
// G_ADD_LOW instructions.
// By splitting this here, we can optimize accesses in the small code model by
// folding in the G_ADD_LOW into the load/store offset.
auto &GlobalOp = MI.getOperand(1);
const auto* GV = GlobalOp.getGlobal();
if (GV->isThreadLocal())
  return true; // Don't want to modify TLS vars.

auto &TM = ST->getTargetLowering()->getTargetMachine();
unsigned OpFlags = ST->ClassifyGlobalReference(GV, TM);

if (OpFlags & AArch64II::MO_GOT)
  return true;

auto Offset = GlobalOp.getOffset();
Register DstReg = MI.getOperand(0).getReg();
auto ADRP = MIRBuilder.buildInstr(AArch64::ADRP, {LLT::pointer(0, 64)}, {})
                .addGlobalAddress(GV, Offset, OpFlags | AArch64II::MO_PAGE);
// Set the regclass on the dest reg too.
MRI.setRegClass(ADRP.getReg(0), &AArch64::GPR64RegClass);

// MO_TAGGED on the page indicates a tagged address. Set the tag now. We do so
// by creating a MOVK that sets bits 48-63 of the register to (global address
// + 0x100000000 - PC) >> 48. The additional 0x100000000 offset here is to
// prevent an incorrect tag being generated during relocation when the the
// global appears before the code section. Without the offset, a global at
// `0x0f00'0000'0000'1000` (i.e. at `0x1000` with tag `0xf`) that's referenced
// by code at `0x2000` would result in `0x0f00'0000'0000'1000 - 0x2000 =
// 0x0eff'ffff'ffff'f000`, meaning the tag would be incorrectly set to `0xe`
// instead of `0xf`.
// This assumes that we're in the small code model so we can assume a binary
// size of <= 4GB, which makes the untagged PC relative offset positive. The
// binary must also be loaded into address range [0, 2^48). Both of these
// properties need to be ensured at runtime when using tagged addresses.
if (OpFlags & AArch64II::MO_TAGGED) {
  assert(!Offset &&(static_cast <bool> (!Offset && "Should not have folded in an offset for a tagged global!"
) ? void (0) : __assert_fail ("!Offset && \"Should not have folded in an offset for a tagged global!\""
, "/build/llvm-toolchain-snapshot-13~++20210621111111+acefe0eaaf82/llvm/lib/Target/AArch64/GISel/AArch64LegalizerInfo.cpp"
, 913, __extension__ __PRETTY_FUNCTION__))
         "Should not have folded in an offset for a tagged global!")(static_cast <bool> (!Offset && "Should not have folded in an offset for a tagged global!"
) ? void (0) : __assert_fail ("!Offset && \"Should not have folded in an offset for a tagged global!\""
, "/build/llvm-toolchain-snapshot-13~++20210621111111+acefe0eaaf82/llvm/lib/Target/AArch64/GISel/AArch64LegalizerInfo.cpp"
, 913, __extension__ __PRETTY_FUNCTION__));
  ADRP = MIRBuilder.buildInstr(AArch64::MOVKXi, {LLT::pointer(0, 64)}, {ADRP})
             .addGlobalAddress(GV, 0x100000000,
                               AArch64II::MO_PREL | AArch64II::MO_G3)
             .addImm(48);
  MRI.setRegClass(ADRP.getReg(0), &AArch64::GPR64RegClass);
}

MIRBuilder.buildInstr(AArch64::G_ADD_LOW, {DstReg}, {ADRP})
    .addGlobalAddress(GV, Offset,
                      OpFlags | AArch64II::MO_PAGEOFF | AArch64II::MO_NC);
MI.eraseFromParent();
return true;
926}

928bool AArch64LegalizerInfo::legalizeIntrinsic(LegalizerHelper &Helper,
                                           MachineInstr &MI) const {
return true;
931}

933bool AArch64LegalizerInfo::legalizeShlAshrLshr(
  MachineInstr &MI, MachineRegisterInfo &MRI, MachineIRBuilder &MIRBuilder,
  GISelChangeObserver &Observer) const {
assert(MI.getOpcode() == TargetOpcode::G_ASHR ||(static_cast <bool> (MI.getOpcode() == TargetOpcode::G_ASHR
 || MI.getOpcode() == TargetOpcode::G_LSHR || MI.getOpcode() ==
 TargetOpcode::G_SHL) ? void (0) : __assert_fail ("MI.getOpcode() == TargetOpcode::G_ASHR || MI.getOpcode() == TargetOpcode::G_LSHR || MI.getOpcode() == TargetOpcode::G_SHL"
, "/build/llvm-toolchain-snapshot-13~++20210621111111+acefe0eaaf82/llvm/lib/Target/AArch64/GISel/AArch64LegalizerInfo.cpp"
, 938, __extension__ __PRETTY_FUNCTION__))
       MI.getOpcode() == TargetOpcode::G_LSHR ||(static_cast <bool> (MI.getOpcode() == TargetOpcode::G_ASHR
 || MI.getOpcode() == TargetOpcode::G_LSHR || MI.getOpcode() ==
 TargetOpcode::G_SHL) ? void (0) : __assert_fail ("MI.getOpcode() == TargetOpcode::G_ASHR || MI.getOpcode() == TargetOpcode::G_LSHR || MI.getOpcode() == TargetOpcode::G_SHL"
, "/build/llvm-toolchain-snapshot-13~++20210621111111+acefe0eaaf82/llvm/lib/Target/AArch64/GISel/AArch64LegalizerInfo.cpp"
, 938, __extension__ __PRETTY_FUNCTION__))
       MI.getOpcode() == TargetOpcode::G_SHL)(static_cast <bool> (MI.getOpcode() == TargetOpcode::G_ASHR
 || MI.getOpcode() == TargetOpcode::G_LSHR || MI.getOpcode() ==
 TargetOpcode::G_SHL) ? void (0) : __assert_fail ("MI.getOpcode() == TargetOpcode::G_ASHR || MI.getOpcode() == TargetOpcode::G_LSHR || MI.getOpcode() == TargetOpcode::G_SHL"
, "/build/llvm-toolchain-snapshot-13~++20210621111111+acefe0eaaf82/llvm/lib/Target/AArch64/GISel/AArch64LegalizerInfo.cpp"
, 938, __extension__ __PRETTY_FUNCTION__));
// If the shift amount is a G_CONSTANT, promote it to a 64 bit type so the
// imported patterns can select it later. Either way, it will be legal.
Register AmtReg = MI.getOperand(2).getReg();
auto VRegAndVal = getConstantVRegValWithLookThrough(AmtReg, MRI);
if (!VRegAndVal)
  return true;
// Check the shift amount is in range for an immediate form.
int64_t Amount = VRegAndVal->Value.getSExtValue();
if (Amount > 31)
  return true; // This will have to remain a register variant.
auto ExtCst = MIRBuilder.buildConstant(LLT::scalar(64), Amount);
Observer.changingInstr(MI);
MI.getOperand(2).setReg(ExtCst.getReg(0));
Observer.changedInstr(MI);
return true;
954}

956bool AArch64LegalizerInfo::legalizeLoadStore(
  MachineInstr &MI, MachineRegisterInfo &MRI, MachineIRBuilder &MIRBuilder,
  GISelChangeObserver &Observer) const {
assert(MI.getOpcode() == TargetOpcode::G_STORE ||(static_cast <bool> (MI.getOpcode() == TargetOpcode::G_STORE
 || MI.getOpcode() == TargetOpcode::G_LOAD) ? void (0) : __assert_fail
 ("MI.getOpcode() == TargetOpcode::G_STORE || MI.getOpcode() == TargetOpcode::G_LOAD"
, "/build/llvm-toolchain-snapshot-13~++20210621111111+acefe0eaaf82/llvm/lib/Target/AArch64/GISel/AArch64LegalizerInfo.cpp"
, 960, __extension__ __PRETTY_FUNCTION__))
       MI.getOpcode() == TargetOpcode::G_LOAD)(static_cast <bool> (MI.getOpcode() == TargetOpcode::G_STORE
 || MI.getOpcode() == TargetOpcode::G_LOAD) ? void (0) : __assert_fail
 ("MI.getOpcode() == TargetOpcode::G_STORE || MI.getOpcode() == TargetOpcode::G_LOAD"
, "/build/llvm-toolchain-snapshot-13~++20210621111111+acefe0eaaf82/llvm/lib/Target/AArch64/GISel/AArch64LegalizerInfo.cpp"
, 960, __extension__ __PRETTY_FUNCTION__));
// Here we just try to handle vector loads/stores where our value type might
// have pointer elements, which the SelectionDAG importer can't handle. To
// allow the existing patterns for s64 to fire for p0, we just try to bitcast
// the value to use s64 types.

// Custom legalization requires the instruction, if not deleted, must be fully
// legalized. In order to allow further legalization of the inst, we create
// a new instruction and erase the existing one.

Register ValReg = MI.getOperand(0).getReg();
const LLT ValTy = MRI.getType(ValReg);

if (!ValTy.isVector() || !ValTy.getElementType().isPointer() ||
    ValTy.getElementType().getAddressSpace() != 0) {
  LLVM_DEBUG(dbgs() << "Tried to do custom legalization on wrong load/store")do { if (::llvm::DebugFlag && ::llvm::isCurrentDebugType
("aarch64-legalinfo")) { dbgs() << "Tried to do custom legalization on wrong load/store"
; } } while (false);
  return false;
}

unsigned PtrSize = ValTy.getElementType().getSizeInBits();
const LLT NewTy = LLT::vector(ValTy.getNumElements(), PtrSize);
auto &MMO = **MI.memoperands_begin();
if (MI.getOpcode() == TargetOpcode::G_STORE) {
  auto Bitcast = MIRBuilder.buildBitcast(NewTy, ValReg);
  MIRBuilder.buildStore(Bitcast.getReg(0), MI.getOperand(1), MMO);
} else {
  auto NewLoad = MIRBuilder.buildLoad(NewTy, MI.getOperand(1), MMO);
  MIRBuilder.buildBitcast(ValReg, NewLoad);
}
MI.eraseFromParent();
return true;
991}

993bool AArch64LegalizerInfo::legalizeVaArg(MachineInstr &MI,
                                       MachineRegisterInfo &MRI,
                                       MachineIRBuilder &MIRBuilder) const {
MachineFunction &MF = MIRBuilder.getMF();
Align Alignment(MI.getOperand(2).getImm());
Register Dst = MI.getOperand(0).getReg();
Register ListPtr = MI.getOperand(1).getReg();

LLT PtrTy = MRI.getType(ListPtr);
LLT IntPtrTy = LLT::scalar(PtrTy.getSizeInBits());

const unsigned PtrSize = PtrTy.getSizeInBits() / 8;
const Align PtrAlign = Align(PtrSize);
auto List = MIRBuilder.buildLoad(
    PtrTy, ListPtr,
    *MF.getMachineMemOperand(MachinePointerInfo(), MachineMemOperand::MOLoad,
                             PtrSize, PtrAlign));

MachineInstrBuilder DstPtr;
if (Alignment > PtrAlign) {
  // Realign the list to the actual required alignment.
  auto AlignMinus1 =
      MIRBuilder.buildConstant(IntPtrTy, Alignment.value() - 1);
  auto ListTmp = MIRBuilder.buildPtrAdd(PtrTy, List, AlignMinus1.getReg(0));
  DstPtr = MIRBuilder.buildMaskLowPtrBits(PtrTy, ListTmp, Log2(Alignment));
} else
  DstPtr = List;

uint64_t ValSize = MRI.getType(Dst).getSizeInBits() / 8;
MIRBuilder.buildLoad(
    Dst, DstPtr,
    *MF.getMachineMemOperand(MachinePointerInfo(), MachineMemOperand::MOLoad,
                             ValSize, std::max(Alignment, PtrAlign)));

auto Size = MIRBuilder.buildConstant(IntPtrTy, alignTo(ValSize, PtrAlign));

auto NewList = MIRBuilder.buildPtrAdd(PtrTy, DstPtr, Size.getReg(0));

MIRBuilder.buildStore(NewList, ListPtr,
                      *MF.getMachineMemOperand(MachinePointerInfo(),
                                               MachineMemOperand::MOStore,
                                               PtrSize, PtrAlign));

MI.eraseFromParent();
return true;
1038}

1040bool AArch64LegalizerInfo::legalizeBitfieldExtract(
  MachineInstr &MI, MachineRegisterInfo &MRI, LegalizerHelper &Helper) const {
// Only legal if we can select immediate forms.
// TODO: Lower this otherwise.
return getConstantVRegValWithLookThrough(MI.getOperand(2).getReg(), MRI) &&
       getConstantVRegValWithLookThrough(MI.getOperand(3).getReg(), MRI);
1046}

1048bool AArch64LegalizerInfo::legalizeCTPOP(MachineInstr &MI,
                                       MachineRegisterInfo &MRI,
                                       LegalizerHelper &Helper) const {
// While there is no integer popcount instruction, it can
// be more efficiently lowered to the following sequence that uses
// AdvSIMD registers/instructions as long as the copies to/from
// the AdvSIMD registers are cheap.
//  FMOV    D0, X0        // copy 64-bit int to vector, high bits zero'd
//  CNT     V0.8B, V0.8B  // 8xbyte pop-counts
//  ADDV    B0, V0.8B     // sum 8xbyte pop-counts
//  UMOV    X0, V0.B[0]   // copy byte result back to integer reg
if (!ST->hasNEON() ||
    MI.getMF()->getFunction().hasFnAttribute(Attribute::NoImplicitFloat))
  return false;
MachineIRBuilder &MIRBuilder = Helper.MIRBuilder;
Register Dst = MI.getOperand(0).getReg();
Register Val = MI.getOperand(1).getReg();
LLT Ty = MRI.getType(Val);

// TODO: Handle vector types.
assert(!Ty.isVector() && "Vector types not handled yet!")(static_cast <bool> (!Ty.isVector() && "Vector types not handled yet!"
) ? void (0) : __assert_fail ("!Ty.isVector() && \"Vector types not handled yet!\""
, "/build/llvm-toolchain-snapshot-13~++20210621111111+acefe0eaaf82/llvm/lib/Target/AArch64/GISel/AArch64LegalizerInfo.cpp"
, 1068, __extension__ __PRETTY_FUNCTION__));
assert(Ty == MRI.getType(Dst) &&(static_cast <bool> (Ty == MRI.getType(Dst) && "Expected src and dst to have the same type!"
) ? void (0) : __assert_fail ("Ty == MRI.getType(Dst) && \"Expected src and dst to have the same type!\""
, "/build/llvm-toolchain-snapshot-13~++20210621111111+acefe0eaaf82/llvm/lib/Target/AArch64/GISel/AArch64LegalizerInfo.cpp"
, 1070, __extension__ __PRETTY_FUNCTION__))
       "Expected src and dst to have the same type!")(static_cast <bool> (Ty == MRI.getType(Dst) && "Expected src and dst to have the same type!"
) ? void (0) : __assert_fail ("Ty == MRI.getType(Dst) && \"Expected src and dst to have the same type!\""
, "/build/llvm-toolchain-snapshot-13~++20210621111111+acefe0eaaf82/llvm/lib/Target/AArch64/GISel/AArch64LegalizerInfo.cpp"
, 1070, __extension__ __PRETTY_FUNCTION__));
// TODO: Handle s128.
unsigned Size = Ty.getSizeInBits();
assert((Size == 32 || Size == 64) && "Expected only 32 or 64 bit scalars!")(static_cast <bool> ((Size == 32 || Size == 64) &&
 "Expected only 32 or 64 bit scalars!") ? void (0) : __assert_fail
 ("(Size == 32 || Size == 64) && \"Expected only 32 or 64 bit scalars!\""
, "/build/llvm-toolchain-snapshot-13~++20210621111111+acefe0eaaf82/llvm/lib/Target/AArch64/GISel/AArch64LegalizerInfo.cpp"
, 1073, __extension__ __PRETTY_FUNCTION__));
if (Size == 32)
  Val = MIRBuilder.buildZExt(LLT::scalar(64), Val).getReg(0);
const LLT V8S8 = LLT::vector(8, LLT::scalar(8));
Val = MIRBuilder.buildBitcast(V8S8, Val).getReg(0);
auto CTPOP = MIRBuilder.buildCTPOP(V8S8, Val);
auto UADDLV =
    MIRBuilder
        .buildIntrinsic(Intrinsic::aarch64_neon_uaddlv, {LLT::scalar(32)},
                        /*HasSideEffects = */ false)
        .addUse(CTPOP.getReg(0));
if (Size == 64)
  MIRBuilder.buildZExt(Dst, UADDLV);
else
  UADDLV->getOperand(0).setReg(Dst);
MI.eraseFromParent();
return true;
1090}

1092bool AArch64LegalizerInfo::legalizeAtomicCmpxchg128(
  MachineInstr &MI, MachineRegisterInfo &MRI, LegalizerHelper &Helper) const {
MachineIRBuilder &MIRBuilder = Helper.MIRBuilder;
LLT s64 = LLT::scalar(64);
auto Addr = MI.getOperand(1).getReg();
auto DesiredI = MIRBuilder.buildUnmerge({s64, s64}, MI.getOperand(2));
auto NewI = MIRBuilder.buildUnmerge({s64, s64}, MI.getOperand(3));
auto DstLo = MRI.createGenericVirtualRegister(s64);
auto DstHi = MRI.createGenericVirtualRegister(s64);

MachineInstrBuilder CAS;
if (ST->hasLSE()) {
  // We have 128-bit CASP instructions taking XSeqPair registers, which are
  // s128. We need the merge/unmerge to bracket the expansion and pair up with
  // the rest of the MIR so we must reassemble the extracted registers into a
  // 128-bit known-regclass one with code like this:
  //
  //     %in1 = REG_SEQUENCE Lo, Hi    ; One for each input
  //     %out = CASP %in1, ...
  //     %OldLo = G_EXTRACT %out, 0
  //     %OldHi = G_EXTRACT %out, 64
  auto Ordering = (*MI.memoperands_begin())->getMergedOrdering();
  unsigned Opcode;
  switch (Ordering) {
  case AtomicOrdering::Acquire:
    Opcode = AArch64::CASPAX;
    break;
  case AtomicOrdering::Release:
    Opcode = AArch64::CASPLX;
    break;
  case AtomicOrdering::AcquireRelease:
  case AtomicOrdering::SequentiallyConsistent:
    Opcode = AArch64::CASPALX;
    break;
  default:
    Opcode = AArch64::CASPX;
    break;
  }

  LLT s128 = LLT::scalar(128);
  auto CASDst = MRI.createGenericVirtualRegister(s128);
  auto CASDesired = MRI.createGenericVirtualRegister(s128);
  auto CASNew = MRI.createGenericVirtualRegister(s128);
  MIRBuilder.buildInstr(TargetOpcode::REG_SEQUENCE, {CASDesired}, {})
      .addUse(DesiredI->getOperand(0).getReg())
      .addImm(AArch64::sube64)
      .addUse(DesiredI->getOperand(1).getReg())
      .addImm(AArch64::subo64);
  MIRBuilder.buildInstr(TargetOpcode::REG_SEQUENCE, {CASNew}, {})
      .addUse(NewI->getOperand(0).getReg())
      .addImm(AArch64::sube64)
      .addUse(NewI->getOperand(1).getReg())
      .addImm(AArch64::subo64);

  CAS = MIRBuilder.buildInstr(Opcode, {CASDst}, {CASDesired, CASNew, Addr});

  MIRBuilder.buildExtract({DstLo}, {CASDst}, 0);
  MIRBuilder.buildExtract({DstHi}, {CASDst}, 64);
} else {
  // The -O0 CMP_SWAP_128 is friendlier to generate code for because LDXP/STXP
  // can take arbitrary registers so it just has the normal GPR64 operands the
  // rest of AArch64 is expecting.
  auto Scratch = MRI.createVirtualRegister(&AArch64::GPR64RegClass);
  CAS = MIRBuilder.buildInstr(AArch64::CMP_SWAP_128, {DstLo, DstHi, Scratch},
                              {Addr, DesiredI->getOperand(0),
                               DesiredI->getOperand(1), NewI->getOperand(0),
                               NewI->getOperand(1)});
}

CAS.cloneMemRefs(MI);
constrainSelectedInstRegOperands(*CAS, *ST->getInstrInfo(),
                                 *MRI.getTargetRegisterInfo(),
                                 *ST->getRegBankInfo());

MIRBuilder.buildMerge(MI.getOperand(0), {DstLo, DstHi});
MI.eraseFromParent();
return true;
1169}

1171bool AArch64LegalizerInfo::legalizeCTTZ(MachineInstr &MI,
                                      LegalizerHelper &Helper) const {
MachineIRBuilder &MIRBuilder = Helper.MIRBuilder;
MachineRegisterInfo &MRI = *MIRBuilder.getMRI();
LLT Ty = MRI.getType(MI.getOperand(1).getReg());
auto BitReverse = MIRBuilder.buildBitReverse(Ty, MI.getOperand(1));
MIRBuilder.buildCTLZ(MI.getOperand(0).getReg(), BitReverse);
MI.eraseFromParent();
return true;
1180}

←

/build/llvm-toolchain-snapshot-13~++20210621111111+acefe0eaaf82/llvm/include/llvm/Support/LowLevelTypeImpl.h

1//== llvm/Support/LowLevelTypeImpl.h --------------------------- -*- C++ -*-==//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8/// \file
9/// Implement a low-level type suitable for MachineInstr level instruction
10/// selection.
11///
12/// For a type attached to a MachineInstr, we only care about 2 details: total
13/// size and the number of vector lanes (if any). Accordingly, there are 4
14/// possible valid type-kinds:
15///
16///    * `sN` for scalars and aggregates
17///    * `<N x sM>` for vectors, which must have at least 2 elements.
18///    * `pN` for pointers
19///
20/// Other information required for correct selection is expected to be carried
21/// by the opcode, or non-type flags. For example the distinction between G_ADD
22/// and G_FADD for int/float or fast-math flags.
23///
24//===----------------------------------------------------------------------===//

26#ifndef LLVM_SUPPORT_LOWLEVELTYPEIMPL_H
27#define LLVM_SUPPORT_LOWLEVELTYPEIMPL_H

29#include "llvm/ADT/DenseMapInfo.h"
30#include "llvm/Support/Debug.h"
31#include "llvm/Support/MachineValueType.h"
32#include <cassert>

34namespace llvm {

36class DataLayout;
37class Type;
38class raw_ostream;

40class LLT {
41public:
/// Get a low-level scalar or aggregate "bag of bits".
static LLT scalar(unsigned SizeInBits) {
  assert(SizeInBits > 0 && "invalid scalar size")(static_cast <bool> (SizeInBits > 0 && "invalid scalar size"
) ? void (0) : __assert_fail ("SizeInBits > 0 && \"invalid scalar size\""
, "/build/llvm-toolchain-snapshot-13~++20210621111111+acefe0eaaf82/llvm/include/llvm/Support/LowLevelTypeImpl.h"
, 44, __extension__ __PRETTY_FUNCTION__));
  return LLT{/*isPointer=*/false, /*isVector=*/false, /*NumElements=*/0,
             SizeInBits, /*AddressSpace=*/0};
}

/// Get a low-level pointer in the given address space.
static LLT pointer(unsigned AddressSpace, unsigned SizeInBits) {
  assert(SizeInBits > 0 && "invalid pointer size")(static_cast <bool> (SizeInBits > 0 && "invalid pointer size"
) ? void (0) : __assert_fail ("SizeInBits > 0 && \"invalid pointer size\""
, "/build/llvm-toolchain-snapshot-13~++20210621111111+acefe0eaaf82/llvm/include/llvm/Support/LowLevelTypeImpl.h"
, 51, __extension__ __PRETTY_FUNCTION__));
  return LLT{/*isPointer=*/true, /*isVector=*/false, /*NumElements=*/0,
             SizeInBits, AddressSpace};
}

/// Get a low-level vector of some number of elements and element width.
/// \p NumElements must be at least 2.
static LLT vector(uint16_t NumElements, unsigned ScalarSizeInBits) {
  assert(NumElements > 1 && "invalid number of vector elements")(static_cast <bool> (NumElements > 1 && "invalid number of vector elements"
) ? void (0) : __assert_fail ("NumElements > 1 && \"invalid number of vector elements\""
, "/build/llvm-toolchain-snapshot-13~++20210621111111+acefe0eaaf82/llvm/include/llvm/Support/LowLevelTypeImpl.h"
, 59, __extension__ __PRETTY_FUNCTION__));
  assert(ScalarSizeInBits > 0 && "invalid vector element size")(static_cast <bool> (ScalarSizeInBits > 0 &&
 "invalid vector element size") ? void (0) : __assert_fail ("ScalarSizeInBits > 0 && \"invalid vector element size\""
, "/build/llvm-toolchain-snapshot-13~++20210621111111+acefe0eaaf82/llvm/include/llvm/Support/LowLevelTypeImpl.h"
, 60, __extension__ __PRETTY_FUNCTION__));
  return LLT{/*isPointer=*/false, /*isVector=*/true, NumElements,
             ScalarSizeInBits, /*AddressSpace=*/0};
}

/// Get a low-level vector of some number of elements and element type.
static LLT vector(uint16_t NumElements, LLT ScalarTy) {
  assert(NumElements > 1 && "invalid number of vector elements")(static_cast <bool> (NumElements > 1 && "invalid number of vector elements"
) ? void (0) : __assert_fail ("NumElements > 1 && \"invalid number of vector elements\""
, "/build/llvm-toolchain-snapshot-13~++20210621111111+acefe0eaaf82/llvm/include/llvm/Support/LowLevelTypeImpl.h"
, 67, __extension__ __PRETTY_FUNCTION__));
  assert(!ScalarTy.isVector() && "invalid vector element type")(static_cast <bool> (!ScalarTy.isVector() && "invalid vector element type"
) ? void (0) : __assert_fail ("!ScalarTy.isVector() && \"invalid vector element type\""
, "/build/llvm-toolchain-snapshot-13~++20210621111111+acefe0eaaf82/llvm/include/llvm/Support/LowLevelTypeImpl.h"
, 68, __extension__ __PRETTY_FUNCTION__));
  return LLT{ScalarTy.isPointer(), /*isVector=*/true, NumElements,
             ScalarTy.getSizeInBits(),
             ScalarTy.isPointer() ? ScalarTy.getAddressSpace() : 0};
}

static LLT scalarOrVector(uint16_t NumElements, LLT ScalarTy) {
  return NumElements == 1 ? ScalarTy : LLT::vector(NumElements, ScalarTy);
}

static LLT scalarOrVector(uint16_t NumElements, unsigned ScalarSize) {
  return scalarOrVector(NumElements, LLT::scalar(ScalarSize));
}

explicit LLT(bool isPointer, bool isVector, uint16_t NumElements,
             unsigned SizeInBits, unsigned AddressSpace) {
  init(isPointer, isVector, NumElements, SizeInBits, AddressSpace);
}
explicit LLT() : IsPointer(false), IsVector(false), RawData(0) {}

explicit LLT(MVT VT);

bool isValid() const { return RawData != 0; }

bool isScalar() const { return isValid() && !IsPointer && !IsVector; }

bool isPointer() const { return isValid() && IsPointer && !IsVector; }

bool isVector() const { return isValid() && IsVector; }
2
←
Returning value, which participates in a condition later→
6
←
Returning zero, which participates in a condition later→

/// Returns the number of elements in a vector LLT. Must only be called on
/// vector types.
uint16_t getNumElements() const {
  assert(IsVector && "cannot get number of elements on scalar/aggregate")(static_cast <bool> (IsVector && "cannot get number of elements on scalar/aggregate"
) ? void (0) : __assert_fail ("IsVector && \"cannot get number of elements on scalar/aggregate\""
, "/build/llvm-toolchain-snapshot-13~++20210621111111+acefe0eaaf82/llvm/include/llvm/Support/LowLevelTypeImpl.h"
, 101, __extension__ __PRETTY_FUNCTION__));
  if (!IsPointer)
    return getFieldValue(VectorElementsFieldInfo);
  else
    return getFieldValue(PointerVectorElementsFieldInfo);
}

/// Returns the total size of the type. Must only be called on sized types.
unsigned getSizeInBits() const {
  if (isPointer() || isScalar())
9
←
Taking false branch→
    return getScalarSizeInBits();
  return getScalarSizeInBits() * getNumElements();
10
←
Returning zero→
}

/// Returns the total size of the type in bytes, i.e. number of whole bytes
/// needed to represent the size in bits. Must only be called on sized types.
unsigned getSizeInBytes() const {
  return (getSizeInBits() + 7) / 8;
}

LLT getScalarType() const {
  return isVector() ? getElementType() : *this;
}

/// If this type is a vector, return a vector with the same number of elements
/// but the new element type. Otherwise, return the new element type.
LLT changeElementType(LLT NewEltTy) const {
  return isVector() ? LLT::vector(getNumElements(), NewEltTy) : NewEltTy;
}

/// If this type is a vector, return a vector with the same number of elements
/// but the new element size. Otherwise, return the new element type. Invalid
/// for pointer types. For pointer types, use changeElementType.
LLT changeElementSize(unsigned NewEltSize) const {
  assert(!getScalarType().isPointer() &&(static_cast <bool> (!getScalarType().isPointer() &&
 "invalid to directly change element size for pointers") ? void
 (0) : __assert_fail ("!getScalarType().isPointer() && \"invalid to directly change element size for pointers\""
, "/build/llvm-toolchain-snapshot-13~++20210621111111+acefe0eaaf82/llvm/include/llvm/Support/LowLevelTypeImpl.h"
, 136, __extension__ __PRETTY_FUNCTION__))
         "invalid to directly change element size for pointers")(static_cast <bool> (!getScalarType().isPointer() &&
 "invalid to directly change element size for pointers") ? void
 (0) : __assert_fail ("!getScalarType().isPointer() && \"invalid to directly change element size for pointers\""
, "/build/llvm-toolchain-snapshot-13~++20210621111111+acefe0eaaf82/llvm/include/llvm/Support/LowLevelTypeImpl.h"
, 136, __extension__ __PRETTY_FUNCTION__));
  return isVector() ? LLT::vector(getNumElements(), NewEltSize)
                    : LLT::scalar(NewEltSize);
}

/// Return a vector or scalar with the same element type and the new number of
/// elements.
LLT changeNumElements(unsigned NewNumElts) const {
  return LLT::scalarOrVector(NewNumElts, getScalarType());
}

/// Return a type that is \p Factor times smaller. Reduces the number of
/// elements if this is a vector, or the bitwidth for scalar/pointers. Does
/// not attempt to handle cases that aren't evenly divisible.
LLT divide(int Factor) const {
  assert(Factor != 1)(static_cast <bool> (Factor != 1) ? void (0) : __assert_fail
 ("Factor != 1", "/build/llvm-toolchain-snapshot-13~++20210621111111+acefe0eaaf82/llvm/include/llvm/Support/LowLevelTypeImpl.h"
, 151, __extension__ __PRETTY_FUNCTION__));
  if (isVector()) {
    assert(getNumElements() % Factor == 0)(static_cast <bool> (getNumElements() % Factor == 0) ? void
 (0) : __assert_fail ("getNumElements() % Factor == 0", "/build/llvm-toolchain-snapshot-13~++20210621111111+acefe0eaaf82/llvm/include/llvm/Support/LowLevelTypeImpl.h"
, 153, __extension__ __PRETTY_FUNCTION__));
    return scalarOrVector(getNumElements() / Factor, getElementType());
  }

  assert(getSizeInBits() % Factor == 0)(static_cast <bool> (getSizeInBits() % Factor == 0) ? void
 (0) : __assert_fail ("getSizeInBits() % Factor == 0", "/build/llvm-toolchain-snapshot-13~++20210621111111+acefe0eaaf82/llvm/include/llvm/Support/LowLevelTypeImpl.h"
, 157, __extension__ __PRETTY_FUNCTION__));
  return scalar(getSizeInBits() / Factor);
}

bool isByteSized() const { return (getSizeInBits() & 7) == 0; }

unsigned getScalarSizeInBits() const {
  assert(RawData != 0 && "Invalid Type")(static_cast <bool> (RawData != 0 && "Invalid Type"
) ? void (0) : __assert_fail ("RawData != 0 && \"Invalid Type\""
, "/build/llvm-toolchain-snapshot-13~++20210621111111+acefe0eaaf82/llvm/include/llvm/Support/LowLevelTypeImpl.h"
, 164, __extension__ __PRETTY_FUNCTION__));
  if (!IsVector) {
    if (!IsPointer)
      return getFieldValue(ScalarSizeFieldInfo);
    else
      return getFieldValue(PointerSizeFieldInfo);
  } else {
    if (!IsPointer)
      return getFieldValue(VectorSizeFieldInfo);
    else
      return getFieldValue(PointerVectorSizeFieldInfo);
  }
}

unsigned getAddressSpace() const {
  assert(RawData != 0 && "Invalid Type")(static_cast <bool> (RawData != 0 && "Invalid Type"
) ? void (0) : __assert_fail ("RawData != 0 && \"Invalid Type\""
, "/build/llvm-toolchain-snapshot-13~++20210621111111+acefe0eaaf82/llvm/include/llvm/Support/LowLevelTypeImpl.h"
, 179, __extension__ __PRETTY_FUNCTION__));
  assert(IsPointer && "cannot get address space of non-pointer type")(static_cast <bool> (IsPointer && "cannot get address space of non-pointer type"
) ? void (0) : __assert_fail ("IsPointer && \"cannot get address space of non-pointer type\""
, "/build/llvm-toolchain-snapshot-13~++20210621111111+acefe0eaaf82/llvm/include/llvm/Support/LowLevelTypeImpl.h"
, 180, __extension__ __PRETTY_FUNCTION__));
  if (!IsVector)
    return getFieldValue(PointerAddressSpaceFieldInfo);
  else
    return getFieldValue(PointerVectorAddressSpaceFieldInfo);
}

/// Returns the vector's element type. Only valid for vector types.
LLT getElementType() const {
  assert(isVector() && "cannot get element type of scalar/aggregate")(static_cast <bool> (isVector() && "cannot get element type of scalar/aggregate"
) ? void (0) : __assert_fail ("isVector() && \"cannot get element type of scalar/aggregate\""
, "/build/llvm-toolchain-snapshot-13~++20210621111111+acefe0eaaf82/llvm/include/llvm/Support/LowLevelTypeImpl.h"
, 189, __extension__ __PRETTY_FUNCTION__));
  if (IsPointer)
    return pointer(getAddressSpace(), getScalarSizeInBits());
  else
    return scalar(getScalarSizeInBits());
}

void print(raw_ostream &OS) const;

198#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
LLVM_DUMP_METHOD__attribute__((noinline)) __attribute__((__used__)) void dump() const {
  print(dbgs());
  dbgs() << '\n';
}
203#endif

bool operator==(const LLT &RHS) const {
  return IsPointer == RHS.IsPointer && IsVector == RHS.IsVector &&
         RHS.RawData == RawData;
}

bool operator!=(const LLT &RHS) const { return !(*this == RHS); }

friend struct DenseMapInfo<LLT>;
friend class GISelInstProfileBuilder;

215private:
/// LLT is packed into 64 bits as follows:
/// isPointer : 1
/// isVector  : 1
/// with 62 bits remaining for Kind-specific data, packed in bitfields
/// as described below. As there isn't a simple portable way to pack bits
/// into bitfields, here the different fields in the packed structure is
/// described in static const *Field variables. Each of these variables
/// is a 2-element array, with the first element describing the bitfield size
/// and the second element describing the bitfield offset.
typedef int BitFieldInfo[2];
///
/// This is how the bitfields are packed per Kind:
/// * Invalid:
///   gets encoded as RawData == 0, as that is an invalid encoding, since for
///   valid encodings, SizeInBits/SizeOfElement must be larger than 0.
/// * Non-pointer scalar (isPointer == 0 && isVector == 0):
///   SizeInBits: 32;
static const constexpr BitFieldInfo ScalarSizeFieldInfo{32, 0};
/// * Pointer (isPointer == 1 && isVector == 0):
///   SizeInBits: 16;
///   AddressSpace: 24;
static const constexpr BitFieldInfo PointerSizeFieldInfo{16, 0};
static const constexpr BitFieldInfo PointerAddressSpaceFieldInfo{
    24, PointerSizeFieldInfo[0] + PointerSizeFieldInfo[1]};
/// * Vector-of-non-pointer (isPointer == 0 && isVector == 1):
///   NumElements: 16;
///   SizeOfElement: 32;
static const constexpr BitFieldInfo VectorElementsFieldInfo{16, 0};
static const constexpr BitFieldInfo VectorSizeFieldInfo{
    32, VectorElementsFieldInfo[0] + VectorElementsFieldInfo[1]};
/// * Vector-of-pointer (isPointer == 1 && isVector == 1):
///   NumElements: 16;
///   SizeOfElement: 16;
///   AddressSpace: 24;
static const constexpr BitFieldInfo PointerVectorElementsFieldInfo{16, 0};
static const constexpr BitFieldInfo PointerVectorSizeFieldInfo{
    16,
    PointerVectorElementsFieldInfo[1] + PointerVectorElementsFieldInfo[0]};
static const constexpr BitFieldInfo PointerVectorAddressSpaceFieldInfo{
    24, PointerVectorSizeFieldInfo[1] + PointerVectorSizeFieldInfo[0]};

uint64_t IsPointer : 1;
uint64_t IsVector : 1;
uint64_t RawData : 62;

static uint64_t getMask(const BitFieldInfo FieldInfo) {
  const int FieldSizeInBits = FieldInfo[0];
  return (((uint64_t)1) << FieldSizeInBits) - 1;
}
static uint64_t maskAndShift(uint64_t Val, uint64_t Mask, uint8_t Shift) {
  assert(Val <= Mask && "Value too large for field")(static_cast <bool> (Val <= Mask && "Value too large for field"
) ? void (0) : __assert_fail ("Val <= Mask && \"Value too large for field\""
, "/build/llvm-toolchain-snapshot-13~++20210621111111+acefe0eaaf82/llvm/include/llvm/Support/LowLevelTypeImpl.h"
, 266, __extension__ __PRETTY_FUNCTION__));
  return (Val & Mask) << Shift;
}
static uint64_t maskAndShift(uint64_t Val, const BitFieldInfo FieldInfo) {
  return maskAndShift(Val, getMask(FieldInfo), FieldInfo[1]);
}
uint64_t getFieldValue(const BitFieldInfo FieldInfo) const {
  return getMask(FieldInfo) & (RawData >> FieldInfo[1]);
}

void init(bool IsPointer, bool IsVector, uint16_t NumElements,
          unsigned SizeInBits, unsigned AddressSpace) {
  this->IsPointer = IsPointer;
  this->IsVector = IsVector;
  if (!IsVector) {
    if (!IsPointer)
      RawData = maskAndShift(SizeInBits, ScalarSizeFieldInfo);
    else
      RawData = maskAndShift(SizeInBits, PointerSizeFieldInfo) |
                maskAndShift(AddressSpace, PointerAddressSpaceFieldInfo);
  } else {
    assert(NumElements > 1 && "invalid number of vector elements")(static_cast <bool> (NumElements > 1 && "invalid number of vector elements"
) ? void (0) : __assert_fail ("NumElements > 1 && \"invalid number of vector elements\""
, "/build/llvm-toolchain-snapshot-13~++20210621111111+acefe0eaaf82/llvm/include/llvm/Support/LowLevelTypeImpl.h"
, 287, __extension__ __PRETTY_FUNCTION__));
    if (!IsPointer)
      RawData = maskAndShift(NumElements, VectorElementsFieldInfo) |
                maskAndShift(SizeInBits, VectorSizeFieldInfo);
    else
      RawData =
          maskAndShift(NumElements, PointerVectorElementsFieldInfo) |
          maskAndShift(SizeInBits, PointerVectorSizeFieldInfo) |
          maskAndShift(AddressSpace, PointerVectorAddressSpaceFieldInfo);
  }
}

uint64_t getUniqueRAWLLTData() const {
  return ((uint64_t)RawData) << 2 | ((uint64_t)IsPointer) << 1 |
         ((uint64_t)IsVector);
}
303};

305inline raw_ostream& operator<<(raw_ostream &OS, const LLT &Ty) {
Ty.print(OS);
return OS;
308}

310template<> struct DenseMapInfo<LLT> {
static inline LLT getEmptyKey() {
  LLT Invalid;
  Invalid.IsPointer = true;
  return Invalid;
}
static inline LLT getTombstoneKey() {
  LLT Invalid;
  Invalid.IsVector = true;
  return Invalid;
}
static inline unsigned getHashValue(const LLT &Ty) {
  uint64_t Val = Ty.getUniqueRAWLLTData();
  return DenseMapInfo<uint64_t>::getHashValue(Val);
}
static bool isEqual(const LLT &LHS, const LLT &RHS) {
  return LHS == RHS;
}
328};

330}

332#endif // LLVM_SUPPORT_LOWLEVELTYPEIMPL_H