doxygen/NVPTXSubtarget_8cpp_source.html

//===- NVPTXSubtarget.cpp - NVPTX Subtarget Information -------------------===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//

//

// This file implements the NVPTX specific subclass of TargetSubtarget.

//

//===----------------------------------------------------------------------===//


#include "NVPTXSubtarget.h"

#include "NVPTXTargetMachine.h"


using namespace llvm;


#define DEBUG_TYPE "nvptx-subtarget"


#define GET_SUBTARGETINFO_ENUM

#define GET_SUBTARGETINFO_TARGET_DESC

#define GET_SUBTARGETINFO_CTOR

#include "NVPTXGenSubtargetInfo.inc"


static cl::opt<bool>

    NoF16Math("nvptx-no-f16-math", cl::Hidden,

              cl::desc("NVPTX Specific: Disable generation of f16 math ops."),

              cl::init(false));

// Pin the vtable to this file.

void NVPTXSubtarget::anchor() {}


NVPTXSubtarget &NVPTXSubtarget::initializeSubtargetDependencies(StringRef CPU,

                                                                StringRef FS) {

    // Provide the default CPU if we don't have one.

    TargetName = std::string(CPU.empty() ? "sm_30" : CPU);


    ParseSubtargetFeatures(TargetName, /*TuneCPU*/ TargetName, FS);


    // Re-map SM version numbers, SmVersion carries the regular SMs which do

    // have relative order, while FullSmVersion allows distinguishing sm_90 from

    // sm_90a, which would *not* be a subset of sm_91.

    SmVersion = getSmVersion();


    // Set default to PTX 6.0 (CUDA 9.0)

    if (PTXVersion == 0) {

      PTXVersion = 60;

  }


  return *this;

}


NVPTXSubtarget::NVPTXSubtarget(const Triple &TT, const std::string &CPU,

                               const std::string &FS,

                               const NVPTXTargetMachine &TM)

    : NVPTXGenSubtargetInfo(TT, CPU, /*TuneCPU*/ CPU, FS), PTXVersion(0),

      FullSmVersion(200), SmVersion(getSmVersion()), TM(TM),

      TLInfo(TM, initializeSubtargetDependencies(CPU, FS)) {}


bool NVPTXSubtarget::hasImageHandles() const {

  // Enable handles for Kepler+, where CUDA supports indirect surfaces and

  // textures

  if (TM.getDrvInterface() == NVPTX::CUDA)

    return (SmVersion >= 30);


  // Disabled, otherwise

  return false;

}


bool NVPTXSubtarget::allowFP16Math() const {

  return hasFP16Math() && NoF16Math == false;

}

NoF16Math
static cl::opt< bool > NoF16Math("nvptx-no-f16-math", cl::Hidden, cl::desc("NVPTX Specific: Disable generation of f16 math ops."), cl::init(false))

NVPTXSubtarget.h

NVPTXTargetMachine.h

SmVersion
unsigned SmVersion
Definition: NVVMReflect.cpp:81

TM
const char LLVMTargetMachineRef TM
Definition: PassBuilderBindings.cpp:47

NVPTXGenSubtargetInfo

llvm::NVPTXSubtarget
Definition: NVPTXSubtarget.h:31

llvm::NVPTXSubtarget::hasImageHandles
bool hasImageHandles() const
Definition: NVPTXSubtarget.cpp:59

llvm::NVPTXSubtarget::ParseSubtargetFeatures
void ParseSubtargetFeatures(StringRef CPU, StringRef TuneCPU, StringRef FS)

llvm::NVPTXSubtarget::getSmVersion
unsigned int getSmVersion() const
Definition: NVPTXSubtarget.h:89

llvm::NVPTXSubtarget::allowFP16Math
bool allowFP16Math() const
Definition: NVPTXSubtarget.cpp:69

llvm::NVPTXSubtarget::NVPTXSubtarget
NVPTXSubtarget(const Triple &TT, const std::string &CPU, const std::string &FS, const NVPTXTargetMachine &TM)
This constructor initializes the data members to match that of the specified module.
Definition: NVPTXSubtarget.cpp:52

llvm::NVPTXSubtarget::initializeSubtargetDependencies
NVPTXSubtarget & initializeSubtargetDependencies(StringRef CPU, StringRef FS)
Definition: NVPTXSubtarget.cpp:32

llvm::NVPTXSubtarget::hasFP16Math
bool hasFP16Math() const
Definition: NVPTXSubtarget.h:83

llvm::NVPTXTargetMachine
NVPTXTargetMachine.
Definition: NVPTXTargetMachine.h:25

llvm::NVPTXTargetMachine::getDrvInterface
NVPTX::DrvInterface getDrvInterface() const
Definition: NVPTXTargetMachine.h:47

llvm::StringRef
StringRef - Represent a constant reference to a string, i.e.
Definition: StringRef.h:50

llvm::StringRef::empty
constexpr bool empty() const
empty - Check if the string is empty.
Definition: StringRef.h:134

llvm::Triple
Triple - Helper class for working with autoconf configuration names.
Definition: Triple.h:44

llvm::cl::opt
Definition: CommandLine.h:1430

llvm::NVPTX::CUDA
@ CUDA
Definition: NVPTX.h:80

llvm::cl::Hidden
@ Hidden
Definition: CommandLine.h:138

llvm::cl::init
initializer< Ty > init(const Ty &Val)
Definition: CommandLine.h:450

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition: AddressRanges.h:18

llvm::cl::desc
Definition: CommandLine.h:416