96 cl::desc(
"Lower GPU ctor / dtors to globals on the device."),
99#define DEPOTNAME "__local_depot"
109 if (
const User *U = dyn_cast<User>(V)) {
110 for (
unsigned i = 0, e = U->getNumOperands(); i != e; ++i) {
126 if (Visited.
count(GV))
130 if (!Visiting.
insert(GV).second)
148 NVPTX_MC::verifyInstructionPredicates(
MI->getOpcode(),
152 lowerToMCInst(
MI, Inst);
157bool NVPTXAsmPrinter::lowerImageHandleOperand(
const MachineInstr *
MI,
165 if (OpNo == 4 && MO.
isImm()) {
166 lowerImageHandleSymbol(MO.
getImm(), MCOp);
170 lowerImageHandleSymbol(MO.
getImm(), MCOp);
180 if (OpNo == VecSize && MO.
isImm()) {
181 lowerImageHandleSymbol(MO.
getImm(), MCOp);
188 if (OpNo == 0 && MO.
isImm()) {
189 lowerImageHandleSymbol(MO.
getImm(), MCOp);
196 if (OpNo == 1 && MO.
isImm()) {
197 lowerImageHandleSymbol(MO.
getImm(), MCOp);
207void NVPTXAsmPrinter::lowerImageHandleSymbol(
unsigned Index,
MCOperand &MCOp) {
220 if (
MI->getOpcode() == NVPTX::CALL_PROTOTYPE) {
227 for (
unsigned i = 0, e =
MI->getNumOperands(); i != e; ++i) {
231 if (lowerImageHandleOperand(
MI, i, MCOp)) {
236 if (lowerOperand(MO, MCOp))
290unsigned NVPTXAsmPrinter::encodeVirtualRegister(
unsigned Reg) {
295 unsigned RegNum = RegMap[
Reg];
300 if (RC == &NVPTX::Int1RegsRegClass) {
302 }
else if (RC == &NVPTX::Int16RegsRegClass) {
304 }
else if (RC == &NVPTX::Int32RegsRegClass) {
306 }
else if (RC == &NVPTX::Int64RegsRegClass) {
308 }
else if (RC == &NVPTX::Float32RegsRegClass) {
310 }
else if (RC == &NVPTX::Float64RegsRegClass) {
312 }
else if (RC == &NVPTX::Int128RegsRegClass) {
319 Ret |= (RegNum & 0x0FFFFFFF);
324 return Reg & 0x0FFFFFFF;
345 Type *Ty =
F->getReturnType();
357 if (
auto *ITy = dyn_cast<IntegerType>(Ty)) {
358 size = ITy->getBitWidth();
364 O <<
".param .b" <<
size <<
" func_retval0";
365 }
else if (isa<PointerType>(Ty)) {
366 O <<
".param .b" << TLI->getPointerTy(
DL).getSizeInBits()
369 unsigned totalsz =
DL.getTypeAllocSize(Ty);
370 Align RetAlignment = TLI->getFunctionArgumentAlignment(
372 O <<
".param .align " << RetAlignment.
value() <<
" .b8 func_retval0["
380 for (
unsigned i = 0, e = vtparts.
size(); i != e; ++i) {
382 EVT elemtype = vtparts[i];
384 elems = vtparts[i].getVectorNumElements();
385 elemtype = vtparts[i].getVectorElementType();
388 for (
unsigned j = 0, je = elems;
j != je; ++
j) {
392 O <<
".reg .b" << sz <<
" func_retval" << idx;
407 printReturnValStr(&F, O);
412bool NVPTXAsmPrinter::isLoopHeaderOfNoUnroll(
414 MachineLoopInfo &LI = getAnalysis<MachineLoopInfoWrapperPass>().getLI();
427 if (
const BasicBlock *PBB = PMBB->getBasicBlock()) {
429 PBB->getTerminator()->getMetadata(LLVMContext::MD_loop)) {
432 if (
MDNode *UnrollCountMD =
434 if (mdconst::extract<ConstantInt>(UnrollCountMD->getOperand(1))
446 if (isLoopHeaderOfNoUnroll(
MBB))
450void NVPTXAsmPrinter::emitFunctionEntryLabel() {
454 if (!GlobalsEmitted) {
456 GlobalsEmitted =
true;
462 emitLinkageDirective(F, O);
467 printReturnValStr(*
MF, O);
472 emitFunctionParamList(F, O);
476 emitKernelFunctionDirectives(*F, O);
486 setAndEmitFunctionVirtualRegisters(*
MF);
487 encodeDebugInfoRegisterNumbers(*
MF);
491 if (!SP->getUnit()->isDebugDirectivesOnly())
507void NVPTXAsmPrinter::emitFunctionBodyStart() {
514void NVPTXAsmPrinter::emitFunctionBodyEnd() {
524void NVPTXAsmPrinter::emitImplicitDef(
const MachineInstr *
MI)
const {
537void NVPTXAsmPrinter::emitKernelFunctionDirectives(
const Function &
F,
546 if (Reqntidx || Reqntidy || Reqntidz)
547 O <<
".reqntid " << Reqntidx.value_or(1) <<
", " << Reqntidy.value_or(1)
548 <<
", " << Reqntidz.value_or(1) <<
"\n";
557 if (Maxntidx || Maxntidy || Maxntidz)
558 O <<
".maxntid " << Maxntidx.value_or(1) <<
", " << Maxntidy.value_or(1)
559 <<
", " << Maxntidz.value_or(1) <<
"\n";
562 O <<
".minnctapersm " << *Mincta <<
"\n";
565 O <<
".maxnreg " << *Maxnreg <<
"\n";
577 if (ClusterX || ClusterY || ClusterZ) {
578 O <<
".explicitcluster\n";
579 if (ClusterX.value_or(1) != 0) {
580 assert(ClusterY.value_or(1) && ClusterZ.value_or(1) &&
581 "cluster_dim_x != 0 implies cluster_dim_y and cluster_dim_z "
582 "should be non-zero as well");
584 O <<
".reqnctapercluster " << ClusterX.value_or(1) <<
", "
585 << ClusterY.value_or(1) <<
", " << ClusterZ.value_or(1) <<
"\n";
587 assert(!ClusterY.value_or(1) && !ClusterZ.value_or(1) &&
588 "cluster_dim_x == 0 implies cluster_dim_y and cluster_dim_z "
589 "should be 0 as well");
593 O <<
".maxclusterrank " << *Maxclusterrank <<
"\n";
604 assert(
I != VRegMapping.
end() &&
"Bad register class");
608 assert(VI != RegMap.
end() &&
"Bad virtual register");
609 unsigned MappedVR = VI->second;
616void NVPTXAsmPrinter::emitVirtualRegister(
unsigned int vr,
621void NVPTXAsmPrinter::emitAliasDeclaration(
const GlobalAlias *GA,
626 "NVPTX aliasee must be a non-kernel function definition");
632 emitDeclarationWithName(F,
getSymbol(GA), O);
636 emitDeclarationWithName(F,
getSymbol(F), O);
641 emitLinkageDirective(F, O);
646 printReturnValStr(F, O);
649 emitFunctionParamList(F, O);
661 return GV->getName() !=
"llvm.used";
664 for (
const User *U :
C->users())
665 if (
const Constant *
C = dyn_cast<Constant>(U))
673 if (
const GlobalVariable *othergv = dyn_cast<GlobalVariable>(U)) {
674 if (othergv->getName() ==
"llvm.used")
679 if (
instr->getParent() &&
instr->getParent()->getParent()) {
681 if (oneFunc && (curFunc != oneFunc))
689 for (
const User *UU : U->users())
723 for (
const User *U :
C->users()) {
724 if (
const Constant *cu = dyn_cast<Constant>(U)) {
727 }
else if (
const Instruction *
I = dyn_cast<Instruction>(U)) {
744 if (
F.getAttributes().hasFnAttr(
"nvptx-libcall-callee")) {
745 emitDeclaration(&F, O);
749 if (
F.isDeclaration()) {
752 if (
F.getIntrinsicID())
754 emitDeclaration(&F, O);
757 for (
const User *U :
F.users()) {
758 if (
const Constant *
C = dyn_cast<Constant>(U)) {
763 emitDeclaration(&F, O);
769 emitDeclaration(&F, O);
774 if (!isa<Instruction>(U))
788 emitDeclaration(&F, O);
795 emitAliasDeclaration(&GA, O);
799 if (!GV)
return true;
801 if (!InitList)
return true;
805void NVPTXAsmPrinter::emitStartOfAsmFile(
Module &M) {
815 emitHeader(M, OS1, *STI);
827 bool IsOpenMP = M.getModuleFlag(
"openmp") !=
nullptr;
832 "Module has a nontrivial global ctor, which NVPTX does not support.");
838 "Module has a nontrivial global dtor, which NVPTX does not support.");
845 GlobalsEmitted =
false;
850void NVPTXAsmPrinter::emitGlobals(
const Module &M) {
854 emitDeclarations(M, OS2);
869 assert(GVVisited.
size() == M.global_size() &&
"Missed a global variable");
870 assert(GVVisiting.
size() == 0 &&
"Did not fully process a global variable");
878 printModuleLevelGV(GV, OS2,
false, STI);
900 O <<
"// Generated by LLVM NVPTX Back-End\n";
905 O <<
".version " << (PTXVersion / 10) <<
"." << (PTXVersion % 10) <<
"\n";
912 O <<
", texmode_independent";
914 bool HasFullDebugInfo =
false;
916 switch(
CU->getEmissionKind()) {
922 HasFullDebugInfo =
true;
925 if (HasFullDebugInfo)
928 if (HasFullDebugInfo)
933 O <<
".address_size ";
946 if (!GlobalsEmitted) {
948 GlobalsEmitted =
true;
962 OutStreamer->emitRawText(
"\t.section\t.debug_macinfo\t{\t}");
966 TS->outputDwarfFileDirectives();
984void NVPTXAsmPrinter::emitLinkageDirective(
const GlobalValue *V,
987 if (V->hasExternalLinkage()) {
988 if (isa<GlobalVariable>(V)) {
996 }
else if (
V->isDeclaration())
1000 }
else if (
V->hasAppendingLinkage()) {
1002 msg.append(
"Error: ");
1003 msg.append(
"Symbol ");
1005 msg.append(std::string(
V->getName()));
1006 msg.append(
"has unsupported appending linkage type");
1008 }
else if (!
V->hasInternalLinkage() &&
1009 !
V->hasPrivateLinkage()) {
1015void NVPTXAsmPrinter::printModuleLevelGV(
const GlobalVariable *GVar,
1062 emitPTXGlobalVariable(GVar, O, STI);
1070 const Constant *Initializer =
nullptr;
1075 CI = dyn_cast<ConstantInt>(Initializer);
1084 O <<
"addr_mode_" << i <<
" = ";
1090 O <<
"clamp_to_border";
1093 O <<
"clamp_to_edge";
1104 O <<
"filter_mode = ";
1119 O <<
", force_unnormalized_coords = 1";
1129 if (strncmp(GVar->
getName().
data(),
"unrollpragma", 12) == 0)
1133 if (strncmp(GVar->
getName().
data(),
"filename", 8) == 0)
1139 const Function *demotedFunc =
nullptr;
1141 O <<
"// " << GVar->
getName() <<
" has been demoted\n";
1142 localDecls[demotedFunc].push_back(GVar);
1152 ".attribute(.managed) requires PTX version >= 4.0 and sm_30");
1154 O <<
" .attribute(.managed)";
1158 O <<
" .align " <<
A->value();
1160 O <<
" .align " << (int)
DL.getPrefTypeAlign(ETy).value();
1169 O << getPTXFundamentalTypeStr(ETy,
false);
1180 if (!Initializer->
isNullValue() && !isa<UndefValue>(Initializer)) {
1182 printScalarConstant(Initializer, O);
1191 "' is not allowed in addrspace(" +
1208 ElementSize =
DL.getTypeStoreSize(ETy);
1215 if (!isa<UndefValue>(Initializer) && !Initializer->
isNullValue()) {
1216 AggBuffer aggBuffer(ElementSize, *
this);
1217 bufferAggregateConstant(Initializer, &aggBuffer);
1218 if (aggBuffer.numSymbols()) {
1220 if (ElementSize % ptrSize ||
1221 !aggBuffer.allSymbolsAligned(ptrSize)) {
1225 "initialized packed aggregate with pointers '" +
1227 "' requires at least PTX ISA version 7.1");
1230 O <<
"[" << ElementSize <<
"] = {";
1231 aggBuffer.printBytes(O);
1234 O <<
" .u" << ptrSize * 8 <<
" ";
1236 O <<
"[" << ElementSize / ptrSize <<
"] = {";
1237 aggBuffer.printWords(O);
1243 O <<
"[" << ElementSize <<
"] = {";
1244 aggBuffer.printBytes(O);
1273void NVPTXAsmPrinter::AggBuffer::printSymbol(
unsigned nSym,
raw_ostream &os) {
1274 const Value *
v = Symbols[nSym];
1275 const Value *v0 = SymbolsBeforeStripping[nSym];
1276 if (
const GlobalValue *GVar = dyn_cast<GlobalValue>(v)) {
1280 bool isGenericPointer = PTy && PTy->getAddressSpace() == 0;
1281 if (EmitGeneric && isGenericPointer && !isa<Function>(v)) {
1283 Name->print(os, AP.MAI);
1286 Name->print(os, AP.MAI);
1288 }
else if (
const ConstantExpr *CExpr = dyn_cast<ConstantExpr>(v0)) {
1289 const MCExpr *Expr = AP.lowerConstantForGV(cast<Constant>(CExpr),
false);
1290 AP.printMCExpr(*Expr, os);
1295void NVPTXAsmPrinter::AggBuffer::printBytes(
raw_ostream &os) {
1296 unsigned int ptrSize = AP.MAI->getCodePointerSize();
1301 unsigned int InitializerCount =
size;
1304 if (numSymbols() == 0)
1305 while (InitializerCount >= 1 && !buffer[InitializerCount - 1])
1308 symbolPosInBuffer.push_back(InitializerCount);
1309 unsigned int nSym = 0;
1310 unsigned int nextSymbolPos = symbolPosInBuffer[nSym];
1311 for (
unsigned int pos = 0; pos < InitializerCount;) {
1314 if (pos != nextSymbolPos) {
1315 os << (
unsigned int)buffer[pos];
1322 std::string symText;
1324 printSymbol(nSym, oss);
1325 for (
unsigned i = 0; i < ptrSize; ++i) {
1329 os <<
"(" << symText <<
")";
1332 nextSymbolPos = symbolPosInBuffer[++nSym];
1333 assert(nextSymbolPos >= pos);
1337void NVPTXAsmPrinter::AggBuffer::printWords(
raw_ostream &os) {
1338 unsigned int ptrSize = AP.MAI->getCodePointerSize();
1339 symbolPosInBuffer.push_back(size);
1340 unsigned int nSym = 0;
1341 unsigned int nextSymbolPos = symbolPosInBuffer[nSym];
1342 assert(nextSymbolPos % ptrSize == 0);
1343 for (
unsigned int pos = 0; pos <
size; pos += ptrSize) {
1346 if (pos == nextSymbolPos) {
1347 printSymbol(nSym, os);
1348 nextSymbolPos = symbolPosInBuffer[++nSym];
1349 assert(nextSymbolPos % ptrSize == 0);
1350 assert(nextSymbolPos >= pos + ptrSize);
1351 }
else if (ptrSize == 4)
1359 auto It = localDecls.find(f);
1360 if (It == localDecls.end())
1363 std::vector<const GlobalVariable *> &gvars = It->second;
1370 O <<
"\t// demoted variable\n\t";
1371 printModuleLevelGV(GV, O,
true, STI);
1375void NVPTXAsmPrinter::emitPTXAddressSpace(
unsigned int AddressSpace,
1398NVPTXAsmPrinter::getPTXFundamentalTypeStr(
Type *Ty,
bool useB4PTR)
const {
1401 unsigned NumBits = cast<IntegerType>(Ty)->getBitWidth();
1404 else if (NumBits <= 64) {
1405 std::string
name =
"u";
1406 return name + utostr(NumBits);
1424 assert((PtrSize == 64 || PtrSize == 32) &&
"Unexpected pointer size");
1442void NVPTXAsmPrinter::emitPTXGlobalVariable(
const GlobalVariable *GVar,
1455 ".attribute(.managed) requires PTX version >= 4.0 and sm_30");
1457 O <<
" .attribute(.managed)";
1460 O <<
" .align " <<
A->value();
1462 O <<
" .align " << (int)
DL.getPrefTypeAlign(ETy).value();
1474 O << getPTXFundamentalTypeStr(ETy);
1480 int64_t ElementSize = 0;
1490 ElementSize =
DL.getTypeStoreSize(ETy);
1513 unsigned paramIndex = 0;
1518 if (
F->arg_empty() && !
F->isVarArg()) {
1525 for (
I =
F->arg_begin(), E =
F->arg_end();
I != E; ++
I, paramIndex++) {
1526 Type *Ty =
I->getType();
1536 std::string ParamSym;
1538 ParamStr <<
F->getName() <<
"_param_" << paramIndex;
1544 O <<
"\t.param .u64 .ptr .surfref ";
1546 O <<
"\t.param .surfref ";
1547 O << TLI->getParamName(F, paramIndex);
1551 O <<
"\t.param .u64 .ptr .texref ";
1553 O <<
"\t.param .texref ";
1554 O << TLI->getParamName(F, paramIndex);
1558 O <<
"\t.param .u64 .ptr .samplerref ";
1560 O <<
"\t.param .samplerref ";
1561 O << TLI->getParamName(F, paramIndex);
1567 auto getOptimalAlignForParam = [TLI, &
DL, &PAL,
F,
1571 return StackAlign.
value();
1573 Align TypeAlign = TLI->getFunctionParamOptimizedAlign(F, Ty,
DL);
1574 MaybeAlign ParamAlign = PAL.getParamAlignment(paramIndex);
1575 return std::max(TypeAlign, ParamAlign.
valueOrOne());
1578 if (!PAL.hasParamAttr(paramIndex, Attribute::ByVal)) {
1584 Align OptimalAlign = getOptimalAlignForParam(Ty);
1586 O <<
"\t.param .align " << OptimalAlign.
value() <<
" .b8 ";
1587 O << TLI->getParamName(F, paramIndex);
1588 O <<
"[" <<
DL.getTypeAllocSize(Ty) <<
"]";
1593 auto *PTy = dyn_cast<PointerType>(Ty);
1594 unsigned PTySizeInBits = 0;
1597 TLI->getPointerTy(
DL, PTy->getAddressSpace()).getSizeInBits();
1598 assert(PTySizeInBits &&
"Invalid pointer size");
1603 O <<
"\t.param .u" << PTySizeInBits <<
" .ptr";
1605 switch (PTy->getAddressSpace()) {
1622 O <<
" .align " <<
I->getParamAlign().valueOrOne().value();
1623 O <<
" " << TLI->getParamName(F, paramIndex);
1633 O << getPTXFundamentalTypeStr(Ty);
1635 O << TLI->getParamName(F, paramIndex);
1641 if (isa<IntegerType>(Ty)) {
1642 sz = cast<IntegerType>(Ty)->getBitWidth();
1645 assert(PTySizeInBits &&
"Invalid pointer size");
1650 O <<
"\t.param .b" << sz <<
" ";
1652 O <<
"\t.reg .b" << sz <<
" ";
1653 O << TLI->getParamName(F, paramIndex);
1658 Type *ETy = PAL.getParamByValType(paramIndex);
1659 assert(ETy &&
"Param should have byval type");
1661 if (isABI || isKernelFunc) {
1666 Align OptimalAlign =
1668 ? getOptimalAlignForParam(ETy)
1669 : TLI->getFunctionByValParamAlign(
1670 F, ETy, PAL.getParamAlignment(paramIndex).valueOrOne(),
DL);
1672 unsigned sz =
DL.getTypeAllocSize(ETy);
1673 O <<
"\t.param .align " << OptimalAlign.
value() <<
" .b8 ";
1674 O << TLI->getParamName(F, paramIndex);
1675 O <<
"[" << sz <<
"]";
1684 for (
unsigned i = 0, e = vtparts.
size(); i != e; ++i) {
1686 EVT elemtype = vtparts[i];
1688 elems = vtparts[i].getVectorNumElements();
1689 elemtype = vtparts[i].getVectorElementType();
1692 for (
unsigned j = 0, je = elems;
j != je; ++
j) {
1696 O <<
"\t.reg .b" << sz <<
" ";
1697 O << TLI->getParamName(F, paramIndex);
1710 if (
F->isVarArg()) {
1715 O << TLI->getParamName(F, -1) <<
"[]";
1721void NVPTXAsmPrinter::setAndEmitFunctionVirtualRegisters(
1738 O <<
"\t.reg .b64 \t%SP;\n";
1739 O <<
"\t.reg .b64 \t%SPL;\n";
1741 O <<
"\t.reg .b32 \t%SP;\n";
1742 O <<
"\t.reg .b32 \t%SPL;\n";
1751 for (
unsigned i = 0; i < numVRs; i++) {
1755 int n = regmap.
size();
1756 regmap.
insert(std::make_pair(vr, n + 1));
1771 for (
unsigned i=0; i<
TRI->getNumRegClasses(); i++) {
1776 int n = regmap.
size();
1780 O <<
"\t.reg " << rcname <<
" \t" << rcStr <<
"<" << (n+1)
1790void NVPTXAsmPrinter::encodeDebugInfoRegisterNumbers(
1800 for (
auto &classMap : VRegMapping) {
1801 for (
auto ®isterMapping : classMap.getSecond()) {
1802 auto reg = registerMapping.getFirst();
1811 unsigned int numHex;
1830 if (
const ConstantInt *CI = dyn_cast<ConstantInt>(CPV)) {
1834 if (
const ConstantFP *CFP = dyn_cast<ConstantFP>(CPV)) {
1835 printFPConstant(CFP, O);
1838 if (isa<ConstantPointerNull>(CPV)) {
1842 if (
const GlobalValue *GVar = dyn_cast<GlobalValue>(CPV)) {
1843 bool IsNonGenericPointer =
false;
1845 IsNonGenericPointer =
true;
1847 if (EmitGeneric && !isa<Function>(CPV) && !IsNonGenericPointer) {
1856 if (
const ConstantExpr *Cexpr = dyn_cast<ConstantExpr>(CPV)) {
1857 const MCExpr *E = lowerConstantForGV(cast<Constant>(Cexpr),
false);
1864void NVPTXAsmPrinter::bufferLEByte(
const Constant *CPV,
int Bytes,
1865 AggBuffer *AggBuffer) {
1867 int AllocSize =
DL.getTypeAllocSize(CPV->
getType());
1871 AggBuffer->addZeros(Bytes ? Bytes : AllocSize);
1876 auto AddIntToBuffer = [AggBuffer, Bytes](
const APInt &Val) {
1877 size_t NumBytes = (Val.getBitWidth() + 7) / 8;
1883 for (
unsigned I = 0;
I < NumBytes - 1; ++
I) {
1884 Buf[
I] = Val.extractBitsAsZExtValue(8,
I * 8);
1886 size_t LastBytePosition = (NumBytes - 1) * 8;
1887 size_t LastByteBits = Val.getBitWidth() - LastBytePosition;
1889 Val.extractBitsAsZExtValue(LastByteBits, LastBytePosition);
1890 AggBuffer->addBytes(Buf.data(), NumBytes, Bytes);
1895 if (
const auto CI = dyn_cast<ConstantInt>(CPV)) {
1899 if (
const auto *Cexpr = dyn_cast<ConstantExpr>(CPV)) {
1900 if (
const auto *CI =
1905 if (Cexpr->getOpcode() == Instruction::PtrToInt) {
1906 Value *
V = Cexpr->getOperand(0)->stripPointerCasts();
1907 AggBuffer->addSymbol(V, Cexpr->getOperand(0));
1908 AggBuffer->addZeros(AllocSize);
1919 AddIntToBuffer(cast<ConstantFP>(CPV)->getValueAPF().bitcastToAPInt());
1923 if (
const GlobalValue *GVar = dyn_cast<GlobalValue>(CPV)) {
1924 AggBuffer->addSymbol(GVar, GVar);
1925 }
else if (
const ConstantExpr *Cexpr = dyn_cast<ConstantExpr>(CPV)) {
1926 const Value *
v = Cexpr->stripPointerCasts();
1927 AggBuffer->addSymbol(v, Cexpr);
1929 AggBuffer->addZeros(AllocSize);
1936 if (isa<ConstantAggregate>(CPV) || isa<ConstantDataSequential>(CPV)) {
1937 bufferAggregateConstant(CPV, AggBuffer);
1938 if (Bytes > AllocSize)
1939 AggBuffer->addZeros(Bytes - AllocSize);
1940 }
else if (isa<ConstantAggregateZero>(CPV))
1941 AggBuffer->addZeros(Bytes);
1952void NVPTXAsmPrinter::bufferAggregateConstant(
const Constant *CPV,
1953 AggBuffer *aggBuffer) {
1958 if (
const ConstantInt *CI = dyn_cast<ConstantInt>(CPV)) {
1960 for (
unsigned I = 0, E =
DL.getTypeAllocSize(CPV->
getType());
I < E; ++
I) {
1962 aggBuffer->addBytes(&Byte, 1, 1);
1969 if (isa<ConstantArray>(CPV) || isa<ConstantVector>(CPV)) {
1972 bufferLEByte(cast<Constant>(CPV->
getOperand(i)), 0, aggBuffer);
1977 dyn_cast<ConstantDataSequential>(CPV)) {
1978 if (CDS->getNumElements())
1979 for (
unsigned i = 0; i < CDS->getNumElements(); ++i)
1980 bufferLEByte(cast<Constant>(CDS->getElementAsConstant(i)), 0,
1985 if (isa<ConstantStruct>(CPV)) {
1990 Bytes =
DL.getStructLayout(ST)->getElementOffset(0) +
1991 DL.getTypeAllocSize(ST) -
1992 DL.getStructLayout(ST)->getElementOffset(i);
1994 Bytes =
DL.getStructLayout(ST)->getElementOffset(i + 1) -
1995 DL.getStructLayout(ST)->getElementOffset(i);
1996 bufferLEByte(cast<Constant>(CPV->
getOperand(i)), Bytes, aggBuffer);
2009NVPTXAsmPrinter::lowerConstantForGV(
const Constant *CV,
bool ProcessingGeneric) {
2015 if (
const ConstantInt *CI = dyn_cast<ConstantInt>(CV))
2018 if (
const GlobalValue *GV = dyn_cast<GlobalValue>(CV)) {
2021 if (ProcessingGeneric) {
2033 switch (
CE->getOpcode()) {
2037 case Instruction::AddrSpaceCast: {
2040 if (DstTy->getAddressSpace() == 0)
2041 return lowerConstantForGV(cast<const Constant>(
CE->getOperand(0)),
true);
2046 case Instruction::GetElementPtr: {
2050 APInt OffsetAI(
DL.getPointerTypeSizeInBits(
CE->getType()), 0);
2051 cast<GEPOperator>(CE)->accumulateConstantOffset(
DL, OffsetAI);
2053 const MCExpr *
Base = lowerConstantForGV(
CE->getOperand(0),
2058 int64_t
Offset = OffsetAI.getSExtValue();
2063 case Instruction::Trunc:
2069 case Instruction::BitCast:
2070 return lowerConstantForGV(
CE->getOperand(0), ProcessingGeneric);
2072 case Instruction::IntToPtr: {
2081 return lowerConstantForGV(
Op, ProcessingGeneric);
2086 case Instruction::PtrToInt: {
2092 Type *Ty =
CE->getType();
2094 const MCExpr *OpExpr = lowerConstantForGV(
Op, ProcessingGeneric);
2098 if (
DL.getTypeAllocSize(Ty) ==
DL.getTypeAllocSize(
Op->getType()))
2104 unsigned InBits =
DL.getTypeAllocSizeInBits(
Op->getType());
2111 case Instruction::Add: {
2112 const MCExpr *
LHS = lowerConstantForGV(
CE->getOperand(0), ProcessingGeneric);
2113 const MCExpr *
RHS = lowerConstantForGV(
CE->getOperand(1), ProcessingGeneric);
2114 switch (
CE->getOpcode()) {
2126 return lowerConstantForGV(
C, ProcessingGeneric);
2131 OS <<
"Unsupported expression in static initializer: ";
2132 CE->printAsOperand(
OS,
false,
2141 return cast<MCTargetExpr>(&Expr)->printImpl(
OS,
MAI);
2143 OS << cast<MCConstantExpr>(Expr).getValue();
2169 if (isa<MCConstantExpr>(BE.
getLHS()) || isa<MCSymbolRefExpr>(BE.
getLHS()) ||
2170 isa<NVPTXGenericMCSymbolRefExpr>(BE.
getLHS())) {
2182 if (RHSC->getValue() < 0) {
2183 OS << RHSC->getValue();
2194 if (isa<MCConstantExpr>(BE.
getRHS()) || isa<MCSymbolRefExpr>(BE.
getRHS())) {
2210bool NVPTXAsmPrinter::PrintAsmOperand(
const MachineInstr *
MI,
unsigned OpNo,
2212 if (ExtraCode && ExtraCode[0]) {
2213 if (ExtraCode[1] != 0)
2216 switch (ExtraCode[0]) {
2225 printOperand(
MI, OpNo, O);
2230bool NVPTXAsmPrinter::PrintAsmMemoryOperand(
const MachineInstr *
MI,
2232 const char *ExtraCode,
2234 if (ExtraCode && ExtraCode[0])
2238 printMemOperand(
MI, OpNo, O);
2244void NVPTXAsmPrinter::printOperand(
const MachineInstr *
MI,
unsigned OpNum,
2250 if (MO.
getReg() == NVPTX::VRDepot)
2255 emitVirtualRegister(MO.
getReg(), O);
2280void NVPTXAsmPrinter::printMemOperand(
const MachineInstr *
MI,
unsigned OpNum,
2282 printOperand(
MI, OpNum, O);
2284 if (Modifier && strcmp(Modifier,
"add") == 0) {
2286 printOperand(
MI, OpNum + 1, O);
2288 if (
MI->getOperand(OpNum + 1).isImm() &&
2289 MI->getOperand(OpNum + 1).getImm() == 0)
2292 printOperand(
MI, OpNum + 1, O);
static cl::opt< bool > LowerCtorDtor("amdgpu-lower-global-ctor-dtor", cl::desc("Lower GPU ctor / dtors to globals on the device."), cl::init(true), cl::Hidden)
This file declares a class to represent arbitrary precision floating point values and provide a varie...
This file implements a class to represent arbitrary precision integral constant values and operations...
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
This file contains the simple types necessary to represent the attributes associated with functions a...
static GCRegistry::Add< ErlangGC > A("erlang", "erlang-compatible garbage collector")
#define LLVM_EXTERNAL_VISIBILITY
This file contains the declarations for the subclasses of Constant, which represent the different fla...
Looks at all the uses of the given value Returns the Liveness deduced from the uses of this value Adds all uses that cause the result to be MaybeLive to MaybeLiveRetUses If the result is MaybeLiveUses might be modified but its content should be ignored(since it might not be complete). DeadArgumentEliminationPass
This file defines the DenseMap class.
This file defines the DenseSet and SmallDenseSet classes.
static GCMetadataPrinterRegistry::Add< ErlangGCPrinter > X("erlang", "erlang-compatible garbage collector")
Module.h This file contains the declarations for the Module class.
unsigned const TargetRegisterInfo * TRI
static bool isEmptyXXStructor(GlobalVariable *GV)
static bool usedInOneFunc(const User *U, Function const *&oneFunc)
static void VisitGlobalVariableForEmission(const GlobalVariable *GV, SmallVectorImpl< const GlobalVariable * > &Order, DenseSet< const GlobalVariable * > &Visited, DenseSet< const GlobalVariable * > &Visiting)
VisitGlobalVariableForEmission - Add GV to the list of GlobalVariable instances to be emitted,...
LLVM_EXTERNAL_VISIBILITY void LLVMInitializeNVPTXAsmPrinter()
static bool usedInGlobalVarDef(const Constant *C)
static bool useFuncSeen(const Constant *C, DenseMap< const Function *, bool > &seenMap)
static cl::opt< bool > LowerCtorDtor("nvptx-lower-global-ctor-dtor", cl::desc("Lower GPU ctor / dtors to globals on the device."), cl::init(false), cl::Hidden)
static bool ShouldPassAsArray(Type *Ty)
static void DiscoverDependentGlobals(const Value *V, DenseSet< const GlobalVariable * > &Globals)
DiscoverDependentGlobals - Return a set of GlobalVariables on which V depends.
static bool canDemoteGlobalVar(const GlobalVariable *gv, Function const *&f)
static GCMetadataPrinterRegistry::Add< OcamlGCMetadataPrinter > Y("ocaml", "ocaml 3.10-compatible collector")
assert(ImpDefSCC.getReg()==AMDGPU::SCC &&ImpDefSCC.isDef())
This file defines the SmallString class.
This file defines the SmallVector class.
opStatus convert(const fltSemantics &ToSemantics, roundingMode RM, bool *losesInfo)
APInt bitcastToAPInt() const
Class for arbitrary precision integers.
APInt getLoBits(unsigned numBits) const
Compute an APInt containing numBits lowbits from this APInt.
uint64_t getZExtValue() const
Get zero extended value.
void lshrInPlace(unsigned ShiftAmt)
Logical right-shift this APInt by ShiftAmt in place.
This class represents an incoming formal argument to a Function.
MCSymbol * getSymbol(const GlobalValue *GV) const
void EmitToStreamer(MCStreamer &S, const MCInst &Inst)
TargetMachine & TM
Target machine description.
virtual void PrintSymbolOperand(const MachineOperand &MO, raw_ostream &OS)
Print the MachineOperand as a symbol.
const MCAsmInfo * MAI
Target Asm Printer information.
MachineFunction * MF
The current machine function.
bool hasDebugInfo() const
Returns true if valid debug info is present.
bool doInitialization(Module &M) override
Set up the AsmPrinter when we are working on a new module.
unsigned getFunctionNumber() const
Return a unique ID for the current function.
MCSymbol * CurrentFnSym
The symbol for the current function.
MCContext & OutContext
This is the context for the output file that we are streaming.
bool doFinalization(Module &M) override
Shut down the asmprinter.
MCSymbol * GetExternalSymbolSymbol(Twine Sym) const
Return the MCSymbol for the specified ExternalSymbol.
virtual void emitBasicBlockStart(const MachineBasicBlock &MBB)
Targets can override this to emit stuff at the start of a basic block.
bool runOnMachineFunction(MachineFunction &MF) override
Emit the specified function out to the OutStreamer.
std::unique_ptr< MCStreamer > OutStreamer
This is the MCStreamer object for the file we are generating.
const DataLayout & getDataLayout() const
Return information about data layout.
void emitInitialRawDwarfLocDirective(const MachineFunction &MF)
Emits inital debug location directive.
const MCSubtargetInfo & getSubtargetInfo() const
Return information about subtarget.
virtual bool PrintAsmOperand(const MachineInstr *MI, unsigned OpNo, const char *ExtraCode, raw_ostream &OS)
Print the specified operand of MI, an INLINEASM instruction, using the specified assembler variant.
LLVM Basic Block Representation.
const Function * getParent() const
Return the enclosing method, or null if none.
ConstantArray - Constant Array Declarations.
ConstantDataSequential - A vector or array constant whose element type is a simple 1/2/4/8-byte integ...
A constant value that is initialized with an expression using other constant values.
ConstantFP - Floating Point Values [float, double].
const APFloat & getValueAPF() const
This is the shared class of boolean and integer constants.
uint64_t getZExtValue() const
Return the constant as a 64-bit unsigned integer value after it has been zero extended as appropriate...
const APInt & getValue() const
Return the constant as an APInt value reference.
This is an important base class in LLVM.
bool isNullValue() const
Return true if this is the value that would be returned by getNullValue.
This class represents an Operation in the Expression.
A parsed version of the target data layout string in and methods for querying it.
iterator find(const_arg_type_t< KeyT > Val)
bool contains(const_arg_type_t< KeyT > Val) const
Return true if the specified key is in the map, false otherwise.
std::pair< iterator, bool > insert(const std::pair< KeyT, ValueT > &KV)
Implements a dense probed hash-table based set.
DISubprogram * getSubprogram() const
Get the attached subprogram.
const GlobalObject * getAliaseeObject() const
StringRef getSection() const
Get the custom section of this global if it has one.
MaybeAlign getAlign() const
Returns the alignment of the given variable or function.
bool hasSection() const
Check if this global has a custom object file section.
bool hasLinkOnceLinkage() const
bool hasExternalLinkage() const
bool isDeclaration() const
Return true if the primary definition of this global value is outside of the current translation unit...
bool hasLocalLinkage() const
bool hasPrivateLinkage() const
unsigned getAddressSpace() const
Module * getParent()
Get the module that this global value is contained inside of...
PointerType * getType() const
Global values are always pointers.
bool hasWeakLinkage() const
bool hasCommonLinkage() const
bool hasAvailableExternallyLinkage() const
Type * getValueType() const
const Constant * getInitializer() const
getInitializer - Return the initializer for this global variable.
bool hasInitializer() const
Definitions have initializers, declarations don't.
bool isLoopHeader(const BlockT *BB) const
LoopT * getLoopFor(const BlockT *BB) const
Return the inner most loop that BB lives in.
unsigned getCodePointerSize() const
Get the code pointer size in bytes.
Binary assembler expressions.
const MCExpr * getLHS() const
Get the left-hand side expression of the binary operator.
const MCExpr * getRHS() const
Get the right-hand side expression of the binary operator.
static const MCBinaryExpr * createAnd(const MCExpr *LHS, const MCExpr *RHS, MCContext &Ctx)
static const MCBinaryExpr * createAdd(const MCExpr *LHS, const MCExpr *RHS, MCContext &Ctx)
Opcode getOpcode() const
Get the kind of this binary expression.
static const MCConstantExpr * create(int64_t Value, MCContext &Ctx, bool PrintInHex=false, unsigned SizeInBytes=0)
Context object for machine code objects.
MCSymbol * getOrCreateSymbol(const Twine &Name)
Lookup the symbol inside with the specified Name.
Base class for the full range of assembler expressions which are needed for parsing.
@ Unary
Unary expressions.
@ Constant
Constant expressions.
@ SymbolRef
References to labels and assigned expressions.
@ Target
Target specific expression.
@ Binary
Binary expressions.
Instances of this class represent a single low-level machine instruction.
void addOperand(const MCOperand Op)
void setOpcode(unsigned Op)
Describe properties that are true of each instruction in the target description file.
Instances of this class represent operands of the MCInst class.
static MCOperand createExpr(const MCExpr *Val)
static MCOperand createReg(MCRegister Reg)
static MCOperand createImm(int64_t Val)
Represent a reference to a symbol from inside an expression.
const MCSymbol & getSymbol() const
static const MCSymbolRefExpr * create(const MCSymbol *Symbol, MCContext &Ctx)
MCSymbol - Instances of this class represent a symbol name in the MC file, and MCSymbols are created ...
void print(raw_ostream &OS, const MCAsmInfo *MAI) const
print - Print the value to the stream OS.
Unary assembler expressions.
Opcode getOpcode() const
Get the kind of this unary expression.
const MCExpr * getSubExpr() const
Get the child of this unary expression.
MCSymbol * getSymbol() const
Return the MCSymbol for this basic block.
iterator_range< pred_iterator > predecessors()
The MachineFrameInfo class represents an abstract stack frame until prolog/epilog code is inserted.
uint64_t getStackSize() const
Return the number of bytes that must be allocated to hold all of the fixed size frame objects.
Align getMaxAlign() const
Return the alignment in bytes that this function must be aligned to, which is greater than the defaul...
const TargetSubtargetInfo & getSubtarget() const
getSubtarget - Return the subtarget for which this machine code is being compiled.
MachineFrameInfo & getFrameInfo()
getFrameInfo - Return the frame info object for the current function.
MachineRegisterInfo & getRegInfo()
getRegInfo - Return information about the registers currently in use.
Function & getFunction()
Return the LLVM function that this machine code represents.
Ty * getInfo()
getInfo - Keep track of various per-function pieces of information for backends that would like to do...
const TargetMachine & getTarget() const
getTarget - Return the target machine this machine code is compiled with
Representation of each machine instruction.
MachineOperand class - Representation of each machine instruction operand.
const GlobalValue * getGlobal() const
MachineBasicBlock * getMBB() const
bool isImm() const
isImm - Tests if this is a MO_Immediate operand.
MachineOperandType getType() const
getType - Returns the MachineOperandType for this operand.
const char * getSymbolName() const
Register getReg() const
getReg - Returns the register number.
const ConstantFP * getFPImm() const
@ MO_Immediate
Immediate operand.
@ MO_GlobalAddress
Address of a global value.
@ MO_MachineBasicBlock
MachineBasicBlock reference.
@ MO_Register
Register operand.
@ MO_ExternalSymbol
Name of external global symbol.
@ MO_FPImmediate
Floating-point immediate operand.
const TargetRegisterClass * getRegClass(Register Reg) const
Return the register class of the specified virtual register.
unsigned getNumVirtRegs() const
getNumVirtRegs - Return the number of virtual registers created.
A Module instance is used to store all the information related to an LLVM module.
bool doInitialization(Module &M) override
Set up the AsmPrinter when we are working on a new module.
bool runOnMachineFunction(MachineFunction &F) override
Emit the specified function out to the OutStreamer.
std::string getVirtualRegisterName(unsigned) const
bool doFinalization(Module &M) override
Shut down the asmprinter.
const MCSymbol * getFunctionFrameSymbol() const override
Return symbol for the function pseudo stack if the stack frame is not a register based.
static const NVPTXFloatMCExpr * createConstantBFPHalf(const APFloat &Flt, MCContext &Ctx)
static const NVPTXFloatMCExpr * createConstantFPHalf(const APFloat &Flt, MCContext &Ctx)
static const NVPTXFloatMCExpr * createConstantFPSingle(const APFloat &Flt, MCContext &Ctx)
static const NVPTXFloatMCExpr * createConstantFPDouble(const APFloat &Flt, MCContext &Ctx)
static const NVPTXGenericMCSymbolRefExpr * create(const MCSymbolRefExpr *SymExpr, MCContext &Ctx)
static const char * getRegisterName(MCRegister Reg)
bool checkImageHandleSymbol(StringRef Symbol) const
Check if the symbol has a mapping.
StringRef getImageHandleSymbol(unsigned Idx) const
Returns the symbol name at the given index.
void clearDebugRegisterMap() const
const char * getName(unsigned RegNo) const
std::string getTargetName() const
unsigned getMaxRequiredAlignment() const
bool hasMaskOperator() const
const NVPTXTargetLowering * getTargetLowering() const override
unsigned getPTXVersion() const
const NVPTXRegisterInfo * getRegisterInfo() const override
unsigned int getSmVersion() const
NVPTX::DrvInterface getDrvInterface() const
const NVPTXSubtarget * getSubtargetImpl(const Function &) const override
Virtual method implemented by subclasses that returns a reference to that target's TargetSubtargetInf...
UniqueStringSaver & getStrPool() const
Implments NVPTX-specific streamer.
void closeLastSection()
Close last section.
unsigned getAddressSpace() const
Return the address space of the Pointer type.
Wrapper class representing virtual and physical registers.
static Register index2VirtReg(unsigned Index)
Convert a 0-based index to a virtual register number.
constexpr bool isVirtual() const
Return true if the specified register number is in the virtual register namespace.
static constexpr bool isVirtualRegister(unsigned Reg)
Return true if the specified register number is in the virtual register namespace.
constexpr bool isPhysical() const
Return true if the specified register number is in the physical register namespace.
SmallString - A SmallString is just a SmallVector with methods and accessors that make it work better...
This class consists of common code factored out of the SmallVector class to reduce code duplication b...
void push_back(const T &Elt)
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
StringRef - Represent a constant reference to a string, i.e.
bool starts_with(StringRef Prefix) const
Check if this string starts with the given Prefix.
constexpr const char * data() const
data - Get a pointer to the start of the string (which may not be null terminated).
Class to represent struct types.
Primary interface to the complete machine description for the target machine.
const STC & getSubtarget(const Function &F) const
This method returns a pointer to the specified type of TargetSubtargetInfo.
unsigned getPointerSizeInBits(unsigned AS) const
TargetRegisterInfo base class - We assume that the target defines a static array of TargetRegisterDes...
virtual const TargetRegisterInfo * getRegisterInfo() const
getRegisterInfo - If register information is available, return it.
Twine - A lightweight data structure for efficiently representing the concatenation of temporary valu...
The instances of the Type class are immutable: once they are created, they are never changed.
bool isVectorTy() const
True if this is an instance of VectorType.
bool isPointerTy() const
True if this is an instance of PointerType.
bool isBFloatTy() const
Return true if this is 'bfloat', a 16-bit bfloat type.
unsigned getPointerAddressSpace() const
Get the address space of this pointer or pointer vector type.
@ HalfTyID
16-bit floating point type
@ VoidTyID
type with no size
@ FloatTyID
32-bit floating point type
@ IntegerTyID
Arbitrary bit width integers.
@ FixedVectorTyID
Fixed width SIMD vector type.
@ BFloatTyID
16-bit floating point type (7-bit significand)
@ DoubleTyID
64-bit floating point type
unsigned getScalarSizeInBits() const LLVM_READONLY
If this is a vector type, return the getPrimitiveSizeInBits value for the element type.
bool isAggregateType() const
Return true if the type is an aggregate type.
bool isHalfTy() const
Return true if this is 'half', a 16-bit IEEE fp type.
bool isFloatingPointTy() const
Return true if this is one of the floating-point types.
bool isIntOrPtrTy() const
Return true if this is an integer type or a pointer type.
bool isIntegerTy() const
True if this is an instance of IntegerType.
TypeID getTypeID() const
Return the type id for the type.
TypeSize getPrimitiveSizeInBits() const LLVM_READONLY
Return the basic size of this type if it is a primitive type.
StringRef save(const char *S)
Value * getOperand(unsigned i) const
unsigned getNumOperands() const
LLVM Value Representation.
Type * getType() const
All values are typed, get the type of this value.
StringRef getName() const
Return a constant reference to the value's name.
std::pair< iterator, bool > insert(const ValueT &V)
bool erase(const ValueT &V)
size_type count(const_arg_type_t< ValueT > V) const
Return 1 if the specified key is in the set, 0 otherwise.
This class implements an extremely fast bulk output stream that can only output to a stream.
A raw_ostream that writes to an std::string.
A raw_ostream that writes to an SmallVector or SmallString.
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
@ C
The default llvm calling convention, compatible with C.
LegalityPredicate isVector(unsigned TypeIdx)
True iff the specified type index is a vector.
@ CE
Windows NT (Windows on ARM)
Reg
All possible values of the reg field in the ModR/M byte.
initializer< Ty > init(const Ty &Val)
uint64_t read64le(const void *P)
uint32_t read32le(const void *P)
This is an optimization pass for GlobalISel generic memory operations.
bool isManaged(const Value &V)
bool shouldEmitPTXNoReturn(const Value *V, const TargetMachine &TM)
auto size(R &&Range, std::enable_if_t< std::is_base_of< std::random_access_iterator_tag, typename std::iterator_traits< decltype(Range.begin())>::iterator_category >::value, void > *=nullptr)
Get the size of a range.
std::optional< unsigned > getMaxNReg(const Function &F)
std::optional< unsigned > getMaxNTIDy(const Function &F)
StringRef getSamplerName(const Value &V)
bool isImageReadWrite(const Value &V)
std::string getNVPTXRegClassName(TargetRegisterClass const *RC)
std::optional< unsigned > getMaxNTIDz(const Function &F)
MaybeAlign getAlign(const Function &F, unsigned Index)
std::optional< unsigned > getMaxNTIDx(const Function &F)
std::optional< unsigned > getMinCTASm(const Function &F)
Constant * ConstantFoldConstant(const Constant *C, const DataLayout &DL, const TargetLibraryInfo *TLI=nullptr)
ConstantFoldConstant - Fold the constant using the specified DataLayout.
bool isImage(const Value &V)
bool isSampler(const Value &V)
unsigned promoteScalarArgumentSize(unsigned size)
void clearAnnotationCache(const Module *Mod)
void report_fatal_error(Error Err, bool gen_crash_diag=true)
Report a serious error, calling any installed error handler.
std::optional< unsigned > getReqNTIDy(const Function &F)
bool isSurface(const Value &V)
FormattedNumber format_hex_no_prefix(uint64_t N, unsigned Width, bool Upper=false)
format_hex_no_prefix - Output N as a fixed width hexadecimal.
std::optional< unsigned > getMaxClusterRank(const Function &F)
StringRef getTextureName(const Value &V)
std::optional< unsigned > getClusterDimx(const Function &F)
void write_hex(raw_ostream &S, uint64_t N, HexPrintStyle Style, std::optional< size_t > Width=std::nullopt)
void ComputeValueVTs(const TargetLowering &TLI, const DataLayout &DL, Type *Ty, SmallVectorImpl< EVT > &ValueVTs, SmallVectorImpl< EVT > *MemVTs, SmallVectorImpl< TypeSize > *Offsets=nullptr, TypeSize StartingOffset=TypeSize::getZero())
ComputeValueVTs - Given an LLVM IR type, compute a sequence of EVTs that represent all the individual...
std::string getNVPTXRegClassStr(TargetRegisterClass const *RC)
StringRef getSurfaceName(const Value &V)
std::optional< unsigned > getClusterDimy(const Function &F)
Target & getTheNVPTXTarget64()
bool isKernelFunction(const Function &F)
bool isTexture(const Value &V)
bool isImageWriteOnly(const Value &V)
std::optional< unsigned > getReqNTIDz(const Function &F)
std::optional< unsigned > getReqNTIDx(const Function &F)
Constant * ConstantFoldIntegerCast(Constant *C, Type *DestTy, bool IsSigned, const DataLayout &DL)
Constant fold a zext, sext or trunc, depending on IsSigned and whether the DestTy is wider or narrowe...
std::optional< unsigned > getClusterDimz(const Function &F)
MDNode * GetUnrollMetadata(MDNode *LoopID, StringRef Name)
Given an llvm.loop loop id metadata node, returns the loop hint metadata node with the given name (fo...
Target & getTheNVPTXTarget32()
static const fltSemantics & IEEEsingle() LLVM_READNONE
static constexpr roundingMode rmNearestTiesToEven
static const fltSemantics & IEEEdouble() LLVM_READNONE
This struct is a compact representation of a valid (non-zero power of two) alignment.
uint64_t value() const
This is a hole in the type system and should not be abused.
TypeSize getSizeInBits() const
Return the size of the specified value type in bits.
bool isInteger() const
Return true if this is an integer or a vector integer type.
This struct is a compact representation of a valid (power of two) or undefined (0) alignment.
Align valueOrOne() const
For convenience, returns a valid alignment or 1 if undefined.
RegisterAsmPrinter - Helper template for registering a target specific assembly printer,...