98 cl::desc(
"Lower GPU ctor / dtors to globals on the device."),
101#define DEPOTNAME "__local_depot"
111 if (
const User *U = dyn_cast<User>(V)) {
112 for (
unsigned i = 0, e = U->getNumOperands(); i != e; ++i) {
128 if (Visited.
count(GV))
132 if (!Visiting.
insert(GV).second)
150 NVPTX_MC::verifyInstructionPredicates(
MI->getOpcode(),
154 lowerToMCInst(
MI, Inst);
159bool NVPTXAsmPrinter::lowerImageHandleOperand(
const MachineInstr *
MI,
167 if (OpNo == 4 && MO.
isImm()) {
168 lowerImageHandleSymbol(MO.
getImm(), MCOp);
172 lowerImageHandleSymbol(MO.
getImm(), MCOp);
182 if (OpNo == VecSize && MO.
isImm()) {
183 lowerImageHandleSymbol(MO.
getImm(), MCOp);
190 if (OpNo == 0 && MO.
isImm()) {
191 lowerImageHandleSymbol(MO.
getImm(), MCOp);
198 if (OpNo == 1 && MO.
isImm()) {
199 lowerImageHandleSymbol(MO.
getImm(), MCOp);
209void NVPTXAsmPrinter::lowerImageHandleSymbol(
unsigned Index,
MCOperand &MCOp) {
222 if (
MI->getOpcode() == NVPTX::CALL_PROTOTYPE) {
230 for (
unsigned i = 0, e =
MI->getNumOperands(); i !=
e; ++i) {
235 if (lowerImageHandleOperand(
MI, i, MCOp)) {
241 if (lowerOperand(MO, MCOp))
295unsigned NVPTXAsmPrinter::encodeVirtualRegister(
unsigned Reg) {
300 unsigned RegNum = RegMap[
Reg];
305 if (RC == &NVPTX::Int1RegsRegClass) {
307 }
else if (RC == &NVPTX::Int16RegsRegClass) {
309 }
else if (RC == &NVPTX::Int32RegsRegClass) {
311 }
else if (RC == &NVPTX::Int64RegsRegClass) {
313 }
else if (RC == &NVPTX::Float32RegsRegClass) {
315 }
else if (RC == &NVPTX::Float64RegsRegClass) {
322 Ret |= (RegNum & 0x0FFFFFFF);
327 return Reg & 0x0FFFFFFF;
348 Type *Ty =
F->getReturnType();
360 if (
auto *ITy = dyn_cast<IntegerType>(Ty)) {
361 size = ITy->getBitWidth();
367 O <<
".param .b" <<
size <<
" func_retval0";
368 }
else if (isa<PointerType>(Ty)) {
369 O <<
".param .b" << TLI->getPointerTy(
DL).getSizeInBits()
372 unsigned totalsz =
DL.getTypeAllocSize(Ty);
373 unsigned retAlignment = 0;
375 retAlignment = TLI->getFunctionParamOptimizedAlign(F, Ty,
DL).value();
376 O <<
".param .align " << retAlignment <<
" .b8 func_retval0[" << totalsz
384 for (
unsigned i = 0, e = vtparts.
size(); i != e; ++i) {
386 EVT elemtype = vtparts[i];
388 elems = vtparts[i].getVectorNumElements();
389 elemtype = vtparts[i].getVectorElementType();
392 for (
unsigned j = 0, je = elems;
j != je; ++
j) {
396 O <<
".reg .b" << sz <<
" func_retval" << idx;
411 printReturnValStr(&F, O);
416bool NVPTXAsmPrinter::isLoopHeaderOfNoUnroll(
431 if (
const BasicBlock *PBB = PMBB->getBasicBlock()) {
433 PBB->getTerminator()->getMetadata(LLVMContext::MD_loop)) {
436 if (
MDNode *UnrollCountMD =
438 if (mdconst::extract<ConstantInt>(UnrollCountMD->getOperand(1))
450 if (isLoopHeaderOfNoUnroll(
MBB))
454void NVPTXAsmPrinter::emitFunctionEntryLabel() {
458 if (!GlobalsEmitted) {
460 GlobalsEmitted =
true;
466 emitLinkageDirective(F, O);
471 printReturnValStr(*
MF, O);
476 emitFunctionParamList(F, O);
480 emitKernelFunctionDirectives(*F, O);
490 setAndEmitFunctionVirtualRegisters(*
MF);
507void NVPTXAsmPrinter::emitFunctionBodyStart() {
514void NVPTXAsmPrinter::emitFunctionBodyEnd() {
524void NVPTXAsmPrinter::emitImplicitDef(
const MachineInstr *
MI)
const {
537void NVPTXAsmPrinter::emitKernelFunctionDirectives(
const Function &
F,
542 unsigned Reqntidx, Reqntidy, Reqntidz;
543 Reqntidx = Reqntidy = Reqntidz = 1;
544 bool ReqSpecified =
false;
550 O <<
".reqntid " << Reqntidx <<
", " << Reqntidy <<
", " << Reqntidz
556 unsigned Maxntidx, Maxntidy, Maxntidz;
557 Maxntidx = Maxntidy = Maxntidz = 1;
558 bool MaxSpecified =
false;
564 O <<
".maxntid " << Maxntidx <<
", " << Maxntidy <<
", " << Maxntidz
569 O <<
".minnctapersm " << Mincta <<
"\n";
571 unsigned Maxnreg = 0;
573 O <<
".maxnreg " << Maxnreg <<
"\n";
579 unsigned Maxclusterrank = 0;
581 O <<
".maxclusterrank " << Maxclusterrank <<
"\n";
591 assert(
I != VRegMapping.
end() &&
"Bad register class");
595 assert(VI != RegMap.
end() &&
"Bad virtual register");
596 unsigned MappedVR = VI->second;
604void NVPTXAsmPrinter::emitVirtualRegister(
unsigned int vr,
609void NVPTXAsmPrinter::emitAliasDeclaration(
const GlobalAlias *GA,
614 "NVPTX aliasee must be a non-kernel function definition");
620 emitDeclarationWithName(F,
getSymbol(GA), O);
624 emitDeclarationWithName(F,
getSymbol(F), O);
629 emitLinkageDirective(F, O);
634 printReturnValStr(F, O);
637 emitFunctionParamList(F, O);
649 return GV->getName() !=
"llvm.used";
652 for (
const User *U :
C->users())
653 if (
const Constant *
C = dyn_cast<Constant>(U))
661 if (
const GlobalVariable *othergv = dyn_cast<GlobalVariable>(U)) {
662 if (othergv->getName() ==
"llvm.used")
667 if (
instr->getParent() &&
instr->getParent()->getParent()) {
669 if (oneFunc && (curFunc != oneFunc))
677 for (
const User *UU : U->users())
711 for (
const User *U :
C->users()) {
712 if (
const Constant *cu = dyn_cast<Constant>(U)) {
715 }
else if (
const Instruction *
I = dyn_cast<Instruction>(U)) {
732 if (
F.getAttributes().hasFnAttr(
"nvptx-libcall-callee")) {
733 emitDeclaration(&F, O);
737 if (
F.isDeclaration()) {
740 if (
F.getIntrinsicID())
742 emitDeclaration(&F, O);
745 for (
const User *U :
F.users()) {
746 if (
const Constant *
C = dyn_cast<Constant>(U)) {
751 emitDeclaration(&F, O);
757 emitDeclaration(&F, O);
762 if (!isa<Instruction>(U))
776 emitDeclaration(&F, O);
783 emitAliasDeclaration(&GA, O);
787 if (!GV)
return true;
789 if (!InitList)
return true;
793void NVPTXAsmPrinter::emitStartOfAsmFile(
Module &M) {
803 emitHeader(M, OS1, *STI);
815 bool IsOpenMP = M.getModuleFlag(
"openmp") !=
nullptr;
820 "Module has a nontrivial global ctor, which NVPTX does not support.");
826 "Module has a nontrivial global dtor, which NVPTX does not support.");
833 GlobalsEmitted =
false;
838void NVPTXAsmPrinter::emitGlobals(
const Module &M) {
842 emitDeclarations(M, OS2);
857 assert(GVVisited.
size() == M.global_size() &&
"Missed a global variable");
858 assert(GVVisiting.
size() == 0 &&
"Did not fully process a global variable");
865 for (
unsigned i = 0, e = Globals.
size(); i != e; ++i)
866 printModuleLevelGV(Globals[i], OS2,
false, STI);
888 O <<
"// Generated by LLVM NVPTX Back-End\n";
893 O <<
".version " << (PTXVersion / 10) <<
"." << (PTXVersion % 10) <<
"\n";
900 O <<
", texmode_independent";
902 bool HasFullDebugInfo =
false;
904 switch(
CU->getEmissionKind()) {
910 HasFullDebugInfo =
true;
913 if (HasFullDebugInfo)
921 O <<
".address_size ";
936 if (!GlobalsEmitted) {
938 GlobalsEmitted =
true;
952 OutStreamer->emitRawText(
"\t.section\t.debug_loc\t{\t}");
956 TS->outputDwarfFileDirectives();
974void NVPTXAsmPrinter::emitLinkageDirective(
const GlobalValue *V,
977 if (V->hasExternalLinkage()) {
978 if (isa<GlobalVariable>(V)) {
986 }
else if (
V->isDeclaration())
990 }
else if (
V->hasAppendingLinkage()) {
992 msg.append(
"Error: ");
993 msg.append(
"Symbol ");
995 msg.append(std::string(
V->getName()));
996 msg.append(
"has unsupported appending linkage type");
998 }
else if (!
V->hasInternalLinkage() &&
999 !
V->hasPrivateLinkage()) {
1005void NVPTXAsmPrinter::printModuleLevelGV(
const GlobalVariable *GVar,
1050 emitPTXGlobalVariable(GVar, O, STI);
1058 const Constant *Initializer =
nullptr;
1063 CI = dyn_cast<ConstantInt>(Initializer);
1072 O <<
"addr_mode_" << i <<
" = ";
1078 O <<
"clamp_to_border";
1081 O <<
"clamp_to_edge";
1092 O <<
"filter_mode = ";
1107 O <<
", force_unnormalized_coords = 1";
1117 if (strncmp(GVar->
getName().
data(),
"unrollpragma", 12) == 0)
1121 if (strncmp(GVar->
getName().
data(),
"filename", 8) == 0)
1127 const Function *demotedFunc =
nullptr;
1129 O <<
"// " << GVar->
getName() <<
" has been demoted\n";
1130 if (localDecls.find(demotedFunc) != localDecls.end())
1131 localDecls[demotedFunc].push_back(GVar);
1133 std::vector<const GlobalVariable *> temp;
1134 temp.push_back(GVar);
1135 localDecls[demotedFunc] = temp;
1141 emitPTXAddressSpace(PTy->getAddressSpace(), O);
1146 ".attribute(.managed) requires PTX version >= 4.0 and sm_30");
1148 O <<
" .attribute(.managed)";
1152 O <<
" .align " <<
A->value();
1154 O <<
" .align " << (int)
DL.getPrefTypeAlign(ETy).value();
1163 O << getPTXFundamentalTypeStr(ETy,
false);
1174 if (!Initializer->
isNullValue() && !isa<UndefValue>(Initializer)) {
1176 printScalarConstant(Initializer, O);
1185 "' is not allowed in addrspace(" +
1186 Twine(PTy->getAddressSpace()) +
")");
1202 ElementSize =
DL.getTypeStoreSize(ETy);
1209 if (!isa<UndefValue>(Initializer) && !Initializer->
isNullValue()) {
1210 AggBuffer aggBuffer(ElementSize, *
this);
1211 bufferAggregateConstant(Initializer, &aggBuffer);
1212 if (aggBuffer.numSymbols()) {
1214 if (ElementSize % ptrSize ||
1215 !aggBuffer.allSymbolsAligned(ptrSize)) {
1219 "initialized packed aggregate with pointers '" +
1221 "' requires at least PTX ISA version 7.1");
1224 O <<
"[" << ElementSize <<
"] = {";
1225 aggBuffer.printBytes(O);
1228 O <<
" .u" << ptrSize * 8 <<
" ";
1230 O <<
"[" << ElementSize / ptrSize <<
"] = {";
1231 aggBuffer.printWords(O);
1237 O <<
"[" << ElementSize <<
"] = {";
1238 aggBuffer.printBytes(O);
1267void NVPTXAsmPrinter::AggBuffer::printSymbol(
unsigned nSym,
raw_ostream &os) {
1268 const Value *
v = Symbols[nSym];
1269 const Value *v0 = SymbolsBeforeStripping[nSym];
1270 if (
const GlobalValue *GVar = dyn_cast<GlobalValue>(v)) {
1274 bool isGenericPointer = PTy && PTy->getAddressSpace() == 0;
1275 if (EmitGeneric && isGenericPointer && !isa<Function>(v)) {
1277 Name->print(os, AP.MAI);
1280 Name->print(os, AP.MAI);
1282 }
else if (
const ConstantExpr *CExpr = dyn_cast<ConstantExpr>(v0)) {
1283 const MCExpr *Expr = AP.lowerConstantForGV(cast<Constant>(CExpr),
false);
1284 AP.printMCExpr(*Expr, os);
1289void NVPTXAsmPrinter::AggBuffer::printBytes(
raw_ostream &os) {
1290 unsigned int ptrSize = AP.MAI->getCodePointerSize();
1295 unsigned int InitializerCount =
size;
1298 if (numSymbols() == 0)
1299 while (InitializerCount >= 1 && !buffer[InitializerCount - 1])
1302 symbolPosInBuffer.push_back(InitializerCount);
1303 unsigned int nSym = 0;
1304 unsigned int nextSymbolPos = symbolPosInBuffer[nSym];
1305 for (
unsigned int pos = 0; pos < InitializerCount;) {
1308 if (pos != nextSymbolPos) {
1309 os << (
unsigned int)buffer[pos];
1316 std::string symText;
1318 printSymbol(nSym, oss);
1319 for (
unsigned i = 0; i < ptrSize; ++i) {
1323 os <<
"(" << symText <<
")";
1326 nextSymbolPos = symbolPosInBuffer[++nSym];
1327 assert(nextSymbolPos >= pos);
1331void NVPTXAsmPrinter::AggBuffer::printWords(
raw_ostream &os) {
1332 unsigned int ptrSize = AP.MAI->getCodePointerSize();
1333 symbolPosInBuffer.push_back(size);
1334 unsigned int nSym = 0;
1335 unsigned int nextSymbolPos = symbolPosInBuffer[nSym];
1336 assert(nextSymbolPos % ptrSize == 0);
1337 for (
unsigned int pos = 0; pos <
size; pos += ptrSize) {
1340 if (pos == nextSymbolPos) {
1341 printSymbol(nSym, os);
1342 nextSymbolPos = symbolPosInBuffer[++nSym];
1343 assert(nextSymbolPos % ptrSize == 0);
1344 assert(nextSymbolPos >= pos + ptrSize);
1345 }
else if (ptrSize == 4)
1353 if (localDecls.find(f) == localDecls.end())
1356 std::vector<const GlobalVariable *> &gvars = localDecls[
f];
1363 O <<
"\t// demoted variable\n\t";
1364 printModuleLevelGV(GV, O,
true, STI);
1368void NVPTXAsmPrinter::emitPTXAddressSpace(
unsigned int AddressSpace,
1391NVPTXAsmPrinter::getPTXFundamentalTypeStr(
Type *Ty,
bool useB4PTR)
const {
1394 unsigned NumBits = cast<IntegerType>(Ty)->getBitWidth();
1397 else if (NumBits <= 64) {
1398 std::string
name =
"u";
1399 return name + utostr(NumBits);
1417 assert((PtrSize == 64 || PtrSize == 32) &&
"Unexpected pointer size");
1435void NVPTXAsmPrinter::emitPTXGlobalVariable(
const GlobalVariable *GVar,
1448 ".attribute(.managed) requires PTX version >= 4.0 and sm_30");
1450 O <<
" .attribute(.managed)";
1453 O <<
" .align " <<
A->value();
1455 O <<
" .align " << (int)
DL.getPrefTypeAlign(ETy).value();
1467 O << getPTXFundamentalTypeStr(ETy);
1473 int64_t ElementSize = 0;
1483 ElementSize =
DL.getTypeStoreSize(ETy);
1504 unsigned paramIndex = 0;
1510 if (
F->arg_empty() && !
F->isVarArg()) {
1517 for (
I =
F->arg_begin(),
E =
F->arg_end();
I !=
E; ++
I, paramIndex++) {
1518 Type *Ty =
I->getType();
1530 if (hasImageHandles)
1531 O <<
"\t.param .u64 .ptr .surfref ";
1533 O <<
"\t.param .surfref ";
1534 O << TLI->getParamName(F, paramIndex);
1537 if (hasImageHandles)
1538 O <<
"\t.param .u64 .ptr .texref ";
1540 O <<
"\t.param .texref ";
1541 O << TLI->getParamName(F, paramIndex);
1544 if (hasImageHandles)
1545 O <<
"\t.param .u64 .ptr .samplerref ";
1547 O <<
"\t.param .samplerref ";
1548 O << TLI->getParamName(F, paramIndex);
1554 auto getOptimalAlignForParam = [TLI, &
DL, &PAL,
F,
1556 Align TypeAlign = TLI->getFunctionParamOptimizedAlign(F, Ty,
DL);
1557 MaybeAlign ParamAlign = PAL.getParamAlignment(paramIndex);
1558 return std::max(TypeAlign, ParamAlign.
valueOrOne());
1561 if (!PAL.hasParamAttr(paramIndex, Attribute::ByVal)) {
1567 Align OptimalAlign = getOptimalAlignForParam(Ty);
1569 O <<
"\t.param .align " << OptimalAlign.
value() <<
" .b8 ";
1570 O << TLI->getParamName(F, paramIndex);
1571 O <<
"[" <<
DL.getTypeAllocSize(Ty) <<
"]";
1576 auto *PTy = dyn_cast<PointerType>(Ty);
1577 unsigned PTySizeInBits = 0;
1580 TLI->getPointerTy(
DL, PTy->getAddressSpace()).getSizeInBits();
1581 assert(PTySizeInBits &&
"Invalid pointer size");
1587 O <<
"\t.param .u" << PTySizeInBits <<
" ";
1591 int addrSpace = PTy->getAddressSpace();
1592 switch (addrSpace) {
1597 O <<
".ptr .const ";
1600 O <<
".ptr .shared ";
1603 O <<
".ptr .global ";
1606 Align ParamAlign =
I->getParamAlign().valueOrOne();
1607 O <<
".align " << ParamAlign.
value() <<
" ";
1609 O << TLI->getParamName(F, paramIndex);
1619 O << getPTXFundamentalTypeStr(Ty);
1621 O << TLI->getParamName(F, paramIndex);
1627 if (isa<IntegerType>(Ty)) {
1628 sz = cast<IntegerType>(Ty)->getBitWidth();
1631 assert(PTySizeInBits &&
"Invalid pointer size");
1636 O <<
"\t.param .b" << sz <<
" ";
1638 O <<
"\t.reg .b" << sz <<
" ";
1639 O << TLI->getParamName(F, paramIndex);
1644 Type *ETy = PAL.getParamByValType(paramIndex);
1645 assert(ETy &&
"Param should have byval type");
1647 if (isABI || isKernelFunc) {
1652 Align OptimalAlign =
1654 ? getOptimalAlignForParam(ETy)
1655 : TLI->getFunctionByValParamAlign(
1656 F, ETy, PAL.getParamAlignment(paramIndex).valueOrOne(),
DL);
1658 unsigned sz =
DL.getTypeAllocSize(ETy);
1659 O <<
"\t.param .align " << OptimalAlign.
value() <<
" .b8 ";
1660 O << TLI->getParamName(F, paramIndex);
1661 O <<
"[" << sz <<
"]";
1670 for (
unsigned i = 0, e = vtparts.
size(); i != e; ++i) {
1672 EVT elemtype = vtparts[i];
1674 elems = vtparts[i].getVectorNumElements();
1675 elemtype = vtparts[i].getVectorElementType();
1678 for (
unsigned j = 0, je = elems;
j != je; ++
j) {
1682 O <<
"\t.reg .b" << sz <<
" ";
1683 O << TLI->getParamName(F, paramIndex);
1696 if (
F->isVarArg()) {
1701 O << TLI->getParamName(F, -1) <<
"[]";
1707void NVPTXAsmPrinter::setAndEmitFunctionVirtualRegisters(
1724 O <<
"\t.reg .b64 \t%SP;\n";
1725 O <<
"\t.reg .b64 \t%SPL;\n";
1727 O <<
"\t.reg .b32 \t%SP;\n";
1728 O <<
"\t.reg .b32 \t%SPL;\n";
1737 for (
unsigned i = 0; i < numVRs; i++) {
1741 int n = regmap.
size();
1742 regmap.
insert(std::make_pair(vr, n + 1));
1757 for (
unsigned i=0; i<
TRI->getNumRegClasses(); i++) {
1762 int n = regmap.
size();
1766 O <<
"\t.reg " << rcname <<
" \t" << rcStr <<
"<" << (n+1)
1777 unsigned int numHex;
1796 if (
const ConstantInt *CI = dyn_cast<ConstantInt>(CPV)) {
1800 if (
const ConstantFP *CFP = dyn_cast<ConstantFP>(CPV)) {
1801 printFPConstant(CFP, O);
1804 if (isa<ConstantPointerNull>(CPV)) {
1808 if (
const GlobalValue *GVar = dyn_cast<GlobalValue>(CPV)) {
1809 bool IsNonGenericPointer =
false;
1811 IsNonGenericPointer =
true;
1813 if (EmitGeneric && !isa<Function>(CPV) && !IsNonGenericPointer) {
1822 if (
const ConstantExpr *Cexpr = dyn_cast<ConstantExpr>(CPV)) {
1823 const MCExpr *
E = lowerConstantForGV(cast<Constant>(Cexpr),
false);
1830void NVPTXAsmPrinter::bufferLEByte(
const Constant *CPV,
int Bytes,
1831 AggBuffer *AggBuffer) {
1833 int AllocSize =
DL.getTypeAllocSize(CPV->
getType());
1837 AggBuffer->addZeros(Bytes ? Bytes : AllocSize);
1842 auto AddIntToBuffer = [AggBuffer, Bytes](
const APInt &Val) {
1843 size_t NumBytes = (Val.getBitWidth() + 7) / 8;
1845 for (
unsigned I = 0;
I < NumBytes; ++
I) {
1846 Buf[
I] = Val.extractBitsAsZExtValue(8,
I * 8);
1848 AggBuffer->addBytes(Buf.data(), NumBytes, Bytes);
1853 if (
const auto CI = dyn_cast<ConstantInt>(CPV)) {
1857 if (
const auto *Cexpr = dyn_cast<ConstantExpr>(CPV)) {
1858 if (
const auto *CI =
1863 if (Cexpr->getOpcode() == Instruction::PtrToInt) {
1864 Value *
V = Cexpr->getOperand(0)->stripPointerCasts();
1865 AggBuffer->addSymbol(V, Cexpr->getOperand(0));
1866 AggBuffer->addZeros(AllocSize);
1877 AddIntToBuffer(cast<ConstantFP>(CPV)->getValueAPF().bitcastToAPInt());
1881 if (
const GlobalValue *GVar = dyn_cast<GlobalValue>(CPV)) {
1882 AggBuffer->addSymbol(GVar, GVar);
1883 }
else if (
const ConstantExpr *Cexpr = dyn_cast<ConstantExpr>(CPV)) {
1884 const Value *
v = Cexpr->stripPointerCasts();
1885 AggBuffer->addSymbol(v, Cexpr);
1887 AggBuffer->addZeros(AllocSize);
1894 if (isa<ConstantAggregate>(CPV) || isa<ConstantDataSequential>(CPV)) {
1895 bufferAggregateConstant(CPV, AggBuffer);
1896 if (Bytes > AllocSize)
1897 AggBuffer->addZeros(Bytes - AllocSize);
1898 }
else if (isa<ConstantAggregateZero>(CPV))
1899 AggBuffer->addZeros(Bytes);
1910void NVPTXAsmPrinter::bufferAggregateConstant(
const Constant *CPV,
1911 AggBuffer *aggBuffer) {
1916 if (
const ConstantInt *CI = dyn_cast<ConstantInt>(CPV)) {
1918 for (
unsigned I = 0,
E =
DL.getTypeAllocSize(CPV->
getType());
I <
E; ++
I) {
1920 aggBuffer->addBytes(&Byte, 1, 1);
1927 if (isa<ConstantArray>(CPV) || isa<ConstantVector>(CPV)) {
1930 bufferLEByte(cast<Constant>(CPV->
getOperand(i)), 0, aggBuffer);
1935 dyn_cast<ConstantDataSequential>(CPV)) {
1936 if (CDS->getNumElements())
1937 for (
unsigned i = 0; i < CDS->getNumElements(); ++i)
1938 bufferLEByte(cast<Constant>(CDS->getElementAsConstant(i)), 0,
1943 if (isa<ConstantStruct>(CPV)) {
1948 Bytes =
DL.getStructLayout(ST)->getElementOffset(0) +
1949 DL.getTypeAllocSize(ST) -
1950 DL.getStructLayout(ST)->getElementOffset(i);
1952 Bytes =
DL.getStructLayout(ST)->getElementOffset(i + 1) -
1953 DL.getStructLayout(ST)->getElementOffset(i);
1954 bufferLEByte(cast<Constant>(CPV->
getOperand(i)), Bytes, aggBuffer);
1967NVPTXAsmPrinter::lowerConstantForGV(
const Constant *CV,
bool ProcessingGeneric) {
1973 if (
const ConstantInt *CI = dyn_cast<ConstantInt>(CV))
1976 if (
const GlobalValue *GV = dyn_cast<GlobalValue>(CV)) {
1979 if (ProcessingGeneric) {
1991 switch (
CE->getOpcode()) {
1995 case Instruction::AddrSpaceCast: {
1998 if (DstTy->getAddressSpace() == 0)
1999 return lowerConstantForGV(cast<const Constant>(
CE->getOperand(0)),
true);
2004 case Instruction::GetElementPtr: {
2008 APInt OffsetAI(
DL.getPointerTypeSizeInBits(
CE->getType()), 0);
2009 cast<GEPOperator>(CE)->accumulateConstantOffset(
DL, OffsetAI);
2011 const MCExpr *
Base = lowerConstantForGV(
CE->getOperand(0),
2016 int64_t
Offset = OffsetAI.getSExtValue();
2021 case Instruction::Trunc:
2027 case Instruction::BitCast:
2028 return lowerConstantForGV(
CE->getOperand(0), ProcessingGeneric);
2030 case Instruction::IntToPtr: {
2039 return lowerConstantForGV(
Op, ProcessingGeneric);
2044 case Instruction::PtrToInt: {
2050 Type *Ty =
CE->getType();
2052 const MCExpr *OpExpr = lowerConstantForGV(
Op, ProcessingGeneric);
2056 if (
DL.getTypeAllocSize(Ty) ==
DL.getTypeAllocSize(
Op->getType()))
2062 unsigned InBits =
DL.getTypeAllocSizeInBits(
Op->getType());
2069 case Instruction::Add: {
2070 const MCExpr *
LHS = lowerConstantForGV(
CE->getOperand(0), ProcessingGeneric);
2071 const MCExpr *
RHS = lowerConstantForGV(
CE->getOperand(1), ProcessingGeneric);
2072 switch (
CE->getOpcode()) {
2084 return lowerConstantForGV(
C, ProcessingGeneric);
2089 OS <<
"Unsupported expression in static initializer: ";
2090 CE->printAsOperand(
OS,
false,
2099 return cast<MCTargetExpr>(&Expr)->printImpl(
OS,
MAI);
2101 OS << cast<MCConstantExpr>(Expr).getValue();
2127 if (isa<MCConstantExpr>(BE.
getLHS()) || isa<MCSymbolRefExpr>(BE.
getLHS()) ||
2128 isa<NVPTXGenericMCSymbolRefExpr>(BE.
getLHS())) {
2140 if (RHSC->getValue() < 0) {
2141 OS << RHSC->getValue();
2152 if (isa<MCConstantExpr>(BE.
getRHS()) || isa<MCSymbolRefExpr>(BE.
getRHS())) {
2168bool NVPTXAsmPrinter::PrintAsmOperand(
const MachineInstr *
MI,
unsigned OpNo,
2170 if (ExtraCode && ExtraCode[0]) {
2171 if (ExtraCode[1] != 0)
2174 switch (ExtraCode[0]) {
2183 printOperand(
MI, OpNo, O);
2188bool NVPTXAsmPrinter::PrintAsmMemoryOperand(
const MachineInstr *
MI,
2190 const char *ExtraCode,
2192 if (ExtraCode && ExtraCode[0])
2196 printMemOperand(
MI, OpNo, O);
2202void NVPTXAsmPrinter::printOperand(
const MachineInstr *
MI,
unsigned OpNum,
2208 if (MO.
getReg() == NVPTX::VRDepot)
2213 emitVirtualRegister(MO.
getReg(), O);
2238void NVPTXAsmPrinter::printMemOperand(
const MachineInstr *
MI,
unsigned OpNum,
2240 printOperand(
MI, OpNum, O);
2242 if (Modifier && strcmp(Modifier,
"add") == 0) {
2244 printOperand(
MI, OpNum + 1, O);
2246 if (
MI->getOperand(OpNum + 1).isImm() &&
2247 MI->getOperand(OpNum + 1).getImm() == 0)
2250 printOperand(
MI, OpNum + 1, O);
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
static cl::opt< bool > LowerCtorDtor("amdgpu-lower-global-ctor-dtor", cl::desc("Lower GPU ctor / dtors to globals on the device."), cl::init(true), cl::Hidden)
This file declares a class to represent arbitrary precision floating point values and provide a varie...
This file implements a class to represent arbitrary precision integral constant values and operations...
This file contains the simple types necessary to represent the attributes associated with functions a...
static GCRegistry::Add< ErlangGC > A("erlang", "erlang-compatible garbage collector")
static GCRegistry::Add< CoreCLRGC > E("coreclr", "CoreCLR-compatible GC")
#define LLVM_EXTERNAL_VISIBILITY
This file contains the declarations for the subclasses of Constant, which represent the different fla...
Looks at all the uses of the given value Returns the Liveness deduced from the uses of this value Adds all uses that cause the result to be MaybeLive to MaybeLiveRetUses If the result is MaybeLiveUses might be modified but its content should be ignored(since it might not be complete). DeadArgumentEliminationPass
This file defines the DenseMap class.
This file defines the DenseSet and SmallDenseSet classes.
static GCMetadataPrinterRegistry::Add< ErlangGCPrinter > X("erlang", "erlang-compatible garbage collector")
unsigned const TargetRegisterInfo * TRI
Module.h This file contains the declarations for the Module class.
static bool isEmptyXXStructor(GlobalVariable *GV)
static bool usedInOneFunc(const User *U, Function const *&oneFunc)
static void VisitGlobalVariableForEmission(const GlobalVariable *GV, SmallVectorImpl< const GlobalVariable * > &Order, DenseSet< const GlobalVariable * > &Visited, DenseSet< const GlobalVariable * > &Visiting)
VisitGlobalVariableForEmission - Add GV to the list of GlobalVariable instances to be emitted,...
LLVM_EXTERNAL_VISIBILITY void LLVMInitializeNVPTXAsmPrinter()
static bool usedInGlobalVarDef(const Constant *C)
static bool useFuncSeen(const Constant *C, DenseMap< const Function *, bool > &seenMap)
static cl::opt< bool > LowerCtorDtor("nvptx-lower-global-ctor-dtor", cl::desc("Lower GPU ctor / dtors to globals on the device."), cl::init(false), cl::Hidden)
static bool ShouldPassAsArray(Type *Ty)
static void DiscoverDependentGlobals(const Value *V, DenseSet< const GlobalVariable * > &Globals)
DiscoverDependentGlobals - Return a set of GlobalVariables on which V depends.
static bool canDemoteGlobalVar(const GlobalVariable *gv, Function const *&f)
static GCMetadataPrinterRegistry::Add< OcamlGCMetadataPrinter > Y("ocaml", "ocaml 3.10-compatible collector")
assert(ImpDefSCC.getReg()==AMDGPU::SCC &&ImpDefSCC.isDef())
This file defines the SmallString class.
This file defines the SmallVector class.
opStatus convert(const fltSemantics &ToSemantics, roundingMode RM, bool *losesInfo)
APInt bitcastToAPInt() const
Class for arbitrary precision integers.
APInt getLoBits(unsigned numBits) const
Compute an APInt containing numBits lowbits from this APInt.
uint64_t getZExtValue() const
Get zero extended value.
void lshrInPlace(unsigned ShiftAmt)
Logical right-shift this APInt by ShiftAmt in place.
This class represents an incoming formal argument to a Function.
MCSymbol * getSymbol(const GlobalValue *GV) const
void EmitToStreamer(MCStreamer &S, const MCInst &Inst)
TargetMachine & TM
Target machine description.
virtual void PrintSymbolOperand(const MachineOperand &MO, raw_ostream &OS)
Print the MachineOperand as a symbol.
const MCAsmInfo * MAI
Target Asm Printer information.
MachineFunction * MF
The current machine function.
bool doInitialization(Module &M) override
Set up the AsmPrinter when we are working on a new module.
unsigned getFunctionNumber() const
Return a unique ID for the current function.
MCSymbol * CurrentFnSym
The symbol for the current function.
MachineModuleInfo * MMI
This is a pointer to the current MachineModuleInfo.
MCContext & OutContext
This is the context for the output file that we are streaming.
bool doFinalization(Module &M) override
Shut down the asmprinter.
MCSymbol * GetExternalSymbolSymbol(Twine Sym) const
Return the MCSymbol for the specified ExternalSymbol.
virtual void emitBasicBlockStart(const MachineBasicBlock &MBB)
Targets can override this to emit stuff at the start of a basic block.
bool runOnMachineFunction(MachineFunction &MF) override
Emit the specified function out to the OutStreamer.
std::unique_ptr< MCStreamer > OutStreamer
This is the MCStreamer object for the file we are generating.
const DataLayout & getDataLayout() const
Return information about data layout.
void emitInitialRawDwarfLocDirective(const MachineFunction &MF)
Emits inital debug location directive.
const MCSubtargetInfo & getSubtargetInfo() const
Return information about subtarget.
virtual bool PrintAsmOperand(const MachineInstr *MI, unsigned OpNo, const char *ExtraCode, raw_ostream &OS)
Print the specified operand of MI, an INLINEASM instruction, using the specified assembler variant.
LLVM Basic Block Representation.
const Function * getParent() const
Return the enclosing method, or null if none.
ConstantArray - Constant Array Declarations.
ConstantDataSequential - A vector or array constant whose element type is a simple 1/2/4/8-byte integ...
A constant value that is initialized with an expression using other constant values.
ConstantFP - Floating Point Values [float, double].
const APFloat & getValueAPF() const
This is the shared class of boolean and integer constants.
uint64_t getZExtValue() const
Return the constant as a 64-bit unsigned integer value after it has been zero extended as appropriate...
const APInt & getValue() const
Return the constant as an APInt value reference.
This is an important base class in LLVM.
bool isNullValue() const
Return true if this is the value that would be returned by getNullValue.
This class represents an Operation in the Expression.
A parsed version of the target data layout string in and methods for querying it.
iterator find(const_arg_type_t< KeyT > Val)
bool contains(const_arg_type_t< KeyT > Val) const
Return true if the specified key is in the map, false otherwise.
std::pair< iterator, bool > insert(const std::pair< KeyT, ValueT > &KV)
Implements a dense probed hash-table based set.
const GlobalObject * getAliaseeObject() const
StringRef getSection() const
Get the custom section of this global if it has one.
MaybeAlign getAlign() const
Returns the alignment of the given variable or function.
bool hasSection() const
Check if this global has a custom object file section.
bool hasLinkOnceLinkage() const
bool hasExternalLinkage() const
bool isDeclaration() const
Return true if the primary definition of this global value is outside of the current translation unit...
bool hasLocalLinkage() const
bool hasPrivateLinkage() const
Module * getParent()
Get the module that this global value is contained inside of...
PointerType * getType() const
Global values are always pointers.
bool hasWeakLinkage() const
bool hasCommonLinkage() const
bool hasAvailableExternallyLinkage() const
Type * getValueType() const
const Constant * getInitializer() const
getInitializer - Return the initializer for this global variable.
bool hasInitializer() const
Definitions have initializers, declarations don't.
This class describes a target machine that is implemented with the LLVM target-independent code gener...
unsigned getCodePointerSize() const
Get the code pointer size in bytes.
Binary assembler expressions.
const MCExpr * getLHS() const
Get the left-hand side expression of the binary operator.
const MCExpr * getRHS() const
Get the right-hand side expression of the binary operator.
static const MCBinaryExpr * createAnd(const MCExpr *LHS, const MCExpr *RHS, MCContext &Ctx)
static const MCBinaryExpr * createAdd(const MCExpr *LHS, const MCExpr *RHS, MCContext &Ctx)
Opcode getOpcode() const
Get the kind of this binary expression.
static const MCConstantExpr * create(int64_t Value, MCContext &Ctx, bool PrintInHex=false, unsigned SizeInBytes=0)
Context object for machine code objects.
MCSymbol * getOrCreateSymbol(const Twine &Name)
Lookup the symbol inside with the specified Name.
Base class for the full range of assembler expressions which are needed for parsing.
@ Unary
Unary expressions.
@ Constant
Constant expressions.
@ SymbolRef
References to labels and assigned expressions.
@ Target
Target specific expression.
@ Binary
Binary expressions.
Instances of this class represent a single low-level machine instruction.
void addOperand(const MCOperand Op)
void setOpcode(unsigned Op)
Describe properties that are true of each instruction in the target description file.
Instances of this class represent operands of the MCInst class.
static MCOperand createReg(unsigned Reg)
static MCOperand createExpr(const MCExpr *Val)
static MCOperand createImm(int64_t Val)
Represent a reference to a symbol from inside an expression.
const MCSymbol & getSymbol() const
static const MCSymbolRefExpr * create(const MCSymbol *Symbol, MCContext &Ctx)
MCSymbol - Instances of this class represent a symbol name in the MC file, and MCSymbols are created ...
void print(raw_ostream &OS, const MCAsmInfo *MAI) const
print - Print the value to the stream OS.
Unary assembler expressions.
Opcode getOpcode() const
Get the kind of this unary expression.
const MCExpr * getSubExpr() const
Get the child of this unary expression.
MCSymbol * getSymbol() const
Return the MCSymbol for this basic block.
iterator_range< pred_iterator > predecessors()
The MachineFrameInfo class represents an abstract stack frame until prolog/epilog code is inserted.
uint64_t getStackSize() const
Return the number of bytes that must be allocated to hold all of the fixed size frame objects.
Align getMaxAlign() const
Return the alignment in bytes that this function must be aligned to, which is greater than the defaul...
const TargetSubtargetInfo & getSubtarget() const
getSubtarget - Return the subtarget for which this machine code is being compiled.
MachineFrameInfo & getFrameInfo()
getFrameInfo - Return the frame info object for the current function.
MachineRegisterInfo & getRegInfo()
getRegInfo - Return information about the registers currently in use.
Function & getFunction()
Return the LLVM function that this machine code represents.
const LLVMTargetMachine & getTarget() const
getTarget - Return the target machine this machine code is compiled with
Ty * getInfo()
getInfo - Keep track of various per-function pieces of information for backends that would like to do...
Representation of each machine instruction.
bool isLoopHeader(const MachineBasicBlock *BB) const
True if the block is a loop header node.
MachineLoop * getLoopFor(const MachineBasicBlock *BB) const
Return the innermost loop that BB lives in.
bool hasDebugInfo() const
Returns true if valid debug info is present.
MachineOperand class - Representation of each machine instruction operand.
const GlobalValue * getGlobal() const
MachineBasicBlock * getMBB() const
bool isImm() const
isImm - Tests if this is a MO_Immediate operand.
MachineOperandType getType() const
getType - Returns the MachineOperandType for this operand.
const char * getSymbolName() const
Register getReg() const
getReg - Returns the register number.
const ConstantFP * getFPImm() const
@ MO_Immediate
Immediate operand.
@ MO_GlobalAddress
Address of a global value.
@ MO_MachineBasicBlock
MachineBasicBlock reference.
@ MO_Register
Register operand.
@ MO_ExternalSymbol
Name of external global symbol.
@ MO_FPImmediate
Floating-point immediate operand.
const TargetRegisterClass * getRegClass(Register Reg) const
Return the register class of the specified virtual register.
unsigned getNumVirtRegs() const
getNumVirtRegs - Return the number of virtual registers created.
A Module instance is used to store all the information related to an LLVM module.
bool doInitialization(Module &M) override
Set up the AsmPrinter when we are working on a new module.
bool runOnMachineFunction(MachineFunction &F) override
Emit the specified function out to the OutStreamer.
std::string getVirtualRegisterName(unsigned) const
bool doFinalization(Module &M) override
Shut down the asmprinter.
const MCSymbol * getFunctionFrameSymbol() const override
Return symbol for the function pseudo stack if the stack frame is not a register based.
static const NVPTXFloatMCExpr * createConstantBFPHalf(const APFloat &Flt, MCContext &Ctx)
static const NVPTXFloatMCExpr * createConstantFPHalf(const APFloat &Flt, MCContext &Ctx)
static const NVPTXFloatMCExpr * createConstantFPSingle(const APFloat &Flt, MCContext &Ctx)
static const NVPTXFloatMCExpr * createConstantFPDouble(const APFloat &Flt, MCContext &Ctx)
static const NVPTXGenericMCSymbolRefExpr * create(const MCSymbolRefExpr *SymExpr, MCContext &Ctx)
static const char * getRegisterName(MCRegister Reg)
const char * getImageHandleSymbol(unsigned Idx) const
Returns the symbol name at the given index.
const char * getName(unsigned RegNo) const
std::string getTargetName() const
bool hasImageHandles() const
unsigned getMaxRequiredAlignment() const
bool hasMaskOperator() const
const NVPTXTargetLowering * getTargetLowering() const override
unsigned getPTXVersion() const
const NVPTXRegisterInfo * getRegisterInfo() const override
unsigned int getSmVersion() const
NVPTX::DrvInterface getDrvInterface() const
const NVPTXSubtarget * getSubtargetImpl(const Function &) const override
Virtual method implemented by subclasses that returns a reference to that target's TargetSubtargetInf...
UniqueStringSaver & getStrPool() const
Implments NVPTX-specific streamer.
void closeLastSection()
Close last section.
unsigned getAddressSpace() const
Return the address space of the Pointer type.
Wrapper class representing virtual and physical registers.
static Register index2VirtReg(unsigned Index)
Convert a 0-based index to a virtual register number.
constexpr bool isVirtual() const
Return true if the specified register number is in the virtual register namespace.
static constexpr bool isVirtualRegister(unsigned Reg)
Return true if the specified register number is in the virtual register namespace.
constexpr bool isPhysical() const
Return true if the specified register number is in the physical register namespace.
SmallString - A SmallString is just a SmallVector with methods and accessors that make it work better...
This class consists of common code factored out of the SmallVector class to reduce code duplication b...
void push_back(const T &Elt)
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
StringRef - Represent a constant reference to a string, i.e.
bool starts_with(StringRef Prefix) const
Check if this string starts with the given Prefix.
constexpr const char * data() const
data - Get a pointer to the start of the string (which may not be null terminated).
Class to represent struct types.
const STC & getSubtarget(const Function &F) const
This method returns a pointer to the specified type of TargetSubtargetInfo.
unsigned getPointerSizeInBits(unsigned AS) const
TargetRegisterInfo base class - We assume that the target defines a static array of TargetRegisterDes...
virtual const TargetRegisterInfo * getRegisterInfo() const
getRegisterInfo - If register information is available, return it.
Twine - A lightweight data structure for efficiently representing the concatenation of temporary valu...
The instances of the Type class are immutable: once they are created, they are never changed.
bool isVectorTy() const
True if this is an instance of VectorType.
bool isPointerTy() const
True if this is an instance of PointerType.
bool isBFloatTy() const
Return true if this is 'bfloat', a 16-bit bfloat type.
unsigned getPointerAddressSpace() const
Get the address space of this pointer or pointer vector type.
@ HalfTyID
16-bit floating point type
@ VoidTyID
type with no size
@ FloatTyID
32-bit floating point type
@ IntegerTyID
Arbitrary bit width integers.
@ FixedVectorTyID
Fixed width SIMD vector type.
@ BFloatTyID
16-bit floating point type (7-bit significand)
@ DoubleTyID
64-bit floating point type
unsigned getScalarSizeInBits() const LLVM_READONLY
If this is a vector type, return the getPrimitiveSizeInBits value for the element type.
bool isAggregateType() const
Return true if the type is an aggregate type.
bool isHalfTy() const
Return true if this is 'half', a 16-bit IEEE fp type.
bool isFloatingPointTy() const
Return true if this is one of the floating-point types.
bool isIntOrPtrTy() const
Return true if this is an integer type or a pointer type.
bool isIntegerTy() const
True if this is an instance of IntegerType.
TypeID getTypeID() const
Return the type id for the type.
TypeSize getPrimitiveSizeInBits() const LLVM_READONLY
Return the basic size of this type if it is a primitive type.
StringRef save(const char *S)
Value * getOperand(unsigned i) const
unsigned getNumOperands() const
LLVM Value Representation.
Type * getType() const
All values are typed, get the type of this value.
StringRef getName() const
Return a constant reference to the value's name.
std::pair< iterator, bool > insert(const ValueT &V)
bool erase(const ValueT &V)
size_type count(const_arg_type_t< ValueT > V) const
Return 1 if the specified key is in the set, 0 otherwise.
This class implements an extremely fast bulk output stream that can only output to a stream.
A raw_ostream that writes to an std::string.
A raw_ostream that writes to an SmallVector or SmallString.
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
@ C
The default llvm calling convention, compatible with C.
LegalityPredicate isVector(unsigned TypeIdx)
True iff the specified type index is a vector.
@ CE
Windows NT (Windows on ARM)
Reg
All possible values of the reg field in the ModR/M byte.
initializer< Ty > init(const Ty &Val)
uint64_t read64le(const void *P)
uint32_t read32le(const void *P)
This is an optimization pass for GlobalISel generic memory operations.
bool shouldEmitPTXNoReturn(const Value *V, const TargetMachine &TM)
auto size(R &&Range, std::enable_if_t< std::is_base_of< std::random_access_iterator_tag, typename std::iterator_traits< decltype(Range.begin())>::iterator_category >::value, void > *=nullptr)
Get the size of a range.
std::string getSamplerName(const Value &val)
bool getAlign(const Function &F, unsigned index, unsigned &align)
bool getMinCTASm(const Function &F, unsigned &x)
std::string getNVPTXRegClassName(TargetRegisterClass const *RC)
bool isImage(const Value &val)
bool getMaxNTIDz(const Function &F, unsigned &z)
Constant * ConstantFoldConstant(const Constant *C, const DataLayout &DL, const TargetLibraryInfo *TLI=nullptr)
ConstantFoldConstant - Fold the constant using the specified DataLayout.
bool isManaged(const Value &val)
unsigned promoteScalarArgumentSize(unsigned size)
bool isSurface(const Value &val)
void clearAnnotationCache(const Module *Mod)
void report_fatal_error(Error Err, bool gen_crash_diag=true)
Report a serious error, calling any installed error handler.
std::string getSurfaceName(const Value &val)
bool getReqNTIDx(const Function &F, unsigned &x)
bool getReqNTIDy(const Function &F, unsigned &y)
FormattedNumber format_hex_no_prefix(uint64_t N, unsigned Width, bool Upper=false)
format_hex_no_prefix - Output N as a fixed width hexadecimal.
bool getMaxNReg(const Function &F, unsigned &x)
bool isTexture(const Value &val)
bool isImageWriteOnly(const Value &val)
bool isImageReadWrite(const Value &val)
void write_hex(raw_ostream &S, uint64_t N, HexPrintStyle Style, std::optional< size_t > Width=std::nullopt)
std::string getTextureName(const Value &val)
void ComputeValueVTs(const TargetLowering &TLI, const DataLayout &DL, Type *Ty, SmallVectorImpl< EVT > &ValueVTs, SmallVectorImpl< EVT > *MemVTs, SmallVectorImpl< TypeSize > *Offsets=nullptr, TypeSize StartingOffset=TypeSize::getZero())
ComputeValueVTs - Given an LLVM IR type, compute a sequence of EVTs that represent all the individual...
std::string getNVPTXRegClassStr(TargetRegisterClass const *RC)
Target & getTheNVPTXTarget64()
bool isKernelFunction(const Function &F)
bool getReqNTIDz(const Function &F, unsigned &z)
bool getMaxNTIDx(const Function &F, unsigned &x)
bool getMaxNTIDy(const Function &F, unsigned &y)
bool isSampler(const Value &val)
Constant * ConstantFoldIntegerCast(Constant *C, Type *DestTy, bool IsSigned, const DataLayout &DL)
Constant fold a zext, sext or trunc, depending on IsSigned and whether the DestTy is wider or narrowe...
bool getMaxClusterRank(const Function &F, unsigned &x)
MDNode * GetUnrollMetadata(MDNode *LoopID, StringRef Name)
Given an llvm.loop loop id metadata node, returns the loop hint metadata node with the given name (fo...
Target & getTheNVPTXTarget32()
static const fltSemantics & IEEEsingle() LLVM_READNONE
static constexpr roundingMode rmNearestTiesToEven
static const fltSemantics & IEEEdouble() LLVM_READNONE
This struct is a compact representation of a valid (non-zero power of two) alignment.
uint64_t value() const
This is a hole in the type system and should not be abused.
TypeSize getSizeInBits() const
Return the size of the specified value type in bits.
bool isInteger() const
Return true if this is an integer or a vector integer type.
This struct is a compact representation of a valid (power of two) or undefined (0) alignment.
Align valueOrOne() const
For convenience, returns a valid alignment or 1 if undefined.
RegisterAsmPrinter - Helper template for registering a target specific assembly printer,...