LLVM 23.0.0git
IRTranslator.cpp
Go to the documentation of this file.
1//===- llvm/CodeGen/GlobalISel/IRTranslator.cpp - IRTranslator ---*- C++ -*-==//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8/// \file
9/// This file implements the IRTranslator class.
10//===----------------------------------------------------------------------===//
11
14#include "llvm/ADT/STLExtras.h"
15#include "llvm/ADT/ScopeExit.h"
20#include "llvm/Analysis/Loads.h"
50#include "llvm/IR/BasicBlock.h"
51#include "llvm/IR/CFG.h"
52#include "llvm/IR/Constant.h"
53#include "llvm/IR/Constants.h"
54#include "llvm/IR/DataLayout.h"
57#include "llvm/IR/Function.h"
59#include "llvm/IR/InlineAsm.h"
60#include "llvm/IR/InstrTypes.h"
63#include "llvm/IR/Intrinsics.h"
64#include "llvm/IR/IntrinsicsAMDGPU.h"
65#include "llvm/IR/LLVMContext.h"
66#include "llvm/IR/Metadata.h"
68#include "llvm/IR/Statepoint.h"
69#include "llvm/IR/Type.h"
70#include "llvm/IR/User.h"
71#include "llvm/IR/Value.h"
73#include "llvm/MC/MCContext.h"
74#include "llvm/Pass.h"
77#include "llvm/Support/Debug.h"
84#include <algorithm>
85#include <cassert>
86#include <cstdint>
87#include <iterator>
88#include <optional>
89#include <string>
90#include <utility>
91#include <vector>
92
93#define DEBUG_TYPE "irtranslator"
94
95using namespace llvm;
96
97static cl::opt<bool>
98 EnableCSEInIRTranslator("enable-cse-in-irtranslator",
99 cl::desc("Should enable CSE in irtranslator"),
100 cl::Optional, cl::init(false));
101char IRTranslator::ID = 0;
102
103INITIALIZE_PASS_BEGIN(IRTranslator, DEBUG_TYPE, "IRTranslator LLVM IR -> MI",
104 false, false)
110INITIALIZE_PASS_END(IRTranslator, DEBUG_TYPE, "IRTranslator LLVM IR -> MI",
112
116 MF.getProperties().setFailedISel();
117 bool IsGlobalISelAbortEnabled =
118 MF.getTarget().Options.GlobalISelAbort == GlobalISelAbortMode::Enable;
119
120 // Print the function name explicitly if we don't have a debug location (which
121 // makes the diagnostic less useful) or if we're going to emit a raw error.
122 if (!R.getLocation().isValid() || IsGlobalISelAbortEnabled)
123 R << (" (in function: " + MF.getName() + ")").str();
124
125 if (IsGlobalISelAbortEnabled)
126 report_fatal_error(Twine(R.getMsg()));
127 else
128 ORE.emit(R);
129}
130
132 : MachineFunctionPass(ID), OptLevel(optlevel) {}
133
134#ifndef NDEBUG
135namespace {
136/// Verify that every instruction created has the same DILocation as the
137/// instruction being translated.
138class DILocationVerifier : public GISelChangeObserver {
139 const Instruction *CurrInst = nullptr;
140
141public:
142 DILocationVerifier() = default;
143 ~DILocationVerifier() override = default;
144
145 const Instruction *getCurrentInst() const { return CurrInst; }
146 void setCurrentInst(const Instruction *Inst) { CurrInst = Inst; }
147
148 void erasingInstr(MachineInstr &MI) override {}
149 void changingInstr(MachineInstr &MI) override {}
150 void changedInstr(MachineInstr &MI) override {}
151
152 void createdInstr(MachineInstr &MI) override {
153 assert(getCurrentInst() && "Inserted instruction without a current MI");
154
155 // Only print the check message if we're actually checking it.
156#ifndef NDEBUG
157 LLVM_DEBUG(dbgs() << "Checking DILocation from " << *CurrInst
158 << " was copied to " << MI);
159#endif
160 // We allow insts in the entry block to have no debug loc because
161 // they could have originated from constants, and we don't want a jumpy
162 // debug experience.
163 assert((CurrInst->getDebugLoc() == MI.getDebugLoc() ||
164 (MI.getParent()->isEntryBlock() && !MI.getDebugLoc()) ||
165 (MI.isDebugInstr())) &&
166 "Line info was not transferred to all instructions");
167 }
168};
169} // namespace
170#endif // ifndef NDEBUG
171
172
189
190IRTranslator::ValueToVRegInfo::VRegListT &
191IRTranslator::allocateVRegs(const Value &Val) {
192 auto VRegsIt = VMap.findVRegs(Val);
193 if (VRegsIt != VMap.vregs_end())
194 return *VRegsIt->second;
195 auto *Regs = VMap.getVRegs(Val);
196 auto *Offsets = VMap.getOffsets(Val);
197 SmallVector<LLT, 4> SplitTys;
198 computeValueLLTs(*DL, *Val.getType(), SplitTys,
199 Offsets->empty() ? Offsets : nullptr);
200 for (unsigned i = 0; i < SplitTys.size(); ++i)
201 Regs->push_back(0);
202 return *Regs;
203}
204
205ArrayRef<Register> IRTranslator::getOrCreateVRegs(const Value &Val) {
206 auto VRegsIt = VMap.findVRegs(Val);
207 if (VRegsIt != VMap.vregs_end())
208 return *VRegsIt->second;
209
210 if (Val.getType()->isVoidTy())
211 return *VMap.getVRegs(Val);
212
213 // Create entry for this type.
214 auto *VRegs = VMap.getVRegs(Val);
215 auto *Offsets = VMap.getOffsets(Val);
216
217 if (!Val.getType()->isTokenTy())
218 assert(Val.getType()->isSized() &&
219 "Don't know how to create an empty vreg");
220
221 // Fast-path values that lower to a single vreg.
222 if (!Val.getType()->isAggregateType()) {
223 LLT Ty = getLLTForType(*Val.getType(), *DL);
224 if (Offsets->empty())
225 Offsets->push_back(0);
226 VRegs->push_back(MRI->createGenericVirtualRegister(Ty));
227 if (isa<Constant>(Val)) {
228 bool Success = translate(cast<Constant>(Val), VRegs->front());
229 if (!Success) {
230 OptimizationRemarkMissed R("gisel-irtranslator", "GISelFailure",
232 &MF->getFunction().getEntryBlock());
233 R << "unable to translate constant: " << ore::NV("Type", Val.getType());
234 reportTranslationError(*MF, *ORE, R);
235 }
236 }
237 return *VRegs;
238 }
239
240 SmallVector<LLT, 4> SplitTys;
241 computeValueLLTs(*DL, *Val.getType(), SplitTys,
242 Offsets->empty() ? Offsets : nullptr);
243
244 if (!isa<Constant>(Val)) {
245 for (auto Ty : SplitTys)
246 VRegs->push_back(MRI->createGenericVirtualRegister(Ty));
247 return *VRegs;
248 }
249
250 // UndefValue, ConstantAggregateZero
251 auto &C = cast<Constant>(Val);
252 unsigned Idx = 0;
253 while (auto Elt = C.getAggregateElement(Idx++)) {
254 auto EltRegs = getOrCreateVRegs(*Elt);
255 llvm::append_range(*VRegs, EltRegs);
256 }
257
258 return *VRegs;
259}
260
261int IRTranslator::getOrCreateFrameIndex(const AllocaInst &AI) {
262 auto [MapEntry, Inserted] = FrameIndices.try_emplace(&AI);
263 if (!Inserted)
264 return MapEntry->second;
265
266 TypeSize TySize = AI.getAllocationSize(*DL).value_or(TypeSize::getZero());
267 uint64_t Size = TySize.getKnownMinValue();
268
269 // Always allocate at least one byte.
270 Size = std::max<uint64_t>(Size, 1u);
271
272 int &FI = MapEntry->second;
273 FI = MF->getFrameInfo().CreateStackObject(Size, AI.getAlign(), false, &AI);
274
275 // Scalable vectors and structures that contain scalable vectors may
276 // need a special StackID to distinguish them from other (fixed size)
277 // stack objects.
278 if (TySize.isScalable()) {
279 auto StackID =
280 MF->getSubtarget().getFrameLowering()->getStackIDForScalableVectors();
281 MF->getFrameInfo().setStackID(FI, StackID);
282 }
283
284 return FI;
285}
286
287Align IRTranslator::getMemOpAlign(const Instruction &I) {
288 if (const StoreInst *SI = dyn_cast<StoreInst>(&I))
289 return SI->getAlign();
290 if (const LoadInst *LI = dyn_cast<LoadInst>(&I))
291 return LI->getAlign();
292 if (const AtomicCmpXchgInst *AI = dyn_cast<AtomicCmpXchgInst>(&I))
293 return AI->getAlign();
294 if (const AtomicRMWInst *AI = dyn_cast<AtomicRMWInst>(&I))
295 return AI->getAlign();
296
297 OptimizationRemarkMissed R("gisel-irtranslator", "", &I);
298 R << "unable to translate memop: " << ore::NV("Opcode", &I);
299 reportTranslationError(*MF, *ORE, R);
300 return Align(1);
301}
302
303MachineBasicBlock &IRTranslator::getMBB(const BasicBlock &BB) {
304 MachineBasicBlock *MBB = FuncInfo.getMBB(&BB);
305 assert(MBB && "BasicBlock was not encountered before");
306 return *MBB;
307}
308
309void IRTranslator::addMachineCFGPred(CFGEdge Edge, MachineBasicBlock *NewPred) {
310 assert(NewPred && "new predecessor must be a real MachineBasicBlock");
311 MachinePreds[Edge].push_back(NewPred);
312}
313
314bool IRTranslator::translateBinaryOp(unsigned Opcode, const User &U,
315 MachineIRBuilder &MIRBuilder) {
316 if (!mayTranslateUserTypes(U))
317 return false;
318
319 // Get or create a virtual register for each value.
320 // Unless the value is a Constant => loadimm cst?
321 // or inline constant each time?
322 // Creation of a virtual register needs to have a size.
323 Register Op0 = getOrCreateVReg(*U.getOperand(0));
324 Register Op1 = getOrCreateVReg(*U.getOperand(1));
325 Register Res = getOrCreateVReg(U);
326 uint32_t Flags = 0;
327 if (isa<Instruction>(U)) {
328 const Instruction &I = cast<Instruction>(U);
330 }
331
332 MIRBuilder.buildInstr(Opcode, {Res}, {Op0, Op1}, Flags);
333 return true;
334}
335
336bool IRTranslator::translateUnaryOp(unsigned Opcode, const User &U,
337 MachineIRBuilder &MIRBuilder) {
338 if (!mayTranslateUserTypes(U))
339 return false;
340
341 Register Op0 = getOrCreateVReg(*U.getOperand(0));
342 Register Res = getOrCreateVReg(U);
343 uint32_t Flags = 0;
344 if (isa<Instruction>(U)) {
345 const Instruction &I = cast<Instruction>(U);
347 }
348 MIRBuilder.buildInstr(Opcode, {Res}, {Op0}, Flags);
349 return true;
350}
351
352bool IRTranslator::translateFNeg(const User &U, MachineIRBuilder &MIRBuilder) {
353 return translateUnaryOp(TargetOpcode::G_FNEG, U, MIRBuilder);
354}
355
356bool IRTranslator::translateCompare(const User &U,
357 MachineIRBuilder &MIRBuilder) {
358 if (!mayTranslateUserTypes(U))
359 return false;
360
361 auto *CI = cast<CmpInst>(&U);
362 Register Op0 = getOrCreateVReg(*U.getOperand(0));
363 Register Op1 = getOrCreateVReg(*U.getOperand(1));
364 Register Res = getOrCreateVReg(U);
365 CmpInst::Predicate Pred = CI->getPredicate();
367 if (CmpInst::isIntPredicate(Pred))
368 MIRBuilder.buildICmp(Pred, Res, Op0, Op1, Flags);
369 else if (Pred == CmpInst::FCMP_FALSE)
370 MIRBuilder.buildCopy(
371 Res, getOrCreateVReg(*Constant::getNullValue(U.getType())));
372 else if (Pred == CmpInst::FCMP_TRUE)
373 MIRBuilder.buildCopy(
374 Res, getOrCreateVReg(*Constant::getAllOnesValue(U.getType())));
375 else
376 MIRBuilder.buildFCmp(Pred, Res, Op0, Op1, Flags);
377
378 return true;
379}
380
381bool IRTranslator::translateRet(const User &U, MachineIRBuilder &MIRBuilder) {
382 const ReturnInst &RI = cast<ReturnInst>(U);
383 const Value *Ret = RI.getReturnValue();
384 if (Ret && DL->getTypeStoreSize(Ret->getType()).isZero())
385 Ret = nullptr;
386
387 ArrayRef<Register> VRegs;
388 if (Ret)
389 VRegs = getOrCreateVRegs(*Ret);
390
391 Register SwiftErrorVReg = 0;
392 if (CLI->supportSwiftError() && SwiftError.getFunctionArg()) {
393 SwiftErrorVReg = SwiftError.getOrCreateVRegUseAt(
394 &RI, &MIRBuilder.getMBB(), SwiftError.getFunctionArg());
395 }
396
397 // The target may mess up with the insertion point, but
398 // this is not important as a return is the last instruction
399 // of the block anyway.
400 return CLI->lowerReturn(MIRBuilder, Ret, VRegs, FuncInfo, SwiftErrorVReg);
401}
402
403void IRTranslator::emitBranchForMergedCondition(
405 MachineBasicBlock *CurBB, MachineBasicBlock *SwitchBB,
406 BranchProbability TProb, BranchProbability FProb, bool InvertCond) {
407 // If the leaf of the tree is a comparison, merge the condition into
408 // the caseblock.
409 if (const CmpInst *BOp = dyn_cast<CmpInst>(Cond)) {
410 CmpInst::Predicate Condition;
411 if (const ICmpInst *IC = dyn_cast<ICmpInst>(Cond)) {
412 Condition = InvertCond ? IC->getInversePredicate() : IC->getPredicate();
413 } else {
414 const FCmpInst *FC = cast<FCmpInst>(Cond);
415 Condition = InvertCond ? FC->getInversePredicate() : FC->getPredicate();
416 }
417
418 SwitchCG::CaseBlock CB(Condition, false, BOp->getOperand(0),
419 BOp->getOperand(1), nullptr, TBB, FBB, CurBB,
420 CurBuilder->getDebugLoc(), TProb, FProb);
421 SL->SwitchCases.push_back(CB);
422 return;
423 }
424
425 // Create a CaseBlock record representing this branch.
427 SwitchCG::CaseBlock CB(
428 Pred, false, Cond, ConstantInt::getTrue(MF->getFunction().getContext()),
429 nullptr, TBB, FBB, CurBB, CurBuilder->getDebugLoc(), TProb, FProb);
430 SL->SwitchCases.push_back(CB);
431}
432
433static bool isValInBlock(const Value *V, const BasicBlock *BB) {
434 if (const Instruction *I = dyn_cast<Instruction>(V))
435 return I->getParent() == BB;
436 return true;
437}
438
439void IRTranslator::findMergedConditions(
441 MachineBasicBlock *CurBB, MachineBasicBlock *SwitchBB,
443 BranchProbability FProb, bool InvertCond) {
444 using namespace PatternMatch;
445 assert((Opc == Instruction::And || Opc == Instruction::Or) &&
446 "Expected Opc to be AND/OR");
447 // Skip over not part of the tree and remember to invert op and operands at
448 // next level.
449 Value *NotCond;
450 if (match(Cond, m_OneUse(m_Not(m_Value(NotCond)))) &&
451 isValInBlock(NotCond, CurBB->getBasicBlock())) {
452 findMergedConditions(NotCond, TBB, FBB, CurBB, SwitchBB, Opc, TProb, FProb,
453 !InvertCond);
454 return;
455 }
456
458 const Value *BOpOp0, *BOpOp1;
459 // Compute the effective opcode for Cond, taking into account whether it needs
460 // to be inverted, e.g.
461 // and (not (or A, B)), C
462 // gets lowered as
463 // and (and (not A, not B), C)
465 if (BOp) {
466 BOpc = match(BOp, m_LogicalAnd(m_Value(BOpOp0), m_Value(BOpOp1)))
467 ? Instruction::And
468 : (match(BOp, m_LogicalOr(m_Value(BOpOp0), m_Value(BOpOp1)))
469 ? Instruction::Or
471 if (InvertCond) {
472 if (BOpc == Instruction::And)
473 BOpc = Instruction::Or;
474 else if (BOpc == Instruction::Or)
475 BOpc = Instruction::And;
476 }
477 }
478
479 // If this node is not part of the or/and tree, emit it as a branch.
480 // Note that all nodes in the tree should have same opcode.
481 bool BOpIsInOrAndTree = BOpc && BOpc == Opc && BOp->hasOneUse();
482 if (!BOpIsInOrAndTree || BOp->getParent() != CurBB->getBasicBlock() ||
483 !isValInBlock(BOpOp0, CurBB->getBasicBlock()) ||
484 !isValInBlock(BOpOp1, CurBB->getBasicBlock())) {
485 emitBranchForMergedCondition(Cond, TBB, FBB, CurBB, SwitchBB, TProb, FProb,
486 InvertCond);
487 return;
488 }
489
490 // Create TmpBB after CurBB.
491 MachineFunction::iterator BBI(CurBB);
492 MachineBasicBlock *TmpBB =
493 MF->CreateMachineBasicBlock(CurBB->getBasicBlock());
494 CurBB->getParent()->insert(++BBI, TmpBB);
495
496 if (Opc == Instruction::Or) {
497 // Codegen X | Y as:
498 // BB1:
499 // jmp_if_X TBB
500 // jmp TmpBB
501 // TmpBB:
502 // jmp_if_Y TBB
503 // jmp FBB
504 //
505
506 // We have flexibility in setting Prob for BB1 and Prob for TmpBB.
507 // The requirement is that
508 // TrueProb for BB1 + (FalseProb for BB1 * TrueProb for TmpBB)
509 // = TrueProb for original BB.
510 // Assuming the original probabilities are A and B, one choice is to set
511 // BB1's probabilities to A/2 and A/2+B, and set TmpBB's probabilities to
512 // A/(1+B) and 2B/(1+B). This choice assumes that
513 // TrueProb for BB1 == FalseProb for BB1 * TrueProb for TmpBB.
514 // Another choice is to assume TrueProb for BB1 equals to TrueProb for
515 // TmpBB, but the math is more complicated.
516
517 auto NewTrueProb = TProb / 2;
518 auto NewFalseProb = TProb / 2 + FProb;
519 // Emit the LHS condition.
520 findMergedConditions(BOpOp0, TBB, TmpBB, CurBB, SwitchBB, Opc, NewTrueProb,
521 NewFalseProb, InvertCond);
522
523 // Normalize A/2 and B to get A/(1+B) and 2B/(1+B).
524 SmallVector<BranchProbability, 2> Probs{TProb / 2, FProb};
526 // Emit the RHS condition into TmpBB.
527 findMergedConditions(BOpOp1, TBB, FBB, TmpBB, SwitchBB, Opc, Probs[0],
528 Probs[1], InvertCond);
529 } else {
530 assert(Opc == Instruction::And && "Unknown merge op!");
531 // Codegen X & Y as:
532 // BB1:
533 // jmp_if_X TmpBB
534 // jmp FBB
535 // TmpBB:
536 // jmp_if_Y TBB
537 // jmp FBB
538 //
539 // This requires creation of TmpBB after CurBB.
540
541 // We have flexibility in setting Prob for BB1 and Prob for TmpBB.
542 // The requirement is that
543 // FalseProb for BB1 + (TrueProb for BB1 * FalseProb for TmpBB)
544 // = FalseProb for original BB.
545 // Assuming the original probabilities are A and B, one choice is to set
546 // BB1's probabilities to A+B/2 and B/2, and set TmpBB's probabilities to
547 // 2A/(1+A) and B/(1+A). This choice assumes that FalseProb for BB1 ==
548 // TrueProb for BB1 * FalseProb for TmpBB.
549
550 auto NewTrueProb = TProb + FProb / 2;
551 auto NewFalseProb = FProb / 2;
552 // Emit the LHS condition.
553 findMergedConditions(BOpOp0, TmpBB, FBB, CurBB, SwitchBB, Opc, NewTrueProb,
554 NewFalseProb, InvertCond);
555
556 // Normalize A and B/2 to get 2A/(1+A) and B/(1+A).
557 SmallVector<BranchProbability, 2> Probs{TProb, FProb / 2};
559 // Emit the RHS condition into TmpBB.
560 findMergedConditions(BOpOp1, TBB, FBB, TmpBB, SwitchBB, Opc, Probs[0],
561 Probs[1], InvertCond);
562 }
563}
564
565bool IRTranslator::shouldEmitAsBranches(
566 const std::vector<SwitchCG::CaseBlock> &Cases) {
567 // For multiple cases, it's better to emit as branches.
568 if (Cases.size() != 2)
569 return true;
570
571 // If this is two comparisons of the same values or'd or and'd together, they
572 // will get folded into a single comparison, so don't emit two blocks.
573 if ((Cases[0].CmpLHS == Cases[1].CmpLHS &&
574 Cases[0].CmpRHS == Cases[1].CmpRHS) ||
575 (Cases[0].CmpRHS == Cases[1].CmpLHS &&
576 Cases[0].CmpLHS == Cases[1].CmpRHS)) {
577 return false;
578 }
579
580 // Handle: (X != null) | (Y != null) --> (X|Y) != 0
581 // Handle: (X == null) & (Y == null) --> (X|Y) == 0
582 if (Cases[0].CmpRHS == Cases[1].CmpRHS &&
583 Cases[0].PredInfo.Pred == Cases[1].PredInfo.Pred &&
584 isa<Constant>(Cases[0].CmpRHS) &&
585 cast<Constant>(Cases[0].CmpRHS)->isNullValue()) {
586 if (Cases[0].PredInfo.Pred == CmpInst::ICMP_EQ &&
587 Cases[0].TrueBB == Cases[1].ThisBB)
588 return false;
589 if (Cases[0].PredInfo.Pred == CmpInst::ICMP_NE &&
590 Cases[0].FalseBB == Cases[1].ThisBB)
591 return false;
592 }
593
594 return true;
595}
596
597bool IRTranslator::translateUncondBr(const User &U,
598 MachineIRBuilder &MIRBuilder) {
599 const UncondBrInst &BrInst = cast<UncondBrInst>(U);
600 auto &CurMBB = MIRBuilder.getMBB();
601 auto *Succ0MBB = &getMBB(*BrInst.getSuccessor(0));
602
603 // If the unconditional target is the layout successor, fallthrough.
604 if (OptLevel == CodeGenOptLevel::None || !CurMBB.isLayoutSuccessor(Succ0MBB))
605 MIRBuilder.buildBr(*Succ0MBB);
606
607 // Link successors.
608 for (const BasicBlock *Succ : successors(&BrInst))
609 CurMBB.addSuccessor(&getMBB(*Succ));
610 return true;
611}
612
613bool IRTranslator::translateCondBr(const User &U,
614 MachineIRBuilder &MIRBuilder) {
615 const CondBrInst &BrInst = cast<CondBrInst>(U);
616 auto &CurMBB = MIRBuilder.getMBB();
617 auto *Succ0MBB = &getMBB(*BrInst.getSuccessor(0));
618
619 // If this condition is one of the special cases we handle, do special stuff
620 // now.
621 const Value *CondVal = BrInst.getCondition();
622 MachineBasicBlock *Succ1MBB = &getMBB(*BrInst.getSuccessor(1));
623
624 // If this is a series of conditions that are or'd or and'd together, emit
625 // this as a sequence of branches instead of setcc's with and/or operations.
626 // As long as jumps are not expensive (exceptions for multi-use logic ops,
627 // unpredictable branches, and vector extracts because those jumps are likely
628 // expensive for any target), this should improve performance.
629 // For example, instead of something like:
630 // cmp A, B
631 // C = seteq
632 // cmp D, E
633 // F = setle
634 // or C, F
635 // jnz foo
636 // Emit:
637 // cmp A, B
638 // je foo
639 // cmp D, E
640 // jle foo
641 using namespace PatternMatch;
642 const Instruction *CondI = dyn_cast<Instruction>(CondVal);
643 if (!TLI->isJumpExpensive() && CondI && CondI->hasOneUse() &&
644 !BrInst.hasMetadata(LLVMContext::MD_unpredictable)) {
646 Value *Vec;
647 const Value *BOp0, *BOp1;
648 if (match(CondI, m_LogicalAnd(m_Value(BOp0), m_Value(BOp1))))
649 Opcode = Instruction::And;
650 else if (match(CondI, m_LogicalOr(m_Value(BOp0), m_Value(BOp1))))
651 Opcode = Instruction::Or;
652
653 if (Opcode && !(match(BOp0, m_ExtractElt(m_Value(Vec), m_Value())) &&
654 match(BOp1, m_ExtractElt(m_Specific(Vec), m_Value())))) {
655 findMergedConditions(CondI, Succ0MBB, Succ1MBB, &CurMBB, &CurMBB, Opcode,
656 getEdgeProbability(&CurMBB, Succ0MBB),
657 getEdgeProbability(&CurMBB, Succ1MBB),
658 /*InvertCond=*/false);
659 assert(SL->SwitchCases[0].ThisBB == &CurMBB && "Unexpected lowering!");
660
661 // Allow some cases to be rejected.
662 if (shouldEmitAsBranches(SL->SwitchCases)) {
663 // Emit the branch for this block.
664 emitSwitchCase(SL->SwitchCases[0], &CurMBB, *CurBuilder);
665 SL->SwitchCases.erase(SL->SwitchCases.begin());
666 return true;
667 }
668
669 // Okay, we decided not to do this, remove any inserted MBB's and clear
670 // SwitchCases.
671 for (unsigned I = 1, E = SL->SwitchCases.size(); I != E; ++I)
672 MF->erase(SL->SwitchCases[I].ThisBB);
673
674 SL->SwitchCases.clear();
675 }
676 }
677
678 // Create a CaseBlock record representing this branch.
679 SwitchCG::CaseBlock CB(CmpInst::ICMP_EQ, false, CondVal,
680 ConstantInt::getTrue(MF->getFunction().getContext()),
681 nullptr, Succ0MBB, Succ1MBB, &CurMBB,
682 CurBuilder->getDebugLoc());
683
684 // Use emitSwitchCase to actually insert the fast branch sequence for this
685 // cond branch.
686 emitSwitchCase(CB, &CurMBB, *CurBuilder);
687 return true;
688}
689
690void IRTranslator::addSuccessorWithProb(MachineBasicBlock *Src,
692 BranchProbability Prob) {
693 if (!FuncInfo.BPI) {
694 Src->addSuccessorWithoutProb(Dst);
695 return;
696 }
697 if (Prob.isUnknown())
698 Prob = getEdgeProbability(Src, Dst);
699 Src->addSuccessor(Dst, Prob);
700}
701
703IRTranslator::getEdgeProbability(const MachineBasicBlock *Src,
704 const MachineBasicBlock *Dst) const {
705 const BasicBlock *SrcBB = Src->getBasicBlock();
706 const BasicBlock *DstBB = Dst->getBasicBlock();
707 if (!FuncInfo.BPI) {
708 // If BPI is not available, set the default probability as 1 / N, where N is
709 // the number of successors.
710 auto SuccSize = std::max<uint32_t>(succ_size(SrcBB), 1);
711 return BranchProbability(1, SuccSize);
712 }
713 return FuncInfo.BPI->getEdgeProbability(SrcBB, DstBB);
714}
715
716bool IRTranslator::translateSwitch(const User &U, MachineIRBuilder &MIB) {
717 using namespace SwitchCG;
718 // Extract cases from the switch.
719 const SwitchInst &SI = cast<SwitchInst>(U);
720 BranchProbabilityInfo *BPI = FuncInfo.BPI;
721 CaseClusterVector Clusters;
722 Clusters.reserve(SI.getNumCases());
723 for (const auto &I : SI.cases()) {
724 MachineBasicBlock *Succ = &getMBB(*I.getCaseSuccessor());
725 assert(Succ && "Could not find successor mbb in mapping");
726 const ConstantInt *CaseVal = I.getCaseValue();
727 BranchProbability Prob =
728 BPI ? BPI->getEdgeProbability(SI.getParent(), I.getSuccessorIndex())
729 : BranchProbability(1, SI.getNumCases() + 1);
730 Clusters.push_back(CaseCluster::range(CaseVal, CaseVal, Succ, Prob));
731 }
732
733 MachineBasicBlock *DefaultMBB = &getMBB(*SI.getDefaultDest());
734
735 // Cluster adjacent cases with the same destination. We do this at all
736 // optimization levels because it's cheap to do and will make codegen faster
737 // if there are many clusters.
738 sortAndRangeify(Clusters);
739
740 MachineBasicBlock *SwitchMBB = &getMBB(*SI.getParent());
741
742 // If there is only the default destination, jump there directly.
743 if (Clusters.empty()) {
744 SwitchMBB->addSuccessor(DefaultMBB);
745 if (DefaultMBB != SwitchMBB->getNextNode())
746 MIB.buildBr(*DefaultMBB);
747 return true;
748 }
749
750 SL->findJumpTables(Clusters, &SI, std::nullopt, DefaultMBB, nullptr, nullptr);
751 SL->findBitTestClusters(Clusters, &SI);
752
753 LLVM_DEBUG({
754 dbgs() << "Case clusters: ";
755 for (const CaseCluster &C : Clusters) {
756 if (C.Kind == CC_JumpTable)
757 dbgs() << "JT:";
758 if (C.Kind == CC_BitTests)
759 dbgs() << "BT:";
760
761 C.Low->getValue().print(dbgs(), true);
762 if (C.Low != C.High) {
763 dbgs() << '-';
764 C.High->getValue().print(dbgs(), true);
765 }
766 dbgs() << ' ';
767 }
768 dbgs() << '\n';
769 });
770
771 assert(!Clusters.empty());
772 SwitchWorkList WorkList;
773 CaseClusterIt First = Clusters.begin();
774 CaseClusterIt Last = Clusters.end() - 1;
775 auto DefaultProb = getEdgeProbability(SwitchMBB, DefaultMBB);
776 WorkList.push_back({SwitchMBB, First, Last, nullptr, nullptr, DefaultProb});
777
778 while (!WorkList.empty()) {
779 SwitchWorkListItem W = WorkList.pop_back_val();
780
781 unsigned NumClusters = W.LastCluster - W.FirstCluster + 1;
782 // For optimized builds, lower large range as a balanced binary tree.
783 if (NumClusters > 3 &&
784 MF->getTarget().getOptLevel() != CodeGenOptLevel::None &&
785 !DefaultMBB->getParent()->getFunction().hasMinSize()) {
786 splitWorkItem(WorkList, W, SI.getCondition(), SwitchMBB, MIB);
787 continue;
788 }
789
790 if (!lowerSwitchWorkItem(W, SI.getCondition(), SwitchMBB, DefaultMBB, MIB))
791 return false;
792 }
793 return true;
794}
795
796void IRTranslator::splitWorkItem(SwitchCG::SwitchWorkList &WorkList,
798 Value *Cond, MachineBasicBlock *SwitchMBB,
799 MachineIRBuilder &MIB) {
800 using namespace SwitchCG;
801 assert(W.FirstCluster->Low->getValue().slt(W.LastCluster->Low->getValue()) &&
802 "Clusters not sorted?");
803 assert(W.LastCluster - W.FirstCluster + 1 >= 2 && "Too small to split!");
804
805 auto [LastLeft, FirstRight, LeftProb, RightProb] =
806 SL->computeSplitWorkItemInfo(W);
807
808 // Use the first element on the right as pivot since we will make less-than
809 // comparisons against it.
810 CaseClusterIt PivotCluster = FirstRight;
811 assert(PivotCluster > W.FirstCluster);
812 assert(PivotCluster <= W.LastCluster);
813
814 CaseClusterIt FirstLeft = W.FirstCluster;
815 CaseClusterIt LastRight = W.LastCluster;
816
817 const ConstantInt *Pivot = PivotCluster->Low;
818
819 // New blocks will be inserted immediately after the current one.
821 ++BBI;
822
823 // We will branch to the LHS if Value < Pivot. If LHS is a single cluster,
824 // we can branch to its destination directly if it's squeezed exactly in
825 // between the known lower bound and Pivot - 1.
826 MachineBasicBlock *LeftMBB;
827 if (FirstLeft == LastLeft && FirstLeft->Kind == CC_Range &&
828 FirstLeft->Low == W.GE &&
829 (FirstLeft->High->getValue() + 1LL) == Pivot->getValue()) {
830 LeftMBB = FirstLeft->MBB;
831 } else {
832 LeftMBB = FuncInfo.MF->CreateMachineBasicBlock(W.MBB->getBasicBlock());
833 FuncInfo.MF->insert(BBI, LeftMBB);
834 WorkList.push_back(
835 {LeftMBB, FirstLeft, LastLeft, W.GE, Pivot, W.DefaultProb / 2});
836 }
837
838 // Similarly, we will branch to the RHS if Value >= Pivot. If RHS is a
839 // single cluster, RHS.Low == Pivot, and we can branch to its destination
840 // directly if RHS.High equals the current upper bound.
841 MachineBasicBlock *RightMBB;
842 if (FirstRight == LastRight && FirstRight->Kind == CC_Range && W.LT &&
843 (FirstRight->High->getValue() + 1ULL) == W.LT->getValue()) {
844 RightMBB = FirstRight->MBB;
845 } else {
846 RightMBB = FuncInfo.MF->CreateMachineBasicBlock(W.MBB->getBasicBlock());
847 FuncInfo.MF->insert(BBI, RightMBB);
848 WorkList.push_back(
849 {RightMBB, FirstRight, LastRight, Pivot, W.LT, W.DefaultProb / 2});
850 }
851
852 // Create the CaseBlock record that will be used to lower the branch.
853 CaseBlock CB(ICmpInst::Predicate::ICMP_SLT, false, Cond, Pivot, nullptr,
854 LeftMBB, RightMBB, W.MBB, MIB.getDebugLoc(), LeftProb,
855 RightProb);
856
857 if (W.MBB == SwitchMBB)
858 emitSwitchCase(CB, SwitchMBB, MIB);
859 else
860 SL->SwitchCases.push_back(CB);
861}
862
863void IRTranslator::emitJumpTable(SwitchCG::JumpTable &JT,
865 // Emit the code for the jump table
866 assert(JT.Reg && "Should lower JT Header first!");
867 MachineIRBuilder MIB(*MBB->getParent());
868 MIB.setMBB(*MBB);
869 MIB.setDebugLoc(CurBuilder->getDebugLoc());
870
871 Type *PtrIRTy = PointerType::getUnqual(MF->getFunction().getContext());
872 const LLT PtrTy = getLLTForType(*PtrIRTy, *DL);
873
874 auto Table = MIB.buildJumpTable(PtrTy, JT.JTI);
875 MIB.buildBrJT(Table.getReg(0), JT.JTI, JT.Reg);
876}
877
878bool IRTranslator::emitJumpTableHeader(SwitchCG::JumpTable &JT,
880 MachineBasicBlock *HeaderBB) {
881 MachineIRBuilder MIB(*HeaderBB->getParent());
882 MIB.setMBB(*HeaderBB);
883 MIB.setDebugLoc(CurBuilder->getDebugLoc());
884
885 const Value &SValue = *JTH.SValue;
886 // Subtract the lowest switch case value from the value being switched on.
887 const LLT SwitchTy = getLLTForType(*SValue.getType(), *DL);
888 Register SwitchOpReg = getOrCreateVReg(SValue);
889 auto FirstCst = MIB.buildConstant(SwitchTy, JTH.First);
890 auto Sub = MIB.buildSub({SwitchTy}, SwitchOpReg, FirstCst);
891
892 // This value may be smaller or larger than the target's pointer type, and
893 // therefore require extension or truncating.
894 auto *PtrIRTy = PointerType::getUnqual(SValue.getContext());
895 const LLT PtrScalarTy = LLT::integer(DL->getTypeSizeInBits(PtrIRTy));
896 Sub = MIB.buildZExtOrTrunc(PtrScalarTy, Sub);
897
898 JT.Reg = Sub.getReg(0);
899
900 if (JTH.FallthroughUnreachable) {
901 if (JT.MBB != HeaderBB->getNextNode())
902 MIB.buildBr(*JT.MBB);
903 return true;
904 }
905
906 // Emit the range check for the jump table, and branch to the default block
907 // for the switch statement if the value being switched on exceeds the
908 // largest case in the switch.
909 auto Cst = getOrCreateVReg(
910 *ConstantInt::get(SValue.getType(), JTH.Last - JTH.First));
911 Cst = MIB.buildZExtOrTrunc(PtrScalarTy, Cst).getReg(0);
912 auto Cmp = MIB.buildICmp(CmpInst::ICMP_UGT, LLT::integer(1), Sub, Cst);
913
914 auto BrCond = MIB.buildBrCond(Cmp.getReg(0), *JT.Default);
915
916 // Avoid emitting unnecessary branches to the next block.
917 if (JT.MBB != HeaderBB->getNextNode())
918 BrCond = MIB.buildBr(*JT.MBB);
919 return true;
920}
921
922void IRTranslator::emitSwitchCase(SwitchCG::CaseBlock &CB,
923 MachineBasicBlock *SwitchBB,
924 MachineIRBuilder &MIB) {
925 Register CondLHS = getOrCreateVReg(*CB.CmpLHS);
927 DebugLoc OldDbgLoc = MIB.getDebugLoc();
928 MIB.setDebugLoc(CB.DbgLoc);
929 MIB.setMBB(*CB.ThisBB);
930
931 if (CB.PredInfo.NoCmp) {
932 // Branch or fall through to TrueBB.
933 addSuccessorWithProb(CB.ThisBB, CB.TrueBB, CB.TrueProb);
934 addMachineCFGPred({SwitchBB->getBasicBlock(), CB.TrueBB->getBasicBlock()},
935 CB.ThisBB);
937 if (CB.TrueBB != CB.ThisBB->getNextNode())
938 MIB.buildBr(*CB.TrueBB);
939 MIB.setDebugLoc(OldDbgLoc);
940 return;
941 }
942
943 const LLT i1Ty = LLT::integer(1);
944 // Build the compare.
945 if (!CB.CmpMHS) {
946 const auto *CI = dyn_cast<ConstantInt>(CB.CmpRHS);
947 // For conditional branch lowering, we might try to do something silly like
948 // emit an G_ICMP to compare an existing G_ICMP i1 result with true. If so,
949 // just re-use the existing condition vreg.
950 if (MRI->getType(CondLHS).getSizeInBits() == 1 && CI && CI->isOne() &&
952 Cond = CondLHS;
953 } else {
954 Register CondRHS = getOrCreateVReg(*CB.CmpRHS);
956 Cond =
957 MIB.buildFCmp(CB.PredInfo.Pred, i1Ty, CondLHS, CondRHS).getReg(0);
958 else
959 Cond =
960 MIB.buildICmp(CB.PredInfo.Pred, i1Ty, CondLHS, CondRHS).getReg(0);
961 }
962 } else {
964 "Can only handle SLE ranges");
965
966 const APInt& Low = cast<ConstantInt>(CB.CmpLHS)->getValue();
967 const APInt& High = cast<ConstantInt>(CB.CmpRHS)->getValue();
968
969 Register CmpOpReg = getOrCreateVReg(*CB.CmpMHS);
970 if (cast<ConstantInt>(CB.CmpLHS)->isMinValue(true)) {
971 Register CondRHS = getOrCreateVReg(*CB.CmpRHS);
972 Cond =
973 MIB.buildICmp(CmpInst::ICMP_SLE, i1Ty, CmpOpReg, CondRHS).getReg(0);
974 } else {
975 const LLT CmpTy = MRI->getType(CmpOpReg);
976 auto Sub = MIB.buildSub({CmpTy}, CmpOpReg, CondLHS);
977 auto Diff = MIB.buildConstant(CmpTy, High - Low);
978 Cond = MIB.buildICmp(CmpInst::ICMP_ULE, i1Ty, Sub, Diff).getReg(0);
979 }
980 }
981
982 // Update successor info
983 addSuccessorWithProb(CB.ThisBB, CB.TrueBB, CB.TrueProb);
984
985 addMachineCFGPred({SwitchBB->getBasicBlock(), CB.TrueBB->getBasicBlock()},
986 CB.ThisBB);
987
988 // TrueBB and FalseBB are always different unless the incoming IR is
989 // degenerate. This only happens when running llc on weird IR.
990 if (CB.TrueBB != CB.FalseBB)
991 addSuccessorWithProb(CB.ThisBB, CB.FalseBB, CB.FalseProb);
993
994 addMachineCFGPred({SwitchBB->getBasicBlock(), CB.FalseBB->getBasicBlock()},
995 CB.ThisBB);
996
997 MIB.buildBrCond(Cond, *CB.TrueBB);
998 MIB.buildBr(*CB.FalseBB);
999 MIB.setDebugLoc(OldDbgLoc);
1000}
1001
1002bool IRTranslator::lowerJumpTableWorkItem(SwitchCG::SwitchWorkListItem W,
1003 MachineBasicBlock *SwitchMBB,
1004 MachineBasicBlock *CurMBB,
1005 MachineBasicBlock *DefaultMBB,
1006 MachineIRBuilder &MIB,
1008 BranchProbability UnhandledProbs,
1010 MachineBasicBlock *Fallthrough,
1011 bool FallthroughUnreachable) {
1012 using namespace SwitchCG;
1013 MachineFunction *CurMF = SwitchMBB->getParent();
1014 // FIXME: Optimize away range check based on pivot comparisons.
1015 JumpTableHeader *JTH = &SL->JTCases[I->JTCasesIndex].first;
1016 SwitchCG::JumpTable *JT = &SL->JTCases[I->JTCasesIndex].second;
1017 BranchProbability DefaultProb = W.DefaultProb;
1018
1019 // The jump block hasn't been inserted yet; insert it here.
1020 MachineBasicBlock *JumpMBB = JT->MBB;
1021 CurMF->insert(BBI, JumpMBB);
1022
1023 // Since the jump table block is separate from the switch block, we need
1024 // to keep track of it as a machine predecessor to the default block,
1025 // otherwise we lose the phi edges.
1026 addMachineCFGPred({SwitchMBB->getBasicBlock(), DefaultMBB->getBasicBlock()},
1027 CurMBB);
1028 addMachineCFGPred({SwitchMBB->getBasicBlock(), DefaultMBB->getBasicBlock()},
1029 JumpMBB);
1030
1031 auto JumpProb = I->Prob;
1032 auto FallthroughProb = UnhandledProbs;
1033
1034 // If the default statement is a target of the jump table, we evenly
1035 // distribute the default probability to successors of CurMBB. Also
1036 // update the probability on the edge from JumpMBB to Fallthrough.
1037 for (MachineBasicBlock::succ_iterator SI = JumpMBB->succ_begin(),
1038 SE = JumpMBB->succ_end();
1039 SI != SE; ++SI) {
1040 if (*SI == DefaultMBB) {
1041 JumpProb += DefaultProb / 2;
1042 FallthroughProb -= DefaultProb / 2;
1043 JumpMBB->setSuccProbability(SI, DefaultProb / 2);
1044 JumpMBB->normalizeSuccProbs();
1045 } else {
1046 // Also record edges from the jump table block to it's successors.
1047 addMachineCFGPred({SwitchMBB->getBasicBlock(), (*SI)->getBasicBlock()},
1048 JumpMBB);
1049 }
1050 }
1051
1052 if (FallthroughUnreachable)
1053 JTH->FallthroughUnreachable = true;
1054
1055 if (!JTH->FallthroughUnreachable)
1056 addSuccessorWithProb(CurMBB, Fallthrough, FallthroughProb);
1057 addSuccessorWithProb(CurMBB, JumpMBB, JumpProb);
1058 CurMBB->normalizeSuccProbs();
1059
1060 // The jump table header will be inserted in our current block, do the
1061 // range check, and fall through to our fallthrough block.
1062 JTH->HeaderBB = CurMBB;
1063 JT->Default = Fallthrough; // FIXME: Move Default to JumpTableHeader.
1064
1065 // If we're in the right place, emit the jump table header right now.
1066 if (CurMBB == SwitchMBB) {
1067 if (!emitJumpTableHeader(*JT, *JTH, CurMBB))
1068 return false;
1069 JTH->Emitted = true;
1070 }
1071 return true;
1072}
1073bool IRTranslator::lowerSwitchRangeWorkItem(SwitchCG::CaseClusterIt I,
1074 Value *Cond,
1075 MachineBasicBlock *Fallthrough,
1076 bool FallthroughUnreachable,
1077 BranchProbability UnhandledProbs,
1078 MachineBasicBlock *CurMBB,
1079 MachineIRBuilder &MIB,
1080 MachineBasicBlock *SwitchMBB) {
1081 using namespace SwitchCG;
1082 const Value *RHS, *LHS, *MHS;
1083 CmpInst::Predicate Pred;
1084 if (I->Low == I->High) {
1085 // Check Cond == I->Low.
1086 Pred = CmpInst::ICMP_EQ;
1087 LHS = Cond;
1088 RHS = I->Low;
1089 MHS = nullptr;
1090 } else {
1091 // Check I->Low <= Cond <= I->High.
1092 Pred = CmpInst::ICMP_SLE;
1093 LHS = I->Low;
1094 MHS = Cond;
1095 RHS = I->High;
1096 }
1097
1098 // If Fallthrough is unreachable, fold away the comparison.
1099 // The false probability is the sum of all unhandled cases.
1100 CaseBlock CB(Pred, FallthroughUnreachable, LHS, RHS, MHS, I->MBB, Fallthrough,
1101 CurMBB, MIB.getDebugLoc(), I->Prob, UnhandledProbs);
1102
1103 emitSwitchCase(CB, SwitchMBB, MIB);
1104 return true;
1105}
1106
1107void IRTranslator::emitBitTestHeader(SwitchCG::BitTestBlock &B,
1108 MachineBasicBlock *SwitchBB) {
1109 MachineIRBuilder &MIB = *CurBuilder;
1110 MIB.setMBB(*SwitchBB);
1111
1112 // Subtract the minimum value.
1113 Register SwitchOpReg = getOrCreateVReg(*B.SValue);
1114
1115 LLT SwitchOpTy = MRI->getType(SwitchOpReg);
1116 Register MinValReg = MIB.buildConstant(SwitchOpTy, B.First).getReg(0);
1117 auto RangeSub = MIB.buildSub(SwitchOpTy, SwitchOpReg, MinValReg);
1118
1119 Type *PtrIRTy = PointerType::getUnqual(MF->getFunction().getContext());
1120 const LLT PtrTy = getLLTForType(*PtrIRTy, *DL);
1121
1122 LLT MaskTy = SwitchOpTy;
1123 if (MaskTy.getSizeInBits() > PtrTy.getSizeInBits() ||
1125 MaskTy = LLT::integer(PtrTy.getSizeInBits());
1126 else {
1127 // Ensure that the type will fit the mask value.
1128 for (const SwitchCG::BitTestCase &Case : B.Cases) {
1129 if (!isUIntN(SwitchOpTy.getSizeInBits(), Case.Mask)) {
1130 // Switch table case range are encoded into series of masks.
1131 // Just use pointer type, it's guaranteed to fit.
1132 MaskTy = LLT::integer(PtrTy.getSizeInBits());
1133 break;
1134 }
1135 }
1136 }
1137 Register SubReg = RangeSub.getReg(0);
1138 if (SwitchOpTy != MaskTy)
1139 SubReg = MIB.buildZExtOrTrunc(MaskTy, SubReg).getReg(0);
1140
1141 B.RegVT = getMVTForLLT(MaskTy);
1142 B.Reg = SubReg;
1143
1144 MachineBasicBlock *MBB = B.Cases[0].ThisBB;
1145
1146 if (!B.FallthroughUnreachable)
1147 addSuccessorWithProb(SwitchBB, B.Default, B.DefaultProb);
1148 addSuccessorWithProb(SwitchBB, MBB, B.Prob);
1149
1150 SwitchBB->normalizeSuccProbs();
1151
1152 if (!B.FallthroughUnreachable) {
1153 // Conditional branch to the default block.
1154 auto RangeCst = MIB.buildConstant(SwitchOpTy, B.Range);
1155 auto RangeCmp = MIB.buildICmp(CmpInst::Predicate::ICMP_UGT, LLT::integer(1),
1156 RangeSub, RangeCst);
1157 MIB.buildBrCond(RangeCmp, *B.Default);
1158 }
1159
1160 // Avoid emitting unnecessary branches to the next block.
1161 if (MBB != SwitchBB->getNextNode())
1162 MIB.buildBr(*MBB);
1163}
1164
1165void IRTranslator::emitBitTestCase(SwitchCG::BitTestBlock &BB,
1166 MachineBasicBlock *NextMBB,
1167 BranchProbability BranchProbToNext,
1169 MachineBasicBlock *SwitchBB) {
1170 MachineIRBuilder &MIB = *CurBuilder;
1171 MIB.setMBB(*SwitchBB);
1172
1173 LLT SwitchTy = getLLTForMVT(BB.RegVT);
1174 Register Cmp;
1175 unsigned PopCount = llvm::popcount(B.Mask);
1176 if (PopCount == 1) {
1177 // Testing for a single bit; just compare the shift count with what it
1178 // would need to be to shift a 1 bit in that position.
1179 auto MaskTrailingZeros =
1180 MIB.buildConstant(SwitchTy, llvm::countr_zero(B.Mask));
1182 MaskTrailingZeros)
1183 .getReg(0);
1184 } else if (PopCount == BB.Range) {
1185 // There is only one zero bit in the range, test for it directly.
1186 auto MaskTrailingOnes =
1187 MIB.buildConstant(SwitchTy, llvm::countr_one(B.Mask));
1188 Cmp =
1189 MIB.buildICmp(CmpInst::ICMP_NE, LLT::integer(1), Reg, MaskTrailingOnes)
1190 .getReg(0);
1191 } else {
1192 // Make desired shift.
1193 auto CstOne = MIB.buildConstant(SwitchTy, 1);
1194 auto SwitchVal = MIB.buildShl(SwitchTy, CstOne, Reg);
1195
1196 // Emit bit tests and jumps.
1197 auto CstMask = MIB.buildConstant(SwitchTy, B.Mask);
1198 auto AndOp = MIB.buildAnd(SwitchTy, SwitchVal, CstMask);
1199 auto CstZero = MIB.buildConstant(SwitchTy, 0);
1200 Cmp = MIB.buildICmp(CmpInst::ICMP_NE, LLT::integer(1), AndOp, CstZero)
1201 .getReg(0);
1202 }
1203
1204 // The branch probability from SwitchBB to B.TargetBB is B.ExtraProb.
1205 addSuccessorWithProb(SwitchBB, B.TargetBB, B.ExtraProb);
1206 // The branch probability from SwitchBB to NextMBB is BranchProbToNext.
1207 addSuccessorWithProb(SwitchBB, NextMBB, BranchProbToNext);
1208 // It is not guaranteed that the sum of B.ExtraProb and BranchProbToNext is
1209 // one as they are relative probabilities (and thus work more like weights),
1210 // and hence we need to normalize them to let the sum of them become one.
1211 SwitchBB->normalizeSuccProbs();
1212
1213 // Record the fact that the IR edge from the header to the bit test target
1214 // will go through our new block. Neeeded for PHIs to have nodes added.
1215 addMachineCFGPred({BB.Parent->getBasicBlock(), B.TargetBB->getBasicBlock()},
1216 SwitchBB);
1217
1218 MIB.buildBrCond(Cmp, *B.TargetBB);
1219
1220 // Avoid emitting unnecessary branches to the next block.
1221 if (NextMBB != SwitchBB->getNextNode())
1222 MIB.buildBr(*NextMBB);
1223}
1224
1225bool IRTranslator::lowerBitTestWorkItem(
1227 MachineBasicBlock *CurMBB, MachineBasicBlock *DefaultMBB,
1229 BranchProbability DefaultProb, BranchProbability UnhandledProbs,
1231 bool FallthroughUnreachable) {
1232 using namespace SwitchCG;
1233 MachineFunction *CurMF = SwitchMBB->getParent();
1234 // FIXME: Optimize away range check based on pivot comparisons.
1235 BitTestBlock *BTB = &SL->BitTestCases[I->BTCasesIndex];
1236 // The bit test blocks haven't been inserted yet; insert them here.
1237 for (BitTestCase &BTC : BTB->Cases)
1238 CurMF->insert(BBI, BTC.ThisBB);
1239
1240 // Fill in fields of the BitTestBlock.
1241 BTB->Parent = CurMBB;
1242 BTB->Default = Fallthrough;
1243
1244 BTB->DefaultProb = UnhandledProbs;
1245 // If the cases in bit test don't form a contiguous range, we evenly
1246 // distribute the probability on the edge to Fallthrough to two
1247 // successors of CurMBB.
1248 if (!BTB->ContiguousRange) {
1249 BTB->Prob += DefaultProb / 2;
1250 BTB->DefaultProb -= DefaultProb / 2;
1251 }
1252
1253 if (FallthroughUnreachable)
1254 BTB->FallthroughUnreachable = true;
1255
1256 // If we're in the right place, emit the bit test header right now.
1257 if (CurMBB == SwitchMBB) {
1258 emitBitTestHeader(*BTB, SwitchMBB);
1259 BTB->Emitted = true;
1260 }
1261 return true;
1262}
1263
1264bool IRTranslator::lowerSwitchWorkItem(SwitchCG::SwitchWorkListItem W,
1265 Value *Cond,
1266 MachineBasicBlock *SwitchMBB,
1267 MachineBasicBlock *DefaultMBB,
1268 MachineIRBuilder &MIB) {
1269 using namespace SwitchCG;
1270 MachineFunction *CurMF = FuncInfo.MF;
1271 MachineBasicBlock *NextMBB = nullptr;
1273 if (++BBI != FuncInfo.MF->end())
1274 NextMBB = &*BBI;
1275
1276 if (EnableOpts) {
1277 // Here, we order cases by probability so the most likely case will be
1278 // checked first. However, two clusters can have the same probability in
1279 // which case their relative ordering is non-deterministic. So we use Low
1280 // as a tie-breaker as clusters are guaranteed to never overlap.
1281 llvm::sort(W.FirstCluster, W.LastCluster + 1,
1282 [](const CaseCluster &a, const CaseCluster &b) {
1283 return a.Prob != b.Prob
1284 ? a.Prob > b.Prob
1285 : a.Low->getValue().slt(b.Low->getValue());
1286 });
1287
1288 // Rearrange the case blocks so that the last one falls through if possible
1289 // without changing the order of probabilities.
1290 for (CaseClusterIt I = W.LastCluster; I > W.FirstCluster;) {
1291 --I;
1292 if (I->Prob > W.LastCluster->Prob)
1293 break;
1294 if (I->Kind == CC_Range && I->MBB == NextMBB) {
1295 std::swap(*I, *W.LastCluster);
1296 break;
1297 }
1298 }
1299 }
1300
1301 // Compute total probability.
1302 BranchProbability DefaultProb = W.DefaultProb;
1303 BranchProbability UnhandledProbs = DefaultProb;
1304 for (CaseClusterIt I = W.FirstCluster; I <= W.LastCluster; ++I)
1305 UnhandledProbs += I->Prob;
1306
1307 MachineBasicBlock *CurMBB = W.MBB;
1308 for (CaseClusterIt I = W.FirstCluster, E = W.LastCluster; I <= E; ++I) {
1309 bool FallthroughUnreachable = false;
1310 MachineBasicBlock *Fallthrough;
1311 if (I == W.LastCluster) {
1312 // For the last cluster, fall through to the default destination.
1313 Fallthrough = DefaultMBB;
1314 FallthroughUnreachable = isa<UnreachableInst>(
1315 DefaultMBB->getBasicBlock()->getFirstNonPHIOrDbg());
1316 } else {
1317 Fallthrough = CurMF->CreateMachineBasicBlock(CurMBB->getBasicBlock());
1318 CurMF->insert(BBI, Fallthrough);
1319 }
1320 UnhandledProbs -= I->Prob;
1321
1322 switch (I->Kind) {
1323 case CC_BitTests: {
1324 if (!lowerBitTestWorkItem(W, SwitchMBB, CurMBB, DefaultMBB, MIB, BBI,
1325 DefaultProb, UnhandledProbs, I, Fallthrough,
1326 FallthroughUnreachable)) {
1327 LLVM_DEBUG(dbgs() << "Failed to lower bit test for switch");
1328 return false;
1329 }
1330 break;
1331 }
1332
1333 case CC_JumpTable: {
1334 if (!lowerJumpTableWorkItem(W, SwitchMBB, CurMBB, DefaultMBB, MIB, BBI,
1335 UnhandledProbs, I, Fallthrough,
1336 FallthroughUnreachable)) {
1337 LLVM_DEBUG(dbgs() << "Failed to lower jump table");
1338 return false;
1339 }
1340 break;
1341 }
1342 case CC_Range: {
1343 if (!lowerSwitchRangeWorkItem(I, Cond, Fallthrough,
1344 FallthroughUnreachable, UnhandledProbs,
1345 CurMBB, MIB, SwitchMBB)) {
1346 LLVM_DEBUG(dbgs() << "Failed to lower switch range");
1347 return false;
1348 }
1349 break;
1350 }
1351 }
1352 CurMBB = Fallthrough;
1353 }
1354
1355 return true;
1356}
1357
1358bool IRTranslator::translateIndirectBr(const User &U,
1359 MachineIRBuilder &MIRBuilder) {
1360 const IndirectBrInst &BrInst = cast<IndirectBrInst>(U);
1361
1362 const Register Tgt = getOrCreateVReg(*BrInst.getAddress());
1363 MIRBuilder.buildBrIndirect(Tgt);
1364
1365 // Link successors.
1366 SmallPtrSet<const BasicBlock *, 32> AddedSuccessors;
1367 MachineBasicBlock &CurBB = MIRBuilder.getMBB();
1368 for (const BasicBlock *Succ : successors(&BrInst)) {
1369 // It's legal for indirectbr instructions to have duplicate blocks in the
1370 // destination list. We don't allow this in MIR. Skip anything that's
1371 // already a successor.
1372 if (!AddedSuccessors.insert(Succ).second)
1373 continue;
1374 CurBB.addSuccessor(&getMBB(*Succ));
1375 }
1376
1377 return true;
1378}
1379
1380static bool isSwiftError(const Value *V) {
1381 if (auto Arg = dyn_cast<Argument>(V))
1382 return Arg->hasSwiftErrorAttr();
1383 if (auto AI = dyn_cast<AllocaInst>(V))
1384 return AI->isSwiftError();
1385 return false;
1386}
1387
1388bool IRTranslator::translateLoad(const User &U, MachineIRBuilder &MIRBuilder) {
1389 const LoadInst &LI = cast<LoadInst>(U);
1390 TypeSize StoreSize = DL->getTypeStoreSize(LI.getType());
1391 if (StoreSize.isZero())
1392 return true;
1393
1394 ArrayRef<Register> Regs = getOrCreateVRegs(LI);
1395 Register Base = getOrCreateVReg(*LI.getPointerOperand());
1396 AAMDNodes AAInfo = LI.getAAMetadata();
1397
1398 const Value *Ptr = LI.getPointerOperand();
1399
1400 if (CLI->supportSwiftError() && isSwiftError(Ptr)) {
1401 assert(Regs.size() == 1 && "swifterror should be single pointer");
1402 Register VReg =
1403 SwiftError.getOrCreateVRegUseAt(&LI, &MIRBuilder.getMBB(), Ptr);
1404 MIRBuilder.buildCopy(Regs[0], VReg);
1405 return true;
1406 }
1407
1409 TLI->getLoadMemOperandFlags(LI, *DL, AC, LibInfo, OptLevel);
1410 if (AA && !(Flags & MachineMemOperand::MOInvariant)) {
1411 if (AA->pointsToConstantMemory(
1412 MemoryLocation(Ptr, LocationSize::precise(StoreSize), AAInfo))) {
1414 }
1415 }
1416
1417 // Fast-path the common single-register load.
1418 if (Regs.size() == 1) {
1419 auto *MMO = MF->getMachineMemOperand(
1420 MachinePointerInfo(LI.getPointerOperand()), Flags,
1421 MRI->getType(Regs[0]), getMemOpAlign(LI), AAInfo,
1422 LI.getMetadata(LLVMContext::MD_range), LI.getSyncScopeID(),
1423 LI.getOrdering());
1424 MIRBuilder.buildLoad(Regs[0], Base, *MMO);
1425 return true;
1426 }
1427
1428 ArrayRef<uint64_t> Offsets = *VMap.getOffsets(LI);
1429 Type *OffsetIRTy = DL->getIndexType(Ptr->getType());
1430 LLT OffsetTy = getLLTForType(*OffsetIRTy, *DL);
1431 for (unsigned i = 0; i < Regs.size(); ++i) {
1432 Register Addr;
1433 MIRBuilder.materializeObjectPtrOffset(Addr, Base, OffsetTy, Offsets[i]);
1434
1435 MachinePointerInfo Ptr(LI.getPointerOperand(), Offsets[i]);
1436 Align BaseAlign = getMemOpAlign(LI);
1437 auto *MMO = MF->getMachineMemOperand(Ptr, Flags, MRI->getType(Regs[i]),
1438 commonAlignment(BaseAlign, Offsets[i]),
1439 AAInfo, nullptr, LI.getSyncScopeID(),
1440 LI.getOrdering());
1441 MIRBuilder.buildLoad(Regs[i], Addr, *MMO);
1442 }
1443
1444 return true;
1445}
1446
1447bool IRTranslator::translateStore(const User &U, MachineIRBuilder &MIRBuilder) {
1448 const StoreInst &SI = cast<StoreInst>(U);
1449 if (DL->getTypeStoreSize(SI.getValueOperand()->getType()).isZero())
1450 return true;
1451
1452 ArrayRef<Register> Vals = getOrCreateVRegs(*SI.getValueOperand());
1453 Register Base = getOrCreateVReg(*SI.getPointerOperand());
1454
1455 if (CLI->supportSwiftError() && isSwiftError(SI.getPointerOperand())) {
1456 assert(Vals.size() == 1 && "swifterror should be single pointer");
1457
1458 Register VReg = SwiftError.getOrCreateVRegDefAt(&SI, &MIRBuilder.getMBB(),
1459 SI.getPointerOperand());
1460 MIRBuilder.buildCopy(VReg, Vals[0]);
1461 return true;
1462 }
1463
1464 MachineMemOperand::Flags Flags = TLI->getStoreMemOperandFlags(SI, *DL);
1465 // Fast-path the common single-register store.
1466 if (Vals.size() == 1) {
1467 auto *MMO = MF->getMachineMemOperand(
1468 MachinePointerInfo(SI.getPointerOperand()), Flags,
1469 MRI->getType(Vals[0]), getMemOpAlign(SI), SI.getAAMetadata(), nullptr,
1470 SI.getSyncScopeID(), SI.getOrdering());
1471 MIRBuilder.buildStore(Vals[0], Base, *MMO);
1472 return true;
1473 }
1474
1475 ArrayRef<uint64_t> Offsets = *VMap.getOffsets(*SI.getValueOperand());
1476 Type *OffsetIRTy = DL->getIndexType(SI.getPointerOperandType());
1477 LLT OffsetTy = getLLTForType(*OffsetIRTy, *DL);
1478 for (unsigned i = 0; i < Vals.size(); ++i) {
1479 Register Addr;
1480 MIRBuilder.materializeObjectPtrOffset(Addr, Base, OffsetTy, Offsets[i]);
1481
1482 MachinePointerInfo Ptr(SI.getPointerOperand(), Offsets[i]);
1483 Align BaseAlign = getMemOpAlign(SI);
1484 auto *MMO = MF->getMachineMemOperand(Ptr, Flags, MRI->getType(Vals[i]),
1485 commonAlignment(BaseAlign, Offsets[i]),
1486 SI.getAAMetadata(), nullptr,
1487 SI.getSyncScopeID(), SI.getOrdering());
1488 MIRBuilder.buildStore(Vals[i], Addr, *MMO);
1489 }
1490 return true;
1491}
1492
1494 const Value *Src = U.getOperand(0);
1495 Type *Int32Ty = Type::getInt32Ty(U.getContext());
1496
1497 // getIndexedOffsetInType is designed for GEPs, so the first index is the
1498 // usual array element rather than looking into the actual aggregate.
1500 Indices.push_back(ConstantInt::get(Int32Ty, 0));
1501
1502 if (const ExtractValueInst *EVI = dyn_cast<ExtractValueInst>(&U)) {
1503 for (auto Idx : EVI->indices())
1504 Indices.push_back(ConstantInt::get(Int32Ty, Idx));
1505 } else if (const InsertValueInst *IVI = dyn_cast<InsertValueInst>(&U)) {
1506 for (auto Idx : IVI->indices())
1507 Indices.push_back(ConstantInt::get(Int32Ty, Idx));
1508 } else {
1509 llvm::append_range(Indices, drop_begin(U.operands()));
1510 }
1511
1512 return static_cast<uint64_t>(
1513 DL.getIndexedOffsetInType(Src->getType(), Indices));
1514}
1515
1516bool IRTranslator::translateExtractValue(const User &U,
1517 MachineIRBuilder &MIRBuilder) {
1518 const Value *Src = U.getOperand(0);
1519 uint64_t Offset = getOffsetFromIndices(U, *DL);
1520 ArrayRef<Register> SrcRegs = getOrCreateVRegs(*Src);
1521 ArrayRef<uint64_t> Offsets = *VMap.getOffsets(*Src);
1522 unsigned Idx = llvm::lower_bound(Offsets, Offset) - Offsets.begin();
1523 auto &DstRegs = allocateVRegs(U);
1524
1525 for (unsigned i = 0; i < DstRegs.size(); ++i)
1526 DstRegs[i] = SrcRegs[Idx++];
1527
1528 return true;
1529}
1530
1531bool IRTranslator::translateInsertValue(const User &U,
1532 MachineIRBuilder &MIRBuilder) {
1533 const Value *Src = U.getOperand(0);
1534 uint64_t Offset = getOffsetFromIndices(U, *DL);
1535 auto &DstRegs = allocateVRegs(U);
1536 ArrayRef<uint64_t> DstOffsets = *VMap.getOffsets(U);
1537 ArrayRef<Register> SrcRegs = getOrCreateVRegs(*Src);
1538 ArrayRef<Register> InsertedRegs = getOrCreateVRegs(*U.getOperand(1));
1539 auto *InsertedIt = InsertedRegs.begin();
1540
1541 for (unsigned i = 0; i < DstRegs.size(); ++i) {
1542 if (DstOffsets[i] >= Offset && InsertedIt != InsertedRegs.end())
1543 DstRegs[i] = *InsertedIt++;
1544 else
1545 DstRegs[i] = SrcRegs[i];
1546 }
1547
1548 return true;
1549}
1550
1551bool IRTranslator::translateSelect(const User &U,
1552 MachineIRBuilder &MIRBuilder) {
1553 Register Tst = getOrCreateVReg(*U.getOperand(0));
1554 ArrayRef<Register> ResRegs = getOrCreateVRegs(U);
1555 ArrayRef<Register> Op0Regs = getOrCreateVRegs(*U.getOperand(1));
1556 ArrayRef<Register> Op1Regs = getOrCreateVRegs(*U.getOperand(2));
1557
1558 uint32_t Flags = 0;
1559 if (const SelectInst *SI = dyn_cast<SelectInst>(&U))
1561
1562 for (unsigned i = 0; i < ResRegs.size(); ++i) {
1563 MIRBuilder.buildSelect(ResRegs[i], Tst, Op0Regs[i], Op1Regs[i], Flags);
1564 }
1565
1566 return true;
1567}
1568
1569bool IRTranslator::translateCopy(const User &U, const Value &V,
1570 MachineIRBuilder &MIRBuilder) {
1571 Register Src = getOrCreateVReg(V);
1572 auto &Regs = *VMap.getVRegs(U);
1573 if (Regs.empty()) {
1574 Regs.push_back(Src);
1575 VMap.getOffsets(U)->push_back(0);
1576 } else {
1577 // If we already assigned a vreg for this instruction, we can't change that.
1578 // Emit a copy to satisfy the users we already emitted.
1579 MIRBuilder.buildCopy(Regs[0], Src);
1580 }
1581 return true;
1582}
1583
1584bool IRTranslator::translateBitCast(const User &U,
1585 MachineIRBuilder &MIRBuilder) {
1586 Type *SrcTy = U.getOperand(0)->getType();
1587 Type *DstTy = U.getType();
1588
1589 // If we're bitcasting to the source type, we can reuse the source vreg.
1590 if (getLLTForType(*SrcTy, *DL) == getLLTForType(*DstTy, *DL)) {
1591 // If the source is a ConstantInt then it was probably created by
1592 // ConstantHoisting and we should leave it alone.
1593 if (isa<ConstantInt>(U.getOperand(0)))
1594 return translateCast(TargetOpcode::G_CONSTANT_FOLD_BARRIER, U,
1595 MIRBuilder);
1596 return translateCopy(U, *U.getOperand(0), MIRBuilder);
1597 }
1598
1599 // Only the scalar byte<->ptr crossing is redirected to G_INTTOPTR/G_PTRTOINT,
1600 // which is the well-typed MIR shape for that boundary. Vector byte<->ptr
1601 // (e.g. <N x b32> -> ptr produced by mixed-type load coalescing) and other
1602 // legacy ptr/non-ptr IR bitcasts (AMDGPU iN<->p3 kernarg packing, etc.)
1603 // keep their historical G_BITCAST lowering — G_INTTOPTR has no vector-src
1604 // -> scalar-ptr form, and downstream passes already handle G_BITCAST.
1605 if (DstTy->isPointerTy() && SrcTy->isByteTy())
1606 return translateCast(TargetOpcode::G_INTTOPTR, U, MIRBuilder);
1607 if (SrcTy->isPointerTy() && DstTy->isByteTy())
1608 return translateCast(TargetOpcode::G_PTRTOINT, U, MIRBuilder);
1609
1610 return translateCast(TargetOpcode::G_BITCAST, U, MIRBuilder);
1611}
1612
1613bool IRTranslator::translateCast(unsigned Opcode, const User &U,
1614 MachineIRBuilder &MIRBuilder) {
1615 if (!mayTranslateUserTypes(U))
1616 return false;
1617
1618 uint32_t Flags = 0;
1619 if (const Instruction *I = dyn_cast<Instruction>(&U))
1621
1622 Register Op = getOrCreateVReg(*U.getOperand(0));
1623 Register Res = getOrCreateVReg(U);
1624 MIRBuilder.buildInstr(Opcode, {Res}, {Op}, Flags);
1625 return true;
1626}
1627
1628bool IRTranslator::translateGetElementPtr(const User &U,
1629 MachineIRBuilder &MIRBuilder) {
1630 Value &Op0 = *U.getOperand(0);
1631 Register BaseReg = getOrCreateVReg(Op0);
1632 Type *PtrIRTy = Op0.getType();
1633 LLT PtrTy = getLLTForType(*PtrIRTy, *DL);
1634 Type *OffsetIRTy = DL->getIndexType(PtrIRTy);
1635 LLT OffsetTy = getLLTForType(*OffsetIRTy, *DL);
1636
1637 uint32_t PtrAddFlags = 0;
1638 // Each PtrAdd generated to implement the GEP inherits its nuw, nusw, inbounds
1639 // flags.
1640 if (const Instruction *I = dyn_cast<Instruction>(&U))
1642
1643 auto PtrAddFlagsWithConst = [&](int64_t Offset) {
1644 // For nusw/inbounds GEP with an offset that is nonnegative when interpreted
1645 // as signed, assume there is no unsigned overflow.
1646 if (Offset >= 0 && (PtrAddFlags & MachineInstr::MIFlag::NoUSWrap))
1647 return PtrAddFlags | MachineInstr::MIFlag::NoUWrap;
1648 return PtrAddFlags;
1649 };
1650
1651 // Normalize Vector GEP - all scalar operands should be converted to the
1652 // splat vector.
1653 unsigned VectorWidth = 0;
1654
1655 // True if we should use a splat vector; using VectorWidth alone is not
1656 // sufficient.
1657 bool WantSplatVector = false;
1658 if (auto *VT = dyn_cast<VectorType>(U.getType())) {
1659 VectorWidth = cast<FixedVectorType>(VT)->getNumElements();
1660 // We don't produce 1 x N vectors; those are treated as scalars.
1661 WantSplatVector = VectorWidth > 1;
1662 }
1663
1664 if (cast<GEPOperator>(U).hasAllZeroIndices())
1665 return translateCopy(U, Op0, MIRBuilder);
1666
1667 // We might need to splat the base pointer into a vector if the offsets
1668 // are vectors.
1669 if (WantSplatVector && !PtrTy.isVector()) {
1670 BaseReg = MIRBuilder
1671 .buildSplatBuildVector(LLT::fixed_vector(VectorWidth, PtrTy),
1672 BaseReg)
1673 .getReg(0);
1674 PtrIRTy = FixedVectorType::get(PtrIRTy, VectorWidth);
1675 PtrTy = getLLTForType(*PtrIRTy, *DL);
1676 OffsetIRTy = DL->getIndexType(PtrIRTy);
1677 OffsetTy = getLLTForType(*OffsetIRTy, *DL);
1678 }
1679
1680 int64_t Offset = 0;
1681 for (gep_type_iterator GTI = gep_type_begin(&U), E = gep_type_end(&U);
1682 GTI != E; ++GTI) {
1683 const Value *Idx = GTI.getOperand();
1684 if (StructType *StTy = GTI.getStructTypeOrNull()) {
1685 unsigned Field = cast<Constant>(Idx)->getUniqueInteger().getZExtValue();
1686 Offset += DL->getStructLayout(StTy)->getElementOffset(Field);
1687 continue;
1688 } else {
1689 uint64_t ElementSize = GTI.getSequentialElementStride(*DL);
1690
1691 // If this is a scalar constant or a splat vector of constants,
1692 // handle it quickly.
1693 if (const auto *CI = dyn_cast<ConstantInt>(Idx)) {
1694 if (std::optional<int64_t> Val = CI->getValue().trySExtValue()) {
1695 Offset += ElementSize * *Val;
1696 continue;
1697 }
1698 }
1699
1700 if (Offset != 0) {
1701 auto OffsetMIB = MIRBuilder.buildConstant({OffsetTy}, Offset);
1702 BaseReg = MIRBuilder
1703 .buildPtrAdd(PtrTy, BaseReg, OffsetMIB.getReg(0),
1704 PtrAddFlagsWithConst(Offset))
1705 .getReg(0);
1706 Offset = 0;
1707 }
1708
1709 Register IdxReg = getOrCreateVReg(*Idx);
1710 LLT IdxTy = MRI->getType(IdxReg);
1711 if (IdxTy != OffsetTy) {
1712 if (!IdxTy.isVector() && WantSplatVector) {
1713 IdxReg = MIRBuilder
1715 IdxReg)
1716 .getReg(0);
1717 }
1718
1719 IdxReg = MIRBuilder.buildSExtOrTrunc(OffsetTy, IdxReg).getReg(0);
1720 }
1721
1722 // N = N + Idx * ElementSize;
1723 // Avoid doing it for ElementSize of 1.
1724 Register GepOffsetReg;
1725 if (ElementSize != 1) {
1726 auto ElementSizeMIB = MIRBuilder.buildConstant(
1727 getLLTForType(*OffsetIRTy, *DL), ElementSize);
1728
1729 // The multiplication is NUW if the GEP is NUW and NSW if the GEP is
1730 // NUSW.
1731 uint32_t ScaleFlags = PtrAddFlags & MachineInstr::MIFlag::NoUWrap;
1732 if (PtrAddFlags & MachineInstr::MIFlag::NoUSWrap)
1733 ScaleFlags |= MachineInstr::MIFlag::NoSWrap;
1734
1735 GepOffsetReg =
1736 MIRBuilder.buildMul(OffsetTy, IdxReg, ElementSizeMIB, ScaleFlags)
1737 .getReg(0);
1738 } else {
1739 GepOffsetReg = IdxReg;
1740 }
1741
1742 BaseReg =
1743 MIRBuilder.buildPtrAdd(PtrTy, BaseReg, GepOffsetReg, PtrAddFlags)
1744 .getReg(0);
1745 }
1746 }
1747
1748 if (Offset != 0) {
1749 auto OffsetMIB =
1750 MIRBuilder.buildConstant(OffsetTy, Offset);
1751
1752 MIRBuilder.buildPtrAdd(getOrCreateVReg(U), BaseReg, OffsetMIB.getReg(0),
1753 PtrAddFlagsWithConst(Offset));
1754 return true;
1755 }
1756
1757 MIRBuilder.buildCopy(getOrCreateVReg(U), BaseReg);
1758 return true;
1759}
1760
1761bool IRTranslator::translateMemFunc(const CallInst &CI,
1762 MachineIRBuilder &MIRBuilder,
1763 unsigned Opcode) {
1764 const Value *SrcPtr = CI.getArgOperand(1);
1765 // If the source is undef, then just emit a nop.
1766 if (isa<UndefValue>(SrcPtr))
1767 return true;
1768
1770
1771 unsigned MinPtrSize = UINT_MAX;
1772 for (auto AI = CI.arg_begin(), AE = CI.arg_end(); std::next(AI) != AE; ++AI) {
1773 Register SrcReg = getOrCreateVReg(**AI);
1774 LLT SrcTy = MRI->getType(SrcReg);
1775 if (SrcTy.isPointer())
1776 MinPtrSize = std::min<unsigned>(SrcTy.getSizeInBits(), MinPtrSize);
1777 SrcRegs.push_back(SrcReg);
1778 }
1779
1780 LLT SizeTy = LLT::integer(MinPtrSize);
1781
1782 // The size operand should be the minimum of the pointer sizes.
1783 Register &SizeOpReg = SrcRegs[SrcRegs.size() - 1];
1784 if (MRI->getType(SizeOpReg) != SizeTy)
1785 SizeOpReg = MIRBuilder.buildZExtOrTrunc(SizeTy, SizeOpReg).getReg(0);
1786
1787 auto ICall = MIRBuilder.buildInstr(Opcode);
1788 for (Register SrcReg : SrcRegs)
1789 ICall.addUse(SrcReg);
1790
1791 Align DstAlign;
1792 Align SrcAlign;
1793 unsigned IsVol =
1794 cast<ConstantInt>(CI.getArgOperand(CI.arg_size() - 1))->getZExtValue();
1795
1796 ConstantInt *CopySize = nullptr;
1797
1798 if (auto *MCI = dyn_cast<MemCpyInst>(&CI)) {
1799 DstAlign = MCI->getDestAlign().valueOrOne();
1800 SrcAlign = MCI->getSourceAlign().valueOrOne();
1801 CopySize = dyn_cast<ConstantInt>(MCI->getArgOperand(2));
1802 } else if (auto *MMI = dyn_cast<MemMoveInst>(&CI)) {
1803 DstAlign = MMI->getDestAlign().valueOrOne();
1804 SrcAlign = MMI->getSourceAlign().valueOrOne();
1805 CopySize = dyn_cast<ConstantInt>(MMI->getArgOperand(2));
1806 } else {
1807 auto *MSI = cast<MemSetInst>(&CI);
1808 DstAlign = MSI->getDestAlign().valueOrOne();
1809 }
1810
1811 if (Opcode != TargetOpcode::G_MEMCPY_INLINE) {
1812 // We need to propagate the tail call flag from the IR inst as an argument.
1813 // Otherwise, we have to pessimize and assume later that we cannot tail call
1814 // any memory intrinsics.
1815 ICall.addImm(CI.isTailCall() ? 1 : 0);
1816 }
1817
1818 // Create mem operands to store the alignment and volatile info.
1821 if (IsVol) {
1822 LoadFlags |= MachineMemOperand::MOVolatile;
1823 StoreFlags |= MachineMemOperand::MOVolatile;
1824 }
1825
1826 AAMDNodes AAInfo = CI.getAAMetadata();
1827 if (AA && CopySize &&
1828 AA->pointsToConstantMemory(MemoryLocation(
1829 SrcPtr, LocationSize::precise(CopySize->getZExtValue()), AAInfo))) {
1830 LoadFlags |= MachineMemOperand::MOInvariant;
1831
1832 // FIXME: pointsToConstantMemory probably does not imply dereferenceable,
1833 // but the previous usage implied it did. Probably should check
1834 // isDereferenceableAndAlignedPointer.
1836 }
1837
1838 ICall.addMemOperand(
1839 MF->getMachineMemOperand(MachinePointerInfo(CI.getArgOperand(0)),
1840 StoreFlags, 1, DstAlign, AAInfo));
1841 if (Opcode != TargetOpcode::G_MEMSET)
1842 ICall.addMemOperand(MF->getMachineMemOperand(
1843 MachinePointerInfo(SrcPtr), LoadFlags, 1, SrcAlign, AAInfo));
1844
1845 return true;
1846}
1847
1848bool IRTranslator::translateTrap(const CallInst &CI,
1849 MachineIRBuilder &MIRBuilder,
1850 unsigned Opcode) {
1851 StringRef TrapFuncName =
1852 CI.getAttributes().getFnAttr("trap-func-name").getValueAsString();
1853 if (TrapFuncName.empty()) {
1854 if (Opcode == TargetOpcode::G_UBSANTRAP) {
1855 uint64_t Code = cast<ConstantInt>(CI.getOperand(0))->getZExtValue();
1856 MIRBuilder.buildInstr(Opcode, {}, ArrayRef<llvm::SrcOp>{Code});
1857 } else {
1858 MIRBuilder.buildInstr(Opcode);
1859 }
1860 return true;
1861 }
1862
1863 CallLowering::CallLoweringInfo Info;
1864 if (Opcode == TargetOpcode::G_UBSANTRAP)
1865 Info.OrigArgs.push_back({getOrCreateVRegs(*CI.getArgOperand(0)),
1866 CI.getArgOperand(0)->getType(), 0});
1867
1868 Info.Callee = MachineOperand::CreateES(TrapFuncName.data());
1869 Info.CB = &CI;
1870 Info.OrigRet = {Register(), Type::getVoidTy(CI.getContext()), 0};
1871 return CLI->lowerCall(MIRBuilder, Info);
1872}
1873
1874bool IRTranslator::translateVectorInterleave2Intrinsic(
1875 const CallInst &CI, MachineIRBuilder &MIRBuilder) {
1876 assert(CI.getIntrinsicID() == Intrinsic::vector_interleave2 &&
1877 "This function can only be called on the interleave2 intrinsic!");
1878 // Canonicalize interleave2 to G_SHUFFLE_VECTOR (similar to SelectionDAG).
1879 Register Op0 = getOrCreateVReg(*CI.getOperand(0));
1880 Register Op1 = getOrCreateVReg(*CI.getOperand(1));
1881 Register Res = getOrCreateVReg(CI);
1882
1883 LLT OpTy = MRI->getType(Op0);
1884 MIRBuilder.buildShuffleVector(Res, Op0, Op1,
1886
1887 return true;
1888}
1889
1890bool IRTranslator::translateVectorDeinterleave2Intrinsic(
1891 const CallInst &CI, MachineIRBuilder &MIRBuilder) {
1892 assert(CI.getIntrinsicID() == Intrinsic::vector_deinterleave2 &&
1893 "This function can only be called on the deinterleave2 intrinsic!");
1894 // Canonicalize deinterleave2 to shuffles that extract sub-vectors (similar to
1895 // SelectionDAG).
1896 Register Op = getOrCreateVReg(*CI.getOperand(0));
1897 auto Undef = MIRBuilder.buildUndef(MRI->getType(Op));
1898 ArrayRef<Register> Res = getOrCreateVRegs(CI);
1899
1900 LLT ResTy = MRI->getType(Res[0]);
1901 MIRBuilder.buildShuffleVector(Res[0], Op, Undef,
1902 createStrideMask(0, 2, ResTy.getNumElements()));
1903 MIRBuilder.buildShuffleVector(Res[1], Op, Undef,
1904 createStrideMask(1, 2, ResTy.getNumElements()));
1905
1906 return true;
1907}
1908
1909void IRTranslator::getStackGuard(Register DstReg,
1910 MachineIRBuilder &MIRBuilder) {
1911 Value *Global =
1912 TLI->getSDagStackGuard(*MF->getFunction().getParent(), *Libcalls);
1913 if (!Global) {
1914 LLVMContext &Ctx = MIRBuilder.getContext();
1915 Ctx.diagnose(DiagnosticInfoGeneric("unable to lower stackguard"));
1916 MIRBuilder.buildUndef(DstReg);
1917 return;
1918 }
1919
1920 const TargetRegisterInfo *TRI = MF->getSubtarget().getRegisterInfo();
1921 MRI->setRegClass(DstReg, TRI->getPointerRegClass());
1922 auto MIB =
1923 MIRBuilder.buildInstr(TargetOpcode::LOAD_STACK_GUARD, {DstReg}, {});
1924
1925 unsigned AddrSpace = Global->getType()->getPointerAddressSpace();
1926 LLT PtrTy = LLT::pointer(AddrSpace, DL->getPointerSizeInBits(AddrSpace));
1927
1928 MachinePointerInfo MPInfo(Global);
1931 MachineMemOperand *MemRef = MF->getMachineMemOperand(
1932 MPInfo, Flags, PtrTy, DL->getPointerABIAlignment(AddrSpace));
1933 MIB.setMemRefs({MemRef});
1934}
1935
1936bool IRTranslator::translateOverflowIntrinsic(const CallInst &CI, unsigned Op,
1937 MachineIRBuilder &MIRBuilder) {
1938 ArrayRef<Register> ResRegs = getOrCreateVRegs(CI);
1939 MIRBuilder.buildInstr(
1940 Op, {ResRegs[0], ResRegs[1]},
1941 {getOrCreateVReg(*CI.getOperand(0)), getOrCreateVReg(*CI.getOperand(1))});
1942
1943 return true;
1944}
1945
1946bool IRTranslator::translateFixedPointIntrinsic(unsigned Op, const CallInst &CI,
1947 MachineIRBuilder &MIRBuilder) {
1948 Register Dst = getOrCreateVReg(CI);
1949 Register Src0 = getOrCreateVReg(*CI.getOperand(0));
1950 Register Src1 = getOrCreateVReg(*CI.getOperand(1));
1951 uint64_t Scale = cast<ConstantInt>(CI.getOperand(2))->getZExtValue();
1952 MIRBuilder.buildInstr(Op, {Dst}, { Src0, Src1, Scale });
1953 return true;
1954}
1955
1956unsigned IRTranslator::getSimpleIntrinsicOpcode(Intrinsic::ID ID) {
1957 switch (ID) {
1958 default:
1959 break;
1960 case Intrinsic::acos:
1961 return TargetOpcode::G_FACOS;
1962 case Intrinsic::asin:
1963 return TargetOpcode::G_FASIN;
1964 case Intrinsic::atan:
1965 return TargetOpcode::G_FATAN;
1966 case Intrinsic::atan2:
1967 return TargetOpcode::G_FATAN2;
1968 case Intrinsic::bswap:
1969 return TargetOpcode::G_BSWAP;
1970 case Intrinsic::bitreverse:
1971 return TargetOpcode::G_BITREVERSE;
1972 case Intrinsic::fshl:
1973 return TargetOpcode::G_FSHL;
1974 case Intrinsic::fshr:
1975 return TargetOpcode::G_FSHR;
1976 case Intrinsic::ceil:
1977 return TargetOpcode::G_FCEIL;
1978 case Intrinsic::cos:
1979 return TargetOpcode::G_FCOS;
1980 case Intrinsic::cosh:
1981 return TargetOpcode::G_FCOSH;
1982 case Intrinsic::ctpop:
1983 return TargetOpcode::G_CTPOP;
1984 case Intrinsic::exp:
1985 return TargetOpcode::G_FEXP;
1986 case Intrinsic::exp2:
1987 return TargetOpcode::G_FEXP2;
1988 case Intrinsic::exp10:
1989 return TargetOpcode::G_FEXP10;
1990 case Intrinsic::fabs:
1991 return TargetOpcode::G_FABS;
1992 case Intrinsic::copysign:
1993 return TargetOpcode::G_FCOPYSIGN;
1994 case Intrinsic::minnum:
1995 return TargetOpcode::G_FMINNUM;
1996 case Intrinsic::maxnum:
1997 return TargetOpcode::G_FMAXNUM;
1998 case Intrinsic::minimum:
1999 return TargetOpcode::G_FMINIMUM;
2000 case Intrinsic::maximum:
2001 return TargetOpcode::G_FMAXIMUM;
2002 case Intrinsic::minimumnum:
2003 return TargetOpcode::G_FMINIMUMNUM;
2004 case Intrinsic::maximumnum:
2005 return TargetOpcode::G_FMAXIMUMNUM;
2006 case Intrinsic::canonicalize:
2007 return TargetOpcode::G_FCANONICALIZE;
2008 case Intrinsic::floor:
2009 return TargetOpcode::G_FFLOOR;
2010 case Intrinsic::fma:
2011 return TargetOpcode::G_FMA;
2012 case Intrinsic::log:
2013 return TargetOpcode::G_FLOG;
2014 case Intrinsic::log2:
2015 return TargetOpcode::G_FLOG2;
2016 case Intrinsic::log10:
2017 return TargetOpcode::G_FLOG10;
2018 case Intrinsic::ldexp:
2019 return TargetOpcode::G_FLDEXP;
2020 case Intrinsic::nearbyint:
2021 return TargetOpcode::G_FNEARBYINT;
2022 case Intrinsic::pow:
2023 return TargetOpcode::G_FPOW;
2024 case Intrinsic::powi:
2025 return TargetOpcode::G_FPOWI;
2026 case Intrinsic::rint:
2027 return TargetOpcode::G_FRINT;
2028 case Intrinsic::round:
2029 return TargetOpcode::G_INTRINSIC_ROUND;
2030 case Intrinsic::roundeven:
2031 return TargetOpcode::G_INTRINSIC_ROUNDEVEN;
2032 case Intrinsic::sin:
2033 return TargetOpcode::G_FSIN;
2034 case Intrinsic::sinh:
2035 return TargetOpcode::G_FSINH;
2036 case Intrinsic::sqrt:
2037 return TargetOpcode::G_FSQRT;
2038 case Intrinsic::tan:
2039 return TargetOpcode::G_FTAN;
2040 case Intrinsic::tanh:
2041 return TargetOpcode::G_FTANH;
2042 case Intrinsic::trunc:
2043 return TargetOpcode::G_INTRINSIC_TRUNC;
2044 case Intrinsic::readcyclecounter:
2045 return TargetOpcode::G_READCYCLECOUNTER;
2046 case Intrinsic::readsteadycounter:
2047 return TargetOpcode::G_READSTEADYCOUNTER;
2048 case Intrinsic::ptrmask:
2049 return TargetOpcode::G_PTRMASK;
2050 case Intrinsic::lrint:
2051 return TargetOpcode::G_INTRINSIC_LRINT;
2052 case Intrinsic::llrint:
2053 return TargetOpcode::G_INTRINSIC_LLRINT;
2054 // FADD/FMUL require checking the FMF, so are handled elsewhere.
2055 case Intrinsic::vector_reduce_fmin:
2056 return TargetOpcode::G_VECREDUCE_FMIN;
2057 case Intrinsic::vector_reduce_fmax:
2058 return TargetOpcode::G_VECREDUCE_FMAX;
2059 case Intrinsic::vector_reduce_fminimum:
2060 return TargetOpcode::G_VECREDUCE_FMINIMUM;
2061 case Intrinsic::vector_reduce_fmaximum:
2062 return TargetOpcode::G_VECREDUCE_FMAXIMUM;
2063 case Intrinsic::vector_reduce_add:
2064 return TargetOpcode::G_VECREDUCE_ADD;
2065 case Intrinsic::vector_reduce_mul:
2066 return TargetOpcode::G_VECREDUCE_MUL;
2067 case Intrinsic::vector_reduce_and:
2068 return TargetOpcode::G_VECREDUCE_AND;
2069 case Intrinsic::vector_reduce_or:
2070 return TargetOpcode::G_VECREDUCE_OR;
2071 case Intrinsic::vector_reduce_xor:
2072 return TargetOpcode::G_VECREDUCE_XOR;
2073 case Intrinsic::vector_reduce_smax:
2074 return TargetOpcode::G_VECREDUCE_SMAX;
2075 case Intrinsic::vector_reduce_smin:
2076 return TargetOpcode::G_VECREDUCE_SMIN;
2077 case Intrinsic::vector_reduce_umax:
2078 return TargetOpcode::G_VECREDUCE_UMAX;
2079 case Intrinsic::vector_reduce_umin:
2080 return TargetOpcode::G_VECREDUCE_UMIN;
2081 case Intrinsic::experimental_vector_compress:
2082 return TargetOpcode::G_VECTOR_COMPRESS;
2083 case Intrinsic::lround:
2084 return TargetOpcode::G_LROUND;
2085 case Intrinsic::llround:
2086 return TargetOpcode::G_LLROUND;
2087 case Intrinsic::get_fpenv:
2088 return TargetOpcode::G_GET_FPENV;
2089 case Intrinsic::get_fpmode:
2090 return TargetOpcode::G_GET_FPMODE;
2091 }
2093}
2094
2095bool IRTranslator::translateSimpleIntrinsic(const CallInst &CI,
2097 MachineIRBuilder &MIRBuilder) {
2098
2099 unsigned Op = getSimpleIntrinsicOpcode(ID);
2100
2101 // Is this a simple intrinsic?
2103 return false;
2104
2105 // Yes. Let's translate it.
2107 for (const auto &Arg : CI.args())
2108 VRegs.push_back(getOrCreateVReg(*Arg));
2109
2110 MIRBuilder.buildInstr(Op, {getOrCreateVReg(CI)}, VRegs,
2112 return true;
2113}
2114
2115// TODO: Include ConstainedOps.def when all strict instructions are defined.
2117 switch (ID) {
2118 case Intrinsic::experimental_constrained_fadd:
2119 return TargetOpcode::G_STRICT_FADD;
2120 case Intrinsic::experimental_constrained_fsub:
2121 return TargetOpcode::G_STRICT_FSUB;
2122 case Intrinsic::experimental_constrained_fmul:
2123 return TargetOpcode::G_STRICT_FMUL;
2124 case Intrinsic::experimental_constrained_fdiv:
2125 return TargetOpcode::G_STRICT_FDIV;
2126 case Intrinsic::experimental_constrained_frem:
2127 return TargetOpcode::G_STRICT_FREM;
2128 case Intrinsic::experimental_constrained_fma:
2129 return TargetOpcode::G_STRICT_FMA;
2130 case Intrinsic::experimental_constrained_sqrt:
2131 return TargetOpcode::G_STRICT_FSQRT;
2132 case Intrinsic::experimental_constrained_ldexp:
2133 return TargetOpcode::G_STRICT_FLDEXP;
2134 case Intrinsic::experimental_constrained_fcmp:
2135 return TargetOpcode::G_STRICT_FCMP;
2136 case Intrinsic::experimental_constrained_fcmps:
2137 return TargetOpcode::G_STRICT_FCMPS;
2138 default:
2139 return 0;
2140 }
2141}
2142
2143bool IRTranslator::translateConstrainedFPIntrinsic(
2144 const ConstrainedFPIntrinsic &FPI, MachineIRBuilder &MIRBuilder) {
2146
2147 unsigned Opcode = getConstrainedOpcode(FPI.getIntrinsicID());
2148 if (!Opcode)
2149 return false;
2150
2154
2155 if (Opcode == TargetOpcode::G_STRICT_FCMP ||
2156 Opcode == TargetOpcode::G_STRICT_FCMPS) {
2157 auto *FPCmp = cast<ConstrainedFPCmpIntrinsic>(&FPI);
2158 Register Operand0 = getOrCreateVReg(*FPCmp->getArgOperand(0));
2159 Register Operand1 = getOrCreateVReg(*FPCmp->getArgOperand(1));
2160 Register Result = getOrCreateVReg(FPI);
2161 MIRBuilder.buildInstr(Opcode, {Result}, {}, Flags)
2162 .addPredicate(FPCmp->getPredicate())
2163 .addUse(Operand0)
2164 .addUse(Operand1);
2165 return true;
2166 }
2167
2169 for (unsigned I = 0, E = FPI.getNonMetadataArgCount(); I != E; ++I)
2170 VRegs.push_back(getOrCreateVReg(*FPI.getArgOperand(I)));
2171
2172 MIRBuilder.buildInstr(Opcode, {getOrCreateVReg(FPI)}, VRegs, Flags);
2173 return true;
2174}
2175
2176std::optional<MCRegister> IRTranslator::getArgPhysReg(Argument &Arg) {
2177 auto VRegs = getOrCreateVRegs(Arg);
2178 if (VRegs.size() != 1)
2179 return std::nullopt;
2180
2181 // Arguments are lowered as a copy of a livein physical register.
2182 auto *VRegDef = MF->getRegInfo().getVRegDef(VRegs[0]);
2183 if (!VRegDef || !VRegDef->isCopy())
2184 return std::nullopt;
2185 return VRegDef->getOperand(1).getReg().asMCReg();
2186}
2187
2188bool IRTranslator::translateIfEntryValueArgument(bool isDeclare, Value *Val,
2189 const DILocalVariable *Var,
2190 const DIExpression *Expr,
2191 const DebugLoc &DL,
2192 MachineIRBuilder &MIRBuilder) {
2193 auto *Arg = dyn_cast<Argument>(Val);
2194 if (!Arg)
2195 return false;
2196
2197 if (!Expr->isEntryValue())
2198 return false;
2199
2200 std::optional<MCRegister> PhysReg = getArgPhysReg(*Arg);
2201 if (!PhysReg) {
2202 LLVM_DEBUG(dbgs() << "Dropping dbg." << (isDeclare ? "declare" : "value")
2203 << ": expression is entry_value but "
2204 << "couldn't find a physical register\n");
2205 LLVM_DEBUG(dbgs() << *Var << "\n");
2206 return true;
2207 }
2208
2209 if (isDeclare) {
2210 // Append an op deref to account for the fact that this is a dbg_declare.
2211 Expr = DIExpression::append(Expr, dwarf::DW_OP_deref);
2212 MF->setVariableDbgInfo(Var, Expr, *PhysReg, DL);
2213 } else {
2214 MIRBuilder.buildDirectDbgValue(*PhysReg, Var, Expr);
2215 }
2216
2217 return true;
2218}
2219
2221 switch (ID) {
2222 default:
2223 llvm_unreachable("Unexpected intrinsic");
2224 case Intrinsic::experimental_convergence_anchor:
2225 return TargetOpcode::CONVERGENCECTRL_ANCHOR;
2226 case Intrinsic::experimental_convergence_entry:
2227 return TargetOpcode::CONVERGENCECTRL_ENTRY;
2228 case Intrinsic::experimental_convergence_loop:
2229 return TargetOpcode::CONVERGENCECTRL_LOOP;
2230 }
2231}
2232
2233bool IRTranslator::translateConvergenceControlIntrinsic(
2234 const CallInst &CI, Intrinsic::ID ID, MachineIRBuilder &MIRBuilder) {
2235 MachineInstrBuilder MIB = MIRBuilder.buildInstr(getConvOpcode(ID));
2236 Register OutputReg = getOrCreateConvergenceTokenVReg(CI);
2237 MIB.addDef(OutputReg);
2238
2239 if (ID == Intrinsic::experimental_convergence_loop) {
2241 assert(Bundle && "Expected a convergence control token.");
2242 Register InputReg =
2243 getOrCreateConvergenceTokenVReg(*Bundle->Inputs[0].get());
2244 MIB.addUse(InputReg);
2245 }
2246
2247 return true;
2248}
2249
2250bool IRTranslator::translateKnownIntrinsic(const CallInst &CI, Intrinsic::ID ID,
2251 MachineIRBuilder &MIRBuilder) {
2252 if (auto *MI = dyn_cast<AnyMemIntrinsic>(&CI)) {
2253 if (ORE->enabled()) {
2254 if (MemoryOpRemark::canHandle(MI, *LibInfo)) {
2255 MemoryOpRemark R(*ORE, "gisel-irtranslator-memsize", *DL, *LibInfo);
2256 R.visit(MI);
2257 }
2258 }
2259 }
2260
2261 // If this is a simple intrinsic (that is, we just need to add a def of
2262 // a vreg, and uses for each arg operand, then translate it.
2263 if (translateSimpleIntrinsic(CI, ID, MIRBuilder))
2264 return true;
2265
2266 switch (ID) {
2267 default:
2268 break;
2269 case Intrinsic::lifetime_start:
2270 case Intrinsic::lifetime_end: {
2271 // No stack colouring in O0, discard region information.
2272 if (MF->getTarget().getOptLevel() == CodeGenOptLevel::None ||
2273 MF->getFunction().hasOptNone())
2274 return true;
2275
2276 unsigned Op = ID == Intrinsic::lifetime_start ? TargetOpcode::LIFETIME_START
2277 : TargetOpcode::LIFETIME_END;
2278
2279 const AllocaInst *AI = dyn_cast<AllocaInst>(CI.getArgOperand(0));
2280 if (!AI || !AI->isStaticAlloca())
2281 return true;
2282
2283 MIRBuilder.buildInstr(Op).addFrameIndex(getOrCreateFrameIndex(*AI));
2284 return true;
2285 }
2286 case Intrinsic::fake_use: {
2288 for (const auto &Arg : CI.args())
2289 llvm::append_range(VRegs, getOrCreateVRegs(*Arg));
2290 MIRBuilder.buildInstr(TargetOpcode::FAKE_USE, {}, VRegs);
2291 MF->setHasFakeUses(true);
2292 return true;
2293 }
2294 case Intrinsic::dbg_declare: {
2295 const DbgDeclareInst &DI = cast<DbgDeclareInst>(CI);
2296 assert(DI.getVariable() && "Missing variable");
2297 translateDbgDeclareRecord(DI.getAddress(), DI.hasArgList(), DI.getVariable(),
2298 DI.getExpression(), DI.getDebugLoc(), MIRBuilder);
2299 return true;
2300 }
2301 case Intrinsic::dbg_label: {
2302 const DbgLabelInst &DI = cast<DbgLabelInst>(CI);
2303 assert(DI.getLabel() && "Missing label");
2304
2306 MIRBuilder.getDebugLoc()) &&
2307 "Expected inlined-at fields to agree");
2308
2309 MIRBuilder.buildDbgLabel(DI.getLabel());
2310 return true;
2311 }
2312 case Intrinsic::vaend:
2313 // No target I know of cares about va_end. Certainly no in-tree target
2314 // does. Simplest intrinsic ever!
2315 return true;
2316 case Intrinsic::vastart: {
2317 Value *Ptr = CI.getArgOperand(0);
2318 unsigned ListSize = TLI->getVaListSizeInBits(*DL) / 8;
2319 Align Alignment = getKnownAlignment(Ptr, *DL);
2320
2321 MIRBuilder.buildInstr(TargetOpcode::G_VASTART, {}, {getOrCreateVReg(*Ptr)})
2322 .addMemOperand(MF->getMachineMemOperand(MachinePointerInfo(Ptr),
2324 ListSize, Alignment));
2325 return true;
2326 }
2327 case Intrinsic::dbg_assign:
2328 // A dbg.assign is a dbg.value with more information about stack locations,
2329 // typically produced during optimisation of variables with leaked
2330 // addresses. We can treat it like a normal dbg_value intrinsic here; to
2331 // benefit from the full analysis of stack/SSA locations, GlobalISel would
2332 // need to register for and use the AssignmentTrackingAnalysis pass.
2333 [[fallthrough]];
2334 case Intrinsic::dbg_value: {
2335 // This form of DBG_VALUE is target-independent.
2336 const DbgValueInst &DI = cast<DbgValueInst>(CI);
2337 translateDbgValueRecord(DI.getValue(), DI.hasArgList(), DI.getVariable(),
2338 DI.getExpression(), DI.getDebugLoc(), MIRBuilder);
2339 return true;
2340 }
2341 case Intrinsic::uadd_with_overflow:
2342 return translateOverflowIntrinsic(CI, TargetOpcode::G_UADDO, MIRBuilder);
2343 case Intrinsic::sadd_with_overflow:
2344 return translateOverflowIntrinsic(CI, TargetOpcode::G_SADDO, MIRBuilder);
2345 case Intrinsic::usub_with_overflow:
2346 return translateOverflowIntrinsic(CI, TargetOpcode::G_USUBO, MIRBuilder);
2347 case Intrinsic::ssub_with_overflow:
2348 return translateOverflowIntrinsic(CI, TargetOpcode::G_SSUBO, MIRBuilder);
2349 case Intrinsic::umul_with_overflow:
2350 return translateOverflowIntrinsic(CI, TargetOpcode::G_UMULO, MIRBuilder);
2351 case Intrinsic::smul_with_overflow:
2352 return translateOverflowIntrinsic(CI, TargetOpcode::G_SMULO, MIRBuilder);
2353 case Intrinsic::uadd_sat:
2354 return translateBinaryOp(TargetOpcode::G_UADDSAT, CI, MIRBuilder);
2355 case Intrinsic::sadd_sat:
2356 return translateBinaryOp(TargetOpcode::G_SADDSAT, CI, MIRBuilder);
2357 case Intrinsic::usub_sat:
2358 return translateBinaryOp(TargetOpcode::G_USUBSAT, CI, MIRBuilder);
2359 case Intrinsic::ssub_sat:
2360 return translateBinaryOp(TargetOpcode::G_SSUBSAT, CI, MIRBuilder);
2361 case Intrinsic::ushl_sat:
2362 return translateBinaryOp(TargetOpcode::G_USHLSAT, CI, MIRBuilder);
2363 case Intrinsic::sshl_sat:
2364 return translateBinaryOp(TargetOpcode::G_SSHLSAT, CI, MIRBuilder);
2365 case Intrinsic::umin:
2366 return translateBinaryOp(TargetOpcode::G_UMIN, CI, MIRBuilder);
2367 case Intrinsic::umax:
2368 return translateBinaryOp(TargetOpcode::G_UMAX, CI, MIRBuilder);
2369 case Intrinsic::smin:
2370 return translateBinaryOp(TargetOpcode::G_SMIN, CI, MIRBuilder);
2371 case Intrinsic::smax:
2372 return translateBinaryOp(TargetOpcode::G_SMAX, CI, MIRBuilder);
2373 case Intrinsic::abs:
2374 // TODO: Preserve "int min is poison" arg in GMIR?
2375 return translateUnaryOp(TargetOpcode::G_ABS, CI, MIRBuilder);
2376 case Intrinsic::smul_fix:
2377 return translateFixedPointIntrinsic(TargetOpcode::G_SMULFIX, CI, MIRBuilder);
2378 case Intrinsic::umul_fix:
2379 return translateFixedPointIntrinsic(TargetOpcode::G_UMULFIX, CI, MIRBuilder);
2380 case Intrinsic::smul_fix_sat:
2381 return translateFixedPointIntrinsic(TargetOpcode::G_SMULFIXSAT, CI, MIRBuilder);
2382 case Intrinsic::umul_fix_sat:
2383 return translateFixedPointIntrinsic(TargetOpcode::G_UMULFIXSAT, CI, MIRBuilder);
2384 case Intrinsic::sdiv_fix:
2385 return translateFixedPointIntrinsic(TargetOpcode::G_SDIVFIX, CI, MIRBuilder);
2386 case Intrinsic::udiv_fix:
2387 return translateFixedPointIntrinsic(TargetOpcode::G_UDIVFIX, CI, MIRBuilder);
2388 case Intrinsic::sdiv_fix_sat:
2389 return translateFixedPointIntrinsic(TargetOpcode::G_SDIVFIXSAT, CI, MIRBuilder);
2390 case Intrinsic::udiv_fix_sat:
2391 return translateFixedPointIntrinsic(TargetOpcode::G_UDIVFIXSAT, CI, MIRBuilder);
2392 case Intrinsic::fmuladd: {
2393 const TargetMachine &TM = MF->getTarget();
2394 Register Dst = getOrCreateVReg(CI);
2395 Register Op0 = getOrCreateVReg(*CI.getArgOperand(0));
2396 Register Op1 = getOrCreateVReg(*CI.getArgOperand(1));
2397 Register Op2 = getOrCreateVReg(*CI.getArgOperand(2));
2399 TLI->isFMAFasterThanFMulAndFAdd(*MF,
2400 TLI->getValueType(*DL, CI.getType()))) {
2401 // TODO: Revisit this to see if we should move this part of the
2402 // lowering to the combiner.
2403 MIRBuilder.buildFMA(Dst, Op0, Op1, Op2,
2405 } else {
2406 LLT Ty = getLLTForType(*CI.getType(), *DL);
2407 auto FMul = MIRBuilder.buildFMul(
2408 Ty, Op0, Op1, MachineInstr::copyFlagsFromInstruction(CI));
2409 MIRBuilder.buildFAdd(Dst, FMul, Op2,
2411 }
2412 return true;
2413 }
2414 case Intrinsic::frexp: {
2415 ArrayRef<Register> VRegs = getOrCreateVRegs(CI);
2416 MIRBuilder.buildFFrexp(VRegs[0], VRegs[1],
2417 getOrCreateVReg(*CI.getArgOperand(0)),
2419 return true;
2420 }
2421 case Intrinsic::modf: {
2422 ArrayRef<Register> VRegs = getOrCreateVRegs(CI);
2423 MIRBuilder.buildModf(VRegs[0], VRegs[1],
2424 getOrCreateVReg(*CI.getArgOperand(0)),
2426 return true;
2427 }
2428 case Intrinsic::sincos: {
2429 ArrayRef<Register> VRegs = getOrCreateVRegs(CI);
2430 MIRBuilder.buildFSincos(VRegs[0], VRegs[1],
2431 getOrCreateVReg(*CI.getArgOperand(0)),
2433 return true;
2434 }
2435 case Intrinsic::fptosi_sat:
2436 MIRBuilder.buildFPTOSI_SAT(getOrCreateVReg(CI),
2437 getOrCreateVReg(*CI.getArgOperand(0)));
2438 return true;
2439 case Intrinsic::fptoui_sat:
2440 MIRBuilder.buildFPTOUI_SAT(getOrCreateVReg(CI),
2441 getOrCreateVReg(*CI.getArgOperand(0)));
2442 return true;
2443 case Intrinsic::memcpy_inline:
2444 return translateMemFunc(CI, MIRBuilder, TargetOpcode::G_MEMCPY_INLINE);
2445 case Intrinsic::memcpy:
2446 return translateMemFunc(CI, MIRBuilder, TargetOpcode::G_MEMCPY);
2447 case Intrinsic::memmove:
2448 return translateMemFunc(CI, MIRBuilder, TargetOpcode::G_MEMMOVE);
2449 case Intrinsic::memset:
2450 return translateMemFunc(CI, MIRBuilder, TargetOpcode::G_MEMSET);
2451 case Intrinsic::eh_typeid_for: {
2452 GlobalValue *GV = ExtractTypeInfo(CI.getArgOperand(0));
2453 Register Reg = getOrCreateVReg(CI);
2454 unsigned TypeID = MF->getTypeIDFor(GV);
2455 MIRBuilder.buildConstant(Reg, TypeID);
2456 return true;
2457 }
2458 case Intrinsic::objectsize:
2459 llvm_unreachable("llvm.objectsize.* should have been lowered already");
2460
2461 case Intrinsic::is_constant:
2462 llvm_unreachable("llvm.is.constant.* should have been lowered already");
2463
2464 case Intrinsic::stackguard:
2465 getStackGuard(getOrCreateVReg(CI), MIRBuilder);
2466 return true;
2467 case Intrinsic::stackprotector: {
2468 LLT PtrTy = getLLTForType(*CI.getArgOperand(0)->getType(), *DL);
2469 Register GuardVal;
2470 if (TLI->useLoadStackGuardNode(*CI.getModule())) {
2471 GuardVal = MRI->createGenericVirtualRegister(PtrTy);
2472 getStackGuard(GuardVal, MIRBuilder);
2473 } else
2474 GuardVal = getOrCreateVReg(*CI.getArgOperand(0)); // The guard's value.
2475
2476 AllocaInst *Slot = cast<AllocaInst>(CI.getArgOperand(1));
2477 int FI = getOrCreateFrameIndex(*Slot);
2478 MF->getFrameInfo().setStackProtectorIndex(FI);
2479
2480 MIRBuilder.buildStore(
2481 GuardVal, getOrCreateVReg(*Slot),
2482 *MF->getMachineMemOperand(MachinePointerInfo::getFixedStack(*MF, FI),
2485 PtrTy, Align(8)));
2486 return true;
2487 }
2488 case Intrinsic::stacksave: {
2489 MIRBuilder.buildInstr(TargetOpcode::G_STACKSAVE, {getOrCreateVReg(CI)}, {});
2490 return true;
2491 }
2492 case Intrinsic::stackrestore: {
2493 MIRBuilder.buildInstr(TargetOpcode::G_STACKRESTORE, {},
2494 {getOrCreateVReg(*CI.getArgOperand(0))});
2495 return true;
2496 }
2497 case Intrinsic::cttz:
2498 case Intrinsic::ctlz: {
2499 ConstantInt *Cst = cast<ConstantInt>(CI.getArgOperand(1));
2500 bool isTrailing = ID == Intrinsic::cttz;
2501 unsigned Opcode = isTrailing ? Cst->isZero()
2502 ? TargetOpcode::G_CTTZ
2503 : TargetOpcode::G_CTTZ_ZERO_POISON
2504 : Cst->isZero() ? TargetOpcode::G_CTLZ
2505 : TargetOpcode::G_CTLZ_ZERO_POISON;
2506 MIRBuilder.buildInstr(Opcode, {getOrCreateVReg(CI)},
2507 {getOrCreateVReg(*CI.getArgOperand(0))});
2508 return true;
2509 }
2510 case Intrinsic::invariant_start: {
2511 MIRBuilder.buildUndef(getOrCreateVReg(CI));
2512 return true;
2513 }
2514 case Intrinsic::invariant_end:
2515 return true;
2516 case Intrinsic::expect:
2517 case Intrinsic::expect_with_probability:
2518 case Intrinsic::annotation:
2519 case Intrinsic::ptr_annotation:
2520 case Intrinsic::launder_invariant_group:
2521 case Intrinsic::strip_invariant_group: {
2522 // Drop the intrinsic, but forward the value.
2523 MIRBuilder.buildCopy(getOrCreateVReg(CI),
2524 getOrCreateVReg(*CI.getArgOperand(0)));
2525 return true;
2526 }
2527 case Intrinsic::assume:
2528 case Intrinsic::experimental_noalias_scope_decl:
2529 case Intrinsic::var_annotation:
2530 case Intrinsic::sideeffect:
2531 // Discard annotate attributes, assumptions, and artificial side-effects.
2532 return true;
2533 case Intrinsic::read_volatile_register:
2534 case Intrinsic::read_register: {
2535 Value *Arg = CI.getArgOperand(0);
2536 MIRBuilder
2537 .buildInstr(TargetOpcode::G_READ_REGISTER, {getOrCreateVReg(CI)}, {})
2538 .addMetadata(cast<MDNode>(cast<MetadataAsValue>(Arg)->getMetadata()));
2539 return true;
2540 }
2541 case Intrinsic::write_register: {
2542 Value *Arg = CI.getArgOperand(0);
2543 MIRBuilder.buildInstr(TargetOpcode::G_WRITE_REGISTER)
2544 .addMetadata(cast<MDNode>(cast<MetadataAsValue>(Arg)->getMetadata()))
2545 .addUse(getOrCreateVReg(*CI.getArgOperand(1)));
2546 return true;
2547 }
2548 case Intrinsic::localescape: {
2549 MachineBasicBlock &EntryMBB = MF->front();
2550 StringRef EscapedName = GlobalValue::dropLLVMManglingEscape(MF->getName());
2551
2552 // Directly emit some LOCAL_ESCAPE machine instrs. Label assignment emission
2553 // is the same on all targets.
2554 for (unsigned Idx = 0, E = CI.arg_size(); Idx < E; ++Idx) {
2555 Value *Arg = CI.getArgOperand(Idx)->stripPointerCasts();
2556 if (isa<ConstantPointerNull>(Arg))
2557 continue; // Skip null pointers. They represent a hole in index space.
2558
2559 int FI = getOrCreateFrameIndex(*cast<AllocaInst>(Arg));
2560 MCSymbol *FrameAllocSym =
2561 MF->getContext().getOrCreateFrameAllocSymbol(EscapedName, Idx);
2562
2563 // This should be inserted at the start of the entry block.
2564 auto LocalEscape =
2565 MIRBuilder.buildInstrNoInsert(TargetOpcode::LOCAL_ESCAPE)
2566 .addSym(FrameAllocSym)
2567 .addFrameIndex(FI);
2568
2569 EntryMBB.insert(EntryMBB.begin(), LocalEscape);
2570 }
2571
2572 return true;
2573 }
2574 case Intrinsic::vector_reduce_fadd:
2575 case Intrinsic::vector_reduce_fmul: {
2576 // Need to check for the reassoc flag to decide whether we want a
2577 // sequential reduction opcode or not.
2578 Register Dst = getOrCreateVReg(CI);
2579 Register ScalarSrc = getOrCreateVReg(*CI.getArgOperand(0));
2580 Register VecSrc = getOrCreateVReg(*CI.getArgOperand(1));
2581 unsigned Opc = 0;
2582 if (!CI.hasAllowReassoc()) {
2583 // The sequential ordering case.
2584 Opc = ID == Intrinsic::vector_reduce_fadd
2585 ? TargetOpcode::G_VECREDUCE_SEQ_FADD
2586 : TargetOpcode::G_VECREDUCE_SEQ_FMUL;
2587 if (!MRI->getType(VecSrc).isVector())
2588 Opc = ID == Intrinsic::vector_reduce_fadd ? TargetOpcode::G_FADD
2589 : TargetOpcode::G_FMUL;
2590 MIRBuilder.buildInstr(Opc, {Dst}, {ScalarSrc, VecSrc},
2592 return true;
2593 }
2594 // We split the operation into a separate G_FADD/G_FMUL + the reduce,
2595 // since the associativity doesn't matter.
2596 unsigned ScalarOpc;
2597 if (ID == Intrinsic::vector_reduce_fadd) {
2598 Opc = TargetOpcode::G_VECREDUCE_FADD;
2599 ScalarOpc = TargetOpcode::G_FADD;
2600 } else {
2601 Opc = TargetOpcode::G_VECREDUCE_FMUL;
2602 ScalarOpc = TargetOpcode::G_FMUL;
2603 }
2604 LLT DstTy = MRI->getType(Dst);
2605 auto Rdx = MIRBuilder.buildInstr(
2606 Opc, {DstTy}, {VecSrc}, MachineInstr::copyFlagsFromInstruction(CI));
2607 MIRBuilder.buildInstr(ScalarOpc, {Dst}, {ScalarSrc, Rdx},
2609
2610 return true;
2611 }
2612 case Intrinsic::trap:
2613 return translateTrap(CI, MIRBuilder, TargetOpcode::G_TRAP);
2614 case Intrinsic::debugtrap:
2615 return translateTrap(CI, MIRBuilder, TargetOpcode::G_DEBUGTRAP);
2616 case Intrinsic::ubsantrap:
2617 return translateTrap(CI, MIRBuilder, TargetOpcode::G_UBSANTRAP);
2618 case Intrinsic::allow_runtime_check:
2619 case Intrinsic::allow_ubsan_check:
2620 MIRBuilder.buildCopy(getOrCreateVReg(CI),
2621 getOrCreateVReg(*ConstantInt::getTrue(CI.getType())));
2622 return true;
2623 case Intrinsic::amdgcn_cs_chain:
2624 case Intrinsic::amdgcn_call_whole_wave:
2625 return translateCallBase(CI, MIRBuilder);
2626 case Intrinsic::fptrunc_round: {
2628
2629 // Convert the metadata argument to a constant integer
2630 Metadata *MD = cast<MetadataAsValue>(CI.getArgOperand(1))->getMetadata();
2631 std::optional<RoundingMode> RoundMode =
2632 convertStrToRoundingMode(cast<MDString>(MD)->getString());
2633
2634 // Add the Rounding mode as an integer
2635 MIRBuilder
2636 .buildInstr(TargetOpcode::G_INTRINSIC_FPTRUNC_ROUND,
2637 {getOrCreateVReg(CI)},
2638 {getOrCreateVReg(*CI.getArgOperand(0))}, Flags)
2639 .addImm((int)*RoundMode);
2640
2641 return true;
2642 }
2643 case Intrinsic::is_fpclass: {
2644 Value *FpValue = CI.getOperand(0);
2645 ConstantInt *TestMaskValue = cast<ConstantInt>(CI.getOperand(1));
2646
2647 MIRBuilder
2648 .buildInstr(TargetOpcode::G_IS_FPCLASS, {getOrCreateVReg(CI)},
2649 {getOrCreateVReg(*FpValue)})
2650 .addImm(TestMaskValue->getZExtValue());
2651
2652 return true;
2653 }
2654 case Intrinsic::set_fpenv: {
2655 Value *FPEnv = CI.getOperand(0);
2656 MIRBuilder.buildSetFPEnv(getOrCreateVReg(*FPEnv));
2657 return true;
2658 }
2659 case Intrinsic::reset_fpenv:
2660 MIRBuilder.buildResetFPEnv();
2661 return true;
2662 case Intrinsic::set_fpmode: {
2663 Value *FPState = CI.getOperand(0);
2664 MIRBuilder.buildSetFPMode(getOrCreateVReg(*FPState));
2665 return true;
2666 }
2667 case Intrinsic::reset_fpmode:
2668 MIRBuilder.buildResetFPMode();
2669 return true;
2670 case Intrinsic::get_rounding:
2671 MIRBuilder.buildGetRounding(getOrCreateVReg(CI));
2672 return true;
2673 case Intrinsic::set_rounding:
2674 MIRBuilder.buildSetRounding(getOrCreateVReg(*CI.getOperand(0)));
2675 return true;
2676 case Intrinsic::vscale: {
2677 MIRBuilder.buildVScale(getOrCreateVReg(CI), 1);
2678 return true;
2679 }
2680 case Intrinsic::scmp:
2681 MIRBuilder.buildSCmp(getOrCreateVReg(CI),
2682 getOrCreateVReg(*CI.getOperand(0)),
2683 getOrCreateVReg(*CI.getOperand(1)));
2684 return true;
2685 case Intrinsic::ucmp:
2686 MIRBuilder.buildUCmp(getOrCreateVReg(CI),
2687 getOrCreateVReg(*CI.getOperand(0)),
2688 getOrCreateVReg(*CI.getOperand(1)));
2689 return true;
2690 case Intrinsic::vector_extract:
2691 return translateExtractVector(CI, MIRBuilder);
2692 case Intrinsic::vector_insert:
2693 return translateInsertVector(CI, MIRBuilder);
2694 case Intrinsic::stepvector: {
2695 MIRBuilder.buildStepVector(getOrCreateVReg(CI), 1);
2696 return true;
2697 }
2698 case Intrinsic::prefetch: {
2699 Value *Addr = CI.getOperand(0);
2700 unsigned RW = cast<ConstantInt>(CI.getOperand(1))->getZExtValue();
2701 unsigned Locality = cast<ConstantInt>(CI.getOperand(2))->getZExtValue();
2702 unsigned CacheType = cast<ConstantInt>(CI.getOperand(3))->getZExtValue();
2703
2705 auto &MMO = *MF->getMachineMemOperand(MachinePointerInfo(Addr), Flags,
2706 LLT(), Align());
2707
2708 MIRBuilder.buildPrefetch(getOrCreateVReg(*Addr), RW, Locality, CacheType,
2709 MMO);
2710
2711 return true;
2712 }
2713
2714 case Intrinsic::vector_interleave2:
2715 case Intrinsic::vector_deinterleave2: {
2716 // Both intrinsics have at least one operand.
2717 Value *Op0 = CI.getOperand(0);
2718 LLT ResTy = getLLTForType(*Op0->getType(), MIRBuilder.getDataLayout());
2719 if (!ResTy.isFixedVector())
2720 return false;
2721
2722 if (CI.getIntrinsicID() == Intrinsic::vector_interleave2)
2723 return translateVectorInterleave2Intrinsic(CI, MIRBuilder);
2724
2725 return translateVectorDeinterleave2Intrinsic(CI, MIRBuilder);
2726 }
2727
2728#define INSTRUCTION(NAME, NARG, ROUND_MODE, INTRINSIC) \
2729 case Intrinsic::INTRINSIC:
2730#include "llvm/IR/ConstrainedOps.def"
2731 return translateConstrainedFPIntrinsic(cast<ConstrainedFPIntrinsic>(CI),
2732 MIRBuilder);
2733 case Intrinsic::experimental_convergence_anchor:
2734 case Intrinsic::experimental_convergence_entry:
2735 case Intrinsic::experimental_convergence_loop:
2736 return translateConvergenceControlIntrinsic(CI, ID, MIRBuilder);
2737 case Intrinsic::reloc_none: {
2738 Metadata *MD = cast<MetadataAsValue>(CI.getArgOperand(0))->getMetadata();
2739 StringRef SymbolName = cast<MDString>(MD)->getString();
2740 MIRBuilder.buildInstr(TargetOpcode::RELOC_NONE)
2742 return true;
2743 }
2744 }
2745 return false;
2746}
2747
2748bool IRTranslator::translateInlineAsm(const CallBase &CB,
2749 MachineIRBuilder &MIRBuilder) {
2750 if (!mayTranslateUserTypes(CB))
2751 return false;
2752
2753 const InlineAsmLowering *ALI = MF->getSubtarget().getInlineAsmLowering();
2754
2755 if (!ALI) {
2756 LLVM_DEBUG(
2757 dbgs() << "Inline asm lowering is not supported for this target yet\n");
2758 return false;
2759 }
2760
2761 return ALI->lowerInlineAsm(
2762 MIRBuilder, CB, [&](const Value &Val) { return getOrCreateVRegs(Val); });
2763}
2764
2765bool IRTranslator::translateCallBase(const CallBase &CB,
2766 MachineIRBuilder &MIRBuilder) {
2767 ArrayRef<Register> Res = getOrCreateVRegs(CB);
2768
2770 Register SwiftInVReg = 0;
2771 Register SwiftErrorVReg = 0;
2772 for (const auto &Arg : CB.args()) {
2773 if (CLI->supportSwiftError() && isSwiftError(Arg)) {
2774 assert(SwiftInVReg == 0 && "Expected only one swift error argument");
2775 LLT Ty = getLLTForType(*Arg->getType(), *DL);
2776 SwiftInVReg = MRI->createGenericVirtualRegister(Ty);
2777 MIRBuilder.buildCopy(SwiftInVReg, SwiftError.getOrCreateVRegUseAt(
2778 &CB, &MIRBuilder.getMBB(), Arg));
2779 Args.emplace_back(ArrayRef(SwiftInVReg));
2780 SwiftErrorVReg =
2781 SwiftError.getOrCreateVRegDefAt(&CB, &MIRBuilder.getMBB(), Arg);
2782 continue;
2783 }
2784 Args.push_back(getOrCreateVRegs(*Arg));
2785 }
2786
2787 if (auto *CI = dyn_cast<CallInst>(&CB)) {
2788 if (ORE->enabled()) {
2789 if (MemoryOpRemark::canHandle(CI, *LibInfo)) {
2790 MemoryOpRemark R(*ORE, "gisel-irtranslator-memsize", *DL, *LibInfo);
2791 R.visit(CI);
2792 }
2793 }
2794 }
2795
2796 std::optional<CallLowering::PtrAuthInfo> PAI;
2797 if (auto Bundle = CB.getOperandBundle(LLVMContext::OB_ptrauth)) {
2798 // Functions should never be ptrauth-called directly.
2799 assert(!CB.getCalledFunction() && "invalid direct ptrauth call");
2800
2801 const Value *Key = Bundle->Inputs[0];
2802 const Value *Discriminator = Bundle->Inputs[1];
2803
2804 // Look through ptrauth constants to try to eliminate the matching bundle
2805 // and turn this into a direct call with no ptrauth.
2806 // CallLowering will use the raw pointer if it doesn't find the PAI.
2807 const auto *CalleeCPA = dyn_cast<ConstantPtrAuth>(CB.getCalledOperand());
2808 if (!CalleeCPA || !isa<Function>(CalleeCPA->getPointer()) ||
2809 !CalleeCPA->isKnownCompatibleWith(Key, Discriminator, *DL)) {
2810 // If we can't make it direct, package the bundle into PAI.
2811 Register DiscReg = getOrCreateVReg(*Discriminator);
2812 PAI = CallLowering::PtrAuthInfo{cast<ConstantInt>(Key)->getZExtValue(),
2813 DiscReg};
2814 }
2815 }
2816
2817 Register ConvergenceCtrlToken = 0;
2818 if (auto Bundle = CB.getOperandBundle(LLVMContext::OB_convergencectrl)) {
2819 const auto &Token = *Bundle->Inputs[0].get();
2820 ConvergenceCtrlToken = getOrCreateConvergenceTokenVReg(Token);
2821 }
2822
2823 // We don't set HasCalls on MFI here yet because call lowering may decide to
2824 // optimize into tail calls. Instead, we defer that to selection where a final
2825 // scan is done to check if any instructions are calls.
2826 bool Success = CLI->lowerCall(
2827 MIRBuilder, CB, Res, Args, SwiftErrorVReg, PAI, ConvergenceCtrlToken,
2828 [&]() { return getOrCreateVReg(*CB.getCalledOperand()); });
2829
2830 // Check if we just inserted a tail call.
2831 if (Success) {
2832 assert(!HasTailCall && "Can't tail call return twice from block?");
2833 const TargetInstrInfo *TII = MF->getSubtarget().getInstrInfo();
2834 HasTailCall = TII->isTailCall(*std::prev(MIRBuilder.getInsertPt()));
2835 }
2836
2837 return Success;
2838}
2839
2840bool IRTranslator::translateCall(const User &U, MachineIRBuilder &MIRBuilder) {
2841 if (!mayTranslateUserTypes(U))
2842 return false;
2843
2844 const CallInst &CI = cast<CallInst>(U);
2845 const Function *F = CI.getCalledFunction();
2846
2847 // FIXME: support Windows dllimport function calls and calls through
2848 // weak symbols.
2849 if (F && (F->hasDLLImportStorageClass() ||
2850 (MF->getTarget().getTargetTriple().isOSWindows() &&
2851 F->hasExternalWeakLinkage())))
2852 return false;
2853
2854 // FIXME: support control flow guard targets.
2856 return false;
2857
2858 // FIXME: support statepoints and related.
2860 return false;
2861
2862 if (CI.isInlineAsm())
2863 return translateInlineAsm(CI, MIRBuilder);
2864
2865 Intrinsic::ID ID = F ? F->getIntrinsicID() : Intrinsic::not_intrinsic;
2866 if (!F || ID == Intrinsic::not_intrinsic) {
2867 if (translateCallBase(CI, MIRBuilder)) {
2868 diagnoseDontCall(CI);
2869 return true;
2870 }
2871 return false;
2872 }
2873
2874 assert(ID != Intrinsic::not_intrinsic && "unknown intrinsic");
2875
2876 if (translateKnownIntrinsic(CI, ID, MIRBuilder))
2877 return true;
2878
2880 TLI->getTgtMemIntrinsic(Infos, CI, *MF, ID);
2881
2882 return translateIntrinsic(CI, ID, MIRBuilder, Infos);
2883}
2884
2885/// Translate a call or callbr to an intrinsic.
2886bool IRTranslator::translateIntrinsic(
2887 const CallBase &CB, Intrinsic::ID ID, MachineIRBuilder &MIRBuilder,
2888 ArrayRef<TargetLowering::IntrinsicInfo> TgtMemIntrinsicInfos) {
2889 ArrayRef<Register> ResultRegs;
2890 if (!CB.getType()->isVoidTy())
2891 ResultRegs = getOrCreateVRegs(CB);
2892
2893 // Ignore the callsite attributes. Backend code is most likely not expecting
2894 // an intrinsic to sometimes have side effects and sometimes not.
2895 MachineInstrBuilder MIB = MIRBuilder.buildIntrinsic(ID, ResultRegs);
2896 if (isa<FPMathOperator>(CB))
2897 MIB->copyIRFlags(CB);
2898
2899 for (const auto &Arg : enumerate(CB.args())) {
2900 // If this is required to be an immediate, don't materialize it in a
2901 // register.
2902 if (CB.paramHasAttr(Arg.index(), Attribute::ImmArg)) {
2903 if (ConstantInt *CI = dyn_cast<ConstantInt>(Arg.value())) {
2904 // imm arguments are more convenient than cimm (and realistically
2905 // probably sufficient), so use them.
2906 assert(CI->getBitWidth() <= 64 &&
2907 "large intrinsic immediates not handled");
2908 MIB.addImm(CI->getSExtValue());
2909 } else {
2910 MIB.addFPImm(cast<ConstantFP>(Arg.value()));
2911 }
2912 } else if (auto *MDVal = dyn_cast<MetadataAsValue>(Arg.value())) {
2913 auto *MD = MDVal->getMetadata();
2914 auto *MDN = dyn_cast<MDNode>(MD);
2915 if (!MDN) {
2916 if (auto *ConstMD = dyn_cast<ConstantAsMetadata>(MD))
2917 MDN = MDNode::get(MF->getFunction().getContext(), ConstMD);
2918 else // This was probably an MDString.
2919 return false;
2920 }
2921 MIB.addMetadata(MDN);
2922 } else {
2923 ArrayRef<Register> VRegs = getOrCreateVRegs(*Arg.value());
2924 if (VRegs.size() > 1)
2925 return false;
2926 MIB.addUse(VRegs[0]);
2927 }
2928 }
2929
2930 // Add MachineMemOperands for each memory access described by the target.
2931 for (const auto &Info : TgtMemIntrinsicInfos) {
2932 Align Alignment = Info.align.value_or(
2933 DL->getABITypeAlign(Info.memVT.getTypeForEVT(CB.getContext())));
2934 LLT MemTy = Info.memVT.isSimple()
2935 ? getLLTForMVT(Info.memVT.getSimpleVT())
2936 : LLT::scalar(Info.memVT.getStoreSizeInBits());
2937
2938 // TODO: We currently just fallback to address space 0 if
2939 // getTgtMemIntrinsic didn't yield anything useful.
2940 MachinePointerInfo MPI;
2941 if (Info.ptrVal) {
2942 MPI = MachinePointerInfo(Info.ptrVal, Info.offset);
2943 } else if (Info.fallbackAddressSpace) {
2944 MPI = MachinePointerInfo(*Info.fallbackAddressSpace);
2945 }
2946 MIB.addMemOperand(MF->getMachineMemOperand(
2947 MPI, Info.flags, MemTy, Alignment, CB.getAAMetadata(),
2948 /*Ranges=*/nullptr, Info.ssid, Info.order, Info.failureOrder));
2949 }
2950
2951 if (CB.isConvergent()) {
2952 if (auto Bundle = CB.getOperandBundle(LLVMContext::OB_convergencectrl)) {
2953 auto *Token = Bundle->Inputs[0].get();
2954 Register TokenReg = getOrCreateVReg(*Token);
2955 MIB.addUse(TokenReg, RegState::Implicit);
2956 }
2957 }
2958
2960 MIB->setDeactivationSymbol(*MF, Bundle->Inputs[0].get());
2961
2962 return true;
2963}
2964
2965bool IRTranslator::findUnwindDestinations(
2966 const BasicBlock *EHPadBB,
2967 BranchProbability Prob,
2968 SmallVectorImpl<std::pair<MachineBasicBlock *, BranchProbability>>
2969 &UnwindDests) {
2971 EHPadBB->getParent()->getFunction().getPersonalityFn());
2972 bool IsMSVCCXX = Personality == EHPersonality::MSVC_CXX;
2973 bool IsCoreCLR = Personality == EHPersonality::CoreCLR;
2974 bool IsWasmCXX = Personality == EHPersonality::Wasm_CXX;
2975 bool IsSEH = isAsynchronousEHPersonality(Personality);
2976
2977 if (IsWasmCXX) {
2978 // Ignore this for now.
2979 return false;
2980 }
2981
2982 while (EHPadBB) {
2984 BasicBlock *NewEHPadBB = nullptr;
2985 if (isa<LandingPadInst>(Pad)) {
2986 // Stop on landingpads. They are not funclets.
2987 UnwindDests.emplace_back(&getMBB(*EHPadBB), Prob);
2988 break;
2989 }
2990 if (isa<CleanupPadInst>(Pad)) {
2991 // Stop on cleanup pads. Cleanups are always funclet entries for all known
2992 // personalities.
2993 UnwindDests.emplace_back(&getMBB(*EHPadBB), Prob);
2994 UnwindDests.back().first->setIsEHScopeEntry();
2995 UnwindDests.back().first->setIsEHFuncletEntry();
2996 break;
2997 }
2998 if (auto *CatchSwitch = dyn_cast<CatchSwitchInst>(Pad)) {
2999 // Add the catchpad handlers to the possible destinations.
3000 for (const BasicBlock *CatchPadBB : CatchSwitch->handlers()) {
3001 UnwindDests.emplace_back(&getMBB(*CatchPadBB), Prob);
3002 // For MSVC++ and the CLR, catchblocks are funclets and need prologues.
3003 if (IsMSVCCXX || IsCoreCLR)
3004 UnwindDests.back().first->setIsEHFuncletEntry();
3005 if (!IsSEH)
3006 UnwindDests.back().first->setIsEHScopeEntry();
3007 }
3008 NewEHPadBB = CatchSwitch->getUnwindDest();
3009 } else {
3010 continue;
3011 }
3012
3013 BranchProbabilityInfo *BPI = FuncInfo.BPI;
3014 if (BPI && NewEHPadBB)
3015 Prob *= BPI->getEdgeProbability(EHPadBB, NewEHPadBB);
3016 EHPadBB = NewEHPadBB;
3017 }
3018 return true;
3019}
3020
3021bool IRTranslator::translateInvoke(const User &U,
3022 MachineIRBuilder &MIRBuilder) {
3023 const InvokeInst &I = cast<InvokeInst>(U);
3024 MCContext &Context = MF->getContext();
3025
3026 const BasicBlock *ReturnBB = I.getSuccessor(0);
3027 const BasicBlock *EHPadBB = I.getSuccessor(1);
3028
3029 const Function *Fn = I.getCalledFunction();
3030
3031 // FIXME: support invoking patchpoint and statepoint intrinsics.
3032 if (Fn && Fn->isIntrinsic())
3033 return false;
3034
3035 // FIXME: support whatever these are.
3036 if (I.hasDeoptState())
3037 return false;
3038
3039 // FIXME: support control flow guard targets.
3040 if (I.countOperandBundlesOfType(LLVMContext::OB_cfguardtarget))
3041 return false;
3042
3043 // FIXME: support Windows exception handling.
3044 if (!isa<LandingPadInst>(EHPadBB->getFirstNonPHIIt()))
3045 return false;
3046
3047 // FIXME: support Windows dllimport function calls and calls through
3048 // weak symbols.
3049 if (Fn && (Fn->hasDLLImportStorageClass() ||
3050 (MF->getTarget().getTargetTriple().isOSWindows() &&
3051 Fn->hasExternalWeakLinkage())))
3052 return false;
3053
3054 bool LowerInlineAsm = I.isInlineAsm();
3055 bool NeedEHLabel = true;
3056
3057 // Emit the actual call, bracketed by EH_LABELs so that the MF knows about
3058 // the region covered by the try.
3059 MCSymbol *BeginSymbol = nullptr;
3060 if (NeedEHLabel) {
3061 MIRBuilder.buildInstr(TargetOpcode::G_INVOKE_REGION_START);
3062 BeginSymbol = Context.createTempSymbol();
3063 MIRBuilder.buildInstr(TargetOpcode::EH_LABEL).addSym(BeginSymbol);
3064 }
3065
3066 if (LowerInlineAsm) {
3067 if (!translateInlineAsm(I, MIRBuilder))
3068 return false;
3069 } else if (!translateCallBase(I, MIRBuilder))
3070 return false;
3071
3072 MCSymbol *EndSymbol = nullptr;
3073 if (NeedEHLabel) {
3074 EndSymbol = Context.createTempSymbol();
3075 MIRBuilder.buildInstr(TargetOpcode::EH_LABEL).addSym(EndSymbol);
3076 }
3077
3079 BranchProbabilityInfo *BPI = FuncInfo.BPI;
3080 MachineBasicBlock *InvokeMBB = &MIRBuilder.getMBB();
3081 BranchProbability EHPadBBProb =
3082 BPI ? BPI->getEdgeProbability(InvokeMBB->getBasicBlock(), EHPadBB)
3084
3085 if (!findUnwindDestinations(EHPadBB, EHPadBBProb, UnwindDests))
3086 return false;
3087
3088 MachineBasicBlock &EHPadMBB = getMBB(*EHPadBB),
3089 &ReturnMBB = getMBB(*ReturnBB);
3090 // Update successor info.
3091 addSuccessorWithProb(InvokeMBB, &ReturnMBB);
3092 for (auto &UnwindDest : UnwindDests) {
3093 UnwindDest.first->setIsEHPad();
3094 addSuccessorWithProb(InvokeMBB, UnwindDest.first, UnwindDest.second);
3095 }
3096 InvokeMBB->normalizeSuccProbs();
3097
3098 if (NeedEHLabel) {
3099 assert(BeginSymbol && "Expected a begin symbol!");
3100 assert(EndSymbol && "Expected an end symbol!");
3101 MF->addInvoke(&EHPadMBB, BeginSymbol, EndSymbol);
3102 }
3103
3104 MIRBuilder.buildBr(ReturnMBB);
3105 return true;
3106}
3107
3108/// The intrinsics currently supported by callbr are implicit control flow
3109/// intrinsics such as amdgcn.kill.
3110bool IRTranslator::translateCallBr(const User &U,
3111 MachineIRBuilder &MIRBuilder) {
3112 if (!mayTranslateUserTypes(U))
3113 return false; // see translateCall
3114
3115 const CallBrInst &I = cast<CallBrInst>(U);
3116 MachineBasicBlock *CallBrMBB = &MIRBuilder.getMBB();
3117
3118 Intrinsic::ID IID = I.getIntrinsicID();
3119 if (I.isInlineAsm()) {
3120 // FIXME: inline asm is not yet supported for callbr in GlobalISel. As soon
3121 // as we add support, we need to handle the indirect asm targets, see
3122 // SelectionDAGBuilder::visitCallBr().
3123 return false;
3124 }
3125 if (!translateIntrinsic(I, IID, MIRBuilder))
3126 return false;
3127
3128 // Retrieve successors.
3129 SmallPtrSet<BasicBlock *, 8> Dests = {I.getDefaultDest()};
3130 MachineBasicBlock *Return = &getMBB(*I.getDefaultDest());
3131
3132 // Update successor info.
3133 addSuccessorWithProb(CallBrMBB, Return, BranchProbability::getOne());
3134
3135 // Add indirect targets as successors. For intrinsic callbr, these represent
3136 // implicit control flow (e.g., the "kill" path for amdgcn.kill). We mark them
3137 // with setIsInlineAsmBrIndirectTarget so the machine verifier accepts them as
3138 // valid successors, even though they're not from inline asm.
3139 for (BasicBlock *Dest : I.getIndirectDests()) {
3140 MachineBasicBlock &Target = getMBB(*Dest);
3141 Target.setIsInlineAsmBrIndirectTarget();
3142 Target.setLabelMustBeEmitted();
3143 // Don't add duplicate machine successors.
3144 if (Dests.insert(Dest).second)
3145 addSuccessorWithProb(CallBrMBB, &Target, BranchProbability::getZero());
3146 }
3147
3148 CallBrMBB->normalizeSuccProbs();
3149
3150 // Drop into default successor.
3151 MIRBuilder.buildBr(*Return);
3152
3153 return true;
3154}
3155
3156bool IRTranslator::translateLandingPad(const User &U,
3157 MachineIRBuilder &MIRBuilder) {
3158 const LandingPadInst &LP = cast<LandingPadInst>(U);
3159
3160 MachineBasicBlock &MBB = MIRBuilder.getMBB();
3161
3162 MBB.setIsEHPad();
3163
3164 // If there aren't registers to copy the values into (e.g., during SjLj
3165 // exceptions), then don't bother.
3166 const Constant *PersonalityFn = MF->getFunction().getPersonalityFn();
3167 if (TLI->getExceptionPointerRegister(PersonalityFn) == 0 &&
3168 TLI->getExceptionSelectorRegister(PersonalityFn) == 0)
3169 return true;
3170
3171 // If landingpad's return type is token type, we don't create DAG nodes
3172 // for its exception pointer and selector value. The extraction of exception
3173 // pointer or selector value from token type landingpads is not currently
3174 // supported.
3175 if (LP.getType()->isTokenTy())
3176 return true;
3177
3178 // Add a label to mark the beginning of the landing pad. Deletion of the
3179 // landing pad can thus be detected via the MachineModuleInfo.
3180 MIRBuilder.buildInstr(TargetOpcode::EH_LABEL)
3181 .addSym(MF->addLandingPad(&MBB));
3182
3183 // If the unwinder does not preserve all registers, ensure that the
3184 // function marks the clobbered registers as used.
3185 const TargetRegisterInfo &TRI = *MF->getSubtarget().getRegisterInfo();
3186 if (auto *RegMask = TRI.getCustomEHPadPreservedMask(*MF))
3187 MF->getRegInfo().addPhysRegsUsedFromRegMask(RegMask);
3188
3189 LLT Ty = getLLTForType(*LP.getType(), *DL);
3190 Register Undef = MRI->createGenericVirtualRegister(Ty);
3191 MIRBuilder.buildUndef(Undef);
3192
3194 for (Type *Ty : cast<StructType>(LP.getType())->elements())
3195 Tys.push_back(getLLTForType(*Ty, *DL));
3196 assert(Tys.size() == 2 && "Only two-valued landingpads are supported");
3197
3198 // Mark exception register as live in.
3199 Register ExceptionReg = TLI->getExceptionPointerRegister(PersonalityFn);
3200 if (!ExceptionReg)
3201 return false;
3202
3203 MBB.addLiveIn(ExceptionReg);
3204 ArrayRef<Register> ResRegs = getOrCreateVRegs(LP);
3205 MIRBuilder.buildCopy(ResRegs[0], ExceptionReg);
3206
3207 Register SelectorReg = TLI->getExceptionSelectorRegister(PersonalityFn);
3208 if (!SelectorReg)
3209 return false;
3210
3211 MBB.addLiveIn(SelectorReg);
3212 Register PtrVReg = MRI->createGenericVirtualRegister(Tys[0]);
3213 MIRBuilder.buildCopy(PtrVReg, SelectorReg);
3214 MIRBuilder.buildCast(ResRegs[1], PtrVReg);
3215
3216 return true;
3217}
3218
3219bool IRTranslator::translateAlloca(const User &U,
3220 MachineIRBuilder &MIRBuilder) {
3221 auto &AI = cast<AllocaInst>(U);
3222
3223 if (AI.isSwiftError())
3224 return true;
3225
3226 if (AI.isStaticAlloca()) {
3227 Register Res = getOrCreateVReg(AI);
3228 int FI = getOrCreateFrameIndex(AI);
3229 MIRBuilder.buildFrameIndex(Res, FI);
3230 return true;
3231 }
3232
3233 // FIXME: support stack probing for Windows.
3234 if (MF->getTarget().getTargetTriple().isOSWindows())
3235 return false;
3236
3237 // Now we're in the harder dynamic case.
3238 Register NumElts = getOrCreateVReg(*AI.getArraySize());
3239 Type *IntPtrIRTy = DL->getIntPtrType(AI.getType());
3240 LLT IntPtrTy = getLLTForType(*IntPtrIRTy, *DL);
3241 if (MRI->getType(NumElts) != IntPtrTy) {
3242 Register ExtElts = MRI->createGenericVirtualRegister(IntPtrTy);
3243 MIRBuilder.buildZExtOrTrunc(ExtElts, NumElts);
3244 NumElts = ExtElts;
3245 }
3246
3247 Type *Ty = AI.getAllocatedType();
3248 TypeSize TySize = DL->getTypeAllocSize(Ty);
3249
3250 Register AllocSize = MRI->createGenericVirtualRegister(IntPtrTy);
3251 Register TySizeReg;
3252 if (TySize.isScalable()) {
3253 // For scalable types, use vscale * min_value
3254 TySizeReg = MRI->createGenericVirtualRegister(IntPtrTy);
3255 MIRBuilder.buildVScale(TySizeReg, TySize.getKnownMinValue());
3256 } else {
3257 // For fixed types, use a constant
3258 TySizeReg =
3259 getOrCreateVReg(*ConstantInt::get(IntPtrIRTy, TySize.getFixedValue()));
3260 }
3261 MIRBuilder.buildMul(AllocSize, NumElts, TySizeReg);
3262
3263 // Round the size of the allocation up to the stack alignment size
3264 // by add SA-1 to the size. This doesn't overflow because we're computing
3265 // an address inside an alloca.
3266 Align StackAlign = MF->getSubtarget().getFrameLowering()->getStackAlign();
3267 auto SAMinusOne = MIRBuilder.buildConstant(IntPtrTy, StackAlign.value() - 1);
3268 auto AllocAdd = MIRBuilder.buildAdd(IntPtrTy, AllocSize, SAMinusOne,
3270 auto AlignCst =
3271 MIRBuilder.buildConstant(IntPtrTy, ~(uint64_t)(StackAlign.value() - 1));
3272 auto AlignedAlloc = MIRBuilder.buildAnd(IntPtrTy, AllocAdd, AlignCst);
3273
3274 Align Alignment = AI.getAlign();
3275 if (Alignment <= StackAlign)
3276 Alignment = Align(1);
3277 MIRBuilder.buildDynStackAlloc(getOrCreateVReg(AI), AlignedAlloc, Alignment);
3278
3279 MF->getFrameInfo().CreateVariableSizedObject(Alignment, &AI);
3280 assert(MF->getFrameInfo().hasVarSizedObjects());
3281 return true;
3282}
3283
3284bool IRTranslator::translateVAArg(const User &U, MachineIRBuilder &MIRBuilder) {
3285 // FIXME: We may need more info about the type. Because of how LLT works,
3286 // we're completely discarding the i64/double distinction here (amongst
3287 // others). Fortunately the ABIs I know of where that matters don't use va_arg
3288 // anyway but that's not guaranteed.
3289 MIRBuilder.buildInstr(TargetOpcode::G_VAARG, {getOrCreateVReg(U)},
3290 {getOrCreateVReg(*U.getOperand(0)),
3291 DL->getABITypeAlign(U.getType()).value()});
3292 return true;
3293}
3294
3295bool IRTranslator::translateUnreachable(const User &U,
3296 MachineIRBuilder &MIRBuilder) {
3297 auto &UI = cast<UnreachableInst>(U);
3298 if (!UI.shouldLowerToTrap(MF->getTarget().Options.TrapUnreachable,
3299 MF->getTarget().Options.NoTrapAfterNoreturn))
3300 return true;
3301
3302 MIRBuilder.buildTrap();
3303 return true;
3304}
3305
3306bool IRTranslator::translateInsertElement(const User &U,
3307 MachineIRBuilder &MIRBuilder) {
3308 // If it is a <1 x Ty> vector, use the scalar as it is
3309 // not a legal vector type in LLT.
3310 if (auto *FVT = dyn_cast<FixedVectorType>(U.getType());
3311 FVT && FVT->getNumElements() == 1)
3312 return translateCopy(U, *U.getOperand(1), MIRBuilder);
3313
3314 Register Res = getOrCreateVReg(U);
3315 Register Val = getOrCreateVReg(*U.getOperand(0));
3316 Register Elt = getOrCreateVReg(*U.getOperand(1));
3317 unsigned PreferredVecIdxWidth = TLI->getVectorIdxWidth(*DL);
3318 Register Idx;
3319 if (auto *CI = dyn_cast<ConstantInt>(U.getOperand(2))) {
3320 if (CI->getBitWidth() != PreferredVecIdxWidth) {
3321 APInt NewIdx = CI->getValue().zextOrTrunc(PreferredVecIdxWidth);
3322 auto *NewIdxCI = ConstantInt::get(CI->getContext(), NewIdx);
3323 Idx = getOrCreateVReg(*NewIdxCI);
3324 }
3325 }
3326 if (!Idx)
3327 Idx = getOrCreateVReg(*U.getOperand(2));
3328 if (MRI->getType(Idx).getSizeInBits() != PreferredVecIdxWidth) {
3329 const LLT VecIdxTy =
3330 MRI->getType(Idx).changeElementSize(PreferredVecIdxWidth);
3331 Idx = MIRBuilder.buildZExtOrTrunc(VecIdxTy, Idx).getReg(0);
3332 }
3333 MIRBuilder.buildInsertVectorElement(Res, Val, Elt, Idx);
3334 return true;
3335}
3336
3337bool IRTranslator::translateInsertVector(const User &U,
3338 MachineIRBuilder &MIRBuilder) {
3339 Register Dst = getOrCreateVReg(U);
3340 Register Vec = getOrCreateVReg(*U.getOperand(0));
3341 Register Elt = getOrCreateVReg(*U.getOperand(1));
3342
3343 ConstantInt *CI = cast<ConstantInt>(U.getOperand(2));
3344 unsigned PreferredVecIdxWidth = TLI->getVectorIdxWidth(*DL);
3345
3346 // Resize Index to preferred index width.
3347 if (CI->getBitWidth() != PreferredVecIdxWidth) {
3348 APInt NewIdx = CI->getValue().zextOrTrunc(PreferredVecIdxWidth);
3349 CI = ConstantInt::get(CI->getContext(), NewIdx);
3350 }
3351
3352 // If it is a <1 x Ty> vector, we have to use other means.
3353 if (auto *ResultType = dyn_cast<FixedVectorType>(U.getOperand(1)->getType());
3354 ResultType && ResultType->getNumElements() == 1) {
3355 if (auto *InputType = dyn_cast<FixedVectorType>(U.getOperand(0)->getType());
3356 InputType && InputType->getNumElements() == 1) {
3357 // We are inserting an illegal fixed vector into an illegal
3358 // fixed vector, use the scalar as it is not a legal vector type
3359 // in LLT.
3360 return translateCopy(U, *U.getOperand(0), MIRBuilder);
3361 }
3362 if (isa<FixedVectorType>(U.getOperand(0)->getType())) {
3363 // We are inserting an illegal fixed vector into a legal fixed
3364 // vector, use the scalar as it is not a legal vector type in
3365 // LLT.
3366 Register Idx = getOrCreateVReg(*CI);
3367 MIRBuilder.buildInsertVectorElement(Dst, Vec, Elt, Idx);
3368 return true;
3369 }
3370 if (isa<ScalableVectorType>(U.getOperand(0)->getType())) {
3371 // We are inserting an illegal fixed vector into a scalable
3372 // vector, use a scalar element insert.
3373 LLT VecIdxTy = LLT::scalar(PreferredVecIdxWidth);
3374 Register Idx = getOrCreateVReg(*CI);
3375 auto ScaledIndex = MIRBuilder.buildMul(
3376 VecIdxTy, MIRBuilder.buildVScale(VecIdxTy, 1), Idx);
3377 MIRBuilder.buildInsertVectorElement(Dst, Vec, Elt, ScaledIndex);
3378 return true;
3379 }
3380 }
3381
3382 MIRBuilder.buildInsertSubvector(
3383 getOrCreateVReg(U), getOrCreateVReg(*U.getOperand(0)),
3384 getOrCreateVReg(*U.getOperand(1)), CI->getZExtValue());
3385 return true;
3386}
3387
3388bool IRTranslator::translateExtractElement(const User &U,
3389 MachineIRBuilder &MIRBuilder) {
3390 // If it is a <1 x Ty> vector, use the scalar as it is
3391 // not a legal vector type in LLT.
3392 if (const FixedVectorType *FVT =
3393 dyn_cast<FixedVectorType>(U.getOperand(0)->getType()))
3394 if (FVT->getNumElements() == 1)
3395 return translateCopy(U, *U.getOperand(0), MIRBuilder);
3396
3397 Register Res = getOrCreateVReg(U);
3398 Register Val = getOrCreateVReg(*U.getOperand(0));
3399 unsigned PreferredVecIdxWidth = TLI->getVectorIdxWidth(*DL);
3400 Register Idx;
3401 if (auto *CI = dyn_cast<ConstantInt>(U.getOperand(1))) {
3402 if (CI->getBitWidth() != PreferredVecIdxWidth) {
3403 APInt NewIdx = CI->getValue().zextOrTrunc(PreferredVecIdxWidth);
3404 auto *NewIdxCI = ConstantInt::get(CI->getContext(), NewIdx);
3405 Idx = getOrCreateVReg(*NewIdxCI);
3406 }
3407 }
3408 if (!Idx)
3409 Idx = getOrCreateVReg(*U.getOperand(1));
3410 if (MRI->getType(Idx).getSizeInBits() != PreferredVecIdxWidth) {
3411 const LLT VecIdxTy =
3412 MRI->getType(Idx).changeElementSize(PreferredVecIdxWidth);
3413 Idx = MIRBuilder.buildZExtOrTrunc(VecIdxTy, Idx).getReg(0);
3414 }
3415 MIRBuilder.buildExtractVectorElement(Res, Val, Idx);
3416 return true;
3417}
3418
3419bool IRTranslator::translateExtractVector(const User &U,
3420 MachineIRBuilder &MIRBuilder) {
3421 Register Res = getOrCreateVReg(U);
3422 Register Vec = getOrCreateVReg(*U.getOperand(0));
3423 ConstantInt *CI = cast<ConstantInt>(U.getOperand(1));
3424 unsigned PreferredVecIdxWidth = TLI->getVectorIdxWidth(*DL);
3425
3426 // Resize Index to preferred index width.
3427 if (CI->getBitWidth() != PreferredVecIdxWidth) {
3428 APInt NewIdx = CI->getValue().zextOrTrunc(PreferredVecIdxWidth);
3429 CI = ConstantInt::get(CI->getContext(), NewIdx);
3430 }
3431
3432 // If it is a <1 x Ty> vector, we have to use other means.
3433 if (auto *ResultType = dyn_cast<FixedVectorType>(U.getType());
3434 ResultType && ResultType->getNumElements() == 1) {
3435 if (auto *InputType = dyn_cast<FixedVectorType>(U.getOperand(0)->getType());
3436 InputType && InputType->getNumElements() == 1) {
3437 // We are extracting an illegal fixed vector from an illegal fixed vector,
3438 // use the scalar as it is not a legal vector type in LLT.
3439 return translateCopy(U, *U.getOperand(0), MIRBuilder);
3440 }
3441 if (isa<FixedVectorType>(U.getOperand(0)->getType())) {
3442 // We are extracting an illegal fixed vector from a legal fixed
3443 // vector, use the scalar as it is not a legal vector type in
3444 // LLT.
3445 Register Idx = getOrCreateVReg(*CI);
3446 MIRBuilder.buildExtractVectorElement(Res, Vec, Idx);
3447 return true;
3448 }
3449 if (isa<ScalableVectorType>(U.getOperand(0)->getType())) {
3450 // We are extracting an illegal fixed vector from a scalable
3451 // vector, use a scalar element extract.
3452 LLT VecIdxTy = LLT::scalar(PreferredVecIdxWidth);
3453 Register Idx = getOrCreateVReg(*CI);
3454 auto ScaledIndex = MIRBuilder.buildMul(
3455 VecIdxTy, MIRBuilder.buildVScale(VecIdxTy, 1), Idx);
3456 MIRBuilder.buildExtractVectorElement(Res, Vec, ScaledIndex);
3457 return true;
3458 }
3459 }
3460
3461 MIRBuilder.buildExtractSubvector(getOrCreateVReg(U),
3462 getOrCreateVReg(*U.getOperand(0)),
3463 CI->getZExtValue());
3464 return true;
3465}
3466
3467bool IRTranslator::translateShuffleVector(const User &U,
3468 MachineIRBuilder &MIRBuilder) {
3469 // A ShuffleVector that operates on scalable vectors is a splat vector where
3470 // the value of the splat vector is the 0th element of the first operand,
3471 // since the index mask operand is the zeroinitializer (undef and
3472 // poison are treated as zeroinitializer here).
3473 if (U.getOperand(0)->getType()->isScalableTy()) {
3474 Register Val = getOrCreateVReg(*U.getOperand(0));
3475 auto SplatVal = MIRBuilder.buildExtractVectorElementConstant(
3476 MRI->getType(Val).getElementType(), Val, 0);
3477 MIRBuilder.buildSplatVector(getOrCreateVReg(U), SplatVal);
3478 return true;
3479 }
3480
3481 ArrayRef<int> Mask;
3482 if (auto *SVI = dyn_cast<ShuffleVectorInst>(&U))
3483 Mask = SVI->getShuffleMask();
3484 else
3485 Mask = cast<ConstantExpr>(U).getShuffleMask();
3486
3487 // As GISel does not represent <1 x > vectors as a separate type from scalars,
3488 // we transform shuffle_vector with a scalar output to an
3489 // ExtractVectorElement. If the input type is also scalar it becomes a Copy.
3490 unsigned DstElts = cast<FixedVectorType>(U.getType())->getNumElements();
3491 unsigned SrcElts =
3492 cast<FixedVectorType>(U.getOperand(0)->getType())->getNumElements();
3493 if (DstElts == 1) {
3494 unsigned M = Mask[0];
3495 if (SrcElts == 1) {
3496 if (M == 0 || M == 1)
3497 return translateCopy(U, *U.getOperand(M), MIRBuilder);
3498 MIRBuilder.buildUndef(getOrCreateVReg(U));
3499 } else {
3500 Register Dst = getOrCreateVReg(U);
3501 if (M < SrcElts) {
3503 Dst, getOrCreateVReg(*U.getOperand(0)), M);
3504 } else if (M < SrcElts * 2) {
3506 Dst, getOrCreateVReg(*U.getOperand(1)), M - SrcElts);
3507 } else {
3508 MIRBuilder.buildUndef(Dst);
3509 }
3510 }
3511 return true;
3512 }
3513
3514 // A single element src is transformed to a build_vector.
3515 if (SrcElts == 1) {
3518 for (int M : Mask) {
3519 LLT SrcTy = getLLTForType(*U.getOperand(0)->getType(), *DL);
3520 if (M == 0 || M == 1) {
3521 Ops.push_back(getOrCreateVReg(*U.getOperand(M)));
3522 } else {
3523 if (!Undef.isValid()) {
3524 Undef = MRI->createGenericVirtualRegister(SrcTy);
3525 MIRBuilder.buildUndef(Undef);
3526 }
3527 Ops.push_back(Undef);
3528 }
3529 }
3530 MIRBuilder.buildBuildVector(getOrCreateVReg(U), Ops);
3531 return true;
3532 }
3533
3534 ArrayRef<int> MaskAlloc = MF->allocateShuffleMask(Mask);
3535 MIRBuilder
3536 .buildInstr(TargetOpcode::G_SHUFFLE_VECTOR, {getOrCreateVReg(U)},
3537 {getOrCreateVReg(*U.getOperand(0)),
3538 getOrCreateVReg(*U.getOperand(1))})
3539 .addShuffleMask(MaskAlloc);
3540 return true;
3541}
3542
3543bool IRTranslator::translatePHI(const User &U, MachineIRBuilder &MIRBuilder) {
3544 const PHINode &PI = cast<PHINode>(U);
3545
3546 SmallVector<MachineInstr *, 4> Insts;
3547 for (auto Reg : getOrCreateVRegs(PI)) {
3548 auto MIB = MIRBuilder.buildInstr(TargetOpcode::G_PHI, {Reg}, {});
3549 Insts.push_back(MIB.getInstr());
3550 }
3551
3552 PendingPHIs.emplace_back(&PI, std::move(Insts));
3553 return true;
3554}
3555
3556bool IRTranslator::translateAtomicCmpXchg(const User &U,
3557 MachineIRBuilder &MIRBuilder) {
3558 const AtomicCmpXchgInst &I = cast<AtomicCmpXchgInst>(U);
3559
3560 auto Flags = TLI->getAtomicMemOperandFlags(I, *DL);
3561
3562 auto Res = getOrCreateVRegs(I);
3563 Register OldValRes = Res[0];
3564 Register SuccessRes = Res[1];
3565 Register Addr = getOrCreateVReg(*I.getPointerOperand());
3566 Register Cmp = getOrCreateVReg(*I.getCompareOperand());
3567 Register NewVal = getOrCreateVReg(*I.getNewValOperand());
3568
3570 OldValRes, SuccessRes, Addr, Cmp, NewVal,
3571 *MF->getMachineMemOperand(
3572 MachinePointerInfo(I.getPointerOperand()), Flags, MRI->getType(Cmp),
3573 getMemOpAlign(I), I.getAAMetadata(), nullptr, I.getSyncScopeID(),
3574 I.getSuccessOrdering(), I.getFailureOrdering()));
3575 return true;
3576}
3577
3578bool IRTranslator::translateAtomicRMW(const User &U,
3579 MachineIRBuilder &MIRBuilder) {
3580 if (!mayTranslateUserTypes(U))
3581 return false;
3582
3583 const AtomicRMWInst &I = cast<AtomicRMWInst>(U);
3584 auto Flags = TLI->getAtomicMemOperandFlags(I, *DL);
3585
3586 Register Res = getOrCreateVReg(I);
3587 Register Addr = getOrCreateVReg(*I.getPointerOperand());
3588 Register Val = getOrCreateVReg(*I.getValOperand());
3589
3590 unsigned Opcode = 0;
3591 switch (I.getOperation()) {
3592 default:
3593 return false;
3595 Opcode = TargetOpcode::G_ATOMICRMW_XCHG;
3596 break;
3597 case AtomicRMWInst::Add:
3598 Opcode = TargetOpcode::G_ATOMICRMW_ADD;
3599 break;
3600 case AtomicRMWInst::Sub:
3601 Opcode = TargetOpcode::G_ATOMICRMW_SUB;
3602 break;
3603 case AtomicRMWInst::And:
3604 Opcode = TargetOpcode::G_ATOMICRMW_AND;
3605 break;
3607 Opcode = TargetOpcode::G_ATOMICRMW_NAND;
3608 break;
3609 case AtomicRMWInst::Or:
3610 Opcode = TargetOpcode::G_ATOMICRMW_OR;
3611 break;
3612 case AtomicRMWInst::Xor:
3613 Opcode = TargetOpcode::G_ATOMICRMW_XOR;
3614 break;
3615 case AtomicRMWInst::Max:
3616 Opcode = TargetOpcode::G_ATOMICRMW_MAX;
3617 break;
3618 case AtomicRMWInst::Min:
3619 Opcode = TargetOpcode::G_ATOMICRMW_MIN;
3620 break;
3622 Opcode = TargetOpcode::G_ATOMICRMW_UMAX;
3623 break;
3625 Opcode = TargetOpcode::G_ATOMICRMW_UMIN;
3626 break;
3628 Opcode = TargetOpcode::G_ATOMICRMW_FADD;
3629 break;
3631 Opcode = TargetOpcode::G_ATOMICRMW_FSUB;
3632 break;
3634 Opcode = TargetOpcode::G_ATOMICRMW_FMAX;
3635 break;
3637 Opcode = TargetOpcode::G_ATOMICRMW_FMIN;
3638 break;
3640 Opcode = TargetOpcode::G_ATOMICRMW_FMAXIMUM;
3641 break;
3643 Opcode = TargetOpcode::G_ATOMICRMW_FMINIMUM;
3644 break;
3646 Opcode = TargetOpcode::G_ATOMICRMW_FMAXIMUMNUM;
3647 break;
3649 Opcode = TargetOpcode::G_ATOMICRMW_FMINIMUMNUM;
3650 break;
3652 Opcode = TargetOpcode::G_ATOMICRMW_UINC_WRAP;
3653 break;
3655 Opcode = TargetOpcode::G_ATOMICRMW_UDEC_WRAP;
3656 break;
3658 Opcode = TargetOpcode::G_ATOMICRMW_USUB_COND;
3659 break;
3661 Opcode = TargetOpcode::G_ATOMICRMW_USUB_SAT;
3662 break;
3663 }
3664
3665 MIRBuilder.buildAtomicRMW(
3666 Opcode, Res, Addr, Val,
3667 *MF->getMachineMemOperand(MachinePointerInfo(I.getPointerOperand()),
3668 Flags, MRI->getType(Val), getMemOpAlign(I),
3669 I.getAAMetadata(), nullptr, I.getSyncScopeID(),
3670 I.getOrdering()));
3671 return true;
3672}
3673
3674bool IRTranslator::translateFence(const User &U,
3675 MachineIRBuilder &MIRBuilder) {
3676 const FenceInst &Fence = cast<FenceInst>(U);
3677 MIRBuilder.buildFence(static_cast<unsigned>(Fence.getOrdering()),
3678 Fence.getSyncScopeID());
3679 return true;
3680}
3681
3682bool IRTranslator::translateFreeze(const User &U,
3683 MachineIRBuilder &MIRBuilder) {
3684 const ArrayRef<Register> DstRegs = getOrCreateVRegs(U);
3685 const ArrayRef<Register> SrcRegs = getOrCreateVRegs(*U.getOperand(0));
3686
3687 assert(DstRegs.size() == SrcRegs.size() &&
3688 "Freeze with different source and destination type?");
3689
3690 for (unsigned I = 0; I < DstRegs.size(); ++I) {
3691 MIRBuilder.buildFreeze(DstRegs[I], SrcRegs[I]);
3692 }
3693
3694 return true;
3695}
3696
3697void IRTranslator::finishPendingPhis() {
3698#ifndef NDEBUG
3699 DILocationVerifier Verifier;
3700 GISelObserverWrapper WrapperObserver(&Verifier);
3701 RAIIMFObsDelInstaller ObsInstall(*MF, WrapperObserver);
3702#endif // ifndef NDEBUG
3703 for (auto &Phi : PendingPHIs) {
3704 const PHINode *PI = Phi.first;
3705 if (PI->getType()->isEmptyTy())
3706 continue;
3707 ArrayRef<MachineInstr *> ComponentPHIs = Phi.second;
3708 MachineBasicBlock *PhiMBB = ComponentPHIs[0]->getParent();
3709 EntryBuilder->setDebugLoc(PI->getDebugLoc());
3710#ifndef NDEBUG
3711 Verifier.setCurrentInst(PI);
3712#endif // ifndef NDEBUG
3713
3714 SmallPtrSet<const MachineBasicBlock *, 16> SeenPreds;
3715 for (unsigned i = 0; i < PI->getNumIncomingValues(); ++i) {
3716 auto IRPred = PI->getIncomingBlock(i);
3717 ArrayRef<Register> ValRegs = getOrCreateVRegs(*PI->getIncomingValue(i));
3718 for (auto *Pred : getMachinePredBBs({IRPred, PI->getParent()})) {
3719 if (SeenPreds.count(Pred) || !PhiMBB->isPredecessor(Pred))
3720 continue;
3721 SeenPreds.insert(Pred);
3722 for (unsigned j = 0; j < ValRegs.size(); ++j) {
3723 MachineInstrBuilder MIB(*MF, ComponentPHIs[j]);
3724 MIB.addUse(ValRegs[j]);
3725 MIB.addMBB(Pred);
3726 }
3727 }
3728 }
3729 }
3730}
3731
3732void IRTranslator::translateDbgValueRecord(Value *V, bool HasArgList,
3733 const DILocalVariable *Variable,
3734 const DIExpression *Expression,
3735 const DebugLoc &DL,
3736 MachineIRBuilder &MIRBuilder) {
3737 assert(Variable->isValidLocationForIntrinsic(DL) &&
3738 "Expected inlined-at fields to agree");
3739 // Act as if we're handling a debug intrinsic.
3740 MIRBuilder.setDebugLoc(DL);
3741
3742 if (!V || HasArgList) {
3743 // DI cannot produce a valid DBG_VALUE, so produce an undef DBG_VALUE to
3744 // terminate any prior location.
3745 MIRBuilder.buildIndirectDbgValue(0, Variable, Expression);
3746 return;
3747 }
3748
3749 if (const auto *CI = dyn_cast<Constant>(V)) {
3750 MIRBuilder.buildConstDbgValue(*CI, Variable, Expression);
3751 return;
3752 }
3753
3754 if (auto *AI = dyn_cast<AllocaInst>(V);
3755 AI && AI->isStaticAlloca() && Expression->startsWithDeref()) {
3756 // If the value is an alloca and the expression starts with a
3757 // dereference, track a stack slot instead of a register, as registers
3758 // may be clobbered.
3759 auto ExprOperands = Expression->getElements();
3760 auto *ExprDerefRemoved =
3761 DIExpression::get(AI->getContext(), ExprOperands.drop_front());
3762 MIRBuilder.buildFIDbgValue(getOrCreateFrameIndex(*AI), Variable,
3763 ExprDerefRemoved);
3764 return;
3765 }
3766 if (translateIfEntryValueArgument(false, V, Variable, Expression, DL,
3767 MIRBuilder))
3768 return;
3769 for (Register Reg : getOrCreateVRegs(*V)) {
3770 // FIXME: This does not handle register-indirect values at offset 0. The
3771 // direct/indirect thing shouldn't really be handled by something as
3772 // implicit as reg+noreg vs reg+imm in the first place, but it seems
3773 // pretty baked in right now.
3774 MIRBuilder.buildDirectDbgValue(Reg, Variable, Expression);
3775 }
3776}
3777
3778void IRTranslator::translateDbgDeclareRecord(Value *Address, bool HasArgList,
3779 const DILocalVariable *Variable,
3780 const DIExpression *Expression,
3781 const DebugLoc &DL,
3782 MachineIRBuilder &MIRBuilder) {
3783 if (!Address || isa<UndefValue>(Address)) {
3784 LLVM_DEBUG(dbgs() << "Dropping debug info for " << *Variable << "\n");
3785 return;
3786 }
3787
3788 assert(Variable->isValidLocationForIntrinsic(DL) &&
3789 "Expected inlined-at fields to agree");
3790 auto AI = dyn_cast<AllocaInst>(Address);
3791 if (AI && AI->isStaticAlloca()) {
3792 // Static allocas are tracked at the MF level, no need for DBG_VALUE
3793 // instructions (in fact, they get ignored if they *do* exist).
3794 MF->setVariableDbgInfo(Variable, Expression,
3795 getOrCreateFrameIndex(*AI), DL);
3796 return;
3797 }
3798
3799 if (translateIfEntryValueArgument(true, Address, Variable,
3800 Expression, DL,
3801 MIRBuilder))
3802 return;
3803
3804 // A dbg.declare describes the address of a source variable, so lower it
3805 // into an indirect DBG_VALUE.
3806 MIRBuilder.setDebugLoc(DL);
3807 MIRBuilder.buildIndirectDbgValue(getOrCreateVReg(*Address), Variable,
3808 Expression);
3809}
3810
3811void IRTranslator::translateDbgInfo(const Instruction &Inst,
3812 MachineIRBuilder &MIRBuilder) {
3813 for (DbgRecord &DR : Inst.getDbgRecordRange()) {
3814 if (DbgLabelRecord *DLR = dyn_cast<DbgLabelRecord>(&DR)) {
3815 MIRBuilder.setDebugLoc(DLR->getDebugLoc());
3816 assert(DLR->getLabel() && "Missing label");
3817 assert(DLR->getLabel()->isValidLocationForIntrinsic(
3818 MIRBuilder.getDebugLoc()) &&
3819 "Expected inlined-at fields to agree");
3820 MIRBuilder.buildDbgLabel(DLR->getLabel());
3821 continue;
3822 }
3823 DbgVariableRecord &DVR = cast<DbgVariableRecord>(DR);
3824 const DILocalVariable *Variable = DVR.getVariable();
3825 const DIExpression *Expression = DVR.getExpression();
3826 Value *V = DVR.getVariableLocationOp(0);
3827 if (DVR.isDbgDeclare())
3828 translateDbgDeclareRecord(V, DVR.hasArgList(), Variable, Expression,
3829 DVR.getDebugLoc(), MIRBuilder);
3830 else
3831 translateDbgValueRecord(V, DVR.hasArgList(), Variable, Expression,
3832 DVR.getDebugLoc(), MIRBuilder);
3833 }
3834}
3835
3836bool IRTranslator::translate(const Instruction &Inst) {
3837 CurBuilder->setDebugLoc(Inst.getDebugLoc());
3838 CurBuilder->setPCSections(Inst.getMetadata(LLVMContext::MD_pcsections));
3839 CurBuilder->setMMRAMetadata(Inst.getMetadata(LLVMContext::MD_mmra));
3840
3841 if (TLI->fallBackToDAGISel(Inst))
3842 return false;
3843
3844 switch (Inst.getOpcode()) {
3845#define HANDLE_INST(NUM, OPCODE, CLASS) \
3846 case Instruction::OPCODE: \
3847 return translate##OPCODE(Inst, *CurBuilder.get());
3848#include "llvm/IR/Instruction.def"
3849 default:
3850 return false;
3851 }
3852}
3853
3854bool IRTranslator::translate(const Constant &C, Register Reg) {
3855 // We only emit constants into the entry block from here. To prevent jumpy
3856 // debug behaviour remove debug line.
3857 if (auto CurrInstDL = CurBuilder->getDL())
3858 EntryBuilder->setDebugLoc(DebugLoc());
3859
3860 if (auto CI = dyn_cast<ConstantInt>(&C)) {
3861 // buildConstant expects a to-be-splatted scalar ConstantInt.
3862 if (isa<VectorType>(CI->getType()))
3863 CI = ConstantInt::get(CI->getContext(), CI->getValue());
3864 EntryBuilder->buildConstant(Reg, *CI);
3865 } else if (auto CB = dyn_cast<ConstantByte>(&C)) {
3866 // Byte constants share G_CONSTANT with integers; the destination Reg's
3867 // LLT (an integer LLT, see getLLTForType) determines vector splatting.
3868 EntryBuilder->buildConstant(Reg, CB->getValue());
3869 } else if (auto CF = dyn_cast<ConstantFP>(&C)) {
3870 // buildFConstant expects a to-be-splatted scalar ConstantFP.
3871 if (isa<VectorType>(CF->getType()))
3872 CF = ConstantFP::get(CF->getContext(), CF->getValue());
3873 EntryBuilder->buildFConstant(Reg, *CF);
3874 } else if (isa<UndefValue>(C))
3875 EntryBuilder->buildUndef(Reg);
3876 else if (isa<ConstantPointerNull>(C))
3877 EntryBuilder->buildConstant(Reg, 0);
3878 else if (auto GV = dyn_cast<GlobalValue>(&C))
3879 EntryBuilder->buildGlobalValue(Reg, GV);
3880 else if (auto CPA = dyn_cast<ConstantPtrAuth>(&C)) {
3881 Register Addr = getOrCreateVReg(*CPA->getPointer());
3882 Register AddrDisc = getOrCreateVReg(*CPA->getAddrDiscriminator());
3883 EntryBuilder->buildConstantPtrAuth(Reg, CPA, Addr, AddrDisc);
3884 } else if (auto CAZ = dyn_cast<ConstantAggregateZero>(&C)) {
3885 Constant &Elt = *CAZ->getElementValue(0u);
3886 if (isa<ScalableVectorType>(CAZ->getType())) {
3887 EntryBuilder->buildSplatVector(Reg, getOrCreateVReg(Elt));
3888 return true;
3889 }
3890 // Return the scalar if it is a <1 x Ty> vector.
3891 unsigned NumElts = CAZ->getElementCount().getFixedValue();
3892 if (NumElts == 1)
3893 return translateCopy(C, Elt, *EntryBuilder);
3894 // All elements are zero so we can just use the first one.
3895 EntryBuilder->buildSplatBuildVector(Reg, getOrCreateVReg(Elt));
3896 } else if (auto CV = dyn_cast<ConstantDataVector>(&C)) {
3897 // Return the scalar if it is a <1 x Ty> vector.
3898 if (CV->getNumElements() == 1)
3899 return translateCopy(C, *CV->getElementAsConstant(0), *EntryBuilder);
3901 for (unsigned i = 0; i < CV->getNumElements(); ++i) {
3902 Constant &Elt = *CV->getElementAsConstant(i);
3903 Ops.push_back(getOrCreateVReg(Elt));
3904 }
3905 EntryBuilder->buildBuildVector(Reg, Ops);
3906 } else if (auto CE = dyn_cast<ConstantExpr>(&C)) {
3907 switch(CE->getOpcode()) {
3908#define HANDLE_INST(NUM, OPCODE, CLASS) \
3909 case Instruction::OPCODE: \
3910 return translate##OPCODE(*CE, *EntryBuilder.get());
3911#include "llvm/IR/Instruction.def"
3912 default:
3913 return false;
3914 }
3915 } else if (auto CV = dyn_cast<ConstantVector>(&C)) {
3916 if (CV->getNumOperands() == 1)
3917 return translateCopy(C, *CV->getOperand(0), *EntryBuilder);
3919 for (unsigned i = 0; i < CV->getNumOperands(); ++i) {
3920 Ops.push_back(getOrCreateVReg(*CV->getOperand(i)));
3921 }
3922 EntryBuilder->buildBuildVector(Reg, Ops);
3923 } else if (auto *BA = dyn_cast<BlockAddress>(&C)) {
3924 EntryBuilder->buildBlockAddress(Reg, BA);
3925 } else
3926 return false;
3927
3928 return true;
3929}
3930
3931bool IRTranslator::mayTranslateUserTypes(const User &U) const {
3932 const TargetMachine &TM = TLI->getTargetMachine();
3933 if (LLT::getUseExtended())
3934 return true;
3935
3936 // BF16 cannot currently be represented by default LLT. To avoid miscompiles
3937 // we prevent any instructions using them by default in all targets that do
3938 // not explicitly enable it via LLT::setUseExtended(true).
3939 // SPIRV target is exception.
3940 return TM.getTargetTriple().isSPIRV() ||
3941 (!U.getType()->getScalarType()->isBFloatTy() &&
3942 !any_of(U.operands(), [](Value *V) {
3943 return V->getType()->getScalarType()->isBFloatTy();
3944 }));
3945}
3946
3947bool IRTranslator::finalizeBasicBlock(const BasicBlock &BB,
3949 for (auto &BTB : SL->BitTestCases) {
3950 // Emit header first, if it wasn't already emitted.
3951 if (!BTB.Emitted)
3952 emitBitTestHeader(BTB, BTB.Parent);
3953
3954 BranchProbability UnhandledProb = BTB.Prob;
3955 for (unsigned j = 0, ej = BTB.Cases.size(); j != ej; ++j) {
3956 UnhandledProb -= BTB.Cases[j].ExtraProb;
3957 // Set the current basic block to the mbb we wish to insert the code into
3958 MachineBasicBlock *MBB = BTB.Cases[j].ThisBB;
3959 // If all cases cover a contiguous range, it is not necessary to jump to
3960 // the default block after the last bit test fails. This is because the
3961 // range check during bit test header creation has guaranteed that every
3962 // case here doesn't go outside the range. In this case, there is no need
3963 // to perform the last bit test, as it will always be true. Instead, make
3964 // the second-to-last bit-test fall through to the target of the last bit
3965 // test, and delete the last bit test.
3966
3967 MachineBasicBlock *NextMBB;
3968 if ((BTB.ContiguousRange || BTB.FallthroughUnreachable) && j + 2 == ej) {
3969 // Second-to-last bit-test with contiguous range: fall through to the
3970 // target of the final bit test.
3971 NextMBB = BTB.Cases[j + 1].TargetBB;
3972 } else if (j + 1 == ej) {
3973 // For the last bit test, fall through to Default.
3974 NextMBB = BTB.Default;
3975 } else {
3976 // Otherwise, fall through to the next bit test.
3977 NextMBB = BTB.Cases[j + 1].ThisBB;
3978 }
3979
3980 emitBitTestCase(BTB, NextMBB, UnhandledProb, BTB.Reg, BTB.Cases[j], MBB);
3981
3982 if ((BTB.ContiguousRange || BTB.FallthroughUnreachable) && j + 2 == ej) {
3983 // We need to record the replacement phi edge here that normally
3984 // happens in emitBitTestCase before we delete the case, otherwise the
3985 // phi edge will be lost.
3986 addMachineCFGPred({BTB.Parent->getBasicBlock(),
3987 BTB.Cases[ej - 1].TargetBB->getBasicBlock()},
3988 MBB);
3989 // Since we're not going to use the final bit test, remove it.
3990 BTB.Cases.pop_back();
3991 break;
3992 }
3993 }
3994 // This is "default" BB. We have two jumps to it. From "header" BB and from
3995 // last "case" BB, unless the latter was skipped.
3996 CFGEdge HeaderToDefaultEdge = {BTB.Parent->getBasicBlock(),
3997 BTB.Default->getBasicBlock()};
3998 addMachineCFGPred(HeaderToDefaultEdge, BTB.Parent);
3999 if (!BTB.ContiguousRange) {
4000 addMachineCFGPred(HeaderToDefaultEdge, BTB.Cases.back().ThisBB);
4001 }
4002 }
4003 SL->BitTestCases.clear();
4004
4005 for (auto &JTCase : SL->JTCases) {
4006 // Emit header first, if it wasn't already emitted.
4007 if (!JTCase.first.Emitted)
4008 emitJumpTableHeader(JTCase.second, JTCase.first, JTCase.first.HeaderBB);
4009
4010 emitJumpTable(JTCase.second, JTCase.second.MBB);
4011 }
4012 SL->JTCases.clear();
4013
4014 for (auto &SwCase : SL->SwitchCases)
4015 emitSwitchCase(SwCase, &CurBuilder->getMBB(), *CurBuilder);
4016 SL->SwitchCases.clear();
4017
4018 // Check if we need to generate stack-protector guard checks.
4019 StackProtector &SP = getAnalysis<StackProtector>();
4020 if (SP.shouldEmitSDCheck(BB)) {
4021 bool FunctionBasedInstrumentation =
4022 TLI->getSSPStackGuardCheck(*MF->getFunction().getParent(), *Libcalls);
4023 SPDescriptor.initialize(&BB, &MBB, FunctionBasedInstrumentation);
4024 }
4025 // Handle stack protector.
4026 if (SPDescriptor.shouldEmitFunctionBasedCheckStackProtector()) {
4027 LLVM_DEBUG(dbgs() << "Unimplemented stack protector case\n");
4028 return false;
4029 } else if (SPDescriptor.shouldEmitStackProtector()) {
4030 MachineBasicBlock *ParentMBB = SPDescriptor.getParentMBB();
4031 MachineBasicBlock *SuccessMBB = SPDescriptor.getSuccessMBB();
4032
4033 // Find the split point to split the parent mbb. At the same time copy all
4034 // physical registers used in the tail of parent mbb into virtual registers
4035 // before the split point and back into physical registers after the split
4036 // point. This prevents us needing to deal with Live-ins and many other
4037 // register allocation issues caused by us splitting the parent mbb. The
4038 // register allocator will clean up said virtual copies later on.
4040 ParentMBB, *MF->getSubtarget().getInstrInfo());
4041
4042 // Splice the terminator of ParentMBB into SuccessMBB.
4043 SuccessMBB->splice(SuccessMBB->end(), ParentMBB, SplitPoint,
4044 ParentMBB->end());
4045
4046 // Add compare/jump on neq/jump to the parent BB.
4047 if (!emitSPDescriptorParent(SPDescriptor, ParentMBB))
4048 return false;
4049
4050 // CodeGen Failure MBB if we have not codegened it yet.
4051 MachineBasicBlock *FailureMBB = SPDescriptor.getFailureMBB();
4052 if (FailureMBB->empty()) {
4053 if (!emitSPDescriptorFailure(SPDescriptor, FailureMBB))
4054 return false;
4055 }
4056
4057 // Clear the Per-BB State.
4058 SPDescriptor.resetPerBBState();
4059 }
4060 return true;
4061}
4062
4063bool IRTranslator::emitSPDescriptorParent(StackProtectorDescriptor &SPD,
4064 MachineBasicBlock *ParentBB) {
4065 CurBuilder->setInsertPt(*ParentBB, ParentBB->end());
4066 // First create the loads to the guard/stack slot for the comparison.
4067 Type *PtrIRTy = PointerType::getUnqual(MF->getFunction().getContext());
4068 const LLT PtrTy = getLLTForType(*PtrIRTy, *DL);
4069 LLT PtrMemTy = getLLTForMVT(TLI->getPointerMemTy(*DL));
4070
4071 MachineFrameInfo &MFI = ParentBB->getParent()->getFrameInfo();
4072 int FI = MFI.getStackProtectorIndex();
4073
4074 Register Guard;
4075 Register StackSlotPtr = CurBuilder->buildFrameIndex(PtrTy, FI).getReg(0);
4076 const Module &M = *ParentBB->getParent()->getFunction().getParent();
4077 Align Align = DL->getPrefTypeAlign(PointerType::getUnqual(M.getContext()));
4078
4079 // Generate code to load the content of the guard slot.
4080 Register GuardVal =
4081 CurBuilder
4082 ->buildLoad(PtrMemTy, StackSlotPtr,
4083 MachinePointerInfo::getFixedStack(*MF, FI), Align,
4085 .getReg(0);
4086
4087 if (TLI->useStackGuardXorFP()) {
4088 LLVM_DEBUG(dbgs() << "Stack protector xor'ing with FP not yet implemented");
4089 return false;
4090 }
4091
4092 // Retrieve guard check function, nullptr if instrumentation is inlined.
4093 if (const Function *GuardCheckFn = TLI->getSSPStackGuardCheck(M, *Libcalls)) {
4094 // This path is currently untestable on GlobalISel, since the only platform
4095 // that needs this seems to be Windows, and we fall back on that currently.
4096 // The code still lives here in case that changes.
4097 // Silence warning about unused variable until the code below that uses
4098 // 'GuardCheckFn' is enabled.
4099 (void)GuardCheckFn;
4100 return false;
4101#if 0
4102 // The target provides a guard check function to validate the guard value.
4103 // Generate a call to that function with the content of the guard slot as
4104 // argument.
4105 FunctionType *FnTy = GuardCheckFn->getFunctionType();
4106 assert(FnTy->getNumParams() == 1 && "Invalid function signature");
4107 ISD::ArgFlagsTy Flags;
4108 if (GuardCheckFn->hasAttribute(1, Attribute::AttrKind::InReg))
4109 Flags.setInReg();
4110 CallLowering::ArgInfo GuardArgInfo(
4111 {GuardVal, FnTy->getParamType(0), {Flags}});
4112
4113 CallLowering::CallLoweringInfo Info;
4114 Info.OrigArgs.push_back(GuardArgInfo);
4115 Info.CallConv = GuardCheckFn->getCallingConv();
4116 Info.Callee = MachineOperand::CreateGA(GuardCheckFn, 0);
4117 Info.OrigRet = {Register(), FnTy->getReturnType()};
4118 if (!CLI->lowerCall(MIRBuilder, Info)) {
4119 LLVM_DEBUG(dbgs() << "Failed to lower call to stack protector check\n");
4120 return false;
4121 }
4122 return true;
4123#endif
4124 }
4125
4126 // If useLoadStackGuardNode returns true, generate LOAD_STACK_GUARD.
4127 // Otherwise, emit a volatile load to retrieve the stack guard value.
4128 if (TLI->useLoadStackGuardNode(*ParentBB->getBasicBlock()->getModule())) {
4129 Guard =
4130 MRI->createGenericVirtualRegister(LLT::scalar(PtrTy.getSizeInBits()));
4131 getStackGuard(Guard, *CurBuilder);
4132 } else {
4133 // TODO: test using android subtarget when we support @llvm.thread.pointer.
4134 const Value *IRGuard = TLI->getSDagStackGuard(M, *Libcalls);
4135 Register GuardPtr = getOrCreateVReg(*IRGuard);
4136
4137 Guard = CurBuilder
4138 ->buildLoad(PtrMemTy, GuardPtr,
4139 MachinePointerInfo::getFixedStack(*MF, FI), Align,
4142 .getReg(0);
4143 }
4144
4145 // Perform the comparison.
4146 auto Cmp =
4147 CurBuilder->buildICmp(CmpInst::ICMP_NE, LLT::integer(1), Guard, GuardVal);
4148 // If the guard/stackslot do not equal, branch to failure MBB.
4149 CurBuilder->buildBrCond(Cmp, *SPD.getFailureMBB());
4150 // Otherwise branch to success MBB.
4151 CurBuilder->buildBr(*SPD.getSuccessMBB());
4152 return true;
4153}
4154
4155bool IRTranslator::emitSPDescriptorFailure(StackProtectorDescriptor &SPD,
4156 MachineBasicBlock *FailureBB) {
4157 const RTLIB::LibcallImpl LibcallImpl =
4158 Libcalls->getLibcallImpl(RTLIB::STACKPROTECTOR_CHECK_FAIL);
4159 if (LibcallImpl == RTLIB::Unsupported)
4160 return false;
4161
4162 CurBuilder->setInsertPt(*FailureBB, FailureBB->end());
4163
4164 CallLowering::CallLoweringInfo Info;
4165 Info.CallConv = Libcalls->getLibcallImplCallingConv(LibcallImpl);
4166
4167 StringRef LibcallName =
4169 Info.Callee = MachineOperand::CreateES(LibcallName.data());
4170 Info.OrigRet = {Register(), Type::getVoidTy(MF->getFunction().getContext()),
4171 0};
4172 if (!CLI->lowerCall(*CurBuilder, Info)) {
4173 LLVM_DEBUG(dbgs() << "Failed to lower call to stack protector fail\n");
4174 return false;
4175 }
4176
4177 // Emit a trap instruction if we are required to do so.
4178 const TargetOptions &TargetOpts = TLI->getTargetMachine().Options;
4179 if (TargetOpts.TrapUnreachable && !TargetOpts.NoTrapAfterNoreturn)
4180 CurBuilder->buildInstr(TargetOpcode::G_TRAP);
4181
4182 return true;
4183}
4184
4185void IRTranslator::finalizeFunction() {
4186 // Release the memory used by the different maps we
4187 // needed during the translation.
4188 PendingPHIs.clear();
4189 VMap.reset();
4190 FrameIndices.clear();
4191 MachinePreds.clear();
4192 // MachineIRBuilder::DebugLoc can outlive the DILocation it holds. Clear it
4193 // to avoid accessing free’d memory (in runOnMachineFunction) and to avoid
4194 // destroying it twice (in ~IRTranslator() and ~LLVMContext())
4195 EntryBuilder.reset();
4196 CurBuilder.reset();
4197 FuncInfo.clear();
4198 SPDescriptor.resetPerFunctionState();
4199}
4200
4201/// Returns true if a BasicBlock \p BB within a variadic function contains a
4202/// variadic musttail call.
4203static bool checkForMustTailInVarArgFn(bool IsVarArg, const BasicBlock &BB) {
4204 if (!IsVarArg)
4205 return false;
4206
4207 // Walk the block backwards, because tail calls usually only appear at the end
4208 // of a block.
4209 return llvm::any_of(llvm::reverse(BB), [](const Instruction &I) {
4210 const auto *CI = dyn_cast<CallInst>(&I);
4211 return CI && CI->isMustTailCall();
4212 });
4213}
4214
4216 MF = &CurMF;
4217 const Function &F = MF->getFunction();
4218 ORE = std::make_unique<OptimizationRemarkEmitter>(&F);
4219 CLI = MF->getSubtarget().getCallLowering();
4220
4221 if (CLI->fallBackToDAGISel(*MF)) {
4222 OptimizationRemarkMissed R("gisel-irtranslator", "GISelFailure",
4223 F.getSubprogram(), &F.getEntryBlock());
4224 R << "unable to lower function: "
4225 << ore::NV("Prototype", F.getFunctionType());
4226
4227 reportTranslationError(*MF, *ORE, R);
4228 return false;
4229 }
4230
4233 // Set the CSEConfig and run the analysis.
4234 GISelCSEInfo *CSEInfo = nullptr;
4236
4237 bool EnableCSE = EnableCSEInIRTranslator.getNumOccurrences()
4239 : TPC->isGISelCSEEnabled();
4240
4241 const TargetSubtargetInfo &Subtarget = MF->getSubtarget();
4242 TLI = Subtarget.getTargetLowering();
4243
4244 if (EnableCSE) {
4245 EntryBuilder = std::make_unique<CSEMIRBuilder>(CurMF);
4246 CSEInfo = &Wrapper.get(TPC->getCSEConfig());
4247 EntryBuilder->setCSEInfo(CSEInfo);
4248 CurBuilder = std::make_unique<CSEMIRBuilder>(CurMF);
4249 CurBuilder->setCSEInfo(CSEInfo);
4250 } else {
4251 EntryBuilder = std::make_unique<MachineIRBuilder>();
4252 CurBuilder = std::make_unique<MachineIRBuilder>();
4253 }
4254 CLI = Subtarget.getCallLowering();
4255 CurBuilder->setMF(*MF);
4256 EntryBuilder->setMF(*MF);
4257 MRI = &MF->getRegInfo();
4258 DL = &F.getDataLayout();
4259 const TargetMachine &TM = MF->getTarget();
4260 EnableOpts = OptLevel != CodeGenOptLevel::None && !skipFunction(F);
4261 FuncInfo.MF = MF;
4262 if (EnableOpts) {
4263 AA = &getAnalysis<AAResultsWrapperPass>().getAAResults();
4264 FuncInfo.BPI = &getAnalysis<BranchProbabilityInfoWrapperPass>().getBPI();
4265 AC = &getAnalysis<AssumptionCacheTracker>().getAssumptionCache(
4266 MF->getFunction());
4267 } else {
4268 AA = nullptr;
4269 FuncInfo.BPI = nullptr;
4270 AC = nullptr;
4271 }
4272 LibInfo = &getAnalysis<TargetLibraryInfoWrapperPass>().getTLI(F);
4273 Libcalls = &getAnalysis<LibcallLoweringInfoWrapper>().getLibcallLowering(
4274 *F.getParent(), Subtarget);
4275
4276 FuncInfo.CanLowerReturn = CLI->checkReturnTypeForCallConv(*MF);
4277
4278 SL = std::make_unique<GISelSwitchLowering>(this, FuncInfo);
4279 SL->init(*TLI, TM, *DL);
4280
4281 assert(PendingPHIs.empty() && "stale PHIs");
4282
4283 // Targets which want to use big endian can enable it using
4284 // enableBigEndian()
4285 if (!DL->isLittleEndian() && !CLI->enableBigEndian()) {
4286 // Currently we don't properly handle big endian code.
4287 OptimizationRemarkMissed R("gisel-irtranslator", "GISelFailure",
4288 F.getSubprogram(), &F.getEntryBlock());
4289 R << "unable to translate in big endian mode";
4290 reportTranslationError(*MF, *ORE, R);
4291 return false;
4292 }
4293
4294 // Release the per-function state when we return, whether we succeeded or not.
4295 llvm::scope_exit FinalizeOnReturn([this]() { finalizeFunction(); });
4296
4297 // Setup a separate basic-block for the arguments and constants
4298 MachineBasicBlock *EntryBB = MF->CreateMachineBasicBlock();
4299 MF->push_back(EntryBB);
4300 EntryBuilder->setMBB(*EntryBB);
4301
4302 DebugLoc DbgLoc = F.getEntryBlock().getFirstNonPHIIt()->getDebugLoc();
4303 SwiftError.setFunction(CurMF);
4304 SwiftError.createEntriesInEntryBlock(DbgLoc);
4305
4306 bool IsVarArg = F.isVarArg();
4307 bool HasMustTailInVarArgFn = false;
4308
4309 // Create all blocks, in IR order, to preserve the layout.
4310 FuncInfo.MBBMap.resize(F.getMaxBlockNumber());
4311 for (const BasicBlock &BB: F) {
4312 auto *&MBB = FuncInfo.MBBMap[BB.getNumber()];
4313
4314 MBB = MF->CreateMachineBasicBlock(&BB);
4315 MF->push_back(MBB);
4316
4317 // Only mark the block if the BlockAddress actually has users. The
4318 // hasAddressTaken flag may be stale if the BlockAddress was optimized away
4319 // but the constant still exists in the uniquing table.
4320 if (BB.hasAddressTaken()) {
4321 if (BlockAddress *BA = BlockAddress::lookup(&BB))
4322 if (!BA->hasZeroLiveUses())
4323 MBB->setAddressTakenIRBlock(const_cast<BasicBlock *>(&BB));
4324 }
4325
4326 if (!HasMustTailInVarArgFn)
4327 HasMustTailInVarArgFn = checkForMustTailInVarArgFn(IsVarArg, BB);
4328 }
4329
4330 MF->getFrameInfo().setHasMustTailInVarArgFunc(HasMustTailInVarArgFn);
4331
4332 // Make our arguments/constants entry block fallthrough to the IR entry block.
4333 EntryBB->addSuccessor(&getMBB(F.front()));
4334
4335 // Lower the actual args into this basic block.
4336 SmallVector<ArrayRef<Register>, 8> VRegArgs;
4337 for (const Argument &Arg: F.args()) {
4338 if (DL->getTypeStoreSize(Arg.getType()).isZero())
4339 continue; // Don't handle zero sized types.
4340 ArrayRef<Register> VRegs = getOrCreateVRegs(Arg);
4341 VRegArgs.push_back(VRegs);
4342
4343 if (CLI->supportSwiftError() && Arg.hasSwiftErrorAttr()) {
4344 assert(VRegs.size() == 1 && "Too many vregs for Swift error");
4345 SwiftError.setCurrentVReg(EntryBB, SwiftError.getFunctionArg(), VRegs[0]);
4346 }
4347 }
4348
4349 if (!CLI->lowerFormalArguments(*EntryBuilder, F, VRegArgs, FuncInfo)) {
4350 OptimizationRemarkMissed R("gisel-irtranslator", "GISelFailure",
4351 F.getSubprogram(), &F.getEntryBlock());
4352 R << "unable to lower arguments: "
4353 << ore::NV("Prototype", F.getFunctionType());
4354 reportTranslationError(*MF, *ORE, R);
4355 return false;
4356 }
4357
4358 // Need to visit defs before uses when translating instructions.
4359 GISelObserverWrapper WrapperObserver;
4360 if (EnableCSE && CSEInfo)
4361 WrapperObserver.addObserver(CSEInfo);
4362 {
4364#ifndef NDEBUG
4365 DILocationVerifier Verifier;
4366 WrapperObserver.addObserver(&Verifier);
4367#endif // ifndef NDEBUG
4368 RAIIMFObsDelInstaller ObsInstall(*MF, WrapperObserver);
4369 for (const BasicBlock *BB : RPOT) {
4370 MachineBasicBlock &MBB = getMBB(*BB);
4371 // Set the insertion point of all the following translations to
4372 // the end of this basic block.
4373 CurBuilder->setMBB(MBB);
4374 HasTailCall = false;
4375 for (const Instruction &Inst : *BB) {
4376 // If we translated a tail call in the last step, then we know
4377 // everything after the call is either a return, or something that is
4378 // handled by the call itself. (E.g. a lifetime marker or assume
4379 // intrinsic.) In this case, we should stop translating the block and
4380 // move on.
4381 if (HasTailCall)
4382 break;
4383#ifndef NDEBUG
4384 Verifier.setCurrentInst(&Inst);
4385#endif // ifndef NDEBUG
4386
4387 // Translate any debug-info attached to the instruction.
4388 translateDbgInfo(Inst, *CurBuilder);
4389
4390 if (translate(Inst))
4391 continue;
4392
4393 OptimizationRemarkMissed R("gisel-irtranslator", "GISelFailure",
4394 Inst.getDebugLoc(), BB);
4395 R << "unable to translate instruction: " << ore::NV("Opcode", &Inst);
4396
4397 if (ORE->allowExtraAnalysis("gisel-irtranslator")) {
4398 std::string InstStrStorage;
4399 raw_string_ostream InstStr(InstStrStorage);
4400 InstStr << Inst;
4401
4402 R << ": '" << InstStrStorage << "'";
4403 }
4404
4405 reportTranslationError(*MF, *ORE, R);
4406 return false;
4407 }
4408
4409 if (!finalizeBasicBlock(*BB, MBB)) {
4410 OptimizationRemarkMissed R("gisel-irtranslator", "GISelFailure",
4411 BB->getTerminator()->getDebugLoc(), BB);
4412 R << "unable to translate basic block";
4413 reportTranslationError(*MF, *ORE, R);
4414 return false;
4415 }
4416 }
4417#ifndef NDEBUG
4418 WrapperObserver.removeObserver(&Verifier);
4419#endif
4420 }
4421
4422 finishPendingPhis();
4423
4424 SwiftError.propagateVRegs();
4425
4426 // Merge the argument lowering and constants block with its single
4427 // successor, the LLVM-IR entry block. We want the basic block to
4428 // be maximal.
4429 assert(EntryBB->succ_size() == 1 &&
4430 "Custom BB used for lowering should have only one successor");
4431 // Get the successor of the current entry block.
4432 MachineBasicBlock &NewEntryBB = **EntryBB->succ_begin();
4433 assert(NewEntryBB.pred_size() == 1 &&
4434 "LLVM-IR entry block has a predecessor!?");
4435 // Move all the instruction from the current entry block to the
4436 // new entry block.
4437 NewEntryBB.splice(NewEntryBB.begin(), EntryBB, EntryBB->begin(),
4438 EntryBB->end());
4439
4440 // Update the live-in information for the new entry block.
4441 for (const MachineBasicBlock::RegisterMaskPair &LiveIn : EntryBB->liveins())
4442 NewEntryBB.addLiveIn(LiveIn);
4443 NewEntryBB.sortUniqueLiveIns();
4444
4445 // Get rid of the now empty basic block.
4446 EntryBB->removeSuccessor(&NewEntryBB);
4447 MF->remove(EntryBB);
4448 MF->deleteMachineBasicBlock(EntryBB);
4449
4450 assert(&MF->front() == &NewEntryBB &&
4451 "New entry wasn't next in the list of basic block!");
4452
4453 // Initialize stack protector information.
4455 SP.copyToMachineFrameInfo(MF->getFrameInfo());
4456
4457 return false;
4458}
#define Success
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")
amdgpu aa AMDGPU Address space based Alias Analysis Wrapper
MachineBasicBlock & MBB
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
static GCRegistry::Add< CoreCLRGC > E("coreclr", "CoreCLR-compatible GC")
static GCRegistry::Add< OcamlGC > B("ocaml", "ocaml 3.10-compatible GC")
Provides analysis for continuously CSEing during GISel passes.
This file implements a version of MachineIRBuilder which CSEs insts within a MachineBasicBlock.
This file describes how to lower LLVM calls to machine code calls.
This file contains the declarations for the subclasses of Constant, which represent the different fla...
dxil translate DXIL Translate Metadata
This contains common code to allow clients to notify changes to machine instr.
#define DEBUG_TYPE
const HexagonInstrInfo * TII
static bool checkForMustTailInVarArgFn(bool IsVarArg, const BasicBlock &BB)
Returns true if a BasicBlock BB within a variadic function contains a variadic musttail call.
static unsigned getConvOpcode(Intrinsic::ID ID)
static uint64_t getOffsetFromIndices(const User &U, const DataLayout &DL)
static unsigned getConstrainedOpcode(Intrinsic::ID ID)
IRTranslator LLVM IR MI
IRTranslator LLVM IR static false void reportTranslationError(MachineFunction &MF, OptimizationRemarkEmitter &ORE, OptimizationRemarkMissed &R)
static cl::opt< bool > EnableCSEInIRTranslator("enable-cse-in-irtranslator", cl::desc("Should enable CSE in irtranslator"), cl::Optional, cl::init(false))
static bool isValInBlock(const Value *V, const BasicBlock *BB)
static bool isSwiftError(const Value *V)
This file declares the IRTranslator pass.
This file provides various utilities for inspecting and working with the control flow graph in LLVM I...
This file describes how to lower LLVM inline asm to machine code INLINEASM.
const AbstractManglingParser< Derived, Alloc >::OperatorInfo AbstractManglingParser< Derived, Alloc >::Ops[]
static LVOptions Options
Definition LVOptions.cpp:25
Implement a low-level type suitable for MachineInstr level instruction selection.
Implement a low-level type suitable for MachineInstr level instruction selection.
#define F(x, y, z)
Definition MD5.cpp:54
#define I(x, y, z)
Definition MD5.cpp:57
Machine Check Debug Module
This file declares the MachineIRBuilder class.
Register Reg
Register const TargetRegisterInfo * TRI
Promote Memory to Register
Definition Mem2Reg.cpp:110
This file contains the declarations for metadata subclasses.
Type::TypeID TypeID
uint64_t High
OptimizedStructLayoutField Field
if(PassOpts->AAPipeline)
#define INITIALIZE_PASS_DEPENDENCY(depName)
Definition PassSupport.h:42
#define INITIALIZE_PASS_END(passName, arg, name, cfg, analysis)
Definition PassSupport.h:44
#define INITIALIZE_PASS_BEGIN(passName, arg, name, cfg, analysis)
Definition PassSupport.h:39
This file builds on the ADT/GraphTraits.h file to build a generic graph post order iterator.
const SmallVectorImpl< MachineOperand > MachineBasicBlock * TBB
const SmallVectorImpl< MachineOperand > & Cond
std::pair< BasicBlock *, BasicBlock * > Edge
This file contains some templates that are useful if you are working with the STL at all.
verify safepoint Safepoint IR Verifier
This file defines the make_scope_exit function, which executes user-defined cleanup logic at scope ex...
This file defines the SmallVector class.
#define LLVM_DEBUG(...)
Definition Debug.h:119
This file describes how to lower LLVM code to machine code.
Target-Independent Code Generator Pass Configuration Options pass.
Value * RHS
Value * LHS
A wrapper pass to provide the legacy pass manager access to a suitably prepared AAResults object.
LLVM_ABI APInt zextOrTrunc(unsigned width) const
Zero extend or truncate to width.
Definition APInt.cpp:1076
an instruction to allocate memory on the stack
bool isSwiftError() const
Return true if this alloca is used as a swifterror argument to a call.
LLVM_ABI bool isStaticAlloca() const
Return true if this alloca is in the entry block of the function and is a constant size.
Align getAlign() const
Return the alignment of the memory that is being allocated by the instruction.
PointerType * getType() const
Overload to return most specific pointer type.
Type * getAllocatedType() const
Return the type that is being allocated by the instruction.
LLVM_ABI std::optional< TypeSize > getAllocationSize(const DataLayout &DL) const
Get allocation size in bytes.
const Value * getArraySize() const
Get the number of elements allocated.
Represent the analysis usage information of a pass.
AnalysisUsage & addRequired()
AnalysisUsage & addPreserved()
Add the specified Pass class to the set of analyses preserved by this pass.
This class represents an incoming formal argument to a Function.
Definition Argument.h:32
Represent a constant reference to an array (0 or more elements consecutively in memory),...
Definition ArrayRef.h:40
iterator end() const
Definition ArrayRef.h:130
size_t size() const
Get the array size.
Definition ArrayRef.h:141
iterator begin() const
Definition ArrayRef.h:129
bool empty() const
Check if the array is empty.
Definition ArrayRef.h:136
An immutable pass that tracks lazily created AssumptionCache objects.
@ Add
*p = old + v
@ FAdd
*p = old + v
@ USubCond
Subtract only if no unsigned overflow.
@ FMinimum
*p = minimum(old, v) minimum matches the behavior of llvm.minimum.
@ Min
*p = old <signed v ? old : v
@ Sub
*p = old - v
@ And
*p = old & v
@ Xor
*p = old ^ v
@ USubSat
*p = usub.sat(old, v) usub.sat matches the behavior of llvm.usub.sat.
@ FMaximum
*p = maximum(old, v) maximum matches the behavior of llvm.maximum.
@ FSub
*p = old - v
@ UIncWrap
Increment one up to a maximum value.
@ Max
*p = old >signed v ? old : v
@ UMin
*p = old <unsigned v ? old : v
@ FMin
*p = minnum(old, v) minnum matches the behavior of llvm.minnum.
@ UMax
*p = old >unsigned v ? old : v
@ FMaximumNum
*p = maximumnum(old, v) maximumnum matches the behavior of llvm.maximumnum.
@ FMax
*p = maxnum(old, v) maxnum matches the behavior of llvm.maxnum.
@ UDecWrap
Decrement one until a minimum value or zero.
@ FMinimumNum
*p = minimumnum(old, v) minimumnum matches the behavior of llvm.minimumnum.
@ Nand
*p = ~(old & v)
LLVM Basic Block Representation.
Definition BasicBlock.h:62
unsigned getNumber() const
Definition BasicBlock.h:95
const Function * getParent() const
Return the enclosing method, or null if none.
Definition BasicBlock.h:213
bool hasAddressTaken() const
Returns true if there are any uses of this basic block other than direct branches,...
Definition BasicBlock.h:687
LLVM_ABI InstListType::const_iterator getFirstNonPHIIt() const
Returns an iterator to the first instruction in this block that is not a PHINode instruction.
InstListType::const_iterator const_iterator
Definition BasicBlock.h:171
LLVM_ABI InstListType::const_iterator getFirstNonPHIOrDbg(bool SkipPseudoOp=true) const
Returns a pointer to the first instruction in this block that is not a PHINode or a debug intrinsic,...
LLVM_ABI const Module * getModule() const
Return the module owning the function this basic block belongs to, or nullptr if the function does no...
The address of a basic block.
Definition Constants.h:1082
static LLVM_ABI BlockAddress * lookup(const BasicBlock *BB)
Lookup an existing BlockAddress constant for the given BasicBlock.
Legacy analysis pass which computes BlockFrequencyInfo.
Legacy analysis pass which computes BranchProbabilityInfo.
LLVM_ABI BranchProbability getEdgeProbability(const BasicBlock *Src, unsigned IndexInSuccessors) const
Get an edge's probability, relative to other out-edges of the Src.
static BranchProbability getOne()
static BranchProbability getZero()
static void normalizeProbabilities(ProbabilityIter Begin, ProbabilityIter End)
Base class for all callable instructions (InvokeInst and CallInst) Holds everything related to callin...
bool isInlineAsm() const
Check if this call is an inline asm statement.
std::optional< OperandBundleUse > getOperandBundle(StringRef Name) const
Return an operand bundle by name, if present.
Function * getCalledFunction() const
Returns the function called, or null if this is an indirect function invocation or the function signa...
LLVM_ABI bool paramHasAttr(unsigned ArgNo, Attribute::AttrKind Kind) const
Determine whether the argument or parameter has the given attribute.
User::op_iterator arg_begin()
Return the iterator pointing to the beginning of the argument list.
unsigned countOperandBundlesOfType(StringRef Name) const
Return the number of operand bundles with the tag Name attached to this instruction.
Value * getCalledOperand() const
Value * getArgOperand(unsigned i) const
User::op_iterator arg_end()
Return the iterator pointing to the end of the argument list.
bool isConvergent() const
Determine if the invoke is convergent.
LLVM_ABI Intrinsic::ID getIntrinsicID() const
Returns the intrinsic ID of the intrinsic called or Intrinsic::not_intrinsic if the called function i...
iterator_range< User::op_iterator > args()
Iteration adapter for range-for loops.
unsigned arg_size() const
AttributeList getAttributes() const
Return the attributes for this call.
This class represents a function call, abstracting a target machine's calling convention.
bool isTailCall() const
Predicate
This enumeration lists the possible predicates for CmpInst subclasses.
Definition InstrTypes.h:740
@ FCMP_TRUE
1 1 1 1 Always true (always folded)
Definition InstrTypes.h:757
@ ICMP_SLT
signed less than
Definition InstrTypes.h:769
@ ICMP_SLE
signed less or equal
Definition InstrTypes.h:770
@ ICMP_UGT
unsigned greater than
Definition InstrTypes.h:763
@ ICMP_NE
not equal
Definition InstrTypes.h:762
@ ICMP_ULE
unsigned less or equal
Definition InstrTypes.h:766
@ FCMP_FALSE
0 0 0 0 Always false (always folded)
Definition InstrTypes.h:742
bool isFPPredicate() const
Definition InstrTypes.h:845
bool isIntPredicate() const
Definition InstrTypes.h:846
Value * getCondition() const
BasicBlock * getSuccessor(unsigned i) const
static LLVM_ABI ConstantInt * getTrue(LLVMContext &Context)
bool isZero() const
This is just a convenience method to make client code smaller for a common code.
Definition Constants.h:219
unsigned getBitWidth() const
getBitWidth - Return the scalar bitwidth of this constant.
Definition Constants.h:162
uint64_t getZExtValue() const
Return the constant as a 64-bit unsigned integer value after it has been zero extended as appropriate...
Definition Constants.h:168
const APInt & getValue() const
Return the constant as an APInt value reference.
Definition Constants.h:159
This is an important base class in LLVM.
Definition Constant.h:43
static LLVM_ABI Constant * getAllOnesValue(Type *Ty)
static LLVM_ABI Constant * getNullValue(Type *Ty)
Constructor to create a '0' constant of arbitrary type.
This is the common base class for constrained floating point intrinsics.
LLVM_ABI std::optional< fp::ExceptionBehavior > getExceptionBehavior() const
LLVM_ABI unsigned getNonMetadataArgCount() const
DWARF expression.
LLVM_ABI bool isEntryValue() const
Check if the expression consists of exactly one entry value operand.
static LLVM_ABI DIExpression * append(const DIExpression *Expr, ArrayRef< uint64_t > Ops)
Append the opcodes Ops to DIExpr.
LLVM_ABI bool startsWithDeref() const
Return whether the first element a DW_OP_deref.
ArrayRef< uint64_t > getElements() const
bool isValidLocationForIntrinsic(const DILocation *DL) const
Check that a location is valid for this label.
A parsed version of the target data layout string in and methods for querying it.
Definition DataLayout.h:64
Value * getAddress() const
DILabel * getLabel() const
DebugLoc getDebugLoc() const
Value * getValue(unsigned OpIdx=0) const
DILocalVariable * getVariable() const
DIExpression * getExpression() const
LLVM_ABI Value * getVariableLocationOp(unsigned OpIdx) const
DIExpression * getExpression() const
DILocalVariable * getVariable() const
A debug info location.
Definition DebugLoc.h:124
Class representing an expression and its matching format.
This instruction extracts a struct member or array element value from an aggregate value.
static LLVM_ABI FixedVectorType * get(Type *ElementType, unsigned NumElts)
Definition Type.cpp:869
bool skipFunction(const Function &F) const
Optional passes call this function to check whether the pass should be skipped.
Definition Pass.cpp:193
const BasicBlock & getEntryBlock() const
Definition Function.h:809
DISubprogram * getSubprogram() const
Get the attached subprogram.
bool hasMinSize() const
Optimize this function for minimum size (-Oz).
Definition Function.h:711
Constant * getPersonalityFn() const
Get the personality function associated with this function.
const Function & getFunction() const
Definition Function.h:166
bool isIntrinsic() const
isIntrinsic - Returns true if the function's name starts with "llvm.".
Definition Function.h:251
The actual analysis pass wrapper.
Definition CSEInfo.h:242
Simple wrapper that does the following.
Definition CSEInfo.h:212
The CSE Analysis object.
Definition CSEInfo.h:72
Abstract class that contains various methods for clients to notify about changes.
Simple wrapper observer that takes several observers, and calls each one for each event.
void removeObserver(GISelChangeObserver *O)
void addObserver(GISelChangeObserver *O)
static StringRef dropLLVMManglingEscape(StringRef Name)
If the given string begins with the GlobalValue name mangling escape character '\1',...
bool hasExternalWeakLinkage() const
bool hasDLLImportStorageClass() const
Module * getParent()
Get the module that this global value is contained inside of...
bool isTailCall(const MachineInstr &MI) const override
bool runOnMachineFunction(MachineFunction &MF) override
runOnMachineFunction - This method must be overloaded to perform the desired machine code transformat...
IRTranslator(CodeGenOptLevel OptLevel=CodeGenOptLevel::None)
void getAnalysisUsage(AnalysisUsage &AU) const override
getAnalysisUsage - This function should be overriden by passes that need analysis information to do t...
bool lowerInlineAsm(MachineIRBuilder &MIRBuilder, const CallBase &CB, std::function< ArrayRef< Register >(const Value &Val)> GetOrCreateVRegs) const
Lower the given inline asm call instruction GetOrCreateVRegs is a callback to materialize a register ...
This instruction inserts a struct field of array element value into an aggregate value.
iterator_range< simple_ilist< DbgRecord >::iterator > getDbgRecordRange() const
Return a range over the DbgRecords attached to this instruction.
const DebugLoc & getDebugLoc() const
Return the debug location for this node as a DebugLoc.
LLVM_ABI const Module * getModule() const
Return the module owning the function this instruction belongs to or nullptr it the function does not...
MDNode * getMetadata(unsigned KindID) const
Get the metadata of given kind attached to this Instruction.
LLVM_ABI AAMDNodes getAAMetadata() const
Returns the AA metadata for this instruction.
unsigned getOpcode() const
Returns a member of one of the enums like Instruction::Add.
LLVM_ABI bool hasAllowReassoc() const LLVM_READONLY
Determine whether the allow-reassociation flag is set.
Intrinsic::ID getIntrinsicID() const
Return the intrinsic ID of this intrinsic.
static bool getUseExtended()
constexpr LLT changeElementType(LLT NewEltTy) const
If this type is a vector, return a vector with the same number of elements but the new element type.
static constexpr LLT scalar(unsigned SizeInBits)
Get a low-level scalar or aggregate "bag of bits".
constexpr uint16_t getNumElements() const
Returns the number of elements in a vector LLT.
constexpr bool isVector() const
static constexpr LLT pointer(unsigned AddressSpace, unsigned SizeInBits)
Get a low-level pointer in the given address space.
constexpr TypeSize getSizeInBits() const
Returns the total size of the type. Must only be called on sized types.
constexpr bool isPointer() const
static constexpr LLT fixed_vector(unsigned NumElements, unsigned ScalarSizeInBits)
Get a low-level fixed-width vector of some number of elements and element width.
constexpr bool isFixedVector() const
Returns true if the LLT is a fixed vector.
static LLT integer(unsigned SizeInBits)
LLT changeElementSize(unsigned NewEltSize) const
If this type is a vector, return a vector with the same number of elements but the new element size.
LLVM_ABI void diagnose(const DiagnosticInfo &DI)
Report a message to the currently installed diagnostic handler.
Value * getPointerOperand()
AtomicOrdering getOrdering() const
Returns the ordering constraint of this load instruction.
SyncScope::ID getSyncScopeID() const
Returns the synchronization scope ID of this load instruction.
static LocationSize precise(uint64_t Value)
static MDTuple * get(LLVMContext &Context, ArrayRef< Metadata * > MDs)
Definition Metadata.h:1561
void normalizeSuccProbs()
Normalize probabilities of all successors so that the sum of them becomes one.
LLVM_ABI instr_iterator insert(instr_iterator I, MachineInstr *M)
Insert MI into the instruction list before I, possibly inside a bundle.
void push_back(MachineInstr *MI)
const BasicBlock * getBasicBlock() const
Return the LLVM basic block that this instance corresponded to originally.
LLVM_ABI void setSuccProbability(succ_iterator I, BranchProbability Prob)
Set successor probability of a given iterator.
LLVM_ABI void addSuccessor(MachineBasicBlock *Succ, BranchProbability Prob=BranchProbability::getUnknown())
Add Succ as a successor of this MachineBasicBlock.
SmallVectorImpl< MachineBasicBlock * >::iterator succ_iterator
LLVM_ABI void sortUniqueLiveIns()
Sorts and uniques the LiveIns vector.
LLVM_ABI bool isPredecessor(const MachineBasicBlock *MBB) const
Return true if the specified MBB is a predecessor of this block.
void addLiveIn(MCRegister PhysReg, LaneBitmask LaneMask=LaneBitmask::getAll())
Adds the specified register as a live in.
const MachineFunction * getParent() const
Return the MachineFunction containing this basic block.
void splice(iterator Where, MachineBasicBlock *Other, iterator From)
Take an instruction from MBB 'Other' at the position From, and insert it into this MBB right before '...
MachineInstrBundleIterator< MachineInstr > iterator
void setIsEHPad(bool V=true)
Indicates the block is a landing pad.
int getStackProtectorIndex() const
Return the index for the stack protector object.
void getAnalysisUsage(AnalysisUsage &AU) const override
getAnalysisUsage - Subclasses that override getAnalysisUsage must call this.
MachineFrameInfo & getFrameInfo()
getFrameInfo - Return the frame info object for the current function.
Function & getFunction()
Return the LLVM function that this machine code represents.
BasicBlockListType::iterator iterator
MachineBasicBlock * CreateMachineBasicBlock(const BasicBlock *BB=nullptr, std::optional< UniqueBBID > BBID=std::nullopt)
CreateMachineInstr - Allocate a new MachineInstr.
void insert(iterator MBBI, MachineBasicBlock *MBB)
Helper class to build MachineInstr.
MachineInstrBuilder buildFPTOUI_SAT(const DstOp &Dst, const SrcOp &Src0)
Build and insert Res = G_FPTOUI_SAT Src0.
MachineInstrBuilder buildFMul(const DstOp &Dst, const SrcOp &Src0, const SrcOp &Src1, std::optional< unsigned > Flags=std::nullopt)
MachineInstrBuilder buildFreeze(const DstOp &Dst, const SrcOp &Src)
Build and insert Dst = G_FREEZE Src.
MachineInstrBuilder buildBr(MachineBasicBlock &Dest)
Build and insert G_BR Dest.
MachineInstrBuilder buildModf(const DstOp &Fract, const DstOp &Int, const SrcOp &Src, std::optional< unsigned > Flags=std::nullopt)
Build and insert Fract, Int = G_FMODF Src.
LLVMContext & getContext() const
MachineInstrBuilder buildAdd(const DstOp &Dst, const SrcOp &Src0, const SrcOp &Src1, std::optional< unsigned > Flags=std::nullopt)
Build and insert Res = G_ADD Op0, Op1.
MachineInstrBuilder buildUndef(const DstOp &Res)
Build and insert Res = IMPLICIT_DEF.
MachineInstrBuilder buildResetFPMode()
Build and insert G_RESET_FPMODE.
MachineInstrBuilder buildFPTOSI_SAT(const DstOp &Dst, const SrcOp &Src0)
Build and insert Res = G_FPTOSI_SAT Src0.
MachineInstrBuilder buildUCmp(const DstOp &Res, const SrcOp &Op0, const SrcOp &Op1)
Build and insert a Res = G_UCMP Op0, Op1.
MachineInstrBuilder buildJumpTable(const LLT PtrTy, unsigned JTI)
Build and insert Res = G_JUMP_TABLE JTI.
MachineInstrBuilder buildGetRounding(const DstOp &Dst)
Build and insert Dst = G_GET_ROUNDING.
MachineInstrBuilder buildSCmp(const DstOp &Res, const SrcOp &Op0, const SrcOp &Op1)
Build and insert a Res = G_SCMP Op0, Op1.
MachineInstrBuilder buildFence(unsigned Ordering, unsigned Scope)
Build and insert G_FENCE Ordering, Scope.
MachineInstrBuilder buildSelect(const DstOp &Res, const SrcOp &Tst, const SrcOp &Op0, const SrcOp &Op1, std::optional< unsigned > Flags=std::nullopt)
Build and insert a Res = G_SELECT Tst, Op0, Op1.
MachineInstrBuilder buildFMA(const DstOp &Dst, const SrcOp &Src0, const SrcOp &Src1, const SrcOp &Src2, std::optional< unsigned > Flags=std::nullopt)
Build and insert Res = G_FMA Op0, Op1, Op2.
MachineInstrBuilder buildMul(const DstOp &Dst, const SrcOp &Src0, const SrcOp &Src1, std::optional< unsigned > Flags=std::nullopt)
Build and insert Res = G_MUL Op0, Op1.
MachineInstrBuilder buildInsertSubvector(const DstOp &Res, const SrcOp &Src0, const SrcOp &Src1, unsigned Index)
Build and insert Res = G_INSERT_SUBVECTOR Src0, Src1, Idx.
MachineInstrBuilder buildAnd(const DstOp &Dst, const SrcOp &Src0, const SrcOp &Src1)
Build and insert Res = G_AND Op0, Op1.
MachineInstrBuilder buildCast(const DstOp &Dst, const SrcOp &Src)
Build and insert an appropriate cast between two registers of equal size.
MachineInstrBuilder buildICmp(CmpInst::Predicate Pred, const DstOp &Res, const SrcOp &Op0, const SrcOp &Op1, std::optional< unsigned > Flags=std::nullopt)
Build and insert a Res = G_ICMP Pred, Op0, Op1.
MachineBasicBlock::iterator getInsertPt()
Current insertion point for new instructions.
MachineInstrBuilder buildSExtOrTrunc(const DstOp &Res, const SrcOp &Op)
Build and insert Res = G_SEXT Op, Res = G_TRUNC Op, or Res = COPY Op depending on the differing sizes...
MachineInstrBuilder buildAtomicRMW(unsigned Opcode, const DstOp &OldValRes, const SrcOp &Addr, const SrcOp &Val, MachineMemOperand &MMO)
Build and insert OldValRes<def> = G_ATOMICRMW_<Opcode> Addr, Val, MMO.
MachineInstrBuilder buildSub(const DstOp &Dst, const SrcOp &Src0, const SrcOp &Src1, std::optional< unsigned > Flags=std::nullopt)
Build and insert Res = G_SUB Op0, Op1.
MachineInstrBuilder buildIntrinsic(Intrinsic::ID ID, ArrayRef< Register > Res, bool HasSideEffects, bool isConvergent)
Build and insert a G_INTRINSIC instruction.
MachineInstrBuilder buildVScale(const DstOp &Res, unsigned MinElts)
Build and insert Res = G_VSCALE MinElts.
MachineInstrBuilder buildSplatBuildVector(const DstOp &Res, const SrcOp &Src)
Build and insert Res = G_BUILD_VECTOR with Src replicated to fill the number of elements.
MachineInstrBuilder buildSetFPMode(const SrcOp &Src)
Build and insert G_SET_FPMODE Src.
MachineInstrBuilder buildIndirectDbgValue(Register Reg, const MDNode *Variable, const MDNode *Expr)
Build and insert a DBG_VALUE instruction expressing the fact that the associated Variable lives in me...
MachineInstrBuilder buildBuildVector(const DstOp &Res, ArrayRef< Register > Ops)
Build and insert Res = G_BUILD_VECTOR Op0, ...
MachineInstrBuilder buildConstDbgValue(const Constant &C, const MDNode *Variable, const MDNode *Expr)
Build and insert a DBG_VALUE instructions specifying that Variable is given by C (suitably modified b...
MachineInstrBuilder buildBrCond(const SrcOp &Tst, MachineBasicBlock &Dest)
Build and insert G_BRCOND Tst, Dest.
std::optional< MachineInstrBuilder > materializeObjectPtrOffset(Register &Res, Register Op0, const LLT ValueTy, uint64_t Value)
Materialize and insert an instruction with appropriate flags for addressing some offset of an object,...
MachineInstrBuilder buildSetRounding(const SrcOp &Src)
Build and insert G_SET_ROUNDING.
MachineInstrBuilder buildExtractVectorElement(const DstOp &Res, const SrcOp &Val, const SrcOp &Idx)
Build and insert Res = G_EXTRACT_VECTOR_ELT Val, Idx.
MachineInstrBuilder buildLoad(const DstOp &Res, const SrcOp &Addr, MachineMemOperand &MMO)
Build and insert Res = G_LOAD Addr, MMO.
MachineInstrBuilder buildPtrAdd(const DstOp &Res, const SrcOp &Op0, const SrcOp &Op1, std::optional< unsigned > Flags=std::nullopt)
Build and insert Res = G_PTR_ADD Op0, Op1.
MachineInstrBuilder buildZExtOrTrunc(const DstOp &Res, const SrcOp &Op)
Build and insert Res = G_ZEXT Op, Res = G_TRUNC Op, or Res = COPY Op depending on the differing sizes...
MachineInstrBuilder buildExtractVectorElementConstant(const DstOp &Res, const SrcOp &Val, const int Idx)
Build and insert Res = G_EXTRACT_VECTOR_ELT Val, Idx.
MachineInstrBuilder buildShl(const DstOp &Dst, const SrcOp &Src0, const SrcOp &Src1, std::optional< unsigned > Flags=std::nullopt)
MachineInstrBuilder buildStore(const SrcOp &Val, const SrcOp &Addr, MachineMemOperand &MMO)
Build and insert G_STORE Val, Addr, MMO.
MachineInstrBuilder buildInstr(unsigned Opcode)
Build and insert <empty> = Opcode <empty>.
MachineInstrBuilder buildFrameIndex(const DstOp &Res, int Idx)
Build and insert Res = G_FRAME_INDEX Idx.
MachineInstrBuilder buildDirectDbgValue(Register Reg, const MDNode *Variable, const MDNode *Expr)
Build and insert a DBG_VALUE instruction expressing the fact that the associated Variable lives in Re...
MachineInstrBuilder buildDbgLabel(const MDNode *Label)
Build and insert a DBG_LABEL instructions specifying that Label is given.
MachineInstrBuilder buildBrJT(Register TablePtr, unsigned JTI, Register IndexReg)
Build and insert G_BRJT TablePtr, JTI, IndexReg.
MachineInstrBuilder buildDynStackAlloc(const DstOp &Res, const SrcOp &Size, Align Alignment)
Build and insert Res = G_DYN_STACKALLOC Size, Align.
MachineInstrBuilder buildFIDbgValue(int FI, const MDNode *Variable, const MDNode *Expr)
Build and insert a DBG_VALUE instruction expressing the fact that the associated Variable lives in th...
MachineInstrBuilder buildResetFPEnv()
Build and insert G_RESET_FPENV.
void setDebugLoc(const DebugLoc &DL)
Set the debug location to DL for all the next build instructions.
const MachineBasicBlock & getMBB() const
Getter for the basic block we currently build.
MachineInstrBuilder buildInsertVectorElement(const DstOp &Res, const SrcOp &Val, const SrcOp &Elt, const SrcOp &Idx)
Build and insert Res = G_INSERT_VECTOR_ELT Val, Elt, Idx.
MachineInstrBuilder buildAtomicCmpXchgWithSuccess(const DstOp &OldValRes, const DstOp &SuccessRes, const SrcOp &Addr, const SrcOp &CmpVal, const SrcOp &NewVal, MachineMemOperand &MMO)
Build and insert OldValRes<def>, SuccessRes<def> = / G_ATOMIC_CMPXCHG_WITH_SUCCESS Addr,...
void setMBB(MachineBasicBlock &MBB)
Set the insertion point to the end of MBB.
const DebugLoc & getDebugLoc()
Get the current instruction's debug location.
MachineInstrBuilder buildTrap(bool Debug=false)
Build and insert G_TRAP or G_DEBUGTRAP.
MachineInstrBuilder buildFFrexp(const DstOp &Fract, const DstOp &Exp, const SrcOp &Src, std::optional< unsigned > Flags=std::nullopt)
Build and insert Fract, Exp = G_FFREXP Src.
MachineInstrBuilder buildFSincos(const DstOp &Sin, const DstOp &Cos, const SrcOp &Src, std::optional< unsigned > Flags=std::nullopt)
Build and insert Sin, Cos = G_FSINCOS Src.
MachineInstrBuilder buildShuffleVector(const DstOp &Res, const SrcOp &Src1, const SrcOp &Src2, ArrayRef< int > Mask)
Build and insert Res = G_SHUFFLE_VECTOR Src1, Src2, Mask.
MachineInstrBuilder buildInstrNoInsert(unsigned Opcode)
Build but don't insert <empty> = Opcode <empty>.
MachineInstrBuilder buildCopy(const DstOp &Res, const SrcOp &Op)
Build and insert Res = COPY Op.
MachineInstrBuilder buildPrefetch(const SrcOp &Addr, unsigned RW, unsigned Locality, unsigned CacheType, MachineMemOperand &MMO)
Build and insert G_PREFETCH Addr, RW, Locality, CacheType.
MachineInstrBuilder buildExtractSubvector(const DstOp &Res, const SrcOp &Src, unsigned Index)
Build and insert Res = G_EXTRACT_SUBVECTOR Src, Idx0.
const DataLayout & getDataLayout() const
MachineInstrBuilder buildBrIndirect(Register Tgt)
Build and insert G_BRINDIRECT Tgt.
MachineInstrBuilder buildSplatVector(const DstOp &Res, const SrcOp &Val)
Build and insert Res = G_SPLAT_VECTOR Val.
MachineInstrBuilder buildStepVector(const DstOp &Res, unsigned Step)
Build and insert Res = G_STEP_VECTOR Step.
virtual MachineInstrBuilder buildConstant(const DstOp &Res, const ConstantInt &Val)
Build and insert Res = G_CONSTANT Val.
MachineInstrBuilder buildFCmp(CmpInst::Predicate Pred, const DstOp &Res, const SrcOp &Op0, const SrcOp &Op1, std::optional< unsigned > Flags=std::nullopt)
Build and insert a Res = G_FCMP PredOp0, Op1.
MachineInstrBuilder buildFAdd(const DstOp &Dst, const SrcOp &Src0, const SrcOp &Src1, std::optional< unsigned > Flags=std::nullopt)
Build and insert Res = G_FADD Op0, Op1.
MachineInstrBuilder buildSetFPEnv(const SrcOp &Src)
Build and insert G_SET_FPENV Src.
Register getReg(unsigned Idx) const
Get the register for the operand index.
const MachineInstrBuilder & addExternalSymbol(const char *FnName, unsigned TargetFlags=0) const
const MachineInstrBuilder & addUse(Register RegNo, RegState Flags={}, unsigned SubReg=0) const
Add a virtual register use operand.
const MachineInstrBuilder & addImm(int64_t Val) const
Add a new immediate operand.
const MachineInstrBuilder & addMetadata(const MDNode *MD) const
const MachineInstrBuilder & addSym(MCSymbol *Sym, unsigned char TargetFlags=0) const
const MachineInstrBuilder & addFrameIndex(int Idx) const
const MachineInstrBuilder & addFPImm(const ConstantFP *Val) const
const MachineInstrBuilder & addMBB(MachineBasicBlock *MBB, unsigned TargetFlags=0) const
const MachineInstrBuilder & addDef(Register RegNo, RegState Flags={}, unsigned SubReg=0) const
Add a virtual register definition operand.
const MachineInstrBuilder & addMemOperand(MachineMemOperand *MMO) const
MachineInstr * getInstr() const
If conversion operators fail, use this method to get the MachineInstr explicitly.
LLVM_ABI void copyIRFlags(const Instruction &I)
Copy all flags to MachineInst MIFlags.
static LLVM_ABI uint32_t copyFlagsFromInstruction(const Instruction &I)
LLVM_ABI void setDeactivationSymbol(MachineFunction &MF, Value *DS)
void setDebugLoc(DebugLoc DL)
Replace current source information with new such.
Flags
Flags values. These may be or'd together.
@ MOVolatile
The memory access is volatile.
@ MODereferenceable
The memory access is dereferenceable (i.e., doesn't trap).
@ MOLoad
The memory access reads data.
@ MOInvariant
The memory access always returns the same value (or traps).
@ MOStore
The memory access writes data.
static MachineOperand CreateES(const char *SymName, unsigned TargetFlags=0)
static MachineOperand CreateGA(const GlobalValue *GV, int64_t Offset, unsigned TargetFlags=0)
LLVM_ABI Register createGenericVirtualRegister(LLT Ty, StringRef Name="")
Create and return a new generic virtual register with low-level type Ty.
The optimization diagnostic interface.
Diagnostic information for missed-optimization remarks.
BasicBlock * getIncomingBlock(unsigned i) const
Return incoming basic block number i.
Value * getIncomingValue(unsigned i) const
Return incoming value number x.
unsigned getNumIncomingValues() const
Return the number of incoming edges.
AnalysisType & getAnalysis() const
getAnalysis<AnalysisType>() - This function is used by subclasses to get to the analysis information ...
static PointerType * getUnqual(Type *ElementType)
This constructs a pointer to an object of the specified type in the default address space (address sp...
Class to install both of the above.
Wrapper class representing virtual and physical registers.
Definition Register.h:20
Value * getReturnValue() const
Convenience accessor. Returns null if there is no return value.
size_type count(ConstPtrType Ptr) const
count - Return 1 if the specified pointer is in the set, 0 otherwise.
std::pair< iterator, bool > insert(PtrType Ptr)
Inserts Ptr if and only if there is no element in the container equal to Ptr.
This class consists of common code factored out of the SmallVector class to reduce code duplication b...
void push_back(const T &Elt)
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
Encapsulates all of the information needed to generate a stack protector check, and signals to isel w...
MachineBasicBlock * getSuccessMBB()
MachineBasicBlock * getFailureMBB()
constexpr bool empty() const
Check if the string is empty.
Definition StringRef.h:141
constexpr const char * data() const
Get a pointer to the start of the string (which may not be null terminated).
Definition StringRef.h:138
Primary interface to the complete machine description for the target machine.
const Triple & getTargetTriple() const
TargetOptions Options
const Target & getTarget() const
unsigned NoTrapAfterNoreturn
Do not emit a trap instruction for 'unreachable' IR instructions behind noreturn calls,...
unsigned TrapUnreachable
Emit target-specific trap instruction for 'unreachable' IR instructions.
FPOpFusion::FPOpFusionMode AllowFPOpFusion
AllowFPOpFusion - This flag is set by the -fp-contract=xxx option.
Target-Independent Code Generator Pass Configuration Options.
TargetSubtargetInfo - Generic base class for all target subtargets.
virtual const CallLowering * getCallLowering() const
virtual const TargetLowering * getTargetLowering() const
bool isSPIRV() const
Tests whether the target is SPIR-V (32/64-bit/Logical).
Definition Triple.h:891
Twine - A lightweight data structure for efficiently representing the concatenation of temporary valu...
Definition Twine.h:82
static constexpr TypeSize getZero()
Definition TypeSize.h:349
The instances of the Type class are immutable: once they are created, they are never changed.
Definition Type.h:46
LLVM_ABI bool isEmptyTy() const
Return true if this type is empty, that is, it has no elements or all of its elements are empty.
Definition Type.cpp:180
bool isByteTy() const
True if this is an instance of ByteType.
Definition Type.h:242
static LLVM_ABI IntegerType * getInt32Ty(LLVMContext &C)
Definition Type.cpp:309
bool isPointerTy() const
True if this is an instance of PointerType.
Definition Type.h:282
static LLVM_ABI Type * getVoidTy(LLVMContext &C)
Definition Type.cpp:282
bool isSized(SmallPtrSetImpl< Type * > *Visited=nullptr) const
Return true if it makes sense to take the size of this type.
Definition Type.h:326
bool isAggregateType() const
Return true if the type is an aggregate type.
Definition Type.h:319
bool isTokenTy() const
Return true if this is 'token'.
Definition Type.h:236
bool isVoidTy() const
Return true if this is 'void'.
Definition Type.h:141
BasicBlock * getSuccessor(unsigned i=0) const
Value * getOperand(unsigned i) const
Definition User.h:207
LLVM Value Representation.
Definition Value.h:75
Type * getType() const
All values are typed, get the type of this value.
Definition Value.h:255
bool hasOneUse() const
Return true if there is exactly one use of this value.
Definition Value.h:439
LLVMContext & getContext() const
All values hold a context through their type.
Definition Value.h:258
LLVM_ABI const Value * stripPointerCasts() const
Strip off pointer casts, all-zero GEPs and address space casts.
Definition Value.cpp:713
constexpr ScalarTy getFixedValue() const
Definition TypeSize.h:200
constexpr bool isScalable() const
Returns whether the quantity is scaled by a runtime quantity (vscale).
Definition TypeSize.h:168
constexpr ScalarTy getKnownMinValue() const
Returns the minimum value this quantity can represent.
Definition TypeSize.h:165
constexpr bool isZero() const
Definition TypeSize.h:153
const ParentTy * getParent() const
Definition ilist_node.h:34
NodeTy * getNextNode()
Get the next node, or nullptr for the list tail.
Definition ilist_node.h:348
A raw_ostream that writes to an std::string.
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
constexpr char Align[]
Key for Kernel::Arg::Metadata::mAlign.
constexpr char Args[]
Key for Kernel::Metadata::mArgs.
constexpr char SymbolName[]
Key for Kernel::Metadata::mSymbolName.
constexpr std::underlying_type_t< E > Mask()
Get a bitmask with 1s in all places up to the high-order bit of E's largest value.
unsigned ID
LLVM IR allows to use arbitrary numbers as calling convention identifiers.
Definition CallingConv.h:24
@ C
The default llvm calling convention, compatible with C.
Definition CallingConv.h:34
@ BasicBlock
Various leaf nodes.
Definition ISDOpcodes.h:81
BinaryOp_match< SrcTy, SpecificConstantMatch, TargetOpcode::G_XOR, true > m_Not(const SrcTy &&Src)
Matches a register not-ed by a G_XOR.
OneUse_match< SubPat > m_OneUse(const SubPat &SP)
bool match(Val *V, const Pattern &P)
specificval_ty m_Specific(const Value *V)
Match if we have a specific specified value.
TwoOps_match< Val_t, Idx_t, Instruction::ExtractElement > m_ExtractElt(const Val_t &Val, const Idx_t &Idx)
Matches ExtractElementInst.
auto m_Value()
Match an arbitrary value and ignore it.
auto m_LogicalOr()
Matches L || R where L and R are arbitrary values.
auto m_LogicalAnd()
Matches L && R where L and R are arbitrary values.
Offsets
Offsets in bytes from the start of the input buffer.
LLVM_ABI void sortAndRangeify(CaseClusterVector &Clusters)
Sort Clusters and merge adjacent cases.
std::vector< CaseCluster > CaseClusterVector
@ CC_Range
A cluster of adjacent case labels with the same destination, or just one case.
@ CC_JumpTable
A cluster of cases suitable for jump table lowering.
@ CC_BitTests
A cluster of cases suitable for bit test lowering.
SmallVector< SwitchWorkListItem, 4 > SwitchWorkList
CaseClusterVector::iterator CaseClusterIt
@ CE
Windows NT (Windows on ARM)
Definition MCAsmInfo.h:50
initializer< Ty > init(const Ty &Val)
ExceptionBehavior
Exception behavior used for floating point operations.
Definition FPEnv.h:39
@ ebIgnore
This corresponds to "fpexcept.ignore".
Definition FPEnv.h:40
DiagnosticInfoOptimizationBase::Argument NV
NodeAddr< PhiNode * > Phi
Definition RDFGraph.h:390
NodeAddr< CodeNode * > Code
Definition RDFGraph.h:388
friend class Instruction
Iterator for Instructions in a `BasicBlock.
Definition BasicBlock.h:73
BaseReg
Stack frame base register. Bit 0 of FREInfo.Info.
Definition SFrame.h:77
This is an optimization pass for GlobalISel generic memory operations.
auto drop_begin(T &&RangeOrContainer, size_t N=1)
Return a range covering RangeOrContainer with the first N elements excluded.
Definition STLExtras.h:315
@ Low
Lower the current thread's priority such that it does not affect foreground tasks significantly.
Definition Threading.h:280
@ Offset
Definition DWP.cpp:558
FunctionAddr VTableAddr Value
Definition InstrProf.h:137
@ Implicit
Not emitted register (e.g. carry, or temporary result).
@ Undef
Value of the register doesn't matter.
auto enumerate(FirstRange &&First, RestRanges &&...Rest)
Given two or more input ranges, returns a new range whose values are tuples (A, B,...
Definition STLExtras.h:2553
decltype(auto) dyn_cast(const From &Val)
dyn_cast<X> - Return the argument parameter cast to the specified type.
Definition Casting.h:643
int countr_one(T Value)
Count the number of ones from the least significant bit to the first zero bit.
Definition bit.h:315
FunctionAddr VTableAddr uintptr_t uintptr_t Int32Ty
Definition InstrProf.h:328
LLVM_ABI void diagnoseDontCall(const CallInst &CI)
auto successors(const MachineBasicBlock *BB)
LLVM_ABI MVT getMVTForLLT(LLT Ty)
Get a rough equivalent of an MVT for a given LLT.
void append_range(Container &C, Range &&R)
Wrapper function to append range R to container C.
Definition STLExtras.h:2207
constexpr bool isUIntN(unsigned N, uint64_t x)
Checks if an unsigned integer fits into the given (dynamic) bit width.
Definition MathExtras.h:243
gep_type_iterator gep_type_end(const User *GEP)
LLVM_ABI MachineBasicBlock::iterator findSplitPointForStackProtector(MachineBasicBlock *BB, const TargetInstrInfo &TII)
Find the split point at which to splice the end of BB into its success stack protector check machine ...
LLVM_ABI LLT getLLTForMVT(MVT Ty)
Get a rough equivalent of an LLT for a given MVT.
constexpr int popcount(T Value) noexcept
Count the number of set bits in a value.
Definition bit.h:156
int countr_zero(T Val)
Count number of 0's from the least significant bit to the most stopping at the first 1.
Definition bit.h:204
Align getKnownAlignment(Value *V, const DataLayout &DL, const Instruction *CxtI=nullptr, AssumptionCache *AC=nullptr, const DominatorTree *DT=nullptr)
Try to infer an alignment for the specified pointer.
Definition Local.h:252
constexpr bool has_single_bit(T Value) noexcept
Definition bit.h:149
bool any_of(R &&range, UnaryPredicate P)
Provide wrappers to std::any_of which take ranges instead of having to pass begin/end explicitly.
Definition STLExtras.h:1745
LLVM_ABI llvm::SmallVector< int, 16 > createStrideMask(unsigned Start, unsigned Stride, unsigned VF)
Create a stride shuffle mask.
auto reverse(ContainerTy &&C)
Definition STLExtras.h:407
void sort(IteratorTy Start, IteratorTy End)
Definition STLExtras.h:1635
LLVM_ABI raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
Definition Debug.cpp:209
LLVM_ABI void report_fatal_error(Error Err, bool gen_crash_diag=true)
Definition Error.cpp:163
generic_gep_type_iterator<> gep_type_iterator
auto succ_size(const MachineBasicBlock *BB)
LLVM_ABI EHPersonality classifyEHPersonality(const Value *Pers)
See if the given exception handling personality function is one that we understand.
CodeGenOptLevel
Code generation optimization level.
Definition CodeGen.h:82
class LLVM_GSL_OWNER SmallVector
Forward declaration of SmallVector so that calculateSmallVectorDefaultInlinedElements can reference s...
bool isa(const From &Val)
isa<X> - Return true if the parameter to the template is an instance of one of the template type argu...
Definition Casting.h:547
@ Success
The lock was released successfully.
LLVM_ATTRIBUTE_VISIBILITY_DEFAULT AnalysisKey InnerAnalysisManagerProxy< AnalysisManagerT, IRUnitT, ExtraArgTs... >::Key
@ Global
Append to llvm.global_dtors.
@ First
Helpers to iterate all locations in the MemoryEffectsBase class.
Definition ModRef.h:74
LLVM_ABI void getSelectionDAGFallbackAnalysisUsage(AnalysisUsage &AU)
Modify analysis usage so it preserves passes required for the SelectionDAG fallback.
Definition Utils.cpp:1150
auto lower_bound(R &&Range, T &&Value)
Provide wrappers to std::lower_bound which take ranges instead of having to pass begin/end explicitly...
Definition STLExtras.h:2051
LLVM_ABI llvm::SmallVector< int, 16 > createInterleaveMask(unsigned VF, unsigned NumVecs)
Create an interleave shuffle mask.
@ FMul
Product of floats.
@ Sub
Subtraction of integers.
DWARFExpression::Operation Op
ArrayRef(const T &OneElt) -> ArrayRef< T >
bool isAsynchronousEHPersonality(EHPersonality Pers)
Returns true if this personality function catches asynchronous exceptions.
decltype(auto) cast(const From &Val)
cast<X> - Return the argument parameter cast to the specified type.
Definition Casting.h:559
LLVM_ABI std::optional< RoundingMode > convertStrToRoundingMode(StringRef)
Returns a valid RoundingMode enumerator when given a string that is valid as input in constrained int...
Definition FPEnv.cpp:25
gep_type_iterator gep_type_begin(const User *GEP)
LLVM_ABI void computeValueLLTs(const DataLayout &DL, Type &Ty, SmallVectorImpl< LLT > &ValueLLTs, SmallVectorImpl< TypeSize > *Offsets=nullptr, TypeSize StartingOffset=TypeSize::getZero())
computeValueLLTs - Given an LLVM IR type, compute a sequence of LLTs that represent all the individua...
Definition Analysis.cpp:153
LLVM_ABI GlobalValue * ExtractTypeInfo(Value *V)
ExtractTypeInfo - Returns the type info, possibly bitcast, encoded in V.
Definition Analysis.cpp:181
Align commonAlignment(Align A, uint64_t Offset)
Returns the alignment that satisfies both alignments.
Definition Alignment.h:201
LLVM_ABI LLT getLLTForType(Type &Ty, const DataLayout &DL)
Construct a low-level type based on an LLVM type.
void swap(llvm::BitVector &LHS, llvm::BitVector &RHS)
Implement std::swap in terms of BitVector swap.
Definition BitVector.h:862
This struct is a compact representation of a valid (non-zero power of two) alignment.
Definition Alignment.h:39
constexpr uint64_t value() const
This is a hole in the type system and should not be abused.
Definition Alignment.h:77
Pair of physical register and lane mask.
static LLVM_ABI MachinePointerInfo getFixedStack(MachineFunction &MF, int FI, int64_t Offset=0)
Return a MachinePointerInfo record that refers to the specified FrameIndex.
static bool canHandle(const Instruction *I, const TargetLibraryInfo &TLI)
static StringRef getLibcallImplName(RTLIB::LibcallImpl CallImpl)
Get the libcall routine name for the specified libcall implementation.
This structure is used to communicate between SelectionDAGBuilder and SDISel for the code generation ...
Register Reg
The virtual register containing the index of the jump table entry to jump to.
MachineBasicBlock * Default
The MBB of the default bb, which is a successor of the range check MBB.
unsigned JTI
The JumpTableIndex for this jump table in the function.
MachineBasicBlock * MBB
The MBB into which to emit the code for the indirect jump.