LLVM 23.0.0git
AArch64CallLowering.cpp
Go to the documentation of this file.
1//===--- AArch64CallLowering.cpp - Call lowering --------------------------===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8///
9/// \file
10/// This file implements the lowering of LLVM calls to machine code calls for
11/// GlobalISel.
12///
13//===----------------------------------------------------------------------===//
14
15#include "AArch64CallLowering.h"
17#include "AArch64ISelLowering.h"
19#include "AArch64RegisterInfo.h"
21#include "AArch64Subtarget.h"
23#include "llvm/ADT/ArrayRef.h"
45#include "llvm/IR/Argument.h"
46#include "llvm/IR/Attributes.h"
47#include "llvm/IR/Function.h"
48#include "llvm/IR/Type.h"
49#include "llvm/IR/Value.h"
50#include <algorithm>
51#include <cassert>
52#include <cstdint>
53
54#define DEBUG_TYPE "aarch64-call-lowering"
55
56using namespace llvm;
57using namespace AArch64GISelUtils;
58
60
63
64static void applyStackPassedSmallTypeDAGHack(EVT OrigVT, MVT &ValVT,
65 MVT &LocVT) {
66 // If ValVT is i1/i8/i16, we should set LocVT to i8/i8/i16. This is a legacy
67 // hack because the DAG calls the assignment function with pre-legalized
68 // register typed values, not the raw type.
69 //
70 // This hack is not applied to return values which are not passed on the
71 // stack.
72 if (OrigVT == MVT::i1 || OrigVT == MVT::i8)
73 ValVT = LocVT = MVT::i8;
74 else if (OrigVT == MVT::i16)
75 ValVT = LocVT = MVT::i16;
76}
77
78// Account for i1/i8/i16 stack passed value hack
80 const MVT ValVT = VA.getValVT();
81 return (ValVT == MVT::i8 || ValVT == MVT::i16) ? LLT(ValVT)
82 : LLT(VA.getLocVT());
83}
84
85namespace {
86
87struct AArch64IncomingValueAssigner
89 AArch64IncomingValueAssigner(CCAssignFn *AssignFn_,
90 CCAssignFn *AssignFnVarArg_)
91 : IncomingValueAssigner(AssignFn_, AssignFnVarArg_) {}
92
93 bool assignArg(unsigned ValNo, EVT OrigVT, MVT ValVT, MVT LocVT,
95 const CallLowering::ArgInfo &Info, ISD::ArgFlagsTy Flags,
96 CCState &State) override {
97 applyStackPassedSmallTypeDAGHack(OrigVT, ValVT, LocVT);
98 return IncomingValueAssigner::assignArg(ValNo, OrigVT, ValVT, LocVT,
99 LocInfo, Info, Flags, State);
100 }
101};
102
103struct AArch64OutgoingValueAssigner
105 const AArch64Subtarget &Subtarget;
106
107 /// Track if this is used for a return instead of function argument
108 /// passing. We apply a hack to i1/i8/i16 stack passed values, but do not use
109 /// stack passed returns for them and cannot apply the type adjustment.
110 bool IsReturn;
111
112 AArch64OutgoingValueAssigner(CCAssignFn *AssignFn_,
113 CCAssignFn *AssignFnVarArg_,
114 const AArch64Subtarget &Subtarget_,
115 bool IsReturn)
116 : OutgoingValueAssigner(AssignFn_, AssignFnVarArg_),
117 Subtarget(Subtarget_), IsReturn(IsReturn) {}
118
119 bool assignArg(unsigned ValNo, EVT OrigVT, MVT ValVT, MVT LocVT,
120 CCValAssign::LocInfo LocInfo,
121 const CallLowering::ArgInfo &Info, ISD::ArgFlagsTy Flags,
122 CCState &State) override {
123 const Function &F = State.getMachineFunction().getFunction();
124 bool IsCalleeWin =
125 Subtarget.isCallingConvWin64(State.getCallingConv(), F.isVarArg());
126 bool UseVarArgsCCForFixed = IsCalleeWin && State.isVarArg();
127
128 bool Res;
129 if (!Flags.isVarArg() && !UseVarArgsCCForFixed) {
130 if (!IsReturn)
131 applyStackPassedSmallTypeDAGHack(OrigVT, ValVT, LocVT);
132 Res = AssignFn(ValNo, ValVT, LocVT, LocInfo, Flags, Info.Ty, State);
133 } else
134 Res = AssignFnVarArg(ValNo, ValVT, LocVT, LocInfo, Flags, Info.Ty, State);
135
136 StackSize = State.getStackSize();
137 return Res;
138 }
139};
140
141struct IncomingArgHandler : public CallLowering::IncomingValueHandler {
142 IncomingArgHandler(MachineIRBuilder &MIRBuilder, MachineRegisterInfo &MRI)
143 : IncomingValueHandler(MIRBuilder, MRI) {}
144
145 Register getStackAddress(uint64_t Size, int64_t Offset,
146 MachinePointerInfo &MPO,
147 ISD::ArgFlagsTy Flags) override {
148 auto &MFI = MIRBuilder.getMF().getFrameInfo();
149
150 // Byval is assumed to be writable memory, but other stack passed arguments
151 // are not.
152 const bool IsImmutable = !Flags.isByVal();
153
154 int FI = MFI.CreateFixedObject(Size, Offset, IsImmutable);
155 MPO = MachinePointerInfo::getFixedStack(MIRBuilder.getMF(), FI);
156 auto AddrReg = MIRBuilder.buildFrameIndex(LLT::pointer(0, 64), FI);
157 return AddrReg.getReg(0);
158 }
159
160 LLT getStackValueStoreType(const DataLayout &DL, const CCValAssign &VA,
161 ISD::ArgFlagsTy Flags) const override {
162 // For pointers, we just need to fixup the integer types reported in the
163 // CCValAssign.
164 if (Flags.isPointer())
167 }
168
169 void assignValueToReg(Register ValVReg, Register PhysReg,
170 const CCValAssign &VA,
171 ISD::ArgFlagsTy Flags = {}) override {
172 markRegUsed(PhysReg);
173 IncomingValueHandler::assignValueToReg(ValVReg, PhysReg, VA);
174 }
175
176 void assignValueToAddress(Register ValVReg, Register Addr, LLT MemTy,
177 const MachinePointerInfo &MPO,
178 const CCValAssign &VA) override {
179 MachineFunction &MF = MIRBuilder.getMF();
180
181 LLT ValTy(VA.getValVT());
182 LLT LocTy(VA.getLocVT());
183
184 // Fixup the types for the DAG compatibility hack.
185 if (VA.getValVT() == MVT::i8 || VA.getValVT() == MVT::i16)
186 std::swap(ValTy, LocTy);
187 else {
188 // The calling code knows if this is a pointer or not, we're only touching
189 // the LocTy for the i8/i16 hack.
190 assert(LocTy.getSizeInBits() == MemTy.getSizeInBits());
191 LocTy = MemTy;
192 }
193
194 auto MMO = MF.getMachineMemOperand(
196 inferAlignFromPtrInfo(MF, MPO));
197
198 switch (VA.getLocInfo()) {
199 case CCValAssign::LocInfo::ZExt:
200 MIRBuilder.buildLoadInstr(TargetOpcode::G_ZEXTLOAD, ValVReg, Addr, *MMO);
201 return;
202 case CCValAssign::LocInfo::SExt:
203 MIRBuilder.buildLoadInstr(TargetOpcode::G_SEXTLOAD, ValVReg, Addr, *MMO);
204 return;
205 default:
206 MIRBuilder.buildLoad(ValVReg, Addr, *MMO);
207 return;
208 }
209 }
210
211 /// How the physical register gets marked varies between formal
212 /// parameters (it's a basic-block live-in), and a call instruction
213 /// (it's an implicit-def of the BL).
214 virtual void markRegUsed(Register Reg) = 0;
215};
216
217struct FormalArgHandler : public IncomingArgHandler {
218 FormalArgHandler(MachineIRBuilder &MIRBuilder, MachineRegisterInfo &MRI)
219 : IncomingArgHandler(MIRBuilder, MRI) {}
220
221 void markRegUsed(Register Reg) override {
222 MIRBuilder.getMRI()->addLiveIn(Reg.asMCReg());
223 MIRBuilder.getMBB().addLiveIn(Reg.asMCReg());
224 }
225};
226
227struct CallReturnHandler : public IncomingArgHandler {
228 CallReturnHandler(MachineIRBuilder &MIRBuilder, MachineRegisterInfo &MRI,
229 MachineInstrBuilder MIB)
230 : IncomingArgHandler(MIRBuilder, MRI), MIB(MIB) {}
231
232 void markRegUsed(Register Reg) override {
233 MIB.addDef(Reg, RegState::Implicit);
234 }
235
236 MachineInstrBuilder MIB;
237};
238
239/// A special return arg handler for "returned" attribute arg calls.
240struct ReturnedArgCallReturnHandler : public CallReturnHandler {
241 ReturnedArgCallReturnHandler(MachineIRBuilder &MIRBuilder,
242 MachineRegisterInfo &MRI,
243 MachineInstrBuilder MIB)
244 : CallReturnHandler(MIRBuilder, MRI, MIB) {}
245
246 void markRegUsed(Register Reg) override {}
247};
248
249struct OutgoingArgHandler : public CallLowering::OutgoingValueHandler {
250 OutgoingArgHandler(MachineIRBuilder &MIRBuilder, MachineRegisterInfo &MRI,
251 MachineInstrBuilder MIB, bool IsTailCall = false,
252 int FPDiff = 0)
253 : OutgoingValueHandler(MIRBuilder, MRI), MIB(MIB), IsTailCall(IsTailCall),
254 FPDiff(FPDiff),
255 Subtarget(MIRBuilder.getMF().getSubtarget<AArch64Subtarget>()) {}
256
257 Register getStackAddress(uint64_t Size, int64_t Offset,
258 MachinePointerInfo &MPO,
259 ISD::ArgFlagsTy Flags) override {
260 MachineFunction &MF = MIRBuilder.getMF();
261 LLT p0 = LLT::pointer(0, 64);
262 LLT s64 = LLT::integer(64);
263
264 if (IsTailCall) {
265 assert(!Flags.isByVal() && "byval unhandled with tail calls");
266
267 Offset += FPDiff;
268 int FI = MF.getFrameInfo().CreateFixedObject(Size, Offset, true);
269 auto FIReg = MIRBuilder.buildFrameIndex(p0, FI);
271 return FIReg.getReg(0);
272 }
273
274 if (!SPReg)
275 SPReg = MIRBuilder.buildCopy(p0, Register(AArch64::SP)).getReg(0);
276
277 auto OffsetReg = MIRBuilder.buildConstant(s64, Offset);
278
279 auto AddrReg = MIRBuilder.buildPtrAdd(p0, SPReg, OffsetReg);
280
282 return AddrReg.getReg(0);
283 }
284
285 /// We need to fixup the reported store size for certain value types because
286 /// we invert the interpretation of ValVT and LocVT in certain cases. This is
287 /// for compatibility with the DAG call lowering implementation, which we're
288 /// currently building on top of.
289 LLT getStackValueStoreType(const DataLayout &DL, const CCValAssign &VA,
290 ISD::ArgFlagsTy Flags) const override {
291 if (Flags.isPointer())
294 }
295
296 void assignValueToReg(Register ValVReg, Register PhysReg,
297 const CCValAssign &VA, ISD::ArgFlagsTy Flags) override {
298 MIB.addUse(PhysReg, RegState::Implicit);
299 Register ExtReg = extendRegister(ValVReg, VA);
300 MIRBuilder.buildCopy(PhysReg, ExtReg);
301 }
302
303 /// Check whether a stack argument requires lowering in a tail call.
304 static bool shouldLowerTailCallStackArg(const MachineFunction &MF,
305 const CCValAssign &VA,
306 Register ValVReg,
307 Register StoreAddr) {
308 const MachineRegisterInfo &MRI = MF.getRegInfo();
309 // Print the defining instruction for the value.
310 auto *DefMI = MRI.getVRegDef(ValVReg);
311 assert(DefMI && "No defining instruction");
312 for (;;) {
313 // Look through nodes that don't alter the bits of the incoming value.
314 unsigned Op = DefMI->getOpcode();
315 if (Op == TargetOpcode::G_ZEXT || Op == TargetOpcode::G_ANYEXT ||
316 Op == TargetOpcode::G_BITCAST || isAssertMI(*DefMI)) {
318 continue;
319 }
320 break;
321 }
322
323 auto *Load = dyn_cast<GLoad>(DefMI);
324 if (!Load)
325 return true;
326 Register LoadReg = Load->getPointerReg();
327 auto *LoadAddrDef = MRI.getVRegDef(LoadReg);
328 if (LoadAddrDef->getOpcode() != TargetOpcode::G_FRAME_INDEX)
329 return true;
330 const MachineFrameInfo &MFI = MF.getFrameInfo();
331 int LoadFI = LoadAddrDef->getOperand(1).getIndex();
332
333 auto *StoreAddrDef = MRI.getVRegDef(StoreAddr);
334 if (StoreAddrDef->getOpcode() != TargetOpcode::G_FRAME_INDEX)
335 return true;
336 int StoreFI = StoreAddrDef->getOperand(1).getIndex();
337
338 if (!MFI.isImmutableObjectIndex(LoadFI))
339 return true;
340 if (MFI.getObjectOffset(LoadFI) != MFI.getObjectOffset(StoreFI))
341 return true;
342 if (Load->getMemSize() != MFI.getObjectSize(StoreFI))
343 return true;
344
345 return false;
346 }
347
348 void assignValueToAddress(Register ValVReg, Register Addr, LLT MemTy,
349 const MachinePointerInfo &MPO,
350 const CCValAssign &VA) override {
351 MachineFunction &MF = MIRBuilder.getMF();
352 if (!FPDiff && !shouldLowerTailCallStackArg(MF, VA, ValVReg, Addr))
353 return;
354 auto MMO = MF.getMachineMemOperand(MPO, MachineMemOperand::MOStore, MemTy,
355 inferAlignFromPtrInfo(MF, MPO));
356 MIRBuilder.buildStore(ValVReg, Addr, *MMO);
357 }
358
359 void assignValueToAddress(const CallLowering::ArgInfo &Arg, unsigned RegIndex,
360 Register Addr, LLT MemTy,
361 const MachinePointerInfo &MPO,
362 const CCValAssign &VA) override {
363 unsigned MaxSize = MemTy.getSizeInBytes() * 8;
364 // For varargs, we always want to extend them to 8 bytes, in which case
365 // we disable setting a max.
366 if (Arg.Flags[0].isVarArg())
367 MaxSize = 0;
368
369 Register ValVReg = Arg.Regs[RegIndex];
370 if (VA.getLocInfo() != CCValAssign::LocInfo::FPExt) {
371 MVT LocVT = VA.getLocVT();
372 MVT ValVT = VA.getValVT();
373
374 if (VA.getValVT() == MVT::i8 || VA.getValVT() == MVT::i16) {
375 std::swap(ValVT, LocVT);
376 MemTy = LLT(VA.getValVT());
377 }
378
379 ValVReg = extendRegister(ValVReg, VA, MaxSize);
380 } else {
381 // The store does not cover the full allocated stack slot.
382 MemTy = LLT(VA.getValVT());
383 }
384
385 assignValueToAddress(ValVReg, Addr, MemTy, MPO, VA);
386 }
387
388 MachineInstrBuilder MIB;
389
390 bool IsTailCall;
391
392 /// For tail calls, the byte offset of the call's argument area from the
393 /// callee's. Unused elsewhere.
394 int FPDiff;
395
396 // Cache the SP register vreg if we need it more than once in this call site.
398
399 const AArch64Subtarget &Subtarget;
400};
401} // namespace
402
403static bool doesCalleeRestoreStack(CallingConv::ID CallConv, bool TailCallOpt) {
404 return (CallConv == CallingConv::Fast && TailCallOpt) ||
405 CallConv == CallingConv::Tail || CallConv == CallingConv::SwiftTail;
406}
407
409 const Value *Val,
410 ArrayRef<Register> VRegs,
412 Register SwiftErrorVReg) const {
413 auto MIB = MIRBuilder.buildInstrNoInsert(AArch64::RET_ReallyLR);
414 assert(((Val && !VRegs.empty()) || (!Val && VRegs.empty())) &&
415 "Return value without a vreg");
416
417 bool Success = true;
418 if (!FLI.CanLowerReturn) {
419 insertSRetStores(MIRBuilder, Val->getType(), VRegs, FLI.DemoteRegister);
420 } else if (!VRegs.empty()) {
421 MachineFunction &MF = MIRBuilder.getMF();
422 const Function &F = MF.getFunction();
423 const AArch64Subtarget &Subtarget = MF.getSubtarget<AArch64Subtarget>();
424
427 CCAssignFn *AssignFn = TLI.CCAssignFnForReturn(F.getCallingConv());
428 auto &DL = F.getDataLayout();
429 LLVMContext &Ctx = Val->getType()->getContext();
430
431 SmallVector<EVT, 4> SplitEVTs;
432 ComputeValueVTs(TLI, DL, Val->getType(), SplitEVTs);
433 assert(VRegs.size() == SplitEVTs.size() &&
434 "For each split Type there should be exactly one VReg.");
435
436 SmallVector<ArgInfo, 8> SplitArgs;
437 CallingConv::ID CC = F.getCallingConv();
438
439 for (unsigned i = 0; i < SplitEVTs.size(); ++i) {
440 Register CurVReg = VRegs[i];
441 ArgInfo CurArgInfo = ArgInfo{CurVReg, SplitEVTs[i].getTypeForEVT(Ctx), 0};
442 setArgFlags(CurArgInfo, AttributeList::ReturnIndex, DL, F);
443
444 // i1 is a special case because SDAG i1 true is naturally zero extended
445 // when widened using ANYEXT. We need to do it explicitly here.
446 auto &Flags = CurArgInfo.Flags[0];
447 if (MRI.getType(CurVReg).getSizeInBits() == TypeSize::getFixed(1) &&
448 !Flags.isSExt() && !Flags.isZExt()) {
449 CurVReg = MIRBuilder.buildZExt(LLT::integer(8), CurVReg).getReg(0);
450 } else if (TLI.getNumRegistersForCallingConv(Ctx, CC, SplitEVTs[i]) ==
451 1) {
452 // Some types will need extending as specified by the CC.
453 MVT NewVT = TLI.getRegisterTypeForCallingConv(Ctx, CC, SplitEVTs[i]);
454 if (EVT(NewVT) != SplitEVTs[i]) {
455 unsigned ExtendOp = TargetOpcode::G_ANYEXT;
456 if (F.getAttributes().hasRetAttr(Attribute::SExt))
457 ExtendOp = TargetOpcode::G_SEXT;
458 else if (F.getAttributes().hasRetAttr(Attribute::ZExt))
459 ExtendOp = TargetOpcode::G_ZEXT;
460
461 LLT NewLLT(NewVT);
462 LLT OldLLT = getLLTForType(*CurArgInfo.Ty, DL);
463 CurArgInfo.Ty = EVT(NewVT).getTypeForEVT(Ctx);
464 // Instead of an extend, we might have a vector type which needs
465 // padding with more elements, e.g. <2 x half> -> <4 x half>.
466 if (NewVT.isVector()) {
467 if (OldLLT.isVector()) {
468 if (NewLLT.getNumElements() > OldLLT.getNumElements()) {
469 CurVReg =
470 MIRBuilder.buildPadVectorWithUndefElements(NewLLT, CurVReg)
471 .getReg(0);
472 } else {
473 // Just do a vector extend.
474 CurVReg = MIRBuilder.buildInstr(ExtendOp, {NewLLT}, {CurVReg})
475 .getReg(0);
476 }
477 } else if (NewLLT.getNumElements() >= 2 &&
478 NewLLT.getNumElements() <= 8) {
479 // We need to pad a <1 x S> type to <2/4/8 x S>. Since we don't
480 // have <1 x S> vector types in GISel we use a build_vector
481 // instead of a vector merge/concat.
482 CurVReg =
483 MIRBuilder.buildPadVectorWithUndefElements(NewLLT, CurVReg)
484 .getReg(0);
485 } else {
486 LLVM_DEBUG(dbgs() << "Could not handle ret ty\n");
487 return false;
488 }
489 } else {
490 // If the split EVT was a <1 x T> vector, and NewVT is T, then we
491 // don't have to do anything since we don't distinguish between the
492 // two.
493 if (NewLLT.getScalarSizeInBits() !=
494 MRI.getType(CurVReg).getScalarSizeInBits()) {
495 // A scalar extend.
496 CurVReg = MIRBuilder.buildInstr(ExtendOp, {NewLLT}, {CurVReg})
497 .getReg(0);
498 }
499 }
500 }
501 }
502 if (CurVReg != CurArgInfo.Regs[0]) {
503 CurArgInfo.Regs[0] = CurVReg;
504 // Reset the arg flags after modifying CurVReg.
505 setArgFlags(CurArgInfo, AttributeList::ReturnIndex, DL, F);
506 }
507 splitToValueTypes(CurArgInfo, SplitArgs, DL, CC);
508 }
509
510 AArch64OutgoingValueAssigner Assigner(AssignFn, AssignFn, Subtarget,
511 /*IsReturn*/ true);
512 OutgoingArgHandler Handler(MIRBuilder, MRI, MIB);
513 Success = determineAndHandleAssignments(Handler, Assigner, SplitArgs,
514 MIRBuilder, CC, F.isVarArg());
515 }
516
517 if (SwiftErrorVReg) {
518 MIB.addUse(AArch64::X21, RegState::Implicit);
519 MIRBuilder.buildCopy(AArch64::X21, SwiftErrorVReg);
520 }
521
522 MIRBuilder.insertInstr(MIB);
523 return Success;
524}
525
527 CallingConv::ID CallConv,
529 bool IsVarArg) const {
531 const auto &TLI = *getTLI<AArch64TargetLowering>();
532 CCState CCInfo(CallConv, IsVarArg, MF, ArgLocs,
533 MF.getFunction().getContext());
534
535 return checkReturn(CCInfo, Outs, TLI.CCAssignFnForReturn(CallConv));
536}
537
538/// Helper function to compute forwarded registers for musttail calls. Computes
539/// the forwarded registers, sets MBB liveness, and emits COPY instructions that
540/// can be used to save + restore registers later.
542 CCAssignFn *AssignFn) {
543 MachineBasicBlock &MBB = MIRBuilder.getMBB();
544 MachineFunction &MF = MIRBuilder.getMF();
545 MachineFrameInfo &MFI = MF.getFrameInfo();
546
547 if (!MFI.hasMustTailInVarArgFunc())
548 return;
549
551 const Function &F = MF.getFunction();
552 assert(F.isVarArg() && "Expected F to be vararg?");
553
554 // Compute the set of forwarded registers. The rest are scratch.
556 CCState CCInfo(F.getCallingConv(), /*IsVarArg=*/true, MF, ArgLocs,
557 F.getContext());
558 SmallVector<MVT, 2> RegParmTypes;
559 RegParmTypes.push_back(MVT::i64);
560 RegParmTypes.push_back(MVT::f128);
561
562 // Later on, we can use this vector to restore the registers if necessary.
565 CCInfo.analyzeMustTailForwardedRegisters(Forwards, RegParmTypes, AssignFn);
566
567 // Conservatively forward X8, since it might be used for an aggregate
568 // return.
569 if (!CCInfo.isAllocated(AArch64::X8)) {
570 Register X8VReg = MF.addLiveIn(AArch64::X8, &AArch64::GPR64RegClass);
571 Forwards.push_back(ForwardedRegister(X8VReg, AArch64::X8, MVT::i64));
572 }
573
574 // Add the forwards to the MachineBasicBlock and MachineFunction.
575 for (const auto &F : Forwards) {
576 MBB.addLiveIn(F.PReg);
577 MIRBuilder.buildCopy(Register(F.VReg), Register(F.PReg));
578 }
579}
580
582 auto &F = MF.getFunction();
583 const auto &TM = static_cast<const AArch64TargetMachine &>(MF.getTarget());
584
585 if (!EnableSVEGISel && (F.getReturnType()->isScalableTy() ||
586 llvm::any_of(F.args(), [](const Argument &A) {
587 return A.getType()->isScalableTy();
588 })))
589 return true;
590 const auto &ST = MF.getSubtarget<AArch64Subtarget>();
591 if (!ST.hasNEON() || !ST.hasFPARMv8()) {
592 LLVM_DEBUG(dbgs() << "Falling back to SDAG because we don't support no-NEON\n");
593 return true;
594 }
595
596 SMEAttrs Attrs = MF.getInfo<AArch64FunctionInfo>()->getSMEFnAttrs();
597 if (Attrs.hasZAState() || Attrs.hasZT0State() ||
598 Attrs.hasStreamingInterfaceOrBody() ||
599 Attrs.hasStreamingCompatibleInterface())
600 return true;
601
602 auto OptLevel = MF.getTarget().getOptLevel();
603 bool IsGlobalISelPreferred =
606 static_cast<unsigned>(OptLevel) <= TM.getEnableGlobalISelAtO() ||
607 F.hasOptNone();
608 return !IsGlobalISelPreferred;
609}
610
611void AArch64CallLowering::saveVarArgRegisters(
613 CCState &CCInfo) const {
616
617 MachineFunction &MF = MIRBuilder.getMF();
619 MachineFrameInfo &MFI = MF.getFrameInfo();
621 auto &Subtarget = MF.getSubtarget<AArch64Subtarget>();
622 bool IsWin64CC = Subtarget.isCallingConvWin64(CCInfo.getCallingConv(),
623 MF.getFunction().isVarArg());
624 const LLT p0 = LLT::pointer(0, 64);
625 const LLT s64 = LLT::integer(64);
626
627 unsigned FirstVariadicGPR = CCInfo.getFirstUnallocated(GPRArgRegs);
628 unsigned NumVariadicGPRArgRegs = GPRArgRegs.size() - FirstVariadicGPR + 1;
629
630 unsigned GPRSaveSize = 8 * (GPRArgRegs.size() - FirstVariadicGPR);
631 int GPRIdx = 0;
632 if (GPRSaveSize != 0) {
633 if (IsWin64CC) {
634 GPRIdx = MFI.CreateFixedObject(GPRSaveSize,
635 -static_cast<int>(GPRSaveSize), false);
636 if (GPRSaveSize & 15)
637 // The extra size here, if triggered, will always be 8.
638 MFI.CreateFixedObject(16 - (GPRSaveSize & 15),
639 -static_cast<int>(alignTo(GPRSaveSize, 16)),
640 false);
641 } else
642 GPRIdx = MFI.CreateStackObject(GPRSaveSize, Align(8), false);
643
644 auto FIN = MIRBuilder.buildFrameIndex(p0, GPRIdx);
645 auto Offset =
646 MIRBuilder.buildConstant(MRI.createGenericVirtualRegister(s64), 8);
647
648 for (unsigned i = FirstVariadicGPR; i < GPRArgRegs.size(); ++i) {
650 Handler.assignValueToReg(
651 Val, GPRArgRegs[i],
653 GPRArgRegs[i], MVT::i64, CCValAssign::Full));
654 auto MPO = IsWin64CC ? MachinePointerInfo::getFixedStack(
655 MF, GPRIdx, (i - FirstVariadicGPR) * 8)
656 : MachinePointerInfo::getStack(MF, i * 8);
657 MIRBuilder.buildStore(Val, FIN, MPO, inferAlignFromPtrInfo(MF, MPO));
658
659 FIN = MIRBuilder.buildPtrAdd(MRI.createGenericVirtualRegister(p0),
660 FIN.getReg(0), Offset);
661 }
662 }
663 FuncInfo->setVarArgsGPRIndex(GPRIdx);
664 FuncInfo->setVarArgsGPRSize(GPRSaveSize);
665
666 if (Subtarget.hasFPARMv8() && !IsWin64CC) {
667 unsigned FirstVariadicFPR = CCInfo.getFirstUnallocated(FPRArgRegs);
668
669 unsigned FPRSaveSize = 16 * (FPRArgRegs.size() - FirstVariadicFPR);
670 int FPRIdx = 0;
671 if (FPRSaveSize != 0) {
672 FPRIdx = MFI.CreateStackObject(FPRSaveSize, Align(16), false);
673
674 auto FIN = MIRBuilder.buildFrameIndex(p0, FPRIdx);
675 auto Offset =
676 MIRBuilder.buildConstant(MRI.createGenericVirtualRegister(s64), 16);
677
678 for (unsigned i = FirstVariadicFPR; i < FPRArgRegs.size(); ++i) {
680 Handler.assignValueToReg(
681 Val, FPRArgRegs[i],
683 i + MF.getFunction().getNumOperands() + NumVariadicGPRArgRegs,
684 MVT::f128, FPRArgRegs[i], MVT::f128, CCValAssign::Full));
685
686 auto MPO = MachinePointerInfo::getStack(MF, i * 16);
687 MIRBuilder.buildStore(Val, FIN, MPO, inferAlignFromPtrInfo(MF, MPO));
688
689 FIN = MIRBuilder.buildPtrAdd(MRI.createGenericVirtualRegister(p0),
690 FIN.getReg(0), Offset);
691 }
692 }
693 FuncInfo->setVarArgsFPRIndex(FPRIdx);
694 FuncInfo->setVarArgsFPRSize(FPRSaveSize);
695 }
696}
697
699 MachineIRBuilder &MIRBuilder, const Function &F,
701 MachineFunction &MF = MIRBuilder.getMF();
702 MachineBasicBlock &MBB = MIRBuilder.getMBB();
704 auto &DL = F.getDataLayout();
705 auto &Subtarget = MF.getSubtarget<AArch64Subtarget>();
706
707 // Arm64EC has extra requirements for varargs calls which are only implemented
708 // in SelectionDAG; bail out for now.
709 if (F.isVarArg() && Subtarget.isWindowsArm64EC())
710 return false;
711
712 // Arm64EC thunks have a special calling convention which is only implemented
713 // in SelectionDAG; bail out for now.
714 if (F.getCallingConv() == CallingConv::ARM64EC_Thunk_Native ||
715 F.getCallingConv() == CallingConv::ARM64EC_Thunk_X64)
716 return false;
717
718 bool IsWin64 =
719 Subtarget.isCallingConvWin64(F.getCallingConv(), F.isVarArg()) &&
720 !Subtarget.isWindowsArm64EC();
721
722 SmallVector<ArgInfo, 8> SplitArgs;
724
725 // Insert the hidden sret parameter if the return value won't fit in the
726 // return registers.
727 if (!FLI.CanLowerReturn)
728 insertSRetIncomingArgument(F, SplitArgs, FLI.DemoteRegister, MRI, DL);
729
730 unsigned i = 0;
731 for (auto &Arg : F.args()) {
732 if (DL.getTypeStoreSize(Arg.getType()).isZero())
733 continue;
734
735 ArgInfo OrigArg{VRegs[i], Arg, i};
736 setArgFlags(OrigArg, i + AttributeList::FirstArgIndex, DL, F);
737
738 // i1 arguments are zero-extended to i8 by the caller. Emit a
739 // hint to reflect this.
740 if (OrigArg.Ty->isIntegerTy(1)) {
741 assert(OrigArg.Regs.size() == 1 &&
742 MRI.getType(OrigArg.Regs[0]).getSizeInBits() == 1 &&
743 "Unexpected registers used for i1 arg");
744
745 auto &Flags = OrigArg.Flags[0];
746 if (!Flags.isZExt() && !Flags.isSExt()) {
747 // Lower i1 argument as i8, and insert AssertZExt + Trunc later.
748 Register OrigReg = OrigArg.Regs[0];
750 OrigArg.Regs[0] = WideReg;
751 BoolArgs.push_back({OrigReg, WideReg});
752 }
753 }
754
755 if (Arg.hasAttribute(Attribute::SwiftAsync))
756 MF.getInfo<AArch64FunctionInfo>()->setHasSwiftAsyncContext(true);
757
758 splitToValueTypes(OrigArg, SplitArgs, DL, F.getCallingConv());
759 ++i;
760 }
761
762 if (!MBB.empty())
763 MIRBuilder.setInstr(*MBB.begin());
764
766 CCAssignFn *AssignFn = TLI.CCAssignFnForCall(F.getCallingConv(), IsWin64 && F.isVarArg());
767
768 AArch64IncomingValueAssigner Assigner(AssignFn, AssignFn);
769 FormalArgHandler Handler(MIRBuilder, MRI);
771 CCState CCInfo(F.getCallingConv(), F.isVarArg(), MF, ArgLocs, F.getContext());
772 if (!determineAssignments(Assigner, SplitArgs, CCInfo) ||
773 !handleAssignments(Handler, SplitArgs, CCInfo, ArgLocs, MIRBuilder))
774 return false;
775
776 if (!BoolArgs.empty()) {
777 for (auto &KV : BoolArgs) {
778 Register OrigReg = KV.first;
779 Register WideReg = KV.second;
780 LLT WideTy = MRI.getType(WideReg);
781 assert(MRI.getType(OrigReg).getScalarSizeInBits() == 1 &&
782 "Unexpected bit size of a bool arg");
783 MIRBuilder.buildTrunc(
784 OrigReg, MIRBuilder.buildAssertZExt(WideTy, WideReg, 1).getReg(0));
785 }
786 }
787
789 uint64_t StackSize = Assigner.StackSize;
790 if (F.isVarArg()) {
791 if ((!Subtarget.isTargetDarwin() && !Subtarget.isWindowsArm64EC()) || IsWin64) {
792 // The AAPCS variadic function ABI is identical to the non-variadic
793 // one. As a result there may be more arguments in registers and we should
794 // save them for future reference.
795 // Win64 variadic functions also pass arguments in registers, but all
796 // float arguments are passed in integer registers.
797 saveVarArgRegisters(MIRBuilder, Handler, CCInfo);
798 } else if (Subtarget.isWindowsArm64EC()) {
799 return false;
800 }
801
802 // We currently pass all varargs at 8-byte alignment, or 4 in ILP32.
803 StackSize = alignTo(Assigner.StackSize, Subtarget.isTargetILP32() ? 4 : 8);
804
805 auto &MFI = MIRBuilder.getMF().getFrameInfo();
806 FuncInfo->setVarArgsStackIndex(MFI.CreateFixedObject(4, StackSize, true));
807 }
808
809 if (doesCalleeRestoreStack(F.getCallingConv(),
811 // We have a non-standard ABI, so why not make full use of the stack that
812 // we're going to pop? It must be aligned to 16 B in any case.
813 StackSize = alignTo(StackSize, 16);
814
815 // If we're expected to restore the stack (e.g. fastcc), then we'll be
816 // adding a multiple of 16.
817 FuncInfo->setArgumentStackToRestore(StackSize);
818
819 // Our own callers will guarantee that the space is free by giving an
820 // aligned value to CALLSEQ_START.
821 }
822
823 // When we tail call, we need to check if the callee's arguments
824 // will fit on the caller's stack. So, whenever we lower formal arguments,
825 // we should keep track of this information, since we might lower a tail call
826 // in this function later.
827 FuncInfo->setBytesInStackArgArea(StackSize);
828
829 if (Subtarget.hasCustomCallingConv())
830 Subtarget.getRegisterInfo()->UpdateCustomCalleeSavedRegs(MF);
831
832 handleMustTailForwardedRegisters(MIRBuilder, AssignFn);
833
834 // Move back to the end of the basic block.
835 MIRBuilder.setMBB(MBB);
836
837 return true;
838}
839
840/// Return true if the calling convention is one that we can guarantee TCO for.
841static bool canGuaranteeTCO(CallingConv::ID CC, bool GuaranteeTailCalls) {
842 return (CC == CallingConv::Fast && GuaranteeTailCalls) ||
844}
845
846/// Return true if we might ever do TCO for calls with this calling convention.
848 switch (CC) {
849 case CallingConv::C:
857 return true;
858 default:
859 return false;
860 }
861}
862
863/// Returns a pair containing the fixed CCAssignFn and the vararg CCAssignFn for
864/// CC.
865static std::pair<CCAssignFn *, CCAssignFn *>
867 return {TLI.CCAssignFnForCall(CC, false), TLI.CCAssignFnForCall(CC, true)};
868}
869
870bool AArch64CallLowering::doCallerAndCalleePassArgsTheSameWay(
871 CallLoweringInfo &Info, MachineFunction &MF,
872 SmallVectorImpl<ArgInfo> &InArgs) const {
873 const Function &CallerF = MF.getFunction();
874 CallingConv::ID CalleeCC = Info.CallConv;
875 CallingConv::ID CallerCC = CallerF.getCallingConv();
876
877 // If the calling conventions match, then everything must be the same.
878 if (CalleeCC == CallerCC)
879 return true;
880
881 // Check if the caller and callee will handle arguments in the same way.
882 const AArch64TargetLowering &TLI = *getTLI<AArch64TargetLowering>();
883 CCAssignFn *CalleeAssignFnFixed;
884 CCAssignFn *CalleeAssignFnVarArg;
885 std::tie(CalleeAssignFnFixed, CalleeAssignFnVarArg) =
886 getAssignFnsForCC(CalleeCC, TLI);
887
888 CCAssignFn *CallerAssignFnFixed;
889 CCAssignFn *CallerAssignFnVarArg;
890 std::tie(CallerAssignFnFixed, CallerAssignFnVarArg) =
891 getAssignFnsForCC(CallerCC, TLI);
892
893 AArch64IncomingValueAssigner CalleeAssigner(CalleeAssignFnFixed,
894 CalleeAssignFnVarArg);
895 AArch64IncomingValueAssigner CallerAssigner(CallerAssignFnFixed,
896 CallerAssignFnVarArg);
897
898 if (!resultsCompatible(Info, MF, InArgs, CalleeAssigner, CallerAssigner))
899 return false;
900
901 // Make sure that the caller and callee preserve all of the same registers.
902 auto TRI = MF.getSubtarget<AArch64Subtarget>().getRegisterInfo();
903 const uint32_t *CallerPreserved = TRI->getCallPreservedMask(MF, CallerCC);
904 const uint32_t *CalleePreserved = TRI->getCallPreservedMask(MF, CalleeCC);
905 if (MF.getSubtarget<AArch64Subtarget>().hasCustomCallingConv()) {
906 TRI->UpdateCustomCallPreservedMask(MF, &CallerPreserved);
907 TRI->UpdateCustomCallPreservedMask(MF, &CalleePreserved);
908 }
909
910 return TRI->regmaskSubsetEqual(CallerPreserved, CalleePreserved);
911}
912
913bool AArch64CallLowering::areCalleeOutgoingArgsTailCallable(
914 CallLoweringInfo &Info, MachineFunction &MF,
915 SmallVectorImpl<ArgInfo> &OrigOutArgs) const {
916 // If there are no outgoing arguments, then we are done.
917 if (OrigOutArgs.empty())
918 return true;
919
920 const Function &CallerF = MF.getFunction();
921 LLVMContext &Ctx = CallerF.getContext();
922 CallingConv::ID CalleeCC = Info.CallConv;
923 CallingConv::ID CallerCC = CallerF.getCallingConv();
924 const AArch64TargetLowering &TLI = *getTLI<AArch64TargetLowering>();
925 const AArch64Subtarget &Subtarget = MF.getSubtarget<AArch64Subtarget>();
926
927 CCAssignFn *AssignFnFixed;
928 CCAssignFn *AssignFnVarArg;
929 std::tie(AssignFnFixed, AssignFnVarArg) = getAssignFnsForCC(CalleeCC, TLI);
930
931 // We have outgoing arguments. Make sure that we can tail call with them.
933 CCState OutInfo(CalleeCC, false, MF, OutLocs, Ctx);
934
935 AArch64OutgoingValueAssigner CalleeAssigner(AssignFnFixed, AssignFnVarArg,
936 Subtarget, /*IsReturn*/ false);
937 // determineAssignments() may modify argument flags, so make a copy.
939 append_range(OutArgs, OrigOutArgs);
940 if (!determineAssignments(CalleeAssigner, OutArgs, OutInfo)) {
941 LLVM_DEBUG(dbgs() << "... Could not analyze call operands.\n");
942 return false;
943 }
944
945 // Make sure that they can fit on the caller's stack.
946 const AArch64FunctionInfo *FuncInfo = MF.getInfo<AArch64FunctionInfo>();
947 if (OutInfo.getStackSize() > FuncInfo->getBytesInStackArgArea()) {
948 LLVM_DEBUG(dbgs() << "... Cannot fit call operands on caller's stack.\n");
949 return false;
950 }
951
952 // Verify that the parameters in callee-saved registers match.
953 // TODO: Port this over to CallLowering as general code once swiftself is
954 // supported.
955 auto TRI = MF.getSubtarget<AArch64Subtarget>().getRegisterInfo();
956 const uint32_t *CallerPreservedMask = TRI->getCallPreservedMask(MF, CallerCC);
957 MachineRegisterInfo &MRI = MF.getRegInfo();
958
959 if (Info.IsVarArg) {
960 // Be conservative and disallow variadic memory operands to match SDAG's
961 // behaviour.
962 // FIXME: If the caller's calling convention is C, then we can
963 // potentially use its argument area. However, for cases like fastcc,
964 // we can't do anything.
965 for (unsigned i = 0; i < OutLocs.size(); ++i) {
966 auto &ArgLoc = OutLocs[i];
967 if (ArgLoc.isRegLoc())
968 continue;
969
971 dbgs()
972 << "... Cannot tail call vararg function with stack arguments\n");
973 return false;
974 }
975 }
976
977 return parametersInCSRMatch(MRI, CallerPreservedMask, OutLocs, OutArgs);
978}
979
981 MachineIRBuilder &MIRBuilder, CallLoweringInfo &Info,
983 SmallVectorImpl<ArgInfo> &OutArgs) const {
984
985 // Must pass all target-independent checks in order to tail call optimize.
986 if (!Info.IsTailCall)
987 return false;
988
989 CallingConv::ID CalleeCC = Info.CallConv;
990 MachineFunction &MF = MIRBuilder.getMF();
991 const Function &CallerF = MF.getFunction();
992
993 LLVM_DEBUG(dbgs() << "Attempting to lower call as tail call\n");
994
995 if (Info.SwiftErrorVReg) {
996 // TODO: We should handle this.
997 // Note that this is also handled by the check for no outgoing arguments.
998 // Proactively disabling this though, because the swifterror handling in
999 // lowerCall inserts a COPY *after* the location of the call.
1000 LLVM_DEBUG(dbgs() << "... Cannot handle tail calls with swifterror yet.\n");
1001 return false;
1002 }
1003
1004 if (!mayTailCallThisCC(CalleeCC)) {
1005 LLVM_DEBUG(dbgs() << "... Calling convention cannot be tail called.\n");
1006 return false;
1007 }
1008
1009 // Byval parameters hand the function a pointer directly into the stack area
1010 // we want to reuse during a tail call. Working around this *is* possible (see
1011 // X86).
1012 //
1013 // FIXME: In AArch64ISelLowering, this isn't worked around. Can/should we try
1014 // it?
1015 //
1016 // On Windows, "inreg" attributes signify non-aggregate indirect returns.
1017 // In this case, it is necessary to save/restore X0 in the callee. Tail
1018 // call opt interferes with this. So we disable tail call opt when the
1019 // caller has an argument with "inreg" attribute.
1020 //
1021 // FIXME: Check whether the callee also has an "inreg" argument.
1022 //
1023 // When the caller has a swifterror argument, we don't want to tail call
1024 // because would have to move into the swifterror register before the
1025 // tail call.
1026 if (any_of(CallerF.args(), [](const Argument &A) {
1027 return A.hasByValAttr() || A.hasInRegAttr() || A.hasSwiftErrorAttr();
1028 })) {
1029 LLVM_DEBUG(dbgs() << "... Cannot tail call from callers with byval, "
1030 "inreg, or swifterror arguments\n");
1031 return false;
1032 }
1033
1034 // Externally-defined functions with weak linkage should not be
1035 // tail-called on AArch64 when the OS does not support dynamic
1036 // pre-emption of symbols, as the AAELF spec requires normal calls
1037 // to undefined weak functions to be replaced with a NOP or jump to the
1038 // next instruction. The behaviour of branch instructions in this
1039 // situation (as used for tail calls) is implementation-defined, so we
1040 // cannot rely on the linker replacing the tail call with a return.
1041 if (Info.Callee.isGlobal()) {
1042 const GlobalValue *GV = Info.Callee.getGlobal();
1043 const Triple &TT = MF.getTarget().getTargetTriple();
1044 if (GV->hasExternalWeakLinkage() &&
1045 (!TT.isOSWindows() || TT.isOSBinFormatELF() ||
1046 TT.isOSBinFormatMachO())) {
1047 LLVM_DEBUG(dbgs() << "... Cannot tail call externally-defined function "
1048 "with weak linkage for this OS.\n");
1049 return false;
1050 }
1051 }
1052
1053 // If we have -tailcallopt, then we're done.
1055 return CalleeCC == CallerF.getCallingConv();
1056
1057 // We don't have -tailcallopt, so we're allowed to change the ABI (sibcall).
1058 // Try to find cases where we can do that.
1059
1060 // I want anyone implementing a new calling convention to think long and hard
1061 // about this assert.
1062 assert((!Info.IsVarArg || CalleeCC == CallingConv::C) &&
1063 "Unexpected variadic calling convention");
1064
1065 // Verify that the incoming and outgoing arguments from the callee are
1066 // safe to tail call.
1067 if (!doCallerAndCalleePassArgsTheSameWay(Info, MF, InArgs)) {
1068 LLVM_DEBUG(
1069 dbgs()
1070 << "... Caller and callee have incompatible calling conventions.\n");
1071 return false;
1072 }
1073
1074 if (!areCalleeOutgoingArgsTailCallable(Info, MF, OutArgs))
1075 return false;
1076
1077 LLVM_DEBUG(
1078 dbgs() << "... Call is eligible for tail call optimization.\n");
1079 return true;
1080}
1081
1082static unsigned getCallOpcode(const MachineFunction &CallerF, bool IsIndirect,
1083 bool IsTailCall,
1084 std::optional<CallLowering::PtrAuthInfo> &PAI,
1085 MachineRegisterInfo &MRI) {
1086 const AArch64FunctionInfo *FuncInfo = CallerF.getInfo<AArch64FunctionInfo>();
1087
1088 if (!IsTailCall) {
1089 if (!PAI)
1090 return IsIndirect ? getBLRCallOpcode(CallerF) : (unsigned)AArch64::BL;
1091
1092 assert(IsIndirect && "Direct call should not be authenticated");
1093 assert((PAI->Key == AArch64PACKey::IA || PAI->Key == AArch64PACKey::IB) &&
1094 "Invalid auth call key");
1095 return AArch64::BLRA;
1096 }
1097
1098 if (!IsIndirect)
1099 return AArch64::TCRETURNdi;
1100
1101 // When BTI or PAuthLR are enabled, there are restrictions on using x16 and
1102 // x17 to hold the function pointer.
1103 if (FuncInfo->branchTargetEnforcement()) {
1104 if (FuncInfo->branchProtectionPAuthLR()) {
1105 assert(!PAI && "ptrauth tail-calls not yet supported with PAuthLR");
1106 return AArch64::TCRETURNrix17;
1107 }
1108 if (PAI)
1109 return AArch64::AUTH_TCRETURN_BTI;
1110 return AArch64::TCRETURNrix16x17;
1111 }
1112
1113 if (FuncInfo->branchProtectionPAuthLR()) {
1114 assert(!PAI && "ptrauth tail-calls not yet supported with PAuthLR");
1115 return AArch64::TCRETURNrinotx16;
1116 }
1117
1118 if (PAI)
1119 return AArch64::AUTH_TCRETURN;
1120 return AArch64::TCRETURNri;
1121}
1122
1123static const uint32_t *
1127 const uint32_t *Mask;
1128 if (!OutArgs.empty() && OutArgs[0].Flags[0].isReturned()) {
1129 // For 'this' returns, use the X0-preserving mask if applicable
1130 Mask = TRI.getThisReturnPreservedMask(MF, Info.CallConv);
1131 if (!Mask) {
1132 OutArgs[0].Flags[0].setReturned(false);
1133 Mask = TRI.getCallPreservedMask(MF, Info.CallConv);
1134 }
1135 } else {
1136 Mask = TRI.getCallPreservedMask(MF, Info.CallConv);
1137 }
1138 return Mask;
1139}
1140
1141bool AArch64CallLowering::lowerTailCall(
1142 MachineIRBuilder &MIRBuilder, CallLoweringInfo &Info,
1143 SmallVectorImpl<ArgInfo> &OutArgs) const {
1144 MachineFunction &MF = MIRBuilder.getMF();
1145 const Function &F = MF.getFunction();
1146 MachineRegisterInfo &MRI = MF.getRegInfo();
1147 const AArch64TargetLowering &TLI = *getTLI<AArch64TargetLowering>();
1148 AArch64FunctionInfo *FuncInfo = MF.getInfo<AArch64FunctionInfo>();
1149
1150 // True when we're tail calling, but without -tailcallopt.
1151 bool IsSibCall = !MF.getTarget().Options.GuaranteedTailCallOpt &&
1152 Info.CallConv != CallingConv::Tail &&
1153 Info.CallConv != CallingConv::SwiftTail;
1154
1155 // Find out which ABI gets to decide where things go.
1156 CallingConv::ID CalleeCC = Info.CallConv;
1157 CCAssignFn *AssignFnFixed;
1158 CCAssignFn *AssignFnVarArg;
1159 std::tie(AssignFnFixed, AssignFnVarArg) = getAssignFnsForCC(CalleeCC, TLI);
1160
1161 MachineInstrBuilder CallSeqStart;
1162 if (!IsSibCall)
1163 CallSeqStart = MIRBuilder.buildInstr(AArch64::ADJCALLSTACKDOWN);
1164
1165 unsigned Opc = getCallOpcode(MF, Info.Callee.isReg(), true, Info.PAI, MRI);
1166 auto MIB = MIRBuilder.buildInstrNoInsert(Opc);
1167 MIB.add(Info.Callee);
1168
1169 // Tell the call which registers are clobbered.
1170 const AArch64Subtarget &Subtarget = MF.getSubtarget<AArch64Subtarget>();
1171 auto TRI = Subtarget.getRegisterInfo();
1172
1173 // Byte offset for the tail call. When we are sibcalling, this will always
1174 // be 0.
1175 MIB.addImm(0);
1176
1177 // Authenticated tail calls always take key/discriminator arguments.
1178 if (Opc == AArch64::AUTH_TCRETURN || Opc == AArch64::AUTH_TCRETURN_BTI) {
1179 assert((Info.PAI->Key == AArch64PACKey::IA ||
1180 Info.PAI->Key == AArch64PACKey::IB) &&
1181 "Invalid auth call key");
1182 MIB.addImm(Info.PAI->Key);
1183
1184 Register AddrDisc = 0;
1185 uint16_t IntDisc = 0;
1186 std::tie(IntDisc, AddrDisc) =
1187 extractPtrauthBlendDiscriminators(Info.PAI->Discriminator, MRI);
1188
1189 MIB.addImm(IntDisc);
1190 MIB.addUse(AddrDisc);
1191 if (AddrDisc != AArch64::NoRegister) {
1192 MIB->getOperand(4).setReg(constrainOperandRegClass(
1193 MF, *TRI, MRI, *MF.getSubtarget().getInstrInfo(),
1194 *MF.getSubtarget().getRegBankInfo(), *MIB, MIB->getDesc(),
1195 MIB->getOperand(4), 4));
1196 }
1197 }
1198
1199 // Tell the call which registers are clobbered.
1200 const uint32_t *Mask = TRI->getCallPreservedMask(MF, CalleeCC);
1201 if (Subtarget.hasCustomCallingConv())
1202 TRI->UpdateCustomCallPreservedMask(MF, &Mask);
1203 MIB.addRegMask(Mask);
1204
1205 if (Info.CFIType)
1206 MIB->setCFIType(MF, Info.CFIType->getZExtValue());
1207
1208 if (TRI->isAnyArgRegReserved(MF))
1209 TRI->emitReservedArgRegCallError(MF);
1210
1211 // FPDiff is the byte offset of the call's argument area from the callee's.
1212 // Stores to callee stack arguments will be placed in FixedStackSlots offset
1213 // by this amount for a tail call. In a sibling call it must be 0 because the
1214 // caller will deallocate the entire stack and the callee still expects its
1215 // arguments to begin at SP+0.
1216 int FPDiff = 0;
1217
1218 // This will be 0 for sibcalls, potentially nonzero for tail calls produced
1219 // by -tailcallopt. For sibcalls, the memory operands for the call are
1220 // already available in the caller's incoming argument space.
1221 unsigned NumBytes = 0;
1222 if (!IsSibCall) {
1223 // We aren't sibcalling, so we need to compute FPDiff. We need to do this
1224 // before handling assignments, because FPDiff must be known for memory
1225 // arguments.
1226 unsigned NumReusableBytes = FuncInfo->getBytesInStackArgArea();
1228 CCState OutInfo(CalleeCC, false, MF, OutLocs, F.getContext());
1229
1230 AArch64OutgoingValueAssigner CalleeAssigner(AssignFnFixed, AssignFnVarArg,
1231 Subtarget, /*IsReturn*/ false);
1232 if (!determineAssignments(CalleeAssigner, OutArgs, OutInfo))
1233 return false;
1234
1235 // The callee will pop the argument stack as a tail call. Thus, we must
1236 // keep it 16-byte aligned.
1237 NumBytes = alignTo(OutInfo.getStackSize(), 16);
1238
1239 // FPDiff will be negative if this tail call requires more space than we
1240 // would automatically have in our incoming argument space. Positive if we
1241 // actually shrink the stack.
1242 FPDiff = NumReusableBytes - NumBytes;
1243
1244 // Update the required reserved area if this is the tail call requiring the
1245 // most argument stack space.
1246 if (FPDiff < 0 && FuncInfo->getTailCallReservedStack() < (unsigned)-FPDiff)
1247 FuncInfo->setTailCallReservedStack(-FPDiff);
1248
1249 // The stack pointer must be 16-byte aligned at all times it's used for a
1250 // memory operation, which in practice means at *all* times and in
1251 // particular across call boundaries. Therefore our own arguments started at
1252 // a 16-byte aligned SP and the delta applied for the tail call should
1253 // satisfy the same constraint.
1254 assert(FPDiff % 16 == 0 && "unaligned stack on tail call");
1255 }
1256
1257 const auto &Forwards = FuncInfo->getForwardedMustTailRegParms();
1258
1259 AArch64OutgoingValueAssigner Assigner(AssignFnFixed, AssignFnVarArg,
1260 Subtarget, /*IsReturn*/ false);
1261
1262 // Do the actual argument marshalling.
1263 OutgoingArgHandler Handler(MIRBuilder, MRI, MIB,
1264 /*IsTailCall*/ true, FPDiff);
1265 if (!determineAndHandleAssignments(Handler, Assigner, OutArgs, MIRBuilder,
1266 CalleeCC, Info.IsVarArg))
1267 return false;
1268
1269 Mask = getMaskForArgs(OutArgs, Info, *TRI, MF);
1270
1271 if (Info.IsVarArg && Info.IsMustTailCall) {
1272 // Now we know what's being passed to the function. Add uses to the call for
1273 // the forwarded registers that we *aren't* passing as parameters. This will
1274 // preserve the copies we build earlier.
1275 for (const auto &F : Forwards) {
1276 Register ForwardedReg = F.PReg;
1277 // If the register is already passed, or aliases a register which is
1278 // already being passed, then skip it.
1279 if (any_of(MIB->uses(), [&ForwardedReg, &TRI](const MachineOperand &Use) {
1280 if (!Use.isReg())
1281 return false;
1282 return TRI->regsOverlap(Use.getReg(), ForwardedReg);
1283 }))
1284 continue;
1285
1286 // We aren't passing it already, so we should add it to the call.
1287 MIRBuilder.buildCopy(ForwardedReg, Register(F.VReg));
1288 MIB.addReg(ForwardedReg, RegState::Implicit);
1289 }
1290 }
1291
1292 // If we have -tailcallopt, we need to adjust the stack. We'll do the call
1293 // sequence start and end here.
1294 if (!IsSibCall) {
1295 MIB->getOperand(1).setImm(FPDiff);
1296 CallSeqStart.addImm(0).addImm(0);
1297 // End the call sequence *before* emitting the call. Normally, we would
1298 // tidy the frame up after the call. However, here, we've laid out the
1299 // parameters so that when SP is reset, they will be in the correct
1300 // location.
1301 MIRBuilder.buildInstr(AArch64::ADJCALLSTACKUP).addImm(0).addImm(0);
1302 }
1303
1304 // Now we can add the actual call instruction to the correct basic block.
1305 MIRBuilder.insertInstr(MIB);
1306
1307 // If Callee is a reg, since it is used by a target specific instruction,
1308 // it must have a register class matching the constraint of that instruction.
1309 if (MIB->getOperand(0).isReg())
1311 *MF.getSubtarget().getRegBankInfo(), *MIB,
1312 MIB->getDesc(), MIB->getOperand(0), 0);
1313
1315 Info.LoweredTailCall = true;
1316 return true;
1317}
1318
1320 CallLoweringInfo &Info) const {
1321 MachineFunction &MF = MIRBuilder.getMF();
1322 const Function &F = MF.getFunction();
1323 MachineRegisterInfo &MRI = MF.getRegInfo();
1324 auto &DL = F.getDataLayout();
1326 const AArch64Subtarget &Subtarget = MF.getSubtarget<AArch64Subtarget>();
1327
1328 // Arm64EC has extra requirements for varargs calls; bail out for now.
1329 //
1330 // Arm64EC has special mangling rules for calls; bail out on all calls for
1331 // now.
1332 if (Subtarget.isWindowsArm64EC())
1333 return false;
1334
1335 // Arm64EC thunks have a special calling convention which is only implemented
1336 // in SelectionDAG; bail out for now.
1337 if (Info.CallConv == CallingConv::ARM64EC_Thunk_Native ||
1338 Info.CallConv == CallingConv::ARM64EC_Thunk_X64)
1339 return false;
1340
1342 for (auto &OrigArg : Info.OrigArgs) {
1343 splitToValueTypes(OrigArg, OutArgs, DL, Info.CallConv);
1344 // AAPCS requires that we zero-extend i1 to 8 bits by the caller.
1345 auto &Flags = OrigArg.Flags[0];
1346 if (OrigArg.Ty->isIntegerTy(1) && !Flags.isSExt() && !Flags.isZExt()) {
1347 ArgInfo &OutArg = OutArgs.back();
1348 assert(OutArg.Regs.size() == 1 &&
1349 MRI.getType(OutArg.Regs[0]).getSizeInBits() == 1 &&
1350 "Unexpected registers used for i1 arg");
1351
1352 // We cannot use a ZExt ArgInfo flag here, because it will
1353 // zero-extend the argument to i32 instead of just i8.
1354 OutArg.Regs[0] =
1355 MIRBuilder.buildZExt(LLT::integer(8), OutArg.Regs[0]).getReg(0);
1356 LLVMContext &Ctx = MF.getFunction().getContext();
1357 OutArg.Ty = Type::getInt8Ty(Ctx);
1358 }
1359 }
1360
1362 if (!Info.OrigRet.Ty->isVoidTy())
1363 splitToValueTypes(Info.OrigRet, InArgs, DL, Info.CallConv);
1364
1365 // If we can lower as a tail call, do that instead.
1366 bool CanTailCallOpt =
1367 isEligibleForTailCallOptimization(MIRBuilder, Info, InArgs, OutArgs);
1368
1369 // We must emit a tail call if we have musttail.
1370 if (Info.IsMustTailCall && !CanTailCallOpt) {
1371 // There are types of incoming/outgoing arguments we can't handle yet, so
1372 // it doesn't make sense to actually die here like in ISelLowering. Instead,
1373 // fall back to SelectionDAG and let it try to handle this.
1374 LLVM_DEBUG(dbgs() << "Failed to lower musttail call as tail call\n");
1375 return false;
1376 }
1377
1378 Info.IsTailCall = CanTailCallOpt;
1379 if (CanTailCallOpt)
1380 return lowerTailCall(MIRBuilder, Info, OutArgs);
1381
1382 // Find out which ABI gets to decide where things go.
1383 CCAssignFn *AssignFnFixed;
1384 CCAssignFn *AssignFnVarArg;
1385 std::tie(AssignFnFixed, AssignFnVarArg) =
1386 getAssignFnsForCC(Info.CallConv, TLI);
1387
1388 MachineInstrBuilder CallSeqStart;
1389 CallSeqStart = MIRBuilder.buildInstr(AArch64::ADJCALLSTACKDOWN);
1390
1391 // Create a temporarily-floating call instruction so we can add the implicit
1392 // uses of arg registers.
1393
1394 unsigned Opc = 0;
1395 // Calls with operand bundle "clang.arc.attachedcall" are special. They should
1396 // be expanded to the call, directly followed by a special marker sequence and
1397 // a call to an ObjC library function.
1398 if (Info.CB && objcarc::hasAttachedCallOpBundle(Info.CB))
1399 Opc = Info.PAI ? AArch64::BLRA_RVMARKER : AArch64::BLR_RVMARKER;
1400 // A call to a returns twice function like setjmp must be followed by a bti
1401 // instruction.
1402 else if (Info.CB && Info.CB->hasFnAttr(Attribute::ReturnsTwice) &&
1403 !Subtarget.noBTIAtReturnTwice() &&
1405 Opc = AArch64::BLR_BTI;
1406 else {
1407 // For an intrinsic call (e.g. memset), use GOT if "RtLibUseGOT" (-fno-plt)
1408 // is set.
1409 if (Info.Callee.isSymbol() && F.getParent()->getRtLibUseGOT()) {
1410 auto MIB = MIRBuilder.buildInstr(TargetOpcode::G_GLOBAL_VALUE);
1411 DstOp(getLLTForType(*F.getType(), DL)).addDefToMIB(MRI, MIB);
1412 MIB.addExternalSymbol(Info.Callee.getSymbolName(), AArch64II::MO_GOT);
1413 Info.Callee = MachineOperand::CreateReg(MIB.getReg(0), false);
1414 }
1415 Opc = getCallOpcode(MF, Info.Callee.isReg(), false, Info.PAI, MRI);
1416 }
1417
1418 auto MIB = MIRBuilder.buildInstrNoInsert(Opc);
1419 unsigned CalleeOpNo = 0;
1420
1421 if (Opc == AArch64::BLR_RVMARKER || Opc == AArch64::BLRA_RVMARKER) {
1422 // Add a target global address for the retainRV/claimRV runtime function
1423 // just before the call target.
1424 Function *ARCFn = *objcarc::getAttachedARCFunction(Info.CB);
1425 MIB.addGlobalAddress(ARCFn);
1426 ++CalleeOpNo;
1427
1428 // We may or may not need to emit both the marker and the retain/claim call.
1429 // Tell the pseudo expansion using an additional boolean op.
1430 MIB.addImm(objcarc::attachedCallOpBundleNeedsMarker(Info.CB));
1431 ++CalleeOpNo;
1432 } else if (Info.CFIType) {
1433 MIB->setCFIType(MF, Info.CFIType->getZExtValue());
1434 }
1435 MIB->setDeactivationSymbol(MF, Info.DeactivationSymbol);
1436
1437 MIB.add(Info.Callee);
1438
1439 // Tell the call which registers are clobbered.
1440 const uint32_t *Mask;
1441 const auto *TRI = Subtarget.getRegisterInfo();
1442
1443 AArch64OutgoingValueAssigner Assigner(AssignFnFixed, AssignFnVarArg,
1444 Subtarget, /*IsReturn*/ false);
1445 // Do the actual argument marshalling.
1446 OutgoingArgHandler Handler(MIRBuilder, MRI, MIB, /*IsReturn*/ false);
1447 if (!determineAndHandleAssignments(Handler, Assigner, OutArgs, MIRBuilder,
1448 Info.CallConv, Info.IsVarArg))
1449 return false;
1450
1451 Mask = getMaskForArgs(OutArgs, Info, *TRI, MF);
1452
1453 if (Opc == AArch64::BLRA || Opc == AArch64::BLRA_RVMARKER) {
1454 assert((Info.PAI->Key == AArch64PACKey::IA ||
1455 Info.PAI->Key == AArch64PACKey::IB) &&
1456 "Invalid auth call key");
1457 MIB.addImm(Info.PAI->Key);
1458
1459 Register AddrDisc = 0;
1460 uint16_t IntDisc = 0;
1461 std::tie(IntDisc, AddrDisc) =
1462 extractPtrauthBlendDiscriminators(Info.PAI->Discriminator, MRI);
1463
1464 MIB.addImm(IntDisc);
1465 MIB.addUse(AddrDisc);
1466 if (AddrDisc != AArch64::NoRegister) {
1468 *MF.getSubtarget().getRegBankInfo(), *MIB,
1469 MIB->getDesc(), MIB->getOperand(CalleeOpNo + 3),
1470 CalleeOpNo + 3);
1471 }
1472 }
1473
1474 // Tell the call which registers are clobbered.
1476 TRI->UpdateCustomCallPreservedMask(MF, &Mask);
1477 MIB.addRegMask(Mask);
1478
1479 if (TRI->isAnyArgRegReserved(MF))
1480 TRI->emitReservedArgRegCallError(MF);
1481
1482 // Now we can add the actual call instruction to the correct basic block.
1483 MIRBuilder.insertInstr(MIB);
1484
1485 uint64_t CalleePopBytes =
1486 doesCalleeRestoreStack(Info.CallConv,
1488 ? alignTo(Assigner.StackSize, 16)
1489 : 0;
1490
1491 CallSeqStart.addImm(Assigner.StackSize).addImm(0);
1492 MIRBuilder.buildInstr(AArch64::ADJCALLSTACKUP)
1493 .addImm(Assigner.StackSize)
1494 .addImm(CalleePopBytes);
1495
1496 // If Callee is a reg, since it is used by a target specific
1497 // instruction, it must have a register class matching the
1498 // constraint of that instruction.
1499 if (MIB->getOperand(CalleeOpNo).isReg())
1500 constrainOperandRegClass(MF, *TRI, MRI, *Subtarget.getInstrInfo(),
1501 *Subtarget.getRegBankInfo(), *MIB, MIB->getDesc(),
1502 MIB->getOperand(CalleeOpNo), CalleeOpNo);
1503
1504 // Finally we can copy the returned value back into its virtual-register. In
1505 // symmetry with the arguments, the physical register must be an
1506 // implicit-define of the call instruction.
1507 if (Info.CanLowerReturn && !Info.OrigRet.Ty->isVoidTy()) {
1508 CCAssignFn *RetAssignFn = TLI.CCAssignFnForReturn(Info.CallConv);
1509 CallReturnHandler Handler(MIRBuilder, MRI, MIB);
1510 bool UsingReturnedArg =
1511 !OutArgs.empty() && OutArgs[0].Flags[0].isReturned();
1512
1513 AArch64OutgoingValueAssigner Assigner(RetAssignFn, RetAssignFn, Subtarget,
1514 /*IsReturn*/ false);
1515 ReturnedArgCallReturnHandler ReturnedArgHandler(MIRBuilder, MRI, MIB);
1517 UsingReturnedArg ? ReturnedArgHandler : Handler, Assigner, InArgs,
1518 MIRBuilder, Info.CallConv, Info.IsVarArg,
1519 UsingReturnedArg ? ArrayRef(OutArgs[0].Regs)
1520 : ArrayRef<Register>()))
1521 return false;
1522 }
1523
1524 if (Info.SwiftErrorVReg) {
1525 MIB.addDef(AArch64::X21, RegState::Implicit);
1526 MIRBuilder.buildCopy(Info.SwiftErrorVReg, Register(AArch64::X21));
1527 }
1528
1529 if (!Info.CanLowerReturn) {
1530 insertSRetLoads(MIRBuilder, Info.OrigRet.Ty, Info.OrigRet.Regs,
1531 Info.DemoteRegister, Info.DemoteStackIndex);
1532 }
1533 return true;
1534}
1535
1537 return Ty.getSizeInBits() == 64;
1538}
static void handleMustTailForwardedRegisters(MachineIRBuilder &MIRBuilder, CCAssignFn *AssignFn)
Helper function to compute forwarded registers for musttail calls.
static unsigned getCallOpcode(const MachineFunction &CallerF, bool IsIndirect, bool IsTailCall, std::optional< CallLowering::PtrAuthInfo > &PAI, MachineRegisterInfo &MRI)
static LLT getStackValueStoreTypeHack(const CCValAssign &VA)
static const uint32_t * getMaskForArgs(SmallVectorImpl< AArch64CallLowering::ArgInfo > &OutArgs, AArch64CallLowering::CallLoweringInfo &Info, const AArch64RegisterInfo &TRI, MachineFunction &MF)
static void applyStackPassedSmallTypeDAGHack(EVT OrigVT, MVT &ValVT, MVT &LocVT)
static std::pair< CCAssignFn *, CCAssignFn * > getAssignFnsForCC(CallingConv::ID CC, const AArch64TargetLowering &TLI)
Returns a pair containing the fixed CCAssignFn and the vararg CCAssignFn for CC.
static bool doesCalleeRestoreStack(CallingConv::ID CallConv, bool TailCallOpt)
This file describes how to lower LLVM calls to machine code calls.
MachineInstrBuilder MachineInstrBuilder & DefMI
static std::tuple< SDValue, SDValue > extractPtrauthBlendDiscriminators(SDValue Disc, SelectionDAG *DAG)
static bool shouldLowerTailCallStackArg(const MachineFunction &MF, const CCValAssign &VA, SDValue Arg, ISD::ArgFlagsTy Flags, int CallOffset)
Check whether a stack argument requires lowering in a tail call.
static const MCPhysReg GPRArgRegs[]
static const MCPhysReg FPRArgRegs[]
cl::opt< bool > EnableSVEGISel("aarch64-enable-gisel-sve", cl::Hidden, cl::desc("Enable / disable SVE scalable vectors in Global ISel"), cl::init(false))
static bool canGuaranteeTCO(CallingConv::ID CC, bool GuaranteeTailCalls)
Return true if the calling convention is one that we can guarantee TCO for.
static bool mayTailCallThisCC(CallingConv::ID CC)
Return true if we might ever do TCO for calls with this calling convention.
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")
MachineBasicBlock & MBB
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
This file contains the simple types necessary to represent the attributes associated with functions a...
static GCRegistry::Add< ErlangGC > A("erlang", "erlang-compatible garbage collector")
Declares convenience wrapper classes for interpreting MachineInstr instances as specific generic oper...
Implement a low-level type suitable for MachineInstr level instruction selection.
#define F(x, y, z)
Definition MD5.cpp:54
This file declares the MachineIRBuilder class.
Register Reg
Register const TargetRegisterInfo * TRI
Promote Memory to Register
Definition Mem2Reg.cpp:110
static MCRegister getReg(const MCDisassembler *D, unsigned RC, unsigned RegNo)
This file defines ARC utility functions which are used by various parts of the compiler.
static constexpr MCPhysReg SPReg
This file defines the SmallVector class.
#define LLVM_DEBUG(...)
Definition Debug.h:119
bool lowerReturn(MachineIRBuilder &MIRBuilder, const Value *Val, ArrayRef< Register > VRegs, FunctionLoweringInfo &FLI, Register SwiftErrorVReg) const override
This hook must be implemented to lower outgoing return values, described by Val, into the specified v...
bool canLowerReturn(MachineFunction &MF, CallingConv::ID CallConv, SmallVectorImpl< BaseArgInfo > &Outs, bool IsVarArg) const override
This hook must be implemented to check whether the return values described by Outs can fit into the r...
bool fallBackToDAGISel(const MachineFunction &MF) const override
bool isTypeIsValidForThisReturn(EVT Ty) const override
For targets which support the "returned" parameter attribute, returns true if the given type is a val...
bool isEligibleForTailCallOptimization(MachineIRBuilder &MIRBuilder, CallLoweringInfo &Info, SmallVectorImpl< ArgInfo > &InArgs, SmallVectorImpl< ArgInfo > &OutArgs) const
Returns true if the call can be lowered as a tail call.
AArch64CallLowering(const AArch64TargetLowering &TLI)
bool lowerCall(MachineIRBuilder &MIRBuilder, CallLoweringInfo &Info) const override
This hook must be implemented to lower the given call instruction, including argument and return valu...
bool lowerFormalArguments(MachineIRBuilder &MIRBuilder, const Function &F, ArrayRef< ArrayRef< Register > > VRegs, FunctionLoweringInfo &FLI) const override
This hook must be implemented to lower the incoming (formal) arguments, described by VRegs,...
AArch64FunctionInfo - This class is derived from MachineFunctionInfo and contains private AArch64-spe...
void setTailCallReservedStack(unsigned bytes)
SmallVectorImpl< ForwardedRegister > & getForwardedMustTailRegParms()
void setBytesInStackArgArea(unsigned bytes)
void setArgumentStackToRestore(unsigned bytes)
const AArch64RegisterInfo * getRegisterInfo() const override
const AArch64InstrInfo * getInstrInfo() const override
bool isCallingConvWin64(CallingConv::ID CC, bool IsVarArg) const
const RegisterBankInfo * getRegBankInfo() const override
bool hasCustomCallingConv() const
CCAssignFn * CCAssignFnForCall(CallingConv::ID CC, bool IsVarArg) const
Selects the correct CCAssignFn for a given CallingConvention value.
This class represents an incoming formal argument to a Function.
Definition Argument.h:32
Represent a constant reference to an array (0 or more elements consecutively in memory),...
Definition ArrayRef.h:40
size_t size() const
Get the array size.
Definition ArrayRef.h:141
bool empty() const
Check if the array is empty.
Definition ArrayRef.h:136
CCState - This class holds information needed while lowering arguments and return values.
MachineFunction & getMachineFunction() const
unsigned getFirstUnallocated(ArrayRef< MCPhysReg > Regs) const
getFirstUnallocated - Return the index of the first unallocated register in the set,...
LLVM_ABI void analyzeMustTailForwardedRegisters(SmallVectorImpl< ForwardedRegister > &Forwards, ArrayRef< MVT > RegParmTypes, CCAssignFn Fn)
Compute the set of registers that need to be preserved and forwarded to any musttail calls.
CallingConv::ID getCallingConv() const
uint64_t getStackSize() const
Returns the size of the currently allocated portion of the stack.
bool isVarArg() const
bool isAllocated(MCRegister Reg) const
isAllocated - Return true if the specified register (or an alias) is allocated.
CCValAssign - Represent assignment of one arg/retval to a location.
LocInfo getLocInfo() const
static CCValAssign getReg(unsigned ValNo, MVT ValVT, MCRegister Reg, MVT LocVT, LocInfo HTP, bool IsCustom=false)
void insertSRetLoads(MachineIRBuilder &MIRBuilder, Type *RetTy, ArrayRef< Register > VRegs, Register DemoteReg, int FI) const
Load the returned value from the stack into virtual registers in VRegs.
bool handleAssignments(ValueHandler &Handler, SmallVectorImpl< ArgInfo > &Args, CCState &CCState, SmallVectorImpl< CCValAssign > &ArgLocs, MachineIRBuilder &MIRBuilder, ArrayRef< Register > ThisReturnRegs={}) const
Use Handler to insert code to handle the argument/return values represented by Args.
bool resultsCompatible(CallLoweringInfo &Info, MachineFunction &MF, SmallVectorImpl< ArgInfo > &InArgs, ValueAssigner &CalleeAssigner, ValueAssigner &CallerAssigner) const
void insertSRetIncomingArgument(const Function &F, SmallVectorImpl< ArgInfo > &SplitArgs, Register &DemoteReg, MachineRegisterInfo &MRI, const DataLayout &DL) const
Insert the hidden sret ArgInfo to the beginning of SplitArgs.
void splitToValueTypes(const ArgInfo &OrigArgInfo, SmallVectorImpl< ArgInfo > &SplitArgs, const DataLayout &DL, CallingConv::ID CallConv, SmallVectorImpl< TypeSize > *Offsets=nullptr) const
Break OrigArgInfo into one or more pieces the calling convention can process, returned in SplitArgs.
bool determineAndHandleAssignments(ValueHandler &Handler, ValueAssigner &Assigner, SmallVectorImpl< ArgInfo > &Args, MachineIRBuilder &MIRBuilder, CallingConv::ID CallConv, bool IsVarArg, ArrayRef< Register > ThisReturnRegs={}) const
Invoke ValueAssigner::assignArg on each of the given Args and then use Handler to move them to the as...
void insertSRetStores(MachineIRBuilder &MIRBuilder, Type *RetTy, ArrayRef< Register > VRegs, Register DemoteReg) const
Store the return value given by VRegs into stack starting at the offset specified in DemoteReg.
bool parametersInCSRMatch(const MachineRegisterInfo &MRI, const uint32_t *CallerPreservedMask, const SmallVectorImpl< CCValAssign > &ArgLocs, const SmallVectorImpl< ArgInfo > &OutVals) const
Check whether parameters to a call that are passed in callee saved registers are the same as from the...
bool determineAssignments(ValueAssigner &Assigner, SmallVectorImpl< ArgInfo > &Args, CCState &CCInfo) const
Analyze the argument list in Args, using Assigner to populate CCInfo.
bool checkReturn(CCState &CCInfo, SmallVectorImpl< BaseArgInfo > &Outs, CCAssignFn *Fn) const
CallLowering(const TargetLowering *TLI)
const TargetLowering * getTLI() const
Getter for generic TargetLowering class.
void setArgFlags(ArgInfo &Arg, unsigned OpIdx, const DataLayout &DL, const FuncInfoTy &FuncInfo) const
void addDefToMIB(MachineRegisterInfo &MRI, MachineInstrBuilder &MIB) const
FormalArgHandler(MachineIRBuilder &MIRBuilder, MachineRegisterInfo &MRI)
FunctionLoweringInfo - This contains information that is global to a function that is used when lower...
Register DemoteRegister
DemoteRegister - if CanLowerReturn is false, DemoteRegister is a vreg allocated to hold a pointer to ...
bool CanLowerReturn
CanLowerReturn - true iff the function's return value can be lowered to registers.
iterator_range< arg_iterator > args()
Definition Function.h:892
CallingConv::ID getCallingConv() const
getCallingConv()/setCallingConv(CC) - These method get and set the calling convention of this functio...
Definition Function.h:272
LLVMContext & getContext() const
getContext - Return a reference to the LLVMContext associated with this function.
Definition Function.cpp:354
bool isVarArg() const
isVarArg - Return true if this function takes a variable number of arguments.
Definition Function.h:229
bool hasExternalWeakLinkage() const
constexpr unsigned getScalarSizeInBits() const
static constexpr LLT scalar(unsigned SizeInBits)
Get a low-level scalar or aggregate "bag of bits".
constexpr uint16_t getNumElements() const
Returns the number of elements in a vector LLT.
constexpr bool isVector() const
static constexpr LLT pointer(unsigned AddressSpace, unsigned SizeInBits)
Get a low-level pointer in the given address space.
constexpr TypeSize getSizeInBits() const
Returns the total size of the type. Must only be called on sized types.
static LLT integer(unsigned SizeInBits)
constexpr TypeSize getSizeInBytes() const
Returns the total size of the type in bytes, i.e.
This is an important class for using LLVM in a threaded context.
Definition LLVMContext.h:68
Machine Value Type.
bool isVector() const
Return true if this is a vector value type.
The MachineFrameInfo class represents an abstract stack frame until prolog/epilog code is inserted.
LLVM_ABI int CreateFixedObject(uint64_t Size, int64_t SPOffset, bool IsImmutable, bool isAliased=false)
Create a new object at a fixed location on the stack.
LLVM_ABI int CreateStackObject(uint64_t Size, Align Alignment, bool isSpillSlot, const AllocaInst *Alloca=nullptr, uint8_t ID=0)
Create a new statically sized stack object, returning a nonnegative identifier to represent it.
bool isImmutableObjectIndex(int ObjectIdx) const
Returns true if the specified index corresponds to an immutable object.
void setHasTailCall(bool V=true)
bool hasMustTailInVarArgFunc() const
Returns true if the function is variadic and contains a musttail call.
int64_t getObjectSize(int ObjectIdx) const
Return the size of the specified object.
int64_t getObjectOffset(int ObjectIdx) const
Return the assigned stack offset of the specified object from the incoming stack pointer.
const TargetSubtargetInfo & getSubtarget() const
getSubtarget - Return the subtarget for which this machine code is being compiled.
MachineMemOperand * getMachineMemOperand(MachinePointerInfo PtrInfo, MachineMemOperand::Flags f, LLT MemTy, Align base_alignment, const AAMDNodes &AAInfo=AAMDNodes(), const MDNode *Ranges=nullptr, SyncScope::ID SSID=SyncScope::System, AtomicOrdering Ordering=AtomicOrdering::NotAtomic, AtomicOrdering FailureOrdering=AtomicOrdering::NotAtomic)
getMachineMemOperand - Allocate a new MachineMemOperand.
MachineFrameInfo & getFrameInfo()
getFrameInfo - Return the frame info object for the current function.
MachineRegisterInfo & getRegInfo()
getRegInfo - Return information about the registers currently in use.
Function & getFunction()
Return the LLVM function that this machine code represents.
Ty * getInfo()
getInfo - Keep track of various per-function pieces of information for backends that would like to do...
Register addLiveIn(MCRegister PReg, const TargetRegisterClass *RC)
addLiveIn - Add the specified physical register as a live-in value and create a corresponding virtual...
const TargetMachine & getTarget() const
getTarget - Return the target machine this machine code is compiled with
Helper class to build MachineInstr.
MachineInstrBuilder insertInstr(MachineInstrBuilder MIB)
Insert an existing instruction at the insertion point.
MachineInstrBuilder buildZExt(const DstOp &Res, const SrcOp &Op, std::optional< unsigned > Flags=std::nullopt)
Build and insert Res = G_ZEXT Op.
void setInstr(MachineInstr &MI)
Set the insertion point to before MI.
MachineInstrBuilder buildAssertZExt(const DstOp &Res, const SrcOp &Op, unsigned Size)
Build and insert Res = G_ASSERT_ZEXT Op, Size.
MachineInstrBuilder buildPtrAdd(const DstOp &Res, const SrcOp &Op0, const SrcOp &Op1, std::optional< unsigned > Flags=std::nullopt)
Build and insert Res = G_PTR_ADD Op0, Op1.
MachineInstrBuilder buildStore(const SrcOp &Val, const SrcOp &Addr, MachineMemOperand &MMO)
Build and insert G_STORE Val, Addr, MMO.
MachineInstrBuilder buildInstr(unsigned Opcode)
Build and insert <empty> = Opcode <empty>.
MachineInstrBuilder buildPadVectorWithUndefElements(const DstOp &Res, const SrcOp &Op0)
Build and insert a, b, ..., x = G_UNMERGE_VALUES Op0 Res = G_BUILD_VECTOR a, b, .....
MachineInstrBuilder buildFrameIndex(const DstOp &Res, int Idx)
Build and insert Res = G_FRAME_INDEX Idx.
MachineFunction & getMF()
Getter for the function we currently build.
MachineInstrBuilder buildTrunc(const DstOp &Res, const SrcOp &Op, std::optional< unsigned > Flags=std::nullopt)
Build and insert Res = G_TRUNC Op.
const MachineBasicBlock & getMBB() const
Getter for the basic block we currently build.
void setMBB(MachineBasicBlock &MBB)
Set the insertion point to the end of MBB.
MachineInstrBuilder buildInstrNoInsert(unsigned Opcode)
Build but don't insert <empty> = Opcode <empty>.
MachineInstrBuilder buildCopy(const DstOp &Res, const SrcOp &Op)
Build and insert Res = COPY Op.
virtual MachineInstrBuilder buildConstant(const DstOp &Res, const ConstantInt &Val)
Build and insert Res = G_CONSTANT Val.
Register getReg(unsigned Idx) const
Get the register for the operand index.
const MachineInstrBuilder & addReg(Register RegNo, RegState Flags={}, unsigned SubReg=0) const
Add a new virtual register operand.
const MachineInstrBuilder & addImm(int64_t Val) const
Add a new immediate operand.
const MachineInstrBuilder & add(const MachineOperand &MO) const
const MachineInstrBuilder & addDef(Register RegNo, RegState Flags={}, unsigned SubReg=0) const
Add a virtual register definition operand.
unsigned getOpcode() const
Returns the opcode of this MachineInstr.
const MachineOperand & getOperand(unsigned i) const
LLVM_ABI void setDeactivationSymbol(MachineFunction &MF, Value *DS)
@ MOLoad
The memory access reads data.
@ MOInvariant
The memory access always returns the same value (or traps).
@ MOStore
The memory access writes data.
Register getReg() const
getReg - Returns the register number.
static MachineOperand CreateReg(Register Reg, bool isDef, bool isImp=false, bool isKill=false, bool isDead=false, bool isUndef=false, bool isEarlyClobber=false, unsigned SubReg=0, bool isDebug=false, bool isInternalRead=false, bool isRenamable=false)
MachineRegisterInfo - Keep track of information for virtual and physical registers,...
LLVM_ABI MachineInstr * getVRegDef(Register Reg) const
getVRegDef - Return the machine instr that defines the specified virtual register or null if none is ...
LLT getType(Register Reg) const
Get the low-level type of Reg or LLT{} if Reg is not a generic (target independent) virtual register.
LLVM_ABI Register createGenericVirtualRegister(LLT Ty, StringRef Name="")
Create and return a new generic virtual register with low-level type Ty.
Wrapper class representing virtual and physical registers.
Definition Register.h:20
MCRegister asMCReg() const
Utility to check-convert this value to a MCRegister.
Definition Register.h:107
SMEAttrs is a utility class to parse the SME ACLE attributes on functions.
This class consists of common code factored out of the SmallVector class to reduce code duplication b...
void push_back(const T &Elt)
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
CodeGenOptLevel getOptLevel() const
Returns the optimization level: None, Less, Default, or Aggressive.
const Triple & getTargetTriple() const
TargetOptions Options
unsigned GuaranteedTailCallOpt
GuaranteedTailCallOpt - This flag is enabled when -tailcallopt is specified on the commandline.
virtual const RegisterBankInfo * getRegBankInfo() const
If the information for the register banks is available, return it.
virtual const TargetInstrInfo * getInstrInfo() const
Triple - Helper class for working with autoconf configuration names.
Definition Triple.h:47
static constexpr TypeSize getFixed(ScalarTy ExactSize)
Definition TypeSize.h:343
static LLVM_ABI IntegerType * getInt8Ty(LLVMContext &C)
Definition Type.cpp:307
LLVMContext & getContext() const
Return the LLVMContext in which this type was uniqued.
Definition Type.h:130
bool isIntegerTy() const
True if this is an instance of IntegerType.
Definition Type.h:257
unsigned getNumOperands() const
Definition User.h:229
LLVM Value Representation.
Definition Value.h:75
Type * getType() const
All values are typed, get the type of this value.
Definition Value.h:255
@ MO_GOT
MO_GOT - This flag indicates that a symbol operand represents the address of the GOT entry for the sy...
ArrayRef< MCPhysReg > getFPRArgRegs()
ArrayRef< MCPhysReg > getGPRArgRegs()
constexpr char Align[]
Key for Kernel::Arg::Metadata::mAlign.
constexpr std::underlying_type_t< E > Mask()
Get a bitmask with 1s in all places up to the high-order bit of E's largest value.
unsigned ID
LLVM IR allows to use arbitrary numbers as calling convention identifiers.
Definition CallingConv.h:24
@ ARM64EC_Thunk_Native
Calling convention used in the ARM64EC ABI to implement calls between ARM64 code and thunks.
@ Swift
Calling convention for Swift.
Definition CallingConv.h:69
@ PreserveMost
Used for runtime calls that preserves most registers.
Definition CallingConv.h:63
@ PreserveAll
Used for runtime calls that preserves (almost) all registers.
Definition CallingConv.h:66
@ Fast
Attempts to make calls as fast as possible (e.g.
Definition CallingConv.h:41
@ PreserveNone
Used for runtime calls that preserves none general registers.
Definition CallingConv.h:90
@ Tail
Attemps to make calls as fast as possible while guaranteeing that tail call optimization can always b...
Definition CallingConv.h:76
@ SwiftTail
This follows the Swift calling convention in how arguments are passed but guarantees tail calls will ...
Definition CallingConv.h:87
@ ARM64EC_Thunk_X64
Calling convention used in the ARM64EC ABI to implement calls between x64 code and thunks.
@ C
The default llvm calling convention, compatible with C.
Definition CallingConv.h:34
std::optional< Function * > getAttachedARCFunction(const CallBase *CB)
This function returns operand bundle clang_arc_attachedcall's argument, which is the address of the A...
Definition ObjCARCUtil.h:43
bool attachedCallOpBundleNeedsMarker(const CallBase *CB)
This function determines whether the clang_arc_attachedcall should be emitted with or without the mar...
Definition ObjCARCUtil.h:58
bool hasAttachedCallOpBundle(const CallBase *CB)
Definition ObjCARCUtil.h:29
This is an optimization pass for GlobalISel generic memory operations.
@ Offset
Definition DWP.cpp:558
LLVM_ABI Register constrainOperandRegClass(const MachineFunction &MF, const TargetRegisterInfo &TRI, MachineRegisterInfo &MRI, const TargetInstrInfo &TII, const RegisterBankInfo &RBI, MachineInstr &InsertPt, const TargetRegisterClass &RegClass, MachineOperand &RegMO)
Constrain the Register operand OpIdx, so that it is now constrained to the TargetRegisterClass passed...
Definition Utils.cpp:60
@ Implicit
Not emitted register (e.g. carry, or temporary result).
LLVM_ABI void ComputeValueVTs(const TargetLowering &TLI, const DataLayout &DL, Type *Ty, SmallVectorImpl< EVT > &ValueVTs, SmallVectorImpl< EVT > *MemVTs=nullptr, SmallVectorImpl< TypeSize > *Offsets=nullptr, TypeSize StartingOffset=TypeSize::getZero())
ComputeValueVTs - Given an LLVM IR type, compute a sequence of EVTs that represent all the individual...
Definition Analysis.cpp:119
decltype(auto) dyn_cast(const From &Val)
dyn_cast<X> - Return the argument parameter cast to the specified type.
Definition Casting.h:643
bool CCAssignFn(unsigned ValNo, MVT ValVT, MVT LocVT, CCValAssign::LocInfo LocInfo, ISD::ArgFlagsTy ArgFlags, Type *OrigTy, CCState &State)
CCAssignFn - This function assigns a location for Val, updating State to reflect the change.
void append_range(Container &C, Range &&R)
Wrapper function to append range R to container C.
Definition STLExtras.h:2207
unsigned getBLRCallOpcode(const MachineFunction &MF)
Return opcode to be used for indirect calls.
bool any_of(R &&range, UnaryPredicate P)
Provide wrappers to std::any_of which take ranges instead of having to pass begin/end explicitly.
Definition STLExtras.h:1745
LLVM_ABI raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
Definition Debug.cpp:209
constexpr uint64_t alignTo(uint64_t Size, Align A)
Returns a multiple of A needed to store Size bytes.
Definition Alignment.h:144
class LLVM_GSL_OWNER SmallVector
Forward declaration of SmallVector so that calculateSmallVectorDefaultInlinedElements can reference s...
@ Success
The lock was released successfully.
DWARFExpression::Operation Op
LLVM_ABI bool isAssertMI(const MachineInstr &MI)
Returns true if the instruction MI is one of the assert instructions.
Definition Utils.cpp:1994
LLVM_ABI LLT getLLTForType(Type &Ty, const DataLayout &DL)
Construct a low-level type based on an LLVM type.
LLVM_ABI CGPassBuilderOption getCGPassBuilderOption()
LLVM_ABI Align inferAlignFromPtrInfo(MachineFunction &MF, const MachinePointerInfo &MPO)
Definition Utils.cpp:844
void swap(llvm::BitVector &LHS, llvm::BitVector &RHS)
Implement std::swap in terms of BitVector swap.
Definition BitVector.h:862
This struct is a compact representation of a valid (non-zero power of two) alignment.
Definition Alignment.h:39
cl::boolOrDefault EnableGlobalISelOption
SmallVector< Register, 4 > Regs
SmallVector< ISD::ArgFlagsTy, 4 > Flags
Base class for ValueHandlers used for arguments coming into the current function, or for return value...
void assignValueToReg(Register ValVReg, Register PhysReg, const CCValAssign &VA, ISD::ArgFlagsTy Flags={}) override
Provides a default implementation for argument handling.
Base class for ValueHandlers used for arguments passed to a function call, or for return values.
virtual LLT getStackValueStoreType(const DataLayout &DL, const CCValAssign &VA, ISD::ArgFlagsTy Flags) const
Return the in-memory size to write for the argument at VA.
Extended Value Type.
Definition ValueTypes.h:35
LLVM_ABI Type * getTypeForEVT(LLVMContext &Context) const
This method returns an LLVM type corresponding to the specified EVT.
Describes a register that needs to be forwarded from the prologue to a musttail call.
This class contains a discriminated union of information about pointers in memory operands,...
static LLVM_ABI MachinePointerInfo getStack(MachineFunction &MF, int64_t Offset, uint8_t ID=0)
Stack pointer relative access.
static LLVM_ABI MachinePointerInfo getFixedStack(MachineFunction &MF, int FI, int64_t Offset=0)
Return a MachinePointerInfo record that refers to the specified FrameIndex.