LLVM 23.0.0git
RISCVInstrInfo.cpp
Go to the documentation of this file.
1//===-- RISCVInstrInfo.cpp - RISC-V Instruction Information -----*- C++ -*-===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8//
9// This file contains the RISC-V implementation of the TargetInstrInfo class.
10//
11//===----------------------------------------------------------------------===//
12
13#include "RISCVInstrInfo.h"
16#include "RISCV.h"
18#include "RISCVSubtarget.h"
19#include "llvm/ADT/STLExtras.h"
21#include "llvm/ADT/Statistic.h"
33#include "llvm/IR/Module.h"
34#include "llvm/MC/MCDwarf.h"
38
39using namespace llvm;
40
41#define GEN_CHECK_COMPRESS_INSTR
42#include "RISCVGenCompressInstEmitter.inc"
43
44#define GET_INSTRINFO_CTOR_DTOR
45#include "RISCVGenInstrInfo.inc"
46
47#define DEBUG_TYPE "riscv-instr-info"
48STATISTIC(NumVRegSpilled,
49 "Number of registers within vector register groups spilled");
50STATISTIC(NumVRegReloaded,
51 "Number of registers within vector register groups reloaded");
52
54 "riscv-prefer-whole-register-move", cl::init(false), cl::Hidden,
55 cl::desc("Prefer whole register move for vector registers."));
56
58 "riscv-force-machine-combiner-strategy", cl::Hidden,
59 cl::desc("Force machine combiner to use a specific strategy for machine "
60 "trace metrics evaluation."),
63 "Local strategy."),
65 "MinInstrCount strategy.")));
66
68 "riscv-outliner-regsave", cl::init(true), cl::Hidden,
69 cl::desc("Enable RegSave strategy in machine outliner (save X5 to a "
70 "temporary register when X5 is live across outlined calls)."));
71
73
74using namespace RISCV;
75
76#define GET_RISCVVPseudosTable_IMPL
77#include "RISCVGenSearchableTables.inc"
78
79} // namespace llvm::RISCVVPseudosTable
80
81namespace llvm::RISCV {
82
83#define GET_RISCVMaskedPseudosTable_IMPL
84#include "RISCVGenSearchableTables.inc"
85
86} // end namespace llvm::RISCV
87
89 : RISCVGenInstrInfo(STI, RegInfo, RISCV::ADJCALLSTACKDOWN,
90 RISCV::ADJCALLSTACKUP),
91 RegInfo(STI.getHwMode()), STI(STI) {}
92
93#define GET_INSTRINFO_HELPERS
94#include "RISCVGenInstrInfo.inc"
95
97 if (STI.hasStdExtZca())
98 return MCInstBuilder(RISCV::C_NOP);
99 return MCInstBuilder(RISCV::ADDI)
100 .addReg(RISCV::X0)
101 .addReg(RISCV::X0)
102 .addImm(0);
103}
104
106 int &FrameIndex) const {
107 TypeSize Dummy = TypeSize::getZero();
108 return isLoadFromStackSlot(MI, FrameIndex, Dummy);
109}
110
111static std::optional<unsigned> getLMULForRVVWholeLoadStore(unsigned Opcode) {
112 switch (Opcode) {
113 default:
114 return std::nullopt;
115 case RISCV::VS1R_V:
116 case RISCV::VL1RE8_V:
117 case RISCV::VL1RE16_V:
118 case RISCV::VL1RE32_V:
119 case RISCV::VL1RE64_V:
120 return 1;
121 case RISCV::VS2R_V:
122 case RISCV::VL2RE8_V:
123 case RISCV::VL2RE16_V:
124 case RISCV::VL2RE32_V:
125 case RISCV::VL2RE64_V:
126 return 2;
127 case RISCV::VS4R_V:
128 case RISCV::VL4RE8_V:
129 case RISCV::VL4RE16_V:
130 case RISCV::VL4RE32_V:
131 case RISCV::VL4RE64_V:
132 return 4;
133 case RISCV::VS8R_V:
134 case RISCV::VL8RE8_V:
135 case RISCV::VL8RE16_V:
136 case RISCV::VL8RE32_V:
137 case RISCV::VL8RE64_V:
138 return 8;
139 }
140}
141
143 int &FrameIndex,
144 TypeSize &MemBytes) const {
145 switch (MI.getOpcode()) {
146 default:
147 return 0;
148 case RISCV::LB:
149 case RISCV::LBU:
150 MemBytes = TypeSize::getFixed(1);
151 break;
152 case RISCV::LH:
153 case RISCV::LH_INX:
154 case RISCV::LHU:
155 case RISCV::FLH:
156 MemBytes = TypeSize::getFixed(2);
157 break;
158 case RISCV::LW:
159 case RISCV::LW_INX:
160 case RISCV::FLW:
161 case RISCV::LWU:
162 MemBytes = TypeSize::getFixed(4);
163 break;
164 case RISCV::LD:
165 case RISCV::LD_RV32:
166 case RISCV::FLD:
167 MemBytes = TypeSize::getFixed(8);
168 break;
169 case RISCV::VL1RE8_V:
170 case RISCV::VL2RE8_V:
171 case RISCV::VL4RE8_V:
172 case RISCV::VL8RE8_V:
173 if (!MI.getOperand(1).isFI())
174 return Register();
175 FrameIndex = MI.getOperand(1).getIndex();
176 unsigned LMUL = *getLMULForRVVWholeLoadStore(MI.getOpcode());
178 return MI.getOperand(0).getReg();
179 }
180
181 if (MI.getOperand(1).isFI() && MI.getOperand(2).isImm() &&
182 MI.getOperand(2).getImm() == 0) {
183 FrameIndex = MI.getOperand(1).getIndex();
184 return MI.getOperand(0).getReg();
185 }
186
187 return 0;
188}
189
191 int &FrameIndex) const {
192 TypeSize Dummy = TypeSize::getZero();
193 return isStoreToStackSlot(MI, FrameIndex, Dummy);
194}
195
197 int &FrameIndex,
198 TypeSize &MemBytes) const {
199 switch (MI.getOpcode()) {
200 default:
201 return 0;
202 case RISCV::SB:
203 MemBytes = TypeSize::getFixed(1);
204 break;
205 case RISCV::SH:
206 case RISCV::SH_INX:
207 case RISCV::FSH:
208 MemBytes = TypeSize::getFixed(2);
209 break;
210 case RISCV::SW:
211 case RISCV::SW_INX:
212 case RISCV::FSW:
213 MemBytes = TypeSize::getFixed(4);
214 break;
215 case RISCV::SD:
216 case RISCV::SD_RV32:
217 case RISCV::FSD:
218 MemBytes = TypeSize::getFixed(8);
219 break;
220 case RISCV::VS1R_V:
221 case RISCV::VS2R_V:
222 case RISCV::VS4R_V:
223 case RISCV::VS8R_V:
224 if (!MI.getOperand(1).isFI())
225 return Register();
226 FrameIndex = MI.getOperand(1).getIndex();
227 unsigned LMUL = *getLMULForRVVWholeLoadStore(MI.getOpcode());
229 return MI.getOperand(0).getReg();
230 }
231
232 if (MI.getOperand(1).isFI() && MI.getOperand(2).isImm() &&
233 MI.getOperand(2).getImm() == 0) {
234 FrameIndex = MI.getOperand(1).getIndex();
235 return MI.getOperand(0).getReg();
236 }
237
238 return 0;
239}
240
242 const MachineInstr &MI) const {
243 switch (RISCV::getRVVMCOpcode(MI.getOpcode())) {
244 case RISCV::VMV_V_X:
245 case RISCV::VFMV_V_F:
246 case RISCV::VMV_V_I:
247 case RISCV::VMV_S_X:
248 case RISCV::VFMV_S_F:
249 case RISCV::VID_V:
250 return MI.getOperand(1).isUndef();
251 default:
253 }
254}
255
256static bool forwardCopyWillClobberTuple(unsigned DstReg, unsigned SrcReg,
257 unsigned NumRegs) {
258 return DstReg > SrcReg && (DstReg - SrcReg) < NumRegs;
259}
260
262 const MachineBasicBlock &MBB,
265 RISCVVType::VLMUL LMul) {
267 return false;
268
269 assert(MBBI->getOpcode() == TargetOpcode::COPY &&
270 "Unexpected COPY instruction.");
271 Register SrcReg = MBBI->getOperand(1).getReg();
273
274 bool FoundDef = false;
275 bool FirstVSetVLI = false;
276 unsigned FirstSEW = 0;
277 while (MBBI != MBB.begin()) {
278 --MBBI;
279 if (MBBI->isMetaInstruction())
280 continue;
281
282 if (RISCVInstrInfo::isVectorConfigInstr(*MBBI)) {
283 // There is a vsetvli between COPY and source define instruction.
284 // vy = def_vop ... (producing instruction)
285 // ...
286 // vsetvli
287 // ...
288 // vx = COPY vy
289 if (!FoundDef) {
290 if (!FirstVSetVLI) {
291 FirstVSetVLI = true;
292 unsigned FirstVType = MBBI->getOperand(2).getImm();
293 RISCVVType::VLMUL FirstLMul = RISCVVType::getVLMUL(FirstVType);
294 FirstSEW = RISCVVType::getSEW(FirstVType);
295 // The first encountered vsetvli must have the same lmul as the
296 // register class of COPY.
297 if (FirstLMul != LMul)
298 return false;
299 }
300 // Only permit `vsetvli x0, x0, vtype` between COPY and the source
301 // define instruction.
302 if (!RISCVInstrInfo::isVLPreservingConfig(*MBBI))
303 return false;
304 continue;
305 }
306
307 // MBBI is the first vsetvli before the producing instruction.
308 unsigned VType = MBBI->getOperand(2).getImm();
309 // If there is a vsetvli between COPY and the producing instruction.
310 if (FirstVSetVLI) {
311 // If SEW is different, return false.
312 if (RISCVVType::getSEW(VType) != FirstSEW)
313 return false;
314 }
315
316 // If the vsetvli is tail undisturbed, keep the whole register move.
317 if (!RISCVVType::isTailAgnostic(VType))
318 return false;
319
320 // The checking is conservative. We only have register classes for
321 // LMUL = 1/2/4/8. We should be able to convert vmv1r.v to vmv.v.v
322 // for fractional LMUL operations. However, we could not use the vsetvli
323 // lmul for widening operations. The result of widening operation is
324 // 2 x LMUL.
325 return LMul == RISCVVType::getVLMUL(VType);
326 } else if (MBBI->isInlineAsm() || MBBI->isCall()) {
327 return false;
328 } else if (MBBI->getNumDefs()) {
329 // Check all the instructions which will change VL.
330 // For example, vleff has implicit def VL.
331 if (MBBI->modifiesRegister(RISCV::VL, /*TRI=*/nullptr))
332 return false;
333
334 // Only converting whole register copies to vmv.v.v when the defining
335 // value appears in the explicit operands.
336 for (const MachineOperand &MO : MBBI->explicit_operands()) {
337 if (!MO.isReg() || !MO.isDef())
338 continue;
339 if (!FoundDef && TRI->regsOverlap(MO.getReg(), SrcReg)) {
340 // We only permit the source of COPY has the same LMUL as the defined
341 // operand.
342 // There are cases we need to keep the whole register copy if the LMUL
343 // is different.
344 // For example,
345 // $x0 = PseudoVSETIVLI 4, 73 // vsetivli zero, 4, e16,m2,ta,m
346 // $v28m4 = PseudoVWADD_VV_M2 $v26m2, $v8m2
347 // # The COPY may be created by vlmul_trunc intrinsic.
348 // $v26m2 = COPY renamable $v28m2, implicit killed $v28m4
349 //
350 // After widening, the valid value will be 4 x e32 elements. If we
351 // convert the COPY to vmv.v.v, it will only copy 4 x e16 elements.
352 // FIXME: The COPY of subregister of Zvlsseg register will not be able
353 // to convert to vmv.v.[v|i] under the constraint.
354 if (MO.getReg() != SrcReg)
355 return false;
356
357 // In widening reduction instructions with LMUL_1 input vector case,
358 // only checking the LMUL is insufficient due to reduction result is
359 // always LMUL_1.
360 // For example,
361 // $x11 = PseudoVSETIVLI 1, 64 // vsetivli a1, 1, e8, m1, ta, mu
362 // $v8m1 = PseudoVWREDSUM_VS_M1 $v26, $v27
363 // $v26 = COPY killed renamable $v8
364 // After widening, The valid value will be 1 x e16 elements. If we
365 // convert the COPY to vmv.v.v, it will only copy 1 x e8 elements.
366 uint64_t TSFlags = MBBI->getDesc().TSFlags;
368 return false;
369
370 // If the producing instruction does not depend on vsetvli, do not
371 // convert COPY to vmv.v.v. For example, VL1R_V or PseudoVRELOAD.
372 if (!RISCVII::hasSEWOp(TSFlags) || !RISCVII::hasVLOp(TSFlags))
373 return false;
374
375 // Found the definition.
376 FoundDef = true;
377 DefMBBI = MBBI;
378 break;
379 }
380 }
381 }
382 }
383
384 return false;
385}
386
389 const DebugLoc &DL, MCRegister DstReg, MCRegister SrcReg, bool KillSrc,
390 const TargetRegisterClass *RegClass) const {
391 const RISCVRegisterInfo *TRI = STI.getRegisterInfo();
393 unsigned NF = RISCVRI::getNF(RegClass->TSFlags);
394
395 uint16_t SrcEncoding = TRI->getEncodingValue(SrcReg);
396 uint16_t DstEncoding = TRI->getEncodingValue(DstReg);
397 auto [LMulVal, Fractional] = RISCVVType::decodeVLMUL(LMul);
398 assert(!Fractional && "It is impossible be fractional lmul here.");
399 unsigned NumRegs = NF * LMulVal;
400 bool ReversedCopy =
401 forwardCopyWillClobberTuple(DstEncoding, SrcEncoding, NumRegs);
402 if (ReversedCopy) {
403 // If the src and dest overlap when copying a tuple, we need to copy the
404 // registers in reverse.
405 SrcEncoding += NumRegs - 1;
406 DstEncoding += NumRegs - 1;
407 }
408
409 unsigned I = 0;
410 auto GetCopyInfo = [&](uint16_t SrcEncoding, uint16_t DstEncoding)
411 -> std::tuple<RISCVVType::VLMUL, const TargetRegisterClass &, unsigned,
412 unsigned, unsigned> {
413 if (ReversedCopy) {
414 // For reversed copying, if there are enough aligned registers(8/4/2), we
415 // can do a larger copy(LMUL8/4/2).
416 // Besides, we have already known that DstEncoding is larger than
417 // SrcEncoding in forwardCopyWillClobberTuple, so the difference between
418 // DstEncoding and SrcEncoding should be >= LMUL value we try to use to
419 // avoid clobbering.
420 uint16_t Diff = DstEncoding - SrcEncoding;
421 if (I + 8 <= NumRegs && Diff >= 8 && SrcEncoding % 8 == 7 &&
422 DstEncoding % 8 == 7)
423 return {RISCVVType::LMUL_8, RISCV::VRM8RegClass, RISCV::VMV8R_V,
424 RISCV::PseudoVMV_V_V_M8, RISCV::PseudoVMV_V_I_M8};
425 if (I + 4 <= NumRegs && Diff >= 4 && SrcEncoding % 4 == 3 &&
426 DstEncoding % 4 == 3)
427 return {RISCVVType::LMUL_4, RISCV::VRM4RegClass, RISCV::VMV4R_V,
428 RISCV::PseudoVMV_V_V_M4, RISCV::PseudoVMV_V_I_M4};
429 if (I + 2 <= NumRegs && Diff >= 2 && SrcEncoding % 2 == 1 &&
430 DstEncoding % 2 == 1)
431 return {RISCVVType::LMUL_2, RISCV::VRM2RegClass, RISCV::VMV2R_V,
432 RISCV::PseudoVMV_V_V_M2, RISCV::PseudoVMV_V_I_M2};
433 // Or we should do LMUL1 copying.
434 return {RISCVVType::LMUL_1, RISCV::VRRegClass, RISCV::VMV1R_V,
435 RISCV::PseudoVMV_V_V_M1, RISCV::PseudoVMV_V_I_M1};
436 }
437
438 // For forward copying, if source register encoding and destination register
439 // encoding are aligned to 8/4/2, we can do a LMUL8/4/2 copying.
440 if (I + 8 <= NumRegs && SrcEncoding % 8 == 0 && DstEncoding % 8 == 0)
441 return {RISCVVType::LMUL_8, RISCV::VRM8RegClass, RISCV::VMV8R_V,
442 RISCV::PseudoVMV_V_V_M8, RISCV::PseudoVMV_V_I_M8};
443 if (I + 4 <= NumRegs && SrcEncoding % 4 == 0 && DstEncoding % 4 == 0)
444 return {RISCVVType::LMUL_4, RISCV::VRM4RegClass, RISCV::VMV4R_V,
445 RISCV::PseudoVMV_V_V_M4, RISCV::PseudoVMV_V_I_M4};
446 if (I + 2 <= NumRegs && SrcEncoding % 2 == 0 && DstEncoding % 2 == 0)
447 return {RISCVVType::LMUL_2, RISCV::VRM2RegClass, RISCV::VMV2R_V,
448 RISCV::PseudoVMV_V_V_M2, RISCV::PseudoVMV_V_I_M2};
449 // Or we should do LMUL1 copying.
450 return {RISCVVType::LMUL_1, RISCV::VRRegClass, RISCV::VMV1R_V,
451 RISCV::PseudoVMV_V_V_M1, RISCV::PseudoVMV_V_I_M1};
452 };
453
454 while (I != NumRegs) {
455 // For non-segment copying, we only do this once as the registers are always
456 // aligned.
457 // For segment copying, we may do this several times. If the registers are
458 // aligned to larger LMUL, we can eliminate some copyings.
459 auto [LMulCopied, RegClass, Opc, VVOpc, VIOpc] =
460 GetCopyInfo(SrcEncoding, DstEncoding);
461 auto [NumCopied, _] = RISCVVType::decodeVLMUL(LMulCopied);
462
464 if (LMul == LMulCopied &&
465 isConvertibleToVMV_V_V(STI, MBB, MBBI, DefMBBI, LMul)) {
466 Opc = VVOpc;
467 if (DefMBBI->getOpcode() == VIOpc)
468 Opc = VIOpc;
469 }
470
471 // Emit actual copying.
472 // For reversed copying, the encoding should be decreased.
473 MCRegister ActualSrcReg = TRI->findVRegWithEncoding(
474 RegClass, ReversedCopy ? (SrcEncoding - NumCopied + 1) : SrcEncoding);
475 MCRegister ActualDstReg = TRI->findVRegWithEncoding(
476 RegClass, ReversedCopy ? (DstEncoding - NumCopied + 1) : DstEncoding);
477
478 auto MIB = BuildMI(MBB, MBBI, DL, get(Opc), ActualDstReg);
479 bool UseVMV_V_I = RISCV::getRVVMCOpcode(Opc) == RISCV::VMV_V_I;
480 bool UseVMV = UseVMV_V_I || RISCV::getRVVMCOpcode(Opc) == RISCV::VMV_V_V;
481 if (UseVMV)
482 MIB.addReg(ActualDstReg, RegState::Undef);
483 if (UseVMV_V_I)
484 MIB = MIB.add(DefMBBI->getOperand(2));
485 else
486 MIB = MIB.addReg(ActualSrcReg, getKillRegState(KillSrc));
487 if (UseVMV) {
488 const MCInstrDesc &Desc = DefMBBI->getDesc();
489 MIB.add(DefMBBI->getOperand(RISCVII::getVLOpNum(Desc))); // AVL
490 unsigned Log2SEW =
491 DefMBBI->getOperand(RISCVII::getSEWOpNum(Desc)).getImm();
492 MIB.addImm(Log2SEW ? Log2SEW : 3); // SEW
493 MIB.addImm(0); // tu, mu
494 MIB.addReg(RISCV::VL, RegState::Implicit);
495 MIB.addReg(RISCV::VTYPE, RegState::Implicit);
496 }
497 // Add an implicit read of the original source to silence the verifier
498 // in the cases where some of the smaller VRs we're copying from might be
499 // undef, caused by the fact that the original, larger source VR might not
500 // be fully initialized at the time this COPY happens.
501 MIB.addReg(SrcReg, RegState::Implicit);
502
503 // If we are copying reversely, we should decrease the encoding.
504 SrcEncoding += (ReversedCopy ? -NumCopied : NumCopied);
505 DstEncoding += (ReversedCopy ? -NumCopied : NumCopied);
506 I += NumCopied;
507 }
508}
509
512 const DebugLoc &DL, Register DstReg,
513 Register SrcReg, bool KillSrc,
514 bool RenamableDest, bool RenamableSrc) const {
515 const TargetRegisterInfo *TRI = STI.getRegisterInfo();
516 RegState KillFlag = getKillRegState(KillSrc);
517
518 if (RISCV::GPRRegClass.contains(DstReg, SrcReg)) {
519 BuildMI(MBB, MBBI, DL, get(RISCV::ADDI), DstReg)
520 .addReg(SrcReg, KillFlag | getRenamableRegState(RenamableSrc))
521 .addImm(0);
522 return;
523 }
524
525 if (RISCV::GPRF16RegClass.contains(DstReg, SrcReg)) {
526 BuildMI(MBB, MBBI, DL, get(RISCV::PseudoMV_FPR16INX), DstReg)
527 .addReg(SrcReg, KillFlag | getRenamableRegState(RenamableSrc));
528 return;
529 }
530
531 if (RISCV::GPRF32RegClass.contains(DstReg, SrcReg)) {
532 BuildMI(MBB, MBBI, DL, get(RISCV::PseudoMV_FPR32INX), DstReg)
533 .addReg(SrcReg, KillFlag | getRenamableRegState(RenamableSrc));
534 return;
535 }
536
537 if (RISCV::GPRPairRegClass.contains(DstReg, SrcReg)) {
538 if (STI.isRV32()) {
539 if (STI.hasStdExtZdinx()) {
540 // On RV32_Zdinx, FMV.D will move a pair of registers to another pair of
541 // registers, in one instruction.
542 BuildMI(MBB, MBBI, DL, get(RISCV::FSGNJ_D_IN32X), DstReg)
543 .addReg(SrcReg, getRenamableRegState(RenamableSrc))
544 .addReg(SrcReg, KillFlag | getRenamableRegState(RenamableSrc));
545 return;
546 }
547
548 if (STI.hasStdExtP()) {
549 // On RV32P, `padd.dw` is a GPR Pair Add
550 BuildMI(MBB, MBBI, DL, get(RISCV::PADD_DW), DstReg)
551 .addReg(SrcReg, KillFlag | getRenamableRegState(RenamableSrc))
552 .addReg(RISCV::X0_Pair);
553 return;
554 }
555 }
556
557 MCRegister EvenReg = TRI->getSubReg(SrcReg, RISCV::sub_gpr_even);
558 MCRegister OddReg = TRI->getSubReg(SrcReg, RISCV::sub_gpr_odd);
559 // We need to correct the odd register of X0_Pair.
560 if (OddReg == RISCV::DUMMY_REG_PAIR_WITH_X0)
561 OddReg = RISCV::X0;
562 assert(DstReg != RISCV::X0_Pair && "Cannot write to X0_Pair");
563
564 // Emit an ADDI for both parts of GPRPair.
565 BuildMI(MBB, MBBI, DL, get(RISCV::ADDI),
566 TRI->getSubReg(DstReg, RISCV::sub_gpr_even))
567 .addReg(EvenReg, KillFlag)
568 .addImm(0);
569 BuildMI(MBB, MBBI, DL, get(RISCV::ADDI),
570 TRI->getSubReg(DstReg, RISCV::sub_gpr_odd))
571 .addReg(OddReg, KillFlag)
572 .addImm(0);
573 return;
574 }
575
576 // Handle copy from csr
577 if (RISCV::VCSRRegClass.contains(SrcReg) &&
578 RISCV::GPRRegClass.contains(DstReg)) {
579 BuildMI(MBB, MBBI, DL, get(RISCV::CSRRS), DstReg)
580 .addImm(RISCVSysReg::lookupSysRegByName(TRI->getName(SrcReg))->Encoding)
581 .addReg(RISCV::X0);
582 return;
583 }
584
585 if (RISCV::FPR16RegClass.contains(DstReg, SrcReg)) {
586 unsigned Opc;
587 if (STI.hasStdExtZfh()) {
588 Opc = RISCV::FSGNJ_H;
589 } else {
590 assert(STI.hasStdExtF() &&
591 (STI.hasStdExtZfhmin() || STI.hasStdExtZfbfmin()) &&
592 "Unexpected extensions");
593 // Zfhmin/Zfbfmin doesn't have FSGNJ_H, replace FSGNJ_H with FSGNJ_S.
594 DstReg = TRI->getMatchingSuperReg(DstReg, RISCV::sub_16,
595 &RISCV::FPR32RegClass);
596 SrcReg = TRI->getMatchingSuperReg(SrcReg, RISCV::sub_16,
597 &RISCV::FPR32RegClass);
598 Opc = RISCV::FSGNJ_S;
599 }
600 BuildMI(MBB, MBBI, DL, get(Opc), DstReg)
601 .addReg(SrcReg, KillFlag)
602 .addReg(SrcReg, KillFlag);
603 return;
604 }
605
606 if (RISCV::FPR32RegClass.contains(DstReg, SrcReg)) {
607 BuildMI(MBB, MBBI, DL, get(RISCV::FSGNJ_S), DstReg)
608 .addReg(SrcReg, KillFlag)
609 .addReg(SrcReg, KillFlag);
610 return;
611 }
612
613 if (RISCV::FPR64RegClass.contains(DstReg, SrcReg)) {
614 BuildMI(MBB, MBBI, DL, get(RISCV::FSGNJ_D), DstReg)
615 .addReg(SrcReg, KillFlag)
616 .addReg(SrcReg, KillFlag);
617 return;
618 }
619
620 if (RISCV::FPR32RegClass.contains(DstReg) &&
621 RISCV::GPRRegClass.contains(SrcReg)) {
622 BuildMI(MBB, MBBI, DL, get(RISCV::FMV_W_X), DstReg)
623 .addReg(SrcReg, KillFlag);
624 return;
625 }
626
627 if (RISCV::GPRRegClass.contains(DstReg) &&
628 RISCV::FPR32RegClass.contains(SrcReg)) {
629 BuildMI(MBB, MBBI, DL, get(RISCV::FMV_X_W), DstReg)
630 .addReg(SrcReg, KillFlag);
631 return;
632 }
633
634 if (RISCV::FPR64RegClass.contains(DstReg) &&
635 RISCV::GPRRegClass.contains(SrcReg)) {
636 assert(STI.getXLen() == 64 && "Unexpected GPR size");
637 BuildMI(MBB, MBBI, DL, get(RISCV::FMV_D_X), DstReg)
638 .addReg(SrcReg, KillFlag);
639 return;
640 }
641
642 if (RISCV::GPRRegClass.contains(DstReg) &&
643 RISCV::FPR64RegClass.contains(SrcReg)) {
644 assert(STI.getXLen() == 64 && "Unexpected GPR size");
645 BuildMI(MBB, MBBI, DL, get(RISCV::FMV_X_D), DstReg)
646 .addReg(SrcReg, KillFlag);
647 return;
648 }
649
650 // VR->VR copies.
651 const TargetRegisterClass *RegClass =
652 TRI->getCommonMinimalPhysRegClass(SrcReg, DstReg);
653 if (RISCVRegisterInfo::isRVVRegClass(RegClass)) {
654 copyPhysRegVector(MBB, MBBI, DL, DstReg, SrcReg, KillSrc, RegClass);
655 return;
656 }
657
658 llvm_unreachable("Impossible reg-to-reg copy");
659}
660
663 Register SrcReg, bool IsKill, int FI,
664 const TargetRegisterClass *RC,
665 Register VReg,
666 MachineInstr::MIFlag Flags) const {
667 MachineFunction *MF = MBB.getParent();
668 MachineFrameInfo &MFI = MF->getFrameInfo();
669 Align Alignment = MFI.getObjectAlign(FI);
670
671 unsigned Opcode;
672 if (RISCV::GPRRegClass.hasSubClassEq(RC)) {
673 Opcode = RegInfo.getRegSizeInBits(RISCV::GPRRegClass) == 32 ? RISCV::SW
674 : RISCV::SD;
675 } else if (RISCV::GPRF16RegClass.hasSubClassEq(RC)) {
676 Opcode = RISCV::SH_INX;
677 } else if (RISCV::GPRF32RegClass.hasSubClassEq(RC)) {
678 Opcode = RISCV::SW_INX;
679 } else if (RISCV::GPRPairRegClass.hasSubClassEq(RC)) {
680 if (!STI.is64Bit() && STI.hasStdExtZilsd() &&
681 Alignment >= STI.getZilsdAlign()) {
682 Opcode = RISCV::SD_RV32;
683 } else {
684 Opcode = RISCV::PseudoRV32ZdinxSD;
685 }
686 } else if (RISCV::FPR16RegClass.hasSubClassEq(RC)) {
687 Opcode = RISCV::FSH;
688 } else if (RISCV::FPR32RegClass.hasSubClassEq(RC)) {
689 Opcode = RISCV::FSW;
690 } else if (RISCV::FPR64RegClass.hasSubClassEq(RC)) {
691 Opcode = RISCV::FSD;
692 } else if (RISCV::VRRegClass.hasSubClassEq(RC)) {
693 Opcode = RISCV::VS1R_V;
694 } else if (RISCV::VRM2RegClass.hasSubClassEq(RC)) {
695 Opcode = RISCV::VS2R_V;
696 } else if (RISCV::VRM4RegClass.hasSubClassEq(RC)) {
697 Opcode = RISCV::VS4R_V;
698 } else if (RISCV::VRM8RegClass.hasSubClassEq(RC)) {
699 Opcode = RISCV::VS8R_V;
700 } else if (RISCV::VRN2M1RegClass.hasSubClassEq(RC))
701 Opcode = RISCV::PseudoVSPILL2_M1;
702 else if (RISCV::VRN2M2RegClass.hasSubClassEq(RC))
703 Opcode = RISCV::PseudoVSPILL2_M2;
704 else if (RISCV::VRN2M4RegClass.hasSubClassEq(RC))
705 Opcode = RISCV::PseudoVSPILL2_M4;
706 else if (RISCV::VRN3M1RegClass.hasSubClassEq(RC))
707 Opcode = RISCV::PseudoVSPILL3_M1;
708 else if (RISCV::VRN3M2RegClass.hasSubClassEq(RC))
709 Opcode = RISCV::PseudoVSPILL3_M2;
710 else if (RISCV::VRN4M1RegClass.hasSubClassEq(RC))
711 Opcode = RISCV::PseudoVSPILL4_M1;
712 else if (RISCV::VRN4M2RegClass.hasSubClassEq(RC))
713 Opcode = RISCV::PseudoVSPILL4_M2;
714 else if (RISCV::VRN5M1RegClass.hasSubClassEq(RC))
715 Opcode = RISCV::PseudoVSPILL5_M1;
716 else if (RISCV::VRN6M1RegClass.hasSubClassEq(RC))
717 Opcode = RISCV::PseudoVSPILL6_M1;
718 else if (RISCV::VRN7M1RegClass.hasSubClassEq(RC))
719 Opcode = RISCV::PseudoVSPILL7_M1;
720 else if (RISCV::VRN8M1RegClass.hasSubClassEq(RC))
721 Opcode = RISCV::PseudoVSPILL8_M1;
722 else
723 llvm_unreachable("Can't store this register to stack slot");
724
728 TypeSize::getScalable(MFI.getObjectSize(FI)), Alignment);
729
731 BuildMI(MBB, I, DebugLoc(), get(Opcode))
732 .addReg(SrcReg, getKillRegState(IsKill))
733 .addFrameIndex(FI)
734 .addMemOperand(MMO)
735 .setMIFlag(Flags);
736 NumVRegSpilled += RegInfo.getRegSizeInBits(*RC) / RISCV::RVVBitsPerBlock;
737 } else {
740 MFI.getObjectSize(FI), Alignment);
741
742 BuildMI(MBB, I, DebugLoc(), get(Opcode))
743 .addReg(SrcReg, getKillRegState(IsKill))
744 .addFrameIndex(FI)
745 .addImm(0)
746 .addMemOperand(MMO)
747 .setMIFlag(Flags);
748 }
749}
750
753 Register DstReg, int FI,
754 const TargetRegisterClass *RC,
755 Register VReg, unsigned SubReg,
756 MachineInstr::MIFlag Flags) const {
757 MachineFunction *MF = MBB.getParent();
758 MachineFrameInfo &MFI = MF->getFrameInfo();
759 Align Alignment = MFI.getObjectAlign(FI);
760 DebugLoc DL =
761 Flags & MachineInstr::FrameDestroy ? MBB.findDebugLoc(I) : DebugLoc();
762
763 unsigned Opcode;
764 if (RISCV::GPRRegClass.hasSubClassEq(RC)) {
765 Opcode = RegInfo.getRegSizeInBits(RISCV::GPRRegClass) == 32 ? RISCV::LW
766 : RISCV::LD;
767 } else if (RISCV::GPRF16RegClass.hasSubClassEq(RC)) {
768 Opcode = RISCV::LH_INX;
769 } else if (RISCV::GPRF32RegClass.hasSubClassEq(RC)) {
770 Opcode = RISCV::LW_INX;
771 } else if (RISCV::GPRPairRegClass.hasSubClassEq(RC)) {
772 if (!STI.is64Bit() && STI.hasStdExtZilsd() &&
773 Alignment >= STI.getZilsdAlign()) {
774 Opcode = RISCV::LD_RV32;
775 } else {
776 Opcode = RISCV::PseudoRV32ZdinxLD;
777 }
778 } else if (RISCV::FPR16RegClass.hasSubClassEq(RC)) {
779 Opcode = RISCV::FLH;
780 } else if (RISCV::FPR32RegClass.hasSubClassEq(RC)) {
781 Opcode = RISCV::FLW;
782 } else if (RISCV::FPR64RegClass.hasSubClassEq(RC)) {
783 Opcode = RISCV::FLD;
784 } else if (RISCV::VRRegClass.hasSubClassEq(RC)) {
785 Opcode = RISCV::VL1RE8_V;
786 } else if (RISCV::VRM2RegClass.hasSubClassEq(RC)) {
787 Opcode = RISCV::VL2RE8_V;
788 } else if (RISCV::VRM4RegClass.hasSubClassEq(RC)) {
789 Opcode = RISCV::VL4RE8_V;
790 } else if (RISCV::VRM8RegClass.hasSubClassEq(RC)) {
791 Opcode = RISCV::VL8RE8_V;
792 } else if (RISCV::VRN2M1RegClass.hasSubClassEq(RC))
793 Opcode = RISCV::PseudoVRELOAD2_M1;
794 else if (RISCV::VRN2M2RegClass.hasSubClassEq(RC))
795 Opcode = RISCV::PseudoVRELOAD2_M2;
796 else if (RISCV::VRN2M4RegClass.hasSubClassEq(RC))
797 Opcode = RISCV::PseudoVRELOAD2_M4;
798 else if (RISCV::VRN3M1RegClass.hasSubClassEq(RC))
799 Opcode = RISCV::PseudoVRELOAD3_M1;
800 else if (RISCV::VRN3M2RegClass.hasSubClassEq(RC))
801 Opcode = RISCV::PseudoVRELOAD3_M2;
802 else if (RISCV::VRN4M1RegClass.hasSubClassEq(RC))
803 Opcode = RISCV::PseudoVRELOAD4_M1;
804 else if (RISCV::VRN4M2RegClass.hasSubClassEq(RC))
805 Opcode = RISCV::PseudoVRELOAD4_M2;
806 else if (RISCV::VRN5M1RegClass.hasSubClassEq(RC))
807 Opcode = RISCV::PseudoVRELOAD5_M1;
808 else if (RISCV::VRN6M1RegClass.hasSubClassEq(RC))
809 Opcode = RISCV::PseudoVRELOAD6_M1;
810 else if (RISCV::VRN7M1RegClass.hasSubClassEq(RC))
811 Opcode = RISCV::PseudoVRELOAD7_M1;
812 else if (RISCV::VRN8M1RegClass.hasSubClassEq(RC))
813 Opcode = RISCV::PseudoVRELOAD8_M1;
814 else
815 llvm_unreachable("Can't load this register from stack slot");
816
820 TypeSize::getScalable(MFI.getObjectSize(FI)), Alignment);
821
823 BuildMI(MBB, I, DL, get(Opcode), DstReg)
824 .addFrameIndex(FI)
825 .addMemOperand(MMO)
826 .setMIFlag(Flags);
827 NumVRegReloaded += RegInfo.getRegSizeInBits(*RC) / RISCV::RVVBitsPerBlock;
828 } else {
831 MFI.getObjectSize(FI), Alignment);
832
833 BuildMI(MBB, I, DL, get(Opcode), DstReg)
834 .addFrameIndex(FI)
835 .addImm(0)
836 .addMemOperand(MMO)
837 .setMIFlag(Flags);
838 }
839}
840std::optional<unsigned> getFoldedOpcode(MachineFunction &MF, MachineInstr &MI,
842 const RISCVSubtarget &ST) {
843
844 // The below optimizations narrow the load so they are only valid for little
845 // endian.
846 // TODO: Support big endian by adding an offset into the frame object?
847 if (MF.getDataLayout().isBigEndian())
848 return std::nullopt;
849
850 // Fold load from stack followed by sext.b/sext.h/sext.w/zext.b/zext.h/zext.w.
851 if (Ops.size() != 1 || Ops[0] != 1)
852 return std::nullopt;
853
854 switch (MI.getOpcode()) {
855 default:
856 if (RISCVInstrInfo::isSEXT_W(MI))
857 return RISCV::LW;
858 if (RISCVInstrInfo::isZEXT_W(MI))
859 return RISCV::LWU;
860 if (RISCVInstrInfo::isZEXT_B(MI))
861 return RISCV::LBU;
862 break;
863 case RISCV::SEXT_H:
864 return RISCV::LH;
865 case RISCV::SEXT_B:
866 return RISCV::LB;
867 case RISCV::ZEXT_H_RV32:
868 case RISCV::ZEXT_H_RV64:
869 return RISCV::LHU;
870 }
871
872 switch (RISCV::getRVVMCOpcode(MI.getOpcode())) {
873 default:
874 return std::nullopt;
875 case RISCV::VMV_X_S: {
876 unsigned Log2SEW =
877 MI.getOperand(RISCVII::getSEWOpNum(MI.getDesc())).getImm();
878 if (ST.getXLen() < (1U << Log2SEW))
879 return std::nullopt;
880 switch (Log2SEW) {
881 case 3:
882 return RISCV::LB;
883 case 4:
884 return RISCV::LH;
885 case 5:
886 return RISCV::LW;
887 case 6:
888 return RISCV::LD;
889 default:
890 llvm_unreachable("Unexpected SEW");
891 }
892 }
893 case RISCV::VFMV_F_S: {
894 unsigned Log2SEW =
895 MI.getOperand(RISCVII::getSEWOpNum(MI.getDesc())).getImm();
896 switch (Log2SEW) {
897 case 4:
898 return RISCV::FLH;
899 case 5:
900 return RISCV::FLW;
901 case 6:
902 return RISCV::FLD;
903 default:
904 llvm_unreachable("Unexpected SEW");
905 }
906 }
907 }
908}
909
910// This is the version used during InlineSpiller::spillAroundUses
913 ArrayRef<unsigned> Ops, int FrameIndex,
914 MachineInstr *&CopyMI, LiveIntervals *LIS,
915 VirtRegMap *VRM) const {
917 std::optional<unsigned> LoadOpc = getFoldedOpcode(MF, MI, Ops, STI);
918 if (!LoadOpc)
919 return nullptr;
920 Register DstReg = MI.getOperand(0).getReg();
921 return BuildMI(*MI.getParent(), InsertPt, MI.getDebugLoc(), get(*LoadOpc),
922 DstReg)
923 .addFrameIndex(FrameIndex)
924 .addImm(0);
925}
926
927static unsigned getLoadPredicatedOpcode(unsigned Opcode) {
928 switch (Opcode) {
929 case RISCV::LB:
930 return RISCV::PseudoCCLB;
931 case RISCV::LBU:
932 return RISCV::PseudoCCLBU;
933 case RISCV::LH:
934 return RISCV::PseudoCCLH;
935 case RISCV::LHU:
936 return RISCV::PseudoCCLHU;
937 case RISCV::LW:
938 return RISCV::PseudoCCLW;
939 case RISCV::LWU:
940 return RISCV::PseudoCCLWU;
941 case RISCV::LD:
942 return RISCV::PseudoCCLD;
943 case RISCV::QC_E_LB:
944 return RISCV::PseudoCCQC_E_LB;
945 case RISCV::QC_E_LBU:
946 return RISCV::PseudoCCQC_E_LBU;
947 case RISCV::QC_E_LH:
948 return RISCV::PseudoCCQC_E_LH;
949 case RISCV::QC_E_LHU:
950 return RISCV::PseudoCCQC_E_LHU;
951 case RISCV::QC_E_LW:
952 return RISCV::PseudoCCQC_E_LW;
953 default:
954 return 0;
955 }
956}
957
960 MachineInstr &LoadMI, MachineInstr *&CopyMI, LiveIntervals *LIS,
961 VirtRegMap *VRM) const {
963 // For now, only handle RISCV::PseudoCCMOVGPR.
964 if (MI.getOpcode() != RISCV::PseudoCCMOVGPR)
965 return nullptr;
966
967 unsigned PredOpc = getLoadPredicatedOpcode(LoadMI.getOpcode());
968
969 if (!STI.hasShortForwardBranchILoad() || !PredOpc)
970 return nullptr;
971
973 if (Ops.size() != 1 || (Ops[0] != 1 && Ops[0] != 2))
974 return nullptr;
975
976 bool Invert = Ops[0] == 2;
977 const MachineOperand &FalseReg = MI.getOperand(!Invert ? 2 : 1);
978 Register DestReg = MI.getOperand(0).getReg();
979 const TargetRegisterClass *PreviousClass = MRI.getRegClass(FalseReg.getReg());
980 if (!MRI.constrainRegClass(DestReg, PreviousClass))
981 return nullptr;
982
983 // Create a new predicated version of DefMI.
984 MachineInstrBuilder NewMI = BuildMI(*MI.getParent(), InsertPt,
985 MI.getDebugLoc(), get(PredOpc), DestReg);
986
987 // Copy the false register.
988 NewMI.add(FalseReg);
989
990 // Copy all the DefMI operands.
991 const MCInstrDesc &DefDesc = LoadMI.getDesc();
992 for (unsigned i = 1, e = DefDesc.getNumOperands(); i != e; ++i)
993 NewMI.add(LoadMI.getOperand(i));
994
995 // Add branch opcode, inverting if necessary.
996 unsigned BCC = MI.getOperand(MI.getNumExplicitOperands() - 3).getImm();
997 if (!Invert)
999 NewMI.addImm(BCC);
1000
1001 // Copy condition portion
1002 NewMI.add({MI.getOperand(MI.getNumExplicitOperands() - 2),
1003 MI.getOperand(MI.getNumExplicitOperands() - 1)});
1004 NewMI.cloneMemRefs(LoadMI);
1005 return NewMI;
1006}
1007
1010 const DebugLoc &DL, Register DstReg, uint64_t Val,
1011 MachineInstr::MIFlag Flag, bool DstRenamable,
1012 bool DstIsDead) const {
1013 Register SrcReg = RISCV::X0;
1014
1015 // For RV32, allow a sign or unsigned 32 bit value.
1016 if (!STI.is64Bit() && !isInt<32>(Val)) {
1017 // If have a uimm32 it will still fit in a register so we can allow it.
1018 if (!isUInt<32>(Val))
1019 report_fatal_error("Should only materialize 32-bit constants for RV32");
1020
1021 // Sign extend for generateInstSeq.
1022 Val = SignExtend64<32>(Val);
1023 }
1024
1026 assert(!Seq.empty());
1027
1028 bool SrcRenamable = false;
1029 unsigned Num = 0;
1030
1031 for (const RISCVMatInt::Inst &Inst : Seq) {
1032 bool LastItem = ++Num == Seq.size();
1033 RegState DstRegState = getDeadRegState(DstIsDead && LastItem) |
1034 getRenamableRegState(DstRenamable);
1035 RegState SrcRegState = getKillRegState(SrcReg != RISCV::X0) |
1036 getRenamableRegState(SrcRenamable);
1037 switch (Inst.getOpndKind()) {
1038 case RISCVMatInt::Imm:
1039 BuildMI(MBB, MBBI, DL, get(Inst.getOpcode()))
1040 .addReg(DstReg, RegState::Define | DstRegState)
1041 .addImm(Inst.getImm())
1042 .setMIFlag(Flag);
1043 break;
1044 case RISCVMatInt::RegX0:
1045 BuildMI(MBB, MBBI, DL, get(Inst.getOpcode()))
1046 .addReg(DstReg, RegState::Define | DstRegState)
1047 .addReg(SrcReg, SrcRegState)
1048 .addReg(RISCV::X0)
1049 .setMIFlag(Flag);
1050 break;
1052 BuildMI(MBB, MBBI, DL, get(Inst.getOpcode()))
1053 .addReg(DstReg, RegState::Define | DstRegState)
1054 .addReg(SrcReg, SrcRegState)
1055 .addReg(SrcReg, SrcRegState)
1056 .setMIFlag(Flag);
1057 break;
1059 BuildMI(MBB, MBBI, DL, get(Inst.getOpcode()))
1060 .addReg(DstReg, RegState::Define | DstRegState)
1061 .addReg(SrcReg, SrcRegState)
1062 .addImm(Inst.getImm())
1063 .setMIFlag(Flag);
1064 break;
1065 }
1066
1067 // Only the first instruction has X0 as its source.
1068 SrcReg = DstReg;
1069 SrcRenamable = DstRenamable;
1070 }
1071}
1072
1074 switch (Opc) {
1075 default:
1076 return RISCVCC::COND_INVALID;
1077 case RISCV::BEQ:
1078 case RISCV::BEQI:
1079 case RISCV::CV_BEQIMM:
1080 case RISCV::QC_BEQI:
1081 case RISCV::QC_E_BEQI:
1082 case RISCV::NDS_BBC:
1083 case RISCV::NDS_BEQC:
1084 return RISCVCC::COND_EQ;
1085 case RISCV::BNE:
1086 case RISCV::BNEI:
1087 case RISCV::QC_BNEI:
1088 case RISCV::QC_E_BNEI:
1089 case RISCV::CV_BNEIMM:
1090 case RISCV::NDS_BBS:
1091 case RISCV::NDS_BNEC:
1092 return RISCVCC::COND_NE;
1093 case RISCV::BLT:
1094 case RISCV::QC_BLTI:
1095 case RISCV::QC_E_BLTI:
1096 return RISCVCC::COND_LT;
1097 case RISCV::BGE:
1098 case RISCV::QC_BGEI:
1099 case RISCV::QC_E_BGEI:
1100 return RISCVCC::COND_GE;
1101 case RISCV::BLTU:
1102 case RISCV::QC_BLTUI:
1103 case RISCV::QC_E_BLTUI:
1104 return RISCVCC::COND_LTU;
1105 case RISCV::BGEU:
1106 case RISCV::QC_BGEUI:
1107 case RISCV::QC_E_BGEUI:
1108 return RISCVCC::COND_GEU;
1109 }
1110}
1111
1113 int64_t C1) {
1114 switch (CC) {
1115 default:
1116 llvm_unreachable("Unexpected CC");
1117 case RISCVCC::COND_EQ:
1118 return C0 == C1;
1119 case RISCVCC::COND_NE:
1120 return C0 != C1;
1121 case RISCVCC::COND_LT:
1122 return C0 < C1;
1123 case RISCVCC::COND_GE:
1124 return C0 >= C1;
1125 case RISCVCC::COND_LTU:
1126 return (uint64_t)C0 < (uint64_t)C1;
1127 case RISCVCC::COND_GEU:
1128 return (uint64_t)C0 >= (uint64_t)C1;
1129 }
1130}
1131
1132// The contents of values added to Cond are not examined outside of
1133// RISCVInstrInfo, giving us flexibility in what to push to it. For RISCV, we
1134// push BranchOpcode, Reg1, Reg2.
1137 // Block ends with fall-through condbranch.
1138 assert(LastInst.getDesc().isConditionalBranch() &&
1139 "Unknown conditional branch");
1140 Target = LastInst.getOperand(2).getMBB();
1141 Cond.push_back(MachineOperand::CreateImm(LastInst.getOpcode()));
1142 Cond.push_back(LastInst.getOperand(0));
1143 Cond.push_back(LastInst.getOperand(1));
1144}
1145
1146static unsigned getInverseXqcicmOpcode(unsigned Opcode) {
1147 switch (Opcode) {
1148 default:
1149 llvm_unreachable("Unexpected Opcode");
1150 case RISCV::QC_MVEQ:
1151 return RISCV::QC_MVNE;
1152 case RISCV::QC_MVNE:
1153 return RISCV::QC_MVEQ;
1154 case RISCV::QC_MVLT:
1155 return RISCV::QC_MVGE;
1156 case RISCV::QC_MVGE:
1157 return RISCV::QC_MVLT;
1158 case RISCV::QC_MVLTU:
1159 return RISCV::QC_MVGEU;
1160 case RISCV::QC_MVGEU:
1161 return RISCV::QC_MVLTU;
1162 case RISCV::QC_MVEQI:
1163 return RISCV::QC_MVNEI;
1164 case RISCV::QC_MVNEI:
1165 return RISCV::QC_MVEQI;
1166 case RISCV::QC_MVLTI:
1167 return RISCV::QC_MVGEI;
1168 case RISCV::QC_MVGEI:
1169 return RISCV::QC_MVLTI;
1170 case RISCV::QC_MVLTUI:
1171 return RISCV::QC_MVGEUI;
1172 case RISCV::QC_MVGEUI:
1173 return RISCV::QC_MVLTUI;
1174 }
1175}
1176
1177unsigned RISCVCC::getBrCond(RISCVCC::CondCode CC, unsigned SelectOpc) {
1178 switch (SelectOpc) {
1179 default:
1180 switch (CC) {
1181 default:
1182 llvm_unreachable("Unexpected condition code!");
1183 case RISCVCC::COND_EQ:
1184 return RISCV::BEQ;
1185 case RISCVCC::COND_NE:
1186 return RISCV::BNE;
1187 case RISCVCC::COND_LT:
1188 return RISCV::BLT;
1189 case RISCVCC::COND_GE:
1190 return RISCV::BGE;
1191 case RISCVCC::COND_LTU:
1192 return RISCV::BLTU;
1193 case RISCVCC::COND_GEU:
1194 return RISCV::BGEU;
1195 }
1196 break;
1197 case RISCV::Select_GPR_Using_CC_Imm5_Zibi:
1198 switch (CC) {
1199 default:
1200 llvm_unreachable("Unexpected condition code!");
1201 case RISCVCC::COND_EQ:
1202 return RISCV::BEQI;
1203 case RISCVCC::COND_NE:
1204 return RISCV::BNEI;
1205 }
1206 break;
1207 case RISCV::Select_GPR_Using_CC_SImm5_CV:
1208 switch (CC) {
1209 default:
1210 llvm_unreachable("Unexpected condition code!");
1211 case RISCVCC::COND_EQ:
1212 return RISCV::CV_BEQIMM;
1213 case RISCVCC::COND_NE:
1214 return RISCV::CV_BNEIMM;
1215 }
1216 break;
1217 case RISCV::Select_GPRNoX0_Using_CC_SImm5NonZero_QC:
1218 switch (CC) {
1219 default:
1220 llvm_unreachable("Unexpected condition code!");
1221 case RISCVCC::COND_EQ:
1222 return RISCV::QC_BEQI;
1223 case RISCVCC::COND_NE:
1224 return RISCV::QC_BNEI;
1225 case RISCVCC::COND_LT:
1226 return RISCV::QC_BLTI;
1227 case RISCVCC::COND_GE:
1228 return RISCV::QC_BGEI;
1229 }
1230 break;
1231 case RISCV::Select_GPRNoX0_Using_CC_UImm5NonZero_QC:
1232 switch (CC) {
1233 default:
1234 llvm_unreachable("Unexpected condition code!");
1235 case RISCVCC::COND_LTU:
1236 return RISCV::QC_BLTUI;
1237 case RISCVCC::COND_GEU:
1238 return RISCV::QC_BGEUI;
1239 }
1240 break;
1241 case RISCV::Select_GPRNoX0_Using_CC_SImm16NonZero_QC:
1242 switch (CC) {
1243 default:
1244 llvm_unreachable("Unexpected condition code!");
1245 case RISCVCC::COND_EQ:
1246 return RISCV::QC_E_BEQI;
1247 case RISCVCC::COND_NE:
1248 return RISCV::QC_E_BNEI;
1249 case RISCVCC::COND_LT:
1250 return RISCV::QC_E_BLTI;
1251 case RISCVCC::COND_GE:
1252 return RISCV::QC_E_BGEI;
1253 }
1254 break;
1255 case RISCV::Select_GPRNoX0_Using_CC_UImm16NonZero_QC:
1256 switch (CC) {
1257 default:
1258 llvm_unreachable("Unexpected condition code!");
1259 case RISCVCC::COND_LTU:
1260 return RISCV::QC_E_BLTUI;
1261 case RISCVCC::COND_GEU:
1262 return RISCV::QC_E_BGEUI;
1263 }
1264 break;
1265 case RISCV::Select_GPR_Using_CC_UImmLog2XLen_NDS:
1266 switch (CC) {
1267 default:
1268 llvm_unreachable("Unexpected condition code!");
1269 case RISCVCC::COND_EQ:
1270 return RISCV::NDS_BBC;
1271 case RISCVCC::COND_NE:
1272 return RISCV::NDS_BBS;
1273 }
1274 break;
1275 case RISCV::Select_GPR_Using_CC_UImm7_NDS:
1276 switch (CC) {
1277 default:
1278 llvm_unreachable("Unexpected condition code!");
1279 case RISCVCC::COND_EQ:
1280 return RISCV::NDS_BEQC;
1281 case RISCVCC::COND_NE:
1282 return RISCV::NDS_BNEC;
1283 }
1284 break;
1285 }
1286}
1287
1289 switch (CC) {
1290 default:
1291 llvm_unreachable("Unrecognized conditional branch");
1292 case RISCVCC::COND_EQ:
1293 return RISCVCC::COND_NE;
1294 case RISCVCC::COND_NE:
1295 return RISCVCC::COND_EQ;
1296 case RISCVCC::COND_LT:
1297 return RISCVCC::COND_GE;
1298 case RISCVCC::COND_GE:
1299 return RISCVCC::COND_LT;
1300 case RISCVCC::COND_LTU:
1301 return RISCVCC::COND_GEU;
1302 case RISCVCC::COND_GEU:
1303 return RISCVCC::COND_LTU;
1304 }
1305}
1306
1307// Return inverse branch
1308unsigned RISCVCC::getInverseBranchOpcode(unsigned BCC) {
1309 switch (BCC) {
1310 default:
1311 llvm_unreachable("Unexpected branch opcode!");
1312 case RISCV::BEQ:
1313 return RISCV::BNE;
1314 case RISCV::BEQI:
1315 return RISCV::BNEI;
1316 case RISCV::BNE:
1317 return RISCV::BEQ;
1318 case RISCV::BNEI:
1319 return RISCV::BEQI;
1320 case RISCV::BLT:
1321 return RISCV::BGE;
1322 case RISCV::BGE:
1323 return RISCV::BLT;
1324 case RISCV::BLTU:
1325 return RISCV::BGEU;
1326 case RISCV::BGEU:
1327 return RISCV::BLTU;
1328 case RISCV::CV_BEQIMM:
1329 return RISCV::CV_BNEIMM;
1330 case RISCV::CV_BNEIMM:
1331 return RISCV::CV_BEQIMM;
1332 case RISCV::QC_BEQI:
1333 return RISCV::QC_BNEI;
1334 case RISCV::QC_BNEI:
1335 return RISCV::QC_BEQI;
1336 case RISCV::QC_BLTI:
1337 return RISCV::QC_BGEI;
1338 case RISCV::QC_BGEI:
1339 return RISCV::QC_BLTI;
1340 case RISCV::QC_BLTUI:
1341 return RISCV::QC_BGEUI;
1342 case RISCV::QC_BGEUI:
1343 return RISCV::QC_BLTUI;
1344 case RISCV::QC_E_BEQI:
1345 return RISCV::QC_E_BNEI;
1346 case RISCV::QC_E_BNEI:
1347 return RISCV::QC_E_BEQI;
1348 case RISCV::QC_E_BLTI:
1349 return RISCV::QC_E_BGEI;
1350 case RISCV::QC_E_BGEI:
1351 return RISCV::QC_E_BLTI;
1352 case RISCV::QC_E_BLTUI:
1353 return RISCV::QC_E_BGEUI;
1354 case RISCV::QC_E_BGEUI:
1355 return RISCV::QC_E_BLTUI;
1356 case RISCV::NDS_BBC:
1357 return RISCV::NDS_BBS;
1358 case RISCV::NDS_BBS:
1359 return RISCV::NDS_BBC;
1360 case RISCV::NDS_BEQC:
1361 return RISCV::NDS_BNEC;
1362 case RISCV::NDS_BNEC:
1363 return RISCV::NDS_BEQC;
1364 }
1365}
1366
1369 MachineBasicBlock *&FBB,
1371 bool AllowModify) const {
1372 TBB = FBB = nullptr;
1373 Cond.clear();
1374
1375 // If the block has no terminators, it just falls into the block after it.
1376 MachineBasicBlock::iterator I = MBB.getLastNonDebugInstr();
1377 if (I == MBB.end() || !isUnpredicatedTerminator(*I))
1378 return false;
1379
1380 // Count the number of terminators and find the first unconditional or
1381 // indirect branch.
1382 MachineBasicBlock::iterator FirstUncondOrIndirectBr = MBB.end();
1383 int NumTerminators = 0;
1384 for (auto J = I.getReverse(); J != MBB.rend() && isUnpredicatedTerminator(*J);
1385 J++) {
1386 NumTerminators++;
1387 if (J->getDesc().isUnconditionalBranch() ||
1388 J->getDesc().isIndirectBranch()) {
1389 FirstUncondOrIndirectBr = J.getReverse();
1390 }
1391 }
1392
1393 // If AllowModify is true, we can erase any terminators after
1394 // FirstUncondOrIndirectBR.
1395 if (AllowModify && FirstUncondOrIndirectBr != MBB.end()) {
1396 while (std::next(FirstUncondOrIndirectBr) != MBB.end()) {
1397 std::next(FirstUncondOrIndirectBr)->eraseFromParent();
1398 NumTerminators--;
1399 }
1400 I = FirstUncondOrIndirectBr;
1401 }
1402
1403 // We can't handle blocks that end in an indirect branch.
1404 if (I->getDesc().isIndirectBranch())
1405 return true;
1406
1407 // We can't handle Generic branch opcodes from Global ISel.
1408 if (I->isPreISelOpcode())
1409 return true;
1410
1411 // We can't handle blocks with more than 2 terminators.
1412 if (NumTerminators > 2)
1413 return true;
1414
1415 // Handle a single unconditional branch.
1416 if (NumTerminators == 1 && I->getDesc().isUnconditionalBranch()) {
1418 return false;
1419 }
1420
1421 // Handle a single conditional branch.
1422 if (NumTerminators == 1 && I->getDesc().isConditionalBranch()) {
1424 return false;
1425 }
1426
1427 // Handle a conditional branch followed by an unconditional branch.
1428 if (NumTerminators == 2 && std::prev(I)->getDesc().isConditionalBranch() &&
1429 I->getDesc().isUnconditionalBranch()) {
1430 parseCondBranch(*std::prev(I), TBB, Cond);
1431 FBB = getBranchDestBlock(*I);
1432 return false;
1433 }
1434
1435 // Otherwise, we can't handle this.
1436 return true;
1437}
1438
1440 int *BytesRemoved) const {
1441 if (BytesRemoved)
1442 *BytesRemoved = 0;
1443 MachineBasicBlock::iterator I = MBB.getLastNonDebugInstr();
1444 if (I == MBB.end())
1445 return 0;
1446
1447 if (!I->getDesc().isUnconditionalBranch() &&
1448 !I->getDesc().isConditionalBranch())
1449 return 0;
1450
1451 // Remove the branch.
1452 if (BytesRemoved)
1453 *BytesRemoved += getInstSizeInBytes(*I);
1454 I->eraseFromParent();
1455
1456 I = MBB.end();
1457
1458 if (I == MBB.begin())
1459 return 1;
1460 --I;
1461 if (!I->getDesc().isConditionalBranch())
1462 return 1;
1463
1464 // Remove the branch.
1465 if (BytesRemoved)
1466 *BytesRemoved += getInstSizeInBytes(*I);
1467 I->eraseFromParent();
1468 return 2;
1469}
1470
1471// Inserts a branch into the end of the specific MachineBasicBlock, returning
1472// the number of instructions inserted.
1475 ArrayRef<MachineOperand> Cond, const DebugLoc &DL, int *BytesAdded) const {
1476 if (BytesAdded)
1477 *BytesAdded = 0;
1478
1479 // Shouldn't be a fall through.
1480 assert(TBB && "insertBranch must not be told to insert a fallthrough");
1481 assert((Cond.size() == 3 || Cond.size() == 0) &&
1482 "RISC-V branch conditions have two components!");
1483
1484 // Unconditional branch.
1485 if (Cond.empty()) {
1486 MachineInstr &MI = *BuildMI(&MBB, DL, get(RISCV::PseudoBR)).addMBB(TBB);
1487 if (BytesAdded)
1488 *BytesAdded += getInstSizeInBytes(MI);
1489 return 1;
1490 }
1491
1492 // Either a one or two-way conditional branch.
1493 MachineInstr &CondMI = *BuildMI(&MBB, DL, get(Cond[0].getImm()))
1494 .add(Cond[1])
1495 .add(Cond[2])
1496 .addMBB(TBB);
1497 if (BytesAdded)
1498 *BytesAdded += getInstSizeInBytes(CondMI);
1499
1500 // One-way conditional branch.
1501 if (!FBB)
1502 return 1;
1503
1504 // Two-way conditional branch.
1505 MachineInstr &MI = *BuildMI(&MBB, DL, get(RISCV::PseudoBR)).addMBB(FBB);
1506 if (BytesAdded)
1507 *BytesAdded += getInstSizeInBytes(MI);
1508 return 2;
1509}
1510
1512 MachineBasicBlock &DestBB,
1513 MachineBasicBlock &RestoreBB,
1514 const DebugLoc &DL, int64_t BrOffset,
1515 RegScavenger *RS) const {
1516 assert(RS && "RegScavenger required for long branching");
1517 assert(MBB.empty() &&
1518 "new block should be inserted for expanding unconditional branch");
1519 assert(MBB.pred_size() == 1);
1520 assert(RestoreBB.empty() &&
1521 "restore block should be inserted for restoring clobbered registers");
1522
1523 MachineFunction *MF = MBB.getParent();
1524 MachineRegisterInfo &MRI = MF->getRegInfo();
1527
1528 if (!isInt<32>(BrOffset))
1530 "Branch offsets outside of the signed 32-bit range not supported");
1531
1532 // FIXME: A virtual register must be used initially, as the register
1533 // scavenger won't work with empty blocks (SIInstrInfo::insertIndirectBranch
1534 // uses the same workaround).
1535 Register ScratchReg = MRI.createVirtualRegister(&RISCV::GPRJALRRegClass);
1536 auto II = MBB.end();
1537 // We may also update the jump target to RestoreBB later.
1538 MachineInstr &MI = *BuildMI(MBB, II, DL, get(RISCV::PseudoJump))
1539 .addReg(ScratchReg, RegState::Define | RegState::Dead)
1540 .addMBB(&DestBB, RISCVII::MO_CALL);
1541
1542 RS->enterBasicBlockEnd(MBB);
1543 // When cf-protection-branch is enabled, we must use t2 (x7) for software
1544 // guarded branches to hold the landing pad label.
1545 bool HasCFBranch =
1546 MF->getInfo<RISCVMachineFunctionInfo>()->hasCFProtectionBranch();
1547 const TargetRegisterClass *RC = &RISCV::GPRRegClass;
1548 if (HasCFBranch)
1549 RC = &RISCV::GPRX7RegClass;
1550 Register TmpGPR =
1551 RS->scavengeRegisterBackwards(*RC, MI.getIterator(),
1552 /*RestoreAfter=*/false, /*SpAdj=*/0,
1553 /*AllowSpill=*/false);
1554 if (TmpGPR.isValid())
1555 RS->setRegUsed(TmpGPR);
1556 else {
1557 // The case when there is no scavenged register needs special handling.
1558
1559 // Pick s11(or s1 for rve) because it doesn't make a difference.
1560 TmpGPR = STI.hasStdExtE() ? RISCV::X9 : RISCV::X27;
1561 // Force t2 if cf-protection-branch is enabled
1562 if (HasCFBranch)
1563 TmpGPR = RISCV::X7;
1564
1565 int FrameIndex = RVFI->getBranchRelaxationScratchFrameIndex();
1566 if (FrameIndex == -1)
1567 report_fatal_error("underestimated function size");
1568
1569 storeRegToStackSlot(MBB, MI, TmpGPR, /*IsKill=*/true, FrameIndex,
1570 &RISCV::GPRRegClass, Register());
1571 TRI->eliminateFrameIndex(std::prev(MI.getIterator()),
1572 /*SpAdj=*/0, /*FIOperandNum=*/1);
1573
1574 MI.getOperand(1).setMBB(&RestoreBB);
1575
1576 loadRegFromStackSlot(RestoreBB, RestoreBB.end(), TmpGPR, FrameIndex,
1577 &RISCV::GPRRegClass, Register());
1578 TRI->eliminateFrameIndex(RestoreBB.back(),
1579 /*SpAdj=*/0, /*FIOperandNum=*/1);
1580 }
1581
1582 MRI.replaceRegWith(ScratchReg, TmpGPR);
1583 MRI.clearVirtRegs();
1584}
1585
1588 assert((Cond.size() == 3) && "Invalid branch condition!");
1589
1591
1592 return false;
1593}
1594
1595// Return true if the instruction is a load immediate instruction (i.e.
1596// (ADDI x0, imm) or (BSETI x0, imm)).
1597static bool isLoadImm(const MachineInstr *MI, int64_t &Imm) {
1598 if (MI->getOpcode() == RISCV::ADDI && MI->getOperand(1).isReg() &&
1599 MI->getOperand(1).getReg() == RISCV::X0) {
1600 Imm = MI->getOperand(2).getImm();
1601 return true;
1602 }
1603 // BSETI can be used to create power of 2 constants. Only 2048 is currently
1604 // interesting because it is 1 more than the maximum ADDI constant.
1605 if (MI->getOpcode() == RISCV::BSETI && MI->getOperand(1).isReg() &&
1606 MI->getOperand(1).getReg() == RISCV::X0 &&
1607 MI->getOperand(2).getImm() == 11) {
1608 Imm = 2048;
1609 return true;
1610 }
1611 return false;
1612}
1613
1615 const MachineOperand &Op, int64_t &Imm) {
1616 // Either a load from immediate instruction or X0.
1617 if (!Op.isReg())
1618 return false;
1619
1620 Register Reg = Op.getReg();
1621 if (Reg == RISCV::X0) {
1622 Imm = 0;
1623 return true;
1624 }
1625 return Reg.isVirtual() && isLoadImm(MRI.getVRegDef(Reg), Imm);
1626}
1627
1629 bool IsSigned = false;
1630 bool IsEquality = false;
1631 switch (MI.getOpcode()) {
1632 default:
1633 return false;
1634 case RISCV::BEQ:
1635 case RISCV::BNE:
1636 IsEquality = true;
1637 break;
1638 case RISCV::BGE:
1639 case RISCV::BLT:
1640 IsSigned = true;
1641 break;
1642 case RISCV::BGEU:
1643 case RISCV::BLTU:
1644 break;
1645 }
1646
1647 MachineBasicBlock *MBB = MI.getParent();
1648 MachineRegisterInfo &MRI = MBB->getParent()->getRegInfo();
1649
1650 const MachineOperand &LHS = MI.getOperand(0);
1651 const MachineOperand &RHS = MI.getOperand(1);
1652 MachineBasicBlock *TBB = MI.getOperand(2).getMBB();
1653
1654 RISCVCC::CondCode CC = getCondFromBranchOpc(MI.getOpcode());
1656
1657 // Canonicalize conditional branches which can be constant folded into
1658 // beqz or bnez. We can't modify the CFG here.
1659 int64_t C0, C1;
1660 if (isFromLoadImm(MRI, LHS, C0) && isFromLoadImm(MRI, RHS, C1)) {
1661 unsigned NewOpc = evaluateCondBranch(CC, C0, C1) ? RISCV::BEQ : RISCV::BNE;
1662 // Build the new branch and remove the old one.
1663 BuildMI(*MBB, MI, MI.getDebugLoc(), get(NewOpc))
1664 .addReg(RISCV::X0)
1665 .addReg(RISCV::X0)
1666 .addMBB(TBB);
1667 MI.eraseFromParent();
1668 return true;
1669 }
1670
1671 if (IsEquality)
1672 return false;
1673
1674 // For two constants C0 and C1 from
1675 // ```
1676 // li Y, C0
1677 // li Z, C1
1678 // ```
1679 // 1. if C1 = C0 + 1
1680 // we can turn:
1681 // (a) blt Y, X -> bge X, Z
1682 // (b) bge Y, X -> blt X, Z
1683 //
1684 // 2. if C1 = C0 - 1
1685 // we can turn:
1686 // (a) blt X, Y -> bge Z, X
1687 // (b) bge X, Y -> blt Z, X
1688 //
1689 // To make sure this optimization is really beneficial, we only
1690 // optimize for cases where Y had only one use (i.e. only used by the branch).
1691 // Try to find the register for constant Z; return
1692 // invalid register otherwise.
1693 auto searchConst = [&](int64_t C1) -> Register {
1695 auto DefC1 = std::find_if(++II, E, [&](const MachineInstr &I) -> bool {
1696 int64_t Imm;
1697 return isLoadImm(&I, Imm) && Imm == C1 &&
1698 I.getOperand(0).getReg().isVirtual();
1699 });
1700 if (DefC1 != E)
1701 return DefC1->getOperand(0).getReg();
1702
1703 return Register();
1704 };
1705
1706 unsigned NewOpc = RISCVCC::getBrCond(getInverseBranchCondition(CC));
1707
1708 // Might be case 1.
1709 // Don't change 0 to 1 since we can use x0.
1710 // For unsigned cases changing -1U to 0 would be incorrect.
1711 // The incorrect case for signed would be INT_MAX, but isFromLoadImm can't
1712 // return that.
1713 if (isFromLoadImm(MRI, LHS, C0) && C0 != 0 && LHS.getReg().isVirtual() &&
1714 MRI.hasOneUse(LHS.getReg()) && (IsSigned || C0 != -1)) {
1715 assert((isInt<12>(C0) || C0 == 2048) && "Unexpected immediate");
1716 if (Register RegZ = searchConst(C0 + 1)) {
1717 BuildMI(*MBB, MI, MI.getDebugLoc(), get(NewOpc))
1718 .add(RHS)
1719 .addReg(RegZ)
1720 .addMBB(TBB);
1721 // We might extend the live range of Z, clear its kill flag to
1722 // account for this.
1723 MRI.clearKillFlags(RegZ);
1724 MI.eraseFromParent();
1725 return true;
1726 }
1727 }
1728
1729 // Might be case 2.
1730 // For signed cases we don't want to change 0 since we can use x0.
1731 // For unsigned cases changing 0 to -1U would be incorrect.
1732 // The incorrect case for signed would be INT_MIN, but isFromLoadImm can't
1733 // return that.
1734 if (isFromLoadImm(MRI, RHS, C0) && C0 != 0 && RHS.getReg().isVirtual() &&
1735 MRI.hasOneUse(RHS.getReg())) {
1736 assert((isInt<12>(C0) || C0 == 2048) && "Unexpected immediate");
1737 if (Register RegZ = searchConst(C0 - 1)) {
1738 BuildMI(*MBB, MI, MI.getDebugLoc(), get(NewOpc))
1739 .addReg(RegZ)
1740 .add(LHS)
1741 .addMBB(TBB);
1742 // We might extend the live range of Z, clear its kill flag to
1743 // account for this.
1744 MRI.clearKillFlags(RegZ);
1745 MI.eraseFromParent();
1746 return true;
1747 }
1748 }
1749
1750 return false;
1751}
1752
1755 assert(MI.getDesc().isBranch() && "Unexpected opcode!");
1756 // The branch target is always the last operand.
1757 int NumOp = MI.getNumExplicitOperands();
1758 return MI.getOperand(NumOp - 1).getMBB();
1759}
1760
1762 int64_t BrOffset) const {
1763 unsigned XLen = STI.getXLen();
1764 // Ideally we could determine the supported branch offset from the
1765 // RISCVII::FormMask, but this can't be used for Pseudo instructions like
1766 // PseudoBR.
1767 switch (BranchOp) {
1768 default:
1769 llvm_unreachable("Unexpected opcode!");
1770 case RISCV::NDS_BBC:
1771 case RISCV::NDS_BBS:
1772 case RISCV::NDS_BEQC:
1773 case RISCV::NDS_BNEC:
1774 return isInt<11>(BrOffset);
1775 case RISCV::BEQ:
1776 case RISCV::BNE:
1777 case RISCV::BLT:
1778 case RISCV::BGE:
1779 case RISCV::BLTU:
1780 case RISCV::BGEU:
1781 case RISCV::BEQI:
1782 case RISCV::BNEI:
1783 case RISCV::CV_BEQIMM:
1784 case RISCV::CV_BNEIMM:
1785 case RISCV::QC_BEQI:
1786 case RISCV::QC_BNEI:
1787 case RISCV::QC_BGEI:
1788 case RISCV::QC_BLTI:
1789 case RISCV::QC_BLTUI:
1790 case RISCV::QC_BGEUI:
1791 case RISCV::QC_E_BEQI:
1792 case RISCV::QC_E_BNEI:
1793 case RISCV::QC_E_BGEI:
1794 case RISCV::QC_E_BLTI:
1795 case RISCV::QC_E_BLTUI:
1796 case RISCV::QC_E_BGEUI:
1797 return isInt<13>(BrOffset);
1798 case RISCV::JAL:
1799 case RISCV::PseudoBR:
1800 return isInt<21>(BrOffset);
1801 case RISCV::PseudoJump:
1802 return isInt<32>(SignExtend64(BrOffset + 0x800, XLen));
1803 }
1804}
1805
1806// If the operation has a predicated pseudo instruction, return the pseudo
1807// instruction opcode. Otherwise, return RISCV::INSTRUCTION_LIST_END.
1808// TODO: Support more operations.
1809unsigned getPredicatedOpcode(unsigned Opcode) {
1810 // clang-format off
1811 switch (Opcode) {
1812 case RISCV::ADD: return RISCV::PseudoCCADD;
1813 case RISCV::SUB: return RISCV::PseudoCCSUB;
1814 case RISCV::SLL: return RISCV::PseudoCCSLL;
1815 case RISCV::SRL: return RISCV::PseudoCCSRL;
1816 case RISCV::SRA: return RISCV::PseudoCCSRA;
1817 case RISCV::AND: return RISCV::PseudoCCAND;
1818 case RISCV::OR: return RISCV::PseudoCCOR;
1819 case RISCV::XOR: return RISCV::PseudoCCXOR;
1820 case RISCV::MAX: return RISCV::PseudoCCMAX;
1821 case RISCV::MAXU: return RISCV::PseudoCCMAXU;
1822 case RISCV::MIN: return RISCV::PseudoCCMIN;
1823 case RISCV::MINU: return RISCV::PseudoCCMINU;
1824 case RISCV::MUL: return RISCV::PseudoCCMUL;
1825 case RISCV::LUI: return RISCV::PseudoCCLUI;
1826 case RISCV::QC_LI: return RISCV::PseudoCCQC_LI;
1827 case RISCV::QC_E_LI: return RISCV::PseudoCCQC_E_LI;
1828
1829 case RISCV::ADDI: return RISCV::PseudoCCADDI;
1830 case RISCV::SLLI: return RISCV::PseudoCCSLLI;
1831 case RISCV::SRLI: return RISCV::PseudoCCSRLI;
1832 case RISCV::SRAI: return RISCV::PseudoCCSRAI;
1833 case RISCV::ANDI: return RISCV::PseudoCCANDI;
1834 case RISCV::ORI: return RISCV::PseudoCCORI;
1835 case RISCV::XORI: return RISCV::PseudoCCXORI;
1836
1837 case RISCV::ADDW: return RISCV::PseudoCCADDW;
1838 case RISCV::SUBW: return RISCV::PseudoCCSUBW;
1839 case RISCV::SLLW: return RISCV::PseudoCCSLLW;
1840 case RISCV::SRLW: return RISCV::PseudoCCSRLW;
1841 case RISCV::SRAW: return RISCV::PseudoCCSRAW;
1842
1843 case RISCV::ADDIW: return RISCV::PseudoCCADDIW;
1844 case RISCV::SLLIW: return RISCV::PseudoCCSLLIW;
1845 case RISCV::SRLIW: return RISCV::PseudoCCSRLIW;
1846 case RISCV::SRAIW: return RISCV::PseudoCCSRAIW;
1847
1848 case RISCV::ANDN: return RISCV::PseudoCCANDN;
1849 case RISCV::ORN: return RISCV::PseudoCCORN;
1850 case RISCV::XNOR: return RISCV::PseudoCCXNOR;
1851
1852 case RISCV::NDS_BFOS: return RISCV::PseudoCCNDS_BFOS;
1853 case RISCV::NDS_BFOZ: return RISCV::PseudoCCNDS_BFOZ;
1854 }
1855 // clang-format on
1856
1857 return RISCV::INSTRUCTION_LIST_END;
1858}
1859
1860/// Identify instructions that can be folded into a CCMOV instruction, and
1861/// return the defining instruction.
1863 const MachineRegisterInfo &MRI,
1864 const TargetInstrInfo *TII,
1865 const RISCVSubtarget &STI) {
1866 if (!Reg.isVirtual())
1867 return nullptr;
1868 if (!MRI.hasOneNonDBGUse(Reg))
1869 return nullptr;
1870 MachineInstr *MI = MRI.getVRegDef(Reg);
1871 if (!MI)
1872 return nullptr;
1873
1874 if (!STI.hasShortForwardBranchIMinMax() &&
1875 (MI->getOpcode() == RISCV::MAX || MI->getOpcode() == RISCV::MIN ||
1876 MI->getOpcode() == RISCV::MINU || MI->getOpcode() == RISCV::MAXU))
1877 return nullptr;
1878
1879 if (!STI.hasShortForwardBranchIMul() && MI->getOpcode() == RISCV::MUL)
1880 return nullptr;
1881
1882 // Check if MI can be predicated and folded into the CCMOV.
1883 if (getPredicatedOpcode(MI->getOpcode()) == RISCV::INSTRUCTION_LIST_END)
1884 return nullptr;
1885 // Don't predicate li idiom.
1886 if (MI->getOpcode() == RISCV::ADDI && MI->getOperand(1).isReg() &&
1887 MI->getOperand(1).getReg() == RISCV::X0)
1888 return nullptr;
1889 // Check if MI has any other defs or physreg uses.
1890 for (const MachineOperand &MO : llvm::drop_begin(MI->operands())) {
1891 // Reject frame index operands, PEI can't handle the predicated pseudos.
1892 if (MO.isFI() || MO.isCPI() || MO.isJTI())
1893 return nullptr;
1894 if (!MO.isReg())
1895 continue;
1896 // MI can't have any tied operands, that would conflict with predication.
1897 if (MO.isTied())
1898 return nullptr;
1899 if (MO.isDef())
1900 return nullptr;
1901 // Allow constant physregs.
1902 if (MO.getReg().isPhysical() && !MRI.isConstantPhysReg(MO.getReg()))
1903 return nullptr;
1904 }
1905 bool DontMoveAcrossStores = true;
1906 if (!MI->isSafeToMove(DontMoveAcrossStores))
1907 return nullptr;
1908 return MI;
1909}
1910
1914 bool PreferFalse) const {
1915 assert(MI.getOpcode() == RISCV::PseudoCCMOVGPR &&
1916 "Unknown select instruction");
1917 if (!STI.hasShortForwardBranchIALU())
1918 return nullptr;
1919
1920 MachineRegisterInfo &MRI = MI.getParent()->getParent()->getRegInfo();
1922 canFoldAsPredicatedOp(MI.getOperand(2).getReg(), MRI, this, STI);
1923 bool Invert = !DefMI;
1924 if (!DefMI)
1925 DefMI = canFoldAsPredicatedOp(MI.getOperand(1).getReg(), MRI, this, STI);
1926 if (!DefMI)
1927 return nullptr;
1928
1929 // Find new register class to use.
1930 MachineOperand FalseReg = MI.getOperand(Invert ? 2 : 1);
1931 Register DestReg = MI.getOperand(0).getReg();
1932 const TargetRegisterClass *PreviousClass = MRI.getRegClass(FalseReg.getReg());
1933 if (!MRI.constrainRegClass(DestReg, PreviousClass))
1934 return nullptr;
1935
1936 unsigned PredOpc = getPredicatedOpcode(DefMI->getOpcode());
1937 assert(PredOpc != RISCV::INSTRUCTION_LIST_END && "Unexpected opcode!");
1938
1939 // Create a new predicated version of DefMI.
1940 MachineInstrBuilder NewMI =
1941 BuildMI(*MI.getParent(), MI, MI.getDebugLoc(), get(PredOpc), DestReg);
1942
1943 // Copy the false register.
1944 NewMI.add(FalseReg);
1945
1946 // Copy all the DefMI operands.
1947 const MCInstrDesc &DefDesc = DefMI->getDesc();
1948 for (unsigned i = 1, e = DefDesc.getNumOperands(); i != e; ++i)
1949 NewMI.add(DefMI->getOperand(i));
1950
1951 // Add branch opcode, inverting if necessary.
1952 unsigned BCCOpcode = MI.getOperand(MI.getNumExplicitOperands() - 3).getImm();
1953 if (Invert)
1954 BCCOpcode = RISCVCC::getInverseBranchOpcode(BCCOpcode);
1955 NewMI.addImm(BCCOpcode);
1956
1957 // Copy the condition portion.
1958 NewMI.add(MI.getOperand(MI.getNumExplicitOperands() - 2));
1959 NewMI.add(MI.getOperand(MI.getNumExplicitOperands() - 1));
1960
1961 // Update SeenMIs set: register newly created MI and erase removed DefMI.
1962 SeenMIs.insert(NewMI);
1963 SeenMIs.erase(DefMI);
1964
1965 // If MI is inside a loop, and DefMI is outside the loop, then kill flags on
1966 // DefMI would be invalid when transferred inside the loop. Checking for a
1967 // loop is expensive, but at least remove kill flags if they are in different
1968 // BBs.
1969 if (DefMI->getParent() != MI.getParent())
1970 NewMI->clearKillInfo();
1971
1972 // The caller will erase MI, but not DefMI.
1973 DefMI->eraseFromParent();
1974 return NewMI;
1975}
1976
1978 if (MI.isMetaInstruction())
1979 return 0;
1980
1981 unsigned Opcode = MI.getOpcode();
1982
1983 if (Opcode == TargetOpcode::INLINEASM ||
1984 Opcode == TargetOpcode::INLINEASM_BR) {
1985 const MachineFunction &MF = *MI.getParent()->getParent();
1986 return getInlineAsmLength(MI.getOperand(0).getSymbolName(),
1987 MF.getTarget().getMCAsmInfo());
1988 }
1989
1990 if (requiresNTLHint(MI)) {
1991 if (STI.hasStdExtZca()) {
1992 if (isCompressibleInst(MI, STI))
1993 return 4; // c.ntl.all + c.load/c.store
1994 return 6; // c.ntl.all + load/store
1995 }
1996 return 8; // ntl.all + load/store
1997 }
1998
1999 if (Opcode == TargetOpcode::BUNDLE)
2000 return getInstBundleSize(MI);
2001
2002 if (MI.getParent() && MI.getParent()->getParent()) {
2003 if (isCompressibleInst(MI, STI))
2004 return 2;
2005 }
2006
2007 switch (Opcode) {
2008 case RISCV::PseudoMV_FPR16INX:
2009 case RISCV::PseudoMV_FPR32INX:
2010 case RISCV::PseudoClearGPR:
2011 // MV is always compressible to either c.mv or c.li rd, 0.
2012 return STI.hasStdExtZca() ? 2 : 4;
2013 // Below cases are for short forward branch pseudos
2014 case RISCV::PseudoCCMOVGPRNoX0:
2015 return get(MI.getOperand(MI.getNumExplicitOperands() - 3).getImm())
2016 .getSize() +
2017 2;
2018 case RISCV::PseudoCCMOVGPR:
2019 case RISCV::PseudoCCADD:
2020 case RISCV::PseudoCCSUB:
2021 case RISCV::PseudoCCSLL:
2022 case RISCV::PseudoCCSRL:
2023 case RISCV::PseudoCCSRA:
2024 case RISCV::PseudoCCAND:
2025 case RISCV::PseudoCCOR:
2026 case RISCV::PseudoCCXOR:
2027 case RISCV::PseudoCCADDI:
2028 case RISCV::PseudoCCANDI:
2029 case RISCV::PseudoCCORI:
2030 case RISCV::PseudoCCXORI:
2031 case RISCV::PseudoCCLUI:
2032 case RISCV::PseudoCCSLLI:
2033 case RISCV::PseudoCCSRLI:
2034 case RISCV::PseudoCCSRAI:
2035 case RISCV::PseudoCCADDW:
2036 case RISCV::PseudoCCSUBW:
2037 case RISCV::PseudoCCSLLW:
2038 case RISCV::PseudoCCSRLW:
2039 case RISCV::PseudoCCSRAW:
2040 case RISCV::PseudoCCADDIW:
2041 case RISCV::PseudoCCSLLIW:
2042 case RISCV::PseudoCCSRLIW:
2043 case RISCV::PseudoCCSRAIW:
2044 case RISCV::PseudoCCANDN:
2045 case RISCV::PseudoCCORN:
2046 case RISCV::PseudoCCXNOR:
2047 case RISCV::PseudoCCMAX:
2048 case RISCV::PseudoCCMIN:
2049 case RISCV::PseudoCCMAXU:
2050 case RISCV::PseudoCCMINU:
2051 case RISCV::PseudoCCMUL:
2052 case RISCV::PseudoCCLB:
2053 case RISCV::PseudoCCLH:
2054 case RISCV::PseudoCCLW:
2055 case RISCV::PseudoCCLHU:
2056 case RISCV::PseudoCCLBU:
2057 case RISCV::PseudoCCLWU:
2058 case RISCV::PseudoCCLD:
2059 case RISCV::PseudoCCQC_LI:
2060 return get(MI.getOperand(MI.getNumExplicitOperands() - 3).getImm())
2061 .getSize() +
2062 4;
2063 case RISCV::PseudoCCQC_E_LI:
2064 case RISCV::PseudoCCQC_E_LB:
2065 case RISCV::PseudoCCQC_E_LH:
2066 case RISCV::PseudoCCQC_E_LW:
2067 case RISCV::PseudoCCQC_E_LHU:
2068 case RISCV::PseudoCCQC_E_LBU:
2069 return get(MI.getOperand(MI.getNumExplicitOperands() - 3).getImm())
2070 .getSize() +
2071 6;
2072 case TargetOpcode::STACKMAP:
2073 // The upper bound for a stackmap intrinsic is the full length of its shadow
2075 case TargetOpcode::PATCHPOINT:
2076 // The size of the patchpoint intrinsic is the number of bytes requested
2078 case TargetOpcode::STATEPOINT: {
2079 // The size of the statepoint intrinsic is the number of bytes requested
2080 unsigned NumBytes = StatepointOpers(&MI).getNumPatchBytes();
2081 // No patch bytes means at most a PseudoCall is emitted
2082 return std::max(NumBytes, 8U);
2083 }
2084 case TargetOpcode::PATCHABLE_FUNCTION_ENTER:
2085 case TargetOpcode::PATCHABLE_FUNCTION_EXIT:
2086 case TargetOpcode::PATCHABLE_TAIL_CALL: {
2087 const MachineFunction &MF = *MI.getParent()->getParent();
2088 const Function &F = MF.getFunction();
2089 if (Opcode == TargetOpcode::PATCHABLE_FUNCTION_ENTER &&
2090 F.hasFnAttribute("patchable-function-entry")) {
2091 unsigned Num =
2092 F.getFnAttributeAsParsedInteger("patchable-function-entry");
2093 // Number of C.NOP or NOP
2094 return (STI.hasStdExtZca() ? 2 : 4) * Num;
2095 }
2096 // XRay uses C.JAL + 21 or 33 C.NOP for each sled in RV32 and RV64,
2097 // respectively.
2098 return STI.is64Bit() ? 68 : 44;
2099 }
2100 default:
2101 return get(Opcode).getSize();
2102 }
2103}
2104
2106 const unsigned Opcode = MI.getOpcode();
2107 switch (Opcode) {
2108 default:
2109 break;
2110 case RISCV::FSGNJ_D:
2111 case RISCV::FSGNJ_S:
2112 case RISCV::FSGNJ_H:
2113 case RISCV::FSGNJ_D_INX:
2114 case RISCV::FSGNJ_D_IN32X:
2115 case RISCV::FSGNJ_S_INX:
2116 case RISCV::FSGNJ_H_INX:
2117 // The canonical floating-point move is fsgnj rd, rs, rs.
2118 return MI.getOperand(1).isReg() && MI.getOperand(2).isReg() &&
2119 MI.getOperand(1).getReg() == MI.getOperand(2).getReg();
2120 case RISCV::ADDI:
2121 case RISCV::ORI:
2122 case RISCV::XORI:
2123 return (MI.getOperand(1).isReg() &&
2124 MI.getOperand(1).getReg() == RISCV::X0) ||
2125 (MI.getOperand(2).isImm() && MI.getOperand(2).getImm() == 0);
2126 }
2127 return MI.isAsCheapAsAMove();
2128}
2129
2130std::optional<DestSourcePair>
2132 if (MI.isMoveReg())
2133 return DestSourcePair{MI.getOperand(0), MI.getOperand(1)};
2134 switch (MI.getOpcode()) {
2135 default:
2136 break;
2137 case RISCV::ADD:
2138 case RISCV::OR:
2139 case RISCV::XOR:
2140 if (MI.getOperand(1).isReg() && MI.getOperand(1).getReg() == RISCV::X0 &&
2141 MI.getOperand(2).isReg())
2142 return DestSourcePair{MI.getOperand(0), MI.getOperand(2)};
2143 if (MI.getOperand(2).isReg() && MI.getOperand(2).getReg() == RISCV::X0 &&
2144 MI.getOperand(1).isReg())
2145 return DestSourcePair{MI.getOperand(0), MI.getOperand(1)};
2146 break;
2147 case RISCV::ADDI:
2148 // Operand 1 can be a frameindex but callers expect registers
2149 if (MI.getOperand(1).isReg() && MI.getOperand(2).isImm() &&
2150 MI.getOperand(2).getImm() == 0)
2151 return DestSourcePair{MI.getOperand(0), MI.getOperand(1)};
2152 break;
2153 case RISCV::SUB:
2154 if (MI.getOperand(2).isReg() && MI.getOperand(2).getReg() == RISCV::X0 &&
2155 MI.getOperand(1).isReg())
2156 return DestSourcePair{MI.getOperand(0), MI.getOperand(1)};
2157 break;
2158 case RISCV::SH1ADD:
2159 case RISCV::SH1ADD_UW:
2160 case RISCV::SH2ADD:
2161 case RISCV::SH2ADD_UW:
2162 case RISCV::SH3ADD:
2163 case RISCV::SH3ADD_UW:
2164 if (MI.getOperand(1).isReg() && MI.getOperand(1).getReg() == RISCV::X0 &&
2165 MI.getOperand(2).isReg())
2166 return DestSourcePair{MI.getOperand(0), MI.getOperand(2)};
2167 break;
2168 case RISCV::FSGNJ_D:
2169 case RISCV::FSGNJ_S:
2170 case RISCV::FSGNJ_H:
2171 case RISCV::FSGNJ_D_INX:
2172 case RISCV::FSGNJ_D_IN32X:
2173 case RISCV::FSGNJ_S_INX:
2174 case RISCV::FSGNJ_H_INX:
2175 // The canonical floating-point move is fsgnj rd, rs, rs.
2176 if (MI.getOperand(1).isReg() && MI.getOperand(2).isReg() &&
2177 MI.getOperand(1).getReg() == MI.getOperand(2).getReg())
2178 return DestSourcePair{MI.getOperand(0), MI.getOperand(1)};
2179 break;
2180 }
2181 return std::nullopt;
2182}
2183
2185 if (ForceMachineCombinerStrategy.getNumOccurrences() == 0) {
2186 // The option is unused. Choose Local strategy only for in-order cores. When
2187 // scheduling model is unspecified, use MinInstrCount strategy as more
2188 // generic one.
2189 const auto &SchedModel = STI.getSchedModel();
2190 return (!SchedModel.hasInstrSchedModel() || SchedModel.isOutOfOrder())
2193 }
2194 // The strategy was forced by the option.
2196}
2197
2199 MachineInstr &Root, unsigned &Pattern,
2200 SmallVectorImpl<MachineInstr *> &InsInstrs) const {
2201 int16_t FrmOpIdx =
2202 RISCV::getNamedOperandIdx(Root.getOpcode(), RISCV::OpName::frm);
2203 if (FrmOpIdx < 0) {
2204 assert(all_of(InsInstrs,
2205 [](MachineInstr *MI) {
2206 return RISCV::getNamedOperandIdx(MI->getOpcode(),
2207 RISCV::OpName::frm) < 0;
2208 }) &&
2209 "New instructions require FRM whereas the old one does not have it");
2210 return;
2211 }
2212
2213 const MachineOperand &FRM = Root.getOperand(FrmOpIdx);
2214 MachineFunction &MF = *Root.getMF();
2215
2216 for (auto *NewMI : InsInstrs) {
2217 // We'd already added the FRM operand.
2218 if (static_cast<unsigned>(RISCV::getNamedOperandIdx(
2219 NewMI->getOpcode(), RISCV::OpName::frm)) != NewMI->getNumOperands())
2220 continue;
2221 MachineInstrBuilder MIB(MF, NewMI);
2222 MIB.add(FRM);
2223 if (FRM.getImm() == RISCVFPRndMode::DYN)
2224 MIB.addUse(RISCV::FRM, RegState::Implicit);
2225 }
2226}
2227
2228static bool isFADD(unsigned Opc) {
2229 switch (Opc) {
2230 default:
2231 return false;
2232 case RISCV::FADD_H:
2233 case RISCV::FADD_S:
2234 case RISCV::FADD_D:
2235 return true;
2236 }
2237}
2238
2239static bool isFSUB(unsigned Opc) {
2240 switch (Opc) {
2241 default:
2242 return false;
2243 case RISCV::FSUB_H:
2244 case RISCV::FSUB_S:
2245 case RISCV::FSUB_D:
2246 return true;
2247 }
2248}
2249
2250static bool isFMUL(unsigned Opc) {
2251 switch (Opc) {
2252 default:
2253 return false;
2254 case RISCV::FMUL_H:
2255 case RISCV::FMUL_S:
2256 case RISCV::FMUL_D:
2257 return true;
2258 }
2259}
2260
2261bool RISCVInstrInfo::isVectorAssociativeAndCommutative(const MachineInstr &Inst,
2262 bool Invert) const {
2263#define OPCODE_LMUL_CASE(OPC) \
2264 case RISCV::OPC##_M1: \
2265 case RISCV::OPC##_M2: \
2266 case RISCV::OPC##_M4: \
2267 case RISCV::OPC##_M8: \
2268 case RISCV::OPC##_MF2: \
2269 case RISCV::OPC##_MF4: \
2270 case RISCV::OPC##_MF8
2271
2272#define OPCODE_LMUL_MASK_CASE(OPC) \
2273 case RISCV::OPC##_M1_MASK: \
2274 case RISCV::OPC##_M2_MASK: \
2275 case RISCV::OPC##_M4_MASK: \
2276 case RISCV::OPC##_M8_MASK: \
2277 case RISCV::OPC##_MF2_MASK: \
2278 case RISCV::OPC##_MF4_MASK: \
2279 case RISCV::OPC##_MF8_MASK
2280
2281 unsigned Opcode = Inst.getOpcode();
2282 if (Invert) {
2283 if (auto InvOpcode = getInverseOpcode(Opcode))
2284 Opcode = *InvOpcode;
2285 else
2286 return false;
2287 }
2288
2289 // clang-format off
2290 switch (Opcode) {
2291 default:
2292 return false;
2293 OPCODE_LMUL_CASE(PseudoVADD_VV):
2294 OPCODE_LMUL_MASK_CASE(PseudoVADD_VV):
2295 OPCODE_LMUL_CASE(PseudoVMUL_VV):
2296 OPCODE_LMUL_MASK_CASE(PseudoVMUL_VV):
2297 return true;
2298 }
2299 // clang-format on
2300
2301#undef OPCODE_LMUL_MASK_CASE
2302#undef OPCODE_LMUL_CASE
2303}
2304
2305bool RISCVInstrInfo::areRVVInstsReassociable(const MachineInstr &Root,
2306 const MachineInstr &Prev) const {
2307 if (!areOpcodesEqualOrInverse(Root.getOpcode(), Prev.getOpcode()))
2308 return false;
2309
2310 assert(Root.getMF() == Prev.getMF());
2311 const MachineRegisterInfo *MRI = &Root.getMF()->getRegInfo();
2312 const TargetRegisterInfo *TRI = MRI->getTargetRegisterInfo();
2313
2314 // Make sure vtype operands are also the same.
2315 const MCInstrDesc &Desc = get(Root.getOpcode());
2316 const uint64_t TSFlags = Desc.TSFlags;
2317
2318 auto checkImmOperand = [&](unsigned OpIdx) {
2319 return Root.getOperand(OpIdx).getImm() == Prev.getOperand(OpIdx).getImm();
2320 };
2321
2322 auto checkRegOperand = [&](unsigned OpIdx) {
2323 return Root.getOperand(OpIdx).getReg() == Prev.getOperand(OpIdx).getReg();
2324 };
2325
2326 // PassThru
2327 // TODO: Potentially we can loosen the condition to consider Root to be
2328 // associable with Prev if Root has NoReg as passthru. In which case we
2329 // also need to loosen the condition on vector policies between these.
2330 if (!checkRegOperand(1))
2331 return false;
2332
2333 // SEW
2334 if (RISCVII::hasSEWOp(TSFlags) &&
2335 !checkImmOperand(RISCVII::getSEWOpNum(Desc)))
2336 return false;
2337
2338 // Mask
2339 if (RISCVII::usesMaskPolicy(TSFlags)) {
2340 const MachineBasicBlock *MBB = Root.getParent();
2343 Register MI1VReg;
2344
2345 bool SeenMI2 = false;
2346 for (auto End = MBB->rend(), It = It1; It != End; ++It) {
2347 if (It == It2) {
2348 SeenMI2 = true;
2349 if (!MI1VReg.isValid())
2350 // There is no V0 def between Root and Prev; they're sharing the
2351 // same V0.
2352 break;
2353 }
2354
2355 if (It->modifiesRegister(RISCV::V0, TRI)) {
2356 Register SrcReg = It->getOperand(1).getReg();
2357 // If it's not VReg it'll be more difficult to track its defs, so
2358 // bailing out here just to be safe.
2359 if (!SrcReg.isVirtual())
2360 return false;
2361
2362 if (!MI1VReg.isValid()) {
2363 // This is the V0 def for Root.
2364 MI1VReg = SrcReg;
2365 continue;
2366 }
2367
2368 // Some random mask updates.
2369 if (!SeenMI2)
2370 continue;
2371
2372 // This is the V0 def for Prev; check if it's the same as that of
2373 // Root.
2374 if (MI1VReg != SrcReg)
2375 return false;
2376 else
2377 break;
2378 }
2379 }
2380
2381 // If we haven't encountered Prev, it's likely that this function was
2382 // called in a wrong way (e.g. Root is before Prev).
2383 assert(SeenMI2 && "Prev is expected to appear before Root");
2384 }
2385
2386 // Tail / Mask policies
2387 if (RISCVII::hasVecPolicyOp(TSFlags) &&
2388 !checkImmOperand(RISCVII::getVecPolicyOpNum(Desc)))
2389 return false;
2390
2391 // VL
2392 if (RISCVII::hasVLOp(TSFlags)) {
2393 unsigned OpIdx = RISCVII::getVLOpNum(Desc);
2394 const MachineOperand &Op1 = Root.getOperand(OpIdx);
2395 const MachineOperand &Op2 = Prev.getOperand(OpIdx);
2396 if (Op1.getType() != Op2.getType())
2397 return false;
2398 switch (Op1.getType()) {
2400 if (Op1.getReg() != Op2.getReg())
2401 return false;
2402 break;
2404 if (Op1.getImm() != Op2.getImm())
2405 return false;
2406 break;
2407 default:
2408 llvm_unreachable("Unrecognized VL operand type");
2409 }
2410 }
2411
2412 // Rounding modes
2413 if (int Idx = RISCVII::getFRMOpNum(Desc); Idx >= 0 && !checkImmOperand(Idx))
2414 return false;
2415 if (int Idx = RISCVII::getVXRMOpNum(Desc); Idx >= 0 && !checkImmOperand(Idx))
2416 return false;
2417
2418 return true;
2419}
2420
2421// Most of our RVV pseudos have passthru operand, so the real operands
2422// start from index = 2.
2423bool RISCVInstrInfo::hasReassociableVectorSibling(const MachineInstr &Inst,
2424 bool &Commuted) const {
2425 const MachineBasicBlock *MBB = Inst.getParent();
2426 const MachineRegisterInfo &MRI = MBB->getParent()->getRegInfo();
2428 "Expect the present of passthrough operand.");
2429 MachineInstr *MI1 = MRI.getUniqueVRegDef(Inst.getOperand(2).getReg());
2430 MachineInstr *MI2 = MRI.getUniqueVRegDef(Inst.getOperand(3).getReg());
2431
2432 // If only one operand has the same or inverse opcode and it's the second
2433 // source operand, the operands must be commuted.
2434 Commuted = !areRVVInstsReassociable(Inst, *MI1) &&
2435 areRVVInstsReassociable(Inst, *MI2);
2436 if (Commuted)
2437 std::swap(MI1, MI2);
2438
2439 return areRVVInstsReassociable(Inst, *MI1) &&
2440 (isVectorAssociativeAndCommutative(*MI1) ||
2441 isVectorAssociativeAndCommutative(*MI1, /* Invert */ true)) &&
2443 MRI.hasOneNonDBGUse(MI1->getOperand(0).getReg());
2444}
2445
2447 const MachineInstr &Inst, const MachineBasicBlock *MBB) const {
2448 if (!isVectorAssociativeAndCommutative(Inst) &&
2449 !isVectorAssociativeAndCommutative(Inst, /*Invert=*/true))
2451
2452 const MachineOperand &Op1 = Inst.getOperand(2);
2453 const MachineOperand &Op2 = Inst.getOperand(3);
2454 const MachineRegisterInfo &MRI = MBB->getParent()->getRegInfo();
2455
2456 // We need virtual register definitions for the operands that we will
2457 // reassociate.
2458 MachineInstr *MI1 = nullptr;
2459 MachineInstr *MI2 = nullptr;
2460 if (Op1.isReg() && Op1.getReg().isVirtual())
2461 MI1 = MRI.getUniqueVRegDef(Op1.getReg());
2462 if (Op2.isReg() && Op2.getReg().isVirtual())
2463 MI2 = MRI.getUniqueVRegDef(Op2.getReg());
2464
2465 // And at least one operand must be defined in MBB.
2466 return MI1 && MI2 && (MI1->getParent() == MBB || MI2->getParent() == MBB);
2467}
2468
2470 const MachineInstr &Root, unsigned Pattern,
2471 std::array<unsigned, 5> &OperandIndices) const {
2473 if (RISCV::getRVVMCOpcode(Root.getOpcode())) {
2474 // Skip the passthrough operand, so increment all indices by one.
2475 for (unsigned I = 0; I < 5; ++I)
2476 ++OperandIndices[I];
2477 }
2478}
2479
2481 bool &Commuted) const {
2482 if (isVectorAssociativeAndCommutative(Inst) ||
2483 isVectorAssociativeAndCommutative(Inst, /*Invert=*/true))
2484 return hasReassociableVectorSibling(Inst, Commuted);
2485
2486 if (!TargetInstrInfo::hasReassociableSibling(Inst, Commuted))
2487 return false;
2488
2489 const MachineRegisterInfo &MRI = Inst.getMF()->getRegInfo();
2490 unsigned OperandIdx = Commuted ? 2 : 1;
2491 const MachineInstr &Sibling =
2492 *MRI.getVRegDef(Inst.getOperand(OperandIdx).getReg());
2493
2494 int16_t InstFrmOpIdx =
2495 RISCV::getNamedOperandIdx(Inst.getOpcode(), RISCV::OpName::frm);
2496 int16_t SiblingFrmOpIdx =
2497 RISCV::getNamedOperandIdx(Sibling.getOpcode(), RISCV::OpName::frm);
2498
2499 return (InstFrmOpIdx < 0 && SiblingFrmOpIdx < 0) ||
2500 RISCV::hasEqualFRM(Inst, Sibling);
2501}
2502
2504 bool Invert) const {
2505 if (isVectorAssociativeAndCommutative(Inst, Invert))
2506 return true;
2507
2508 unsigned Opc = Inst.getOpcode();
2509 if (Invert) {
2510 auto InverseOpcode = getInverseOpcode(Opc);
2511 if (!InverseOpcode)
2512 return false;
2513 Opc = *InverseOpcode;
2514 }
2515
2516 if (isFADD(Opc) || isFMUL(Opc))
2519
2520 switch (Opc) {
2521 default:
2522 return false;
2523 case RISCV::ADD:
2524 case RISCV::ADDW:
2525 case RISCV::AND:
2526 case RISCV::OR:
2527 case RISCV::XOR:
2528 // From RISC-V ISA spec, if both the high and low bits of the same product
2529 // are required, then the recommended code sequence is:
2530 //
2531 // MULH[[S]U] rdh, rs1, rs2
2532 // MUL rdl, rs1, rs2
2533 // (source register specifiers must be in same order and rdh cannot be the
2534 // same as rs1 or rs2)
2535 //
2536 // Microarchitectures can then fuse these into a single multiply operation
2537 // instead of performing two separate multiplies.
2538 // MachineCombiner may reassociate MUL operands and lose the fusion
2539 // opportunity.
2540 case RISCV::MUL:
2541 case RISCV::MULW:
2542 case RISCV::MIN:
2543 case RISCV::MINU:
2544 case RISCV::MAX:
2545 case RISCV::MAXU:
2546 case RISCV::FMIN_H:
2547 case RISCV::FMIN_S:
2548 case RISCV::FMIN_D:
2549 case RISCV::FMAX_H:
2550 case RISCV::FMAX_S:
2551 case RISCV::FMAX_D:
2552 return true;
2553 }
2554
2555 return false;
2556}
2557
2558std::optional<unsigned>
2559RISCVInstrInfo::getInverseOpcode(unsigned Opcode) const {
2560#define RVV_OPC_LMUL_CASE(OPC, INV) \
2561 case RISCV::OPC##_M1: \
2562 return RISCV::INV##_M1; \
2563 case RISCV::OPC##_M2: \
2564 return RISCV::INV##_M2; \
2565 case RISCV::OPC##_M4: \
2566 return RISCV::INV##_M4; \
2567 case RISCV::OPC##_M8: \
2568 return RISCV::INV##_M8; \
2569 case RISCV::OPC##_MF2: \
2570 return RISCV::INV##_MF2; \
2571 case RISCV::OPC##_MF4: \
2572 return RISCV::INV##_MF4; \
2573 case RISCV::OPC##_MF8: \
2574 return RISCV::INV##_MF8
2575
2576#define RVV_OPC_LMUL_MASK_CASE(OPC, INV) \
2577 case RISCV::OPC##_M1_MASK: \
2578 return RISCV::INV##_M1_MASK; \
2579 case RISCV::OPC##_M2_MASK: \
2580 return RISCV::INV##_M2_MASK; \
2581 case RISCV::OPC##_M4_MASK: \
2582 return RISCV::INV##_M4_MASK; \
2583 case RISCV::OPC##_M8_MASK: \
2584 return RISCV::INV##_M8_MASK; \
2585 case RISCV::OPC##_MF2_MASK: \
2586 return RISCV::INV##_MF2_MASK; \
2587 case RISCV::OPC##_MF4_MASK: \
2588 return RISCV::INV##_MF4_MASK; \
2589 case RISCV::OPC##_MF8_MASK: \
2590 return RISCV::INV##_MF8_MASK
2591
2592 switch (Opcode) {
2593 default:
2594 return std::nullopt;
2595 case RISCV::FADD_H:
2596 return RISCV::FSUB_H;
2597 case RISCV::FADD_S:
2598 return RISCV::FSUB_S;
2599 case RISCV::FADD_D:
2600 return RISCV::FSUB_D;
2601 case RISCV::FSUB_H:
2602 return RISCV::FADD_H;
2603 case RISCV::FSUB_S:
2604 return RISCV::FADD_S;
2605 case RISCV::FSUB_D:
2606 return RISCV::FADD_D;
2607 case RISCV::ADD:
2608 return RISCV::SUB;
2609 case RISCV::SUB:
2610 return RISCV::ADD;
2611 case RISCV::ADDW:
2612 return RISCV::SUBW;
2613 case RISCV::SUBW:
2614 return RISCV::ADDW;
2615 // clang-format off
2616 RVV_OPC_LMUL_CASE(PseudoVADD_VV, PseudoVSUB_VV);
2617 RVV_OPC_LMUL_MASK_CASE(PseudoVADD_VV, PseudoVSUB_VV);
2618 RVV_OPC_LMUL_CASE(PseudoVSUB_VV, PseudoVADD_VV);
2619 RVV_OPC_LMUL_MASK_CASE(PseudoVSUB_VV, PseudoVADD_VV);
2620 // clang-format on
2621 }
2622
2623#undef RVV_OPC_LMUL_MASK_CASE
2624#undef RVV_OPC_LMUL_CASE
2625}
2626
2628 const MachineOperand &MO,
2629 bool DoRegPressureReduce) {
2630 if (!MO.isReg() || !MO.getReg().isVirtual())
2631 return false;
2632 const MachineRegisterInfo &MRI = Root.getMF()->getRegInfo();
2633 MachineInstr *MI = MRI.getVRegDef(MO.getReg());
2634 if (!MI || !isFMUL(MI->getOpcode()))
2635 return false;
2636
2639 return false;
2640
2641 // Try combining even if fmul has more than one use as it eliminates
2642 // dependency between fadd(fsub) and fmul. However, it can extend liveranges
2643 // for fmul operands, so reject the transformation in register pressure
2644 // reduction mode.
2645 if (DoRegPressureReduce && !MRI.hasOneNonDBGUse(MI->getOperand(0).getReg()))
2646 return false;
2647
2648 // Do not combine instructions from different basic blocks.
2649 if (Root.getParent() != MI->getParent())
2650 return false;
2651 return RISCV::hasEqualFRM(Root, *MI);
2652}
2653
2655 SmallVectorImpl<unsigned> &Patterns,
2656 bool DoRegPressureReduce) {
2657 unsigned Opc = Root.getOpcode();
2658 bool IsFAdd = isFADD(Opc);
2659 if (!IsFAdd && !isFSUB(Opc))
2660 return false;
2661 bool Added = false;
2662 if (canCombineFPFusedMultiply(Root, Root.getOperand(1),
2663 DoRegPressureReduce)) {
2666 Added = true;
2667 }
2668 if (canCombineFPFusedMultiply(Root, Root.getOperand(2),
2669 DoRegPressureReduce)) {
2672 Added = true;
2673 }
2674 return Added;
2675}
2676
2677static bool getFPPatterns(MachineInstr &Root,
2678 SmallVectorImpl<unsigned> &Patterns,
2679 bool DoRegPressureReduce) {
2680 return getFPFusedMultiplyPatterns(Root, Patterns, DoRegPressureReduce);
2681}
2682
2683/// Utility routine that checks if \param MO is defined by an
2684/// \param CombineOpc instruction in the basic block \param MBB
2686 const MachineOperand &MO,
2687 unsigned CombineOpc) {
2688 const MachineRegisterInfo &MRI = MBB.getParent()->getRegInfo();
2689 const MachineInstr *MI = nullptr;
2690
2691 if (MO.isReg() && MO.getReg().isVirtual())
2692 MI = MRI.getUniqueVRegDef(MO.getReg());
2693 // And it needs to be in the trace (otherwise, it won't have a depth).
2694 if (!MI || MI->getParent() != &MBB || MI->getOpcode() != CombineOpc)
2695 return nullptr;
2696 // Must only used by the user we combine with.
2697 if (!MRI.hasOneNonDBGUse(MI->getOperand(0).getReg()))
2698 return nullptr;
2699
2700 return MI;
2701}
2702
2703/// Utility routine that checks if \param MO is defined by a SLLI in \param
2704/// MBB that can be combined by splitting across 2 SHXADD instructions. The
2705/// first SHXADD shift amount is given by \param OuterShiftAmt.
2707 const MachineOperand &MO,
2708 unsigned OuterShiftAmt) {
2709 const MachineInstr *ShiftMI = canCombine(MBB, MO, RISCV::SLLI);
2710 if (!ShiftMI)
2711 return false;
2712
2713 unsigned InnerShiftAmt = ShiftMI->getOperand(2).getImm();
2714 if (InnerShiftAmt < OuterShiftAmt || (InnerShiftAmt - OuterShiftAmt) > 3)
2715 return false;
2716
2717 return true;
2718}
2719
2720// Returns the shift amount from a SHXADD instruction. Returns 0 if the
2721// instruction is not a SHXADD.
2722static unsigned getSHXADDShiftAmount(unsigned Opc) {
2723 switch (Opc) {
2724 default:
2725 return 0;
2726 case RISCV::SH1ADD:
2727 return 1;
2728 case RISCV::SH2ADD:
2729 return 2;
2730 case RISCV::SH3ADD:
2731 return 3;
2732 }
2733}
2734
2735// Returns the shift amount from a SHXADD.UW instruction. Returns 0 if the
2736// instruction is not a SHXADD.UW.
2737static unsigned getSHXADDUWShiftAmount(unsigned Opc) {
2738 switch (Opc) {
2739 default:
2740 return 0;
2741 case RISCV::SH1ADD_UW:
2742 return 1;
2743 case RISCV::SH2ADD_UW:
2744 return 2;
2745 case RISCV::SH3ADD_UW:
2746 return 3;
2747 }
2748}
2749
2750// Look for opportunities to combine (sh3add Z, (add X, (slli Y, 5))) into
2751// (sh3add (sh2add Y, Z), X).
2752static bool getSHXADDPatterns(const MachineInstr &Root,
2753 SmallVectorImpl<unsigned> &Patterns) {
2754 unsigned ShiftAmt = getSHXADDShiftAmount(Root.getOpcode());
2755 if (!ShiftAmt)
2756 return false;
2757
2758 const MachineBasicBlock &MBB = *Root.getParent();
2759
2760 const MachineInstr *AddMI = canCombine(MBB, Root.getOperand(2), RISCV::ADD);
2761 if (!AddMI)
2762 return false;
2763
2764 bool Found = false;
2765 if (canCombineShiftIntoShXAdd(MBB, AddMI->getOperand(1), ShiftAmt)) {
2767 Found = true;
2768 }
2769 if (canCombineShiftIntoShXAdd(MBB, AddMI->getOperand(2), ShiftAmt)) {
2771 Found = true;
2772 }
2773
2774 return Found;
2775}
2776
2788
2790 MachineInstr &Root, SmallVectorImpl<unsigned> &Patterns,
2791 bool DoRegPressureReduce) const {
2792
2793 if (getFPPatterns(Root, Patterns, DoRegPressureReduce))
2794 return true;
2795
2796 if (getSHXADDPatterns(Root, Patterns))
2797 return true;
2798
2799 return TargetInstrInfo::getMachineCombinerPatterns(Root, Patterns,
2800 DoRegPressureReduce);
2801}
2802
2803static unsigned getFPFusedMultiplyOpcode(unsigned RootOpc, unsigned Pattern) {
2804 switch (RootOpc) {
2805 default:
2806 llvm_unreachable("Unexpected opcode");
2807 case RISCV::FADD_H:
2808 return RISCV::FMADD_H;
2809 case RISCV::FADD_S:
2810 return RISCV::FMADD_S;
2811 case RISCV::FADD_D:
2812 return RISCV::FMADD_D;
2813 case RISCV::FSUB_H:
2814 return Pattern == RISCVMachineCombinerPattern::FMSUB ? RISCV::FMSUB_H
2815 : RISCV::FNMSUB_H;
2816 case RISCV::FSUB_S:
2817 return Pattern == RISCVMachineCombinerPattern::FMSUB ? RISCV::FMSUB_S
2818 : RISCV::FNMSUB_S;
2819 case RISCV::FSUB_D:
2820 return Pattern == RISCVMachineCombinerPattern::FMSUB ? RISCV::FMSUB_D
2821 : RISCV::FNMSUB_D;
2822 }
2823}
2824
2825static unsigned getAddendOperandIdx(unsigned Pattern) {
2826 switch (Pattern) {
2827 default:
2828 llvm_unreachable("Unexpected pattern");
2831 return 2;
2834 return 1;
2835 }
2836}
2837
2839 unsigned Pattern,
2842 MachineFunction *MF = Root.getMF();
2843 MachineRegisterInfo &MRI = MF->getRegInfo();
2845
2846 MachineOperand &Mul1 = Prev.getOperand(1);
2847 MachineOperand &Mul2 = Prev.getOperand(2);
2848 MachineOperand &Dst = Root.getOperand(0);
2850
2851 Register DstReg = Dst.getReg();
2852 unsigned FusedOpc = getFPFusedMultiplyOpcode(Root.getOpcode(), Pattern);
2853 uint32_t IntersectedFlags = Root.getFlags() & Prev.getFlags();
2854 DebugLoc MergedLoc =
2856
2857 bool Mul1IsKill = Mul1.isKill();
2858 bool Mul2IsKill = Mul2.isKill();
2859 bool AddendIsKill = Addend.isKill();
2860
2861 // We need to clear kill flags since we may be extending the live range past
2862 // a kill. If the mul had kill flags, we can preserve those since we know
2863 // where the previous range stopped.
2864 MRI.clearKillFlags(Mul1.getReg());
2865 MRI.clearKillFlags(Mul2.getReg());
2866
2868 BuildMI(*MF, MergedLoc, TII->get(FusedOpc), DstReg)
2869 .addReg(Mul1.getReg(), getKillRegState(Mul1IsKill))
2870 .addReg(Mul2.getReg(), getKillRegState(Mul2IsKill))
2871 .addReg(Addend.getReg(), getKillRegState(AddendIsKill))
2872 .setMIFlags(IntersectedFlags);
2873
2874 InsInstrs.push_back(MIB);
2875 if (MRI.hasOneNonDBGUse(Prev.getOperand(0).getReg()))
2876 DelInstrs.push_back(&Prev);
2877 DelInstrs.push_back(&Root);
2878}
2879
2880// Combine patterns like (sh3add Z, (add X, (slli Y, 5))) to
2881// (sh3add (sh2add Y, Z), X) if the shift amount can be split across two
2882// shXadd instructions. The outer shXadd keeps its original opcode.
2883static void
2884genShXAddAddShift(MachineInstr &Root, unsigned AddOpIdx,
2887 DenseMap<Register, unsigned> &InstrIdxForVirtReg) {
2888 MachineFunction *MF = Root.getMF();
2889 MachineRegisterInfo &MRI = MF->getRegInfo();
2891
2892 unsigned OuterShiftAmt = getSHXADDShiftAmount(Root.getOpcode());
2893 assert(OuterShiftAmt != 0 && "Unexpected opcode");
2894
2895 MachineInstr *AddMI = MRI.getUniqueVRegDef(Root.getOperand(2).getReg());
2896 MachineInstr *ShiftMI =
2897 MRI.getUniqueVRegDef(AddMI->getOperand(AddOpIdx).getReg());
2898
2899 unsigned InnerShiftAmt = ShiftMI->getOperand(2).getImm();
2900 assert(InnerShiftAmt >= OuterShiftAmt && "Unexpected shift amount");
2901
2902 unsigned InnerOpc;
2903 switch (InnerShiftAmt - OuterShiftAmt) {
2904 default:
2905 llvm_unreachable("Unexpected shift amount");
2906 case 0:
2907 InnerOpc = RISCV::ADD;
2908 break;
2909 case 1:
2910 InnerOpc = RISCV::SH1ADD;
2911 break;
2912 case 2:
2913 InnerOpc = RISCV::SH2ADD;
2914 break;
2915 case 3:
2916 InnerOpc = RISCV::SH3ADD;
2917 break;
2918 }
2919
2920 const MachineOperand &X = AddMI->getOperand(3 - AddOpIdx);
2921 const MachineOperand &Y = ShiftMI->getOperand(1);
2922 const MachineOperand &Z = Root.getOperand(1);
2923
2924 Register NewVR = MRI.createVirtualRegister(&RISCV::GPRRegClass);
2925
2926 auto MIB1 = BuildMI(*MF, MIMetadata(Root), TII->get(InnerOpc), NewVR)
2927 .addReg(Y.getReg(), getKillRegState(Y.isKill()))
2928 .addReg(Z.getReg(), getKillRegState(Z.isKill()));
2929 auto MIB2 = BuildMI(*MF, MIMetadata(Root), TII->get(Root.getOpcode()),
2930 Root.getOperand(0).getReg())
2931 .addReg(NewVR, RegState::Kill)
2932 .addReg(X.getReg(), getKillRegState(X.isKill()));
2933
2934 InstrIdxForVirtReg.insert(std::make_pair(NewVR, 0));
2935 InsInstrs.push_back(MIB1);
2936 InsInstrs.push_back(MIB2);
2937 DelInstrs.push_back(ShiftMI);
2938 DelInstrs.push_back(AddMI);
2939 DelInstrs.push_back(&Root);
2940}
2941
2943 MachineInstr &Root, unsigned Pattern,
2946 DenseMap<Register, unsigned> &InstrIdxForVirtReg) const {
2947 MachineRegisterInfo &MRI = Root.getMF()->getRegInfo();
2948 switch (Pattern) {
2949 default:
2951 DelInstrs, InstrIdxForVirtReg);
2952 return;
2955 MachineInstr &Prev = *MRI.getVRegDef(Root.getOperand(1).getReg());
2956 combineFPFusedMultiply(Root, Prev, Pattern, InsInstrs, DelInstrs);
2957 return;
2958 }
2961 MachineInstr &Prev = *MRI.getVRegDef(Root.getOperand(2).getReg());
2962 combineFPFusedMultiply(Root, Prev, Pattern, InsInstrs, DelInstrs);
2963 return;
2964 }
2966 genShXAddAddShift(Root, 1, InsInstrs, DelInstrs, InstrIdxForVirtReg);
2967 return;
2969 genShXAddAddShift(Root, 2, InsInstrs, DelInstrs, InstrIdxForVirtReg);
2970 return;
2971 }
2972}
2973
2975 StringRef &ErrInfo) const {
2976 MCInstrDesc const &Desc = MI.getDesc();
2977
2978 for (const auto &[Index, Operand] : enumerate(Desc.operands())) {
2979 const MachineOperand &MO = MI.getOperand(Index);
2980 unsigned OpType = Operand.OperandType;
2981 switch (OpType) {
2982 default:
2983 if (OpType >= RISCVOp::OPERAND_FIRST_RISCV_IMM &&
2985 if (!MO.isImm()) {
2986 ErrInfo = "Expected an immediate operand.";
2987 return false;
2988 }
2989 int64_t Imm = MO.getImm();
2990 bool Ok;
2991 switch (OpType) {
2992 default:
2993 llvm_unreachable("Unexpected operand type");
2994
2995#define CASE_OPERAND_UIMM(NUM) \
2996 case RISCVOp::OPERAND_UIMM##NUM: \
2997 Ok = isUInt<NUM>(Imm); \
2998 break;
2999#define CASE_OPERAND_UIMM_LSB_ZEROS(BITS, SUFFIX) \
3000 case RISCVOp::OPERAND_UIMM##BITS##_LSB##SUFFIX: { \
3001 constexpr size_t NumZeros = sizeof(#SUFFIX) - 1; \
3002 Ok = isShiftedUInt<BITS - NumZeros, NumZeros>(Imm); \
3003 break; \
3004 }
3005#define CASE_OPERAND_SIMM(NUM) \
3006 case RISCVOp::OPERAND_SIMM##NUM: \
3007 Ok = isInt<NUM>(Imm); \
3008 break;
3009 // clang-format off
3033 // clang-format on
3035 Ok = isUInt<5>(Imm) && (Imm != 0);
3036 break;
3038 Ok = isUInt<5>(Imm) && (Imm > 3);
3039 break;
3041 Ok = Imm >= 1 && Imm <= 32;
3042 break;
3044 Ok = Imm >= 1 && Imm <= 64;
3045 break;
3047 Ok = Imm == STI.getXLen();
3048 break;
3050 Ok = isUInt<8>(Imm) && Imm >= 32;
3051 break;
3053 Ok = RISCV::isValidYBNDSWImm(Imm);
3054 break;
3056 Ok = isShiftedInt<6, 4>(Imm) && (Imm != 0);
3057 break;
3059 Ok = isShiftedUInt<8, 2>(Imm) && (Imm != 0);
3060 break;
3062 Ok = isUInt<16>(Imm) && (Imm != 0);
3063 break;
3065 Ok = Imm == 3;
3066 break;
3068 Ok = Imm == 4;
3069 break;
3071 Ok = (isUInt<5>(Imm) && Imm != 0) || Imm == -1;
3072 break;
3073 // clang-format off
3081 // clang-format on
3083 Ok = Imm >= -15 && Imm <= 16;
3084 break;
3086 Ok = isInt<5>(Imm) && (Imm != 0);
3087 break;
3089 Ok = Imm != 0 && isInt<6>(Imm);
3090 break;
3092 Ok = isUInt<10>(Imm) && RISCVVType::isValidVType(Imm);
3093 break;
3095 Ok = isUInt<11>(Imm) && RISCVVType::isValidVType(Imm);
3096 break;
3098 Ok = isShiftedInt<7, 5>(Imm);
3099 break;
3101 Ok = isInt<16>(Imm) && (Imm != 0);
3102 break;
3104 Ok = isInt<20>(Imm);
3105 break;
3107 Ok = STI.is64Bit() ? isUInt<6>(Imm) : isUInt<5>(Imm);
3108 break;
3110 Ok = STI.is64Bit() ? isUInt<6>(Imm) : isUInt<5>(Imm);
3111 Ok = Ok && Imm != 0;
3112 break;
3114 Ok = (isUInt<5>(Imm) && Imm != 0) || (Imm >= 0xfffe0 && Imm <= 0xfffff);
3115 break;
3117 Ok = Imm >= 0 && Imm <= 10;
3118 break;
3120 Ok = Imm >= 0 && Imm <= 7;
3121 break;
3123 Ok = Imm >= 1 && Imm <= 10;
3124 break;
3126 Ok = Imm >= 2 && Imm <= 14;
3127 break;
3129 Ok = Imm >= RISCVZC::RA && Imm <= RISCVZC::RA_S0_S11;
3130 break;
3132 Ok = Imm >= RISCVZC::RA_S0 && Imm <= RISCVZC::RA_S0_S11;
3133 break;
3135 Ok = Imm >= 0 && Imm <= 48 && Imm % 16 == 0;
3136 break;
3139 break;
3141 Ok = Imm == RISCVFPRndMode::RTZ;
3142 break;
3144 Ok = Imm >= 0 && Imm < RISCVCC::COND_INVALID;
3145 break;
3147 Ok = isValidAtomicOrdering(Imm);
3148 break;
3151 Imm;
3152 break;
3154 Ok = (isUInt<5>(Imm) && RISCVVType::isValidSEW(1 << Imm));
3155 break;
3157 Ok = Imm == 0;
3158 break;
3161 if (RISCVII::usesVXRM(Desc.TSFlags))
3162 Ok = isUInt<2>(Imm);
3163 else
3165 break;
3168 break;
3170 Ok = Imm == 1 || Imm == 2 || Imm == 4;
3171 break;
3172 }
3173 if (!Ok) {
3174 ErrInfo = "Invalid immediate";
3175 return false;
3176 }
3177 }
3178 break;
3180 // TODO: We could be stricter about what non-register operands are
3181 // allowed.
3182 if (MO.isReg()) {
3183 ErrInfo = "Expected a non-register operand.";
3184 return false;
3185 }
3186 if (MO.isImm() && !isInt<12>(MO.getImm())) {
3187 ErrInfo = "Invalid immediate";
3188 return false;
3189 }
3190 break;
3193 // TODO: We could be stricter about what non-register operands are
3194 // allowed.
3195 if (MO.isReg()) {
3196 ErrInfo = "Expected a non-register operand.";
3197 return false;
3198 }
3199 if (MO.isImm() && !isUInt<20>(MO.getImm())) {
3200 ErrInfo = "Invalid immediate";
3201 return false;
3202 }
3203 break;
3205 // TODO: We could be stricter about what non-register operands are
3206 // allowed.
3207 if (MO.isReg()) {
3208 ErrInfo = "Expected a non-register operand.";
3209 return false;
3210 }
3211 if (MO.isImm() && !isInt<32>(MO.getImm())) {
3212 ErrInfo = "Invalid immediate";
3213 return false;
3214 }
3215 break;
3217 if (MO.isImm()) {
3218 int64_t Imm = MO.getImm();
3219 // VLMAX is represented as -1.
3220 if (!isUInt<5>(Imm) && Imm != -1) {
3221 ErrInfo = "Invalid immediate";
3222 return false;
3223 }
3224 } else if (!MO.isReg()) {
3225 ErrInfo = "Expected a register or immediate operand.";
3226 return false;
3227 }
3228 break;
3230 if (!MO.isReg() && !MO.isImm()) {
3231 ErrInfo = "Expected a register or immediate operand.";
3232 return false;
3233 }
3234 break;
3235 }
3236 }
3237
3238 const uint64_t TSFlags = Desc.TSFlags;
3239 if (RISCVII::hasVLOp(TSFlags)) {
3240 const MachineOperand &Op = MI.getOperand(RISCVII::getVLOpNum(Desc));
3241 if (!Op.isImm() && !Op.isReg()) {
3242 ErrInfo = "Invalid operand type for VL operand";
3243 return false;
3244 }
3245 if (Op.isReg() && Op.getReg().isValid()) {
3246 const MachineRegisterInfo &MRI = MI.getParent()->getParent()->getRegInfo();
3247 auto *RC = MRI.getRegClass(Op.getReg());
3248 if (!RISCV::GPRNoX0RegClass.hasSubClassEq(RC)) {
3249 ErrInfo = "Invalid register class for VL operand";
3250 return false;
3251 }
3252 }
3253 if (!RISCVII::hasSEWOp(TSFlags)) {
3254 ErrInfo = "VL operand w/o SEW operand?";
3255 return false;
3256 }
3257 }
3258 if (RISCVII::hasSEWOp(TSFlags)) {
3259 unsigned OpIdx = RISCVII::getSEWOpNum(Desc);
3260 if (!MI.getOperand(OpIdx).isImm()) {
3261 ErrInfo = "SEW value expected to be an immediate";
3262 return false;
3263 }
3264 uint64_t Log2SEW = MI.getOperand(OpIdx).getImm();
3265 if (Log2SEW > 31) {
3266 ErrInfo = "Unexpected SEW value";
3267 return false;
3268 }
3269 unsigned SEW = Log2SEW ? 1 << Log2SEW : 8;
3270 if (!RISCVVType::isValidSEW(SEW)) {
3271 ErrInfo = "Unexpected SEW value";
3272 return false;
3273 }
3274 }
3275 if (RISCVII::hasVecPolicyOp(TSFlags)) {
3277 if (!MI.getOperand(OpIdx).isImm()) {
3278 ErrInfo = "Policy operand expected to be an immediate";
3279 return false;
3280 }
3281 uint64_t Policy = MI.getOperand(OpIdx).getImm();
3283 ErrInfo = "Invalid Policy Value";
3284 return false;
3285 }
3286 if (!RISCVII::hasVLOp(TSFlags)) {
3287 ErrInfo = "policy operand w/o VL operand?";
3288 return false;
3289 }
3290
3291 // VecPolicy operands can only exist on instructions with passthru/merge
3292 // arguments. Note that not all arguments with passthru have vec policy
3293 // operands- some instructions have implicit policies.
3294 unsigned UseOpIdx;
3295 if (!MI.isRegTiedToUseOperand(0, &UseOpIdx)) {
3296 ErrInfo = "policy operand w/o tied operand?";
3297 return false;
3298 }
3299 }
3300
3301 if (int Idx = RISCVII::getFRMOpNum(Desc);
3302 Idx >= 0 && MI.getOperand(Idx).getImm() == RISCVFPRndMode::DYN &&
3303 !MI.readsRegister(RISCV::FRM, /*TRI=*/nullptr)) {
3304 ErrInfo = "dynamic rounding mode should read FRM";
3305 return false;
3306 }
3307
3308 return true;
3309}
3310
3312 const MachineInstr &AddrI,
3313 ExtAddrMode &AM) const {
3314 switch (MemI.getOpcode()) {
3315 default:
3316 return false;
3317 case RISCV::LB:
3318 case RISCV::LBU:
3319 case RISCV::LH:
3320 case RISCV::LH_INX:
3321 case RISCV::LHU:
3322 case RISCV::LW:
3323 case RISCV::LW_INX:
3324 case RISCV::LWU:
3325 case RISCV::LD:
3326 case RISCV::LD_RV32:
3327 case RISCV::FLH:
3328 case RISCV::FLW:
3329 case RISCV::FLD:
3330 case RISCV::SB:
3331 case RISCV::SH:
3332 case RISCV::SH_INX:
3333 case RISCV::SW:
3334 case RISCV::SW_INX:
3335 case RISCV::SD:
3336 case RISCV::SD_RV32:
3337 case RISCV::FSH:
3338 case RISCV::FSW:
3339 case RISCV::FSD:
3340 break;
3341 }
3342
3343 if (MemI.getOperand(0).getReg() == Reg)
3344 return false;
3345
3346 if (AddrI.getOpcode() != RISCV::ADDI || !AddrI.getOperand(1).isReg() ||
3347 !AddrI.getOperand(2).isImm())
3348 return false;
3349
3350 int64_t OldOffset = MemI.getOperand(2).getImm();
3351 int64_t Disp = AddrI.getOperand(2).getImm();
3352 int64_t NewOffset = OldOffset + Disp;
3353 if (!STI.is64Bit())
3354 NewOffset = SignExtend64<32>(NewOffset);
3355
3356 if (!isInt<12>(NewOffset))
3357 return false;
3358
3359 AM.BaseReg = AddrI.getOperand(1).getReg();
3360 AM.ScaledReg = 0;
3361 AM.Scale = 0;
3362 AM.Displacement = NewOffset;
3364 return true;
3365}
3366
3368 const ExtAddrMode &AM) const {
3369
3370 const DebugLoc &DL = MemI.getDebugLoc();
3371 MachineBasicBlock &MBB = *MemI.getParent();
3372
3373 assert(AM.ScaledReg == 0 && AM.Scale == 0 &&
3374 "Addressing mode not supported for folding");
3375
3376 return BuildMI(MBB, MemI, DL, get(MemI.getOpcode()))
3377 .addReg(MemI.getOperand(0).getReg(), getDefRegState(MemI.mayLoad()))
3378 .addReg(AM.BaseReg)
3379 .addImm(AM.Displacement)
3380 .setMemRefs(MemI.memoperands())
3381 .setMIFlags(MemI.getFlags());
3382}
3383
3384// TODO: At the moment, MIPS introduced paring of instructions operating with
3385// word or double word. This should be extended with more instructions when more
3386// vendors support load/store pairing.
3388 switch (Opc) {
3389 default:
3390 return false;
3391 case RISCV::SW:
3392 case RISCV::SD:
3393 case RISCV::LD:
3394 case RISCV::LW:
3395 return true;
3396 }
3397}
3398
3400 const TargetRegisterInfo *TRI) {
3401 // If this is a volatile load/store, don't mess with it.
3402 if (LdSt.hasOrderedMemoryRef() || LdSt.getNumExplicitOperands() != 3)
3403 return false;
3404
3405 if (LdSt.getOperand(1).isFI())
3406 return true;
3407
3408 assert(LdSt.getOperand(1).isReg() && "Expected a reg operand.");
3409 // Can't cluster if the instruction modifies the base register
3410 // or it is update form. e.g. ld x5,8(x5)
3411 if (LdSt.modifiesRegister(LdSt.getOperand(1).getReg(), TRI))
3412 return false;
3413
3414 if (!LdSt.getOperand(2).isImm())
3415 return false;
3416
3417 return true;
3418}
3419
3422 int64_t &Offset, bool &OffsetIsScalable, LocationSize &Width,
3423 const TargetRegisterInfo *TRI) const {
3424 if (!LdSt.mayLoadOrStore())
3425 return false;
3426
3427 // Conservatively, only handle scalar loads/stores for now.
3428 switch (LdSt.getOpcode()) {
3429 case RISCV::LB:
3430 case RISCV::LBU:
3431 case RISCV::SB:
3432 case RISCV::LH:
3433 case RISCV::LH_INX:
3434 case RISCV::LHU:
3435 case RISCV::FLH:
3436 case RISCV::SH:
3437 case RISCV::SH_INX:
3438 case RISCV::FSH:
3439 case RISCV::LW:
3440 case RISCV::LW_INX:
3441 case RISCV::LWU:
3442 case RISCV::FLW:
3443 case RISCV::SW:
3444 case RISCV::SW_INX:
3445 case RISCV::FSW:
3446 case RISCV::LD:
3447 case RISCV::LD_RV32:
3448 case RISCV::FLD:
3449 case RISCV::SD:
3450 case RISCV::SD_RV32:
3451 case RISCV::FSD:
3452 break;
3453 default:
3454 return false;
3455 }
3456 const MachineOperand *BaseOp;
3457 OffsetIsScalable = false;
3458 if (!getMemOperandWithOffsetWidth(LdSt, BaseOp, Offset, Width, TRI))
3459 return false;
3460 BaseOps.push_back(BaseOp);
3461 return true;
3462}
3463
3464// TODO: This was copied from SIInstrInfo. Could it be lifted to a common
3465// helper?
3468 const MachineInstr &MI2,
3470 // Only examine the first "base" operand of each instruction, on the
3471 // assumption that it represents the real base address of the memory access.
3472 // Other operands are typically offsets or indices from this base address.
3473 if (BaseOps1.front()->isIdenticalTo(*BaseOps2.front()))
3474 return true;
3475
3476 if (!MI1.hasOneMemOperand() || !MI2.hasOneMemOperand())
3477 return false;
3478
3479 auto MO1 = *MI1.memoperands_begin();
3480 auto MO2 = *MI2.memoperands_begin();
3481 if (MO1->getAddrSpace() != MO2->getAddrSpace())
3482 return false;
3483
3484 auto Base1 = MO1->getValue();
3485 auto Base2 = MO2->getValue();
3486 if (!Base1 || !Base2)
3487 return false;
3488 Base1 = getUnderlyingObject(Base1);
3489 Base2 = getUnderlyingObject(Base2);
3490
3491 if (isa<UndefValue>(Base1) || isa<UndefValue>(Base2))
3492 return false;
3493
3494 return Base1 == Base2;
3495}
3496
3498 ArrayRef<const MachineOperand *> BaseOps1, int64_t Offset1,
3499 bool OffsetIsScalable1, ArrayRef<const MachineOperand *> BaseOps2,
3500 int64_t Offset2, bool OffsetIsScalable2, unsigned ClusterSize,
3501 unsigned NumBytes) const {
3502 // If the mem ops (to be clustered) do not have the same base ptr, then they
3503 // should not be clustered
3504 if (!BaseOps1.empty() && !BaseOps2.empty()) {
3505 const MachineInstr &FirstLdSt = *BaseOps1.front()->getParent();
3506 const MachineInstr &SecondLdSt = *BaseOps2.front()->getParent();
3507 if (!memOpsHaveSameBasePtr(FirstLdSt, BaseOps1, SecondLdSt, BaseOps2))
3508 return false;
3509 } else if (!BaseOps1.empty() || !BaseOps2.empty()) {
3510 // If only one base op is empty, they do not have the same base ptr
3511 return false;
3512 }
3513
3514 unsigned CacheLineSize =
3515 BaseOps1.front()->getParent()->getMF()->getSubtarget().getCacheLineSize();
3516 // Assume a cache line size of 64 bytes if no size is set in RISCVSubtarget.
3518 // Cluster if the memory operations are on the same or a neighbouring cache
3519 // line, but limit the maximum ClusterSize to avoid creating too much
3520 // additional register pressure.
3521 return ClusterSize <= 4 && std::abs(Offset1 - Offset2) < CacheLineSize;
3522}
3523
3524// Set BaseReg (the base register operand), Offset (the byte offset being
3525// accessed) and the access Width of the passed instruction that reads/writes
3526// memory. Returns false if the instruction does not read/write memory or the
3527// BaseReg/Offset/Width can't be determined. Is not guaranteed to always
3528// recognise base operands and offsets in all cases.
3529// TODO: Add an IsScalable bool ref argument (like the equivalent AArch64
3530// function) and set it as appropriate.
3532 const MachineInstr &LdSt, const MachineOperand *&BaseReg, int64_t &Offset,
3533 LocationSize &Width, const TargetRegisterInfo *TRI) const {
3534 if (!LdSt.mayLoadOrStore())
3535 return false;
3536
3537 // Here we assume the standard RISC-V ISA, which uses a base+offset
3538 // addressing mode. You'll need to relax these conditions to support custom
3539 // load/store instructions.
3540 if (LdSt.getNumExplicitOperands() != 3)
3541 return false;
3542 if ((!LdSt.getOperand(1).isReg() && !LdSt.getOperand(1).isFI()) ||
3543 !LdSt.getOperand(2).isImm())
3544 return false;
3545
3546 if (!LdSt.hasOneMemOperand())
3547 return false;
3548
3549 Width = (*LdSt.memoperands_begin())->getSize();
3550 BaseReg = &LdSt.getOperand(1);
3551 Offset = LdSt.getOperand(2).getImm();
3552 return true;
3553}
3554
3556 const MachineInstr &MIa, const MachineInstr &MIb) const {
3557 assert(MIa.mayLoadOrStore() && "MIa must be a load or store.");
3558 assert(MIb.mayLoadOrStore() && "MIb must be a load or store.");
3559
3562 return false;
3563
3564 // Retrieve the base register, offset from the base register and width. Width
3565 // is the size of memory that is being loaded/stored (e.g. 1, 2, 4). If
3566 // base registers are identical, and the offset of a lower memory access +
3567 // the width doesn't overlap the offset of a higher memory access,
3568 // then the memory accesses are different.
3569 const TargetRegisterInfo *TRI = STI.getRegisterInfo();
3570 const MachineOperand *BaseOpA = nullptr, *BaseOpB = nullptr;
3571 int64_t OffsetA = 0, OffsetB = 0;
3573 WidthB = LocationSize::precise(0);
3574 if (getMemOperandWithOffsetWidth(MIa, BaseOpA, OffsetA, WidthA, TRI) &&
3575 getMemOperandWithOffsetWidth(MIb, BaseOpB, OffsetB, WidthB, TRI)) {
3576 if (BaseOpA->isIdenticalTo(*BaseOpB)) {
3577 int LowOffset = std::min(OffsetA, OffsetB);
3578 int HighOffset = std::max(OffsetA, OffsetB);
3579 LocationSize LowWidth = (LowOffset == OffsetA) ? WidthA : WidthB;
3580 if (LowWidth.hasValue() &&
3581 LowOffset + (int)LowWidth.getValue() <= HighOffset)
3582 return true;
3583 }
3584 }
3585 return false;
3586}
3587
3588std::pair<unsigned, unsigned>
3590 const unsigned Mask = RISCVII::MO_DIRECT_FLAG_MASK;
3591 return std::make_pair(TF & Mask, TF & ~Mask);
3592}
3593
3596 using namespace RISCVII;
3597 static const std::pair<unsigned, const char *> TargetFlags[] = {
3598 {MO_CALL, "riscv-call"},
3599 {MO_LO, "riscv-lo"},
3600 {MO_HI, "riscv-hi"},
3601 {MO_PCREL_LO, "riscv-pcrel-lo"},
3602 {MO_PCREL_HI, "riscv-pcrel-hi"},
3603 {MO_GOT_HI, "riscv-got-hi"},
3604 {MO_TPREL_LO, "riscv-tprel-lo"},
3605 {MO_TPREL_HI, "riscv-tprel-hi"},
3606 {MO_TPREL_ADD, "riscv-tprel-add"},
3607 {MO_TLS_GOT_HI, "riscv-tls-got-hi"},
3608 {MO_TLS_GD_HI, "riscv-tls-gd-hi"},
3609 {MO_TLSDESC_HI, "riscv-tlsdesc-hi"},
3610 {MO_TLSDESC_LOAD_LO, "riscv-tlsdesc-load-lo"},
3611 {MO_TLSDESC_ADD_LO, "riscv-tlsdesc-add-lo"},
3612 {MO_TLSDESC_CALL, "riscv-tlsdesc-call"}};
3613 return ArrayRef(TargetFlags);
3614}
3616 MachineFunction &MF, bool OutlineFromLinkOnceODRs) const {
3617 const Function &F = MF.getFunction();
3618
3619 // Can F be deduplicated by the linker? If it can, don't outline from it.
3620 if (!OutlineFromLinkOnceODRs && F.hasLinkOnceODRLinkage())
3621 return false;
3622
3623 // Don't outline from functions with section markings; the program could
3624 // expect that all the code is in the named section.
3625 if (F.hasSection())
3626 return false;
3627
3628 // It's safe to outline from MF.
3629 return true;
3630}
3631
3633 unsigned &Flags) const {
3634 // More accurate safety checking is done in getOutliningCandidateInfo.
3636}
3637
3638// Enum values indicating how an outlined call should be constructed.
3644
3649
3651 const MachineFunction *MF = MBB.getParent();
3652 const Function &F = MF->getFunction();
3653 return F.getFnAttribute("fentry-call").getValueAsBool() ||
3654 F.hasFnAttribute("patchable-function-entry");
3655}
3656
3658 MCRegister RegNo) {
3659 return MI.readsRegister(RegNo, TRI) ||
3660 MI.getDesc().hasImplicitUseOfPhysReg(RegNo);
3661}
3662
3664 const TargetRegisterInfo *TRI, MCRegister RegNo) {
3665 return MI.modifiesRegister(RegNo, TRI) ||
3666 MI.getDesc().hasImplicitDefOfPhysReg(RegNo);
3667}
3668
3670 if (!MBB.back().isReturn())
3671 return true;
3673 return true;
3674
3675 // If the candidate reads the pre-set register
3676 // that can be used for expanding PseudoTAIL instruction,
3677 // then we cannot insert tail call.
3678 const TargetSubtargetInfo &STI = MBB.getParent()->getSubtarget();
3679 MCRegister TailExpandUseRegNo =
3681 for (const MachineInstr &MI : MBB) {
3682 if (isMIReadsReg(MI, STI.getRegisterInfo(), TailExpandUseRegNo))
3683 return true;
3684 if (isMIModifiesReg(MI, STI.getRegisterInfo(), TailExpandUseRegNo))
3685 break;
3686 }
3687 return false;
3688}
3689
3691 const TargetRegisterInfo &TRI) {
3692 // Candidate registers for saving X5: t1-t6
3693 static const MCPhysReg TempRegs[] = {
3694 RISCV::X6, // t1
3695 RISCV::X7, // t2
3696 RISCV::X28, // t3
3697 RISCV::X29, // t4
3698 RISCV::X30, // t5
3699 RISCV::X31 // t6
3700 };
3701
3702 const MachineFunction *MF = C.getMF();
3703 const MachineRegisterInfo &MRI = MF->getRegInfo();
3704
3705 for (MCPhysReg Reg : TempRegs) {
3706 if (MRI.isReserved(Reg))
3707 continue;
3708
3709 if (C.isAvailableAcrossAndOutOfSeq(Reg, TRI) &&
3710 C.isAvailableInsideSeq(Reg, TRI)) {
3711 return Reg;
3712 }
3713 }
3714
3715 return Register();
3716}
3717
3719 // If the expansion register for tail calls is live across the candidate
3720 // outlined call site, we cannot outline that candidate as the expansion
3721 // would clobber the register.
3722 MCRegister TailExpandUseReg =
3723 RISCVII::getTailExpandUseRegNo(STI.getFeatureBits());
3724 if (C.back().isReturn() &&
3725 !C.isAvailableAcrossAndOutOfSeq(TailExpandUseReg, RegInfo)) {
3726 LLVM_DEBUG(dbgs() << "MBB:\n" << *C.getMBB());
3727 LLVM_DEBUG(dbgs() << "Cannot be outlined between: " << C.front() << "and "
3728 << C.back());
3729 LLVM_DEBUG(dbgs() << "Because the tail-call register is live across "
3730 "the proposed outlined function call\n");
3731 return true;
3732 }
3733
3734 // If last instruction is return then we can rely on
3735 // the verification already performed in the getOutliningTypeImpl.
3736 if (C.back().isReturn()) {
3737 assert(!cannotInsertTailCall(*C.getMBB()) &&
3738 "The candidate who uses return instruction must be outlined "
3739 "using tail call");
3740 return false;
3741 }
3742
3743 // Filter out candidates where the X5 register (t0) can't be used to setup
3744 // the function call.
3745 if (!C.isAvailableInsideSeq(RISCV::X5, RegInfo))
3746 return true;
3747
3748 // If X5 is available in the region, use X5 directly (MachineOutlinerDefault).
3749 if (C.isAvailableAcrossAndOutOfSeq(RISCV::X5, RegInfo))
3750 return false;
3751
3752 // Otherwise, try to save X5 into t1-t6 (MachineOutlinerRegSave).
3754 return false;
3755
3756 return true;
3757}
3758
3759std::optional<std::unique_ptr<outliner::OutlinedFunction>>
3761 const MachineModuleInfo &MMI,
3762 std::vector<outliner::Candidate> &RepeatedSequenceLocs,
3763 unsigned MinRepeats) const {
3764
3765 // Analyze each candidate and erase the ones that are not viable.
3766 llvm::erase_if(RepeatedSequenceLocs, [this](auto Candidate) {
3767 return analyzeCandidate(Candidate);
3768 });
3769
3770 // If the sequence doesn't have enough candidates left, then we're done.
3771 if (RepeatedSequenceLocs.size() < MinRepeats)
3772 return std::nullopt;
3773
3774 // Each RepeatedSequenceLoc is identical.
3775 outliner::Candidate &Candidate = RepeatedSequenceLocs[0];
3776 unsigned InstrSizeCExt =
3777 Candidate.getMF()->getSubtarget<RISCVSubtarget>().hasStdExtZca() ? 2 : 4;
3778 unsigned CallOverhead = 0, FrameOverhead = 0;
3779
3780 // Count the number of CFI instructions in the candidate, if present.
3781 unsigned CFICount = 0;
3782 for (auto &I : Candidate) {
3783 if (I.isCFIInstruction())
3784 CFICount++;
3785 }
3786
3787 // Ensure CFI coverage matches: comparing the number of CFIs in the candidate
3788 // with the total number of CFIs in the parent function for each candidate.
3789 // Outlining only a subset of a function’s CFIs would split the unwind state
3790 // across two code regions and lead to incorrect address offsets between the
3791 // outlined body and the remaining code. To preserve correct unwind info, we
3792 // only outline when all CFIs in the function can be outlined together.
3793 for (outliner::Candidate &C : RepeatedSequenceLocs) {
3794 std::vector<MCCFIInstruction> CFIInstructions =
3795 C.getMF()->getFrameInstructions();
3796
3797 if (CFICount > 0 && CFICount != CFIInstructions.size())
3798 return std::nullopt;
3799 }
3800
3802 if (Candidate.back().isReturn()) {
3804 // tail call = auipc + jalr in the worst case without linker relaxation.
3805 // FIXME: This code suggests the JALR can be compressed - how?
3806 CallOverhead = 4 + InstrSizeCExt;
3807 // Using tail call we move ret instruction from caller to callee.
3808 FrameOverhead = 0;
3809 } else {
3810 // call t0, function = 8 bytes.
3811 CallOverhead = 8;
3812 // jr t0 = 4 bytes, 2 bytes if compressed instructions are enabled.
3813 FrameOverhead = InstrSizeCExt;
3814 }
3815
3816 // If we have CFI instructions, we can only outline if the outlined section
3817 // can be a tail call.
3818 if (MOCI != MachineOutlinerTailCall && CFICount > 0)
3819 return std::nullopt;
3820
3822 // Set per-candidate overhead based on X5 availability
3823 for (auto &C : RepeatedSequenceLocs) {
3824
3825 if (C.isAvailableAcrossAndOutOfSeq(RISCV::X5, RegInfo)) {
3826 // X5 is available, just need the call
3827 unsigned CandCallOverhead = 8;
3828 C.setCallInfo(MachineOutlinerDefault, CandCallOverhead);
3829 } else {
3830 // X5 unavailable, need save + call + restore
3831 // Save (2-4) + Call (8) + Restore (2-4)
3832 unsigned CandCallOverhead = InstrSizeCExt + 8 + InstrSizeCExt;
3833 C.setCallInfo(MachineOutlinerRegSave, CandCallOverhead);
3834 }
3835 }
3836 } else {
3837 for (auto &C : RepeatedSequenceLocs)
3838 C.setCallInfo(MOCI, CallOverhead);
3839 }
3840
3841 unsigned SequenceSize = 0;
3842 for (auto &MI : Candidate)
3843 SequenceSize += getInstSizeInBytes(MI);
3844
3845 return std::make_unique<outliner::OutlinedFunction>(
3846 RepeatedSequenceLocs, SequenceSize, FrameOverhead, MOCI);
3847}
3848
3852 unsigned Flags) const {
3853 MachineInstr &MI = *MBBI;
3854 MachineBasicBlock *MBB = MI.getParent();
3855 const TargetRegisterInfo *TRI =
3856 MBB->getParent()->getSubtarget().getRegisterInfo();
3857 const auto &F = MI.getMF()->getFunction();
3858
3859 // We can only outline CFI instructions if we will tail call the outlined
3860 // function, or fix up the CFI offsets. Currently, CFI instructions are
3861 // outlined only if in a tail call.
3862 if (MI.isCFIInstruction())
3864
3865 if (cannotInsertTailCall(*MBB) &&
3866 (MI.isReturn() || isMIModifiesReg(MI, TRI, RISCV::X5)))
3868
3869 // Make sure the operands don't reference something unsafe.
3870 for (const auto &MO : MI.operands()) {
3871
3872 // pcrel-hi and pcrel-lo can't put in separate sections, filter that out
3873 // if any possible.
3874 if (MO.getTargetFlags() == RISCVII::MO_PCREL_LO &&
3875 (MI.getMF()->getTarget().getFunctionSections() || F.hasComdat() ||
3876 F.hasSection() || F.getSectionPrefix()))
3878 }
3879
3880 if (isLPAD(MI))
3882
3884}
3885
3888 const outliner::OutlinedFunction &OF) const {
3889
3890 if (OF.FrameConstructionID == MachineOutlinerTailCall)
3891 return;
3892
3893 MBB.addLiveIn(RISCV::X5);
3894
3895 // Add in a return instruction to the end of the outlined frame.
3896 MBB.insert(MBB.end(), BuildMI(MF, DebugLoc(), get(RISCV::JALR))
3897 .addReg(RISCV::X0, RegState::Define)
3898 .addReg(RISCV::X5)
3899 .addImm(0));
3900}
3901
3905
3906 if (C.CallConstructionID == MachineOutlinerTailCall) {
3907 It = MBB.insert(It, BuildMI(MF, DebugLoc(), get(RISCV::PseudoTAIL))
3908 .addGlobalAddress(M.getNamedValue(MF.getName()),
3909 /*Offset=*/0, RISCVII::MO_CALL));
3910 return It;
3911 }
3912
3913 if (C.CallConstructionID == MachineOutlinerRegSave) {
3914 Register SaveReg = findRegisterToSaveX5To(C, RegInfo);
3915 assert(SaveReg && "Cannot find an available register to save/restore X5.");
3916
3917 // Save: ADDI SaveReg, X5, 0 (equivalent to MV SaveReg, X5)
3918 It = MBB.insert(It, BuildMI(MF, DebugLoc(), get(RISCV::ADDI), SaveReg)
3919 .addReg(RISCV::X5)
3920 .addImm(0));
3921 It++;
3922
3923 // Call: PseudoCALLReg X5
3924 It = MBB.insert(
3925 It, BuildMI(MF, DebugLoc(), get(RISCV::PseudoCALLReg), RISCV::X5)
3926 .addGlobalAddress(M.getNamedValue(MF.getName()), 0,
3928 MachineBasicBlock::iterator CallPt = It;
3929 It++;
3930
3931 // Restore: ADDI X5, SaveReg, 0 (equivalent to MV X5, SaveReg)
3932 It = MBB.insert(It, BuildMI(MF, DebugLoc(), get(RISCV::ADDI), RISCV::X5)
3933 .addReg(SaveReg)
3934 .addImm(0));
3935
3936 return CallPt;
3937 }
3938
3939 // Add in a call instruction to the outlined function at the given location.
3940 It = MBB.insert(It,
3941 BuildMI(MF, DebugLoc(), get(RISCV::PseudoCALLReg), RISCV::X5)
3942 .addGlobalAddress(M.getNamedValue(MF.getName()), 0,
3944 return It;
3945}
3946
3949 DebugLoc &DL,
3950 bool AllowSideEffects) const {
3951
3952 const MachineFunction &MF = *MBB.getParent();
3953 const RISCVRegisterInfo &TRI = *STI.getRegisterInfo();
3954
3955 if (TRI.isGeneralPurposeRegister(MF, Reg)) {
3956 BuildMI(MBB, Iter, DL, get(RISCV::PseudoClearGPR), Reg);
3957 } else {
3959 "buildClearRegister is not implemented for non-GPR registers");
3960 }
3961}
3962
3963std::optional<RegImmPair> RISCVInstrInfo::isAddImmediate(const MachineInstr &MI,
3964 Register Reg) const {
3965 // TODO: Handle cases where Reg is a super- or sub-register of the
3966 // destination register.
3967 const MachineOperand &Op0 = MI.getOperand(0);
3968 if (!Op0.isReg() || Reg != Op0.getReg())
3969 return std::nullopt;
3970
3971 // Don't consider ADDIW as a candidate because the caller may not be aware
3972 // of its sign extension behaviour.
3973 if (MI.getOpcode() == RISCV::ADDI && MI.getOperand(1).isReg() &&
3974 MI.getOperand(2).isImm())
3975 return RegImmPair{MI.getOperand(1).getReg(), MI.getOperand(2).getImm()};
3976
3977 return std::nullopt;
3978}
3979
3980// MIR printer helper function to annotate Operands with a comment.
3982 const MachineInstr &MI, const MachineOperand &Op, unsigned OpIdx,
3983 const TargetRegisterInfo *TRI) const {
3984 // Print a generic comment for this operand if there is one.
3985 std::string GenericComment =
3987 if (!GenericComment.empty())
3988 return GenericComment;
3989
3990 const MCInstrDesc &Desc = MI.getDesc();
3991 if (OpIdx >= Desc.getNumOperands())
3992 return std::string();
3993
3994 std::string Comment;
3995 raw_string_ostream OS(Comment);
3996
3997 const MCOperandInfo &OpInfo = Desc.operands()[OpIdx];
3998
3999 // Print the full VType operand of vsetvli/vsetivli instructions, and the SEW
4000 // operand of vector codegen pseudos.
4001 switch (OpInfo.OperandType) {
4004 unsigned Imm = Op.getImm();
4005 RISCVVType::printVType(Imm, OS);
4006 break;
4007 }
4009 unsigned Imm = Op.getImm();
4011 break;
4012 }
4014 unsigned Imm = Op.getImm();
4015 OS << "w" << Imm;
4016 break;
4017 }
4020 unsigned Log2SEW = Op.getImm();
4021 unsigned SEW = Log2SEW ? 1 << Log2SEW : 8;
4022 assert(RISCVVType::isValidSEW(SEW) && "Unexpected SEW");
4023 OS << "e" << SEW;
4024 break;
4025 }
4027 unsigned Policy = Op.getImm();
4029 "Invalid Policy Value");
4030 OS << (Policy & RISCVVType::TAIL_AGNOSTIC ? "ta" : "tu") << ", "
4031 << (Policy & RISCVVType::MASK_AGNOSTIC ? "ma" : "mu");
4032 break;
4033 }
4035 if (Op.isImm() && Op.getImm() == -1)
4036 OS << "vl=VLMAX";
4037 else
4038 OS << "vl";
4039 break;
4041 if (RISCVII::usesVXRM(Desc.TSFlags)) {
4043 auto VXRM = static_cast<RISCVVXRndMode::RoundingMode>(Op.getImm());
4044 OS << "vxrm=" << RISCVVXRndMode::roundingModeToString(VXRM);
4045 } else {
4047 auto FRM = static_cast<RISCVFPRndMode::RoundingMode>(Op.getImm());
4048 OS << "frm=" << RISCVFPRndMode::roundingModeToString(FRM);
4049 }
4050 break;
4051 }
4052
4053 return Comment;
4054}
4055
4056// clang-format off
4057#define CASE_RVV_OPCODE_UNMASK_LMUL(OP, LMUL) \
4058 RISCV::Pseudo##OP##_##LMUL
4059
4060#define CASE_RVV_OPCODE_MASK_LMUL(OP, LMUL) \
4061 RISCV::Pseudo##OP##_##LMUL##_MASK
4062
4063#define CASE_RVV_OPCODE_LMUL(OP, LMUL) \
4064 CASE_RVV_OPCODE_UNMASK_LMUL(OP, LMUL): \
4065 case CASE_RVV_OPCODE_MASK_LMUL(OP, LMUL)
4066
4067#define CASE_RVV_OPCODE_UNMASK_WIDEN(OP) \
4068 CASE_RVV_OPCODE_UNMASK_LMUL(OP, MF8): \
4069 case CASE_RVV_OPCODE_UNMASK_LMUL(OP, MF4): \
4070 case CASE_RVV_OPCODE_UNMASK_LMUL(OP, MF2): \
4071 case CASE_RVV_OPCODE_UNMASK_LMUL(OP, M1): \
4072 case CASE_RVV_OPCODE_UNMASK_LMUL(OP, M2): \
4073 case CASE_RVV_OPCODE_UNMASK_LMUL(OP, M4)
4074
4075#define CASE_RVV_OPCODE_UNMASK(OP) \
4076 CASE_RVV_OPCODE_UNMASK_WIDEN(OP): \
4077 case CASE_RVV_OPCODE_UNMASK_LMUL(OP, M8)
4078
4079#define CASE_RVV_OPCODE_MASK_WIDEN(OP) \
4080 CASE_RVV_OPCODE_MASK_LMUL(OP, MF8): \
4081 case CASE_RVV_OPCODE_MASK_LMUL(OP, MF4): \
4082 case CASE_RVV_OPCODE_MASK_LMUL(OP, MF2): \
4083 case CASE_RVV_OPCODE_MASK_LMUL(OP, M1): \
4084 case CASE_RVV_OPCODE_MASK_LMUL(OP, M2): \
4085 case CASE_RVV_OPCODE_MASK_LMUL(OP, M4)
4086
4087#define CASE_RVV_OPCODE_MASK(OP) \
4088 CASE_RVV_OPCODE_MASK_WIDEN(OP): \
4089 case CASE_RVV_OPCODE_MASK_LMUL(OP, M8)
4090
4091#define CASE_RVV_OPCODE_WIDEN(OP) \
4092 CASE_RVV_OPCODE_UNMASK_WIDEN(OP): \
4093 case CASE_RVV_OPCODE_MASK_WIDEN(OP)
4094
4095#define CASE_RVV_OPCODE(OP) \
4096 CASE_RVV_OPCODE_UNMASK(OP): \
4097 case CASE_RVV_OPCODE_MASK(OP)
4098// clang-format on
4099
4100// clang-format off
4101#define CASE_VMA_OPCODE_COMMON(OP, TYPE, LMUL) \
4102 RISCV::PseudoV##OP##_##TYPE##_##LMUL
4103
4104#define CASE_VMA_OPCODE_LMULS(OP, TYPE) \
4105 CASE_VMA_OPCODE_COMMON(OP, TYPE, MF8): \
4106 case CASE_VMA_OPCODE_COMMON(OP, TYPE, MF4): \
4107 case CASE_VMA_OPCODE_COMMON(OP, TYPE, MF2): \
4108 case CASE_VMA_OPCODE_COMMON(OP, TYPE, M1): \
4109 case CASE_VMA_OPCODE_COMMON(OP, TYPE, M2): \
4110 case CASE_VMA_OPCODE_COMMON(OP, TYPE, M4): \
4111 case CASE_VMA_OPCODE_COMMON(OP, TYPE, M8)
4112
4113// VFMA instructions are SEW specific.
4114#define CASE_VFMA_OPCODE_COMMON(OP, TYPE, LMUL, SEW) \
4115 RISCV::PseudoV##OP##_##TYPE##_##LMUL##_##SEW
4116
4117#define CASE_VFMA_OPCODE_LMULS_M1(OP, TYPE, SEW) \
4118 CASE_VFMA_OPCODE_COMMON(OP, TYPE, M1, SEW): \
4119 case CASE_VFMA_OPCODE_COMMON(OP, TYPE, M2, SEW): \
4120 case CASE_VFMA_OPCODE_COMMON(OP, TYPE, M4, SEW): \
4121 case CASE_VFMA_OPCODE_COMMON(OP, TYPE, M8, SEW)
4122
4123#define CASE_VFMA_OPCODE_LMULS_MF2(OP, TYPE, SEW) \
4124 CASE_VFMA_OPCODE_COMMON(OP, TYPE, MF2, SEW): \
4125 case CASE_VFMA_OPCODE_LMULS_M1(OP, TYPE, SEW)
4126
4127#define CASE_VFMA_OPCODE_LMULS_MF4(OP, TYPE, SEW) \
4128 CASE_VFMA_OPCODE_COMMON(OP, TYPE, MF4, SEW): \
4129 case CASE_VFMA_OPCODE_LMULS_MF2(OP, TYPE, SEW)
4130
4131#define CASE_VFMA_OPCODE_VV(OP) \
4132 CASE_VFMA_OPCODE_LMULS_MF4(OP, VV, E16): \
4133 case CASE_VFMA_OPCODE_LMULS_MF4(OP##_ALT, VV, E16): \
4134 case CASE_VFMA_OPCODE_LMULS_MF2(OP, VV, E32): \
4135 case CASE_VFMA_OPCODE_LMULS_M1(OP, VV, E64)
4136
4137#define CASE_VFMA_SPLATS(OP) \
4138 CASE_VFMA_OPCODE_LMULS_MF4(OP, VFPR16, E16): \
4139 case CASE_VFMA_OPCODE_LMULS_MF4(OP##_ALT, VFPR16, E16): \
4140 case CASE_VFMA_OPCODE_LMULS_MF2(OP, VFPR32, E32): \
4141 case CASE_VFMA_OPCODE_LMULS_M1(OP, VFPR64, E64)
4142// clang-format on
4143
4145 unsigned &SrcOpIdx1,
4146 unsigned &SrcOpIdx2) const {
4147 const MCInstrDesc &Desc = MI.getDesc();
4148 if (!Desc.isCommutable())
4149 return false;
4150
4151 switch (MI.getOpcode()) {
4152 case RISCV::TH_MVEQZ:
4153 case RISCV::TH_MVNEZ:
4154 // We can't commute operands if operand 2 (i.e., rs1 in
4155 // mveqz/mvnez rd,rs1,rs2) is the zero-register (as it is
4156 // not valid as the in/out-operand 1).
4157 if (MI.getOperand(2).getReg() == RISCV::X0)
4158 return false;
4159 // Operands 1 and 2 are commutable, if we switch the opcode.
4160 return fixCommutedOpIndices(SrcOpIdx1, SrcOpIdx2, 1, 2);
4161 case RISCV::QC_SELECTIEQ:
4162 case RISCV::QC_SELECTINE:
4163 case RISCV::QC_SELECTIIEQ:
4164 case RISCV::QC_SELECTIINE:
4165 return fixCommutedOpIndices(SrcOpIdx1, SrcOpIdx2, 1, 2);
4166 case RISCV::QC_MVEQ:
4167 case RISCV::QC_MVNE:
4168 case RISCV::QC_MVLT:
4169 case RISCV::QC_MVGE:
4170 case RISCV::QC_MVLTU:
4171 case RISCV::QC_MVGEU:
4172 case RISCV::QC_MVEQI:
4173 case RISCV::QC_MVNEI:
4174 case RISCV::QC_MVLTI:
4175 case RISCV::QC_MVGEI:
4176 case RISCV::QC_MVLTUI:
4177 case RISCV::QC_MVGEUI:
4178 return fixCommutedOpIndices(SrcOpIdx1, SrcOpIdx2, 1, 4);
4179 case RISCV::TH_MULA:
4180 case RISCV::TH_MULAW:
4181 case RISCV::TH_MULAH:
4182 case RISCV::TH_MULS:
4183 case RISCV::TH_MULSW:
4184 case RISCV::TH_MULSH:
4185 // Operands 2 and 3 are commutable.
4186 return fixCommutedOpIndices(SrcOpIdx1, SrcOpIdx2, 2, 3);
4187 case RISCV::PseudoCCMOVGPRNoX0:
4188 case RISCV::PseudoCCMOVGPR:
4189 // Operands 1 and 2 are commutable.
4190 return fixCommutedOpIndices(SrcOpIdx1, SrcOpIdx2, 1, 2);
4191 case CASE_RVV_OPCODE(VADD_VV):
4192 case CASE_RVV_OPCODE(VAND_VV):
4193 case CASE_RVV_OPCODE(VOR_VV):
4194 case CASE_RVV_OPCODE(VXOR_VV):
4195 case CASE_RVV_OPCODE_MASK(VMSEQ_VV):
4196 case CASE_RVV_OPCODE_MASK(VMSNE_VV):
4197 case CASE_RVV_OPCODE(VMIN_VV):
4198 case CASE_RVV_OPCODE(VMINU_VV):
4199 case CASE_RVV_OPCODE(VMAX_VV):
4200 case CASE_RVV_OPCODE(VMAXU_VV):
4201 case CASE_RVV_OPCODE(VMUL_VV):
4202 case CASE_RVV_OPCODE(VMULH_VV):
4203 case CASE_RVV_OPCODE(VMULHU_VV):
4204 case CASE_RVV_OPCODE_WIDEN(VWADD_VV):
4205 case CASE_RVV_OPCODE_WIDEN(VWADDU_VV):
4206 case CASE_RVV_OPCODE_WIDEN(VWMUL_VV):
4207 case CASE_RVV_OPCODE_WIDEN(VWMULU_VV):
4208 case CASE_RVV_OPCODE_WIDEN(VWMACC_VV):
4209 case CASE_RVV_OPCODE_WIDEN(VWMACCU_VV):
4210 case CASE_RVV_OPCODE(VABD_VV):
4211 case CASE_RVV_OPCODE(VABDU_VV):
4212 case CASE_RVV_OPCODE_WIDEN(VWABDA_VV):
4213 case CASE_RVV_OPCODE_WIDEN(VWABDAU_VV):
4214 case CASE_RVV_OPCODE_UNMASK(VADC_VVM):
4215 case CASE_RVV_OPCODE(VSADD_VV):
4216 case CASE_RVV_OPCODE(VSADDU_VV):
4217 case CASE_RVV_OPCODE(VAADD_VV):
4218 case CASE_RVV_OPCODE(VAADDU_VV):
4219 case CASE_RVV_OPCODE(VSMUL_VV):
4220 case CASE_RVV_OPCODE_LMUL(VDOT4A_VV, MF2):
4221 case CASE_RVV_OPCODE_LMUL(VDOT4A_VV, M1):
4222 case CASE_RVV_OPCODE_LMUL(VDOT4A_VV, M2):
4223 case CASE_RVV_OPCODE_LMUL(VDOT4A_VV, M4):
4224 case CASE_RVV_OPCODE_LMUL(VDOT4A_VV, M8):
4225 case CASE_RVV_OPCODE_LMUL(VDOT4AU_VV, MF2):
4226 case CASE_RVV_OPCODE_LMUL(VDOT4AU_VV, M1):
4227 case CASE_RVV_OPCODE_LMUL(VDOT4AU_VV, M2):
4228 case CASE_RVV_OPCODE_LMUL(VDOT4AU_VV, M4):
4229 case CASE_RVV_OPCODE_LMUL(VDOT4AU_VV, M8):
4230 // Operands 2 and 3 are commutable.
4231 return fixCommutedOpIndices(SrcOpIdx1, SrcOpIdx2, 2, 3);
4232 case CASE_VFMA_SPLATS(FMADD):
4233 case CASE_VFMA_SPLATS(FMSUB):
4234 case CASE_VFMA_SPLATS(FMACC):
4235 case CASE_VFMA_SPLATS(FMSAC):
4238 case CASE_VFMA_SPLATS(FNMACC):
4239 case CASE_VFMA_SPLATS(FNMSAC):
4240 case CASE_VFMA_OPCODE_VV(FMACC):
4241 case CASE_VFMA_OPCODE_VV(FMSAC):
4242 case CASE_VFMA_OPCODE_VV(FNMACC):
4243 case CASE_VFMA_OPCODE_VV(FNMSAC):
4244 case CASE_VMA_OPCODE_LMULS(MADD, VX):
4245 case CASE_VMA_OPCODE_LMULS(NMSUB, VX):
4246 case CASE_VMA_OPCODE_LMULS(MACC, VX):
4247 case CASE_VMA_OPCODE_LMULS(NMSAC, VX):
4248 case CASE_VMA_OPCODE_LMULS(MACC, VV):
4249 case CASE_VMA_OPCODE_LMULS(NMSAC, VV): {
4250 // If the tail policy is undisturbed we can't commute.
4251 assert(RISCVII::hasVecPolicyOp(MI.getDesc().TSFlags));
4252 if ((MI.getOperand(RISCVII::getVecPolicyOpNum(MI.getDesc())).getImm() &
4253 1) == 0)
4254 return false;
4255
4256 // For these instructions we can only swap operand 1 and operand 3 by
4257 // changing the opcode.
4258 unsigned CommutableOpIdx1 = 1;
4259 unsigned CommutableOpIdx2 = 3;
4260 if (!fixCommutedOpIndices(SrcOpIdx1, SrcOpIdx2, CommutableOpIdx1,
4261 CommutableOpIdx2))
4262 return false;
4263 return true;
4264 }
4265 case CASE_VFMA_OPCODE_VV(FMADD):
4269 case CASE_VMA_OPCODE_LMULS(MADD, VV):
4270 case CASE_VMA_OPCODE_LMULS(NMSUB, VV): {
4271 // If the tail policy is undisturbed we can't commute.
4272 assert(RISCVII::hasVecPolicyOp(MI.getDesc().TSFlags));
4273 if ((MI.getOperand(RISCVII::getVecPolicyOpNum(MI.getDesc())).getImm() &
4274 1) == 0)
4275 return false;
4276
4277 // For these instructions we have more freedom. We can commute with the
4278 // other multiplicand or with the addend/subtrahend/minuend.
4279
4280 // Any fixed operand must be from source 1, 2 or 3.
4281 if (SrcOpIdx1 != CommuteAnyOperandIndex && SrcOpIdx1 > 3)
4282 return false;
4283 if (SrcOpIdx2 != CommuteAnyOperandIndex && SrcOpIdx2 > 3)
4284 return false;
4285
4286 // It both ops are fixed one must be the tied source.
4287 if (SrcOpIdx1 != CommuteAnyOperandIndex &&
4288 SrcOpIdx2 != CommuteAnyOperandIndex && SrcOpIdx1 != 1 && SrcOpIdx2 != 1)
4289 return false;
4290
4291 // Look for two different register operands assumed to be commutable
4292 // regardless of the FMA opcode. The FMA opcode is adjusted later if
4293 // needed.
4294 if (SrcOpIdx1 == CommuteAnyOperandIndex ||
4295 SrcOpIdx2 == CommuteAnyOperandIndex) {
4296 // At least one of operands to be commuted is not specified and
4297 // this method is free to choose appropriate commutable operands.
4298 unsigned CommutableOpIdx1 = SrcOpIdx1;
4299 if (SrcOpIdx1 == SrcOpIdx2) {
4300 // Both of operands are not fixed. Set one of commutable
4301 // operands to the tied source.
4302 CommutableOpIdx1 = 1;
4303 } else if (SrcOpIdx1 == CommuteAnyOperandIndex) {
4304 // Only one of the operands is not fixed.
4305 CommutableOpIdx1 = SrcOpIdx2;
4306 }
4307
4308 // CommutableOpIdx1 is well defined now. Let's choose another commutable
4309 // operand and assign its index to CommutableOpIdx2.
4310 unsigned CommutableOpIdx2;
4311 if (CommutableOpIdx1 != 1) {
4312 // If we haven't already used the tied source, we must use it now.
4313 CommutableOpIdx2 = 1;
4314 } else {
4315 Register Op1Reg = MI.getOperand(CommutableOpIdx1).getReg();
4316
4317 // The commuted operands should have different registers.
4318 // Otherwise, the commute transformation does not change anything and
4319 // is useless. We use this as a hint to make our decision.
4320 if (Op1Reg != MI.getOperand(2).getReg())
4321 CommutableOpIdx2 = 2;
4322 else
4323 CommutableOpIdx2 = 3;
4324 }
4325
4326 // Assign the found pair of commutable indices to SrcOpIdx1 and
4327 // SrcOpIdx2 to return those values.
4328 if (!fixCommutedOpIndices(SrcOpIdx1, SrcOpIdx2, CommutableOpIdx1,
4329 CommutableOpIdx2))
4330 return false;
4331 }
4332
4333 return true;
4334 }
4335 }
4336
4337 return TargetInstrInfo::findCommutedOpIndices(MI, SrcOpIdx1, SrcOpIdx2);
4338}
4339
4340// clang-format off
4341#define CASE_VMA_CHANGE_OPCODE_COMMON(OLDOP, NEWOP, TYPE, LMUL) \
4342 case RISCV::PseudoV##OLDOP##_##TYPE##_##LMUL: \
4343 Opc = RISCV::PseudoV##NEWOP##_##TYPE##_##LMUL; \
4344 break;
4345
4346#define CASE_VMA_CHANGE_OPCODE_LMULS(OLDOP, NEWOP, TYPE) \
4347 CASE_VMA_CHANGE_OPCODE_COMMON(OLDOP, NEWOP, TYPE, MF8) \
4348 CASE_VMA_CHANGE_OPCODE_COMMON(OLDOP, NEWOP, TYPE, MF4) \
4349 CASE_VMA_CHANGE_OPCODE_COMMON(OLDOP, NEWOP, TYPE, MF2) \
4350 CASE_VMA_CHANGE_OPCODE_COMMON(OLDOP, NEWOP, TYPE, M1) \
4351 CASE_VMA_CHANGE_OPCODE_COMMON(OLDOP, NEWOP, TYPE, M2) \
4352 CASE_VMA_CHANGE_OPCODE_COMMON(OLDOP, NEWOP, TYPE, M4) \
4353 CASE_VMA_CHANGE_OPCODE_COMMON(OLDOP, NEWOP, TYPE, M8)
4354
4355// VFMA depends on SEW.
4356#define CASE_VFMA_CHANGE_OPCODE_COMMON(OLDOP, NEWOP, TYPE, LMUL, SEW) \
4357 case RISCV::PseudoV##OLDOP##_##TYPE##_##LMUL##_##SEW: \
4358 Opc = RISCV::PseudoV##NEWOP##_##TYPE##_##LMUL##_##SEW; \
4359 break;
4360
4361#define CASE_VFMA_CHANGE_OPCODE_LMULS_M1(OLDOP, NEWOP, TYPE, SEW) \
4362 CASE_VFMA_CHANGE_OPCODE_COMMON(OLDOP, NEWOP, TYPE, M1, SEW) \
4363 CASE_VFMA_CHANGE_OPCODE_COMMON(OLDOP, NEWOP, TYPE, M2, SEW) \
4364 CASE_VFMA_CHANGE_OPCODE_COMMON(OLDOP, NEWOP, TYPE, M4, SEW) \
4365 CASE_VFMA_CHANGE_OPCODE_COMMON(OLDOP, NEWOP, TYPE, M8, SEW)
4366
4367#define CASE_VFMA_CHANGE_OPCODE_LMULS_MF2(OLDOP, NEWOP, TYPE, SEW) \
4368 CASE_VFMA_CHANGE_OPCODE_COMMON(OLDOP, NEWOP, TYPE, MF2, SEW) \
4369 CASE_VFMA_CHANGE_OPCODE_LMULS_M1(OLDOP, NEWOP, TYPE, SEW)
4370
4371#define CASE_VFMA_CHANGE_OPCODE_LMULS_MF4(OLDOP, NEWOP, TYPE, SEW) \
4372 CASE_VFMA_CHANGE_OPCODE_COMMON(OLDOP, NEWOP, TYPE, MF4, SEW) \
4373 CASE_VFMA_CHANGE_OPCODE_LMULS_MF2(OLDOP, NEWOP, TYPE, SEW)
4374
4375#define CASE_VFMA_CHANGE_OPCODE_VV(OLDOP, NEWOP) \
4376 CASE_VFMA_CHANGE_OPCODE_LMULS_MF4(OLDOP, NEWOP, VV, E16) \
4377 CASE_VFMA_CHANGE_OPCODE_LMULS_MF4(OLDOP##_ALT, NEWOP##_ALT, VV, E16) \
4378 CASE_VFMA_CHANGE_OPCODE_LMULS_MF2(OLDOP, NEWOP, VV, E32) \
4379 CASE_VFMA_CHANGE_OPCODE_LMULS_M1(OLDOP, NEWOP, VV, E64)
4380
4381#define CASE_VFMA_CHANGE_OPCODE_SPLATS(OLDOP, NEWOP) \
4382 CASE_VFMA_CHANGE_OPCODE_LMULS_MF4(OLDOP, NEWOP, VFPR16, E16) \
4383 CASE_VFMA_CHANGE_OPCODE_LMULS_MF4(OLDOP##_ALT, NEWOP##_ALT, VFPR16, E16) \
4384 CASE_VFMA_CHANGE_OPCODE_LMULS_MF2(OLDOP, NEWOP, VFPR32, E32) \
4385 CASE_VFMA_CHANGE_OPCODE_LMULS_M1(OLDOP, NEWOP, VFPR64, E64)
4386// clang-format on
4387
4389 bool NewMI,
4390 unsigned OpIdx1,
4391 unsigned OpIdx2) const {
4392 auto cloneIfNew = [NewMI](MachineInstr &MI) -> MachineInstr & {
4393 if (NewMI)
4394 return *MI.getParent()->getParent()->CloneMachineInstr(&MI);
4395 return MI;
4396 };
4397
4398 switch (MI.getOpcode()) {
4399 case RISCV::TH_MVEQZ:
4400 case RISCV::TH_MVNEZ: {
4401 auto &WorkingMI = cloneIfNew(MI);
4402 WorkingMI.setDesc(get(MI.getOpcode() == RISCV::TH_MVEQZ ? RISCV::TH_MVNEZ
4403 : RISCV::TH_MVEQZ));
4404 return TargetInstrInfo::commuteInstructionImpl(WorkingMI, false, OpIdx1,
4405 OpIdx2);
4406 }
4407 case RISCV::QC_SELECTIEQ:
4408 case RISCV::QC_SELECTINE:
4409 case RISCV::QC_SELECTIIEQ:
4410 case RISCV::QC_SELECTIINE:
4411 return TargetInstrInfo::commuteInstructionImpl(MI, NewMI, OpIdx1, OpIdx2);
4412 case RISCV::QC_MVEQ:
4413 case RISCV::QC_MVNE:
4414 case RISCV::QC_MVLT:
4415 case RISCV::QC_MVGE:
4416 case RISCV::QC_MVLTU:
4417 case RISCV::QC_MVGEU:
4418 case RISCV::QC_MVEQI:
4419 case RISCV::QC_MVNEI:
4420 case RISCV::QC_MVLTI:
4421 case RISCV::QC_MVGEI:
4422 case RISCV::QC_MVLTUI:
4423 case RISCV::QC_MVGEUI: {
4424 auto &WorkingMI = cloneIfNew(MI);
4425 WorkingMI.setDesc(get(getInverseXqcicmOpcode(MI.getOpcode())));
4426 return TargetInstrInfo::commuteInstructionImpl(WorkingMI, false, OpIdx1,
4427 OpIdx2);
4428 }
4429 case RISCV::PseudoCCMOVGPRNoX0:
4430 case RISCV::PseudoCCMOVGPR: {
4431 // CCMOV can be commuted by inverting the condition.
4432 unsigned BCC = MI.getOperand(MI.getNumExplicitOperands() - 3).getImm();
4434 auto &WorkingMI = cloneIfNew(MI);
4435 WorkingMI.getOperand(MI.getNumExplicitOperands() - 3).setImm(BCC);
4436 return TargetInstrInfo::commuteInstructionImpl(WorkingMI, /*NewMI*/ false,
4437 OpIdx1, OpIdx2);
4438 }
4439 case CASE_VFMA_SPLATS(FMACC):
4440 case CASE_VFMA_SPLATS(FMADD):
4441 case CASE_VFMA_SPLATS(FMSAC):
4442 case CASE_VFMA_SPLATS(FMSUB):
4443 case CASE_VFMA_SPLATS(FNMACC):
4445 case CASE_VFMA_SPLATS(FNMSAC):
4447 case CASE_VFMA_OPCODE_VV(FMACC):
4448 case CASE_VFMA_OPCODE_VV(FMSAC):
4449 case CASE_VFMA_OPCODE_VV(FNMACC):
4450 case CASE_VFMA_OPCODE_VV(FNMSAC):
4451 case CASE_VMA_OPCODE_LMULS(MADD, VX):
4452 case CASE_VMA_OPCODE_LMULS(NMSUB, VX):
4453 case CASE_VMA_OPCODE_LMULS(MACC, VX):
4454 case CASE_VMA_OPCODE_LMULS(NMSAC, VX):
4455 case CASE_VMA_OPCODE_LMULS(MACC, VV):
4456 case CASE_VMA_OPCODE_LMULS(NMSAC, VV): {
4457 // It only make sense to toggle these between clobbering the
4458 // addend/subtrahend/minuend one of the multiplicands.
4459 assert((OpIdx1 == 1 || OpIdx2 == 1) && "Unexpected opcode index");
4460 assert((OpIdx1 == 3 || OpIdx2 == 3) && "Unexpected opcode index");
4461 unsigned Opc;
4462 switch (MI.getOpcode()) {
4463 default:
4464 llvm_unreachable("Unexpected opcode");
4465 CASE_VFMA_CHANGE_OPCODE_SPLATS(FMACC, FMADD)
4466 CASE_VFMA_CHANGE_OPCODE_SPLATS(FMADD, FMACC)
4473 CASE_VFMA_CHANGE_OPCODE_VV(FMACC, FMADD)
4477 CASE_VMA_CHANGE_OPCODE_LMULS(MACC, MADD, VX)
4478 CASE_VMA_CHANGE_OPCODE_LMULS(MADD, MACC, VX)
4479 CASE_VMA_CHANGE_OPCODE_LMULS(NMSAC, NMSUB, VX)
4480 CASE_VMA_CHANGE_OPCODE_LMULS(NMSUB, NMSAC, VX)
4481 CASE_VMA_CHANGE_OPCODE_LMULS(MACC, MADD, VV)
4482 CASE_VMA_CHANGE_OPCODE_LMULS(NMSAC, NMSUB, VV)
4483 }
4484
4485 auto &WorkingMI = cloneIfNew(MI);
4486 WorkingMI.setDesc(get(Opc));
4487 return TargetInstrInfo::commuteInstructionImpl(WorkingMI, /*NewMI=*/false,
4488 OpIdx1, OpIdx2);
4489 }
4490 case CASE_VFMA_OPCODE_VV(FMADD):
4494 case CASE_VMA_OPCODE_LMULS(MADD, VV):
4495 case CASE_VMA_OPCODE_LMULS(NMSUB, VV): {
4496 assert((OpIdx1 == 1 || OpIdx2 == 1) && "Unexpected opcode index");
4497 // If one of the operands, is the addend we need to change opcode.
4498 // Otherwise we're just swapping 2 of the multiplicands.
4499 if (OpIdx1 == 3 || OpIdx2 == 3) {
4500 unsigned Opc;
4501 switch (MI.getOpcode()) {
4502 default:
4503 llvm_unreachable("Unexpected opcode");
4504 CASE_VFMA_CHANGE_OPCODE_VV(FMADD, FMACC)
4508 CASE_VMA_CHANGE_OPCODE_LMULS(MADD, MACC, VV)
4509 CASE_VMA_CHANGE_OPCODE_LMULS(NMSUB, NMSAC, VV)
4510 }
4511
4512 auto &WorkingMI = cloneIfNew(MI);
4513 WorkingMI.setDesc(get(Opc));
4514 return TargetInstrInfo::commuteInstructionImpl(WorkingMI, /*NewMI=*/false,
4515 OpIdx1, OpIdx2);
4516 }
4517 // Let the default code handle it.
4518 break;
4519 }
4520 }
4521
4522 return TargetInstrInfo::commuteInstructionImpl(MI, NewMI, OpIdx1, OpIdx2);
4523}
4524
4525#undef CASE_VMA_CHANGE_OPCODE_COMMON
4526#undef CASE_VMA_CHANGE_OPCODE_LMULS
4527#undef CASE_VFMA_CHANGE_OPCODE_COMMON
4528#undef CASE_VFMA_CHANGE_OPCODE_LMULS_M1
4529#undef CASE_VFMA_CHANGE_OPCODE_LMULS_MF2
4530#undef CASE_VFMA_CHANGE_OPCODE_LMULS_MF4
4531#undef CASE_VFMA_CHANGE_OPCODE_VV
4532#undef CASE_VFMA_CHANGE_OPCODE_SPLATS
4533
4534#undef CASE_RVV_OPCODE_UNMASK_LMUL
4535#undef CASE_RVV_OPCODE_MASK_LMUL
4536#undef CASE_RVV_OPCODE_LMUL
4537#undef CASE_RVV_OPCODE_UNMASK_WIDEN
4538#undef CASE_RVV_OPCODE_UNMASK
4539#undef CASE_RVV_OPCODE_MASK_WIDEN
4540#undef CASE_RVV_OPCODE_MASK
4541#undef CASE_RVV_OPCODE_WIDEN
4542#undef CASE_RVV_OPCODE
4543
4544#undef CASE_VMA_OPCODE_COMMON
4545#undef CASE_VMA_OPCODE_LMULS
4546#undef CASE_VFMA_OPCODE_COMMON
4547#undef CASE_VFMA_OPCODE_LMULS_M1
4548#undef CASE_VFMA_OPCODE_LMULS_MF2
4549#undef CASE_VFMA_OPCODE_LMULS_MF4
4550#undef CASE_VFMA_OPCODE_VV
4551#undef CASE_VFMA_SPLATS
4552
4554 switch (MI.getOpcode()) {
4555 default:
4556 break;
4557 case RISCV::ADD:
4558 case RISCV::OR:
4559 case RISCV::XOR:
4560 // Normalize (so we hit the next if clause).
4561 // add/[x]or rd, zero, rs => add/[x]or rd, rs, zero
4562 if (MI.getOperand(1).getReg() == RISCV::X0)
4563 commuteInstruction(MI);
4564 // add/[x]or rd, rs, zero => addi rd, rs, 0
4565 if (MI.getOperand(2).getReg() == RISCV::X0) {
4566 MI.getOperand(2).ChangeToImmediate(0);
4567 MI.setDesc(get(RISCV::ADDI));
4568 return true;
4569 }
4570 // xor rd, rs, rs => addi rd, zero, 0
4571 if (MI.getOpcode() == RISCV::XOR &&
4572 MI.getOperand(1).getReg() == MI.getOperand(2).getReg()) {
4573 MI.getOperand(1).setReg(RISCV::X0);
4574 MI.getOperand(2).ChangeToImmediate(0);
4575 MI.setDesc(get(RISCV::ADDI));
4576 return true;
4577 }
4578 break;
4579 case RISCV::ORI:
4580 case RISCV::XORI:
4581 // [x]ori rd, zero, N => addi rd, zero, N
4582 if (MI.getOperand(1).getReg() == RISCV::X0) {
4583 MI.setDesc(get(RISCV::ADDI));
4584 return true;
4585 }
4586 break;
4587 case RISCV::SUB:
4588 // sub rd, rs, zero => addi rd, rs, 0
4589 if (MI.getOperand(2).getReg() == RISCV::X0) {
4590 MI.getOperand(2).ChangeToImmediate(0);
4591 MI.setDesc(get(RISCV::ADDI));
4592 return true;
4593 }
4594 break;
4595 case RISCV::SUBW:
4596 // subw rd, rs, zero => addiw rd, rs, 0
4597 if (MI.getOperand(2).getReg() == RISCV::X0) {
4598 MI.getOperand(2).ChangeToImmediate(0);
4599 MI.setDesc(get(RISCV::ADDIW));
4600 return true;
4601 }
4602 break;
4603 case RISCV::ADDW:
4604 // Normalize (so we hit the next if clause).
4605 // addw rd, zero, rs => addw rd, rs, zero
4606 if (MI.getOperand(1).getReg() == RISCV::X0)
4607 commuteInstruction(MI);
4608 // addw rd, rs, zero => addiw rd, rs, 0
4609 if (MI.getOperand(2).getReg() == RISCV::X0) {
4610 MI.getOperand(2).ChangeToImmediate(0);
4611 MI.setDesc(get(RISCV::ADDIW));
4612 return true;
4613 }
4614 break;
4615 case RISCV::SH1ADD:
4616 case RISCV::SH1ADD_UW:
4617 case RISCV::SH2ADD:
4618 case RISCV::SH2ADD_UW:
4619 case RISCV::SH3ADD:
4620 case RISCV::SH3ADD_UW:
4621 // shNadd[.uw] rd, zero, rs => addi rd, rs, 0
4622 if (MI.getOperand(1).getReg() == RISCV::X0) {
4623 MI.removeOperand(1);
4624 MI.addOperand(MachineOperand::CreateImm(0));
4625 MI.setDesc(get(RISCV::ADDI));
4626 return true;
4627 }
4628 // shNadd[.uw] rd, rs, zero => slli[.uw] rd, rs, N
4629 if (MI.getOperand(2).getReg() == RISCV::X0) {
4630 MI.removeOperand(2);
4631 unsigned Opc = MI.getOpcode();
4632 if (Opc == RISCV::SH1ADD_UW || Opc == RISCV::SH2ADD_UW ||
4633 Opc == RISCV::SH3ADD_UW) {
4635 MI.setDesc(get(RISCV::SLLI_UW));
4636 return true;
4637 }
4639 MI.setDesc(get(RISCV::SLLI));
4640 return true;
4641 }
4642 break;
4643 case RISCV::AND:
4644 case RISCV::MUL:
4645 case RISCV::MULH:
4646 case RISCV::MULHSU:
4647 case RISCV::MULHU:
4648 case RISCV::MULW:
4649 // and rd, zero, rs => addi rd, zero, 0
4650 // mul* rd, zero, rs => addi rd, zero, 0
4651 // and rd, rs, zero => addi rd, zero, 0
4652 // mul* rd, rs, zero => addi rd, zero, 0
4653 if (MI.getOperand(1).getReg() == RISCV::X0 ||
4654 MI.getOperand(2).getReg() == RISCV::X0) {
4655 MI.getOperand(1).setReg(RISCV::X0);
4656 MI.getOperand(2).ChangeToImmediate(0);
4657 MI.setDesc(get(RISCV::ADDI));
4658 return true;
4659 }
4660 break;
4661 case RISCV::ANDI:
4662 // andi rd, zero, C => addi rd, zero, 0
4663 if (MI.getOperand(1).getReg() == RISCV::X0) {
4664 MI.getOperand(2).setImm(0);
4665 MI.setDesc(get(RISCV::ADDI));
4666 return true;
4667 }
4668 break;
4669 case RISCV::SLL:
4670 case RISCV::SRL:
4671 case RISCV::SRA:
4672 // shift rd, zero, rs => addi rd, zero, 0
4673 if (MI.getOperand(1).getReg() == RISCV::X0) {
4674 MI.getOperand(2).ChangeToImmediate(0);
4675 MI.setDesc(get(RISCV::ADDI));
4676 return true;
4677 }
4678 // shift rd, rs, zero => addi rd, rs, 0
4679 if (MI.getOperand(2).getReg() == RISCV::X0) {
4680 MI.getOperand(2).ChangeToImmediate(0);
4681 MI.setDesc(get(RISCV::ADDI));
4682 return true;
4683 }
4684 break;
4685 case RISCV::SLLW:
4686 case RISCV::SRLW:
4687 case RISCV::SRAW:
4688 // shiftw rd, zero, rs => addi rd, zero, 0
4689 if (MI.getOperand(1).getReg() == RISCV::X0) {
4690 MI.getOperand(2).ChangeToImmediate(0);
4691 MI.setDesc(get(RISCV::ADDI));
4692 return true;
4693 }
4694 break;
4695 case RISCV::SLLI:
4696 case RISCV::SRLI:
4697 case RISCV::SRAI:
4698 case RISCV::SLLIW:
4699 case RISCV::SRLIW:
4700 case RISCV::SRAIW:
4701 case RISCV::SLLI_UW:
4702 // shiftimm rd, zero, N => addi rd, zero, 0
4703 if (MI.getOperand(1).getReg() == RISCV::X0) {
4704 MI.getOperand(2).setImm(0);
4705 MI.setDesc(get(RISCV::ADDI));
4706 return true;
4707 }
4708 break;
4709 case RISCV::SLTU:
4710 case RISCV::ADD_UW:
4711 // sltu rd, zero, zero => addi rd, zero, 0
4712 // add.uw rd, zero, zero => addi rd, zero, 0
4713 if (MI.getOperand(1).getReg() == RISCV::X0 &&
4714 MI.getOperand(2).getReg() == RISCV::X0) {
4715 MI.getOperand(2).ChangeToImmediate(0);
4716 MI.setDesc(get(RISCV::ADDI));
4717 return true;
4718 }
4719 // add.uw rd, zero, rs => addi rd, rs, 0
4720 if (MI.getOpcode() == RISCV::ADD_UW &&
4721 MI.getOperand(1).getReg() == RISCV::X0) {
4722 MI.removeOperand(1);
4723 MI.addOperand(MachineOperand::CreateImm(0));
4724 MI.setDesc(get(RISCV::ADDI));
4725 }
4726 break;
4727 case RISCV::SLTIU:
4728 // sltiu rd, zero, NZC => addi rd, zero, 1
4729 // sltiu rd, zero, 0 => addi rd, zero, 0
4730 if (MI.getOperand(1).getReg() == RISCV::X0) {
4731 MI.getOperand(2).setImm(MI.getOperand(2).getImm() != 0);
4732 MI.setDesc(get(RISCV::ADDI));
4733 return true;
4734 }
4735 break;
4736 case RISCV::SEXT_H:
4737 case RISCV::SEXT_B:
4738 case RISCV::ZEXT_H_RV32:
4739 case RISCV::ZEXT_H_RV64:
4740 // sext.[hb] rd, zero => addi rd, zero, 0
4741 // zext.h rd, zero => addi rd, zero, 0
4742 if (MI.getOperand(1).getReg() == RISCV::X0) {
4743 MI.addOperand(MachineOperand::CreateImm(0));
4744 MI.setDesc(get(RISCV::ADDI));
4745 return true;
4746 }
4747 break;
4748 case RISCV::MIN:
4749 case RISCV::MINU:
4750 case RISCV::MAX:
4751 case RISCV::MAXU:
4752 // min|max rd, rs, rs => addi rd, rs, 0
4753 if (MI.getOperand(1).getReg() == MI.getOperand(2).getReg()) {
4754 MI.getOperand(2).ChangeToImmediate(0);
4755 MI.setDesc(get(RISCV::ADDI));
4756 return true;
4757 }
4758 break;
4759 case RISCV::BEQ:
4760 case RISCV::BNE:
4761 // b{eq,ne} zero, rs, imm => b{eq,ne} rs, zero, imm
4762 if (MI.getOperand(0).getReg() == RISCV::X0) {
4763 MachineOperand MO0 = MI.getOperand(0);
4764 MI.removeOperand(0);
4765 MI.insert(MI.operands_begin() + 1, {MO0});
4766 }
4767 break;
4768 case RISCV::BLTU:
4769 // bltu zero, rs, imm => bne rs, zero, imm
4770 if (MI.getOperand(0).getReg() == RISCV::X0) {
4771 MachineOperand MO0 = MI.getOperand(0);
4772 MI.removeOperand(0);
4773 MI.insert(MI.operands_begin() + 1, {MO0});
4774 MI.setDesc(get(RISCV::BNE));
4775 }
4776 break;
4777 case RISCV::BGEU:
4778 // bgeu zero, rs, imm => beq rs, zero, imm
4779 if (MI.getOperand(0).getReg() == RISCV::X0) {
4780 MachineOperand MO0 = MI.getOperand(0);
4781 MI.removeOperand(0);
4782 MI.insert(MI.operands_begin() + 1, {MO0});
4783 MI.setDesc(get(RISCV::BEQ));
4784 }
4785 break;
4786 }
4787 return false;
4788}
4789
4790// clang-format off
4791#define CASE_WIDEOP_OPCODE_COMMON(OP, LMUL) \
4792 RISCV::PseudoV##OP##_##LMUL##_TIED
4793
4794#define CASE_WIDEOP_OPCODE_LMULS(OP) \
4795 CASE_WIDEOP_OPCODE_COMMON(OP, MF8): \
4796 case CASE_WIDEOP_OPCODE_COMMON(OP, MF4): \
4797 case CASE_WIDEOP_OPCODE_COMMON(OP, MF2): \
4798 case CASE_WIDEOP_OPCODE_COMMON(OP, M1): \
4799 case CASE_WIDEOP_OPCODE_COMMON(OP, M2): \
4800 case CASE_WIDEOP_OPCODE_COMMON(OP, M4)
4801
4802#define CASE_WIDEOP_CHANGE_OPCODE_COMMON(OP, LMUL) \
4803 case RISCV::PseudoV##OP##_##LMUL##_TIED: \
4804 NewOpc = RISCV::PseudoV##OP##_##LMUL; \
4805 break;
4806
4807#define CASE_WIDEOP_CHANGE_OPCODE_LMULS(OP) \
4808 CASE_WIDEOP_CHANGE_OPCODE_COMMON(OP, MF8) \
4809 CASE_WIDEOP_CHANGE_OPCODE_COMMON(OP, MF4) \
4810 CASE_WIDEOP_CHANGE_OPCODE_COMMON(OP, MF2) \
4811 CASE_WIDEOP_CHANGE_OPCODE_COMMON(OP, M1) \
4812 CASE_WIDEOP_CHANGE_OPCODE_COMMON(OP, M2) \
4813 CASE_WIDEOP_CHANGE_OPCODE_COMMON(OP, M4)
4814
4815// FP Widening Ops may by SEW aware. Create SEW aware cases for these cases.
4816#define CASE_FP_WIDEOP_OPCODE_COMMON(OP, LMUL, SEW) \
4817 RISCV::PseudoV##OP##_##LMUL##_##SEW##_TIED
4818
4819#define CASE_FP_WIDEOP_OPCODE_LMULS(OP) \
4820 CASE_FP_WIDEOP_OPCODE_COMMON(OP, MF4, E16): \
4821 case CASE_FP_WIDEOP_OPCODE_COMMON(OP, MF2, E16): \
4822 case CASE_FP_WIDEOP_OPCODE_COMMON(OP, MF2, E32): \
4823 case CASE_FP_WIDEOP_OPCODE_COMMON(OP, M1, E16): \
4824 case CASE_FP_WIDEOP_OPCODE_COMMON(OP, M1, E32): \
4825 case CASE_FP_WIDEOP_OPCODE_COMMON(OP, M2, E16): \
4826 case CASE_FP_WIDEOP_OPCODE_COMMON(OP, M2, E32): \
4827 case CASE_FP_WIDEOP_OPCODE_COMMON(OP, M4, E16): \
4828 case CASE_FP_WIDEOP_OPCODE_COMMON(OP, M4, E32) \
4829
4830#define CASE_FP_WIDEOP_CHANGE_OPCODE_COMMON(OP, LMUL, SEW) \
4831 case RISCV::PseudoV##OP##_##LMUL##_##SEW##_TIED: \
4832 NewOpc = RISCV::PseudoV##OP##_##LMUL##_##SEW; \
4833 break;
4834
4835#define CASE_FP_WIDEOP_CHANGE_OPCODE_LMULS(OP) \
4836 CASE_FP_WIDEOP_CHANGE_OPCODE_COMMON(OP, MF4, E16) \
4837 CASE_FP_WIDEOP_CHANGE_OPCODE_COMMON(OP, MF2, E16) \
4838 CASE_FP_WIDEOP_CHANGE_OPCODE_COMMON(OP, MF2, E32) \
4839 CASE_FP_WIDEOP_CHANGE_OPCODE_COMMON(OP, M1, E16) \
4840 CASE_FP_WIDEOP_CHANGE_OPCODE_COMMON(OP, M1, E32) \
4841 CASE_FP_WIDEOP_CHANGE_OPCODE_COMMON(OP, M2, E16) \
4842 CASE_FP_WIDEOP_CHANGE_OPCODE_COMMON(OP, M2, E32) \
4843 CASE_FP_WIDEOP_CHANGE_OPCODE_COMMON(OP, M4, E16) \
4844 CASE_FP_WIDEOP_CHANGE_OPCODE_COMMON(OP, M4, E32) \
4845
4846#define CASE_FP_WIDEOP_OPCODE_LMULS_ALT(OP) \
4847 CASE_FP_WIDEOP_OPCODE_COMMON(OP, MF4, E16): \
4848 case CASE_FP_WIDEOP_OPCODE_COMMON(OP, MF2, E16): \
4849 case CASE_FP_WIDEOP_OPCODE_COMMON(OP, M1, E16): \
4850 case CASE_FP_WIDEOP_OPCODE_COMMON(OP, M2, E16): \
4851 case CASE_FP_WIDEOP_OPCODE_COMMON(OP, M4, E16)
4852
4853#define CASE_FP_WIDEOP_CHANGE_OPCODE_LMULS_ALT(OP) \
4854 CASE_FP_WIDEOP_CHANGE_OPCODE_COMMON(OP, MF4, E16) \
4855 CASE_FP_WIDEOP_CHANGE_OPCODE_COMMON(OP, MF2, E16) \
4856 CASE_FP_WIDEOP_CHANGE_OPCODE_COMMON(OP, M1, E16) \
4857 CASE_FP_WIDEOP_CHANGE_OPCODE_COMMON(OP, M2, E16) \
4858 CASE_FP_WIDEOP_CHANGE_OPCODE_COMMON(OP, M4, E16)
4859// clang-format on
4860
4862 LiveVariables *LV,
4863 LiveIntervals *LIS) const {
4865 switch (MI.getOpcode()) {
4866 default:
4867 return nullptr;
4868 case CASE_FP_WIDEOP_OPCODE_LMULS_ALT(FWADD_ALT_WV):
4869 case CASE_FP_WIDEOP_OPCODE_LMULS_ALT(FWSUB_ALT_WV):
4870 case CASE_FP_WIDEOP_OPCODE_LMULS(FWADD_WV):
4871 case CASE_FP_WIDEOP_OPCODE_LMULS(FWSUB_WV): {
4872 assert(RISCVII::hasVecPolicyOp(MI.getDesc().TSFlags) &&
4873 MI.getNumExplicitOperands() == 7 &&
4874 "Expect 7 explicit operands rd, rs2, rs1, rm, vl, sew, policy");
4875 // If the tail policy is undisturbed we can't convert.
4876 if ((MI.getOperand(RISCVII::getVecPolicyOpNum(MI.getDesc())).getImm() &
4877 1) == 0)
4878 return nullptr;
4879 // clang-format off
4880 unsigned NewOpc;
4881 switch (MI.getOpcode()) {
4882 default:
4883 llvm_unreachable("Unexpected opcode");
4888 }
4889 // clang-format on
4890
4891 MachineBasicBlock &MBB = *MI.getParent();
4892 MIB = BuildMI(MBB, MI, MI.getDebugLoc(), get(NewOpc))
4893 .add(MI.getOperand(0))
4894 .addReg(MI.getOperand(0).getReg(), RegState::Undef)
4895 .add(MI.getOperand(1))
4896 .add(MI.getOperand(2))
4897 .add(MI.getOperand(3))
4898 .add(MI.getOperand(4))
4899 .add(MI.getOperand(5))
4900 .add(MI.getOperand(6));
4901 break;
4902 }
4903 case CASE_WIDEOP_OPCODE_LMULS(WADD_WV):
4904 case CASE_WIDEOP_OPCODE_LMULS(WADDU_WV):
4905 case CASE_WIDEOP_OPCODE_LMULS(WSUB_WV):
4906 case CASE_WIDEOP_OPCODE_LMULS(WSUBU_WV): {
4907 // If the tail policy is undisturbed we can't convert.
4908 assert(RISCVII::hasVecPolicyOp(MI.getDesc().TSFlags) &&
4909 MI.getNumExplicitOperands() == 6);
4910 if ((MI.getOperand(RISCVII::getVecPolicyOpNum(MI.getDesc())).getImm() &
4911 1) == 0)
4912 return nullptr;
4913
4914 // clang-format off
4915 unsigned NewOpc;
4916 switch (MI.getOpcode()) {
4917 default:
4918 llvm_unreachable("Unexpected opcode");
4923 }
4924 // clang-format on
4925
4926 MachineBasicBlock &MBB = *MI.getParent();
4927 MIB = BuildMI(MBB, MI, MI.getDebugLoc(), get(NewOpc))
4928 .add(MI.getOperand(0))
4929 .addReg(MI.getOperand(0).getReg(), RegState::Undef)
4930 .add(MI.getOperand(1))
4931 .add(MI.getOperand(2))
4932 .add(MI.getOperand(3))
4933 .add(MI.getOperand(4))
4934 .add(MI.getOperand(5));
4935 break;
4936 }
4937 }
4938 MIB.copyImplicitOps(MI);
4939
4940 if (LV) {
4941 unsigned NumOps = MI.getNumOperands();
4942 for (unsigned I = 1; I < NumOps; ++I) {
4943 MachineOperand &Op = MI.getOperand(I);
4944 if (Op.isReg() && Op.isKill())
4945 LV->replaceKillInstruction(Op.getReg(), MI, *MIB);
4946 }
4947 }
4948
4949 if (LIS) {
4950 SlotIndex Idx = LIS->ReplaceMachineInstrInMaps(MI, *MIB);
4951
4952 if (MI.getOperand(0).isEarlyClobber()) {
4953 // Use operand 1 was tied to early-clobber def operand 0, so its live
4954 // interval could have ended at an early-clobber slot. Now they are not
4955 // tied we need to update it to the normal register slot.
4956 LiveInterval &LI = LIS->getInterval(MI.getOperand(1).getReg());
4958 if (S->end == Idx.getRegSlot(true))
4959 S->end = Idx.getRegSlot();
4960 }
4961 }
4962
4963 return MIB;
4964}
4965
4966#undef CASE_WIDEOP_OPCODE_COMMON
4967#undef CASE_WIDEOP_OPCODE_LMULS
4968#undef CASE_WIDEOP_CHANGE_OPCODE_COMMON
4969#undef CASE_WIDEOP_CHANGE_OPCODE_LMULS
4970#undef CASE_FP_WIDEOP_OPCODE_COMMON
4971#undef CASE_FP_WIDEOP_OPCODE_LMULS
4972#undef CASE_FP_WIDEOP_CHANGE_OPCODE_COMMON
4973#undef CASE_FP_WIDEOP_CHANGE_OPCODE_LMULS
4974
4977 Register DestReg, uint32_t Amount,
4978 MachineInstr::MIFlag Flag) const {
4979 MachineRegisterInfo &MRI = MF.getRegInfo();
4980 if (llvm::has_single_bit(Amount)) {
4981 uint32_t ShiftAmount = Log2_32(Amount);
4982 if (ShiftAmount == 0)
4983 return;
4984 BuildMI(MBB, II, DL, get(RISCV::SLLI), DestReg)
4985 .addReg(DestReg, RegState::Kill)
4986 .addImm(ShiftAmount)
4987 .setMIFlag(Flag);
4988 } else if (int ShXAmount, ShiftAmount;
4989 STI.hasShlAdd(3) &&
4990 (ShXAmount = isShifted359(Amount, ShiftAmount)) != 0) {
4991 // We can use Zba SHXADD+SLLI instructions for multiply in some cases.
4992 unsigned Opc;
4993 switch (ShXAmount) {
4994 case 1:
4995 Opc = RISCV::SH1ADD;
4996 break;
4997 case 2:
4998 Opc = RISCV::SH2ADD;
4999 break;
5000 case 3:
5001 Opc = RISCV::SH3ADD;
5002 break;
5003 default:
5004 llvm_unreachable("unexpected result of isShifted359");
5005 }
5006 if (ShiftAmount)
5007 BuildMI(MBB, II, DL, get(RISCV::SLLI), DestReg)
5008 .addReg(DestReg, RegState::Kill)
5009 .addImm(ShiftAmount)
5010 .setMIFlag(Flag);
5011 BuildMI(MBB, II, DL, get(Opc), DestReg)
5012 .addReg(DestReg, RegState::Kill)
5013 .addReg(DestReg)
5014 .setMIFlag(Flag);
5015 } else if (llvm::has_single_bit(Amount - 1)) {
5016 Register ScaledRegister = MRI.createVirtualRegister(&RISCV::GPRRegClass);
5017 uint32_t ShiftAmount = Log2_32(Amount - 1);
5018 BuildMI(MBB, II, DL, get(RISCV::SLLI), ScaledRegister)
5019 .addReg(DestReg)
5020 .addImm(ShiftAmount)
5021 .setMIFlag(Flag);
5022 BuildMI(MBB, II, DL, get(RISCV::ADD), DestReg)
5023 .addReg(ScaledRegister, RegState::Kill)
5024 .addReg(DestReg, RegState::Kill)
5025 .setMIFlag(Flag);
5026 } else if (llvm::has_single_bit(Amount + 1)) {
5027 Register ScaledRegister = MRI.createVirtualRegister(&RISCV::GPRRegClass);
5028 uint32_t ShiftAmount = Log2_32(Amount + 1);
5029 BuildMI(MBB, II, DL, get(RISCV::SLLI), ScaledRegister)
5030 .addReg(DestReg)
5031 .addImm(ShiftAmount)
5032 .setMIFlag(Flag);
5033 BuildMI(MBB, II, DL, get(RISCV::SUB), DestReg)
5034 .addReg(ScaledRegister, RegState::Kill)
5035 .addReg(DestReg, RegState::Kill)
5036 .setMIFlag(Flag);
5037 } else if (STI.hasStdExtZmmul()) {
5038 Register N = MRI.createVirtualRegister(&RISCV::GPRRegClass);
5039 movImm(MBB, II, DL, N, Amount, Flag);
5040 BuildMI(MBB, II, DL, get(RISCV::MUL), DestReg)
5041 .addReg(DestReg, RegState::Kill)
5043 .setMIFlag(Flag);
5044 } else {
5045 Register Acc;
5046 uint32_t PrevShiftAmount = 0;
5047 for (uint32_t ShiftAmount = 0; Amount >> ShiftAmount; ShiftAmount++) {
5048 if (Amount & (1U << ShiftAmount)) {
5049 if (ShiftAmount)
5050 BuildMI(MBB, II, DL, get(RISCV::SLLI), DestReg)
5051 .addReg(DestReg, RegState::Kill)
5052 .addImm(ShiftAmount - PrevShiftAmount)
5053 .setMIFlag(Flag);
5054 if (Amount >> (ShiftAmount + 1)) {
5055 // If we don't have an accmulator yet, create it and copy DestReg.
5056 if (!Acc) {
5057 Acc = MRI.createVirtualRegister(&RISCV::GPRRegClass);
5058 BuildMI(MBB, II, DL, get(TargetOpcode::COPY), Acc)
5059 .addReg(DestReg)
5060 .setMIFlag(Flag);
5061 } else {
5062 BuildMI(MBB, II, DL, get(RISCV::ADD), Acc)
5063 .addReg(Acc, RegState::Kill)
5064 .addReg(DestReg)
5065 .setMIFlag(Flag);
5066 }
5067 }
5068 PrevShiftAmount = ShiftAmount;
5069 }
5070 }
5071 assert(Acc && "Expected valid accumulator");
5072 BuildMI(MBB, II, DL, get(RISCV::ADD), DestReg)
5073 .addReg(DestReg, RegState::Kill)
5074 .addReg(Acc, RegState::Kill)
5075 .setMIFlag(Flag);
5076 }
5077}
5078
5081 static const std::pair<MachineMemOperand::Flags, const char *> TargetFlags[] =
5082 {{MONontemporalBit0, "riscv-nontemporal-domain-bit-0"},
5083 {MONontemporalBit1, "riscv-nontemporal-domain-bit-1"}};
5084 return ArrayRef(TargetFlags);
5085}
5086
5088 return OptLevel >= CodeGenOptLevel::Aggressive
5089 ? STI.getTailDupAggressiveThreshold()
5090 : 2;
5091}
5092
5094 // RVV lacks any support for immediate addressing for stack addresses, so be
5095 // conservative.
5096 unsigned Opcode = MI.getOpcode();
5097 if (!RISCVVPseudosTable::getPseudoInfo(Opcode) &&
5099 return false;
5100 return true;
5101}
5102
5103/// Return true if \p MI is a copy that will be lowered to one or more vmvNr.vs.
5105 const MachineInstr &MI) {
5106 return MI.isCopy() && MI.getOperand(0).getReg().isPhysical() &&
5108 TRI->getMinimalPhysRegClass(MI.getOperand(0).getReg()));
5109}
5110
5111std::optional<std::pair<unsigned, unsigned>>
5113 switch (Opcode) {
5114 default:
5115 return std::nullopt;
5116 case RISCV::PseudoVSPILL2_M1:
5117 case RISCV::PseudoVRELOAD2_M1:
5118 return std::make_pair(2u, 1u);
5119 case RISCV::PseudoVSPILL2_M2:
5120 case RISCV::PseudoVRELOAD2_M2:
5121 return std::make_pair(2u, 2u);
5122 case RISCV::PseudoVSPILL2_M4:
5123 case RISCV::PseudoVRELOAD2_M4:
5124 return std::make_pair(2u, 4u);
5125 case RISCV::PseudoVSPILL3_M1:
5126 case RISCV::PseudoVRELOAD3_M1:
5127 return std::make_pair(3u, 1u);
5128 case RISCV::PseudoVSPILL3_M2:
5129 case RISCV::PseudoVRELOAD3_M2:
5130 return std::make_pair(3u, 2u);
5131 case RISCV::PseudoVSPILL4_M1:
5132 case RISCV::PseudoVRELOAD4_M1:
5133 return std::make_pair(4u, 1u);
5134 case RISCV::PseudoVSPILL4_M2:
5135 case RISCV::PseudoVRELOAD4_M2:
5136 return std::make_pair(4u, 2u);
5137 case RISCV::PseudoVSPILL5_M1:
5138 case RISCV::PseudoVRELOAD5_M1:
5139 return std::make_pair(5u, 1u);
5140 case RISCV::PseudoVSPILL6_M1:
5141 case RISCV::PseudoVRELOAD6_M1:
5142 return std::make_pair(6u, 1u);
5143 case RISCV::PseudoVSPILL7_M1:
5144 case RISCV::PseudoVRELOAD7_M1:
5145 return std::make_pair(7u, 1u);
5146 case RISCV::PseudoVSPILL8_M1:
5147 case RISCV::PseudoVRELOAD8_M1:
5148 return std::make_pair(8u, 1u);
5149 }
5150}
5151
5152bool RISCV::hasEqualFRM(const MachineInstr &MI1, const MachineInstr &MI2) {
5153 int16_t MI1FrmOpIdx =
5154 RISCV::getNamedOperandIdx(MI1.getOpcode(), RISCV::OpName::frm);
5155 int16_t MI2FrmOpIdx =
5156 RISCV::getNamedOperandIdx(MI2.getOpcode(), RISCV::OpName::frm);
5157 if (MI1FrmOpIdx < 0 || MI2FrmOpIdx < 0)
5158 return false;
5159 MachineOperand FrmOp1 = MI1.getOperand(MI1FrmOpIdx);
5160 MachineOperand FrmOp2 = MI2.getOperand(MI2FrmOpIdx);
5161 return FrmOp1.getImm() == FrmOp2.getImm();
5162}
5163
5164std::optional<unsigned>
5165RISCV::getVectorLowDemandedScalarBits(unsigned Opcode, unsigned Log2SEW) {
5166 switch (Opcode) {
5167 default:
5168 return std::nullopt;
5169
5170 // 11.6. Vector Single-Width Shift Instructions
5171 case RISCV::VSLL_VX:
5172 case RISCV::VSRL_VX:
5173 case RISCV::VSRA_VX:
5174 // 12.4. Vector Single-Width Scaling Shift Instructions
5175 case RISCV::VSSRL_VX:
5176 case RISCV::VSSRA_VX:
5177 // Zvbb
5178 case RISCV::VROL_VX:
5179 case RISCV::VROR_VX:
5180 // Only the low lg2(SEW) bits of the shift-amount value are used.
5181 return Log2SEW;
5182
5183 // 11.7 Vector Narrowing Integer Right Shift Instructions
5184 case RISCV::VNSRL_WX:
5185 case RISCV::VNSRA_WX:
5186 // 12.5. Vector Narrowing Fixed-Point Clip Instructions
5187 case RISCV::VNCLIPU_WX:
5188 case RISCV::VNCLIP_WX:
5189 // Zvbb
5190 case RISCV::VWSLL_VX:
5191 // Only the low lg2(2*SEW) bits of the shift-amount value are used.
5192 return Log2SEW + 1;
5193
5194 // 11.1. Vector Single-Width Integer Add and Subtract
5195 case RISCV::VADD_VX:
5196 case RISCV::VSUB_VX:
5197 case RISCV::VRSUB_VX:
5198 // 11.2. Vector Widening Integer Add/Subtract
5199 case RISCV::VWADDU_VX:
5200 case RISCV::VWSUBU_VX:
5201 case RISCV::VWADD_VX:
5202 case RISCV::VWSUB_VX:
5203 case RISCV::VWADDU_WX:
5204 case RISCV::VWSUBU_WX:
5205 case RISCV::VWADD_WX:
5206 case RISCV::VWSUB_WX:
5207 // 11.4. Vector Integer Add-with-Carry / Subtract-with-Borrow Instructions
5208 case RISCV::VADC_VXM:
5209 case RISCV::VADC_VIM:
5210 case RISCV::VMADC_VXM:
5211 case RISCV::VMADC_VIM:
5212 case RISCV::VMADC_VX:
5213 case RISCV::VSBC_VXM:
5214 case RISCV::VMSBC_VXM:
5215 case RISCV::VMSBC_VX:
5216 // 11.5 Vector Bitwise Logical Instructions
5217 case RISCV::VAND_VX:
5218 case RISCV::VOR_VX:
5219 case RISCV::VXOR_VX:
5220 // 11.8. Vector Integer Compare Instructions
5221 case RISCV::VMSEQ_VX:
5222 case RISCV::VMSNE_VX:
5223 case RISCV::VMSLTU_VX:
5224 case RISCV::VMSLT_VX:
5225 case RISCV::VMSLEU_VX:
5226 case RISCV::VMSLE_VX:
5227 case RISCV::VMSGTU_VX:
5228 case RISCV::VMSGT_VX:
5229 // 11.9. Vector Integer Min/Max Instructions
5230 case RISCV::VMINU_VX:
5231 case RISCV::VMIN_VX:
5232 case RISCV::VMAXU_VX:
5233 case RISCV::VMAX_VX:
5234 // 11.10. Vector Single-Width Integer Multiply Instructions
5235 case RISCV::VMUL_VX:
5236 case RISCV::VMULH_VX:
5237 case RISCV::VMULHU_VX:
5238 case RISCV::VMULHSU_VX:
5239 // 11.11. Vector Integer Divide Instructions
5240 case RISCV::VDIVU_VX:
5241 case RISCV::VDIV_VX:
5242 case RISCV::VREMU_VX:
5243 case RISCV::VREM_VX:
5244 // 11.12. Vector Widening Integer Multiply Instructions
5245 case RISCV::VWMUL_VX:
5246 case RISCV::VWMULU_VX:
5247 case RISCV::VWMULSU_VX:
5248 // 11.13. Vector Single-Width Integer Multiply-Add Instructions
5249 case RISCV::VMACC_VX:
5250 case RISCV::VNMSAC_VX:
5251 case RISCV::VMADD_VX:
5252 case RISCV::VNMSUB_VX:
5253 // 11.14. Vector Widening Integer Multiply-Add Instructions
5254 case RISCV::VWMACCU_VX:
5255 case RISCV::VWMACC_VX:
5256 case RISCV::VWMACCSU_VX:
5257 case RISCV::VWMACCUS_VX:
5258 // 11.15. Vector Integer Merge Instructions
5259 case RISCV::VMERGE_VXM:
5260 // 11.16. Vector Integer Move Instructions
5261 case RISCV::VMV_V_X:
5262 // 12.1. Vector Single-Width Saturating Add and Subtract
5263 case RISCV::VSADDU_VX:
5264 case RISCV::VSADD_VX:
5265 case RISCV::VSSUBU_VX:
5266 case RISCV::VSSUB_VX:
5267 // 12.2. Vector Single-Width Averaging Add and Subtract
5268 case RISCV::VAADDU_VX:
5269 case RISCV::VAADD_VX:
5270 case RISCV::VASUBU_VX:
5271 case RISCV::VASUB_VX:
5272 // 12.3. Vector Single-Width Fractional Multiply with Rounding and Saturation
5273 case RISCV::VSMUL_VX:
5274 // 16.1. Integer Scalar Move Instructions
5275 case RISCV::VMV_S_X:
5276 // Zvbb
5277 case RISCV::VANDN_VX:
5278 return 1U << Log2SEW;
5279 }
5280}
5281
5282unsigned RISCV::getRVVMCOpcode(unsigned RVVPseudoOpcode) {
5284 RISCVVPseudosTable::getPseudoInfo(RVVPseudoOpcode);
5285 if (!RVV)
5286 return 0;
5287 return RVV->BaseInstr;
5288}
5289
5290unsigned RISCV::getDestLog2EEW(const MCInstrDesc &Desc, unsigned Log2SEW) {
5291 unsigned DestEEW =
5293 // EEW = 1
5294 if (DestEEW == 0)
5295 return 0;
5296 // EEW = SEW * n
5297 unsigned Scaled = Log2SEW + (DestEEW - 1);
5298 assert(Scaled >= 3 && Scaled <= 6);
5299 return Scaled;
5300}
5301
5302static std::optional<int64_t> getEffectiveImm(const MachineOperand &MO) {
5303 assert(MO.isImm() || MO.getReg().isVirtual());
5304 if (MO.isImm())
5305 return MO.getImm();
5306 const MachineInstr *Def =
5307 MO.getParent()->getMF()->getRegInfo().getVRegDef(MO.getReg());
5308 int64_t Imm;
5309 if (isLoadImm(Def, Imm))
5310 return Imm;
5311 return std::nullopt;
5312}
5313
5314/// Given two VL operands, do we know that LHS <= RHS? Must be used in SSA form.
5316 assert((LHS.isImm() || LHS.getParent()->getMF()->getRegInfo().isSSA()) &&
5317 (RHS.isImm() || RHS.getParent()->getMF()->getRegInfo().isSSA()));
5318 if (LHS.isReg() && RHS.isReg() && LHS.getReg().isVirtual() &&
5319 LHS.getReg() == RHS.getReg())
5320 return true;
5321 if (RHS.isImm() && RHS.getImm() == RISCV::VLMaxSentinel)
5322 return true;
5323 if (LHS.isImm() && LHS.getImm() == 0)
5324 return true;
5325 if (LHS.isImm() && LHS.getImm() == RISCV::VLMaxSentinel)
5326 return false;
5327 std::optional<int64_t> LHSImm = getEffectiveImm(LHS),
5328 RHSImm = getEffectiveImm(RHS);
5329 if (!LHSImm || !RHSImm)
5330 return false;
5331 return LHSImm <= RHSImm;
5332}
5333
5334namespace {
5335class RISCVPipelinerLoopInfo : public TargetInstrInfo::PipelinerLoopInfo {
5336 const MachineInstr *LHS;
5337 const MachineInstr *RHS;
5339
5340public:
5341 RISCVPipelinerLoopInfo(const MachineInstr *LHS, const MachineInstr *RHS,
5343 : LHS(LHS), RHS(RHS), Cond(Cond.begin(), Cond.end()) {}
5344
5345 bool shouldIgnoreForPipelining(const MachineInstr *MI) const override {
5346 // Make the instructions for loop control be placed in stage 0.
5347 // The predecessors of LHS/RHS are considered by the caller.
5348 if (LHS && MI == LHS)
5349 return true;
5350 if (RHS && MI == RHS)
5351 return true;
5352 return false;
5353 }
5354
5355 std::optional<bool> createTripCountGreaterCondition(
5356 int TC, MachineBasicBlock &MBB,
5357 SmallVectorImpl<MachineOperand> &CondParam) override {
5358 // A branch instruction will be inserted as "if (Cond) goto epilogue".
5359 // Cond is normalized for such use.
5360 // The predecessors of the branch are assumed to have already been inserted.
5361 CondParam = Cond;
5362 return {};
5363 }
5364
5365 void setPreheader(MachineBasicBlock *NewPreheader) override {}
5366
5367 void adjustTripCount(int TripCountAdjust) override {}
5368};
5369} // namespace
5370
5371std::unique_ptr<TargetInstrInfo::PipelinerLoopInfo>
5373 MachineBasicBlock *TBB = nullptr, *FBB = nullptr;
5375 if (analyzeBranch(*LoopBB, TBB, FBB, Cond, /*AllowModify=*/false))
5376 return nullptr;
5377
5378 // Infinite loops are not supported
5379 if (TBB == LoopBB && FBB == LoopBB)
5380 return nullptr;
5381
5382 // Must be conditional branch
5383 if (FBB == nullptr)
5384 return nullptr;
5385
5386 assert((TBB == LoopBB || FBB == LoopBB) &&
5387 "The Loop must be a single-basic-block loop");
5388
5389 // Normalization for createTripCountGreaterCondition()
5390 if (TBB == LoopBB)
5392
5393 const MachineRegisterInfo &MRI = LoopBB->getParent()->getRegInfo();
5394 auto FindRegDef = [&MRI](MachineOperand &Op) -> const MachineInstr * {
5395 if (!Op.isReg())
5396 return nullptr;
5397 Register Reg = Op.getReg();
5398 if (!Reg.isVirtual())
5399 return nullptr;
5400 return MRI.getVRegDef(Reg);
5401 };
5402
5403 const MachineInstr *LHS = FindRegDef(Cond[1]);
5404 const MachineInstr *RHS = FindRegDef(Cond[2]);
5405 if (LHS && LHS->isPHI())
5406 return nullptr;
5407 if (RHS && RHS->isPHI())
5408 return nullptr;
5409
5410 return std::make_unique<RISCVPipelinerLoopInfo>(LHS, RHS, Cond);
5411}
5412
5413// FIXME: We should remove this if we have a default generic scheduling model.
5415 unsigned RVVMCOpcode = RISCV::getRVVMCOpcode(Opc);
5416 Opc = RVVMCOpcode ? RVVMCOpcode : Opc;
5417 switch (Opc) {
5418 default:
5419 return false;
5420 // Integer div/rem.
5421 case RISCV::DIV:
5422 case RISCV::DIVW:
5423 case RISCV::DIVU:
5424 case RISCV::DIVUW:
5425 case RISCV::REM:
5426 case RISCV::REMW:
5427 case RISCV::REMU:
5428 case RISCV::REMUW:
5429 // Floating-point div/sqrt.
5430 case RISCV::FDIV_H:
5431 case RISCV::FDIV_S:
5432 case RISCV::FDIV_D:
5433 case RISCV::FDIV_H_INX:
5434 case RISCV::FDIV_S_INX:
5435 case RISCV::FDIV_D_INX:
5436 case RISCV::FDIV_D_IN32X:
5437 case RISCV::FSQRT_H:
5438 case RISCV::FSQRT_S:
5439 case RISCV::FSQRT_D:
5440 case RISCV::FSQRT_H_INX:
5441 case RISCV::FSQRT_S_INX:
5442 case RISCV::FSQRT_D_INX:
5443 case RISCV::FSQRT_D_IN32X:
5444 // Vector integer div/rem
5445 case RISCV::VDIV_VV:
5446 case RISCV::VDIV_VX:
5447 case RISCV::VDIVU_VV:
5448 case RISCV::VDIVU_VX:
5449 case RISCV::VREM_VV:
5450 case RISCV::VREM_VX:
5451 case RISCV::VREMU_VV:
5452 case RISCV::VREMU_VX:
5453 // Vector floating-point div/sqrt.
5454 case RISCV::VFDIV_VV:
5455 case RISCV::VFDIV_VF:
5456 case RISCV::VFRDIV_VF:
5457 case RISCV::VFSQRT_V:
5458 case RISCV::VFRSQRT7_V:
5459 return true;
5460 }
5461}
5462
5463bool RISCVInstrInfo::isVRegCopy(const MachineInstr *MI, unsigned LMul) const {
5464 if (MI->getOpcode() != TargetOpcode::COPY)
5465 return false;
5466 const MachineRegisterInfo &MRI = MI->getMF()->getRegInfo();
5468
5469 Register DstReg = MI->getOperand(0).getReg();
5470 const TargetRegisterClass *RC = DstReg.isVirtual()
5471 ? MRI.getRegClass(DstReg)
5472 : TRI->getMinimalPhysRegClass(DstReg);
5473
5475 return false;
5476
5477 if (!LMul)
5478 return true;
5479
5480 // TODO: Perhaps we could distinguish segment register classes (e.g. VRN3M2)
5481 // in the future.
5482 auto [RCLMul, RCFractional] =
5484 return (!RCFractional && LMul == RCLMul) || (RCFractional && LMul == 1);
5485}
5486
5488 if (MI.memoperands_empty())
5489 return false;
5490
5491 MachineMemOperand *MMO = *(MI.memoperands_begin());
5492 if (!MMO->isNonTemporal())
5493 return false;
5494
5495 return true;
5496}
5497
5499 const MachineBasicBlock::iterator &To) {
5500 assert(To == From.getParent()->end() || From.getParent() == To->getParent());
5501 SmallVector<Register> PhysUses, PhysDefs;
5502 for (const MachineOperand &MO : From.all_uses())
5503 if (MO.getReg().isPhysical())
5504 PhysUses.push_back(MO.getReg());
5505 for (const MachineOperand &MO : From.all_defs())
5506 if (MO.getReg().isPhysical())
5507 PhysDefs.push_back(MO.getReg());
5508 bool SawStore = false;
5509 for (auto II = std::next(From.getIterator()); II != To; II++) {
5510 for (Register PhysReg : PhysUses)
5511 if (II->definesRegister(PhysReg, nullptr))
5512 return false;
5513 for (Register PhysReg : PhysDefs)
5514 if (II->definesRegister(PhysReg, nullptr) ||
5515 II->readsRegister(PhysReg, nullptr))
5516 return false;
5517 if (II->mayStore()) {
5518 SawStore = true;
5519 break;
5520 }
5521 }
5522 return From.isSafeToMove(SawStore);
5523}
MachineInstrBuilder MachineInstrBuilder & DefMI
static bool forwardCopyWillClobberTuple(unsigned DestReg, unsigned SrcReg, unsigned NumRegs)
static void parseCondBranch(MachineInstr *LastInst, MachineBasicBlock *&Target, SmallVectorImpl< MachineOperand > &Cond)
@ MachineOutlinerTailCall
Emit a save, restore, call, and return.
@ MachineOutlinerRegSave
Emit a call and tail-call.
@ MachineOutlinerDefault
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")
SmallVector< int16_t, MAX_SRC_OPERANDS_NUM > OperandIndices
@ Scaled
MachineBasicBlock & MBB
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
MachineBasicBlock MachineBasicBlock::iterator MBBI
basic Basic Alias true
#define X(NUM, ENUM, NAME)
Definition ELF.h:853
#define clEnumValN(ENUMVAL, FLAGNAME, DESC)
const HexagonInstrInfo * TII
#define _
IRTranslator LLVM IR MI
Module.h This file contains the declarations for the Module class.
const size_t AbstractManglingParser< Derived, Alloc >::NumOps
const AbstractManglingParser< Derived, Alloc >::OperatorInfo AbstractManglingParser< Derived, Alloc >::Ops[]
#define F(x, y, z)
Definition MD5.cpp:54
#define I(x, y, z)
Definition MD5.cpp:57
Register Reg
Register const TargetRegisterInfo * TRI
Promote Memory to Register
Definition Mem2Reg.cpp:110
This file provides utility analysis objects describing memory locations.
MachineInstr unsigned OpIdx
uint64_t IntrinsicInst * II
static bool cannotInsertTailCall(const MachineBasicBlock &MBB)
#define CASE_VFMA_CHANGE_OPCODE_SPLATS(OLDOP, NEWOP)
#define CASE_FP_WIDEOP_CHANGE_OPCODE_LMULS_ALT(OP)
#define CASE_FP_WIDEOP_OPCODE_LMULS(OP)
#define CASE_OPERAND_SIMM(NUM)
static std::optional< unsigned > getLMULForRVVWholeLoadStore(unsigned Opcode)
#define CASE_VFMA_CHANGE_OPCODE_VV(OLDOP, NEWOP)
static unsigned getFPFusedMultiplyOpcode(unsigned RootOpc, unsigned Pattern)
std::optional< unsigned > getFoldedOpcode(MachineFunction &MF, MachineInstr &MI, ArrayRef< unsigned > Ops, const RISCVSubtarget &ST)
#define RVV_OPC_LMUL_CASE(OPC, INV)
#define CASE_FP_WIDEOP_CHANGE_OPCODE_LMULS(OP)
static void combineFPFusedMultiply(MachineInstr &Root, MachineInstr &Prev, unsigned Pattern, SmallVectorImpl< MachineInstr * > &InsInstrs, SmallVectorImpl< MachineInstr * > &DelInstrs)
static unsigned getAddendOperandIdx(unsigned Pattern)
#define CASE_RVV_OPCODE_UNMASK(OP)
#define CASE_WIDEOP_CHANGE_OPCODE_LMULS(OP)
static cl::opt< bool > PreferWholeRegisterMove("riscv-prefer-whole-register-move", cl::init(false), cl::Hidden, cl::desc("Prefer whole register move for vector registers."))
#define CASE_VFMA_SPLATS(OP)
unsigned getPredicatedOpcode(unsigned Opcode)
#define CASE_FP_WIDEOP_OPCODE_LMULS_ALT(OP)
#define CASE_WIDEOP_OPCODE_LMULS(OP)
static bool isMIReadsReg(const MachineInstr &MI, const TargetRegisterInfo *TRI, MCRegister RegNo)
#define OPCODE_LMUL_MASK_CASE(OPC)
#define CASE_OPERAND_UIMM_LSB_ZEROS(BITS, SUFFIX)
static bool isFSUB(unsigned Opc)
#define CASE_VMA_CHANGE_OPCODE_LMULS(OLDOP, NEWOP, TYPE)
#define CASE_RVV_OPCODE(OP)
static std::optional< int64_t > getEffectiveImm(const MachineOperand &MO)
#define CASE_VFMA_OPCODE_VV(OP)
static cl::opt< bool > OutlinerEnableRegSave("riscv-outliner-regsave", cl::init(true), cl::Hidden, cl::desc("Enable RegSave strategy in machine outliner (save X5 to a " "temporary register when X5 is live across outlined calls)."))
MachineOutlinerConstructionID
#define CASE_RVV_OPCODE_WIDEN(OP)
static unsigned getLoadPredicatedOpcode(unsigned Opcode)
static unsigned getSHXADDUWShiftAmount(unsigned Opc)
#define CASE_VMA_OPCODE_LMULS(OP, TYPE)
static bool isConvertibleToVMV_V_V(const RISCVSubtarget &STI, const MachineBasicBlock &MBB, MachineBasicBlock::const_iterator MBBI, MachineBasicBlock::const_iterator &DefMBBI, RISCVVType::VLMUL LMul)
static bool isFMUL(unsigned Opc)
static unsigned getInverseXqcicmOpcode(unsigned Opcode)
static bool getFPPatterns(MachineInstr &Root, SmallVectorImpl< unsigned > &Patterns, bool DoRegPressureReduce)
#define OPCODE_LMUL_CASE(OPC)
#define CASE_OPERAND_UIMM(NUM)
static Register findRegisterToSaveX5To(outliner::Candidate &C, const TargetRegisterInfo &TRI)
static bool canCombineShiftIntoShXAdd(const MachineBasicBlock &MBB, const MachineOperand &MO, unsigned OuterShiftAmt)
Utility routine that checks if.
static bool isCandidatePatchable(const MachineBasicBlock &MBB)
static bool isFADD(unsigned Opc)
static void genShXAddAddShift(MachineInstr &Root, unsigned AddOpIdx, SmallVectorImpl< MachineInstr * > &InsInstrs, SmallVectorImpl< MachineInstr * > &DelInstrs, DenseMap< Register, unsigned > &InstrIdxForVirtReg)
static bool isLoadImm(const MachineInstr *MI, int64_t &Imm)
static bool isMIModifiesReg(const MachineInstr &MI, const TargetRegisterInfo *TRI, MCRegister RegNo)
#define CASE_RVV_OPCODE_LMUL(OP, LMUL)
static bool canCombineFPFusedMultiply(const MachineInstr &Root, const MachineOperand &MO, bool DoRegPressureReduce)
static bool getSHXADDPatterns(const MachineInstr &Root, SmallVectorImpl< unsigned > &Patterns)
static bool getFPFusedMultiplyPatterns(MachineInstr &Root, SmallVectorImpl< unsigned > &Patterns, bool DoRegPressureReduce)
static cl::opt< MachineTraceStrategy > ForceMachineCombinerStrategy("riscv-force-machine-combiner-strategy", cl::Hidden, cl::desc("Force machine combiner to use a specific strategy for machine " "trace metrics evaluation."), cl::init(MachineTraceStrategy::TS_NumStrategies), cl::values(clEnumValN(MachineTraceStrategy::TS_Local, "local", "Local strategy."), clEnumValN(MachineTraceStrategy::TS_MinInstrCount, "min-instr", "MinInstrCount strategy.")))
static unsigned getSHXADDShiftAmount(unsigned Opc)
#define CASE_RVV_OPCODE_MASK(OP)
#define RVV_OPC_LMUL_MASK_CASE(OPC, INV)
static MachineInstr * canFoldAsPredicatedOp(Register Reg, const MachineRegisterInfo &MRI, const TargetInstrInfo *TII, const RISCVSubtarget &STI)
Identify instructions that can be folded into a CCMOV instruction, and return the defining instructio...
const SmallVectorImpl< MachineOperand > MachineBasicBlock * TBB
const SmallVectorImpl< MachineOperand > & Cond
This file declares the machine register scavenger class.
static bool memOpsHaveSameBasePtr(const MachineInstr &MI1, ArrayRef< const MachineOperand * > BaseOps1, const MachineInstr &MI2, ArrayRef< const MachineOperand * > BaseOps2)
This file contains some templates that are useful if you are working with the STL at all.
static bool contains(SmallPtrSetImpl< ConstantExpr * > &Cache, ConstantExpr *Expr, Constant *C)
Definition Value.cpp:484
This file defines the SmallVector class.
This file defines the 'Statistic' class, which is designed to be an easy way to expose various metric...
#define STATISTIC(VARNAME, DESC)
Definition Statistic.h:171
#define LLVM_DEBUG(...)
Definition Debug.h:119
static TableGen::Emitter::Opt Y("gen-skeleton-entry", EmitSkeleton, "Generate example skeleton entry")
static bool canCombine(MachineBasicBlock &MBB, MachineOperand &MO, unsigned CombineOpc=0)
static cl::opt< unsigned > CacheLineSize("cache-line-size", cl::init(0), cl::Hidden, cl::desc("Use this to override the target cache line size when " "specified by the user."))
Value * RHS
Value * LHS
Represent a constant reference to an array (0 or more elements consecutively in memory),...
Definition ArrayRef.h:40
const T & front() const
Get the first element.
Definition ArrayRef.h:144
bool empty() const
Check if the array is empty.
Definition ArrayRef.h:136
static LLVM_ABI DILocation * getMergedLocation(DILocation *LocA, DILocation *LocB)
Attempts to merge LocA and LocB into a single location; see DebugLoc::getMergedLocation for more deta...
bool isBigEndian() const
Definition DataLayout.h:218
A debug info location.
Definition DebugLoc.h:124
std::pair< iterator, bool > insert(const std::pair< KeyT, ValueT > &KV)
Definition DenseMap.h:286
bool hasMinSize() const
Optimize this function for minimum size (-Oz).
Definition Function.h:711
LiveInterval - This class represents the liveness of a register, or stack slot.
LiveInterval & getInterval(Register Reg)
SlotIndex ReplaceMachineInstrInMaps(MachineInstr &MI, MachineInstr &NewMI)
const Segment * getSegmentContaining(SlotIndex Idx) const
Return the segment that contains the specified index, or null if there is none.
LLVM_ABI void replaceKillInstruction(Register Reg, MachineInstr &OldMI, MachineInstr &NewMI)
replaceKillInstruction - Update register kill info by replacing a kill instruction with a new one.
bool hasValue() const
static LocationSize precise(uint64_t Value)
TypeSize getValue() const
MCInstBuilder & addReg(MCRegister Reg)
Add a new register operand.
MCInstBuilder & addImm(int64_t Val)
Add a new integer immediate operand.
Instances of this class represent a single low-level machine instruction.
Definition MCInst.h:188
Describe properties that are true of each instruction in the target description file.
unsigned getNumOperands() const
Return the number of declared MachineOperands for this MachineInstruction.
bool isConditionalBranch() const
Return true if this is a branch which may fall through to the next instruction or may transfer contro...
This holds information about one operand of a machine instruction, indicating the register class for ...
Definition MCInstrDesc.h:86
Wrapper class representing physical registers. Should be passed by value.
Definition MCRegister.h:41
const FeatureBitset & getFeatureBits() const
Set of metadata that should be preserved when using BuildMI().
MachineInstrBundleIterator< const MachineInstr > const_iterator
MachineInstrBundleIterator< MachineInstr, true > reverse_iterator
const MachineFunction * getParent() const
Return the MachineFunction containing this basic block.
MachineInstrBundleIterator< MachineInstr > iterator
MachineInstrBundleIterator< const MachineInstr, true > const_reverse_iterator
The MachineFrameInfo class represents an abstract stack frame until prolog/epilog code is inserted.
void setStackID(int ObjectIdx, uint8_t ID)
Align getObjectAlign(int ObjectIdx) const
Return the alignment of the specified stack object.
int64_t getObjectSize(int ObjectIdx) const
Return the size of the specified object.
const TargetSubtargetInfo & getSubtarget() const
getSubtarget - Return the subtarget for which this machine code is being compiled.
StringRef getName() const
getName - Return the name of the corresponding LLVM function.
MachineMemOperand * getMachineMemOperand(MachinePointerInfo PtrInfo, MachineMemOperand::Flags f, LLT MemTy, Align base_alignment, const AAMDNodes &AAInfo=AAMDNodes(), const MDNode *Ranges=nullptr, SyncScope::ID SSID=SyncScope::System, AtomicOrdering Ordering=AtomicOrdering::NotAtomic, AtomicOrdering FailureOrdering=AtomicOrdering::NotAtomic)
getMachineMemOperand - Allocate a new MachineMemOperand.
MachineFrameInfo & getFrameInfo()
getFrameInfo - Return the frame info object for the current function.
MachineRegisterInfo & getRegInfo()
getRegInfo - Return information about the registers currently in use.
const DataLayout & getDataLayout() const
Return the DataLayout attached to the Module associated to this MF.
Function & getFunction()
Return the LLVM function that this machine code represents.
Ty * getInfo()
getInfo - Keep track of various per-function pieces of information for backends that would like to do...
const TargetMachine & getTarget() const
getTarget - Return the target machine this machine code is compiled with
const MachineInstrBuilder & setMemRefs(ArrayRef< MachineMemOperand * > MMOs) const
const MachineInstrBuilder & addUse(Register RegNo, RegState Flags={}, unsigned SubReg=0) const
Add a virtual register use operand.
const MachineInstrBuilder & addReg(Register RegNo, RegState Flags={}, unsigned SubReg=0) const
Add a new virtual register operand.
const MachineInstrBuilder & setMIFlag(MachineInstr::MIFlag Flag) const
const MachineInstrBuilder & addImm(int64_t Val) const
Add a new immediate operand.
const MachineInstrBuilder & add(const MachineOperand &MO) const
const MachineInstrBuilder & addFrameIndex(int Idx) const
const MachineInstrBuilder & addMBB(MachineBasicBlock *MBB, unsigned TargetFlags=0) const
const MachineInstrBuilder & cloneMemRefs(const MachineInstr &OtherMI) const
const MachineInstrBuilder & setMIFlags(unsigned Flags) const
const MachineInstrBuilder & copyImplicitOps(const MachineInstr &OtherMI) const
Copy all the implicit operands from OtherMI onto this one.
const MachineInstrBuilder & addMemOperand(MachineMemOperand *MMO) const
reverse_iterator getReverse() const
Get a reverse iterator to the same node.
Representation of each machine instruction.
unsigned getOpcode() const
Returns the opcode of this MachineInstr.
bool isReturn(QueryType Type=AnyInBundle) const
bool mayLoadOrStore(QueryType Type=AnyInBundle) const
Return true if this instruction could possibly read or modify memory.
const MachineBasicBlock * getParent() const
filtered_mop_range all_defs()
Returns an iterator range over all operands that are (explicit or implicit) register defs.
bool getFlag(MIFlag Flag) const
Return whether an MI flag is set.
LLVM_ABI bool isSafeToMove(bool &SawStore) const
Return true if it is safe to move this instruction.
LLVM_ABI unsigned getNumExplicitOperands() const
Returns the number of non-implicit operands.
bool modifiesRegister(Register Reg, const TargetRegisterInfo *TRI) const
Return true if the MachineInstr modifies (fully define or partially define) the specified register.
bool mayLoad(QueryType Type=AnyInBundle) const
Return true if this instruction could possibly read memory.
const MCInstrDesc & getDesc() const
Returns the target instruction descriptor of this MachineInstr.
LLVM_ABI bool hasUnmodeledSideEffects() const
Return true if this instruction has side effects that are not modeled by mayLoad / mayStore,...
bool hasOneMemOperand() const
Return true if this instruction has exactly one MachineMemOperand.
mmo_iterator memoperands_begin() const
Access to memory operands of the instruction.
LLVM_ABI bool hasOrderedMemoryRef() const
Return true if this instruction may have an ordered or volatile memory reference, or if the informati...
LLVM_ABI const MachineFunction * getMF() const
Return the function that contains the basic block that this instruction belongs to.
ArrayRef< MachineMemOperand * > memoperands() const
Access to memory operands of the instruction.
const DebugLoc & getDebugLoc() const
Returns the debug location id of this MachineInstr.
filtered_mop_range all_uses()
Returns an iterator range over all operands that are (explicit or implicit) register uses.
const MachineOperand & getOperand(unsigned i) const
uint32_t getFlags() const
Return the MI flags bitvector.
LLVM_ABI void clearKillInfo()
Clears kill flags on all operands.
A description of a memory reference used in the backend.
@ MOLoad
The memory access reads data.
@ MOStore
The memory access writes data.
This class contains meta information specific to a module.
MachineOperand class - Representation of each machine instruction operand.
int64_t getImm() const
bool isReg() const
isReg - Tests if this is a MO_Register operand.
MachineBasicBlock * getMBB() const
bool isImm() const
isImm - Tests if this is a MO_Immediate operand.
MachineInstr * getParent()
getParent - Return the instruction that this operand belongs to.
static MachineOperand CreateImm(int64_t Val)
MachineOperandType getType() const
getType - Returns the MachineOperandType for this operand.
Register getReg() const
getReg - Returns the register number.
bool isFI() const
isFI - Tests if this is a MO_FrameIndex operand.
LLVM_ABI bool isIdenticalTo(const MachineOperand &Other) const
Returns true if this operand is identical to the specified operand except for liveness related flags ...
@ MO_Immediate
Immediate operand.
@ MO_Register
Register operand.
MachineRegisterInfo - Keep track of information for virtual and physical registers,...
LLVM_ABI bool hasOneNonDBGUse(Register RegNo) const
hasOneNonDBGUse - Return true if there is exactly one non-Debug use of the specified register.
const TargetRegisterClass * getRegClass(Register Reg) const
Return the register class of the specified virtual register.
LLVM_ABI void clearKillFlags(Register Reg) const
clearKillFlags - Iterate over all the uses of the given register and clear the kill flag from the Mac...
LLVM_ABI MachineInstr * getVRegDef(Register Reg) const
getVRegDef - Return the machine instr that defines the specified virtual register or null if none is ...
bool isReserved(MCRegister PhysReg) const
isReserved - Returns true when PhysReg is a reserved register.
LLVM_ABI Register createVirtualRegister(const TargetRegisterClass *RegClass, StringRef Name="")
createVirtualRegister - Create and return a new virtual register in the function with the specified r...
bool hasOneUse(Register RegNo) const
hasOneUse - Return true if there is exactly one instruction using the specified register.
LLVM_ABI void clearVirtRegs()
clearVirtRegs - Remove all virtual registers (after physreg assignment).
const TargetRegisterInfo * getTargetRegisterInfo() const
LLVM_ABI bool isConstantPhysReg(MCRegister PhysReg) const
Returns true if PhysReg is unallocatable and constant throughout the function.
LLVM_ABI const TargetRegisterClass * constrainRegClass(Register Reg, const TargetRegisterClass *RC, unsigned MinNumRegs=0)
constrainRegClass - Constrain the register class of the specified virtual register to be a common sub...
LLVM_ABI void replaceRegWith(Register FromReg, Register ToReg)
replaceRegWith - Replace all instances of FromReg with ToReg in the machine function.
LLVM_ABI MachineInstr * getUniqueVRegDef(Register Reg) const
getUniqueVRegDef - Return the unique machine instr that defines the specified virtual register or nul...
A Module instance is used to store all the information related to an LLVM module.
Definition Module.h:67
MI-level patchpoint operands.
Definition StackMaps.h:77
uint32_t getNumPatchBytes() const
Return the number of patchable bytes the given patchpoint should emit.
Definition StackMaps.h:105
void storeRegToStackSlot(MachineBasicBlock &MBB, MachineBasicBlock::iterator MBBI, Register SrcReg, bool IsKill, int FrameIndex, const TargetRegisterClass *RC, Register VReg, MachineInstr::MIFlag Flags=MachineInstr::NoFlags) const override
static bool isSafeToMove(const MachineInstr &From, const MachineBasicBlock::iterator &To)
Return true if moving From down to To won't cause any physical register reads or writes to be clobber...
MachineInstr * convertToThreeAddress(MachineInstr &MI, LiveVariables *LV, LiveIntervals *LIS) const override
Register isLoadFromStackSlot(const MachineInstr &MI, int &FrameIndex) const override
std::optional< std::unique_ptr< outliner::OutlinedFunction > > getOutliningCandidateInfo(const MachineModuleInfo &MMI, std::vector< outliner::Candidate > &RepeatedSequenceLocs, unsigned MinRepeats) const override
unsigned removeBranch(MachineBasicBlock &MBB, int *BytesRemoved=nullptr) const override
void genAlternativeCodeSequence(MachineInstr &Root, unsigned Pattern, SmallVectorImpl< MachineInstr * > &InsInstrs, SmallVectorImpl< MachineInstr * > &DelInstrs, DenseMap< Register, unsigned > &InstrIdxForVirtReg) const override
void movImm(MachineBasicBlock &MBB, MachineBasicBlock::iterator MBBI, const DebugLoc &DL, Register DstReg, uint64_t Val, MachineInstr::MIFlag Flag=MachineInstr::NoFlags, bool DstRenamable=false, bool DstIsDead=false) const
MachineInstr * emitLdStWithAddr(MachineInstr &MemI, const ExtAddrMode &AM) const override
void mulImm(MachineFunction &MF, MachineBasicBlock &MBB, MachineBasicBlock::iterator II, const DebugLoc &DL, Register DestReg, uint32_t Amt, MachineInstr::MIFlag Flag) const
Generate code to multiply the value in DestReg by Amt - handles all the common optimizations for this...
static bool isPairableLdStInstOpc(unsigned Opc)
Return true if pairing the given load or store may be paired with another.
RISCVInstrInfo(const RISCVSubtarget &STI)
void loadRegFromStackSlot(MachineBasicBlock &MBB, MachineBasicBlock::iterator MBBI, Register DstReg, int FrameIndex, const TargetRegisterClass *RC, Register VReg, unsigned SubReg=0, MachineInstr::MIFlag Flags=MachineInstr::NoFlags) const override
bool isFunctionSafeToOutlineFrom(MachineFunction &MF, bool OutlineFromLinkOnceODRs) const override
std::unique_ptr< TargetInstrInfo::PipelinerLoopInfo > analyzeLoopForPipelining(MachineBasicBlock *LoopBB) const override
unsigned insertBranch(MachineBasicBlock &MBB, MachineBasicBlock *TBB, MachineBasicBlock *FBB, ArrayRef< MachineOperand > Cond, const DebugLoc &dl, int *BytesAdded=nullptr) const override
bool hasReassociableSibling(const MachineInstr &Inst, bool &Commuted) const override
static bool isLdStSafeToPair(const MachineInstr &LdSt, const TargetRegisterInfo *TRI)
void copyPhysRegVector(MachineBasicBlock &MBB, MachineBasicBlock::iterator MBBI, const DebugLoc &DL, MCRegister DstReg, MCRegister SrcReg, bool KillSrc, const TargetRegisterClass *RegClass) const
bool isReMaterializableImpl(const MachineInstr &MI) const override
MachineInstr * optimizeSelect(MachineInstr &MI, SmallPtrSetImpl< MachineInstr * > &SeenMIs, bool) const override
bool isVRegCopy(const MachineInstr *MI, unsigned LMul=0) const
Return true if MI is a COPY to a vector register of a specific LMul, or any kind of vector registers ...
bool canFoldIntoAddrMode(const MachineInstr &MemI, Register Reg, const MachineInstr &AddrI, ExtAddrMode &AM) const override
void insertIndirectBranch(MachineBasicBlock &MBB, MachineBasicBlock &NewDestBB, MachineBasicBlock &RestoreBB, const DebugLoc &DL, int64_t BrOffset, RegScavenger *RS) const override
bool isAsCheapAsAMove(const MachineInstr &MI) const override
bool verifyInstruction(const MachineInstr &MI, StringRef &ErrInfo) const override
bool getMemOperandWithOffsetWidth(const MachineInstr &LdSt, const MachineOperand *&BaseOp, int64_t &Offset, LocationSize &Width, const TargetRegisterInfo *TRI) const
unsigned getTailDuplicateSize(CodeGenOptLevel OptLevel) const override
void getReassociateOperandIndices(const MachineInstr &Root, unsigned Pattern, std::array< unsigned, 5 > &OperandIndices) const override
const RISCVSubtarget & STI
Register isStoreToStackSlot(const MachineInstr &MI, int &FrameIndex) const override
std::optional< unsigned > getInverseOpcode(unsigned Opcode) const override
bool simplifyInstruction(MachineInstr &MI) const override
ArrayRef< std::pair< unsigned, const char * > > getSerializableDirectMachineOperandTargetFlags() const override
outliner::InstrType getOutliningTypeImpl(const MachineModuleInfo &MMI, MachineBasicBlock::iterator &MBBI, unsigned Flags) const override
MachineTraceStrategy getMachineCombinerTraceStrategy() const override
unsigned getInstSizeInBytes(const MachineInstr &MI) const override
std::optional< RegImmPair > isAddImmediate(const MachineInstr &MI, Register Reg) const override
bool reverseBranchCondition(SmallVectorImpl< MachineOperand > &Cond) const override
ArrayRef< std::pair< MachineMemOperand::Flags, const char * > > getSerializableMachineMemOperandTargetFlags() const override
MCInst getNop() const override
bool analyzeCandidate(outliner::Candidate &C) const
bool isMBBSafeToOutlineFrom(MachineBasicBlock &MBB, unsigned &Flags) const override
bool getMemOperandsWithOffsetWidth(const MachineInstr &MI, SmallVectorImpl< const MachineOperand * > &BaseOps, int64_t &Offset, bool &OffsetIsScalable, LocationSize &Width, const TargetRegisterInfo *TRI) const override
void buildOutlinedFrame(MachineBasicBlock &MBB, MachineFunction &MF, const outliner::OutlinedFunction &OF) const override
bool requiresNTLHint(const MachineInstr &MI) const
Return true if the instruction requires an NTL hint to be emitted.
void finalizeInsInstrs(MachineInstr &Root, unsigned &Pattern, SmallVectorImpl< MachineInstr * > &InsInstrs) const override
std::pair< unsigned, unsigned > decomposeMachineOperandsTargetFlags(unsigned TF) const override
MachineInstr * commuteInstructionImpl(MachineInstr &MI, bool NewMI, unsigned OpIdx1, unsigned OpIdx2) const override
bool hasReassociableOperands(const MachineInstr &Inst, const MachineBasicBlock *MBB) const override
MachineBasicBlock * getBranchDestBlock(const MachineInstr &MI) const override
std::string createMIROperandComment(const MachineInstr &MI, const MachineOperand &Op, unsigned OpIdx, const TargetRegisterInfo *TRI) const override
bool shouldOutlineFromFunctionByDefault(MachineFunction &MF) const override
void copyPhysReg(MachineBasicBlock &MBB, MachineBasicBlock::iterator MBBI, const DebugLoc &DL, Register DstReg, Register SrcReg, bool KillSrc, bool RenamableDest=false, bool RenamableSrc=false) const override
bool findCommutedOpIndices(const MachineInstr &MI, unsigned &SrcOpIdx1, unsigned &SrcOpIdx2) const override
bool analyzeBranch(MachineBasicBlock &MBB, MachineBasicBlock *&TBB, MachineBasicBlock *&FBB, SmallVectorImpl< MachineOperand > &Cond, bool AllowModify) const override
MachineBasicBlock::iterator insertOutlinedCall(Module &M, MachineBasicBlock &MBB, MachineBasicBlock::iterator &It, MachineFunction &MF, outliner::Candidate &C) const override
MachineInstr * foldMemoryOperandImpl(MachineFunction &MF, MachineInstr &MI, ArrayRef< unsigned > Ops, int FrameIndex, MachineInstr *&CopyMI, LiveIntervals *LIS=nullptr, VirtRegMap *VRM=nullptr) const override
bool isBranchOffsetInRange(unsigned BranchOpc, int64_t BrOffset) const override
static RISCVCC::CondCode getCondFromBranchOpc(unsigned Opc)
void buildClearRegister(Register Reg, MachineBasicBlock &MBB, MachineBasicBlock::iterator Iter, DebugLoc &DL, bool AllowSideEffects=true) const override
bool isAssociativeAndCommutative(const MachineInstr &Inst, bool Invert) const override
CombinerObjective getCombinerObjective(unsigned Pattern) const override
bool isHighLatencyDef(int Opc) const override
static bool evaluateCondBranch(RISCVCC::CondCode CC, int64_t C0, int64_t C1)
Return the result of the evaluation of C0 CC C1, where CC is a RISCVCC::CondCode.
bool getMachineCombinerPatterns(MachineInstr &Root, SmallVectorImpl< unsigned > &Patterns, bool DoRegPressureReduce) const override
bool optimizeCondBranch(MachineInstr &MI) const override
std::optional< DestSourcePair > isCopyInstrImpl(const MachineInstr &MI) const override
static bool isFromLoadImm(const MachineRegisterInfo &MRI, const MachineOperand &Op, int64_t &Imm)
Return true if the operand is a load immediate instruction and sets Imm to the immediate value.
bool shouldClusterMemOps(ArrayRef< const MachineOperand * > BaseOps1, int64_t Offset1, bool OffsetIsScalable1, ArrayRef< const MachineOperand * > BaseOps2, int64_t Offset2, bool OffsetIsScalable2, unsigned ClusterSize, unsigned NumBytes) const override
bool areMemAccessesTriviallyDisjoint(const MachineInstr &MIa, const MachineInstr &MIb) const override
RISCVMachineFunctionInfo - This class is derived from MachineFunctionInfo and contains private RISCV-...
const RISCVRegisterInfo * getRegisterInfo() const override
Wrapper class representing virtual and physical registers.
Definition Register.h:20
constexpr bool isValid() const
Definition Register.h:112
constexpr bool isVirtual() const
Return true if the specified register number is in the virtual register namespace.
Definition Register.h:79
SlotIndex - An opaque wrapper around machine indexes.
Definition SlotIndexes.h:66
SlotIndex getRegSlot(bool EC=false) const
Returns the register use/def slot in the current instruction for a normal or early-clobber def.
A templated base class for SmallPtrSet which provides the typesafe interface that is common across al...
bool erase(PtrType Ptr)
Remove pointer from the set.
std::pair< iterator, bool > insert(PtrType Ptr)
Inserts Ptr if and only if there is no element in the container equal to Ptr.
This class consists of common code factored out of the SmallVector class to reduce code duplication b...
void push_back(const T &Elt)
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
MI-level stackmap operands.
Definition StackMaps.h:36
uint32_t getNumPatchBytes() const
Return the number of patchable bytes the given stackmap should emit.
Definition StackMaps.h:51
MI-level Statepoint operands.
Definition StackMaps.h:159
uint32_t getNumPatchBytes() const
Return the number of patchable bytes the given statepoint should emit.
Definition StackMaps.h:208
Represent a constant reference to a string, i.e.
Definition StringRef.h:56
Object returned by analyzeLoopForPipelining.
TargetInstrInfo - Interface to description of machine instruction set.
virtual bool findCommutedOpIndices(const MachineInstr &MI, unsigned &SrcOpIdx1, unsigned &SrcOpIdx2) const
Returns true iff the routine could find two commutable operands in the given machine instruction.
virtual bool hasReassociableOperands(const MachineInstr &Inst, const MachineBasicBlock *MBB) const
Return true when \P Inst has reassociable operands in the same \P MBB.
virtual void genAlternativeCodeSequence(MachineInstr &Root, unsigned Pattern, SmallVectorImpl< MachineInstr * > &InsInstrs, SmallVectorImpl< MachineInstr * > &DelInstrs, DenseMap< Register, unsigned > &InstIdxForVirtReg) const
When getMachineCombinerPatterns() finds patterns, this function generates the instructions that could...
virtual bool getMachineCombinerPatterns(MachineInstr &Root, SmallVectorImpl< unsigned > &Patterns, bool DoRegPressureReduce) const
Return true when there is potentially a faster code sequence for an instruction chain ending in Root.
virtual bool isReMaterializableImpl(const MachineInstr &MI) const
For instructions with opcodes for which the M_REMATERIALIZABLE flag is set, this hook lets the target...
virtual bool isMBBSafeToOutlineFrom(MachineBasicBlock &MBB, unsigned &Flags) const
Optional target hook that returns true if MBB is safe to outline from, and returns any target-specifi...
virtual void getReassociateOperandIndices(const MachineInstr &Root, unsigned Pattern, std::array< unsigned, 5 > &OperandIndices) const
The returned array encodes the operand index for each parameter because the operands may be commuted;...
virtual CombinerObjective getCombinerObjective(unsigned Pattern) const
Return the objective of a combiner pattern.
virtual MachineInstr * commuteInstructionImpl(MachineInstr &MI, bool NewMI, unsigned OpIdx1, unsigned OpIdx2) const
This method commutes the operands of the given machine instruction MI.
virtual bool hasReassociableSibling(const MachineInstr &Inst, bool &Commuted) const
Return true when \P Inst has reassociable sibling.
virtual std::string createMIROperandComment(const MachineInstr &MI, const MachineOperand &Op, unsigned OpIdx, const TargetRegisterInfo *TRI) const
const MCAsmInfo & getMCAsmInfo() const
Return target specific asm information.
const uint8_t TSFlags
Configurable target specific flags.
TargetRegisterInfo base class - We assume that the target defines a static array of TargetRegisterDes...
TargetSubtargetInfo - Generic base class for all target subtargets.
virtual const TargetInstrInfo * getInstrInfo() const
virtual const TargetRegisterInfo * getRegisterInfo() const =0
Return the target's register information.
Target - Wrapper for Target specific information.
static constexpr TypeSize getFixed(ScalarTy ExactSize)
Definition TypeSize.h:343
static constexpr TypeSize getZero()
Definition TypeSize.h:349
static constexpr TypeSize getScalable(ScalarTy MinimumSize)
Definition TypeSize.h:346
self_iterator getIterator()
Definition ilist_node.h:123
A raw_ostream that writes to an std::string.
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
@ C
The default llvm calling convention, compatible with C.
Definition CallingConv.h:34
CondCode getInverseBranchCondition(CondCode)
unsigned getInverseBranchOpcode(unsigned BCC)
unsigned getBrCond(CondCode CC, unsigned SelectOpc=0)
static bool isValidRoundingMode(unsigned Mode)
static StringRef roundingModeToString(RoundingMode RndMode)
static unsigned getVecPolicyOpNum(const MCInstrDesc &Desc)
static bool usesMaskPolicy(uint64_t TSFlags)
static bool hasRoundModeOp(uint64_t TSFlags)
static unsigned getVLOpNum(const MCInstrDesc &Desc)
static bool hasVLOp(uint64_t TSFlags)
static MCRegister getTailExpandUseRegNo(const FeatureBitset &FeatureBits)
static int getFRMOpNum(const MCInstrDesc &Desc)
static int getVXRMOpNum(const MCInstrDesc &Desc)
static bool hasVecPolicyOp(uint64_t TSFlags)
static bool usesVXRM(uint64_t TSFlags)
static bool isRVVWideningReduction(uint64_t TSFlags)
static unsigned getSEWOpNum(const MCInstrDesc &Desc)
static bool hasSEWOp(uint64_t TSFlags)
static bool isFirstDefTiedToFirstUse(const MCInstrDesc &Desc)
InstSeq generateInstSeq(int64_t Val, const MCSubtargetInfo &STI)
SmallVector< Inst, 8 > InstSeq
Definition RISCVMatInt.h:43
@ OPERAND_UIMMLOG2XLEN_NONZERO
@ OPERAND_UIMM10_LSB00_NONZERO
@ OPERAND_SIMM10_LSB0000_NONZERO
static unsigned getNF(uint8_t TSFlags)
static RISCVVType::VLMUL getLMul(uint8_t TSFlags)
static bool isTailAgnostic(unsigned VType)
LLVM_ABI void printXSfmmVType(unsigned VType, raw_ostream &OS)
LLVM_ABI std::pair< unsigned, bool > decodeVLMUL(VLMUL VLMul)
static bool isValidSEW(unsigned SEW)
static bool isValidVType(unsigned VType)
LLVM_ABI void printVType(unsigned VType, raw_ostream &OS)
static bool isValidXSfmmVType(unsigned VTypeI)
static unsigned getSEW(unsigned VType)
static VLMUL getVLMUL(unsigned VType)
static bool isValidRoundingMode(unsigned Mode)
static StringRef roundingModeToString(RoundingMode RndMode)
bool hasEqualFRM(const MachineInstr &MI1, const MachineInstr &MI2)
bool isVLKnownLE(const MachineOperand &LHS, const MachineOperand &RHS)
Given two VL operands, do we know that LHS <= RHS?
bool isValidYBNDSWImm(int64_t Imm)
unsigned getRVVMCOpcode(unsigned RVVPseudoOpcode)
unsigned getDestLog2EEW(const MCInstrDesc &Desc, unsigned Log2SEW)
std::optional< unsigned > getVectorLowDemandedScalarBits(unsigned Opcode, unsigned Log2SEW)
std::optional< std::pair< unsigned, unsigned > > isRVVSpillForZvlsseg(unsigned Opcode)
static constexpr unsigned RVVBitsPerBlock
bool isRVVSpill(const MachineInstr &MI)
static constexpr unsigned RVVBytesPerBlock
static constexpr int64_t VLMaxSentinel
bool isVectorCopy(const TargetRegisterInfo *TRI, const MachineInstr &MI)
Return true if MI is a copy that will be lowered to one or more vmvNr.vs.
ValuesClass values(OptsTy... Options)
Helper to build a ValuesClass by forwarding a variable number of arguments as an initializer list to ...
initializer< Ty > init(const Ty &Val)
InstrType
Represents how an instruction should be mapped by the outliner.
This is an optimization pass for GlobalISel generic memory operations.
auto drop_begin(T &&RangeOrContainer, size_t N=1)
Return a range covering RangeOrContainer with the first N elements excluded.
Definition STLExtras.h:315
@ Offset
Definition DWP.cpp:558
@ SHXADD_ADD_SLLI_OP2
@ SHXADD_ADD_SLLI_OP1
MachineTraceStrategy
Strategies for selecting traces.
@ TS_MinInstrCount
Select the trace through a block that has the fewest instructions.
@ TS_Local
Select the trace that contains only the current basic block.
bool all_of(R &&range, UnaryPredicate P)
Provide wrappers to std::all_of which take ranges instead of having to pass begin/end explicitly.
Definition STLExtras.h:1738
static const MachineMemOperand::Flags MONontemporalBit1
MachineInstrBuilder BuildMI(MachineFunction &MF, const MIMetadata &MIMD, const MCInstrDesc &MCID)
Builder interface. Specify how to create the initial instruction itself.
constexpr bool isInt(int64_t x)
Checks if an integer fits into the given bit width.
Definition MathExtras.h:165
RegState
Flags to represent properties of register accesses.
@ Implicit
Not emitted register (e.g. carry, or temporary result).
@ Dead
Unused definition.
@ Kill
The last use of a register.
@ Undef
Value of the register doesn't matter.
@ Define
Register definition.
auto enumerate(FirstRange &&First, RestRanges &&...Rest)
Given two or more input ranges, returns a new range whose values are tuples (A, B,...
Definition STLExtras.h:2553
bool isValidAtomicOrdering(Int I)
constexpr RegState getKillRegState(bool B)
static const MachineMemOperand::Flags MONontemporalBit0
constexpr RegState getDeadRegState(bool B)
LLVM_ABI void reportFatalInternalError(Error Err)
Report a fatal error that indicates a bug in LLVM.
Definition Error.cpp:173
Op::Description Desc
unsigned M1(unsigned Val)
Definition VE.h:377
constexpr bool has_single_bit(T Value) noexcept
Definition bit.h:149
unsigned Log2_32(uint32_t Value)
Return the floor log base 2 of the specified value, -1 if the value is zero.
Definition MathExtras.h:331
MachineInstr * getImm(const MachineOperand &MO, const MachineRegisterInfo *MRI)
constexpr RegState getRenamableRegState(bool B)
decltype(auto) get(const PointerIntPair< PointerTy, IntBits, IntType, PtrTraits, Info > &Pair)
LLVM_ABI raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
Definition Debug.cpp:209
LLVM_ABI void report_fatal_error(Error Err, bool gen_crash_diag=true)
Definition Error.cpp:163
constexpr RegState getDefRegState(bool B)
CombinerObjective
The combiner's goal may differ based on which pattern it is attempting to optimize.
constexpr bool isUInt(uint64_t x)
Checks if an unsigned integer fits into the given bit width.
Definition MathExtras.h:189
CodeGenOptLevel
Code generation optimization level.
Definition CodeGen.h:82
int isShifted359(T Value, int &Shift)
bool isa(const From &Val)
isa<X> - Return true if the parameter to the template is an instance of one of the template type argu...
Definition Casting.h:547
uint16_t MCPhysReg
An unsigned integer type large enough to represent all physical registers, but not necessarily virtua...
Definition MCRegister.h:21
DWARFExpression::Operation Op
ArrayRef(const T &OneElt) -> ArrayRef< T >
constexpr bool isShiftedInt(int64_t x)
Checks if a signed integer is an N bit number shifted left by S.
Definition MathExtras.h:182
void erase_if(Container &C, UnaryPredicate P)
Provide a container algorithm similar to C++ Library Fundamentals v2's erase_if which is equivalent t...
Definition STLExtras.h:2191
constexpr int64_t SignExtend64(uint64_t x)
Sign-extend the number in the bottom B bits of X to a 64-bit integer.
Definition MathExtras.h:572
LLVM_ABI const Value * getUnderlyingObject(const Value *V, unsigned MaxLookup=MaxLookupSearchDepth)
This method strips off any GEP address adjustments, pointer casts or llvm.threadlocal....
constexpr bool isShiftedUInt(uint64_t x)
Checks if a unsigned integer is an N bit number shifted left by S.
Definition MathExtras.h:198
void swap(llvm::BitVector &LHS, llvm::BitVector &RHS)
Implement std::swap in terms of BitVector swap.
Definition BitVector.h:862
#define N
This struct is a compact representation of a valid (non-zero power of two) alignment.
Definition Alignment.h:39
Used to describe addressing mode similar to ExtAddrMode in CodeGenPrepare.
This represents a simple continuous liveness interval for a value.
static LLVM_ABI MachinePointerInfo getFixedStack(MachineFunction &MF, int FI, int64_t Offset=0)
Return a MachinePointerInfo record that refers to the specified FrameIndex.
static bool isRVVRegClass(const TargetRegisterClass *RC)
Used to describe a register and immediate addition.
An individual sequence of instructions to be replaced with a call to an outlined function.
MachineFunction * getMF() const
The information necessary to create an outlined function for some class of candidate.