LLVM 23.0.0git
RISCVInstrInfo.cpp
Go to the documentation of this file.
1//===-- RISCVInstrInfo.cpp - RISC-V Instruction Information -----*- C++ -*-===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8//
9// This file contains the RISC-V implementation of the TargetInstrInfo class.
10//
11//===----------------------------------------------------------------------===//
12
13#include "RISCVInstrInfo.h"
16#include "RISCV.h"
18#include "RISCVSubtarget.h"
19#include "llvm/ADT/STLExtras.h"
21#include "llvm/ADT/Statistic.h"
33#include "llvm/IR/Module.h"
34#include "llvm/MC/MCDwarf.h"
38
39using namespace llvm;
40
41#define GEN_CHECK_COMPRESS_INSTR
42#include "RISCVGenCompressInstEmitter.inc"
43
44#define GET_INSTRINFO_CTOR_DTOR
45#include "RISCVGenInstrInfo.inc"
46
47#define DEBUG_TYPE "riscv-instr-info"
48STATISTIC(NumVRegSpilled,
49 "Number of registers within vector register groups spilled");
50STATISTIC(NumVRegReloaded,
51 "Number of registers within vector register groups reloaded");
52
54 "riscv-prefer-whole-register-move", cl::init(false), cl::Hidden,
55 cl::desc("Prefer whole register move for vector registers."));
56
58 "riscv-force-machine-combiner-strategy", cl::Hidden,
59 cl::desc("Force machine combiner to use a specific strategy for machine "
60 "trace metrics evaluation."),
63 "Local strategy."),
65 "MinInstrCount strategy.")));
66
68 "riscv-outliner-regsave", cl::init(true), cl::Hidden,
69 cl::desc("Enable RegSave strategy in machine outliner (save X5 to a "
70 "temporary register when X5 is live across outlined calls)."));
71
73
74using namespace RISCV;
75
76#define GET_RISCVVPseudosTable_IMPL
77#include "RISCVGenSearchableTables.inc"
78
79} // namespace llvm::RISCVVPseudosTable
80
81namespace llvm::RISCV {
82
83#define GET_RISCVMaskedPseudosTable_IMPL
84#include "RISCVGenSearchableTables.inc"
85
86} // end namespace llvm::RISCV
87
89 : RISCVGenInstrInfo(STI, RegInfo, RISCV::ADJCALLSTACKDOWN,
90 RISCV::ADJCALLSTACKUP),
91 RegInfo(STI.getHwMode()), STI(STI) {}
92
93#define GET_INSTRINFO_HELPERS
94#include "RISCVGenInstrInfo.inc"
95
97 if (STI.hasStdExtZca())
98 return MCInstBuilder(RISCV::C_NOP);
99 return MCInstBuilder(RISCV::ADDI)
100 .addReg(RISCV::X0)
101 .addReg(RISCV::X0)
102 .addImm(0);
103}
104
106 int &FrameIndex) const {
107 TypeSize Dummy = TypeSize::getZero();
108 return isLoadFromStackSlot(MI, FrameIndex, Dummy);
109}
110
111static std::optional<unsigned> getLMULForRVVWholeLoadStore(unsigned Opcode) {
112 switch (Opcode) {
113 default:
114 return std::nullopt;
115 case RISCV::VS1R_V:
116 case RISCV::VL1RE8_V:
117 case RISCV::VL1RE16_V:
118 case RISCV::VL1RE32_V:
119 case RISCV::VL1RE64_V:
120 return 1;
121 case RISCV::VS2R_V:
122 case RISCV::VL2RE8_V:
123 case RISCV::VL2RE16_V:
124 case RISCV::VL2RE32_V:
125 case RISCV::VL2RE64_V:
126 return 2;
127 case RISCV::VS4R_V:
128 case RISCV::VL4RE8_V:
129 case RISCV::VL4RE16_V:
130 case RISCV::VL4RE32_V:
131 case RISCV::VL4RE64_V:
132 return 4;
133 case RISCV::VS8R_V:
134 case RISCV::VL8RE8_V:
135 case RISCV::VL8RE16_V:
136 case RISCV::VL8RE32_V:
137 case RISCV::VL8RE64_V:
138 return 8;
139 }
140}
141
143 int &FrameIndex,
144 TypeSize &MemBytes) const {
145 switch (MI.getOpcode()) {
146 default:
147 return 0;
148 case RISCV::LB:
149 case RISCV::LBU:
150 MemBytes = TypeSize::getFixed(1);
151 break;
152 case RISCV::LH:
153 case RISCV::LH_INX:
154 case RISCV::LHU:
155 case RISCV::FLH:
156 MemBytes = TypeSize::getFixed(2);
157 break;
158 case RISCV::LW:
159 case RISCV::LW_INX:
160 case RISCV::FLW:
161 case RISCV::LWU:
162 MemBytes = TypeSize::getFixed(4);
163 break;
164 case RISCV::LD:
165 case RISCV::LD_RV32:
166 case RISCV::FLD:
167 MemBytes = TypeSize::getFixed(8);
168 break;
169 case RISCV::VL1RE8_V:
170 case RISCV::VL2RE8_V:
171 case RISCV::VL4RE8_V:
172 case RISCV::VL8RE8_V:
173 if (!MI.getOperand(1).isFI())
174 return Register();
175 FrameIndex = MI.getOperand(1).getIndex();
176 unsigned LMUL = *getLMULForRVVWholeLoadStore(MI.getOpcode());
178 return MI.getOperand(0).getReg();
179 }
180
181 if (MI.getOperand(1).isFI() && MI.getOperand(2).isImm() &&
182 MI.getOperand(2).getImm() == 0) {
183 FrameIndex = MI.getOperand(1).getIndex();
184 return MI.getOperand(0).getReg();
185 }
186
187 return 0;
188}
189
191 int &FrameIndex) const {
192 TypeSize Dummy = TypeSize::getZero();
193 return isStoreToStackSlot(MI, FrameIndex, Dummy);
194}
195
197 int &FrameIndex,
198 TypeSize &MemBytes) const {
199 switch (MI.getOpcode()) {
200 default:
201 return 0;
202 case RISCV::SB:
203 MemBytes = TypeSize::getFixed(1);
204 break;
205 case RISCV::SH:
206 case RISCV::SH_INX:
207 case RISCV::FSH:
208 MemBytes = TypeSize::getFixed(2);
209 break;
210 case RISCV::SW:
211 case RISCV::SW_INX:
212 case RISCV::FSW:
213 MemBytes = TypeSize::getFixed(4);
214 break;
215 case RISCV::SD:
216 case RISCV::SD_RV32:
217 case RISCV::FSD:
218 MemBytes = TypeSize::getFixed(8);
219 break;
220 case RISCV::VS1R_V:
221 case RISCV::VS2R_V:
222 case RISCV::VS4R_V:
223 case RISCV::VS8R_V:
224 if (!MI.getOperand(1).isFI())
225 return Register();
226 FrameIndex = MI.getOperand(1).getIndex();
227 unsigned LMUL = *getLMULForRVVWholeLoadStore(MI.getOpcode());
229 return MI.getOperand(0).getReg();
230 }
231
232 if (MI.getOperand(1).isFI() && MI.getOperand(2).isImm() &&
233 MI.getOperand(2).getImm() == 0) {
234 FrameIndex = MI.getOperand(1).getIndex();
235 return MI.getOperand(0).getReg();
236 }
237
238 return 0;
239}
240
242 const MachineInstr &MI) const {
243 switch (RISCV::getRVVMCOpcode(MI.getOpcode())) {
244 case RISCV::VMV_V_X:
245 case RISCV::VFMV_V_F:
246 case RISCV::VMV_V_I:
247 case RISCV::VMV_S_X:
248 case RISCV::VFMV_S_F:
249 case RISCV::VID_V:
250 return MI.getOperand(1).isUndef();
251 default:
253 }
254}
255
256static bool forwardCopyWillClobberTuple(unsigned DstReg, unsigned SrcReg,
257 unsigned NumRegs) {
258 return DstReg > SrcReg && (DstReg - SrcReg) < NumRegs;
259}
260
262 const MachineBasicBlock &MBB,
265 RISCVVType::VLMUL LMul) {
267 return false;
268
269 assert(MBBI->getOpcode() == TargetOpcode::COPY &&
270 "Unexpected COPY instruction.");
271 Register SrcReg = MBBI->getOperand(1).getReg();
273
274 bool FoundDef = false;
275 bool FirstVSetVLI = false;
276 unsigned FirstSEW = 0;
277 while (MBBI != MBB.begin()) {
278 --MBBI;
279 if (MBBI->isMetaInstruction())
280 continue;
281
282 if (RISCVInstrInfo::isVectorConfigInstr(*MBBI)) {
283 // There is a vsetvli between COPY and source define instruction.
284 // vy = def_vop ... (producing instruction)
285 // ...
286 // vsetvli
287 // ...
288 // vx = COPY vy
289 if (!FoundDef) {
290 if (!FirstVSetVLI) {
291 FirstVSetVLI = true;
292 unsigned FirstVType = MBBI->getOperand(2).getImm();
293 RISCVVType::VLMUL FirstLMul = RISCVVType::getVLMUL(FirstVType);
294 FirstSEW = RISCVVType::getSEW(FirstVType);
295 // The first encountered vsetvli must have the same lmul as the
296 // register class of COPY.
297 if (FirstLMul != LMul)
298 return false;
299 }
300 // Only permit `vsetvli x0, x0, vtype` between COPY and the source
301 // define instruction.
302 if (!RISCVInstrInfo::isVLPreservingConfig(*MBBI))
303 return false;
304 continue;
305 }
306
307 // MBBI is the first vsetvli before the producing instruction.
308 unsigned VType = MBBI->getOperand(2).getImm();
309 // If there is a vsetvli between COPY and the producing instruction.
310 if (FirstVSetVLI) {
311 // If SEW is different, return false.
312 if (RISCVVType::getSEW(VType) != FirstSEW)
313 return false;
314 }
315
316 // If the vsetvli is tail undisturbed, keep the whole register move.
317 if (!RISCVVType::isTailAgnostic(VType))
318 return false;
319
320 // The checking is conservative. We only have register classes for
321 // LMUL = 1/2/4/8. We should be able to convert vmv1r.v to vmv.v.v
322 // for fractional LMUL operations. However, we could not use the vsetvli
323 // lmul for widening operations. The result of widening operation is
324 // 2 x LMUL.
325 return LMul == RISCVVType::getVLMUL(VType);
326 } else if (MBBI->isInlineAsm() || MBBI->isCall()) {
327 return false;
328 } else if (MBBI->getNumDefs()) {
329 // Check all the instructions which will change VL.
330 // For example, vleff has implicit def VL.
331 if (MBBI->modifiesRegister(RISCV::VL, /*TRI=*/nullptr))
332 return false;
333
334 // Only converting whole register copies to vmv.v.v when the defining
335 // value appears in the explicit operands.
336 for (const MachineOperand &MO : MBBI->explicit_operands()) {
337 if (!MO.isReg() || !MO.isDef())
338 continue;
339 if (!FoundDef && TRI->regsOverlap(MO.getReg(), SrcReg)) {
340 // We only permit the source of COPY has the same LMUL as the defined
341 // operand.
342 // There are cases we need to keep the whole register copy if the LMUL
343 // is different.
344 // For example,
345 // $x0 = PseudoVSETIVLI 4, 73 // vsetivli zero, 4, e16,m2,ta,m
346 // $v28m4 = PseudoVWADD_VV_M2 $v26m2, $v8m2
347 // # The COPY may be created by vlmul_trunc intrinsic.
348 // $v26m2 = COPY renamable $v28m2, implicit killed $v28m4
349 //
350 // After widening, the valid value will be 4 x e32 elements. If we
351 // convert the COPY to vmv.v.v, it will only copy 4 x e16 elements.
352 // FIXME: The COPY of subregister of Zvlsseg register will not be able
353 // to convert to vmv.v.[v|i] under the constraint.
354 if (MO.getReg() != SrcReg)
355 return false;
356
357 // In widening reduction instructions with LMUL_1 input vector case,
358 // only checking the LMUL is insufficient due to reduction result is
359 // always LMUL_1.
360 // For example,
361 // $x11 = PseudoVSETIVLI 1, 64 // vsetivli a1, 1, e8, m1, ta, mu
362 // $v8m1 = PseudoVWREDSUM_VS_M1 $v26, $v27
363 // $v26 = COPY killed renamable $v8
364 // After widening, The valid value will be 1 x e16 elements. If we
365 // convert the COPY to vmv.v.v, it will only copy 1 x e8 elements.
366 uint64_t TSFlags = MBBI->getDesc().TSFlags;
368 return false;
369
370 // If the producing instruction does not depend on vsetvli, do not
371 // convert COPY to vmv.v.v. For example, VL1R_V or PseudoVRELOAD.
372 if (!RISCVII::hasSEWOp(TSFlags) || !RISCVII::hasVLOp(TSFlags))
373 return false;
374
375 // Found the definition.
376 FoundDef = true;
377 DefMBBI = MBBI;
378 break;
379 }
380 }
381 }
382 }
383
384 return false;
385}
386
389 const DebugLoc &DL, MCRegister DstReg, MCRegister SrcReg, bool KillSrc,
390 const TargetRegisterClass *RegClass) const {
391 const RISCVRegisterInfo *TRI = STI.getRegisterInfo();
393 unsigned NF = RISCVRI::getNF(RegClass->TSFlags);
394
395 uint16_t SrcEncoding = TRI->getEncodingValue(SrcReg);
396 uint16_t DstEncoding = TRI->getEncodingValue(DstReg);
397 auto [LMulVal, Fractional] = RISCVVType::decodeVLMUL(LMul);
398 assert(!Fractional && "It is impossible be fractional lmul here.");
399 unsigned NumRegs = NF * LMulVal;
400 bool ReversedCopy =
401 forwardCopyWillClobberTuple(DstEncoding, SrcEncoding, NumRegs);
402 if (ReversedCopy) {
403 // If the src and dest overlap when copying a tuple, we need to copy the
404 // registers in reverse.
405 SrcEncoding += NumRegs - 1;
406 DstEncoding += NumRegs - 1;
407 }
408
409 unsigned I = 0;
410 auto GetCopyInfo = [&](uint16_t SrcEncoding, uint16_t DstEncoding)
411 -> std::tuple<RISCVVType::VLMUL, const TargetRegisterClass &, unsigned,
412 unsigned, unsigned> {
413 if (ReversedCopy) {
414 // For reversed copying, if there are enough aligned registers(8/4/2), we
415 // can do a larger copy(LMUL8/4/2).
416 // Besides, we have already known that DstEncoding is larger than
417 // SrcEncoding in forwardCopyWillClobberTuple, so the difference between
418 // DstEncoding and SrcEncoding should be >= LMUL value we try to use to
419 // avoid clobbering.
420 uint16_t Diff = DstEncoding - SrcEncoding;
421 if (I + 8 <= NumRegs && Diff >= 8 && SrcEncoding % 8 == 7 &&
422 DstEncoding % 8 == 7)
423 return {RISCVVType::LMUL_8, RISCV::VRM8RegClass, RISCV::VMV8R_V,
424 RISCV::PseudoVMV_V_V_M8, RISCV::PseudoVMV_V_I_M8};
425 if (I + 4 <= NumRegs && Diff >= 4 && SrcEncoding % 4 == 3 &&
426 DstEncoding % 4 == 3)
427 return {RISCVVType::LMUL_4, RISCV::VRM4RegClass, RISCV::VMV4R_V,
428 RISCV::PseudoVMV_V_V_M4, RISCV::PseudoVMV_V_I_M4};
429 if (I + 2 <= NumRegs && Diff >= 2 && SrcEncoding % 2 == 1 &&
430 DstEncoding % 2 == 1)
431 return {RISCVVType::LMUL_2, RISCV::VRM2RegClass, RISCV::VMV2R_V,
432 RISCV::PseudoVMV_V_V_M2, RISCV::PseudoVMV_V_I_M2};
433 // Or we should do LMUL1 copying.
434 return {RISCVVType::LMUL_1, RISCV::VRRegClass, RISCV::VMV1R_V,
435 RISCV::PseudoVMV_V_V_M1, RISCV::PseudoVMV_V_I_M1};
436 }
437
438 // For forward copying, if source register encoding and destination register
439 // encoding are aligned to 8/4/2, we can do a LMUL8/4/2 copying.
440 if (I + 8 <= NumRegs && SrcEncoding % 8 == 0 && DstEncoding % 8 == 0)
441 return {RISCVVType::LMUL_8, RISCV::VRM8RegClass, RISCV::VMV8R_V,
442 RISCV::PseudoVMV_V_V_M8, RISCV::PseudoVMV_V_I_M8};
443 if (I + 4 <= NumRegs && SrcEncoding % 4 == 0 && DstEncoding % 4 == 0)
444 return {RISCVVType::LMUL_4, RISCV::VRM4RegClass, RISCV::VMV4R_V,
445 RISCV::PseudoVMV_V_V_M4, RISCV::PseudoVMV_V_I_M4};
446 if (I + 2 <= NumRegs && SrcEncoding % 2 == 0 && DstEncoding % 2 == 0)
447 return {RISCVVType::LMUL_2, RISCV::VRM2RegClass, RISCV::VMV2R_V,
448 RISCV::PseudoVMV_V_V_M2, RISCV::PseudoVMV_V_I_M2};
449 // Or we should do LMUL1 copying.
450 return {RISCVVType::LMUL_1, RISCV::VRRegClass, RISCV::VMV1R_V,
451 RISCV::PseudoVMV_V_V_M1, RISCV::PseudoVMV_V_I_M1};
452 };
453
454 while (I != NumRegs) {
455 // For non-segment copying, we only do this once as the registers are always
456 // aligned.
457 // For segment copying, we may do this several times. If the registers are
458 // aligned to larger LMUL, we can eliminate some copyings.
459 auto [LMulCopied, RegClass, Opc, VVOpc, VIOpc] =
460 GetCopyInfo(SrcEncoding, DstEncoding);
461 auto [NumCopied, _] = RISCVVType::decodeVLMUL(LMulCopied);
462
464 if (LMul == LMulCopied &&
465 isConvertibleToVMV_V_V(STI, MBB, MBBI, DefMBBI, LMul)) {
466 Opc = VVOpc;
467 if (DefMBBI->getOpcode() == VIOpc)
468 Opc = VIOpc;
469 }
470
471 // Emit actual copying.
472 // For reversed copying, the encoding should be decreased.
473 MCRegister ActualSrcReg = TRI->findVRegWithEncoding(
474 RegClass, ReversedCopy ? (SrcEncoding - NumCopied + 1) : SrcEncoding);
475 MCRegister ActualDstReg = TRI->findVRegWithEncoding(
476 RegClass, ReversedCopy ? (DstEncoding - NumCopied + 1) : DstEncoding);
477
478 auto MIB = BuildMI(MBB, MBBI, DL, get(Opc), ActualDstReg);
479 bool UseVMV_V_I = RISCV::getRVVMCOpcode(Opc) == RISCV::VMV_V_I;
480 bool UseVMV = UseVMV_V_I || RISCV::getRVVMCOpcode(Opc) == RISCV::VMV_V_V;
481 if (UseVMV)
482 MIB.addReg(ActualDstReg, RegState::Undef);
483 if (UseVMV_V_I)
484 MIB = MIB.add(DefMBBI->getOperand(2));
485 else
486 MIB = MIB.addReg(ActualSrcReg, getKillRegState(KillSrc));
487 if (UseVMV) {
488 const MCInstrDesc &Desc = DefMBBI->getDesc();
489 MIB.add(DefMBBI->getOperand(RISCVII::getVLOpNum(Desc))); // AVL
490 unsigned Log2SEW =
491 DefMBBI->getOperand(RISCVII::getSEWOpNum(Desc)).getImm();
492 MIB.addImm(Log2SEW ? Log2SEW : 3); // SEW
493 MIB.addImm(0); // tu, mu
494 MIB.addReg(RISCV::VL, RegState::Implicit);
495 MIB.addReg(RISCV::VTYPE, RegState::Implicit);
496 }
497 // Add an implicit read of the original source to silence the verifier
498 // in the cases where some of the smaller VRs we're copying from might be
499 // undef, caused by the fact that the original, larger source VR might not
500 // be fully initialized at the time this COPY happens.
501 MIB.addReg(SrcReg, RegState::Implicit);
502
503 // If we are copying reversely, we should decrease the encoding.
504 SrcEncoding += (ReversedCopy ? -NumCopied : NumCopied);
505 DstEncoding += (ReversedCopy ? -NumCopied : NumCopied);
506 I += NumCopied;
507 }
508}
509
512 const DebugLoc &DL, Register DstReg,
513 Register SrcReg, bool KillSrc,
514 bool RenamableDest, bool RenamableSrc) const {
515 const TargetRegisterInfo *TRI = STI.getRegisterInfo();
516 RegState KillFlag = getKillRegState(KillSrc);
517
518 if (RISCV::GPRRegClass.contains(DstReg, SrcReg)) {
519 BuildMI(MBB, MBBI, DL, get(RISCV::ADDI), DstReg)
520 .addReg(SrcReg, KillFlag | getRenamableRegState(RenamableSrc))
521 .addImm(0);
522 return;
523 }
524
525 if (RISCV::GPRF16RegClass.contains(DstReg, SrcReg)) {
526 BuildMI(MBB, MBBI, DL, get(RISCV::PseudoMV_FPR16INX), DstReg)
527 .addReg(SrcReg, KillFlag | getRenamableRegState(RenamableSrc));
528 return;
529 }
530
531 if (RISCV::GPRF32RegClass.contains(DstReg, SrcReg)) {
532 BuildMI(MBB, MBBI, DL, get(RISCV::PseudoMV_FPR32INX), DstReg)
533 .addReg(SrcReg, KillFlag | getRenamableRegState(RenamableSrc));
534 return;
535 }
536
537 if (RISCV::GPRPairRegClass.contains(DstReg, SrcReg)) {
538 if (STI.isRV32()) {
539 if (STI.hasStdExtZdinx()) {
540 // On RV32_Zdinx, FMV.D will move a pair of registers to another pair of
541 // registers, in one instruction.
542 BuildMI(MBB, MBBI, DL, get(RISCV::FSGNJ_D_IN32X), DstReg)
543 .addReg(SrcReg, getRenamableRegState(RenamableSrc))
544 .addReg(SrcReg, KillFlag | getRenamableRegState(RenamableSrc));
545 return;
546 }
547
548 if (STI.hasStdExtP()) {
549 // On RV32P, `padd.dw` is a GPR Pair Add
550 BuildMI(MBB, MBBI, DL, get(RISCV::PADD_DW), DstReg)
551 .addReg(SrcReg, KillFlag | getRenamableRegState(RenamableSrc))
552 .addReg(RISCV::X0_Pair);
553 return;
554 }
555 }
556
557 MCRegister EvenReg = TRI->getSubReg(SrcReg, RISCV::sub_gpr_even);
558 MCRegister OddReg = TRI->getSubReg(SrcReg, RISCV::sub_gpr_odd);
559 // We need to correct the odd register of X0_Pair.
560 if (OddReg == RISCV::DUMMY_REG_PAIR_WITH_X0)
561 OddReg = RISCV::X0;
562 assert(DstReg != RISCV::X0_Pair && "Cannot write to X0_Pair");
563
564 // Emit an ADDI for both parts of GPRPair.
565 BuildMI(MBB, MBBI, DL, get(RISCV::ADDI),
566 TRI->getSubReg(DstReg, RISCV::sub_gpr_even))
567 .addReg(EvenReg, KillFlag)
568 .addImm(0);
569 BuildMI(MBB, MBBI, DL, get(RISCV::ADDI),
570 TRI->getSubReg(DstReg, RISCV::sub_gpr_odd))
571 .addReg(OddReg, KillFlag)
572 .addImm(0);
573 return;
574 }
575
576 // Handle copy from csr
577 if (RISCV::VCSRRegClass.contains(SrcReg) &&
578 RISCV::GPRRegClass.contains(DstReg)) {
579 BuildMI(MBB, MBBI, DL, get(RISCV::CSRRS), DstReg)
580 .addImm(RISCVSysReg::lookupSysRegByName(TRI->getName(SrcReg))->Encoding)
581 .addReg(RISCV::X0);
582 return;
583 }
584
585 if (RISCV::FPR16RegClass.contains(DstReg, SrcReg)) {
586 unsigned Opc;
587 if (STI.hasStdExtZfh()) {
588 Opc = RISCV::FSGNJ_H;
589 } else {
590 assert(STI.hasStdExtF() &&
591 (STI.hasStdExtZfhmin() || STI.hasStdExtZfbfmin()) &&
592 "Unexpected extensions");
593 // Zfhmin/Zfbfmin doesn't have FSGNJ_H, replace FSGNJ_H with FSGNJ_S.
594 DstReg = TRI->getMatchingSuperReg(DstReg, RISCV::sub_16,
595 &RISCV::FPR32RegClass);
596 SrcReg = TRI->getMatchingSuperReg(SrcReg, RISCV::sub_16,
597 &RISCV::FPR32RegClass);
598 Opc = RISCV::FSGNJ_S;
599 }
600 BuildMI(MBB, MBBI, DL, get(Opc), DstReg)
601 .addReg(SrcReg, KillFlag)
602 .addReg(SrcReg, KillFlag);
603 return;
604 }
605
606 if (RISCV::FPR32RegClass.contains(DstReg, SrcReg)) {
607 BuildMI(MBB, MBBI, DL, get(RISCV::FSGNJ_S), DstReg)
608 .addReg(SrcReg, KillFlag)
609 .addReg(SrcReg, KillFlag);
610 return;
611 }
612
613 if (RISCV::FPR64RegClass.contains(DstReg, SrcReg)) {
614 BuildMI(MBB, MBBI, DL, get(RISCV::FSGNJ_D), DstReg)
615 .addReg(SrcReg, KillFlag)
616 .addReg(SrcReg, KillFlag);
617 return;
618 }
619
620 if (RISCV::FPR32RegClass.contains(DstReg) &&
621 RISCV::GPRRegClass.contains(SrcReg)) {
622 BuildMI(MBB, MBBI, DL, get(RISCV::FMV_W_X), DstReg)
623 .addReg(SrcReg, KillFlag);
624 return;
625 }
626
627 if (RISCV::GPRRegClass.contains(DstReg) &&
628 RISCV::FPR32RegClass.contains(SrcReg)) {
629 BuildMI(MBB, MBBI, DL, get(RISCV::FMV_X_W), DstReg)
630 .addReg(SrcReg, KillFlag);
631 return;
632 }
633
634 if (RISCV::FPR64RegClass.contains(DstReg) &&
635 RISCV::GPRRegClass.contains(SrcReg)) {
636 assert(STI.getXLen() == 64 && "Unexpected GPR size");
637 BuildMI(MBB, MBBI, DL, get(RISCV::FMV_D_X), DstReg)
638 .addReg(SrcReg, KillFlag);
639 return;
640 }
641
642 if (RISCV::GPRRegClass.contains(DstReg) &&
643 RISCV::FPR64RegClass.contains(SrcReg)) {
644 assert(STI.getXLen() == 64 && "Unexpected GPR size");
645 BuildMI(MBB, MBBI, DL, get(RISCV::FMV_X_D), DstReg)
646 .addReg(SrcReg, KillFlag);
647 return;
648 }
649
650 // VR->VR copies.
651 const TargetRegisterClass *RegClass =
652 TRI->getCommonMinimalPhysRegClass(SrcReg, DstReg);
653 if (RISCVRegisterInfo::isRVVRegClass(RegClass)) {
654 copyPhysRegVector(MBB, MBBI, DL, DstReg, SrcReg, KillSrc, RegClass);
655 return;
656 }
657
658 llvm_unreachable("Impossible reg-to-reg copy");
659}
660
663 Register SrcReg, bool IsKill, int FI,
664 const TargetRegisterClass *RC,
665 Register VReg,
666 MachineInstr::MIFlag Flags) const {
667 MachineFunction *MF = MBB.getParent();
668 MachineFrameInfo &MFI = MF->getFrameInfo();
669 Align Alignment = MFI.getObjectAlign(FI);
670
671 unsigned Opcode;
672 if (RISCV::GPRRegClass.hasSubClassEq(RC)) {
673 Opcode = RegInfo.getRegSizeInBits(RISCV::GPRRegClass) == 32 ? RISCV::SW
674 : RISCV::SD;
675 } else if (RISCV::GPRF16RegClass.hasSubClassEq(RC)) {
676 Opcode = RISCV::SH_INX;
677 } else if (RISCV::GPRF32RegClass.hasSubClassEq(RC)) {
678 Opcode = RISCV::SW_INX;
679 } else if (RISCV::GPRPairRegClass.hasSubClassEq(RC)) {
680 if (!STI.is64Bit() && STI.hasStdExtZilsd() &&
681 Alignment >= STI.getZilsdAlign()) {
682 Opcode = RISCV::SD_RV32;
683 } else {
684 Opcode = RISCV::PseudoRV32ZdinxSD;
685 }
686 } else if (RISCV::FPR16RegClass.hasSubClassEq(RC)) {
687 Opcode = RISCV::FSH;
688 } else if (RISCV::FPR32RegClass.hasSubClassEq(RC)) {
689 Opcode = RISCV::FSW;
690 } else if (RISCV::FPR64RegClass.hasSubClassEq(RC)) {
691 Opcode = RISCV::FSD;
692 } else if (RISCV::VRRegClass.hasSubClassEq(RC)) {
693 Opcode = RISCV::VS1R_V;
694 } else if (RISCV::VRM2RegClass.hasSubClassEq(RC)) {
695 Opcode = RISCV::VS2R_V;
696 } else if (RISCV::VRM4RegClass.hasSubClassEq(RC)) {
697 Opcode = RISCV::VS4R_V;
698 } else if (RISCV::VRM8RegClass.hasSubClassEq(RC)) {
699 Opcode = RISCV::VS8R_V;
700 } else if (RISCV::VRN2M1RegClass.hasSubClassEq(RC))
701 Opcode = RISCV::PseudoVSPILL2_M1;
702 else if (RISCV::VRN2M2RegClass.hasSubClassEq(RC))
703 Opcode = RISCV::PseudoVSPILL2_M2;
704 else if (RISCV::VRN2M4RegClass.hasSubClassEq(RC))
705 Opcode = RISCV::PseudoVSPILL2_M4;
706 else if (RISCV::VRN3M1RegClass.hasSubClassEq(RC))
707 Opcode = RISCV::PseudoVSPILL3_M1;
708 else if (RISCV::VRN3M2RegClass.hasSubClassEq(RC))
709 Opcode = RISCV::PseudoVSPILL3_M2;
710 else if (RISCV::VRN4M1RegClass.hasSubClassEq(RC))
711 Opcode = RISCV::PseudoVSPILL4_M1;
712 else if (RISCV::VRN4M2RegClass.hasSubClassEq(RC))
713 Opcode = RISCV::PseudoVSPILL4_M2;
714 else if (RISCV::VRN5M1RegClass.hasSubClassEq(RC))
715 Opcode = RISCV::PseudoVSPILL5_M1;
716 else if (RISCV::VRN6M1RegClass.hasSubClassEq(RC))
717 Opcode = RISCV::PseudoVSPILL6_M1;
718 else if (RISCV::VRN7M1RegClass.hasSubClassEq(RC))
719 Opcode = RISCV::PseudoVSPILL7_M1;
720 else if (RISCV::VRN8M1RegClass.hasSubClassEq(RC))
721 Opcode = RISCV::PseudoVSPILL8_M1;
722 else
723 llvm_unreachable("Can't store this register to stack slot");
724
728 TypeSize::getScalable(MFI.getObjectSize(FI)), Alignment);
729
731 BuildMI(MBB, I, DebugLoc(), get(Opcode))
732 .addReg(SrcReg, getKillRegState(IsKill))
733 .addFrameIndex(FI)
734 .addMemOperand(MMO)
735 .setMIFlag(Flags);
736 NumVRegSpilled += RegInfo.getRegSizeInBits(*RC) / RISCV::RVVBitsPerBlock;
737 } else {
740 MFI.getObjectSize(FI), Alignment);
741
742 BuildMI(MBB, I, DebugLoc(), get(Opcode))
743 .addReg(SrcReg, getKillRegState(IsKill))
744 .addFrameIndex(FI)
745 .addImm(0)
746 .addMemOperand(MMO)
747 .setMIFlag(Flags);
748 }
749}
750
753 Register DstReg, int FI,
754 const TargetRegisterClass *RC,
755 Register VReg, unsigned SubReg,
756 MachineInstr::MIFlag Flags) const {
757 MachineFunction *MF = MBB.getParent();
758 MachineFrameInfo &MFI = MF->getFrameInfo();
759 Align Alignment = MFI.getObjectAlign(FI);
760 DebugLoc DL =
761 Flags & MachineInstr::FrameDestroy ? MBB.findDebugLoc(I) : DebugLoc();
762
763 unsigned Opcode;
764 if (RISCV::GPRRegClass.hasSubClassEq(RC)) {
765 Opcode = RegInfo.getRegSizeInBits(RISCV::GPRRegClass) == 32 ? RISCV::LW
766 : RISCV::LD;
767 } else if (RISCV::GPRF16RegClass.hasSubClassEq(RC)) {
768 Opcode = RISCV::LH_INX;
769 } else if (RISCV::GPRF32RegClass.hasSubClassEq(RC)) {
770 Opcode = RISCV::LW_INX;
771 } else if (RISCV::GPRPairRegClass.hasSubClassEq(RC)) {
772 if (!STI.is64Bit() && STI.hasStdExtZilsd() &&
773 Alignment >= STI.getZilsdAlign()) {
774 Opcode = RISCV::LD_RV32;
775 } else {
776 Opcode = RISCV::PseudoRV32ZdinxLD;
777 }
778 } else if (RISCV::FPR16RegClass.hasSubClassEq(RC)) {
779 Opcode = RISCV::FLH;
780 } else if (RISCV::FPR32RegClass.hasSubClassEq(RC)) {
781 Opcode = RISCV::FLW;
782 } else if (RISCV::FPR64RegClass.hasSubClassEq(RC)) {
783 Opcode = RISCV::FLD;
784 } else if (RISCV::VRRegClass.hasSubClassEq(RC)) {
785 Opcode = RISCV::VL1RE8_V;
786 } else if (RISCV::VRM2RegClass.hasSubClassEq(RC)) {
787 Opcode = RISCV::VL2RE8_V;
788 } else if (RISCV::VRM4RegClass.hasSubClassEq(RC)) {
789 Opcode = RISCV::VL4RE8_V;
790 } else if (RISCV::VRM8RegClass.hasSubClassEq(RC)) {
791 Opcode = RISCV::VL8RE8_V;
792 } else if (RISCV::VRN2M1RegClass.hasSubClassEq(RC))
793 Opcode = RISCV::PseudoVRELOAD2_M1;
794 else if (RISCV::VRN2M2RegClass.hasSubClassEq(RC))
795 Opcode = RISCV::PseudoVRELOAD2_M2;
796 else if (RISCV::VRN2M4RegClass.hasSubClassEq(RC))
797 Opcode = RISCV::PseudoVRELOAD2_M4;
798 else if (RISCV::VRN3M1RegClass.hasSubClassEq(RC))
799 Opcode = RISCV::PseudoVRELOAD3_M1;
800 else if (RISCV::VRN3M2RegClass.hasSubClassEq(RC))
801 Opcode = RISCV::PseudoVRELOAD3_M2;
802 else if (RISCV::VRN4M1RegClass.hasSubClassEq(RC))
803 Opcode = RISCV::PseudoVRELOAD4_M1;
804 else if (RISCV::VRN4M2RegClass.hasSubClassEq(RC))
805 Opcode = RISCV::PseudoVRELOAD4_M2;
806 else if (RISCV::VRN5M1RegClass.hasSubClassEq(RC))
807 Opcode = RISCV::PseudoVRELOAD5_M1;
808 else if (RISCV::VRN6M1RegClass.hasSubClassEq(RC))
809 Opcode = RISCV::PseudoVRELOAD6_M1;
810 else if (RISCV::VRN7M1RegClass.hasSubClassEq(RC))
811 Opcode = RISCV::PseudoVRELOAD7_M1;
812 else if (RISCV::VRN8M1RegClass.hasSubClassEq(RC))
813 Opcode = RISCV::PseudoVRELOAD8_M1;
814 else
815 llvm_unreachable("Can't load this register from stack slot");
816
820 TypeSize::getScalable(MFI.getObjectSize(FI)), Alignment);
821
823 BuildMI(MBB, I, DL, get(Opcode), DstReg)
824 .addFrameIndex(FI)
825 .addMemOperand(MMO)
826 .setMIFlag(Flags);
827 NumVRegReloaded += RegInfo.getRegSizeInBits(*RC) / RISCV::RVVBitsPerBlock;
828 } else {
831 MFI.getObjectSize(FI), Alignment);
832
833 BuildMI(MBB, I, DL, get(Opcode), DstReg)
834 .addFrameIndex(FI)
835 .addImm(0)
836 .addMemOperand(MMO)
837 .setMIFlag(Flags);
838 }
839}
840std::optional<unsigned> getFoldedOpcode(MachineFunction &MF, MachineInstr &MI,
842 const RISCVSubtarget &ST) {
843
844 // The below optimizations narrow the load so they are only valid for little
845 // endian.
846 // TODO: Support big endian by adding an offset into the frame object?
847 if (MF.getDataLayout().isBigEndian())
848 return std::nullopt;
849
850 // Fold load from stack followed by sext.b/sext.h/sext.w/zext.b/zext.h/zext.w.
851 if (Ops.size() != 1 || Ops[0] != 1)
852 return std::nullopt;
853
854 switch (MI.getOpcode()) {
855 default:
856 if (RISCVInstrInfo::isSEXT_W(MI))
857 return RISCV::LW;
858 if (RISCVInstrInfo::isZEXT_W(MI))
859 return RISCV::LWU;
860 if (RISCVInstrInfo::isZEXT_B(MI))
861 return RISCV::LBU;
862 break;
863 case RISCV::SEXT_H:
864 return RISCV::LH;
865 case RISCV::SEXT_B:
866 return RISCV::LB;
867 case RISCV::ZEXT_H_RV32:
868 case RISCV::ZEXT_H_RV64:
869 return RISCV::LHU;
870 }
871
872 switch (RISCV::getRVVMCOpcode(MI.getOpcode())) {
873 default:
874 return std::nullopt;
875 case RISCV::VMV_X_S: {
876 unsigned Log2SEW =
877 MI.getOperand(RISCVII::getSEWOpNum(MI.getDesc())).getImm();
878 if (ST.getXLen() < (1U << Log2SEW))
879 return std::nullopt;
880 switch (Log2SEW) {
881 case 3:
882 return RISCV::LB;
883 case 4:
884 return RISCV::LH;
885 case 5:
886 return RISCV::LW;
887 case 6:
888 return RISCV::LD;
889 default:
890 llvm_unreachable("Unexpected SEW");
891 }
892 }
893 case RISCV::VFMV_F_S: {
894 unsigned Log2SEW =
895 MI.getOperand(RISCVII::getSEWOpNum(MI.getDesc())).getImm();
896 switch (Log2SEW) {
897 case 4:
898 return RISCV::FLH;
899 case 5:
900 return RISCV::FLW;
901 case 6:
902 return RISCV::FLD;
903 default:
904 llvm_unreachable("Unexpected SEW");
905 }
906 }
907 }
908}
909
910// This is the version used during InlineSpiller::spillAroundUses
913 ArrayRef<unsigned> Ops, int FrameIndex,
914 MachineInstr *&CopyMI, LiveIntervals *LIS,
915 VirtRegMap *VRM) const {
917 std::optional<unsigned> LoadOpc = getFoldedOpcode(MF, MI, Ops, STI);
918 if (!LoadOpc)
919 return nullptr;
920 Register DstReg = MI.getOperand(0).getReg();
921 return BuildMI(*MI.getParent(), InsertPt, MI.getDebugLoc(), get(*LoadOpc),
922 DstReg)
923 .addFrameIndex(FrameIndex)
924 .addImm(0);
925}
926
927static unsigned getLoadPredicatedOpcode(unsigned Opcode) {
928 switch (Opcode) {
929 case RISCV::LB:
930 return RISCV::PseudoCCLB;
931 case RISCV::LBU:
932 return RISCV::PseudoCCLBU;
933 case RISCV::LH:
934 return RISCV::PseudoCCLH;
935 case RISCV::LHU:
936 return RISCV::PseudoCCLHU;
937 case RISCV::LW:
938 return RISCV::PseudoCCLW;
939 case RISCV::LWU:
940 return RISCV::PseudoCCLWU;
941 case RISCV::LD:
942 return RISCV::PseudoCCLD;
943 case RISCV::QC_E_LB:
944 return RISCV::PseudoCCQC_E_LB;
945 case RISCV::QC_E_LBU:
946 return RISCV::PseudoCCQC_E_LBU;
947 case RISCV::QC_E_LH:
948 return RISCV::PseudoCCQC_E_LH;
949 case RISCV::QC_E_LHU:
950 return RISCV::PseudoCCQC_E_LHU;
951 case RISCV::QC_E_LW:
952 return RISCV::PseudoCCQC_E_LW;
953 default:
954 return 0;
955 }
956}
957
960 MachineInstr &LoadMI, MachineInstr *&CopyMI, LiveIntervals *LIS,
961 VirtRegMap *VRM) const {
963 // For now, only handle RISCV::PseudoCCMOVGPR.
964 if (MI.getOpcode() != RISCV::PseudoCCMOVGPR)
965 return nullptr;
966
967 unsigned PredOpc = getLoadPredicatedOpcode(LoadMI.getOpcode());
968
969 if (!STI.hasShortForwardBranchILoad() || !PredOpc)
970 return nullptr;
971
973 if (Ops.size() != 1 || (Ops[0] != 1 && Ops[0] != 2))
974 return nullptr;
975
976 bool Invert = Ops[0] == 2;
977 const MachineOperand &FalseReg = MI.getOperand(!Invert ? 2 : 1);
978 Register DestReg = MI.getOperand(0).getReg();
979 const TargetRegisterClass *PreviousClass = MRI.getRegClass(FalseReg.getReg());
980 if (!MRI.constrainRegClass(DestReg, PreviousClass))
981 return nullptr;
982
983 // Create a new predicated version of DefMI.
984 MachineInstrBuilder NewMI = BuildMI(*MI.getParent(), InsertPt,
985 MI.getDebugLoc(), get(PredOpc), DestReg);
986
987 // Copy the false register.
988 NewMI.add(FalseReg);
989
990 // Copy all the DefMI operands.
991 const MCInstrDesc &DefDesc = LoadMI.getDesc();
992 for (unsigned i = 1, e = DefDesc.getNumOperands(); i != e; ++i)
993 NewMI.add(LoadMI.getOperand(i));
994
995 // Add branch opcode, inverting if necessary.
996 unsigned BCC = MI.getOperand(MI.getNumExplicitOperands() - 3).getImm();
997 if (!Invert)
999 NewMI.addImm(BCC);
1000
1001 // Copy condition portion
1002 NewMI.add({MI.getOperand(MI.getNumExplicitOperands() - 2),
1003 MI.getOperand(MI.getNumExplicitOperands() - 1)});
1004 NewMI.cloneMemRefs(LoadMI);
1005 return NewMI;
1006}
1007
1010 const DebugLoc &DL, Register DstReg, uint64_t Val,
1011 MachineInstr::MIFlag Flag, bool DstRenamable,
1012 bool DstIsDead) const {
1013 Register SrcReg = RISCV::X0;
1014
1015 // For RV32, allow a sign or unsigned 32 bit value.
1016 if (!STI.is64Bit() && !isInt<32>(Val)) {
1017 // If have a uimm32 it will still fit in a register so we can allow it.
1018 if (!isUInt<32>(Val))
1019 report_fatal_error("Should only materialize 32-bit constants for RV32");
1020
1021 // Sign extend for generateInstSeq.
1022 Val = SignExtend64<32>(Val);
1023 }
1024
1026 assert(!Seq.empty());
1027
1028 bool SrcRenamable = false;
1029 unsigned Num = 0;
1030
1031 for (const RISCVMatInt::Inst &Inst : Seq) {
1032 bool LastItem = ++Num == Seq.size();
1033 RegState DstRegState = getDeadRegState(DstIsDead && LastItem) |
1034 getRenamableRegState(DstRenamable);
1035 RegState SrcRegState = getKillRegState(SrcReg != RISCV::X0) |
1036 getRenamableRegState(SrcRenamable);
1037 switch (Inst.getOpndKind()) {
1038 case RISCVMatInt::Imm:
1039 BuildMI(MBB, MBBI, DL, get(Inst.getOpcode()))
1040 .addReg(DstReg, RegState::Define | DstRegState)
1041 .addImm(Inst.getImm())
1042 .setMIFlag(Flag);
1043 break;
1044 case RISCVMatInt::RegX0:
1045 BuildMI(MBB, MBBI, DL, get(Inst.getOpcode()))
1046 .addReg(DstReg, RegState::Define | DstRegState)
1047 .addReg(SrcReg, SrcRegState)
1048 .addReg(RISCV::X0)
1049 .setMIFlag(Flag);
1050 break;
1052 BuildMI(MBB, MBBI, DL, get(Inst.getOpcode()))
1053 .addReg(DstReg, RegState::Define | DstRegState)
1054 .addReg(SrcReg, SrcRegState)
1055 .addReg(SrcReg, SrcRegState)
1056 .setMIFlag(Flag);
1057 break;
1059 BuildMI(MBB, MBBI, DL, get(Inst.getOpcode()))
1060 .addReg(DstReg, RegState::Define | DstRegState)
1061 .addReg(SrcReg, SrcRegState)
1062 .addImm(Inst.getImm())
1063 .setMIFlag(Flag);
1064 break;
1065 }
1066
1067 // Only the first instruction has X0 as its source.
1068 SrcReg = DstReg;
1069 SrcRenamable = DstRenamable;
1070 }
1071}
1072
1074 switch (Opc) {
1075 default:
1076 return RISCVCC::COND_INVALID;
1077 case RISCV::BEQ:
1078 case RISCV::BEQI:
1079 case RISCV::CV_BEQIMM:
1080 case RISCV::QC_BEQI:
1081 case RISCV::QC_E_BEQI:
1082 case RISCV::NDS_BBC:
1083 case RISCV::NDS_BEQC:
1084 return RISCVCC::COND_EQ;
1085 case RISCV::BNE:
1086 case RISCV::BNEI:
1087 case RISCV::QC_BNEI:
1088 case RISCV::QC_E_BNEI:
1089 case RISCV::CV_BNEIMM:
1090 case RISCV::NDS_BBS:
1091 case RISCV::NDS_BNEC:
1092 return RISCVCC::COND_NE;
1093 case RISCV::BLT:
1094 case RISCV::QC_BLTI:
1095 case RISCV::QC_E_BLTI:
1096 return RISCVCC::COND_LT;
1097 case RISCV::BGE:
1098 case RISCV::QC_BGEI:
1099 case RISCV::QC_E_BGEI:
1100 return RISCVCC::COND_GE;
1101 case RISCV::BLTU:
1102 case RISCV::QC_BLTUI:
1103 case RISCV::QC_E_BLTUI:
1104 return RISCVCC::COND_LTU;
1105 case RISCV::BGEU:
1106 case RISCV::QC_BGEUI:
1107 case RISCV::QC_E_BGEUI:
1108 return RISCVCC::COND_GEU;
1109 }
1110}
1111
1113 int64_t C1) {
1114 switch (CC) {
1115 default:
1116 llvm_unreachable("Unexpected CC");
1117 case RISCVCC::COND_EQ:
1118 return C0 == C1;
1119 case RISCVCC::COND_NE:
1120 return C0 != C1;
1121 case RISCVCC::COND_LT:
1122 return C0 < C1;
1123 case RISCVCC::COND_GE:
1124 return C0 >= C1;
1125 case RISCVCC::COND_LTU:
1126 return (uint64_t)C0 < (uint64_t)C1;
1127 case RISCVCC::COND_GEU:
1128 return (uint64_t)C0 >= (uint64_t)C1;
1129 }
1130}
1131
1132// The contents of values added to Cond are not examined outside of
1133// RISCVInstrInfo, giving us flexibility in what to push to it. For RISCV, we
1134// push BranchOpcode, Reg1, Reg2.
1137 // Block ends with fall-through condbranch.
1138 assert(LastInst.getDesc().isConditionalBranch() &&
1139 "Unknown conditional branch");
1140 Target = LastInst.getOperand(2).getMBB();
1141 Cond.push_back(MachineOperand::CreateImm(LastInst.getOpcode()));
1142 Cond.push_back(LastInst.getOperand(0));
1143 Cond.push_back(LastInst.getOperand(1));
1144}
1145
1146static unsigned getInverseXqcicmOpcode(unsigned Opcode) {
1147 switch (Opcode) {
1148 default:
1149 llvm_unreachable("Unexpected Opcode");
1150 case RISCV::QC_MVEQ:
1151 return RISCV::QC_MVNE;
1152 case RISCV::QC_MVNE:
1153 return RISCV::QC_MVEQ;
1154 case RISCV::QC_MVLT:
1155 return RISCV::QC_MVGE;
1156 case RISCV::QC_MVGE:
1157 return RISCV::QC_MVLT;
1158 case RISCV::QC_MVLTU:
1159 return RISCV::QC_MVGEU;
1160 case RISCV::QC_MVGEU:
1161 return RISCV::QC_MVLTU;
1162 case RISCV::QC_MVEQI:
1163 return RISCV::QC_MVNEI;
1164 case RISCV::QC_MVNEI:
1165 return RISCV::QC_MVEQI;
1166 case RISCV::QC_MVLTI:
1167 return RISCV::QC_MVGEI;
1168 case RISCV::QC_MVGEI:
1169 return RISCV::QC_MVLTI;
1170 case RISCV::QC_MVLTUI:
1171 return RISCV::QC_MVGEUI;
1172 case RISCV::QC_MVGEUI:
1173 return RISCV::QC_MVLTUI;
1174 }
1175}
1176
1177unsigned RISCVCC::getBrCond(RISCVCC::CondCode CC, unsigned SelectOpc) {
1178 switch (SelectOpc) {
1179 default:
1180 switch (CC) {
1181 default:
1182 llvm_unreachable("Unexpected condition code!");
1183 case RISCVCC::COND_EQ:
1184 return RISCV::BEQ;
1185 case RISCVCC::COND_NE:
1186 return RISCV::BNE;
1187 case RISCVCC::COND_LT:
1188 return RISCV::BLT;
1189 case RISCVCC::COND_GE:
1190 return RISCV::BGE;
1191 case RISCVCC::COND_LTU:
1192 return RISCV::BLTU;
1193 case RISCVCC::COND_GEU:
1194 return RISCV::BGEU;
1195 }
1196 break;
1197 case RISCV::Select_GPR_Using_CC_Imm5_Zibi:
1198 switch (CC) {
1199 default:
1200 llvm_unreachable("Unexpected condition code!");
1201 case RISCVCC::COND_EQ:
1202 return RISCV::BEQI;
1203 case RISCVCC::COND_NE:
1204 return RISCV::BNEI;
1205 }
1206 break;
1207 case RISCV::Select_GPR_Using_CC_SImm5_CV:
1208 switch (CC) {
1209 default:
1210 llvm_unreachable("Unexpected condition code!");
1211 case RISCVCC::COND_EQ:
1212 return RISCV::CV_BEQIMM;
1213 case RISCVCC::COND_NE:
1214 return RISCV::CV_BNEIMM;
1215 }
1216 break;
1217 case RISCV::Select_GPRNoX0_Using_CC_SImm5NonZero_QC:
1218 switch (CC) {
1219 default:
1220 llvm_unreachable("Unexpected condition code!");
1221 case RISCVCC::COND_EQ:
1222 return RISCV::QC_BEQI;
1223 case RISCVCC::COND_NE:
1224 return RISCV::QC_BNEI;
1225 case RISCVCC::COND_LT:
1226 return RISCV::QC_BLTI;
1227 case RISCVCC::COND_GE:
1228 return RISCV::QC_BGEI;
1229 }
1230 break;
1231 case RISCV::Select_GPRNoX0_Using_CC_UImm5NonZero_QC:
1232 switch (CC) {
1233 default:
1234 llvm_unreachable("Unexpected condition code!");
1235 case RISCVCC::COND_LTU:
1236 return RISCV::QC_BLTUI;
1237 case RISCVCC::COND_GEU:
1238 return RISCV::QC_BGEUI;
1239 }
1240 break;
1241 case RISCV::Select_GPRNoX0_Using_CC_SImm16NonZero_QC:
1242 switch (CC) {
1243 default:
1244 llvm_unreachable("Unexpected condition code!");
1245 case RISCVCC::COND_EQ:
1246 return RISCV::QC_E_BEQI;
1247 case RISCVCC::COND_NE:
1248 return RISCV::QC_E_BNEI;
1249 case RISCVCC::COND_LT:
1250 return RISCV::QC_E_BLTI;
1251 case RISCVCC::COND_GE:
1252 return RISCV::QC_E_BGEI;
1253 }
1254 break;
1255 case RISCV::Select_GPRNoX0_Using_CC_UImm16NonZero_QC:
1256 switch (CC) {
1257 default:
1258 llvm_unreachable("Unexpected condition code!");
1259 case RISCVCC::COND_LTU:
1260 return RISCV::QC_E_BLTUI;
1261 case RISCVCC::COND_GEU:
1262 return RISCV::QC_E_BGEUI;
1263 }
1264 break;
1265 case RISCV::Select_GPR_Using_CC_UImmLog2XLen_NDS:
1266 switch (CC) {
1267 default:
1268 llvm_unreachable("Unexpected condition code!");
1269 case RISCVCC::COND_EQ:
1270 return RISCV::NDS_BBC;
1271 case RISCVCC::COND_NE:
1272 return RISCV::NDS_BBS;
1273 }
1274 break;
1275 case RISCV::Select_GPR_Using_CC_UImm7_NDS:
1276 switch (CC) {
1277 default:
1278 llvm_unreachable("Unexpected condition code!");
1279 case RISCVCC::COND_EQ:
1280 return RISCV::NDS_BEQC;
1281 case RISCVCC::COND_NE:
1282 return RISCV::NDS_BNEC;
1283 }
1284 break;
1285 }
1286}
1287
1289 switch (CC) {
1290 default:
1291 llvm_unreachable("Unrecognized conditional branch");
1292 case RISCVCC::COND_EQ:
1293 return RISCVCC::COND_NE;
1294 case RISCVCC::COND_NE:
1295 return RISCVCC::COND_EQ;
1296 case RISCVCC::COND_LT:
1297 return RISCVCC::COND_GE;
1298 case RISCVCC::COND_GE:
1299 return RISCVCC::COND_LT;
1300 case RISCVCC::COND_LTU:
1301 return RISCVCC::COND_GEU;
1302 case RISCVCC::COND_GEU:
1303 return RISCVCC::COND_LTU;
1304 }
1305}
1306
1307// Return inverse branch
1308unsigned RISCVCC::getInverseBranchOpcode(unsigned BCC) {
1309 switch (BCC) {
1310 default:
1311 llvm_unreachable("Unexpected branch opcode!");
1312 case RISCV::BEQ:
1313 return RISCV::BNE;
1314 case RISCV::BEQI:
1315 return RISCV::BNEI;
1316 case RISCV::BNE:
1317 return RISCV::BEQ;
1318 case RISCV::BNEI:
1319 return RISCV::BEQI;
1320 case RISCV::BLT:
1321 return RISCV::BGE;
1322 case RISCV::BGE:
1323 return RISCV::BLT;
1324 case RISCV::BLTU:
1325 return RISCV::BGEU;
1326 case RISCV::BGEU:
1327 return RISCV::BLTU;
1328 case RISCV::CV_BEQIMM:
1329 return RISCV::CV_BNEIMM;
1330 case RISCV::CV_BNEIMM:
1331 return RISCV::CV_BEQIMM;
1332 case RISCV::QC_BEQI:
1333 return RISCV::QC_BNEI;
1334 case RISCV::QC_BNEI:
1335 return RISCV::QC_BEQI;
1336 case RISCV::QC_BLTI:
1337 return RISCV::QC_BGEI;
1338 case RISCV::QC_BGEI:
1339 return RISCV::QC_BLTI;
1340 case RISCV::QC_BLTUI:
1341 return RISCV::QC_BGEUI;
1342 case RISCV::QC_BGEUI:
1343 return RISCV::QC_BLTUI;
1344 case RISCV::QC_E_BEQI:
1345 return RISCV::QC_E_BNEI;
1346 case RISCV::QC_E_BNEI:
1347 return RISCV::QC_E_BEQI;
1348 case RISCV::QC_E_BLTI:
1349 return RISCV::QC_E_BGEI;
1350 case RISCV::QC_E_BGEI:
1351 return RISCV::QC_E_BLTI;
1352 case RISCV::QC_E_BLTUI:
1353 return RISCV::QC_E_BGEUI;
1354 case RISCV::QC_E_BGEUI:
1355 return RISCV::QC_E_BLTUI;
1356 case RISCV::NDS_BBC:
1357 return RISCV::NDS_BBS;
1358 case RISCV::NDS_BBS:
1359 return RISCV::NDS_BBC;
1360 case RISCV::NDS_BEQC:
1361 return RISCV::NDS_BNEC;
1362 case RISCV::NDS_BNEC:
1363 return RISCV::NDS_BEQC;
1364 }
1365}
1366
1369 MachineBasicBlock *&FBB,
1371 bool AllowModify) const {
1372 TBB = FBB = nullptr;
1373 Cond.clear();
1374
1375 // If the block has no terminators, it just falls into the block after it.
1376 MachineBasicBlock::iterator I = MBB.getLastNonDebugInstr();
1377 if (I == MBB.end() || !isUnpredicatedTerminator(*I))
1378 return false;
1379
1380 // Count the number of terminators and find the first unconditional or
1381 // indirect branch.
1382 MachineBasicBlock::iterator FirstUncondOrIndirectBr = MBB.end();
1383 int NumTerminators = 0;
1384 for (auto J = I.getReverse(); J != MBB.rend() && isUnpredicatedTerminator(*J);
1385 J++) {
1386 NumTerminators++;
1387 if (J->getDesc().isUnconditionalBranch() ||
1388 J->getDesc().isIndirectBranch()) {
1389 FirstUncondOrIndirectBr = J.getReverse();
1390 }
1391 }
1392
1393 // If AllowModify is true, we can erase any terminators after
1394 // FirstUncondOrIndirectBR.
1395 if (AllowModify && FirstUncondOrIndirectBr != MBB.end()) {
1396 while (std::next(FirstUncondOrIndirectBr) != MBB.end()) {
1397 std::next(FirstUncondOrIndirectBr)->eraseFromParent();
1398 NumTerminators--;
1399 }
1400 I = FirstUncondOrIndirectBr;
1401 }
1402
1403 // We can't handle blocks that end in an indirect branch.
1404 if (I->getDesc().isIndirectBranch())
1405 return true;
1406
1407 // We can't handle Generic branch opcodes from Global ISel.
1408 if (I->isPreISelOpcode())
1409 return true;
1410
1411 // We can't handle blocks with more than 2 terminators.
1412 if (NumTerminators > 2)
1413 return true;
1414
1415 // Handle a single unconditional branch.
1416 if (NumTerminators == 1 && I->getDesc().isUnconditionalBranch()) {
1418 return false;
1419 }
1420
1421 // Handle a single conditional branch.
1422 if (NumTerminators == 1 && I->getDesc().isConditionalBranch()) {
1424 return false;
1425 }
1426
1427 // Handle a conditional branch followed by an unconditional branch.
1428 if (NumTerminators == 2 && std::prev(I)->getDesc().isConditionalBranch() &&
1429 I->getDesc().isUnconditionalBranch()) {
1430 parseCondBranch(*std::prev(I), TBB, Cond);
1431 FBB = getBranchDestBlock(*I);
1432 return false;
1433 }
1434
1435 // Otherwise, we can't handle this.
1436 return true;
1437}
1438
1440 int *BytesRemoved) const {
1441 if (BytesRemoved)
1442 *BytesRemoved = 0;
1443 MachineBasicBlock::iterator I = MBB.getLastNonDebugInstr();
1444 if (I == MBB.end())
1445 return 0;
1446
1447 if (!I->getDesc().isUnconditionalBranch() &&
1448 !I->getDesc().isConditionalBranch())
1449 return 0;
1450
1451 // Remove the branch.
1452 if (BytesRemoved)
1453 *BytesRemoved += getInstSizeInBytes(*I);
1454 I->eraseFromParent();
1455
1456 I = MBB.end();
1457
1458 if (I == MBB.begin())
1459 return 1;
1460 --I;
1461 if (!I->getDesc().isConditionalBranch())
1462 return 1;
1463
1464 // Remove the branch.
1465 if (BytesRemoved)
1466 *BytesRemoved += getInstSizeInBytes(*I);
1467 I->eraseFromParent();
1468 return 2;
1469}
1470
1471// Inserts a branch into the end of the specific MachineBasicBlock, returning
1472// the number of instructions inserted.
1475 ArrayRef<MachineOperand> Cond, const DebugLoc &DL, int *BytesAdded) const {
1476 if (BytesAdded)
1477 *BytesAdded = 0;
1478
1479 // Shouldn't be a fall through.
1480 assert(TBB && "insertBranch must not be told to insert a fallthrough");
1481 assert((Cond.size() == 3 || Cond.size() == 0) &&
1482 "RISC-V branch conditions have two components!");
1483
1484 // Unconditional branch.
1485 if (Cond.empty()) {
1486 MachineInstr &MI = *BuildMI(&MBB, DL, get(RISCV::PseudoBR)).addMBB(TBB);
1487 if (BytesAdded)
1488 *BytesAdded += getInstSizeInBytes(MI);
1489 return 1;
1490 }
1491
1492 // Either a one or two-way conditional branch.
1493 MachineInstr &CondMI = *BuildMI(&MBB, DL, get(Cond[0].getImm()))
1494 .add(Cond[1])
1495 .add(Cond[2])
1496 .addMBB(TBB);
1497 if (BytesAdded)
1498 *BytesAdded += getInstSizeInBytes(CondMI);
1499
1500 // One-way conditional branch.
1501 if (!FBB)
1502 return 1;
1503
1504 // Two-way conditional branch.
1505 MachineInstr &MI = *BuildMI(&MBB, DL, get(RISCV::PseudoBR)).addMBB(FBB);
1506 if (BytesAdded)
1507 *BytesAdded += getInstSizeInBytes(MI);
1508 return 2;
1509}
1510
1512 MachineBasicBlock &DestBB,
1513 MachineBasicBlock &RestoreBB,
1514 const DebugLoc &DL, int64_t BrOffset,
1515 RegScavenger *RS) const {
1516 assert(RS && "RegScavenger required for long branching");
1517 assert(MBB.empty() &&
1518 "new block should be inserted for expanding unconditional branch");
1519 assert(MBB.pred_size() == 1);
1520 assert(RestoreBB.empty() &&
1521 "restore block should be inserted for restoring clobbered registers");
1522
1523 MachineFunction *MF = MBB.getParent();
1524 MachineRegisterInfo &MRI = MF->getRegInfo();
1527
1528 if (!isInt<32>(BrOffset))
1530 "Branch offsets outside of the signed 32-bit range not supported");
1531
1532 // FIXME: A virtual register must be used initially, as the register
1533 // scavenger won't work with empty blocks (SIInstrInfo::insertIndirectBranch
1534 // uses the same workaround).
1535 Register ScratchReg = MRI.createVirtualRegister(&RISCV::GPRJALRRegClass);
1536 auto II = MBB.end();
1537 // We may also update the jump target to RestoreBB later.
1538 MachineInstr &MI = *BuildMI(MBB, II, DL, get(RISCV::PseudoJump))
1539 .addReg(ScratchReg, RegState::Define | RegState::Dead)
1540 .addMBB(&DestBB, RISCVII::MO_CALL);
1541
1542 RS->enterBasicBlockEnd(MBB);
1543 // When cf-protection-branch is enabled, we must use t2 (x7) for software
1544 // guarded branches to hold the landing pad label.
1545 bool HasCFBranch =
1546 MF->getInfo<RISCVMachineFunctionInfo>()->hasCFProtectionBranch();
1547 const TargetRegisterClass *RC = &RISCV::GPRRegClass;
1548 if (HasCFBranch)
1549 RC = &RISCV::GPRX7RegClass;
1550 Register TmpGPR =
1551 RS->scavengeRegisterBackwards(*RC, MI.getIterator(),
1552 /*RestoreAfter=*/false, /*SpAdj=*/0,
1553 /*AllowSpill=*/false);
1554 if (TmpGPR.isValid())
1555 RS->setRegUsed(TmpGPR);
1556 else {
1557 // The case when there is no scavenged register needs special handling.
1558
1559 // Pick s11(or s1 for rve) because it doesn't make a difference.
1560 TmpGPR = STI.hasStdExtE() ? RISCV::X9 : RISCV::X27;
1561 // Force t2 if cf-protection-branch is enabled
1562 if (HasCFBranch)
1563 TmpGPR = RISCV::X7;
1564
1565 int FrameIndex = RVFI->getBranchRelaxationScratchFrameIndex();
1566 if (FrameIndex == -1)
1567 report_fatal_error("underestimated function size");
1568
1569 storeRegToStackSlot(MBB, MI, TmpGPR, /*IsKill=*/true, FrameIndex,
1570 &RISCV::GPRRegClass, Register());
1571 TRI->eliminateFrameIndex(std::prev(MI.getIterator()),
1572 /*SpAdj=*/0, /*FIOperandNum=*/1);
1573
1574 MI.getOperand(1).setMBB(&RestoreBB);
1575
1576 loadRegFromStackSlot(RestoreBB, RestoreBB.end(), TmpGPR, FrameIndex,
1577 &RISCV::GPRRegClass, Register());
1578 TRI->eliminateFrameIndex(RestoreBB.back(),
1579 /*SpAdj=*/0, /*FIOperandNum=*/1);
1580 }
1581
1582 MRI.replaceRegWith(ScratchReg, TmpGPR);
1583 MRI.clearVirtRegs();
1584}
1585
1588 assert((Cond.size() == 3) && "Invalid branch condition!");
1589
1591
1592 return false;
1593}
1594
1595// Return true if the instruction is a load immediate instruction (i.e.
1596// (ADDI x0, imm) or (BSETI x0, imm)).
1597static bool isLoadImm(const MachineInstr *MI, int64_t &Imm) {
1598 if (MI->getOpcode() == RISCV::ADDI && MI->getOperand(1).isReg() &&
1599 MI->getOperand(1).getReg() == RISCV::X0) {
1600 Imm = MI->getOperand(2).getImm();
1601 return true;
1602 }
1603 // BSETI can be used to create power of 2 constants. Only 2048 is currently
1604 // interesting because it is 1 more than the maximum ADDI constant.
1605 if (MI->getOpcode() == RISCV::BSETI && MI->getOperand(1).isReg() &&
1606 MI->getOperand(1).getReg() == RISCV::X0 &&
1607 MI->getOperand(2).getImm() == 11) {
1608 Imm = 2048;
1609 return true;
1610 }
1611 return false;
1612}
1613
1615 const MachineOperand &Op, int64_t &Imm) {
1616 // Either a load from immediate instruction or X0.
1617 if (!Op.isReg())
1618 return false;
1619
1620 Register Reg = Op.getReg();
1621 if (Reg == RISCV::X0) {
1622 Imm = 0;
1623 return true;
1624 }
1625 return Reg.isVirtual() && isLoadImm(MRI.getVRegDef(Reg), Imm);
1626}
1627
1629 bool IsSigned = false;
1630 bool IsEquality = false;
1631 switch (MI.getOpcode()) {
1632 default:
1633 return false;
1634 case RISCV::BEQ:
1635 case RISCV::BNE:
1636 IsEquality = true;
1637 break;
1638 case RISCV::BGE:
1639 case RISCV::BLT:
1640 IsSigned = true;
1641 break;
1642 case RISCV::BGEU:
1643 case RISCV::BLTU:
1644 break;
1645 }
1646
1647 MachineBasicBlock *MBB = MI.getParent();
1648 MachineRegisterInfo &MRI = MBB->getParent()->getRegInfo();
1649
1650 const MachineOperand &LHS = MI.getOperand(0);
1651 const MachineOperand &RHS = MI.getOperand(1);
1652 MachineBasicBlock *TBB = MI.getOperand(2).getMBB();
1653
1654 RISCVCC::CondCode CC = getCondFromBranchOpc(MI.getOpcode());
1656
1657 // Canonicalize conditional branches which can be constant folded into
1658 // beqz or bnez. We can't modify the CFG here.
1659 int64_t C0, C1;
1660 if (isFromLoadImm(MRI, LHS, C0) && isFromLoadImm(MRI, RHS, C1)) {
1661 unsigned NewOpc = evaluateCondBranch(CC, C0, C1) ? RISCV::BEQ : RISCV::BNE;
1662 // Build the new branch and remove the old one.
1663 BuildMI(*MBB, MI, MI.getDebugLoc(), get(NewOpc))
1664 .addReg(RISCV::X0)
1665 .addReg(RISCV::X0)
1666 .addMBB(TBB);
1667 MI.eraseFromParent();
1668 return true;
1669 }
1670
1671 if (IsEquality)
1672 return false;
1673
1674 // For two constants C0 and C1 from
1675 // ```
1676 // li Y, C0
1677 // li Z, C1
1678 // ```
1679 // 1. if C1 = C0 + 1
1680 // we can turn:
1681 // (a) blt Y, X -> bge X, Z
1682 // (b) bge Y, X -> blt X, Z
1683 //
1684 // 2. if C1 = C0 - 1
1685 // we can turn:
1686 // (a) blt X, Y -> bge Z, X
1687 // (b) bge X, Y -> blt Z, X
1688 //
1689 // To make sure this optimization is really beneficial, we only
1690 // optimize for cases where Y had only one use (i.e. only used by the branch).
1691 // Try to find the register for constant Z; return
1692 // invalid register otherwise.
1693 auto searchConst = [&](int64_t C1) -> Register {
1695 auto DefC1 = std::find_if(++II, E, [&](const MachineInstr &I) -> bool {
1696 int64_t Imm;
1697 return isLoadImm(&I, Imm) && Imm == C1 &&
1698 I.getOperand(0).getReg().isVirtual();
1699 });
1700 if (DefC1 != E)
1701 return DefC1->getOperand(0).getReg();
1702
1703 return Register();
1704 };
1705
1706 unsigned NewOpc = RISCVCC::getBrCond(getInverseBranchCondition(CC));
1707
1708 // Might be case 1.
1709 // Don't change 0 to 1 since we can use x0.
1710 // For unsigned cases changing -1U to 0 would be incorrect.
1711 // The incorrect case for signed would be INT_MAX, but isFromLoadImm can't
1712 // return that.
1713 if (isFromLoadImm(MRI, LHS, C0) && C0 != 0 && LHS.getReg().isVirtual() &&
1714 MRI.hasOneUse(LHS.getReg()) && (IsSigned || C0 != -1)) {
1715 assert((isInt<12>(C0) || C0 == 2048) && "Unexpected immediate");
1716 if (Register RegZ = searchConst(C0 + 1)) {
1717 BuildMI(*MBB, MI, MI.getDebugLoc(), get(NewOpc))
1718 .add(RHS)
1719 .addReg(RegZ)
1720 .addMBB(TBB);
1721 // We might extend the live range of Z, clear its kill flag to
1722 // account for this.
1723 MRI.clearKillFlags(RegZ);
1724 MI.eraseFromParent();
1725 return true;
1726 }
1727 }
1728
1729 // Might be case 2.
1730 // For signed cases we don't want to change 0 since we can use x0.
1731 // For unsigned cases changing 0 to -1U would be incorrect.
1732 // The incorrect case for signed would be INT_MIN, but isFromLoadImm can't
1733 // return that.
1734 if (isFromLoadImm(MRI, RHS, C0) && C0 != 0 && RHS.getReg().isVirtual() &&
1735 MRI.hasOneUse(RHS.getReg())) {
1736 assert((isInt<12>(C0) || C0 == 2048) && "Unexpected immediate");
1737 if (Register RegZ = searchConst(C0 - 1)) {
1738 BuildMI(*MBB, MI, MI.getDebugLoc(), get(NewOpc))
1739 .addReg(RegZ)
1740 .add(LHS)
1741 .addMBB(TBB);
1742 // We might extend the live range of Z, clear its kill flag to
1743 // account for this.
1744 MRI.clearKillFlags(RegZ);
1745 MI.eraseFromParent();
1746 return true;
1747 }
1748 }
1749
1750 return false;
1751}
1752
1755 assert(MI.getDesc().isBranch() && "Unexpected opcode!");
1756 // The branch target is always the last operand.
1757 int NumOp = MI.getNumExplicitOperands();
1758 return MI.getOperand(NumOp - 1).getMBB();
1759}
1760
1762 int64_t BrOffset) const {
1763 unsigned XLen = STI.getXLen();
1764 // Ideally we could determine the supported branch offset from the
1765 // RISCVII::FormMask, but this can't be used for Pseudo instructions like
1766 // PseudoBR.
1767 switch (BranchOp) {
1768 default:
1769 llvm_unreachable("Unexpected opcode!");
1770 case RISCV::NDS_BBC:
1771 case RISCV::NDS_BBS:
1772 case RISCV::NDS_BEQC:
1773 case RISCV::NDS_BNEC:
1774 return isInt<11>(BrOffset);
1775 case RISCV::BEQ:
1776 case RISCV::BNE:
1777 case RISCV::BLT:
1778 case RISCV::BGE:
1779 case RISCV::BLTU:
1780 case RISCV::BGEU:
1781 case RISCV::BEQI:
1782 case RISCV::BNEI:
1783 case RISCV::CV_BEQIMM:
1784 case RISCV::CV_BNEIMM:
1785 case RISCV::QC_BEQI:
1786 case RISCV::QC_BNEI:
1787 case RISCV::QC_BGEI:
1788 case RISCV::QC_BLTI:
1789 case RISCV::QC_BLTUI:
1790 case RISCV::QC_BGEUI:
1791 case RISCV::QC_E_BEQI:
1792 case RISCV::QC_E_BNEI:
1793 case RISCV::QC_E_BGEI:
1794 case RISCV::QC_E_BLTI:
1795 case RISCV::QC_E_BLTUI:
1796 case RISCV::QC_E_BGEUI:
1797 return isInt<13>(BrOffset);
1798 case RISCV::JAL:
1799 case RISCV::PseudoBR:
1800 return isInt<21>(BrOffset);
1801 case RISCV::PseudoJump:
1802 return isInt<32>(SignExtend64(BrOffset + 0x800, XLen));
1803 }
1804}
1805
1806// If the operation has a predicated pseudo instruction, return the pseudo
1807// instruction opcode. Otherwise, return RISCV::INSTRUCTION_LIST_END.
1808// TODO: Support more operations.
1809unsigned getPredicatedOpcode(unsigned Opcode) {
1810 // clang-format off
1811 switch (Opcode) {
1812 case RISCV::ADD: return RISCV::PseudoCCADD;
1813 case RISCV::SUB: return RISCV::PseudoCCSUB;
1814 case RISCV::SLL: return RISCV::PseudoCCSLL;
1815 case RISCV::SRL: return RISCV::PseudoCCSRL;
1816 case RISCV::SRA: return RISCV::PseudoCCSRA;
1817 case RISCV::AND: return RISCV::PseudoCCAND;
1818 case RISCV::OR: return RISCV::PseudoCCOR;
1819 case RISCV::XOR: return RISCV::PseudoCCXOR;
1820 case RISCV::MAX: return RISCV::PseudoCCMAX;
1821 case RISCV::MAXU: return RISCV::PseudoCCMAXU;
1822 case RISCV::MIN: return RISCV::PseudoCCMIN;
1823 case RISCV::MINU: return RISCV::PseudoCCMINU;
1824 case RISCV::MUL: return RISCV::PseudoCCMUL;
1825 case RISCV::LUI: return RISCV::PseudoCCLUI;
1826 case RISCV::QC_LI: return RISCV::PseudoCCQC_LI;
1827 case RISCV::QC_E_LI: return RISCV::PseudoCCQC_E_LI;
1828
1829 case RISCV::ADDI: return RISCV::PseudoCCADDI;
1830 case RISCV::SLLI: return RISCV::PseudoCCSLLI;
1831 case RISCV::SRLI: return RISCV::PseudoCCSRLI;
1832 case RISCV::SRAI: return RISCV::PseudoCCSRAI;
1833 case RISCV::ANDI: return RISCV::PseudoCCANDI;
1834 case RISCV::ORI: return RISCV::PseudoCCORI;
1835 case RISCV::XORI: return RISCV::PseudoCCXORI;
1836
1837 case RISCV::ADDW: return RISCV::PseudoCCADDW;
1838 case RISCV::SUBW: return RISCV::PseudoCCSUBW;
1839 case RISCV::SLLW: return RISCV::PseudoCCSLLW;
1840 case RISCV::SRLW: return RISCV::PseudoCCSRLW;
1841 case RISCV::SRAW: return RISCV::PseudoCCSRAW;
1842
1843 case RISCV::ADDIW: return RISCV::PseudoCCADDIW;
1844 case RISCV::SLLIW: return RISCV::PseudoCCSLLIW;
1845 case RISCV::SRLIW: return RISCV::PseudoCCSRLIW;
1846 case RISCV::SRAIW: return RISCV::PseudoCCSRAIW;
1847
1848 case RISCV::ANDN: return RISCV::PseudoCCANDN;
1849 case RISCV::ORN: return RISCV::PseudoCCORN;
1850 case RISCV::XNOR: return RISCV::PseudoCCXNOR;
1851
1852 case RISCV::NDS_BFOS: return RISCV::PseudoCCNDS_BFOS;
1853 case RISCV::NDS_BFOZ: return RISCV::PseudoCCNDS_BFOZ;
1854 }
1855 // clang-format on
1856
1857 return RISCV::INSTRUCTION_LIST_END;
1858}
1859
1860/// Identify instructions that can be folded into a CCMOV instruction, and
1861/// return the defining instruction.
1863 const MachineRegisterInfo &MRI,
1864 const TargetInstrInfo *TII,
1865 const RISCVSubtarget &STI) {
1866 if (!Reg.isVirtual())
1867 return nullptr;
1868 if (!MRI.hasOneNonDBGUse(Reg))
1869 return nullptr;
1870 MachineInstr *MI = MRI.getVRegDef(Reg);
1871 if (!MI)
1872 return nullptr;
1873
1874 if (!STI.hasShortForwardBranchIMinMax() &&
1875 (MI->getOpcode() == RISCV::MAX || MI->getOpcode() == RISCV::MIN ||
1876 MI->getOpcode() == RISCV::MINU || MI->getOpcode() == RISCV::MAXU))
1877 return nullptr;
1878
1879 if (!STI.hasShortForwardBranchIMul() && MI->getOpcode() == RISCV::MUL)
1880 return nullptr;
1881
1882 // Check if MI can be predicated and folded into the CCMOV.
1883 if (getPredicatedOpcode(MI->getOpcode()) == RISCV::INSTRUCTION_LIST_END)
1884 return nullptr;
1885 // Don't predicate li idiom.
1886 if (MI->getOpcode() == RISCV::ADDI && MI->getOperand(1).isReg() &&
1887 MI->getOperand(1).getReg() == RISCV::X0)
1888 return nullptr;
1889 // Check if MI has any other defs or physreg uses.
1890 for (const MachineOperand &MO : llvm::drop_begin(MI->operands())) {
1891 // Reject frame index operands, PEI can't handle the predicated pseudos.
1892 if (MO.isFI() || MO.isCPI() || MO.isJTI())
1893 return nullptr;
1894 if (!MO.isReg())
1895 continue;
1896 // MI can't have any tied operands, that would conflict with predication.
1897 if (MO.isTied())
1898 return nullptr;
1899 if (MO.isDef())
1900 return nullptr;
1901 // Allow constant physregs.
1902 if (MO.getReg().isPhysical() && !MRI.isConstantPhysReg(MO.getReg()))
1903 return nullptr;
1904 }
1905 bool DontMoveAcrossStores = true;
1906 if (!MI->isSafeToMove(DontMoveAcrossStores))
1907 return nullptr;
1908 return MI;
1909}
1910
1914 bool PreferFalse) const {
1915 assert(MI.getOpcode() == RISCV::PseudoCCMOVGPR &&
1916 "Unknown select instruction");
1917 if (!STI.hasShortForwardBranchIALU())
1918 return nullptr;
1919
1920 MachineRegisterInfo &MRI = MI.getParent()->getParent()->getRegInfo();
1922 canFoldAsPredicatedOp(MI.getOperand(2).getReg(), MRI, this, STI);
1923 bool Invert = !DefMI;
1924 if (!DefMI)
1925 DefMI = canFoldAsPredicatedOp(MI.getOperand(1).getReg(), MRI, this, STI);
1926 if (!DefMI)
1927 return nullptr;
1928
1929 // Find new register class to use.
1930 MachineOperand FalseReg = MI.getOperand(Invert ? 2 : 1);
1931 Register DestReg = MI.getOperand(0).getReg();
1932 const TargetRegisterClass *PreviousClass = MRI.getRegClass(FalseReg.getReg());
1933 if (!MRI.constrainRegClass(DestReg, PreviousClass))
1934 return nullptr;
1935
1936 unsigned PredOpc = getPredicatedOpcode(DefMI->getOpcode());
1937 assert(PredOpc != RISCV::INSTRUCTION_LIST_END && "Unexpected opcode!");
1938
1939 // Create a new predicated version of DefMI.
1940 MachineInstrBuilder NewMI =
1941 BuildMI(*MI.getParent(), MI, MI.getDebugLoc(), get(PredOpc), DestReg);
1942
1943 // Copy the false register.
1944 NewMI.add(FalseReg);
1945
1946 // Copy all the DefMI operands.
1947 const MCInstrDesc &DefDesc = DefMI->getDesc();
1948 for (unsigned i = 1, e = DefDesc.getNumOperands(); i != e; ++i)
1949 NewMI.add(DefMI->getOperand(i));
1950
1951 // Add branch opcode, inverting if necessary.
1952 unsigned BCCOpcode = MI.getOperand(MI.getNumExplicitOperands() - 3).getImm();
1953 if (Invert)
1954 BCCOpcode = RISCVCC::getInverseBranchOpcode(BCCOpcode);
1955 NewMI.addImm(BCCOpcode);
1956
1957 // Copy the condition portion.
1958 NewMI.add(MI.getOperand(MI.getNumExplicitOperands() - 2));
1959 NewMI.add(MI.getOperand(MI.getNumExplicitOperands() - 1));
1960
1961 // Update SeenMIs set: register newly created MI and erase removed DefMI.
1962 SeenMIs.insert(NewMI);
1963 SeenMIs.erase(DefMI);
1964
1965 // If MI is inside a loop, and DefMI is outside the loop, then kill flags on
1966 // DefMI would be invalid when transferred inside the loop. Checking for a
1967 // loop is expensive, but at least remove kill flags if they are in different
1968 // BBs.
1969 if (DefMI->getParent() != MI.getParent())
1970 NewMI->clearKillInfo();
1971
1972 // The caller will erase MI, but not DefMI.
1973 DefMI->eraseFromParent();
1974 return NewMI;
1975}
1976
1978 if (MI.isMetaInstruction())
1979 return 0;
1980
1981 unsigned Opcode = MI.getOpcode();
1982
1983 if (Opcode == TargetOpcode::INLINEASM ||
1984 Opcode == TargetOpcode::INLINEASM_BR) {
1985 const MachineFunction &MF = *MI.getParent()->getParent();
1986 return getInlineAsmLength(MI.getOperand(0).getSymbolName(),
1987 MF.getTarget().getMCAsmInfo());
1988 }
1989
1990 if (requiresNTLHint(MI)) {
1991 if (STI.hasStdExtZca()) {
1992 if (isCompressibleInst(MI, STI))
1993 return 4; // c.ntl.all + c.load/c.store
1994 return 6; // c.ntl.all + load/store
1995 }
1996 return 8; // ntl.all + load/store
1997 }
1998
1999 if (Opcode == TargetOpcode::BUNDLE)
2000 return getInstBundleSize(MI);
2001
2002 if (MI.getParent() && MI.getParent()->getParent()) {
2003 if (isCompressibleInst(MI, STI))
2004 return 2;
2005 }
2006
2007 switch (Opcode) {
2008 case RISCV::PseudoMV_FPR16INX:
2009 case RISCV::PseudoMV_FPR32INX:
2010 // MV is always compressible to either c.mv or c.li rd, 0.
2011 return STI.hasStdExtZca() ? 2 : 4;
2012 // Below cases are for short forward branch pseudos
2013 case RISCV::PseudoCCMOVGPRNoX0:
2014 return get(MI.getOperand(MI.getNumExplicitOperands() - 3).getImm())
2015 .getSize() +
2016 2;
2017 case RISCV::PseudoCCMOVGPR:
2018 case RISCV::PseudoCCADD:
2019 case RISCV::PseudoCCSUB:
2020 case RISCV::PseudoCCSLL:
2021 case RISCV::PseudoCCSRL:
2022 case RISCV::PseudoCCSRA:
2023 case RISCV::PseudoCCAND:
2024 case RISCV::PseudoCCOR:
2025 case RISCV::PseudoCCXOR:
2026 case RISCV::PseudoCCADDI:
2027 case RISCV::PseudoCCANDI:
2028 case RISCV::PseudoCCORI:
2029 case RISCV::PseudoCCXORI:
2030 case RISCV::PseudoCCLUI:
2031 case RISCV::PseudoCCSLLI:
2032 case RISCV::PseudoCCSRLI:
2033 case RISCV::PseudoCCSRAI:
2034 case RISCV::PseudoCCADDW:
2035 case RISCV::PseudoCCSUBW:
2036 case RISCV::PseudoCCSLLW:
2037 case RISCV::PseudoCCSRLW:
2038 case RISCV::PseudoCCSRAW:
2039 case RISCV::PseudoCCADDIW:
2040 case RISCV::PseudoCCSLLIW:
2041 case RISCV::PseudoCCSRLIW:
2042 case RISCV::PseudoCCSRAIW:
2043 case RISCV::PseudoCCANDN:
2044 case RISCV::PseudoCCORN:
2045 case RISCV::PseudoCCXNOR:
2046 case RISCV::PseudoCCMAX:
2047 case RISCV::PseudoCCMIN:
2048 case RISCV::PseudoCCMAXU:
2049 case RISCV::PseudoCCMINU:
2050 case RISCV::PseudoCCMUL:
2051 case RISCV::PseudoCCLB:
2052 case RISCV::PseudoCCLH:
2053 case RISCV::PseudoCCLW:
2054 case RISCV::PseudoCCLHU:
2055 case RISCV::PseudoCCLBU:
2056 case RISCV::PseudoCCLWU:
2057 case RISCV::PseudoCCLD:
2058 case RISCV::PseudoCCQC_LI:
2059 return get(MI.getOperand(MI.getNumExplicitOperands() - 3).getImm())
2060 .getSize() +
2061 4;
2062 case RISCV::PseudoCCQC_E_LI:
2063 case RISCV::PseudoCCQC_E_LB:
2064 case RISCV::PseudoCCQC_E_LH:
2065 case RISCV::PseudoCCQC_E_LW:
2066 case RISCV::PseudoCCQC_E_LHU:
2067 case RISCV::PseudoCCQC_E_LBU:
2068 return get(MI.getOperand(MI.getNumExplicitOperands() - 3).getImm())
2069 .getSize() +
2070 6;
2071 case TargetOpcode::STACKMAP:
2072 // The upper bound for a stackmap intrinsic is the full length of its shadow
2074 case TargetOpcode::PATCHPOINT:
2075 // The size of the patchpoint intrinsic is the number of bytes requested
2077 case TargetOpcode::STATEPOINT: {
2078 // The size of the statepoint intrinsic is the number of bytes requested
2079 unsigned NumBytes = StatepointOpers(&MI).getNumPatchBytes();
2080 // No patch bytes means at most a PseudoCall is emitted
2081 return std::max(NumBytes, 8U);
2082 }
2083 case TargetOpcode::PATCHABLE_FUNCTION_ENTER:
2084 case TargetOpcode::PATCHABLE_FUNCTION_EXIT:
2085 case TargetOpcode::PATCHABLE_TAIL_CALL: {
2086 const MachineFunction &MF = *MI.getParent()->getParent();
2087 const Function &F = MF.getFunction();
2088 if (Opcode == TargetOpcode::PATCHABLE_FUNCTION_ENTER &&
2089 F.hasFnAttribute("patchable-function-entry")) {
2090 unsigned Num =
2091 F.getFnAttributeAsParsedInteger("patchable-function-entry");
2092 // Number of C.NOP or NOP
2093 return (STI.hasStdExtZca() ? 2 : 4) * Num;
2094 }
2095 // XRay uses C.JAL + 21 or 33 C.NOP for each sled in RV32 and RV64,
2096 // respectively.
2097 return STI.is64Bit() ? 68 : 44;
2098 }
2099 default:
2100 return get(Opcode).getSize();
2101 }
2102}
2103
2105 const unsigned Opcode = MI.getOpcode();
2106 switch (Opcode) {
2107 default:
2108 break;
2109 case RISCV::FSGNJ_D:
2110 case RISCV::FSGNJ_S:
2111 case RISCV::FSGNJ_H:
2112 case RISCV::FSGNJ_D_INX:
2113 case RISCV::FSGNJ_D_IN32X:
2114 case RISCV::FSGNJ_S_INX:
2115 case RISCV::FSGNJ_H_INX:
2116 // The canonical floating-point move is fsgnj rd, rs, rs.
2117 return MI.getOperand(1).isReg() && MI.getOperand(2).isReg() &&
2118 MI.getOperand(1).getReg() == MI.getOperand(2).getReg();
2119 case RISCV::ADDI:
2120 case RISCV::ORI:
2121 case RISCV::XORI:
2122 return (MI.getOperand(1).isReg() &&
2123 MI.getOperand(1).getReg() == RISCV::X0) ||
2124 (MI.getOperand(2).isImm() && MI.getOperand(2).getImm() == 0);
2125 }
2126 return MI.isAsCheapAsAMove();
2127}
2128
2129std::optional<DestSourcePair>
2131 if (MI.isMoveReg())
2132 return DestSourcePair{MI.getOperand(0), MI.getOperand(1)};
2133 switch (MI.getOpcode()) {
2134 default:
2135 break;
2136 case RISCV::ADD:
2137 case RISCV::OR:
2138 case RISCV::XOR:
2139 if (MI.getOperand(1).isReg() && MI.getOperand(1).getReg() == RISCV::X0 &&
2140 MI.getOperand(2).isReg())
2141 return DestSourcePair{MI.getOperand(0), MI.getOperand(2)};
2142 if (MI.getOperand(2).isReg() && MI.getOperand(2).getReg() == RISCV::X0 &&
2143 MI.getOperand(1).isReg())
2144 return DestSourcePair{MI.getOperand(0), MI.getOperand(1)};
2145 break;
2146 case RISCV::ADDI:
2147 // Operand 1 can be a frameindex but callers expect registers
2148 if (MI.getOperand(1).isReg() && MI.getOperand(2).isImm() &&
2149 MI.getOperand(2).getImm() == 0)
2150 return DestSourcePair{MI.getOperand(0), MI.getOperand(1)};
2151 break;
2152 case RISCV::SUB:
2153 if (MI.getOperand(2).isReg() && MI.getOperand(2).getReg() == RISCV::X0 &&
2154 MI.getOperand(1).isReg())
2155 return DestSourcePair{MI.getOperand(0), MI.getOperand(1)};
2156 break;
2157 case RISCV::SH1ADD:
2158 case RISCV::SH1ADD_UW:
2159 case RISCV::SH2ADD:
2160 case RISCV::SH2ADD_UW:
2161 case RISCV::SH3ADD:
2162 case RISCV::SH3ADD_UW:
2163 if (MI.getOperand(1).isReg() && MI.getOperand(1).getReg() == RISCV::X0 &&
2164 MI.getOperand(2).isReg())
2165 return DestSourcePair{MI.getOperand(0), MI.getOperand(2)};
2166 break;
2167 case RISCV::FSGNJ_D:
2168 case RISCV::FSGNJ_S:
2169 case RISCV::FSGNJ_H:
2170 case RISCV::FSGNJ_D_INX:
2171 case RISCV::FSGNJ_D_IN32X:
2172 case RISCV::FSGNJ_S_INX:
2173 case RISCV::FSGNJ_H_INX:
2174 // The canonical floating-point move is fsgnj rd, rs, rs.
2175 if (MI.getOperand(1).isReg() && MI.getOperand(2).isReg() &&
2176 MI.getOperand(1).getReg() == MI.getOperand(2).getReg())
2177 return DestSourcePair{MI.getOperand(0), MI.getOperand(1)};
2178 break;
2179 }
2180 return std::nullopt;
2181}
2182
2184 if (ForceMachineCombinerStrategy.getNumOccurrences() == 0) {
2185 // The option is unused. Choose Local strategy only for in-order cores. When
2186 // scheduling model is unspecified, use MinInstrCount strategy as more
2187 // generic one.
2188 const auto &SchedModel = STI.getSchedModel();
2189 return (!SchedModel.hasInstrSchedModel() || SchedModel.isOutOfOrder())
2192 }
2193 // The strategy was forced by the option.
2195}
2196
2198 MachineInstr &Root, unsigned &Pattern,
2199 SmallVectorImpl<MachineInstr *> &InsInstrs) const {
2200 int16_t FrmOpIdx =
2201 RISCV::getNamedOperandIdx(Root.getOpcode(), RISCV::OpName::frm);
2202 if (FrmOpIdx < 0) {
2203 assert(all_of(InsInstrs,
2204 [](MachineInstr *MI) {
2205 return RISCV::getNamedOperandIdx(MI->getOpcode(),
2206 RISCV::OpName::frm) < 0;
2207 }) &&
2208 "New instructions require FRM whereas the old one does not have it");
2209 return;
2210 }
2211
2212 const MachineOperand &FRM = Root.getOperand(FrmOpIdx);
2213 MachineFunction &MF = *Root.getMF();
2214
2215 for (auto *NewMI : InsInstrs) {
2216 // We'd already added the FRM operand.
2217 if (static_cast<unsigned>(RISCV::getNamedOperandIdx(
2218 NewMI->getOpcode(), RISCV::OpName::frm)) != NewMI->getNumOperands())
2219 continue;
2220 MachineInstrBuilder MIB(MF, NewMI);
2221 MIB.add(FRM);
2222 if (FRM.getImm() == RISCVFPRndMode::DYN)
2223 MIB.addUse(RISCV::FRM, RegState::Implicit);
2224 }
2225}
2226
2227static bool isFADD(unsigned Opc) {
2228 switch (Opc) {
2229 default:
2230 return false;
2231 case RISCV::FADD_H:
2232 case RISCV::FADD_S:
2233 case RISCV::FADD_D:
2234 return true;
2235 }
2236}
2237
2238static bool isFSUB(unsigned Opc) {
2239 switch (Opc) {
2240 default:
2241 return false;
2242 case RISCV::FSUB_H:
2243 case RISCV::FSUB_S:
2244 case RISCV::FSUB_D:
2245 return true;
2246 }
2247}
2248
2249static bool isFMUL(unsigned Opc) {
2250 switch (Opc) {
2251 default:
2252 return false;
2253 case RISCV::FMUL_H:
2254 case RISCV::FMUL_S:
2255 case RISCV::FMUL_D:
2256 return true;
2257 }
2258}
2259
2260bool RISCVInstrInfo::isVectorAssociativeAndCommutative(const MachineInstr &Inst,
2261 bool Invert) const {
2262#define OPCODE_LMUL_CASE(OPC) \
2263 case RISCV::OPC##_M1: \
2264 case RISCV::OPC##_M2: \
2265 case RISCV::OPC##_M4: \
2266 case RISCV::OPC##_M8: \
2267 case RISCV::OPC##_MF2: \
2268 case RISCV::OPC##_MF4: \
2269 case RISCV::OPC##_MF8
2270
2271#define OPCODE_LMUL_MASK_CASE(OPC) \
2272 case RISCV::OPC##_M1_MASK: \
2273 case RISCV::OPC##_M2_MASK: \
2274 case RISCV::OPC##_M4_MASK: \
2275 case RISCV::OPC##_M8_MASK: \
2276 case RISCV::OPC##_MF2_MASK: \
2277 case RISCV::OPC##_MF4_MASK: \
2278 case RISCV::OPC##_MF8_MASK
2279
2280 unsigned Opcode = Inst.getOpcode();
2281 if (Invert) {
2282 if (auto InvOpcode = getInverseOpcode(Opcode))
2283 Opcode = *InvOpcode;
2284 else
2285 return false;
2286 }
2287
2288 // clang-format off
2289 switch (Opcode) {
2290 default:
2291 return false;
2292 OPCODE_LMUL_CASE(PseudoVADD_VV):
2293 OPCODE_LMUL_MASK_CASE(PseudoVADD_VV):
2294 OPCODE_LMUL_CASE(PseudoVMUL_VV):
2295 OPCODE_LMUL_MASK_CASE(PseudoVMUL_VV):
2296 return true;
2297 }
2298 // clang-format on
2299
2300#undef OPCODE_LMUL_MASK_CASE
2301#undef OPCODE_LMUL_CASE
2302}
2303
2304bool RISCVInstrInfo::areRVVInstsReassociable(const MachineInstr &Root,
2305 const MachineInstr &Prev) const {
2306 if (!areOpcodesEqualOrInverse(Root.getOpcode(), Prev.getOpcode()))
2307 return false;
2308
2309 assert(Root.getMF() == Prev.getMF());
2310 const MachineRegisterInfo *MRI = &Root.getMF()->getRegInfo();
2311 const TargetRegisterInfo *TRI = MRI->getTargetRegisterInfo();
2312
2313 // Make sure vtype operands are also the same.
2314 const MCInstrDesc &Desc = get(Root.getOpcode());
2315 const uint64_t TSFlags = Desc.TSFlags;
2316
2317 auto checkImmOperand = [&](unsigned OpIdx) {
2318 return Root.getOperand(OpIdx).getImm() == Prev.getOperand(OpIdx).getImm();
2319 };
2320
2321 auto checkRegOperand = [&](unsigned OpIdx) {
2322 return Root.getOperand(OpIdx).getReg() == Prev.getOperand(OpIdx).getReg();
2323 };
2324
2325 // PassThru
2326 // TODO: Potentially we can loosen the condition to consider Root to be
2327 // associable with Prev if Root has NoReg as passthru. In which case we
2328 // also need to loosen the condition on vector policies between these.
2329 if (!checkRegOperand(1))
2330 return false;
2331
2332 // SEW
2333 if (RISCVII::hasSEWOp(TSFlags) &&
2334 !checkImmOperand(RISCVII::getSEWOpNum(Desc)))
2335 return false;
2336
2337 // Mask
2338 if (RISCVII::usesMaskPolicy(TSFlags)) {
2339 const MachineBasicBlock *MBB = Root.getParent();
2342 Register MI1VReg;
2343
2344 bool SeenMI2 = false;
2345 for (auto End = MBB->rend(), It = It1; It != End; ++It) {
2346 if (It == It2) {
2347 SeenMI2 = true;
2348 if (!MI1VReg.isValid())
2349 // There is no V0 def between Root and Prev; they're sharing the
2350 // same V0.
2351 break;
2352 }
2353
2354 if (It->modifiesRegister(RISCV::V0, TRI)) {
2355 Register SrcReg = It->getOperand(1).getReg();
2356 // If it's not VReg it'll be more difficult to track its defs, so
2357 // bailing out here just to be safe.
2358 if (!SrcReg.isVirtual())
2359 return false;
2360
2361 if (!MI1VReg.isValid()) {
2362 // This is the V0 def for Root.
2363 MI1VReg = SrcReg;
2364 continue;
2365 }
2366
2367 // Some random mask updates.
2368 if (!SeenMI2)
2369 continue;
2370
2371 // This is the V0 def for Prev; check if it's the same as that of
2372 // Root.
2373 if (MI1VReg != SrcReg)
2374 return false;
2375 else
2376 break;
2377 }
2378 }
2379
2380 // If we haven't encountered Prev, it's likely that this function was
2381 // called in a wrong way (e.g. Root is before Prev).
2382 assert(SeenMI2 && "Prev is expected to appear before Root");
2383 }
2384
2385 // Tail / Mask policies
2386 if (RISCVII::hasVecPolicyOp(TSFlags) &&
2387 !checkImmOperand(RISCVII::getVecPolicyOpNum(Desc)))
2388 return false;
2389
2390 // VL
2391 if (RISCVII::hasVLOp(TSFlags)) {
2392 unsigned OpIdx = RISCVII::getVLOpNum(Desc);
2393 const MachineOperand &Op1 = Root.getOperand(OpIdx);
2394 const MachineOperand &Op2 = Prev.getOperand(OpIdx);
2395 if (Op1.getType() != Op2.getType())
2396 return false;
2397 switch (Op1.getType()) {
2399 if (Op1.getReg() != Op2.getReg())
2400 return false;
2401 break;
2403 if (Op1.getImm() != Op2.getImm())
2404 return false;
2405 break;
2406 default:
2407 llvm_unreachable("Unrecognized VL operand type");
2408 }
2409 }
2410
2411 // Rounding modes
2412 if (int Idx = RISCVII::getFRMOpNum(Desc); Idx >= 0 && !checkImmOperand(Idx))
2413 return false;
2414 if (int Idx = RISCVII::getVXRMOpNum(Desc); Idx >= 0 && !checkImmOperand(Idx))
2415 return false;
2416
2417 return true;
2418}
2419
2420// Most of our RVV pseudos have passthru operand, so the real operands
2421// start from index = 2.
2422bool RISCVInstrInfo::hasReassociableVectorSibling(const MachineInstr &Inst,
2423 bool &Commuted) const {
2424 const MachineBasicBlock *MBB = Inst.getParent();
2425 const MachineRegisterInfo &MRI = MBB->getParent()->getRegInfo();
2427 "Expect the present of passthrough operand.");
2428 MachineInstr *MI1 = MRI.getUniqueVRegDef(Inst.getOperand(2).getReg());
2429 MachineInstr *MI2 = MRI.getUniqueVRegDef(Inst.getOperand(3).getReg());
2430
2431 // If only one operand has the same or inverse opcode and it's the second
2432 // source operand, the operands must be commuted.
2433 Commuted = !areRVVInstsReassociable(Inst, *MI1) &&
2434 areRVVInstsReassociable(Inst, *MI2);
2435 if (Commuted)
2436 std::swap(MI1, MI2);
2437
2438 return areRVVInstsReassociable(Inst, *MI1) &&
2439 (isVectorAssociativeAndCommutative(*MI1) ||
2440 isVectorAssociativeAndCommutative(*MI1, /* Invert */ true)) &&
2442 MRI.hasOneNonDBGUse(MI1->getOperand(0).getReg());
2443}
2444
2446 const MachineInstr &Inst, const MachineBasicBlock *MBB) const {
2447 if (!isVectorAssociativeAndCommutative(Inst) &&
2448 !isVectorAssociativeAndCommutative(Inst, /*Invert=*/true))
2450
2451 const MachineOperand &Op1 = Inst.getOperand(2);
2452 const MachineOperand &Op2 = Inst.getOperand(3);
2453 const MachineRegisterInfo &MRI = MBB->getParent()->getRegInfo();
2454
2455 // We need virtual register definitions for the operands that we will
2456 // reassociate.
2457 MachineInstr *MI1 = nullptr;
2458 MachineInstr *MI2 = nullptr;
2459 if (Op1.isReg() && Op1.getReg().isVirtual())
2460 MI1 = MRI.getUniqueVRegDef(Op1.getReg());
2461 if (Op2.isReg() && Op2.getReg().isVirtual())
2462 MI2 = MRI.getUniqueVRegDef(Op2.getReg());
2463
2464 // And at least one operand must be defined in MBB.
2465 return MI1 && MI2 && (MI1->getParent() == MBB || MI2->getParent() == MBB);
2466}
2467
2469 const MachineInstr &Root, unsigned Pattern,
2470 std::array<unsigned, 5> &OperandIndices) const {
2472 if (RISCV::getRVVMCOpcode(Root.getOpcode())) {
2473 // Skip the passthrough operand, so increment all indices by one.
2474 for (unsigned I = 0; I < 5; ++I)
2475 ++OperandIndices[I];
2476 }
2477}
2478
2480 bool &Commuted) const {
2481 if (isVectorAssociativeAndCommutative(Inst) ||
2482 isVectorAssociativeAndCommutative(Inst, /*Invert=*/true))
2483 return hasReassociableVectorSibling(Inst, Commuted);
2484
2485 if (!TargetInstrInfo::hasReassociableSibling(Inst, Commuted))
2486 return false;
2487
2488 const MachineRegisterInfo &MRI = Inst.getMF()->getRegInfo();
2489 unsigned OperandIdx = Commuted ? 2 : 1;
2490 const MachineInstr &Sibling =
2491 *MRI.getVRegDef(Inst.getOperand(OperandIdx).getReg());
2492
2493 int16_t InstFrmOpIdx =
2494 RISCV::getNamedOperandIdx(Inst.getOpcode(), RISCV::OpName::frm);
2495 int16_t SiblingFrmOpIdx =
2496 RISCV::getNamedOperandIdx(Sibling.getOpcode(), RISCV::OpName::frm);
2497
2498 return (InstFrmOpIdx < 0 && SiblingFrmOpIdx < 0) ||
2499 RISCV::hasEqualFRM(Inst, Sibling);
2500}
2501
2503 bool Invert) const {
2504 if (isVectorAssociativeAndCommutative(Inst, Invert))
2505 return true;
2506
2507 unsigned Opc = Inst.getOpcode();
2508 if (Invert) {
2509 auto InverseOpcode = getInverseOpcode(Opc);
2510 if (!InverseOpcode)
2511 return false;
2512 Opc = *InverseOpcode;
2513 }
2514
2515 if (isFADD(Opc) || isFMUL(Opc))
2518
2519 switch (Opc) {
2520 default:
2521 return false;
2522 case RISCV::ADD:
2523 case RISCV::ADDW:
2524 case RISCV::AND:
2525 case RISCV::OR:
2526 case RISCV::XOR:
2527 // From RISC-V ISA spec, if both the high and low bits of the same product
2528 // are required, then the recommended code sequence is:
2529 //
2530 // MULH[[S]U] rdh, rs1, rs2
2531 // MUL rdl, rs1, rs2
2532 // (source register specifiers must be in same order and rdh cannot be the
2533 // same as rs1 or rs2)
2534 //
2535 // Microarchitectures can then fuse these into a single multiply operation
2536 // instead of performing two separate multiplies.
2537 // MachineCombiner may reassociate MUL operands and lose the fusion
2538 // opportunity.
2539 case RISCV::MUL:
2540 case RISCV::MULW:
2541 case RISCV::MIN:
2542 case RISCV::MINU:
2543 case RISCV::MAX:
2544 case RISCV::MAXU:
2545 case RISCV::FMIN_H:
2546 case RISCV::FMIN_S:
2547 case RISCV::FMIN_D:
2548 case RISCV::FMAX_H:
2549 case RISCV::FMAX_S:
2550 case RISCV::FMAX_D:
2551 return true;
2552 }
2553
2554 return false;
2555}
2556
2557std::optional<unsigned>
2558RISCVInstrInfo::getInverseOpcode(unsigned Opcode) const {
2559#define RVV_OPC_LMUL_CASE(OPC, INV) \
2560 case RISCV::OPC##_M1: \
2561 return RISCV::INV##_M1; \
2562 case RISCV::OPC##_M2: \
2563 return RISCV::INV##_M2; \
2564 case RISCV::OPC##_M4: \
2565 return RISCV::INV##_M4; \
2566 case RISCV::OPC##_M8: \
2567 return RISCV::INV##_M8; \
2568 case RISCV::OPC##_MF2: \
2569 return RISCV::INV##_MF2; \
2570 case RISCV::OPC##_MF4: \
2571 return RISCV::INV##_MF4; \
2572 case RISCV::OPC##_MF8: \
2573 return RISCV::INV##_MF8
2574
2575#define RVV_OPC_LMUL_MASK_CASE(OPC, INV) \
2576 case RISCV::OPC##_M1_MASK: \
2577 return RISCV::INV##_M1_MASK; \
2578 case RISCV::OPC##_M2_MASK: \
2579 return RISCV::INV##_M2_MASK; \
2580 case RISCV::OPC##_M4_MASK: \
2581 return RISCV::INV##_M4_MASK; \
2582 case RISCV::OPC##_M8_MASK: \
2583 return RISCV::INV##_M8_MASK; \
2584 case RISCV::OPC##_MF2_MASK: \
2585 return RISCV::INV##_MF2_MASK; \
2586 case RISCV::OPC##_MF4_MASK: \
2587 return RISCV::INV##_MF4_MASK; \
2588 case RISCV::OPC##_MF8_MASK: \
2589 return RISCV::INV##_MF8_MASK
2590
2591 switch (Opcode) {
2592 default:
2593 return std::nullopt;
2594 case RISCV::FADD_H:
2595 return RISCV::FSUB_H;
2596 case RISCV::FADD_S:
2597 return RISCV::FSUB_S;
2598 case RISCV::FADD_D:
2599 return RISCV::FSUB_D;
2600 case RISCV::FSUB_H:
2601 return RISCV::FADD_H;
2602 case RISCV::FSUB_S:
2603 return RISCV::FADD_S;
2604 case RISCV::FSUB_D:
2605 return RISCV::FADD_D;
2606 case RISCV::ADD:
2607 return RISCV::SUB;
2608 case RISCV::SUB:
2609 return RISCV::ADD;
2610 case RISCV::ADDW:
2611 return RISCV::SUBW;
2612 case RISCV::SUBW:
2613 return RISCV::ADDW;
2614 // clang-format off
2615 RVV_OPC_LMUL_CASE(PseudoVADD_VV, PseudoVSUB_VV);
2616 RVV_OPC_LMUL_MASK_CASE(PseudoVADD_VV, PseudoVSUB_VV);
2617 RVV_OPC_LMUL_CASE(PseudoVSUB_VV, PseudoVADD_VV);
2618 RVV_OPC_LMUL_MASK_CASE(PseudoVSUB_VV, PseudoVADD_VV);
2619 // clang-format on
2620 }
2621
2622#undef RVV_OPC_LMUL_MASK_CASE
2623#undef RVV_OPC_LMUL_CASE
2624}
2625
2627 const MachineOperand &MO,
2628 bool DoRegPressureReduce) {
2629 if (!MO.isReg() || !MO.getReg().isVirtual())
2630 return false;
2631 const MachineRegisterInfo &MRI = Root.getMF()->getRegInfo();
2632 MachineInstr *MI = MRI.getVRegDef(MO.getReg());
2633 if (!MI || !isFMUL(MI->getOpcode()))
2634 return false;
2635
2638 return false;
2639
2640 // Try combining even if fmul has more than one use as it eliminates
2641 // dependency between fadd(fsub) and fmul. However, it can extend liveranges
2642 // for fmul operands, so reject the transformation in register pressure
2643 // reduction mode.
2644 if (DoRegPressureReduce && !MRI.hasOneNonDBGUse(MI->getOperand(0).getReg()))
2645 return false;
2646
2647 // Do not combine instructions from different basic blocks.
2648 if (Root.getParent() != MI->getParent())
2649 return false;
2650 return RISCV::hasEqualFRM(Root, *MI);
2651}
2652
2654 SmallVectorImpl<unsigned> &Patterns,
2655 bool DoRegPressureReduce) {
2656 unsigned Opc = Root.getOpcode();
2657 bool IsFAdd = isFADD(Opc);
2658 if (!IsFAdd && !isFSUB(Opc))
2659 return false;
2660 bool Added = false;
2661 if (canCombineFPFusedMultiply(Root, Root.getOperand(1),
2662 DoRegPressureReduce)) {
2665 Added = true;
2666 }
2667 if (canCombineFPFusedMultiply(Root, Root.getOperand(2),
2668 DoRegPressureReduce)) {
2671 Added = true;
2672 }
2673 return Added;
2674}
2675
2676static bool getFPPatterns(MachineInstr &Root,
2677 SmallVectorImpl<unsigned> &Patterns,
2678 bool DoRegPressureReduce) {
2679 return getFPFusedMultiplyPatterns(Root, Patterns, DoRegPressureReduce);
2680}
2681
2682/// Utility routine that checks if \param MO is defined by an
2683/// \param CombineOpc instruction in the basic block \param MBB
2685 const MachineOperand &MO,
2686 unsigned CombineOpc) {
2687 const MachineRegisterInfo &MRI = MBB.getParent()->getRegInfo();
2688 const MachineInstr *MI = nullptr;
2689
2690 if (MO.isReg() && MO.getReg().isVirtual())
2691 MI = MRI.getUniqueVRegDef(MO.getReg());
2692 // And it needs to be in the trace (otherwise, it won't have a depth).
2693 if (!MI || MI->getParent() != &MBB || MI->getOpcode() != CombineOpc)
2694 return nullptr;
2695 // Must only used by the user we combine with.
2696 if (!MRI.hasOneNonDBGUse(MI->getOperand(0).getReg()))
2697 return nullptr;
2698
2699 return MI;
2700}
2701
2702/// Utility routine that checks if \param MO is defined by a SLLI in \param
2703/// MBB that can be combined by splitting across 2 SHXADD instructions. The
2704/// first SHXADD shift amount is given by \param OuterShiftAmt.
2706 const MachineOperand &MO,
2707 unsigned OuterShiftAmt) {
2708 const MachineInstr *ShiftMI = canCombine(MBB, MO, RISCV::SLLI);
2709 if (!ShiftMI)
2710 return false;
2711
2712 unsigned InnerShiftAmt = ShiftMI->getOperand(2).getImm();
2713 if (InnerShiftAmt < OuterShiftAmt || (InnerShiftAmt - OuterShiftAmt) > 3)
2714 return false;
2715
2716 return true;
2717}
2718
2719// Returns the shift amount from a SHXADD instruction. Returns 0 if the
2720// instruction is not a SHXADD.
2721static unsigned getSHXADDShiftAmount(unsigned Opc) {
2722 switch (Opc) {
2723 default:
2724 return 0;
2725 case RISCV::SH1ADD:
2726 return 1;
2727 case RISCV::SH2ADD:
2728 return 2;
2729 case RISCV::SH3ADD:
2730 return 3;
2731 }
2732}
2733
2734// Returns the shift amount from a SHXADD.UW instruction. Returns 0 if the
2735// instruction is not a SHXADD.UW.
2736static unsigned getSHXADDUWShiftAmount(unsigned Opc) {
2737 switch (Opc) {
2738 default:
2739 return 0;
2740 case RISCV::SH1ADD_UW:
2741 return 1;
2742 case RISCV::SH2ADD_UW:
2743 return 2;
2744 case RISCV::SH3ADD_UW:
2745 return 3;
2746 }
2747}
2748
2749// Look for opportunities to combine (sh3add Z, (add X, (slli Y, 5))) into
2750// (sh3add (sh2add Y, Z), X).
2751static bool getSHXADDPatterns(const MachineInstr &Root,
2752 SmallVectorImpl<unsigned> &Patterns) {
2753 unsigned ShiftAmt = getSHXADDShiftAmount(Root.getOpcode());
2754 if (!ShiftAmt)
2755 return false;
2756
2757 const MachineBasicBlock &MBB = *Root.getParent();
2758
2759 const MachineInstr *AddMI = canCombine(MBB, Root.getOperand(2), RISCV::ADD);
2760 if (!AddMI)
2761 return false;
2762
2763 bool Found = false;
2764 if (canCombineShiftIntoShXAdd(MBB, AddMI->getOperand(1), ShiftAmt)) {
2766 Found = true;
2767 }
2768 if (canCombineShiftIntoShXAdd(MBB, AddMI->getOperand(2), ShiftAmt)) {
2770 Found = true;
2771 }
2772
2773 return Found;
2774}
2775
2787
2789 MachineInstr &Root, SmallVectorImpl<unsigned> &Patterns,
2790 bool DoRegPressureReduce) const {
2791
2792 if (getFPPatterns(Root, Patterns, DoRegPressureReduce))
2793 return true;
2794
2795 if (getSHXADDPatterns(Root, Patterns))
2796 return true;
2797
2798 return TargetInstrInfo::getMachineCombinerPatterns(Root, Patterns,
2799 DoRegPressureReduce);
2800}
2801
2802static unsigned getFPFusedMultiplyOpcode(unsigned RootOpc, unsigned Pattern) {
2803 switch (RootOpc) {
2804 default:
2805 llvm_unreachable("Unexpected opcode");
2806 case RISCV::FADD_H:
2807 return RISCV::FMADD_H;
2808 case RISCV::FADD_S:
2809 return RISCV::FMADD_S;
2810 case RISCV::FADD_D:
2811 return RISCV::FMADD_D;
2812 case RISCV::FSUB_H:
2813 return Pattern == RISCVMachineCombinerPattern::FMSUB ? RISCV::FMSUB_H
2814 : RISCV::FNMSUB_H;
2815 case RISCV::FSUB_S:
2816 return Pattern == RISCVMachineCombinerPattern::FMSUB ? RISCV::FMSUB_S
2817 : RISCV::FNMSUB_S;
2818 case RISCV::FSUB_D:
2819 return Pattern == RISCVMachineCombinerPattern::FMSUB ? RISCV::FMSUB_D
2820 : RISCV::FNMSUB_D;
2821 }
2822}
2823
2824static unsigned getAddendOperandIdx(unsigned Pattern) {
2825 switch (Pattern) {
2826 default:
2827 llvm_unreachable("Unexpected pattern");
2830 return 2;
2833 return 1;
2834 }
2835}
2836
2838 unsigned Pattern,
2841 MachineFunction *MF = Root.getMF();
2842 MachineRegisterInfo &MRI = MF->getRegInfo();
2844
2845 MachineOperand &Mul1 = Prev.getOperand(1);
2846 MachineOperand &Mul2 = Prev.getOperand(2);
2847 MachineOperand &Dst = Root.getOperand(0);
2849
2850 Register DstReg = Dst.getReg();
2851 unsigned FusedOpc = getFPFusedMultiplyOpcode(Root.getOpcode(), Pattern);
2852 uint32_t IntersectedFlags = Root.getFlags() & Prev.getFlags();
2853 DebugLoc MergedLoc =
2855
2856 bool Mul1IsKill = Mul1.isKill();
2857 bool Mul2IsKill = Mul2.isKill();
2858 bool AddendIsKill = Addend.isKill();
2859
2860 // We need to clear kill flags since we may be extending the live range past
2861 // a kill. If the mul had kill flags, we can preserve those since we know
2862 // where the previous range stopped.
2863 MRI.clearKillFlags(Mul1.getReg());
2864 MRI.clearKillFlags(Mul2.getReg());
2865
2867 BuildMI(*MF, MergedLoc, TII->get(FusedOpc), DstReg)
2868 .addReg(Mul1.getReg(), getKillRegState(Mul1IsKill))
2869 .addReg(Mul2.getReg(), getKillRegState(Mul2IsKill))
2870 .addReg(Addend.getReg(), getKillRegState(AddendIsKill))
2871 .setMIFlags(IntersectedFlags);
2872
2873 InsInstrs.push_back(MIB);
2874 if (MRI.hasOneNonDBGUse(Prev.getOperand(0).getReg()))
2875 DelInstrs.push_back(&Prev);
2876 DelInstrs.push_back(&Root);
2877}
2878
2879// Combine patterns like (sh3add Z, (add X, (slli Y, 5))) to
2880// (sh3add (sh2add Y, Z), X) if the shift amount can be split across two
2881// shXadd instructions. The outer shXadd keeps its original opcode.
2882static void
2883genShXAddAddShift(MachineInstr &Root, unsigned AddOpIdx,
2886 DenseMap<Register, unsigned> &InstrIdxForVirtReg) {
2887 MachineFunction *MF = Root.getMF();
2888 MachineRegisterInfo &MRI = MF->getRegInfo();
2890
2891 unsigned OuterShiftAmt = getSHXADDShiftAmount(Root.getOpcode());
2892 assert(OuterShiftAmt != 0 && "Unexpected opcode");
2893
2894 MachineInstr *AddMI = MRI.getUniqueVRegDef(Root.getOperand(2).getReg());
2895 MachineInstr *ShiftMI =
2896 MRI.getUniqueVRegDef(AddMI->getOperand(AddOpIdx).getReg());
2897
2898 unsigned InnerShiftAmt = ShiftMI->getOperand(2).getImm();
2899 assert(InnerShiftAmt >= OuterShiftAmt && "Unexpected shift amount");
2900
2901 unsigned InnerOpc;
2902 switch (InnerShiftAmt - OuterShiftAmt) {
2903 default:
2904 llvm_unreachable("Unexpected shift amount");
2905 case 0:
2906 InnerOpc = RISCV::ADD;
2907 break;
2908 case 1:
2909 InnerOpc = RISCV::SH1ADD;
2910 break;
2911 case 2:
2912 InnerOpc = RISCV::SH2ADD;
2913 break;
2914 case 3:
2915 InnerOpc = RISCV::SH3ADD;
2916 break;
2917 }
2918
2919 const MachineOperand &X = AddMI->getOperand(3 - AddOpIdx);
2920 const MachineOperand &Y = ShiftMI->getOperand(1);
2921 const MachineOperand &Z = Root.getOperand(1);
2922
2923 Register NewVR = MRI.createVirtualRegister(&RISCV::GPRRegClass);
2924
2925 auto MIB1 = BuildMI(*MF, MIMetadata(Root), TII->get(InnerOpc), NewVR)
2926 .addReg(Y.getReg(), getKillRegState(Y.isKill()))
2927 .addReg(Z.getReg(), getKillRegState(Z.isKill()));
2928 auto MIB2 = BuildMI(*MF, MIMetadata(Root), TII->get(Root.getOpcode()),
2929 Root.getOperand(0).getReg())
2930 .addReg(NewVR, RegState::Kill)
2931 .addReg(X.getReg(), getKillRegState(X.isKill()));
2932
2933 InstrIdxForVirtReg.insert(std::make_pair(NewVR, 0));
2934 InsInstrs.push_back(MIB1);
2935 InsInstrs.push_back(MIB2);
2936 DelInstrs.push_back(ShiftMI);
2937 DelInstrs.push_back(AddMI);
2938 DelInstrs.push_back(&Root);
2939}
2940
2942 MachineInstr &Root, unsigned Pattern,
2945 DenseMap<Register, unsigned> &InstrIdxForVirtReg) const {
2946 MachineRegisterInfo &MRI = Root.getMF()->getRegInfo();
2947 switch (Pattern) {
2948 default:
2950 DelInstrs, InstrIdxForVirtReg);
2951 return;
2954 MachineInstr &Prev = *MRI.getVRegDef(Root.getOperand(1).getReg());
2955 combineFPFusedMultiply(Root, Prev, Pattern, InsInstrs, DelInstrs);
2956 return;
2957 }
2960 MachineInstr &Prev = *MRI.getVRegDef(Root.getOperand(2).getReg());
2961 combineFPFusedMultiply(Root, Prev, Pattern, InsInstrs, DelInstrs);
2962 return;
2963 }
2965 genShXAddAddShift(Root, 1, InsInstrs, DelInstrs, InstrIdxForVirtReg);
2966 return;
2968 genShXAddAddShift(Root, 2, InsInstrs, DelInstrs, InstrIdxForVirtReg);
2969 return;
2970 }
2971}
2972
2974 StringRef &ErrInfo) const {
2975 MCInstrDesc const &Desc = MI.getDesc();
2976
2977 for (const auto &[Index, Operand] : enumerate(Desc.operands())) {
2978 const MachineOperand &MO = MI.getOperand(Index);
2979 unsigned OpType = Operand.OperandType;
2980 switch (OpType) {
2981 default:
2982 if (OpType >= RISCVOp::OPERAND_FIRST_RISCV_IMM &&
2984 if (!MO.isImm()) {
2985 ErrInfo = "Expected an immediate operand.";
2986 return false;
2987 }
2988 int64_t Imm = MO.getImm();
2989 bool Ok;
2990 switch (OpType) {
2991 default:
2992 llvm_unreachable("Unexpected operand type");
2993
2994#define CASE_OPERAND_UIMM(NUM) \
2995 case RISCVOp::OPERAND_UIMM##NUM: \
2996 Ok = isUInt<NUM>(Imm); \
2997 break;
2998#define CASE_OPERAND_UIMM_LSB_ZEROS(BITS, SUFFIX) \
2999 case RISCVOp::OPERAND_UIMM##BITS##_LSB##SUFFIX: { \
3000 constexpr size_t NumZeros = sizeof(#SUFFIX) - 1; \
3001 Ok = isShiftedUInt<BITS - NumZeros, NumZeros>(Imm); \
3002 break; \
3003 }
3004#define CASE_OPERAND_SIMM(NUM) \
3005 case RISCVOp::OPERAND_SIMM##NUM: \
3006 Ok = isInt<NUM>(Imm); \
3007 break;
3008 // clang-format off
3032 // clang-format on
3034 Ok = isUInt<5>(Imm) && (Imm != 0);
3035 break;
3037 Ok = isUInt<5>(Imm) && (Imm > 3);
3038 break;
3040 Ok = Imm >= 1 && Imm <= 32;
3041 break;
3043 Ok = Imm >= 1 && Imm <= 64;
3044 break;
3046 Ok = Imm == STI.getXLen();
3047 break;
3049 Ok = isUInt<8>(Imm) && Imm >= 32;
3050 break;
3052 Ok = RISCV::isValidYBNDSWImm(Imm);
3053 break;
3055 Ok = isShiftedInt<6, 4>(Imm) && (Imm != 0);
3056 break;
3058 Ok = isShiftedUInt<8, 2>(Imm) && (Imm != 0);
3059 break;
3061 Ok = isUInt<16>(Imm) && (Imm != 0);
3062 break;
3064 Ok = Imm == 3;
3065 break;
3067 Ok = Imm == 4;
3068 break;
3070 Ok = (isUInt<5>(Imm) && Imm != 0) || Imm == -1;
3071 break;
3072 // clang-format off
3080 // clang-format on
3082 Ok = Imm >= -15 && Imm <= 16;
3083 break;
3085 Ok = isInt<5>(Imm) && (Imm != 0);
3086 break;
3088 Ok = Imm != 0 && isInt<6>(Imm);
3089 break;
3091 Ok = isUInt<10>(Imm) && RISCVVType::isValidVType(Imm);
3092 break;
3094 Ok = isUInt<11>(Imm) && RISCVVType::isValidVType(Imm);
3095 break;
3097 Ok = isShiftedInt<7, 5>(Imm);
3098 break;
3100 Ok = isInt<16>(Imm) && (Imm != 0);
3101 break;
3103 Ok = isInt<20>(Imm);
3104 break;
3106 Ok = STI.is64Bit() ? isUInt<6>(Imm) : isUInt<5>(Imm);
3107 break;
3109 Ok = STI.is64Bit() ? isUInt<6>(Imm) : isUInt<5>(Imm);
3110 Ok = Ok && Imm != 0;
3111 break;
3113 Ok = (isUInt<5>(Imm) && Imm != 0) || (Imm >= 0xfffe0 && Imm <= 0xfffff);
3114 break;
3116 Ok = Imm >= 0 && Imm <= 10;
3117 break;
3119 Ok = Imm >= 0 && Imm <= 7;
3120 break;
3122 Ok = Imm >= 1 && Imm <= 10;
3123 break;
3125 Ok = Imm >= 2 && Imm <= 14;
3126 break;
3128 Ok = Imm >= RISCVZC::RA && Imm <= RISCVZC::RA_S0_S11;
3129 break;
3131 Ok = Imm >= RISCVZC::RA_S0 && Imm <= RISCVZC::RA_S0_S11;
3132 break;
3134 Ok = Imm >= 0 && Imm <= 48 && Imm % 16 == 0;
3135 break;
3138 break;
3140 Ok = Imm == RISCVFPRndMode::RTZ;
3141 break;
3143 Ok = Imm >= 0 && Imm < RISCVCC::COND_INVALID;
3144 break;
3146 Ok = isValidAtomicOrdering(Imm);
3147 break;
3150 Imm;
3151 break;
3153 Ok = (isUInt<5>(Imm) && RISCVVType::isValidSEW(1 << Imm));
3154 break;
3156 Ok = Imm == 0;
3157 break;
3160 if (RISCVII::usesVXRM(Desc.TSFlags))
3161 Ok = isUInt<2>(Imm);
3162 else
3164 break;
3167 break;
3169 Ok = Imm == 1 || Imm == 2 || Imm == 4;
3170 break;
3171 }
3172 if (!Ok) {
3173 ErrInfo = "Invalid immediate";
3174 return false;
3175 }
3176 }
3177 break;
3179 // TODO: We could be stricter about what non-register operands are
3180 // allowed.
3181 if (MO.isReg()) {
3182 ErrInfo = "Expected a non-register operand.";
3183 return false;
3184 }
3185 if (MO.isImm() && !isInt<12>(MO.getImm())) {
3186 ErrInfo = "Invalid immediate";
3187 return false;
3188 }
3189 break;
3192 // TODO: We could be stricter about what non-register operands are
3193 // allowed.
3194 if (MO.isReg()) {
3195 ErrInfo = "Expected a non-register operand.";
3196 return false;
3197 }
3198 if (MO.isImm() && !isUInt<20>(MO.getImm())) {
3199 ErrInfo = "Invalid immediate";
3200 return false;
3201 }
3202 break;
3204 // TODO: We could be stricter about what non-register operands are
3205 // allowed.
3206 if (MO.isReg()) {
3207 ErrInfo = "Expected a non-register operand.";
3208 return false;
3209 }
3210 if (MO.isImm() && !isInt<32>(MO.getImm())) {
3211 ErrInfo = "Invalid immediate";
3212 return false;
3213 }
3214 break;
3216 if (MO.isImm()) {
3217 int64_t Imm = MO.getImm();
3218 // VLMAX is represented as -1.
3219 if (!isUInt<5>(Imm) && Imm != -1) {
3220 ErrInfo = "Invalid immediate";
3221 return false;
3222 }
3223 } else if (!MO.isReg()) {
3224 ErrInfo = "Expected a register or immediate operand.";
3225 return false;
3226 }
3227 break;
3229 if (!MO.isReg() && !MO.isImm()) {
3230 ErrInfo = "Expected a register or immediate operand.";
3231 return false;
3232 }
3233 break;
3234 }
3235 }
3236
3237 const uint64_t TSFlags = Desc.TSFlags;
3238 if (RISCVII::hasVLOp(TSFlags)) {
3239 const MachineOperand &Op = MI.getOperand(RISCVII::getVLOpNum(Desc));
3240 if (!Op.isImm() && !Op.isReg()) {
3241 ErrInfo = "Invalid operand type for VL operand";
3242 return false;
3243 }
3244 if (Op.isReg() && Op.getReg().isValid()) {
3245 const MachineRegisterInfo &MRI = MI.getParent()->getParent()->getRegInfo();
3246 auto *RC = MRI.getRegClass(Op.getReg());
3247 if (!RISCV::GPRNoX0RegClass.hasSubClassEq(RC)) {
3248 ErrInfo = "Invalid register class for VL operand";
3249 return false;
3250 }
3251 }
3252 if (!RISCVII::hasSEWOp(TSFlags)) {
3253 ErrInfo = "VL operand w/o SEW operand?";
3254 return false;
3255 }
3256 }
3257 if (RISCVII::hasSEWOp(TSFlags)) {
3258 unsigned OpIdx = RISCVII::getSEWOpNum(Desc);
3259 if (!MI.getOperand(OpIdx).isImm()) {
3260 ErrInfo = "SEW value expected to be an immediate";
3261 return false;
3262 }
3263 uint64_t Log2SEW = MI.getOperand(OpIdx).getImm();
3264 if (Log2SEW > 31) {
3265 ErrInfo = "Unexpected SEW value";
3266 return false;
3267 }
3268 unsigned SEW = Log2SEW ? 1 << Log2SEW : 8;
3269 if (!RISCVVType::isValidSEW(SEW)) {
3270 ErrInfo = "Unexpected SEW value";
3271 return false;
3272 }
3273 }
3274 if (RISCVII::hasVecPolicyOp(TSFlags)) {
3276 if (!MI.getOperand(OpIdx).isImm()) {
3277 ErrInfo = "Policy operand expected to be an immediate";
3278 return false;
3279 }
3280 uint64_t Policy = MI.getOperand(OpIdx).getImm();
3282 ErrInfo = "Invalid Policy Value";
3283 return false;
3284 }
3285 if (!RISCVII::hasVLOp(TSFlags)) {
3286 ErrInfo = "policy operand w/o VL operand?";
3287 return false;
3288 }
3289
3290 // VecPolicy operands can only exist on instructions with passthru/merge
3291 // arguments. Note that not all arguments with passthru have vec policy
3292 // operands- some instructions have implicit policies.
3293 unsigned UseOpIdx;
3294 if (!MI.isRegTiedToUseOperand(0, &UseOpIdx)) {
3295 ErrInfo = "policy operand w/o tied operand?";
3296 return false;
3297 }
3298 }
3299
3300 if (int Idx = RISCVII::getFRMOpNum(Desc);
3301 Idx >= 0 && MI.getOperand(Idx).getImm() == RISCVFPRndMode::DYN &&
3302 !MI.readsRegister(RISCV::FRM, /*TRI=*/nullptr)) {
3303 ErrInfo = "dynamic rounding mode should read FRM";
3304 return false;
3305 }
3306
3307 return true;
3308}
3309
3311 const MachineInstr &AddrI,
3312 ExtAddrMode &AM) const {
3313 switch (MemI.getOpcode()) {
3314 default:
3315 return false;
3316 case RISCV::LB:
3317 case RISCV::LBU:
3318 case RISCV::LH:
3319 case RISCV::LH_INX:
3320 case RISCV::LHU:
3321 case RISCV::LW:
3322 case RISCV::LW_INX:
3323 case RISCV::LWU:
3324 case RISCV::LD:
3325 case RISCV::LD_RV32:
3326 case RISCV::FLH:
3327 case RISCV::FLW:
3328 case RISCV::FLD:
3329 case RISCV::SB:
3330 case RISCV::SH:
3331 case RISCV::SH_INX:
3332 case RISCV::SW:
3333 case RISCV::SW_INX:
3334 case RISCV::SD:
3335 case RISCV::SD_RV32:
3336 case RISCV::FSH:
3337 case RISCV::FSW:
3338 case RISCV::FSD:
3339 break;
3340 }
3341
3342 if (MemI.getOperand(0).getReg() == Reg)
3343 return false;
3344
3345 if (AddrI.getOpcode() != RISCV::ADDI || !AddrI.getOperand(1).isReg() ||
3346 !AddrI.getOperand(2).isImm())
3347 return false;
3348
3349 int64_t OldOffset = MemI.getOperand(2).getImm();
3350 int64_t Disp = AddrI.getOperand(2).getImm();
3351 int64_t NewOffset = OldOffset + Disp;
3352 if (!STI.is64Bit())
3353 NewOffset = SignExtend64<32>(NewOffset);
3354
3355 if (!isInt<12>(NewOffset))
3356 return false;
3357
3358 AM.BaseReg = AddrI.getOperand(1).getReg();
3359 AM.ScaledReg = 0;
3360 AM.Scale = 0;
3361 AM.Displacement = NewOffset;
3363 return true;
3364}
3365
3367 const ExtAddrMode &AM) const {
3368
3369 const DebugLoc &DL = MemI.getDebugLoc();
3370 MachineBasicBlock &MBB = *MemI.getParent();
3371
3372 assert(AM.ScaledReg == 0 && AM.Scale == 0 &&
3373 "Addressing mode not supported for folding");
3374
3375 return BuildMI(MBB, MemI, DL, get(MemI.getOpcode()))
3376 .addReg(MemI.getOperand(0).getReg(), getDefRegState(MemI.mayLoad()))
3377 .addReg(AM.BaseReg)
3378 .addImm(AM.Displacement)
3379 .setMemRefs(MemI.memoperands())
3380 .setMIFlags(MemI.getFlags());
3381}
3382
3383// TODO: At the moment, MIPS introduced paring of instructions operating with
3384// word or double word. This should be extended with more instructions when more
3385// vendors support load/store pairing.
3387 switch (Opc) {
3388 default:
3389 return false;
3390 case RISCV::SW:
3391 case RISCV::SD:
3392 case RISCV::LD:
3393 case RISCV::LW:
3394 return true;
3395 }
3396}
3397
3399 const TargetRegisterInfo *TRI) {
3400 // If this is a volatile load/store, don't mess with it.
3401 if (LdSt.hasOrderedMemoryRef() || LdSt.getNumExplicitOperands() != 3)
3402 return false;
3403
3404 if (LdSt.getOperand(1).isFI())
3405 return true;
3406
3407 assert(LdSt.getOperand(1).isReg() && "Expected a reg operand.");
3408 // Can't cluster if the instruction modifies the base register
3409 // or it is update form. e.g. ld x5,8(x5)
3410 if (LdSt.modifiesRegister(LdSt.getOperand(1).getReg(), TRI))
3411 return false;
3412
3413 if (!LdSt.getOperand(2).isImm())
3414 return false;
3415
3416 return true;
3417}
3418
3421 int64_t &Offset, bool &OffsetIsScalable, LocationSize &Width,
3422 const TargetRegisterInfo *TRI) const {
3423 if (!LdSt.mayLoadOrStore())
3424 return false;
3425
3426 // Conservatively, only handle scalar loads/stores for now.
3427 switch (LdSt.getOpcode()) {
3428 case RISCV::LB:
3429 case RISCV::LBU:
3430 case RISCV::SB:
3431 case RISCV::LH:
3432 case RISCV::LH_INX:
3433 case RISCV::LHU:
3434 case RISCV::FLH:
3435 case RISCV::SH:
3436 case RISCV::SH_INX:
3437 case RISCV::FSH:
3438 case RISCV::LW:
3439 case RISCV::LW_INX:
3440 case RISCV::LWU:
3441 case RISCV::FLW:
3442 case RISCV::SW:
3443 case RISCV::SW_INX:
3444 case RISCV::FSW:
3445 case RISCV::LD:
3446 case RISCV::LD_RV32:
3447 case RISCV::FLD:
3448 case RISCV::SD:
3449 case RISCV::SD_RV32:
3450 case RISCV::FSD:
3451 break;
3452 default:
3453 return false;
3454 }
3455 const MachineOperand *BaseOp;
3456 OffsetIsScalable = false;
3457 if (!getMemOperandWithOffsetWidth(LdSt, BaseOp, Offset, Width, TRI))
3458 return false;
3459 BaseOps.push_back(BaseOp);
3460 return true;
3461}
3462
3463// TODO: This was copied from SIInstrInfo. Could it be lifted to a common
3464// helper?
3467 const MachineInstr &MI2,
3469 // Only examine the first "base" operand of each instruction, on the
3470 // assumption that it represents the real base address of the memory access.
3471 // Other operands are typically offsets or indices from this base address.
3472 if (BaseOps1.front()->isIdenticalTo(*BaseOps2.front()))
3473 return true;
3474
3475 if (!MI1.hasOneMemOperand() || !MI2.hasOneMemOperand())
3476 return false;
3477
3478 auto MO1 = *MI1.memoperands_begin();
3479 auto MO2 = *MI2.memoperands_begin();
3480 if (MO1->getAddrSpace() != MO2->getAddrSpace())
3481 return false;
3482
3483 auto Base1 = MO1->getValue();
3484 auto Base2 = MO2->getValue();
3485 if (!Base1 || !Base2)
3486 return false;
3487 Base1 = getUnderlyingObject(Base1);
3488 Base2 = getUnderlyingObject(Base2);
3489
3490 if (isa<UndefValue>(Base1) || isa<UndefValue>(Base2))
3491 return false;
3492
3493 return Base1 == Base2;
3494}
3495
3497 ArrayRef<const MachineOperand *> BaseOps1, int64_t Offset1,
3498 bool OffsetIsScalable1, ArrayRef<const MachineOperand *> BaseOps2,
3499 int64_t Offset2, bool OffsetIsScalable2, unsigned ClusterSize,
3500 unsigned NumBytes) const {
3501 // If the mem ops (to be clustered) do not have the same base ptr, then they
3502 // should not be clustered
3503 if (!BaseOps1.empty() && !BaseOps2.empty()) {
3504 const MachineInstr &FirstLdSt = *BaseOps1.front()->getParent();
3505 const MachineInstr &SecondLdSt = *BaseOps2.front()->getParent();
3506 if (!memOpsHaveSameBasePtr(FirstLdSt, BaseOps1, SecondLdSt, BaseOps2))
3507 return false;
3508 } else if (!BaseOps1.empty() || !BaseOps2.empty()) {
3509 // If only one base op is empty, they do not have the same base ptr
3510 return false;
3511 }
3512
3513 unsigned CacheLineSize =
3514 BaseOps1.front()->getParent()->getMF()->getSubtarget().getCacheLineSize();
3515 // Assume a cache line size of 64 bytes if no size is set in RISCVSubtarget.
3517 // Cluster if the memory operations are on the same or a neighbouring cache
3518 // line, but limit the maximum ClusterSize to avoid creating too much
3519 // additional register pressure.
3520 return ClusterSize <= 4 && std::abs(Offset1 - Offset2) < CacheLineSize;
3521}
3522
3523// Set BaseReg (the base register operand), Offset (the byte offset being
3524// accessed) and the access Width of the passed instruction that reads/writes
3525// memory. Returns false if the instruction does not read/write memory or the
3526// BaseReg/Offset/Width can't be determined. Is not guaranteed to always
3527// recognise base operands and offsets in all cases.
3528// TODO: Add an IsScalable bool ref argument (like the equivalent AArch64
3529// function) and set it as appropriate.
3531 const MachineInstr &LdSt, const MachineOperand *&BaseReg, int64_t &Offset,
3532 LocationSize &Width, const TargetRegisterInfo *TRI) const {
3533 if (!LdSt.mayLoadOrStore())
3534 return false;
3535
3536 // Here we assume the standard RISC-V ISA, which uses a base+offset
3537 // addressing mode. You'll need to relax these conditions to support custom
3538 // load/store instructions.
3539 if (LdSt.getNumExplicitOperands() != 3)
3540 return false;
3541 if ((!LdSt.getOperand(1).isReg() && !LdSt.getOperand(1).isFI()) ||
3542 !LdSt.getOperand(2).isImm())
3543 return false;
3544
3545 if (!LdSt.hasOneMemOperand())
3546 return false;
3547
3548 Width = (*LdSt.memoperands_begin())->getSize();
3549 BaseReg = &LdSt.getOperand(1);
3550 Offset = LdSt.getOperand(2).getImm();
3551 return true;
3552}
3553
3555 const MachineInstr &MIa, const MachineInstr &MIb) const {
3556 assert(MIa.mayLoadOrStore() && "MIa must be a load or store.");
3557 assert(MIb.mayLoadOrStore() && "MIb must be a load or store.");
3558
3561 return false;
3562
3563 // Retrieve the base register, offset from the base register and width. Width
3564 // is the size of memory that is being loaded/stored (e.g. 1, 2, 4). If
3565 // base registers are identical, and the offset of a lower memory access +
3566 // the width doesn't overlap the offset of a higher memory access,
3567 // then the memory accesses are different.
3568 const TargetRegisterInfo *TRI = STI.getRegisterInfo();
3569 const MachineOperand *BaseOpA = nullptr, *BaseOpB = nullptr;
3570 int64_t OffsetA = 0, OffsetB = 0;
3572 WidthB = LocationSize::precise(0);
3573 if (getMemOperandWithOffsetWidth(MIa, BaseOpA, OffsetA, WidthA, TRI) &&
3574 getMemOperandWithOffsetWidth(MIb, BaseOpB, OffsetB, WidthB, TRI)) {
3575 if (BaseOpA->isIdenticalTo(*BaseOpB)) {
3576 int LowOffset = std::min(OffsetA, OffsetB);
3577 int HighOffset = std::max(OffsetA, OffsetB);
3578 LocationSize LowWidth = (LowOffset == OffsetA) ? WidthA : WidthB;
3579 if (LowWidth.hasValue() &&
3580 LowOffset + (int)LowWidth.getValue() <= HighOffset)
3581 return true;
3582 }
3583 }
3584 return false;
3585}
3586
3587std::pair<unsigned, unsigned>
3589 const unsigned Mask = RISCVII::MO_DIRECT_FLAG_MASK;
3590 return std::make_pair(TF & Mask, TF & ~Mask);
3591}
3592
3595 using namespace RISCVII;
3596 static const std::pair<unsigned, const char *> TargetFlags[] = {
3597 {MO_CALL, "riscv-call"},
3598 {MO_LO, "riscv-lo"},
3599 {MO_HI, "riscv-hi"},
3600 {MO_PCREL_LO, "riscv-pcrel-lo"},
3601 {MO_PCREL_HI, "riscv-pcrel-hi"},
3602 {MO_GOT_HI, "riscv-got-hi"},
3603 {MO_TPREL_LO, "riscv-tprel-lo"},
3604 {MO_TPREL_HI, "riscv-tprel-hi"},
3605 {MO_TPREL_ADD, "riscv-tprel-add"},
3606 {MO_TLS_GOT_HI, "riscv-tls-got-hi"},
3607 {MO_TLS_GD_HI, "riscv-tls-gd-hi"},
3608 {MO_TLSDESC_HI, "riscv-tlsdesc-hi"},
3609 {MO_TLSDESC_LOAD_LO, "riscv-tlsdesc-load-lo"},
3610 {MO_TLSDESC_ADD_LO, "riscv-tlsdesc-add-lo"},
3611 {MO_TLSDESC_CALL, "riscv-tlsdesc-call"}};
3612 return ArrayRef(TargetFlags);
3613}
3615 MachineFunction &MF, bool OutlineFromLinkOnceODRs) const {
3616 const Function &F = MF.getFunction();
3617
3618 // Can F be deduplicated by the linker? If it can, don't outline from it.
3619 if (!OutlineFromLinkOnceODRs && F.hasLinkOnceODRLinkage())
3620 return false;
3621
3622 // Don't outline from functions with section markings; the program could
3623 // expect that all the code is in the named section.
3624 if (F.hasSection())
3625 return false;
3626
3627 // It's safe to outline from MF.
3628 return true;
3629}
3630
3632 unsigned &Flags) const {
3633 // More accurate safety checking is done in getOutliningCandidateInfo.
3635}
3636
3637// Enum values indicating how an outlined call should be constructed.
3643
3648
3650 const MachineFunction *MF = MBB.getParent();
3651 const Function &F = MF->getFunction();
3652 return F.getFnAttribute("fentry-call").getValueAsBool() ||
3653 F.hasFnAttribute("patchable-function-entry");
3654}
3655
3657 MCRegister RegNo) {
3658 return MI.readsRegister(RegNo, TRI) ||
3659 MI.getDesc().hasImplicitUseOfPhysReg(RegNo);
3660}
3661
3663 const TargetRegisterInfo *TRI, MCRegister RegNo) {
3664 return MI.modifiesRegister(RegNo, TRI) ||
3665 MI.getDesc().hasImplicitDefOfPhysReg(RegNo);
3666}
3667
3669 if (!MBB.back().isReturn())
3670 return true;
3672 return true;
3673
3674 // If the candidate reads the pre-set register
3675 // that can be used for expanding PseudoTAIL instruction,
3676 // then we cannot insert tail call.
3677 const TargetSubtargetInfo &STI = MBB.getParent()->getSubtarget();
3678 MCRegister TailExpandUseRegNo =
3680 for (const MachineInstr &MI : MBB) {
3681 if (isMIReadsReg(MI, STI.getRegisterInfo(), TailExpandUseRegNo))
3682 return true;
3683 if (isMIModifiesReg(MI, STI.getRegisterInfo(), TailExpandUseRegNo))
3684 break;
3685 }
3686 return false;
3687}
3688
3690 const TargetRegisterInfo &TRI) {
3691 // Candidate registers for saving X5: t1-t6
3692 static const MCPhysReg TempRegs[] = {
3693 RISCV::X6, // t1
3694 RISCV::X7, // t2
3695 RISCV::X28, // t3
3696 RISCV::X29, // t4
3697 RISCV::X30, // t5
3698 RISCV::X31 // t6
3699 };
3700
3701 const MachineFunction *MF = C.getMF();
3702 const MachineRegisterInfo &MRI = MF->getRegInfo();
3703
3704 for (MCPhysReg Reg : TempRegs) {
3705 if (MRI.isReserved(Reg))
3706 continue;
3707
3708 if (C.isAvailableAcrossAndOutOfSeq(Reg, TRI) &&
3709 C.isAvailableInsideSeq(Reg, TRI)) {
3710 return Reg;
3711 }
3712 }
3713
3714 return Register();
3715}
3716
3718 // If the expansion register for tail calls is live across the candidate
3719 // outlined call site, we cannot outline that candidate as the expansion
3720 // would clobber the register.
3721 MCRegister TailExpandUseReg =
3722 RISCVII::getTailExpandUseRegNo(STI.getFeatureBits());
3723 if (C.back().isReturn() &&
3724 !C.isAvailableAcrossAndOutOfSeq(TailExpandUseReg, RegInfo)) {
3725 LLVM_DEBUG(dbgs() << "MBB:\n" << *C.getMBB());
3726 LLVM_DEBUG(dbgs() << "Cannot be outlined between: " << C.front() << "and "
3727 << C.back());
3728 LLVM_DEBUG(dbgs() << "Because the tail-call register is live across "
3729 "the proposed outlined function call\n");
3730 return true;
3731 }
3732
3733 // If last instruction is return then we can rely on
3734 // the verification already performed in the getOutliningTypeImpl.
3735 if (C.back().isReturn()) {
3736 assert(!cannotInsertTailCall(*C.getMBB()) &&
3737 "The candidate who uses return instruction must be outlined "
3738 "using tail call");
3739 return false;
3740 }
3741
3742 // Filter out candidates where the X5 register (t0) can't be used to setup
3743 // the function call.
3744 if (!C.isAvailableInsideSeq(RISCV::X5, RegInfo))
3745 return true;
3746
3747 // If X5 is available in the region, use X5 directly (MachineOutlinerDefault).
3748 if (C.isAvailableAcrossAndOutOfSeq(RISCV::X5, RegInfo))
3749 return false;
3750
3751 // Otherwise, try to save X5 into t1-t6 (MachineOutlinerRegSave).
3753 return false;
3754
3755 return true;
3756}
3757
3758std::optional<std::unique_ptr<outliner::OutlinedFunction>>
3760 const MachineModuleInfo &MMI,
3761 std::vector<outliner::Candidate> &RepeatedSequenceLocs,
3762 unsigned MinRepeats) const {
3763
3764 // Analyze each candidate and erase the ones that are not viable.
3765 llvm::erase_if(RepeatedSequenceLocs, [this](auto Candidate) {
3766 return analyzeCandidate(Candidate);
3767 });
3768
3769 // If the sequence doesn't have enough candidates left, then we're done.
3770 if (RepeatedSequenceLocs.size() < MinRepeats)
3771 return std::nullopt;
3772
3773 // Each RepeatedSequenceLoc is identical.
3774 outliner::Candidate &Candidate = RepeatedSequenceLocs[0];
3775 unsigned InstrSizeCExt =
3776 Candidate.getMF()->getSubtarget<RISCVSubtarget>().hasStdExtZca() ? 2 : 4;
3777 unsigned CallOverhead = 0, FrameOverhead = 0;
3778
3779 // Count the number of CFI instructions in the candidate, if present.
3780 unsigned CFICount = 0;
3781 for (auto &I : Candidate) {
3782 if (I.isCFIInstruction())
3783 CFICount++;
3784 }
3785
3786 // Ensure CFI coverage matches: comparing the number of CFIs in the candidate
3787 // with the total number of CFIs in the parent function for each candidate.
3788 // Outlining only a subset of a function’s CFIs would split the unwind state
3789 // across two code regions and lead to incorrect address offsets between the
3790 // outlined body and the remaining code. To preserve correct unwind info, we
3791 // only outline when all CFIs in the function can be outlined together.
3792 for (outliner::Candidate &C : RepeatedSequenceLocs) {
3793 std::vector<MCCFIInstruction> CFIInstructions =
3794 C.getMF()->getFrameInstructions();
3795
3796 if (CFICount > 0 && CFICount != CFIInstructions.size())
3797 return std::nullopt;
3798 }
3799
3801 if (Candidate.back().isReturn()) {
3803 // tail call = auipc + jalr in the worst case without linker relaxation.
3804 // FIXME: This code suggests the JALR can be compressed - how?
3805 CallOverhead = 4 + InstrSizeCExt;
3806 // Using tail call we move ret instruction from caller to callee.
3807 FrameOverhead = 0;
3808 } else {
3809 // call t0, function = 8 bytes.
3810 CallOverhead = 8;
3811 // jr t0 = 4 bytes, 2 bytes if compressed instructions are enabled.
3812 FrameOverhead = InstrSizeCExt;
3813 }
3814
3815 // If we have CFI instructions, we can only outline if the outlined section
3816 // can be a tail call.
3817 if (MOCI != MachineOutlinerTailCall && CFICount > 0)
3818 return std::nullopt;
3819
3821 // Set per-candidate overhead based on X5 availability
3822 for (auto &C : RepeatedSequenceLocs) {
3823
3824 if (C.isAvailableAcrossAndOutOfSeq(RISCV::X5, RegInfo)) {
3825 // X5 is available, just need the call
3826 unsigned CandCallOverhead = 8;
3827 C.setCallInfo(MachineOutlinerDefault, CandCallOverhead);
3828 } else {
3829 // X5 unavailable, need save + call + restore
3830 // Save (2-4) + Call (8) + Restore (2-4)
3831 unsigned CandCallOverhead = InstrSizeCExt + 8 + InstrSizeCExt;
3832 C.setCallInfo(MachineOutlinerRegSave, CandCallOverhead);
3833 }
3834 }
3835 } else {
3836 for (auto &C : RepeatedSequenceLocs)
3837 C.setCallInfo(MOCI, CallOverhead);
3838 }
3839
3840 unsigned SequenceSize = 0;
3841 for (auto &MI : Candidate)
3842 SequenceSize += getInstSizeInBytes(MI);
3843
3844 return std::make_unique<outliner::OutlinedFunction>(
3845 RepeatedSequenceLocs, SequenceSize, FrameOverhead, MOCI);
3846}
3847
3851 unsigned Flags) const {
3852 MachineInstr &MI = *MBBI;
3853 MachineBasicBlock *MBB = MI.getParent();
3854 const TargetRegisterInfo *TRI =
3855 MBB->getParent()->getSubtarget().getRegisterInfo();
3856 const auto &F = MI.getMF()->getFunction();
3857
3858 // We can only outline CFI instructions if we will tail call the outlined
3859 // function, or fix up the CFI offsets. Currently, CFI instructions are
3860 // outlined only if in a tail call.
3861 if (MI.isCFIInstruction())
3863
3864 if (cannotInsertTailCall(*MBB) &&
3865 (MI.isReturn() || isMIModifiesReg(MI, TRI, RISCV::X5)))
3867
3868 // Make sure the operands don't reference something unsafe.
3869 for (const auto &MO : MI.operands()) {
3870
3871 // pcrel-hi and pcrel-lo can't put in separate sections, filter that out
3872 // if any possible.
3873 if (MO.getTargetFlags() == RISCVII::MO_PCREL_LO &&
3874 (MI.getMF()->getTarget().getFunctionSections() || F.hasComdat() ||
3875 F.hasSection() || F.getSectionPrefix()))
3877 }
3878
3879 if (isLPAD(MI))
3881
3883}
3884
3887 const outliner::OutlinedFunction &OF) const {
3888
3889 if (OF.FrameConstructionID == MachineOutlinerTailCall)
3890 return;
3891
3892 MBB.addLiveIn(RISCV::X5);
3893
3894 // Add in a return instruction to the end of the outlined frame.
3895 MBB.insert(MBB.end(), BuildMI(MF, DebugLoc(), get(RISCV::JALR))
3896 .addReg(RISCV::X0, RegState::Define)
3897 .addReg(RISCV::X5)
3898 .addImm(0));
3899}
3900
3904
3905 if (C.CallConstructionID == MachineOutlinerTailCall) {
3906 It = MBB.insert(It, BuildMI(MF, DebugLoc(), get(RISCV::PseudoTAIL))
3907 .addGlobalAddress(M.getNamedValue(MF.getName()),
3908 /*Offset=*/0, RISCVII::MO_CALL));
3909 return It;
3910 }
3911
3912 if (C.CallConstructionID == MachineOutlinerRegSave) {
3913 Register SaveReg = findRegisterToSaveX5To(C, RegInfo);
3914 assert(SaveReg && "Cannot find an available register to save/restore X5.");
3915
3916 // Save: ADDI SaveReg, X5, 0 (equivalent to MV SaveReg, X5)
3917 It = MBB.insert(It, BuildMI(MF, DebugLoc(), get(RISCV::ADDI), SaveReg)
3918 .addReg(RISCV::X5)
3919 .addImm(0));
3920 It++;
3921
3922 // Call: PseudoCALLReg X5
3923 It = MBB.insert(
3924 It, BuildMI(MF, DebugLoc(), get(RISCV::PseudoCALLReg), RISCV::X5)
3925 .addGlobalAddress(M.getNamedValue(MF.getName()), 0,
3927 MachineBasicBlock::iterator CallPt = It;
3928 It++;
3929
3930 // Restore: ADDI X5, SaveReg, 0 (equivalent to MV X5, SaveReg)
3931 It = MBB.insert(It, BuildMI(MF, DebugLoc(), get(RISCV::ADDI), RISCV::X5)
3932 .addReg(SaveReg)
3933 .addImm(0));
3934
3935 return CallPt;
3936 }
3937
3938 // Add in a call instruction to the outlined function at the given location.
3939 It = MBB.insert(It,
3940 BuildMI(MF, DebugLoc(), get(RISCV::PseudoCALLReg), RISCV::X5)
3941 .addGlobalAddress(M.getNamedValue(MF.getName()), 0,
3943 return It;
3944}
3945
3946std::optional<RegImmPair> RISCVInstrInfo::isAddImmediate(const MachineInstr &MI,
3947 Register Reg) const {
3948 // TODO: Handle cases where Reg is a super- or sub-register of the
3949 // destination register.
3950 const MachineOperand &Op0 = MI.getOperand(0);
3951 if (!Op0.isReg() || Reg != Op0.getReg())
3952 return std::nullopt;
3953
3954 // Don't consider ADDIW as a candidate because the caller may not be aware
3955 // of its sign extension behaviour.
3956 if (MI.getOpcode() == RISCV::ADDI && MI.getOperand(1).isReg() &&
3957 MI.getOperand(2).isImm())
3958 return RegImmPair{MI.getOperand(1).getReg(), MI.getOperand(2).getImm()};
3959
3960 return std::nullopt;
3961}
3962
3963// MIR printer helper function to annotate Operands with a comment.
3965 const MachineInstr &MI, const MachineOperand &Op, unsigned OpIdx,
3966 const TargetRegisterInfo *TRI) const {
3967 // Print a generic comment for this operand if there is one.
3968 std::string GenericComment =
3970 if (!GenericComment.empty())
3971 return GenericComment;
3972
3973 const MCInstrDesc &Desc = MI.getDesc();
3974 if (OpIdx >= Desc.getNumOperands())
3975 return std::string();
3976
3977 std::string Comment;
3978 raw_string_ostream OS(Comment);
3979
3980 const MCOperandInfo &OpInfo = Desc.operands()[OpIdx];
3981
3982 // Print the full VType operand of vsetvli/vsetivli instructions, and the SEW
3983 // operand of vector codegen pseudos.
3984 switch (OpInfo.OperandType) {
3987 unsigned Imm = Op.getImm();
3988 RISCVVType::printVType(Imm, OS);
3989 break;
3990 }
3992 unsigned Imm = Op.getImm();
3994 break;
3995 }
3997 unsigned Imm = Op.getImm();
3998 OS << "w" << Imm;
3999 break;
4000 }
4003 unsigned Log2SEW = Op.getImm();
4004 unsigned SEW = Log2SEW ? 1 << Log2SEW : 8;
4005 assert(RISCVVType::isValidSEW(SEW) && "Unexpected SEW");
4006 OS << "e" << SEW;
4007 break;
4008 }
4010 unsigned Policy = Op.getImm();
4012 "Invalid Policy Value");
4013 OS << (Policy & RISCVVType::TAIL_AGNOSTIC ? "ta" : "tu") << ", "
4014 << (Policy & RISCVVType::MASK_AGNOSTIC ? "ma" : "mu");
4015 break;
4016 }
4018 if (Op.isImm() && Op.getImm() == -1)
4019 OS << "vl=VLMAX";
4020 else
4021 OS << "vl";
4022 break;
4024 if (RISCVII::usesVXRM(Desc.TSFlags)) {
4026 auto VXRM = static_cast<RISCVVXRndMode::RoundingMode>(Op.getImm());
4027 OS << "vxrm=" << RISCVVXRndMode::roundingModeToString(VXRM);
4028 } else {
4030 auto FRM = static_cast<RISCVFPRndMode::RoundingMode>(Op.getImm());
4031 OS << "frm=" << RISCVFPRndMode::roundingModeToString(FRM);
4032 }
4033 break;
4034 }
4035
4036 return Comment;
4037}
4038
4039// clang-format off
4040#define CASE_RVV_OPCODE_UNMASK_LMUL(OP, LMUL) \
4041 RISCV::Pseudo##OP##_##LMUL
4042
4043#define CASE_RVV_OPCODE_MASK_LMUL(OP, LMUL) \
4044 RISCV::Pseudo##OP##_##LMUL##_MASK
4045
4046#define CASE_RVV_OPCODE_LMUL(OP, LMUL) \
4047 CASE_RVV_OPCODE_UNMASK_LMUL(OP, LMUL): \
4048 case CASE_RVV_OPCODE_MASK_LMUL(OP, LMUL)
4049
4050#define CASE_RVV_OPCODE_UNMASK_WIDEN(OP) \
4051 CASE_RVV_OPCODE_UNMASK_LMUL(OP, MF8): \
4052 case CASE_RVV_OPCODE_UNMASK_LMUL(OP, MF4): \
4053 case CASE_RVV_OPCODE_UNMASK_LMUL(OP, MF2): \
4054 case CASE_RVV_OPCODE_UNMASK_LMUL(OP, M1): \
4055 case CASE_RVV_OPCODE_UNMASK_LMUL(OP, M2): \
4056 case CASE_RVV_OPCODE_UNMASK_LMUL(OP, M4)
4057
4058#define CASE_RVV_OPCODE_UNMASK(OP) \
4059 CASE_RVV_OPCODE_UNMASK_WIDEN(OP): \
4060 case CASE_RVV_OPCODE_UNMASK_LMUL(OP, M8)
4061
4062#define CASE_RVV_OPCODE_MASK_WIDEN(OP) \
4063 CASE_RVV_OPCODE_MASK_LMUL(OP, MF8): \
4064 case CASE_RVV_OPCODE_MASK_LMUL(OP, MF4): \
4065 case CASE_RVV_OPCODE_MASK_LMUL(OP, MF2): \
4066 case CASE_RVV_OPCODE_MASK_LMUL(OP, M1): \
4067 case CASE_RVV_OPCODE_MASK_LMUL(OP, M2): \
4068 case CASE_RVV_OPCODE_MASK_LMUL(OP, M4)
4069
4070#define CASE_RVV_OPCODE_MASK(OP) \
4071 CASE_RVV_OPCODE_MASK_WIDEN(OP): \
4072 case CASE_RVV_OPCODE_MASK_LMUL(OP, M8)
4073
4074#define CASE_RVV_OPCODE_WIDEN(OP) \
4075 CASE_RVV_OPCODE_UNMASK_WIDEN(OP): \
4076 case CASE_RVV_OPCODE_MASK_WIDEN(OP)
4077
4078#define CASE_RVV_OPCODE(OP) \
4079 CASE_RVV_OPCODE_UNMASK(OP): \
4080 case CASE_RVV_OPCODE_MASK(OP)
4081// clang-format on
4082
4083// clang-format off
4084#define CASE_VMA_OPCODE_COMMON(OP, TYPE, LMUL) \
4085 RISCV::PseudoV##OP##_##TYPE##_##LMUL
4086
4087#define CASE_VMA_OPCODE_LMULS(OP, TYPE) \
4088 CASE_VMA_OPCODE_COMMON(OP, TYPE, MF8): \
4089 case CASE_VMA_OPCODE_COMMON(OP, TYPE, MF4): \
4090 case CASE_VMA_OPCODE_COMMON(OP, TYPE, MF2): \
4091 case CASE_VMA_OPCODE_COMMON(OP, TYPE, M1): \
4092 case CASE_VMA_OPCODE_COMMON(OP, TYPE, M2): \
4093 case CASE_VMA_OPCODE_COMMON(OP, TYPE, M4): \
4094 case CASE_VMA_OPCODE_COMMON(OP, TYPE, M8)
4095
4096// VFMA instructions are SEW specific.
4097#define CASE_VFMA_OPCODE_COMMON(OP, TYPE, LMUL, SEW) \
4098 RISCV::PseudoV##OP##_##TYPE##_##LMUL##_##SEW
4099
4100#define CASE_VFMA_OPCODE_LMULS_M1(OP, TYPE, SEW) \
4101 CASE_VFMA_OPCODE_COMMON(OP, TYPE, M1, SEW): \
4102 case CASE_VFMA_OPCODE_COMMON(OP, TYPE, M2, SEW): \
4103 case CASE_VFMA_OPCODE_COMMON(OP, TYPE, M4, SEW): \
4104 case CASE_VFMA_OPCODE_COMMON(OP, TYPE, M8, SEW)
4105
4106#define CASE_VFMA_OPCODE_LMULS_MF2(OP, TYPE, SEW) \
4107 CASE_VFMA_OPCODE_COMMON(OP, TYPE, MF2, SEW): \
4108 case CASE_VFMA_OPCODE_LMULS_M1(OP, TYPE, SEW)
4109
4110#define CASE_VFMA_OPCODE_LMULS_MF4(OP, TYPE, SEW) \
4111 CASE_VFMA_OPCODE_COMMON(OP, TYPE, MF4, SEW): \
4112 case CASE_VFMA_OPCODE_LMULS_MF2(OP, TYPE, SEW)
4113
4114#define CASE_VFMA_OPCODE_VV(OP) \
4115 CASE_VFMA_OPCODE_LMULS_MF4(OP, VV, E16): \
4116 case CASE_VFMA_OPCODE_LMULS_MF4(OP##_ALT, VV, E16): \
4117 case CASE_VFMA_OPCODE_LMULS_MF2(OP, VV, E32): \
4118 case CASE_VFMA_OPCODE_LMULS_M1(OP, VV, E64)
4119
4120#define CASE_VFMA_SPLATS(OP) \
4121 CASE_VFMA_OPCODE_LMULS_MF4(OP, VFPR16, E16): \
4122 case CASE_VFMA_OPCODE_LMULS_MF4(OP##_ALT, VFPR16, E16): \
4123 case CASE_VFMA_OPCODE_LMULS_MF2(OP, VFPR32, E32): \
4124 case CASE_VFMA_OPCODE_LMULS_M1(OP, VFPR64, E64)
4125// clang-format on
4126
4128 unsigned &SrcOpIdx1,
4129 unsigned &SrcOpIdx2) const {
4130 const MCInstrDesc &Desc = MI.getDesc();
4131 if (!Desc.isCommutable())
4132 return false;
4133
4134 switch (MI.getOpcode()) {
4135 case RISCV::TH_MVEQZ:
4136 case RISCV::TH_MVNEZ:
4137 // We can't commute operands if operand 2 (i.e., rs1 in
4138 // mveqz/mvnez rd,rs1,rs2) is the zero-register (as it is
4139 // not valid as the in/out-operand 1).
4140 if (MI.getOperand(2).getReg() == RISCV::X0)
4141 return false;
4142 // Operands 1 and 2 are commutable, if we switch the opcode.
4143 return fixCommutedOpIndices(SrcOpIdx1, SrcOpIdx2, 1, 2);
4144 case RISCV::QC_SELECTIEQ:
4145 case RISCV::QC_SELECTINE:
4146 case RISCV::QC_SELECTIIEQ:
4147 case RISCV::QC_SELECTIINE:
4148 return fixCommutedOpIndices(SrcOpIdx1, SrcOpIdx2, 1, 2);
4149 case RISCV::QC_MVEQ:
4150 case RISCV::QC_MVNE:
4151 case RISCV::QC_MVLT:
4152 case RISCV::QC_MVGE:
4153 case RISCV::QC_MVLTU:
4154 case RISCV::QC_MVGEU:
4155 case RISCV::QC_MVEQI:
4156 case RISCV::QC_MVNEI:
4157 case RISCV::QC_MVLTI:
4158 case RISCV::QC_MVGEI:
4159 case RISCV::QC_MVLTUI:
4160 case RISCV::QC_MVGEUI:
4161 return fixCommutedOpIndices(SrcOpIdx1, SrcOpIdx2, 1, 4);
4162 case RISCV::TH_MULA:
4163 case RISCV::TH_MULAW:
4164 case RISCV::TH_MULAH:
4165 case RISCV::TH_MULS:
4166 case RISCV::TH_MULSW:
4167 case RISCV::TH_MULSH:
4168 // Operands 2 and 3 are commutable.
4169 return fixCommutedOpIndices(SrcOpIdx1, SrcOpIdx2, 2, 3);
4170 case RISCV::PseudoCCMOVGPRNoX0:
4171 case RISCV::PseudoCCMOVGPR:
4172 // Operands 1 and 2 are commutable.
4173 return fixCommutedOpIndices(SrcOpIdx1, SrcOpIdx2, 1, 2);
4174 case CASE_RVV_OPCODE(VADD_VV):
4175 case CASE_RVV_OPCODE(VAND_VV):
4176 case CASE_RVV_OPCODE(VOR_VV):
4177 case CASE_RVV_OPCODE(VXOR_VV):
4178 case CASE_RVV_OPCODE_MASK(VMSEQ_VV):
4179 case CASE_RVV_OPCODE_MASK(VMSNE_VV):
4180 case CASE_RVV_OPCODE(VMIN_VV):
4181 case CASE_RVV_OPCODE(VMINU_VV):
4182 case CASE_RVV_OPCODE(VMAX_VV):
4183 case CASE_RVV_OPCODE(VMAXU_VV):
4184 case CASE_RVV_OPCODE(VMUL_VV):
4185 case CASE_RVV_OPCODE(VMULH_VV):
4186 case CASE_RVV_OPCODE(VMULHU_VV):
4187 case CASE_RVV_OPCODE_WIDEN(VWADD_VV):
4188 case CASE_RVV_OPCODE_WIDEN(VWADDU_VV):
4189 case CASE_RVV_OPCODE_WIDEN(VWMUL_VV):
4190 case CASE_RVV_OPCODE_WIDEN(VWMULU_VV):
4191 case CASE_RVV_OPCODE_WIDEN(VWMACC_VV):
4192 case CASE_RVV_OPCODE_WIDEN(VWMACCU_VV):
4193 case CASE_RVV_OPCODE(VABD_VV):
4194 case CASE_RVV_OPCODE(VABDU_VV):
4195 case CASE_RVV_OPCODE_WIDEN(VWABDA_VV):
4196 case CASE_RVV_OPCODE_WIDEN(VWABDAU_VV):
4197 case CASE_RVV_OPCODE_UNMASK(VADC_VVM):
4198 case CASE_RVV_OPCODE(VSADD_VV):
4199 case CASE_RVV_OPCODE(VSADDU_VV):
4200 case CASE_RVV_OPCODE(VAADD_VV):
4201 case CASE_RVV_OPCODE(VAADDU_VV):
4202 case CASE_RVV_OPCODE(VSMUL_VV):
4203 case CASE_RVV_OPCODE_LMUL(VDOT4A_VV, MF2):
4204 case CASE_RVV_OPCODE_LMUL(VDOT4A_VV, M1):
4205 case CASE_RVV_OPCODE_LMUL(VDOT4A_VV, M2):
4206 case CASE_RVV_OPCODE_LMUL(VDOT4A_VV, M4):
4207 case CASE_RVV_OPCODE_LMUL(VDOT4A_VV, M8):
4208 case CASE_RVV_OPCODE_LMUL(VDOT4AU_VV, MF2):
4209 case CASE_RVV_OPCODE_LMUL(VDOT4AU_VV, M1):
4210 case CASE_RVV_OPCODE_LMUL(VDOT4AU_VV, M2):
4211 case CASE_RVV_OPCODE_LMUL(VDOT4AU_VV, M4):
4212 case CASE_RVV_OPCODE_LMUL(VDOT4AU_VV, M8):
4213 // Operands 2 and 3 are commutable.
4214 return fixCommutedOpIndices(SrcOpIdx1, SrcOpIdx2, 2, 3);
4215 case CASE_VFMA_SPLATS(FMADD):
4216 case CASE_VFMA_SPLATS(FMSUB):
4217 case CASE_VFMA_SPLATS(FMACC):
4218 case CASE_VFMA_SPLATS(FMSAC):
4221 case CASE_VFMA_SPLATS(FNMACC):
4222 case CASE_VFMA_SPLATS(FNMSAC):
4223 case CASE_VFMA_OPCODE_VV(FMACC):
4224 case CASE_VFMA_OPCODE_VV(FMSAC):
4225 case CASE_VFMA_OPCODE_VV(FNMACC):
4226 case CASE_VFMA_OPCODE_VV(FNMSAC):
4227 case CASE_VMA_OPCODE_LMULS(MADD, VX):
4228 case CASE_VMA_OPCODE_LMULS(NMSUB, VX):
4229 case CASE_VMA_OPCODE_LMULS(MACC, VX):
4230 case CASE_VMA_OPCODE_LMULS(NMSAC, VX):
4231 case CASE_VMA_OPCODE_LMULS(MACC, VV):
4232 case CASE_VMA_OPCODE_LMULS(NMSAC, VV): {
4233 // If the tail policy is undisturbed we can't commute.
4234 assert(RISCVII::hasVecPolicyOp(MI.getDesc().TSFlags));
4235 if ((MI.getOperand(RISCVII::getVecPolicyOpNum(MI.getDesc())).getImm() &
4236 1) == 0)
4237 return false;
4238
4239 // For these instructions we can only swap operand 1 and operand 3 by
4240 // changing the opcode.
4241 unsigned CommutableOpIdx1 = 1;
4242 unsigned CommutableOpIdx2 = 3;
4243 if (!fixCommutedOpIndices(SrcOpIdx1, SrcOpIdx2, CommutableOpIdx1,
4244 CommutableOpIdx2))
4245 return false;
4246 return true;
4247 }
4248 case CASE_VFMA_OPCODE_VV(FMADD):
4252 case CASE_VMA_OPCODE_LMULS(MADD, VV):
4253 case CASE_VMA_OPCODE_LMULS(NMSUB, VV): {
4254 // If the tail policy is undisturbed we can't commute.
4255 assert(RISCVII::hasVecPolicyOp(MI.getDesc().TSFlags));
4256 if ((MI.getOperand(RISCVII::getVecPolicyOpNum(MI.getDesc())).getImm() &
4257 1) == 0)
4258 return false;
4259
4260 // For these instructions we have more freedom. We can commute with the
4261 // other multiplicand or with the addend/subtrahend/minuend.
4262
4263 // Any fixed operand must be from source 1, 2 or 3.
4264 if (SrcOpIdx1 != CommuteAnyOperandIndex && SrcOpIdx1 > 3)
4265 return false;
4266 if (SrcOpIdx2 != CommuteAnyOperandIndex && SrcOpIdx2 > 3)
4267 return false;
4268
4269 // It both ops are fixed one must be the tied source.
4270 if (SrcOpIdx1 != CommuteAnyOperandIndex &&
4271 SrcOpIdx2 != CommuteAnyOperandIndex && SrcOpIdx1 != 1 && SrcOpIdx2 != 1)
4272 return false;
4273
4274 // Look for two different register operands assumed to be commutable
4275 // regardless of the FMA opcode. The FMA opcode is adjusted later if
4276 // needed.
4277 if (SrcOpIdx1 == CommuteAnyOperandIndex ||
4278 SrcOpIdx2 == CommuteAnyOperandIndex) {
4279 // At least one of operands to be commuted is not specified and
4280 // this method is free to choose appropriate commutable operands.
4281 unsigned CommutableOpIdx1 = SrcOpIdx1;
4282 if (SrcOpIdx1 == SrcOpIdx2) {
4283 // Both of operands are not fixed. Set one of commutable
4284 // operands to the tied source.
4285 CommutableOpIdx1 = 1;
4286 } else if (SrcOpIdx1 == CommuteAnyOperandIndex) {
4287 // Only one of the operands is not fixed.
4288 CommutableOpIdx1 = SrcOpIdx2;
4289 }
4290
4291 // CommutableOpIdx1 is well defined now. Let's choose another commutable
4292 // operand and assign its index to CommutableOpIdx2.
4293 unsigned CommutableOpIdx2;
4294 if (CommutableOpIdx1 != 1) {
4295 // If we haven't already used the tied source, we must use it now.
4296 CommutableOpIdx2 = 1;
4297 } else {
4298 Register Op1Reg = MI.getOperand(CommutableOpIdx1).getReg();
4299
4300 // The commuted operands should have different registers.
4301 // Otherwise, the commute transformation does not change anything and
4302 // is useless. We use this as a hint to make our decision.
4303 if (Op1Reg != MI.getOperand(2).getReg())
4304 CommutableOpIdx2 = 2;
4305 else
4306 CommutableOpIdx2 = 3;
4307 }
4308
4309 // Assign the found pair of commutable indices to SrcOpIdx1 and
4310 // SrcOpIdx2 to return those values.
4311 if (!fixCommutedOpIndices(SrcOpIdx1, SrcOpIdx2, CommutableOpIdx1,
4312 CommutableOpIdx2))
4313 return false;
4314 }
4315
4316 return true;
4317 }
4318 }
4319
4320 return TargetInstrInfo::findCommutedOpIndices(MI, SrcOpIdx1, SrcOpIdx2);
4321}
4322
4323// clang-format off
4324#define CASE_VMA_CHANGE_OPCODE_COMMON(OLDOP, NEWOP, TYPE, LMUL) \
4325 case RISCV::PseudoV##OLDOP##_##TYPE##_##LMUL: \
4326 Opc = RISCV::PseudoV##NEWOP##_##TYPE##_##LMUL; \
4327 break;
4328
4329#define CASE_VMA_CHANGE_OPCODE_LMULS(OLDOP, NEWOP, TYPE) \
4330 CASE_VMA_CHANGE_OPCODE_COMMON(OLDOP, NEWOP, TYPE, MF8) \
4331 CASE_VMA_CHANGE_OPCODE_COMMON(OLDOP, NEWOP, TYPE, MF4) \
4332 CASE_VMA_CHANGE_OPCODE_COMMON(OLDOP, NEWOP, TYPE, MF2) \
4333 CASE_VMA_CHANGE_OPCODE_COMMON(OLDOP, NEWOP, TYPE, M1) \
4334 CASE_VMA_CHANGE_OPCODE_COMMON(OLDOP, NEWOP, TYPE, M2) \
4335 CASE_VMA_CHANGE_OPCODE_COMMON(OLDOP, NEWOP, TYPE, M4) \
4336 CASE_VMA_CHANGE_OPCODE_COMMON(OLDOP, NEWOP, TYPE, M8)
4337
4338// VFMA depends on SEW.
4339#define CASE_VFMA_CHANGE_OPCODE_COMMON(OLDOP, NEWOP, TYPE, LMUL, SEW) \
4340 case RISCV::PseudoV##OLDOP##_##TYPE##_##LMUL##_##SEW: \
4341 Opc = RISCV::PseudoV##NEWOP##_##TYPE##_##LMUL##_##SEW; \
4342 break;
4343
4344#define CASE_VFMA_CHANGE_OPCODE_LMULS_M1(OLDOP, NEWOP, TYPE, SEW) \
4345 CASE_VFMA_CHANGE_OPCODE_COMMON(OLDOP, NEWOP, TYPE, M1, SEW) \
4346 CASE_VFMA_CHANGE_OPCODE_COMMON(OLDOP, NEWOP, TYPE, M2, SEW) \
4347 CASE_VFMA_CHANGE_OPCODE_COMMON(OLDOP, NEWOP, TYPE, M4, SEW) \
4348 CASE_VFMA_CHANGE_OPCODE_COMMON(OLDOP, NEWOP, TYPE, M8, SEW)
4349
4350#define CASE_VFMA_CHANGE_OPCODE_LMULS_MF2(OLDOP, NEWOP, TYPE, SEW) \
4351 CASE_VFMA_CHANGE_OPCODE_COMMON(OLDOP, NEWOP, TYPE, MF2, SEW) \
4352 CASE_VFMA_CHANGE_OPCODE_LMULS_M1(OLDOP, NEWOP, TYPE, SEW)
4353
4354#define CASE_VFMA_CHANGE_OPCODE_LMULS_MF4(OLDOP, NEWOP, TYPE, SEW) \
4355 CASE_VFMA_CHANGE_OPCODE_COMMON(OLDOP, NEWOP, TYPE, MF4, SEW) \
4356 CASE_VFMA_CHANGE_OPCODE_LMULS_MF2(OLDOP, NEWOP, TYPE, SEW)
4357
4358#define CASE_VFMA_CHANGE_OPCODE_VV(OLDOP, NEWOP) \
4359 CASE_VFMA_CHANGE_OPCODE_LMULS_MF4(OLDOP, NEWOP, VV, E16) \
4360 CASE_VFMA_CHANGE_OPCODE_LMULS_MF4(OLDOP##_ALT, NEWOP##_ALT, VV, E16) \
4361 CASE_VFMA_CHANGE_OPCODE_LMULS_MF2(OLDOP, NEWOP, VV, E32) \
4362 CASE_VFMA_CHANGE_OPCODE_LMULS_M1(OLDOP, NEWOP, VV, E64)
4363
4364#define CASE_VFMA_CHANGE_OPCODE_SPLATS(OLDOP, NEWOP) \
4365 CASE_VFMA_CHANGE_OPCODE_LMULS_MF4(OLDOP, NEWOP, VFPR16, E16) \
4366 CASE_VFMA_CHANGE_OPCODE_LMULS_MF4(OLDOP##_ALT, NEWOP##_ALT, VFPR16, E16) \
4367 CASE_VFMA_CHANGE_OPCODE_LMULS_MF2(OLDOP, NEWOP, VFPR32, E32) \
4368 CASE_VFMA_CHANGE_OPCODE_LMULS_M1(OLDOP, NEWOP, VFPR64, E64)
4369// clang-format on
4370
4372 bool NewMI,
4373 unsigned OpIdx1,
4374 unsigned OpIdx2) const {
4375 auto cloneIfNew = [NewMI](MachineInstr &MI) -> MachineInstr & {
4376 if (NewMI)
4377 return *MI.getParent()->getParent()->CloneMachineInstr(&MI);
4378 return MI;
4379 };
4380
4381 switch (MI.getOpcode()) {
4382 case RISCV::TH_MVEQZ:
4383 case RISCV::TH_MVNEZ: {
4384 auto &WorkingMI = cloneIfNew(MI);
4385 WorkingMI.setDesc(get(MI.getOpcode() == RISCV::TH_MVEQZ ? RISCV::TH_MVNEZ
4386 : RISCV::TH_MVEQZ));
4387 return TargetInstrInfo::commuteInstructionImpl(WorkingMI, false, OpIdx1,
4388 OpIdx2);
4389 }
4390 case RISCV::QC_SELECTIEQ:
4391 case RISCV::QC_SELECTINE:
4392 case RISCV::QC_SELECTIIEQ:
4393 case RISCV::QC_SELECTIINE:
4394 return TargetInstrInfo::commuteInstructionImpl(MI, NewMI, OpIdx1, OpIdx2);
4395 case RISCV::QC_MVEQ:
4396 case RISCV::QC_MVNE:
4397 case RISCV::QC_MVLT:
4398 case RISCV::QC_MVGE:
4399 case RISCV::QC_MVLTU:
4400 case RISCV::QC_MVGEU:
4401 case RISCV::QC_MVEQI:
4402 case RISCV::QC_MVNEI:
4403 case RISCV::QC_MVLTI:
4404 case RISCV::QC_MVGEI:
4405 case RISCV::QC_MVLTUI:
4406 case RISCV::QC_MVGEUI: {
4407 auto &WorkingMI = cloneIfNew(MI);
4408 WorkingMI.setDesc(get(getInverseXqcicmOpcode(MI.getOpcode())));
4409 return TargetInstrInfo::commuteInstructionImpl(WorkingMI, false, OpIdx1,
4410 OpIdx2);
4411 }
4412 case RISCV::PseudoCCMOVGPRNoX0:
4413 case RISCV::PseudoCCMOVGPR: {
4414 // CCMOV can be commuted by inverting the condition.
4415 unsigned BCC = MI.getOperand(MI.getNumExplicitOperands() - 3).getImm();
4417 auto &WorkingMI = cloneIfNew(MI);
4418 WorkingMI.getOperand(MI.getNumExplicitOperands() - 3).setImm(BCC);
4419 return TargetInstrInfo::commuteInstructionImpl(WorkingMI, /*NewMI*/ false,
4420 OpIdx1, OpIdx2);
4421 }
4422 case CASE_VFMA_SPLATS(FMACC):
4423 case CASE_VFMA_SPLATS(FMADD):
4424 case CASE_VFMA_SPLATS(FMSAC):
4425 case CASE_VFMA_SPLATS(FMSUB):
4426 case CASE_VFMA_SPLATS(FNMACC):
4428 case CASE_VFMA_SPLATS(FNMSAC):
4430 case CASE_VFMA_OPCODE_VV(FMACC):
4431 case CASE_VFMA_OPCODE_VV(FMSAC):
4432 case CASE_VFMA_OPCODE_VV(FNMACC):
4433 case CASE_VFMA_OPCODE_VV(FNMSAC):
4434 case CASE_VMA_OPCODE_LMULS(MADD, VX):
4435 case CASE_VMA_OPCODE_LMULS(NMSUB, VX):
4436 case CASE_VMA_OPCODE_LMULS(MACC, VX):
4437 case CASE_VMA_OPCODE_LMULS(NMSAC, VX):
4438 case CASE_VMA_OPCODE_LMULS(MACC, VV):
4439 case CASE_VMA_OPCODE_LMULS(NMSAC, VV): {
4440 // It only make sense to toggle these between clobbering the
4441 // addend/subtrahend/minuend one of the multiplicands.
4442 assert((OpIdx1 == 1 || OpIdx2 == 1) && "Unexpected opcode index");
4443 assert((OpIdx1 == 3 || OpIdx2 == 3) && "Unexpected opcode index");
4444 unsigned Opc;
4445 switch (MI.getOpcode()) {
4446 default:
4447 llvm_unreachable("Unexpected opcode");
4448 CASE_VFMA_CHANGE_OPCODE_SPLATS(FMACC, FMADD)
4449 CASE_VFMA_CHANGE_OPCODE_SPLATS(FMADD, FMACC)
4456 CASE_VFMA_CHANGE_OPCODE_VV(FMACC, FMADD)
4460 CASE_VMA_CHANGE_OPCODE_LMULS(MACC, MADD, VX)
4461 CASE_VMA_CHANGE_OPCODE_LMULS(MADD, MACC, VX)
4462 CASE_VMA_CHANGE_OPCODE_LMULS(NMSAC, NMSUB, VX)
4463 CASE_VMA_CHANGE_OPCODE_LMULS(NMSUB, NMSAC, VX)
4464 CASE_VMA_CHANGE_OPCODE_LMULS(MACC, MADD, VV)
4465 CASE_VMA_CHANGE_OPCODE_LMULS(NMSAC, NMSUB, VV)
4466 }
4467
4468 auto &WorkingMI = cloneIfNew(MI);
4469 WorkingMI.setDesc(get(Opc));
4470 return TargetInstrInfo::commuteInstructionImpl(WorkingMI, /*NewMI=*/false,
4471 OpIdx1, OpIdx2);
4472 }
4473 case CASE_VFMA_OPCODE_VV(FMADD):
4477 case CASE_VMA_OPCODE_LMULS(MADD, VV):
4478 case CASE_VMA_OPCODE_LMULS(NMSUB, VV): {
4479 assert((OpIdx1 == 1 || OpIdx2 == 1) && "Unexpected opcode index");
4480 // If one of the operands, is the addend we need to change opcode.
4481 // Otherwise we're just swapping 2 of the multiplicands.
4482 if (OpIdx1 == 3 || OpIdx2 == 3) {
4483 unsigned Opc;
4484 switch (MI.getOpcode()) {
4485 default:
4486 llvm_unreachable("Unexpected opcode");
4487 CASE_VFMA_CHANGE_OPCODE_VV(FMADD, FMACC)
4491 CASE_VMA_CHANGE_OPCODE_LMULS(MADD, MACC, VV)
4492 CASE_VMA_CHANGE_OPCODE_LMULS(NMSUB, NMSAC, VV)
4493 }
4494
4495 auto &WorkingMI = cloneIfNew(MI);
4496 WorkingMI.setDesc(get(Opc));
4497 return TargetInstrInfo::commuteInstructionImpl(WorkingMI, /*NewMI=*/false,
4498 OpIdx1, OpIdx2);
4499 }
4500 // Let the default code handle it.
4501 break;
4502 }
4503 }
4504
4505 return TargetInstrInfo::commuteInstructionImpl(MI, NewMI, OpIdx1, OpIdx2);
4506}
4507
4508#undef CASE_VMA_CHANGE_OPCODE_COMMON
4509#undef CASE_VMA_CHANGE_OPCODE_LMULS
4510#undef CASE_VFMA_CHANGE_OPCODE_COMMON
4511#undef CASE_VFMA_CHANGE_OPCODE_LMULS_M1
4512#undef CASE_VFMA_CHANGE_OPCODE_LMULS_MF2
4513#undef CASE_VFMA_CHANGE_OPCODE_LMULS_MF4
4514#undef CASE_VFMA_CHANGE_OPCODE_VV
4515#undef CASE_VFMA_CHANGE_OPCODE_SPLATS
4516
4517#undef CASE_RVV_OPCODE_UNMASK_LMUL
4518#undef CASE_RVV_OPCODE_MASK_LMUL
4519#undef CASE_RVV_OPCODE_LMUL
4520#undef CASE_RVV_OPCODE_UNMASK_WIDEN
4521#undef CASE_RVV_OPCODE_UNMASK
4522#undef CASE_RVV_OPCODE_MASK_WIDEN
4523#undef CASE_RVV_OPCODE_MASK
4524#undef CASE_RVV_OPCODE_WIDEN
4525#undef CASE_RVV_OPCODE
4526
4527#undef CASE_VMA_OPCODE_COMMON
4528#undef CASE_VMA_OPCODE_LMULS
4529#undef CASE_VFMA_OPCODE_COMMON
4530#undef CASE_VFMA_OPCODE_LMULS_M1
4531#undef CASE_VFMA_OPCODE_LMULS_MF2
4532#undef CASE_VFMA_OPCODE_LMULS_MF4
4533#undef CASE_VFMA_OPCODE_VV
4534#undef CASE_VFMA_SPLATS
4535
4537 switch (MI.getOpcode()) {
4538 default:
4539 break;
4540 case RISCV::ADD:
4541 case RISCV::OR:
4542 case RISCV::XOR:
4543 // Normalize (so we hit the next if clause).
4544 // add/[x]or rd, zero, rs => add/[x]or rd, rs, zero
4545 if (MI.getOperand(1).getReg() == RISCV::X0)
4546 commuteInstruction(MI);
4547 // add/[x]or rd, rs, zero => addi rd, rs, 0
4548 if (MI.getOperand(2).getReg() == RISCV::X0) {
4549 MI.getOperand(2).ChangeToImmediate(0);
4550 MI.setDesc(get(RISCV::ADDI));
4551 return true;
4552 }
4553 // xor rd, rs, rs => addi rd, zero, 0
4554 if (MI.getOpcode() == RISCV::XOR &&
4555 MI.getOperand(1).getReg() == MI.getOperand(2).getReg()) {
4556 MI.getOperand(1).setReg(RISCV::X0);
4557 MI.getOperand(2).ChangeToImmediate(0);
4558 MI.setDesc(get(RISCV::ADDI));
4559 return true;
4560 }
4561 break;
4562 case RISCV::ORI:
4563 case RISCV::XORI:
4564 // [x]ori rd, zero, N => addi rd, zero, N
4565 if (MI.getOperand(1).getReg() == RISCV::X0) {
4566 MI.setDesc(get(RISCV::ADDI));
4567 return true;
4568 }
4569 break;
4570 case RISCV::SUB:
4571 // sub rd, rs, zero => addi rd, rs, 0
4572 if (MI.getOperand(2).getReg() == RISCV::X0) {
4573 MI.getOperand(2).ChangeToImmediate(0);
4574 MI.setDesc(get(RISCV::ADDI));
4575 return true;
4576 }
4577 break;
4578 case RISCV::SUBW:
4579 // subw rd, rs, zero => addiw rd, rs, 0
4580 if (MI.getOperand(2).getReg() == RISCV::X0) {
4581 MI.getOperand(2).ChangeToImmediate(0);
4582 MI.setDesc(get(RISCV::ADDIW));
4583 return true;
4584 }
4585 break;
4586 case RISCV::ADDW:
4587 // Normalize (so we hit the next if clause).
4588 // addw rd, zero, rs => addw rd, rs, zero
4589 if (MI.getOperand(1).getReg() == RISCV::X0)
4590 commuteInstruction(MI);
4591 // addw rd, rs, zero => addiw rd, rs, 0
4592 if (MI.getOperand(2).getReg() == RISCV::X0) {
4593 MI.getOperand(2).ChangeToImmediate(0);
4594 MI.setDesc(get(RISCV::ADDIW));
4595 return true;
4596 }
4597 break;
4598 case RISCV::SH1ADD:
4599 case RISCV::SH1ADD_UW:
4600 case RISCV::SH2ADD:
4601 case RISCV::SH2ADD_UW:
4602 case RISCV::SH3ADD:
4603 case RISCV::SH3ADD_UW:
4604 // shNadd[.uw] rd, zero, rs => addi rd, rs, 0
4605 if (MI.getOperand(1).getReg() == RISCV::X0) {
4606 MI.removeOperand(1);
4607 MI.addOperand(MachineOperand::CreateImm(0));
4608 MI.setDesc(get(RISCV::ADDI));
4609 return true;
4610 }
4611 // shNadd[.uw] rd, rs, zero => slli[.uw] rd, rs, N
4612 if (MI.getOperand(2).getReg() == RISCV::X0) {
4613 MI.removeOperand(2);
4614 unsigned Opc = MI.getOpcode();
4615 if (Opc == RISCV::SH1ADD_UW || Opc == RISCV::SH2ADD_UW ||
4616 Opc == RISCV::SH3ADD_UW) {
4618 MI.setDesc(get(RISCV::SLLI_UW));
4619 return true;
4620 }
4622 MI.setDesc(get(RISCV::SLLI));
4623 return true;
4624 }
4625 break;
4626 case RISCV::AND:
4627 case RISCV::MUL:
4628 case RISCV::MULH:
4629 case RISCV::MULHSU:
4630 case RISCV::MULHU:
4631 case RISCV::MULW:
4632 // and rd, zero, rs => addi rd, zero, 0
4633 // mul* rd, zero, rs => addi rd, zero, 0
4634 // and rd, rs, zero => addi rd, zero, 0
4635 // mul* rd, rs, zero => addi rd, zero, 0
4636 if (MI.getOperand(1).getReg() == RISCV::X0 ||
4637 MI.getOperand(2).getReg() == RISCV::X0) {
4638 MI.getOperand(1).setReg(RISCV::X0);
4639 MI.getOperand(2).ChangeToImmediate(0);
4640 MI.setDesc(get(RISCV::ADDI));
4641 return true;
4642 }
4643 break;
4644 case RISCV::ANDI:
4645 // andi rd, zero, C => addi rd, zero, 0
4646 if (MI.getOperand(1).getReg() == RISCV::X0) {
4647 MI.getOperand(2).setImm(0);
4648 MI.setDesc(get(RISCV::ADDI));
4649 return true;
4650 }
4651 break;
4652 case RISCV::SLL:
4653 case RISCV::SRL:
4654 case RISCV::SRA:
4655 // shift rd, zero, rs => addi rd, zero, 0
4656 if (MI.getOperand(1).getReg() == RISCV::X0) {
4657 MI.getOperand(2).ChangeToImmediate(0);
4658 MI.setDesc(get(RISCV::ADDI));
4659 return true;
4660 }
4661 // shift rd, rs, zero => addi rd, rs, 0
4662 if (MI.getOperand(2).getReg() == RISCV::X0) {
4663 MI.getOperand(2).ChangeToImmediate(0);
4664 MI.setDesc(get(RISCV::ADDI));
4665 return true;
4666 }
4667 break;
4668 case RISCV::SLLW:
4669 case RISCV::SRLW:
4670 case RISCV::SRAW:
4671 // shiftw rd, zero, rs => addi rd, zero, 0
4672 if (MI.getOperand(1).getReg() == RISCV::X0) {
4673 MI.getOperand(2).ChangeToImmediate(0);
4674 MI.setDesc(get(RISCV::ADDI));
4675 return true;
4676 }
4677 break;
4678 case RISCV::SLLI:
4679 case RISCV::SRLI:
4680 case RISCV::SRAI:
4681 case RISCV::SLLIW:
4682 case RISCV::SRLIW:
4683 case RISCV::SRAIW:
4684 case RISCV::SLLI_UW:
4685 // shiftimm rd, zero, N => addi rd, zero, 0
4686 if (MI.getOperand(1).getReg() == RISCV::X0) {
4687 MI.getOperand(2).setImm(0);
4688 MI.setDesc(get(RISCV::ADDI));
4689 return true;
4690 }
4691 break;
4692 case RISCV::SLTU:
4693 case RISCV::ADD_UW:
4694 // sltu rd, zero, zero => addi rd, zero, 0
4695 // add.uw rd, zero, zero => addi rd, zero, 0
4696 if (MI.getOperand(1).getReg() == RISCV::X0 &&
4697 MI.getOperand(2).getReg() == RISCV::X0) {
4698 MI.getOperand(2).ChangeToImmediate(0);
4699 MI.setDesc(get(RISCV::ADDI));
4700 return true;
4701 }
4702 // add.uw rd, zero, rs => addi rd, rs, 0
4703 if (MI.getOpcode() == RISCV::ADD_UW &&
4704 MI.getOperand(1).getReg() == RISCV::X0) {
4705 MI.removeOperand(1);
4706 MI.addOperand(MachineOperand::CreateImm(0));
4707 MI.setDesc(get(RISCV::ADDI));
4708 }
4709 break;
4710 case RISCV::SLTIU:
4711 // sltiu rd, zero, NZC => addi rd, zero, 1
4712 // sltiu rd, zero, 0 => addi rd, zero, 0
4713 if (MI.getOperand(1).getReg() == RISCV::X0) {
4714 MI.getOperand(2).setImm(MI.getOperand(2).getImm() != 0);
4715 MI.setDesc(get(RISCV::ADDI));
4716 return true;
4717 }
4718 break;
4719 case RISCV::SEXT_H:
4720 case RISCV::SEXT_B:
4721 case RISCV::ZEXT_H_RV32:
4722 case RISCV::ZEXT_H_RV64:
4723 // sext.[hb] rd, zero => addi rd, zero, 0
4724 // zext.h rd, zero => addi rd, zero, 0
4725 if (MI.getOperand(1).getReg() == RISCV::X0) {
4726 MI.addOperand(MachineOperand::CreateImm(0));
4727 MI.setDesc(get(RISCV::ADDI));
4728 return true;
4729 }
4730 break;
4731 case RISCV::MIN:
4732 case RISCV::MINU:
4733 case RISCV::MAX:
4734 case RISCV::MAXU:
4735 // min|max rd, rs, rs => addi rd, rs, 0
4736 if (MI.getOperand(1).getReg() == MI.getOperand(2).getReg()) {
4737 MI.getOperand(2).ChangeToImmediate(0);
4738 MI.setDesc(get(RISCV::ADDI));
4739 return true;
4740 }
4741 break;
4742 case RISCV::BEQ:
4743 case RISCV::BNE:
4744 // b{eq,ne} zero, rs, imm => b{eq,ne} rs, zero, imm
4745 if (MI.getOperand(0).getReg() == RISCV::X0) {
4746 MachineOperand MO0 = MI.getOperand(0);
4747 MI.removeOperand(0);
4748 MI.insert(MI.operands_begin() + 1, {MO0});
4749 }
4750 break;
4751 case RISCV::BLTU:
4752 // bltu zero, rs, imm => bne rs, zero, imm
4753 if (MI.getOperand(0).getReg() == RISCV::X0) {
4754 MachineOperand MO0 = MI.getOperand(0);
4755 MI.removeOperand(0);
4756 MI.insert(MI.operands_begin() + 1, {MO0});
4757 MI.setDesc(get(RISCV::BNE));
4758 }
4759 break;
4760 case RISCV::BGEU:
4761 // bgeu zero, rs, imm => beq rs, zero, imm
4762 if (MI.getOperand(0).getReg() == RISCV::X0) {
4763 MachineOperand MO0 = MI.getOperand(0);
4764 MI.removeOperand(0);
4765 MI.insert(MI.operands_begin() + 1, {MO0});
4766 MI.setDesc(get(RISCV::BEQ));
4767 }
4768 break;
4769 }
4770 return false;
4771}
4772
4773// clang-format off
4774#define CASE_WIDEOP_OPCODE_COMMON(OP, LMUL) \
4775 RISCV::PseudoV##OP##_##LMUL##_TIED
4776
4777#define CASE_WIDEOP_OPCODE_LMULS(OP) \
4778 CASE_WIDEOP_OPCODE_COMMON(OP, MF8): \
4779 case CASE_WIDEOP_OPCODE_COMMON(OP, MF4): \
4780 case CASE_WIDEOP_OPCODE_COMMON(OP, MF2): \
4781 case CASE_WIDEOP_OPCODE_COMMON(OP, M1): \
4782 case CASE_WIDEOP_OPCODE_COMMON(OP, M2): \
4783 case CASE_WIDEOP_OPCODE_COMMON(OP, M4)
4784
4785#define CASE_WIDEOP_CHANGE_OPCODE_COMMON(OP, LMUL) \
4786 case RISCV::PseudoV##OP##_##LMUL##_TIED: \
4787 NewOpc = RISCV::PseudoV##OP##_##LMUL; \
4788 break;
4789
4790#define CASE_WIDEOP_CHANGE_OPCODE_LMULS(OP) \
4791 CASE_WIDEOP_CHANGE_OPCODE_COMMON(OP, MF8) \
4792 CASE_WIDEOP_CHANGE_OPCODE_COMMON(OP, MF4) \
4793 CASE_WIDEOP_CHANGE_OPCODE_COMMON(OP, MF2) \
4794 CASE_WIDEOP_CHANGE_OPCODE_COMMON(OP, M1) \
4795 CASE_WIDEOP_CHANGE_OPCODE_COMMON(OP, M2) \
4796 CASE_WIDEOP_CHANGE_OPCODE_COMMON(OP, M4)
4797
4798// FP Widening Ops may by SEW aware. Create SEW aware cases for these cases.
4799#define CASE_FP_WIDEOP_OPCODE_COMMON(OP, LMUL, SEW) \
4800 RISCV::PseudoV##OP##_##LMUL##_##SEW##_TIED
4801
4802#define CASE_FP_WIDEOP_OPCODE_LMULS(OP) \
4803 CASE_FP_WIDEOP_OPCODE_COMMON(OP, MF4, E16): \
4804 case CASE_FP_WIDEOP_OPCODE_COMMON(OP, MF2, E16): \
4805 case CASE_FP_WIDEOP_OPCODE_COMMON(OP, MF2, E32): \
4806 case CASE_FP_WIDEOP_OPCODE_COMMON(OP, M1, E16): \
4807 case CASE_FP_WIDEOP_OPCODE_COMMON(OP, M1, E32): \
4808 case CASE_FP_WIDEOP_OPCODE_COMMON(OP, M2, E16): \
4809 case CASE_FP_WIDEOP_OPCODE_COMMON(OP, M2, E32): \
4810 case CASE_FP_WIDEOP_OPCODE_COMMON(OP, M4, E16): \
4811 case CASE_FP_WIDEOP_OPCODE_COMMON(OP, M4, E32) \
4812
4813#define CASE_FP_WIDEOP_CHANGE_OPCODE_COMMON(OP, LMUL, SEW) \
4814 case RISCV::PseudoV##OP##_##LMUL##_##SEW##_TIED: \
4815 NewOpc = RISCV::PseudoV##OP##_##LMUL##_##SEW; \
4816 break;
4817
4818#define CASE_FP_WIDEOP_CHANGE_OPCODE_LMULS(OP) \
4819 CASE_FP_WIDEOP_CHANGE_OPCODE_COMMON(OP, MF4, E16) \
4820 CASE_FP_WIDEOP_CHANGE_OPCODE_COMMON(OP, MF2, E16) \
4821 CASE_FP_WIDEOP_CHANGE_OPCODE_COMMON(OP, MF2, E32) \
4822 CASE_FP_WIDEOP_CHANGE_OPCODE_COMMON(OP, M1, E16) \
4823 CASE_FP_WIDEOP_CHANGE_OPCODE_COMMON(OP, M1, E32) \
4824 CASE_FP_WIDEOP_CHANGE_OPCODE_COMMON(OP, M2, E16) \
4825 CASE_FP_WIDEOP_CHANGE_OPCODE_COMMON(OP, M2, E32) \
4826 CASE_FP_WIDEOP_CHANGE_OPCODE_COMMON(OP, M4, E16) \
4827 CASE_FP_WIDEOP_CHANGE_OPCODE_COMMON(OP, M4, E32) \
4828
4829#define CASE_FP_WIDEOP_OPCODE_LMULS_ALT(OP) \
4830 CASE_FP_WIDEOP_OPCODE_COMMON(OP, MF4, E16): \
4831 case CASE_FP_WIDEOP_OPCODE_COMMON(OP, MF2, E16): \
4832 case CASE_FP_WIDEOP_OPCODE_COMMON(OP, M1, E16): \
4833 case CASE_FP_WIDEOP_OPCODE_COMMON(OP, M2, E16): \
4834 case CASE_FP_WIDEOP_OPCODE_COMMON(OP, M4, E16)
4835
4836#define CASE_FP_WIDEOP_CHANGE_OPCODE_LMULS_ALT(OP) \
4837 CASE_FP_WIDEOP_CHANGE_OPCODE_COMMON(OP, MF4, E16) \
4838 CASE_FP_WIDEOP_CHANGE_OPCODE_COMMON(OP, MF2, E16) \
4839 CASE_FP_WIDEOP_CHANGE_OPCODE_COMMON(OP, M1, E16) \
4840 CASE_FP_WIDEOP_CHANGE_OPCODE_COMMON(OP, M2, E16) \
4841 CASE_FP_WIDEOP_CHANGE_OPCODE_COMMON(OP, M4, E16)
4842// clang-format on
4843
4845 LiveVariables *LV,
4846 LiveIntervals *LIS) const {
4848 switch (MI.getOpcode()) {
4849 default:
4850 return nullptr;
4851 case CASE_FP_WIDEOP_OPCODE_LMULS_ALT(FWADD_ALT_WV):
4852 case CASE_FP_WIDEOP_OPCODE_LMULS_ALT(FWSUB_ALT_WV):
4853 case CASE_FP_WIDEOP_OPCODE_LMULS(FWADD_WV):
4854 case CASE_FP_WIDEOP_OPCODE_LMULS(FWSUB_WV): {
4855 assert(RISCVII::hasVecPolicyOp(MI.getDesc().TSFlags) &&
4856 MI.getNumExplicitOperands() == 7 &&
4857 "Expect 7 explicit operands rd, rs2, rs1, rm, vl, sew, policy");
4858 // If the tail policy is undisturbed we can't convert.
4859 if ((MI.getOperand(RISCVII::getVecPolicyOpNum(MI.getDesc())).getImm() &
4860 1) == 0)
4861 return nullptr;
4862 // clang-format off
4863 unsigned NewOpc;
4864 switch (MI.getOpcode()) {
4865 default:
4866 llvm_unreachable("Unexpected opcode");
4871 }
4872 // clang-format on
4873
4874 MachineBasicBlock &MBB = *MI.getParent();
4875 MIB = BuildMI(MBB, MI, MI.getDebugLoc(), get(NewOpc))
4876 .add(MI.getOperand(0))
4877 .addReg(MI.getOperand(0).getReg(), RegState::Undef)
4878 .add(MI.getOperand(1))
4879 .add(MI.getOperand(2))
4880 .add(MI.getOperand(3))
4881 .add(MI.getOperand(4))
4882 .add(MI.getOperand(5))
4883 .add(MI.getOperand(6));
4884 break;
4885 }
4886 case CASE_WIDEOP_OPCODE_LMULS(WADD_WV):
4887 case CASE_WIDEOP_OPCODE_LMULS(WADDU_WV):
4888 case CASE_WIDEOP_OPCODE_LMULS(WSUB_WV):
4889 case CASE_WIDEOP_OPCODE_LMULS(WSUBU_WV): {
4890 // If the tail policy is undisturbed we can't convert.
4891 assert(RISCVII::hasVecPolicyOp(MI.getDesc().TSFlags) &&
4892 MI.getNumExplicitOperands() == 6);
4893 if ((MI.getOperand(RISCVII::getVecPolicyOpNum(MI.getDesc())).getImm() &
4894 1) == 0)
4895 return nullptr;
4896
4897 // clang-format off
4898 unsigned NewOpc;
4899 switch (MI.getOpcode()) {
4900 default:
4901 llvm_unreachable("Unexpected opcode");
4906 }
4907 // clang-format on
4908
4909 MachineBasicBlock &MBB = *MI.getParent();
4910 MIB = BuildMI(MBB, MI, MI.getDebugLoc(), get(NewOpc))
4911 .add(MI.getOperand(0))
4912 .addReg(MI.getOperand(0).getReg(), RegState::Undef)
4913 .add(MI.getOperand(1))
4914 .add(MI.getOperand(2))
4915 .add(MI.getOperand(3))
4916 .add(MI.getOperand(4))
4917 .add(MI.getOperand(5));
4918 break;
4919 }
4920 }
4921 MIB.copyImplicitOps(MI);
4922
4923 if (LV) {
4924 unsigned NumOps = MI.getNumOperands();
4925 for (unsigned I = 1; I < NumOps; ++I) {
4926 MachineOperand &Op = MI.getOperand(I);
4927 if (Op.isReg() && Op.isKill())
4928 LV->replaceKillInstruction(Op.getReg(), MI, *MIB);
4929 }
4930 }
4931
4932 if (LIS) {
4933 SlotIndex Idx = LIS->ReplaceMachineInstrInMaps(MI, *MIB);
4934
4935 if (MI.getOperand(0).isEarlyClobber()) {
4936 // Use operand 1 was tied to early-clobber def operand 0, so its live
4937 // interval could have ended at an early-clobber slot. Now they are not
4938 // tied we need to update it to the normal register slot.
4939 LiveInterval &LI = LIS->getInterval(MI.getOperand(1).getReg());
4941 if (S->end == Idx.getRegSlot(true))
4942 S->end = Idx.getRegSlot();
4943 }
4944 }
4945
4946 return MIB;
4947}
4948
4949#undef CASE_WIDEOP_OPCODE_COMMON
4950#undef CASE_WIDEOP_OPCODE_LMULS
4951#undef CASE_WIDEOP_CHANGE_OPCODE_COMMON
4952#undef CASE_WIDEOP_CHANGE_OPCODE_LMULS
4953#undef CASE_FP_WIDEOP_OPCODE_COMMON
4954#undef CASE_FP_WIDEOP_OPCODE_LMULS
4955#undef CASE_FP_WIDEOP_CHANGE_OPCODE_COMMON
4956#undef CASE_FP_WIDEOP_CHANGE_OPCODE_LMULS
4957
4960 Register DestReg, uint32_t Amount,
4961 MachineInstr::MIFlag Flag) const {
4962 MachineRegisterInfo &MRI = MF.getRegInfo();
4963 if (llvm::has_single_bit(Amount)) {
4964 uint32_t ShiftAmount = Log2_32(Amount);
4965 if (ShiftAmount == 0)
4966 return;
4967 BuildMI(MBB, II, DL, get(RISCV::SLLI), DestReg)
4968 .addReg(DestReg, RegState::Kill)
4969 .addImm(ShiftAmount)
4970 .setMIFlag(Flag);
4971 } else if (int ShXAmount, ShiftAmount;
4972 STI.hasShlAdd(3) &&
4973 (ShXAmount = isShifted359(Amount, ShiftAmount)) != 0) {
4974 // We can use Zba SHXADD+SLLI instructions for multiply in some cases.
4975 unsigned Opc;
4976 switch (ShXAmount) {
4977 case 1:
4978 Opc = RISCV::SH1ADD;
4979 break;
4980 case 2:
4981 Opc = RISCV::SH2ADD;
4982 break;
4983 case 3:
4984 Opc = RISCV::SH3ADD;
4985 break;
4986 default:
4987 llvm_unreachable("unexpected result of isShifted359");
4988 }
4989 if (ShiftAmount)
4990 BuildMI(MBB, II, DL, get(RISCV::SLLI), DestReg)
4991 .addReg(DestReg, RegState::Kill)
4992 .addImm(ShiftAmount)
4993 .setMIFlag(Flag);
4994 BuildMI(MBB, II, DL, get(Opc), DestReg)
4995 .addReg(DestReg, RegState::Kill)
4996 .addReg(DestReg)
4997 .setMIFlag(Flag);
4998 } else if (llvm::has_single_bit(Amount - 1)) {
4999 Register ScaledRegister = MRI.createVirtualRegister(&RISCV::GPRRegClass);
5000 uint32_t ShiftAmount = Log2_32(Amount - 1);
5001 BuildMI(MBB, II, DL, get(RISCV::SLLI), ScaledRegister)
5002 .addReg(DestReg)
5003 .addImm(ShiftAmount)
5004 .setMIFlag(Flag);
5005 BuildMI(MBB, II, DL, get(RISCV::ADD), DestReg)
5006 .addReg(ScaledRegister, RegState::Kill)
5007 .addReg(DestReg, RegState::Kill)
5008 .setMIFlag(Flag);
5009 } else if (llvm::has_single_bit(Amount + 1)) {
5010 Register ScaledRegister = MRI.createVirtualRegister(&RISCV::GPRRegClass);
5011 uint32_t ShiftAmount = Log2_32(Amount + 1);
5012 BuildMI(MBB, II, DL, get(RISCV::SLLI), ScaledRegister)
5013 .addReg(DestReg)
5014 .addImm(ShiftAmount)
5015 .setMIFlag(Flag);
5016 BuildMI(MBB, II, DL, get(RISCV::SUB), DestReg)
5017 .addReg(ScaledRegister, RegState::Kill)
5018 .addReg(DestReg, RegState::Kill)
5019 .setMIFlag(Flag);
5020 } else if (STI.hasStdExtZmmul()) {
5021 Register N = MRI.createVirtualRegister(&RISCV::GPRRegClass);
5022 movImm(MBB, II, DL, N, Amount, Flag);
5023 BuildMI(MBB, II, DL, get(RISCV::MUL), DestReg)
5024 .addReg(DestReg, RegState::Kill)
5026 .setMIFlag(Flag);
5027 } else {
5028 Register Acc;
5029 uint32_t PrevShiftAmount = 0;
5030 for (uint32_t ShiftAmount = 0; Amount >> ShiftAmount; ShiftAmount++) {
5031 if (Amount & (1U << ShiftAmount)) {
5032 if (ShiftAmount)
5033 BuildMI(MBB, II, DL, get(RISCV::SLLI), DestReg)
5034 .addReg(DestReg, RegState::Kill)
5035 .addImm(ShiftAmount - PrevShiftAmount)
5036 .setMIFlag(Flag);
5037 if (Amount >> (ShiftAmount + 1)) {
5038 // If we don't have an accmulator yet, create it and copy DestReg.
5039 if (!Acc) {
5040 Acc = MRI.createVirtualRegister(&RISCV::GPRRegClass);
5041 BuildMI(MBB, II, DL, get(TargetOpcode::COPY), Acc)
5042 .addReg(DestReg)
5043 .setMIFlag(Flag);
5044 } else {
5045 BuildMI(MBB, II, DL, get(RISCV::ADD), Acc)
5046 .addReg(Acc, RegState::Kill)
5047 .addReg(DestReg)
5048 .setMIFlag(Flag);
5049 }
5050 }
5051 PrevShiftAmount = ShiftAmount;
5052 }
5053 }
5054 assert(Acc && "Expected valid accumulator");
5055 BuildMI(MBB, II, DL, get(RISCV::ADD), DestReg)
5056 .addReg(DestReg, RegState::Kill)
5057 .addReg(Acc, RegState::Kill)
5058 .setMIFlag(Flag);
5059 }
5060}
5061
5064 static const std::pair<MachineMemOperand::Flags, const char *> TargetFlags[] =
5065 {{MONontemporalBit0, "riscv-nontemporal-domain-bit-0"},
5066 {MONontemporalBit1, "riscv-nontemporal-domain-bit-1"}};
5067 return ArrayRef(TargetFlags);
5068}
5069
5071 return OptLevel >= CodeGenOptLevel::Aggressive
5072 ? STI.getTailDupAggressiveThreshold()
5073 : 2;
5074}
5075
5077 // RVV lacks any support for immediate addressing for stack addresses, so be
5078 // conservative.
5079 unsigned Opcode = MI.getOpcode();
5080 if (!RISCVVPseudosTable::getPseudoInfo(Opcode) &&
5082 return false;
5083 return true;
5084}
5085
5086/// Return true if \p MI is a copy that will be lowered to one or more vmvNr.vs.
5088 const MachineInstr &MI) {
5089 return MI.isCopy() && MI.getOperand(0).getReg().isPhysical() &&
5091 TRI->getMinimalPhysRegClass(MI.getOperand(0).getReg()));
5092}
5093
5094std::optional<std::pair<unsigned, unsigned>>
5096 switch (Opcode) {
5097 default:
5098 return std::nullopt;
5099 case RISCV::PseudoVSPILL2_M1:
5100 case RISCV::PseudoVRELOAD2_M1:
5101 return std::make_pair(2u, 1u);
5102 case RISCV::PseudoVSPILL2_M2:
5103 case RISCV::PseudoVRELOAD2_M2:
5104 return std::make_pair(2u, 2u);
5105 case RISCV::PseudoVSPILL2_M4:
5106 case RISCV::PseudoVRELOAD2_M4:
5107 return std::make_pair(2u, 4u);
5108 case RISCV::PseudoVSPILL3_M1:
5109 case RISCV::PseudoVRELOAD3_M1:
5110 return std::make_pair(3u, 1u);
5111 case RISCV::PseudoVSPILL3_M2:
5112 case RISCV::PseudoVRELOAD3_M2:
5113 return std::make_pair(3u, 2u);
5114 case RISCV::PseudoVSPILL4_M1:
5115 case RISCV::PseudoVRELOAD4_M1:
5116 return std::make_pair(4u, 1u);
5117 case RISCV::PseudoVSPILL4_M2:
5118 case RISCV::PseudoVRELOAD4_M2:
5119 return std::make_pair(4u, 2u);
5120 case RISCV::PseudoVSPILL5_M1:
5121 case RISCV::PseudoVRELOAD5_M1:
5122 return std::make_pair(5u, 1u);
5123 case RISCV::PseudoVSPILL6_M1:
5124 case RISCV::PseudoVRELOAD6_M1:
5125 return std::make_pair(6u, 1u);
5126 case RISCV::PseudoVSPILL7_M1:
5127 case RISCV::PseudoVRELOAD7_M1:
5128 return std::make_pair(7u, 1u);
5129 case RISCV::PseudoVSPILL8_M1:
5130 case RISCV::PseudoVRELOAD8_M1:
5131 return std::make_pair(8u, 1u);
5132 }
5133}
5134
5135bool RISCV::hasEqualFRM(const MachineInstr &MI1, const MachineInstr &MI2) {
5136 int16_t MI1FrmOpIdx =
5137 RISCV::getNamedOperandIdx(MI1.getOpcode(), RISCV::OpName::frm);
5138 int16_t MI2FrmOpIdx =
5139 RISCV::getNamedOperandIdx(MI2.getOpcode(), RISCV::OpName::frm);
5140 if (MI1FrmOpIdx < 0 || MI2FrmOpIdx < 0)
5141 return false;
5142 MachineOperand FrmOp1 = MI1.getOperand(MI1FrmOpIdx);
5143 MachineOperand FrmOp2 = MI2.getOperand(MI2FrmOpIdx);
5144 return FrmOp1.getImm() == FrmOp2.getImm();
5145}
5146
5147std::optional<unsigned>
5148RISCV::getVectorLowDemandedScalarBits(unsigned Opcode, unsigned Log2SEW) {
5149 switch (Opcode) {
5150 default:
5151 return std::nullopt;
5152
5153 // 11.6. Vector Single-Width Shift Instructions
5154 case RISCV::VSLL_VX:
5155 case RISCV::VSRL_VX:
5156 case RISCV::VSRA_VX:
5157 // 12.4. Vector Single-Width Scaling Shift Instructions
5158 case RISCV::VSSRL_VX:
5159 case RISCV::VSSRA_VX:
5160 // Zvbb
5161 case RISCV::VROL_VX:
5162 case RISCV::VROR_VX:
5163 // Only the low lg2(SEW) bits of the shift-amount value are used.
5164 return Log2SEW;
5165
5166 // 11.7 Vector Narrowing Integer Right Shift Instructions
5167 case RISCV::VNSRL_WX:
5168 case RISCV::VNSRA_WX:
5169 // 12.5. Vector Narrowing Fixed-Point Clip Instructions
5170 case RISCV::VNCLIPU_WX:
5171 case RISCV::VNCLIP_WX:
5172 // Zvbb
5173 case RISCV::VWSLL_VX:
5174 // Only the low lg2(2*SEW) bits of the shift-amount value are used.
5175 return Log2SEW + 1;
5176
5177 // 11.1. Vector Single-Width Integer Add and Subtract
5178 case RISCV::VADD_VX:
5179 case RISCV::VSUB_VX:
5180 case RISCV::VRSUB_VX:
5181 // 11.2. Vector Widening Integer Add/Subtract
5182 case RISCV::VWADDU_VX:
5183 case RISCV::VWSUBU_VX:
5184 case RISCV::VWADD_VX:
5185 case RISCV::VWSUB_VX:
5186 case RISCV::VWADDU_WX:
5187 case RISCV::VWSUBU_WX:
5188 case RISCV::VWADD_WX:
5189 case RISCV::VWSUB_WX:
5190 // 11.4. Vector Integer Add-with-Carry / Subtract-with-Borrow Instructions
5191 case RISCV::VADC_VXM:
5192 case RISCV::VADC_VIM:
5193 case RISCV::VMADC_VXM:
5194 case RISCV::VMADC_VIM:
5195 case RISCV::VMADC_VX:
5196 case RISCV::VSBC_VXM:
5197 case RISCV::VMSBC_VXM:
5198 case RISCV::VMSBC_VX:
5199 // 11.5 Vector Bitwise Logical Instructions
5200 case RISCV::VAND_VX:
5201 case RISCV::VOR_VX:
5202 case RISCV::VXOR_VX:
5203 // 11.8. Vector Integer Compare Instructions
5204 case RISCV::VMSEQ_VX:
5205 case RISCV::VMSNE_VX:
5206 case RISCV::VMSLTU_VX:
5207 case RISCV::VMSLT_VX:
5208 case RISCV::VMSLEU_VX:
5209 case RISCV::VMSLE_VX:
5210 case RISCV::VMSGTU_VX:
5211 case RISCV::VMSGT_VX:
5212 // 11.9. Vector Integer Min/Max Instructions
5213 case RISCV::VMINU_VX:
5214 case RISCV::VMIN_VX:
5215 case RISCV::VMAXU_VX:
5216 case RISCV::VMAX_VX:
5217 // 11.10. Vector Single-Width Integer Multiply Instructions
5218 case RISCV::VMUL_VX:
5219 case RISCV::VMULH_VX:
5220 case RISCV::VMULHU_VX:
5221 case RISCV::VMULHSU_VX:
5222 // 11.11. Vector Integer Divide Instructions
5223 case RISCV::VDIVU_VX:
5224 case RISCV::VDIV_VX:
5225 case RISCV::VREMU_VX:
5226 case RISCV::VREM_VX:
5227 // 11.12. Vector Widening Integer Multiply Instructions
5228 case RISCV::VWMUL_VX:
5229 case RISCV::VWMULU_VX:
5230 case RISCV::VWMULSU_VX:
5231 // 11.13. Vector Single-Width Integer Multiply-Add Instructions
5232 case RISCV::VMACC_VX:
5233 case RISCV::VNMSAC_VX:
5234 case RISCV::VMADD_VX:
5235 case RISCV::VNMSUB_VX:
5236 // 11.14. Vector Widening Integer Multiply-Add Instructions
5237 case RISCV::VWMACCU_VX:
5238 case RISCV::VWMACC_VX:
5239 case RISCV::VWMACCSU_VX:
5240 case RISCV::VWMACCUS_VX:
5241 // 11.15. Vector Integer Merge Instructions
5242 case RISCV::VMERGE_VXM:
5243 // 11.16. Vector Integer Move Instructions
5244 case RISCV::VMV_V_X:
5245 // 12.1. Vector Single-Width Saturating Add and Subtract
5246 case RISCV::VSADDU_VX:
5247 case RISCV::VSADD_VX:
5248 case RISCV::VSSUBU_VX:
5249 case RISCV::VSSUB_VX:
5250 // 12.2. Vector Single-Width Averaging Add and Subtract
5251 case RISCV::VAADDU_VX:
5252 case RISCV::VAADD_VX:
5253 case RISCV::VASUBU_VX:
5254 case RISCV::VASUB_VX:
5255 // 12.3. Vector Single-Width Fractional Multiply with Rounding and Saturation
5256 case RISCV::VSMUL_VX:
5257 // 16.1. Integer Scalar Move Instructions
5258 case RISCV::VMV_S_X:
5259 // Zvbb
5260 case RISCV::VANDN_VX:
5261 return 1U << Log2SEW;
5262 }
5263}
5264
5265unsigned RISCV::getRVVMCOpcode(unsigned RVVPseudoOpcode) {
5267 RISCVVPseudosTable::getPseudoInfo(RVVPseudoOpcode);
5268 if (!RVV)
5269 return 0;
5270 return RVV->BaseInstr;
5271}
5272
5273unsigned RISCV::getDestLog2EEW(const MCInstrDesc &Desc, unsigned Log2SEW) {
5274 unsigned DestEEW =
5276 // EEW = 1
5277 if (DestEEW == 0)
5278 return 0;
5279 // EEW = SEW * n
5280 unsigned Scaled = Log2SEW + (DestEEW - 1);
5281 assert(Scaled >= 3 && Scaled <= 6);
5282 return Scaled;
5283}
5284
5285static std::optional<int64_t> getEffectiveImm(const MachineOperand &MO) {
5286 assert(MO.isImm() || MO.getReg().isVirtual());
5287 if (MO.isImm())
5288 return MO.getImm();
5289 const MachineInstr *Def =
5290 MO.getParent()->getMF()->getRegInfo().getVRegDef(MO.getReg());
5291 int64_t Imm;
5292 if (isLoadImm(Def, Imm))
5293 return Imm;
5294 return std::nullopt;
5295}
5296
5297/// Given two VL operands, do we know that LHS <= RHS? Must be used in SSA form.
5299 assert((LHS.isImm() || LHS.getParent()->getMF()->getRegInfo().isSSA()) &&
5300 (RHS.isImm() || RHS.getParent()->getMF()->getRegInfo().isSSA()));
5301 if (LHS.isReg() && RHS.isReg() && LHS.getReg().isVirtual() &&
5302 LHS.getReg() == RHS.getReg())
5303 return true;
5304 if (RHS.isImm() && RHS.getImm() == RISCV::VLMaxSentinel)
5305 return true;
5306 if (LHS.isImm() && LHS.getImm() == 0)
5307 return true;
5308 if (LHS.isImm() && LHS.getImm() == RISCV::VLMaxSentinel)
5309 return false;
5310 std::optional<int64_t> LHSImm = getEffectiveImm(LHS),
5311 RHSImm = getEffectiveImm(RHS);
5312 if (!LHSImm || !RHSImm)
5313 return false;
5314 return LHSImm <= RHSImm;
5315}
5316
5317namespace {
5318class RISCVPipelinerLoopInfo : public TargetInstrInfo::PipelinerLoopInfo {
5319 const MachineInstr *LHS;
5320 const MachineInstr *RHS;
5322
5323public:
5324 RISCVPipelinerLoopInfo(const MachineInstr *LHS, const MachineInstr *RHS,
5326 : LHS(LHS), RHS(RHS), Cond(Cond.begin(), Cond.end()) {}
5327
5328 bool shouldIgnoreForPipelining(const MachineInstr *MI) const override {
5329 // Make the instructions for loop control be placed in stage 0.
5330 // The predecessors of LHS/RHS are considered by the caller.
5331 if (LHS && MI == LHS)
5332 return true;
5333 if (RHS && MI == RHS)
5334 return true;
5335 return false;
5336 }
5337
5338 std::optional<bool> createTripCountGreaterCondition(
5339 int TC, MachineBasicBlock &MBB,
5340 SmallVectorImpl<MachineOperand> &CondParam) override {
5341 // A branch instruction will be inserted as "if (Cond) goto epilogue".
5342 // Cond is normalized for such use.
5343 // The predecessors of the branch are assumed to have already been inserted.
5344 CondParam = Cond;
5345 return {};
5346 }
5347
5348 void setPreheader(MachineBasicBlock *NewPreheader) override {}
5349
5350 void adjustTripCount(int TripCountAdjust) override {}
5351};
5352} // namespace
5353
5354std::unique_ptr<TargetInstrInfo::PipelinerLoopInfo>
5356 MachineBasicBlock *TBB = nullptr, *FBB = nullptr;
5358 if (analyzeBranch(*LoopBB, TBB, FBB, Cond, /*AllowModify=*/false))
5359 return nullptr;
5360
5361 // Infinite loops are not supported
5362 if (TBB == LoopBB && FBB == LoopBB)
5363 return nullptr;
5364
5365 // Must be conditional branch
5366 if (FBB == nullptr)
5367 return nullptr;
5368
5369 assert((TBB == LoopBB || FBB == LoopBB) &&
5370 "The Loop must be a single-basic-block loop");
5371
5372 // Normalization for createTripCountGreaterCondition()
5373 if (TBB == LoopBB)
5375
5376 const MachineRegisterInfo &MRI = LoopBB->getParent()->getRegInfo();
5377 auto FindRegDef = [&MRI](MachineOperand &Op) -> const MachineInstr * {
5378 if (!Op.isReg())
5379 return nullptr;
5380 Register Reg = Op.getReg();
5381 if (!Reg.isVirtual())
5382 return nullptr;
5383 return MRI.getVRegDef(Reg);
5384 };
5385
5386 const MachineInstr *LHS = FindRegDef(Cond[1]);
5387 const MachineInstr *RHS = FindRegDef(Cond[2]);
5388 if (LHS && LHS->isPHI())
5389 return nullptr;
5390 if (RHS && RHS->isPHI())
5391 return nullptr;
5392
5393 return std::make_unique<RISCVPipelinerLoopInfo>(LHS, RHS, Cond);
5394}
5395
5396// FIXME: We should remove this if we have a default generic scheduling model.
5398 unsigned RVVMCOpcode = RISCV::getRVVMCOpcode(Opc);
5399 Opc = RVVMCOpcode ? RVVMCOpcode : Opc;
5400 switch (Opc) {
5401 default:
5402 return false;
5403 // Integer div/rem.
5404 case RISCV::DIV:
5405 case RISCV::DIVW:
5406 case RISCV::DIVU:
5407 case RISCV::DIVUW:
5408 case RISCV::REM:
5409 case RISCV::REMW:
5410 case RISCV::REMU:
5411 case RISCV::REMUW:
5412 // Floating-point div/sqrt.
5413 case RISCV::FDIV_H:
5414 case RISCV::FDIV_S:
5415 case RISCV::FDIV_D:
5416 case RISCV::FDIV_H_INX:
5417 case RISCV::FDIV_S_INX:
5418 case RISCV::FDIV_D_INX:
5419 case RISCV::FDIV_D_IN32X:
5420 case RISCV::FSQRT_H:
5421 case RISCV::FSQRT_S:
5422 case RISCV::FSQRT_D:
5423 case RISCV::FSQRT_H_INX:
5424 case RISCV::FSQRT_S_INX:
5425 case RISCV::FSQRT_D_INX:
5426 case RISCV::FSQRT_D_IN32X:
5427 // Vector integer div/rem
5428 case RISCV::VDIV_VV:
5429 case RISCV::VDIV_VX:
5430 case RISCV::VDIVU_VV:
5431 case RISCV::VDIVU_VX:
5432 case RISCV::VREM_VV:
5433 case RISCV::VREM_VX:
5434 case RISCV::VREMU_VV:
5435 case RISCV::VREMU_VX:
5436 // Vector floating-point div/sqrt.
5437 case RISCV::VFDIV_VV:
5438 case RISCV::VFDIV_VF:
5439 case RISCV::VFRDIV_VF:
5440 case RISCV::VFSQRT_V:
5441 case RISCV::VFRSQRT7_V:
5442 return true;
5443 }
5444}
5445
5446bool RISCVInstrInfo::isVRegCopy(const MachineInstr *MI, unsigned LMul) const {
5447 if (MI->getOpcode() != TargetOpcode::COPY)
5448 return false;
5449 const MachineRegisterInfo &MRI = MI->getMF()->getRegInfo();
5451
5452 Register DstReg = MI->getOperand(0).getReg();
5453 const TargetRegisterClass *RC = DstReg.isVirtual()
5454 ? MRI.getRegClass(DstReg)
5455 : TRI->getMinimalPhysRegClass(DstReg);
5456
5458 return false;
5459
5460 if (!LMul)
5461 return true;
5462
5463 // TODO: Perhaps we could distinguish segment register classes (e.g. VRN3M2)
5464 // in the future.
5465 auto [RCLMul, RCFractional] =
5467 return (!RCFractional && LMul == RCLMul) || (RCFractional && LMul == 1);
5468}
5469
5471 if (MI.memoperands_empty())
5472 return false;
5473
5474 MachineMemOperand *MMO = *(MI.memoperands_begin());
5475 if (!MMO->isNonTemporal())
5476 return false;
5477
5478 return true;
5479}
5480
5482 const MachineBasicBlock::iterator &To) {
5483 assert(To == From.getParent()->end() || From.getParent() == To->getParent());
5484 SmallVector<Register> PhysUses, PhysDefs;
5485 for (const MachineOperand &MO : From.all_uses())
5486 if (MO.getReg().isPhysical())
5487 PhysUses.push_back(MO.getReg());
5488 for (const MachineOperand &MO : From.all_defs())
5489 if (MO.getReg().isPhysical())
5490 PhysDefs.push_back(MO.getReg());
5491 bool SawStore = false;
5492 for (auto II = std::next(From.getIterator()); II != To; II++) {
5493 for (Register PhysReg : PhysUses)
5494 if (II->definesRegister(PhysReg, nullptr))
5495 return false;
5496 for (Register PhysReg : PhysDefs)
5497 if (II->definesRegister(PhysReg, nullptr) ||
5498 II->readsRegister(PhysReg, nullptr))
5499 return false;
5500 if (II->mayStore()) {
5501 SawStore = true;
5502 break;
5503 }
5504 }
5505 return From.isSafeToMove(SawStore);
5506}
MachineInstrBuilder MachineInstrBuilder & DefMI
static bool forwardCopyWillClobberTuple(unsigned DestReg, unsigned SrcReg, unsigned NumRegs)
static void parseCondBranch(MachineInstr *LastInst, MachineBasicBlock *&Target, SmallVectorImpl< MachineOperand > &Cond)
@ MachineOutlinerTailCall
Emit a save, restore, call, and return.
@ MachineOutlinerRegSave
Emit a call and tail-call.
@ MachineOutlinerDefault
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")
SmallVector< int16_t, MAX_SRC_OPERANDS_NUM > OperandIndices
@ Scaled
MachineBasicBlock & MBB
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
MachineBasicBlock MachineBasicBlock::iterator MBBI
basic Basic Alias true
#define X(NUM, ENUM, NAME)
Definition ELF.h:853
#define clEnumValN(ENUMVAL, FLAGNAME, DESC)
const HexagonInstrInfo * TII
#define _
IRTranslator LLVM IR MI
Module.h This file contains the declarations for the Module class.
const size_t AbstractManglingParser< Derived, Alloc >::NumOps
const AbstractManglingParser< Derived, Alloc >::OperatorInfo AbstractManglingParser< Derived, Alloc >::Ops[]
#define F(x, y, z)
Definition MD5.cpp:54
#define I(x, y, z)
Definition MD5.cpp:57
Register Reg
Register const TargetRegisterInfo * TRI
Promote Memory to Register
Definition Mem2Reg.cpp:110
This file provides utility analysis objects describing memory locations.
MachineInstr unsigned OpIdx
uint64_t IntrinsicInst * II
static bool cannotInsertTailCall(const MachineBasicBlock &MBB)
#define CASE_VFMA_CHANGE_OPCODE_SPLATS(OLDOP, NEWOP)
#define CASE_FP_WIDEOP_CHANGE_OPCODE_LMULS_ALT(OP)
#define CASE_FP_WIDEOP_OPCODE_LMULS(OP)
#define CASE_OPERAND_SIMM(NUM)
static std::optional< unsigned > getLMULForRVVWholeLoadStore(unsigned Opcode)
#define CASE_VFMA_CHANGE_OPCODE_VV(OLDOP, NEWOP)
static unsigned getFPFusedMultiplyOpcode(unsigned RootOpc, unsigned Pattern)
std::optional< unsigned > getFoldedOpcode(MachineFunction &MF, MachineInstr &MI, ArrayRef< unsigned > Ops, const RISCVSubtarget &ST)
#define RVV_OPC_LMUL_CASE(OPC, INV)
#define CASE_FP_WIDEOP_CHANGE_OPCODE_LMULS(OP)
static void combineFPFusedMultiply(MachineInstr &Root, MachineInstr &Prev, unsigned Pattern, SmallVectorImpl< MachineInstr * > &InsInstrs, SmallVectorImpl< MachineInstr * > &DelInstrs)
static unsigned getAddendOperandIdx(unsigned Pattern)
#define CASE_RVV_OPCODE_UNMASK(OP)
#define CASE_WIDEOP_CHANGE_OPCODE_LMULS(OP)
static cl::opt< bool > PreferWholeRegisterMove("riscv-prefer-whole-register-move", cl::init(false), cl::Hidden, cl::desc("Prefer whole register move for vector registers."))
#define CASE_VFMA_SPLATS(OP)
unsigned getPredicatedOpcode(unsigned Opcode)
#define CASE_FP_WIDEOP_OPCODE_LMULS_ALT(OP)
#define CASE_WIDEOP_OPCODE_LMULS(OP)
static bool isMIReadsReg(const MachineInstr &MI, const TargetRegisterInfo *TRI, MCRegister RegNo)
#define OPCODE_LMUL_MASK_CASE(OPC)
#define CASE_OPERAND_UIMM_LSB_ZEROS(BITS, SUFFIX)
static bool isFSUB(unsigned Opc)
#define CASE_VMA_CHANGE_OPCODE_LMULS(OLDOP, NEWOP, TYPE)
#define CASE_RVV_OPCODE(OP)
static std::optional< int64_t > getEffectiveImm(const MachineOperand &MO)
#define CASE_VFMA_OPCODE_VV(OP)
static cl::opt< bool > OutlinerEnableRegSave("riscv-outliner-regsave", cl::init(true), cl::Hidden, cl::desc("Enable RegSave strategy in machine outliner (save X5 to a " "temporary register when X5 is live across outlined calls)."))
MachineOutlinerConstructionID
#define CASE_RVV_OPCODE_WIDEN(OP)
static unsigned getLoadPredicatedOpcode(unsigned Opcode)
static unsigned getSHXADDUWShiftAmount(unsigned Opc)
#define CASE_VMA_OPCODE_LMULS(OP, TYPE)
static bool isConvertibleToVMV_V_V(const RISCVSubtarget &STI, const MachineBasicBlock &MBB, MachineBasicBlock::const_iterator MBBI, MachineBasicBlock::const_iterator &DefMBBI, RISCVVType::VLMUL LMul)
static bool isFMUL(unsigned Opc)
static unsigned getInverseXqcicmOpcode(unsigned Opcode)
static bool getFPPatterns(MachineInstr &Root, SmallVectorImpl< unsigned > &Patterns, bool DoRegPressureReduce)
#define OPCODE_LMUL_CASE(OPC)
#define CASE_OPERAND_UIMM(NUM)
static Register findRegisterToSaveX5To(outliner::Candidate &C, const TargetRegisterInfo &TRI)
static bool canCombineShiftIntoShXAdd(const MachineBasicBlock &MBB, const MachineOperand &MO, unsigned OuterShiftAmt)
Utility routine that checks if.
static bool isCandidatePatchable(const MachineBasicBlock &MBB)
static bool isFADD(unsigned Opc)
static void genShXAddAddShift(MachineInstr &Root, unsigned AddOpIdx, SmallVectorImpl< MachineInstr * > &InsInstrs, SmallVectorImpl< MachineInstr * > &DelInstrs, DenseMap< Register, unsigned > &InstrIdxForVirtReg)
static bool isLoadImm(const MachineInstr *MI, int64_t &Imm)
static bool isMIModifiesReg(const MachineInstr &MI, const TargetRegisterInfo *TRI, MCRegister RegNo)
#define CASE_RVV_OPCODE_LMUL(OP, LMUL)
static bool canCombineFPFusedMultiply(const MachineInstr &Root, const MachineOperand &MO, bool DoRegPressureReduce)
static bool getSHXADDPatterns(const MachineInstr &Root, SmallVectorImpl< unsigned > &Patterns)
static bool getFPFusedMultiplyPatterns(MachineInstr &Root, SmallVectorImpl< unsigned > &Patterns, bool DoRegPressureReduce)
static cl::opt< MachineTraceStrategy > ForceMachineCombinerStrategy("riscv-force-machine-combiner-strategy", cl::Hidden, cl::desc("Force machine combiner to use a specific strategy for machine " "trace metrics evaluation."), cl::init(MachineTraceStrategy::TS_NumStrategies), cl::values(clEnumValN(MachineTraceStrategy::TS_Local, "local", "Local strategy."), clEnumValN(MachineTraceStrategy::TS_MinInstrCount, "min-instr", "MinInstrCount strategy.")))
static unsigned getSHXADDShiftAmount(unsigned Opc)
#define CASE_RVV_OPCODE_MASK(OP)
#define RVV_OPC_LMUL_MASK_CASE(OPC, INV)
static MachineInstr * canFoldAsPredicatedOp(Register Reg, const MachineRegisterInfo &MRI, const TargetInstrInfo *TII, const RISCVSubtarget &STI)
Identify instructions that can be folded into a CCMOV instruction, and return the defining instructio...
const SmallVectorImpl< MachineOperand > MachineBasicBlock * TBB
const SmallVectorImpl< MachineOperand > & Cond
This file declares the machine register scavenger class.
static bool memOpsHaveSameBasePtr(const MachineInstr &MI1, ArrayRef< const MachineOperand * > BaseOps1, const MachineInstr &MI2, ArrayRef< const MachineOperand * > BaseOps2)
This file contains some templates that are useful if you are working with the STL at all.
static bool contains(SmallPtrSetImpl< ConstantExpr * > &Cache, ConstantExpr *Expr, Constant *C)
Definition Value.cpp:483
This file defines the SmallVector class.
This file defines the 'Statistic' class, which is designed to be an easy way to expose various metric...
#define STATISTIC(VARNAME, DESC)
Definition Statistic.h:171
#define LLVM_DEBUG(...)
Definition Debug.h:119
static TableGen::Emitter::Opt Y("gen-skeleton-entry", EmitSkeleton, "Generate example skeleton entry")
static bool canCombine(MachineBasicBlock &MBB, MachineOperand &MO, unsigned CombineOpc=0)
static cl::opt< unsigned > CacheLineSize("cache-line-size", cl::init(0), cl::Hidden, cl::desc("Use this to override the target cache line size when " "specified by the user."))
Value * RHS
Value * LHS
Represent a constant reference to an array (0 or more elements consecutively in memory),...
Definition ArrayRef.h:40
const T & front() const
Get the first element.
Definition ArrayRef.h:144
bool empty() const
Check if the array is empty.
Definition ArrayRef.h:136
static LLVM_ABI DILocation * getMergedLocation(DILocation *LocA, DILocation *LocB)
Attempts to merge LocA and LocB into a single location; see DebugLoc::getMergedLocation for more deta...
bool isBigEndian() const
Definition DataLayout.h:218
A debug info location.
Definition DebugLoc.h:124
std::pair< iterator, bool > insert(const std::pair< KeyT, ValueT > &KV)
Definition DenseMap.h:286
bool hasMinSize() const
Optimize this function for minimum size (-Oz).
Definition Function.h:711
LiveInterval - This class represents the liveness of a register, or stack slot.
LiveInterval & getInterval(Register Reg)
SlotIndex ReplaceMachineInstrInMaps(MachineInstr &MI, MachineInstr &NewMI)
const Segment * getSegmentContaining(SlotIndex Idx) const
Return the segment that contains the specified index, or null if there is none.
LLVM_ABI void replaceKillInstruction(Register Reg, MachineInstr &OldMI, MachineInstr &NewMI)
replaceKillInstruction - Update register kill info by replacing a kill instruction with a new one.
bool hasValue() const
static LocationSize precise(uint64_t Value)
TypeSize getValue() const
MCInstBuilder & addReg(MCRegister Reg)
Add a new register operand.
MCInstBuilder & addImm(int64_t Val)
Add a new integer immediate operand.
Instances of this class represent a single low-level machine instruction.
Definition MCInst.h:188
Describe properties that are true of each instruction in the target description file.
unsigned getNumOperands() const
Return the number of declared MachineOperands for this MachineInstruction.
bool isConditionalBranch() const
Return true if this is a branch which may fall through to the next instruction or may transfer contro...
This holds information about one operand of a machine instruction, indicating the register class for ...
Definition MCInstrDesc.h:86
Wrapper class representing physical registers. Should be passed by value.
Definition MCRegister.h:41
const FeatureBitset & getFeatureBits() const
Set of metadata that should be preserved when using BuildMI().
MachineInstrBundleIterator< const MachineInstr > const_iterator
MachineInstrBundleIterator< MachineInstr, true > reverse_iterator
const MachineFunction * getParent() const
Return the MachineFunction containing this basic block.
MachineInstrBundleIterator< MachineInstr > iterator
MachineInstrBundleIterator< const MachineInstr, true > const_reverse_iterator
The MachineFrameInfo class represents an abstract stack frame until prolog/epilog code is inserted.
void setStackID(int ObjectIdx, uint8_t ID)
Align getObjectAlign(int ObjectIdx) const
Return the alignment of the specified stack object.
int64_t getObjectSize(int ObjectIdx) const
Return the size of the specified object.
const TargetSubtargetInfo & getSubtarget() const
getSubtarget - Return the subtarget for which this machine code is being compiled.
StringRef getName() const
getName - Return the name of the corresponding LLVM function.
MachineMemOperand * getMachineMemOperand(MachinePointerInfo PtrInfo, MachineMemOperand::Flags f, LLT MemTy, Align base_alignment, const AAMDNodes &AAInfo=AAMDNodes(), const MDNode *Ranges=nullptr, SyncScope::ID SSID=SyncScope::System, AtomicOrdering Ordering=AtomicOrdering::NotAtomic, AtomicOrdering FailureOrdering=AtomicOrdering::NotAtomic)
getMachineMemOperand - Allocate a new MachineMemOperand.
MachineFrameInfo & getFrameInfo()
getFrameInfo - Return the frame info object for the current function.
MachineRegisterInfo & getRegInfo()
getRegInfo - Return information about the registers currently in use.
const DataLayout & getDataLayout() const
Return the DataLayout attached to the Module associated to this MF.
Function & getFunction()
Return the LLVM function that this machine code represents.
Ty * getInfo()
getInfo - Keep track of various per-function pieces of information for backends that would like to do...
const TargetMachine & getTarget() const
getTarget - Return the target machine this machine code is compiled with
const MachineInstrBuilder & setMemRefs(ArrayRef< MachineMemOperand * > MMOs) const
const MachineInstrBuilder & addUse(Register RegNo, RegState Flags={}, unsigned SubReg=0) const
Add a virtual register use operand.
const MachineInstrBuilder & addReg(Register RegNo, RegState Flags={}, unsigned SubReg=0) const
Add a new virtual register operand.
const MachineInstrBuilder & setMIFlag(MachineInstr::MIFlag Flag) const
const MachineInstrBuilder & addImm(int64_t Val) const
Add a new immediate operand.
const MachineInstrBuilder & add(const MachineOperand &MO) const
const MachineInstrBuilder & addFrameIndex(int Idx) const
const MachineInstrBuilder & addMBB(MachineBasicBlock *MBB, unsigned TargetFlags=0) const
const MachineInstrBuilder & cloneMemRefs(const MachineInstr &OtherMI) const
const MachineInstrBuilder & setMIFlags(unsigned Flags) const
const MachineInstrBuilder & copyImplicitOps(const MachineInstr &OtherMI) const
Copy all the implicit operands from OtherMI onto this one.
const MachineInstrBuilder & addMemOperand(MachineMemOperand *MMO) const
reverse_iterator getReverse() const
Get a reverse iterator to the same node.
Representation of each machine instruction.
unsigned getOpcode() const
Returns the opcode of this MachineInstr.
bool isReturn(QueryType Type=AnyInBundle) const
bool mayLoadOrStore(QueryType Type=AnyInBundle) const
Return true if this instruction could possibly read or modify memory.
const MachineBasicBlock * getParent() const
filtered_mop_range all_defs()
Returns an iterator range over all operands that are (explicit or implicit) register defs.
bool getFlag(MIFlag Flag) const
Return whether an MI flag is set.
LLVM_ABI bool isSafeToMove(bool &SawStore) const
Return true if it is safe to move this instruction.
LLVM_ABI unsigned getNumExplicitOperands() const
Returns the number of non-implicit operands.
bool modifiesRegister(Register Reg, const TargetRegisterInfo *TRI) const
Return true if the MachineInstr modifies (fully define or partially define) the specified register.
bool mayLoad(QueryType Type=AnyInBundle) const
Return true if this instruction could possibly read memory.
const MCInstrDesc & getDesc() const
Returns the target instruction descriptor of this MachineInstr.
LLVM_ABI bool hasUnmodeledSideEffects() const
Return true if this instruction has side effects that are not modeled by mayLoad / mayStore,...
bool hasOneMemOperand() const
Return true if this instruction has exactly one MachineMemOperand.
mmo_iterator memoperands_begin() const
Access to memory operands of the instruction.
LLVM_ABI bool hasOrderedMemoryRef() const
Return true if this instruction may have an ordered or volatile memory reference, or if the informati...
LLVM_ABI const MachineFunction * getMF() const
Return the function that contains the basic block that this instruction belongs to.
ArrayRef< MachineMemOperand * > memoperands() const
Access to memory operands of the instruction.
const DebugLoc & getDebugLoc() const
Returns the debug location id of this MachineInstr.
filtered_mop_range all_uses()
Returns an iterator range over all operands that are (explicit or implicit) register uses.
const MachineOperand & getOperand(unsigned i) const
uint32_t getFlags() const
Return the MI flags bitvector.
LLVM_ABI void clearKillInfo()
Clears kill flags on all operands.
A description of a memory reference used in the backend.
@ MOLoad
The memory access reads data.
@ MOStore
The memory access writes data.
This class contains meta information specific to a module.
MachineOperand class - Representation of each machine instruction operand.
int64_t getImm() const
bool isReg() const
isReg - Tests if this is a MO_Register operand.
MachineBasicBlock * getMBB() const
bool isImm() const
isImm - Tests if this is a MO_Immediate operand.
MachineInstr * getParent()
getParent - Return the instruction that this operand belongs to.
static MachineOperand CreateImm(int64_t Val)
MachineOperandType getType() const
getType - Returns the MachineOperandType for this operand.
Register getReg() const
getReg - Returns the register number.
bool isFI() const
isFI - Tests if this is a MO_FrameIndex operand.
LLVM_ABI bool isIdenticalTo(const MachineOperand &Other) const
Returns true if this operand is identical to the specified operand except for liveness related flags ...
@ MO_Immediate
Immediate operand.
@ MO_Register
Register operand.
MachineRegisterInfo - Keep track of information for virtual and physical registers,...
LLVM_ABI bool hasOneNonDBGUse(Register RegNo) const
hasOneNonDBGUse - Return true if there is exactly one non-Debug use of the specified register.
const TargetRegisterClass * getRegClass(Register Reg) const
Return the register class of the specified virtual register.
LLVM_ABI void clearKillFlags(Register Reg) const
clearKillFlags - Iterate over all the uses of the given register and clear the kill flag from the Mac...
LLVM_ABI MachineInstr * getVRegDef(Register Reg) const
getVRegDef - Return the machine instr that defines the specified virtual register or null if none is ...
bool isReserved(MCRegister PhysReg) const
isReserved - Returns true when PhysReg is a reserved register.
LLVM_ABI Register createVirtualRegister(const TargetRegisterClass *RegClass, StringRef Name="")
createVirtualRegister - Create and return a new virtual register in the function with the specified r...
bool hasOneUse(Register RegNo) const
hasOneUse - Return true if there is exactly one instruction using the specified register.
LLVM_ABI void clearVirtRegs()
clearVirtRegs - Remove all virtual registers (after physreg assignment).
const TargetRegisterInfo * getTargetRegisterInfo() const
LLVM_ABI bool isConstantPhysReg(MCRegister PhysReg) const
Returns true if PhysReg is unallocatable and constant throughout the function.
LLVM_ABI const TargetRegisterClass * constrainRegClass(Register Reg, const TargetRegisterClass *RC, unsigned MinNumRegs=0)
constrainRegClass - Constrain the register class of the specified virtual register to be a common sub...
LLVM_ABI void replaceRegWith(Register FromReg, Register ToReg)
replaceRegWith - Replace all instances of FromReg with ToReg in the machine function.
LLVM_ABI MachineInstr * getUniqueVRegDef(Register Reg) const
getUniqueVRegDef - Return the unique machine instr that defines the specified virtual register or nul...
A Module instance is used to store all the information related to an LLVM module.
Definition Module.h:67
MI-level patchpoint operands.
Definition StackMaps.h:77
uint32_t getNumPatchBytes() const
Return the number of patchable bytes the given patchpoint should emit.
Definition StackMaps.h:105
void storeRegToStackSlot(MachineBasicBlock &MBB, MachineBasicBlock::iterator MBBI, Register SrcReg, bool IsKill, int FrameIndex, const TargetRegisterClass *RC, Register VReg, MachineInstr::MIFlag Flags=MachineInstr::NoFlags) const override
static bool isSafeToMove(const MachineInstr &From, const MachineBasicBlock::iterator &To)
Return true if moving From down to To won't cause any physical register reads or writes to be clobber...
MachineInstr * convertToThreeAddress(MachineInstr &MI, LiveVariables *LV, LiveIntervals *LIS) const override
Register isLoadFromStackSlot(const MachineInstr &MI, int &FrameIndex) const override
std::optional< std::unique_ptr< outliner::OutlinedFunction > > getOutliningCandidateInfo(const MachineModuleInfo &MMI, std::vector< outliner::Candidate > &RepeatedSequenceLocs, unsigned MinRepeats) const override
unsigned removeBranch(MachineBasicBlock &MBB, int *BytesRemoved=nullptr) const override
void genAlternativeCodeSequence(MachineInstr &Root, unsigned Pattern, SmallVectorImpl< MachineInstr * > &InsInstrs, SmallVectorImpl< MachineInstr * > &DelInstrs, DenseMap< Register, unsigned > &InstrIdxForVirtReg) const override
void movImm(MachineBasicBlock &MBB, MachineBasicBlock::iterator MBBI, const DebugLoc &DL, Register DstReg, uint64_t Val, MachineInstr::MIFlag Flag=MachineInstr::NoFlags, bool DstRenamable=false, bool DstIsDead=false) const
MachineInstr * emitLdStWithAddr(MachineInstr &MemI, const ExtAddrMode &AM) const override
void mulImm(MachineFunction &MF, MachineBasicBlock &MBB, MachineBasicBlock::iterator II, const DebugLoc &DL, Register DestReg, uint32_t Amt, MachineInstr::MIFlag Flag) const
Generate code to multiply the value in DestReg by Amt - handles all the common optimizations for this...
static bool isPairableLdStInstOpc(unsigned Opc)
Return true if pairing the given load or store may be paired with another.
RISCVInstrInfo(const RISCVSubtarget &STI)
void loadRegFromStackSlot(MachineBasicBlock &MBB, MachineBasicBlock::iterator MBBI, Register DstReg, int FrameIndex, const TargetRegisterClass *RC, Register VReg, unsigned SubReg=0, MachineInstr::MIFlag Flags=MachineInstr::NoFlags) const override
bool isFunctionSafeToOutlineFrom(MachineFunction &MF, bool OutlineFromLinkOnceODRs) const override
std::unique_ptr< TargetInstrInfo::PipelinerLoopInfo > analyzeLoopForPipelining(MachineBasicBlock *LoopBB) const override
unsigned insertBranch(MachineBasicBlock &MBB, MachineBasicBlock *TBB, MachineBasicBlock *FBB, ArrayRef< MachineOperand > Cond, const DebugLoc &dl, int *BytesAdded=nullptr) const override
bool hasReassociableSibling(const MachineInstr &Inst, bool &Commuted) const override
static bool isLdStSafeToPair(const MachineInstr &LdSt, const TargetRegisterInfo *TRI)
void copyPhysRegVector(MachineBasicBlock &MBB, MachineBasicBlock::iterator MBBI, const DebugLoc &DL, MCRegister DstReg, MCRegister SrcReg, bool KillSrc, const TargetRegisterClass *RegClass) const
bool isReMaterializableImpl(const MachineInstr &MI) const override
MachineInstr * optimizeSelect(MachineInstr &MI, SmallPtrSetImpl< MachineInstr * > &SeenMIs, bool) const override
bool isVRegCopy(const MachineInstr *MI, unsigned LMul=0) const
Return true if MI is a COPY to a vector register of a specific LMul, or any kind of vector registers ...
bool canFoldIntoAddrMode(const MachineInstr &MemI, Register Reg, const MachineInstr &AddrI, ExtAddrMode &AM) const override
void insertIndirectBranch(MachineBasicBlock &MBB, MachineBasicBlock &NewDestBB, MachineBasicBlock &RestoreBB, const DebugLoc &DL, int64_t BrOffset, RegScavenger *RS) const override
bool isAsCheapAsAMove(const MachineInstr &MI) const override
bool verifyInstruction(const MachineInstr &MI, StringRef &ErrInfo) const override
bool getMemOperandWithOffsetWidth(const MachineInstr &LdSt, const MachineOperand *&BaseOp, int64_t &Offset, LocationSize &Width, const TargetRegisterInfo *TRI) const
unsigned getTailDuplicateSize(CodeGenOptLevel OptLevel) const override
void getReassociateOperandIndices(const MachineInstr &Root, unsigned Pattern, std::array< unsigned, 5 > &OperandIndices) const override
const RISCVSubtarget & STI
Register isStoreToStackSlot(const MachineInstr &MI, int &FrameIndex) const override
std::optional< unsigned > getInverseOpcode(unsigned Opcode) const override
bool simplifyInstruction(MachineInstr &MI) const override
ArrayRef< std::pair< unsigned, const char * > > getSerializableDirectMachineOperandTargetFlags() const override
outliner::InstrType getOutliningTypeImpl(const MachineModuleInfo &MMI, MachineBasicBlock::iterator &MBBI, unsigned Flags) const override
MachineTraceStrategy getMachineCombinerTraceStrategy() const override
unsigned getInstSizeInBytes(const MachineInstr &MI) const override
std::optional< RegImmPair > isAddImmediate(const MachineInstr &MI, Register Reg) const override
bool reverseBranchCondition(SmallVectorImpl< MachineOperand > &Cond) const override
ArrayRef< std::pair< MachineMemOperand::Flags, const char * > > getSerializableMachineMemOperandTargetFlags() const override
MCInst getNop() const override
bool analyzeCandidate(outliner::Candidate &C) const
bool isMBBSafeToOutlineFrom(MachineBasicBlock &MBB, unsigned &Flags) const override
bool getMemOperandsWithOffsetWidth(const MachineInstr &MI, SmallVectorImpl< const MachineOperand * > &BaseOps, int64_t &Offset, bool &OffsetIsScalable, LocationSize &Width, const TargetRegisterInfo *TRI) const override
void buildOutlinedFrame(MachineBasicBlock &MBB, MachineFunction &MF, const outliner::OutlinedFunction &OF) const override
bool requiresNTLHint(const MachineInstr &MI) const
Return true if the instruction requires an NTL hint to be emitted.
void finalizeInsInstrs(MachineInstr &Root, unsigned &Pattern, SmallVectorImpl< MachineInstr * > &InsInstrs) const override
std::pair< unsigned, unsigned > decomposeMachineOperandsTargetFlags(unsigned TF) const override
MachineInstr * commuteInstructionImpl(MachineInstr &MI, bool NewMI, unsigned OpIdx1, unsigned OpIdx2) const override
bool hasReassociableOperands(const MachineInstr &Inst, const MachineBasicBlock *MBB) const override
MachineBasicBlock * getBranchDestBlock(const MachineInstr &MI) const override
std::string createMIROperandComment(const MachineInstr &MI, const MachineOperand &Op, unsigned OpIdx, const TargetRegisterInfo *TRI) const override
bool shouldOutlineFromFunctionByDefault(MachineFunction &MF) const override
void copyPhysReg(MachineBasicBlock &MBB, MachineBasicBlock::iterator MBBI, const DebugLoc &DL, Register DstReg, Register SrcReg, bool KillSrc, bool RenamableDest=false, bool RenamableSrc=false) const override
bool findCommutedOpIndices(const MachineInstr &MI, unsigned &SrcOpIdx1, unsigned &SrcOpIdx2) const override
bool analyzeBranch(MachineBasicBlock &MBB, MachineBasicBlock *&TBB, MachineBasicBlock *&FBB, SmallVectorImpl< MachineOperand > &Cond, bool AllowModify) const override
MachineBasicBlock::iterator insertOutlinedCall(Module &M, MachineBasicBlock &MBB, MachineBasicBlock::iterator &It, MachineFunction &MF, outliner::Candidate &C) const override
MachineInstr * foldMemoryOperandImpl(MachineFunction &MF, MachineInstr &MI, ArrayRef< unsigned > Ops, int FrameIndex, MachineInstr *&CopyMI, LiveIntervals *LIS=nullptr, VirtRegMap *VRM=nullptr) const override
bool isBranchOffsetInRange(unsigned BranchOpc, int64_t BrOffset) const override
static RISCVCC::CondCode getCondFromBranchOpc(unsigned Opc)
bool isAssociativeAndCommutative(const MachineInstr &Inst, bool Invert) const override
CombinerObjective getCombinerObjective(unsigned Pattern) const override
bool isHighLatencyDef(int Opc) const override
static bool evaluateCondBranch(RISCVCC::CondCode CC, int64_t C0, int64_t C1)
Return the result of the evaluation of C0 CC C1, where CC is a RISCVCC::CondCode.
bool getMachineCombinerPatterns(MachineInstr &Root, SmallVectorImpl< unsigned > &Patterns, bool DoRegPressureReduce) const override
bool optimizeCondBranch(MachineInstr &MI) const override
std::optional< DestSourcePair > isCopyInstrImpl(const MachineInstr &MI) const override
static bool isFromLoadImm(const MachineRegisterInfo &MRI, const MachineOperand &Op, int64_t &Imm)
Return true if the operand is a load immediate instruction and sets Imm to the immediate value.
bool shouldClusterMemOps(ArrayRef< const MachineOperand * > BaseOps1, int64_t Offset1, bool OffsetIsScalable1, ArrayRef< const MachineOperand * > BaseOps2, int64_t Offset2, bool OffsetIsScalable2, unsigned ClusterSize, unsigned NumBytes) const override
bool areMemAccessesTriviallyDisjoint(const MachineInstr &MIa, const MachineInstr &MIb) const override
RISCVMachineFunctionInfo - This class is derived from MachineFunctionInfo and contains private RISCV-...
const RISCVRegisterInfo * getRegisterInfo() const override
Wrapper class representing virtual and physical registers.
Definition Register.h:20
constexpr bool isValid() const
Definition Register.h:112
constexpr bool isVirtual() const
Return true if the specified register number is in the virtual register namespace.
Definition Register.h:79
SlotIndex - An opaque wrapper around machine indexes.
Definition SlotIndexes.h:66
SlotIndex getRegSlot(bool EC=false) const
Returns the register use/def slot in the current instruction for a normal or early-clobber def.
A templated base class for SmallPtrSet which provides the typesafe interface that is common across al...
bool erase(PtrType Ptr)
Remove pointer from the set.
std::pair< iterator, bool > insert(PtrType Ptr)
Inserts Ptr if and only if there is no element in the container equal to Ptr.
This class consists of common code factored out of the SmallVector class to reduce code duplication b...
void push_back(const T &Elt)
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
MI-level stackmap operands.
Definition StackMaps.h:36
uint32_t getNumPatchBytes() const
Return the number of patchable bytes the given stackmap should emit.
Definition StackMaps.h:51
MI-level Statepoint operands.
Definition StackMaps.h:159
uint32_t getNumPatchBytes() const
Return the number of patchable bytes the given statepoint should emit.
Definition StackMaps.h:208
Represent a constant reference to a string, i.e.
Definition StringRef.h:56
Object returned by analyzeLoopForPipelining.
TargetInstrInfo - Interface to description of machine instruction set.
virtual bool findCommutedOpIndices(const MachineInstr &MI, unsigned &SrcOpIdx1, unsigned &SrcOpIdx2) const
Returns true iff the routine could find two commutable operands in the given machine instruction.
virtual bool hasReassociableOperands(const MachineInstr &Inst, const MachineBasicBlock *MBB) const
Return true when \P Inst has reassociable operands in the same \P MBB.
virtual void genAlternativeCodeSequence(MachineInstr &Root, unsigned Pattern, SmallVectorImpl< MachineInstr * > &InsInstrs, SmallVectorImpl< MachineInstr * > &DelInstrs, DenseMap< Register, unsigned > &InstIdxForVirtReg) const
When getMachineCombinerPatterns() finds patterns, this function generates the instructions that could...
virtual bool getMachineCombinerPatterns(MachineInstr &Root, SmallVectorImpl< unsigned > &Patterns, bool DoRegPressureReduce) const
Return true when there is potentially a faster code sequence for an instruction chain ending in Root.
virtual bool isReMaterializableImpl(const MachineInstr &MI) const
For instructions with opcodes for which the M_REMATERIALIZABLE flag is set, this hook lets the target...
virtual bool isMBBSafeToOutlineFrom(MachineBasicBlock &MBB, unsigned &Flags) const
Optional target hook that returns true if MBB is safe to outline from, and returns any target-specifi...
virtual void getReassociateOperandIndices(const MachineInstr &Root, unsigned Pattern, std::array< unsigned, 5 > &OperandIndices) const
The returned array encodes the operand index for each parameter because the operands may be commuted;...
virtual CombinerObjective getCombinerObjective(unsigned Pattern) const
Return the objective of a combiner pattern.
virtual MachineInstr * commuteInstructionImpl(MachineInstr &MI, bool NewMI, unsigned OpIdx1, unsigned OpIdx2) const
This method commutes the operands of the given machine instruction MI.
virtual bool hasReassociableSibling(const MachineInstr &Inst, bool &Commuted) const
Return true when \P Inst has reassociable sibling.
virtual std::string createMIROperandComment(const MachineInstr &MI, const MachineOperand &Op, unsigned OpIdx, const TargetRegisterInfo *TRI) const
const MCAsmInfo & getMCAsmInfo() const
Return target specific asm information.
const uint8_t TSFlags
Configurable target specific flags.
TargetRegisterInfo base class - We assume that the target defines a static array of TargetRegisterDes...
TargetSubtargetInfo - Generic base class for all target subtargets.
virtual const TargetInstrInfo * getInstrInfo() const
virtual const TargetRegisterInfo * getRegisterInfo() const =0
Return the target's register information.
Target - Wrapper for Target specific information.
static constexpr TypeSize getFixed(ScalarTy ExactSize)
Definition TypeSize.h:343
static constexpr TypeSize getZero()
Definition TypeSize.h:349
static constexpr TypeSize getScalable(ScalarTy MinimumSize)
Definition TypeSize.h:346
self_iterator getIterator()
Definition ilist_node.h:123
A raw_ostream that writes to an std::string.
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
@ C
The default llvm calling convention, compatible with C.
Definition CallingConv.h:34
CondCode getInverseBranchCondition(CondCode)
unsigned getInverseBranchOpcode(unsigned BCC)
unsigned getBrCond(CondCode CC, unsigned SelectOpc=0)
static bool isValidRoundingMode(unsigned Mode)
static StringRef roundingModeToString(RoundingMode RndMode)
static unsigned getVecPolicyOpNum(const MCInstrDesc &Desc)
static bool usesMaskPolicy(uint64_t TSFlags)
static bool hasRoundModeOp(uint64_t TSFlags)
static unsigned getVLOpNum(const MCInstrDesc &Desc)
static bool hasVLOp(uint64_t TSFlags)
static MCRegister getTailExpandUseRegNo(const FeatureBitset &FeatureBits)
static int getFRMOpNum(const MCInstrDesc &Desc)
static int getVXRMOpNum(const MCInstrDesc &Desc)
static bool hasVecPolicyOp(uint64_t TSFlags)
static bool usesVXRM(uint64_t TSFlags)
static bool isRVVWideningReduction(uint64_t TSFlags)
static unsigned getSEWOpNum(const MCInstrDesc &Desc)
static bool hasSEWOp(uint64_t TSFlags)
static bool isFirstDefTiedToFirstUse(const MCInstrDesc &Desc)
InstSeq generateInstSeq(int64_t Val, const MCSubtargetInfo &STI)
SmallVector< Inst, 8 > InstSeq
Definition RISCVMatInt.h:43
@ OPERAND_UIMMLOG2XLEN_NONZERO
@ OPERAND_UIMM10_LSB00_NONZERO
@ OPERAND_SIMM10_LSB0000_NONZERO
static unsigned getNF(uint8_t TSFlags)
static RISCVVType::VLMUL getLMul(uint8_t TSFlags)
static bool isTailAgnostic(unsigned VType)
LLVM_ABI void printXSfmmVType(unsigned VType, raw_ostream &OS)
LLVM_ABI std::pair< unsigned, bool > decodeVLMUL(VLMUL VLMul)
static bool isValidSEW(unsigned SEW)
static bool isValidVType(unsigned VType)
LLVM_ABI void printVType(unsigned VType, raw_ostream &OS)
static bool isValidXSfmmVType(unsigned VTypeI)
static unsigned getSEW(unsigned VType)
static VLMUL getVLMUL(unsigned VType)
static bool isValidRoundingMode(unsigned Mode)
static StringRef roundingModeToString(RoundingMode RndMode)
bool hasEqualFRM(const MachineInstr &MI1, const MachineInstr &MI2)
bool isVLKnownLE(const MachineOperand &LHS, const MachineOperand &RHS)
Given two VL operands, do we know that LHS <= RHS?
bool isValidYBNDSWImm(int64_t Imm)
unsigned getRVVMCOpcode(unsigned RVVPseudoOpcode)
unsigned getDestLog2EEW(const MCInstrDesc &Desc, unsigned Log2SEW)
std::optional< unsigned > getVectorLowDemandedScalarBits(unsigned Opcode, unsigned Log2SEW)
std::optional< std::pair< unsigned, unsigned > > isRVVSpillForZvlsseg(unsigned Opcode)
static constexpr unsigned RVVBitsPerBlock
bool isRVVSpill(const MachineInstr &MI)
static constexpr unsigned RVVBytesPerBlock
static constexpr int64_t VLMaxSentinel
bool isVectorCopy(const TargetRegisterInfo *TRI, const MachineInstr &MI)
Return true if MI is a copy that will be lowered to one or more vmvNr.vs.
ValuesClass values(OptsTy... Options)
Helper to build a ValuesClass by forwarding a variable number of arguments as an initializer list to ...
initializer< Ty > init(const Ty &Val)
InstrType
Represents how an instruction should be mapped by the outliner.
This is an optimization pass for GlobalISel generic memory operations.
auto drop_begin(T &&RangeOrContainer, size_t N=1)
Return a range covering RangeOrContainer with the first N elements excluded.
Definition STLExtras.h:315
@ Offset
Definition DWP.cpp:558
@ SHXADD_ADD_SLLI_OP2
@ SHXADD_ADD_SLLI_OP1
MachineTraceStrategy
Strategies for selecting traces.
@ TS_MinInstrCount
Select the trace through a block that has the fewest instructions.
@ TS_Local
Select the trace that contains only the current basic block.
bool all_of(R &&range, UnaryPredicate P)
Provide wrappers to std::all_of which take ranges instead of having to pass begin/end explicitly.
Definition STLExtras.h:1738
static const MachineMemOperand::Flags MONontemporalBit1
MachineInstrBuilder BuildMI(MachineFunction &MF, const MIMetadata &MIMD, const MCInstrDesc &MCID)
Builder interface. Specify how to create the initial instruction itself.
constexpr bool isInt(int64_t x)
Checks if an integer fits into the given bit width.
Definition MathExtras.h:165
RegState
Flags to represent properties of register accesses.
@ Implicit
Not emitted register (e.g. carry, or temporary result).
@ Dead
Unused definition.
@ Kill
The last use of a register.
@ Undef
Value of the register doesn't matter.
@ Define
Register definition.
auto enumerate(FirstRange &&First, RestRanges &&...Rest)
Given two or more input ranges, returns a new range whose values are tuples (A, B,...
Definition STLExtras.h:2553
bool isValidAtomicOrdering(Int I)
constexpr RegState getKillRegState(bool B)
static const MachineMemOperand::Flags MONontemporalBit0
constexpr RegState getDeadRegState(bool B)
Op::Description Desc
unsigned M1(unsigned Val)
Definition VE.h:377
constexpr bool has_single_bit(T Value) noexcept
Definition bit.h:149
unsigned Log2_32(uint32_t Value)
Return the floor log base 2 of the specified value, -1 if the value is zero.
Definition MathExtras.h:331
MachineInstr * getImm(const MachineOperand &MO, const MachineRegisterInfo *MRI)
constexpr RegState getRenamableRegState(bool B)
decltype(auto) get(const PointerIntPair< PointerTy, IntBits, IntType, PtrTraits, Info > &Pair)
LLVM_ABI raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
Definition Debug.cpp:209
LLVM_ABI void report_fatal_error(Error Err, bool gen_crash_diag=true)
Definition Error.cpp:163
constexpr RegState getDefRegState(bool B)
CombinerObjective
The combiner's goal may differ based on which pattern it is attempting to optimize.
constexpr bool isUInt(uint64_t x)
Checks if an unsigned integer fits into the given bit width.
Definition MathExtras.h:189
CodeGenOptLevel
Code generation optimization level.
Definition CodeGen.h:82
int isShifted359(T Value, int &Shift)
bool isa(const From &Val)
isa<X> - Return true if the parameter to the template is an instance of one of the template type argu...
Definition Casting.h:547
uint16_t MCPhysReg
An unsigned integer type large enough to represent all physical registers, but not necessarily virtua...
Definition MCRegister.h:21
DWARFExpression::Operation Op
ArrayRef(const T &OneElt) -> ArrayRef< T >
constexpr bool isShiftedInt(int64_t x)
Checks if a signed integer is an N bit number shifted left by S.
Definition MathExtras.h:182
void erase_if(Container &C, UnaryPredicate P)
Provide a container algorithm similar to C++ Library Fundamentals v2's erase_if which is equivalent t...
Definition STLExtras.h:2191
constexpr int64_t SignExtend64(uint64_t x)
Sign-extend the number in the bottom B bits of X to a 64-bit integer.
Definition MathExtras.h:572
LLVM_ABI const Value * getUnderlyingObject(const Value *V, unsigned MaxLookup=MaxLookupSearchDepth)
This method strips off any GEP address adjustments, pointer casts or llvm.threadlocal....
constexpr bool isShiftedUInt(uint64_t x)
Checks if a unsigned integer is an N bit number shifted left by S.
Definition MathExtras.h:198
void swap(llvm::BitVector &LHS, llvm::BitVector &RHS)
Implement std::swap in terms of BitVector swap.
Definition BitVector.h:863
#define N
This struct is a compact representation of a valid (non-zero power of two) alignment.
Definition Alignment.h:39
Used to describe addressing mode similar to ExtAddrMode in CodeGenPrepare.
This represents a simple continuous liveness interval for a value.
static LLVM_ABI MachinePointerInfo getFixedStack(MachineFunction &MF, int FI, int64_t Offset=0)
Return a MachinePointerInfo record that refers to the specified FrameIndex.
static bool isRVVRegClass(const TargetRegisterClass *RC)
Used to describe a register and immediate addition.
An individual sequence of instructions to be replaced with a call to an outlined function.
MachineFunction * getMF() const
The information necessary to create an outlined function for some class of candidate.