66#define GET_INSTRINFO_CTOR_DTOR
67#include "AArch64GenInstrInfo.inc"
69#define DEBUG_TYPE "AArch64InstrInfo"
71STATISTIC(NumCopyInstrs,
"Number of COPY instructions expanded");
72STATISTIC(NumZCRegMoveInstrsGPR,
"Number of zero-cycle GPR register move "
73 "instructions expanded from canonical COPY");
74STATISTIC(NumZCRegMoveInstrsFPR,
"Number of zero-cycle FPR register move "
75 "instructions expanded from canonical COPY");
76STATISTIC(NumZCZeroingInstrsGPR,
"Number of zero-cycle GPR zeroing "
77 "instructions expanded from canonical COPY");
82 cl::desc(
"Restrict range of CB instructions (DEBUG)"));
86 cl::desc(
"Restrict range of TB[N]Z instructions (DEBUG)"));
90 cl::desc(
"Restrict range of CB[N]Z instructions (DEBUG)"));
94 cl::desc(
"Restrict range of Bcc instructions (DEBUG)"));
98 cl::desc(
"Restrict range of B instructions (DEBUG)"));
102 cl::desc(
"Restrict range of instructions to search for the "
103 "machine-combiner gather pattern optimization"));
108 RI(STI.getTargetTriple(), STI.getHwMode()), Subtarget(STI) {}
118 switch (
MI.getOpcode()) {
129 if (
MI.getOperand(0).getReg() != AArch64::LR)
138 if (MO.isReg() && MO.isDef() && MO.getReg() == AArch64::LR)
156 auto Op =
MI.getOpcode();
157 if (
Op == AArch64::INLINEASM ||
Op == AArch64::INLINEASM_BR)
158 return getInlineAsmLength(
MI.getOperand(0).getSymbolName(), MAI);
162 if (
MI.isMetaInstruction())
167 unsigned NumBytes = 0;
177 NumBytes =
Desc.getSize() ?
Desc.getSize() : 4;
180 if (!MFI->shouldSignReturnAddress(*MF))
183 auto Method = STI.getAuthenticatedLRCheckMethod(*MF);
191 switch (
Desc.getOpcode()) {
194 return Desc.getSize();
201 case TargetOpcode::STACKMAP:
204 assert(NumBytes % 4 == 0 &&
"Invalid number of NOP bytes requested!");
206 case TargetOpcode::PATCHPOINT:
209 assert(NumBytes % 4 == 0 &&
"Invalid number of NOP bytes requested!");
211 case TargetOpcode::STATEPOINT:
213 assert(NumBytes % 4 == 0 &&
"Invalid number of NOP bytes requested!");
218 case TargetOpcode::PATCHABLE_FUNCTION_ENTER:
223 F.getFnAttributeAsParsedInteger(
"patchable-function-entry", 9) * 4;
225 case TargetOpcode::PATCHABLE_FUNCTION_EXIT:
226 case TargetOpcode::PATCHABLE_TAIL_CALL:
227 case TargetOpcode::PATCHABLE_TYPED_EVENT_CALL:
231 case TargetOpcode::PATCHABLE_EVENT_CALL:
237 NumBytes =
MI.getOperand(1).getImm();
239 case AArch64::MOVaddr:
240 case AArch64::MOVaddrJT:
241 case AArch64::MOVaddrCP:
242 case AArch64::MOVaddrBA:
243 case AArch64::MOVaddrTLS:
244 case AArch64::MOVaddrEXT: {
248 MI.getOperand(1).getTargetFlags(),
249 Subtarget.isTargetMachO(), Insn);
250 NumBytes = Insn.
size() * 4;
254 case AArch64::MOVi32imm:
255 case AArch64::MOVi64imm: {
257 unsigned BitSize =
Desc.getOpcode() == AArch64::MOVi32imm ? 32 : 64;
260 NumBytes = Insn.
size() * 4;
264 case TargetOpcode::BUNDLE:
265 NumBytes = getInstBundleSize(
MI);
301 case AArch64::CBWPri:
302 case AArch64::CBXPri:
303 case AArch64::CBWPrr:
304 case AArch64::CBXPrr:
312 case AArch64::CBBAssertExt:
313 case AArch64::CBHAssertExt:
344 case AArch64::CBWPri:
345 case AArch64::CBXPri:
346 case AArch64::CBBAssertExt:
347 case AArch64::CBHAssertExt:
348 case AArch64::CBWPrr:
349 case AArch64::CBXPrr:
355 int64_t BrOffset)
const {
357 assert(Bits >= 3 &&
"max branch displacement must be enough to jump"
358 "over conditional branch expansion");
359 return isIntN(Bits, BrOffset / 4);
364 switch (
MI.getOpcode()) {
368 return MI.getOperand(0).getMBB();
373 return MI.getOperand(2).getMBB();
379 return MI.getOperand(1).getMBB();
380 case AArch64::CBWPri:
381 case AArch64::CBXPri:
382 case AArch64::CBBAssertExt:
383 case AArch64::CBHAssertExt:
384 case AArch64::CBWPrr:
385 case AArch64::CBXPrr:
386 return MI.getOperand(3).getMBB();
396 assert(RS &&
"RegScavenger required for long branching");
398 "new block should be inserted for expanding unconditional branch");
401 "restore block should be inserted for restoring clobbered registers");
408 "Branch offsets outside of the signed 33-bit range not supported");
419 RS->enterBasicBlockEnd(
MBB);
422 constexpr Register Reg = AArch64::X16;
423 if (!RS->isRegUsed(Reg)) {
424 insertUnconditionalBranch(
MBB, &NewDestBB,
DL);
435 Register Scavenged = RS->FindUnusedReg(&AArch64::GPR64RegClass);
436 if (Scavenged != AArch64::NoRegister) {
437 buildIndirectBranch(Scavenged, NewDestBB);
438 RS->setRegUsed(Scavenged);
447 "Unable to insert indirect branch inside function that has red zone");
470 bool AllowModify)
const {
477 if (
I->getOpcode() == AArch64::SpeculationBarrierISBDSBEndBB ||
478 I->getOpcode() == AArch64::SpeculationBarrierSBEndBB) {
482 if (!isUnpredicatedTerminator(*
I))
489 unsigned LastOpc = LastInst->
getOpcode();
490 if (
I ==
MBB.begin() || !isUnpredicatedTerminator(*--
I)) {
505 unsigned SecondLastOpc = SecondLastInst->
getOpcode();
512 LastInst = SecondLastInst;
514 if (
I ==
MBB.begin() || !isUnpredicatedTerminator(*--
I)) {
519 SecondLastInst = &*
I;
520 SecondLastOpc = SecondLastInst->
getOpcode();
531 LastInst = SecondLastInst;
533 if (
I ==
MBB.begin() || !isUnpredicatedTerminator(*--
I)) {
535 "unreachable unconditional branches removed above");
544 SecondLastInst = &*
I;
545 SecondLastOpc = SecondLastInst->
getOpcode();
549 if (SecondLastInst &&
I !=
MBB.begin() && isUnpredicatedTerminator(*--
I))
565 I->eraseFromParent();
574 I->eraseFromParent();
583 MachineBranchPredicate &MBP,
584 bool AllowModify)
const {
596 assert(MBP.TrueDest &&
"expected!");
597 MBP.FalseDest = FBB ? FBB :
MBB.getNextNode();
599 MBP.ConditionDef =
nullptr;
600 MBP.SingleUseCondition =
false;
610 if (
I ==
MBB.begin())
626 if (
MI.modifiesRegister(AArch64::NZCV,
nullptr)) {
627 MBP.ConditionDef = &
MI;
636 case AArch64::CBNZX: {
640 MBP.Predicate = (
Opc == AArch64::CBNZX ||
Opc == AArch64::CBNZW)
641 ? MachineBranchPredicate::PRED_NE
642 : MachineBranchPredicate::PRED_EQ;
643 Register CondReg = MBP.LHS.getReg();
652 case AArch64::TBNZX: {
673 Cond[1].setImm(AArch64::CBNZW);
676 Cond[1].setImm(AArch64::CBZW);
679 Cond[1].setImm(AArch64::CBNZX);
682 Cond[1].setImm(AArch64::CBZX);
685 Cond[1].setImm(AArch64::TBNZW);
688 Cond[1].setImm(AArch64::TBZW);
691 Cond[1].setImm(AArch64::TBNZX);
694 Cond[1].setImm(AArch64::TBZX);
698 case AArch64::CBWPri:
699 case AArch64::CBXPri:
700 case AArch64::CBBAssertExt:
701 case AArch64::CBHAssertExt:
702 case AArch64::CBWPrr:
703 case AArch64::CBXPrr: {
716 int *BytesRemoved)
const {
726 I->eraseFromParent();
730 if (
I ==
MBB.begin()) {
743 I->eraseFromParent();
750void AArch64InstrInfo::instantiateCondBranch(
775 if (
Cond.size() > 5) {
786 assert(
TBB &&
"insertBranch must not be told to insert a fallthrough");
813 unsigned Opc =
MI.getOpcode();
820 if (
MI.getOperand(0).getReg() == AArch64::WZR ||
821 MI.getOperand(0).getReg() == AArch64::XZR) {
823 dbgs() <<
"Removing always taken branch: " <<
MI);
826 for (
auto *S : Succs)
828 MBB->removeSuccessor(S);
830 while (
MBB->rbegin() != &
MI)
831 MBB->rbegin()->eraseFromParent();
832 MI.eraseFromParent();
842 if (
MI.getOperand(0).getReg() == AArch64::WZR ||
843 MI.getOperand(0).getReg() == AArch64::XZR) {
845 dbgs() <<
"Removing never taken branch: " <<
MI);
847 MI.getParent()->removeSuccessor(
Target);
848 MI.eraseFromParent();
861 if (!
DefMI->isFullCopy())
863 VReg =
DefMI->getOperand(1).getReg();
872 unsigned *NewReg =
nullptr) {
877 bool Is64Bit = AArch64::GPR64allRegClass.hasSubClassEq(MRI.
getRegClass(VReg));
881 switch (
DefMI->getOpcode()) {
882 case AArch64::SUBREG_TO_REG:
886 if (!
DefMI->getOperand(1).isReg())
888 if (!
DefMI->getOperand(2).isImm() ||
889 DefMI->getOperand(2).getImm() != AArch64::sub_32)
892 if (
DefMI->getOpcode() != AArch64::MOVi32imm)
894 if (!
DefMI->getOperand(1).isImm() ||
DefMI->getOperand(1).getImm() != 1)
897 SrcReg = AArch64::XZR;
898 Opc = AArch64::CSINCXr;
901 case AArch64::MOVi32imm:
902 case AArch64::MOVi64imm:
903 if (!
DefMI->getOperand(1).isImm() ||
DefMI->getOperand(1).getImm() != 1)
905 SrcReg = Is64Bit ? AArch64::XZR : AArch64::WZR;
906 Opc = Is64Bit ? AArch64::CSINCXr : AArch64::CSINCWr;
909 case AArch64::ADDSXri:
910 case AArch64::ADDSWri:
912 if (
DefMI->findRegisterDefOperandIdx(AArch64::NZCV,
nullptr,
917 case AArch64::ADDXri:
918 case AArch64::ADDWri:
920 if (!
DefMI->getOperand(2).isImm() ||
DefMI->getOperand(2).getImm() != 1 ||
921 DefMI->getOperand(3).getImm() != 0)
923 SrcReg =
DefMI->getOperand(1).getReg();
924 Opc = Is64Bit ? AArch64::CSINCXr : AArch64::CSINCWr;
927 case AArch64::ORNXrr:
928 case AArch64::ORNWrr: {
931 if (ZReg != AArch64::XZR && ZReg != AArch64::WZR)
933 SrcReg =
DefMI->getOperand(2).getReg();
934 Opc = Is64Bit ? AArch64::CSINVXr : AArch64::CSINVWr;
938 case AArch64::SUBSXrr:
939 case AArch64::SUBSWrr:
941 if (
DefMI->findRegisterDefOperandIdx(AArch64::NZCV,
nullptr,
946 case AArch64::SUBXrr:
947 case AArch64::SUBWrr: {
950 if (ZReg != AArch64::XZR && ZReg != AArch64::WZR)
952 SrcReg =
DefMI->getOperand(2).getReg();
953 Opc = Is64Bit ? AArch64::CSNEGXr : AArch64::CSNEGWr;
959 assert(
Opc && SrcReg &&
"Missing parameters");
971 int &FalseCycles)
const {
982 if (!RI.getCommonSubClass(RC, MRI.
getRegClass(DstReg)))
986 unsigned ExtraCondLat =
Cond.size() != 1;
990 if (AArch64::GPR64allRegClass.hasSubClassEq(RC) ||
991 AArch64::GPR32allRegClass.hasSubClassEq(RC)) {
993 CondCycles = 1 + ExtraCondLat;
994 TrueCycles = FalseCycles = 1;
1004 if (AArch64::FPR64RegClass.hasSubClassEq(RC) ||
1005 AArch64::FPR32RegClass.hasSubClassEq(RC)) {
1006 CondCycles = 5 + ExtraCondLat;
1007 TrueCycles = FalseCycles = 2;
1024 switch (
Cond.size()) {
1044 case AArch64::CBNZW:
1048 case AArch64::CBNZX:
1079 case AArch64::TBNZW:
1080 case AArch64::TBNZX:
1102 unsigned SubsOpc, SubsDestReg;
1108 case AArch64::CBWPri:
1109 SubsOpc = AArch64::SUBSWri;
1110 SubsDestReg = AArch64::WZR;
1113 case AArch64::CBXPri:
1114 SubsOpc = AArch64::SUBSXri;
1115 SubsDestReg = AArch64::XZR;
1118 case AArch64::CBWPrr:
1119 SubsOpc = AArch64::SUBSWrr;
1120 SubsDestReg = AArch64::WZR;
1123 case AArch64::CBXPrr:
1124 SubsOpc = AArch64::SUBSXrr;
1125 SubsDestReg = AArch64::XZR;
1154 switch (ExtendType) {
1160 "Unexpected compare-and-branch instruction for SXTB shift-extend");
1161 ExtOpc = AArch64::SBFMWri;
1167 "Unexpected compare-and-branch instruction for SXTH shift-extend");
1168 ExtOpc = AArch64::SBFMWri;
1174 "Unexpected compare-and-branch instruction for UXTB shift-extend");
1175 ExtOpc = AArch64::ANDWri;
1181 "Unexpected compare-and-branch instruction for UXTH shift-extend");
1182 ExtOpc = AArch64::ANDWri;
1191 if (ExtOpc != AArch64::ANDWri)
1193 MBBI.addImm(ExtBits);
1221 bool TryFold =
false;
1223 RC = &AArch64::GPR64RegClass;
1224 Opc = AArch64::CSELXr;
1227 RC = &AArch64::GPR32RegClass;
1228 Opc = AArch64::CSELWr;
1231 RC = &AArch64::FPR64RegClass;
1232 Opc = AArch64::FCSELDrrr;
1234 RC = &AArch64::FPR32RegClass;
1235 Opc = AArch64::FCSELSrrr;
1237 assert(RC &&
"Unsupported regclass");
1241 unsigned NewReg = 0;
1264 (FalseReg.
isVirtual() || FalseReg == AArch64::WZR ||
1265 FalseReg == AArch64::XZR) &&
1266 "FalseReg was folded into a non-virtual register other than WZR or XZR");
1283 assert(BitSize == 64 &&
"Only bit sizes of 32 or 64 allowed");
1288 return Is.
size() <= 2;
1293 assert(
MI.isCopy() &&
"Expected COPY instruction");
1299 if (
Reg.isVirtual())
1301 if (
Reg.isPhysical())
1302 return RI.getMinimalPhysRegClass(
Reg);
1307 if (DstRC && SrcRC && !RI.getCommonSubClass(DstRC, SrcRC))
1310 return MI.isAsCheapAsAMove();
1316 if (Subtarget.hasExynosCheapAsMoveHandling()) {
1317 if (isExynosCheapAsMove(
MI))
1319 return MI.isAsCheapAsAMove();
1322 switch (
MI.getOpcode()) {
1324 return MI.isAsCheapAsAMove();
1326 case TargetOpcode::COPY:
1329 case AArch64::ADDWrs:
1330 case AArch64::ADDXrs:
1331 case AArch64::SUBWrs:
1332 case AArch64::SUBXrs:
1333 return Subtarget.hasALULSLFast() &&
MI.getOperand(3).getImm() <= 4;
1338 case AArch64::MOVi32imm:
1340 case AArch64::MOVi64imm:
1345bool AArch64InstrInfo::isFalkorShiftExtFast(
const MachineInstr &
MI) {
1346 switch (
MI.getOpcode()) {
1350 case AArch64::ADDWrs:
1351 case AArch64::ADDXrs:
1352 case AArch64::ADDSWrs:
1353 case AArch64::ADDSXrs: {
1354 unsigned Imm =
MI.getOperand(3).getImm();
1361 case AArch64::ADDWrx:
1362 case AArch64::ADDXrx:
1363 case AArch64::ADDXrx64:
1364 case AArch64::ADDSWrx:
1365 case AArch64::ADDSXrx:
1366 case AArch64::ADDSXrx64: {
1367 unsigned Imm =
MI.getOperand(3).getImm();
1379 case AArch64::SUBWrs:
1380 case AArch64::SUBSWrs: {
1381 unsigned Imm =
MI.getOperand(3).getImm();
1383 return ShiftVal == 0 ||
1387 case AArch64::SUBXrs:
1388 case AArch64::SUBSXrs: {
1389 unsigned Imm =
MI.getOperand(3).getImm();
1391 return ShiftVal == 0 ||
1395 case AArch64::SUBWrx:
1396 case AArch64::SUBXrx:
1397 case AArch64::SUBXrx64:
1398 case AArch64::SUBSWrx:
1399 case AArch64::SUBSXrx:
1400 case AArch64::SUBSXrx64: {
1401 unsigned Imm =
MI.getOperand(3).getImm();
1413 case AArch64::LDRBBroW:
1414 case AArch64::LDRBBroX:
1415 case AArch64::LDRBroW:
1416 case AArch64::LDRBroX:
1417 case AArch64::LDRDroW:
1418 case AArch64::LDRDroX:
1419 case AArch64::LDRHHroW:
1420 case AArch64::LDRHHroX:
1421 case AArch64::LDRHroW:
1422 case AArch64::LDRHroX:
1423 case AArch64::LDRQroW:
1424 case AArch64::LDRQroX:
1425 case AArch64::LDRSBWroW:
1426 case AArch64::LDRSBWroX:
1427 case AArch64::LDRSBXroW:
1428 case AArch64::LDRSBXroX:
1429 case AArch64::LDRSHWroW:
1430 case AArch64::LDRSHWroX:
1431 case AArch64::LDRSHXroW:
1432 case AArch64::LDRSHXroX:
1433 case AArch64::LDRSWroW:
1434 case AArch64::LDRSWroX:
1435 case AArch64::LDRSroW:
1436 case AArch64::LDRSroX:
1437 case AArch64::LDRWroW:
1438 case AArch64::LDRWroX:
1439 case AArch64::LDRXroW:
1440 case AArch64::LDRXroX:
1441 case AArch64::PRFMroW:
1442 case AArch64::PRFMroX:
1443 case AArch64::STRBBroW:
1444 case AArch64::STRBBroX:
1445 case AArch64::STRBroW:
1446 case AArch64::STRBroX:
1447 case AArch64::STRDroW:
1448 case AArch64::STRDroX:
1449 case AArch64::STRHHroW:
1450 case AArch64::STRHHroX:
1451 case AArch64::STRHroW:
1452 case AArch64::STRHroX:
1453 case AArch64::STRQroW:
1454 case AArch64::STRQroX:
1455 case AArch64::STRSroW:
1456 case AArch64::STRSroX:
1457 case AArch64::STRWroW:
1458 case AArch64::STRWroX:
1459 case AArch64::STRXroW:
1460 case AArch64::STRXroX: {
1461 unsigned IsSigned =
MI.getOperand(3).getImm();
1468 unsigned Opc =
MI.getOpcode();
1472 case AArch64::SEH_StackAlloc:
1473 case AArch64::SEH_SaveFPLR:
1474 case AArch64::SEH_SaveFPLR_X:
1475 case AArch64::SEH_SaveReg:
1476 case AArch64::SEH_SaveReg_X:
1477 case AArch64::SEH_SaveRegP:
1478 case AArch64::SEH_SaveRegP_X:
1479 case AArch64::SEH_SaveFReg:
1480 case AArch64::SEH_SaveFReg_X:
1481 case AArch64::SEH_SaveFRegP:
1482 case AArch64::SEH_SaveFRegP_X:
1483 case AArch64::SEH_SetFP:
1484 case AArch64::SEH_AddFP:
1485 case AArch64::SEH_Nop:
1486 case AArch64::SEH_PrologEnd:
1487 case AArch64::SEH_EpilogStart:
1488 case AArch64::SEH_EpilogEnd:
1489 case AArch64::SEH_PACSignLR:
1490 case AArch64::SEH_SaveAnyRegI:
1491 case AArch64::SEH_SaveAnyRegIP:
1492 case AArch64::SEH_SaveAnyRegQP:
1493 case AArch64::SEH_SaveAnyRegQPX:
1494 case AArch64::SEH_AllocZ:
1495 case AArch64::SEH_SaveZReg:
1496 case AArch64::SEH_SavePReg:
1503 unsigned &SubIdx)
const {
1504 switch (
MI.getOpcode()) {
1507 case AArch64::SBFMXri:
1508 case AArch64::UBFMXri:
1511 if (
MI.getOperand(2).getImm() != 0 ||
MI.getOperand(3).getImm() != 31)
1514 SrcReg =
MI.getOperand(1).getReg();
1515 DstReg =
MI.getOperand(0).getReg();
1516 SubIdx = AArch64::sub_32;
1525 int64_t OffsetA = 0, OffsetB = 0;
1526 TypeSize WidthA(0,
false), WidthB(0,
false);
1527 bool OffsetAIsScalable =
false, OffsetBIsScalable =
false;
1548 OffsetAIsScalable == OffsetBIsScalable) {
1549 int LowOffset = OffsetA < OffsetB ? OffsetA : OffsetB;
1550 int HighOffset = OffsetA < OffsetB ? OffsetB : OffsetA;
1551 TypeSize LowWidth = (LowOffset == OffsetA) ? WidthA : WidthB;
1552 if (LowWidth.
isScalable() == OffsetAIsScalable &&
1570 switch (
MI.getOpcode()) {
1573 if (
MI.getOperand(0).getImm() == 0x14)
1580 case AArch64::MSRpstatesvcrImm1:
1587 auto Next = std::next(
MI.getIterator());
1588 return Next !=
MBB->end() &&
Next->isCFIInstruction();
1595 Register &SrcReg2, int64_t &CmpMask,
1596 int64_t &CmpValue)
const {
1600 assert(
MI.getNumOperands() >= 2 &&
"All AArch64 cmps should have 2 operands");
1601 if (!
MI.getOperand(1).isReg() ||
MI.getOperand(1).getSubReg())
1604 switch (
MI.getOpcode()) {
1607 case AArch64::PTEST_PP:
1608 case AArch64::PTEST_PP_ANY:
1609 case AArch64::PTEST_PP_FIRST:
1610 SrcReg =
MI.getOperand(0).getReg();
1611 SrcReg2 =
MI.getOperand(1).getReg();
1612 if (
MI.getOperand(2).getSubReg())
1619 case AArch64::SUBSWrr:
1620 case AArch64::SUBSWrs:
1621 case AArch64::SUBSWrx:
1622 case AArch64::SUBSXrr:
1623 case AArch64::SUBSXrs:
1624 case AArch64::SUBSXrx:
1625 case AArch64::ADDSWrr:
1626 case AArch64::ADDSWrs:
1627 case AArch64::ADDSWrx:
1628 case AArch64::ADDSXrr:
1629 case AArch64::ADDSXrs:
1630 case AArch64::ADDSXrx:
1632 SrcReg =
MI.getOperand(1).getReg();
1633 SrcReg2 =
MI.getOperand(2).getReg();
1636 if (
MI.getOperand(2).getSubReg())
1642 case AArch64::SUBSWri:
1643 case AArch64::ADDSWri:
1644 case AArch64::SUBSXri:
1645 case AArch64::ADDSXri:
1646 SrcReg =
MI.getOperand(1).getReg();
1649 CmpValue =
MI.getOperand(2).getImm();
1651 case AArch64::ANDSWri:
1652 case AArch64::ANDSXri:
1655 SrcReg =
MI.getOperand(1).getReg();
1659 MI.getOperand(2).getImm(),
1660 MI.getOpcode() == AArch64::ANDSWri ? 32 : 64);
1669 assert(
MBB &&
"Can't get MachineBasicBlock here");
1671 assert(MF &&
"Can't get MachineFunction here");
1676 for (
unsigned OpIdx = 0, EndIdx = Instr.getNumOperands();
OpIdx < EndIdx;
1683 if (!OpRegCstraints)
1691 "Operand has register constraints without being a register!");
1694 if (
Reg.isPhysical()) {
1711 bool MIDefinesZeroReg =
false;
1712 if (
MI.definesRegister(AArch64::WZR,
nullptr) ||
1713 MI.definesRegister(AArch64::XZR,
nullptr))
1714 MIDefinesZeroReg =
true;
1716 switch (
MI.getOpcode()) {
1718 return MI.getOpcode();
1719 case AArch64::ADDSWrr:
1720 return AArch64::ADDWrr;
1721 case AArch64::ADDSWri:
1722 return MIDefinesZeroReg ? AArch64::ADDSWri : AArch64::ADDWri;
1723 case AArch64::ADDSWrs:
1724 return MIDefinesZeroReg ? AArch64::ADDSWrs : AArch64::ADDWrs;
1725 case AArch64::ADDSWrx:
1726 return AArch64::ADDWrx;
1727 case AArch64::ADDSXrr:
1728 return AArch64::ADDXrr;
1729 case AArch64::ADDSXri:
1730 return MIDefinesZeroReg ? AArch64::ADDSXri : AArch64::ADDXri;
1731 case AArch64::ADDSXrs:
1732 return MIDefinesZeroReg ? AArch64::ADDSXrs : AArch64::ADDXrs;
1733 case AArch64::ADDSXrx:
1734 return AArch64::ADDXrx;
1735 case AArch64::SUBSWrr:
1736 return AArch64::SUBWrr;
1737 case AArch64::SUBSWri:
1738 return MIDefinesZeroReg ? AArch64::SUBSWri : AArch64::SUBWri;
1739 case AArch64::SUBSWrs:
1740 return MIDefinesZeroReg ? AArch64::SUBSWrs : AArch64::SUBWrs;
1741 case AArch64::SUBSWrx:
1742 return AArch64::SUBWrx;
1743 case AArch64::SUBSXrr:
1744 return AArch64::SUBXrr;
1745 case AArch64::SUBSXri:
1746 return MIDefinesZeroReg ? AArch64::SUBSXri : AArch64::SUBXri;
1747 case AArch64::SUBSXrs:
1748 return MIDefinesZeroReg ? AArch64::SUBSXrs : AArch64::SUBXrs;
1749 case AArch64::SUBSXrx:
1750 return AArch64::SUBXrx;
1765 if (To == To->getParent()->begin())
1770 if (To->getParent() != From->getParent())
1782 Instr.modifiesRegister(AArch64::NZCV,
TRI)) ||
1783 ((AccessToCheck &
AK_Read) && Instr.readsRegister(AArch64::NZCV,
TRI)))
1789std::optional<unsigned>
1793 unsigned MaskOpcode =
Mask->getOpcode();
1794 unsigned PredOpcode = Pred->
getOpcode();
1795 bool PredIsPTestLike = isPTestLikeOpcode(PredOpcode);
1796 bool PredIsWhileLike = isWhileOpcode(PredOpcode);
1798 if (PredIsWhileLike) {
1802 if ((Mask == Pred) && PTest->
getOpcode() == AArch64::PTEST_PP_ANY)
1809 getElementSizeForOpcode(MaskOpcode) ==
1810 getElementSizeForOpcode(PredOpcode))
1816 if (PTest->
getOpcode() == AArch64::PTEST_PP_FIRST &&
1823 if (PredIsPTestLike) {
1828 if ((Mask == Pred) && PTest->
getOpcode() == AArch64::PTEST_PP_ANY)
1836 if (Mask != PTestLikeMask && PTestLikeMask->isFullCopy() &&
1837 PTestLikeMask->getOperand(1).getReg().isVirtual())
1845 getElementSizeForOpcode(MaskOpcode) ==
1846 getElementSizeForOpcode(PredOpcode)) {
1847 if (Mask == PTestLikeMask || PTest->
getOpcode() == AArch64::PTEST_PP_ANY)
1873 uint64_t PredElementSize = getElementSizeForOpcode(PredOpcode);
1875 PTest->
getOpcode() == AArch64::PTEST_PP_ANY))
1883 switch (PredOpcode) {
1884 case AArch64::AND_PPzPP:
1885 case AArch64::BIC_PPzPP:
1886 case AArch64::EOR_PPzPP:
1887 case AArch64::NAND_PPzPP:
1888 case AArch64::NOR_PPzPP:
1889 case AArch64::ORN_PPzPP:
1890 case AArch64::ORR_PPzPP:
1891 case AArch64::BRKA_PPzP:
1892 case AArch64::BRKPA_PPzPP:
1893 case AArch64::BRKB_PPzP:
1894 case AArch64::BRKPB_PPzPP:
1895 case AArch64::RDFFR_PPz: {
1899 if (Mask != PredMask)
1903 case AArch64::BRKN_PPzP: {
1907 if ((MaskOpcode != AArch64::PTRUE_B) ||
1908 (
Mask->getOperand(1).getImm() != 31))
1912 case AArch64::PTRUE_B:
1925bool AArch64InstrInfo::optimizePTestInstr(
1926 MachineInstr *PTest,
unsigned MaskReg,
unsigned PredReg,
1931 if (Pred->
isCopy() && PTest->
getOpcode() == AArch64::PTEST_PP_FIRST) {
1935 if (
Op.isReg() &&
Op.getReg().isVirtual() &&
1936 Op.getSubReg() == AArch64::psub0)
1940 unsigned PredOpcode = Pred->
getOpcode();
1941 auto NewOp = canRemovePTestInstr(PTest, Mask, Pred, MRI);
1957 if (*NewOp != PredOpcode) {
1968 for (; i !=
e; ++i) {
1999 if (DeadNZCVIdx != -1) {
2018 if (CmpInstr.
getOpcode() == AArch64::PTEST_PP ||
2019 CmpInstr.
getOpcode() == AArch64::PTEST_PP_ANY ||
2020 CmpInstr.
getOpcode() == AArch64::PTEST_PP_FIRST)
2021 return optimizePTestInstr(&CmpInstr, SrcReg, SrcReg2, MRI);
2030 if (CmpValue == 0 && substituteCmpToZero(CmpInstr, SrcReg, *MRI))
2032 return (CmpValue == 0 || CmpValue == 1) &&
2033 removeCmpToZeroOrOne(CmpInstr, SrcReg, CmpValue, *MRI);
2041 switch (Instr.getOpcode()) {
2043 return AArch64::INSTRUCTION_LIST_END;
2045 case AArch64::ADDSWrr:
2046 case AArch64::ADDSWri:
2047 case AArch64::ADDSXrr:
2048 case AArch64::ADDSXri:
2049 case AArch64::ADDSWrx:
2050 case AArch64::ADDSXrx:
2051 case AArch64::SUBSWrr:
2052 case AArch64::SUBSWri:
2053 case AArch64::SUBSWrx:
2054 case AArch64::SUBSXrr:
2055 case AArch64::SUBSXri:
2056 case AArch64::SUBSXrx:
2057 case AArch64::ANDSWri:
2058 case AArch64::ANDSWrr:
2059 case AArch64::ANDSWrs:
2060 case AArch64::ANDSXri:
2061 case AArch64::ANDSXrr:
2062 case AArch64::ANDSXrs:
2063 case AArch64::BICSWrr:
2064 case AArch64::BICSXrr:
2065 case AArch64::BICSWrs:
2066 case AArch64::BICSXrs:
2067 return Instr.getOpcode();
2069 case AArch64::ADDWrr:
2070 return AArch64::ADDSWrr;
2071 case AArch64::ADDWri:
2072 return AArch64::ADDSWri;
2073 case AArch64::ADDXrr:
2074 return AArch64::ADDSXrr;
2075 case AArch64::ADDXri:
2076 return AArch64::ADDSXri;
2077 case AArch64::ADDWrx:
2078 return AArch64::ADDSWrx;
2079 case AArch64::ADDXrx:
2080 return AArch64::ADDSXrx;
2081 case AArch64::ADCWr:
2082 return AArch64::ADCSWr;
2083 case AArch64::ADCXr:
2084 return AArch64::ADCSXr;
2085 case AArch64::SUBWrr:
2086 return AArch64::SUBSWrr;
2087 case AArch64::SUBWri:
2088 return AArch64::SUBSWri;
2089 case AArch64::SUBXrr:
2090 return AArch64::SUBSXrr;
2091 case AArch64::SUBXri:
2092 return AArch64::SUBSXri;
2093 case AArch64::SUBWrx:
2094 return AArch64::SUBSWrx;
2095 case AArch64::SUBXrx:
2096 return AArch64::SUBSXrx;
2097 case AArch64::SBCWr:
2098 return AArch64::SBCSWr;
2099 case AArch64::SBCXr:
2100 return AArch64::SBCSXr;
2101 case AArch64::ANDWri:
2102 return AArch64::ANDSWri;
2103 case AArch64::ANDXri:
2104 return AArch64::ANDSXri;
2105 case AArch64::ANDWrr:
2106 return AArch64::ANDSWrr;
2107 case AArch64::ANDWrs:
2108 return AArch64::ANDSWrs;
2109 case AArch64::ANDXrr:
2110 return AArch64::ANDSXrr;
2111 case AArch64::ANDXrs:
2112 return AArch64::ANDSXrs;
2113 case AArch64::BICWrr:
2114 return AArch64::BICSWrr;
2115 case AArch64::BICXrr:
2116 return AArch64::BICSXrr;
2117 case AArch64::BICWrs:
2118 return AArch64::BICSWrs;
2119 case AArch64::BICXrs:
2120 return AArch64::BICSXrs;
2126 for (
auto *BB :
MBB->successors())
2127 if (BB->isLiveIn(AArch64::NZCV))
2134int AArch64InstrInfo::findCondCodeUseOperandIdxForBranchOrSelect(
2136 switch (
Instr.getOpcode()) {
2140 case AArch64::Bcc: {
2141 int Idx =
Instr.findRegisterUseOperandIdx(AArch64::NZCV,
nullptr);
2146 case AArch64::CSINVWr:
2147 case AArch64::CSINVXr:
2148 case AArch64::CSINCWr:
2149 case AArch64::CSINCXr:
2150 case AArch64::CSELWr:
2151 case AArch64::CSELXr:
2152 case AArch64::CSNEGWr:
2153 case AArch64::CSNEGXr:
2154 case AArch64::FCSELSrrr:
2155 case AArch64::FCSELDrrr: {
2156 int Idx =
Instr.findRegisterUseOperandIdx(AArch64::NZCV,
nullptr);
2168 AArch64InstrInfo::findCondCodeUseOperandIdxForBranchOrSelect(Instr);
2170 Instr.getOperand(CCIdx).
getImm())
2223std::optional<UsedNZCV>
2228 if (
MI.getParent() != CmpParent)
2229 return std::nullopt;
2232 return std::nullopt;
2237 if (Instr.readsRegister(AArch64::NZCV, &
TRI)) {
2240 return std::nullopt;
2245 if (Instr.modifiesRegister(AArch64::NZCV, &
TRI))
2248 return NZCVUsedAfterCmp;
2252 return Opcode == AArch64::ADDSWri || Opcode == AArch64::ADDSXri;
2256 return Opcode == AArch64::SUBSWri || Opcode == AArch64::SUBSXri;
2262 case AArch64::ANDSWri:
2263 case AArch64::ANDSWrr:
2264 case AArch64::ANDSWrs:
2265 case AArch64::ANDSXri:
2266 case AArch64::ANDSXrr:
2267 case AArch64::ANDSXrs:
2268 case AArch64::BICSWrr:
2269 case AArch64::BICSXrr:
2270 case AArch64::BICSWrs:
2271 case AArch64::BICSXrs:
2297 const unsigned CmpOpcode = CmpInstr.
getOpcode();
2303 "Caller guarantees that CmpInstr compares with constant 0");
2306 if (!NZVCUsed || NZVCUsed->C)
2329bool AArch64InstrInfo::substituteCmpToZero(
2340 if (NewOpc == AArch64::INSTRUCTION_LIST_END)
2347 MI->setDesc(
get(NewOpc));
2352 MI->addRegisterDefined(AArch64::NZCV, &
TRI);
2364 assert((CmpValue == 0 || CmpValue == 1) &&
2365 "Only comparisons to 0 or 1 considered for removal!");
2368 unsigned MIOpc =
MI.getOpcode();
2369 if (MIOpc == AArch64::CSINCWr) {
2370 if (
MI.getOperand(1).getReg() != AArch64::WZR ||
2371 MI.getOperand(2).getReg() != AArch64::WZR)
2373 }
else if (MIOpc == AArch64::CSINCXr) {
2374 if (
MI.getOperand(1).getReg() != AArch64::XZR ||
2375 MI.getOperand(2).getReg() != AArch64::XZR)
2385 if (
MI.findRegisterDefOperandIdx(AArch64::NZCV,
nullptr,
true) != -1)
2389 const unsigned CmpOpcode = CmpInstr.
getOpcode();
2391 if (CmpValue && !IsSubsRegImm)
2393 if (!CmpValue && !IsSubsRegImm && !
isADDSRegImm(CmpOpcode))
2398 if (MIUsedNZCV.
C || MIUsedNZCV.
V)
2401 std::optional<UsedNZCV> NZCVUsedAfterCmp =
2405 if (!NZCVUsedAfterCmp || NZCVUsedAfterCmp->C || NZCVUsedAfterCmp->V)
2408 if ((MIUsedNZCV.
Z && NZCVUsedAfterCmp->N) ||
2409 (MIUsedNZCV.
N && NZCVUsedAfterCmp->Z))
2412 if (MIUsedNZCV.
N && !CmpValue)
2454bool AArch64InstrInfo::removeCmpToZeroOrOne(
2461 SmallVector<MachineInstr *, 4> CCUseInstrs;
2462 bool IsInvertCC =
false;
2470 for (MachineInstr *CCUseInstr : CCUseInstrs) {
2471 int Idx = findCondCodeUseOperandIdxForBranchOrSelect(*CCUseInstr);
2472 assert(Idx >= 0 &&
"Unexpected instruction using CC.");
2473 MachineOperand &CCOperand = CCUseInstr->getOperand(Idx);
2482bool AArch64InstrInfo::expandPostRAPseudo(
MachineInstr &
MI)
const {
2483 if (
MI.getOpcode() != TargetOpcode::LOAD_STACK_GUARD &&
2484 MI.getOpcode() != AArch64::CATCHRET)
2487 MachineBasicBlock &
MBB = *
MI.getParent();
2489 auto TRI = Subtarget.getRegisterInfo();
2492 if (
MI.getOpcode() == AArch64::CATCHRET) {
2494 const TargetInstrInfo *
TII =
2496 MachineBasicBlock *TargetMBB =
MI.getOperand(0).getMBB();
2501 FirstEpilogSEH = std::prev(FirstEpilogSEH);
2503 FirstEpilogSEH = std::next(FirstEpilogSEH);
2518 if (
M.getStackProtectorGuard() ==
"sysreg") {
2519 const AArch64SysReg::SysReg *SrcReg =
2520 AArch64SysReg::lookupSysRegByName(
M.getStackProtectorGuardReg());
2528 int Offset =
M.getStackProtectorGuardOffset();
2579 const GlobalValue *GV =
2582 unsigned OpFlags = Subtarget.ClassifyGlobalReference(GV, TM);
2585 unsigned GuardWidth =
M.getStackProtectorGuardValueWidth().value_or(
2586 Subtarget.isTargetILP32() ? 4 : 8);
2587 if (GuardWidth != 4 && GuardWidth != 8)
2592 if (GuardWidth == 4) {
2593 unsigned Reg32 =
TRI->getSubReg(
Reg, AArch64::sub_32);
2607 if (GuardWidth == 4)
2641 if (GuardWidth == 4) {
2642 unsigned Reg32 =
TRI->getSubReg(
Reg, AArch64::sub_32);
2665 switch (
MI.getOpcode()) {
2668 case AArch64::MOVZWi:
2669 case AArch64::MOVZXi:
2670 if (
MI.getOperand(1).isImm() &&
MI.getOperand(1).getImm() == 0) {
2671 assert(
MI.getDesc().getNumOperands() == 3 &&
2672 MI.getOperand(2).getImm() == 0 &&
"invalid MOVZi operands");
2676 case AArch64::ANDWri:
2677 return MI.getOperand(1).getReg() == AArch64::WZR;
2678 case AArch64::ANDXri:
2679 return MI.getOperand(1).getReg() == AArch64::XZR;
2680 case TargetOpcode::COPY:
2681 return MI.getOperand(1).getReg() == AArch64::WZR;
2689 switch (
MI.getOpcode()) {
2692 case TargetOpcode::COPY: {
2695 return (AArch64::GPR32RegClass.
contains(DstReg) ||
2696 AArch64::GPR64RegClass.
contains(DstReg));
2698 case AArch64::ORRXrs:
2699 if (
MI.getOperand(1).getReg() == AArch64::XZR) {
2700 assert(
MI.getDesc().getNumOperands() == 4 &&
2701 MI.getOperand(3).getImm() == 0 &&
"invalid ORRrs operands");
2705 case AArch64::ADDXri:
2706 if (
MI.getOperand(2).getImm() == 0) {
2707 assert(
MI.getDesc().getNumOperands() == 4 &&
2708 MI.getOperand(3).getImm() == 0 &&
"invalid ADDXri operands");
2719 switch (
MI.getOpcode()) {
2722 case TargetOpcode::COPY: {
2724 return AArch64::FPR128RegClass.contains(DstReg);
2726 case AArch64::ORRv16i8:
2727 if (
MI.getOperand(1).getReg() ==
MI.getOperand(2).getReg()) {
2728 assert(
MI.getDesc().getNumOperands() == 3 &&
MI.getOperand(0).isReg() &&
2729 "invalid ORRv16i8 operands");
2741 case AArch64::LDRWui:
2742 case AArch64::LDRXui:
2743 case AArch64::LDRBui:
2744 case AArch64::LDRHui:
2745 case AArch64::LDRSui:
2746 case AArch64::LDRDui:
2747 case AArch64::LDRQui:
2748 case AArch64::LDR_PXI:
2754 int &FrameIndex)
const {
2758 if (
MI.getOperand(0).getSubReg() == 0 &&
MI.getOperand(1).isFI() &&
2759 MI.getOperand(2).isImm() &&
MI.getOperand(2).getImm() == 0) {
2760 FrameIndex =
MI.getOperand(1).getIndex();
2761 return MI.getOperand(0).getReg();
2770 case AArch64::STRWui:
2771 case AArch64::STRXui:
2772 case AArch64::STRBui:
2773 case AArch64::STRHui:
2774 case AArch64::STRSui:
2775 case AArch64::STRDui:
2776 case AArch64::STRQui:
2777 case AArch64::STR_PXI:
2783 int &FrameIndex)
const {
2787 if (
MI.getOperand(0).getSubReg() == 0 &&
MI.getOperand(1).isFI() &&
2788 MI.getOperand(2).isImm() &&
MI.getOperand(2).getImm() == 0) {
2789 FrameIndex =
MI.getOperand(1).getIndex();
2790 return MI.getOperand(0).getReg();
2796 int &FrameIndex)
const {
2811 return MI.getOperand(0).getReg();
2817 int &FrameIndex)
const {
2832 return MI.getOperand(0).getReg();
2840 return MMO->getFlags() & MOSuppressPair;
2846 if (
MI.memoperands_empty())
2854 return MMO->getFlags() & MOStridedAccess;
2862 case AArch64::STURSi:
2863 case AArch64::STRSpre:
2864 case AArch64::STURDi:
2865 case AArch64::STRDpre:
2866 case AArch64::STURQi:
2867 case AArch64::STRQpre:
2868 case AArch64::STURBBi:
2869 case AArch64::STURHHi:
2870 case AArch64::STURWi:
2871 case AArch64::STRWpre:
2872 case AArch64::STURXi:
2873 case AArch64::STRXpre:
2874 case AArch64::LDURSi:
2875 case AArch64::LDRSpre:
2876 case AArch64::LDURDi:
2877 case AArch64::LDRDpre:
2878 case AArch64::LDURQi:
2879 case AArch64::LDRQpre:
2880 case AArch64::LDURWi:
2881 case AArch64::LDRWpre:
2882 case AArch64::LDURXi:
2883 case AArch64::LDRXpre:
2884 case AArch64::LDRSWpre:
2885 case AArch64::LDURSWi:
2886 case AArch64::LDURHHi:
2887 case AArch64::LDURBBi:
2888 case AArch64::LDURSBWi:
2889 case AArch64::LDURSHWi:
2897 case AArch64::PRFMui:
return AArch64::PRFUMi;
2898 case AArch64::LDRXui:
return AArch64::LDURXi;
2899 case AArch64::LDRWui:
return AArch64::LDURWi;
2900 case AArch64::LDRBui:
return AArch64::LDURBi;
2901 case AArch64::LDRHui:
return AArch64::LDURHi;
2902 case AArch64::LDRSui:
return AArch64::LDURSi;
2903 case AArch64::LDRDui:
return AArch64::LDURDi;
2904 case AArch64::LDRQui:
return AArch64::LDURQi;
2905 case AArch64::LDRBBui:
return AArch64::LDURBBi;
2906 case AArch64::LDRHHui:
return AArch64::LDURHHi;
2907 case AArch64::LDRSBXui:
return AArch64::LDURSBXi;
2908 case AArch64::LDRSBWui:
return AArch64::LDURSBWi;
2909 case AArch64::LDRSHXui:
return AArch64::LDURSHXi;
2910 case AArch64::LDRSHWui:
return AArch64::LDURSHWi;
2911 case AArch64::LDRSWui:
return AArch64::LDURSWi;
2912 case AArch64::STRXui:
return AArch64::STURXi;
2913 case AArch64::STRWui:
return AArch64::STURWi;
2914 case AArch64::STRBui:
return AArch64::STURBi;
2915 case AArch64::STRHui:
return AArch64::STURHi;
2916 case AArch64::STRSui:
return AArch64::STURSi;
2917 case AArch64::STRDui:
return AArch64::STURDi;
2918 case AArch64::STRQui:
return AArch64::STURQi;
2919 case AArch64::STRBBui:
return AArch64::STURBBi;
2920 case AArch64::STRHHui:
return AArch64::STURHHi;
2929 case AArch64::LDAPURBi:
2930 case AArch64::LDAPURHi:
2931 case AArch64::LDAPURi:
2932 case AArch64::LDAPURSBWi:
2933 case AArch64::LDAPURSBXi:
2934 case AArch64::LDAPURSHWi:
2935 case AArch64::LDAPURSHXi:
2936 case AArch64::LDAPURSWi:
2937 case AArch64::LDAPURXi:
2938 case AArch64::LDR_PPXI:
2939 case AArch64::LDR_PXI:
2940 case AArch64::LDR_ZXI:
2941 case AArch64::LDR_ZZXI:
2942 case AArch64::LDR_ZZXI_STRIDED_CONTIGUOUS:
2943 case AArch64::LDR_ZZZXI:
2944 case AArch64::LDR_ZZZZXI:
2945 case AArch64::LDR_ZZZZXI_STRIDED_CONTIGUOUS:
2946 case AArch64::LDRBBui:
2947 case AArch64::LDRBui:
2948 case AArch64::LDRDui:
2949 case AArch64::LDRHHui:
2950 case AArch64::LDRHui:
2951 case AArch64::LDRQui:
2952 case AArch64::LDRSBWui:
2953 case AArch64::LDRSBXui:
2954 case AArch64::LDRSHWui:
2955 case AArch64::LDRSHXui:
2956 case AArch64::LDRSui:
2957 case AArch64::LDRSWui:
2958 case AArch64::LDRWui:
2959 case AArch64::LDRXui:
2960 case AArch64::LDURBBi:
2961 case AArch64::LDURBi:
2962 case AArch64::LDURDi:
2963 case AArch64::LDURHHi:
2964 case AArch64::LDURHi:
2965 case AArch64::LDURQi:
2966 case AArch64::LDURSBWi:
2967 case AArch64::LDURSBXi:
2968 case AArch64::LDURSHWi:
2969 case AArch64::LDURSHXi:
2970 case AArch64::LDURSi:
2971 case AArch64::LDURSWi:
2972 case AArch64::LDURWi:
2973 case AArch64::LDURXi:
2974 case AArch64::PRFMui:
2975 case AArch64::PRFUMi:
2976 case AArch64::ST2Gi:
2978 case AArch64::STLURBi:
2979 case AArch64::STLURHi:
2980 case AArch64::STLURWi:
2981 case AArch64::STLURXi:
2982 case AArch64::StoreSwiftAsyncContext:
2983 case AArch64::STR_PPXI:
2984 case AArch64::STR_PXI:
2985 case AArch64::STR_ZXI:
2986 case AArch64::STR_ZZXI:
2987 case AArch64::STR_ZZXI_STRIDED_CONTIGUOUS:
2988 case AArch64::STR_ZZZXI:
2989 case AArch64::STR_ZZZZXI:
2990 case AArch64::STR_ZZZZXI_STRIDED_CONTIGUOUS:
2991 case AArch64::STRBBui:
2992 case AArch64::STRBui:
2993 case AArch64::STRDui:
2994 case AArch64::STRHHui:
2995 case AArch64::STRHui:
2996 case AArch64::STRQui:
2997 case AArch64::STRSui:
2998 case AArch64::STRWui:
2999 case AArch64::STRXui:
3000 case AArch64::STURBBi:
3001 case AArch64::STURBi:
3002 case AArch64::STURDi:
3003 case AArch64::STURHHi:
3004 case AArch64::STURHi:
3005 case AArch64::STURQi:
3006 case AArch64::STURSi:
3007 case AArch64::STURWi:
3008 case AArch64::STURXi:
3009 case AArch64::STZ2Gi:
3010 case AArch64::STZGi:
3011 case AArch64::TAGPstack:
3013 case AArch64::LD1B_D_IMM:
3014 case AArch64::LD1B_H_IMM:
3015 case AArch64::LD1B_IMM:
3016 case AArch64::LD1B_S_IMM:
3017 case AArch64::LD1D_IMM:
3018 case AArch64::LD1H_D_IMM:
3019 case AArch64::LD1H_IMM:
3020 case AArch64::LD1H_S_IMM:
3021 case AArch64::LD1RB_D_IMM:
3022 case AArch64::LD1RB_H_IMM:
3023 case AArch64::LD1RB_IMM:
3024 case AArch64::LD1RB_S_IMM:
3025 case AArch64::LD1RD_IMM:
3026 case AArch64::LD1RH_D_IMM:
3027 case AArch64::LD1RH_IMM:
3028 case AArch64::LD1RH_S_IMM:
3029 case AArch64::LD1RSB_D_IMM:
3030 case AArch64::LD1RSB_H_IMM:
3031 case AArch64::LD1RSB_S_IMM:
3032 case AArch64::LD1RSH_D_IMM:
3033 case AArch64::LD1RSH_S_IMM:
3034 case AArch64::LD1RSW_IMM:
3035 case AArch64::LD1RW_D_IMM:
3036 case AArch64::LD1RW_IMM:
3037 case AArch64::LD1SB_D_IMM:
3038 case AArch64::LD1SB_H_IMM:
3039 case AArch64::LD1SB_S_IMM:
3040 case AArch64::LD1SH_D_IMM:
3041 case AArch64::LD1SH_S_IMM:
3042 case AArch64::LD1SW_D_IMM:
3043 case AArch64::LD1W_D_IMM:
3044 case AArch64::LD1W_IMM:
3045 case AArch64::LD2B_IMM:
3046 case AArch64::LD2D_IMM:
3047 case AArch64::LD2H_IMM:
3048 case AArch64::LD2W_IMM:
3049 case AArch64::LD3B_IMM:
3050 case AArch64::LD3D_IMM:
3051 case AArch64::LD3H_IMM:
3052 case AArch64::LD3W_IMM:
3053 case AArch64::LD4B_IMM:
3054 case AArch64::LD4D_IMM:
3055 case AArch64::LD4H_IMM:
3056 case AArch64::LD4W_IMM:
3058 case AArch64::LDNF1B_D_IMM:
3059 case AArch64::LDNF1B_H_IMM:
3060 case AArch64::LDNF1B_IMM:
3061 case AArch64::LDNF1B_S_IMM:
3062 case AArch64::LDNF1D_IMM:
3063 case AArch64::LDNF1H_D_IMM:
3064 case AArch64::LDNF1H_IMM:
3065 case AArch64::LDNF1H_S_IMM:
3066 case AArch64::LDNF1SB_D_IMM:
3067 case AArch64::LDNF1SB_H_IMM:
3068 case AArch64::LDNF1SB_S_IMM:
3069 case AArch64::LDNF1SH_D_IMM:
3070 case AArch64::LDNF1SH_S_IMM:
3071 case AArch64::LDNF1SW_D_IMM:
3072 case AArch64::LDNF1W_D_IMM:
3073 case AArch64::LDNF1W_IMM:
3074 case AArch64::LDNPDi:
3075 case AArch64::LDNPQi:
3076 case AArch64::LDNPSi:
3077 case AArch64::LDNPWi:
3078 case AArch64::LDNPXi:
3079 case AArch64::LDNT1B_ZRI:
3080 case AArch64::LDNT1D_ZRI:
3081 case AArch64::LDNT1H_ZRI:
3082 case AArch64::LDNT1W_ZRI:
3083 case AArch64::LDPDi:
3084 case AArch64::LDPQi:
3085 case AArch64::LDPSi:
3086 case AArch64::LDPWi:
3087 case AArch64::LDPXi:
3088 case AArch64::LDRBBpost:
3089 case AArch64::LDRBBpre:
3090 case AArch64::LDRBpost:
3091 case AArch64::LDRBpre:
3092 case AArch64::LDRDpost:
3093 case AArch64::LDRDpre:
3094 case AArch64::LDRHHpost:
3095 case AArch64::LDRHHpre:
3096 case AArch64::LDRHpost:
3097 case AArch64::LDRHpre:
3098 case AArch64::LDRQpost:
3099 case AArch64::LDRQpre:
3100 case AArch64::LDRSpost:
3101 case AArch64::LDRSpre:
3102 case AArch64::LDRWpost:
3103 case AArch64::LDRWpre:
3104 case AArch64::LDRXpost:
3105 case AArch64::LDRXpre:
3106 case AArch64::ST1B_D_IMM:
3107 case AArch64::ST1B_H_IMM:
3108 case AArch64::ST1B_IMM:
3109 case AArch64::ST1B_S_IMM:
3110 case AArch64::ST1D_IMM:
3111 case AArch64::ST1H_D_IMM:
3112 case AArch64::ST1H_IMM:
3113 case AArch64::ST1H_S_IMM:
3114 case AArch64::ST1W_D_IMM:
3115 case AArch64::ST1W_IMM:
3116 case AArch64::ST2B_IMM:
3117 case AArch64::ST2D_IMM:
3118 case AArch64::ST2H_IMM:
3119 case AArch64::ST2W_IMM:
3120 case AArch64::ST3B_IMM:
3121 case AArch64::ST3D_IMM:
3122 case AArch64::ST3H_IMM:
3123 case AArch64::ST3W_IMM:
3124 case AArch64::ST4B_IMM:
3125 case AArch64::ST4D_IMM:
3126 case AArch64::ST4H_IMM:
3127 case AArch64::ST4W_IMM:
3128 case AArch64::STGPi:
3129 case AArch64::STGPreIndex:
3130 case AArch64::STZGPreIndex:
3131 case AArch64::ST2GPreIndex:
3132 case AArch64::STZ2GPreIndex:
3133 case AArch64::STGPostIndex:
3134 case AArch64::STZGPostIndex:
3135 case AArch64::ST2GPostIndex:
3136 case AArch64::STZ2GPostIndex:
3137 case AArch64::STNPDi:
3138 case AArch64::STNPQi:
3139 case AArch64::STNPSi:
3140 case AArch64::STNPWi:
3141 case AArch64::STNPXi:
3142 case AArch64::STNT1B_ZRI:
3143 case AArch64::STNT1D_ZRI:
3144 case AArch64::STNT1H_ZRI:
3145 case AArch64::STNT1W_ZRI:
3146 case AArch64::STPDi:
3147 case AArch64::STPQi:
3148 case AArch64::STPSi:
3149 case AArch64::STPWi:
3150 case AArch64::STPXi:
3151 case AArch64::STRBBpost:
3152 case AArch64::STRBBpre:
3153 case AArch64::STRBpost:
3154 case AArch64::STRBpre:
3155 case AArch64::STRDpost:
3156 case AArch64::STRDpre:
3157 case AArch64::STRHHpost:
3158 case AArch64::STRHHpre:
3159 case AArch64::STRHpost:
3160 case AArch64::STRHpre:
3161 case AArch64::STRQpost:
3162 case AArch64::STRQpre:
3163 case AArch64::STRSpost:
3164 case AArch64::STRSpre:
3165 case AArch64::STRWpost:
3166 case AArch64::STRWpre:
3167 case AArch64::STRXpost:
3168 case AArch64::STRXpre:
3169 case AArch64::LD1B_2Z_IMM:
3170 case AArch64::LD1B_2Z_STRIDED_IMM:
3171 case AArch64::LD1H_2Z_IMM:
3172 case AArch64::LD1H_2Z_STRIDED_IMM:
3173 case AArch64::LD1W_2Z_IMM:
3174 case AArch64::LD1W_2Z_STRIDED_IMM:
3175 case AArch64::LD1D_2Z_IMM:
3176 case AArch64::LD1D_2Z_STRIDED_IMM:
3177 case AArch64::LD1B_4Z_IMM:
3178 case AArch64::LD1B_4Z_STRIDED_IMM:
3179 case AArch64::LD1H_4Z_IMM:
3180 case AArch64::LD1H_4Z_STRIDED_IMM:
3181 case AArch64::LD1W_4Z_IMM:
3182 case AArch64::LD1W_4Z_STRIDED_IMM:
3183 case AArch64::LD1D_4Z_IMM:
3184 case AArch64::LD1D_4Z_STRIDED_IMM:
3185 case AArch64::LD1B_2Z_IMM_PSEUDO:
3186 case AArch64::LD1H_2Z_IMM_PSEUDO:
3187 case AArch64::LD1W_2Z_IMM_PSEUDO:
3188 case AArch64::LD1D_2Z_IMM_PSEUDO:
3189 case AArch64::LD1B_4Z_IMM_PSEUDO:
3190 case AArch64::LD1H_4Z_IMM_PSEUDO:
3191 case AArch64::LD1W_4Z_IMM_PSEUDO:
3192 case AArch64::LD1D_4Z_IMM_PSEUDO:
3193 case AArch64::ST1B_2Z_IMM:
3194 case AArch64::ST1B_2Z_STRIDED_IMM:
3195 case AArch64::ST1H_2Z_IMM:
3196 case AArch64::ST1H_2Z_STRIDED_IMM:
3197 case AArch64::ST1W_2Z_IMM:
3198 case AArch64::ST1W_2Z_STRIDED_IMM:
3199 case AArch64::ST1D_2Z_IMM:
3200 case AArch64::ST1D_2Z_STRIDED_IMM:
3201 case AArch64::LDNT1B_2Z_IMM_PSEUDO:
3202 case AArch64::LDNT1B_2Z_IMM:
3203 case AArch64::LDNT1B_2Z_STRIDED_IMM:
3204 case AArch64::LDNT1H_2Z_IMM_PSEUDO:
3205 case AArch64::LDNT1H_2Z_IMM:
3206 case AArch64::LDNT1H_2Z_STRIDED_IMM:
3207 case AArch64::LDNT1W_2Z_IMM_PSEUDO:
3208 case AArch64::LDNT1W_2Z_IMM:
3209 case AArch64::LDNT1W_2Z_STRIDED_IMM:
3210 case AArch64::LDNT1D_2Z_IMM_PSEUDO:
3211 case AArch64::LDNT1D_2Z_IMM:
3212 case AArch64::LDNT1D_2Z_STRIDED_IMM:
3213 case AArch64::STNT1B_2Z_IMM:
3214 case AArch64::STNT1B_2Z_STRIDED_IMM:
3215 case AArch64::STNT1H_2Z_IMM:
3216 case AArch64::STNT1H_2Z_STRIDED_IMM:
3217 case AArch64::STNT1W_2Z_IMM:
3218 case AArch64::STNT1W_2Z_STRIDED_IMM:
3219 case AArch64::STNT1D_2Z_IMM:
3220 case AArch64::STNT1D_2Z_STRIDED_IMM:
3221 case AArch64::ST1B_4Z_IMM:
3222 case AArch64::ST1B_4Z_STRIDED_IMM:
3223 case AArch64::ST1H_4Z_IMM:
3224 case AArch64::ST1H_4Z_STRIDED_IMM:
3225 case AArch64::ST1W_4Z_IMM:
3226 case AArch64::ST1W_4Z_STRIDED_IMM:
3227 case AArch64::ST1D_4Z_IMM:
3228 case AArch64::ST1D_4Z_STRIDED_IMM:
3229 case AArch64::LDNT1B_4Z_IMM_PSEUDO:
3230 case AArch64::LDNT1B_4Z_IMM:
3231 case AArch64::LDNT1B_4Z_STRIDED_IMM:
3232 case AArch64::LDNT1H_4Z_IMM_PSEUDO:
3233 case AArch64::LDNT1H_4Z_IMM:
3234 case AArch64::LDNT1H_4Z_STRIDED_IMM:
3235 case AArch64::LDNT1W_4Z_IMM_PSEUDO:
3236 case AArch64::LDNT1W_4Z_IMM:
3237 case AArch64::LDNT1W_4Z_STRIDED_IMM:
3238 case AArch64::LDNT1D_4Z_IMM_PSEUDO:
3239 case AArch64::LDNT1D_4Z_IMM:
3240 case AArch64::LDNT1D_4Z_STRIDED_IMM:
3241 case AArch64::STNT1B_4Z_IMM:
3242 case AArch64::STNT1B_4Z_STRIDED_IMM:
3243 case AArch64::STNT1H_4Z_IMM:
3244 case AArch64::STNT1H_4Z_STRIDED_IMM:
3245 case AArch64::STNT1W_4Z_IMM:
3246 case AArch64::STNT1W_4Z_STRIDED_IMM:
3247 case AArch64::STNT1D_4Z_IMM:
3248 case AArch64::STNT1D_4Z_STRIDED_IMM:
3250 case AArch64::LDPDpost:
3251 case AArch64::LDPDpre:
3252 case AArch64::LDPQpost:
3253 case AArch64::LDPQpre:
3254 case AArch64::LDPSpost:
3255 case AArch64::LDPSpre:
3256 case AArch64::LDPWpost:
3257 case AArch64::LDPWpre:
3258 case AArch64::LDPXpost:
3259 case AArch64::LDPXpre:
3260 case AArch64::STGPpre:
3261 case AArch64::STGPpost:
3262 case AArch64::STPDpost:
3263 case AArch64::STPDpre:
3264 case AArch64::STPQpost:
3265 case AArch64::STPQpre:
3266 case AArch64::STPSpost:
3267 case AArch64::STPSpre:
3268 case AArch64::STPWpost:
3269 case AArch64::STPWpre:
3270 case AArch64::STPXpost:
3271 case AArch64::STPXpre:
3277 switch (
MI.getOpcode()) {
3281 case AArch64::STRSui:
3282 case AArch64::STRDui:
3283 case AArch64::STRQui:
3284 case AArch64::STRXui:
3285 case AArch64::STRWui:
3286 case AArch64::LDRSui:
3287 case AArch64::LDRDui:
3288 case AArch64::LDRQui:
3289 case AArch64::LDRXui:
3290 case AArch64::LDRWui:
3291 case AArch64::LDRSWui:
3293 case AArch64::STURSi:
3294 case AArch64::STRSpre:
3295 case AArch64::STURDi:
3296 case AArch64::STRDpre:
3297 case AArch64::STURQi:
3298 case AArch64::STRQpre:
3299 case AArch64::STURWi:
3300 case AArch64::STRWpre:
3301 case AArch64::STURXi:
3302 case AArch64::STRXpre:
3303 case AArch64::LDURSi:
3304 case AArch64::LDRSpre:
3305 case AArch64::LDURDi:
3306 case AArch64::LDRDpre:
3307 case AArch64::LDURQi:
3308 case AArch64::LDRQpre:
3309 case AArch64::LDURWi:
3310 case AArch64::LDRWpre:
3311 case AArch64::LDURXi:
3312 case AArch64::LDRXpre:
3313 case AArch64::LDURSWi:
3314 case AArch64::LDRSWpre:
3316 case AArch64::LDR_ZXI:
3317 case AArch64::STR_ZXI:
3323 switch (
MI.getOpcode()) {
3326 "Unexpected instruction - was a new tail call opcode introduced?");
3328 case AArch64::TCRETURNdi:
3329 case AArch64::TCRETURNri:
3330 case AArch64::TCRETURNrix16x17:
3331 case AArch64::TCRETURNrix17:
3332 case AArch64::TCRETURNrinotx16:
3333 case AArch64::TCRETURNriALL:
3334 case AArch64::AUTH_TCRETURN:
3335 case AArch64::AUTH_TCRETURN_BTI:
3345 case AArch64::ADDWri:
3346 return AArch64::ADDSWri;
3347 case AArch64::ADDWrr:
3348 return AArch64::ADDSWrr;
3349 case AArch64::ADDWrs:
3350 return AArch64::ADDSWrs;
3351 case AArch64::ADDWrx:
3352 return AArch64::ADDSWrx;
3353 case AArch64::ANDWri:
3354 return AArch64::ANDSWri;
3355 case AArch64::ANDWrr:
3356 return AArch64::ANDSWrr;
3357 case AArch64::ANDWrs:
3358 return AArch64::ANDSWrs;
3359 case AArch64::BICWrr:
3360 return AArch64::BICSWrr;
3361 case AArch64::BICWrs:
3362 return AArch64::BICSWrs;
3363 case AArch64::SUBWri:
3364 return AArch64::SUBSWri;
3365 case AArch64::SUBWrr:
3366 return AArch64::SUBSWrr;
3367 case AArch64::SUBWrs:
3368 return AArch64::SUBSWrs;
3369 case AArch64::SUBWrx:
3370 return AArch64::SUBSWrx;
3372 case AArch64::ADDXri:
3373 return AArch64::ADDSXri;
3374 case AArch64::ADDXrr:
3375 return AArch64::ADDSXrr;
3376 case AArch64::ADDXrs:
3377 return AArch64::ADDSXrs;
3378 case AArch64::ADDXrx:
3379 return AArch64::ADDSXrx;
3380 case AArch64::ANDXri:
3381 return AArch64::ANDSXri;
3382 case AArch64::ANDXrr:
3383 return AArch64::ANDSXrr;
3384 case AArch64::ANDXrs:
3385 return AArch64::ANDSXrs;
3386 case AArch64::BICXrr:
3387 return AArch64::BICSXrr;
3388 case AArch64::BICXrs:
3389 return AArch64::BICSXrs;
3390 case AArch64::SUBXri:
3391 return AArch64::SUBSXri;
3392 case AArch64::SUBXrr:
3393 return AArch64::SUBSXrr;
3394 case AArch64::SUBXrs:
3395 return AArch64::SUBSXrs;
3396 case AArch64::SUBXrx:
3397 return AArch64::SUBSXrx;
3399 case AArch64::AND_PPzPP:
3400 return AArch64::ANDS_PPzPP;
3401 case AArch64::BIC_PPzPP:
3402 return AArch64::BICS_PPzPP;
3403 case AArch64::EOR_PPzPP:
3404 return AArch64::EORS_PPzPP;
3405 case AArch64::NAND_PPzPP:
3406 return AArch64::NANDS_PPzPP;
3407 case AArch64::NOR_PPzPP:
3408 return AArch64::NORS_PPzPP;
3409 case AArch64::ORN_PPzPP:
3410 return AArch64::ORNS_PPzPP;
3411 case AArch64::ORR_PPzPP:
3412 return AArch64::ORRS_PPzPP;
3413 case AArch64::BRKA_PPzP:
3414 return AArch64::BRKAS_PPzP;
3415 case AArch64::BRKPA_PPzPP:
3416 return AArch64::BRKPAS_PPzPP;
3417 case AArch64::BRKB_PPzP:
3418 return AArch64::BRKBS_PPzP;
3419 case AArch64::BRKPB_PPzPP:
3420 return AArch64::BRKPBS_PPzPP;
3421 case AArch64::BRKN_PPzP:
3422 return AArch64::BRKNS_PPzP;
3423 case AArch64::RDFFR_PPz:
3424 return AArch64::RDFFRS_PPz;
3425 case AArch64::PTRUE_B:
3426 return AArch64::PTRUES_B;
3437 if (
MI.hasOrderedMemoryRef())
3442 assert((
MI.getOperand(IsPreLdSt ? 2 : 1).isReg() ||
3443 MI.getOperand(IsPreLdSt ? 2 : 1).isFI()) &&
3444 "Expected a reg or frame index operand.");
3448 bool IsImmPreLdSt = IsPreLdSt &&
MI.getOperand(3).isImm();
3450 if (!
MI.getOperand(2).isImm() && !IsImmPreLdSt)
3463 if (
MI.getOperand(1).isReg() && !IsPreLdSt) {
3464 Register BaseReg =
MI.getOperand(1).getReg();
3466 if (
MI.modifiesRegister(BaseReg,
TRI))
3472 switch (
MI.getOpcode()) {
3475 case AArch64::LDR_ZXI:
3476 case AArch64::STR_ZXI:
3477 if (!Subtarget.isLittleEndian() ||
3478 Subtarget.getSVEVectorSizeInBits() != 128)
3491 const MCAsmInfo &MAI =
MI.getMF()->getTarget().getMCAsmInfo();
3499 if (Subtarget.isPaired128Slow()) {
3500 switch (
MI.getOpcode()) {
3503 case AArch64::LDURQi:
3504 case AArch64::STURQi:
3505 case AArch64::LDRQui:
3506 case AArch64::STRQui:
3533std::optional<ExtAddrMode>
3538 bool OffsetIsScalable;
3539 if (!getMemOperandWithOffset(MemI,
Base,
Offset, OffsetIsScalable,
TRI))
3540 return std::nullopt;
3543 return std::nullopt;
3558 int64_t OffsetScale = 1;
3563 case AArch64::LDURQi:
3564 case AArch64::STURQi:
3568 case AArch64::LDURDi:
3569 case AArch64::STURDi:
3570 case AArch64::LDURXi:
3571 case AArch64::STURXi:
3575 case AArch64::LDURWi:
3576 case AArch64::LDURSWi:
3577 case AArch64::STURWi:
3581 case AArch64::LDURHi:
3582 case AArch64::STURHi:
3583 case AArch64::LDURHHi:
3584 case AArch64::STURHHi:
3585 case AArch64::LDURSHXi:
3586 case AArch64::LDURSHWi:
3590 case AArch64::LDRBroX:
3591 case AArch64::LDRBBroX:
3592 case AArch64::LDRSBXroX:
3593 case AArch64::LDRSBWroX:
3594 case AArch64::STRBroX:
3595 case AArch64::STRBBroX:
3596 case AArch64::LDURBi:
3597 case AArch64::LDURBBi:
3598 case AArch64::LDURSBXi:
3599 case AArch64::LDURSBWi:
3600 case AArch64::STURBi:
3601 case AArch64::STURBBi:
3602 case AArch64::LDRBui:
3603 case AArch64::LDRBBui:
3604 case AArch64::LDRSBXui:
3605 case AArch64::LDRSBWui:
3606 case AArch64::STRBui:
3607 case AArch64::STRBBui:
3611 case AArch64::LDRQroX:
3612 case AArch64::STRQroX:
3613 case AArch64::LDRQui:
3614 case AArch64::STRQui:
3619 case AArch64::LDRDroX:
3620 case AArch64::STRDroX:
3621 case AArch64::LDRXroX:
3622 case AArch64::STRXroX:
3623 case AArch64::LDRDui:
3624 case AArch64::STRDui:
3625 case AArch64::LDRXui:
3626 case AArch64::STRXui:
3631 case AArch64::LDRWroX:
3632 case AArch64::LDRSWroX:
3633 case AArch64::STRWroX:
3634 case AArch64::LDRWui:
3635 case AArch64::LDRSWui:
3636 case AArch64::STRWui:
3641 case AArch64::LDRHroX:
3642 case AArch64::STRHroX:
3643 case AArch64::LDRHHroX:
3644 case AArch64::STRHHroX:
3645 case AArch64::LDRSHXroX:
3646 case AArch64::LDRSHWroX:
3647 case AArch64::LDRHui:
3648 case AArch64::STRHui:
3649 case AArch64::LDRHHui:
3650 case AArch64::STRHHui:
3651 case AArch64::LDRSHXui:
3652 case AArch64::LDRSHWui:
3660 if (BaseRegOp.
isReg() && BaseRegOp.
getReg() == Reg)
3684 case AArch64::SBFMXri:
3697 AM.
Scale = OffsetScale;
3702 case TargetOpcode::SUBREG_TO_REG: {
3718 if (
DefMI.getOpcode() != AArch64::ORRWrs ||
3719 DefMI.getOperand(1).getReg() != AArch64::WZR ||
3720 DefMI.getOperand(3).getImm() != 0)
3727 AM.
Scale = OffsetScale;
3738 auto validateOffsetForLDP = [](
unsigned NumBytes, int64_t OldOffset,
3739 int64_t NewOffset) ->
bool {
3740 int64_t MinOffset, MaxOffset;
3757 return OldOffset < MinOffset || OldOffset > MaxOffset ||
3758 (NewOffset >= MinOffset && NewOffset <= MaxOffset);
3760 auto canFoldAddSubImmIntoAddrMode = [&](int64_t Disp) ->
bool {
3762 int64_t NewOffset = OldOffset + Disp;
3763 if (!isLegalAddressingMode(NumBytes, NewOffset, 0))
3767 if (!validateOffsetForLDP(NumBytes, OldOffset, NewOffset))
3777 auto canFoldAddRegIntoAddrMode =
3782 if ((
unsigned)Scale != Scale)
3784 if (!isLegalAddressingMode(NumBytes, 0, Scale))
3796 return (Opcode == AArch64::STURQi || Opcode == AArch64::STRQui) &&
3797 Subtarget.isSTRQroSlow();
3806 case AArch64::ADDXri:
3812 return canFoldAddSubImmIntoAddrMode(Disp);
3814 case AArch64::SUBXri:
3820 return canFoldAddSubImmIntoAddrMode(-Disp);
3822 case AArch64::ADDXrs: {
3835 if (Shift != 2 && Shift != 3 && Subtarget.hasAddrLSLSlow14())
3837 if (avoidSlowSTRQ(MemI))
3840 return canFoldAddRegIntoAddrMode(1ULL << Shift);
3843 case AArch64::ADDXrr:
3851 if (!OptSize && avoidSlowSTRQ(MemI))
3853 return canFoldAddRegIntoAddrMode(1);
3855 case AArch64::ADDXrx:
3863 if (!OptSize && avoidSlowSTRQ(MemI))
3872 return canFoldAddRegIntoAddrMode(
3887 case AArch64::LDURQi:
3888 case AArch64::LDRQui:
3889 return AArch64::LDRQroX;
3890 case AArch64::STURQi:
3891 case AArch64::STRQui:
3892 return AArch64::STRQroX;
3893 case AArch64::LDURDi:
3894 case AArch64::LDRDui:
3895 return AArch64::LDRDroX;
3896 case AArch64::STURDi:
3897 case AArch64::STRDui:
3898 return AArch64::STRDroX;
3899 case AArch64::LDURXi:
3900 case AArch64::LDRXui:
3901 return AArch64::LDRXroX;
3902 case AArch64::STURXi:
3903 case AArch64::STRXui:
3904 return AArch64::STRXroX;
3905 case AArch64::LDURWi:
3906 case AArch64::LDRWui:
3907 return AArch64::LDRWroX;
3908 case AArch64::LDURSWi:
3909 case AArch64::LDRSWui:
3910 return AArch64::LDRSWroX;
3911 case AArch64::STURWi:
3912 case AArch64::STRWui:
3913 return AArch64::STRWroX;
3914 case AArch64::LDURHi:
3915 case AArch64::LDRHui:
3916 return AArch64::LDRHroX;
3917 case AArch64::STURHi:
3918 case AArch64::STRHui:
3919 return AArch64::STRHroX;
3920 case AArch64::LDURHHi:
3921 case AArch64::LDRHHui:
3922 return AArch64::LDRHHroX;
3923 case AArch64::STURHHi:
3924 case AArch64::STRHHui:
3925 return AArch64::STRHHroX;
3926 case AArch64::LDURSHXi:
3927 case AArch64::LDRSHXui:
3928 return AArch64::LDRSHXroX;
3929 case AArch64::LDURSHWi:
3930 case AArch64::LDRSHWui:
3931 return AArch64::LDRSHWroX;
3932 case AArch64::LDURBi:
3933 case AArch64::LDRBui:
3934 return AArch64::LDRBroX;
3935 case AArch64::LDURBBi:
3936 case AArch64::LDRBBui:
3937 return AArch64::LDRBBroX;
3938 case AArch64::LDURSBXi:
3939 case AArch64::LDRSBXui:
3940 return AArch64::LDRSBXroX;
3941 case AArch64::LDURSBWi:
3942 case AArch64::LDRSBWui:
3943 return AArch64::LDRSBWroX;
3944 case AArch64::STURBi:
3945 case AArch64::STRBui:
3946 return AArch64::STRBroX;
3947 case AArch64::STURBBi:
3948 case AArch64::STRBBui:
3949 return AArch64::STRBBroX;
3961 case AArch64::LDURQi:
3963 return AArch64::LDRQui;
3964 case AArch64::STURQi:
3966 return AArch64::STRQui;
3967 case AArch64::LDURDi:
3969 return AArch64::LDRDui;
3970 case AArch64::STURDi:
3972 return AArch64::STRDui;
3973 case AArch64::LDURXi:
3975 return AArch64::LDRXui;
3976 case AArch64::STURXi:
3978 return AArch64::STRXui;
3979 case AArch64::LDURWi:
3981 return AArch64::LDRWui;
3982 case AArch64::LDURSWi:
3984 return AArch64::LDRSWui;
3985 case AArch64::STURWi:
3987 return AArch64::STRWui;
3988 case AArch64::LDURHi:
3990 return AArch64::LDRHui;
3991 case AArch64::STURHi:
3993 return AArch64::STRHui;
3994 case AArch64::LDURHHi:
3996 return AArch64::LDRHHui;
3997 case AArch64::STURHHi:
3999 return AArch64::STRHHui;
4000 case AArch64::LDURSHXi:
4002 return AArch64::LDRSHXui;
4003 case AArch64::LDURSHWi:
4005 return AArch64::LDRSHWui;
4006 case AArch64::LDURBi:
4008 return AArch64::LDRBui;
4009 case AArch64::LDURBBi:
4011 return AArch64::LDRBBui;
4012 case AArch64::LDURSBXi:
4014 return AArch64::LDRSBXui;
4015 case AArch64::LDURSBWi:
4017 return AArch64::LDRSBWui;
4018 case AArch64::STURBi:
4020 return AArch64::STRBui;
4021 case AArch64::STURBBi:
4023 return AArch64::STRBBui;
4024 case AArch64::LDRQui:
4025 case AArch64::STRQui:
4028 case AArch64::LDRDui:
4029 case AArch64::STRDui:
4030 case AArch64::LDRXui:
4031 case AArch64::STRXui:
4034 case AArch64::LDRWui:
4035 case AArch64::LDRSWui:
4036 case AArch64::STRWui:
4039 case AArch64::LDRHui:
4040 case AArch64::STRHui:
4041 case AArch64::LDRHHui:
4042 case AArch64::STRHHui:
4043 case AArch64::LDRSHXui:
4044 case AArch64::LDRSHWui:
4047 case AArch64::LDRBui:
4048 case AArch64::LDRBBui:
4049 case AArch64::LDRSBXui:
4050 case AArch64::LDRSBWui:
4051 case AArch64::STRBui:
4052 case AArch64::STRBBui:
4066 case AArch64::LDURQi:
4067 case AArch64::STURQi:
4068 case AArch64::LDURDi:
4069 case AArch64::STURDi:
4070 case AArch64::LDURXi:
4071 case AArch64::STURXi:
4072 case AArch64::LDURWi:
4073 case AArch64::LDURSWi:
4074 case AArch64::STURWi:
4075 case AArch64::LDURHi:
4076 case AArch64::STURHi:
4077 case AArch64::LDURHHi:
4078 case AArch64::STURHHi:
4079 case AArch64::LDURSHXi:
4080 case AArch64::LDURSHWi:
4081 case AArch64::LDURBi:
4082 case AArch64::STURBi:
4083 case AArch64::LDURBBi:
4084 case AArch64::STURBBi:
4085 case AArch64::LDURSBWi:
4086 case AArch64::LDURSBXi:
4088 case AArch64::LDRQui:
4089 return AArch64::LDURQi;
4090 case AArch64::STRQui:
4091 return AArch64::STURQi;
4092 case AArch64::LDRDui:
4093 return AArch64::LDURDi;
4094 case AArch64::STRDui:
4095 return AArch64::STURDi;
4096 case AArch64::LDRXui:
4097 return AArch64::LDURXi;
4098 case AArch64::STRXui:
4099 return AArch64::STURXi;
4100 case AArch64::LDRWui:
4101 return AArch64::LDURWi;
4102 case AArch64::LDRSWui:
4103 return AArch64::LDURSWi;
4104 case AArch64::STRWui:
4105 return AArch64::STURWi;
4106 case AArch64::LDRHui:
4107 return AArch64::LDURHi;
4108 case AArch64::STRHui:
4109 return AArch64::STURHi;
4110 case AArch64::LDRHHui:
4111 return AArch64::LDURHHi;
4112 case AArch64::STRHHui:
4113 return AArch64::STURHHi;
4114 case AArch64::LDRSHXui:
4115 return AArch64::LDURSHXi;
4116 case AArch64::LDRSHWui:
4117 return AArch64::LDURSHWi;
4118 case AArch64::LDRBBui:
4119 return AArch64::LDURBBi;
4120 case AArch64::LDRBui:
4121 return AArch64::LDURBi;
4122 case AArch64::STRBBui:
4123 return AArch64::STURBBi;
4124 case AArch64::STRBui:
4125 return AArch64::STURBi;
4126 case AArch64::LDRSBWui:
4127 return AArch64::LDURSBWi;
4128 case AArch64::LDRSBXui:
4129 return AArch64::LDURSBXi;
4142 case AArch64::LDRQroX:
4143 case AArch64::LDURQi:
4144 case AArch64::LDRQui:
4145 return AArch64::LDRQroW;
4146 case AArch64::STRQroX:
4147 case AArch64::STURQi:
4148 case AArch64::STRQui:
4149 return AArch64::STRQroW;
4150 case AArch64::LDRDroX:
4151 case AArch64::LDURDi:
4152 case AArch64::LDRDui:
4153 return AArch64::LDRDroW;
4154 case AArch64::STRDroX:
4155 case AArch64::STURDi:
4156 case AArch64::STRDui:
4157 return AArch64::STRDroW;
4158 case AArch64::LDRXroX:
4159 case AArch64::LDURXi:
4160 case AArch64::LDRXui:
4161 return AArch64::LDRXroW;
4162 case AArch64::STRXroX:
4163 case AArch64::STURXi:
4164 case AArch64::STRXui:
4165 return AArch64::STRXroW;
4166 case AArch64::LDRWroX:
4167 case AArch64::LDURWi:
4168 case AArch64::LDRWui:
4169 return AArch64::LDRWroW;
4170 case AArch64::LDRSWroX:
4171 case AArch64::LDURSWi:
4172 case AArch64::LDRSWui:
4173 return AArch64::LDRSWroW;
4174 case AArch64::STRWroX:
4175 case AArch64::STURWi:
4176 case AArch64::STRWui:
4177 return AArch64::STRWroW;
4178 case AArch64::LDRHroX:
4179 case AArch64::LDURHi:
4180 case AArch64::LDRHui:
4181 return AArch64::LDRHroW;
4182 case AArch64::STRHroX:
4183 case AArch64::STURHi:
4184 case AArch64::STRHui:
4185 return AArch64::STRHroW;
4186 case AArch64::LDRHHroX:
4187 case AArch64::LDURHHi:
4188 case AArch64::LDRHHui:
4189 return AArch64::LDRHHroW;
4190 case AArch64::STRHHroX:
4191 case AArch64::STURHHi:
4192 case AArch64::STRHHui:
4193 return AArch64::STRHHroW;
4194 case AArch64::LDRSHXroX:
4195 case AArch64::LDURSHXi:
4196 case AArch64::LDRSHXui:
4197 return AArch64::LDRSHXroW;
4198 case AArch64::LDRSHWroX:
4199 case AArch64::LDURSHWi:
4200 case AArch64::LDRSHWui:
4201 return AArch64::LDRSHWroW;
4202 case AArch64::LDRBroX:
4203 case AArch64::LDURBi:
4204 case AArch64::LDRBui:
4205 return AArch64::LDRBroW;
4206 case AArch64::LDRBBroX:
4207 case AArch64::LDURBBi:
4208 case AArch64::LDRBBui:
4209 return AArch64::LDRBBroW;
4210 case AArch64::LDRSBXroX:
4211 case AArch64::LDURSBXi:
4212 case AArch64::LDRSBXui:
4213 return AArch64::LDRSBXroW;
4214 case AArch64::LDRSBWroX:
4215 case AArch64::LDURSBWi:
4216 case AArch64::LDRSBWui:
4217 return AArch64::LDRSBWroW;
4218 case AArch64::STRBroX:
4219 case AArch64::STURBi:
4220 case AArch64::STRBui:
4221 return AArch64::STRBroW;
4222 case AArch64::STRBBroX:
4223 case AArch64::STURBBi:
4224 case AArch64::STRBBui:
4225 return AArch64::STRBBroW;
4250 return B.getInstr();
4254 "Addressing mode not supported for folding");
4271 return B.getInstr();
4278 "Address offset can be a register or an immediate, but not both");
4299 return B.getInstr();
4303 "Function must not be called with an addressing mode it can't handle");
4312 case AArch64::LD1Fourv16b_POST:
4313 case AArch64::LD1Fourv1d_POST:
4314 case AArch64::LD1Fourv2d_POST:
4315 case AArch64::LD1Fourv2s_POST:
4316 case AArch64::LD1Fourv4h_POST:
4317 case AArch64::LD1Fourv4s_POST:
4318 case AArch64::LD1Fourv8b_POST:
4319 case AArch64::LD1Fourv8h_POST:
4320 case AArch64::LD1Onev16b_POST:
4321 case AArch64::LD1Onev1d_POST:
4322 case AArch64::LD1Onev2d_POST:
4323 case AArch64::LD1Onev2s_POST:
4324 case AArch64::LD1Onev4h_POST:
4325 case AArch64::LD1Onev4s_POST:
4326 case AArch64::LD1Onev8b_POST:
4327 case AArch64::LD1Onev8h_POST:
4328 case AArch64::LD1Rv16b_POST:
4329 case AArch64::LD1Rv1d_POST:
4330 case AArch64::LD1Rv2d_POST:
4331 case AArch64::LD1Rv2s_POST:
4332 case AArch64::LD1Rv4h_POST:
4333 case AArch64::LD1Rv4s_POST:
4334 case AArch64::LD1Rv8b_POST:
4335 case AArch64::LD1Rv8h_POST:
4336 case AArch64::LD1Threev16b_POST:
4337 case AArch64::LD1Threev1d_POST:
4338 case AArch64::LD1Threev2d_POST:
4339 case AArch64::LD1Threev2s_POST:
4340 case AArch64::LD1Threev4h_POST:
4341 case AArch64::LD1Threev4s_POST:
4342 case AArch64::LD1Threev8b_POST:
4343 case AArch64::LD1Threev8h_POST:
4344 case AArch64::LD1Twov16b_POST:
4345 case AArch64::LD1Twov1d_POST:
4346 case AArch64::LD1Twov2d_POST:
4347 case AArch64::LD1Twov2s_POST:
4348 case AArch64::LD1Twov4h_POST:
4349 case AArch64::LD1Twov4s_POST:
4350 case AArch64::LD1Twov8b_POST:
4351 case AArch64::LD1Twov8h_POST:
4352 case AArch64::LD1i16_POST:
4353 case AArch64::LD1i32_POST:
4354 case AArch64::LD1i64_POST:
4355 case AArch64::LD1i8_POST:
4356 case AArch64::LD2Rv16b_POST:
4357 case AArch64::LD2Rv1d_POST:
4358 case AArch64::LD2Rv2d_POST:
4359 case AArch64::LD2Rv2s_POST:
4360 case AArch64::LD2Rv4h_POST:
4361 case AArch64::LD2Rv4s_POST:
4362 case AArch64::LD2Rv8b_POST:
4363 case AArch64::LD2Rv8h_POST:
4364 case AArch64::LD2Twov16b_POST:
4365 case AArch64::LD2Twov2d_POST:
4366 case AArch64::LD2Twov2s_POST:
4367 case AArch64::LD2Twov4h_POST:
4368 case AArch64::LD2Twov4s_POST:
4369 case AArch64::LD2Twov8b_POST:
4370 case AArch64::LD2Twov8h_POST:
4371 case AArch64::LD2i16_POST:
4372 case AArch64::LD2i32_POST:
4373 case AArch64::LD2i64_POST:
4374 case AArch64::LD2i8_POST:
4375 case AArch64::LD3Rv16b_POST:
4376 case AArch64::LD3Rv1d_POST:
4377 case AArch64::LD3Rv2d_POST:
4378 case AArch64::LD3Rv2s_POST:
4379 case AArch64::LD3Rv4h_POST:
4380 case AArch64::LD3Rv4s_POST:
4381 case AArch64::LD3Rv8b_POST:
4382 case AArch64::LD3Rv8h_POST:
4383 case AArch64::LD3Threev16b_POST:
4384 case AArch64::LD3Threev2d_POST:
4385 case AArch64::LD3Threev2s_POST:
4386 case AArch64::LD3Threev4h_POST:
4387 case AArch64::LD3Threev4s_POST:
4388 case AArch64::LD3Threev8b_POST:
4389 case AArch64::LD3Threev8h_POST:
4390 case AArch64::LD3i16_POST:
4391 case AArch64::LD3i32_POST:
4392 case AArch64::LD3i64_POST:
4393 case AArch64::LD3i8_POST:
4394 case AArch64::LD4Fourv16b_POST:
4395 case AArch64::LD4Fourv2d_POST:
4396 case AArch64::LD4Fourv2s_POST:
4397 case AArch64::LD4Fourv4h_POST:
4398 case AArch64::LD4Fourv4s_POST:
4399 case AArch64::LD4Fourv8b_POST:
4400 case AArch64::LD4Fourv8h_POST:
4401 case AArch64::LD4Rv16b_POST:
4402 case AArch64::LD4Rv1d_POST:
4403 case AArch64::LD4Rv2d_POST:
4404 case AArch64::LD4Rv2s_POST:
4405 case AArch64::LD4Rv4h_POST:
4406 case AArch64::LD4Rv4s_POST:
4407 case AArch64::LD4Rv8b_POST:
4408 case AArch64::LD4Rv8h_POST:
4409 case AArch64::LD4i16_POST:
4410 case AArch64::LD4i32_POST:
4411 case AArch64::LD4i64_POST:
4412 case AArch64::LD4i8_POST:
4413 case AArch64::LDAPRWpost:
4414 case AArch64::LDAPRXpost:
4415 case AArch64::LDIAPPWpost:
4416 case AArch64::LDIAPPXpost:
4417 case AArch64::LDPDpost:
4418 case AArch64::LDPQpost:
4419 case AArch64::LDPSWpost:
4420 case AArch64::LDPSpost:
4421 case AArch64::LDPWpost:
4422 case AArch64::LDPXpost:
4423 case AArch64::LDRBBpost:
4424 case AArch64::LDRBpost:
4425 case AArch64::LDRDpost:
4426 case AArch64::LDRHHpost:
4427 case AArch64::LDRHpost:
4428 case AArch64::LDRQpost:
4429 case AArch64::LDRSBWpost:
4430 case AArch64::LDRSBXpost:
4431 case AArch64::LDRSHWpost:
4432 case AArch64::LDRSHXpost:
4433 case AArch64::LDRSWpost:
4434 case AArch64::LDRSpost:
4435 case AArch64::LDRWpost:
4436 case AArch64::LDRXpost:
4437 case AArch64::ST1Fourv16b_POST:
4438 case AArch64::ST1Fourv1d_POST:
4439 case AArch64::ST1Fourv2d_POST:
4440 case AArch64::ST1Fourv2s_POST:
4441 case AArch64::ST1Fourv4h_POST:
4442 case AArch64::ST1Fourv4s_POST:
4443 case AArch64::ST1Fourv8b_POST:
4444 case AArch64::ST1Fourv8h_POST:
4445 case AArch64::ST1Onev16b_POST:
4446 case AArch64::ST1Onev1d_POST:
4447 case AArch64::ST1Onev2d_POST:
4448 case AArch64::ST1Onev2s_POST:
4449 case AArch64::ST1Onev4h_POST:
4450 case AArch64::ST1Onev4s_POST:
4451 case AArch64::ST1Onev8b_POST:
4452 case AArch64::ST1Onev8h_POST:
4453 case AArch64::ST1Threev16b_POST:
4454 case AArch64::ST1Threev1d_POST:
4455 case AArch64::ST1Threev2d_POST:
4456 case AArch64::ST1Threev2s_POST:
4457 case AArch64::ST1Threev4h_POST:
4458 case AArch64::ST1Threev4s_POST:
4459 case AArch64::ST1Threev8b_POST:
4460 case AArch64::ST1Threev8h_POST:
4461 case AArch64::ST1Twov16b_POST:
4462 case AArch64::ST1Twov1d_POST:
4463 case AArch64::ST1Twov2d_POST:
4464 case AArch64::ST1Twov2s_POST:
4465 case AArch64::ST1Twov4h_POST:
4466 case AArch64::ST1Twov4s_POST:
4467 case AArch64::ST1Twov8b_POST:
4468 case AArch64::ST1Twov8h_POST:
4469 case AArch64::ST1i16_POST:
4470 case AArch64::ST1i32_POST:
4471 case AArch64::ST1i64_POST:
4472 case AArch64::ST1i8_POST:
4473 case AArch64::ST2GPostIndex:
4474 case AArch64::ST2Twov16b_POST:
4475 case AArch64::ST2Twov2d_POST:
4476 case AArch64::ST2Twov2s_POST:
4477 case AArch64::ST2Twov4h_POST:
4478 case AArch64::ST2Twov4s_POST:
4479 case AArch64::ST2Twov8b_POST:
4480 case AArch64::ST2Twov8h_POST:
4481 case AArch64::ST2i16_POST:
4482 case AArch64::ST2i32_POST:
4483 case AArch64::ST2i64_POST:
4484 case AArch64::ST2i8_POST:
4485 case AArch64::ST3Threev16b_POST:
4486 case AArch64::ST3Threev2d_POST:
4487 case AArch64::ST3Threev2s_POST:
4488 case AArch64::ST3Threev4h_POST:
4489 case AArch64::ST3Threev4s_POST:
4490 case AArch64::ST3Threev8b_POST:
4491 case AArch64::ST3Threev8h_POST:
4492 case AArch64::ST3i16_POST:
4493 case AArch64::ST3i32_POST:
4494 case AArch64::ST3i64_POST:
4495 case AArch64::ST3i8_POST:
4496 case AArch64::ST4Fourv16b_POST:
4497 case AArch64::ST4Fourv2d_POST:
4498 case AArch64::ST4Fourv2s_POST:
4499 case AArch64::ST4Fourv4h_POST:
4500 case AArch64::ST4Fourv4s_POST:
4501 case AArch64::ST4Fourv8b_POST:
4502 case AArch64::ST4Fourv8h_POST:
4503 case AArch64::ST4i16_POST:
4504 case AArch64::ST4i32_POST:
4505 case AArch64::ST4i64_POST:
4506 case AArch64::ST4i8_POST:
4507 case AArch64::STGPostIndex:
4508 case AArch64::STGPpost:
4509 case AArch64::STPDpost:
4510 case AArch64::STPQpost:
4511 case AArch64::STPSpost:
4512 case AArch64::STPWpost:
4513 case AArch64::STPXpost:
4514 case AArch64::STRBBpost:
4515 case AArch64::STRBpost:
4516 case AArch64::STRDpost:
4517 case AArch64::STRHHpost:
4518 case AArch64::STRHpost:
4519 case AArch64::STRQpost:
4520 case AArch64::STRSpost:
4521 case AArch64::STRWpost:
4522 case AArch64::STRXpost:
4523 case AArch64::STZ2GPostIndex:
4524 case AArch64::STZGPostIndex:
4531 bool &OffsetIsScalable,
TypeSize &Width,
4552 int64_t Dummy1, Dummy2;
4574 return BaseOp->
isReg() || BaseOp->
isFI();
4581 assert(OfsOp.
isImm() &&
"Offset operand wasn't immediate.");
4586 TypeSize &Width, int64_t &MinOffset,
4587 int64_t &MaxOffset) {
4592 MinOffset = MaxOffset = 0;
4595 case AArch64::LDRQui:
4596 case AArch64::STRQui:
4601 case AArch64::LDRXui:
4602 case AArch64::LDRDui:
4603 case AArch64::STRXui:
4604 case AArch64::STRDui:
4605 case AArch64::PRFMui:
4610 case AArch64::LDRWui:
4611 case AArch64::LDRSui:
4612 case AArch64::LDRSWui:
4613 case AArch64::STRWui:
4614 case AArch64::STRSui:
4619 case AArch64::LDRHui:
4620 case AArch64::LDRHHui:
4621 case AArch64::LDRSHWui:
4622 case AArch64::LDRSHXui:
4623 case AArch64::STRHui:
4624 case AArch64::STRHHui:
4629 case AArch64::LDRBui:
4630 case AArch64::LDRBBui:
4631 case AArch64::LDRSBWui:
4632 case AArch64::LDRSBXui:
4633 case AArch64::STRBui:
4634 case AArch64::STRBBui:
4640 case AArch64::STRQpre:
4641 case AArch64::LDRQpost:
4647 case AArch64::LDRDpost:
4648 case AArch64::LDRDpre:
4649 case AArch64::LDRXpost:
4650 case AArch64::LDRXpre:
4651 case AArch64::STRDpost:
4652 case AArch64::STRDpre:
4653 case AArch64::STRXpost:
4654 case AArch64::STRXpre:
4660 case AArch64::STRWpost:
4661 case AArch64::STRWpre:
4662 case AArch64::LDRWpost:
4663 case AArch64::LDRWpre:
4664 case AArch64::STRSpost:
4665 case AArch64::STRSpre:
4666 case AArch64::LDRSpost:
4667 case AArch64::LDRSpre:
4673 case AArch64::LDRHpost:
4674 case AArch64::LDRHpre:
4675 case AArch64::STRHpost:
4676 case AArch64::STRHpre:
4677 case AArch64::LDRHHpost:
4678 case AArch64::LDRHHpre:
4679 case AArch64::STRHHpost:
4680 case AArch64::STRHHpre:
4686 case AArch64::LDRBpost:
4687 case AArch64::LDRBpre:
4688 case AArch64::STRBpost:
4689 case AArch64::STRBpre:
4690 case AArch64::LDRBBpost:
4691 case AArch64::LDRBBpre:
4692 case AArch64::STRBBpost:
4693 case AArch64::STRBBpre:
4699 case AArch64::LDURQi:
4700 case AArch64::STURQi:
4706 case AArch64::LDURXi:
4707 case AArch64::LDURDi:
4708 case AArch64::LDAPURXi:
4709 case AArch64::STURXi:
4710 case AArch64::STURDi:
4711 case AArch64::STLURXi:
4712 case AArch64::PRFUMi:
4718 case AArch64::LDURWi:
4719 case AArch64::LDURSi:
4720 case AArch64::LDURSWi:
4721 case AArch64::LDAPURi:
4722 case AArch64::LDAPURSWi:
4723 case AArch64::STURWi:
4724 case AArch64::STURSi:
4725 case AArch64::STLURWi:
4731 case AArch64::LDURHi:
4732 case AArch64::LDURHHi:
4733 case AArch64::LDURSHXi:
4734 case AArch64::LDURSHWi:
4735 case AArch64::LDAPURHi:
4736 case AArch64::LDAPURSHWi:
4737 case AArch64::LDAPURSHXi:
4738 case AArch64::STURHi:
4739 case AArch64::STURHHi:
4740 case AArch64::STLURHi:
4746 case AArch64::LDURBi:
4747 case AArch64::LDURBBi:
4748 case AArch64::LDURSBXi:
4749 case AArch64::LDURSBWi:
4750 case AArch64::LDAPURBi:
4751 case AArch64::LDAPURSBWi:
4752 case AArch64::LDAPURSBXi:
4753 case AArch64::STURBi:
4754 case AArch64::STURBBi:
4755 case AArch64::STLURBi:
4761 case AArch64::LDPQi:
4762 case AArch64::LDNPQi:
4763 case AArch64::STPQi:
4764 case AArch64::STNPQi:
4765 case AArch64::LDPQpost:
4766 case AArch64::LDPQpre:
4767 case AArch64::STPQpost:
4768 case AArch64::STPQpre:
4774 case AArch64::LDPXi:
4775 case AArch64::LDPDi:
4776 case AArch64::LDNPXi:
4777 case AArch64::LDNPDi:
4778 case AArch64::STPXi:
4779 case AArch64::STPDi:
4780 case AArch64::STNPXi:
4781 case AArch64::STNPDi:
4782 case AArch64::LDPDpost:
4783 case AArch64::LDPDpre:
4784 case AArch64::LDPXpost:
4785 case AArch64::LDPXpre:
4786 case AArch64::STPDpost:
4787 case AArch64::STPDpre:
4788 case AArch64::STPXpost:
4789 case AArch64::STPXpre:
4795 case AArch64::LDPWi:
4796 case AArch64::LDPSi:
4797 case AArch64::LDNPWi:
4798 case AArch64::LDNPSi:
4799 case AArch64::STPWi:
4800 case AArch64::STPSi:
4801 case AArch64::STNPWi:
4802 case AArch64::STNPSi:
4803 case AArch64::LDPSpost:
4804 case AArch64::LDPSpre:
4805 case AArch64::LDPWpost:
4806 case AArch64::LDPWpre:
4807 case AArch64::STPSpost:
4808 case AArch64::STPSpre:
4809 case AArch64::STPWpost:
4810 case AArch64::STPWpre:
4816 case AArch64::StoreSwiftAsyncContext:
4829 case AArch64::TAGPstack:
4839 case AArch64::STGPreIndex:
4840 case AArch64::STGPostIndex:
4841 case AArch64::STZGi:
4842 case AArch64::STZGPreIndex:
4843 case AArch64::STZGPostIndex:
4849 case AArch64::STR_ZZZZXI:
4850 case AArch64::STR_ZZZZXI_STRIDED_CONTIGUOUS:
4851 case AArch64::LDR_ZZZZXI:
4852 case AArch64::LDR_ZZZZXI_STRIDED_CONTIGUOUS:
4858 case AArch64::STR_ZZZXI:
4859 case AArch64::LDR_ZZZXI:
4865 case AArch64::STR_ZZXI:
4866 case AArch64::STR_ZZXI_STRIDED_CONTIGUOUS:
4867 case AArch64::LDR_ZZXI:
4868 case AArch64::LDR_ZZXI_STRIDED_CONTIGUOUS:
4874 case AArch64::LDR_PXI:
4875 case AArch64::STR_PXI:
4880 case AArch64::LDR_PPXI:
4881 case AArch64::STR_PPXI:
4887 case AArch64::LDR_ZXI:
4888 case AArch64::STR_ZXI:
4893 case AArch64::LD1B_IMM:
4894 case AArch64::LD1H_IMM:
4895 case AArch64::LD1W_IMM:
4896 case AArch64::LD1D_IMM:
4897 case AArch64::LDNT1B_ZRI:
4898 case AArch64::LDNT1H_ZRI:
4899 case AArch64::LDNT1W_ZRI:
4900 case AArch64::LDNT1D_ZRI:
4901 case AArch64::ST1B_IMM:
4902 case AArch64::ST1H_IMM:
4903 case AArch64::ST1W_IMM:
4904 case AArch64::ST1D_IMM:
4905 case AArch64::STNT1B_ZRI:
4906 case AArch64::STNT1H_ZRI:
4907 case AArch64::STNT1W_ZRI:
4908 case AArch64::STNT1D_ZRI:
4909 case AArch64::LDNF1B_IMM:
4910 case AArch64::LDNF1H_IMM:
4911 case AArch64::LDNF1W_IMM:
4912 case AArch64::LDNF1D_IMM:
4919 case AArch64::LD2B_IMM:
4920 case AArch64::LD2H_IMM:
4921 case AArch64::LD2W_IMM:
4922 case AArch64::LD2D_IMM:
4923 case AArch64::ST2B_IMM:
4924 case AArch64::ST2H_IMM:
4925 case AArch64::ST2W_IMM:
4926 case AArch64::ST2D_IMM:
4927 case AArch64::LD1B_2Z_IMM:
4928 case AArch64::LD1B_2Z_STRIDED_IMM:
4929 case AArch64::LD1H_2Z_IMM:
4930 case AArch64::LD1H_2Z_STRIDED_IMM:
4931 case AArch64::LD1W_2Z_IMM:
4932 case AArch64::LD1W_2Z_STRIDED_IMM:
4933 case AArch64::LD1D_2Z_IMM:
4934 case AArch64::LD1D_2Z_STRIDED_IMM:
4935 case AArch64::LD1B_2Z_IMM_PSEUDO:
4936 case AArch64::LD1H_2Z_IMM_PSEUDO:
4937 case AArch64::LD1W_2Z_IMM_PSEUDO:
4938 case AArch64::LD1D_2Z_IMM_PSEUDO:
4939 case AArch64::ST1B_2Z_IMM:
4940 case AArch64::ST1B_2Z_STRIDED_IMM:
4941 case AArch64::ST1H_2Z_IMM:
4942 case AArch64::ST1H_2Z_STRIDED_IMM:
4943 case AArch64::ST1W_2Z_IMM:
4944 case AArch64::ST1W_2Z_STRIDED_IMM:
4945 case AArch64::ST1D_2Z_IMM:
4946 case AArch64::ST1D_2Z_STRIDED_IMM:
4947 case AArch64::LDNT1B_2Z_IMM_PSEUDO:
4948 case AArch64::LDNT1B_2Z_IMM:
4949 case AArch64::LDNT1B_2Z_STRIDED_IMM:
4950 case AArch64::LDNT1H_2Z_IMM_PSEUDO:
4951 case AArch64::LDNT1H_2Z_IMM:
4952 case AArch64::LDNT1H_2Z_STRIDED_IMM:
4953 case AArch64::LDNT1W_2Z_IMM_PSEUDO:
4954 case AArch64::LDNT1W_2Z_IMM:
4955 case AArch64::LDNT1W_2Z_STRIDED_IMM:
4956 case AArch64::LDNT1D_2Z_IMM_PSEUDO:
4957 case AArch64::LDNT1D_2Z_IMM:
4958 case AArch64::LDNT1D_2Z_STRIDED_IMM:
4959 case AArch64::STNT1B_2Z_IMM:
4960 case AArch64::STNT1B_2Z_STRIDED_IMM:
4961 case AArch64::STNT1H_2Z_IMM:
4962 case AArch64::STNT1H_2Z_STRIDED_IMM:
4963 case AArch64::STNT1W_2Z_IMM:
4964 case AArch64::STNT1W_2Z_STRIDED_IMM:
4965 case AArch64::STNT1D_2Z_IMM:
4966 case AArch64::STNT1D_2Z_STRIDED_IMM:
4971 case AArch64::LD3B_IMM:
4972 case AArch64::LD3H_IMM:
4973 case AArch64::LD3W_IMM:
4974 case AArch64::LD3D_IMM:
4975 case AArch64::ST3B_IMM:
4976 case AArch64::ST3H_IMM:
4977 case AArch64::ST3W_IMM:
4978 case AArch64::ST3D_IMM:
4983 case AArch64::LD4B_IMM:
4984 case AArch64::LD4H_IMM:
4985 case AArch64::LD4W_IMM:
4986 case AArch64::LD4D_IMM:
4987 case AArch64::ST4B_IMM:
4988 case AArch64::ST4H_IMM:
4989 case AArch64::ST4W_IMM:
4990 case AArch64::ST4D_IMM:
4991 case AArch64::LD1B_4Z_IMM:
4992 case AArch64::LD1B_4Z_STRIDED_IMM:
4993 case AArch64::LD1H_4Z_IMM:
4994 case AArch64::LD1H_4Z_STRIDED_IMM:
4995 case AArch64::LD1W_4Z_IMM:
4996 case AArch64::LD1W_4Z_STRIDED_IMM:
4997 case AArch64::LD1D_4Z_IMM:
4998 case AArch64::LD1D_4Z_STRIDED_IMM:
4999 case AArch64::LD1B_4Z_IMM_PSEUDO:
5000 case AArch64::LD1H_4Z_IMM_PSEUDO:
5001 case AArch64::LD1W_4Z_IMM_PSEUDO:
5002 case AArch64::LD1D_4Z_IMM_PSEUDO:
5003 case AArch64::ST1B_4Z_IMM:
5004 case AArch64::ST1B_4Z_STRIDED_IMM:
5005 case AArch64::ST1H_4Z_IMM:
5006 case AArch64::ST1H_4Z_STRIDED_IMM:
5007 case AArch64::ST1W_4Z_IMM:
5008 case AArch64::ST1W_4Z_STRIDED_IMM:
5009 case AArch64::ST1D_4Z_IMM:
5010 case AArch64::ST1D_4Z_STRIDED_IMM:
5011 case AArch64::LDNT1B_4Z_IMM_PSEUDO:
5012 case AArch64::LDNT1B_4Z_IMM:
5013 case AArch64::LDNT1B_4Z_STRIDED_IMM:
5014 case AArch64::LDNT1H_4Z_IMM_PSEUDO:
5015 case AArch64::LDNT1H_4Z_IMM:
5016 case AArch64::LDNT1H_4Z_STRIDED_IMM:
5017 case AArch64::LDNT1W_4Z_IMM_PSEUDO:
5018 case AArch64::LDNT1W_4Z_IMM:
5019 case AArch64::LDNT1W_4Z_STRIDED_IMM:
5020 case AArch64::LDNT1D_4Z_IMM_PSEUDO:
5021 case AArch64::LDNT1D_4Z_IMM:
5022 case AArch64::LDNT1D_4Z_STRIDED_IMM:
5023 case AArch64::STNT1B_4Z_IMM:
5024 case AArch64::STNT1B_4Z_STRIDED_IMM:
5025 case AArch64::STNT1H_4Z_IMM:
5026 case AArch64::STNT1H_4Z_STRIDED_IMM:
5027 case AArch64::STNT1W_4Z_IMM:
5028 case AArch64::STNT1W_4Z_STRIDED_IMM:
5029 case AArch64::STNT1D_4Z_IMM:
5030 case AArch64::STNT1D_4Z_STRIDED_IMM:
5035 case AArch64::LD1B_H_IMM:
5036 case AArch64::LD1SB_H_IMM:
5037 case AArch64::LD1H_S_IMM:
5038 case AArch64::LD1SH_S_IMM:
5039 case AArch64::LD1W_D_IMM:
5040 case AArch64::LD1SW_D_IMM:
5041 case AArch64::ST1B_H_IMM:
5042 case AArch64::ST1H_S_IMM:
5043 case AArch64::ST1W_D_IMM:
5044 case AArch64::LDNF1B_H_IMM:
5045 case AArch64::LDNF1SB_H_IMM:
5046 case AArch64::LDNF1H_S_IMM:
5047 case AArch64::LDNF1SH_S_IMM:
5048 case AArch64::LDNF1W_D_IMM:
5049 case AArch64::LDNF1SW_D_IMM:
5056 case AArch64::LD1B_S_IMM:
5057 case AArch64::LD1SB_S_IMM:
5058 case AArch64::LD1H_D_IMM:
5059 case AArch64::LD1SH_D_IMM:
5060 case AArch64::ST1B_S_IMM:
5061 case AArch64::ST1H_D_IMM:
5062 case AArch64::LDNF1B_S_IMM:
5063 case AArch64::LDNF1SB_S_IMM:
5064 case AArch64::LDNF1H_D_IMM:
5065 case AArch64::LDNF1SH_D_IMM:
5072 case AArch64::LD1B_D_IMM:
5073 case AArch64::LD1SB_D_IMM:
5074 case AArch64::ST1B_D_IMM:
5075 case AArch64::LDNF1B_D_IMM:
5076 case AArch64::LDNF1SB_D_IMM:
5083 case AArch64::ST2Gi:
5084 case AArch64::ST2GPreIndex:
5085 case AArch64::ST2GPostIndex:
5086 case AArch64::STZ2Gi:
5087 case AArch64::STZ2GPreIndex:
5088 case AArch64::STZ2GPostIndex:
5094 case AArch64::STGPi:
5095 case AArch64::STGPpost:
5096 case AArch64::STGPpre:
5101 case AArch64::LD1RB_IMM:
5102 case AArch64::LD1RB_H_IMM:
5103 case AArch64::LD1RB_S_IMM:
5104 case AArch64::LD1RB_D_IMM:
5105 case AArch64::LD1RSB_H_IMM:
5106 case AArch64::LD1RSB_S_IMM:
5107 case AArch64::LD1RSB_D_IMM:
5112 case AArch64::LD1RH_IMM:
5113 case AArch64::LD1RH_S_IMM:
5114 case AArch64::LD1RH_D_IMM:
5115 case AArch64::LD1RSH_S_IMM:
5116 case AArch64::LD1RSH_D_IMM:
5121 case AArch64::LD1RW_IMM:
5122 case AArch64::LD1RW_D_IMM:
5123 case AArch64::LD1RSW_IMM:
5128 case AArch64::LD1RD_IMM:
5143 case AArch64::LDRBui:
5144 case AArch64::LDRBBui:
5145 case AArch64::LDURBBi:
5146 case AArch64::LDRSBWui:
5147 case AArch64::LDURSBWi:
5148 case AArch64::STRBui:
5149 case AArch64::STRBBui:
5150 case AArch64::STURBBi:
5152 case AArch64::LDRHui:
5153 case AArch64::LDRHHui:
5154 case AArch64::LDURHHi:
5155 case AArch64::LDRSHWui:
5156 case AArch64::LDURSHWi:
5157 case AArch64::STRHui:
5158 case AArch64::STRHHui:
5159 case AArch64::STURHHi:
5161 case AArch64::LDRSui:
5162 case AArch64::LDURSi:
5163 case AArch64::LDRSpre:
5164 case AArch64::LDRSWui:
5165 case AArch64::LDURSWi:
5166 case AArch64::LDRSWpre:
5167 case AArch64::LDRWpre:
5168 case AArch64::LDRWui:
5169 case AArch64::LDURWi:
5170 case AArch64::STRSui:
5171 case AArch64::STURSi:
5172 case AArch64::STRSpre:
5173 case AArch64::STRWui:
5174 case AArch64::STURWi:
5175 case AArch64::STRWpre:
5176 case AArch64::LDPSi:
5177 case AArch64::LDPSWi:
5178 case AArch64::LDPWi:
5179 case AArch64::STPSi:
5180 case AArch64::STPWi:
5182 case AArch64::LDRDui:
5183 case AArch64::LDURDi:
5184 case AArch64::LDRDpre:
5185 case AArch64::LDRXui:
5186 case AArch64::LDURXi:
5187 case AArch64::LDRXpre:
5188 case AArch64::STRDui:
5189 case AArch64::STURDi:
5190 case AArch64::STRDpre:
5191 case AArch64::STRXui:
5192 case AArch64::STURXi:
5193 case AArch64::STRXpre:
5194 case AArch64::LDPDi:
5195 case AArch64::LDPXi:
5196 case AArch64::STPDi:
5197 case AArch64::STPXi:
5199 case AArch64::LDRQui:
5200 case AArch64::LDURQi:
5201 case AArch64::STRQui:
5202 case AArch64::STURQi:
5203 case AArch64::STRQpre:
5204 case AArch64::LDPQi:
5205 case AArch64::LDRQpre:
5206 case AArch64::STPQi:
5208 case AArch64::STZGi:
5209 case AArch64::ST2Gi:
5210 case AArch64::STZ2Gi:
5211 case AArch64::STGPi:
5217 switch (
MI.getOpcode()) {
5220 case AArch64::LDRWpre:
5221 case AArch64::LDRXpre:
5222 case AArch64::LDRSWpre:
5223 case AArch64::LDRSpre:
5224 case AArch64::LDRDpre:
5225 case AArch64::LDRQpre:
5231 switch (
MI.getOpcode()) {
5234 case AArch64::STRWpre:
5235 case AArch64::STRXpre:
5236 case AArch64::STRSpre:
5237 case AArch64::STRDpre:
5238 case AArch64::STRQpre:
5248 switch (
MI.getOpcode()) {
5251 case AArch64::LDURBBi:
5252 case AArch64::LDURHHi:
5253 case AArch64::LDURWi:
5254 case AArch64::LDRBBui:
5255 case AArch64::LDRHHui:
5256 case AArch64::LDRWui:
5257 case AArch64::LDRBBroX:
5258 case AArch64::LDRHHroX:
5259 case AArch64::LDRWroX:
5260 case AArch64::LDRBBroW:
5261 case AArch64::LDRHHroW:
5262 case AArch64::LDRWroW:
5268 switch (
MI.getOpcode()) {
5271 case AArch64::LDURSBWi:
5272 case AArch64::LDURSHWi:
5273 case AArch64::LDURSBXi:
5274 case AArch64::LDURSHXi:
5275 case AArch64::LDURSWi:
5276 case AArch64::LDRSBWui:
5277 case AArch64::LDRSHWui:
5278 case AArch64::LDRSBXui:
5279 case AArch64::LDRSHXui:
5280 case AArch64::LDRSWui:
5281 case AArch64::LDRSBWroX:
5282 case AArch64::LDRSHWroX:
5283 case AArch64::LDRSBXroX:
5284 case AArch64::LDRSHXroX:
5285 case AArch64::LDRSWroX:
5286 case AArch64::LDRSBWroW:
5287 case AArch64::LDRSHWroW:
5288 case AArch64::LDRSBXroW:
5289 case AArch64::LDRSHXroW:
5290 case AArch64::LDRSWroW:
5296 switch (
MI.getOpcode()) {
5299 case AArch64::LDPSi:
5300 case AArch64::LDPSWi:
5301 case AArch64::LDPDi:
5302 case AArch64::LDPQi:
5303 case AArch64::LDPWi:
5304 case AArch64::LDPXi:
5305 case AArch64::STPSi:
5306 case AArch64::STPDi:
5307 case AArch64::STPQi:
5308 case AArch64::STPWi:
5309 case AArch64::STPXi:
5310 case AArch64::STGPi:
5316 assert(
MI.mayLoadOrStore() &&
"Load or store instruction expected");
5320 return MI.getOperand(Idx);
5325 assert(
MI.mayLoadOrStore() &&
"Load or store instruction expected");
5329 return MI.getOperand(Idx);
5334 switch (
MI.getOpcode()) {
5337 case AArch64::LDRBroX:
5338 case AArch64::LDRBBroX:
5339 case AArch64::LDRSBXroX:
5340 case AArch64::LDRSBWroX:
5341 case AArch64::LDRHroX:
5342 case AArch64::LDRHHroX:
5343 case AArch64::LDRSHXroX:
5344 case AArch64::LDRSHWroX:
5345 case AArch64::LDRWroX:
5346 case AArch64::LDRSroX:
5347 case AArch64::LDRSWroX:
5348 case AArch64::LDRDroX:
5349 case AArch64::LDRXroX:
5350 case AArch64::LDRQroX:
5351 return MI.getOperand(4);
5357 if (
MI.getParent() ==
nullptr)
5367 auto Reg =
Op.getReg();
5368 if (Reg.isPhysical())
5369 return AArch64::FPR16RegClass.contains(Reg);
5371 return TRC == &AArch64::FPR16RegClass ||
5372 TRC == &AArch64::FPR16_loRegClass;
5381 auto Reg =
Op.getReg();
5382 if (Reg.isPhysical())
5383 return AArch64::FPR128RegClass.contains(Reg);
5385 return TRC == &AArch64::FPR128RegClass ||
5386 TRC == &AArch64::FPR128_loRegClass;
5392 switch (
MI.getOpcode()) {
5395 case AArch64::PACIASP:
5396 case AArch64::PACIBSP:
5399 case AArch64::PAUTH_PROLOGUE:
5402 case AArch64::HINT: {
5403 unsigned Imm =
MI.getOperand(0).getImm();
5405 if (Imm == 32 || Imm == 34 || Imm == 36 || Imm == 38)
5408 if (Imm == 25 || Imm == 27)
5420 assert(Reg.isPhysical() &&
"Expected physical register in isFpOrNEON");
5421 return AArch64::FPR128RegClass.contains(Reg) ||
5422 AArch64::FPR64RegClass.contains(Reg) ||
5423 AArch64::FPR32RegClass.contains(Reg) ||
5424 AArch64::FPR16RegClass.contains(Reg) ||
5425 AArch64::FPR8RegClass.contains(Reg);
5432 auto Reg =
Op.getReg();
5433 if (Reg.isPhysical())
5437 return TRC == &AArch64::FPR128RegClass ||
5438 TRC == &AArch64::FPR128_loRegClass ||
5439 TRC == &AArch64::FPR64RegClass ||
5440 TRC == &AArch64::FPR64_loRegClass ||
5441 TRC == &AArch64::FPR32RegClass || TRC == &AArch64::FPR16RegClass ||
5442 TRC == &AArch64::FPR8RegClass;
5464 if (FirstOpc == SecondOpc)
5470 case AArch64::STRSui:
5471 case AArch64::STURSi:
5472 return SecondOpc == AArch64::STRSui || SecondOpc == AArch64::STURSi;
5473 case AArch64::STRDui:
5474 case AArch64::STURDi:
5475 return SecondOpc == AArch64::STRDui || SecondOpc == AArch64::STURDi;
5476 case AArch64::STRQui:
5477 case AArch64::STURQi:
5478 return SecondOpc == AArch64::STRQui || SecondOpc == AArch64::STURQi;
5479 case AArch64::STRWui:
5480 case AArch64::STURWi:
5481 return SecondOpc == AArch64::STRWui || SecondOpc == AArch64::STURWi;
5482 case AArch64::STRXui:
5483 case AArch64::STURXi:
5484 return SecondOpc == AArch64::STRXui || SecondOpc == AArch64::STURXi;
5485 case AArch64::LDRSui:
5486 case AArch64::LDURSi:
5487 return SecondOpc == AArch64::LDRSui || SecondOpc == AArch64::LDURSi;
5488 case AArch64::LDRDui:
5489 case AArch64::LDURDi:
5490 return SecondOpc == AArch64::LDRDui || SecondOpc == AArch64::LDURDi;
5491 case AArch64::LDRQui:
5492 case AArch64::LDURQi:
5493 return SecondOpc == AArch64::LDRQui || SecondOpc == AArch64::LDURQi;
5494 case AArch64::LDRWui:
5495 case AArch64::LDURWi:
5496 return SecondOpc == AArch64::LDRSWui || SecondOpc == AArch64::LDURSWi;
5497 case AArch64::LDRSWui:
5498 case AArch64::LDURSWi:
5499 return SecondOpc == AArch64::LDRWui || SecondOpc == AArch64::LDURWi;
5500 case AArch64::LDRXui:
5501 case AArch64::LDURXi:
5502 return SecondOpc == AArch64::LDRXui || SecondOpc == AArch64::LDURXi;
5509 int64_t Offset1,
unsigned Opcode1,
int FI2,
5510 int64_t Offset2,
unsigned Opcode2) {
5516 assert(ObjectOffset1 <= ObjectOffset2 &&
"Object offsets are not ordered.");
5519 if (ObjectOffset1 % Scale1 != 0)
5521 ObjectOffset1 /= Scale1;
5523 if (ObjectOffset2 % Scale2 != 0)
5525 ObjectOffset2 /= Scale2;
5526 ObjectOffset1 += Offset1;
5527 ObjectOffset2 += Offset2;
5528 return ObjectOffset1 + 1 == ObjectOffset2;
5540 int64_t OpOffset2,
bool OffsetIsScalable2,
unsigned ClusterSize,
5541 unsigned NumBytes)
const {
5551 "Only base registers and frame indices are supported.");
5558 if (ClusterSize > 2)
5565 unsigned FirstOpc = FirstLdSt.
getOpcode();
5566 unsigned SecondOpc = SecondLdSt.
getOpcode();
5586 if (Offset1 > 63 || Offset1 < -64)
5591 if (BaseOp1.
isFI()) {
5593 "Caller should have ordered offsets.");
5598 BaseOp2.
getIndex(), Offset2, SecondOpc);
5601 assert(Offset1 <= Offset2 &&
"Caller should have ordered offsets.");
5603 return Offset1 + 1 == Offset2;
5613 if (
Reg.isPhysical())
5622 return ((DestReg - SrcReg) & 0x1f) < NumRegs;
5631 assert(Subtarget.hasNEON() &&
"Unexpected register copy without NEON");
5633 uint16_t DestEncoding =
TRI->getEncodingValue(DestReg);
5634 uint16_t SrcEncoding =
TRI->getEncodingValue(SrcReg);
5635 unsigned NumRegs = Indices.
size();
5637 int SubReg = 0, End = NumRegs, Incr = 1;
5639 SubReg = NumRegs - 1;
5644 for (; SubReg != End; SubReg += Incr) {
5656 unsigned Opcode,
unsigned ZeroReg,
5659 unsigned NumRegs = Indices.
size();
5662 uint16_t DestEncoding =
TRI->getEncodingValue(DestReg);
5663 uint16_t SrcEncoding =
TRI->getEncodingValue(SrcReg);
5664 assert(DestEncoding % NumRegs == 0 && SrcEncoding % NumRegs == 0 &&
5665 "GPR reg sequences should not be able to overlap");
5668 for (
unsigned SubReg = 0; SubReg != NumRegs; ++SubReg) {
5689 unsigned Opc =
MI.getOpcode();
5690 if (
Opc == AArch64::MSRpstatesvcrImm1 ||
Opc == AArch64::MSRpstatePseudo) {
5692 int64_t PState =
MI.getOperand(0).getImm();
5693 if (PState == AArch64SVCR::SVCRSM || PState == AArch64SVCR::SVCRSMZA) {
5695 return MI.getOperand(1).getImm() == 1;
5714 bool RenamableSrc)
const {
5716 if (AArch64::GPR32spRegClass.
contains(DestReg) &&
5717 AArch64::GPR32spRegClass.
contains(SrcReg)) {
5718 if (DestReg == AArch64::WSP || SrcReg == AArch64::WSP) {
5720 if (Subtarget.hasZeroCycleRegMoveGPR64() &&
5721 !Subtarget.hasZeroCycleRegMoveGPR32()) {
5723 MCRegister DestRegX = RI.getMatchingSuperReg(DestReg, AArch64::sub_32,
5724 &AArch64::GPR64spRegClass);
5725 MCRegister SrcRegX = RI.getMatchingSuperReg(SrcReg, AArch64::sub_32,
5726 &AArch64::GPR64spRegClass);
5736 ++NumZCRegMoveInstrsGPR;
5742 if (Subtarget.hasZeroCycleRegMoveGPR32())
5743 ++NumZCRegMoveInstrsGPR;
5745 }
else if (Subtarget.hasZeroCycleRegMoveGPR64() &&
5746 !Subtarget.hasZeroCycleRegMoveGPR32()) {
5748 MCRegister DestRegX = RI.getMatchingSuperReg(DestReg, AArch64::sub_32,
5749 &AArch64::GPR64spRegClass);
5750 assert(DestRegX.
isValid() &&
"Destination super-reg not valid");
5751 MCRegister SrcRegX = RI.getMatchingSuperReg(SrcReg, AArch64::sub_32,
5752 &AArch64::GPR64spRegClass);
5762 ++NumZCRegMoveInstrsGPR;
5768 if (Subtarget.hasZeroCycleRegMoveGPR32())
5769 ++NumZCRegMoveInstrsGPR;
5775 if (AArch64::GPR32spRegClass.
contains(DestReg) && SrcReg == AArch64::WZR) {
5776 if (Subtarget.hasZeroCycleZeroingGPR64() &&
5777 !Subtarget.hasZeroCycleZeroingGPR32()) {
5778 MCRegister DestRegX = RI.getMatchingSuperReg(DestReg, AArch64::sub_32,
5779 &AArch64::GPR64spRegClass);
5780 assert(DestRegX.
isValid() &&
"Destination super-reg not valid");
5784 ++NumZCZeroingInstrsGPR;
5785 }
else if (Subtarget.hasZeroCycleZeroingGPR32()) {
5789 ++NumZCZeroingInstrsGPR;
5798 if (AArch64::GPR64spRegClass.
contains(DestReg) &&
5799 AArch64::GPR64spRegClass.
contains(SrcReg)) {
5800 if (DestReg == AArch64::SP || SrcReg == AArch64::SP) {
5806 if (Subtarget.hasZeroCycleRegMoveGPR64())
5807 ++NumZCRegMoveInstrsGPR;
5813 if (Subtarget.hasZeroCycleRegMoveGPR64())
5814 ++NumZCRegMoveInstrsGPR;
5820 if (AArch64::GPR64spRegClass.
contains(DestReg) && SrcReg == AArch64::XZR) {
5821 if (Subtarget.hasZeroCycleZeroingGPR64()) {
5825 ++NumZCZeroingInstrsGPR;
5835 if (AArch64::PPRRegClass.
contains(DestReg) &&
5836 AArch64::PPRRegClass.
contains(SrcReg)) {
5837 assert(Subtarget.isSVEorStreamingSVEAvailable() &&
5838 "Unexpected SVE register.");
5848 bool DestIsPNR = AArch64::PNRRegClass.contains(DestReg);
5849 bool SrcIsPNR = AArch64::PNRRegClass.contains(SrcReg);
5850 if (DestIsPNR || SrcIsPNR) {
5852 return (R - AArch64::PN0) + AArch64::P0;
5857 if (PPRSrcReg != PPRDestReg) {
5869 if (AArch64::ZPRRegClass.
contains(DestReg) &&
5870 AArch64::ZPRRegClass.
contains(SrcReg)) {
5871 assert(Subtarget.isSVEorStreamingSVEAvailable() &&
5872 "Unexpected SVE register.");
5880 if ((AArch64::ZPR2RegClass.
contains(DestReg) ||
5881 AArch64::ZPR2StridedOrContiguousRegClass.
contains(DestReg)) &&
5882 (AArch64::ZPR2RegClass.
contains(SrcReg) ||
5883 AArch64::ZPR2StridedOrContiguousRegClass.
contains(SrcReg))) {
5884 assert(Subtarget.isSVEorStreamingSVEAvailable() &&
5885 "Unexpected SVE register.");
5886 static const unsigned Indices[] = {AArch64::zsub0, AArch64::zsub1};
5893 if (AArch64::ZPR3RegClass.
contains(DestReg) &&
5894 AArch64::ZPR3RegClass.
contains(SrcReg)) {
5895 assert(Subtarget.isSVEorStreamingSVEAvailable() &&
5896 "Unexpected SVE register.");
5897 static const unsigned Indices[] = {AArch64::zsub0, AArch64::zsub1,
5905 if ((AArch64::ZPR4RegClass.
contains(DestReg) ||
5906 AArch64::ZPR4StridedOrContiguousRegClass.
contains(DestReg)) &&
5907 (AArch64::ZPR4RegClass.
contains(SrcReg) ||
5908 AArch64::ZPR4StridedOrContiguousRegClass.
contains(SrcReg))) {
5909 assert(Subtarget.isSVEorStreamingSVEAvailable() &&
5910 "Unexpected SVE register.");
5911 static const unsigned Indices[] = {AArch64::zsub0, AArch64::zsub1,
5912 AArch64::zsub2, AArch64::zsub3};
5919 if (AArch64::DDDDRegClass.
contains(DestReg) &&
5920 AArch64::DDDDRegClass.
contains(SrcReg)) {
5921 static const unsigned Indices[] = {AArch64::dsub0, AArch64::dsub1,
5922 AArch64::dsub2, AArch64::dsub3};
5929 if (AArch64::DDDRegClass.
contains(DestReg) &&
5930 AArch64::DDDRegClass.
contains(SrcReg)) {
5931 static const unsigned Indices[] = {AArch64::dsub0, AArch64::dsub1,
5939 if (AArch64::DDRegClass.
contains(DestReg) &&
5940 AArch64::DDRegClass.
contains(SrcReg)) {
5941 static const unsigned Indices[] = {AArch64::dsub0, AArch64::dsub1};
5948 if (AArch64::QQQQRegClass.
contains(DestReg) &&
5949 AArch64::QQQQRegClass.
contains(SrcReg)) {
5950 static const unsigned Indices[] = {AArch64::qsub0, AArch64::qsub1,
5951 AArch64::qsub2, AArch64::qsub3};
5958 if (AArch64::QQQRegClass.
contains(DestReg) &&
5959 AArch64::QQQRegClass.
contains(SrcReg)) {
5960 static const unsigned Indices[] = {AArch64::qsub0, AArch64::qsub1,
5968 if (AArch64::QQRegClass.
contains(DestReg) &&
5969 AArch64::QQRegClass.
contains(SrcReg)) {
5970 static const unsigned Indices[] = {AArch64::qsub0, AArch64::qsub1};
5976 if (AArch64::XSeqPairsClassRegClass.
contains(DestReg) &&
5977 AArch64::XSeqPairsClassRegClass.
contains(SrcReg)) {
5978 static const unsigned Indices[] = {AArch64::sube64, AArch64::subo64};
5980 AArch64::XZR, Indices);
5984 if (AArch64::WSeqPairsClassRegClass.
contains(DestReg) &&
5985 AArch64::WSeqPairsClassRegClass.
contains(SrcReg)) {
5986 static const unsigned Indices[] = {AArch64::sube32, AArch64::subo32};
5988 AArch64::WZR, Indices);
5992 if (AArch64::FPR128RegClass.
contains(DestReg) &&
5993 AArch64::FPR128RegClass.
contains(SrcReg)) {
5997 if ((Subtarget.isSVEorStreamingSVEAvailable() &&
5998 !Subtarget.isNeonAvailable()) ||
6002 .
addReg(AArch64::Z0 + (SrcReg - AArch64::Q0))
6003 .
addReg(AArch64::Z0 + (SrcReg - AArch64::Q0));
6004 }
else if (Subtarget.isNeonAvailable()) {
6008 if (Subtarget.hasZeroCycleRegMoveFPR128())
6009 ++NumZCRegMoveInstrsFPR;
6025 if (AArch64::FPR64RegClass.
contains(DestReg) &&
6026 AArch64::FPR64RegClass.
contains(SrcReg)) {
6027 if (Subtarget.hasZeroCycleRegMoveFPR128() &&
6028 !Subtarget.hasZeroCycleRegMoveFPR64() &&
6029 !Subtarget.hasZeroCycleRegMoveFPR32() && Subtarget.isNeonAvailable() &&
6031 MCRegister DestRegQ = RI.getMatchingSuperReg(DestReg, AArch64::dsub,
6032 &AArch64::FPR128RegClass);
6033 MCRegister SrcRegQ = RI.getMatchingSuperReg(SrcReg, AArch64::dsub,
6034 &AArch64::FPR128RegClass);
6043 ++NumZCRegMoveInstrsFPR;
6047 if (Subtarget.hasZeroCycleRegMoveFPR64())
6048 ++NumZCRegMoveInstrsFPR;
6053 if (AArch64::FPR32RegClass.
contains(DestReg) &&
6054 AArch64::FPR32RegClass.
contains(SrcReg)) {
6055 if (Subtarget.hasZeroCycleRegMoveFPR128() &&
6056 !Subtarget.hasZeroCycleRegMoveFPR64() &&
6057 !Subtarget.hasZeroCycleRegMoveFPR32() && Subtarget.isNeonAvailable() &&
6059 MCRegister DestRegQ = RI.getMatchingSuperReg(DestReg, AArch64::ssub,
6060 &AArch64::FPR128RegClass);
6061 MCRegister SrcRegQ = RI.getMatchingSuperReg(SrcReg, AArch64::ssub,
6062 &AArch64::FPR128RegClass);
6071 ++NumZCRegMoveInstrsFPR;
6072 }
else if (Subtarget.hasZeroCycleRegMoveFPR64() &&
6073 !Subtarget.hasZeroCycleRegMoveFPR32()) {
6074 MCRegister DestRegD = RI.getMatchingSuperReg(DestReg, AArch64::ssub,
6075 &AArch64::FPR64RegClass);
6076 MCRegister SrcRegD = RI.getMatchingSuperReg(SrcReg, AArch64::ssub,
6077 &AArch64::FPR64RegClass);
6085 ++NumZCRegMoveInstrsFPR;
6089 if (Subtarget.hasZeroCycleRegMoveFPR32())
6090 ++NumZCRegMoveInstrsFPR;
6095 if (AArch64::FPR16RegClass.
contains(DestReg) &&
6096 AArch64::FPR16RegClass.
contains(SrcReg)) {
6097 if (Subtarget.hasZeroCycleRegMoveFPR128() &&
6098 !Subtarget.hasZeroCycleRegMoveFPR64() &&
6099 !Subtarget.hasZeroCycleRegMoveFPR32() && Subtarget.isNeonAvailable() &&
6101 MCRegister DestRegQ = RI.getMatchingSuperReg(DestReg, AArch64::hsub,
6102 &AArch64::FPR128RegClass);
6103 MCRegister SrcRegQ = RI.getMatchingSuperReg(SrcReg, AArch64::hsub,
6104 &AArch64::FPR128RegClass);
6113 }
else if (Subtarget.hasZeroCycleRegMoveFPR64() &&
6114 !Subtarget.hasZeroCycleRegMoveFPR32()) {
6115 MCRegister DestRegD = RI.getMatchingSuperReg(DestReg, AArch64::hsub,
6116 &AArch64::FPR64RegClass);
6117 MCRegister SrcRegD = RI.getMatchingSuperReg(SrcReg, AArch64::hsub,
6118 &AArch64::FPR64RegClass);
6127 DestReg = RI.getMatchingSuperReg(DestReg, AArch64::hsub,
6128 &AArch64::FPR32RegClass);
6129 SrcReg = RI.getMatchingSuperReg(SrcReg, AArch64::hsub,
6130 &AArch64::FPR32RegClass);
6137 if (AArch64::FPR8RegClass.
contains(DestReg) &&
6138 AArch64::FPR8RegClass.
contains(SrcReg)) {
6139 if (Subtarget.hasZeroCycleRegMoveFPR128() &&
6140 !Subtarget.hasZeroCycleRegMoveFPR64() &&
6141 !Subtarget.hasZeroCycleRegMoveFPR32() && Subtarget.isNeonAvailable() &&
6143 MCRegister DestRegQ = RI.getMatchingSuperReg(DestReg, AArch64::bsub,
6144 &AArch64::FPR128RegClass);
6145 MCRegister SrcRegQ = RI.getMatchingSuperReg(SrcReg, AArch64::bsub,
6146 &AArch64::FPR128RegClass);
6155 }
else if (Subtarget.hasZeroCycleRegMoveFPR64() &&
6156 !Subtarget.hasZeroCycleRegMoveFPR32()) {
6157 MCRegister DestRegD = RI.getMatchingSuperReg(DestReg, AArch64::bsub,
6158 &AArch64::FPR64RegClass);
6159 MCRegister SrcRegD = RI.getMatchingSuperReg(SrcReg, AArch64::bsub,
6160 &AArch64::FPR64RegClass);
6169 DestReg = RI.getMatchingSuperReg(DestReg, AArch64::bsub,
6170 &AArch64::FPR32RegClass);
6171 SrcReg = RI.getMatchingSuperReg(SrcReg, AArch64::bsub,
6172 &AArch64::FPR32RegClass);
6180 if (AArch64::FPR64RegClass.
contains(DestReg) &&
6181 AArch64::GPR64RegClass.
contains(SrcReg)) {
6182 if (AArch64::XZR == SrcReg) {
6190 if (AArch64::GPR64RegClass.
contains(DestReg) &&
6191 AArch64::FPR64RegClass.
contains(SrcReg)) {
6197 if (AArch64::FPR32RegClass.
contains(DestReg) &&
6198 AArch64::GPR32RegClass.
contains(SrcReg)) {
6199 if (AArch64::WZR == SrcReg) {
6207 if (AArch64::GPR32RegClass.
contains(DestReg) &&
6208 AArch64::FPR32RegClass.
contains(SrcReg)) {
6214 if (DestReg == AArch64::NZCV) {
6215 assert(AArch64::GPR64RegClass.
contains(SrcReg) &&
"Invalid NZCV copy");
6217 .
addImm(AArch64SysReg::NZCV)
6223 if (SrcReg == AArch64::NZCV) {
6224 assert(AArch64::GPR64RegClass.
contains(DestReg) &&
"Invalid NZCV copy");
6226 .
addImm(AArch64SysReg::NZCV)
6232 errs() << RI.getRegAsmName(DestReg) <<
" = COPY " << RI.getRegAsmName(SrcReg)
6243 unsigned SubIdx0,
unsigned SubIdx1,
int FI,
6248 SrcReg0 =
TRI.getSubReg(SrcReg, SubIdx0);
6250 SrcReg1 =
TRI.getSubReg(SrcReg, SubIdx1);
6263 Register SrcReg,
bool isKill,
int FI,
6278 switch (RI.getSpillSize(*RC)) {
6280 if (AArch64::FPR8RegClass.hasSubClassEq(RC))
6281 Opc = AArch64::STRBui;
6284 if (AArch64::FPR16RegClass.hasSubClassEq(RC))
6285 Opc = AArch64::STRHui;
6286 else if (AArch64::PNRRegClass.hasSubClassEq(RC) ||
6287 AArch64::PPRRegClass.hasSubClassEq(RC)) {
6288 assert(Subtarget.isSVEorStreamingSVEAvailable() &&
6289 "Unexpected register store without SVE store instructions");
6290 Opc = AArch64::STR_PXI;
6296 if (AArch64::GPR32allRegClass.hasSubClassEq(RC)) {
6297 Opc = AArch64::STRWui;
6301 assert(SrcReg != AArch64::WSP);
6302 }
else if (AArch64::FPR32RegClass.hasSubClassEq(RC))
6303 Opc = AArch64::STRSui;
6304 else if (AArch64::PPR2RegClass.hasSubClassEq(RC)) {
6305 Opc = AArch64::STR_PPXI;
6310 if (AArch64::GPR64allRegClass.hasSubClassEq(RC)) {
6311 Opc = AArch64::STRXui;
6315 assert(SrcReg != AArch64::SP);
6316 }
else if (AArch64::FPR64RegClass.hasSubClassEq(RC)) {
6317 Opc = AArch64::STRDui;
6318 }
else if (AArch64::WSeqPairsClassRegClass.hasSubClassEq(RC)) {
6320 get(AArch64::STPWi), SrcReg, isKill,
6321 AArch64::sube32, AArch64::subo32, FI, MMO);
6326 if (AArch64::FPR128RegClass.hasSubClassEq(RC))
6327 Opc = AArch64::STRQui;
6328 else if (AArch64::DDRegClass.hasSubClassEq(RC)) {
6329 assert(Subtarget.hasNEON() &&
"Unexpected register store without NEON");
6330 Opc = AArch64::ST1Twov1d;
6332 }
else if (AArch64::XSeqPairsClassRegClass.hasSubClassEq(RC)) {
6334 get(AArch64::STPXi), SrcReg, isKill,
6335 AArch64::sube64, AArch64::subo64, FI, MMO);
6337 }
else if (AArch64::ZPRRegClass.hasSubClassEq(RC)) {
6338 assert(Subtarget.isSVEorStreamingSVEAvailable() &&
6339 "Unexpected register store without SVE store instructions");
6340 Opc = AArch64::STR_ZXI;
6345 if (AArch64::DDDRegClass.hasSubClassEq(RC)) {
6346 assert(Subtarget.hasNEON() &&
"Unexpected register store without NEON");
6347 Opc = AArch64::ST1Threev1d;
6352 if (AArch64::DDDDRegClass.hasSubClassEq(RC)) {
6353 assert(Subtarget.hasNEON() &&
"Unexpected register store without NEON");
6354 Opc = AArch64::ST1Fourv1d;
6356 }
else if (AArch64::QQRegClass.hasSubClassEq(RC)) {
6357 assert(Subtarget.hasNEON() &&
"Unexpected register store without NEON");
6358 Opc = AArch64::ST1Twov2d;
6360 }
else if (AArch64::ZPR2StridedOrContiguousRegClass.hasSubClassEq(RC)) {
6361 assert(Subtarget.isSVEorStreamingSVEAvailable() &&
6362 "Unexpected register store without SVE store instructions");
6363 Opc = AArch64::STR_ZZXI_STRIDED_CONTIGUOUS;
6365 }
else if (AArch64::ZPR2RegClass.hasSubClassEq(RC)) {
6366 assert(Subtarget.isSVEorStreamingSVEAvailable() &&
6367 "Unexpected register store without SVE store instructions");
6368 Opc = AArch64::STR_ZZXI;
6373 if (AArch64::QQQRegClass.hasSubClassEq(RC)) {
6374 assert(Subtarget.hasNEON() &&
"Unexpected register store without NEON");
6375 Opc = AArch64::ST1Threev2d;
6377 }
else if (AArch64::ZPR3RegClass.hasSubClassEq(RC)) {
6378 assert(Subtarget.isSVEorStreamingSVEAvailable() &&
6379 "Unexpected register store without SVE store instructions");
6380 Opc = AArch64::STR_ZZZXI;
6385 if (AArch64::QQQQRegClass.hasSubClassEq(RC)) {
6386 assert(Subtarget.hasNEON() &&
"Unexpected register store without NEON");
6387 Opc = AArch64::ST1Fourv2d;
6389 }
else if (AArch64::ZPR4StridedOrContiguousRegClass.hasSubClassEq(RC)) {
6390 assert(Subtarget.isSVEorStreamingSVEAvailable() &&
6391 "Unexpected register store without SVE store instructions");
6392 Opc = AArch64::STR_ZZZZXI_STRIDED_CONTIGUOUS;
6394 }
else if (AArch64::ZPR4RegClass.hasSubClassEq(RC)) {
6395 assert(Subtarget.isSVEorStreamingSVEAvailable() &&
6396 "Unexpected register store without SVE store instructions");
6397 Opc = AArch64::STR_ZZZZXI;
6402 assert(
Opc &&
"Unknown register class");
6413 MI.addMemOperand(MMO);
6420 Register DestReg,
unsigned SubIdx0,
6421 unsigned SubIdx1,
int FI,
6425 bool IsUndef =
true;
6427 DestReg0 =
TRI.getSubReg(DestReg, SubIdx0);
6429 DestReg1 =
TRI.getSubReg(DestReg, SubIdx1);
6458 switch (
TRI.getSpillSize(*RC)) {
6460 if (AArch64::FPR8RegClass.hasSubClassEq(RC))
6461 Opc = AArch64::LDRBui;
6464 bool IsPNR = AArch64::PNRRegClass.hasSubClassEq(RC);
6465 if (AArch64::FPR16RegClass.hasSubClassEq(RC))
6466 Opc = AArch64::LDRHui;
6467 else if (IsPNR || AArch64::PPRRegClass.hasSubClassEq(RC)) {
6468 assert(Subtarget.isSVEorStreamingSVEAvailable() &&
6469 "Unexpected register load without SVE load instructions");
6472 Opc = AArch64::LDR_PXI;
6478 if (AArch64::GPR32allRegClass.hasSubClassEq(RC)) {
6479 Opc = AArch64::LDRWui;
6483 assert(DestReg != AArch64::WSP);
6484 }
else if (AArch64::FPR32RegClass.hasSubClassEq(RC))
6485 Opc = AArch64::LDRSui;
6486 else if (AArch64::PPR2RegClass.hasSubClassEq(RC)) {
6487 Opc = AArch64::LDR_PPXI;
6492 if (AArch64::GPR64allRegClass.hasSubClassEq(RC)) {
6493 Opc = AArch64::LDRXui;
6497 assert(DestReg != AArch64::SP);
6498 }
else if (AArch64::FPR64RegClass.hasSubClassEq(RC)) {
6499 Opc = AArch64::LDRDui;
6500 }
else if (AArch64::WSeqPairsClassRegClass.hasSubClassEq(RC)) {
6502 get(AArch64::LDPWi), DestReg, AArch64::sube32,
6503 AArch64::subo32, FI, MMO);
6508 if (AArch64::FPR128RegClass.hasSubClassEq(RC))
6509 Opc = AArch64::LDRQui;
6510 else if (AArch64::DDRegClass.hasSubClassEq(RC)) {
6511 assert(Subtarget.hasNEON() &&
"Unexpected register load without NEON");
6512 Opc = AArch64::LD1Twov1d;
6514 }
else if (AArch64::XSeqPairsClassRegClass.hasSubClassEq(RC)) {
6516 get(AArch64::LDPXi), DestReg, AArch64::sube64,
6517 AArch64::subo64, FI, MMO);
6519 }
else if (AArch64::ZPRRegClass.hasSubClassEq(RC)) {
6520 assert(Subtarget.isSVEorStreamingSVEAvailable() &&
6521 "Unexpected register load without SVE load instructions");
6522 Opc = AArch64::LDR_ZXI;
6527 if (AArch64::DDDRegClass.hasSubClassEq(RC)) {
6528 assert(Subtarget.hasNEON() &&
"Unexpected register load without NEON");
6529 Opc = AArch64::LD1Threev1d;
6534 if (AArch64::DDDDRegClass.hasSubClassEq(RC)) {
6535 assert(Subtarget.hasNEON() &&
"Unexpected register load without NEON");
6536 Opc = AArch64::LD1Fourv1d;
6538 }
else if (AArch64::QQRegClass.hasSubClassEq(RC)) {
6539 assert(Subtarget.hasNEON() &&
"Unexpected register load without NEON");
6540 Opc = AArch64::LD1Twov2d;
6542 }
else if (AArch64::ZPR2StridedOrContiguousRegClass.hasSubClassEq(RC)) {
6543 assert(Subtarget.isSVEorStreamingSVEAvailable() &&
6544 "Unexpected register load without SVE load instructions");
6545 Opc = AArch64::LDR_ZZXI_STRIDED_CONTIGUOUS;
6547 }
else if (AArch64::ZPR2RegClass.hasSubClassEq(RC)) {
6548 assert(Subtarget.isSVEorStreamingSVEAvailable() &&
6549 "Unexpected register load without SVE load instructions");
6550 Opc = AArch64::LDR_ZZXI;
6555 if (AArch64::QQQRegClass.hasSubClassEq(RC)) {
6556 assert(Subtarget.hasNEON() &&
"Unexpected register load without NEON");
6557 Opc = AArch64::LD1Threev2d;
6559 }
else if (AArch64::ZPR3RegClass.hasSubClassEq(RC)) {
6560 assert(Subtarget.isSVEorStreamingSVEAvailable() &&
6561 "Unexpected register load without SVE load instructions");
6562 Opc = AArch64::LDR_ZZZXI;
6567 if (AArch64::QQQQRegClass.hasSubClassEq(RC)) {
6568 assert(Subtarget.hasNEON() &&
"Unexpected register load without NEON");
6569 Opc = AArch64::LD1Fourv2d;
6571 }
else if (AArch64::ZPR4StridedOrContiguousRegClass.hasSubClassEq(RC)) {
6572 assert(Subtarget.isSVEorStreamingSVEAvailable() &&
6573 "Unexpected register load without SVE load instructions");
6574 Opc = AArch64::LDR_ZZZZXI_STRIDED_CONTIGUOUS;
6576 }
else if (AArch64::ZPR4RegClass.hasSubClassEq(RC)) {
6577 assert(Subtarget.isSVEorStreamingSVEAvailable() &&
6578 "Unexpected register load without SVE load instructions");
6579 Opc = AArch64::LDR_ZZZZXI;
6585 assert(
Opc &&
"Unknown register class");
6595 MI.addMemOperand(MMO);
6602 UseMI.getIterator()),
6604 return I.modifiesRegister(AArch64::NZCV, TRI) ||
6605 I.readsRegister(AArch64::NZCV, TRI);
6609void AArch64InstrInfo::decomposeStackOffsetForDwarfOffsets(
6614 assert(
Offset.getScalable() % 2 == 0 &&
"Invalid frame offset");
6621 ByteSized =
Offset.getFixed();
6622 VGSized =
Offset.getScalable() / 2;
6628void AArch64InstrInfo::decomposeStackOffsetForFrameOffsets(
6630 int64_t &NumDataVectors) {
6634 assert(
Offset.getScalable() % 2 == 0 &&
"Invalid frame offset");
6636 NumBytes =
Offset.getFixed();
6638 NumPredicateVectors =
Offset.getScalable() / 2;
6643 if (NumPredicateVectors % 8 == 0 || NumPredicateVectors < -64 ||
6644 NumPredicateVectors > 62) {
6645 NumDataVectors = NumPredicateVectors / 8;
6646 NumPredicateVectors -= NumDataVectors * 8;
6672 Expr.
push_back((
char)dwarf::DW_OP_bregx);
6680 int64_t OffsetFromDefCFA) {
6694 Comment << (NumBytes < 0 ?
" - " :
" + ") << std::abs(NumBytes);
6695 if (!RegScale.empty())
6705 int64_t NumBytes, NumVGScaledBytes;
6706 AArch64InstrInfo::decomposeStackOffsetForDwarfOffsets(
Offset, NumBytes,
6708 std::string CommentBuffer;
6711 if (
Reg == AArch64::SP)
6713 else if (
Reg == AArch64::FP)
6720 unsigned DwarfReg =
TRI.getDwarfRegNum(
Reg,
true);
6721 assert(DwarfReg <= 31 &&
"DwarfReg out of bounds (0..31)");
6723 Expr.
push_back(dwarf::DW_OP_breg0 + DwarfReg);
6726 if (NumVGScaledBytes) {
6736 DefCfaExpr.
push_back(dwarf::DW_CFA_def_cfa_expression);
6744 unsigned FrameReg,
unsigned Reg,
6746 bool LastAdjustmentWasScalable) {
6747 if (
Offset.getScalable())
6750 if (FrameReg == Reg && !LastAdjustmentWasScalable)
6753 unsigned DwarfReg =
TRI.getDwarfRegNum(Reg,
true);
6760 std::optional<int64_t> IncomingVGOffsetFromDefCFA) {
6761 int64_t NumBytes, NumVGScaledBytes;
6762 AArch64InstrInfo::decomposeStackOffsetForDwarfOffsets(
6763 OffsetFromDefCFA, NumBytes, NumVGScaledBytes);
6765 unsigned DwarfReg =
TRI.getDwarfRegNum(Reg,
true);
6768 if (!NumVGScaledBytes)
6771 std::string CommentBuffer;
6776 assert(NumVGScaledBytes &&
"Expected scalable offset");
6780 if (IncomingVGOffsetFromDefCFA) {
6782 VGRegScale =
"* IncomingVG";
6785 VGRegScale =
"* VG";
6789 OffsetExpr.
push_back(dwarf::DW_OP_plus);
6798 CfaExpr.
push_back(dwarf::DW_CFA_expression);
6813 unsigned SrcReg, int64_t
Offset,
unsigned Opc,
6816 bool *HasWinCFI,
bool EmitCFAOffset,
6819 unsigned MaxEncoding, ShiftSize;
6821 case AArch64::ADDXri:
6822 case AArch64::ADDSXri:
6823 case AArch64::SUBXri:
6824 case AArch64::SUBSXri:
6825 MaxEncoding = 0xfff;
6828 case AArch64::ADDVL_XXI:
6829 case AArch64::ADDPL_XXI:
6830 case AArch64::ADDSVL_XXI:
6831 case AArch64::ADDSPL_XXI:
6846 if (
Opc == AArch64::ADDVL_XXI ||
Opc == AArch64::ADDSVL_XXI)
6848 else if (
Opc == AArch64::ADDPL_XXI ||
Opc == AArch64::ADDSPL_XXI)
6862 const unsigned MaxEncodableValue = MaxEncoding << ShiftSize;
6864 if (TmpReg == AArch64::XZR)
6865 TmpReg =
MBB.getParent()->getRegInfo().createVirtualRegister(
6866 &AArch64::GPR64RegClass);
6868 uint64_t ThisVal = std::min<uint64_t>(
Offset, MaxEncodableValue);
6869 unsigned LocalShiftSize = 0;
6870 if (ThisVal > MaxEncoding) {
6871 ThisVal = ThisVal >> ShiftSize;
6872 LocalShiftSize = ShiftSize;
6874 assert((ThisVal >> ShiftSize) <= MaxEncoding &&
6875 "Encoding cannot handle value that big");
6877 Offset -= ThisVal << LocalShiftSize;
6882 .
addImm(Sign * (
int)ThisVal);
6892 if (Sign == -1 ||
Opc == AArch64::SUBXri ||
Opc == AArch64::SUBSXri)
6893 CFAOffset += Change;
6895 CFAOffset -= Change;
6896 if (EmitCFAOffset && DestReg == TmpReg) {
6909 int Imm = (int)(ThisVal << LocalShiftSize);
6910 if (VScale != 1 && DestReg == AArch64::SP) {
6916 }
else if ((DestReg == AArch64::FP && SrcReg == AArch64::SP) ||
6917 (SrcReg == AArch64::FP && DestReg == AArch64::SP)) {
6918 assert(VScale == 1 &&
"Expected non-scalable operation");
6927 assert(
Offset == 0 &&
"Expected remaining offset to be zero to "
6928 "emit a single SEH directive");
6929 }
else if (DestReg == AArch64::SP) {
6930 assert(VScale == 1 &&
"Expected non-scalable operation");
6933 assert(SrcReg == AArch64::SP &&
"Unexpected SrcReg for SEH_StackAlloc");
6946 unsigned DestReg,
unsigned SrcReg,
6949 bool NeedsWinCFI,
bool *HasWinCFI,
6951 unsigned FrameReg) {
6958 bool UseSVL =
F.hasFnAttribute(
"aarch64_pstate_sm_body");
6960 int64_t Bytes, NumPredicateVectors, NumDataVectors;
6961 AArch64InstrInfo::decomposeStackOffsetForFrameOffsets(
6962 Offset, Bytes, NumPredicateVectors, NumDataVectors);
6965 bool NeedsFinalDefNZCV = SetNZCV && (NumPredicateVectors || NumDataVectors);
6966 if (NeedsFinalDefNZCV)
6970 if (Bytes || (!
Offset && SrcReg != DestReg)) {
6971 assert((DestReg != AArch64::SP || Bytes % 8 == 0) &&
6972 "SP increment/decrement not 8-byte aligned");
6973 unsigned Opc = SetNZCV ? AArch64::ADDSXri : AArch64::ADDXri;
6976 Opc = SetNZCV ? AArch64::SUBSXri : AArch64::SUBXri;
6979 NeedsWinCFI, HasWinCFI, EmitCFAOffset, CFAOffset,
6981 CFAOffset += (
Opc == AArch64::ADDXri ||
Opc == AArch64::ADDSXri)
6988 assert(!(NeedsWinCFI && NumPredicateVectors) &&
6989 "WinCFI can't allocate fractions of an SVE data vector");
6991 if (NumDataVectors) {
6993 UseSVL ? AArch64::ADDSVL_XXI : AArch64::ADDVL_XXI,
TII,
6994 Flag, NeedsWinCFI, HasWinCFI, EmitCFAOffset, CFAOffset,
7000 if (NumPredicateVectors) {
7001 assert(DestReg != AArch64::SP &&
"Unaligned access to SP");
7003 UseSVL ? AArch64::ADDSPL_XXI : AArch64::ADDPL_XXI,
TII,
7004 Flag, NeedsWinCFI, HasWinCFI, EmitCFAOffset, CFAOffset,
7008 if (NeedsFinalDefNZCV)
7030 if (
MI.isFullCopy()) {
7033 if (SrcReg == AArch64::SP && DstReg.
isVirtual()) {
7037 if (DstReg == AArch64::SP && SrcReg.
isVirtual()) {
7042 if (SrcReg == AArch64::NZCV || DstReg == AArch64::NZCV)
7070 if (
MI.isCopy() &&
Ops.size() == 1 &&
7072 (
Ops[0] == 0 ||
Ops[0] == 1)) {
7073 bool IsSpill =
Ops[0] == 0;
7074 bool IsFill = !IsSpill;
7086 :
TRI.getMinimalPhysRegClass(Reg);
7092 "Mismatched register size in non subreg COPY");
7099 return &*--InsertPt;
7111 if (IsSpill && DstMO.
isUndef() && SrcReg == AArch64::WZR &&
7114 "Unexpected subreg on physical register");
7116 FrameIndex, &AArch64::GPR64RegClass,
Register());
7117 return &*--InsertPt;
7134 case AArch64::sub_32:
7135 if (AArch64::GPR64RegClass.hasSubClassEq(
getRegClass(DstReg)))
7136 FillRC = &AArch64::GPR32RegClass;
7139 FillRC = &AArch64::FPR32RegClass;
7142 FillRC = &AArch64::FPR64RegClass;
7148 TRI.getRegSizeInBits(*FillRC) &&
7149 "Mismatched regclass size on folded subreg COPY");
7168 bool *OutUseUnscaledOp,
7169 unsigned *OutUnscaledOp,
7170 int64_t *EmittableOffset) {
7172 if (EmittableOffset)
7173 *EmittableOffset = 0;
7174 if (OutUseUnscaledOp)
7175 *OutUseUnscaledOp =
false;
7181 switch (
MI.getOpcode()) {
7184 case AArch64::LD1Rv1d:
7185 case AArch64::LD1Rv2s:
7186 case AArch64::LD1Rv2d:
7187 case AArch64::LD1Rv4h:
7188 case AArch64::LD1Rv4s:
7189 case AArch64::LD1Rv8b:
7190 case AArch64::LD1Rv8h:
7191 case AArch64::LD1Rv16b:
7192 case AArch64::LD1Twov2d:
7193 case AArch64::LD1Threev2d:
7194 case AArch64::LD1Fourv2d:
7195 case AArch64::LD1Twov1d:
7196 case AArch64::LD1Threev1d:
7197 case AArch64::LD1Fourv1d:
7198 case AArch64::ST1Twov2d:
7199 case AArch64::ST1Threev2d:
7200 case AArch64::ST1Fourv2d:
7201 case AArch64::ST1Twov1d:
7202 case AArch64::ST1Threev1d:
7203 case AArch64::ST1Fourv1d:
7204 case AArch64::ST1i8:
7205 case AArch64::ST1i16:
7206 case AArch64::ST1i32:
7207 case AArch64::ST1i64:
7209 case AArch64::IRGstack:
7210 case AArch64::STGloop:
7211 case AArch64::STZGloop:
7216 TypeSize ScaleValue(0U,
false), Width(0U,
false);
7217 int64_t MinOff, MaxOff;
7223 bool IsMulVL = ScaleValue.isScalable();
7224 unsigned Scale = ScaleValue.getKnownMinValue();
7234 std::optional<unsigned> UnscaledOp =
7236 bool useUnscaledOp = UnscaledOp && (
Offset % Scale ||
Offset < 0);
7237 if (useUnscaledOp &&
7242 Scale = ScaleValue.getKnownMinValue();
7243 assert(IsMulVL == ScaleValue.isScalable() &&
7244 "Unscaled opcode has different value for scalable");
7246 int64_t Remainder =
Offset % Scale;
7247 assert(!(Remainder && useUnscaledOp) &&
7248 "Cannot have remainder when using unscaled op");
7250 assert(MinOff < MaxOff &&
"Unexpected Min/Max offsets");
7251 int64_t NewOffset =
Offset / Scale;
7252 if (MinOff <= NewOffset && NewOffset <= MaxOff)
7255 NewOffset = NewOffset < 0 ? MinOff : MaxOff;
7259 if (EmittableOffset)
7260 *EmittableOffset = NewOffset;
7261 if (OutUseUnscaledOp)
7262 *OutUseUnscaledOp = useUnscaledOp;
7263 if (OutUnscaledOp && UnscaledOp)
7264 *OutUnscaledOp = *UnscaledOp;
7277 unsigned Opcode =
MI.getOpcode();
7278 unsigned ImmIdx = FrameRegIdx + 1;
7280 if (Opcode == AArch64::ADDSXri || Opcode == AArch64::ADDXri) {
7285 MI.eraseFromParent();
7291 unsigned UnscaledOp;
7294 &UnscaledOp, &NewOffset);
7298 MI.getOperand(FrameRegIdx).ChangeToRegister(FrameReg,
false);
7300 MI.setDesc(
TII->get(UnscaledOp));
7302 MI.getOperand(ImmIdx).ChangeToImmediate(NewOffset);
7318bool AArch64InstrInfo::useMachineCombiner()
const {
return true; }
7323 case AArch64::ADDSWrr:
7324 case AArch64::ADDSWri:
7325 case AArch64::ADDSXrr:
7326 case AArch64::ADDSXri:
7327 case AArch64::SUBSWrr:
7328 case AArch64::SUBSXrr:
7330 case AArch64::SUBSWri:
7331 case AArch64::SUBSXri:
7342 case AArch64::ADDWrr:
7343 case AArch64::ADDWri:
7344 case AArch64::SUBWrr:
7345 case AArch64::ADDSWrr:
7346 case AArch64::ADDSWri:
7347 case AArch64::SUBSWrr:
7349 case AArch64::SUBWri:
7350 case AArch64::SUBSWri:
7361 case AArch64::ADDXrr:
7362 case AArch64::ADDXri:
7363 case AArch64::SUBXrr:
7364 case AArch64::ADDSXrr:
7365 case AArch64::ADDSXri:
7366 case AArch64::SUBSXrr:
7368 case AArch64::SUBXri:
7369 case AArch64::SUBSXri:
7370 case AArch64::ADDv8i8:
7371 case AArch64::ADDv16i8:
7372 case AArch64::ADDv4i16:
7373 case AArch64::ADDv8i16:
7374 case AArch64::ADDv2i32:
7375 case AArch64::ADDv4i32:
7376 case AArch64::SUBv8i8:
7377 case AArch64::SUBv16i8:
7378 case AArch64::SUBv4i16:
7379 case AArch64::SUBv8i16:
7380 case AArch64::SUBv2i32:
7381 case AArch64::SUBv4i32:
7394 case AArch64::FADDHrr:
7395 case AArch64::FADDSrr:
7396 case AArch64::FADDDrr:
7397 case AArch64::FADDv4f16:
7398 case AArch64::FADDv8f16:
7399 case AArch64::FADDv2f32:
7400 case AArch64::FADDv2f64:
7401 case AArch64::FADDv4f32:
7402 case AArch64::FSUBHrr:
7403 case AArch64::FSUBSrr:
7404 case AArch64::FSUBDrr:
7405 case AArch64::FSUBv4f16:
7406 case AArch64::FSUBv8f16:
7407 case AArch64::FSUBv2f32:
7408 case AArch64::FSUBv2f64:
7409 case AArch64::FSUBv4f32:
7428 unsigned CombineOpc,
unsigned ZeroReg = 0,
7429 bool CheckZeroReg =
false) {
7436 if (!
MI ||
MI->getParent() != &
MBB ||
MI->getOpcode() != CombineOpc)
7443 assert(
MI->getNumOperands() >= 4 &&
MI->getOperand(0).isReg() &&
7444 MI->getOperand(1).isReg() &&
MI->getOperand(2).isReg() &&
7445 MI->getOperand(3).isReg() &&
"MAdd/MSub must have a least 4 regs");
7447 if (
MI->getOperand(3).getReg() != ZeroReg)
7452 MI->findRegisterDefOperandIdx(AArch64::NZCV,
nullptr,
true) == -1)
7461 unsigned MulOpc,
unsigned ZeroReg) {
7476bool AArch64InstrInfo::isAssociativeAndCommutative(
const MachineInstr &Inst,
7477 bool Invert)
const {
7483 case AArch64::FADDHrr:
7484 case AArch64::FADDSrr:
7485 case AArch64::FADDDrr:
7486 case AArch64::FMULHrr:
7487 case AArch64::FMULSrr:
7488 case AArch64::FMULDrr:
7489 case AArch64::FMULX16:
7490 case AArch64::FMULX32:
7491 case AArch64::FMULX64:
7493 case AArch64::FADDv4f16:
7494 case AArch64::FADDv8f16:
7495 case AArch64::FADDv2f32:
7496 case AArch64::FADDv4f32:
7497 case AArch64::FADDv2f64:
7498 case AArch64::FMULv4f16:
7499 case AArch64::FMULv8f16:
7500 case AArch64::FMULv2f32:
7501 case AArch64::FMULv4f32:
7502 case AArch64::FMULv2f64:
7503 case AArch64::FMULXv4f16:
7504 case AArch64::FMULXv8f16:
7505 case AArch64::FMULXv2f32:
7506 case AArch64::FMULXv4f32:
7507 case AArch64::FMULXv2f64:
7511 case AArch64::FADD_ZZZ_H:
7512 case AArch64::FADD_ZZZ_S:
7513 case AArch64::FADD_ZZZ_D:
7514 case AArch64::FMUL_ZZZ_H:
7515 case AArch64::FMUL_ZZZ_S:
7516 case AArch64::FMUL_ZZZ_D:
7527 case AArch64::ADDWrr:
7528 case AArch64::ADDXrr:
7529 case AArch64::ANDWrr:
7530 case AArch64::ANDXrr:
7531 case AArch64::ORRWrr:
7532 case AArch64::ORRXrr:
7533 case AArch64::EORWrr:
7534 case AArch64::EORXrr:
7535 case AArch64::EONWrr:
7536 case AArch64::EONXrr:
7540 case AArch64::ADDv8i8:
7541 case AArch64::ADDv16i8:
7542 case AArch64::ADDv4i16:
7543 case AArch64::ADDv8i16:
7544 case AArch64::ADDv2i32:
7545 case AArch64::ADDv4i32:
7546 case AArch64::ADDv1i64:
7547 case AArch64::ADDv2i64:
7548 case AArch64::MULv8i8:
7549 case AArch64::MULv16i8:
7550 case AArch64::MULv4i16:
7551 case AArch64::MULv8i16:
7552 case AArch64::MULv2i32:
7553 case AArch64::MULv4i32:
7554 case AArch64::ANDv8i8:
7555 case AArch64::ANDv16i8:
7556 case AArch64::ORRv8i8:
7557 case AArch64::ORRv16i8:
7558 case AArch64::EORv8i8:
7559 case AArch64::EORv16i8:
7561 case AArch64::ADD_ZZZ_B:
7562 case AArch64::ADD_ZZZ_H:
7563 case AArch64::ADD_ZZZ_S:
7564 case AArch64::ADD_ZZZ_D:
7565 case AArch64::MUL_ZZZ_B:
7566 case AArch64::MUL_ZZZ_H:
7567 case AArch64::MUL_ZZZ_S:
7568 case AArch64::MUL_ZZZ_D:
7569 case AArch64::AND_ZZZ:
7570 case AArch64::ORR_ZZZ:
7571 case AArch64::EOR_ZZZ:
7602 auto setFound = [&](
int Opcode,
int Operand,
unsigned ZeroReg,
7610 auto setVFound = [&](
int Opcode,
int Operand,
unsigned Pattern) {
7622 case AArch64::ADDWrr:
7624 "ADDWrr does not have register operands");
7625 setFound(AArch64::MADDWrrr, 1, AArch64::WZR, MCP::MULADDW_OP1);
7626 setFound(AArch64::MADDWrrr, 2, AArch64::WZR, MCP::MULADDW_OP2);
7628 case AArch64::ADDXrr:
7629 setFound(AArch64::MADDXrrr, 1, AArch64::XZR, MCP::MULADDX_OP1);
7630 setFound(AArch64::MADDXrrr, 2, AArch64::XZR, MCP::MULADDX_OP2);
7632 case AArch64::SUBWrr:
7633 setFound(AArch64::MADDWrrr, 2, AArch64::WZR, MCP::MULSUBW_OP2);
7634 setFound(AArch64::MADDWrrr, 1, AArch64::WZR, MCP::MULSUBW_OP1);
7636 case AArch64::SUBXrr:
7637 setFound(AArch64::MADDXrrr, 2, AArch64::XZR, MCP::MULSUBX_OP2);
7638 setFound(AArch64::MADDXrrr, 1, AArch64::XZR, MCP::MULSUBX_OP1);
7640 case AArch64::ADDWri:
7641 setFound(AArch64::MADDWrrr, 1, AArch64::WZR, MCP::MULADDWI_OP1);
7643 case AArch64::ADDXri:
7644 setFound(AArch64::MADDXrrr, 1, AArch64::XZR, MCP::MULADDXI_OP1);
7646 case AArch64::SUBWri:
7647 setFound(AArch64::MADDWrrr, 1, AArch64::WZR, MCP::MULSUBWI_OP1);
7649 case AArch64::SUBXri:
7650 setFound(AArch64::MADDXrrr, 1, AArch64::XZR, MCP::MULSUBXI_OP1);
7652 case AArch64::ADDv8i8:
7653 setVFound(AArch64::MULv8i8, 1, MCP::MULADDv8i8_OP1);
7654 setVFound(AArch64::MULv8i8, 2, MCP::MULADDv8i8_OP2);
7656 case AArch64::ADDv16i8:
7657 setVFound(AArch64::MULv16i8, 1, MCP::MULADDv16i8_OP1);
7658 setVFound(AArch64::MULv16i8, 2, MCP::MULADDv16i8_OP2);
7660 case AArch64::ADDv4i16:
7661 setVFound(AArch64::MULv4i16, 1, MCP::MULADDv4i16_OP1);
7662 setVFound(AArch64::MULv4i16, 2, MCP::MULADDv4i16_OP2);
7663 setVFound(AArch64::MULv4i16_indexed, 1, MCP::MULADDv4i16_indexed_OP1);
7664 setVFound(AArch64::MULv4i16_indexed, 2, MCP::MULADDv4i16_indexed_OP2);
7666 case AArch64::ADDv8i16:
7667 setVFound(AArch64::MULv8i16, 1, MCP::MULADDv8i16_OP1);
7668 setVFound(AArch64::MULv8i16, 2, MCP::MULADDv8i16_OP2);
7669 setVFound(AArch64::MULv8i16_indexed, 1, MCP::MULADDv8i16_indexed_OP1);
7670 setVFound(AArch64::MULv8i16_indexed, 2, MCP::MULADDv8i16_indexed_OP2);
7672 case AArch64::ADDv2i32:
7673 setVFound(AArch64::MULv2i32, 1, MCP::MULADDv2i32_OP1);
7674 setVFound(AArch64::MULv2i32, 2, MCP::MULADDv2i32_OP2);
7675 setVFound(AArch64::MULv2i32_indexed, 1, MCP::MULADDv2i32_indexed_OP1);
7676 setVFound(AArch64::MULv2i32_indexed, 2, MCP::MULADDv2i32_indexed_OP2);
7678 case AArch64::ADDv4i32:
7679 setVFound(AArch64::MULv4i32, 1, MCP::MULADDv4i32_OP1);
7680 setVFound(AArch64::MULv4i32, 2, MCP::MULADDv4i32_OP2);
7681 setVFound(AArch64::MULv4i32_indexed, 1, MCP::MULADDv4i32_indexed_OP1);
7682 setVFound(AArch64::MULv4i32_indexed, 2, MCP::MULADDv4i32_indexed_OP2);
7684 case AArch64::SUBv8i8:
7685 setVFound(AArch64::MULv8i8, 1, MCP::MULSUBv8i8_OP1);
7686 setVFound(AArch64::MULv8i8, 2, MCP::MULSUBv8i8_OP2);
7688 case AArch64::SUBv16i8:
7689 setVFound(AArch64::MULv16i8, 1, MCP::MULSUBv16i8_OP1);
7690 setVFound(AArch64::MULv16i8, 2, MCP::MULSUBv16i8_OP2);
7692 case AArch64::SUBv4i16:
7693 setVFound(AArch64::MULv4i16, 1, MCP::MULSUBv4i16_OP1);
7694 setVFound(AArch64::MULv4i16, 2, MCP::MULSUBv4i16_OP2);
7695 setVFound(AArch64::MULv4i16_indexed, 1, MCP::MULSUBv4i16_indexed_OP1);
7696 setVFound(AArch64::MULv4i16_indexed, 2, MCP::MULSUBv4i16_indexed_OP2);
7698 case AArch64::SUBv8i16:
7699 setVFound(AArch64::MULv8i16, 1, MCP::MULSUBv8i16_OP1);
7700 setVFound(AArch64::MULv8i16, 2, MCP::MULSUBv8i16_OP2);
7701 setVFound(AArch64::MULv8i16_indexed, 1, MCP::MULSUBv8i16_indexed_OP1);
7702 setVFound(AArch64::MULv8i16_indexed, 2, MCP::MULSUBv8i16_indexed_OP2);
7704 case AArch64::SUBv2i32:
7705 setVFound(AArch64::MULv2i32, 1, MCP::MULSUBv2i32_OP1);
7706 setVFound(AArch64::MULv2i32, 2, MCP::MULSUBv2i32_OP2);
7707 setVFound(AArch64::MULv2i32_indexed, 1, MCP::MULSUBv2i32_indexed_OP1);
7708 setVFound(AArch64::MULv2i32_indexed, 2, MCP::MULSUBv2i32_indexed_OP2);
7710 case AArch64::SUBv4i32:
7711 setVFound(AArch64::MULv4i32, 1, MCP::MULSUBv4i32_OP1);
7712 setVFound(AArch64::MULv4i32, 2, MCP::MULSUBv4i32_OP2);
7713 setVFound(AArch64::MULv4i32_indexed, 1, MCP::MULSUBv4i32_indexed_OP1);
7714 setVFound(AArch64::MULv4i32_indexed, 2, MCP::MULSUBv4i32_indexed_OP2);
7720bool AArch64InstrInfo::isAccumulationOpcode(
unsigned Opcode)
const {
7724 case AArch64::UABALB_ZZZ_D:
7725 case AArch64::UABALB_ZZZ_H:
7726 case AArch64::UABALB_ZZZ_S:
7727 case AArch64::UABALT_ZZZ_D:
7728 case AArch64::UABALT_ZZZ_H:
7729 case AArch64::UABALT_ZZZ_S:
7730 case AArch64::SABALB_ZZZ_D:
7731 case AArch64::SABALB_ZZZ_S:
7732 case AArch64::SABALB_ZZZ_H:
7733 case AArch64::SABALT_ZZZ_D:
7734 case AArch64::SABALT_ZZZ_S:
7735 case AArch64::SABALT_ZZZ_H:
7736 case AArch64::UABALv16i8_v8i16:
7737 case AArch64::UABALv2i32_v2i64:
7738 case AArch64::UABALv4i16_v4i32:
7739 case AArch64::UABALv4i32_v2i64:
7740 case AArch64::UABALv8i16_v4i32:
7741 case AArch64::UABALv8i8_v8i16:
7742 case AArch64::UABAv16i8:
7743 case AArch64::UABAv2i32:
7744 case AArch64::UABAv4i16:
7745 case AArch64::UABAv4i32:
7746 case AArch64::UABAv8i16:
7747 case AArch64::UABAv8i8:
7748 case AArch64::SABALv16i8_v8i16:
7749 case AArch64::SABALv2i32_v2i64:
7750 case AArch64::SABALv4i16_v4i32:
7751 case AArch64::SABALv4i32_v2i64:
7752 case AArch64::SABALv8i16_v4i32:
7753 case AArch64::SABALv8i8_v8i16:
7754 case AArch64::SABAv16i8:
7755 case AArch64::SABAv2i32:
7756 case AArch64::SABAv4i16:
7757 case AArch64::SABAv4i32:
7758 case AArch64::SABAv8i16:
7759 case AArch64::SABAv8i8:
7766unsigned AArch64InstrInfo::getAccumulationStartOpcode(
7767 unsigned AccumulationOpcode)
const {
7768 switch (AccumulationOpcode) {
7771 case AArch64::UABALB_ZZZ_D:
7772 return AArch64::UABDLB_ZZZ_D;
7773 case AArch64::UABALB_ZZZ_H:
7774 return AArch64::UABDLB_ZZZ_H;
7775 case AArch64::UABALB_ZZZ_S:
7776 return AArch64::UABDLB_ZZZ_S;
7777 case AArch64::UABALT_ZZZ_D:
7778 return AArch64::UABDLT_ZZZ_D;
7779 case AArch64::UABALT_ZZZ_H:
7780 return AArch64::UABDLT_ZZZ_H;
7781 case AArch64::UABALT_ZZZ_S:
7782 return AArch64::UABDLT_ZZZ_S;
7783 case AArch64::UABALv16i8_v8i16:
7784 return AArch64::UABDLv16i8_v8i16;
7785 case AArch64::UABALv2i32_v2i64:
7786 return AArch64::UABDLv2i32_v2i64;
7787 case AArch64::UABALv4i16_v4i32:
7788 return AArch64::UABDLv4i16_v4i32;
7789 case AArch64::UABALv4i32_v2i64:
7790 return AArch64::UABDLv4i32_v2i64;
7791 case AArch64::UABALv8i16_v4i32:
7792 return AArch64::UABDLv8i16_v4i32;
7793 case AArch64::UABALv8i8_v8i16:
7794 return AArch64::UABDLv8i8_v8i16;
7795 case AArch64::UABAv16i8:
7796 return AArch64::UABDv16i8;
7797 case AArch64::UABAv2i32:
7798 return AArch64::UABDv2i32;
7799 case AArch64::UABAv4i16:
7800 return AArch64::UABDv4i16;
7801 case AArch64::UABAv4i32:
7802 return AArch64::UABDv4i32;
7803 case AArch64::UABAv8i16:
7804 return AArch64::UABDv8i16;
7805 case AArch64::UABAv8i8:
7806 return AArch64::UABDv8i8;
7807 case AArch64::SABALB_ZZZ_D:
7808 return AArch64::SABDLB_ZZZ_D;
7809 case AArch64::SABALB_ZZZ_S:
7810 return AArch64::SABDLB_ZZZ_S;
7811 case AArch64::SABALB_ZZZ_H:
7812 return AArch64::SABDLB_ZZZ_H;
7813 case AArch64::SABALT_ZZZ_D:
7814 return AArch64::SABDLT_ZZZ_D;
7815 case AArch64::SABALT_ZZZ_S:
7816 return AArch64::SABDLT_ZZZ_S;
7817 case AArch64::SABALT_ZZZ_H:
7818 return AArch64::SABDLT_ZZZ_H;
7819 case AArch64::SABALv16i8_v8i16:
7820 return AArch64::SABDLv16i8_v8i16;
7821 case AArch64::SABALv2i32_v2i64:
7822 return AArch64::SABDLv2i32_v2i64;
7823 case AArch64::SABALv4i16_v4i32:
7824 return AArch64::SABDLv4i16_v4i32;
7825 case AArch64::SABALv4i32_v2i64:
7826 return AArch64::SABDLv4i32_v2i64;
7827 case AArch64::SABALv8i16_v4i32:
7828 return AArch64::SABDLv8i16_v4i32;
7829 case AArch64::SABALv8i8_v8i16:
7830 return AArch64::SABDLv8i8_v8i16;
7831 case AArch64::SABAv16i8:
7832 return AArch64::SABDv16i8;
7833 case AArch64::SABAv2i32:
7834 return AArch64::SABAv2i32;
7835 case AArch64::SABAv4i16:
7836 return AArch64::SABDv4i16;
7837 case AArch64::SABAv4i32:
7838 return AArch64::SABDv4i32;
7839 case AArch64::SABAv8i16:
7840 return AArch64::SABDv8i16;
7841 case AArch64::SABAv8i8:
7842 return AArch64::SABDv8i8;
7858 auto Match = [&](
int Opcode,
int Operand,
unsigned Pattern) ->
bool {
7870 assert(
false &&
"Unsupported FP instruction in combiner\n");
7872 case AArch64::FADDHrr:
7874 "FADDHrr does not have register operands");
7876 Found = Match(AArch64::FMULHrr, 1, MCP::FMULADDH_OP1);
7877 Found |= Match(AArch64::FMULHrr, 2, MCP::FMULADDH_OP2);
7879 case AArch64::FADDSrr:
7881 "FADDSrr does not have register operands");
7883 Found |= Match(AArch64::FMULSrr, 1, MCP::FMULADDS_OP1) ||
7884 Match(AArch64::FMULv1i32_indexed, 1, MCP::FMLAv1i32_indexed_OP1);
7886 Found |= Match(AArch64::FMULSrr, 2, MCP::FMULADDS_OP2) ||
7887 Match(AArch64::FMULv1i32_indexed, 2, MCP::FMLAv1i32_indexed_OP2);
7889 case AArch64::FADDDrr:
7890 Found |= Match(AArch64::FMULDrr, 1, MCP::FMULADDD_OP1) ||
7891 Match(AArch64::FMULv1i64_indexed, 1, MCP::FMLAv1i64_indexed_OP1);
7893 Found |= Match(AArch64::FMULDrr, 2, MCP::FMULADDD_OP2) ||
7894 Match(AArch64::FMULv1i64_indexed, 2, MCP::FMLAv1i64_indexed_OP2);
7896 case AArch64::FADDv4f16:
7897 Found |= Match(AArch64::FMULv4i16_indexed, 1, MCP::FMLAv4i16_indexed_OP1) ||
7898 Match(AArch64::FMULv4f16, 1, MCP::FMLAv4f16_OP1);
7900 Found |= Match(AArch64::FMULv4i16_indexed, 2, MCP::FMLAv4i16_indexed_OP2) ||
7901 Match(AArch64::FMULv4f16, 2, MCP::FMLAv4f16_OP2);
7903 case AArch64::FADDv8f16:
7904 Found |= Match(AArch64::FMULv8i16_indexed, 1, MCP::FMLAv8i16_indexed_OP1) ||
7905 Match(AArch64::FMULv8f16, 1, MCP::FMLAv8f16_OP1);
7907 Found |= Match(AArch64::FMULv8i16_indexed, 2, MCP::FMLAv8i16_indexed_OP2) ||
7908 Match(AArch64::FMULv8f16, 2, MCP::FMLAv8f16_OP2);
7910 case AArch64::FADDv2f32:
7911 Found |= Match(AArch64::FMULv2i32_indexed, 1, MCP::FMLAv2i32_indexed_OP1) ||
7912 Match(AArch64::FMULv2f32, 1, MCP::FMLAv2f32_OP1);
7914 Found |= Match(AArch64::FMULv2i32_indexed, 2, MCP::FMLAv2i32_indexed_OP2) ||
7915 Match(AArch64::FMULv2f32, 2, MCP::FMLAv2f32_OP2);
7917 case AArch64::FADDv2f64:
7918 Found |= Match(AArch64::FMULv2i64_indexed, 1, MCP::FMLAv2i64_indexed_OP1) ||
7919 Match(AArch64::FMULv2f64, 1, MCP::FMLAv2f64_OP1);
7921 Found |= Match(AArch64::FMULv2i64_indexed, 2, MCP::FMLAv2i64_indexed_OP2) ||
7922 Match(AArch64::FMULv2f64, 2, MCP::FMLAv2f64_OP2);
7924 case AArch64::FADDv4f32:
7925 Found |= Match(AArch64::FMULv4i32_indexed, 1, MCP::FMLAv4i32_indexed_OP1) ||
7926 Match(AArch64::FMULv4f32, 1, MCP::FMLAv4f32_OP1);
7928 Found |= Match(AArch64::FMULv4i32_indexed, 2, MCP::FMLAv4i32_indexed_OP2) ||
7929 Match(AArch64::FMULv4f32, 2, MCP::FMLAv4f32_OP2);
7931 case AArch64::FSUBHrr:
7932 Found = Match(AArch64::FMULHrr, 1, MCP::FMULSUBH_OP1);
7933 Found |= Match(AArch64::FMULHrr, 2, MCP::FMULSUBH_OP2);
7934 Found |= Match(AArch64::FNMULHrr, 1, MCP::FNMULSUBH_OP1);
7936 case AArch64::FSUBSrr:
7937 Found = Match(AArch64::FMULSrr, 1, MCP::FMULSUBS_OP1);
7939 Found |= Match(AArch64::FMULSrr, 2, MCP::FMULSUBS_OP2) ||
7940 Match(AArch64::FMULv1i32_indexed, 2, MCP::FMLSv1i32_indexed_OP2);
7942 Found |= Match(AArch64::FNMULSrr, 1, MCP::FNMULSUBS_OP1);
7944 case AArch64::FSUBDrr:
7945 Found = Match(AArch64::FMULDrr, 1, MCP::FMULSUBD_OP1);
7947 Found |= Match(AArch64::FMULDrr, 2, MCP::FMULSUBD_OP2) ||
7948 Match(AArch64::FMULv1i64_indexed, 2, MCP::FMLSv1i64_indexed_OP2);
7950 Found |= Match(AArch64::FNMULDrr, 1, MCP::FNMULSUBD_OP1);
7952 case AArch64::FSUBv4f16:
7953 Found |= Match(AArch64::FMULv4i16_indexed, 2, MCP::FMLSv4i16_indexed_OP2) ||
7954 Match(AArch64::FMULv4f16, 2, MCP::FMLSv4f16_OP2);
7956 Found |= Match(AArch64::FMULv4i16_indexed, 1, MCP::FMLSv4i16_indexed_OP1) ||
7957 Match(AArch64::FMULv4f16, 1, MCP::FMLSv4f16_OP1);
7959 case AArch64::FSUBv8f16:
7960 Found |= Match(AArch64::FMULv8i16_indexed, 2, MCP::FMLSv8i16_indexed_OP2) ||
7961 Match(AArch64::FMULv8f16, 2, MCP::FMLSv8f16_OP2);
7963 Found |= Match(AArch64::FMULv8i16_indexed, 1, MCP::FMLSv8i16_indexed_OP1) ||
7964 Match(AArch64::FMULv8f16, 1, MCP::FMLSv8f16_OP1);
7966 case AArch64::FSUBv2f32:
7967 Found |= Match(AArch64::FMULv2i32_indexed, 2, MCP::FMLSv2i32_indexed_OP2) ||
7968 Match(AArch64::FMULv2f32, 2, MCP::FMLSv2f32_OP2);
7970 Found |= Match(AArch64::FMULv2i32_indexed, 1, MCP::FMLSv2i32_indexed_OP1) ||
7971 Match(AArch64::FMULv2f32, 1, MCP::FMLSv2f32_OP1);
7973 case AArch64::FSUBv2f64:
7974 Found |= Match(AArch64::FMULv2i64_indexed, 2, MCP::FMLSv2i64_indexed_OP2) ||
7975 Match(AArch64::FMULv2f64, 2, MCP::FMLSv2f64_OP2);
7977 Found |= Match(AArch64::FMULv2i64_indexed, 1, MCP::FMLSv2i64_indexed_OP1) ||
7978 Match(AArch64::FMULv2f64, 1, MCP::FMLSv2f64_OP1);
7980 case AArch64::FSUBv4f32:
7981 Found |= Match(AArch64::FMULv4i32_indexed, 2, MCP::FMLSv4i32_indexed_OP2) ||
7982 Match(AArch64::FMULv4f32, 2, MCP::FMLSv4f32_OP2);
7984 Found |= Match(AArch64::FMULv4i32_indexed, 1, MCP::FMLSv4i32_indexed_OP1) ||
7985 Match(AArch64::FMULv4f32, 1, MCP::FMLSv4f32_OP1);
7996 auto Match = [&](
unsigned Opcode,
int Operand,
unsigned Pattern) ->
bool {
8003 if (
MI &&
MI->getOpcode() == TargetOpcode::COPY &&
8004 MI->getOperand(1).getReg().isVirtual())
8006 if (
MI &&
MI->getOpcode() == Opcode) {
8018 case AArch64::FMULv2f32:
8019 Found = Match(AArch64::DUPv2i32lane, 1, MCP::FMULv2i32_indexed_OP1);
8020 Found |= Match(AArch64::DUPv2i32lane, 2, MCP::FMULv2i32_indexed_OP2);
8022 case AArch64::FMULv2f64:
8023 Found = Match(AArch64::DUPv2i64lane, 1, MCP::FMULv2i64_indexed_OP1);
8024 Found |= Match(AArch64::DUPv2i64lane, 2, MCP::FMULv2i64_indexed_OP2);
8026 case AArch64::FMULv4f16:
8027 Found = Match(AArch64::DUPv4i16lane, 1, MCP::FMULv4i16_indexed_OP1);
8028 Found |= Match(AArch64::DUPv4i16lane, 2, MCP::FMULv4i16_indexed_OP2);
8030 case AArch64::FMULv4f32:
8031 Found = Match(AArch64::DUPv4i32lane, 1, MCP::FMULv4i32_indexed_OP1);
8032 Found |= Match(AArch64::DUPv4i32lane, 2, MCP::FMULv4i32_indexed_OP2);
8034 case AArch64::FMULv8f16:
8035 Found = Match(AArch64::DUPv8i16lane, 1, MCP::FMULv8i16_indexed_OP1);
8036 Found |= Match(AArch64::DUPv8i16lane, 2, MCP::FMULv8i16_indexed_OP2);
8049 auto Match = [&](
unsigned Opcode,
unsigned Pattern) ->
bool {
8052 if (
MI !=
nullptr && (
MI->getOpcode() == Opcode) &&
8067 case AArch64::FNEGDr:
8069 case AArch64::FNEGSr:
8201 case AArch64::SUBWrr:
8202 case AArch64::SUBSWrr:
8203 case AArch64::SUBXrr:
8204 case AArch64::SUBSXrr:
8249 unsigned LoadLaneOpCode,
unsigned NumLanes) {
8272 while (!RemainingLanes.
empty() && CurrInstr &&
8273 CurrInstr->getOpcode() == LoadLaneOpCode &&
8275 CurrInstr->getNumOperands() == 4) {
8276 RemainingLanes.
erase(CurrInstr->getOperand(2).getImm());
8282 if (!RemainingLanes.
empty())
8286 if (CurrInstr->getOpcode() != TargetOpcode::SUBREG_TO_REG)
8290 auto Lane0LoadReg = CurrInstr->getOperand(1).getReg();
8291 unsigned SingleLaneSizeInBits = 128 / NumLanes;
8292 if (
TRI->getRegSizeInBits(Lane0LoadReg, MRI) != SingleLaneSizeInBits)
8308 RemainingLoadInstrs.
insert(LoadInstrs.
begin(), LoadInstrs.
end());
8311 for (; MBBItr !=
MBB->begin() && RemainingSteps > 0 &&
8312 !RemainingLoadInstrs.
empty();
8313 --MBBItr, --RemainingSteps) {
8317 RemainingLoadInstrs.
erase(&CurrInstr);
8327 if (RemainingSteps == 0 && !RemainingLoadInstrs.
empty())
8353 case AArch64::LD1i32:
8355 case AArch64::LD1i16:
8357 case AArch64::LD1i8:
8373 unsigned Pattern,
unsigned NumLanes) {
8381 for (
unsigned i = 0; i < NumLanes - 1; ++i) {
8389 return A->getOperand(2).getImm() >
B->getOperand(2).getImm();
8395 auto LoadToLaneInstrsAscending =
llvm::reverse(LoadToLaneInstrs);
8401 auto CreateLD1Instruction = [&](
MachineInstr *OriginalInstr,
8402 Register SrcRegister,
unsigned Lane,
8404 bool OffsetRegisterKillState) {
8413 InstrIdxForVirtReg.
insert(std::make_pair(NewRegister, InsInstrs.
size()));
8414 InsInstrs.
push_back(LoadIndexIntoRegister);
8420 auto CreateLDRInstruction =
8426 Opcode = AArch64::LDRSui;
8429 Opcode = AArch64::LDRHui;
8432 Opcode = AArch64::LDRBui;
8436 "Got unsupported number of lanes in machine-combiner gather pattern");
8446 auto LanesToLoadToReg0 =
8448 LoadToLaneInstrsAscending.begin() + NumLanes / 2);
8449 Register PrevReg = SubregToReg->getOperand(0).getReg();
8451 const MachineOperand &OffsetRegOperand = LoadInstr->getOperand(3);
8452 PrevReg = CreateLD1Instruction(LoadInstr, PrevReg, Index + 1,
8453 OffsetRegOperand.
getReg(),
8454 OffsetRegOperand.
isKill());
8461 MachineInstr *Lane0Load = *LoadToLaneInstrsAscending.begin();
8463 *std::next(LoadToLaneInstrsAscending.begin(), NumLanes / 2);
8470 CreateLDRInstruction(NumLanes, DestRegForMiddleIndex,
8471 OriginalSplitToLoadOffsetOperand.
getReg(),
8474 InstrIdxForVirtReg.
insert(
8475 std::make_pair(DestRegForMiddleIndex, InsInstrs.
size()));
8476 InsInstrs.
push_back(MiddleIndexLoadInstr);
8481 unsigned SubregType;
8484 SubregType = AArch64::ssub;
8487 SubregType = AArch64::hsub;
8490 SubregType = AArch64::bsub;
8494 "Got invalid NumLanes for machine-combiner gather pattern");
8497 auto SubRegToRegInstr =
8499 DestRegForSubregToReg)
8502 InstrIdxForVirtReg.
insert(
8503 std::make_pair(DestRegForSubregToReg, InsInstrs.
size()));
8507 auto LanesToLoadToReg1 =
8509 LoadToLaneInstrsAscending.end());
8510 PrevReg = SubRegToRegInstr->getOperand(0).getReg();
8512 const MachineOperand &OffsetRegOperand = LoadInstr->getOperand(3);
8513 PrevReg = CreateLD1Instruction(LoadInstr, PrevReg, Index + 1,
8514 OffsetRegOperand.
getReg(),
8515 OffsetRegOperand.
isKill());
8518 if (Index == NumLanes / 2 - 2) {
8553bool AArch64InstrInfo::getMachineCombinerPatterns(
8555 bool DoRegPressureReduce)
const {
8576 DoRegPressureReduce);
8605 const Register *ReplacedAddend =
nullptr) {
8606 assert(IdxMulOpd == 1 || IdxMulOpd == 2);
8608 unsigned IdxOtherOpd = IdxMulOpd == 1 ? 2 : 1;
8611 Register SrcReg0 = MUL->getOperand(1).getReg();
8612 bool Src0IsKill = MUL->getOperand(1).isKill();
8613 Register SrcReg1 = MUL->getOperand(2).getReg();
8614 bool Src1IsKill = MUL->getOperand(2).isKill();
8618 if (ReplacedAddend) {
8620 SrcReg2 = *ReplacedAddend;
8647 .
addImm(MUL->getOperand(3).getImm());
8654 assert(
false &&
"Invalid FMA instruction kind \n");
8668 if (AArch64::FPR32RegClass.hasSubClassEq(RC))
8669 Opc = AArch64::FNMADDSrrr;
8670 else if (AArch64::FPR64RegClass.hasSubClassEq(RC))
8671 Opc = AArch64::FNMADDDrrr;
8705 unsigned IdxDupOp,
unsigned MulOpc,
8707 assert(((IdxDupOp == 1) || (IdxDupOp == 2)) &&
8708 "Invalid index of FMUL operand");
8716 if (Dup->
getOpcode() == TargetOpcode::COPY)
8725 unsigned IdxMulOp = IdxDupOp == 1 ? 2 : 1;
8766 InstrIdxForVirtReg.
insert(std::make_pair(NewVR, 0));
8781 genNeg(MF, MRI,
TII, Root, InsInstrs, InstrIdxForVirtReg, MnegOpc, RC);
8808 genNeg(MF, MRI,
TII, Root, InsInstrs, InstrIdxForVirtReg, MnegOpc, RC);
8836 unsigned IdxMulOpd,
unsigned MaddOpc,
unsigned VR,
8838 assert(IdxMulOpd == 1 || IdxMulOpd == 2);
8842 Register SrcReg0 = MUL->getOperand(1).getReg();
8843 bool Src0IsKill = MUL->getOperand(1).isKill();
8844 Register SrcReg1 = MUL->getOperand(2).getReg();
8845 bool Src1IsKill = MUL->getOperand(2).isKill();
8875 assert(IdxOpd1 == 1 || IdxOpd1 == 2);
8876 unsigned IdxOtherOpd = IdxOpd1 == 1 ? 2 : 1;
8890 if (Opcode == AArch64::SUBSWrr)
8891 Opcode = AArch64::SUBWrr;
8892 else if (Opcode == AArch64::SUBSXrr)
8893 Opcode = AArch64::SUBXrr;
8895 assert((Opcode == AArch64::SUBWrr || Opcode == AArch64::SUBXrr) &&
8896 "Unexpected instruction opcode.");
8913 InstrIdxForVirtReg.
insert(std::make_pair(NewVR, 0));
8920unsigned AArch64InstrInfo::getReduceOpcodeForAccumulator(
8921 unsigned int AccumulatorOpCode)
const {
8922 switch (AccumulatorOpCode) {
8923 case AArch64::UABALB_ZZZ_D:
8924 case AArch64::SABALB_ZZZ_D:
8925 case AArch64::UABALT_ZZZ_D:
8926 case AArch64::SABALT_ZZZ_D:
8927 return AArch64::ADD_ZZZ_D;
8928 case AArch64::UABALB_ZZZ_H:
8929 case AArch64::SABALB_ZZZ_H:
8930 case AArch64::UABALT_ZZZ_H:
8931 case AArch64::SABALT_ZZZ_H:
8932 return AArch64::ADD_ZZZ_H;
8933 case AArch64::UABALB_ZZZ_S:
8934 case AArch64::SABALB_ZZZ_S:
8935 case AArch64::UABALT_ZZZ_S:
8936 case AArch64::SABALT_ZZZ_S:
8937 return AArch64::ADD_ZZZ_S;
8938 case AArch64::UABALv16i8_v8i16:
8939 case AArch64::SABALv8i8_v8i16:
8940 case AArch64::SABAv8i16:
8941 case AArch64::UABAv8i16:
8942 return AArch64::ADDv8i16;
8943 case AArch64::SABALv2i32_v2i64:
8944 case AArch64::UABALv2i32_v2i64:
8945 case AArch64::SABALv4i32_v2i64:
8946 return AArch64::ADDv2i64;
8947 case AArch64::UABALv4i16_v4i32:
8948 case AArch64::SABALv4i16_v4i32:
8949 case AArch64::SABALv8i16_v4i32:
8950 case AArch64::SABAv4i32:
8951 case AArch64::UABAv4i32:
8952 return AArch64::ADDv4i32;
8953 case AArch64::UABALv4i32_v2i64:
8954 return AArch64::ADDv2i64;
8955 case AArch64::UABALv8i16_v4i32:
8956 return AArch64::ADDv4i32;
8957 case AArch64::UABALv8i8_v8i16:
8958 case AArch64::SABALv16i8_v8i16:
8959 return AArch64::ADDv8i16;
8960 case AArch64::UABAv16i8:
8961 case AArch64::SABAv16i8:
8962 return AArch64::ADDv16i8;
8963 case AArch64::UABAv4i16:
8964 case AArch64::SABAv4i16:
8965 return AArch64::ADDv4i16;
8966 case AArch64::UABAv2i32:
8967 case AArch64::SABAv2i32:
8968 return AArch64::ADDv2i32;
8969 case AArch64::UABAv8i8:
8970 case AArch64::SABAv8i8:
8971 return AArch64::ADDv8i8;
8980void AArch64InstrInfo::genAlternativeCodeSequence(
8990 MachineInstr *
MUL =
nullptr;
8991 const TargetRegisterClass *RC;
8997 DelInstrs, InstrIdxForVirtReg);
9003 InstrIdxForVirtReg);
9009 InstrIdxForVirtReg);
9018 Opc = AArch64::MADDWrrr;
9019 RC = &AArch64::GPR32RegClass;
9021 Opc = AArch64::MADDXrrr;
9022 RC = &AArch64::GPR64RegClass;
9033 Opc = AArch64::MADDWrrr;
9034 RC = &AArch64::GPR32RegClass;
9036 Opc = AArch64::MADDXrrr;
9037 RC = &AArch64::GPR64RegClass;
9050 const TargetRegisterClass *RC;
9051 unsigned BitSize, MovImm;
9054 MovImm = AArch64::MOVi32imm;
9055 RC = &AArch64::GPR32spRegClass;
9057 Opc = AArch64::MADDWrrr;
9058 RC = &AArch64::GPR32RegClass;
9060 MovImm = AArch64::MOVi64imm;
9061 RC = &AArch64::GPR64spRegClass;
9063 Opc = AArch64::MADDXrrr;
9064 RC = &AArch64::GPR64RegClass;
9075 uint64_t UImm =
SignExtend64(IsSub ? -Imm : Imm, BitSize);
9079 if (Insn.
size() != 1)
9081 MachineInstrBuilder MIB1 =
9082 BuildMI(MF, MIMetadata(Root),
TII->get(MovImm), NewVR)
9083 .
addImm(IsSub ? -Imm : Imm);
9085 InstrIdxForVirtReg.
insert(std::make_pair(NewVR, 0));
9096 const TargetRegisterClass *SubRC;
9097 unsigned SubOpc, ZeroReg;
9099 SubOpc = AArch64::SUBWrr;
9100 SubRC = &AArch64::GPR32spRegClass;
9101 ZeroReg = AArch64::WZR;
9102 Opc = AArch64::MADDWrrr;
9103 RC = &AArch64::GPR32RegClass;
9105 SubOpc = AArch64::SUBXrr;
9106 SubRC = &AArch64::GPR64spRegClass;
9107 ZeroReg = AArch64::XZR;
9108 Opc = AArch64::MADDXrrr;
9109 RC = &AArch64::GPR64RegClass;
9113 MachineInstrBuilder MIB1 =
9114 BuildMI(MF, MIMetadata(Root),
TII->get(SubOpc), NewVR)
9118 InstrIdxForVirtReg.
insert(std::make_pair(NewVR, 0));
9129 Opc = AArch64::MSUBWrrr;
9130 RC = &AArch64::GPR32RegClass;
9132 Opc = AArch64::MSUBXrrr;
9133 RC = &AArch64::GPR64RegClass;
9138 Opc = AArch64::MLAv8i8;
9139 RC = &AArch64::FPR64RegClass;
9143 Opc = AArch64::MLAv8i8;
9144 RC = &AArch64::FPR64RegClass;
9148 Opc = AArch64::MLAv16i8;
9149 RC = &AArch64::FPR128RegClass;
9153 Opc = AArch64::MLAv16i8;
9154 RC = &AArch64::FPR128RegClass;
9158 Opc = AArch64::MLAv4i16;
9159 RC = &AArch64::FPR64RegClass;
9163 Opc = AArch64::MLAv4i16;
9164 RC = &AArch64::FPR64RegClass;
9168 Opc = AArch64::MLAv8i16;
9169 RC = &AArch64::FPR128RegClass;
9173 Opc = AArch64::MLAv8i16;
9174 RC = &AArch64::FPR128RegClass;
9178 Opc = AArch64::MLAv2i32;
9179 RC = &AArch64::FPR64RegClass;
9183 Opc = AArch64::MLAv2i32;
9184 RC = &AArch64::FPR64RegClass;
9188 Opc = AArch64::MLAv4i32;
9189 RC = &AArch64::FPR128RegClass;
9193 Opc = AArch64::MLAv4i32;
9194 RC = &AArch64::FPR128RegClass;
9199 Opc = AArch64::MLAv8i8;
9200 RC = &AArch64::FPR64RegClass;
9202 InstrIdxForVirtReg, 1,
Opc, AArch64::NEGv8i8,
9206 Opc = AArch64::MLSv8i8;
9207 RC = &AArch64::FPR64RegClass;
9211 Opc = AArch64::MLAv16i8;
9212 RC = &AArch64::FPR128RegClass;
9214 InstrIdxForVirtReg, 1,
Opc, AArch64::NEGv16i8,
9218 Opc = AArch64::MLSv16i8;
9219 RC = &AArch64::FPR128RegClass;
9223 Opc = AArch64::MLAv4i16;
9224 RC = &AArch64::FPR64RegClass;
9226 InstrIdxForVirtReg, 1,
Opc, AArch64::NEGv4i16,
9230 Opc = AArch64::MLSv4i16;
9231 RC = &AArch64::FPR64RegClass;
9235 Opc = AArch64::MLAv8i16;
9236 RC = &AArch64::FPR128RegClass;
9238 InstrIdxForVirtReg, 1,
Opc, AArch64::NEGv8i16,
9242 Opc = AArch64::MLSv8i16;
9243 RC = &AArch64::FPR128RegClass;
9247 Opc = AArch64::MLAv2i32;
9248 RC = &AArch64::FPR64RegClass;
9250 InstrIdxForVirtReg, 1,
Opc, AArch64::NEGv2i32,
9254 Opc = AArch64::MLSv2i32;
9255 RC = &AArch64::FPR64RegClass;
9259 Opc = AArch64::MLAv4i32;
9260 RC = &AArch64::FPR128RegClass;
9262 InstrIdxForVirtReg, 1,
Opc, AArch64::NEGv4i32,
9266 Opc = AArch64::MLSv4i32;
9267 RC = &AArch64::FPR128RegClass;
9272 Opc = AArch64::MLAv4i16_indexed;
9273 RC = &AArch64::FPR64RegClass;
9277 Opc = AArch64::MLAv4i16_indexed;
9278 RC = &AArch64::FPR64RegClass;
9282 Opc = AArch64::MLAv8i16_indexed;
9283 RC = &AArch64::FPR128RegClass;
9287 Opc = AArch64::MLAv8i16_indexed;
9288 RC = &AArch64::FPR128RegClass;
9292 Opc = AArch64::MLAv2i32_indexed;
9293 RC = &AArch64::FPR64RegClass;
9297 Opc = AArch64::MLAv2i32_indexed;
9298 RC = &AArch64::FPR64RegClass;
9302 Opc = AArch64::MLAv4i32_indexed;
9303 RC = &AArch64::FPR128RegClass;
9307 Opc = AArch64::MLAv4i32_indexed;
9308 RC = &AArch64::FPR128RegClass;
9313 Opc = AArch64::MLAv4i16_indexed;
9314 RC = &AArch64::FPR64RegClass;
9316 InstrIdxForVirtReg, 1,
Opc, AArch64::NEGv4i16,
9320 Opc = AArch64::MLSv4i16_indexed;
9321 RC = &AArch64::FPR64RegClass;
9325 Opc = AArch64::MLAv8i16_indexed;
9326 RC = &AArch64::FPR128RegClass;
9328 InstrIdxForVirtReg, 1,
Opc, AArch64::NEGv8i16,
9332 Opc = AArch64::MLSv8i16_indexed;
9333 RC = &AArch64::FPR128RegClass;
9337 Opc = AArch64::MLAv2i32_indexed;
9338 RC = &AArch64::FPR64RegClass;
9340 InstrIdxForVirtReg, 1,
Opc, AArch64::NEGv2i32,
9344 Opc = AArch64::MLSv2i32_indexed;
9345 RC = &AArch64::FPR64RegClass;
9349 Opc = AArch64::MLAv4i32_indexed;
9350 RC = &AArch64::FPR128RegClass;
9352 InstrIdxForVirtReg, 1,
Opc, AArch64::NEGv4i32,
9356 Opc = AArch64::MLSv4i32_indexed;
9357 RC = &AArch64::FPR128RegClass;
9363 Opc = AArch64::FMADDHrrr;
9364 RC = &AArch64::FPR16RegClass;
9368 Opc = AArch64::FMADDSrrr;
9369 RC = &AArch64::FPR32RegClass;
9373 Opc = AArch64::FMADDDrrr;
9374 RC = &AArch64::FPR64RegClass;
9379 Opc = AArch64::FMADDHrrr;
9380 RC = &AArch64::FPR16RegClass;
9384 Opc = AArch64::FMADDSrrr;
9385 RC = &AArch64::FPR32RegClass;
9389 Opc = AArch64::FMADDDrrr;
9390 RC = &AArch64::FPR64RegClass;
9395 Opc = AArch64::FMLAv1i32_indexed;
9396 RC = &AArch64::FPR32RegClass;
9401 Opc = AArch64::FMLAv1i32_indexed;
9402 RC = &AArch64::FPR32RegClass;
9408 Opc = AArch64::FMLAv1i64_indexed;
9409 RC = &AArch64::FPR64RegClass;
9414 Opc = AArch64::FMLAv1i64_indexed;
9415 RC = &AArch64::FPR64RegClass;
9421 RC = &AArch64::FPR64RegClass;
9422 Opc = AArch64::FMLAv4i16_indexed;
9427 RC = &AArch64::FPR64RegClass;
9428 Opc = AArch64::FMLAv4f16;
9433 RC = &AArch64::FPR64RegClass;
9434 Opc = AArch64::FMLAv4i16_indexed;
9439 RC = &AArch64::FPR64RegClass;
9440 Opc = AArch64::FMLAv4f16;
9447 RC = &AArch64::FPR64RegClass;
9449 Opc = AArch64::FMLAv2i32_indexed;
9453 Opc = AArch64::FMLAv2f32;
9460 RC = &AArch64::FPR64RegClass;
9462 Opc = AArch64::FMLAv2i32_indexed;
9466 Opc = AArch64::FMLAv2f32;
9473 RC = &AArch64::FPR128RegClass;
9474 Opc = AArch64::FMLAv8i16_indexed;
9479 RC = &AArch64::FPR128RegClass;
9480 Opc = AArch64::FMLAv8f16;
9485 RC = &AArch64::FPR128RegClass;
9486 Opc = AArch64::FMLAv8i16_indexed;
9491 RC = &AArch64::FPR128RegClass;
9492 Opc = AArch64::FMLAv8f16;
9499 RC = &AArch64::FPR128RegClass;
9501 Opc = AArch64::FMLAv2i64_indexed;
9505 Opc = AArch64::FMLAv2f64;
9512 RC = &AArch64::FPR128RegClass;
9514 Opc = AArch64::FMLAv2i64_indexed;
9518 Opc = AArch64::FMLAv2f64;
9526 RC = &AArch64::FPR128RegClass;
9528 Opc = AArch64::FMLAv4i32_indexed;
9532 Opc = AArch64::FMLAv4f32;
9540 RC = &AArch64::FPR128RegClass;
9542 Opc = AArch64::FMLAv4i32_indexed;
9546 Opc = AArch64::FMLAv4f32;
9553 Opc = AArch64::FNMSUBHrrr;
9554 RC = &AArch64::FPR16RegClass;
9558 Opc = AArch64::FNMSUBSrrr;
9559 RC = &AArch64::FPR32RegClass;
9563 Opc = AArch64::FNMSUBDrrr;
9564 RC = &AArch64::FPR64RegClass;
9569 Opc = AArch64::FNMADDHrrr;
9570 RC = &AArch64::FPR16RegClass;
9574 Opc = AArch64::FNMADDSrrr;
9575 RC = &AArch64::FPR32RegClass;
9579 Opc = AArch64::FNMADDDrrr;
9580 RC = &AArch64::FPR64RegClass;
9585 Opc = AArch64::FMSUBHrrr;
9586 RC = &AArch64::FPR16RegClass;
9590 Opc = AArch64::FMSUBSrrr;
9591 RC = &AArch64::FPR32RegClass;
9595 Opc = AArch64::FMSUBDrrr;
9596 RC = &AArch64::FPR64RegClass;
9601 Opc = AArch64::FMLSv1i32_indexed;
9602 RC = &AArch64::FPR32RegClass;
9608 Opc = AArch64::FMLSv1i64_indexed;
9609 RC = &AArch64::FPR64RegClass;
9616 RC = &AArch64::FPR64RegClass;
9618 MachineInstrBuilder MIB1 =
9619 BuildMI(MF, MIMetadata(Root),
TII->get(AArch64::FNEGv4f16), NewVR)
9622 InstrIdxForVirtReg.
insert(std::make_pair(NewVR, 0));
9624 Opc = AArch64::FMLAv4f16;
9628 Opc = AArch64::FMLAv4i16_indexed;
9635 RC = &AArch64::FPR64RegClass;
9636 Opc = AArch64::FMLSv4f16;
9641 RC = &AArch64::FPR64RegClass;
9642 Opc = AArch64::FMLSv4i16_indexed;
9649 RC = &AArch64::FPR64RegClass;
9651 Opc = AArch64::FMLSv2i32_indexed;
9655 Opc = AArch64::FMLSv2f32;
9663 RC = &AArch64::FPR128RegClass;
9665 MachineInstrBuilder MIB1 =
9666 BuildMI(MF, MIMetadata(Root),
TII->get(AArch64::FNEGv8f16), NewVR)
9669 InstrIdxForVirtReg.
insert(std::make_pair(NewVR, 0));
9671 Opc = AArch64::FMLAv8f16;
9675 Opc = AArch64::FMLAv8i16_indexed;
9682 RC = &AArch64::FPR128RegClass;
9683 Opc = AArch64::FMLSv8f16;
9688 RC = &AArch64::FPR128RegClass;
9689 Opc = AArch64::FMLSv8i16_indexed;
9696 RC = &AArch64::FPR128RegClass;
9698 Opc = AArch64::FMLSv2i64_indexed;
9702 Opc = AArch64::FMLSv2f64;
9710 RC = &AArch64::FPR128RegClass;
9712 Opc = AArch64::FMLSv4i32_indexed;
9716 Opc = AArch64::FMLSv4f32;
9723 RC = &AArch64::FPR64RegClass;
9725 MachineInstrBuilder MIB1 =
9726 BuildMI(MF, MIMetadata(Root),
TII->get(AArch64::FNEGv2f32), NewVR)
9729 InstrIdxForVirtReg.
insert(std::make_pair(NewVR, 0));
9731 Opc = AArch64::FMLAv2i32_indexed;
9735 Opc = AArch64::FMLAv2f32;
9743 RC = &AArch64::FPR128RegClass;
9745 MachineInstrBuilder MIB1 =
9746 BuildMI(MF, MIMetadata(Root),
TII->get(AArch64::FNEGv4f32), NewVR)
9749 InstrIdxForVirtReg.
insert(std::make_pair(NewVR, 0));
9751 Opc = AArch64::FMLAv4i32_indexed;
9755 Opc = AArch64::FMLAv4f32;
9763 RC = &AArch64::FPR128RegClass;
9765 MachineInstrBuilder MIB1 =
9766 BuildMI(MF, MIMetadata(Root),
TII->get(AArch64::FNEGv2f64), NewVR)
9769 InstrIdxForVirtReg.
insert(std::make_pair(NewVR, 0));
9771 Opc = AArch64::FMLAv2i64_indexed;
9775 Opc = AArch64::FMLAv2f64;
9787 &AArch64::FPR128RegClass, MRI);
9796 &AArch64::FPR128RegClass, MRI);
9805 &AArch64::FPR128_loRegClass, MRI);
9814 &AArch64::FPR128RegClass, MRI);
9823 &AArch64::FPR128_loRegClass, MRI);
9857 for (
auto *
MI : InsInstrs)
9858 MI->setFlags(Flags);
9899 bool IsNegativeBranch =
false;
9900 bool IsTestAndBranch =
false;
9901 unsigned TargetBBInMI = 0;
9902 switch (
MI.getOpcode()) {
9906 case AArch64::CBWPri:
9907 case AArch64::CBXPri:
9908 case AArch64::CBBAssertExt:
9909 case AArch64::CBHAssertExt:
9910 case AArch64::CBWPrr:
9911 case AArch64::CBXPrr:
9917 case AArch64::CBNZW:
9918 case AArch64::CBNZX:
9920 IsNegativeBranch =
true;
9925 IsTestAndBranch =
true;
9927 case AArch64::TBNZW:
9928 case AArch64::TBNZX:
9930 IsNegativeBranch =
true;
9931 IsTestAndBranch =
true;
9937 if (IsTestAndBranch &&
MI.getOperand(1).getImm())
9941 assert(
MI.getParent() &&
"Incomplete machine instruction\n");
9952 while (
DefMI->isCopy()) {
9961 switch (
DefMI->getOpcode()) {
9965 case AArch64::ANDWri:
9966 case AArch64::ANDXri: {
9967 if (IsTestAndBranch)
9974 bool Is32Bit = (
DefMI->getOpcode() == AArch64::ANDWri);
9976 DefMI->getOperand(2).getImm(), Is32Bit ? 32 : 64);
9991 unsigned Opc = (Imm < 32)
9992 ? (IsNegativeBranch ? AArch64::TBNZW : AArch64::TBZW)
9993 : (IsNegativeBranch ? AArch64::TBNZX : AArch64::TBZX);
10006 if (!Is32Bit && Imm < 32)
10008 MI.eraseFromParent();
10012 case AArch64::CSINCWr:
10013 case AArch64::CSINCXr: {
10014 if (!(
DefMI->getOperand(1).getReg() == AArch64::WZR &&
10015 DefMI->getOperand(2).getReg() == AArch64::WZR) &&
10016 !(
DefMI->getOperand(1).getReg() == AArch64::XZR &&
10017 DefMI->getOperand(2).getReg() == AArch64::XZR))
10020 if (
DefMI->findRegisterDefOperandIdx(AArch64::NZCV,
nullptr,
10033 if (IsNegativeBranch)
10036 MI.eraseFromParent();
10042std::pair<unsigned, unsigned>
10043AArch64InstrInfo::decomposeMachineOperandsTargetFlags(
unsigned TF)
const {
10045 return std::make_pair(TF & Mask, TF & ~Mask);
10049AArch64InstrInfo::getSerializableDirectMachineOperandTargetFlags()
const {
10052 static const std::pair<unsigned, const char *> TargetFlags[] = {
10053 {MO_PAGE,
"aarch64-page"}, {
MO_PAGEOFF,
"aarch64-pageoff"},
10054 {
MO_G3,
"aarch64-g3"}, {
MO_G2,
"aarch64-g2"},
10055 {
MO_G1,
"aarch64-g1"}, {
MO_G0,
"aarch64-g0"},
10061AArch64InstrInfo::getSerializableBitmaskMachineOperandTargetFlags()
const {
10062 using namespace AArch64II;
10064 static const std::pair<unsigned, const char *> TargetFlags[] = {
10066 {
MO_GOT,
"aarch64-got"},
10067 {
MO_NC,
"aarch64-nc"},
10068 {
MO_S,
"aarch64-s"},
10069 {
MO_TLS,
"aarch64-tls"},
10079AArch64InstrInfo::getSerializableMachineMemOperandTargetFlags()
const {
10080 static const std::pair<MachineMemOperand::Flags, const char *> TargetFlags[] =
10182 MachineFunction *MF =
C.getMF();
10184 const AArch64RegisterInfo *ARI =
10185 static_cast<const AArch64RegisterInfo *
>(&
TRI);
10188 for (
unsigned Reg : AArch64::GPR64RegClass) {
10190 Reg != AArch64::LR &&
10191 Reg != AArch64::X16 &&
10192 Reg != AArch64::X17 &&
10193 C.isAvailableAcrossAndOutOfSeq(
Reg,
TRI) &&
10194 C.isAvailableInsideSeq(
Reg,
TRI))
10225 return SubtargetA.hasV8_3aOps() == SubtargetB.hasV8_3aOps();
10228std::optional<std::unique_ptr<outliner::OutlinedFunction>>
10229AArch64InstrInfo::getOutliningCandidateInfo(
10231 std::vector<outliner::Candidate> &RepeatedSequenceLocs,
10232 unsigned MinRepeats)
const {
10233 unsigned SequenceSize = 0;
10234 for (
auto &
MI : RepeatedSequenceLocs[0])
10237 unsigned NumBytesToCreateFrame = 0;
10243 MachineInstr &LastMI = RepeatedSequenceLocs[0].back();
10244 MachineInstr &FirstMI = RepeatedSequenceLocs[0].front();
10245 if (LastMI.
getOpcode() == AArch64::ADRP &&
10248 return std::nullopt;
10253 if ((FirstMI.
getOpcode() == AArch64::ADDXri ||
10254 FirstMI.
getOpcode() == AArch64::LDRXui) &&
10257 return std::nullopt;
10268 if (std::adjacent_find(
10269 RepeatedSequenceLocs.begin(), RepeatedSequenceLocs.end(),
10270 [](
const outliner::Candidate &a,
const outliner::Candidate &b) {
10273 if (outliningCandidatesSigningScopeConsensus(a, b) &&
10274 outliningCandidatesSigningKeyConsensus(a, b) &&
10275 outliningCandidatesV8_3OpsConsensus(a, b)) {
10279 }) != RepeatedSequenceLocs.end()) {
10280 return std::nullopt;
10297 unsigned NumBytesToCheckLRInTCEpilogue = 0;
10298 const auto RASignCondition = RepeatedSequenceLocs[0]
10301 ->getSignReturnAddressCondition();
10304 NumBytesToCreateFrame += 8;
10307 auto LRCheckMethod = Subtarget.getAuthenticatedLRCheckMethod(
10308 *RepeatedSequenceLocs[0].getMF());
10309 NumBytesToCheckLRInTCEpilogue =
10313 if (isTailCallReturnInst(RepeatedSequenceLocs[0].
back()))
10314 SequenceSize += NumBytesToCheckLRInTCEpilogue;
10322 for (
auto &
MI :
C) {
10323 if (
MI.modifiesRegister(AArch64::SP, &
TRI)) {
10324 switch (
MI.getOpcode()) {
10325 case AArch64::ADDXri:
10326 case AArch64::ADDWri:
10327 assert(
MI.getNumOperands() == 4 &&
"Wrong number of operands");
10328 assert(
MI.getOperand(2).isImm() &&
10329 "Expected operand to be immediate");
10330 assert(
MI.getOperand(1).isReg() &&
10331 "Expected operand to be a register");
10335 if (
MI.getOperand(1).getReg() == AArch64::SP)
10336 SPValue +=
MI.getOperand(2).getImm();
10340 case AArch64::SUBXri:
10341 case AArch64::SUBWri:
10342 assert(
MI.getNumOperands() == 4 &&
"Wrong number of operands");
10343 assert(
MI.getOperand(2).isImm() &&
10344 "Expected operand to be immediate");
10345 assert(
MI.getOperand(1).isReg() &&
10346 "Expected operand to be a register");
10350 if (
MI.getOperand(1).getReg() == AArch64::SP)
10351 SPValue -=
MI.getOperand(2).getImm();
10368 if (RepeatedSequenceLocs.size() < MinRepeats)
10369 return std::nullopt;
10373 unsigned FlagsSetInAll = 0xF;
10377 FlagsSetInAll &=
C.Flags;
10379 unsigned LastInstrOpcode = RepeatedSequenceLocs[0].back().getOpcode();
10382 auto SetCandidateCallInfo =
10383 [&RepeatedSequenceLocs](
unsigned CallID,
unsigned NumBytesForCall) {
10385 C.setCallInfo(CallID, NumBytesForCall);
10389 NumBytesToCreateFrame += 4;
10397 unsigned CFICount = 0;
10398 for (
auto &
I : RepeatedSequenceLocs[0]) {
10399 if (
I.isCFIInstruction())
10409 std::vector<MCCFIInstruction> CFIInstructions =
10410 C.getMF()->getFrameInstructions();
10412 if (CFICount > 0 && CFICount != CFIInstructions.size())
10413 return std::nullopt;
10421 if (!
MI.modifiesRegister(AArch64::SP, &
TRI) &&
10422 !
MI.readsRegister(AArch64::SP, &
TRI))
10428 if (
MI.modifiesRegister(AArch64::SP, &
TRI))
10433 if (
MI.mayLoadOrStore()) {
10436 bool OffsetIsScalable;
10440 if (!getMemOperandWithOffset(
MI,
Base,
Offset, OffsetIsScalable, &
TRI) ||
10441 !
Base->isReg() ||
Base->getReg() != AArch64::SP)
10445 if (OffsetIsScalable)
10453 TypeSize Scale(0U,
false), DummyWidth(0U,
false);
10454 getMemOpInfo(
MI.getOpcode(), Scale, DummyWidth, MinOffset, MaxOffset);
10457 if (
Offset < MinOffset * (int64_t)Scale.getFixedValue() ||
10458 Offset > MaxOffset * (int64_t)Scale.getFixedValue())
10473 bool AllStackInstrsSafe =
10478 if (RepeatedSequenceLocs[0].
back().isTerminator()) {
10480 NumBytesToCreateFrame = 0;
10481 unsigned NumBytesForCall = 4 + NumBytesToCheckLRInTCEpilogue;
10485 else if (LastInstrOpcode == AArch64::BL ||
10486 ((LastInstrOpcode == AArch64::BLR ||
10487 LastInstrOpcode == AArch64::BLRNoIP) &&
10491 NumBytesToCreateFrame = NumBytesToCheckLRInTCEpilogue;
10499 unsigned NumBytesNoStackCalls = 0;
10500 std::vector<outliner::Candidate> CandidatesWithoutStackFixups;
10506 ?
C.isAvailableAcrossAndOutOfSeq(AArch64::LR,
TRI)
10515 C.getMF()->getFunction().hasFnAttribute(Attribute::NoReturn);
10518 if (LRAvailable && !IsNoReturn) {
10519 NumBytesNoStackCalls += 4;
10521 CandidatesWithoutStackFixups.push_back(
C);
10526 else if (findRegisterToSaveLRTo(
C)) {
10527 NumBytesNoStackCalls += 12;
10529 CandidatesWithoutStackFixups.push_back(
C);
10534 else if (
C.isAvailableInsideSeq(AArch64::SP,
TRI)) {
10535 NumBytesNoStackCalls += 12;
10537 CandidatesWithoutStackFixups.push_back(
C);
10543 NumBytesNoStackCalls += SequenceSize;
10550 if (!AllStackInstrsSafe ||
10551 NumBytesNoStackCalls <= RepeatedSequenceLocs.size() * 12) {
10552 RepeatedSequenceLocs = CandidatesWithoutStackFixups;
10554 if (RepeatedSequenceLocs.size() < MinRepeats)
10555 return std::nullopt;
10608 (!
C.isAvailableAcrossAndOutOfSeq(AArch64::LR,
TRI) ||
10609 !findRegisterToSaveLRTo(
C));
10615 if (RepeatedSequenceLocs.size() < MinRepeats)
10616 return std::nullopt;
10625 bool ModStackToSaveLR =
false;
10628 ModStackToSaveLR =
true;
10637 ModStackToSaveLR =
true;
10639 if (ModStackToSaveLR) {
10641 if (!AllStackInstrsSafe)
10642 return std::nullopt;
10645 NumBytesToCreateFrame += 8;
10652 return std::nullopt;
10654 return std::make_unique<outliner::OutlinedFunction>(
10655 RepeatedSequenceLocs, SequenceSize, NumBytesToCreateFrame, FrameID);
10658void AArch64InstrInfo::mergeOutliningCandidateAttributes(
10659 Function &
F, std::vector<outliner::Candidate> &Candidates)
const {
10663 const auto &CFn = Candidates.front().getMF()->getFunction();
10665 if (CFn.hasFnAttribute(
"ptrauth-returns"))
10666 F.addFnAttr(CFn.getFnAttribute(
"ptrauth-returns"));
10667 if (CFn.hasFnAttribute(
"ptrauth-auth-traps"))
10668 F.addFnAttr(CFn.getFnAttribute(
"ptrauth-auth-traps"));
10671 if (CFn.hasFnAttribute(
"sign-return-address"))
10672 F.addFnAttr(CFn.getFnAttribute(
"sign-return-address"));
10673 if (CFn.hasFnAttribute(
"sign-return-address-key"))
10674 F.addFnAttr(CFn.getFnAttribute(
"sign-return-address-key"));
10676 AArch64GenInstrInfo::mergeOutliningCandidateAttributes(
F, Candidates);
10679bool AArch64InstrInfo::isFunctionSafeToOutlineFrom(
10684 if (!OutlineFromLinkOnceODRs &&
F.hasLinkOnceODRLinkage())
10691 if (
F.hasSection())
10697 AArch64FunctionInfo *AFI = MF.
getInfo<AArch64FunctionInfo>();
10698 if (!AFI || AFI->
hasRedZone().value_or(
true))
10718 unsigned &Flags)
const {
10720 "Must track liveness!");
10722 std::pair<MachineBasicBlock::iterator, MachineBasicBlock::iterator>>
10737 auto AreAllUnsafeRegsDead = [&LRU]() {
10738 return LRU.available(AArch64::W16) && LRU.available(AArch64::W17) &&
10739 LRU.available(AArch64::NZCV);
10754 bool LRAvailableEverywhere =
true;
10756 LRU.addLiveOuts(
MBB);
10758 auto UpdateWholeMBBFlags = [&
Flags](
const MachineInstr &
MI) {
10759 if (
MI.isCall() && !
MI.isTerminator())
10765 auto CreateNewRangeStartingAt =
10766 [&RangeBegin, &RangeEnd,
10768 RangeBegin = NewBegin;
10769 RangeEnd = std::next(RangeBegin);
10772 auto SaveRangeIfNonEmpty = [&RangeLen, &
Ranges, &RangeBegin, &RangeEnd]() {
10778 if (!RangeBegin.isEnd() && RangeBegin->isBundledWithPred())
10780 if (!RangeEnd.isEnd() && RangeEnd->isBundledWithPred())
10782 Ranges.emplace_back(RangeBegin, RangeEnd);
10790 for (; FirstPossibleEndPt !=
MBB.
instr_rend(); ++FirstPossibleEndPt) {
10791 if (!FirstPossibleEndPt->isDebugInstr())
10792 LRU.stepBackward(*FirstPossibleEndPt);
10795 UpdateWholeMBBFlags(*FirstPossibleEndPt);
10796 if (AreAllUnsafeRegsDead())
10803 CreateNewRangeStartingAt(FirstPossibleEndPt->getIterator());
10808 if (!
MI.isDebugInstr())
10809 LRU.stepBackward(
MI);
10810 UpdateWholeMBBFlags(
MI);
10811 if (!AreAllUnsafeRegsDead()) {
10812 SaveRangeIfNonEmpty();
10813 CreateNewRangeStartingAt(
MI.getIterator());
10816 LRAvailableEverywhere &= LRU.available(AArch64::LR);
10817 RangeBegin =
MI.getIterator();
10822 if (AreAllUnsafeRegsDead())
10823 SaveRangeIfNonEmpty();
10831 if (!LRAvailableEverywhere)
10839 unsigned Flags)
const {
10840 MachineInstr &
MI = *MIT;
10844 switch (
MI.getOpcode()) {
10845 case AArch64::PACM:
10846 case AArch64::PACIASP:
10847 case AArch64::PACIBSP:
10848 case AArch64::PACIASPPC:
10849 case AArch64::PACIBSPPC:
10850 case AArch64::AUTIASP:
10851 case AArch64::AUTIBSP:
10852 case AArch64::AUTIASPPCi:
10853 case AArch64::AUTIASPPCr:
10854 case AArch64::AUTIBSPPCi:
10855 case AArch64::AUTIBSPPCr:
10856 case AArch64::RETAA:
10857 case AArch64::RETAB:
10858 case AArch64::RETAASPPCi:
10859 case AArch64::RETAASPPCr:
10860 case AArch64::RETABSPPCi:
10861 case AArch64::RETABSPPCr:
10862 case AArch64::EMITBKEY:
10863 case AArch64::PAUTH_PROLOGUE:
10864 case AArch64::PAUTH_EPILOGUE:
10874 if (
MI.isCFIInstruction())
10878 if (
MI.isTerminator())
10884 for (
const MachineOperand &MOP :
MI.operands()) {
10887 assert(!MOP.isCFIIndex());
10890 if (MOP.isReg() && !MOP.isImplicit() &&
10891 (MOP.getReg() == AArch64::LR || MOP.getReg() == AArch64::W30))
10898 if (
MI.getOpcode() == AArch64::ADRP)
10918 for (
const MachineOperand &MOP :
MI.operands()) {
10919 if (MOP.isGlobal()) {
10927 if (Callee &&
Callee->getName() ==
"\01_mcount")
10935 if (
MI.getOpcode() == AArch64::BLR ||
10936 MI.getOpcode() == AArch64::BLRNoIP ||
MI.getOpcode() == AArch64::BL)
10940 return UnknownCallOutlineType;
10948 return UnknownCallOutlineType;
10956 return UnknownCallOutlineType;
10977 for (MachineInstr &
MI :
MBB) {
10978 const MachineOperand *
Base;
10979 TypeSize Width(0,
false);
10981 bool OffsetIsScalable;
10984 if (!
MI.mayLoadOrStore() ||
10987 (
Base->isReg() &&
Base->getReg() != AArch64::SP))
10991 TypeSize Scale(0U,
false);
10992 int64_t Dummy1, Dummy2;
10995 assert(StackOffsetOperand.
isImm() &&
"Stack offset wasn't immediate!");
10997 assert(Scale != 0 &&
"Unexpected opcode!");
10998 assert(!OffsetIsScalable &&
"Expected offset to be a byte offset");
11003 int64_t NewImm = (
Offset + 16) / (int64_t)Scale.getFixedValue();
11004 StackOffsetOperand.
setImm(NewImm);
11010 bool ShouldSignReturnAddr) {
11011 if (!ShouldSignReturnAddr)
11019void AArch64InstrInfo::buildOutlinedFrame(
11023 AArch64FunctionInfo *FI = MF.
getInfo<AArch64FunctionInfo>();
11031 unsigned TailOpcode;
11033 TailOpcode = AArch64::TCRETURNdi;
11037 TailOpcode = AArch64::TCRETURNriALL;
11048 bool IsLeafFunction =
true;
11051 auto IsNonTailCall = [](
const MachineInstr &
MI) {
11052 return MI.isCall() && !
MI.isReturn();
11062 "Can only fix up stack references once");
11063 fixupPostOutline(
MBB);
11065 IsLeafFunction =
false;
11076 Et = std::prev(
MBB.
end());
11086 if (MF.
getInfo<AArch64FunctionInfo>()->needsDwarfUnwindInfo(MF)) {
11090 CFIBuilder.buildDefCFAOffset(16);
11094 CFIBuilder.buildOffset(AArch64::LR, -16);
11108 RASignCondition, !IsLeafFunction);
11137 fixupPostOutline(
MBB);
11148 .addGlobalAddress(
M.getNamedValue(MF.
getName()))
11158 .addGlobalAddress(
M.getNamedValue(MF.
getName())));
11167 MachineInstr *Save;
11168 MachineInstr *Restore;
11174 assert(
Reg &&
"No callee-saved register available?");
11208 .addGlobalAddress(
M.getNamedValue(MF.
getName())));
11216bool AArch64InstrInfo::shouldOutlineFromFunctionByDefault(
11224 bool AllowSideEffects)
const {
11226 const AArch64Subtarget &STI = MF.
getSubtarget<AArch64Subtarget>();
11229 if (
TRI.isGeneralPurposeRegister(MF,
Reg)) {
11242 assert(STI.hasNEON() &&
"Expected to have NEON.");
11248std::optional<DestSourcePair>
11253 if (((
MI.getOpcode() == AArch64::ORRWrs &&
11254 MI.getOperand(1).getReg() == AArch64::WZR &&
11255 MI.getOperand(3).getImm() == 0x0) ||
11256 (
MI.getOpcode() == AArch64::ORRWrr &&
11257 MI.getOperand(1).getReg() == AArch64::WZR)) &&
11259 (!
MI.getOperand(0).getReg().isVirtual() ||
11260 MI.getOperand(0).getSubReg() == 0) &&
11261 (!
MI.getOperand(0).getReg().isPhysical() ||
11266 if (
MI.getOpcode() == AArch64::ORRXrs &&
11267 MI.getOperand(1).getReg() == AArch64::XZR &&
11268 MI.getOperand(3).getImm() == 0x0)
11271 return std::nullopt;
11274std::optional<DestSourcePair>
11276 if ((
MI.getOpcode() == AArch64::ORRWrs &&
11277 MI.getOperand(1).getReg() == AArch64::WZR &&
11278 MI.getOperand(3).getImm() == 0x0) ||
11279 (
MI.getOpcode() == AArch64::ORRWrr &&
11280 MI.getOperand(1).getReg() == AArch64::WZR))
11282 return std::nullopt;
11285std::optional<RegImmPair>
11294 return std::nullopt;
11296 switch (
MI.getOpcode()) {
11298 return std::nullopt;
11299 case AArch64::SUBWri:
11300 case AArch64::SUBXri:
11301 case AArch64::SUBSWri:
11302 case AArch64::SUBSXri:
11305 case AArch64::ADDSWri:
11306 case AArch64::ADDSXri:
11307 case AArch64::ADDWri:
11308 case AArch64::ADDXri: {
11310 if (!
MI.getOperand(0).isReg() || !
MI.getOperand(1).isReg() ||
11311 !
MI.getOperand(2).isImm())
11312 return std::nullopt;
11313 int Shift =
MI.getOperand(3).getImm();
11314 assert((Shift == 0 || Shift == 12) &&
"Shift can be either 0 or 12");
11318 return RegImmPair{
MI.getOperand(1).getReg(),
Offset};
11324static std::optional<ParamLoadedValue>
11328 auto DestSrc =
TII->isCopyLikeInstr(
MI);
11330 return std::nullopt;
11332 Register DestReg = DestSrc->Destination->getReg();
11333 Register SrcReg = DestSrc->Source->getReg();
11336 return std::nullopt;
11341 if (DestReg == DescribedReg)
11345 if (
MI.getOpcode() == AArch64::ORRWrs &&
11346 TRI->isSuperRegister(DestReg, DescribedReg))
11350 if (
MI.getOpcode() == AArch64::ORRXrs &&
11351 TRI->isSubRegister(DestReg, DescribedReg)) {
11352 Register SrcSubReg =
TRI->getSubReg(SrcReg, AArch64::sub_32);
11356 assert(!
TRI->isSuperOrSubRegisterEq(DestReg, DescribedReg) &&
11357 "Unhandled ORR[XW]rs copy case");
11359 return std::nullopt;
11362bool AArch64InstrInfo::isFunctionSafeToSplit(
const MachineFunction &MF)
const {
11367 if (MF.
getInfo<AArch64FunctionInfo>()->hasRedZone().value_or(
true))
11373bool AArch64InstrInfo::isMBBSafeToSplitToCold(
11377 auto isAsmGoto = [](
const MachineInstr &
MI) {
11378 return MI.getOpcode() == AArch64::INLINEASM_BR;
11388 auto containsMBB = [&
MBB](
const MachineJumpTableEntry &JTE) {
11395 for (
const MachineInstr &
MI :
MBB) {
11396 switch (
MI.getOpcode()) {
11397 case TargetOpcode::G_BRJT:
11398 case AArch64::JumpTableDest32:
11399 case AArch64::JumpTableDest16:
11400 case AArch64::JumpTableDest8:
11411std::optional<ParamLoadedValue>
11414 const MachineFunction *MF =
MI.getMF();
11416 switch (
MI.getOpcode()) {
11417 case AArch64::MOVZWi:
11418 case AArch64::MOVZXi: {
11421 if (!
TRI->isSuperRegisterEq(
MI.getOperand(0).getReg(),
Reg))
11422 return std::nullopt;
11424 if (!
MI.getOperand(1).isImm())
11425 return std::nullopt;
11426 int64_t Immediate =
MI.getOperand(1).getImm();
11427 int Shift =
MI.getOperand(2).getImm();
11431 case AArch64::ORRWrs:
11432 case AArch64::ORRXrs:
11439bool AArch64InstrInfo::isExtendLikelyToBeFolded(
11442 ExtMI.
getOpcode() == TargetOpcode::G_ZEXT ||
11443 ExtMI.
getOpcode() == TargetOpcode::G_ANYEXT);
11446 if (ExtMI.
getOpcode() == TargetOpcode::G_ANYEXT)
11456 return UserMI->
getOpcode() == TargetOpcode::G_PTR_ADD;
11459uint64_t AArch64InstrInfo::getElementSizeForOpcode(
unsigned Opc)
const {
11463bool AArch64InstrInfo::isPTestLikeOpcode(
unsigned Opc)
const {
11467bool AArch64InstrInfo::isWhileOpcode(
unsigned Opc)
const {
11472AArch64InstrInfo::getTailDuplicateSize(
CodeGenOptLevel OptLevel)
const {
11476bool AArch64InstrInfo::isLegalAddressingMode(
unsigned NumBytes, int64_t
Offset,
11477 unsigned Scale)
const {
11488 unsigned Shift =
Log2_64(NumBytes);
11489 if (NumBytes &&
Offset > 0 && (
Offset / NumBytes) <= (1LL << 12) - 1 &&
11497 return Scale == 1 || (Scale > 0 && Scale == NumBytes);
11502 return AArch64::BLRNoIP;
11504 return AArch64::BLR;
11510 auto Builder =
BuildMI(
MBB, InsertPt,
DL,
get(AArch64::PAUTH_EPILOGUE))
11520 if (Subtarget.hasPAuthLR())
11531 Register TargetReg,
bool FrameSetup)
const {
11532 assert(TargetReg != AArch64::SP &&
"New top of stack cannot already be in SP");
11544 MF.
insert(MBBInsertPoint, LoopTestMBB);
11547 MF.
insert(MBBInsertPoint, LoopBodyMBB);
11549 MF.
insert(MBBInsertPoint, ExitMBB);
11559 BuildMI(*LoopTestMBB, LoopTestMBB->
end(),
DL,
TII->get(AArch64::SUBSXrx64),
11567 BuildMI(*LoopTestMBB, LoopTestMBB->
end(),
DL,
TII->get(AArch64::Bcc))
11573 BuildMI(*LoopBodyMBB, LoopBodyMBB->
end(),
DL,
TII->get(AArch64::LDRXui))
11590 BuildMI(*ExitMBB, ExitMBB->
end(),
DL,
TII->get(AArch64::ADDXri), AArch64::SP)
11609 MBB.addSuccessor(LoopTestMBB);
11615 return ExitMBB->
begin();
11620 MachineFunction *MF;
11621 const TargetInstrInfo *
TII;
11622 const TargetRegisterInfo *
TRI;
11623 MachineRegisterInfo &MRI;
11626 MachineBasicBlock *LoopBB;
11628 MachineInstr *CondBranch;
11630 MachineInstr *Comp;
11632 unsigned CompCounterOprNum;
11634 MachineInstr *Update;
11636 unsigned UpdateCounterOprNum;
11640 bool IsUpdatePriorComp;
11646 AArch64PipelinerLoopInfo(MachineBasicBlock *LoopBB, MachineInstr *CondBranch,
11647 MachineInstr *Comp,
unsigned CompCounterOprNum,
11648 MachineInstr *Update,
unsigned UpdateCounterOprNum,
11649 Register Init,
bool IsUpdatePriorComp,
11650 const SmallVectorImpl<MachineOperand> &
Cond)
11652 TII(MF->getSubtarget().getInstrInfo()),
11653 TRI(MF->getSubtarget().getRegisterInfo()), MRI(MF->getRegInfo()),
11654 LoopBB(LoopBB), CondBranch(CondBranch), Comp(Comp),
11655 CompCounterOprNum(CompCounterOprNum), Update(Update),
11656 UpdateCounterOprNum(UpdateCounterOprNum), Init(Init),
11659 bool shouldIgnoreForPipelining(
const MachineInstr *
MI)
const override {
11665 std::optional<bool> createTripCountGreaterCondition(
11666 int TC, MachineBasicBlock &
MBB,
11667 SmallVectorImpl<MachineOperand> &CondParam)
override {
11675 void createRemainingIterationsGreaterCondition(
11676 int TC, MachineBasicBlock &
MBB, SmallVectorImpl<MachineOperand> &
Cond,
11677 DenseMap<MachineInstr *, MachineInstr *> &LastStage0Insts)
override;
11679 void setPreheader(MachineBasicBlock *NewPreheader)
override {}
11681 void adjustTripCount(
int TripCountAdjust)
override {}
11683 bool isMVEExpanderSupported()
override {
return true; }
11702 }
else if (
I == ReplaceOprNum) {
11707 MBB.insert(InsertTo, NewMI);
11711void AArch64PipelinerLoopInfo::createRemainingIterationsGreaterCondition(
11727 assert(CondBranch->getOpcode() == AArch64::Bcc);
11731 if (CondBranch->getOperand(1).getMBB() == LoopBB)
11738 auto AccumulateCond = [&](
Register CurCond,
11749 if (!LastStage0Insts.
empty() && LastStage0Insts[Comp]->getParent() == &
MBB) {
11753 for (
int I = 0;
I <= TC; ++
I) {
11759 AccCond = AccumulateCond(AccCond, CC);
11763 if (Update != Comp && IsUpdatePriorComp) {
11765 LastStage0Insts[Comp]->getOperand(CompCounterOprNum).getReg();
11766 NextCounter =
cloneInstr(Update, UpdateCounterOprNum, Counter,
MBB,
11770 NextCounter = LastStage0Insts[Update]->getOperand(0).getReg();
11772 }
else if (Update != Comp) {
11777 Counter = NextCounter;
11781 if (LastStage0Insts.
empty()) {
11785 if (IsUpdatePriorComp)
11790 Counter = LastStage0Insts[Comp]->getOperand(CompCounterOprNum).getReg();
11793 for (
int I = 0;
I <= TC; ++
I) {
11797 AccCond = AccumulateCond(AccCond, CC);
11798 if (
I != TC && Update != Comp)
11801 Counter = NextCounter;
11817 assert(Phi.getNumOperands() == 5);
11818 if (Phi.getOperand(2).getMBB() ==
MBB) {
11819 RegMBB = Phi.getOperand(1).getReg();
11820 RegOther = Phi.getOperand(3).getReg();
11822 assert(Phi.getOperand(4).getMBB() ==
MBB);
11823 RegMBB = Phi.getOperand(3).getReg();
11824 RegOther = Phi.getOperand(1).getReg();
11829 if (!
Reg.isVirtual())
11838 unsigned &UpdateCounterOprNum,
Register &InitReg,
11839 bool &IsUpdatePriorComp) {
11853 if (!
Reg.isVirtual())
11856 UpdateInst =
nullptr;
11857 UpdateCounterOprNum = 0;
11859 IsUpdatePriorComp =
true;
11863 if (Def->getParent() != LoopBB)
11865 if (Def->isCopy()) {
11867 if (Def->getOperand(0).getSubReg() || Def->getOperand(1).getSubReg())
11869 CurReg = Def->getOperand(1).getReg();
11870 }
else if (Def->isPHI()) {
11874 IsUpdatePriorComp =
false;
11879 switch (Def->getOpcode()) {
11880 case AArch64::ADDSXri:
11881 case AArch64::ADDSWri:
11882 case AArch64::SUBSXri:
11883 case AArch64::SUBSWri:
11884 case AArch64::ADDXri:
11885 case AArch64::ADDWri:
11886 case AArch64::SUBXri:
11887 case AArch64::SUBWri:
11889 UpdateCounterOprNum = 1;
11891 case AArch64::ADDSXrr:
11892 case AArch64::ADDSWrr:
11893 case AArch64::SUBSXrr:
11894 case AArch64::SUBSWrr:
11895 case AArch64::ADDXrr:
11896 case AArch64::ADDWrr:
11897 case AArch64::SUBXrr:
11898 case AArch64::SUBWrr:
11901 UpdateCounterOprNum = 1;
11903 UpdateCounterOprNum = 2;
11910 CurReg = Def->getOperand(UpdateCounterOprNum).getReg();
11925std::unique_ptr<TargetInstrInfo::PipelinerLoopInfo>
11936 if (
MI.isCall() ||
MI.hasUnmodeledSideEffects())
11947 if (
TBB == LoopBB && FBB == LoopBB)
11951 if (
TBB != LoopBB && FBB ==
nullptr)
11954 assert((
TBB == LoopBB || FBB == LoopBB) &&
11955 "The Loop must be a single-basic-block loop");
11960 if (CondBranch->
getOpcode() != AArch64::Bcc)
11968 unsigned CompCounterOprNum = 0;
11970 if (
MI.modifiesRegister(AArch64::NZCV, &
TRI)) {
11974 switch (
MI.getOpcode()) {
11975 case AArch64::SUBSXri:
11976 case AArch64::SUBSWri:
11977 case AArch64::ADDSXri:
11978 case AArch64::ADDSWri:
11980 CompCounterOprNum = 1;
11982 case AArch64::ADDSWrr:
11983 case AArch64::ADDSXrr:
11984 case AArch64::SUBSWrr:
11985 case AArch64::SUBSXrr:
11989 if (isWhileOpcode(
MI.getOpcode())) {
11996 if (CompCounterOprNum == 0) {
11998 CompCounterOprNum = 2;
12000 CompCounterOprNum = 1;
12012 bool IsUpdatePriorComp;
12013 unsigned UpdateCounterOprNum;
12015 Update, UpdateCounterOprNum,
Init, IsUpdatePriorComp))
12018 return std::make_unique<AArch64PipelinerLoopInfo>(
12019 LoopBB, CondBranch, Comp, CompCounterOprNum, Update, UpdateCounterOprNum,
12029 TypeSize Scale(0U,
false), Width(0U,
false);
12030 int64_t MinOffset, MaxOffset;
12031 if (
getMemOpInfo(
MI.getOpcode(), Scale, Width, MinOffset, MaxOffset)) {
12033 if (
MI.getOperand(ImmIdx).isImm() && !
MI.getOperand(ImmIdx - 1).isFI()) {
12034 int64_t Imm =
MI.getOperand(ImmIdx).getImm();
12035 if (Imm < MinOffset || Imm > MaxOffset) {
12036 ErrInfo =
"Unexpected immediate on load/store instruction";
12042 const MCInstrDesc &MCID =
MI.getDesc();
12044 const MachineOperand &MO =
MI.getOperand(
Op);
12048 ErrInfo =
"OPERAND_IMPLICIT_IMM_0 should be 0";
12057 ErrInfo =
"OPERAND_SHIFT_MSL should be msl shift of 8 or 16";
12068#define GET_INSTRINFO_HELPERS
12069#define GET_INSTRMAP_INFO
12070#include "AArch64GenInstrInfo.inc"
MachineInstrBuilder & UseMI
MachineInstrBuilder MachineInstrBuilder & DefMI
static bool forwardCopyWillClobberTuple(unsigned DestReg, unsigned SrcReg, unsigned NumRegs)
static cl::opt< unsigned > BCCDisplacementBits("aarch64-bcc-offset-bits", cl::Hidden, cl::init(19), cl::desc("Restrict range of Bcc instructions (DEBUG)"))
static Register genNeg(MachineFunction &MF, MachineRegisterInfo &MRI, const TargetInstrInfo *TII, MachineInstr &Root, SmallVectorImpl< MachineInstr * > &InsInstrs, DenseMap< Register, unsigned > &InstrIdxForVirtReg, unsigned MnegOpc, const TargetRegisterClass *RC)
genNeg - Helper to generate an intermediate negation of the second operand of Root
static bool isFrameStoreOpcode(int Opcode)
static cl::opt< unsigned > GatherOptSearchLimit("aarch64-search-limit", cl::Hidden, cl::init(2048), cl::desc("Restrict range of instructions to search for the " "machine-combiner gather pattern optimization"))
static bool getMaddPatterns(MachineInstr &Root, SmallVectorImpl< unsigned > &Patterns)
Find instructions that can be turned into madd.
static AArch64CC::CondCode findCondCodeUsedByInstr(const MachineInstr &Instr)
Find a condition code used by the instruction.
static MachineInstr * genFusedMultiplyAcc(MachineFunction &MF, MachineRegisterInfo &MRI, const TargetInstrInfo *TII, MachineInstr &Root, SmallVectorImpl< MachineInstr * > &InsInstrs, unsigned IdxMulOpd, unsigned MaddOpc, const TargetRegisterClass *RC)
genFusedMultiplyAcc - Helper to generate fused multiply accumulate instructions.
static MachineInstr * genFusedMultiplyAccNeg(MachineFunction &MF, MachineRegisterInfo &MRI, const TargetInstrInfo *TII, MachineInstr &Root, SmallVectorImpl< MachineInstr * > &InsInstrs, DenseMap< Register, unsigned > &InstrIdxForVirtReg, unsigned IdxMulOpd, unsigned MaddOpc, unsigned MnegOpc, const TargetRegisterClass *RC)
genFusedMultiplyAccNeg - Helper to generate fused multiply accumulate instructions with an additional...
static bool isCombineInstrCandidate64(unsigned Opc)
static bool isFrameLoadOpcode(int Opcode)
static unsigned removeCopies(const MachineRegisterInfo &MRI, unsigned VReg)
static bool areCFlagsAccessedBetweenInstrs(MachineBasicBlock::iterator From, MachineBasicBlock::iterator To, const TargetRegisterInfo *TRI, const AccessKind AccessToCheck=AK_All)
True when condition flags are accessed (either by writing or reading) on the instruction trace starti...
static bool getFMAPatterns(MachineInstr &Root, SmallVectorImpl< unsigned > &Patterns)
Floating-Point Support.
static bool isADDSRegImm(unsigned Opcode)
static bool isCheapCopy(const MachineInstr &MI, const AArch64RegisterInfo &RI)
static bool isANDOpcode(MachineInstr &MI)
static void appendOffsetComment(int NumBytes, llvm::raw_string_ostream &Comment, StringRef RegScale={})
static unsigned sForm(MachineInstr &Instr)
Get opcode of S version of Instr.
static bool isCombineInstrSettingFlag(unsigned Opc)
static bool getFNEGPatterns(MachineInstr &Root, SmallVectorImpl< unsigned > &Patterns)
static bool getIndVarInfo(Register Reg, const MachineBasicBlock *LoopBB, MachineInstr *&UpdateInst, unsigned &UpdateCounterOprNum, Register &InitReg, bool &IsUpdatePriorComp)
If Reg is an induction variable, return true and set some parameters.
static bool canPairLdStOpc(unsigned FirstOpc, unsigned SecondOpc)
static bool mustAvoidNeonAtMBBI(const AArch64Subtarget &Subtarget, MachineBasicBlock &MBB, MachineBasicBlock::iterator I)
Returns true if in a streaming call site region without SME-FA64.
static bool isPostIndexLdStOpcode(unsigned Opcode)
Return true if the opcode is a post-index ld/st instruction, which really loads from base+0.
static std::optional< unsigned > getLFIInstSizeInBytes(const MachineInstr &MI)
Return the maximum number of bytes of code the specified instruction may be after LFI rewriting.
static unsigned getBranchDisplacementBits(unsigned Opc)
static cl::opt< unsigned > CBDisplacementBits("aarch64-cb-offset-bits", cl::Hidden, cl::init(9), cl::desc("Restrict range of CB instructions (DEBUG)"))
static std::optional< ParamLoadedValue > describeORRLoadedValue(const MachineInstr &MI, Register DescribedReg, const TargetInstrInfo *TII, const TargetRegisterInfo *TRI)
If the given ORR instruction is a copy, and DescribedReg overlaps with the destination register then,...
static bool getFMULPatterns(MachineInstr &Root, SmallVectorImpl< unsigned > &Patterns)
static void appendReadRegExpr(SmallVectorImpl< char > &Expr, unsigned RegNum)
static MachineInstr * genMaddR(MachineFunction &MF, MachineRegisterInfo &MRI, const TargetInstrInfo *TII, MachineInstr &Root, SmallVectorImpl< MachineInstr * > &InsInstrs, unsigned IdxMulOpd, unsigned MaddOpc, unsigned VR, const TargetRegisterClass *RC)
genMaddR - Generate madd instruction and combine mul and add using an extra virtual register Example ...
static Register cloneInstr(const MachineInstr *MI, unsigned ReplaceOprNum, Register ReplaceReg, MachineBasicBlock &MBB, MachineBasicBlock::iterator InsertTo)
Clone an instruction from MI.
static bool scaleOffset(unsigned Opc, int64_t &Offset)
static bool canCombineWithFMUL(MachineBasicBlock &MBB, MachineOperand &MO, unsigned MulOpc)
unsigned scaledOffsetOpcode(unsigned Opcode, unsigned &Scale)
static MachineInstr * genFusedMultiplyIdx(MachineFunction &MF, MachineRegisterInfo &MRI, const TargetInstrInfo *TII, MachineInstr &Root, SmallVectorImpl< MachineInstr * > &InsInstrs, unsigned IdxMulOpd, unsigned MaddOpc, const TargetRegisterClass *RC)
genFusedMultiplyIdx - Helper to generate fused multiply accumulate instructions.
static MachineInstr * genIndexedMultiply(MachineInstr &Root, SmallVectorImpl< MachineInstr * > &InsInstrs, unsigned IdxDupOp, unsigned MulOpc, const TargetRegisterClass *RC, MachineRegisterInfo &MRI)
Fold (FMUL x (DUP y lane)) into (FMUL_indexed x y lane)
static bool isSUBSRegImm(unsigned Opcode)
static bool UpdateOperandRegClass(MachineInstr &Instr)
static const TargetRegisterClass * getRegClass(const MachineInstr &MI, Register Reg)
static bool isInStreamingCallSiteRegion(MachineBasicBlock &MBB, MachineBasicBlock::iterator I)
Returns true if the instruction at I is in a streaming call site region, within a single basic block.
static bool canCmpInstrBeRemoved(MachineInstr &MI, MachineInstr &CmpInstr, int CmpValue, const TargetRegisterInfo &TRI, SmallVectorImpl< MachineInstr * > &CCUseInstrs, bool &IsInvertCC)
unsigned unscaledOffsetOpcode(unsigned Opcode)
static bool getLoadPatterns(MachineInstr &Root, SmallVectorImpl< unsigned > &Patterns)
Search for patterns of LD instructions we can optimize.
static bool canInstrSubstituteCmpInstr(MachineInstr &MI, MachineInstr &CmpInstr, const TargetRegisterInfo &TRI)
Check if CmpInstr can be substituted by MI.
static UsedNZCV getUsedNZCV(AArch64CC::CondCode CC)
static bool isCombineInstrCandidateFP(const MachineInstr &Inst)
static void appendLoadRegExpr(SmallVectorImpl< char > &Expr, int64_t OffsetFromDefCFA)
static void appendConstantExpr(SmallVectorImpl< char > &Expr, int64_t Constant, dwarf::LocationAtom Operation)
static unsigned convertToNonFlagSettingOpc(const MachineInstr &MI)
Return the opcode that does not set flags when possible - otherwise return the original opcode.
static bool outliningCandidatesV8_3OpsConsensus(const outliner::Candidate &a, const outliner::Candidate &b)
static bool isCombineInstrCandidate32(unsigned Opc)
static void parseCondBranch(MachineInstr *LastInst, MachineBasicBlock *&Target, SmallVectorImpl< MachineOperand > &Cond)
static unsigned offsetExtendOpcode(unsigned Opcode)
static void loadRegPairFromStackSlot(const TargetRegisterInfo &TRI, MachineBasicBlock &MBB, MachineBasicBlock::iterator InsertBefore, const MCInstrDesc &MCID, Register DestReg, unsigned SubIdx0, unsigned SubIdx1, int FI, MachineMemOperand *MMO)
static void generateGatherLanePattern(MachineInstr &Root, SmallVectorImpl< MachineInstr * > &InsInstrs, SmallVectorImpl< MachineInstr * > &DelInstrs, DenseMap< Register, unsigned > &InstrIdxForVirtReg, unsigned Pattern, unsigned NumLanes)
Generate optimized instruction sequence for gather load patterns to improve Memory-Level Parallelism ...
static bool getMiscPatterns(MachineInstr &Root, SmallVectorImpl< unsigned > &Patterns)
Find other MI combine patterns.
static bool outliningCandidatesSigningKeyConsensus(const outliner::Candidate &a, const outliner::Candidate &b)
static const MachineInstrBuilder & AddSubReg(const MachineInstrBuilder &MIB, MCRegister Reg, unsigned SubIdx, RegState State, const TargetRegisterInfo *TRI)
static bool outliningCandidatesSigningScopeConsensus(const outliner::Candidate &a, const outliner::Candidate &b)
static bool shouldClusterFI(const MachineFrameInfo &MFI, int FI1, int64_t Offset1, unsigned Opcode1, int FI2, int64_t Offset2, unsigned Opcode2)
static cl::opt< unsigned > TBZDisplacementBits("aarch64-tbz-offset-bits", cl::Hidden, cl::init(14), cl::desc("Restrict range of TB[N]Z instructions (DEBUG)"))
static void extractPhiReg(const MachineInstr &Phi, const MachineBasicBlock *MBB, Register &RegMBB, Register &RegOther)
static MCCFIInstruction createDefCFAExpression(const TargetRegisterInfo &TRI, unsigned Reg, const StackOffset &Offset)
static bool isDefinedOutside(Register Reg, const MachineBasicBlock *BB)
static MachineInstr * genFusedMultiply(MachineFunction &MF, MachineRegisterInfo &MRI, const TargetInstrInfo *TII, MachineInstr &Root, SmallVectorImpl< MachineInstr * > &InsInstrs, unsigned IdxMulOpd, unsigned MaddOpc, const TargetRegisterClass *RC, FMAInstKind kind=FMAInstKind::Default, const Register *ReplacedAddend=nullptr)
genFusedMultiply - Generate fused multiply instructions.
static bool getGatherLanePattern(MachineInstr &Root, SmallVectorImpl< unsigned > &Patterns, unsigned LoadLaneOpCode, unsigned NumLanes)
Check if the given instruction forms a gather load pattern that can be optimized for better Memory-Le...
static MachineInstr * genFusedMultiplyIdxNeg(MachineFunction &MF, MachineRegisterInfo &MRI, const TargetInstrInfo *TII, MachineInstr &Root, SmallVectorImpl< MachineInstr * > &InsInstrs, DenseMap< Register, unsigned > &InstrIdxForVirtReg, unsigned IdxMulOpd, unsigned MaddOpc, unsigned MnegOpc, const TargetRegisterClass *RC)
genFusedMultiplyAccNeg - Helper to generate fused multiply accumulate instructions with an additional...
static bool isCombineInstrCandidate(unsigned Opc)
static unsigned regOffsetOpcode(unsigned Opcode)
MachineOutlinerClass
Constants defining how certain sequences should be outlined.
@ MachineOutlinerTailCall
Emit a save, restore, call, and return.
@ MachineOutlinerRegSave
Emit a call and tail-call.
@ MachineOutlinerNoLRSave
Only emit a branch.
@ MachineOutlinerThunk
Emit a call and return.
static cl::opt< unsigned > BDisplacementBits("aarch64-b-offset-bits", cl::Hidden, cl::init(26), cl::desc("Restrict range of B instructions (DEBUG)"))
static bool areCFlagsAliveInSuccessors(const MachineBasicBlock *MBB)
Check if AArch64::NZCV should be alive in successors of MBB.
static void emitFrameOffsetAdj(MachineBasicBlock &MBB, MachineBasicBlock::iterator MBBI, const DebugLoc &DL, unsigned DestReg, unsigned SrcReg, int64_t Offset, unsigned Opc, const TargetInstrInfo *TII, MachineInstr::MIFlag Flag, bool NeedsWinCFI, bool *HasWinCFI, bool EmitCFAOffset, StackOffset CFAOffset, unsigned FrameReg)
static bool isCheapImmediate(const MachineInstr &MI, unsigned BitSize)
static cl::opt< unsigned > CBZDisplacementBits("aarch64-cbz-offset-bits", cl::Hidden, cl::init(19), cl::desc("Restrict range of CB[N]Z instructions (DEBUG)"))
static void genSubAdd2SubSub(MachineFunction &MF, MachineRegisterInfo &MRI, const TargetInstrInfo *TII, MachineInstr &Root, SmallVectorImpl< MachineInstr * > &InsInstrs, SmallVectorImpl< MachineInstr * > &DelInstrs, unsigned IdxOpd1, DenseMap< Register, unsigned > &InstrIdxForVirtReg)
Do the following transformation A - (B + C) ==> (A - B) - C A - (B + C) ==> (A - C) - B.
static unsigned canFoldIntoCSel(const MachineRegisterInfo &MRI, unsigned VReg, unsigned *NewReg=nullptr)
static void signOutlinedFunction(MachineFunction &MF, MachineBasicBlock &MBB, const AArch64InstrInfo *TII, bool ShouldSignReturnAddr)
static MachineInstr * genFNegatedMAD(MachineFunction &MF, MachineRegisterInfo &MRI, const TargetInstrInfo *TII, MachineInstr &Root, SmallVectorImpl< MachineInstr * > &InsInstrs)
static bool canCombineWithMUL(MachineBasicBlock &MBB, MachineOperand &MO, unsigned MulOpc, unsigned ZeroReg)
static void storeRegPairToStackSlot(const TargetRegisterInfo &TRI, MachineBasicBlock &MBB, MachineBasicBlock::iterator InsertBefore, const MCInstrDesc &MCID, Register SrcReg, bool IsKill, unsigned SubIdx0, unsigned SubIdx1, int FI, MachineMemOperand *MMO)
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
MachineBasicBlock MachineBasicBlock::iterator MBBI
static const Function * getParent(const Value *V)
static GCRegistry::Add< ErlangGC > A("erlang", "erlang-compatible garbage collector")
static GCRegistry::Add< OcamlGC > B("ocaml", "ocaml 3.10-compatible GC")
DXIL Forward Handle Accesses
const HexagonInstrInfo * TII
Module.h This file contains the declarations for the Module class.
const AbstractManglingParser< Derived, Alloc >::OperatorInfo AbstractManglingParser< Derived, Alloc >::Ops[]
This file implements the LivePhysRegs utility for tracking liveness of physical registers.
Machine Check Debug Module
Register const TargetRegisterInfo * TRI
Promote Memory to Register
static MCRegister getReg(const MCDisassembler *D, unsigned RC, unsigned RegNo)
MachineInstr unsigned OpIdx
ConstantRange Range(APInt(BitWidth, Low), APInt(BitWidth, High))
PowerPC Reduce CR logical Operation
const SmallVectorImpl< MachineOperand > MachineBasicBlock * TBB
const SmallVectorImpl< MachineOperand > & Cond
This file declares the machine register scavenger class.
static bool contains(SmallPtrSetImpl< ConstantExpr * > &Cache, ConstantExpr *Expr, Constant *C)
This file defines the SmallSet class.
This file defines the SmallVector class.
This file defines the 'Statistic' class, which is designed to be an easy way to expose various metric...
#define STATISTIC(VARNAME, DESC)
#define DEBUG_WITH_TYPE(TYPE,...)
DEBUG_WITH_TYPE macro - This macro should be used by passes to emit debug information.
static bool canCombine(MachineBasicBlock &MBB, MachineOperand &MO, unsigned CombineOpc=0)
AArch64FunctionInfo - This class is derived from MachineFunctionInfo and contains private AArch64-spe...
bool branchTargetEnforcement() const
unsigned getArgumentStackToRestore() const
SignReturnAddress getSignReturnAddressCondition() const
bool hasStreamingModeChanges() const
void setOutliningStyle(const std::string &Style)
bool branchProtectionPAuthLR() const
std::optional< bool > hasRedZone() const
static bool shouldSignReturnAddress(SignReturnAddress Condition, bool IsLRSpilled)
bool shouldSignWithBKey() const
static bool isHForm(const MachineInstr &MI)
Returns whether the instruction is in H form (16 bit operands)
void insertSelect(MachineBasicBlock &MBB, MachineBasicBlock::iterator MI, const DebugLoc &DL, Register DstReg, ArrayRef< MachineOperand > Cond, Register TrueReg, Register FalseReg) const override
static bool hasBTISemantics(const MachineInstr &MI)
Returns whether the instruction can be compatible with non-zero BTYPE.
static bool isQForm(const MachineInstr &MI)
Returns whether the instruction is in Q form (128 bit operands)
static bool getMemOpInfo(unsigned Opcode, TypeSize &Scale, TypeSize &Width, int64_t &MinOffset, int64_t &MaxOffset)
Returns true if opcode Opc is a memory operation.
static bool isTailCallReturnInst(const MachineInstr &MI)
Returns true if MI is one of the TCRETURN* instructions.
static bool isFPRCopy(const MachineInstr &MI)
Does this instruction rename an FPR without modifying bits?
MachineInstr * emitLdStWithAddr(MachineInstr &MemI, const ExtAddrMode &AM) const override
std::optional< DestSourcePair > isCopyInstrImpl(const MachineInstr &MI) const override
If the specific machine instruction is an instruction that moves/copies value from one register to an...
MachineBasicBlock * getBranchDestBlock(const MachineInstr &MI) const override
unsigned getInstSizeInBytes(const MachineInstr &MI) const override
GetInstSize - Return the number of bytes of code the specified instruction may be.
static bool isZExtLoad(const MachineInstr &MI)
Returns whether the instruction is a zero-extending load.
bool areMemAccessesTriviallyDisjoint(const MachineInstr &MIa, const MachineInstr &MIb) const override
void copyPhysReg(MachineBasicBlock &MBB, MachineBasicBlock::iterator I, const DebugLoc &DL, Register DestReg, Register SrcReg, bool KillSrc, bool RenamableDest=false, bool RenamableSrc=false) const override
static bool isGPRCopy(const MachineInstr &MI)
Does this instruction rename a GPR without modifying bits?
static unsigned convertToFlagSettingOpc(unsigned Opc)
Return the opcode that set flags when possible.
void createPauthEpilogueInstr(MachineBasicBlock &MBB, DebugLoc DL) const
Return true when there is potentially a faster code sequence for an instruction chain ending in Root.
bool isBranchOffsetInRange(unsigned BranchOpc, int64_t BrOffset) const override
bool canInsertSelect(const MachineBasicBlock &, ArrayRef< MachineOperand > Cond, Register, Register, Register, int &, int &, int &) const override
Register isLoadFromStackSlotPostFE(const MachineInstr &MI, int &FrameIndex) const override
Check for post-frame ptr elimination stack locations as well.
static const MachineOperand & getLdStOffsetOp(const MachineInstr &MI)
Returns the immediate offset operator of a load/store.
bool isCoalescableExtInstr(const MachineInstr &MI, Register &SrcReg, Register &DstReg, unsigned &SubIdx) const override
static std::optional< unsigned > getUnscaledLdSt(unsigned Opc)
Returns the unscaled load/store for the scaled load/store opcode, if there is a corresponding unscale...
static bool hasUnscaledLdStOffset(unsigned Opc)
Return true if it has an unscaled load/store offset.
static const MachineOperand & getLdStAmountOp(const MachineInstr &MI)
Returns the shift amount operator of a load/store.
static bool isPreLdSt(const MachineInstr &MI)
Returns whether the instruction is a pre-indexed load/store.
std::optional< ExtAddrMode > getAddrModeFromMemoryOp(const MachineInstr &MemI, const TargetRegisterInfo *TRI) const override
bool getMemOperandsWithOffsetWidth(const MachineInstr &MI, SmallVectorImpl< const MachineOperand * > &BaseOps, int64_t &Offset, bool &OffsetIsScalable, LocationSize &Width, const TargetRegisterInfo *TRI) const override
bool analyzeBranchPredicate(MachineBasicBlock &MBB, MachineBranchPredicate &MBP, bool AllowModify) const override
void insertIndirectBranch(MachineBasicBlock &MBB, MachineBasicBlock &NewDestBB, MachineBasicBlock &RestoreBB, const DebugLoc &DL, int64_t BrOffset, RegScavenger *RS) const override
void loadRegFromStackSlot(MachineBasicBlock &MBB, MachineBasicBlock::iterator MBBI, Register DestReg, int FrameIndex, const TargetRegisterClass *RC, Register VReg, unsigned SubReg=0, MachineInstr::MIFlag Flags=MachineInstr::NoFlags) const override
static bool isPairableLdStInst(const MachineInstr &MI)
Return true if pairing the given load or store may be paired with another.
void storeRegToStackSlot(MachineBasicBlock &MBB, MachineBasicBlock::iterator MBBI, Register SrcReg, bool isKill, int FrameIndex, const TargetRegisterClass *RC, Register VReg, MachineInstr::MIFlag Flags=MachineInstr::NoFlags) const override
static bool isSExtLoad(const MachineInstr &MI)
Returns whether the instruction is a sign-extending load.
const AArch64RegisterInfo & getRegisterInfo() const
getRegisterInfo - TargetInstrInfo is a superset of MRegister info.
static bool isPreSt(const MachineInstr &MI)
Returns whether the instruction is a pre-indexed store.
void insertNoop(MachineBasicBlock &MBB, MachineBasicBlock::iterator MI) const override
AArch64InstrInfo(const AArch64Subtarget &STI)
static bool isPairedLdSt(const MachineInstr &MI)
Returns whether the instruction is a paired load/store.
MachineInstr * foldMemoryOperandImpl(MachineFunction &MF, MachineInstr &MI, ArrayRef< unsigned > Ops, int FrameIndex, MachineInstr *&CopyMI, LiveIntervals *LIS=nullptr, VirtRegMap *VRM=nullptr) const override
bool getMemOperandWithOffsetWidth(const MachineInstr &MI, const MachineOperand *&BaseOp, int64_t &Offset, bool &OffsetIsScalable, TypeSize &Width, const TargetRegisterInfo *TRI) const
If OffsetIsScalable is set to 'true', the offset is scaled by vscale.
Register isLoadFromStackSlot(const MachineInstr &MI, int &FrameIndex) const override
bool reverseBranchCondition(SmallVectorImpl< MachineOperand > &Cond) const override
static bool isStridedAccess(const MachineInstr &MI)
Return true if the given load or store is a strided memory access.
bool shouldClusterMemOps(ArrayRef< const MachineOperand * > BaseOps1, int64_t Offset1, bool OffsetIsScalable1, ArrayRef< const MachineOperand * > BaseOps2, int64_t Offset2, bool OffsetIsScalable2, unsigned ClusterSize, unsigned NumBytes) const override
Detect opportunities for ldp/stp formation.
unsigned removeBranch(MachineBasicBlock &MBB, int *BytesRemoved=nullptr) const override
bool isThroughputPattern(unsigned Pattern) const override
Return true when a code sequence can improve throughput.
MachineOperand & getMemOpBaseRegImmOfsOffsetOperand(MachineInstr &LdSt) const
Return the immediate offset of the base register in a load/store LdSt.
bool analyzeBranch(MachineBasicBlock &MBB, MachineBasicBlock *&TBB, MachineBasicBlock *&FBB, SmallVectorImpl< MachineOperand > &Cond, bool AllowModify=false) const override
bool canFoldIntoAddrMode(const MachineInstr &MemI, Register Reg, const MachineInstr &AddrI, ExtAddrMode &AM) const override
static bool isLdStPairSuppressed(const MachineInstr &MI)
Return true if pairing the given load or store is hinted to be unprofitable.
Register isStoreToStackSlotPostFE(const MachineInstr &MI, int &FrameIndex) const override
Check for post-frame ptr elimination stack locations as well.
std::unique_ptr< TargetInstrInfo::PipelinerLoopInfo > analyzeLoopForPipelining(MachineBasicBlock *LoopBB) const override
bool isSchedulingBoundary(const MachineInstr &MI, const MachineBasicBlock *MBB, const MachineFunction &MF) const override
unsigned insertBranch(MachineBasicBlock &MBB, MachineBasicBlock *TBB, MachineBasicBlock *FBB, ArrayRef< MachineOperand > Cond, const DebugLoc &DL, int *BytesAdded=nullptr) const override
bool optimizeCompareInstr(MachineInstr &CmpInstr, Register SrcReg, Register SrcReg2, int64_t CmpMask, int64_t CmpValue, const MachineRegisterInfo *MRI) const override
optimizeCompareInstr - Convert the instruction supplying the argument to the comparison into one that...
static unsigned getLoadStoreImmIdx(unsigned Opc)
Returns the index for the immediate for a given instruction.
static bool isGPRZero(const MachineInstr &MI)
Does this instruction set its full destination register to zero?
void copyGPRRegTuple(MachineBasicBlock &MBB, MachineBasicBlock::iterator I, const DebugLoc &DL, MCRegister DestReg, MCRegister SrcReg, bool KillSrc, unsigned Opcode, unsigned ZeroReg, llvm::ArrayRef< unsigned > Indices) const
bool analyzeCompare(const MachineInstr &MI, Register &SrcReg, Register &SrcReg2, int64_t &CmpMask, int64_t &CmpValue) const override
analyzeCompare - For a comparison instruction, return the source registers in SrcReg and SrcReg2,...
CombinerObjective getCombinerObjective(unsigned Pattern) const override
static bool isFpOrNEON(Register Reg)
Returns whether the physical register is FP or NEON.
bool isAsCheapAsAMove(const MachineInstr &MI) const override
std::optional< DestSourcePair > isCopyLikeInstrImpl(const MachineInstr &MI) const override
static void suppressLdStPair(MachineInstr &MI)
Hint that pairing the given load or store is unprofitable.
Register isStoreToStackSlot(const MachineInstr &MI, int &FrameIndex) const override
static bool isPreLd(const MachineInstr &MI)
Returns whether the instruction is a pre-indexed load.
void copyPhysRegTuple(MachineBasicBlock &MBB, MachineBasicBlock::iterator I, const DebugLoc &DL, MCRegister DestReg, MCRegister SrcReg, bool KillSrc, unsigned Opcode, llvm::ArrayRef< unsigned > Indices) const
bool optimizeCondBranch(MachineInstr &MI) const override
Replace csincr-branch sequence by simple conditional branch.
static int getMemScale(unsigned Opc)
Scaling factor for (scaled or unscaled) load or store.
bool isCandidateToMergeOrPair(const MachineInstr &MI) const
Return true if this is a load/store that can be potentially paired/merged.
MCInst getNop() const override
static const MachineOperand & getLdStBaseOp(const MachineInstr &MI)
Returns the base register operator of a load/store.
bool isReservedReg(const MachineFunction &MF, MCRegister Reg) const
const AArch64RegisterInfo * getRegisterInfo() const override
bool isNeonAvailable() const
Returns true if the target has NEON and the function at runtime is known to have NEON enabled (e....
bool isSVEorStreamingSVEAvailable() const
Returns true if the target has access to either the full range of SVE instructions,...
Represent a constant reference to an array (0 or more elements consecutively in memory),...
const T & front() const
Get the first element.
size_t size() const
Get the array size.
This is an important base class in LLVM.
std::pair< iterator, bool > insert(const std::pair< KeyT, ValueT > &KV)
bool hasOptSize() const
Optimize this function for size (-Os) or minimum size (-Oz).
bool hasMinSize() const
Optimize this function for minimum size (-Oz).
Module * getParent()
Get the module that this global value is contained inside of...
LLVM_ABI InstListType::iterator eraseFromParent()
This method unlinks 'this' from the containing basic block and deletes it.
unsigned getOpcode() const
Returns a member of one of the enums like Instruction::Add.
static LocationSize precise(uint64_t Value)
This class is intended to be used as a base class for asm properties and features specific to the tar...
bool usesWindowsCFI() const
static MCCFIInstruction cfiDefCfa(MCSymbol *L, unsigned Register, int64_t Offset, SMLoc Loc={})
.cfi_def_cfa defines a rule for computing CFA as: take address from Register and add Offset to it.
static MCCFIInstruction createOffset(MCSymbol *L, unsigned Register, int64_t Offset, SMLoc Loc={})
.cfi_offset Previous value of Register is saved at offset Offset from CFA.
static MCCFIInstruction cfiDefCfaOffset(MCSymbol *L, int64_t Offset, SMLoc Loc={})
.cfi_def_cfa_offset modifies a rule for computing CFA.
static MCCFIInstruction createEscape(MCSymbol *L, StringRef Vals, SMLoc Loc={}, StringRef Comment="")
.cfi_escape Allows the user to add arbitrary bytes to the unwind info.
Instances of this class represent a single low-level machine instruction.
Describe properties that are true of each instruction in the target description file.
unsigned getNumOperands() const
Return the number of declared MachineOperands for this MachineInstruction.
ArrayRef< MCOperandInfo > operands() const
Wrapper class representing physical registers. Should be passed by value.
constexpr bool isValid() const
static constexpr unsigned NoRegister
static MDTuple * get(LLVMContext &Context, ArrayRef< Metadata * > MDs)
bool isInlineAsmBrIndirectTarget() const
Returns true if this is the indirect dest of an INLINEASM_BR.
unsigned pred_size() const
LLVM_ABI void transferSuccessorsAndUpdatePHIs(MachineBasicBlock *FromMBB)
Transfers all the successors, as in transferSuccessors, and update PHI operands in the successor bloc...
LLVM_ABI instr_iterator insert(instr_iterator I, MachineInstr *M)
Insert MI into the instruction list before I, possibly inside a bundle.
reverse_instr_iterator instr_rbegin()
LLVM_ABI iterator getFirstTerminator()
Returns an iterator to the first terminator instruction of this basic block.
LLVM_ABI void addSuccessor(MachineBasicBlock *Succ, BranchProbability Prob=BranchProbability::getUnknown())
Add Succ as a successor of this MachineBasicBlock.
reverse_instr_iterator instr_rend()
Instructions::iterator instr_iterator
instr_iterator instr_end()
void addLiveIn(MCRegister PhysReg, LaneBitmask LaneMask=LaneBitmask::getAll())
Adds the specified register as a live in.
const MachineFunction * getParent() const
Return the MachineFunction containing this basic block.
LLVM_ABI instr_iterator erase(instr_iterator I)
Remove an instruction from the instruction list and delete it.
void splice(iterator Where, MachineBasicBlock *Other, iterator From)
Take an instruction from MBB 'Other' at the position From, and insert it into this MBB right before '...
MachineInstrBundleIterator< MachineInstr > iterator
void setMachineBlockAddressTaken()
Set this block to indicate that its address is used as something other than the target of a terminato...
LLVM_ABI bool isLiveIn(MCRegister Reg, LaneBitmask LaneMask=LaneBitmask::getAll()) const
Return true if the specified register is in the live in set.
The MachineFrameInfo class represents an abstract stack frame until prolog/epilog code is inserted.
uint64_t getStackSize() const
Return the number of bytes that must be allocated to hold all of the fixed size frame objects.
void setStackID(int ObjectIdx, uint8_t ID)
bool isCalleeSavedInfoValid() const
Has the callee saved info been calculated yet?
Align getObjectAlign(int ObjectIdx) const
Return the alignment of the specified stack object.
int64_t getObjectSize(int ObjectIdx) const
Return the size of the specified object.
unsigned getNumObjects() const
Return the number of objects.
int64_t getObjectOffset(int ObjectIdx) const
Return the assigned stack offset of the specified object from the incoming stack pointer.
bool isFixedObjectIndex(int ObjectIdx) const
Returns true if the specified index corresponds to a fixed stack object.
unsigned addFrameInst(const MCCFIInstruction &Inst)
const TargetSubtargetInfo & getSubtarget() const
getSubtarget - Return the subtarget for which this machine code is being compiled.
StringRef getName() const
getName - Return the name of the corresponding LLVM function.
MachineMemOperand * getMachineMemOperand(MachinePointerInfo PtrInfo, MachineMemOperand::Flags f, LLT MemTy, Align base_alignment, const AAMDNodes &AAInfo=AAMDNodes(), const MDNode *Ranges=nullptr, SyncScope::ID SSID=SyncScope::System, AtomicOrdering Ordering=AtomicOrdering::NotAtomic, AtomicOrdering FailureOrdering=AtomicOrdering::NotAtomic)
getMachineMemOperand - Allocate a new MachineMemOperand.
MachineFrameInfo & getFrameInfo()
getFrameInfo - Return the frame info object for the current function.
MachineRegisterInfo & getRegInfo()
getRegInfo - Return information about the registers currently in use.
Function & getFunction()
Return the LLVM function that this machine code represents.
BasicBlockListType::iterator iterator
Ty * getInfo()
getInfo - Keep track of various per-function pieces of information for backends that would like to do...
const MachineJumpTableInfo * getJumpTableInfo() const
getJumpTableInfo - Return the jump table info object for the current function.
MachineBasicBlock * CreateMachineBasicBlock(const BasicBlock *BB=nullptr, std::optional< UniqueBBID > BBID=std::nullopt)
CreateMachineInstr - Allocate a new MachineInstr.
void insert(iterator MBBI, MachineBasicBlock *MBB)
const TargetMachine & getTarget() const
getTarget - Return the target machine this machine code is compiled with
const MachineInstrBuilder & setMemRefs(ArrayRef< MachineMemOperand * > MMOs) const
const MachineInstrBuilder & addCFIIndex(unsigned CFIIndex) const
const MachineInstrBuilder & addUse(Register RegNo, RegState Flags={}, unsigned SubReg=0) const
Add a virtual register use operand.
const MachineInstrBuilder & addReg(Register RegNo, RegState Flags={}, unsigned SubReg=0) const
Add a new virtual register operand.
const MachineInstrBuilder & setMIFlag(MachineInstr::MIFlag Flag) const
const MachineInstrBuilder & addImm(int64_t Val) const
Add a new immediate operand.
const MachineInstrBuilder & add(const MachineOperand &MO) const
const MachineInstrBuilder & addSym(MCSymbol *Sym, unsigned char TargetFlags=0) const
const MachineInstrBuilder & addFrameIndex(int Idx) const
const MachineInstrBuilder & addGlobalAddress(const GlobalValue *GV, int64_t Offset=0, unsigned TargetFlags=0) const
const MachineInstrBuilder & addMBB(MachineBasicBlock *MBB, unsigned TargetFlags=0) const
const MachineInstrBuilder & addDef(Register RegNo, RegState Flags={}, unsigned SubReg=0) const
Add a virtual register definition operand.
const MachineInstrBuilder & setMIFlags(unsigned Flags) const
const MachineInstrBuilder & addMemOperand(MachineMemOperand *MMO) const
reverse_iterator getReverse() const
Get a reverse iterator to the same node.
Representation of each machine instruction.
unsigned getOpcode() const
Returns the opcode of this MachineInstr.
bool mayLoadOrStore(QueryType Type=AnyInBundle) const
Return true if this instruction could possibly read or modify memory.
const MachineBasicBlock * getParent() const
bool isCall(QueryType Type=AnyInBundle) const
bool getFlag(MIFlag Flag) const
Return whether an MI flag is set.
LLVM_ABI uint32_t mergeFlagsWith(const MachineInstr &Other) const
Return the MIFlags which represent both MachineInstrs.
unsigned getNumOperands() const
Retuns the total number of operands.
LLVM_ABI unsigned getNumExplicitOperands() const
Returns the number of non-implicit operands.
bool mayLoad(QueryType Type=AnyInBundle) const
Return true if this instruction could possibly read memory.
const MCInstrDesc & getDesc() const
Returns the target instruction descriptor of this MachineInstr.
LLVM_ABI bool hasUnmodeledSideEffects() const
Return true if this instruction has side effects that are not modeled by mayLoad / mayStore,...
bool registerDefIsDead(Register Reg, const TargetRegisterInfo *TRI) const
Returns true if the register is dead in this machine instruction.
bool definesRegister(Register Reg, const TargetRegisterInfo *TRI) const
Return true if the MachineInstr fully defines the specified register.
LLVM_ABI void setDesc(const MCInstrDesc &TID)
Replace the instruction descriptor (thus opcode) of the current instruction with a new one.
LLVM_ABI bool hasOrderedMemoryRef() const
Return true if this instruction may have an ordered or volatile memory reference, or if the informati...
LLVM_ABI const MachineFunction * getMF() const
Return the function that contains the basic block that this instruction belongs to.
ArrayRef< MachineMemOperand * > memoperands() const
Access to memory operands of the instruction.
LLVM_ABI bool isLoadFoldBarrier() const
Returns true if it is illegal to fold a load across this instruction.
const DebugLoc & getDebugLoc() const
Returns the debug location id of this MachineInstr.
LLVM_ABI void removeOperand(unsigned OpNo)
Erase an operand from an instruction, leaving it with one fewer operand than it started with.
LLVM_ABI void addRegisterDefined(Register Reg, const TargetRegisterInfo *RegInfo=nullptr)
We have determined MI defines a register.
const MachineOperand & getOperand(unsigned i) const
uint32_t getFlags() const
Return the MI flags bitvector.
LLVM_ABI int findRegisterDefOperandIdx(Register Reg, const TargetRegisterInfo *TRI, bool isDead=false, bool Overlap=false) const
Returns the operand index that is a def of the specified register or -1 if it is not found.
LLVM_ABI MachineInstrBundleIterator< MachineInstr > eraseFromParent()
Unlink 'this' from the containing basic block and delete it.
const std::vector< MachineJumpTableEntry > & getJumpTables() const
A description of a memory reference used in the backend.
@ MOVolatile
The memory access is volatile.
@ MOLoad
The memory access reads data.
@ MOStore
The memory access writes data.
This class contains meta information specific to a module.
LLVM_ABI MachineFunction * getMachineFunction(const Function &F) const
Returns the MachineFunction associated to IR function F if there is one, otherwise nullptr.
MachineOperand class - Representation of each machine instruction operand.
void setSubReg(unsigned subReg)
unsigned getSubReg() const
void setImm(int64_t immVal)
bool isReg() const
isReg - Tests if this is a MO_Register operand.
MachineBasicBlock * getMBB() const
void setIsDead(bool Val=true)
LLVM_ABI void setReg(Register Reg)
Change the register this operand corresponds to.
bool isImm() const
isImm - Tests if this is a MO_Immediate operand.
void setIsKill(bool Val=true)
MachineInstr * getParent()
getParent - Return the instruction that this operand belongs to.
unsigned getTargetFlags() const
static MachineOperand CreateImm(int64_t Val)
MachineOperandType getType() const
getType - Returns the MachineOperandType for this operand.
void setIsUndef(bool Val=true)
Register getReg() const
getReg - Returns the register number.
bool isFI() const
isFI - Tests if this is a MO_FrameIndex operand.
LLVM_ABI bool isIdenticalTo(const MachineOperand &Other) const
Returns true if this operand is identical to the specified operand except for liveness related flags ...
static MachineOperand CreateReg(Register Reg, bool isDef, bool isImp=false, bool isKill=false, bool isDead=false, bool isUndef=false, bool isEarlyClobber=false, unsigned SubReg=0, bool isDebug=false, bool isInternalRead=false, bool isRenamable=false)
MachineRegisterInfo - Keep track of information for virtual and physical registers,...
LLVM_ABI bool hasOneNonDBGUse(Register RegNo) const
hasOneNonDBGUse - Return true if there is exactly one non-Debug use of the specified register.
bool tracksLiveness() const
tracksLiveness - Returns true when tracking register liveness accurately.
const TargetRegisterClass * getRegClass(Register Reg) const
Return the register class of the specified virtual register.
LLVM_ABI void clearKillFlags(Register Reg) const
clearKillFlags - Iterate over all the uses of the given register and clear the kill flag from the Mac...
LLVM_ABI MachineInstr * getVRegDef(Register Reg) const
getVRegDef - Return the machine instr that defines the specified virtual register or null if none is ...
bool use_nodbg_empty(Register RegNo) const
use_nodbg_empty - Return true if there are no non-Debug instructions using the specified register.
LLVM_ABI Register createVirtualRegister(const TargetRegisterClass *RegClass, StringRef Name="")
createVirtualRegister - Create and return a new virtual register in the function with the specified r...
bool reservedRegsFrozen() const
reservedRegsFrozen - Returns true after freezeReservedRegs() was called to ensure the set of reserved...
bool def_empty(Register RegNo) const
def_empty - Return true if there are no instructions defining the specified register (it may be live-...
use_instr_nodbg_iterator use_instr_nodbg_begin(Register RegNo) const
bool hasOneDef(Register RegNo) const
Return true if there is exactly one operand defining the specified register.
const TargetRegisterClass * getRegClassOrNull(Register Reg) const
Return the register class of Reg, or null if Reg has not been assigned a register class yet.
LLVM_ABI const TargetRegisterClass * constrainRegClass(Register Reg, const TargetRegisterClass *RC, unsigned MinNumRegs=0)
constrainRegClass - Constrain the register class of the specified virtual register to be a common sub...
LLVM_ABI MachineInstr * getUniqueVRegDef(Register Reg) const
getUniqueVRegDef - Return the unique machine instr that defines the specified virtual register or nul...
A Module instance is used to store all the information related to an LLVM module.
MI-level patchpoint operands.
uint32_t getNumPatchBytes() const
Return the number of patchable bytes the given patchpoint should emit.
Wrapper class representing virtual and physical registers.
MCRegister asMCReg() const
Utility to check-convert this value to a MCRegister.
constexpr bool isValid() const
constexpr bool isVirtual() const
Return true if the specified register number is in the virtual register namespace.
static constexpr bool isVirtualRegister(unsigned Reg)
Return true if the specified register number is in the virtual register namespace.
constexpr bool isPhysical() const
Return true if the specified register number is in the physical register namespace.
Represents a location in source code.
bool erase(PtrType Ptr)
Remove pointer from the set.
std::pair< iterator, bool > insert(PtrType Ptr)
Inserts Ptr if and only if there is no element in the container equal to Ptr.
SmallPtrSet - This class implements a set which is optimized for holding SmallSize or less elements.
SmallSet - This maintains a set of unique values, optimizing for the case when the set is small (less...
SmallString - A SmallString is just a SmallVector with methods and accessors that make it work better...
void append(StringRef RHS)
Append from a StringRef.
StringRef str() const
Explicit conversion to StringRef.
This class consists of common code factored out of the SmallVector class to reduce code duplication b...
void push_back(const T &Elt)
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
MI-level stackmap operands.
uint32_t getNumPatchBytes() const
Return the number of patchable bytes the given stackmap should emit.
StackOffset holds a fixed and a scalable offset in bytes.
int64_t getFixed() const
Returns the fixed component of the stack.
int64_t getScalable() const
Returns the scalable component of the stack.
static StackOffset get(int64_t Fixed, int64_t Scalable)
static StackOffset getScalable(int64_t Scalable)
static StackOffset getFixed(int64_t Fixed)
MI-level Statepoint operands.
uint32_t getNumPatchBytes() const
Return the number of patchable bytes the given statepoint should emit.
Represent a constant reference to a string, i.e.
Object returned by analyzeLoopForPipelining.
TargetInstrInfo - Interface to description of machine instruction set.
virtual void genAlternativeCodeSequence(MachineInstr &Root, unsigned Pattern, SmallVectorImpl< MachineInstr * > &InsInstrs, SmallVectorImpl< MachineInstr * > &DelInstrs, DenseMap< Register, unsigned > &InstIdxForVirtReg) const
When getMachineCombinerPatterns() finds patterns, this function generates the instructions that could...
virtual std::optional< ParamLoadedValue > describeLoadedValue(const MachineInstr &MI, Register Reg) const
Produce the expression describing the MI loading a value into the physical register Reg.
virtual bool getMachineCombinerPatterns(MachineInstr &Root, SmallVectorImpl< unsigned > &Patterns, bool DoRegPressureReduce) const
Return true when there is potentially a faster code sequence for an instruction chain ending in Root.
virtual bool isSchedulingBoundary(const MachineInstr &MI, const MachineBasicBlock *MBB, const MachineFunction &MF) const
Test if the given instruction should be considered a scheduling boundary.
virtual CombinerObjective getCombinerObjective(unsigned Pattern) const
Return the objective of a combiner pattern.
virtual bool isFunctionSafeToSplit(const MachineFunction &MF) const
Return true if the function is a viable candidate for machine function splitting.
const MCAsmInfo & getMCAsmInfo() const
Return target specific asm information.
CodeModel::Model getCodeModel() const
Returns the code model.
bool contains(Register Reg) const
Return true if the specified register is included in this register class.
bool hasSubClassEq(const TargetRegisterClass *RC) const
Returns true if RC is a sub-class of or equal to this class.
bool hasSuperClassEq(const TargetRegisterClass *RC) const
Returns true if RC is a super-class of or equal to this class.
TargetRegisterInfo base class - We assume that the target defines a static array of TargetRegisterDes...
TargetSubtargetInfo - Generic base class for all target subtargets.
virtual const TargetInstrInfo * getInstrInfo() const
virtual const TargetRegisterInfo * getRegisterInfo() const =0
Return the target's register information.
Target - Wrapper for Target specific information.
static constexpr TypeSize getFixed(ScalarTy ExactSize)
static constexpr TypeSize getScalable(ScalarTy MinimumSize)
Value * getOperand(unsigned i) const
constexpr bool isScalable() const
Returns whether the quantity is scaled by a runtime quantity (vscale).
constexpr ScalarTy getKnownMinValue() const
Returns the minimum value this quantity can represent.
self_iterator getIterator()
A raw_ostream that writes to an std::string.
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
static CondCode getInvertedCondCode(CondCode Code)
@ MO_DLLIMPORT
MO_DLLIMPORT - On a symbol operand, this represents that the reference to the symbol is for an import...
@ MO_NC
MO_NC - Indicates whether the linker is expected to check the symbol reference for overflow.
@ MO_G1
MO_G1 - A symbol operand with this flag (granule 1) represents the bits 16-31 of a 64-bit address,...
@ MO_S
MO_S - Indicates that the bits of the symbol operand represented by MO_G0 etc are signed.
@ MO_PAGEOFF
MO_PAGEOFF - A symbol operand with this flag represents the offset of that symbol within a 4K page.
@ MO_GOT
MO_GOT - This flag indicates that a symbol operand represents the address of the GOT entry for the sy...
@ MO_PREL
MO_PREL - Indicates that the bits of the symbol operand represented by MO_G0 etc are PC relative.
@ MO_G0
MO_G0 - A symbol operand with this flag (granule 0) represents the bits 0-15 of a 64-bit address,...
@ MO_ARM64EC_CALLMANGLE
MO_ARM64EC_CALLMANGLE - Operand refers to the Arm64EC-mangled version of a symbol,...
@ MO_PAGE
MO_PAGE - A symbol operand with this flag represents the pc-relative offset of the 4K page containing...
@ MO_HI12
MO_HI12 - This flag indicates that a symbol operand represents the bits 13-24 of a 64-bit address,...
@ MO_TLS
MO_TLS - Indicates that the operand being accessed is some kind of thread-local symbol.
@ MO_G2
MO_G2 - A symbol operand with this flag (granule 2) represents the bits 32-47 of a 64-bit address,...
@ MO_TAGGED
MO_TAGGED - With MO_PAGE, indicates that the page includes a memory tag in bits 56-63.
@ MO_G3
MO_G3 - A symbol operand with this flag (granule 3) represents the high 16-bits of a 64-bit address,...
@ MO_COFFSTUB
MO_COFFSTUB - On a symbol operand "FOO", this indicates that the reference is actually to the "....
unsigned getCheckerSizeInBytes(AuthCheckMethod Method)
Returns the number of bytes added by checkAuthenticatedRegister.
static uint64_t decodeLogicalImmediate(uint64_t val, unsigned regSize)
decodeLogicalImmediate - Decode a logical immediate value in the form "N:immr:imms" (where the immr a...
static unsigned getShiftValue(unsigned Imm)
getShiftValue - Extract the shift value.
static unsigned getArithExtendImm(AArch64_AM::ShiftExtendType ET, unsigned Imm)
getArithExtendImm - Encode the extend type and shift amount for an arithmetic instruction: imm: 3-bit...
static unsigned getArithShiftValue(unsigned Imm)
getArithShiftValue - get the arithmetic shift value.
static uint64_t encodeLogicalImmediate(uint64_t imm, unsigned regSize)
encodeLogicalImmediate - Return the encoded immediate value for a logical immediate instruction of th...
static AArch64_AM::ShiftExtendType getExtendType(unsigned Imm)
getExtendType - Extract the extend type for operands of arithmetic ops.
static AArch64_AM::ShiftExtendType getArithExtendType(unsigned Imm)
static AArch64_AM::ShiftExtendType getShiftType(unsigned Imm)
getShiftType - Extract the shift type.
static unsigned getShifterImm(AArch64_AM::ShiftExtendType ST, unsigned Imm)
getShifterImm - Encode the shift type and amount: imm: 6-bit shift amount shifter: 000 ==> lsl 001 ==...
void expandMOVAddr(unsigned Opcode, unsigned TargetFlags, bool IsTargetMachO, SmallVectorImpl< AddrInsnModel > &Insn)
void expandMOVImm(uint64_t Imm, unsigned BitSize, SmallVectorImpl< ImmInsnModel > &Insn)
Expand a MOVi32imm or MOVi64imm pseudo instruction to one or more real move-immediate instructions to...
static const uint64_t InstrFlagIsWhile
static const uint64_t InstrFlagIsPTestLike
constexpr std::underlying_type_t< E > Mask()
Get a bitmask with 1s in all places up to the high-order bit of E's largest value.
@ C
The default llvm calling convention, compatible with C.
@ ScalablePredicateVector
initializer< Ty > init(const Ty &Val)
InstrType
Represents how an instruction should be mapped by the outliner.
NodeAddr< InstrNode * > Instr
LLVM_ABI Instruction & back() const
LLVM_ABI iterator begin() const
This is an optimization pass for GlobalISel generic memory operations.
auto drop_begin(T &&RangeOrContainer, size_t N=1)
Return a range covering RangeOrContainer with the first N elements excluded.
bool all_of(R &&range, UnaryPredicate P)
Provide wrappers to std::all_of which take ranges instead of having to pass begin/end explicitly.
static bool isCondBranchOpcode(int Opc)
MCCFIInstruction createDefCFA(const TargetRegisterInfo &TRI, unsigned FrameReg, unsigned Reg, const StackOffset &Offset, bool LastAdjustmentWasScalable=true)
static bool isPTrueOpcode(unsigned Opc)
MachineInstrBuilder BuildMI(MachineFunction &MF, const MIMetadata &MIMD, const MCInstrDesc &MCID)
Builder interface. Specify how to create the initial instruction itself.
bool succeeded(LogicalResult Result)
Utility function that returns true if the provided LogicalResult corresponds to a success value.
int isAArch64FrameOffsetLegal(const MachineInstr &MI, StackOffset &Offset, bool *OutUseUnscaledOp=nullptr, unsigned *OutUnscaledOp=nullptr, int64_t *EmittableOffset=nullptr)
Check if the Offset is a valid frame offset for MI.
constexpr bool isInt(int64_t x)
Checks if an integer fits into the given bit width.
RegState
Flags to represent properties of register accesses.
@ Implicit
Not emitted register (e.g. carry, or temporary result).
@ Kill
The last use of a register.
@ Undef
Value of the register doesn't matter.
@ Define
Register definition.
@ Renamable
Register that may be renamed.
auto enumerate(FirstRange &&First, RestRanges &&...Rest)
Given two or more input ranges, returns a new range whose values are tuples (A, B,...
constexpr RegState getKillRegState(bool B)
decltype(auto) dyn_cast(const From &Val)
dyn_cast<X> - Return the argument parameter cast to the specified type.
static bool isIndirectBranchOpcode(int Opc)
iterator_range< T > make_range(T x, T y)
Convenience function for iterating over sub-ranges.
unsigned getBLRCallOpcode(const MachineFunction &MF)
Return opcode to be used for indirect calls.
@ AArch64FrameOffsetIsLegal
Offset is legal.
@ AArch64FrameOffsetCanUpdate
Offset can apply, at least partly.
@ AArch64FrameOffsetCannotUpdate
Offset cannot apply.
constexpr bool isPowerOf2_64(uint64_t Value)
Return true if the argument is a power of two > 0 (64 bit edition.)
unsigned Log2_64(uint64_t Value)
Return the floor log base 2 of the specified value, -1 if the value is zero.
static bool isSEHInstruction(const MachineInstr &MI)
bool any_of(R &&range, UnaryPredicate P)
Provide wrappers to std::any_of which take ranges instead of having to pass begin/end explicitly.
auto reverse(ContainerTy &&C)
MachineInstr * getImm(const MachineOperand &MO, const MachineRegisterInfo *MRI)
decltype(auto) get(const PointerIntPair< PointerTy, IntBits, IntType, PtrTraits, Info > &Pair)
void sort(IteratorTy Start, IteratorTy End)
AArch64MachineCombinerPattern
@ MULSUBv2i32_indexed_OP1
@ MULADDv4i16_indexed_OP2
@ MULSUBv8i16_indexed_OP2
@ MULSUBv4i16_indexed_OP2
@ MULSUBv4i32_indexed_OP2
@ MULADDv2i32_indexed_OP1
@ MULADDv4i32_indexed_OP1
@ MULADDv2i32_indexed_OP2
@ MULSUBv4i16_indexed_OP1
@ MULADDv4i32_indexed_OP2
@ MULSUBv8i16_indexed_OP1
@ MULSUBv2i32_indexed_OP2
@ MULADDv8i16_indexed_OP1
@ MULSUBv4i32_indexed_OP1
@ MULADDv8i16_indexed_OP2
@ MULADDv4i16_indexed_OP1
LLVM_ABI raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
void emitFrameOffset(MachineBasicBlock &MBB, MachineBasicBlock::iterator MBBI, const DebugLoc &DL, unsigned DestReg, unsigned SrcReg, StackOffset Offset, const TargetInstrInfo *TII, MachineInstr::MIFlag=MachineInstr::NoFlags, bool SetNZCV=false, bool NeedsWinCFI=false, bool *HasWinCFI=nullptr, bool EmitCFAOffset=false, StackOffset InitialOffset={}, unsigned FrameReg=AArch64::SP)
emitFrameOffset - Emit instructions as needed to set DestReg to SrcReg plus Offset.
LLVM_ABI void report_fatal_error(Error Err, bool gen_crash_diag=true)
constexpr RegState getDefRegState(bool B)
CombinerObjective
The combiner's goal may differ based on which pattern it is attempting to optimize.
std::optional< UsedNZCV > examineCFlagsUse(MachineInstr &MI, MachineInstr &CmpInstr, const TargetRegisterInfo &TRI, SmallVectorImpl< MachineInstr * > *CCUseInstrs=nullptr)
CodeGenOptLevel
Code generation optimization level.
class LLVM_GSL_OWNER SmallVector
Forward declaration of SmallVector so that calculateSmallVectorDefaultInlinedElements can reference s...
auto instructionsWithoutDebug(IterT It, IterT End, bool SkipPseudoOp=true)
Construct a range iterator which begins at It and moves forwards until End is reached,...
LLVM_ABI raw_fd_ostream & errs()
This returns a reference to a raw_ostream for standard error.
auto drop_end(T &&RangeOrContainer, size_t N=1)
Return a range covering RangeOrContainer with the last N elements excluded.
static MCRegister getXRegFromWReg(MCRegister Reg)
MCCFIInstruction createCFAOffset(const TargetRegisterInfo &MRI, unsigned Reg, const StackOffset &OffsetFromDefCFA, std::optional< int64_t > IncomingVGOffsetFromDefCFA)
FunctionAddr VTableAddr Next
DWARFExpression::Operation Op
ArrayRef(const T &OneElt) -> ArrayRef< T >
static bool isUncondBranchOpcode(int Opc)
decltype(auto) cast(const From &Val)
cast<X> - Return the argument parameter cast to the specified type.
void erase_if(Container &C, UnaryPredicate P)
Provide a container algorithm similar to C++ Library Fundamentals v2's erase_if which is equivalent t...
constexpr bool isIntN(unsigned N, int64_t x)
Checks if an signed integer fits into the given (dynamic) bit width.
bool rewriteAArch64FrameIndex(MachineInstr &MI, unsigned FrameRegIdx, unsigned FrameReg, StackOffset &Offset, const AArch64InstrInfo *TII)
rewriteAArch64FrameIndex - Rewrite MI to access 'Offset' bytes from the FP.
bool is_contained(R &&Range, const E &Element)
Returns true if Element is found in Range.
static const MachineMemOperand::Flags MOSuppressPair
constexpr int64_t SignExtend64(uint64_t x)
Sign-extend the number in the bottom B bits of X to a 64-bit integer.
void appendLEB128(SmallVectorImpl< U > &Buffer, T Value)
bool optimizeTerminators(MachineBasicBlock *MBB, const TargetInstrInfo &TII)
std::pair< MachineOperand, DIExpression * > ParamLoadedValue
bool isNZCVTouchedInInstructionRange(const MachineInstr &DefMI, const MachineInstr &UseMI, const TargetRegisterInfo *TRI)
Return true if there is an instruction /after/ DefMI and before UseMI which either reads or clobbers ...
auto seq(T Begin, T End)
Iterate over an integral type from Begin up to - but not including - End.
static const MachineMemOperand::Flags MOStridedAccess
constexpr RegState getUndefRegState(bool B)
void fullyRecomputeLiveIns(ArrayRef< MachineBasicBlock * > MBBs)
Convenience function for recomputing live-in's for a set of MBBs until the computation converges.
LLVM_ABI Printable printReg(Register Reg, const TargetRegisterInfo *TRI=nullptr, unsigned SubIdx=0, const MachineRegisterInfo *MRI=nullptr)
Prints virtual and physical registers with or without a TRI instance.
This struct is a compact representation of a valid (non-zero power of two) alignment.
Used to describe addressing mode similar to ExtAddrMode in CodeGenPrepare.
LLVM_ABI static const MBBSectionID ColdSectionID
This class contains a discriminated union of information about pointers in memory operands,...
static LLVM_ABI MachinePointerInfo getUnknownStack(MachineFunction &MF)
Stack memory without other information.
static LLVM_ABI MachinePointerInfo getFixedStack(MachineFunction &MF, int FI, int64_t Offset=0)
Return a MachinePointerInfo record that refers to the specified FrameIndex.
An individual sequence of instructions to be replaced with a call to an outlined function.
MachineFunction * getMF() const
The information necessary to create an outlined function for some class of candidate.