67#define GET_INSTRINFO_CTOR_DTOR
68#include "AArch64GenInstrInfo.inc"
70#define DEBUG_TYPE "AArch64InstrInfo"
72STATISTIC(NumCopyInstrs,
"Number of COPY instructions expanded");
73STATISTIC(NumZCRegMoveInstrsGPR,
"Number of zero-cycle GPR register move "
74 "instructions expanded from canonical COPY");
75STATISTIC(NumZCRegMoveInstrsFPR,
"Number of zero-cycle FPR register move "
76 "instructions expanded from canonical COPY");
77STATISTIC(NumZCZeroingInstrsGPR,
"Number of zero-cycle GPR zeroing "
78 "instructions expanded from canonical COPY");
83 cl::desc(
"Restrict range of CB instructions (DEBUG)"));
87 cl::desc(
"Restrict range of TB[N]Z instructions (DEBUG)"));
91 cl::desc(
"Restrict range of CB[N]Z instructions (DEBUG)"));
95 cl::desc(
"Restrict range of Bcc instructions (DEBUG)"));
99 cl::desc(
"Restrict range of B instructions (DEBUG)"));
103 cl::desc(
"Restrict range of instructions to search for the "
104 "machine-combiner gather pattern optimization"));
109 RI(STI.getTargetTriple(), STI.getHwMode()), Subtarget(STI) {}
119 switch (
MI.getOpcode()) {
130 if (
MI.getOperand(0).getReg() != AArch64::LR)
135 if (
MI.getOperand(0).getImm() == 3 &&
MI.getOperand(1).getImm() == 7 &&
136 MI.getOperand(3).getImm() == 1)
144 bool ModifiesLR =
false;
145 bool ModifiesSP =
false;
149 if (MO.getReg() == AArch64::LR)
151 else if (MO.getReg() == AArch64::SP)
160 if (
MI.mayLoadOrStore()) {
168 if (ModifiesSP || ModifiesLR)
186 auto Op =
MI.getOpcode();
187 if (
Op == AArch64::INLINEASM ||
Op == AArch64::INLINEASM_BR)
188 return getInlineAsmLength(
MI.getOperand(0).getSymbolName(), MAI);
192 if (
MI.isMetaInstruction())
197 unsigned NumBytes = 0;
207 NumBytes =
Desc.getSize() ?
Desc.getSize() : 4;
210 if (!MFI->shouldSignReturnAddress(*MF))
213 auto Method = STI.getAuthenticatedLRCheckMethod(*MF);
221 switch (
Desc.getOpcode()) {
224 return Desc.getSize();
231 case TargetOpcode::STACKMAP:
234 assert(NumBytes % 4 == 0 &&
"Invalid number of NOP bytes requested!");
236 case TargetOpcode::PATCHPOINT:
239 assert(NumBytes % 4 == 0 &&
"Invalid number of NOP bytes requested!");
241 case TargetOpcode::STATEPOINT:
243 assert(NumBytes % 4 == 0 &&
"Invalid number of NOP bytes requested!");
248 case TargetOpcode::PATCHABLE_FUNCTION_ENTER:
253 F.getFnAttributeAsParsedInteger(
"patchable-function-entry", 9) * 4;
255 case TargetOpcode::PATCHABLE_FUNCTION_EXIT:
256 case TargetOpcode::PATCHABLE_TAIL_CALL:
257 case TargetOpcode::PATCHABLE_TYPED_EVENT_CALL:
261 case TargetOpcode::PATCHABLE_EVENT_CALL:
267 NumBytes =
MI.getOperand(1).getImm();
269 case AArch64::MOVaddr:
270 case AArch64::MOVaddrJT:
271 case AArch64::MOVaddrCP:
272 case AArch64::MOVaddrBA:
273 case AArch64::MOVaddrTLS:
274 case AArch64::MOVaddrEXT: {
278 MI.getOperand(1).getTargetFlags(),
279 Subtarget.isTargetMachO(), Insn);
280 NumBytes = Insn.
size() * 4;
284 case AArch64::MOVi32imm:
285 case AArch64::MOVi64imm: {
287 unsigned BitSize =
Desc.getOpcode() == AArch64::MOVi32imm ? 32 : 64;
290 NumBytes = Insn.
size() * 4;
294 case TargetOpcode::BUNDLE:
295 NumBytes = getInstBundleSize(
MI);
331 case AArch64::CBWPri:
332 case AArch64::CBXPri:
333 case AArch64::CBWPrr:
334 case AArch64::CBXPrr:
342 case AArch64::CBBAssertExt:
343 case AArch64::CBHAssertExt:
374 case AArch64::CBWPri:
375 case AArch64::CBXPri:
376 case AArch64::CBBAssertExt:
377 case AArch64::CBHAssertExt:
378 case AArch64::CBWPrr:
379 case AArch64::CBXPrr:
385 int64_t BrOffset)
const {
387 assert(Bits >= 3 &&
"max branch displacement must be enough to jump"
388 "over conditional branch expansion");
389 return isIntN(Bits, BrOffset / 4);
394 switch (
MI.getOpcode()) {
398 return MI.getOperand(0).getMBB();
403 return MI.getOperand(2).getMBB();
409 return MI.getOperand(1).getMBB();
410 case AArch64::CBWPri:
411 case AArch64::CBXPri:
412 case AArch64::CBBAssertExt:
413 case AArch64::CBHAssertExt:
414 case AArch64::CBWPrr:
415 case AArch64::CBXPrr:
416 return MI.getOperand(3).getMBB();
426 assert(RS &&
"RegScavenger required for long branching");
428 "new block should be inserted for expanding unconditional branch");
431 "restore block should be inserted for restoring clobbered registers");
438 "Branch offsets outside of the signed 33-bit range not supported");
449 RS->enterBasicBlockEnd(
MBB);
452 constexpr Register Reg = AArch64::X16;
453 if (!RS->isRegUsed(Reg)) {
454 insertUnconditionalBranch(
MBB, &NewDestBB,
DL);
465 Register Scavenged = RS->FindUnusedReg(&AArch64::GPR64RegClass);
466 if (Scavenged != AArch64::NoRegister) {
467 buildIndirectBranch(Scavenged, NewDestBB);
468 RS->setRegUsed(Scavenged);
477 "Unable to insert indirect branch inside function that has red zone");
500 bool AllowModify)
const {
507 if (
I->getOpcode() == AArch64::SpeculationBarrierISBDSBEndBB ||
508 I->getOpcode() == AArch64::SpeculationBarrierSBEndBB) {
512 if (!isUnpredicatedTerminator(*
I))
519 unsigned LastOpc = LastInst->
getOpcode();
520 if (
I ==
MBB.begin() || !isUnpredicatedTerminator(*--
I)) {
535 unsigned SecondLastOpc = SecondLastInst->
getOpcode();
542 LastInst = SecondLastInst;
544 if (
I ==
MBB.begin() || !isUnpredicatedTerminator(*--
I)) {
549 SecondLastInst = &*
I;
550 SecondLastOpc = SecondLastInst->
getOpcode();
561 LastInst = SecondLastInst;
563 if (
I ==
MBB.begin() || !isUnpredicatedTerminator(*--
I)) {
565 "unreachable unconditional branches removed above");
574 SecondLastInst = &*
I;
575 SecondLastOpc = SecondLastInst->
getOpcode();
579 if (SecondLastInst &&
I !=
MBB.begin() && isUnpredicatedTerminator(*--
I))
595 I->eraseFromParent();
604 I->eraseFromParent();
613 MachineBranchPredicate &MBP,
614 bool AllowModify)
const {
626 assert(MBP.TrueDest &&
"expected!");
627 MBP.FalseDest = FBB ? FBB :
MBB.getNextNode();
629 MBP.ConditionDef =
nullptr;
630 MBP.SingleUseCondition =
false;
640 if (
I ==
MBB.begin())
656 if (
MI.modifiesRegister(AArch64::NZCV,
nullptr)) {
657 MBP.ConditionDef = &
MI;
666 case AArch64::CBNZX: {
670 MBP.Predicate = (
Opc == AArch64::CBNZX ||
Opc == AArch64::CBNZW)
671 ? MachineBranchPredicate::PRED_NE
672 : MachineBranchPredicate::PRED_EQ;
673 Register CondReg = MBP.LHS.getReg();
682 case AArch64::TBNZX: {
703 Cond[1].setImm(AArch64::CBNZW);
706 Cond[1].setImm(AArch64::CBZW);
709 Cond[1].setImm(AArch64::CBNZX);
712 Cond[1].setImm(AArch64::CBZX);
715 Cond[1].setImm(AArch64::TBNZW);
718 Cond[1].setImm(AArch64::TBZW);
721 Cond[1].setImm(AArch64::TBNZX);
724 Cond[1].setImm(AArch64::TBZX);
728 case AArch64::CBWPri:
729 case AArch64::CBXPri:
730 case AArch64::CBBAssertExt:
731 case AArch64::CBHAssertExt:
732 case AArch64::CBWPrr:
733 case AArch64::CBXPrr: {
746 int *BytesRemoved)
const {
756 I->eraseFromParent();
760 if (
I ==
MBB.begin()) {
773 I->eraseFromParent();
780void AArch64InstrInfo::instantiateCondBranch(
805 if (
Cond.size() > 5) {
816 assert(
TBB &&
"insertBranch must not be told to insert a fallthrough");
843 unsigned Opc =
MI.getOpcode();
850 if (
MI.getOperand(0).getReg() == AArch64::WZR ||
851 MI.getOperand(0).getReg() == AArch64::XZR) {
853 dbgs() <<
"Removing always taken branch: " <<
MI);
856 for (
auto *S : Succs)
858 MBB->removeSuccessor(S);
860 while (
MBB->rbegin() != &
MI)
861 MBB->rbegin()->eraseFromParent();
862 MI.eraseFromParent();
872 if (
MI.getOperand(0).getReg() == AArch64::WZR ||
873 MI.getOperand(0).getReg() == AArch64::XZR) {
875 dbgs() <<
"Removing never taken branch: " <<
MI);
877 MI.getParent()->removeSuccessor(
Target);
878 MI.eraseFromParent();
891 if (!
DefMI->isFullCopy())
893 VReg =
DefMI->getOperand(1).getReg();
902 unsigned *NewReg =
nullptr) {
907 bool Is64Bit = AArch64::GPR64allRegClass.hasSubClassEq(MRI.
getRegClass(VReg));
911 switch (
DefMI->getOpcode()) {
912 case AArch64::SUBREG_TO_REG:
916 if (!
DefMI->getOperand(1).isReg())
918 if (!
DefMI->getOperand(2).isImm() ||
919 DefMI->getOperand(2).getImm() != AArch64::sub_32)
922 if (
DefMI->getOpcode() != AArch64::MOVi32imm)
924 if (!
DefMI->getOperand(1).isImm() ||
DefMI->getOperand(1).getImm() != 1)
927 SrcReg = AArch64::XZR;
928 Opc = AArch64::CSINCXr;
931 case AArch64::MOVi32imm:
932 case AArch64::MOVi64imm:
933 if (!
DefMI->getOperand(1).isImm() ||
DefMI->getOperand(1).getImm() != 1)
935 SrcReg = Is64Bit ? AArch64::XZR : AArch64::WZR;
936 Opc = Is64Bit ? AArch64::CSINCXr : AArch64::CSINCWr;
939 case AArch64::ADDSXri:
940 case AArch64::ADDSWri:
942 if (
DefMI->findRegisterDefOperandIdx(AArch64::NZCV,
nullptr,
947 case AArch64::ADDXri:
948 case AArch64::ADDWri:
950 if (!
DefMI->getOperand(2).isImm() ||
DefMI->getOperand(2).getImm() != 1 ||
951 DefMI->getOperand(3).getImm() != 0)
953 SrcReg =
DefMI->getOperand(1).getReg();
954 Opc = Is64Bit ? AArch64::CSINCXr : AArch64::CSINCWr;
957 case AArch64::ORNXrr:
958 case AArch64::ORNWrr: {
961 if (ZReg != AArch64::XZR && ZReg != AArch64::WZR)
963 SrcReg =
DefMI->getOperand(2).getReg();
964 Opc = Is64Bit ? AArch64::CSINVXr : AArch64::CSINVWr;
968 case AArch64::SUBSXrr:
969 case AArch64::SUBSWrr:
971 if (
DefMI->findRegisterDefOperandIdx(AArch64::NZCV,
nullptr,
976 case AArch64::SUBXrr:
977 case AArch64::SUBWrr: {
980 if (ZReg != AArch64::XZR && ZReg != AArch64::WZR)
982 SrcReg =
DefMI->getOperand(2).getReg();
983 Opc = Is64Bit ? AArch64::CSNEGXr : AArch64::CSNEGWr;
989 assert(
Opc && SrcReg &&
"Missing parameters");
1001 int &FalseCycles)
const {
1012 if (!RI.getCommonSubClass(RC, MRI.
getRegClass(DstReg)))
1016 unsigned ExtraCondLat =
Cond.size() != 1;
1020 if (AArch64::GPR64allRegClass.hasSubClassEq(RC) ||
1021 AArch64::GPR32allRegClass.hasSubClassEq(RC)) {
1023 CondCycles = 1 + ExtraCondLat;
1024 TrueCycles = FalseCycles = 1;
1034 if (AArch64::FPR64RegClass.hasSubClassEq(RC) ||
1035 AArch64::FPR32RegClass.hasSubClassEq(RC)) {
1036 CondCycles = 5 + ExtraCondLat;
1037 TrueCycles = FalseCycles = 2;
1054 switch (
Cond.size()) {
1074 case AArch64::CBNZW:
1078 case AArch64::CBNZX:
1109 case AArch64::TBNZW:
1110 case AArch64::TBNZX:
1132 unsigned SubsOpc, SubsDestReg;
1138 case AArch64::CBWPri:
1139 SubsOpc = AArch64::SUBSWri;
1140 SubsDestReg = AArch64::WZR;
1143 case AArch64::CBXPri:
1144 SubsOpc = AArch64::SUBSXri;
1145 SubsDestReg = AArch64::XZR;
1148 case AArch64::CBWPrr:
1149 SubsOpc = AArch64::SUBSWrr;
1150 SubsDestReg = AArch64::WZR;
1153 case AArch64::CBXPrr:
1154 SubsOpc = AArch64::SUBSXrr;
1155 SubsDestReg = AArch64::XZR;
1184 switch (ExtendType) {
1190 "Unexpected compare-and-branch instruction for SXTB shift-extend");
1191 ExtOpc = AArch64::SBFMWri;
1197 "Unexpected compare-and-branch instruction for SXTH shift-extend");
1198 ExtOpc = AArch64::SBFMWri;
1204 "Unexpected compare-and-branch instruction for UXTB shift-extend");
1205 ExtOpc = AArch64::ANDWri;
1211 "Unexpected compare-and-branch instruction for UXTH shift-extend");
1212 ExtOpc = AArch64::ANDWri;
1221 if (ExtOpc != AArch64::ANDWri)
1223 MBBI.addImm(ExtBits);
1251 bool TryFold =
false;
1253 RC = &AArch64::GPR64RegClass;
1254 Opc = AArch64::CSELXr;
1257 RC = &AArch64::GPR32RegClass;
1258 Opc = AArch64::CSELWr;
1261 RC = &AArch64::FPR64RegClass;
1262 Opc = AArch64::FCSELDrrr;
1264 RC = &AArch64::FPR32RegClass;
1265 Opc = AArch64::FCSELSrrr;
1267 assert(RC &&
"Unsupported regclass");
1271 unsigned NewReg = 0;
1294 (FalseReg.
isVirtual() || FalseReg == AArch64::WZR ||
1295 FalseReg == AArch64::XZR) &&
1296 "FalseReg was folded into a non-virtual register other than WZR or XZR");
1313 assert(BitSize == 64 &&
"Only bit sizes of 32 or 64 allowed");
1318 return Is.
size() <= 2;
1323 assert(
MI.isCopy() &&
"Expected COPY instruction");
1329 if (
Reg.isVirtual())
1331 if (
Reg.isPhysical())
1332 return RI.getMinimalPhysRegClass(
Reg);
1337 if (DstRC && SrcRC && !RI.getCommonSubClass(DstRC, SrcRC))
1340 return MI.isAsCheapAsAMove();
1346 if (Subtarget.hasExynosCheapAsMoveHandling()) {
1347 if (isExynosCheapAsMove(
MI))
1349 return MI.isAsCheapAsAMove();
1352 switch (
MI.getOpcode()) {
1354 return MI.isAsCheapAsAMove();
1356 case TargetOpcode::COPY:
1359 case AArch64::ADDWrs:
1360 case AArch64::ADDXrs:
1361 case AArch64::SUBWrs:
1362 case AArch64::SUBXrs:
1363 return Subtarget.hasALULSLFast() &&
MI.getOperand(3).getImm() <= 4;
1368 case AArch64::MOVi32imm:
1370 case AArch64::MOVi64imm:
1375bool AArch64InstrInfo::isFalkorShiftExtFast(
const MachineInstr &
MI) {
1376 switch (
MI.getOpcode()) {
1380 case AArch64::ADDWrs:
1381 case AArch64::ADDXrs:
1382 case AArch64::ADDSWrs:
1383 case AArch64::ADDSXrs: {
1384 unsigned Imm =
MI.getOperand(3).getImm();
1391 case AArch64::ADDWrx:
1392 case AArch64::ADDXrx:
1393 case AArch64::ADDXrx64:
1394 case AArch64::ADDSWrx:
1395 case AArch64::ADDSXrx:
1396 case AArch64::ADDSXrx64: {
1397 unsigned Imm =
MI.getOperand(3).getImm();
1409 case AArch64::SUBWrs:
1410 case AArch64::SUBSWrs: {
1411 unsigned Imm =
MI.getOperand(3).getImm();
1413 return ShiftVal == 0 ||
1417 case AArch64::SUBXrs:
1418 case AArch64::SUBSXrs: {
1419 unsigned Imm =
MI.getOperand(3).getImm();
1421 return ShiftVal == 0 ||
1425 case AArch64::SUBWrx:
1426 case AArch64::SUBXrx:
1427 case AArch64::SUBXrx64:
1428 case AArch64::SUBSWrx:
1429 case AArch64::SUBSXrx:
1430 case AArch64::SUBSXrx64: {
1431 unsigned Imm =
MI.getOperand(3).getImm();
1443 case AArch64::LDRBBroW:
1444 case AArch64::LDRBBroX:
1445 case AArch64::LDRBroW:
1446 case AArch64::LDRBroX:
1447 case AArch64::LDRDroW:
1448 case AArch64::LDRDroX:
1449 case AArch64::LDRHHroW:
1450 case AArch64::LDRHHroX:
1451 case AArch64::LDRHroW:
1452 case AArch64::LDRHroX:
1453 case AArch64::LDRQroW:
1454 case AArch64::LDRQroX:
1455 case AArch64::LDRSBWroW:
1456 case AArch64::LDRSBWroX:
1457 case AArch64::LDRSBXroW:
1458 case AArch64::LDRSBXroX:
1459 case AArch64::LDRSHWroW:
1460 case AArch64::LDRSHWroX:
1461 case AArch64::LDRSHXroW:
1462 case AArch64::LDRSHXroX:
1463 case AArch64::LDRSWroW:
1464 case AArch64::LDRSWroX:
1465 case AArch64::LDRSroW:
1466 case AArch64::LDRSroX:
1467 case AArch64::LDRWroW:
1468 case AArch64::LDRWroX:
1469 case AArch64::LDRXroW:
1470 case AArch64::LDRXroX:
1471 case AArch64::PRFMroW:
1472 case AArch64::PRFMroX:
1473 case AArch64::STRBBroW:
1474 case AArch64::STRBBroX:
1475 case AArch64::STRBroW:
1476 case AArch64::STRBroX:
1477 case AArch64::STRDroW:
1478 case AArch64::STRDroX:
1479 case AArch64::STRHHroW:
1480 case AArch64::STRHHroX:
1481 case AArch64::STRHroW:
1482 case AArch64::STRHroX:
1483 case AArch64::STRQroW:
1484 case AArch64::STRQroX:
1485 case AArch64::STRSroW:
1486 case AArch64::STRSroX:
1487 case AArch64::STRWroW:
1488 case AArch64::STRWroX:
1489 case AArch64::STRXroW:
1490 case AArch64::STRXroX: {
1491 unsigned IsSigned =
MI.getOperand(3).getImm();
1498 unsigned Opc =
MI.getOpcode();
1502 case AArch64::SEH_StackAlloc:
1503 case AArch64::SEH_SaveFPLR:
1504 case AArch64::SEH_SaveFPLR_X:
1505 case AArch64::SEH_SaveReg:
1506 case AArch64::SEH_SaveReg_X:
1507 case AArch64::SEH_SaveRegP:
1508 case AArch64::SEH_SaveRegP_X:
1509 case AArch64::SEH_SaveFReg:
1510 case AArch64::SEH_SaveFReg_X:
1511 case AArch64::SEH_SaveFRegP:
1512 case AArch64::SEH_SaveFRegP_X:
1513 case AArch64::SEH_SetFP:
1514 case AArch64::SEH_AddFP:
1515 case AArch64::SEH_Nop:
1516 case AArch64::SEH_PrologEnd:
1517 case AArch64::SEH_EpilogStart:
1518 case AArch64::SEH_EpilogEnd:
1519 case AArch64::SEH_PACSignLR:
1520 case AArch64::SEH_SaveAnyRegI:
1521 case AArch64::SEH_SaveAnyRegIP:
1522 case AArch64::SEH_SaveAnyRegQP:
1523 case AArch64::SEH_SaveAnyRegQPX:
1524 case AArch64::SEH_AllocZ:
1525 case AArch64::SEH_SaveZReg:
1526 case AArch64::SEH_SavePReg:
1533 unsigned &SubIdx)
const {
1534 switch (
MI.getOpcode()) {
1537 case AArch64::SBFMXri:
1538 case AArch64::UBFMXri:
1541 if (
MI.getOperand(2).getImm() != 0 ||
MI.getOperand(3).getImm() != 31)
1544 SrcReg =
MI.getOperand(1).getReg();
1545 DstReg =
MI.getOperand(0).getReg();
1546 SubIdx = AArch64::sub_32;
1555 int64_t OffsetA = 0, OffsetB = 0;
1556 TypeSize WidthA(0,
false), WidthB(0,
false);
1557 bool OffsetAIsScalable =
false, OffsetBIsScalable =
false;
1578 OffsetAIsScalable == OffsetBIsScalable) {
1579 int LowOffset = OffsetA < OffsetB ? OffsetA : OffsetB;
1580 int HighOffset = OffsetA < OffsetB ? OffsetB : OffsetA;
1581 TypeSize LowWidth = (LowOffset == OffsetA) ? WidthA : WidthB;
1582 if (LowWidth.
isScalable() == OffsetAIsScalable &&
1600 switch (
MI.getOpcode()) {
1603 if (
MI.getOperand(0).getImm() == 0x14)
1610 case AArch64::MSRpstatesvcrImm1:
1617 auto Next = std::next(
MI.getIterator());
1618 return Next !=
MBB->end() &&
Next->isCFIInstruction();
1625 Register &SrcReg2, int64_t &CmpMask,
1626 int64_t &CmpValue)
const {
1630 assert(
MI.getNumOperands() >= 2 &&
"All AArch64 cmps should have 2 operands");
1631 if (!
MI.getOperand(1).isReg() ||
MI.getOperand(1).getSubReg())
1634 switch (
MI.getOpcode()) {
1637 case AArch64::PTEST_PP:
1638 case AArch64::PTEST_PP_ANY:
1639 case AArch64::PTEST_PP_FIRST:
1640 SrcReg =
MI.getOperand(0).getReg();
1641 SrcReg2 =
MI.getOperand(1).getReg();
1642 if (
MI.getOperand(2).getSubReg())
1649 case AArch64::SUBSWrr:
1650 case AArch64::SUBSWrs:
1651 case AArch64::SUBSWrx:
1652 case AArch64::SUBSXrr:
1653 case AArch64::SUBSXrs:
1654 case AArch64::SUBSXrx:
1655 case AArch64::ADDSWrr:
1656 case AArch64::ADDSWrs:
1657 case AArch64::ADDSWrx:
1658 case AArch64::ADDSXrr:
1659 case AArch64::ADDSXrs:
1660 case AArch64::ADDSXrx:
1662 SrcReg =
MI.getOperand(1).getReg();
1663 SrcReg2 =
MI.getOperand(2).getReg();
1666 if (
MI.getOperand(2).getSubReg())
1672 case AArch64::SUBSWri:
1673 case AArch64::ADDSWri:
1674 case AArch64::SUBSXri:
1675 case AArch64::ADDSXri:
1676 SrcReg =
MI.getOperand(1).getReg();
1679 CmpValue =
MI.getOperand(2).getImm();
1681 case AArch64::ANDSWri:
1682 case AArch64::ANDSXri:
1685 SrcReg =
MI.getOperand(1).getReg();
1689 MI.getOperand(2).getImm(),
1690 MI.getOpcode() == AArch64::ANDSWri ? 32 : 64);
1699 assert(
MBB &&
"Can't get MachineBasicBlock here");
1701 assert(MF &&
"Can't get MachineFunction here");
1706 for (
unsigned OpIdx = 0, EndIdx = Instr.getNumOperands();
OpIdx < EndIdx;
1713 if (!OpRegCstraints)
1721 "Operand has register constraints without being a register!");
1724 if (
Reg.isPhysical()) {
1741 bool MIDefinesZeroReg =
false;
1742 if (
MI.definesRegister(AArch64::WZR,
nullptr) ||
1743 MI.definesRegister(AArch64::XZR,
nullptr))
1744 MIDefinesZeroReg =
true;
1746 switch (
MI.getOpcode()) {
1748 return MI.getOpcode();
1749 case AArch64::ADDSWrr:
1750 return AArch64::ADDWrr;
1751 case AArch64::ADDSWri:
1752 return MIDefinesZeroReg ? AArch64::ADDSWri : AArch64::ADDWri;
1753 case AArch64::ADDSWrs:
1754 return MIDefinesZeroReg ? AArch64::ADDSWrs : AArch64::ADDWrs;
1755 case AArch64::ADDSWrx:
1756 return AArch64::ADDWrx;
1757 case AArch64::ADDSXrr:
1758 return AArch64::ADDXrr;
1759 case AArch64::ADDSXri:
1760 return MIDefinesZeroReg ? AArch64::ADDSXri : AArch64::ADDXri;
1761 case AArch64::ADDSXrs:
1762 return MIDefinesZeroReg ? AArch64::ADDSXrs : AArch64::ADDXrs;
1763 case AArch64::ADDSXrx:
1764 return AArch64::ADDXrx;
1765 case AArch64::SUBSWrr:
1766 return AArch64::SUBWrr;
1767 case AArch64::SUBSWri:
1768 return MIDefinesZeroReg ? AArch64::SUBSWri : AArch64::SUBWri;
1769 case AArch64::SUBSWrs:
1770 return MIDefinesZeroReg ? AArch64::SUBSWrs : AArch64::SUBWrs;
1771 case AArch64::SUBSWrx:
1772 return AArch64::SUBWrx;
1773 case AArch64::SUBSXrr:
1774 return AArch64::SUBXrr;
1775 case AArch64::SUBSXri:
1776 return MIDefinesZeroReg ? AArch64::SUBSXri : AArch64::SUBXri;
1777 case AArch64::SUBSXrs:
1778 return MIDefinesZeroReg ? AArch64::SUBSXrs : AArch64::SUBXrs;
1779 case AArch64::SUBSXrx:
1780 return AArch64::SUBXrx;
1795 if (To == To->getParent()->begin())
1800 if (To->getParent() != From->getParent())
1812 Instr.modifiesRegister(AArch64::NZCV,
TRI)) ||
1813 ((AccessToCheck &
AK_Read) && Instr.readsRegister(AArch64::NZCV,
TRI)))
1819std::optional<unsigned>
1823 unsigned MaskOpcode =
Mask->getOpcode();
1824 unsigned PredOpcode = Pred->
getOpcode();
1825 bool PredIsPTestLike = isPTestLikeOpcode(PredOpcode);
1826 bool PredIsWhileLike = isWhileOpcode(PredOpcode);
1828 if (PredIsWhileLike) {
1832 if ((Mask == Pred) && PTest->
getOpcode() == AArch64::PTEST_PP_ANY)
1839 getElementSizeForOpcode(MaskOpcode) ==
1840 getElementSizeForOpcode(PredOpcode))
1846 if (PTest->
getOpcode() == AArch64::PTEST_PP_FIRST &&
1853 if (PredIsPTestLike) {
1858 if ((Mask == Pred) && PTest->
getOpcode() == AArch64::PTEST_PP_ANY)
1866 if (Mask != PTestLikeMask && PTestLikeMask->isFullCopy() &&
1867 PTestLikeMask->getOperand(1).getReg().isVirtual())
1875 getElementSizeForOpcode(MaskOpcode) ==
1876 getElementSizeForOpcode(PredOpcode)) {
1877 if (Mask == PTestLikeMask || PTest->
getOpcode() == AArch64::PTEST_PP_ANY)
1903 uint64_t PredElementSize = getElementSizeForOpcode(PredOpcode);
1905 PTest->
getOpcode() == AArch64::PTEST_PP_ANY))
1913 switch (PredOpcode) {
1914 case AArch64::AND_PPzPP:
1915 case AArch64::BIC_PPzPP:
1916 case AArch64::EOR_PPzPP:
1917 case AArch64::NAND_PPzPP:
1918 case AArch64::NOR_PPzPP:
1919 case AArch64::ORN_PPzPP:
1920 case AArch64::ORR_PPzPP:
1921 case AArch64::BRKA_PPzP:
1922 case AArch64::BRKPA_PPzPP:
1923 case AArch64::BRKB_PPzP:
1924 case AArch64::BRKPB_PPzPP:
1925 case AArch64::RDFFR_PPz: {
1929 if (Mask != PredMask)
1933 case AArch64::BRKN_PPzP: {
1937 if ((MaskOpcode != AArch64::PTRUE_B) ||
1938 (
Mask->getOperand(1).getImm() != 31))
1942 case AArch64::PTRUE_B:
1955bool AArch64InstrInfo::optimizePTestInstr(
1956 MachineInstr *PTest,
unsigned MaskReg,
unsigned PredReg,
1961 if (Pred->
isCopy() && PTest->
getOpcode() == AArch64::PTEST_PP_FIRST) {
1965 if (
Op.isReg() &&
Op.getReg().isVirtual() &&
1966 Op.getSubReg() == AArch64::psub0)
1970 unsigned PredOpcode = Pred->
getOpcode();
1971 auto NewOp = canRemovePTestInstr(PTest, Mask, Pred, MRI);
1987 if (*NewOp != PredOpcode) {
1998 for (; i !=
e; ++i) {
2029 if (DeadNZCVIdx != -1) {
2048 if (CmpInstr.
getOpcode() == AArch64::PTEST_PP ||
2049 CmpInstr.
getOpcode() == AArch64::PTEST_PP_ANY ||
2050 CmpInstr.
getOpcode() == AArch64::PTEST_PP_FIRST)
2051 return optimizePTestInstr(&CmpInstr, SrcReg, SrcReg2, MRI);
2060 if (CmpValue == 0 && substituteCmpToZero(CmpInstr, SrcReg, *MRI))
2062 return (CmpValue == 0 || CmpValue == 1) &&
2063 removeCmpToZeroOrOne(CmpInstr, SrcReg, CmpValue, *MRI);
2071 switch (Instr.getOpcode()) {
2073 return AArch64::INSTRUCTION_LIST_END;
2075 case AArch64::ADDSWrr:
2076 case AArch64::ADDSWri:
2077 case AArch64::ADDSXrr:
2078 case AArch64::ADDSXri:
2079 case AArch64::ADDSWrx:
2080 case AArch64::ADDSXrx:
2081 case AArch64::ADDSWrs:
2082 case AArch64::ADDSXrs:
2083 case AArch64::SUBSWrr:
2084 case AArch64::SUBSWri:
2085 case AArch64::SUBSWrx:
2086 case AArch64::SUBSWrs:
2087 case AArch64::SUBSXrr:
2088 case AArch64::SUBSXri:
2089 case AArch64::SUBSXrx:
2090 case AArch64::SUBSXrs:
2091 case AArch64::ANDSWri:
2092 case AArch64::ANDSWrr:
2093 case AArch64::ANDSWrs:
2094 case AArch64::ANDSXri:
2095 case AArch64::ANDSXrr:
2096 case AArch64::ANDSXrs:
2097 case AArch64::BICSWrr:
2098 case AArch64::BICSXrr:
2099 case AArch64::BICSWrs:
2100 case AArch64::BICSXrs:
2101 case AArch64::ADCSWr:
2102 case AArch64::ADCSXr:
2103 case AArch64::SBCSWr:
2104 case AArch64::SBCSXr:
2105 return Instr.getOpcode();
2107 case AArch64::ADDWrr:
2108 return AArch64::ADDSWrr;
2109 case AArch64::ADDWri:
2110 return AArch64::ADDSWri;
2111 case AArch64::ADDXrr:
2112 return AArch64::ADDSXrr;
2113 case AArch64::ADDXri:
2114 return AArch64::ADDSXri;
2115 case AArch64::ADDWrx:
2116 return AArch64::ADDSWrx;
2117 case AArch64::ADDXrx:
2118 return AArch64::ADDSXrx;
2119 case AArch64::ADDWrs:
2120 return AArch64::ADDSWrs;
2121 case AArch64::ADDXrs:
2122 return AArch64::ADDSXrs;
2123 case AArch64::ADCWr:
2124 return AArch64::ADCSWr;
2125 case AArch64::ADCXr:
2126 return AArch64::ADCSXr;
2127 case AArch64::SUBWrr:
2128 return AArch64::SUBSWrr;
2129 case AArch64::SUBWri:
2130 return AArch64::SUBSWri;
2131 case AArch64::SUBXrr:
2132 return AArch64::SUBSXrr;
2133 case AArch64::SUBXri:
2134 return AArch64::SUBSXri;
2135 case AArch64::SUBWrx:
2136 return AArch64::SUBSWrx;
2137 case AArch64::SUBXrx:
2138 return AArch64::SUBSXrx;
2139 case AArch64::SUBWrs:
2140 return AArch64::SUBSWrs;
2141 case AArch64::SUBXrs:
2142 return AArch64::SUBSXrs;
2143 case AArch64::SBCWr:
2144 return AArch64::SBCSWr;
2145 case AArch64::SBCXr:
2146 return AArch64::SBCSXr;
2147 case AArch64::ANDWri:
2148 return AArch64::ANDSWri;
2149 case AArch64::ANDXri:
2150 return AArch64::ANDSXri;
2151 case AArch64::ANDWrr:
2152 return AArch64::ANDSWrr;
2153 case AArch64::ANDWrs:
2154 return AArch64::ANDSWrs;
2155 case AArch64::ANDXrr:
2156 return AArch64::ANDSXrr;
2157 case AArch64::ANDXrs:
2158 return AArch64::ANDSXrs;
2159 case AArch64::BICWrr:
2160 return AArch64::BICSWrr;
2161 case AArch64::BICXrr:
2162 return AArch64::BICSXrr;
2163 case AArch64::BICWrs:
2164 return AArch64::BICSWrs;
2165 case AArch64::BICXrs:
2166 return AArch64::BICSXrs;
2172 for (
auto *BB :
MBB->successors())
2173 if (BB->isLiveIn(AArch64::NZCV))
2180int AArch64InstrInfo::findCondCodeUseOperandIdxForBranchOrSelect(
2182 switch (
Instr.getOpcode()) {
2186 case AArch64::Bcc: {
2187 int Idx =
Instr.findRegisterUseOperandIdx(AArch64::NZCV,
nullptr);
2192 case AArch64::CSINVWr:
2193 case AArch64::CSINVXr:
2194 case AArch64::CSINCWr:
2195 case AArch64::CSINCXr:
2196 case AArch64::CSELWr:
2197 case AArch64::CSELXr:
2198 case AArch64::CSNEGWr:
2199 case AArch64::CSNEGXr:
2200 case AArch64::FCSELSrrr:
2201 case AArch64::FCSELDrrr: {
2202 int Idx =
Instr.findRegisterUseOperandIdx(AArch64::NZCV,
nullptr);
2214 AArch64InstrInfo::findCondCodeUseOperandIdxForBranchOrSelect(Instr);
2216 Instr.getOperand(CCIdx).
getImm())
2269std::optional<UsedNZCV>
2274 if (
MI.getParent() != CmpParent)
2275 return std::nullopt;
2278 return std::nullopt;
2283 if (Instr.readsRegister(AArch64::NZCV, &
TRI)) {
2286 return std::nullopt;
2291 if (Instr.modifiesRegister(AArch64::NZCV, &
TRI))
2294 return NZCVUsedAfterCmp;
2298 return Opcode == AArch64::ADDSWri || Opcode == AArch64::ADDSXri;
2302 return Opcode == AArch64::SUBSWri || Opcode == AArch64::SUBSXri;
2308 case AArch64::ANDSWri:
2309 case AArch64::ANDSWrr:
2310 case AArch64::ANDSWrs:
2311 case AArch64::ANDSXri:
2312 case AArch64::ANDSXrr:
2313 case AArch64::ANDSXrs:
2314 case AArch64::BICSWrr:
2315 case AArch64::BICSXrr:
2316 case AArch64::BICSWrs:
2317 case AArch64::BICSXrs:
2343 const unsigned CmpOpcode = CmpInstr.
getOpcode();
2349 "Caller guarantees that CmpInstr compares with constant 0");
2352 if (!NZVCUsed || NZVCUsed->C)
2373bool AArch64InstrInfo::substituteCmpToZero(
2384 if (NewOpc == AArch64::INSTRUCTION_LIST_END)
2391 MI->setDesc(
get(NewOpc));
2396 MI->addRegisterDefined(AArch64::NZCV, &
TRI);
2408 assert((CmpValue == 0 || CmpValue == 1) &&
2409 "Only comparisons to 0 or 1 considered for removal!");
2412 unsigned MIOpc =
MI.getOpcode();
2413 if (MIOpc == AArch64::CSINCWr) {
2414 if (
MI.getOperand(1).getReg() != AArch64::WZR ||
2415 MI.getOperand(2).getReg() != AArch64::WZR)
2417 }
else if (MIOpc == AArch64::CSINCXr) {
2418 if (
MI.getOperand(1).getReg() != AArch64::XZR ||
2419 MI.getOperand(2).getReg() != AArch64::XZR)
2429 if (
MI.findRegisterDefOperandIdx(AArch64::NZCV,
nullptr,
true) != -1)
2433 const unsigned CmpOpcode = CmpInstr.
getOpcode();
2435 if (CmpValue && !IsSubsRegImm)
2437 if (!CmpValue && !IsSubsRegImm && !
isADDSRegImm(CmpOpcode))
2442 if (MIUsedNZCV.
C || MIUsedNZCV.
V)
2445 std::optional<UsedNZCV> NZCVUsedAfterCmp =
2449 if (!NZCVUsedAfterCmp || NZCVUsedAfterCmp->C || NZCVUsedAfterCmp->V)
2452 if ((MIUsedNZCV.
Z && NZCVUsedAfterCmp->N) ||
2453 (MIUsedNZCV.
N && NZCVUsedAfterCmp->Z))
2456 if (MIUsedNZCV.
N && !CmpValue)
2498bool AArch64InstrInfo::removeCmpToZeroOrOne(
2505 SmallVector<MachineInstr *, 4> CCUseInstrs;
2506 bool IsInvertCC =
false;
2514 for (MachineInstr *CCUseInstr : CCUseInstrs) {
2515 int Idx = findCondCodeUseOperandIdxForBranchOrSelect(*CCUseInstr);
2516 assert(Idx >= 0 &&
"Unexpected instruction using CC.");
2517 MachineOperand &CCOperand = CCUseInstr->getOperand(Idx);
2526bool AArch64InstrInfo::expandPostRAPseudo(
MachineInstr &
MI)
const {
2527 if (
MI.getOpcode() != TargetOpcode::LOAD_STACK_GUARD &&
2528 MI.getOpcode() != AArch64::CATCHRET &&
2529 MI.getOpcode() != AArch64::STACK_GUARD_UNMIX)
2532 MachineBasicBlock &
MBB = *
MI.getParent();
2534 auto TRI = Subtarget.getRegisterInfo();
2537 if (
MI.getOpcode() == AArch64::STACK_GUARD_UNMIX) {
2551 if (
MI.getOpcode() == AArch64::CATCHRET) {
2553 const TargetInstrInfo *
TII =
2555 MachineBasicBlock *TargetMBB =
MI.getOperand(0).getMBB();
2560 FirstEpilogSEH = std::prev(FirstEpilogSEH);
2562 FirstEpilogSEH = std::next(FirstEpilogSEH);
2577 if (
M.getStackProtectorGuard() ==
"sysreg") {
2578 const AArch64SysReg::SysReg *SrcReg =
2579 AArch64SysReg::lookupSysRegByName(
M.getStackProtectorGuardReg());
2587 int Offset =
M.getStackProtectorGuardOffset();
2638 const GlobalValue *GV =
2641 unsigned OpFlags = Subtarget.ClassifyGlobalReference(GV, TM);
2644 unsigned GuardWidth =
M.getStackProtectorGuardValueWidth().value_or(
2645 Subtarget.isTargetILP32() ? 4 : 8);
2646 if (GuardWidth != 4 && GuardWidth != 8)
2651 if (GuardWidth == 4) {
2652 unsigned Reg32 =
TRI->getSubReg(
Reg, AArch64::sub_32);
2666 if (GuardWidth == 4)
2692 if (GuardWidth == 4) {
2693 unsigned Reg32 =
TRI->getSubReg(
Reg, AArch64::sub_32);
2711 if (Subtarget.getTargetTriple().isOSMSVCRT())
2724 switch (
MI.getOpcode()) {
2727 case AArch64::MOVZWi:
2728 case AArch64::MOVZXi:
2729 if (
MI.getOperand(1).isImm() &&
MI.getOperand(1).getImm() == 0) {
2730 assert(
MI.getDesc().getNumOperands() == 3 &&
2731 MI.getOperand(2).getImm() == 0 &&
"invalid MOVZi operands");
2735 case AArch64::ANDWri:
2736 return MI.getOperand(1).getReg() == AArch64::WZR;
2737 case AArch64::ANDXri:
2738 return MI.getOperand(1).getReg() == AArch64::XZR;
2739 case TargetOpcode::COPY:
2740 return MI.getOperand(1).getReg() == AArch64::WZR;
2748 switch (
MI.getOpcode()) {
2751 case TargetOpcode::COPY: {
2754 return (AArch64::GPR32RegClass.
contains(DstReg) ||
2755 AArch64::GPR64RegClass.
contains(DstReg));
2757 case AArch64::ORRXrs:
2758 if (
MI.getOperand(1).getReg() == AArch64::XZR) {
2759 assert(
MI.getDesc().getNumOperands() == 4 &&
2760 MI.getOperand(3).getImm() == 0 &&
"invalid ORRrs operands");
2764 case AArch64::ADDXri:
2765 if (
MI.getOperand(2).getImm() == 0) {
2766 assert(
MI.getDesc().getNumOperands() == 4 &&
2767 MI.getOperand(3).getImm() == 0 &&
"invalid ADDXri operands");
2778 switch (
MI.getOpcode()) {
2781 case TargetOpcode::COPY: {
2783 return AArch64::FPR128RegClass.contains(DstReg);
2785 case AArch64::ORRv16i8:
2786 if (
MI.getOperand(1).getReg() ==
MI.getOperand(2).getReg()) {
2787 assert(
MI.getDesc().getNumOperands() == 3 &&
MI.getOperand(0).isReg() &&
2788 "invalid ORRv16i8 operands");
2800 case AArch64::LDRWui:
2801 case AArch64::LDRXui:
2802 case AArch64::LDRBui:
2803 case AArch64::LDRHui:
2804 case AArch64::LDRSui:
2805 case AArch64::LDRDui:
2806 case AArch64::LDRQui:
2807 case AArch64::LDR_PXI:
2813 int &FrameIndex)
const {
2817 if (
MI.getOperand(0).getSubReg() == 0 &&
MI.getOperand(1).isFI() &&
2818 MI.getOperand(2).isImm() &&
MI.getOperand(2).getImm() == 0) {
2819 FrameIndex =
MI.getOperand(1).getIndex();
2820 return MI.getOperand(0).getReg();
2829 case AArch64::STRWui:
2830 case AArch64::STRXui:
2831 case AArch64::STRBui:
2832 case AArch64::STRHui:
2833 case AArch64::STRSui:
2834 case AArch64::STRDui:
2835 case AArch64::STRQui:
2836 case AArch64::STR_PXI:
2842 int &FrameIndex)
const {
2846 if (
MI.getOperand(0).getSubReg() == 0 &&
MI.getOperand(1).isFI() &&
2847 MI.getOperand(2).isImm() &&
MI.getOperand(2).getImm() == 0) {
2848 FrameIndex =
MI.getOperand(1).getIndex();
2849 return MI.getOperand(0).getReg();
2855 int &FrameIndex)
const {
2870 return MI.getOperand(0).getReg();
2876 int &FrameIndex)
const {
2891 return MI.getOperand(0).getReg();
2899 return MMO->getFlags() & MOSuppressPair;
2905 if (
MI.memoperands_empty())
2913 return MMO->getFlags() & MOStridedAccess;
2921 case AArch64::STURSi:
2922 case AArch64::STRSpre:
2923 case AArch64::STURDi:
2924 case AArch64::STRDpre:
2925 case AArch64::STURQi:
2926 case AArch64::STRQpre:
2927 case AArch64::STURBBi:
2928 case AArch64::STURHHi:
2929 case AArch64::STURWi:
2930 case AArch64::STRWpre:
2931 case AArch64::STURXi:
2932 case AArch64::STRXpre:
2933 case AArch64::LDURSi:
2934 case AArch64::LDRSpre:
2935 case AArch64::LDURDi:
2936 case AArch64::LDRDpre:
2937 case AArch64::LDURQi:
2938 case AArch64::LDRQpre:
2939 case AArch64::LDURWi:
2940 case AArch64::LDRWpre:
2941 case AArch64::LDURXi:
2942 case AArch64::LDRXpre:
2943 case AArch64::LDRSWpre:
2944 case AArch64::LDURSWi:
2945 case AArch64::LDURHHi:
2946 case AArch64::LDURBBi:
2947 case AArch64::LDURSBWi:
2948 case AArch64::LDURSHWi:
2956 case AArch64::PRFMui:
return AArch64::PRFUMi;
2957 case AArch64::LDRXui:
return AArch64::LDURXi;
2958 case AArch64::LDRWui:
return AArch64::LDURWi;
2959 case AArch64::LDRBui:
return AArch64::LDURBi;
2960 case AArch64::LDRHui:
return AArch64::LDURHi;
2961 case AArch64::LDRSui:
return AArch64::LDURSi;
2962 case AArch64::LDRDui:
return AArch64::LDURDi;
2963 case AArch64::LDRQui:
return AArch64::LDURQi;
2964 case AArch64::LDRBBui:
return AArch64::LDURBBi;
2965 case AArch64::LDRHHui:
return AArch64::LDURHHi;
2966 case AArch64::LDRSBXui:
return AArch64::LDURSBXi;
2967 case AArch64::LDRSBWui:
return AArch64::LDURSBWi;
2968 case AArch64::LDRSHXui:
return AArch64::LDURSHXi;
2969 case AArch64::LDRSHWui:
return AArch64::LDURSHWi;
2970 case AArch64::LDRSWui:
return AArch64::LDURSWi;
2971 case AArch64::STRXui:
return AArch64::STURXi;
2972 case AArch64::STRWui:
return AArch64::STURWi;
2973 case AArch64::STRBui:
return AArch64::STURBi;
2974 case AArch64::STRHui:
return AArch64::STURHi;
2975 case AArch64::STRSui:
return AArch64::STURSi;
2976 case AArch64::STRDui:
return AArch64::STURDi;
2977 case AArch64::STRQui:
return AArch64::STURQi;
2978 case AArch64::STRBBui:
return AArch64::STURBBi;
2979 case AArch64::STRHHui:
return AArch64::STURHHi;
2988 case AArch64::LDAPURBi:
2989 case AArch64::LDAPURHi:
2990 case AArch64::LDAPURi:
2991 case AArch64::LDAPURSBWi:
2992 case AArch64::LDAPURSBXi:
2993 case AArch64::LDAPURSHWi:
2994 case AArch64::LDAPURSHXi:
2995 case AArch64::LDAPURSWi:
2996 case AArch64::LDAPURXi:
2997 case AArch64::LDR_PPXI:
2998 case AArch64::LDR_PXI:
2999 case AArch64::LDR_ZXI:
3000 case AArch64::LDR_ZZXI:
3001 case AArch64::LDR_ZZXI_STRIDED_CONTIGUOUS:
3002 case AArch64::LDR_ZZZXI:
3003 case AArch64::LDR_ZZZZXI:
3004 case AArch64::LDR_ZZZZXI_STRIDED_CONTIGUOUS:
3005 case AArch64::LDRBBui:
3006 case AArch64::LDRBui:
3007 case AArch64::LDRDui:
3008 case AArch64::LDRHHui:
3009 case AArch64::LDRHui:
3010 case AArch64::LDRQui:
3011 case AArch64::LDRSBWui:
3012 case AArch64::LDRSBXui:
3013 case AArch64::LDRSHWui:
3014 case AArch64::LDRSHXui:
3015 case AArch64::LDRSui:
3016 case AArch64::LDRSWui:
3017 case AArch64::LDRWui:
3018 case AArch64::LDRXui:
3019 case AArch64::LDURBBi:
3020 case AArch64::LDURBi:
3021 case AArch64::LDURDi:
3022 case AArch64::LDURHHi:
3023 case AArch64::LDURHi:
3024 case AArch64::LDURQi:
3025 case AArch64::LDURSBWi:
3026 case AArch64::LDURSBXi:
3027 case AArch64::LDURSHWi:
3028 case AArch64::LDURSHXi:
3029 case AArch64::LDURSi:
3030 case AArch64::LDURSWi:
3031 case AArch64::LDURWi:
3032 case AArch64::LDURXi:
3033 case AArch64::PRFMui:
3034 case AArch64::PRFUMi:
3035 case AArch64::ST2Gi:
3037 case AArch64::STLURBi:
3038 case AArch64::STLURHi:
3039 case AArch64::STLURWi:
3040 case AArch64::STLURXi:
3041 case AArch64::StoreSwiftAsyncContext:
3042 case AArch64::STR_PPXI:
3043 case AArch64::STR_PXI:
3044 case AArch64::STR_ZXI:
3045 case AArch64::STR_ZZXI:
3046 case AArch64::STR_ZZXI_STRIDED_CONTIGUOUS:
3047 case AArch64::STR_ZZZXI:
3048 case AArch64::STR_ZZZZXI:
3049 case AArch64::STR_ZZZZXI_STRIDED_CONTIGUOUS:
3050 case AArch64::STRBBui:
3051 case AArch64::STRBui:
3052 case AArch64::STRDui:
3053 case AArch64::STRHHui:
3054 case AArch64::STRHui:
3055 case AArch64::STRQui:
3056 case AArch64::STRSui:
3057 case AArch64::STRWui:
3058 case AArch64::STRXui:
3059 case AArch64::STURBBi:
3060 case AArch64::STURBi:
3061 case AArch64::STURDi:
3062 case AArch64::STURHHi:
3063 case AArch64::STURHi:
3064 case AArch64::STURQi:
3065 case AArch64::STURSi:
3066 case AArch64::STURWi:
3067 case AArch64::STURXi:
3068 case AArch64::STZ2Gi:
3069 case AArch64::STZGi:
3070 case AArch64::TAGPstack:
3072 case AArch64::LD1B_D_IMM:
3073 case AArch64::LD1B_H_IMM:
3074 case AArch64::LD1B_IMM:
3075 case AArch64::LD1B_S_IMM:
3076 case AArch64::LD1D_IMM:
3077 case AArch64::LD1H_D_IMM:
3078 case AArch64::LD1H_IMM:
3079 case AArch64::LD1H_S_IMM:
3080 case AArch64::LD1RB_D_IMM:
3081 case AArch64::LD1RB_H_IMM:
3082 case AArch64::LD1RB_IMM:
3083 case AArch64::LD1RB_S_IMM:
3084 case AArch64::LD1RD_IMM:
3085 case AArch64::LD1RH_D_IMM:
3086 case AArch64::LD1RH_IMM:
3087 case AArch64::LD1RH_S_IMM:
3088 case AArch64::LD1RSB_D_IMM:
3089 case AArch64::LD1RSB_H_IMM:
3090 case AArch64::LD1RSB_S_IMM:
3091 case AArch64::LD1RSH_D_IMM:
3092 case AArch64::LD1RSH_S_IMM:
3093 case AArch64::LD1RSW_IMM:
3094 case AArch64::LD1RW_D_IMM:
3095 case AArch64::LD1RW_IMM:
3096 case AArch64::LD1SB_D_IMM:
3097 case AArch64::LD1SB_H_IMM:
3098 case AArch64::LD1SB_S_IMM:
3099 case AArch64::LD1SH_D_IMM:
3100 case AArch64::LD1SH_S_IMM:
3101 case AArch64::LD1SW_D_IMM:
3102 case AArch64::LD1W_D_IMM:
3103 case AArch64::LD1W_IMM:
3104 case AArch64::LD2B_IMM:
3105 case AArch64::LD2D_IMM:
3106 case AArch64::LD2H_IMM:
3107 case AArch64::LD2W_IMM:
3108 case AArch64::LD3B_IMM:
3109 case AArch64::LD3D_IMM:
3110 case AArch64::LD3H_IMM:
3111 case AArch64::LD3W_IMM:
3112 case AArch64::LD4B_IMM:
3113 case AArch64::LD4D_IMM:
3114 case AArch64::LD4H_IMM:
3115 case AArch64::LD4W_IMM:
3117 case AArch64::LDNF1B_D_IMM:
3118 case AArch64::LDNF1B_H_IMM:
3119 case AArch64::LDNF1B_IMM:
3120 case AArch64::LDNF1B_S_IMM:
3121 case AArch64::LDNF1D_IMM:
3122 case AArch64::LDNF1H_D_IMM:
3123 case AArch64::LDNF1H_IMM:
3124 case AArch64::LDNF1H_S_IMM:
3125 case AArch64::LDNF1SB_D_IMM:
3126 case AArch64::LDNF1SB_H_IMM:
3127 case AArch64::LDNF1SB_S_IMM:
3128 case AArch64::LDNF1SH_D_IMM:
3129 case AArch64::LDNF1SH_S_IMM:
3130 case AArch64::LDNF1SW_D_IMM:
3131 case AArch64::LDNF1W_D_IMM:
3132 case AArch64::LDNF1W_IMM:
3133 case AArch64::LDNPDi:
3134 case AArch64::LDNPQi:
3135 case AArch64::LDNPSi:
3136 case AArch64::LDNPWi:
3137 case AArch64::LDNPXi:
3138 case AArch64::LDNT1B_ZRI:
3139 case AArch64::LDNT1D_ZRI:
3140 case AArch64::LDNT1H_ZRI:
3141 case AArch64::LDNT1W_ZRI:
3142 case AArch64::LDPDi:
3143 case AArch64::LDPQi:
3144 case AArch64::LDPSi:
3145 case AArch64::LDPWi:
3146 case AArch64::LDPXi:
3147 case AArch64::LDRBBpost:
3148 case AArch64::LDRBBpre:
3149 case AArch64::LDRBpost:
3150 case AArch64::LDRBpre:
3151 case AArch64::LDRDpost:
3152 case AArch64::LDRDpre:
3153 case AArch64::LDRHHpost:
3154 case AArch64::LDRHHpre:
3155 case AArch64::LDRHpost:
3156 case AArch64::LDRHpre:
3157 case AArch64::LDRQpost:
3158 case AArch64::LDRQpre:
3159 case AArch64::LDRSpost:
3160 case AArch64::LDRSpre:
3161 case AArch64::LDRWpost:
3162 case AArch64::LDRWpre:
3163 case AArch64::LDRXpost:
3164 case AArch64::LDRXpre:
3165 case AArch64::ST1B_D_IMM:
3166 case AArch64::ST1B_H_IMM:
3167 case AArch64::ST1B_IMM:
3168 case AArch64::ST1B_S_IMM:
3169 case AArch64::ST1D_IMM:
3170 case AArch64::ST1H_D_IMM:
3171 case AArch64::ST1H_IMM:
3172 case AArch64::ST1H_S_IMM:
3173 case AArch64::ST1W_D_IMM:
3174 case AArch64::ST1W_IMM:
3175 case AArch64::ST2B_IMM:
3176 case AArch64::ST2D_IMM:
3177 case AArch64::ST2H_IMM:
3178 case AArch64::ST2W_IMM:
3179 case AArch64::ST3B_IMM:
3180 case AArch64::ST3D_IMM:
3181 case AArch64::ST3H_IMM:
3182 case AArch64::ST3W_IMM:
3183 case AArch64::ST4B_IMM:
3184 case AArch64::ST4D_IMM:
3185 case AArch64::ST4H_IMM:
3186 case AArch64::ST4W_IMM:
3187 case AArch64::STGPi:
3188 case AArch64::STGPreIndex:
3189 case AArch64::STZGPreIndex:
3190 case AArch64::ST2GPreIndex:
3191 case AArch64::STZ2GPreIndex:
3192 case AArch64::STGPostIndex:
3193 case AArch64::STZGPostIndex:
3194 case AArch64::ST2GPostIndex:
3195 case AArch64::STZ2GPostIndex:
3196 case AArch64::STNPDi:
3197 case AArch64::STNPQi:
3198 case AArch64::STNPSi:
3199 case AArch64::STNPWi:
3200 case AArch64::STNPXi:
3201 case AArch64::STNT1B_ZRI:
3202 case AArch64::STNT1D_ZRI:
3203 case AArch64::STNT1H_ZRI:
3204 case AArch64::STNT1W_ZRI:
3205 case AArch64::STPDi:
3206 case AArch64::STPQi:
3207 case AArch64::STPSi:
3208 case AArch64::STPWi:
3209 case AArch64::STPXi:
3210 case AArch64::STRBBpost:
3211 case AArch64::STRBBpre:
3212 case AArch64::STRBpost:
3213 case AArch64::STRBpre:
3214 case AArch64::STRDpost:
3215 case AArch64::STRDpre:
3216 case AArch64::STRHHpost:
3217 case AArch64::STRHHpre:
3218 case AArch64::STRHpost:
3219 case AArch64::STRHpre:
3220 case AArch64::STRQpost:
3221 case AArch64::STRQpre:
3222 case AArch64::STRSpost:
3223 case AArch64::STRSpre:
3224 case AArch64::STRWpost:
3225 case AArch64::STRWpre:
3226 case AArch64::STRXpost:
3227 case AArch64::STRXpre:
3228 case AArch64::LD1B_2Z_IMM:
3229 case AArch64::LD1B_2Z_STRIDED_IMM:
3230 case AArch64::LD1H_2Z_IMM:
3231 case AArch64::LD1H_2Z_STRIDED_IMM:
3232 case AArch64::LD1W_2Z_IMM:
3233 case AArch64::LD1W_2Z_STRIDED_IMM:
3234 case AArch64::LD1D_2Z_IMM:
3235 case AArch64::LD1D_2Z_STRIDED_IMM:
3236 case AArch64::LD1B_4Z_IMM:
3237 case AArch64::LD1B_4Z_STRIDED_IMM:
3238 case AArch64::LD1H_4Z_IMM:
3239 case AArch64::LD1H_4Z_STRIDED_IMM:
3240 case AArch64::LD1W_4Z_IMM:
3241 case AArch64::LD1W_4Z_STRIDED_IMM:
3242 case AArch64::LD1D_4Z_IMM:
3243 case AArch64::LD1D_4Z_STRIDED_IMM:
3244 case AArch64::LD1B_2Z_IMM_PSEUDO:
3245 case AArch64::LD1H_2Z_IMM_PSEUDO:
3246 case AArch64::LD1W_2Z_IMM_PSEUDO:
3247 case AArch64::LD1D_2Z_IMM_PSEUDO:
3248 case AArch64::LD1B_4Z_IMM_PSEUDO:
3249 case AArch64::LD1H_4Z_IMM_PSEUDO:
3250 case AArch64::LD1W_4Z_IMM_PSEUDO:
3251 case AArch64::LD1D_4Z_IMM_PSEUDO:
3252 case AArch64::ST1B_2Z_IMM:
3253 case AArch64::ST1B_2Z_STRIDED_IMM:
3254 case AArch64::ST1H_2Z_IMM:
3255 case AArch64::ST1H_2Z_STRIDED_IMM:
3256 case AArch64::ST1W_2Z_IMM:
3257 case AArch64::ST1W_2Z_STRIDED_IMM:
3258 case AArch64::ST1D_2Z_IMM:
3259 case AArch64::ST1D_2Z_STRIDED_IMM:
3260 case AArch64::LDNT1B_2Z_IMM_PSEUDO:
3261 case AArch64::LDNT1B_2Z_IMM:
3262 case AArch64::LDNT1B_2Z_STRIDED_IMM:
3263 case AArch64::LDNT1H_2Z_IMM_PSEUDO:
3264 case AArch64::LDNT1H_2Z_IMM:
3265 case AArch64::LDNT1H_2Z_STRIDED_IMM:
3266 case AArch64::LDNT1W_2Z_IMM_PSEUDO:
3267 case AArch64::LDNT1W_2Z_IMM:
3268 case AArch64::LDNT1W_2Z_STRIDED_IMM:
3269 case AArch64::LDNT1D_2Z_IMM_PSEUDO:
3270 case AArch64::LDNT1D_2Z_IMM:
3271 case AArch64::LDNT1D_2Z_STRIDED_IMM:
3272 case AArch64::STNT1B_2Z_IMM:
3273 case AArch64::STNT1B_2Z_STRIDED_IMM:
3274 case AArch64::STNT1H_2Z_IMM:
3275 case AArch64::STNT1H_2Z_STRIDED_IMM:
3276 case AArch64::STNT1W_2Z_IMM:
3277 case AArch64::STNT1W_2Z_STRIDED_IMM:
3278 case AArch64::STNT1D_2Z_IMM:
3279 case AArch64::STNT1D_2Z_STRIDED_IMM:
3280 case AArch64::ST1B_4Z_IMM:
3281 case AArch64::ST1B_4Z_STRIDED_IMM:
3282 case AArch64::ST1H_4Z_IMM:
3283 case AArch64::ST1H_4Z_STRIDED_IMM:
3284 case AArch64::ST1W_4Z_IMM:
3285 case AArch64::ST1W_4Z_STRIDED_IMM:
3286 case AArch64::ST1D_4Z_IMM:
3287 case AArch64::ST1D_4Z_STRIDED_IMM:
3288 case AArch64::LDNT1B_4Z_IMM_PSEUDO:
3289 case AArch64::LDNT1B_4Z_IMM:
3290 case AArch64::LDNT1B_4Z_STRIDED_IMM:
3291 case AArch64::LDNT1H_4Z_IMM_PSEUDO:
3292 case AArch64::LDNT1H_4Z_IMM:
3293 case AArch64::LDNT1H_4Z_STRIDED_IMM:
3294 case AArch64::LDNT1W_4Z_IMM_PSEUDO:
3295 case AArch64::LDNT1W_4Z_IMM:
3296 case AArch64::LDNT1W_4Z_STRIDED_IMM:
3297 case AArch64::LDNT1D_4Z_IMM_PSEUDO:
3298 case AArch64::LDNT1D_4Z_IMM:
3299 case AArch64::LDNT1D_4Z_STRIDED_IMM:
3300 case AArch64::STNT1B_4Z_IMM:
3301 case AArch64::STNT1B_4Z_STRIDED_IMM:
3302 case AArch64::STNT1H_4Z_IMM:
3303 case AArch64::STNT1H_4Z_STRIDED_IMM:
3304 case AArch64::STNT1W_4Z_IMM:
3305 case AArch64::STNT1W_4Z_STRIDED_IMM:
3306 case AArch64::STNT1D_4Z_IMM:
3307 case AArch64::STNT1D_4Z_STRIDED_IMM:
3309 case AArch64::LDPDpost:
3310 case AArch64::LDPDpre:
3311 case AArch64::LDPQpost:
3312 case AArch64::LDPQpre:
3313 case AArch64::LDPSpost:
3314 case AArch64::LDPSpre:
3315 case AArch64::LDPWpost:
3316 case AArch64::LDPWpre:
3317 case AArch64::LDPXpost:
3318 case AArch64::LDPXpre:
3319 case AArch64::STGPpre:
3320 case AArch64::STGPpost:
3321 case AArch64::STPDpost:
3322 case AArch64::STPDpre:
3323 case AArch64::STPQpost:
3324 case AArch64::STPQpre:
3325 case AArch64::STPSpost:
3326 case AArch64::STPSpre:
3327 case AArch64::STPWpost:
3328 case AArch64::STPWpre:
3329 case AArch64::STPXpost:
3330 case AArch64::STPXpre:
3336 switch (
MI.getOpcode()) {
3340 case AArch64::STRSui:
3341 case AArch64::STRDui:
3342 case AArch64::STRQui:
3343 case AArch64::STRXui:
3344 case AArch64::STRWui:
3345 case AArch64::LDRSui:
3346 case AArch64::LDRDui:
3347 case AArch64::LDRQui:
3348 case AArch64::LDRXui:
3349 case AArch64::LDRWui:
3350 case AArch64::LDRSWui:
3352 case AArch64::STURSi:
3353 case AArch64::STRSpre:
3354 case AArch64::STURDi:
3355 case AArch64::STRDpre:
3356 case AArch64::STURQi:
3357 case AArch64::STRQpre:
3358 case AArch64::STURWi:
3359 case AArch64::STRWpre:
3360 case AArch64::STURXi:
3361 case AArch64::STRXpre:
3362 case AArch64::LDURSi:
3363 case AArch64::LDRSpre:
3364 case AArch64::LDURDi:
3365 case AArch64::LDRDpre:
3366 case AArch64::LDURQi:
3367 case AArch64::LDRQpre:
3368 case AArch64::LDURWi:
3369 case AArch64::LDRWpre:
3370 case AArch64::LDURXi:
3371 case AArch64::LDRXpre:
3372 case AArch64::LDURSWi:
3373 case AArch64::LDRSWpre:
3375 case AArch64::LDR_ZXI:
3376 case AArch64::STR_ZXI:
3382 switch (
MI.getOpcode()) {
3385 "Unexpected instruction - was a new tail call opcode introduced?");
3387 case AArch64::TCRETURNdi:
3388 case AArch64::TCRETURNri:
3389 case AArch64::TCRETURNrix16x17:
3390 case AArch64::TCRETURNrix17:
3391 case AArch64::TCRETURNrinotx16:
3392 case AArch64::TCRETURNriALL:
3393 case AArch64::AUTH_TCRETURN:
3394 case AArch64::AUTH_TCRETURN_BTI:
3404 case AArch64::ADDWri:
3405 return AArch64::ADDSWri;
3406 case AArch64::ADDWrr:
3407 return AArch64::ADDSWrr;
3408 case AArch64::ADDWrs:
3409 return AArch64::ADDSWrs;
3410 case AArch64::ADDWrx:
3411 return AArch64::ADDSWrx;
3412 case AArch64::ANDWri:
3413 return AArch64::ANDSWri;
3414 case AArch64::ANDWrr:
3415 return AArch64::ANDSWrr;
3416 case AArch64::ANDWrs:
3417 return AArch64::ANDSWrs;
3418 case AArch64::BICWrr:
3419 return AArch64::BICSWrr;
3420 case AArch64::BICWrs:
3421 return AArch64::BICSWrs;
3422 case AArch64::SUBWri:
3423 return AArch64::SUBSWri;
3424 case AArch64::SUBWrr:
3425 return AArch64::SUBSWrr;
3426 case AArch64::SUBWrs:
3427 return AArch64::SUBSWrs;
3428 case AArch64::SUBWrx:
3429 return AArch64::SUBSWrx;
3431 case AArch64::ADDXri:
3432 return AArch64::ADDSXri;
3433 case AArch64::ADDXrr:
3434 return AArch64::ADDSXrr;
3435 case AArch64::ADDXrs:
3436 return AArch64::ADDSXrs;
3437 case AArch64::ADDXrx:
3438 return AArch64::ADDSXrx;
3439 case AArch64::ANDXri:
3440 return AArch64::ANDSXri;
3441 case AArch64::ANDXrr:
3442 return AArch64::ANDSXrr;
3443 case AArch64::ANDXrs:
3444 return AArch64::ANDSXrs;
3445 case AArch64::BICXrr:
3446 return AArch64::BICSXrr;
3447 case AArch64::BICXrs:
3448 return AArch64::BICSXrs;
3449 case AArch64::SUBXri:
3450 return AArch64::SUBSXri;
3451 case AArch64::SUBXrr:
3452 return AArch64::SUBSXrr;
3453 case AArch64::SUBXrs:
3454 return AArch64::SUBSXrs;
3455 case AArch64::SUBXrx:
3456 return AArch64::SUBSXrx;
3458 case AArch64::AND_PPzPP:
3459 return AArch64::ANDS_PPzPP;
3460 case AArch64::BIC_PPzPP:
3461 return AArch64::BICS_PPzPP;
3462 case AArch64::EOR_PPzPP:
3463 return AArch64::EORS_PPzPP;
3464 case AArch64::NAND_PPzPP:
3465 return AArch64::NANDS_PPzPP;
3466 case AArch64::NOR_PPzPP:
3467 return AArch64::NORS_PPzPP;
3468 case AArch64::ORN_PPzPP:
3469 return AArch64::ORNS_PPzPP;
3470 case AArch64::ORR_PPzPP:
3471 return AArch64::ORRS_PPzPP;
3472 case AArch64::BRKA_PPzP:
3473 return AArch64::BRKAS_PPzP;
3474 case AArch64::BRKPA_PPzPP:
3475 return AArch64::BRKPAS_PPzPP;
3476 case AArch64::BRKB_PPzP:
3477 return AArch64::BRKBS_PPzP;
3478 case AArch64::BRKPB_PPzPP:
3479 return AArch64::BRKPBS_PPzPP;
3480 case AArch64::BRKN_PPzP:
3481 return AArch64::BRKNS_PPzP;
3482 case AArch64::RDFFR_PPz:
3483 return AArch64::RDFFRS_PPz;
3484 case AArch64::PTRUE_B:
3485 return AArch64::PTRUES_B;
3496 if (
MI.hasOrderedMemoryRef())
3501 assert((
MI.getOperand(IsPreLdSt ? 2 : 1).isReg() ||
3502 MI.getOperand(IsPreLdSt ? 2 : 1).isFI()) &&
3503 "Expected a reg or frame index operand.");
3507 bool IsImmPreLdSt = IsPreLdSt &&
MI.getOperand(3).isImm();
3509 if (!
MI.getOperand(2).isImm() && !IsImmPreLdSt)
3522 if (
MI.getOperand(1).isReg() && !IsPreLdSt) {
3523 Register BaseReg =
MI.getOperand(1).getReg();
3525 if (
MI.modifiesRegister(BaseReg,
TRI))
3531 switch (
MI.getOpcode()) {
3534 case AArch64::LDR_ZXI:
3535 case AArch64::STR_ZXI:
3536 if (!Subtarget.isLittleEndian() ||
3537 Subtarget.getSVEVectorSizeInBits() != 128)
3550 const MCAsmInfo &MAI =
MI.getMF()->getTarget().getMCAsmInfo();
3558 if (Subtarget.isPaired128Slow()) {
3559 switch (
MI.getOpcode()) {
3562 case AArch64::LDURQi:
3563 case AArch64::STURQi:
3564 case AArch64::LDRQui:
3565 case AArch64::STRQui:
3592std::optional<ExtAddrMode>
3597 bool OffsetIsScalable;
3598 if (!getMemOperandWithOffset(MemI,
Base,
Offset, OffsetIsScalable,
TRI))
3599 return std::nullopt;
3602 return std::nullopt;
3617 int64_t OffsetScale = 1;
3622 case AArch64::LDURQi:
3623 case AArch64::STURQi:
3627 case AArch64::LDURDi:
3628 case AArch64::STURDi:
3629 case AArch64::LDURXi:
3630 case AArch64::STURXi:
3634 case AArch64::LDURWi:
3635 case AArch64::LDURSWi:
3636 case AArch64::STURWi:
3640 case AArch64::LDURHi:
3641 case AArch64::STURHi:
3642 case AArch64::LDURHHi:
3643 case AArch64::STURHHi:
3644 case AArch64::LDURSHXi:
3645 case AArch64::LDURSHWi:
3649 case AArch64::LDRBroX:
3650 case AArch64::LDRBBroX:
3651 case AArch64::LDRSBXroX:
3652 case AArch64::LDRSBWroX:
3653 case AArch64::STRBroX:
3654 case AArch64::STRBBroX:
3655 case AArch64::LDURBi:
3656 case AArch64::LDURBBi:
3657 case AArch64::LDURSBXi:
3658 case AArch64::LDURSBWi:
3659 case AArch64::STURBi:
3660 case AArch64::STURBBi:
3661 case AArch64::LDRBui:
3662 case AArch64::LDRBBui:
3663 case AArch64::LDRSBXui:
3664 case AArch64::LDRSBWui:
3665 case AArch64::STRBui:
3666 case AArch64::STRBBui:
3670 case AArch64::LDRQroX:
3671 case AArch64::STRQroX:
3672 case AArch64::LDRQui:
3673 case AArch64::STRQui:
3678 case AArch64::LDRDroX:
3679 case AArch64::STRDroX:
3680 case AArch64::LDRXroX:
3681 case AArch64::STRXroX:
3682 case AArch64::LDRDui:
3683 case AArch64::STRDui:
3684 case AArch64::LDRXui:
3685 case AArch64::STRXui:
3690 case AArch64::LDRWroX:
3691 case AArch64::LDRSWroX:
3692 case AArch64::STRWroX:
3693 case AArch64::LDRWui:
3694 case AArch64::LDRSWui:
3695 case AArch64::STRWui:
3700 case AArch64::LDRHroX:
3701 case AArch64::STRHroX:
3702 case AArch64::LDRHHroX:
3703 case AArch64::STRHHroX:
3704 case AArch64::LDRSHXroX:
3705 case AArch64::LDRSHWroX:
3706 case AArch64::LDRHui:
3707 case AArch64::STRHui:
3708 case AArch64::LDRHHui:
3709 case AArch64::STRHHui:
3710 case AArch64::LDRSHXui:
3711 case AArch64::LDRSHWui:
3719 if (BaseRegOp.
isReg() && BaseRegOp.
getReg() == Reg)
3743 case AArch64::SBFMXri:
3756 AM.
Scale = OffsetScale;
3761 case TargetOpcode::SUBREG_TO_REG: {
3777 if (
DefMI.getOpcode() != AArch64::ORRWrs ||
3778 DefMI.getOperand(1).getReg() != AArch64::WZR ||
3779 DefMI.getOperand(3).getImm() != 0)
3786 AM.
Scale = OffsetScale;
3797 auto validateOffsetForLDP = [](
unsigned NumBytes, int64_t OldOffset,
3798 int64_t NewOffset) ->
bool {
3799 int64_t MinOffset, MaxOffset;
3816 return OldOffset < MinOffset || OldOffset > MaxOffset ||
3817 (NewOffset >= MinOffset && NewOffset <= MaxOffset);
3819 auto canFoldAddSubImmIntoAddrMode = [&](int64_t Disp) ->
bool {
3821 int64_t NewOffset = OldOffset + Disp;
3822 if (!isLegalAddressingMode(NumBytes, NewOffset, 0))
3826 if (!validateOffsetForLDP(NumBytes, OldOffset, NewOffset))
3836 auto canFoldAddRegIntoAddrMode =
3841 if ((
unsigned)Scale != Scale)
3843 if (!isLegalAddressingMode(NumBytes, 0, Scale))
3855 return (Opcode == AArch64::STURQi || Opcode == AArch64::STRQui) &&
3856 Subtarget.isSTRQroSlow();
3865 case AArch64::ADDXri:
3871 return canFoldAddSubImmIntoAddrMode(Disp);
3873 case AArch64::SUBXri:
3879 return canFoldAddSubImmIntoAddrMode(-Disp);
3881 case AArch64::ADDXrs: {
3894 if (Shift != 2 && Shift != 3 && Subtarget.hasAddrLSLSlow14())
3896 if (avoidSlowSTRQ(MemI))
3899 return canFoldAddRegIntoAddrMode(1ULL << Shift);
3902 case AArch64::ADDXrr:
3910 if (!OptSize && avoidSlowSTRQ(MemI))
3912 return canFoldAddRegIntoAddrMode(1);
3914 case AArch64::ADDXrx:
3922 if (!OptSize && avoidSlowSTRQ(MemI))
3931 return canFoldAddRegIntoAddrMode(
3946 case AArch64::LDURQi:
3947 case AArch64::LDRQui:
3948 return AArch64::LDRQroX;
3949 case AArch64::STURQi:
3950 case AArch64::STRQui:
3951 return AArch64::STRQroX;
3952 case AArch64::LDURDi:
3953 case AArch64::LDRDui:
3954 return AArch64::LDRDroX;
3955 case AArch64::STURDi:
3956 case AArch64::STRDui:
3957 return AArch64::STRDroX;
3958 case AArch64::LDURXi:
3959 case AArch64::LDRXui:
3960 return AArch64::LDRXroX;
3961 case AArch64::STURXi:
3962 case AArch64::STRXui:
3963 return AArch64::STRXroX;
3964 case AArch64::LDURWi:
3965 case AArch64::LDRWui:
3966 return AArch64::LDRWroX;
3967 case AArch64::LDURSWi:
3968 case AArch64::LDRSWui:
3969 return AArch64::LDRSWroX;
3970 case AArch64::STURWi:
3971 case AArch64::STRWui:
3972 return AArch64::STRWroX;
3973 case AArch64::LDURHi:
3974 case AArch64::LDRHui:
3975 return AArch64::LDRHroX;
3976 case AArch64::STURHi:
3977 case AArch64::STRHui:
3978 return AArch64::STRHroX;
3979 case AArch64::LDURHHi:
3980 case AArch64::LDRHHui:
3981 return AArch64::LDRHHroX;
3982 case AArch64::STURHHi:
3983 case AArch64::STRHHui:
3984 return AArch64::STRHHroX;
3985 case AArch64::LDURSHXi:
3986 case AArch64::LDRSHXui:
3987 return AArch64::LDRSHXroX;
3988 case AArch64::LDURSHWi:
3989 case AArch64::LDRSHWui:
3990 return AArch64::LDRSHWroX;
3991 case AArch64::LDURBi:
3992 case AArch64::LDRBui:
3993 return AArch64::LDRBroX;
3994 case AArch64::LDURBBi:
3995 case AArch64::LDRBBui:
3996 return AArch64::LDRBBroX;
3997 case AArch64::LDURSBXi:
3998 case AArch64::LDRSBXui:
3999 return AArch64::LDRSBXroX;
4000 case AArch64::LDURSBWi:
4001 case AArch64::LDRSBWui:
4002 return AArch64::LDRSBWroX;
4003 case AArch64::STURBi:
4004 case AArch64::STRBui:
4005 return AArch64::STRBroX;
4006 case AArch64::STURBBi:
4007 case AArch64::STRBBui:
4008 return AArch64::STRBBroX;
4020 case AArch64::LDURQi:
4022 return AArch64::LDRQui;
4023 case AArch64::STURQi:
4025 return AArch64::STRQui;
4026 case AArch64::LDURDi:
4028 return AArch64::LDRDui;
4029 case AArch64::STURDi:
4031 return AArch64::STRDui;
4032 case AArch64::LDURXi:
4034 return AArch64::LDRXui;
4035 case AArch64::STURXi:
4037 return AArch64::STRXui;
4038 case AArch64::LDURWi:
4040 return AArch64::LDRWui;
4041 case AArch64::LDURSWi:
4043 return AArch64::LDRSWui;
4044 case AArch64::STURWi:
4046 return AArch64::STRWui;
4047 case AArch64::LDURHi:
4049 return AArch64::LDRHui;
4050 case AArch64::STURHi:
4052 return AArch64::STRHui;
4053 case AArch64::LDURHHi:
4055 return AArch64::LDRHHui;
4056 case AArch64::STURHHi:
4058 return AArch64::STRHHui;
4059 case AArch64::LDURSHXi:
4061 return AArch64::LDRSHXui;
4062 case AArch64::LDURSHWi:
4064 return AArch64::LDRSHWui;
4065 case AArch64::LDURBi:
4067 return AArch64::LDRBui;
4068 case AArch64::LDURBBi:
4070 return AArch64::LDRBBui;
4071 case AArch64::LDURSBXi:
4073 return AArch64::LDRSBXui;
4074 case AArch64::LDURSBWi:
4076 return AArch64::LDRSBWui;
4077 case AArch64::STURBi:
4079 return AArch64::STRBui;
4080 case AArch64::STURBBi:
4082 return AArch64::STRBBui;
4083 case AArch64::LDRQui:
4084 case AArch64::STRQui:
4087 case AArch64::LDRDui:
4088 case AArch64::STRDui:
4089 case AArch64::LDRXui:
4090 case AArch64::STRXui:
4093 case AArch64::LDRWui:
4094 case AArch64::LDRSWui:
4095 case AArch64::STRWui:
4098 case AArch64::LDRHui:
4099 case AArch64::STRHui:
4100 case AArch64::LDRHHui:
4101 case AArch64::STRHHui:
4102 case AArch64::LDRSHXui:
4103 case AArch64::LDRSHWui:
4106 case AArch64::LDRBui:
4107 case AArch64::LDRBBui:
4108 case AArch64::LDRSBXui:
4109 case AArch64::LDRSBWui:
4110 case AArch64::STRBui:
4111 case AArch64::STRBBui:
4125 case AArch64::LDURQi:
4126 case AArch64::STURQi:
4127 case AArch64::LDURDi:
4128 case AArch64::STURDi:
4129 case AArch64::LDURXi:
4130 case AArch64::STURXi:
4131 case AArch64::LDURWi:
4132 case AArch64::LDURSWi:
4133 case AArch64::STURWi:
4134 case AArch64::LDURHi:
4135 case AArch64::STURHi:
4136 case AArch64::LDURHHi:
4137 case AArch64::STURHHi:
4138 case AArch64::LDURSHXi:
4139 case AArch64::LDURSHWi:
4140 case AArch64::LDURBi:
4141 case AArch64::STURBi:
4142 case AArch64::LDURBBi:
4143 case AArch64::STURBBi:
4144 case AArch64::LDURSBWi:
4145 case AArch64::LDURSBXi:
4147 case AArch64::LDRQui:
4148 return AArch64::LDURQi;
4149 case AArch64::STRQui:
4150 return AArch64::STURQi;
4151 case AArch64::LDRDui:
4152 return AArch64::LDURDi;
4153 case AArch64::STRDui:
4154 return AArch64::STURDi;
4155 case AArch64::LDRXui:
4156 return AArch64::LDURXi;
4157 case AArch64::STRXui:
4158 return AArch64::STURXi;
4159 case AArch64::LDRWui:
4160 return AArch64::LDURWi;
4161 case AArch64::LDRSWui:
4162 return AArch64::LDURSWi;
4163 case AArch64::STRWui:
4164 return AArch64::STURWi;
4165 case AArch64::LDRHui:
4166 return AArch64::LDURHi;
4167 case AArch64::STRHui:
4168 return AArch64::STURHi;
4169 case AArch64::LDRHHui:
4170 return AArch64::LDURHHi;
4171 case AArch64::STRHHui:
4172 return AArch64::STURHHi;
4173 case AArch64::LDRSHXui:
4174 return AArch64::LDURSHXi;
4175 case AArch64::LDRSHWui:
4176 return AArch64::LDURSHWi;
4177 case AArch64::LDRBBui:
4178 return AArch64::LDURBBi;
4179 case AArch64::LDRBui:
4180 return AArch64::LDURBi;
4181 case AArch64::STRBBui:
4182 return AArch64::STURBBi;
4183 case AArch64::STRBui:
4184 return AArch64::STURBi;
4185 case AArch64::LDRSBWui:
4186 return AArch64::LDURSBWi;
4187 case AArch64::LDRSBXui:
4188 return AArch64::LDURSBXi;
4201 case AArch64::LDRQroX:
4202 case AArch64::LDURQi:
4203 case AArch64::LDRQui:
4204 return AArch64::LDRQroW;
4205 case AArch64::STRQroX:
4206 case AArch64::STURQi:
4207 case AArch64::STRQui:
4208 return AArch64::STRQroW;
4209 case AArch64::LDRDroX:
4210 case AArch64::LDURDi:
4211 case AArch64::LDRDui:
4212 return AArch64::LDRDroW;
4213 case AArch64::STRDroX:
4214 case AArch64::STURDi:
4215 case AArch64::STRDui:
4216 return AArch64::STRDroW;
4217 case AArch64::LDRXroX:
4218 case AArch64::LDURXi:
4219 case AArch64::LDRXui:
4220 return AArch64::LDRXroW;
4221 case AArch64::STRXroX:
4222 case AArch64::STURXi:
4223 case AArch64::STRXui:
4224 return AArch64::STRXroW;
4225 case AArch64::LDRWroX:
4226 case AArch64::LDURWi:
4227 case AArch64::LDRWui:
4228 return AArch64::LDRWroW;
4229 case AArch64::LDRSWroX:
4230 case AArch64::LDURSWi:
4231 case AArch64::LDRSWui:
4232 return AArch64::LDRSWroW;
4233 case AArch64::STRWroX:
4234 case AArch64::STURWi:
4235 case AArch64::STRWui:
4236 return AArch64::STRWroW;
4237 case AArch64::LDRHroX:
4238 case AArch64::LDURHi:
4239 case AArch64::LDRHui:
4240 return AArch64::LDRHroW;
4241 case AArch64::STRHroX:
4242 case AArch64::STURHi:
4243 case AArch64::STRHui:
4244 return AArch64::STRHroW;
4245 case AArch64::LDRHHroX:
4246 case AArch64::LDURHHi:
4247 case AArch64::LDRHHui:
4248 return AArch64::LDRHHroW;
4249 case AArch64::STRHHroX:
4250 case AArch64::STURHHi:
4251 case AArch64::STRHHui:
4252 return AArch64::STRHHroW;
4253 case AArch64::LDRSHXroX:
4254 case AArch64::LDURSHXi:
4255 case AArch64::LDRSHXui:
4256 return AArch64::LDRSHXroW;
4257 case AArch64::LDRSHWroX:
4258 case AArch64::LDURSHWi:
4259 case AArch64::LDRSHWui:
4260 return AArch64::LDRSHWroW;
4261 case AArch64::LDRBroX:
4262 case AArch64::LDURBi:
4263 case AArch64::LDRBui:
4264 return AArch64::LDRBroW;
4265 case AArch64::LDRBBroX:
4266 case AArch64::LDURBBi:
4267 case AArch64::LDRBBui:
4268 return AArch64::LDRBBroW;
4269 case AArch64::LDRSBXroX:
4270 case AArch64::LDURSBXi:
4271 case AArch64::LDRSBXui:
4272 return AArch64::LDRSBXroW;
4273 case AArch64::LDRSBWroX:
4274 case AArch64::LDURSBWi:
4275 case AArch64::LDRSBWui:
4276 return AArch64::LDRSBWroW;
4277 case AArch64::STRBroX:
4278 case AArch64::STURBi:
4279 case AArch64::STRBui:
4280 return AArch64::STRBroW;
4281 case AArch64::STRBBroX:
4282 case AArch64::STURBBi:
4283 case AArch64::STRBBui:
4284 return AArch64::STRBBroW;
4309 return B.getInstr();
4313 "Addressing mode not supported for folding");
4330 return B.getInstr();
4337 "Address offset can be a register or an immediate, but not both");
4358 return B.getInstr();
4362 "Function must not be called with an addressing mode it can't handle");
4371 case AArch64::LD1Fourv16b_POST:
4372 case AArch64::LD1Fourv1d_POST:
4373 case AArch64::LD1Fourv2d_POST:
4374 case AArch64::LD1Fourv2s_POST:
4375 case AArch64::LD1Fourv4h_POST:
4376 case AArch64::LD1Fourv4s_POST:
4377 case AArch64::LD1Fourv8b_POST:
4378 case AArch64::LD1Fourv8h_POST:
4379 case AArch64::LD1Onev16b_POST:
4380 case AArch64::LD1Onev1d_POST:
4381 case AArch64::LD1Onev2d_POST:
4382 case AArch64::LD1Onev2s_POST:
4383 case AArch64::LD1Onev4h_POST:
4384 case AArch64::LD1Onev4s_POST:
4385 case AArch64::LD1Onev8b_POST:
4386 case AArch64::LD1Onev8h_POST:
4387 case AArch64::LD1Rv16b_POST:
4388 case AArch64::LD1Rv1d_POST:
4389 case AArch64::LD1Rv2d_POST:
4390 case AArch64::LD1Rv2s_POST:
4391 case AArch64::LD1Rv4h_POST:
4392 case AArch64::LD1Rv4s_POST:
4393 case AArch64::LD1Rv8b_POST:
4394 case AArch64::LD1Rv8h_POST:
4395 case AArch64::LD1Threev16b_POST:
4396 case AArch64::LD1Threev1d_POST:
4397 case AArch64::LD1Threev2d_POST:
4398 case AArch64::LD1Threev2s_POST:
4399 case AArch64::LD1Threev4h_POST:
4400 case AArch64::LD1Threev4s_POST:
4401 case AArch64::LD1Threev8b_POST:
4402 case AArch64::LD1Threev8h_POST:
4403 case AArch64::LD1Twov16b_POST:
4404 case AArch64::LD1Twov1d_POST:
4405 case AArch64::LD1Twov2d_POST:
4406 case AArch64::LD1Twov2s_POST:
4407 case AArch64::LD1Twov4h_POST:
4408 case AArch64::LD1Twov4s_POST:
4409 case AArch64::LD1Twov8b_POST:
4410 case AArch64::LD1Twov8h_POST:
4411 case AArch64::LD1i16_POST:
4412 case AArch64::LD1i32_POST:
4413 case AArch64::LD1i64_POST:
4414 case AArch64::LD1i8_POST:
4415 case AArch64::LD2Rv16b_POST:
4416 case AArch64::LD2Rv1d_POST:
4417 case AArch64::LD2Rv2d_POST:
4418 case AArch64::LD2Rv2s_POST:
4419 case AArch64::LD2Rv4h_POST:
4420 case AArch64::LD2Rv4s_POST:
4421 case AArch64::LD2Rv8b_POST:
4422 case AArch64::LD2Rv8h_POST:
4423 case AArch64::LD2Twov16b_POST:
4424 case AArch64::LD2Twov2d_POST:
4425 case AArch64::LD2Twov2s_POST:
4426 case AArch64::LD2Twov4h_POST:
4427 case AArch64::LD2Twov4s_POST:
4428 case AArch64::LD2Twov8b_POST:
4429 case AArch64::LD2Twov8h_POST:
4430 case AArch64::LD2i16_POST:
4431 case AArch64::LD2i32_POST:
4432 case AArch64::LD2i64_POST:
4433 case AArch64::LD2i8_POST:
4434 case AArch64::LD3Rv16b_POST:
4435 case AArch64::LD3Rv1d_POST:
4436 case AArch64::LD3Rv2d_POST:
4437 case AArch64::LD3Rv2s_POST:
4438 case AArch64::LD3Rv4h_POST:
4439 case AArch64::LD3Rv4s_POST:
4440 case AArch64::LD3Rv8b_POST:
4441 case AArch64::LD3Rv8h_POST:
4442 case AArch64::LD3Threev16b_POST:
4443 case AArch64::LD3Threev2d_POST:
4444 case AArch64::LD3Threev2s_POST:
4445 case AArch64::LD3Threev4h_POST:
4446 case AArch64::LD3Threev4s_POST:
4447 case AArch64::LD3Threev8b_POST:
4448 case AArch64::LD3Threev8h_POST:
4449 case AArch64::LD3i16_POST:
4450 case AArch64::LD3i32_POST:
4451 case AArch64::LD3i64_POST:
4452 case AArch64::LD3i8_POST:
4453 case AArch64::LD4Fourv16b_POST:
4454 case AArch64::LD4Fourv2d_POST:
4455 case AArch64::LD4Fourv2s_POST:
4456 case AArch64::LD4Fourv4h_POST:
4457 case AArch64::LD4Fourv4s_POST:
4458 case AArch64::LD4Fourv8b_POST:
4459 case AArch64::LD4Fourv8h_POST:
4460 case AArch64::LD4Rv16b_POST:
4461 case AArch64::LD4Rv1d_POST:
4462 case AArch64::LD4Rv2d_POST:
4463 case AArch64::LD4Rv2s_POST:
4464 case AArch64::LD4Rv4h_POST:
4465 case AArch64::LD4Rv4s_POST:
4466 case AArch64::LD4Rv8b_POST:
4467 case AArch64::LD4Rv8h_POST:
4468 case AArch64::LD4i16_POST:
4469 case AArch64::LD4i32_POST:
4470 case AArch64::LD4i64_POST:
4471 case AArch64::LD4i8_POST:
4472 case AArch64::LDAPRWpost:
4473 case AArch64::LDAPRXpost:
4474 case AArch64::LDIAPPWpost:
4475 case AArch64::LDIAPPXpost:
4476 case AArch64::LDPDpost:
4477 case AArch64::LDPQpost:
4478 case AArch64::LDPSWpost:
4479 case AArch64::LDPSpost:
4480 case AArch64::LDPWpost:
4481 case AArch64::LDPXpost:
4482 case AArch64::LDRBBpost:
4483 case AArch64::LDRBpost:
4484 case AArch64::LDRDpost:
4485 case AArch64::LDRHHpost:
4486 case AArch64::LDRHpost:
4487 case AArch64::LDRQpost:
4488 case AArch64::LDRSBWpost:
4489 case AArch64::LDRSBXpost:
4490 case AArch64::LDRSHWpost:
4491 case AArch64::LDRSHXpost:
4492 case AArch64::LDRSWpost:
4493 case AArch64::LDRSpost:
4494 case AArch64::LDRWpost:
4495 case AArch64::LDRXpost:
4496 case AArch64::ST1Fourv16b_POST:
4497 case AArch64::ST1Fourv1d_POST:
4498 case AArch64::ST1Fourv2d_POST:
4499 case AArch64::ST1Fourv2s_POST:
4500 case AArch64::ST1Fourv4h_POST:
4501 case AArch64::ST1Fourv4s_POST:
4502 case AArch64::ST1Fourv8b_POST:
4503 case AArch64::ST1Fourv8h_POST:
4504 case AArch64::ST1Onev16b_POST:
4505 case AArch64::ST1Onev1d_POST:
4506 case AArch64::ST1Onev2d_POST:
4507 case AArch64::ST1Onev2s_POST:
4508 case AArch64::ST1Onev4h_POST:
4509 case AArch64::ST1Onev4s_POST:
4510 case AArch64::ST1Onev8b_POST:
4511 case AArch64::ST1Onev8h_POST:
4512 case AArch64::ST1Threev16b_POST:
4513 case AArch64::ST1Threev1d_POST:
4514 case AArch64::ST1Threev2d_POST:
4515 case AArch64::ST1Threev2s_POST:
4516 case AArch64::ST1Threev4h_POST:
4517 case AArch64::ST1Threev4s_POST:
4518 case AArch64::ST1Threev8b_POST:
4519 case AArch64::ST1Threev8h_POST:
4520 case AArch64::ST1Twov16b_POST:
4521 case AArch64::ST1Twov1d_POST:
4522 case AArch64::ST1Twov2d_POST:
4523 case AArch64::ST1Twov2s_POST:
4524 case AArch64::ST1Twov4h_POST:
4525 case AArch64::ST1Twov4s_POST:
4526 case AArch64::ST1Twov8b_POST:
4527 case AArch64::ST1Twov8h_POST:
4528 case AArch64::ST1i16_POST:
4529 case AArch64::ST1i32_POST:
4530 case AArch64::ST1i64_POST:
4531 case AArch64::ST1i8_POST:
4532 case AArch64::ST2GPostIndex:
4533 case AArch64::ST2Twov16b_POST:
4534 case AArch64::ST2Twov2d_POST:
4535 case AArch64::ST2Twov2s_POST:
4536 case AArch64::ST2Twov4h_POST:
4537 case AArch64::ST2Twov4s_POST:
4538 case AArch64::ST2Twov8b_POST:
4539 case AArch64::ST2Twov8h_POST:
4540 case AArch64::ST2i16_POST:
4541 case AArch64::ST2i32_POST:
4542 case AArch64::ST2i64_POST:
4543 case AArch64::ST2i8_POST:
4544 case AArch64::ST3Threev16b_POST:
4545 case AArch64::ST3Threev2d_POST:
4546 case AArch64::ST3Threev2s_POST:
4547 case AArch64::ST3Threev4h_POST:
4548 case AArch64::ST3Threev4s_POST:
4549 case AArch64::ST3Threev8b_POST:
4550 case AArch64::ST3Threev8h_POST:
4551 case AArch64::ST3i16_POST:
4552 case AArch64::ST3i32_POST:
4553 case AArch64::ST3i64_POST:
4554 case AArch64::ST3i8_POST:
4555 case AArch64::ST4Fourv16b_POST:
4556 case AArch64::ST4Fourv2d_POST:
4557 case AArch64::ST4Fourv2s_POST:
4558 case AArch64::ST4Fourv4h_POST:
4559 case AArch64::ST4Fourv4s_POST:
4560 case AArch64::ST4Fourv8b_POST:
4561 case AArch64::ST4Fourv8h_POST:
4562 case AArch64::ST4i16_POST:
4563 case AArch64::ST4i32_POST:
4564 case AArch64::ST4i64_POST:
4565 case AArch64::ST4i8_POST:
4566 case AArch64::STGPostIndex:
4567 case AArch64::STGPpost:
4568 case AArch64::STPDpost:
4569 case AArch64::STPQpost:
4570 case AArch64::STPSpost:
4571 case AArch64::STPWpost:
4572 case AArch64::STPXpost:
4573 case AArch64::STRBBpost:
4574 case AArch64::STRBpost:
4575 case AArch64::STRDpost:
4576 case AArch64::STRHHpost:
4577 case AArch64::STRHpost:
4578 case AArch64::STRQpost:
4579 case AArch64::STRSpost:
4580 case AArch64::STRWpost:
4581 case AArch64::STRXpost:
4582 case AArch64::STZ2GPostIndex:
4583 case AArch64::STZGPostIndex:
4590 bool &OffsetIsScalable,
TypeSize &Width,
4611 int64_t Dummy1, Dummy2;
4633 return BaseOp->
isReg() || BaseOp->
isFI();
4640 assert(OfsOp.
isImm() &&
"Offset operand wasn't immediate.");
4645 TypeSize &Width, int64_t &MinOffset,
4646 int64_t &MaxOffset) {
4651 MinOffset = MaxOffset = 0;
4654 case AArch64::LDRQui:
4655 case AArch64::STRQui:
4660 case AArch64::LDRXui:
4661 case AArch64::LDRDui:
4662 case AArch64::STRXui:
4663 case AArch64::STRDui:
4664 case AArch64::PRFMui:
4669 case AArch64::LDRWui:
4670 case AArch64::LDRSui:
4671 case AArch64::LDRSWui:
4672 case AArch64::STRWui:
4673 case AArch64::STRSui:
4678 case AArch64::LDRHui:
4679 case AArch64::LDRHHui:
4680 case AArch64::LDRSHWui:
4681 case AArch64::LDRSHXui:
4682 case AArch64::STRHui:
4683 case AArch64::STRHHui:
4688 case AArch64::LDRBui:
4689 case AArch64::LDRBBui:
4690 case AArch64::LDRSBWui:
4691 case AArch64::LDRSBXui:
4692 case AArch64::STRBui:
4693 case AArch64::STRBBui:
4699 case AArch64::STRQpre:
4700 case AArch64::LDRQpost:
4706 case AArch64::LDRDpost:
4707 case AArch64::LDRDpre:
4708 case AArch64::LDRXpost:
4709 case AArch64::LDRXpre:
4710 case AArch64::STRDpost:
4711 case AArch64::STRDpre:
4712 case AArch64::STRXpost:
4713 case AArch64::STRXpre:
4719 case AArch64::STRWpost:
4720 case AArch64::STRWpre:
4721 case AArch64::LDRWpost:
4722 case AArch64::LDRWpre:
4723 case AArch64::STRSpost:
4724 case AArch64::STRSpre:
4725 case AArch64::LDRSpost:
4726 case AArch64::LDRSpre:
4732 case AArch64::LDRHpost:
4733 case AArch64::LDRHpre:
4734 case AArch64::STRHpost:
4735 case AArch64::STRHpre:
4736 case AArch64::LDRHHpost:
4737 case AArch64::LDRHHpre:
4738 case AArch64::STRHHpost:
4739 case AArch64::STRHHpre:
4745 case AArch64::LDRBpost:
4746 case AArch64::LDRBpre:
4747 case AArch64::STRBpost:
4748 case AArch64::STRBpre:
4749 case AArch64::LDRBBpost:
4750 case AArch64::LDRBBpre:
4751 case AArch64::STRBBpost:
4752 case AArch64::STRBBpre:
4758 case AArch64::LDURQi:
4759 case AArch64::STURQi:
4765 case AArch64::LDURXi:
4766 case AArch64::LDURDi:
4767 case AArch64::LDAPURXi:
4768 case AArch64::STURXi:
4769 case AArch64::STURDi:
4770 case AArch64::STLURXi:
4771 case AArch64::PRFUMi:
4777 case AArch64::LDURWi:
4778 case AArch64::LDURSi:
4779 case AArch64::LDURSWi:
4780 case AArch64::LDAPURi:
4781 case AArch64::LDAPURSWi:
4782 case AArch64::STURWi:
4783 case AArch64::STURSi:
4784 case AArch64::STLURWi:
4790 case AArch64::LDURHi:
4791 case AArch64::LDURHHi:
4792 case AArch64::LDURSHXi:
4793 case AArch64::LDURSHWi:
4794 case AArch64::LDAPURHi:
4795 case AArch64::LDAPURSHWi:
4796 case AArch64::LDAPURSHXi:
4797 case AArch64::STURHi:
4798 case AArch64::STURHHi:
4799 case AArch64::STLURHi:
4805 case AArch64::LDURBi:
4806 case AArch64::LDURBBi:
4807 case AArch64::LDURSBXi:
4808 case AArch64::LDURSBWi:
4809 case AArch64::LDAPURBi:
4810 case AArch64::LDAPURSBWi:
4811 case AArch64::LDAPURSBXi:
4812 case AArch64::STURBi:
4813 case AArch64::STURBBi:
4814 case AArch64::STLURBi:
4820 case AArch64::LDPQi:
4821 case AArch64::LDNPQi:
4822 case AArch64::STPQi:
4823 case AArch64::STNPQi:
4824 case AArch64::LDPQpost:
4825 case AArch64::LDPQpre:
4826 case AArch64::STPQpost:
4827 case AArch64::STPQpre:
4833 case AArch64::LDPXi:
4834 case AArch64::LDPDi:
4835 case AArch64::LDNPXi:
4836 case AArch64::LDNPDi:
4837 case AArch64::STPXi:
4838 case AArch64::STPDi:
4839 case AArch64::STNPXi:
4840 case AArch64::STNPDi:
4841 case AArch64::LDPDpost:
4842 case AArch64::LDPDpre:
4843 case AArch64::LDPXpost:
4844 case AArch64::LDPXpre:
4845 case AArch64::STPDpost:
4846 case AArch64::STPDpre:
4847 case AArch64::STPXpost:
4848 case AArch64::STPXpre:
4854 case AArch64::LDPWi:
4855 case AArch64::LDPSi:
4856 case AArch64::LDNPWi:
4857 case AArch64::LDNPSi:
4858 case AArch64::STPWi:
4859 case AArch64::STPSi:
4860 case AArch64::STNPWi:
4861 case AArch64::STNPSi:
4862 case AArch64::LDPSpost:
4863 case AArch64::LDPSpre:
4864 case AArch64::LDPWpost:
4865 case AArch64::LDPWpre:
4866 case AArch64::STPSpost:
4867 case AArch64::STPSpre:
4868 case AArch64::STPWpost:
4869 case AArch64::STPWpre:
4875 case AArch64::StoreSwiftAsyncContext:
4888 case AArch64::TAGPstack:
4898 case AArch64::STGPreIndex:
4899 case AArch64::STGPostIndex:
4900 case AArch64::STZGi:
4901 case AArch64::STZGPreIndex:
4902 case AArch64::STZGPostIndex:
4908 case AArch64::STR_ZZZZXI:
4909 case AArch64::STR_ZZZZXI_STRIDED_CONTIGUOUS:
4910 case AArch64::LDR_ZZZZXI:
4911 case AArch64::LDR_ZZZZXI_STRIDED_CONTIGUOUS:
4917 case AArch64::STR_ZZZXI:
4918 case AArch64::LDR_ZZZXI:
4924 case AArch64::STR_ZZXI:
4925 case AArch64::STR_ZZXI_STRIDED_CONTIGUOUS:
4926 case AArch64::LDR_ZZXI:
4927 case AArch64::LDR_ZZXI_STRIDED_CONTIGUOUS:
4933 case AArch64::LDR_PXI:
4934 case AArch64::STR_PXI:
4939 case AArch64::LDR_PPXI:
4940 case AArch64::STR_PPXI:
4946 case AArch64::LDR_ZXI:
4947 case AArch64::STR_ZXI:
4952 case AArch64::LD1B_IMM:
4953 case AArch64::LD1H_IMM:
4954 case AArch64::LD1W_IMM:
4955 case AArch64::LD1D_IMM:
4956 case AArch64::LDNT1B_ZRI:
4957 case AArch64::LDNT1H_ZRI:
4958 case AArch64::LDNT1W_ZRI:
4959 case AArch64::LDNT1D_ZRI:
4960 case AArch64::ST1B_IMM:
4961 case AArch64::ST1H_IMM:
4962 case AArch64::ST1W_IMM:
4963 case AArch64::ST1D_IMM:
4964 case AArch64::STNT1B_ZRI:
4965 case AArch64::STNT1H_ZRI:
4966 case AArch64::STNT1W_ZRI:
4967 case AArch64::STNT1D_ZRI:
4968 case AArch64::LDNF1B_IMM:
4969 case AArch64::LDNF1H_IMM:
4970 case AArch64::LDNF1W_IMM:
4971 case AArch64::LDNF1D_IMM:
4978 case AArch64::LD2B_IMM:
4979 case AArch64::LD2H_IMM:
4980 case AArch64::LD2W_IMM:
4981 case AArch64::LD2D_IMM:
4982 case AArch64::ST2B_IMM:
4983 case AArch64::ST2H_IMM:
4984 case AArch64::ST2W_IMM:
4985 case AArch64::ST2D_IMM:
4986 case AArch64::LD1B_2Z_IMM:
4987 case AArch64::LD1B_2Z_STRIDED_IMM:
4988 case AArch64::LD1H_2Z_IMM:
4989 case AArch64::LD1H_2Z_STRIDED_IMM:
4990 case AArch64::LD1W_2Z_IMM:
4991 case AArch64::LD1W_2Z_STRIDED_IMM:
4992 case AArch64::LD1D_2Z_IMM:
4993 case AArch64::LD1D_2Z_STRIDED_IMM:
4994 case AArch64::LD1B_2Z_IMM_PSEUDO:
4995 case AArch64::LD1H_2Z_IMM_PSEUDO:
4996 case AArch64::LD1W_2Z_IMM_PSEUDO:
4997 case AArch64::LD1D_2Z_IMM_PSEUDO:
4998 case AArch64::ST1B_2Z_IMM:
4999 case AArch64::ST1B_2Z_STRIDED_IMM:
5000 case AArch64::ST1H_2Z_IMM:
5001 case AArch64::ST1H_2Z_STRIDED_IMM:
5002 case AArch64::ST1W_2Z_IMM:
5003 case AArch64::ST1W_2Z_STRIDED_IMM:
5004 case AArch64::ST1D_2Z_IMM:
5005 case AArch64::ST1D_2Z_STRIDED_IMM:
5006 case AArch64::LDNT1B_2Z_IMM_PSEUDO:
5007 case AArch64::LDNT1B_2Z_IMM:
5008 case AArch64::LDNT1B_2Z_STRIDED_IMM:
5009 case AArch64::LDNT1H_2Z_IMM_PSEUDO:
5010 case AArch64::LDNT1H_2Z_IMM:
5011 case AArch64::LDNT1H_2Z_STRIDED_IMM:
5012 case AArch64::LDNT1W_2Z_IMM_PSEUDO:
5013 case AArch64::LDNT1W_2Z_IMM:
5014 case AArch64::LDNT1W_2Z_STRIDED_IMM:
5015 case AArch64::LDNT1D_2Z_IMM_PSEUDO:
5016 case AArch64::LDNT1D_2Z_IMM:
5017 case AArch64::LDNT1D_2Z_STRIDED_IMM:
5018 case AArch64::STNT1B_2Z_IMM:
5019 case AArch64::STNT1B_2Z_STRIDED_IMM:
5020 case AArch64::STNT1H_2Z_IMM:
5021 case AArch64::STNT1H_2Z_STRIDED_IMM:
5022 case AArch64::STNT1W_2Z_IMM:
5023 case AArch64::STNT1W_2Z_STRIDED_IMM:
5024 case AArch64::STNT1D_2Z_IMM:
5025 case AArch64::STNT1D_2Z_STRIDED_IMM:
5030 case AArch64::LD3B_IMM:
5031 case AArch64::LD3H_IMM:
5032 case AArch64::LD3W_IMM:
5033 case AArch64::LD3D_IMM:
5034 case AArch64::ST3B_IMM:
5035 case AArch64::ST3H_IMM:
5036 case AArch64::ST3W_IMM:
5037 case AArch64::ST3D_IMM:
5042 case AArch64::LD4B_IMM:
5043 case AArch64::LD4H_IMM:
5044 case AArch64::LD4W_IMM:
5045 case AArch64::LD4D_IMM:
5046 case AArch64::ST4B_IMM:
5047 case AArch64::ST4H_IMM:
5048 case AArch64::ST4W_IMM:
5049 case AArch64::ST4D_IMM:
5050 case AArch64::LD1B_4Z_IMM:
5051 case AArch64::LD1B_4Z_STRIDED_IMM:
5052 case AArch64::LD1H_4Z_IMM:
5053 case AArch64::LD1H_4Z_STRIDED_IMM:
5054 case AArch64::LD1W_4Z_IMM:
5055 case AArch64::LD1W_4Z_STRIDED_IMM:
5056 case AArch64::LD1D_4Z_IMM:
5057 case AArch64::LD1D_4Z_STRIDED_IMM:
5058 case AArch64::LD1B_4Z_IMM_PSEUDO:
5059 case AArch64::LD1H_4Z_IMM_PSEUDO:
5060 case AArch64::LD1W_4Z_IMM_PSEUDO:
5061 case AArch64::LD1D_4Z_IMM_PSEUDO:
5062 case AArch64::ST1B_4Z_IMM:
5063 case AArch64::ST1B_4Z_STRIDED_IMM:
5064 case AArch64::ST1H_4Z_IMM:
5065 case AArch64::ST1H_4Z_STRIDED_IMM:
5066 case AArch64::ST1W_4Z_IMM:
5067 case AArch64::ST1W_4Z_STRIDED_IMM:
5068 case AArch64::ST1D_4Z_IMM:
5069 case AArch64::ST1D_4Z_STRIDED_IMM:
5070 case AArch64::LDNT1B_4Z_IMM_PSEUDO:
5071 case AArch64::LDNT1B_4Z_IMM:
5072 case AArch64::LDNT1B_4Z_STRIDED_IMM:
5073 case AArch64::LDNT1H_4Z_IMM_PSEUDO:
5074 case AArch64::LDNT1H_4Z_IMM:
5075 case AArch64::LDNT1H_4Z_STRIDED_IMM:
5076 case AArch64::LDNT1W_4Z_IMM_PSEUDO:
5077 case AArch64::LDNT1W_4Z_IMM:
5078 case AArch64::LDNT1W_4Z_STRIDED_IMM:
5079 case AArch64::LDNT1D_4Z_IMM_PSEUDO:
5080 case AArch64::LDNT1D_4Z_IMM:
5081 case AArch64::LDNT1D_4Z_STRIDED_IMM:
5082 case AArch64::STNT1B_4Z_IMM:
5083 case AArch64::STNT1B_4Z_STRIDED_IMM:
5084 case AArch64::STNT1H_4Z_IMM:
5085 case AArch64::STNT1H_4Z_STRIDED_IMM:
5086 case AArch64::STNT1W_4Z_IMM:
5087 case AArch64::STNT1W_4Z_STRIDED_IMM:
5088 case AArch64::STNT1D_4Z_IMM:
5089 case AArch64::STNT1D_4Z_STRIDED_IMM:
5094 case AArch64::LD1B_H_IMM:
5095 case AArch64::LD1SB_H_IMM:
5096 case AArch64::LD1H_S_IMM:
5097 case AArch64::LD1SH_S_IMM:
5098 case AArch64::LD1W_D_IMM:
5099 case AArch64::LD1SW_D_IMM:
5100 case AArch64::ST1B_H_IMM:
5101 case AArch64::ST1H_S_IMM:
5102 case AArch64::ST1W_D_IMM:
5103 case AArch64::LDNF1B_H_IMM:
5104 case AArch64::LDNF1SB_H_IMM:
5105 case AArch64::LDNF1H_S_IMM:
5106 case AArch64::LDNF1SH_S_IMM:
5107 case AArch64::LDNF1W_D_IMM:
5108 case AArch64::LDNF1SW_D_IMM:
5115 case AArch64::LD1B_S_IMM:
5116 case AArch64::LD1SB_S_IMM:
5117 case AArch64::LD1H_D_IMM:
5118 case AArch64::LD1SH_D_IMM:
5119 case AArch64::ST1B_S_IMM:
5120 case AArch64::ST1H_D_IMM:
5121 case AArch64::LDNF1B_S_IMM:
5122 case AArch64::LDNF1SB_S_IMM:
5123 case AArch64::LDNF1H_D_IMM:
5124 case AArch64::LDNF1SH_D_IMM:
5131 case AArch64::LD1B_D_IMM:
5132 case AArch64::LD1SB_D_IMM:
5133 case AArch64::ST1B_D_IMM:
5134 case AArch64::LDNF1B_D_IMM:
5135 case AArch64::LDNF1SB_D_IMM:
5142 case AArch64::ST2Gi:
5143 case AArch64::ST2GPreIndex:
5144 case AArch64::ST2GPostIndex:
5145 case AArch64::STZ2Gi:
5146 case AArch64::STZ2GPreIndex:
5147 case AArch64::STZ2GPostIndex:
5153 case AArch64::STGPi:
5154 case AArch64::STGPpost:
5155 case AArch64::STGPpre:
5160 case AArch64::LD1RB_IMM:
5161 case AArch64::LD1RB_H_IMM:
5162 case AArch64::LD1RB_S_IMM:
5163 case AArch64::LD1RB_D_IMM:
5164 case AArch64::LD1RSB_H_IMM:
5165 case AArch64::LD1RSB_S_IMM:
5166 case AArch64::LD1RSB_D_IMM:
5171 case AArch64::LD1RH_IMM:
5172 case AArch64::LD1RH_S_IMM:
5173 case AArch64::LD1RH_D_IMM:
5174 case AArch64::LD1RSH_S_IMM:
5175 case AArch64::LD1RSH_D_IMM:
5180 case AArch64::LD1RW_IMM:
5181 case AArch64::LD1RW_D_IMM:
5182 case AArch64::LD1RSW_IMM:
5187 case AArch64::LD1RD_IMM:
5202 case AArch64::LDRBui:
5203 case AArch64::LDRBBui:
5204 case AArch64::LDURBBi:
5205 case AArch64::LDRSBWui:
5206 case AArch64::LDURSBWi:
5207 case AArch64::STRBui:
5208 case AArch64::STRBBui:
5209 case AArch64::STURBBi:
5211 case AArch64::LDRHui:
5212 case AArch64::LDRHHui:
5213 case AArch64::LDURHHi:
5214 case AArch64::LDRSHWui:
5215 case AArch64::LDURSHWi:
5216 case AArch64::STRHui:
5217 case AArch64::STRHHui:
5218 case AArch64::STURHHi:
5220 case AArch64::LDRSui:
5221 case AArch64::LDURSi:
5222 case AArch64::LDRSpre:
5223 case AArch64::LDRSWui:
5224 case AArch64::LDURSWi:
5225 case AArch64::LDRSWpre:
5226 case AArch64::LDRWpre:
5227 case AArch64::LDRWui:
5228 case AArch64::LDURWi:
5229 case AArch64::STRSui:
5230 case AArch64::STURSi:
5231 case AArch64::STRSpre:
5232 case AArch64::STRWui:
5233 case AArch64::STURWi:
5234 case AArch64::STRWpre:
5235 case AArch64::LDPSi:
5236 case AArch64::LDPSWi:
5237 case AArch64::LDPWi:
5238 case AArch64::STPSi:
5239 case AArch64::STPWi:
5241 case AArch64::LDRDui:
5242 case AArch64::LDURDi:
5243 case AArch64::LDRDpre:
5244 case AArch64::LDRXui:
5245 case AArch64::LDURXi:
5246 case AArch64::LDRXpre:
5247 case AArch64::STRDui:
5248 case AArch64::STURDi:
5249 case AArch64::STRDpre:
5250 case AArch64::STRXui:
5251 case AArch64::STURXi:
5252 case AArch64::STRXpre:
5253 case AArch64::LDPDi:
5254 case AArch64::LDPXi:
5255 case AArch64::STPDi:
5256 case AArch64::STPXi:
5258 case AArch64::LDRQui:
5259 case AArch64::LDURQi:
5260 case AArch64::STRQui:
5261 case AArch64::STURQi:
5262 case AArch64::STRQpre:
5263 case AArch64::LDPQi:
5264 case AArch64::LDRQpre:
5265 case AArch64::STPQi:
5267 case AArch64::STZGi:
5268 case AArch64::ST2Gi:
5269 case AArch64::STZ2Gi:
5270 case AArch64::STGPi:
5276 switch (
MI.getOpcode()) {
5279 case AArch64::LDRWpre:
5280 case AArch64::LDRXpre:
5281 case AArch64::LDRSWpre:
5282 case AArch64::LDRSpre:
5283 case AArch64::LDRDpre:
5284 case AArch64::LDRQpre:
5290 switch (
MI.getOpcode()) {
5293 case AArch64::STRWpre:
5294 case AArch64::STRXpre:
5295 case AArch64::STRSpre:
5296 case AArch64::STRDpre:
5297 case AArch64::STRQpre:
5307 switch (
MI.getOpcode()) {
5310 case AArch64::LDURBBi:
5311 case AArch64::LDURHHi:
5312 case AArch64::LDURWi:
5313 case AArch64::LDRBBui:
5314 case AArch64::LDRHHui:
5315 case AArch64::LDRWui:
5316 case AArch64::LDRBBroX:
5317 case AArch64::LDRHHroX:
5318 case AArch64::LDRWroX:
5319 case AArch64::LDRBBroW:
5320 case AArch64::LDRHHroW:
5321 case AArch64::LDRWroW:
5327 switch (
MI.getOpcode()) {
5330 case AArch64::LDURSBWi:
5331 case AArch64::LDURSHWi:
5332 case AArch64::LDURSBXi:
5333 case AArch64::LDURSHXi:
5334 case AArch64::LDURSWi:
5335 case AArch64::LDRSBWui:
5336 case AArch64::LDRSHWui:
5337 case AArch64::LDRSBXui:
5338 case AArch64::LDRSHXui:
5339 case AArch64::LDRSWui:
5340 case AArch64::LDRSBWroX:
5341 case AArch64::LDRSHWroX:
5342 case AArch64::LDRSBXroX:
5343 case AArch64::LDRSHXroX:
5344 case AArch64::LDRSWroX:
5345 case AArch64::LDRSBWroW:
5346 case AArch64::LDRSHWroW:
5347 case AArch64::LDRSBXroW:
5348 case AArch64::LDRSHXroW:
5349 case AArch64::LDRSWroW:
5355 switch (
MI.getOpcode()) {
5358 case AArch64::LDPSi:
5359 case AArch64::LDPSWi:
5360 case AArch64::LDPDi:
5361 case AArch64::LDPQi:
5362 case AArch64::LDPWi:
5363 case AArch64::LDPXi:
5364 case AArch64::STPSi:
5365 case AArch64::STPDi:
5366 case AArch64::STPQi:
5367 case AArch64::STPWi:
5368 case AArch64::STPXi:
5369 case AArch64::STGPi:
5375 assert(
MI.mayLoadOrStore() &&
"Load or store instruction expected");
5379 return MI.getOperand(Idx);
5384 assert(
MI.mayLoadOrStore() &&
"Load or store instruction expected");
5388 return MI.getOperand(Idx);
5393 switch (
MI.getOpcode()) {
5396 case AArch64::LDRBroX:
5397 case AArch64::LDRBBroX:
5398 case AArch64::LDRSBXroX:
5399 case AArch64::LDRSBWroX:
5400 case AArch64::LDRHroX:
5401 case AArch64::LDRHHroX:
5402 case AArch64::LDRSHXroX:
5403 case AArch64::LDRSHWroX:
5404 case AArch64::LDRWroX:
5405 case AArch64::LDRSroX:
5406 case AArch64::LDRSWroX:
5407 case AArch64::LDRDroX:
5408 case AArch64::LDRXroX:
5409 case AArch64::LDRQroX:
5410 return MI.getOperand(4);
5416 if (
MI.getParent() ==
nullptr)
5426 auto Reg =
Op.getReg();
5427 if (Reg.isPhysical())
5428 return AArch64::FPR16RegClass.contains(Reg);
5430 return TRC == &AArch64::FPR16RegClass ||
5431 TRC == &AArch64::FPR16_loRegClass;
5440 auto Reg =
Op.getReg();
5441 if (Reg.isPhysical())
5442 return AArch64::FPR128RegClass.contains(Reg);
5444 return TRC == &AArch64::FPR128RegClass ||
5445 TRC == &AArch64::FPR128_loRegClass;
5451 switch (
MI.getOpcode()) {
5454 case AArch64::PACIASP:
5455 case AArch64::PACIBSP:
5458 case AArch64::PAUTH_PROLOGUE:
5461 case AArch64::HINT: {
5462 unsigned Imm =
MI.getOperand(0).getImm();
5464 if (Imm == 32 || Imm == 34 || Imm == 36 || Imm == 38)
5467 if (Imm == 25 || Imm == 27)
5479 assert(Reg.isPhysical() &&
"Expected physical register in isFpOrNEON");
5480 return AArch64::FPR128RegClass.contains(Reg) ||
5481 AArch64::FPR64RegClass.contains(Reg) ||
5482 AArch64::FPR32RegClass.contains(Reg) ||
5483 AArch64::FPR16RegClass.contains(Reg) ||
5484 AArch64::FPR8RegClass.contains(Reg);
5491 auto Reg =
Op.getReg();
5492 if (Reg.isPhysical())
5496 return TRC == &AArch64::FPR128RegClass ||
5497 TRC == &AArch64::FPR128_loRegClass ||
5498 TRC == &AArch64::FPR64RegClass ||
5499 TRC == &AArch64::FPR64_loRegClass ||
5500 TRC == &AArch64::FPR32RegClass || TRC == &AArch64::FPR16RegClass ||
5501 TRC == &AArch64::FPR8RegClass;
5523 if (FirstOpc == SecondOpc)
5529 case AArch64::STRSui:
5530 case AArch64::STURSi:
5531 return SecondOpc == AArch64::STRSui || SecondOpc == AArch64::STURSi;
5532 case AArch64::STRDui:
5533 case AArch64::STURDi:
5534 return SecondOpc == AArch64::STRDui || SecondOpc == AArch64::STURDi;
5535 case AArch64::STRQui:
5536 case AArch64::STURQi:
5537 return SecondOpc == AArch64::STRQui || SecondOpc == AArch64::STURQi;
5538 case AArch64::STRWui:
5539 case AArch64::STURWi:
5540 return SecondOpc == AArch64::STRWui || SecondOpc == AArch64::STURWi;
5541 case AArch64::STRXui:
5542 case AArch64::STURXi:
5543 return SecondOpc == AArch64::STRXui || SecondOpc == AArch64::STURXi;
5544 case AArch64::LDRSui:
5545 case AArch64::LDURSi:
5546 return SecondOpc == AArch64::LDRSui || SecondOpc == AArch64::LDURSi;
5547 case AArch64::LDRDui:
5548 case AArch64::LDURDi:
5549 return SecondOpc == AArch64::LDRDui || SecondOpc == AArch64::LDURDi;
5550 case AArch64::LDRQui:
5551 case AArch64::LDURQi:
5552 return SecondOpc == AArch64::LDRQui || SecondOpc == AArch64::LDURQi;
5553 case AArch64::LDRWui:
5554 case AArch64::LDURWi:
5555 return SecondOpc == AArch64::LDRSWui || SecondOpc == AArch64::LDURSWi;
5556 case AArch64::LDRSWui:
5557 case AArch64::LDURSWi:
5558 return SecondOpc == AArch64::LDRWui || SecondOpc == AArch64::LDURWi;
5559 case AArch64::LDRXui:
5560 case AArch64::LDURXi:
5561 return SecondOpc == AArch64::LDRXui || SecondOpc == AArch64::LDURXi;
5568 int64_t Offset1,
unsigned Opcode1,
int FI2,
5569 int64_t Offset2,
unsigned Opcode2) {
5575 assert(ObjectOffset1 <= ObjectOffset2 &&
"Object offsets are not ordered.");
5578 if (ObjectOffset1 % Scale1 != 0)
5580 ObjectOffset1 /= Scale1;
5582 if (ObjectOffset2 % Scale2 != 0)
5584 ObjectOffset2 /= Scale2;
5585 ObjectOffset1 += Offset1;
5586 ObjectOffset2 += Offset2;
5587 return ObjectOffset1 + 1 == ObjectOffset2;
5599 int64_t OpOffset2,
bool OffsetIsScalable2,
unsigned ClusterSize,
5600 unsigned NumBytes)
const {
5610 "Only base registers and frame indices are supported.");
5617 if (ClusterSize > 2)
5624 unsigned FirstOpc = FirstLdSt.
getOpcode();
5625 unsigned SecondOpc = SecondLdSt.
getOpcode();
5645 if (Offset1 > 63 || Offset1 < -64)
5650 if (BaseOp1.
isFI()) {
5652 "Caller should have ordered offsets.");
5657 BaseOp2.
getIndex(), Offset2, SecondOpc);
5660 assert(Offset1 <= Offset2 &&
"Caller should have ordered offsets.");
5662 return Offset1 + 1 == Offset2;
5672 if (
Reg.isPhysical())
5681 return ((DestReg - SrcReg) & 0x1f) < NumRegs;
5690 assert(Subtarget.hasNEON() &&
"Unexpected register copy without NEON");
5692 uint16_t DestEncoding =
TRI->getEncodingValue(DestReg);
5693 uint16_t SrcEncoding =
TRI->getEncodingValue(SrcReg);
5694 unsigned NumRegs = Indices.
size();
5696 int SubReg = 0, End = NumRegs, Incr = 1;
5698 SubReg = NumRegs - 1;
5703 for (; SubReg != End; SubReg += Incr) {
5715 unsigned Opcode,
unsigned ZeroReg,
5718 unsigned NumRegs = Indices.
size();
5721 uint16_t DestEncoding =
TRI->getEncodingValue(DestReg);
5722 uint16_t SrcEncoding =
TRI->getEncodingValue(SrcReg);
5723 assert(DestEncoding % NumRegs == 0 && SrcEncoding % NumRegs == 0 &&
5724 "GPR reg sequences should not be able to overlap");
5727 for (
unsigned SubReg = 0; SubReg != NumRegs; ++SubReg) {
5748 unsigned Opc =
MI.getOpcode();
5749 if (
Opc == AArch64::MSRpstatesvcrImm1 ||
Opc == AArch64::MSRpstatePseudo) {
5751 int64_t PState =
MI.getOperand(0).getImm();
5752 if (PState == AArch64SVCR::SVCRSM || PState == AArch64SVCR::SVCRSMZA) {
5754 return MI.getOperand(1).getImm() == 1;
5773 bool RenamableSrc)
const {
5775 if (AArch64::GPR32spRegClass.
contains(DestReg) &&
5776 AArch64::GPR32spRegClass.
contains(SrcReg)) {
5777 if (DestReg == AArch64::WSP || SrcReg == AArch64::WSP) {
5779 if (Subtarget.hasZeroCycleRegMoveGPR64() &&
5780 !Subtarget.hasZeroCycleRegMoveGPR32()) {
5782 MCRegister DestRegX = RI.getMatchingSuperReg(DestReg, AArch64::sub_32,
5783 &AArch64::GPR64spRegClass);
5784 MCRegister SrcRegX = RI.getMatchingSuperReg(SrcReg, AArch64::sub_32,
5785 &AArch64::GPR64spRegClass);
5795 ++NumZCRegMoveInstrsGPR;
5801 if (Subtarget.hasZeroCycleRegMoveGPR32())
5802 ++NumZCRegMoveInstrsGPR;
5804 }
else if (Subtarget.hasZeroCycleRegMoveGPR64() &&
5805 !Subtarget.hasZeroCycleRegMoveGPR32()) {
5807 MCRegister DestRegX = RI.getMatchingSuperReg(DestReg, AArch64::sub_32,
5808 &AArch64::GPR64spRegClass);
5809 assert(DestRegX.
isValid() &&
"Destination super-reg not valid");
5810 MCRegister SrcRegX = RI.getMatchingSuperReg(SrcReg, AArch64::sub_32,
5811 &AArch64::GPR64spRegClass);
5821 ++NumZCRegMoveInstrsGPR;
5827 if (Subtarget.hasZeroCycleRegMoveGPR32())
5828 ++NumZCRegMoveInstrsGPR;
5834 if (AArch64::GPR32spRegClass.
contains(DestReg) && SrcReg == AArch64::WZR) {
5835 if (Subtarget.hasZeroCycleZeroingGPR64() &&
5836 !Subtarget.hasZeroCycleZeroingGPR32()) {
5837 MCRegister DestRegX = RI.getMatchingSuperReg(DestReg, AArch64::sub_32,
5838 &AArch64::GPR64spRegClass);
5839 assert(DestRegX.
isValid() &&
"Destination super-reg not valid");
5843 ++NumZCZeroingInstrsGPR;
5844 }
else if (Subtarget.hasZeroCycleZeroingGPR32()) {
5848 ++NumZCZeroingInstrsGPR;
5857 if (AArch64::GPR64spRegClass.
contains(DestReg) &&
5858 AArch64::GPR64spRegClass.
contains(SrcReg)) {
5859 if (DestReg == AArch64::SP || SrcReg == AArch64::SP) {
5865 if (Subtarget.hasZeroCycleRegMoveGPR64())
5866 ++NumZCRegMoveInstrsGPR;
5872 if (Subtarget.hasZeroCycleRegMoveGPR64())
5873 ++NumZCRegMoveInstrsGPR;
5879 if (AArch64::GPR64spRegClass.
contains(DestReg) && SrcReg == AArch64::XZR) {
5880 if (Subtarget.hasZeroCycleZeroingGPR64()) {
5884 ++NumZCZeroingInstrsGPR;
5894 if (AArch64::PPRRegClass.
contains(DestReg) &&
5895 AArch64::PPRRegClass.
contains(SrcReg)) {
5896 assert(Subtarget.isSVEorStreamingSVEAvailable() &&
5897 "Unexpected SVE register.");
5907 bool DestIsPNR = AArch64::PNRRegClass.contains(DestReg);
5908 bool SrcIsPNR = AArch64::PNRRegClass.contains(SrcReg);
5909 if (DestIsPNR || SrcIsPNR) {
5911 return (R - AArch64::PN0) + AArch64::P0;
5916 if (PPRSrcReg != PPRDestReg) {
5928 if (AArch64::ZPRRegClass.
contains(DestReg) &&
5929 AArch64::ZPRRegClass.
contains(SrcReg)) {
5930 assert(Subtarget.isSVEorStreamingSVEAvailable() &&
5931 "Unexpected SVE register.");
5939 if ((AArch64::ZPR2RegClass.
contains(DestReg) ||
5940 AArch64::ZPR2StridedOrContiguousRegClass.
contains(DestReg)) &&
5941 (AArch64::ZPR2RegClass.
contains(SrcReg) ||
5942 AArch64::ZPR2StridedOrContiguousRegClass.
contains(SrcReg))) {
5943 assert(Subtarget.isSVEorStreamingSVEAvailable() &&
5944 "Unexpected SVE register.");
5945 static const unsigned Indices[] = {AArch64::zsub0, AArch64::zsub1};
5952 if (AArch64::ZPR3RegClass.
contains(DestReg) &&
5953 AArch64::ZPR3RegClass.
contains(SrcReg)) {
5954 assert(Subtarget.isSVEorStreamingSVEAvailable() &&
5955 "Unexpected SVE register.");
5956 static const unsigned Indices[] = {AArch64::zsub0, AArch64::zsub1,
5964 if ((AArch64::ZPR4RegClass.
contains(DestReg) ||
5965 AArch64::ZPR4StridedOrContiguousRegClass.
contains(DestReg)) &&
5966 (AArch64::ZPR4RegClass.
contains(SrcReg) ||
5967 AArch64::ZPR4StridedOrContiguousRegClass.
contains(SrcReg))) {
5968 assert(Subtarget.isSVEorStreamingSVEAvailable() &&
5969 "Unexpected SVE register.");
5970 static const unsigned Indices[] = {AArch64::zsub0, AArch64::zsub1,
5971 AArch64::zsub2, AArch64::zsub3};
5978 if (AArch64::DDDDRegClass.
contains(DestReg) &&
5979 AArch64::DDDDRegClass.
contains(SrcReg)) {
5980 static const unsigned Indices[] = {AArch64::dsub0, AArch64::dsub1,
5981 AArch64::dsub2, AArch64::dsub3};
5988 if (AArch64::DDDRegClass.
contains(DestReg) &&
5989 AArch64::DDDRegClass.
contains(SrcReg)) {
5990 static const unsigned Indices[] = {AArch64::dsub0, AArch64::dsub1,
5998 if (AArch64::DDRegClass.
contains(DestReg) &&
5999 AArch64::DDRegClass.
contains(SrcReg)) {
6000 static const unsigned Indices[] = {AArch64::dsub0, AArch64::dsub1};
6007 if (AArch64::QQQQRegClass.
contains(DestReg) &&
6008 AArch64::QQQQRegClass.
contains(SrcReg)) {
6009 static const unsigned Indices[] = {AArch64::qsub0, AArch64::qsub1,
6010 AArch64::qsub2, AArch64::qsub3};
6017 if (AArch64::QQQRegClass.
contains(DestReg) &&
6018 AArch64::QQQRegClass.
contains(SrcReg)) {
6019 static const unsigned Indices[] = {AArch64::qsub0, AArch64::qsub1,
6027 if (AArch64::QQRegClass.
contains(DestReg) &&
6028 AArch64::QQRegClass.
contains(SrcReg)) {
6029 static const unsigned Indices[] = {AArch64::qsub0, AArch64::qsub1};
6035 if (AArch64::XSeqPairsClassRegClass.
contains(DestReg) &&
6036 AArch64::XSeqPairsClassRegClass.
contains(SrcReg)) {
6037 static const unsigned Indices[] = {AArch64::sube64, AArch64::subo64};
6039 AArch64::XZR, Indices);
6043 if (AArch64::WSeqPairsClassRegClass.
contains(DestReg) &&
6044 AArch64::WSeqPairsClassRegClass.
contains(SrcReg)) {
6045 static const unsigned Indices[] = {AArch64::sube32, AArch64::subo32};
6047 AArch64::WZR, Indices);
6051 if (AArch64::FPR128RegClass.
contains(DestReg) &&
6052 AArch64::FPR128RegClass.
contains(SrcReg)) {
6056 if ((Subtarget.isSVEorStreamingSVEAvailable() &&
6057 !Subtarget.isNeonAvailable()) ||
6061 .
addReg(AArch64::Z0 + (SrcReg - AArch64::Q0))
6062 .
addReg(AArch64::Z0 + (SrcReg - AArch64::Q0));
6063 }
else if (Subtarget.isNeonAvailable()) {
6067 if (Subtarget.hasZeroCycleRegMoveFPR128())
6068 ++NumZCRegMoveInstrsFPR;
6084 if (AArch64::FPR64RegClass.
contains(DestReg) &&
6085 AArch64::FPR64RegClass.
contains(SrcReg)) {
6086 if (Subtarget.hasZeroCycleRegMoveFPR128() &&
6087 !Subtarget.hasZeroCycleRegMoveFPR64() &&
6088 !Subtarget.hasZeroCycleRegMoveFPR32() && Subtarget.isNeonAvailable() &&
6090 MCRegister DestRegQ = RI.getMatchingSuperReg(DestReg, AArch64::dsub,
6091 &AArch64::FPR128RegClass);
6092 MCRegister SrcRegQ = RI.getMatchingSuperReg(SrcReg, AArch64::dsub,
6093 &AArch64::FPR128RegClass);
6102 ++NumZCRegMoveInstrsFPR;
6106 if (Subtarget.hasZeroCycleRegMoveFPR64())
6107 ++NumZCRegMoveInstrsFPR;
6112 if (AArch64::FPR32RegClass.
contains(DestReg) &&
6113 AArch64::FPR32RegClass.
contains(SrcReg)) {
6114 if (Subtarget.hasZeroCycleRegMoveFPR128() &&
6115 !Subtarget.hasZeroCycleRegMoveFPR64() &&
6116 !Subtarget.hasZeroCycleRegMoveFPR32() && Subtarget.isNeonAvailable() &&
6118 MCRegister DestRegQ = RI.getMatchingSuperReg(DestReg, AArch64::ssub,
6119 &AArch64::FPR128RegClass);
6120 MCRegister SrcRegQ = RI.getMatchingSuperReg(SrcReg, AArch64::ssub,
6121 &AArch64::FPR128RegClass);
6130 ++NumZCRegMoveInstrsFPR;
6131 }
else if (Subtarget.hasZeroCycleRegMoveFPR64() &&
6132 !Subtarget.hasZeroCycleRegMoveFPR32()) {
6133 MCRegister DestRegD = RI.getMatchingSuperReg(DestReg, AArch64::ssub,
6134 &AArch64::FPR64RegClass);
6135 MCRegister SrcRegD = RI.getMatchingSuperReg(SrcReg, AArch64::ssub,
6136 &AArch64::FPR64RegClass);
6144 ++NumZCRegMoveInstrsFPR;
6148 if (Subtarget.hasZeroCycleRegMoveFPR32())
6149 ++NumZCRegMoveInstrsFPR;
6154 if (AArch64::FPR16RegClass.
contains(DestReg) &&
6155 AArch64::FPR16RegClass.
contains(SrcReg)) {
6156 if (Subtarget.hasZeroCycleRegMoveFPR128() &&
6157 !Subtarget.hasZeroCycleRegMoveFPR64() &&
6158 !Subtarget.hasZeroCycleRegMoveFPR32() && Subtarget.isNeonAvailable() &&
6160 MCRegister DestRegQ = RI.getMatchingSuperReg(DestReg, AArch64::hsub,
6161 &AArch64::FPR128RegClass);
6162 MCRegister SrcRegQ = RI.getMatchingSuperReg(SrcReg, AArch64::hsub,
6163 &AArch64::FPR128RegClass);
6172 }
else if (Subtarget.hasZeroCycleRegMoveFPR64() &&
6173 !Subtarget.hasZeroCycleRegMoveFPR32()) {
6174 MCRegister DestRegD = RI.getMatchingSuperReg(DestReg, AArch64::hsub,
6175 &AArch64::FPR64RegClass);
6176 MCRegister SrcRegD = RI.getMatchingSuperReg(SrcReg, AArch64::hsub,
6177 &AArch64::FPR64RegClass);
6186 DestReg = RI.getMatchingSuperReg(DestReg, AArch64::hsub,
6187 &AArch64::FPR32RegClass);
6188 SrcReg = RI.getMatchingSuperReg(SrcReg, AArch64::hsub,
6189 &AArch64::FPR32RegClass);
6196 if (AArch64::FPR8RegClass.
contains(DestReg) &&
6197 AArch64::FPR8RegClass.
contains(SrcReg)) {
6198 if (Subtarget.hasZeroCycleRegMoveFPR128() &&
6199 !Subtarget.hasZeroCycleRegMoveFPR64() &&
6200 !Subtarget.hasZeroCycleRegMoveFPR32() && Subtarget.isNeonAvailable() &&
6202 MCRegister DestRegQ = RI.getMatchingSuperReg(DestReg, AArch64::bsub,
6203 &AArch64::FPR128RegClass);
6204 MCRegister SrcRegQ = RI.getMatchingSuperReg(SrcReg, AArch64::bsub,
6205 &AArch64::FPR128RegClass);
6214 }
else if (Subtarget.hasZeroCycleRegMoveFPR64() &&
6215 !Subtarget.hasZeroCycleRegMoveFPR32()) {
6216 MCRegister DestRegD = RI.getMatchingSuperReg(DestReg, AArch64::bsub,
6217 &AArch64::FPR64RegClass);
6218 MCRegister SrcRegD = RI.getMatchingSuperReg(SrcReg, AArch64::bsub,
6219 &AArch64::FPR64RegClass);
6228 DestReg = RI.getMatchingSuperReg(DestReg, AArch64::bsub,
6229 &AArch64::FPR32RegClass);
6230 SrcReg = RI.getMatchingSuperReg(SrcReg, AArch64::bsub,
6231 &AArch64::FPR32RegClass);
6239 if (AArch64::FPR64RegClass.
contains(DestReg) &&
6240 AArch64::GPR64RegClass.
contains(SrcReg)) {
6241 if (AArch64::XZR == SrcReg) {
6249 if (AArch64::GPR64RegClass.
contains(DestReg) &&
6250 AArch64::FPR64RegClass.
contains(SrcReg)) {
6256 if (AArch64::FPR32RegClass.
contains(DestReg) &&
6257 AArch64::GPR32RegClass.
contains(SrcReg)) {
6258 if (AArch64::WZR == SrcReg) {
6266 if (AArch64::GPR32RegClass.
contains(DestReg) &&
6267 AArch64::FPR32RegClass.
contains(SrcReg)) {
6273 if (DestReg == AArch64::NZCV) {
6274 assert(AArch64::GPR64RegClass.
contains(SrcReg) &&
"Invalid NZCV copy");
6276 .
addImm(AArch64SysReg::NZCV)
6282 if (SrcReg == AArch64::NZCV) {
6283 assert(AArch64::GPR64RegClass.
contains(DestReg) &&
"Invalid NZCV copy");
6285 .
addImm(AArch64SysReg::NZCV)
6291 errs() << RI.getRegAsmName(DestReg) <<
" = COPY " << RI.getRegAsmName(SrcReg)
6302 unsigned SubIdx0,
unsigned SubIdx1,
int FI,
6307 SrcReg0 =
TRI.getSubReg(SrcReg, SubIdx0);
6309 SrcReg1 =
TRI.getSubReg(SrcReg, SubIdx1);
6322 Register SrcReg,
bool isKill,
int FI,
6337 switch (RI.getSpillSize(*RC)) {
6339 if (AArch64::FPR8RegClass.hasSubClassEq(RC))
6340 Opc = AArch64::STRBui;
6343 if (AArch64::FPR16RegClass.hasSubClassEq(RC))
6344 Opc = AArch64::STRHui;
6345 else if (AArch64::PNRRegClass.hasSubClassEq(RC) ||
6346 AArch64::PPRRegClass.hasSubClassEq(RC)) {
6347 assert(Subtarget.isSVEorStreamingSVEAvailable() &&
6348 "Unexpected register store without SVE store instructions");
6349 Opc = AArch64::STR_PXI;
6355 if (AArch64::GPR32allRegClass.hasSubClassEq(RC)) {
6356 Opc = AArch64::STRWui;
6360 assert(SrcReg != AArch64::WSP);
6361 }
else if (AArch64::FPR32RegClass.hasSubClassEq(RC))
6362 Opc = AArch64::STRSui;
6363 else if (AArch64::PPR2RegClass.hasSubClassEq(RC)) {
6364 Opc = AArch64::STR_PPXI;
6369 if (AArch64::GPR64allRegClass.hasSubClassEq(RC)) {
6370 Opc = AArch64::STRXui;
6374 assert(SrcReg != AArch64::SP);
6375 }
else if (AArch64::FPR64RegClass.hasSubClassEq(RC)) {
6376 Opc = AArch64::STRDui;
6377 }
else if (AArch64::WSeqPairsClassRegClass.hasSubClassEq(RC)) {
6379 get(AArch64::STPWi), SrcReg, isKill,
6380 AArch64::sube32, AArch64::subo32, FI, MMO);
6385 if (AArch64::FPR128RegClass.hasSubClassEq(RC))
6386 Opc = AArch64::STRQui;
6387 else if (AArch64::DDRegClass.hasSubClassEq(RC)) {
6388 assert(Subtarget.hasNEON() &&
"Unexpected register store without NEON");
6389 Opc = AArch64::ST1Twov1d;
6391 }
else if (AArch64::XSeqPairsClassRegClass.hasSubClassEq(RC)) {
6393 get(AArch64::STPXi), SrcReg, isKill,
6394 AArch64::sube64, AArch64::subo64, FI, MMO);
6396 }
else if (AArch64::ZPRRegClass.hasSubClassEq(RC)) {
6397 assert(Subtarget.isSVEorStreamingSVEAvailable() &&
6398 "Unexpected register store without SVE store instructions");
6399 Opc = AArch64::STR_ZXI;
6404 if (AArch64::DDDRegClass.hasSubClassEq(RC)) {
6405 assert(Subtarget.hasNEON() &&
"Unexpected register store without NEON");
6406 Opc = AArch64::ST1Threev1d;
6411 if (AArch64::DDDDRegClass.hasSubClassEq(RC)) {
6412 assert(Subtarget.hasNEON() &&
"Unexpected register store without NEON");
6413 Opc = AArch64::ST1Fourv1d;
6415 }
else if (AArch64::QQRegClass.hasSubClassEq(RC)) {
6416 assert(Subtarget.hasNEON() &&
"Unexpected register store without NEON");
6417 Opc = AArch64::ST1Twov2d;
6419 }
else if (AArch64::ZPR2StridedOrContiguousRegClass.hasSubClassEq(RC)) {
6420 assert(Subtarget.isSVEorStreamingSVEAvailable() &&
6421 "Unexpected register store without SVE store instructions");
6422 Opc = AArch64::STR_ZZXI_STRIDED_CONTIGUOUS;
6424 }
else if (AArch64::ZPR2RegClass.hasSubClassEq(RC)) {
6425 assert(Subtarget.isSVEorStreamingSVEAvailable() &&
6426 "Unexpected register store without SVE store instructions");
6427 Opc = AArch64::STR_ZZXI;
6432 if (AArch64::QQQRegClass.hasSubClassEq(RC)) {
6433 assert(Subtarget.hasNEON() &&
"Unexpected register store without NEON");
6434 Opc = AArch64::ST1Threev2d;
6436 }
else if (AArch64::ZPR3RegClass.hasSubClassEq(RC)) {
6437 assert(Subtarget.isSVEorStreamingSVEAvailable() &&
6438 "Unexpected register store without SVE store instructions");
6439 Opc = AArch64::STR_ZZZXI;
6444 if (AArch64::QQQQRegClass.hasSubClassEq(RC)) {
6445 assert(Subtarget.hasNEON() &&
"Unexpected register store without NEON");
6446 Opc = AArch64::ST1Fourv2d;
6448 }
else if (AArch64::ZPR4StridedOrContiguousRegClass.hasSubClassEq(RC)) {
6449 assert(Subtarget.isSVEorStreamingSVEAvailable() &&
6450 "Unexpected register store without SVE store instructions");
6451 Opc = AArch64::STR_ZZZZXI_STRIDED_CONTIGUOUS;
6453 }
else if (AArch64::ZPR4RegClass.hasSubClassEq(RC)) {
6454 assert(Subtarget.isSVEorStreamingSVEAvailable() &&
6455 "Unexpected register store without SVE store instructions");
6456 Opc = AArch64::STR_ZZZZXI;
6461 assert(
Opc &&
"Unknown register class");
6472 MI.addMemOperand(MMO);
6479 Register DestReg,
unsigned SubIdx0,
6480 unsigned SubIdx1,
int FI,
6484 bool IsUndef =
true;
6486 DestReg0 =
TRI.getSubReg(DestReg, SubIdx0);
6488 DestReg1 =
TRI.getSubReg(DestReg, SubIdx1);
6517 switch (
TRI.getSpillSize(*RC)) {
6519 if (AArch64::FPR8RegClass.hasSubClassEq(RC))
6520 Opc = AArch64::LDRBui;
6523 bool IsPNR = AArch64::PNRRegClass.hasSubClassEq(RC);
6524 if (AArch64::FPR16RegClass.hasSubClassEq(RC))
6525 Opc = AArch64::LDRHui;
6526 else if (IsPNR || AArch64::PPRRegClass.hasSubClassEq(RC)) {
6527 assert(Subtarget.isSVEorStreamingSVEAvailable() &&
6528 "Unexpected register load without SVE load instructions");
6531 Opc = AArch64::LDR_PXI;
6537 if (AArch64::GPR32allRegClass.hasSubClassEq(RC)) {
6538 Opc = AArch64::LDRWui;
6542 assert(DestReg != AArch64::WSP);
6543 }
else if (AArch64::FPR32RegClass.hasSubClassEq(RC))
6544 Opc = AArch64::LDRSui;
6545 else if (AArch64::PPR2RegClass.hasSubClassEq(RC)) {
6546 Opc = AArch64::LDR_PPXI;
6551 if (AArch64::GPR64allRegClass.hasSubClassEq(RC)) {
6552 Opc = AArch64::LDRXui;
6556 assert(DestReg != AArch64::SP);
6557 }
else if (AArch64::FPR64RegClass.hasSubClassEq(RC)) {
6558 Opc = AArch64::LDRDui;
6559 }
else if (AArch64::WSeqPairsClassRegClass.hasSubClassEq(RC)) {
6561 get(AArch64::LDPWi), DestReg, AArch64::sube32,
6562 AArch64::subo32, FI, MMO);
6567 if (AArch64::FPR128RegClass.hasSubClassEq(RC))
6568 Opc = AArch64::LDRQui;
6569 else if (AArch64::DDRegClass.hasSubClassEq(RC)) {
6570 assert(Subtarget.hasNEON() &&
"Unexpected register load without NEON");
6571 Opc = AArch64::LD1Twov1d;
6573 }
else if (AArch64::XSeqPairsClassRegClass.hasSubClassEq(RC)) {
6575 get(AArch64::LDPXi), DestReg, AArch64::sube64,
6576 AArch64::subo64, FI, MMO);
6578 }
else if (AArch64::ZPRRegClass.hasSubClassEq(RC)) {
6579 assert(Subtarget.isSVEorStreamingSVEAvailable() &&
6580 "Unexpected register load without SVE load instructions");
6581 Opc = AArch64::LDR_ZXI;
6586 if (AArch64::DDDRegClass.hasSubClassEq(RC)) {
6587 assert(Subtarget.hasNEON() &&
"Unexpected register load without NEON");
6588 Opc = AArch64::LD1Threev1d;
6593 if (AArch64::DDDDRegClass.hasSubClassEq(RC)) {
6594 assert(Subtarget.hasNEON() &&
"Unexpected register load without NEON");
6595 Opc = AArch64::LD1Fourv1d;
6597 }
else if (AArch64::QQRegClass.hasSubClassEq(RC)) {
6598 assert(Subtarget.hasNEON() &&
"Unexpected register load without NEON");
6599 Opc = AArch64::LD1Twov2d;
6601 }
else if (AArch64::ZPR2StridedOrContiguousRegClass.hasSubClassEq(RC)) {
6602 assert(Subtarget.isSVEorStreamingSVEAvailable() &&
6603 "Unexpected register load without SVE load instructions");
6604 Opc = AArch64::LDR_ZZXI_STRIDED_CONTIGUOUS;
6606 }
else if (AArch64::ZPR2RegClass.hasSubClassEq(RC)) {
6607 assert(Subtarget.isSVEorStreamingSVEAvailable() &&
6608 "Unexpected register load without SVE load instructions");
6609 Opc = AArch64::LDR_ZZXI;
6614 if (AArch64::QQQRegClass.hasSubClassEq(RC)) {
6615 assert(Subtarget.hasNEON() &&
"Unexpected register load without NEON");
6616 Opc = AArch64::LD1Threev2d;
6618 }
else if (AArch64::ZPR3RegClass.hasSubClassEq(RC)) {
6619 assert(Subtarget.isSVEorStreamingSVEAvailable() &&
6620 "Unexpected register load without SVE load instructions");
6621 Opc = AArch64::LDR_ZZZXI;
6626 if (AArch64::QQQQRegClass.hasSubClassEq(RC)) {
6627 assert(Subtarget.hasNEON() &&
"Unexpected register load without NEON");
6628 Opc = AArch64::LD1Fourv2d;
6630 }
else if (AArch64::ZPR4StridedOrContiguousRegClass.hasSubClassEq(RC)) {
6631 assert(Subtarget.isSVEorStreamingSVEAvailable() &&
6632 "Unexpected register load without SVE load instructions");
6633 Opc = AArch64::LDR_ZZZZXI_STRIDED_CONTIGUOUS;
6635 }
else if (AArch64::ZPR4RegClass.hasSubClassEq(RC)) {
6636 assert(Subtarget.isSVEorStreamingSVEAvailable() &&
6637 "Unexpected register load without SVE load instructions");
6638 Opc = AArch64::LDR_ZZZZXI;
6644 assert(
Opc &&
"Unknown register class");
6654 MI.addMemOperand(MMO);
6661 UseMI.getIterator()),
6663 return I.modifiesRegister(AArch64::NZCV, TRI) ||
6664 I.readsRegister(AArch64::NZCV, TRI);
6668void AArch64InstrInfo::decomposeStackOffsetForDwarfOffsets(
6673 assert(
Offset.getScalable() % 2 == 0 &&
"Invalid frame offset");
6680 ByteSized =
Offset.getFixed();
6681 VGSized =
Offset.getScalable() / 2;
6687void AArch64InstrInfo::decomposeStackOffsetForFrameOffsets(
6689 int64_t &NumDataVectors) {
6693 assert(
Offset.getScalable() % 2 == 0 &&
"Invalid frame offset");
6695 NumBytes =
Offset.getFixed();
6697 NumPredicateVectors =
Offset.getScalable() / 2;
6702 if (NumPredicateVectors % 8 == 0 || NumPredicateVectors < -64 ||
6703 NumPredicateVectors > 62) {
6704 NumDataVectors = NumPredicateVectors / 8;
6705 NumPredicateVectors -= NumDataVectors * 8;
6731 Expr.
push_back((
char)dwarf::DW_OP_bregx);
6739 int64_t OffsetFromDefCFA) {
6753 Comment << (NumBytes < 0 ?
" - " :
" + ") << std::abs(NumBytes);
6754 if (!RegScale.empty())
6764 int64_t NumBytes, NumVGScaledBytes;
6765 AArch64InstrInfo::decomposeStackOffsetForDwarfOffsets(
Offset, NumBytes,
6767 std::string CommentBuffer;
6770 if (
Reg == AArch64::SP)
6772 else if (
Reg == AArch64::FP)
6779 unsigned DwarfReg =
TRI.getDwarfRegNum(
Reg,
true);
6780 assert(DwarfReg <= 31 &&
"DwarfReg out of bounds (0..31)");
6782 Expr.
push_back(dwarf::DW_OP_breg0 + DwarfReg);
6785 if (NumVGScaledBytes) {
6795 DefCfaExpr.
push_back(dwarf::DW_CFA_def_cfa_expression);
6803 unsigned FrameReg,
unsigned Reg,
6805 bool LastAdjustmentWasScalable) {
6806 if (
Offset.getScalable())
6809 if (FrameReg == Reg && !LastAdjustmentWasScalable)
6812 unsigned DwarfReg =
TRI.getDwarfRegNum(Reg,
true);
6819 std::optional<int64_t> IncomingVGOffsetFromDefCFA) {
6820 int64_t NumBytes, NumVGScaledBytes;
6821 AArch64InstrInfo::decomposeStackOffsetForDwarfOffsets(
6822 OffsetFromDefCFA, NumBytes, NumVGScaledBytes);
6824 unsigned DwarfReg =
TRI.getDwarfRegNum(Reg,
true);
6827 if (!NumVGScaledBytes)
6830 std::string CommentBuffer;
6835 assert(NumVGScaledBytes &&
"Expected scalable offset");
6839 if (IncomingVGOffsetFromDefCFA) {
6841 VGRegScale =
"* IncomingVG";
6844 VGRegScale =
"* VG";
6848 OffsetExpr.
push_back(dwarf::DW_OP_plus);
6857 CfaExpr.
push_back(dwarf::DW_CFA_expression);
6872 unsigned SrcReg, int64_t
Offset,
unsigned Opc,
6875 bool *HasWinCFI,
bool EmitCFAOffset,
6878 unsigned MaxEncoding, ShiftSize;
6880 case AArch64::ADDXri:
6881 case AArch64::ADDSXri:
6882 case AArch64::SUBXri:
6883 case AArch64::SUBSXri:
6884 MaxEncoding = 0xfff;
6887 case AArch64::ADDVL_XXI:
6888 case AArch64::ADDPL_XXI:
6889 case AArch64::ADDSVL_XXI:
6890 case AArch64::ADDSPL_XXI:
6905 if (
Opc == AArch64::ADDVL_XXI ||
Opc == AArch64::ADDSVL_XXI)
6907 else if (
Opc == AArch64::ADDPL_XXI ||
Opc == AArch64::ADDSPL_XXI)
6921 const unsigned MaxEncodableValue = MaxEncoding << ShiftSize;
6923 if (TmpReg == AArch64::XZR)
6924 TmpReg =
MBB.getParent()->getRegInfo().createVirtualRegister(
6925 &AArch64::GPR64RegClass);
6927 uint64_t ThisVal = std::min<uint64_t>(
Offset, MaxEncodableValue);
6928 unsigned LocalShiftSize = 0;
6929 if (ThisVal > MaxEncoding) {
6930 ThisVal = ThisVal >> ShiftSize;
6931 LocalShiftSize = ShiftSize;
6933 assert((ThisVal >> ShiftSize) <= MaxEncoding &&
6934 "Encoding cannot handle value that big");
6936 Offset -= ThisVal << LocalShiftSize;
6941 .
addImm(Sign * (
int)ThisVal);
6951 if (Sign == -1 ||
Opc == AArch64::SUBXri ||
Opc == AArch64::SUBSXri)
6952 CFAOffset += Change;
6954 CFAOffset -= Change;
6955 if (EmitCFAOffset && DestReg == TmpReg) {
6968 int Imm = (int)(ThisVal << LocalShiftSize);
6969 if (VScale != 1 && DestReg == AArch64::SP) {
6975 }
else if ((DestReg == AArch64::FP && SrcReg == AArch64::SP) ||
6976 (SrcReg == AArch64::FP && DestReg == AArch64::SP)) {
6977 assert(VScale == 1 &&
"Expected non-scalable operation");
6986 assert(
Offset == 0 &&
"Expected remaining offset to be zero to "
6987 "emit a single SEH directive");
6988 }
else if (DestReg == AArch64::SP) {
6989 assert(VScale == 1 &&
"Expected non-scalable operation");
6992 assert(SrcReg == AArch64::SP &&
"Unexpected SrcReg for SEH_StackAlloc");
7005 unsigned DestReg,
unsigned SrcReg,
7008 bool NeedsWinCFI,
bool *HasWinCFI,
7010 unsigned FrameReg) {
7017 bool UseSVL =
F.hasFnAttribute(
"aarch64_pstate_sm_body");
7019 int64_t Bytes, NumPredicateVectors, NumDataVectors;
7020 AArch64InstrInfo::decomposeStackOffsetForFrameOffsets(
7021 Offset, Bytes, NumPredicateVectors, NumDataVectors);
7024 bool NeedsFinalDefNZCV = SetNZCV && (NumPredicateVectors || NumDataVectors);
7025 if (NeedsFinalDefNZCV)
7029 if (Bytes || (!
Offset && SrcReg != DestReg)) {
7030 assert((DestReg != AArch64::SP || Bytes % 8 == 0) &&
7031 "SP increment/decrement not 8-byte aligned");
7032 unsigned Opc = SetNZCV ? AArch64::ADDSXri : AArch64::ADDXri;
7035 Opc = SetNZCV ? AArch64::SUBSXri : AArch64::SUBXri;
7038 NeedsWinCFI, HasWinCFI, EmitCFAOffset, CFAOffset,
7040 CFAOffset += (
Opc == AArch64::ADDXri ||
Opc == AArch64::ADDSXri)
7047 assert(!(NeedsWinCFI && NumPredicateVectors) &&
7048 "WinCFI can't allocate fractions of an SVE data vector");
7050 if (NumDataVectors) {
7052 UseSVL ? AArch64::ADDSVL_XXI : AArch64::ADDVL_XXI,
TII,
7053 Flag, NeedsWinCFI, HasWinCFI, EmitCFAOffset, CFAOffset,
7059 if (NumPredicateVectors) {
7060 assert(DestReg != AArch64::SP &&
"Unaligned access to SP");
7062 UseSVL ? AArch64::ADDSPL_XXI : AArch64::ADDPL_XXI,
TII,
7063 Flag, NeedsWinCFI, HasWinCFI, EmitCFAOffset, CFAOffset,
7067 if (NeedsFinalDefNZCV)
7089 if (
MI.isFullCopy()) {
7092 if (SrcReg == AArch64::SP && DstReg.
isVirtual()) {
7096 if (DstReg == AArch64::SP && SrcReg.
isVirtual()) {
7101 if (SrcReg == AArch64::NZCV || DstReg == AArch64::NZCV)
7129 if (
MI.isCopy() &&
Ops.size() == 1 &&
7131 (
Ops[0] == 0 ||
Ops[0] == 1)) {
7132 bool IsSpill =
Ops[0] == 0;
7133 bool IsFill = !IsSpill;
7145 :
TRI.getMinimalPhysRegClass(Reg);
7151 "Mismatched register size in non subreg COPY");
7158 return &*--InsertPt;
7170 if (IsSpill && DstMO.
isUndef() && SrcReg == AArch64::WZR &&
7173 "Unexpected subreg on physical register");
7175 FrameIndex, &AArch64::GPR64RegClass,
Register());
7176 return &*--InsertPt;
7193 case AArch64::sub_32:
7194 if (AArch64::GPR64RegClass.hasSubClassEq(
getRegClass(DstReg)))
7195 FillRC = &AArch64::GPR32RegClass;
7198 FillRC = &AArch64::FPR32RegClass;
7201 FillRC = &AArch64::FPR64RegClass;
7207 TRI.getRegSizeInBits(*FillRC) &&
7208 "Mismatched regclass size on folded subreg COPY");
7227 bool *OutUseUnscaledOp,
7228 unsigned *OutUnscaledOp,
7229 int64_t *EmittableOffset) {
7231 if (EmittableOffset)
7232 *EmittableOffset = 0;
7233 if (OutUseUnscaledOp)
7234 *OutUseUnscaledOp =
false;
7240 switch (
MI.getOpcode()) {
7243 case AArch64::LD1Rv1d:
7244 case AArch64::LD1Rv2s:
7245 case AArch64::LD1Rv2d:
7246 case AArch64::LD1Rv4h:
7247 case AArch64::LD1Rv4s:
7248 case AArch64::LD1Rv8b:
7249 case AArch64::LD1Rv8h:
7250 case AArch64::LD1Rv16b:
7251 case AArch64::LD1Twov2d:
7252 case AArch64::LD1Threev2d:
7253 case AArch64::LD1Fourv2d:
7254 case AArch64::LD1Twov1d:
7255 case AArch64::LD1Threev1d:
7256 case AArch64::LD1Fourv1d:
7257 case AArch64::ST1Twov2d:
7258 case AArch64::ST1Threev2d:
7259 case AArch64::ST1Fourv2d:
7260 case AArch64::ST1Twov1d:
7261 case AArch64::ST1Threev1d:
7262 case AArch64::ST1Fourv1d:
7263 case AArch64::ST1i8:
7264 case AArch64::ST1i16:
7265 case AArch64::ST1i32:
7266 case AArch64::ST1i64:
7268 case AArch64::IRGstack:
7269 case AArch64::STGloop:
7270 case AArch64::STZGloop:
7275 TypeSize ScaleValue(0U,
false), Width(0U,
false);
7276 int64_t MinOff, MaxOff;
7282 bool IsMulVL = ScaleValue.isScalable();
7283 unsigned Scale = ScaleValue.getKnownMinValue();
7293 std::optional<unsigned> UnscaledOp =
7295 bool useUnscaledOp = UnscaledOp && (
Offset % Scale ||
Offset < 0);
7296 if (useUnscaledOp &&
7301 Scale = ScaleValue.getKnownMinValue();
7302 assert(IsMulVL == ScaleValue.isScalable() &&
7303 "Unscaled opcode has different value for scalable");
7305 int64_t Remainder =
Offset % Scale;
7306 assert(!(Remainder && useUnscaledOp) &&
7307 "Cannot have remainder when using unscaled op");
7309 assert(MinOff < MaxOff &&
"Unexpected Min/Max offsets");
7310 int64_t NewOffset =
Offset / Scale;
7311 if (MinOff <= NewOffset && NewOffset <= MaxOff)
7319 int64_t HighPart =
Offset & ~0xFFF;
7320 int64_t LowPart =
Offset & 0xFFF;
7321 int64_t LowScaled = LowPart / Scale;
7322 if (!IsMulVL && NewOffset >= 0 && LowPart % Scale == 0 &&
7323 MinOff <= LowScaled && LowScaled <= MaxOff &&
7325 NewOffset = LowScaled;
7330 NewOffset = NewOffset < 0 ? MinOff : MaxOff;
7335 if (EmittableOffset)
7336 *EmittableOffset = NewOffset;
7337 if (OutUseUnscaledOp)
7338 *OutUseUnscaledOp = useUnscaledOp;
7339 if (OutUnscaledOp && UnscaledOp)
7340 *OutUnscaledOp = *UnscaledOp;
7353 unsigned Opcode =
MI.getOpcode();
7354 unsigned ImmIdx = FrameRegIdx + 1;
7356 if (Opcode == AArch64::ADDSXri || Opcode == AArch64::ADDXri) {
7361 MI.eraseFromParent();
7367 unsigned UnscaledOp;
7370 &UnscaledOp, &NewOffset);
7374 MI.getOperand(FrameRegIdx).ChangeToRegister(FrameReg,
false);
7376 MI.setDesc(
TII->get(UnscaledOp));
7378 MI.getOperand(ImmIdx).ChangeToImmediate(NewOffset);
7394bool AArch64InstrInfo::useMachineCombiner()
const {
return true; }
7399 case AArch64::ADDSWrr:
7400 case AArch64::ADDSWri:
7401 case AArch64::ADDSXrr:
7402 case AArch64::ADDSXri:
7403 case AArch64::SUBSWrr:
7404 case AArch64::SUBSXrr:
7406 case AArch64::SUBSWri:
7407 case AArch64::SUBSXri:
7418 case AArch64::ADDWrr:
7419 case AArch64::ADDWri:
7420 case AArch64::SUBWrr:
7421 case AArch64::ADDSWrr:
7422 case AArch64::ADDSWri:
7423 case AArch64::SUBSWrr:
7425 case AArch64::SUBWri:
7426 case AArch64::SUBSWri:
7437 case AArch64::ADDXrr:
7438 case AArch64::ADDXri:
7439 case AArch64::SUBXrr:
7440 case AArch64::ADDSXrr:
7441 case AArch64::ADDSXri:
7442 case AArch64::SUBSXrr:
7444 case AArch64::SUBXri:
7445 case AArch64::SUBSXri:
7446 case AArch64::ADDv8i8:
7447 case AArch64::ADDv16i8:
7448 case AArch64::ADDv4i16:
7449 case AArch64::ADDv8i16:
7450 case AArch64::ADDv2i32:
7451 case AArch64::ADDv4i32:
7452 case AArch64::SUBv8i8:
7453 case AArch64::SUBv16i8:
7454 case AArch64::SUBv4i16:
7455 case AArch64::SUBv8i16:
7456 case AArch64::SUBv2i32:
7457 case AArch64::SUBv4i32:
7470 case AArch64::FADDHrr:
7471 case AArch64::FADDSrr:
7472 case AArch64::FADDDrr:
7473 case AArch64::FADDv4f16:
7474 case AArch64::FADDv8f16:
7475 case AArch64::FADDv2f32:
7476 case AArch64::FADDv2f64:
7477 case AArch64::FADDv4f32:
7478 case AArch64::FSUBHrr:
7479 case AArch64::FSUBSrr:
7480 case AArch64::FSUBDrr:
7481 case AArch64::FSUBv4f16:
7482 case AArch64::FSUBv8f16:
7483 case AArch64::FSUBv2f32:
7484 case AArch64::FSUBv2f64:
7485 case AArch64::FSUBv4f32:
7504 unsigned CombineOpc,
unsigned ZeroReg = 0,
7505 bool CheckZeroReg =
false) {
7512 if (!
MI ||
MI->getParent() != &
MBB ||
MI->getOpcode() != CombineOpc)
7519 assert(
MI->getNumOperands() >= 4 &&
MI->getOperand(0).isReg() &&
7520 MI->getOperand(1).isReg() &&
MI->getOperand(2).isReg() &&
7521 MI->getOperand(3).isReg() &&
"MAdd/MSub must have a least 4 regs");
7523 if (
MI->getOperand(3).getReg() != ZeroReg)
7528 MI->findRegisterDefOperandIdx(AArch64::NZCV,
nullptr,
true) == -1)
7537 unsigned MulOpc,
unsigned ZeroReg) {
7552bool AArch64InstrInfo::isAssociativeAndCommutative(
const MachineInstr &Inst,
7553 bool Invert)
const {
7559 case AArch64::FADDHrr:
7560 case AArch64::FADDSrr:
7561 case AArch64::FADDDrr:
7562 case AArch64::FMULHrr:
7563 case AArch64::FMULSrr:
7564 case AArch64::FMULDrr:
7565 case AArch64::FMULX16:
7566 case AArch64::FMULX32:
7567 case AArch64::FMULX64:
7569 case AArch64::FADDv4f16:
7570 case AArch64::FADDv8f16:
7571 case AArch64::FADDv2f32:
7572 case AArch64::FADDv4f32:
7573 case AArch64::FADDv2f64:
7574 case AArch64::FMULv4f16:
7575 case AArch64::FMULv8f16:
7576 case AArch64::FMULv2f32:
7577 case AArch64::FMULv4f32:
7578 case AArch64::FMULv2f64:
7579 case AArch64::FMULXv4f16:
7580 case AArch64::FMULXv8f16:
7581 case AArch64::FMULXv2f32:
7582 case AArch64::FMULXv4f32:
7583 case AArch64::FMULXv2f64:
7587 case AArch64::FADD_ZZZ_H:
7588 case AArch64::FADD_ZZZ_S:
7589 case AArch64::FADD_ZZZ_D:
7590 case AArch64::FMUL_ZZZ_H:
7591 case AArch64::FMUL_ZZZ_S:
7592 case AArch64::FMUL_ZZZ_D:
7603 case AArch64::ADDWrr:
7604 case AArch64::ADDXrr:
7605 case AArch64::ANDWrr:
7606 case AArch64::ANDXrr:
7607 case AArch64::ORRWrr:
7608 case AArch64::ORRXrr:
7609 case AArch64::EORWrr:
7610 case AArch64::EORXrr:
7611 case AArch64::EONWrr:
7612 case AArch64::EONXrr:
7616 case AArch64::ADDv8i8:
7617 case AArch64::ADDv16i8:
7618 case AArch64::ADDv4i16:
7619 case AArch64::ADDv8i16:
7620 case AArch64::ADDv2i32:
7621 case AArch64::ADDv4i32:
7622 case AArch64::ADDv1i64:
7623 case AArch64::ADDv2i64:
7624 case AArch64::MULv8i8:
7625 case AArch64::MULv16i8:
7626 case AArch64::MULv4i16:
7627 case AArch64::MULv8i16:
7628 case AArch64::MULv2i32:
7629 case AArch64::MULv4i32:
7630 case AArch64::ANDv8i8:
7631 case AArch64::ANDv16i8:
7632 case AArch64::ORRv8i8:
7633 case AArch64::ORRv16i8:
7634 case AArch64::EORv8i8:
7635 case AArch64::EORv16i8:
7637 case AArch64::ADD_ZZZ_B:
7638 case AArch64::ADD_ZZZ_H:
7639 case AArch64::ADD_ZZZ_S:
7640 case AArch64::ADD_ZZZ_D:
7641 case AArch64::MUL_ZZZ_B:
7642 case AArch64::MUL_ZZZ_H:
7643 case AArch64::MUL_ZZZ_S:
7644 case AArch64::MUL_ZZZ_D:
7645 case AArch64::AND_ZZZ:
7646 case AArch64::ORR_ZZZ:
7647 case AArch64::EOR_ZZZ:
7678 auto setFound = [&](
int Opcode,
int Operand,
unsigned ZeroReg,
7686 auto setVFound = [&](
int Opcode,
int Operand,
unsigned Pattern) {
7698 case AArch64::ADDWrr:
7700 "ADDWrr does not have register operands");
7701 setFound(AArch64::MADDWrrr, 1, AArch64::WZR, MCP::MULADDW_OP1);
7702 setFound(AArch64::MADDWrrr, 2, AArch64::WZR, MCP::MULADDW_OP2);
7704 case AArch64::ADDXrr:
7705 setFound(AArch64::MADDXrrr, 1, AArch64::XZR, MCP::MULADDX_OP1);
7706 setFound(AArch64::MADDXrrr, 2, AArch64::XZR, MCP::MULADDX_OP2);
7708 case AArch64::SUBWrr:
7709 setFound(AArch64::MADDWrrr, 2, AArch64::WZR, MCP::MULSUBW_OP2);
7710 setFound(AArch64::MADDWrrr, 1, AArch64::WZR, MCP::MULSUBW_OP1);
7712 case AArch64::SUBXrr:
7713 setFound(AArch64::MADDXrrr, 2, AArch64::XZR, MCP::MULSUBX_OP2);
7714 setFound(AArch64::MADDXrrr, 1, AArch64::XZR, MCP::MULSUBX_OP1);
7716 case AArch64::ADDWri:
7717 setFound(AArch64::MADDWrrr, 1, AArch64::WZR, MCP::MULADDWI_OP1);
7719 case AArch64::ADDXri:
7720 setFound(AArch64::MADDXrrr, 1, AArch64::XZR, MCP::MULADDXI_OP1);
7722 case AArch64::SUBWri:
7723 setFound(AArch64::MADDWrrr, 1, AArch64::WZR, MCP::MULSUBWI_OP1);
7725 case AArch64::SUBXri:
7726 setFound(AArch64::MADDXrrr, 1, AArch64::XZR, MCP::MULSUBXI_OP1);
7728 case AArch64::ADDv8i8:
7729 setVFound(AArch64::MULv8i8, 1, MCP::MULADDv8i8_OP1);
7730 setVFound(AArch64::MULv8i8, 2, MCP::MULADDv8i8_OP2);
7732 case AArch64::ADDv16i8:
7733 setVFound(AArch64::MULv16i8, 1, MCP::MULADDv16i8_OP1);
7734 setVFound(AArch64::MULv16i8, 2, MCP::MULADDv16i8_OP2);
7736 case AArch64::ADDv4i16:
7737 setVFound(AArch64::MULv4i16, 1, MCP::MULADDv4i16_OP1);
7738 setVFound(AArch64::MULv4i16, 2, MCP::MULADDv4i16_OP2);
7739 setVFound(AArch64::MULv4i16_indexed, 1, MCP::MULADDv4i16_indexed_OP1);
7740 setVFound(AArch64::MULv4i16_indexed, 2, MCP::MULADDv4i16_indexed_OP2);
7742 case AArch64::ADDv8i16:
7743 setVFound(AArch64::MULv8i16, 1, MCP::MULADDv8i16_OP1);
7744 setVFound(AArch64::MULv8i16, 2, MCP::MULADDv8i16_OP2);
7745 setVFound(AArch64::MULv8i16_indexed, 1, MCP::MULADDv8i16_indexed_OP1);
7746 setVFound(AArch64::MULv8i16_indexed, 2, MCP::MULADDv8i16_indexed_OP2);
7748 case AArch64::ADDv2i32:
7749 setVFound(AArch64::MULv2i32, 1, MCP::MULADDv2i32_OP1);
7750 setVFound(AArch64::MULv2i32, 2, MCP::MULADDv2i32_OP2);
7751 setVFound(AArch64::MULv2i32_indexed, 1, MCP::MULADDv2i32_indexed_OP1);
7752 setVFound(AArch64::MULv2i32_indexed, 2, MCP::MULADDv2i32_indexed_OP2);
7754 case AArch64::ADDv4i32:
7755 setVFound(AArch64::MULv4i32, 1, MCP::MULADDv4i32_OP1);
7756 setVFound(AArch64::MULv4i32, 2, MCP::MULADDv4i32_OP2);
7757 setVFound(AArch64::MULv4i32_indexed, 1, MCP::MULADDv4i32_indexed_OP1);
7758 setVFound(AArch64::MULv4i32_indexed, 2, MCP::MULADDv4i32_indexed_OP2);
7760 case AArch64::SUBv8i8:
7761 setVFound(AArch64::MULv8i8, 1, MCP::MULSUBv8i8_OP1);
7762 setVFound(AArch64::MULv8i8, 2, MCP::MULSUBv8i8_OP2);
7764 case AArch64::SUBv16i8:
7765 setVFound(AArch64::MULv16i8, 1, MCP::MULSUBv16i8_OP1);
7766 setVFound(AArch64::MULv16i8, 2, MCP::MULSUBv16i8_OP2);
7768 case AArch64::SUBv4i16:
7769 setVFound(AArch64::MULv4i16, 1, MCP::MULSUBv4i16_OP1);
7770 setVFound(AArch64::MULv4i16, 2, MCP::MULSUBv4i16_OP2);
7771 setVFound(AArch64::MULv4i16_indexed, 1, MCP::MULSUBv4i16_indexed_OP1);
7772 setVFound(AArch64::MULv4i16_indexed, 2, MCP::MULSUBv4i16_indexed_OP2);
7774 case AArch64::SUBv8i16:
7775 setVFound(AArch64::MULv8i16, 1, MCP::MULSUBv8i16_OP1);
7776 setVFound(AArch64::MULv8i16, 2, MCP::MULSUBv8i16_OP2);
7777 setVFound(AArch64::MULv8i16_indexed, 1, MCP::MULSUBv8i16_indexed_OP1);
7778 setVFound(AArch64::MULv8i16_indexed, 2, MCP::MULSUBv8i16_indexed_OP2);
7780 case AArch64::SUBv2i32:
7781 setVFound(AArch64::MULv2i32, 1, MCP::MULSUBv2i32_OP1);
7782 setVFound(AArch64::MULv2i32, 2, MCP::MULSUBv2i32_OP2);
7783 setVFound(AArch64::MULv2i32_indexed, 1, MCP::MULSUBv2i32_indexed_OP1);
7784 setVFound(AArch64::MULv2i32_indexed, 2, MCP::MULSUBv2i32_indexed_OP2);
7786 case AArch64::SUBv4i32:
7787 setVFound(AArch64::MULv4i32, 1, MCP::MULSUBv4i32_OP1);
7788 setVFound(AArch64::MULv4i32, 2, MCP::MULSUBv4i32_OP2);
7789 setVFound(AArch64::MULv4i32_indexed, 1, MCP::MULSUBv4i32_indexed_OP1);
7790 setVFound(AArch64::MULv4i32_indexed, 2, MCP::MULSUBv4i32_indexed_OP2);
7796bool AArch64InstrInfo::isAccumulationOpcode(
unsigned Opcode)
const {
7800 case AArch64::UABALB_ZZZ_D:
7801 case AArch64::UABALB_ZZZ_H:
7802 case AArch64::UABALB_ZZZ_S:
7803 case AArch64::UABALT_ZZZ_D:
7804 case AArch64::UABALT_ZZZ_H:
7805 case AArch64::UABALT_ZZZ_S:
7806 case AArch64::SABALB_ZZZ_D:
7807 case AArch64::SABALB_ZZZ_S:
7808 case AArch64::SABALB_ZZZ_H:
7809 case AArch64::SABALT_ZZZ_D:
7810 case AArch64::SABALT_ZZZ_S:
7811 case AArch64::SABALT_ZZZ_H:
7812 case AArch64::UABALv16i8_v8i16:
7813 case AArch64::UABALv2i32_v2i64:
7814 case AArch64::UABALv4i16_v4i32:
7815 case AArch64::UABALv4i32_v2i64:
7816 case AArch64::UABALv8i16_v4i32:
7817 case AArch64::UABALv8i8_v8i16:
7818 case AArch64::UABAv16i8:
7819 case AArch64::UABAv2i32:
7820 case AArch64::UABAv4i16:
7821 case AArch64::UABAv4i32:
7822 case AArch64::UABAv8i16:
7823 case AArch64::UABAv8i8:
7824 case AArch64::SABALv16i8_v8i16:
7825 case AArch64::SABALv2i32_v2i64:
7826 case AArch64::SABALv4i16_v4i32:
7827 case AArch64::SABALv4i32_v2i64:
7828 case AArch64::SABALv8i16_v4i32:
7829 case AArch64::SABALv8i8_v8i16:
7830 case AArch64::SABAv16i8:
7831 case AArch64::SABAv2i32:
7832 case AArch64::SABAv4i16:
7833 case AArch64::SABAv4i32:
7834 case AArch64::SABAv8i16:
7835 case AArch64::SABAv8i8:
7842unsigned AArch64InstrInfo::getAccumulationStartOpcode(
7843 unsigned AccumulationOpcode)
const {
7844 switch (AccumulationOpcode) {
7847 case AArch64::UABALB_ZZZ_D:
7848 return AArch64::UABDLB_ZZZ_D;
7849 case AArch64::UABALB_ZZZ_H:
7850 return AArch64::UABDLB_ZZZ_H;
7851 case AArch64::UABALB_ZZZ_S:
7852 return AArch64::UABDLB_ZZZ_S;
7853 case AArch64::UABALT_ZZZ_D:
7854 return AArch64::UABDLT_ZZZ_D;
7855 case AArch64::UABALT_ZZZ_H:
7856 return AArch64::UABDLT_ZZZ_H;
7857 case AArch64::UABALT_ZZZ_S:
7858 return AArch64::UABDLT_ZZZ_S;
7859 case AArch64::UABALv16i8_v8i16:
7860 return AArch64::UABDLv16i8_v8i16;
7861 case AArch64::UABALv2i32_v2i64:
7862 return AArch64::UABDLv2i32_v2i64;
7863 case AArch64::UABALv4i16_v4i32:
7864 return AArch64::UABDLv4i16_v4i32;
7865 case AArch64::UABALv4i32_v2i64:
7866 return AArch64::UABDLv4i32_v2i64;
7867 case AArch64::UABALv8i16_v4i32:
7868 return AArch64::UABDLv8i16_v4i32;
7869 case AArch64::UABALv8i8_v8i16:
7870 return AArch64::UABDLv8i8_v8i16;
7871 case AArch64::UABAv16i8:
7872 return AArch64::UABDv16i8;
7873 case AArch64::UABAv2i32:
7874 return AArch64::UABDv2i32;
7875 case AArch64::UABAv4i16:
7876 return AArch64::UABDv4i16;
7877 case AArch64::UABAv4i32:
7878 return AArch64::UABDv4i32;
7879 case AArch64::UABAv8i16:
7880 return AArch64::UABDv8i16;
7881 case AArch64::UABAv8i8:
7882 return AArch64::UABDv8i8;
7883 case AArch64::SABALB_ZZZ_D:
7884 return AArch64::SABDLB_ZZZ_D;
7885 case AArch64::SABALB_ZZZ_S:
7886 return AArch64::SABDLB_ZZZ_S;
7887 case AArch64::SABALB_ZZZ_H:
7888 return AArch64::SABDLB_ZZZ_H;
7889 case AArch64::SABALT_ZZZ_D:
7890 return AArch64::SABDLT_ZZZ_D;
7891 case AArch64::SABALT_ZZZ_S:
7892 return AArch64::SABDLT_ZZZ_S;
7893 case AArch64::SABALT_ZZZ_H:
7894 return AArch64::SABDLT_ZZZ_H;
7895 case AArch64::SABALv16i8_v8i16:
7896 return AArch64::SABDLv16i8_v8i16;
7897 case AArch64::SABALv2i32_v2i64:
7898 return AArch64::SABDLv2i32_v2i64;
7899 case AArch64::SABALv4i16_v4i32:
7900 return AArch64::SABDLv4i16_v4i32;
7901 case AArch64::SABALv4i32_v2i64:
7902 return AArch64::SABDLv4i32_v2i64;
7903 case AArch64::SABALv8i16_v4i32:
7904 return AArch64::SABDLv8i16_v4i32;
7905 case AArch64::SABALv8i8_v8i16:
7906 return AArch64::SABDLv8i8_v8i16;
7907 case AArch64::SABAv16i8:
7908 return AArch64::SABDv16i8;
7909 case AArch64::SABAv2i32:
7910 return AArch64::SABAv2i32;
7911 case AArch64::SABAv4i16:
7912 return AArch64::SABDv4i16;
7913 case AArch64::SABAv4i32:
7914 return AArch64::SABDv4i32;
7915 case AArch64::SABAv8i16:
7916 return AArch64::SABDv8i16;
7917 case AArch64::SABAv8i8:
7918 return AArch64::SABDv8i8;
7934 auto Match = [&](
int Opcode,
int Operand,
unsigned Pattern) ->
bool {
7946 assert(
false &&
"Unsupported FP instruction in combiner\n");
7948 case AArch64::FADDHrr:
7950 "FADDHrr does not have register operands");
7952 Found = Match(AArch64::FMULHrr, 1, MCP::FMULADDH_OP1);
7953 Found |= Match(AArch64::FMULHrr, 2, MCP::FMULADDH_OP2);
7955 case AArch64::FADDSrr:
7957 "FADDSrr does not have register operands");
7959 Found |= Match(AArch64::FMULSrr, 1, MCP::FMULADDS_OP1) ||
7960 Match(AArch64::FMULv1i32_indexed, 1, MCP::FMLAv1i32_indexed_OP1);
7962 Found |= Match(AArch64::FMULSrr, 2, MCP::FMULADDS_OP2) ||
7963 Match(AArch64::FMULv1i32_indexed, 2, MCP::FMLAv1i32_indexed_OP2);
7965 case AArch64::FADDDrr:
7966 Found |= Match(AArch64::FMULDrr, 1, MCP::FMULADDD_OP1) ||
7967 Match(AArch64::FMULv1i64_indexed, 1, MCP::FMLAv1i64_indexed_OP1);
7969 Found |= Match(AArch64::FMULDrr, 2, MCP::FMULADDD_OP2) ||
7970 Match(AArch64::FMULv1i64_indexed, 2, MCP::FMLAv1i64_indexed_OP2);
7972 case AArch64::FADDv4f16:
7973 Found |= Match(AArch64::FMULv4i16_indexed, 1, MCP::FMLAv4i16_indexed_OP1) ||
7974 Match(AArch64::FMULv4f16, 1, MCP::FMLAv4f16_OP1);
7976 Found |= Match(AArch64::FMULv4i16_indexed, 2, MCP::FMLAv4i16_indexed_OP2) ||
7977 Match(AArch64::FMULv4f16, 2, MCP::FMLAv4f16_OP2);
7979 case AArch64::FADDv8f16:
7980 Found |= Match(AArch64::FMULv8i16_indexed, 1, MCP::FMLAv8i16_indexed_OP1) ||
7981 Match(AArch64::FMULv8f16, 1, MCP::FMLAv8f16_OP1);
7983 Found |= Match(AArch64::FMULv8i16_indexed, 2, MCP::FMLAv8i16_indexed_OP2) ||
7984 Match(AArch64::FMULv8f16, 2, MCP::FMLAv8f16_OP2);
7986 case AArch64::FADDv2f32:
7987 Found |= Match(AArch64::FMULv2i32_indexed, 1, MCP::FMLAv2i32_indexed_OP1) ||
7988 Match(AArch64::FMULv2f32, 1, MCP::FMLAv2f32_OP1);
7990 Found |= Match(AArch64::FMULv2i32_indexed, 2, MCP::FMLAv2i32_indexed_OP2) ||
7991 Match(AArch64::FMULv2f32, 2, MCP::FMLAv2f32_OP2);
7993 case AArch64::FADDv2f64:
7994 Found |= Match(AArch64::FMULv2i64_indexed, 1, MCP::FMLAv2i64_indexed_OP1) ||
7995 Match(AArch64::FMULv2f64, 1, MCP::FMLAv2f64_OP1);
7997 Found |= Match(AArch64::FMULv2i64_indexed, 2, MCP::FMLAv2i64_indexed_OP2) ||
7998 Match(AArch64::FMULv2f64, 2, MCP::FMLAv2f64_OP2);
8000 case AArch64::FADDv4f32:
8001 Found |= Match(AArch64::FMULv4i32_indexed, 1, MCP::FMLAv4i32_indexed_OP1) ||
8002 Match(AArch64::FMULv4f32, 1, MCP::FMLAv4f32_OP1);
8004 Found |= Match(AArch64::FMULv4i32_indexed, 2, MCP::FMLAv4i32_indexed_OP2) ||
8005 Match(AArch64::FMULv4f32, 2, MCP::FMLAv4f32_OP2);
8007 case AArch64::FSUBHrr:
8008 Found = Match(AArch64::FMULHrr, 1, MCP::FMULSUBH_OP1);
8009 Found |= Match(AArch64::FMULHrr, 2, MCP::FMULSUBH_OP2);
8010 Found |= Match(AArch64::FNMULHrr, 1, MCP::FNMULSUBH_OP1);
8012 case AArch64::FSUBSrr:
8013 Found = Match(AArch64::FMULSrr, 1, MCP::FMULSUBS_OP1);
8015 Found |= Match(AArch64::FMULSrr, 2, MCP::FMULSUBS_OP2) ||
8016 Match(AArch64::FMULv1i32_indexed, 2, MCP::FMLSv1i32_indexed_OP2);
8018 Found |= Match(AArch64::FNMULSrr, 1, MCP::FNMULSUBS_OP1);
8020 case AArch64::FSUBDrr:
8021 Found = Match(AArch64::FMULDrr, 1, MCP::FMULSUBD_OP1);
8023 Found |= Match(AArch64::FMULDrr, 2, MCP::FMULSUBD_OP2) ||
8024 Match(AArch64::FMULv1i64_indexed, 2, MCP::FMLSv1i64_indexed_OP2);
8026 Found |= Match(AArch64::FNMULDrr, 1, MCP::FNMULSUBD_OP1);
8028 case AArch64::FSUBv4f16:
8029 Found |= Match(AArch64::FMULv4i16_indexed, 2, MCP::FMLSv4i16_indexed_OP2) ||
8030 Match(AArch64::FMULv4f16, 2, MCP::FMLSv4f16_OP2);
8032 Found |= Match(AArch64::FMULv4i16_indexed, 1, MCP::FMLSv4i16_indexed_OP1) ||
8033 Match(AArch64::FMULv4f16, 1, MCP::FMLSv4f16_OP1);
8035 case AArch64::FSUBv8f16:
8036 Found |= Match(AArch64::FMULv8i16_indexed, 2, MCP::FMLSv8i16_indexed_OP2) ||
8037 Match(AArch64::FMULv8f16, 2, MCP::FMLSv8f16_OP2);
8039 Found |= Match(AArch64::FMULv8i16_indexed, 1, MCP::FMLSv8i16_indexed_OP1) ||
8040 Match(AArch64::FMULv8f16, 1, MCP::FMLSv8f16_OP1);
8042 case AArch64::FSUBv2f32:
8043 Found |= Match(AArch64::FMULv2i32_indexed, 2, MCP::FMLSv2i32_indexed_OP2) ||
8044 Match(AArch64::FMULv2f32, 2, MCP::FMLSv2f32_OP2);
8046 Found |= Match(AArch64::FMULv2i32_indexed, 1, MCP::FMLSv2i32_indexed_OP1) ||
8047 Match(AArch64::FMULv2f32, 1, MCP::FMLSv2f32_OP1);
8049 case AArch64::FSUBv2f64:
8050 Found |= Match(AArch64::FMULv2i64_indexed, 2, MCP::FMLSv2i64_indexed_OP2) ||
8051 Match(AArch64::FMULv2f64, 2, MCP::FMLSv2f64_OP2);
8053 Found |= Match(AArch64::FMULv2i64_indexed, 1, MCP::FMLSv2i64_indexed_OP1) ||
8054 Match(AArch64::FMULv2f64, 1, MCP::FMLSv2f64_OP1);
8056 case AArch64::FSUBv4f32:
8057 Found |= Match(AArch64::FMULv4i32_indexed, 2, MCP::FMLSv4i32_indexed_OP2) ||
8058 Match(AArch64::FMULv4f32, 2, MCP::FMLSv4f32_OP2);
8060 Found |= Match(AArch64::FMULv4i32_indexed, 1, MCP::FMLSv4i32_indexed_OP1) ||
8061 Match(AArch64::FMULv4f32, 1, MCP::FMLSv4f32_OP1);
8072 auto Match = [&](
unsigned Opcode,
int Operand,
unsigned Pattern) ->
bool {
8079 if (
MI &&
MI->getOpcode() == TargetOpcode::COPY &&
8080 MI->getOperand(1).getReg().isVirtual())
8082 if (
MI &&
MI->getOpcode() == Opcode) {
8094 case AArch64::FMULv2f32:
8095 Found = Match(AArch64::DUPv2i32lane, 1, MCP::FMULv2i32_indexed_OP1);
8096 Found |= Match(AArch64::DUPv2i32lane, 2, MCP::FMULv2i32_indexed_OP2);
8098 case AArch64::FMULv2f64:
8099 Found = Match(AArch64::DUPv2i64lane, 1, MCP::FMULv2i64_indexed_OP1);
8100 Found |= Match(AArch64::DUPv2i64lane, 2, MCP::FMULv2i64_indexed_OP2);
8102 case AArch64::FMULv4f16:
8103 Found = Match(AArch64::DUPv4i16lane, 1, MCP::FMULv4i16_indexed_OP1);
8104 Found |= Match(AArch64::DUPv4i16lane, 2, MCP::FMULv4i16_indexed_OP2);
8106 case AArch64::FMULv4f32:
8107 Found = Match(AArch64::DUPv4i32lane, 1, MCP::FMULv4i32_indexed_OP1);
8108 Found |= Match(AArch64::DUPv4i32lane, 2, MCP::FMULv4i32_indexed_OP2);
8110 case AArch64::FMULv8f16:
8111 Found = Match(AArch64::DUPv8i16lane, 1, MCP::FMULv8i16_indexed_OP1);
8112 Found |= Match(AArch64::DUPv8i16lane, 2, MCP::FMULv8i16_indexed_OP2);
8125 auto Match = [&](
unsigned Opcode,
unsigned Pattern) ->
bool {
8128 if (
MI !=
nullptr && (
MI->getOpcode() == Opcode) &&
8143 case AArch64::FNEGDr:
8145 case AArch64::FNEGSr:
8277 case AArch64::SUBWrr:
8278 case AArch64::SUBSWrr:
8279 case AArch64::SUBXrr:
8280 case AArch64::SUBSXrr:
8325 unsigned LoadLaneOpCode,
unsigned NumLanes) {
8348 while (!RemainingLanes.
empty() && CurrInstr &&
8349 CurrInstr->getOpcode() == LoadLaneOpCode &&
8351 CurrInstr->getNumOperands() == 4) {
8352 RemainingLanes.
erase(CurrInstr->getOperand(2).getImm());
8358 if (!RemainingLanes.
empty())
8362 if (CurrInstr->getOpcode() != TargetOpcode::SUBREG_TO_REG)
8366 auto Lane0LoadReg = CurrInstr->getOperand(1).getReg();
8367 unsigned SingleLaneSizeInBits = 128 / NumLanes;
8368 if (
TRI->getRegSizeInBits(Lane0LoadReg, MRI) != SingleLaneSizeInBits)
8384 RemainingLoadInstrs.
insert(LoadInstrs.
begin(), LoadInstrs.
end());
8387 for (; MBBItr !=
MBB->begin() && RemainingSteps > 0 &&
8388 !RemainingLoadInstrs.
empty();
8389 --MBBItr, --RemainingSteps) {
8393 RemainingLoadInstrs.
erase(&CurrInstr);
8403 if (RemainingSteps == 0 && !RemainingLoadInstrs.
empty())
8429 case AArch64::LD1i32:
8431 case AArch64::LD1i16:
8433 case AArch64::LD1i8:
8449 unsigned Pattern,
unsigned NumLanes) {
8457 for (
unsigned i = 0; i < NumLanes - 1; ++i) {
8465 return A->getOperand(2).getImm() >
B->getOperand(2).getImm();
8471 auto LoadToLaneInstrsAscending =
llvm::reverse(LoadToLaneInstrs);
8477 auto CreateLD1Instruction = [&](
MachineInstr *OriginalInstr,
8478 Register SrcRegister,
unsigned Lane,
8480 bool OffsetRegisterKillState) {
8489 InstrIdxForVirtReg.
insert(std::make_pair(NewRegister, InsInstrs.
size()));
8490 InsInstrs.
push_back(LoadIndexIntoRegister);
8496 auto CreateLDRInstruction =
8502 Opcode = AArch64::LDRSui;
8505 Opcode = AArch64::LDRHui;
8508 Opcode = AArch64::LDRBui;
8512 "Got unsupported number of lanes in machine-combiner gather pattern");
8522 auto LanesToLoadToReg0 =
8524 LoadToLaneInstrsAscending.begin() + NumLanes / 2);
8525 Register PrevReg = SubregToReg->getOperand(0).getReg();
8527 const MachineOperand &OffsetRegOperand = LoadInstr->getOperand(3);
8528 PrevReg = CreateLD1Instruction(LoadInstr, PrevReg, Index + 1,
8529 OffsetRegOperand.
getReg(),
8530 OffsetRegOperand.
isKill());
8537 MachineInstr *Lane0Load = *LoadToLaneInstrsAscending.begin();
8539 *std::next(LoadToLaneInstrsAscending.begin(), NumLanes / 2);
8546 CreateLDRInstruction(NumLanes, DestRegForMiddleIndex,
8547 OriginalSplitToLoadOffsetOperand.
getReg(),
8550 InstrIdxForVirtReg.
insert(
8551 std::make_pair(DestRegForMiddleIndex, InsInstrs.
size()));
8552 InsInstrs.
push_back(MiddleIndexLoadInstr);
8557 unsigned SubregType;
8560 SubregType = AArch64::ssub;
8563 SubregType = AArch64::hsub;
8566 SubregType = AArch64::bsub;
8570 "Got invalid NumLanes for machine-combiner gather pattern");
8573 auto SubRegToRegInstr =
8575 DestRegForSubregToReg)
8578 InstrIdxForVirtReg.
insert(
8579 std::make_pair(DestRegForSubregToReg, InsInstrs.
size()));
8583 auto LanesToLoadToReg1 =
8585 LoadToLaneInstrsAscending.end());
8586 PrevReg = SubRegToRegInstr->getOperand(0).getReg();
8588 const MachineOperand &OffsetRegOperand = LoadInstr->getOperand(3);
8589 PrevReg = CreateLD1Instruction(LoadInstr, PrevReg, Index + 1,
8590 OffsetRegOperand.
getReg(),
8591 OffsetRegOperand.
isKill());
8594 if (Index == NumLanes / 2 - 2) {
8629bool AArch64InstrInfo::getMachineCombinerPatterns(
8631 bool DoRegPressureReduce)
const {
8652 DoRegPressureReduce);
8681 const Register *ReplacedAddend =
nullptr) {
8682 assert(IdxMulOpd == 1 || IdxMulOpd == 2);
8684 unsigned IdxOtherOpd = IdxMulOpd == 1 ? 2 : 1;
8687 Register SrcReg0 = MUL->getOperand(1).getReg();
8688 bool Src0IsKill = MUL->getOperand(1).isKill();
8689 Register SrcReg1 = MUL->getOperand(2).getReg();
8690 bool Src1IsKill = MUL->getOperand(2).isKill();
8694 if (ReplacedAddend) {
8696 SrcReg2 = *ReplacedAddend;
8723 .
addImm(MUL->getOperand(3).getImm());
8730 assert(
false &&
"Invalid FMA instruction kind \n");
8744 if (AArch64::FPR32RegClass.hasSubClassEq(RC))
8745 Opc = AArch64::FNMADDSrrr;
8746 else if (AArch64::FPR64RegClass.hasSubClassEq(RC))
8747 Opc = AArch64::FNMADDDrrr;
8781 unsigned IdxDupOp,
unsigned MulOpc,
8783 assert(((IdxDupOp == 1) || (IdxDupOp == 2)) &&
8784 "Invalid index of FMUL operand");
8792 if (Dup->
getOpcode() == TargetOpcode::COPY)
8801 unsigned IdxMulOp = IdxDupOp == 1 ? 2 : 1;
8842 InstrIdxForVirtReg.
insert(std::make_pair(NewVR, 0));
8857 genNeg(MF, MRI,
TII, Root, InsInstrs, InstrIdxForVirtReg, MnegOpc, RC);
8884 genNeg(MF, MRI,
TII, Root, InsInstrs, InstrIdxForVirtReg, MnegOpc, RC);
8912 unsigned IdxMulOpd,
unsigned MaddOpc,
unsigned VR,
8914 assert(IdxMulOpd == 1 || IdxMulOpd == 2);
8918 Register SrcReg0 = MUL->getOperand(1).getReg();
8919 bool Src0IsKill = MUL->getOperand(1).isKill();
8920 Register SrcReg1 = MUL->getOperand(2).getReg();
8921 bool Src1IsKill = MUL->getOperand(2).isKill();
8951 assert(IdxOpd1 == 1 || IdxOpd1 == 2);
8952 unsigned IdxOtherOpd = IdxOpd1 == 1 ? 2 : 1;
8966 if (Opcode == AArch64::SUBSWrr)
8967 Opcode = AArch64::SUBWrr;
8968 else if (Opcode == AArch64::SUBSXrr)
8969 Opcode = AArch64::SUBXrr;
8971 assert((Opcode == AArch64::SUBWrr || Opcode == AArch64::SUBXrr) &&
8972 "Unexpected instruction opcode.");
8989 InstrIdxForVirtReg.
insert(std::make_pair(NewVR, 0));
8996unsigned AArch64InstrInfo::getReduceOpcodeForAccumulator(
8997 unsigned int AccumulatorOpCode)
const {
8998 switch (AccumulatorOpCode) {
8999 case AArch64::UABALB_ZZZ_D:
9000 case AArch64::SABALB_ZZZ_D:
9001 case AArch64::UABALT_ZZZ_D:
9002 case AArch64::SABALT_ZZZ_D:
9003 return AArch64::ADD_ZZZ_D;
9004 case AArch64::UABALB_ZZZ_H:
9005 case AArch64::SABALB_ZZZ_H:
9006 case AArch64::UABALT_ZZZ_H:
9007 case AArch64::SABALT_ZZZ_H:
9008 return AArch64::ADD_ZZZ_H;
9009 case AArch64::UABALB_ZZZ_S:
9010 case AArch64::SABALB_ZZZ_S:
9011 case AArch64::UABALT_ZZZ_S:
9012 case AArch64::SABALT_ZZZ_S:
9013 return AArch64::ADD_ZZZ_S;
9014 case AArch64::UABALv16i8_v8i16:
9015 case AArch64::SABALv8i8_v8i16:
9016 case AArch64::SABAv8i16:
9017 case AArch64::UABAv8i16:
9018 return AArch64::ADDv8i16;
9019 case AArch64::SABALv2i32_v2i64:
9020 case AArch64::UABALv2i32_v2i64:
9021 case AArch64::SABALv4i32_v2i64:
9022 return AArch64::ADDv2i64;
9023 case AArch64::UABALv4i16_v4i32:
9024 case AArch64::SABALv4i16_v4i32:
9025 case AArch64::SABALv8i16_v4i32:
9026 case AArch64::SABAv4i32:
9027 case AArch64::UABAv4i32:
9028 return AArch64::ADDv4i32;
9029 case AArch64::UABALv4i32_v2i64:
9030 return AArch64::ADDv2i64;
9031 case AArch64::UABALv8i16_v4i32:
9032 return AArch64::ADDv4i32;
9033 case AArch64::UABALv8i8_v8i16:
9034 case AArch64::SABALv16i8_v8i16:
9035 return AArch64::ADDv8i16;
9036 case AArch64::UABAv16i8:
9037 case AArch64::SABAv16i8:
9038 return AArch64::ADDv16i8;
9039 case AArch64::UABAv4i16:
9040 case AArch64::SABAv4i16:
9041 return AArch64::ADDv4i16;
9042 case AArch64::UABAv2i32:
9043 case AArch64::SABAv2i32:
9044 return AArch64::ADDv2i32;
9045 case AArch64::UABAv8i8:
9046 case AArch64::SABAv8i8:
9047 return AArch64::ADDv8i8;
9056void AArch64InstrInfo::genAlternativeCodeSequence(
9066 MachineInstr *
MUL =
nullptr;
9067 const TargetRegisterClass *RC;
9073 DelInstrs, InstrIdxForVirtReg);
9079 InstrIdxForVirtReg);
9085 InstrIdxForVirtReg);
9094 Opc = AArch64::MADDWrrr;
9095 RC = &AArch64::GPR32RegClass;
9097 Opc = AArch64::MADDXrrr;
9098 RC = &AArch64::GPR64RegClass;
9109 Opc = AArch64::MADDWrrr;
9110 RC = &AArch64::GPR32RegClass;
9112 Opc = AArch64::MADDXrrr;
9113 RC = &AArch64::GPR64RegClass;
9126 const TargetRegisterClass *RC;
9127 unsigned BitSize, MovImm;
9130 MovImm = AArch64::MOVi32imm;
9131 RC = &AArch64::GPR32spRegClass;
9133 Opc = AArch64::MADDWrrr;
9134 RC = &AArch64::GPR32RegClass;
9136 MovImm = AArch64::MOVi64imm;
9137 RC = &AArch64::GPR64spRegClass;
9139 Opc = AArch64::MADDXrrr;
9140 RC = &AArch64::GPR64RegClass;
9151 uint64_t UImm =
SignExtend64(IsSub ? -Imm : Imm, BitSize);
9155 if (Insn.
size() != 1)
9157 MachineInstrBuilder MIB1 =
9158 BuildMI(MF, MIMetadata(Root),
TII->get(MovImm), NewVR)
9159 .
addImm(IsSub ? -Imm : Imm);
9161 InstrIdxForVirtReg.
insert(std::make_pair(NewVR, 0));
9172 const TargetRegisterClass *SubRC;
9173 unsigned SubOpc, ZeroReg;
9175 SubOpc = AArch64::SUBWrr;
9176 SubRC = &AArch64::GPR32spRegClass;
9177 ZeroReg = AArch64::WZR;
9178 Opc = AArch64::MADDWrrr;
9179 RC = &AArch64::GPR32RegClass;
9181 SubOpc = AArch64::SUBXrr;
9182 SubRC = &AArch64::GPR64spRegClass;
9183 ZeroReg = AArch64::XZR;
9184 Opc = AArch64::MADDXrrr;
9185 RC = &AArch64::GPR64RegClass;
9189 MachineInstrBuilder MIB1 =
9190 BuildMI(MF, MIMetadata(Root),
TII->get(SubOpc), NewVR)
9194 InstrIdxForVirtReg.
insert(std::make_pair(NewVR, 0));
9205 Opc = AArch64::MSUBWrrr;
9206 RC = &AArch64::GPR32RegClass;
9208 Opc = AArch64::MSUBXrrr;
9209 RC = &AArch64::GPR64RegClass;
9214 Opc = AArch64::MLAv8i8;
9215 RC = &AArch64::FPR64RegClass;
9219 Opc = AArch64::MLAv8i8;
9220 RC = &AArch64::FPR64RegClass;
9224 Opc = AArch64::MLAv16i8;
9225 RC = &AArch64::FPR128RegClass;
9229 Opc = AArch64::MLAv16i8;
9230 RC = &AArch64::FPR128RegClass;
9234 Opc = AArch64::MLAv4i16;
9235 RC = &AArch64::FPR64RegClass;
9239 Opc = AArch64::MLAv4i16;
9240 RC = &AArch64::FPR64RegClass;
9244 Opc = AArch64::MLAv8i16;
9245 RC = &AArch64::FPR128RegClass;
9249 Opc = AArch64::MLAv8i16;
9250 RC = &AArch64::FPR128RegClass;
9254 Opc = AArch64::MLAv2i32;
9255 RC = &AArch64::FPR64RegClass;
9259 Opc = AArch64::MLAv2i32;
9260 RC = &AArch64::FPR64RegClass;
9264 Opc = AArch64::MLAv4i32;
9265 RC = &AArch64::FPR128RegClass;
9269 Opc = AArch64::MLAv4i32;
9270 RC = &AArch64::FPR128RegClass;
9275 Opc = AArch64::MLAv8i8;
9276 RC = &AArch64::FPR64RegClass;
9278 InstrIdxForVirtReg, 1,
Opc, AArch64::NEGv8i8,
9282 Opc = AArch64::MLSv8i8;
9283 RC = &AArch64::FPR64RegClass;
9287 Opc = AArch64::MLAv16i8;
9288 RC = &AArch64::FPR128RegClass;
9290 InstrIdxForVirtReg, 1,
Opc, AArch64::NEGv16i8,
9294 Opc = AArch64::MLSv16i8;
9295 RC = &AArch64::FPR128RegClass;
9299 Opc = AArch64::MLAv4i16;
9300 RC = &AArch64::FPR64RegClass;
9302 InstrIdxForVirtReg, 1,
Opc, AArch64::NEGv4i16,
9306 Opc = AArch64::MLSv4i16;
9307 RC = &AArch64::FPR64RegClass;
9311 Opc = AArch64::MLAv8i16;
9312 RC = &AArch64::FPR128RegClass;
9314 InstrIdxForVirtReg, 1,
Opc, AArch64::NEGv8i16,
9318 Opc = AArch64::MLSv8i16;
9319 RC = &AArch64::FPR128RegClass;
9323 Opc = AArch64::MLAv2i32;
9324 RC = &AArch64::FPR64RegClass;
9326 InstrIdxForVirtReg, 1,
Opc, AArch64::NEGv2i32,
9330 Opc = AArch64::MLSv2i32;
9331 RC = &AArch64::FPR64RegClass;
9335 Opc = AArch64::MLAv4i32;
9336 RC = &AArch64::FPR128RegClass;
9338 InstrIdxForVirtReg, 1,
Opc, AArch64::NEGv4i32,
9342 Opc = AArch64::MLSv4i32;
9343 RC = &AArch64::FPR128RegClass;
9348 Opc = AArch64::MLAv4i16_indexed;
9349 RC = &AArch64::FPR64RegClass;
9353 Opc = AArch64::MLAv4i16_indexed;
9354 RC = &AArch64::FPR64RegClass;
9358 Opc = AArch64::MLAv8i16_indexed;
9359 RC = &AArch64::FPR128RegClass;
9363 Opc = AArch64::MLAv8i16_indexed;
9364 RC = &AArch64::FPR128RegClass;
9368 Opc = AArch64::MLAv2i32_indexed;
9369 RC = &AArch64::FPR64RegClass;
9373 Opc = AArch64::MLAv2i32_indexed;
9374 RC = &AArch64::FPR64RegClass;
9378 Opc = AArch64::MLAv4i32_indexed;
9379 RC = &AArch64::FPR128RegClass;
9383 Opc = AArch64::MLAv4i32_indexed;
9384 RC = &AArch64::FPR128RegClass;
9389 Opc = AArch64::MLAv4i16_indexed;
9390 RC = &AArch64::FPR64RegClass;
9392 InstrIdxForVirtReg, 1,
Opc, AArch64::NEGv4i16,
9396 Opc = AArch64::MLSv4i16_indexed;
9397 RC = &AArch64::FPR64RegClass;
9401 Opc = AArch64::MLAv8i16_indexed;
9402 RC = &AArch64::FPR128RegClass;
9404 InstrIdxForVirtReg, 1,
Opc, AArch64::NEGv8i16,
9408 Opc = AArch64::MLSv8i16_indexed;
9409 RC = &AArch64::FPR128RegClass;
9413 Opc = AArch64::MLAv2i32_indexed;
9414 RC = &AArch64::FPR64RegClass;
9416 InstrIdxForVirtReg, 1,
Opc, AArch64::NEGv2i32,
9420 Opc = AArch64::MLSv2i32_indexed;
9421 RC = &AArch64::FPR64RegClass;
9425 Opc = AArch64::MLAv4i32_indexed;
9426 RC = &AArch64::FPR128RegClass;
9428 InstrIdxForVirtReg, 1,
Opc, AArch64::NEGv4i32,
9432 Opc = AArch64::MLSv4i32_indexed;
9433 RC = &AArch64::FPR128RegClass;
9439 Opc = AArch64::FMADDHrrr;
9440 RC = &AArch64::FPR16RegClass;
9444 Opc = AArch64::FMADDSrrr;
9445 RC = &AArch64::FPR32RegClass;
9449 Opc = AArch64::FMADDDrrr;
9450 RC = &AArch64::FPR64RegClass;
9455 Opc = AArch64::FMADDHrrr;
9456 RC = &AArch64::FPR16RegClass;
9460 Opc = AArch64::FMADDSrrr;
9461 RC = &AArch64::FPR32RegClass;
9465 Opc = AArch64::FMADDDrrr;
9466 RC = &AArch64::FPR64RegClass;
9471 Opc = AArch64::FMLAv1i32_indexed;
9472 RC = &AArch64::FPR32RegClass;
9477 Opc = AArch64::FMLAv1i32_indexed;
9478 RC = &AArch64::FPR32RegClass;
9484 Opc = AArch64::FMLAv1i64_indexed;
9485 RC = &AArch64::FPR64RegClass;
9490 Opc = AArch64::FMLAv1i64_indexed;
9491 RC = &AArch64::FPR64RegClass;
9497 RC = &AArch64::FPR64RegClass;
9498 Opc = AArch64::FMLAv4i16_indexed;
9503 RC = &AArch64::FPR64RegClass;
9504 Opc = AArch64::FMLAv4f16;
9509 RC = &AArch64::FPR64RegClass;
9510 Opc = AArch64::FMLAv4i16_indexed;
9515 RC = &AArch64::FPR64RegClass;
9516 Opc = AArch64::FMLAv4f16;
9523 RC = &AArch64::FPR64RegClass;
9525 Opc = AArch64::FMLAv2i32_indexed;
9529 Opc = AArch64::FMLAv2f32;
9536 RC = &AArch64::FPR64RegClass;
9538 Opc = AArch64::FMLAv2i32_indexed;
9542 Opc = AArch64::FMLAv2f32;
9549 RC = &AArch64::FPR128RegClass;
9550 Opc = AArch64::FMLAv8i16_indexed;
9555 RC = &AArch64::FPR128RegClass;
9556 Opc = AArch64::FMLAv8f16;
9561 RC = &AArch64::FPR128RegClass;
9562 Opc = AArch64::FMLAv8i16_indexed;
9567 RC = &AArch64::FPR128RegClass;
9568 Opc = AArch64::FMLAv8f16;
9575 RC = &AArch64::FPR128RegClass;
9577 Opc = AArch64::FMLAv2i64_indexed;
9581 Opc = AArch64::FMLAv2f64;
9588 RC = &AArch64::FPR128RegClass;
9590 Opc = AArch64::FMLAv2i64_indexed;
9594 Opc = AArch64::FMLAv2f64;
9602 RC = &AArch64::FPR128RegClass;
9604 Opc = AArch64::FMLAv4i32_indexed;
9608 Opc = AArch64::FMLAv4f32;
9616 RC = &AArch64::FPR128RegClass;
9618 Opc = AArch64::FMLAv4i32_indexed;
9622 Opc = AArch64::FMLAv4f32;
9629 Opc = AArch64::FNMSUBHrrr;
9630 RC = &AArch64::FPR16RegClass;
9634 Opc = AArch64::FNMSUBSrrr;
9635 RC = &AArch64::FPR32RegClass;
9639 Opc = AArch64::FNMSUBDrrr;
9640 RC = &AArch64::FPR64RegClass;
9645 Opc = AArch64::FNMADDHrrr;
9646 RC = &AArch64::FPR16RegClass;
9650 Opc = AArch64::FNMADDSrrr;
9651 RC = &AArch64::FPR32RegClass;
9655 Opc = AArch64::FNMADDDrrr;
9656 RC = &AArch64::FPR64RegClass;
9661 Opc = AArch64::FMSUBHrrr;
9662 RC = &AArch64::FPR16RegClass;
9666 Opc = AArch64::FMSUBSrrr;
9667 RC = &AArch64::FPR32RegClass;
9671 Opc = AArch64::FMSUBDrrr;
9672 RC = &AArch64::FPR64RegClass;
9677 Opc = AArch64::FMLSv1i32_indexed;
9678 RC = &AArch64::FPR32RegClass;
9684 Opc = AArch64::FMLSv1i64_indexed;
9685 RC = &AArch64::FPR64RegClass;
9692 RC = &AArch64::FPR64RegClass;
9694 MachineInstrBuilder MIB1 =
9695 BuildMI(MF, MIMetadata(Root),
TII->get(AArch64::FNEGv4f16), NewVR)
9698 InstrIdxForVirtReg.
insert(std::make_pair(NewVR, 0));
9700 Opc = AArch64::FMLAv4f16;
9704 Opc = AArch64::FMLAv4i16_indexed;
9711 RC = &AArch64::FPR64RegClass;
9712 Opc = AArch64::FMLSv4f16;
9717 RC = &AArch64::FPR64RegClass;
9718 Opc = AArch64::FMLSv4i16_indexed;
9725 RC = &AArch64::FPR64RegClass;
9727 Opc = AArch64::FMLSv2i32_indexed;
9731 Opc = AArch64::FMLSv2f32;
9739 RC = &AArch64::FPR128RegClass;
9741 MachineInstrBuilder MIB1 =
9742 BuildMI(MF, MIMetadata(Root),
TII->get(AArch64::FNEGv8f16), NewVR)
9745 InstrIdxForVirtReg.
insert(std::make_pair(NewVR, 0));
9747 Opc = AArch64::FMLAv8f16;
9751 Opc = AArch64::FMLAv8i16_indexed;
9758 RC = &AArch64::FPR128RegClass;
9759 Opc = AArch64::FMLSv8f16;
9764 RC = &AArch64::FPR128RegClass;
9765 Opc = AArch64::FMLSv8i16_indexed;
9772 RC = &AArch64::FPR128RegClass;
9774 Opc = AArch64::FMLSv2i64_indexed;
9778 Opc = AArch64::FMLSv2f64;
9786 RC = &AArch64::FPR128RegClass;
9788 Opc = AArch64::FMLSv4i32_indexed;
9792 Opc = AArch64::FMLSv4f32;
9799 RC = &AArch64::FPR64RegClass;
9801 MachineInstrBuilder MIB1 =
9802 BuildMI(MF, MIMetadata(Root),
TII->get(AArch64::FNEGv2f32), NewVR)
9805 InstrIdxForVirtReg.
insert(std::make_pair(NewVR, 0));
9807 Opc = AArch64::FMLAv2i32_indexed;
9811 Opc = AArch64::FMLAv2f32;
9819 RC = &AArch64::FPR128RegClass;
9821 MachineInstrBuilder MIB1 =
9822 BuildMI(MF, MIMetadata(Root),
TII->get(AArch64::FNEGv4f32), NewVR)
9825 InstrIdxForVirtReg.
insert(std::make_pair(NewVR, 0));
9827 Opc = AArch64::FMLAv4i32_indexed;
9831 Opc = AArch64::FMLAv4f32;
9839 RC = &AArch64::FPR128RegClass;
9841 MachineInstrBuilder MIB1 =
9842 BuildMI(MF, MIMetadata(Root),
TII->get(AArch64::FNEGv2f64), NewVR)
9845 InstrIdxForVirtReg.
insert(std::make_pair(NewVR, 0));
9847 Opc = AArch64::FMLAv2i64_indexed;
9851 Opc = AArch64::FMLAv2f64;
9863 &AArch64::FPR128RegClass, MRI);
9872 &AArch64::FPR128RegClass, MRI);
9881 &AArch64::FPR128_loRegClass, MRI);
9890 &AArch64::FPR128RegClass, MRI);
9899 &AArch64::FPR128_loRegClass, MRI);
9933 for (
auto *
MI : InsInstrs)
9934 MI->setFlags(Flags);
9975 bool IsNegativeBranch =
false;
9976 bool IsTestAndBranch =
false;
9977 unsigned TargetBBInMI = 0;
9978 switch (
MI.getOpcode()) {
9982 case AArch64::CBWPri:
9983 case AArch64::CBXPri:
9984 case AArch64::CBBAssertExt:
9985 case AArch64::CBHAssertExt:
9986 case AArch64::CBWPrr:
9987 case AArch64::CBXPrr:
9993 case AArch64::CBNZW:
9994 case AArch64::CBNZX:
9996 IsNegativeBranch =
true;
10001 IsTestAndBranch =
true;
10003 case AArch64::TBNZW:
10004 case AArch64::TBNZX:
10006 IsNegativeBranch =
true;
10007 IsTestAndBranch =
true;
10013 if (IsTestAndBranch &&
MI.getOperand(1).getImm())
10017 assert(
MI.getParent() &&
"Incomplete machine instruction\n");
10028 while (
DefMI->isCopy()) {
10037 switch (
DefMI->getOpcode()) {
10041 case AArch64::ANDWri:
10042 case AArch64::ANDXri: {
10043 if (IsTestAndBranch)
10050 bool Is32Bit = (
DefMI->getOpcode() == AArch64::ANDWri);
10052 DefMI->getOperand(2).getImm(), Is32Bit ? 32 : 64);
10066 unsigned Imm =
Log2_64(Mask);
10067 unsigned Opc = (Imm < 32)
10068 ? (IsNegativeBranch ? AArch64::TBNZW : AArch64::TBZW)
10069 : (IsNegativeBranch ? AArch64::TBNZX : AArch64::TBZX);
10082 if (!Is32Bit && Imm < 32)
10084 MI.eraseFromParent();
10088 case AArch64::CSINCWr:
10089 case AArch64::CSINCXr: {
10090 if (!(
DefMI->getOperand(1).getReg() == AArch64::WZR &&
10091 DefMI->getOperand(2).getReg() == AArch64::WZR) &&
10092 !(
DefMI->getOperand(1).getReg() == AArch64::XZR &&
10093 DefMI->getOperand(2).getReg() == AArch64::XZR))
10096 if (
DefMI->findRegisterDefOperandIdx(AArch64::NZCV,
nullptr,
10109 if (IsNegativeBranch)
10112 MI.eraseFromParent();
10118std::pair<unsigned, unsigned>
10119AArch64InstrInfo::decomposeMachineOperandsTargetFlags(
unsigned TF)
const {
10121 return std::make_pair(TF & Mask, TF & ~Mask);
10125AArch64InstrInfo::getSerializableDirectMachineOperandTargetFlags()
const {
10128 static const std::pair<unsigned, const char *> TargetFlags[] = {
10129 {MO_PAGE,
"aarch64-page"}, {
MO_PAGEOFF,
"aarch64-pageoff"},
10130 {
MO_G3,
"aarch64-g3"}, {
MO_G2,
"aarch64-g2"},
10131 {
MO_G1,
"aarch64-g1"}, {
MO_G0,
"aarch64-g0"},
10137AArch64InstrInfo::getSerializableBitmaskMachineOperandTargetFlags()
const {
10138 using namespace AArch64II;
10140 static const std::pair<unsigned, const char *> TargetFlags[] = {
10142 {
MO_GOT,
"aarch64-got"},
10143 {
MO_NC,
"aarch64-nc"},
10144 {
MO_S,
"aarch64-s"},
10145 {
MO_TLS,
"aarch64-tls"},
10155AArch64InstrInfo::getSerializableMachineMemOperandTargetFlags()
const {
10156 static const std::pair<MachineMemOperand::Flags, const char *> TargetFlags[] =
10258 MachineFunction *MF =
C.getMF();
10260 const AArch64RegisterInfo *ARI =
10261 static_cast<const AArch64RegisterInfo *
>(&
TRI);
10264 for (
unsigned Reg : AArch64::GPR64RegClass) {
10266 Reg != AArch64::LR &&
10267 Reg != AArch64::X16 &&
10268 Reg != AArch64::X17 &&
10269 C.isAvailableAcrossAndOutOfSeq(
Reg,
TRI) &&
10270 C.isAvailableInsideSeq(
Reg,
TRI))
10301 return SubtargetA.hasV8_3aOps() == SubtargetB.hasV8_3aOps();
10304std::optional<std::unique_ptr<outliner::OutlinedFunction>>
10305AArch64InstrInfo::getOutliningCandidateInfo(
10307 std::vector<outliner::Candidate> &RepeatedSequenceLocs,
10308 unsigned MinRepeats)
const {
10309 unsigned SequenceSize = 0;
10310 for (
auto &
MI : RepeatedSequenceLocs[0])
10313 unsigned NumBytesToCreateFrame = 0;
10319 MachineInstr &LastMI = RepeatedSequenceLocs[0].back();
10320 MachineInstr &FirstMI = RepeatedSequenceLocs[0].front();
10321 if (LastMI.
getOpcode() == AArch64::ADRP &&
10324 return std::nullopt;
10329 if ((FirstMI.
getOpcode() == AArch64::ADDXri ||
10330 FirstMI.
getOpcode() == AArch64::LDRXui) &&
10333 return std::nullopt;
10344 if (std::adjacent_find(
10345 RepeatedSequenceLocs.begin(), RepeatedSequenceLocs.end(),
10346 [](
const outliner::Candidate &a,
const outliner::Candidate &b) {
10349 if (outliningCandidatesSigningScopeConsensus(a, b) &&
10350 outliningCandidatesSigningKeyConsensus(a, b) &&
10351 outliningCandidatesV8_3OpsConsensus(a, b)) {
10355 }) != RepeatedSequenceLocs.end()) {
10356 return std::nullopt;
10373 unsigned NumBytesToCheckLRInTCEpilogue = 0;
10374 const auto RASignCondition = RepeatedSequenceLocs[0]
10377 ->getSignReturnAddressCondition();
10380 NumBytesToCreateFrame += 8;
10383 auto LRCheckMethod = Subtarget.getAuthenticatedLRCheckMethod(
10384 *RepeatedSequenceLocs[0].getMF());
10385 NumBytesToCheckLRInTCEpilogue =
10389 if (isTailCallReturnInst(RepeatedSequenceLocs[0].
back()))
10390 SequenceSize += NumBytesToCheckLRInTCEpilogue;
10398 for (
auto &
MI :
C) {
10399 if (
MI.modifiesRegister(AArch64::SP, &
TRI)) {
10400 switch (
MI.getOpcode()) {
10401 case AArch64::ADDXri:
10402 case AArch64::ADDWri:
10403 assert(
MI.getNumOperands() == 4 &&
"Wrong number of operands");
10404 assert(
MI.getOperand(2).isImm() &&
10405 "Expected operand to be immediate");
10406 assert(
MI.getOperand(1).isReg() &&
10407 "Expected operand to be a register");
10411 if (
MI.getOperand(1).getReg() == AArch64::SP)
10412 SPValue +=
MI.getOperand(2).getImm();
10416 case AArch64::SUBXri:
10417 case AArch64::SUBWri:
10418 assert(
MI.getNumOperands() == 4 &&
"Wrong number of operands");
10419 assert(
MI.getOperand(2).isImm() &&
10420 "Expected operand to be immediate");
10421 assert(
MI.getOperand(1).isReg() &&
10422 "Expected operand to be a register");
10426 if (
MI.getOperand(1).getReg() == AArch64::SP)
10427 SPValue -=
MI.getOperand(2).getImm();
10444 if (RepeatedSequenceLocs.size() < MinRepeats)
10445 return std::nullopt;
10449 unsigned FlagsSetInAll = 0xF;
10453 FlagsSetInAll &=
C.Flags;
10455 unsigned LastInstrOpcode = RepeatedSequenceLocs[0].back().getOpcode();
10458 auto SetCandidateCallInfo =
10459 [&RepeatedSequenceLocs](
unsigned CallID,
unsigned NumBytesForCall) {
10461 C.setCallInfo(CallID, NumBytesForCall);
10465 NumBytesToCreateFrame += 4;
10473 unsigned CFICount = 0;
10474 for (
auto &
I : RepeatedSequenceLocs[0]) {
10475 if (
I.isCFIInstruction())
10485 std::vector<MCCFIInstruction> CFIInstructions =
10486 C.getMF()->getFrameInstructions();
10488 if (CFICount > 0 && CFICount != CFIInstructions.size())
10489 return std::nullopt;
10497 if (!
MI.modifiesRegister(AArch64::SP, &
TRI) &&
10498 !
MI.readsRegister(AArch64::SP, &
TRI))
10504 if (
MI.modifiesRegister(AArch64::SP, &
TRI))
10509 if (
MI.mayLoadOrStore()) {
10512 bool OffsetIsScalable;
10516 if (!getMemOperandWithOffset(
MI,
Base,
Offset, OffsetIsScalable, &
TRI) ||
10517 !
Base->isReg() ||
Base->getReg() != AArch64::SP)
10521 if (OffsetIsScalable)
10529 TypeSize Scale(0U,
false), DummyWidth(0U,
false);
10530 getMemOpInfo(
MI.getOpcode(), Scale, DummyWidth, MinOffset, MaxOffset);
10533 if (
Offset < MinOffset * (int64_t)Scale.getFixedValue() ||
10534 Offset > MaxOffset * (int64_t)Scale.getFixedValue())
10549 bool AllStackInstrsSafe =
10554 if (RepeatedSequenceLocs[0].
back().isTerminator()) {
10556 NumBytesToCreateFrame = 0;
10557 unsigned NumBytesForCall = 4 + NumBytesToCheckLRInTCEpilogue;
10561 else if (LastInstrOpcode == AArch64::BL ||
10562 ((LastInstrOpcode == AArch64::BLR ||
10563 LastInstrOpcode == AArch64::BLRNoIP) &&
10567 NumBytesToCreateFrame = NumBytesToCheckLRInTCEpilogue;
10575 unsigned NumBytesNoStackCalls = 0;
10576 std::vector<outliner::Candidate> CandidatesWithoutStackFixups;
10582 ?
C.isAvailableAcrossAndOutOfSeq(AArch64::LR,
TRI)
10591 C.getMF()->getFunction().hasFnAttribute(Attribute::NoReturn);
10594 if (LRAvailable && !IsNoReturn) {
10595 NumBytesNoStackCalls += 4;
10597 CandidatesWithoutStackFixups.push_back(
C);
10602 else if (findRegisterToSaveLRTo(
C)) {
10603 NumBytesNoStackCalls += 12;
10605 CandidatesWithoutStackFixups.push_back(
C);
10610 else if (
C.isAvailableInsideSeq(AArch64::SP,
TRI)) {
10611 NumBytesNoStackCalls += 12;
10613 CandidatesWithoutStackFixups.push_back(
C);
10619 NumBytesNoStackCalls += SequenceSize;
10626 if (!AllStackInstrsSafe ||
10627 NumBytesNoStackCalls <= RepeatedSequenceLocs.size() * 12) {
10628 RepeatedSequenceLocs = CandidatesWithoutStackFixups;
10630 if (RepeatedSequenceLocs.size() < MinRepeats)
10631 return std::nullopt;
10684 (!
C.isAvailableAcrossAndOutOfSeq(AArch64::LR,
TRI) ||
10685 !findRegisterToSaveLRTo(
C));
10691 if (RepeatedSequenceLocs.size() < MinRepeats)
10692 return std::nullopt;
10701 bool ModStackToSaveLR =
false;
10704 ModStackToSaveLR =
true;
10713 ModStackToSaveLR =
true;
10715 if (ModStackToSaveLR) {
10717 if (!AllStackInstrsSafe)
10718 return std::nullopt;
10721 NumBytesToCreateFrame += 8;
10728 return std::nullopt;
10730 return std::make_unique<outliner::OutlinedFunction>(
10731 RepeatedSequenceLocs, SequenceSize, NumBytesToCreateFrame, FrameID);
10734void AArch64InstrInfo::mergeOutliningCandidateAttributes(
10735 Function &
F, std::vector<outliner::Candidate> &Candidates)
const {
10739 const auto &CFn = Candidates.front().getMF()->getFunction();
10741 if (CFn.hasFnAttribute(
"ptrauth-returns"))
10742 F.addFnAttr(CFn.getFnAttribute(
"ptrauth-returns"));
10743 if (CFn.hasFnAttribute(
"ptrauth-auth-traps"))
10744 F.addFnAttr(CFn.getFnAttribute(
"ptrauth-auth-traps"));
10747 if (CFn.hasFnAttribute(
"sign-return-address"))
10748 F.addFnAttr(CFn.getFnAttribute(
"sign-return-address"));
10749 if (CFn.hasFnAttribute(
"sign-return-address-key"))
10750 F.addFnAttr(CFn.getFnAttribute(
"sign-return-address-key"));
10752 AArch64GenInstrInfo::mergeOutliningCandidateAttributes(
F, Candidates);
10755bool AArch64InstrInfo::isFunctionSafeToOutlineFrom(
10760 if (!OutlineFromLinkOnceODRs &&
F.hasLinkOnceODRLinkage())
10767 if (
F.hasSection())
10773 AArch64FunctionInfo *AFI = MF.
getInfo<AArch64FunctionInfo>();
10774 if (!AFI || AFI->
hasRedZone().value_or(
true))
10794 unsigned &Flags)
const {
10796 "Must track liveness!");
10798 std::pair<MachineBasicBlock::iterator, MachineBasicBlock::iterator>>
10813 auto AreAllUnsafeRegsDead = [&LRU]() {
10814 return LRU.available(AArch64::W16) && LRU.available(AArch64::W17) &&
10815 LRU.available(AArch64::NZCV);
10830 bool LRAvailableEverywhere =
true;
10832 LRU.addLiveOuts(
MBB);
10834 auto UpdateWholeMBBFlags = [&
Flags](
const MachineInstr &
MI) {
10835 if (
MI.isCall() && !
MI.isTerminator())
10841 auto CreateNewRangeStartingAt =
10842 [&RangeBegin, &RangeEnd,
10844 RangeBegin = NewBegin;
10845 RangeEnd = std::next(RangeBegin);
10848 auto SaveRangeIfNonEmpty = [&RangeLen, &
Ranges, &RangeBegin, &RangeEnd]() {
10854 if (!RangeBegin.isEnd() && RangeBegin->isBundledWithPred())
10856 if (!RangeEnd.isEnd() && RangeEnd->isBundledWithPred())
10858 Ranges.emplace_back(RangeBegin, RangeEnd);
10866 for (; FirstPossibleEndPt !=
MBB.
instr_rend(); ++FirstPossibleEndPt) {
10867 if (!FirstPossibleEndPt->isDebugInstr())
10868 LRU.stepBackward(*FirstPossibleEndPt);
10871 UpdateWholeMBBFlags(*FirstPossibleEndPt);
10872 if (AreAllUnsafeRegsDead())
10879 CreateNewRangeStartingAt(FirstPossibleEndPt->getIterator());
10884 if (!
MI.isDebugInstr())
10885 LRU.stepBackward(
MI);
10886 UpdateWholeMBBFlags(
MI);
10887 if (!AreAllUnsafeRegsDead()) {
10888 SaveRangeIfNonEmpty();
10889 CreateNewRangeStartingAt(
MI.getIterator());
10892 LRAvailableEverywhere &= LRU.available(AArch64::LR);
10893 RangeBegin =
MI.getIterator();
10898 if (AreAllUnsafeRegsDead())
10899 SaveRangeIfNonEmpty();
10907 if (!LRAvailableEverywhere)
10915 unsigned Flags)
const {
10916 MachineInstr &
MI = *MIT;
10920 switch (
MI.getOpcode()) {
10921 case AArch64::PACM:
10922 case AArch64::PACIASP:
10923 case AArch64::PACIBSP:
10924 case AArch64::PACIASPPC:
10925 case AArch64::PACIBSPPC:
10926 case AArch64::AUTIASP:
10927 case AArch64::AUTIBSP:
10928 case AArch64::AUTIASPPCi:
10929 case AArch64::AUTIASPPCr:
10930 case AArch64::AUTIBSPPCi:
10931 case AArch64::AUTIBSPPCr:
10932 case AArch64::RETAA:
10933 case AArch64::RETAB:
10934 case AArch64::RETAASPPCi:
10935 case AArch64::RETAASPPCr:
10936 case AArch64::RETABSPPCi:
10937 case AArch64::RETABSPPCr:
10938 case AArch64::EMITBKEY:
10939 case AArch64::PAUTH_PROLOGUE:
10940 case AArch64::PAUTH_EPILOGUE:
10950 if (
MI.isCFIInstruction())
10954 if (
MI.isTerminator())
10960 for (
const MachineOperand &MOP :
MI.operands()) {
10963 assert(!MOP.isCFIIndex());
10966 if (MOP.isReg() && !MOP.isImplicit() &&
10967 (MOP.getReg() == AArch64::LR || MOP.getReg() == AArch64::W30))
10974 if (
MI.getOpcode() == AArch64::ADRP)
10994 for (
const MachineOperand &MOP :
MI.operands()) {
10995 if (MOP.isGlobal()) {
11003 if (Callee &&
Callee->getName() ==
"\01_mcount")
11011 if (
MI.getOpcode() == AArch64::BLR ||
11012 MI.getOpcode() == AArch64::BLRNoIP ||
MI.getOpcode() == AArch64::BL)
11016 return UnknownCallOutlineType;
11024 return UnknownCallOutlineType;
11032 return UnknownCallOutlineType;
11053 for (MachineInstr &
MI :
MBB) {
11054 const MachineOperand *
Base;
11055 TypeSize Width(0,
false);
11057 bool OffsetIsScalable;
11060 if (!
MI.mayLoadOrStore() ||
11063 (
Base->isReg() &&
Base->getReg() != AArch64::SP))
11067 TypeSize Scale(0U,
false);
11068 int64_t Dummy1, Dummy2;
11071 assert(StackOffsetOperand.
isImm() &&
"Stack offset wasn't immediate!");
11073 assert(Scale != 0 &&
"Unexpected opcode!");
11074 assert(!OffsetIsScalable &&
"Expected offset to be a byte offset");
11079 int64_t NewImm = (
Offset + 16) / (int64_t)Scale.getFixedValue();
11080 StackOffsetOperand.
setImm(NewImm);
11086 bool ShouldSignReturnAddr) {
11087 if (!ShouldSignReturnAddr)
11095void AArch64InstrInfo::buildOutlinedFrame(
11099 AArch64FunctionInfo *FI = MF.
getInfo<AArch64FunctionInfo>();
11107 unsigned TailOpcode;
11109 TailOpcode = AArch64::TCRETURNdi;
11113 TailOpcode = AArch64::TCRETURNriALL;
11124 bool IsLeafFunction =
true;
11127 auto IsNonTailCall = [](
const MachineInstr &
MI) {
11128 return MI.isCall() && !
MI.isReturn();
11138 "Can only fix up stack references once");
11139 fixupPostOutline(
MBB);
11141 IsLeafFunction =
false;
11152 Et = std::prev(
MBB.
end());
11162 if (MF.
getInfo<AArch64FunctionInfo>()->needsDwarfUnwindInfo(MF)) {
11166 CFIBuilder.buildDefCFAOffset(16);
11170 CFIBuilder.buildOffset(AArch64::LR, -16);
11184 RASignCondition, !IsLeafFunction);
11213 fixupPostOutline(
MBB);
11224 .addGlobalAddress(
M.getNamedValue(MF.
getName()))
11234 .addGlobalAddress(
M.getNamedValue(MF.
getName())));
11243 MachineInstr *Save;
11244 MachineInstr *Restore;
11250 assert(
Reg &&
"No callee-saved register available?");
11284 .addGlobalAddress(
M.getNamedValue(MF.
getName())));
11292bool AArch64InstrInfo::shouldOutlineFromFunctionByDefault(
11300 bool AllowSideEffects)
const {
11302 const AArch64Subtarget &STI = MF.
getSubtarget<AArch64Subtarget>();
11305 if (
TRI.isGeneralPurposeRegister(MF,
Reg)) {
11318 assert(STI.hasNEON() &&
"Expected to have NEON.");
11324std::optional<DestSourcePair>
11329 if (((
MI.getOpcode() == AArch64::ORRWrs &&
11330 MI.getOperand(1).getReg() == AArch64::WZR &&
11331 MI.getOperand(3).getImm() == 0x0) ||
11332 (
MI.getOpcode() == AArch64::ORRWrr &&
11333 MI.getOperand(1).getReg() == AArch64::WZR)) &&
11335 (!
MI.getOperand(0).getReg().isVirtual() ||
11336 MI.getOperand(0).getSubReg() == 0) &&
11337 (!
MI.getOperand(0).getReg().isPhysical() ||
11342 if (
MI.getOpcode() == AArch64::ORRXrs &&
11343 MI.getOperand(1).getReg() == AArch64::XZR &&
11344 MI.getOperand(3).getImm() == 0x0)
11347 return std::nullopt;
11350std::optional<DestSourcePair>
11352 if ((
MI.getOpcode() == AArch64::ORRWrs &&
11353 MI.getOperand(1).getReg() == AArch64::WZR &&
11354 MI.getOperand(3).getImm() == 0x0) ||
11355 (
MI.getOpcode() == AArch64::ORRWrr &&
11356 MI.getOperand(1).getReg() == AArch64::WZR))
11358 return std::nullopt;
11361std::optional<RegImmPair>
11370 return std::nullopt;
11372 switch (
MI.getOpcode()) {
11374 return std::nullopt;
11375 case AArch64::SUBWri:
11376 case AArch64::SUBXri:
11377 case AArch64::SUBSWri:
11378 case AArch64::SUBSXri:
11381 case AArch64::ADDSWri:
11382 case AArch64::ADDSXri:
11383 case AArch64::ADDWri:
11384 case AArch64::ADDXri: {
11386 if (!
MI.getOperand(0).isReg() || !
MI.getOperand(1).isReg() ||
11387 !
MI.getOperand(2).isImm())
11388 return std::nullopt;
11389 int Shift =
MI.getOperand(3).getImm();
11390 assert((Shift == 0 || Shift == 12) &&
"Shift can be either 0 or 12");
11394 return RegImmPair{
MI.getOperand(1).getReg(),
Offset};
11400static std::optional<ParamLoadedValue>
11404 auto DestSrc =
TII->isCopyLikeInstr(
MI);
11406 return std::nullopt;
11408 Register DestReg = DestSrc->Destination->getReg();
11409 Register SrcReg = DestSrc->Source->getReg();
11412 return std::nullopt;
11417 if (DestReg == DescribedReg)
11421 if (
MI.getOpcode() == AArch64::ORRWrs &&
11422 TRI->isSuperRegister(DestReg, DescribedReg))
11426 if (
MI.getOpcode() == AArch64::ORRXrs &&
11427 TRI->isSubRegister(DestReg, DescribedReg)) {
11428 Register SrcSubReg =
TRI->getSubReg(SrcReg, AArch64::sub_32);
11432 assert(!
TRI->isSuperOrSubRegisterEq(DestReg, DescribedReg) &&
11433 "Unhandled ORR[XW]rs copy case");
11435 return std::nullopt;
11438bool AArch64InstrInfo::isFunctionSafeToSplit(
const MachineFunction &MF)
const {
11443 if (MF.
getInfo<AArch64FunctionInfo>()->hasRedZone().value_or(
true))
11449bool AArch64InstrInfo::isMBBSafeToSplitToCold(
11453 auto isAsmGoto = [](
const MachineInstr &
MI) {
11454 return MI.getOpcode() == AArch64::INLINEASM_BR;
11464 auto containsMBB = [&
MBB](
const MachineJumpTableEntry &JTE) {
11471 for (
const MachineInstr &
MI :
MBB) {
11472 switch (
MI.getOpcode()) {
11473 case TargetOpcode::G_BRJT:
11474 case AArch64::JumpTableDest32:
11475 case AArch64::JumpTableDest16:
11476 case AArch64::JumpTableDest8:
11487std::optional<ParamLoadedValue>
11490 const MachineFunction *MF =
MI.getMF();
11492 switch (
MI.getOpcode()) {
11493 case AArch64::MOVZWi:
11494 case AArch64::MOVZXi: {
11497 if (!
TRI->isSuperRegisterEq(
MI.getOperand(0).getReg(),
Reg))
11498 return std::nullopt;
11500 if (!
MI.getOperand(1).isImm())
11501 return std::nullopt;
11502 int64_t Immediate =
MI.getOperand(1).getImm();
11503 int Shift =
MI.getOperand(2).getImm();
11507 case AArch64::ORRWrs:
11508 case AArch64::ORRXrs:
11515bool AArch64InstrInfo::isExtendLikelyToBeFolded(
11518 ExtMI.
getOpcode() == TargetOpcode::G_ZEXT ||
11519 ExtMI.
getOpcode() == TargetOpcode::G_ANYEXT);
11522 if (ExtMI.
getOpcode() == TargetOpcode::G_ANYEXT)
11532 return UserMI->
getOpcode() == TargetOpcode::G_PTR_ADD;
11535uint64_t AArch64InstrInfo::getElementSizeForOpcode(
unsigned Opc)
const {
11539bool AArch64InstrInfo::isPTestLikeOpcode(
unsigned Opc)
const {
11543bool AArch64InstrInfo::isWhileOpcode(
unsigned Opc)
const {
11548AArch64InstrInfo::getTailDuplicateSize(
CodeGenOptLevel OptLevel)
const {
11552bool AArch64InstrInfo::isLegalAddressingMode(
unsigned NumBytes, int64_t
Offset,
11553 unsigned Scale)
const {
11564 unsigned Shift =
Log2_64(NumBytes);
11565 if (NumBytes &&
Offset > 0 && (
Offset / NumBytes) <= (1LL << 12) - 1 &&
11573 return Scale == 1 || (Scale > 0 && Scale == NumBytes);
11578 return AArch64::BLRNoIP;
11580 return AArch64::BLR;
11586 auto Builder =
BuildMI(
MBB, InsertPt,
DL,
get(AArch64::PAUTH_EPILOGUE))
11596 if (Subtarget.hasPAuthLR())
11607 Register TargetReg,
bool FrameSetup)
const {
11608 assert(TargetReg != AArch64::SP &&
"New top of stack cannot already be in SP");
11620 MF.
insert(MBBInsertPoint, LoopTestMBB);
11623 MF.
insert(MBBInsertPoint, LoopBodyMBB);
11625 MF.
insert(MBBInsertPoint, ExitMBB);
11635 BuildMI(*LoopTestMBB, LoopTestMBB->
end(),
DL,
TII->get(AArch64::SUBSXrx64),
11643 BuildMI(*LoopTestMBB, LoopTestMBB->
end(),
DL,
TII->get(AArch64::Bcc))
11649 BuildMI(*LoopBodyMBB, LoopBodyMBB->
end(),
DL,
TII->get(AArch64::LDRXui))
11666 BuildMI(*ExitMBB, ExitMBB->
end(),
DL,
TII->get(AArch64::ADDXri), AArch64::SP)
11685 MBB.addSuccessor(LoopTestMBB);
11691 return ExitMBB->
begin();
11696 MachineFunction *MF;
11697 const TargetInstrInfo *
TII;
11698 const TargetRegisterInfo *
TRI;
11699 MachineRegisterInfo &MRI;
11702 MachineBasicBlock *LoopBB;
11704 MachineInstr *CondBranch;
11706 MachineInstr *Comp;
11708 unsigned CompCounterOprNum;
11710 MachineInstr *Update;
11712 unsigned UpdateCounterOprNum;
11716 bool IsUpdatePriorComp;
11722 AArch64PipelinerLoopInfo(MachineBasicBlock *LoopBB, MachineInstr *CondBranch,
11723 MachineInstr *Comp,
unsigned CompCounterOprNum,
11724 MachineInstr *Update,
unsigned UpdateCounterOprNum,
11725 Register Init,
bool IsUpdatePriorComp,
11726 const SmallVectorImpl<MachineOperand> &
Cond)
11728 TII(MF->getSubtarget().getInstrInfo()),
11729 TRI(MF->getSubtarget().getRegisterInfo()), MRI(MF->getRegInfo()),
11730 LoopBB(LoopBB), CondBranch(CondBranch), Comp(Comp),
11731 CompCounterOprNum(CompCounterOprNum), Update(Update),
11732 UpdateCounterOprNum(UpdateCounterOprNum), Init(Init),
11735 bool shouldIgnoreForPipelining(
const MachineInstr *
MI)
const override {
11741 std::optional<bool> createTripCountGreaterCondition(
11742 int TC, MachineBasicBlock &
MBB,
11743 SmallVectorImpl<MachineOperand> &CondParam)
override {
11751 void createRemainingIterationsGreaterCondition(
11752 int TC, MachineBasicBlock &
MBB, SmallVectorImpl<MachineOperand> &
Cond,
11753 DenseMap<MachineInstr *, MachineInstr *> &LastStage0Insts)
override;
11755 void setPreheader(MachineBasicBlock *NewPreheader)
override {}
11757 void adjustTripCount(
int TripCountAdjust)
override {}
11759 bool isMVEExpanderSupported()
override {
return true; }
11778 }
else if (
I == ReplaceOprNum) {
11783 MBB.insert(InsertTo, NewMI);
11787void AArch64PipelinerLoopInfo::createRemainingIterationsGreaterCondition(
11803 assert(CondBranch->getOpcode() == AArch64::Bcc);
11807 if (CondBranch->getOperand(1).getMBB() == LoopBB)
11814 auto AccumulateCond = [&](
Register CurCond,
11825 if (!LastStage0Insts.
empty() && LastStage0Insts[Comp]->getParent() == &
MBB) {
11829 for (
int I = 0;
I <= TC; ++
I) {
11835 AccCond = AccumulateCond(AccCond, CC);
11839 if (Update != Comp && IsUpdatePriorComp) {
11841 LastStage0Insts[Comp]->getOperand(CompCounterOprNum).getReg();
11842 NextCounter =
cloneInstr(Update, UpdateCounterOprNum, Counter,
MBB,
11846 NextCounter = LastStage0Insts[Update]->getOperand(0).getReg();
11848 }
else if (Update != Comp) {
11853 Counter = NextCounter;
11857 if (LastStage0Insts.
empty()) {
11861 if (IsUpdatePriorComp)
11866 Counter = LastStage0Insts[Comp]->getOperand(CompCounterOprNum).getReg();
11869 for (
int I = 0;
I <= TC; ++
I) {
11873 AccCond = AccumulateCond(AccCond, CC);
11874 if (
I != TC && Update != Comp)
11877 Counter = NextCounter;
11893 assert(Phi.getNumOperands() == 5);
11894 if (Phi.getOperand(2).getMBB() ==
MBB) {
11895 RegMBB = Phi.getOperand(1).getReg();
11896 RegOther = Phi.getOperand(3).getReg();
11898 assert(Phi.getOperand(4).getMBB() ==
MBB);
11899 RegMBB = Phi.getOperand(3).getReg();
11900 RegOther = Phi.getOperand(1).getReg();
11905 if (!
Reg.isVirtual())
11914 unsigned &UpdateCounterOprNum,
Register &InitReg,
11915 bool &IsUpdatePriorComp) {
11929 if (!
Reg.isVirtual())
11932 UpdateInst =
nullptr;
11933 UpdateCounterOprNum = 0;
11935 IsUpdatePriorComp =
true;
11939 if (Def->getParent() != LoopBB)
11941 if (Def->isCopy()) {
11943 if (Def->getOperand(0).getSubReg() || Def->getOperand(1).getSubReg())
11945 CurReg = Def->getOperand(1).getReg();
11946 }
else if (Def->isPHI()) {
11950 IsUpdatePriorComp =
false;
11955 switch (Def->getOpcode()) {
11956 case AArch64::ADDSXri:
11957 case AArch64::ADDSWri:
11958 case AArch64::SUBSXri:
11959 case AArch64::SUBSWri:
11960 case AArch64::ADDXri:
11961 case AArch64::ADDWri:
11962 case AArch64::SUBXri:
11963 case AArch64::SUBWri:
11965 UpdateCounterOprNum = 1;
11967 case AArch64::ADDSXrr:
11968 case AArch64::ADDSWrr:
11969 case AArch64::SUBSXrr:
11970 case AArch64::SUBSWrr:
11971 case AArch64::ADDXrr:
11972 case AArch64::ADDWrr:
11973 case AArch64::SUBXrr:
11974 case AArch64::SUBWrr:
11977 UpdateCounterOprNum = 1;
11979 UpdateCounterOprNum = 2;
11986 CurReg = Def->getOperand(UpdateCounterOprNum).getReg();
12001std::unique_ptr<TargetInstrInfo::PipelinerLoopInfo>
12012 if (
MI.isCall() ||
MI.hasUnmodeledSideEffects())
12023 if (
TBB == LoopBB && FBB == LoopBB)
12027 if (
TBB != LoopBB && FBB ==
nullptr)
12030 assert((
TBB == LoopBB || FBB == LoopBB) &&
12031 "The Loop must be a single-basic-block loop");
12036 if (CondBranch->
getOpcode() != AArch64::Bcc)
12044 unsigned CompCounterOprNum = 0;
12046 if (
MI.modifiesRegister(AArch64::NZCV, &
TRI)) {
12050 switch (
MI.getOpcode()) {
12051 case AArch64::SUBSXri:
12052 case AArch64::SUBSWri:
12053 case AArch64::ADDSXri:
12054 case AArch64::ADDSWri:
12056 CompCounterOprNum = 1;
12058 case AArch64::ADDSWrr:
12059 case AArch64::ADDSXrr:
12060 case AArch64::SUBSWrr:
12061 case AArch64::SUBSXrr:
12065 if (isWhileOpcode(
MI.getOpcode())) {
12072 if (CompCounterOprNum == 0) {
12074 CompCounterOprNum = 2;
12076 CompCounterOprNum = 1;
12088 bool IsUpdatePriorComp;
12089 unsigned UpdateCounterOprNum;
12091 Update, UpdateCounterOprNum,
Init, IsUpdatePriorComp))
12094 return std::make_unique<AArch64PipelinerLoopInfo>(
12095 LoopBB, CondBranch, Comp, CompCounterOprNum, Update, UpdateCounterOprNum,
12105 TypeSize Scale(0U,
false), Width(0U,
false);
12106 int64_t MinOffset, MaxOffset;
12107 if (
getMemOpInfo(
MI.getOpcode(), Scale, Width, MinOffset, MaxOffset)) {
12109 if (
MI.getOperand(ImmIdx).isImm() && !
MI.getOperand(ImmIdx - 1).isFI()) {
12110 int64_t Imm =
MI.getOperand(ImmIdx).getImm();
12111 if (Imm < MinOffset || Imm > MaxOffset) {
12112 ErrInfo =
"Unexpected immediate on load/store instruction";
12118 const MCInstrDesc &MCID =
MI.getDesc();
12120 const MachineOperand &MO =
MI.getOperand(
Op);
12124 ErrInfo =
"OPERAND_IMPLICIT_IMM_0 should be 0";
12133 ErrInfo =
"OPERAND_SHIFT_MSL should be msl shift of 8 or 16";
12144#define GET_INSTRINFO_HELPERS
12145#define GET_INSTRMAP_INFO
12146#include "AArch64GenInstrInfo.inc"
MachineInstrBuilder & UseMI
MachineInstrBuilder MachineInstrBuilder & DefMI
static bool forwardCopyWillClobberTuple(unsigned DestReg, unsigned SrcReg, unsigned NumRegs)
static cl::opt< unsigned > BCCDisplacementBits("aarch64-bcc-offset-bits", cl::Hidden, cl::init(19), cl::desc("Restrict range of Bcc instructions (DEBUG)"))
static Register genNeg(MachineFunction &MF, MachineRegisterInfo &MRI, const TargetInstrInfo *TII, MachineInstr &Root, SmallVectorImpl< MachineInstr * > &InsInstrs, DenseMap< Register, unsigned > &InstrIdxForVirtReg, unsigned MnegOpc, const TargetRegisterClass *RC)
genNeg - Helper to generate an intermediate negation of the second operand of Root
static bool isFrameStoreOpcode(int Opcode)
static cl::opt< unsigned > GatherOptSearchLimit("aarch64-search-limit", cl::Hidden, cl::init(2048), cl::desc("Restrict range of instructions to search for the " "machine-combiner gather pattern optimization"))
static bool getMaddPatterns(MachineInstr &Root, SmallVectorImpl< unsigned > &Patterns)
Find instructions that can be turned into madd.
static AArch64CC::CondCode findCondCodeUsedByInstr(const MachineInstr &Instr)
Find a condition code used by the instruction.
static MachineInstr * genFusedMultiplyAcc(MachineFunction &MF, MachineRegisterInfo &MRI, const TargetInstrInfo *TII, MachineInstr &Root, SmallVectorImpl< MachineInstr * > &InsInstrs, unsigned IdxMulOpd, unsigned MaddOpc, const TargetRegisterClass *RC)
genFusedMultiplyAcc - Helper to generate fused multiply accumulate instructions.
static MachineInstr * genFusedMultiplyAccNeg(MachineFunction &MF, MachineRegisterInfo &MRI, const TargetInstrInfo *TII, MachineInstr &Root, SmallVectorImpl< MachineInstr * > &InsInstrs, DenseMap< Register, unsigned > &InstrIdxForVirtReg, unsigned IdxMulOpd, unsigned MaddOpc, unsigned MnegOpc, const TargetRegisterClass *RC)
genFusedMultiplyAccNeg - Helper to generate fused multiply accumulate instructions with an additional...
static bool isCombineInstrCandidate64(unsigned Opc)
static bool isFrameLoadOpcode(int Opcode)
static unsigned removeCopies(const MachineRegisterInfo &MRI, unsigned VReg)
static bool areCFlagsAccessedBetweenInstrs(MachineBasicBlock::iterator From, MachineBasicBlock::iterator To, const TargetRegisterInfo *TRI, const AccessKind AccessToCheck=AK_All)
True when condition flags are accessed (either by writing or reading) on the instruction trace starti...
static bool getFMAPatterns(MachineInstr &Root, SmallVectorImpl< unsigned > &Patterns)
Floating-Point Support.
static bool isADDSRegImm(unsigned Opcode)
static bool isCheapCopy(const MachineInstr &MI, const AArch64RegisterInfo &RI)
static bool isANDOpcode(MachineInstr &MI)
static void appendOffsetComment(int NumBytes, llvm::raw_string_ostream &Comment, StringRef RegScale={})
static unsigned sForm(MachineInstr &Instr)
Get opcode of S version of Instr.
static bool isCombineInstrSettingFlag(unsigned Opc)
static bool getFNEGPatterns(MachineInstr &Root, SmallVectorImpl< unsigned > &Patterns)
static bool getIndVarInfo(Register Reg, const MachineBasicBlock *LoopBB, MachineInstr *&UpdateInst, unsigned &UpdateCounterOprNum, Register &InitReg, bool &IsUpdatePriorComp)
If Reg is an induction variable, return true and set some parameters.
static bool canPairLdStOpc(unsigned FirstOpc, unsigned SecondOpc)
static bool mustAvoidNeonAtMBBI(const AArch64Subtarget &Subtarget, MachineBasicBlock &MBB, MachineBasicBlock::iterator I)
Returns true if in a streaming call site region without SME-FA64.
static bool isPostIndexLdStOpcode(unsigned Opcode)
Return true if the opcode is a post-index ld/st instruction, which really loads from base+0.
static std::optional< unsigned > getLFIInstSizeInBytes(const MachineInstr &MI)
Return the maximum number of bytes of code the specified instruction may be after LFI rewriting.
static unsigned getBranchDisplacementBits(unsigned Opc)
static cl::opt< unsigned > CBDisplacementBits("aarch64-cb-offset-bits", cl::Hidden, cl::init(9), cl::desc("Restrict range of CB instructions (DEBUG)"))
static std::optional< ParamLoadedValue > describeORRLoadedValue(const MachineInstr &MI, Register DescribedReg, const TargetInstrInfo *TII, const TargetRegisterInfo *TRI)
If the given ORR instruction is a copy, and DescribedReg overlaps with the destination register then,...
static bool getFMULPatterns(MachineInstr &Root, SmallVectorImpl< unsigned > &Patterns)
static void appendReadRegExpr(SmallVectorImpl< char > &Expr, unsigned RegNum)
static MachineInstr * genMaddR(MachineFunction &MF, MachineRegisterInfo &MRI, const TargetInstrInfo *TII, MachineInstr &Root, SmallVectorImpl< MachineInstr * > &InsInstrs, unsigned IdxMulOpd, unsigned MaddOpc, unsigned VR, const TargetRegisterClass *RC)
genMaddR - Generate madd instruction and combine mul and add using an extra virtual register Example ...
static Register cloneInstr(const MachineInstr *MI, unsigned ReplaceOprNum, Register ReplaceReg, MachineBasicBlock &MBB, MachineBasicBlock::iterator InsertTo)
Clone an instruction from MI.
static bool scaleOffset(unsigned Opc, int64_t &Offset)
static bool canCombineWithFMUL(MachineBasicBlock &MBB, MachineOperand &MO, unsigned MulOpc)
unsigned scaledOffsetOpcode(unsigned Opcode, unsigned &Scale)
static MachineInstr * genFusedMultiplyIdx(MachineFunction &MF, MachineRegisterInfo &MRI, const TargetInstrInfo *TII, MachineInstr &Root, SmallVectorImpl< MachineInstr * > &InsInstrs, unsigned IdxMulOpd, unsigned MaddOpc, const TargetRegisterClass *RC)
genFusedMultiplyIdx - Helper to generate fused multiply accumulate instructions.
static MachineInstr * genIndexedMultiply(MachineInstr &Root, SmallVectorImpl< MachineInstr * > &InsInstrs, unsigned IdxDupOp, unsigned MulOpc, const TargetRegisterClass *RC, MachineRegisterInfo &MRI)
Fold (FMUL x (DUP y lane)) into (FMUL_indexed x y lane)
static bool isSUBSRegImm(unsigned Opcode)
static bool UpdateOperandRegClass(MachineInstr &Instr)
static const TargetRegisterClass * getRegClass(const MachineInstr &MI, Register Reg)
static bool isInStreamingCallSiteRegion(MachineBasicBlock &MBB, MachineBasicBlock::iterator I)
Returns true if the instruction at I is in a streaming call site region, within a single basic block.
static bool canCmpInstrBeRemoved(MachineInstr &MI, MachineInstr &CmpInstr, int CmpValue, const TargetRegisterInfo &TRI, SmallVectorImpl< MachineInstr * > &CCUseInstrs, bool &IsInvertCC)
unsigned unscaledOffsetOpcode(unsigned Opcode)
static bool getLoadPatterns(MachineInstr &Root, SmallVectorImpl< unsigned > &Patterns)
Search for patterns of LD instructions we can optimize.
static bool canInstrSubstituteCmpInstr(MachineInstr &MI, MachineInstr &CmpInstr, const TargetRegisterInfo &TRI)
Check if CmpInstr can be substituted by MI.
static UsedNZCV getUsedNZCV(AArch64CC::CondCode CC)
static bool isCombineInstrCandidateFP(const MachineInstr &Inst)
static void appendLoadRegExpr(SmallVectorImpl< char > &Expr, int64_t OffsetFromDefCFA)
static void appendConstantExpr(SmallVectorImpl< char > &Expr, int64_t Constant, dwarf::LocationAtom Operation)
static unsigned convertToNonFlagSettingOpc(const MachineInstr &MI)
Return the opcode that does not set flags when possible - otherwise return the original opcode.
static bool outliningCandidatesV8_3OpsConsensus(const outliner::Candidate &a, const outliner::Candidate &b)
static bool isCombineInstrCandidate32(unsigned Opc)
static void parseCondBranch(MachineInstr *LastInst, MachineBasicBlock *&Target, SmallVectorImpl< MachineOperand > &Cond)
static unsigned offsetExtendOpcode(unsigned Opcode)
static void loadRegPairFromStackSlot(const TargetRegisterInfo &TRI, MachineBasicBlock &MBB, MachineBasicBlock::iterator InsertBefore, const MCInstrDesc &MCID, Register DestReg, unsigned SubIdx0, unsigned SubIdx1, int FI, MachineMemOperand *MMO)
static void generateGatherLanePattern(MachineInstr &Root, SmallVectorImpl< MachineInstr * > &InsInstrs, SmallVectorImpl< MachineInstr * > &DelInstrs, DenseMap< Register, unsigned > &InstrIdxForVirtReg, unsigned Pattern, unsigned NumLanes)
Generate optimized instruction sequence for gather load patterns to improve Memory-Level Parallelism ...
static bool getMiscPatterns(MachineInstr &Root, SmallVectorImpl< unsigned > &Patterns)
Find other MI combine patterns.
static bool outliningCandidatesSigningKeyConsensus(const outliner::Candidate &a, const outliner::Candidate &b)
static const MachineInstrBuilder & AddSubReg(const MachineInstrBuilder &MIB, MCRegister Reg, unsigned SubIdx, RegState State, const TargetRegisterInfo *TRI)
static bool outliningCandidatesSigningScopeConsensus(const outliner::Candidate &a, const outliner::Candidate &b)
static bool shouldClusterFI(const MachineFrameInfo &MFI, int FI1, int64_t Offset1, unsigned Opcode1, int FI2, int64_t Offset2, unsigned Opcode2)
static cl::opt< unsigned > TBZDisplacementBits("aarch64-tbz-offset-bits", cl::Hidden, cl::init(14), cl::desc("Restrict range of TB[N]Z instructions (DEBUG)"))
static void extractPhiReg(const MachineInstr &Phi, const MachineBasicBlock *MBB, Register &RegMBB, Register &RegOther)
static MCCFIInstruction createDefCFAExpression(const TargetRegisterInfo &TRI, unsigned Reg, const StackOffset &Offset)
static bool isDefinedOutside(Register Reg, const MachineBasicBlock *BB)
static MachineInstr * genFusedMultiply(MachineFunction &MF, MachineRegisterInfo &MRI, const TargetInstrInfo *TII, MachineInstr &Root, SmallVectorImpl< MachineInstr * > &InsInstrs, unsigned IdxMulOpd, unsigned MaddOpc, const TargetRegisterClass *RC, FMAInstKind kind=FMAInstKind::Default, const Register *ReplacedAddend=nullptr)
genFusedMultiply - Generate fused multiply instructions.
static bool getGatherLanePattern(MachineInstr &Root, SmallVectorImpl< unsigned > &Patterns, unsigned LoadLaneOpCode, unsigned NumLanes)
Check if the given instruction forms a gather load pattern that can be optimized for better Memory-Le...
static MachineInstr * genFusedMultiplyIdxNeg(MachineFunction &MF, MachineRegisterInfo &MRI, const TargetInstrInfo *TII, MachineInstr &Root, SmallVectorImpl< MachineInstr * > &InsInstrs, DenseMap< Register, unsigned > &InstrIdxForVirtReg, unsigned IdxMulOpd, unsigned MaddOpc, unsigned MnegOpc, const TargetRegisterClass *RC)
genFusedMultiplyAccNeg - Helper to generate fused multiply accumulate instructions with an additional...
static bool isCombineInstrCandidate(unsigned Opc)
static unsigned regOffsetOpcode(unsigned Opcode)
MachineOutlinerClass
Constants defining how certain sequences should be outlined.
@ MachineOutlinerTailCall
Emit a save, restore, call, and return.
@ MachineOutlinerRegSave
Emit a call and tail-call.
@ MachineOutlinerNoLRSave
Only emit a branch.
@ MachineOutlinerThunk
Emit a call and return.
static cl::opt< unsigned > BDisplacementBits("aarch64-b-offset-bits", cl::Hidden, cl::init(26), cl::desc("Restrict range of B instructions (DEBUG)"))
static bool areCFlagsAliveInSuccessors(const MachineBasicBlock *MBB)
Check if AArch64::NZCV should be alive in successors of MBB.
static void emitFrameOffsetAdj(MachineBasicBlock &MBB, MachineBasicBlock::iterator MBBI, const DebugLoc &DL, unsigned DestReg, unsigned SrcReg, int64_t Offset, unsigned Opc, const TargetInstrInfo *TII, MachineInstr::MIFlag Flag, bool NeedsWinCFI, bool *HasWinCFI, bool EmitCFAOffset, StackOffset CFAOffset, unsigned FrameReg)
static bool isCheapImmediate(const MachineInstr &MI, unsigned BitSize)
static cl::opt< unsigned > CBZDisplacementBits("aarch64-cbz-offset-bits", cl::Hidden, cl::init(19), cl::desc("Restrict range of CB[N]Z instructions (DEBUG)"))
static void genSubAdd2SubSub(MachineFunction &MF, MachineRegisterInfo &MRI, const TargetInstrInfo *TII, MachineInstr &Root, SmallVectorImpl< MachineInstr * > &InsInstrs, SmallVectorImpl< MachineInstr * > &DelInstrs, unsigned IdxOpd1, DenseMap< Register, unsigned > &InstrIdxForVirtReg)
Do the following transformation A - (B + C) ==> (A - B) - C A - (B + C) ==> (A - C) - B.
static unsigned canFoldIntoCSel(const MachineRegisterInfo &MRI, unsigned VReg, unsigned *NewReg=nullptr)
static void signOutlinedFunction(MachineFunction &MF, MachineBasicBlock &MBB, const AArch64InstrInfo *TII, bool ShouldSignReturnAddr)
static MachineInstr * genFNegatedMAD(MachineFunction &MF, MachineRegisterInfo &MRI, const TargetInstrInfo *TII, MachineInstr &Root, SmallVectorImpl< MachineInstr * > &InsInstrs)
static bool canCombineWithMUL(MachineBasicBlock &MBB, MachineOperand &MO, unsigned MulOpc, unsigned ZeroReg)
static void storeRegPairToStackSlot(const TargetRegisterInfo &TRI, MachineBasicBlock &MBB, MachineBasicBlock::iterator InsertBefore, const MCInstrDesc &MCID, Register SrcReg, bool IsKill, unsigned SubIdx0, unsigned SubIdx1, int FI, MachineMemOperand *MMO)
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
MachineBasicBlock MachineBasicBlock::iterator MBBI
static const Function * getParent(const Value *V)
static GCRegistry::Add< ErlangGC > A("erlang", "erlang-compatible garbage collector")
static GCRegistry::Add< OcamlGC > B("ocaml", "ocaml 3.10-compatible GC")
DXIL Forward Handle Accesses
const HexagonInstrInfo * TII
Module.h This file contains the declarations for the Module class.
const AbstractManglingParser< Derived, Alloc >::OperatorInfo AbstractManglingParser< Derived, Alloc >::Ops[]
This file implements the LivePhysRegs utility for tracking liveness of physical registers.
Machine Check Debug Module
Register const TargetRegisterInfo * TRI
Promote Memory to Register
static MCRegister getReg(const MCDisassembler *D, unsigned RC, unsigned RegNo)
MachineInstr unsigned OpIdx
ConstantRange Range(APInt(BitWidth, Low), APInt(BitWidth, High))
PowerPC Reduce CR logical Operation
const SmallVectorImpl< MachineOperand > MachineBasicBlock * TBB
const SmallVectorImpl< MachineOperand > & Cond
This file declares the machine register scavenger class.
static bool contains(SmallPtrSetImpl< ConstantExpr * > &Cache, ConstantExpr *Expr, Constant *C)
This file defines the SmallSet class.
This file defines the SmallVector class.
This file defines the 'Statistic' class, which is designed to be an easy way to expose various metric...
#define STATISTIC(VARNAME, DESC)
#define DEBUG_WITH_TYPE(TYPE,...)
DEBUG_WITH_TYPE macro - This macro should be used by passes to emit debug information.
static bool canCombine(MachineBasicBlock &MBB, MachineOperand &MO, unsigned CombineOpc=0)
AArch64FunctionInfo - This class is derived from MachineFunctionInfo and contains private AArch64-spe...
bool branchTargetEnforcement() const
unsigned getArgumentStackToRestore() const
SignReturnAddress getSignReturnAddressCondition() const
bool hasStreamingModeChanges() const
void setOutliningStyle(const std::string &Style)
bool branchProtectionPAuthLR() const
std::optional< bool > hasRedZone() const
static bool shouldSignReturnAddress(SignReturnAddress Condition, bool IsLRSpilled)
bool shouldSignWithBKey() const
static bool isHForm(const MachineInstr &MI)
Returns whether the instruction is in H form (16 bit operands)
void insertSelect(MachineBasicBlock &MBB, MachineBasicBlock::iterator MI, const DebugLoc &DL, Register DstReg, ArrayRef< MachineOperand > Cond, Register TrueReg, Register FalseReg) const override
static bool hasBTISemantics(const MachineInstr &MI)
Returns whether the instruction can be compatible with non-zero BTYPE.
static bool isQForm(const MachineInstr &MI)
Returns whether the instruction is in Q form (128 bit operands)
static bool getMemOpInfo(unsigned Opcode, TypeSize &Scale, TypeSize &Width, int64_t &MinOffset, int64_t &MaxOffset)
Returns true if opcode Opc is a memory operation.
static bool isTailCallReturnInst(const MachineInstr &MI)
Returns true if MI is one of the TCRETURN* instructions.
static bool isFPRCopy(const MachineInstr &MI)
Does this instruction rename an FPR without modifying bits?
MachineInstr * emitLdStWithAddr(MachineInstr &MemI, const ExtAddrMode &AM) const override
std::optional< DestSourcePair > isCopyInstrImpl(const MachineInstr &MI) const override
If the specific machine instruction is an instruction that moves/copies value from one register to an...
MachineBasicBlock * getBranchDestBlock(const MachineInstr &MI) const override
unsigned getInstSizeInBytes(const MachineInstr &MI) const override
GetInstSize - Return the number of bytes of code the specified instruction may be.
static bool isZExtLoad(const MachineInstr &MI)
Returns whether the instruction is a zero-extending load.
bool areMemAccessesTriviallyDisjoint(const MachineInstr &MIa, const MachineInstr &MIb) const override
void copyPhysReg(MachineBasicBlock &MBB, MachineBasicBlock::iterator I, const DebugLoc &DL, Register DestReg, Register SrcReg, bool KillSrc, bool RenamableDest=false, bool RenamableSrc=false) const override
static bool isGPRCopy(const MachineInstr &MI)
Does this instruction rename a GPR without modifying bits?
static unsigned convertToFlagSettingOpc(unsigned Opc)
Return the opcode that set flags when possible.
void createPauthEpilogueInstr(MachineBasicBlock &MBB, DebugLoc DL) const
Return true when there is potentially a faster code sequence for an instruction chain ending in Root.
bool isBranchOffsetInRange(unsigned BranchOpc, int64_t BrOffset) const override
bool canInsertSelect(const MachineBasicBlock &, ArrayRef< MachineOperand > Cond, Register, Register, Register, int &, int &, int &) const override
Register isLoadFromStackSlotPostFE(const MachineInstr &MI, int &FrameIndex) const override
Check for post-frame ptr elimination stack locations as well.
static const MachineOperand & getLdStOffsetOp(const MachineInstr &MI)
Returns the immediate offset operator of a load/store.
bool isCoalescableExtInstr(const MachineInstr &MI, Register &SrcReg, Register &DstReg, unsigned &SubIdx) const override
static std::optional< unsigned > getUnscaledLdSt(unsigned Opc)
Returns the unscaled load/store for the scaled load/store opcode, if there is a corresponding unscale...
static bool hasUnscaledLdStOffset(unsigned Opc)
Return true if it has an unscaled load/store offset.
static const MachineOperand & getLdStAmountOp(const MachineInstr &MI)
Returns the shift amount operator of a load/store.
static bool isPreLdSt(const MachineInstr &MI)
Returns whether the instruction is a pre-indexed load/store.
std::optional< ExtAddrMode > getAddrModeFromMemoryOp(const MachineInstr &MemI, const TargetRegisterInfo *TRI) const override
bool getMemOperandsWithOffsetWidth(const MachineInstr &MI, SmallVectorImpl< const MachineOperand * > &BaseOps, int64_t &Offset, bool &OffsetIsScalable, LocationSize &Width, const TargetRegisterInfo *TRI) const override
bool analyzeBranchPredicate(MachineBasicBlock &MBB, MachineBranchPredicate &MBP, bool AllowModify) const override
void insertIndirectBranch(MachineBasicBlock &MBB, MachineBasicBlock &NewDestBB, MachineBasicBlock &RestoreBB, const DebugLoc &DL, int64_t BrOffset, RegScavenger *RS) const override
void loadRegFromStackSlot(MachineBasicBlock &MBB, MachineBasicBlock::iterator MBBI, Register DestReg, int FrameIndex, const TargetRegisterClass *RC, Register VReg, unsigned SubReg=0, MachineInstr::MIFlag Flags=MachineInstr::NoFlags) const override
static bool isPairableLdStInst(const MachineInstr &MI)
Return true if pairing the given load or store may be paired with another.
void storeRegToStackSlot(MachineBasicBlock &MBB, MachineBasicBlock::iterator MBBI, Register SrcReg, bool isKill, int FrameIndex, const TargetRegisterClass *RC, Register VReg, MachineInstr::MIFlag Flags=MachineInstr::NoFlags) const override
static bool isSExtLoad(const MachineInstr &MI)
Returns whether the instruction is a sign-extending load.
const AArch64RegisterInfo & getRegisterInfo() const
getRegisterInfo - TargetInstrInfo is a superset of MRegister info.
static bool isPreSt(const MachineInstr &MI)
Returns whether the instruction is a pre-indexed store.
void insertNoop(MachineBasicBlock &MBB, MachineBasicBlock::iterator MI) const override
AArch64InstrInfo(const AArch64Subtarget &STI)
static bool isPairedLdSt(const MachineInstr &MI)
Returns whether the instruction is a paired load/store.
MachineInstr * foldMemoryOperandImpl(MachineFunction &MF, MachineInstr &MI, ArrayRef< unsigned > Ops, int FrameIndex, MachineInstr *&CopyMI, LiveIntervals *LIS=nullptr, VirtRegMap *VRM=nullptr) const override
bool getMemOperandWithOffsetWidth(const MachineInstr &MI, const MachineOperand *&BaseOp, int64_t &Offset, bool &OffsetIsScalable, TypeSize &Width, const TargetRegisterInfo *TRI) const
If OffsetIsScalable is set to 'true', the offset is scaled by vscale.
Register isLoadFromStackSlot(const MachineInstr &MI, int &FrameIndex) const override
bool reverseBranchCondition(SmallVectorImpl< MachineOperand > &Cond) const override
static bool isStridedAccess(const MachineInstr &MI)
Return true if the given load or store is a strided memory access.
bool shouldClusterMemOps(ArrayRef< const MachineOperand * > BaseOps1, int64_t Offset1, bool OffsetIsScalable1, ArrayRef< const MachineOperand * > BaseOps2, int64_t Offset2, bool OffsetIsScalable2, unsigned ClusterSize, unsigned NumBytes) const override
Detect opportunities for ldp/stp formation.
unsigned removeBranch(MachineBasicBlock &MBB, int *BytesRemoved=nullptr) const override
bool isThroughputPattern(unsigned Pattern) const override
Return true when a code sequence can improve throughput.
MachineOperand & getMemOpBaseRegImmOfsOffsetOperand(MachineInstr &LdSt) const
Return the immediate offset of the base register in a load/store LdSt.
bool analyzeBranch(MachineBasicBlock &MBB, MachineBasicBlock *&TBB, MachineBasicBlock *&FBB, SmallVectorImpl< MachineOperand > &Cond, bool AllowModify=false) const override
bool canFoldIntoAddrMode(const MachineInstr &MemI, Register Reg, const MachineInstr &AddrI, ExtAddrMode &AM) const override
static bool isLdStPairSuppressed(const MachineInstr &MI)
Return true if pairing the given load or store is hinted to be unprofitable.
Register isStoreToStackSlotPostFE(const MachineInstr &MI, int &FrameIndex) const override
Check for post-frame ptr elimination stack locations as well.
std::unique_ptr< TargetInstrInfo::PipelinerLoopInfo > analyzeLoopForPipelining(MachineBasicBlock *LoopBB) const override
bool isSchedulingBoundary(const MachineInstr &MI, const MachineBasicBlock *MBB, const MachineFunction &MF) const override
unsigned insertBranch(MachineBasicBlock &MBB, MachineBasicBlock *TBB, MachineBasicBlock *FBB, ArrayRef< MachineOperand > Cond, const DebugLoc &DL, int *BytesAdded=nullptr) const override
bool optimizeCompareInstr(MachineInstr &CmpInstr, Register SrcReg, Register SrcReg2, int64_t CmpMask, int64_t CmpValue, const MachineRegisterInfo *MRI) const override
optimizeCompareInstr - Convert the instruction supplying the argument to the comparison into one that...
static unsigned getLoadStoreImmIdx(unsigned Opc)
Returns the index for the immediate for a given instruction.
static bool isGPRZero(const MachineInstr &MI)
Does this instruction set its full destination register to zero?
void copyGPRRegTuple(MachineBasicBlock &MBB, MachineBasicBlock::iterator I, const DebugLoc &DL, MCRegister DestReg, MCRegister SrcReg, bool KillSrc, unsigned Opcode, unsigned ZeroReg, llvm::ArrayRef< unsigned > Indices) const
bool analyzeCompare(const MachineInstr &MI, Register &SrcReg, Register &SrcReg2, int64_t &CmpMask, int64_t &CmpValue) const override
analyzeCompare - For a comparison instruction, return the source registers in SrcReg and SrcReg2,...
CombinerObjective getCombinerObjective(unsigned Pattern) const override
static bool isFpOrNEON(Register Reg)
Returns whether the physical register is FP or NEON.
bool isAsCheapAsAMove(const MachineInstr &MI) const override
std::optional< DestSourcePair > isCopyLikeInstrImpl(const MachineInstr &MI) const override
static void suppressLdStPair(MachineInstr &MI)
Hint that pairing the given load or store is unprofitable.
Register isStoreToStackSlot(const MachineInstr &MI, int &FrameIndex) const override
static bool isPreLd(const MachineInstr &MI)
Returns whether the instruction is a pre-indexed load.
void copyPhysRegTuple(MachineBasicBlock &MBB, MachineBasicBlock::iterator I, const DebugLoc &DL, MCRegister DestReg, MCRegister SrcReg, bool KillSrc, unsigned Opcode, llvm::ArrayRef< unsigned > Indices) const
bool optimizeCondBranch(MachineInstr &MI) const override
Replace csincr-branch sequence by simple conditional branch.
static int getMemScale(unsigned Opc)
Scaling factor for (scaled or unscaled) load or store.
bool isCandidateToMergeOrPair(const MachineInstr &MI) const
Return true if this is a load/store that can be potentially paired/merged.
MCInst getNop() const override
static const MachineOperand & getLdStBaseOp(const MachineInstr &MI)
Returns the base register operator of a load/store.
bool isReservedReg(const MachineFunction &MF, MCRegister Reg) const
const AArch64RegisterInfo * getRegisterInfo() const override
bool isNeonAvailable() const
Returns true if the target has NEON and the function at runtime is known to have NEON enabled (e....
bool isSVEorStreamingSVEAvailable() const
Returns true if the target has access to either the full range of SVE instructions,...
Represent a constant reference to an array (0 or more elements consecutively in memory),...
const T & front() const
Get the first element.
size_t size() const
Get the array size.
This is an important base class in LLVM.
std::pair< iterator, bool > insert(const std::pair< KeyT, ValueT > &KV)
bool hasOptSize() const
Optimize this function for size (-Os) or minimum size (-Oz).
bool hasMinSize() const
Optimize this function for minimum size (-Oz).
Module * getParent()
Get the module that this global value is contained inside of...
LLVM_ABI InstListType::iterator eraseFromParent()
This method unlinks 'this' from the containing basic block and deletes it.
unsigned getOpcode() const
Returns a member of one of the enums like Instruction::Add.
static LocationSize precise(uint64_t Value)
This class is intended to be used as a base class for asm properties and features specific to the tar...
bool usesWindowsCFI() const
static MCCFIInstruction cfiDefCfa(MCSymbol *L, unsigned Register, int64_t Offset, SMLoc Loc={})
.cfi_def_cfa defines a rule for computing CFA as: take address from Register and add Offset to it.
static MCCFIInstruction createOffset(MCSymbol *L, unsigned Register, int64_t Offset, SMLoc Loc={})
.cfi_offset Previous value of Register is saved at offset Offset from CFA.
static MCCFIInstruction cfiDefCfaOffset(MCSymbol *L, int64_t Offset, SMLoc Loc={})
.cfi_def_cfa_offset modifies a rule for computing CFA.
static MCCFIInstruction createEscape(MCSymbol *L, StringRef Vals, SMLoc Loc={}, StringRef Comment="")
.cfi_escape Allows the user to add arbitrary bytes to the unwind info.
Instances of this class represent a single low-level machine instruction.
Describe properties that are true of each instruction in the target description file.
unsigned getNumOperands() const
Return the number of declared MachineOperands for this MachineInstruction.
ArrayRef< MCOperandInfo > operands() const
Wrapper class representing physical registers. Should be passed by value.
constexpr bool isValid() const
static constexpr unsigned NoRegister
static MDTuple * get(LLVMContext &Context, ArrayRef< Metadata * > MDs)
bool isInlineAsmBrIndirectTarget() const
Returns true if this is the indirect dest of an INLINEASM_BR.
unsigned pred_size() const
LLVM_ABI void transferSuccessorsAndUpdatePHIs(MachineBasicBlock *FromMBB)
Transfers all the successors, as in transferSuccessors, and update PHI operands in the successor bloc...
LLVM_ABI instr_iterator insert(instr_iterator I, MachineInstr *M)
Insert MI into the instruction list before I, possibly inside a bundle.
reverse_instr_iterator instr_rbegin()
LLVM_ABI iterator getFirstTerminator()
Returns an iterator to the first terminator instruction of this basic block.
LLVM_ABI void addSuccessor(MachineBasicBlock *Succ, BranchProbability Prob=BranchProbability::getUnknown())
Add Succ as a successor of this MachineBasicBlock.
reverse_instr_iterator instr_rend()
Instructions::iterator instr_iterator
instr_iterator instr_end()
void addLiveIn(MCRegister PhysReg, LaneBitmask LaneMask=LaneBitmask::getAll())
Adds the specified register as a live in.
const MachineFunction * getParent() const
Return the MachineFunction containing this basic block.
LLVM_ABI instr_iterator erase(instr_iterator I)
Remove an instruction from the instruction list and delete it.
void splice(iterator Where, MachineBasicBlock *Other, iterator From)
Take an instruction from MBB 'Other' at the position From, and insert it into this MBB right before '...
MachineInstrBundleIterator< MachineInstr > iterator
void setMachineBlockAddressTaken()
Set this block to indicate that its address is used as something other than the target of a terminato...
LLVM_ABI bool isLiveIn(MCRegister Reg, LaneBitmask LaneMask=LaneBitmask::getAll()) const
Return true if the specified register is in the live in set.
The MachineFrameInfo class represents an abstract stack frame until prolog/epilog code is inserted.
uint64_t getStackSize() const
Return the number of bytes that must be allocated to hold all of the fixed size frame objects.
void setStackID(int ObjectIdx, uint8_t ID)
bool isCalleeSavedInfoValid() const
Has the callee saved info been calculated yet?
Align getObjectAlign(int ObjectIdx) const
Return the alignment of the specified stack object.
int64_t getObjectSize(int ObjectIdx) const
Return the size of the specified object.
unsigned getNumObjects() const
Return the number of objects.
int64_t getObjectOffset(int ObjectIdx) const
Return the assigned stack offset of the specified object from the incoming stack pointer.
bool isFixedObjectIndex(int ObjectIdx) const
Returns true if the specified index corresponds to a fixed stack object.
unsigned addFrameInst(const MCCFIInstruction &Inst)
const TargetSubtargetInfo & getSubtarget() const
getSubtarget - Return the subtarget for which this machine code is being compiled.
StringRef getName() const
getName - Return the name of the corresponding LLVM function.
MachineMemOperand * getMachineMemOperand(MachinePointerInfo PtrInfo, MachineMemOperand::Flags f, LLT MemTy, Align base_alignment, const AAMDNodes &AAInfo=AAMDNodes(), const MDNode *Ranges=nullptr, SyncScope::ID SSID=SyncScope::System, AtomicOrdering Ordering=AtomicOrdering::NotAtomic, AtomicOrdering FailureOrdering=AtomicOrdering::NotAtomic)
getMachineMemOperand - Allocate a new MachineMemOperand.
MachineFrameInfo & getFrameInfo()
getFrameInfo - Return the frame info object for the current function.
MachineRegisterInfo & getRegInfo()
getRegInfo - Return information about the registers currently in use.
Function & getFunction()
Return the LLVM function that this machine code represents.
BasicBlockListType::iterator iterator
Ty * getInfo()
getInfo - Keep track of various per-function pieces of information for backends that would like to do...
const MachineJumpTableInfo * getJumpTableInfo() const
getJumpTableInfo - Return the jump table info object for the current function.
MachineBasicBlock * CreateMachineBasicBlock(const BasicBlock *BB=nullptr, std::optional< UniqueBBID > BBID=std::nullopt)
CreateMachineInstr - Allocate a new MachineInstr.
void insert(iterator MBBI, MachineBasicBlock *MBB)
const TargetMachine & getTarget() const
getTarget - Return the target machine this machine code is compiled with
const MachineInstrBuilder & setMemRefs(ArrayRef< MachineMemOperand * > MMOs) const
const MachineInstrBuilder & addCFIIndex(unsigned CFIIndex) const
const MachineInstrBuilder & addUse(Register RegNo, RegState Flags={}, unsigned SubReg=0) const
Add a virtual register use operand.
const MachineInstrBuilder & addReg(Register RegNo, RegState Flags={}, unsigned SubReg=0) const
Add a new virtual register operand.
const MachineInstrBuilder & setMIFlag(MachineInstr::MIFlag Flag) const
const MachineInstrBuilder & addImm(int64_t Val) const
Add a new immediate operand.
const MachineInstrBuilder & add(const MachineOperand &MO) const
const MachineInstrBuilder & addSym(MCSymbol *Sym, unsigned char TargetFlags=0) const
const MachineInstrBuilder & addFrameIndex(int Idx) const
const MachineInstrBuilder & addGlobalAddress(const GlobalValue *GV, int64_t Offset=0, unsigned TargetFlags=0) const
const MachineInstrBuilder & addMBB(MachineBasicBlock *MBB, unsigned TargetFlags=0) const
const MachineInstrBuilder & addDef(Register RegNo, RegState Flags={}, unsigned SubReg=0) const
Add a virtual register definition operand.
const MachineInstrBuilder & setMIFlags(unsigned Flags) const
const MachineInstrBuilder & addMemOperand(MachineMemOperand *MMO) const
reverse_iterator getReverse() const
Get a reverse iterator to the same node.
Representation of each machine instruction.
unsigned getOpcode() const
Returns the opcode of this MachineInstr.
bool mayLoadOrStore(QueryType Type=AnyInBundle) const
Return true if this instruction could possibly read or modify memory.
const MachineBasicBlock * getParent() const
bool isCall(QueryType Type=AnyInBundle) const
bool getFlag(MIFlag Flag) const
Return whether an MI flag is set.
LLVM_ABI uint32_t mergeFlagsWith(const MachineInstr &Other) const
Return the MIFlags which represent both MachineInstrs.
unsigned getNumOperands() const
Retuns the total number of operands.
LLVM_ABI unsigned getNumExplicitOperands() const
Returns the number of non-implicit operands.
bool mayLoad(QueryType Type=AnyInBundle) const
Return true if this instruction could possibly read memory.
const MCInstrDesc & getDesc() const
Returns the target instruction descriptor of this MachineInstr.
LLVM_ABI bool hasUnmodeledSideEffects() const
Return true if this instruction has side effects that are not modeled by mayLoad / mayStore,...
bool registerDefIsDead(Register Reg, const TargetRegisterInfo *TRI) const
Returns true if the register is dead in this machine instruction.
bool definesRegister(Register Reg, const TargetRegisterInfo *TRI) const
Return true if the MachineInstr fully defines the specified register.
LLVM_ABI void setDesc(const MCInstrDesc &TID)
Replace the instruction descriptor (thus opcode) of the current instruction with a new one.
LLVM_ABI bool hasOrderedMemoryRef() const
Return true if this instruction may have an ordered or volatile memory reference, or if the informati...
LLVM_ABI const MachineFunction * getMF() const
Return the function that contains the basic block that this instruction belongs to.
ArrayRef< MachineMemOperand * > memoperands() const
Access to memory operands of the instruction.
LLVM_ABI bool isLoadFoldBarrier() const
Returns true if it is illegal to fold a load across this instruction.
const DebugLoc & getDebugLoc() const
Returns the debug location id of this MachineInstr.
LLVM_ABI void removeOperand(unsigned OpNo)
Erase an operand from an instruction, leaving it with one fewer operand than it started with.
LLVM_ABI void addRegisterDefined(Register Reg, const TargetRegisterInfo *RegInfo=nullptr)
We have determined MI defines a register.
const MachineOperand & getOperand(unsigned i) const
uint32_t getFlags() const
Return the MI flags bitvector.
LLVM_ABI int findRegisterDefOperandIdx(Register Reg, const TargetRegisterInfo *TRI, bool isDead=false, bool Overlap=false) const
Returns the operand index that is a def of the specified register or -1 if it is not found.
LLVM_ABI MachineInstrBundleIterator< MachineInstr > eraseFromParent()
Unlink 'this' from the containing basic block and delete it.
const std::vector< MachineJumpTableEntry > & getJumpTables() const
A description of a memory reference used in the backend.
@ MOVolatile
The memory access is volatile.
@ MOLoad
The memory access reads data.
@ MOStore
The memory access writes data.
This class contains meta information specific to a module.
LLVM_ABI MachineFunction * getMachineFunction(const Function &F) const
Returns the MachineFunction associated to IR function F if there is one, otherwise nullptr.
MachineOperand class - Representation of each machine instruction operand.
void setSubReg(unsigned subReg)
unsigned getSubReg() const
void setImm(int64_t immVal)
bool isReg() const
isReg - Tests if this is a MO_Register operand.
MachineBasicBlock * getMBB() const
void setIsDead(bool Val=true)
LLVM_ABI void setReg(Register Reg)
Change the register this operand corresponds to.
bool isImm() const
isImm - Tests if this is a MO_Immediate operand.
void setIsKill(bool Val=true)
MachineInstr * getParent()
getParent - Return the instruction that this operand belongs to.
unsigned getTargetFlags() const
static MachineOperand CreateImm(int64_t Val)
MachineOperandType getType() const
getType - Returns the MachineOperandType for this operand.
void setIsUndef(bool Val=true)
Register getReg() const
getReg - Returns the register number.
bool isFI() const
isFI - Tests if this is a MO_FrameIndex operand.
LLVM_ABI bool isIdenticalTo(const MachineOperand &Other) const
Returns true if this operand is identical to the specified operand except for liveness related flags ...
static MachineOperand CreateReg(Register Reg, bool isDef, bool isImp=false, bool isKill=false, bool isDead=false, bool isUndef=false, bool isEarlyClobber=false, unsigned SubReg=0, bool isDebug=false, bool isInternalRead=false, bool isRenamable=false)
MachineRegisterInfo - Keep track of information for virtual and physical registers,...
LLVM_ABI bool hasOneNonDBGUse(Register RegNo) const
hasOneNonDBGUse - Return true if there is exactly one non-Debug use of the specified register.
bool tracksLiveness() const
tracksLiveness - Returns true when tracking register liveness accurately.
const TargetRegisterClass * getRegClass(Register Reg) const
Return the register class of the specified virtual register.
LLVM_ABI void clearKillFlags(Register Reg) const
clearKillFlags - Iterate over all the uses of the given register and clear the kill flag from the Mac...
LLVM_ABI MachineInstr * getVRegDef(Register Reg) const
getVRegDef - Return the machine instr that defines the specified virtual register or null if none is ...
bool use_nodbg_empty(Register RegNo) const
use_nodbg_empty - Return true if there are no non-Debug instructions using the specified register.
LLVM_ABI Register createVirtualRegister(const TargetRegisterClass *RegClass, StringRef Name="")
createVirtualRegister - Create and return a new virtual register in the function with the specified r...
bool reservedRegsFrozen() const
reservedRegsFrozen - Returns true after freezeReservedRegs() was called to ensure the set of reserved...
bool def_empty(Register RegNo) const
def_empty - Return true if there are no instructions defining the specified register (it may be live-...
use_instr_nodbg_iterator use_instr_nodbg_begin(Register RegNo) const
bool hasOneDef(Register RegNo) const
Return true if there is exactly one operand defining the specified register.
const TargetRegisterClass * getRegClassOrNull(Register Reg) const
Return the register class of Reg, or null if Reg has not been assigned a register class yet.
LLVM_ABI const TargetRegisterClass * constrainRegClass(Register Reg, const TargetRegisterClass *RC, unsigned MinNumRegs=0)
constrainRegClass - Constrain the register class of the specified virtual register to be a common sub...
LLVM_ABI MachineInstr * getUniqueVRegDef(Register Reg) const
getUniqueVRegDef - Return the unique machine instr that defines the specified virtual register or nul...
A Module instance is used to store all the information related to an LLVM module.
MI-level patchpoint operands.
uint32_t getNumPatchBytes() const
Return the number of patchable bytes the given patchpoint should emit.
Wrapper class representing virtual and physical registers.
MCRegister asMCReg() const
Utility to check-convert this value to a MCRegister.
constexpr bool isValid() const
constexpr bool isVirtual() const
Return true if the specified register number is in the virtual register namespace.
static constexpr bool isVirtualRegister(unsigned Reg)
Return true if the specified register number is in the virtual register namespace.
constexpr bool isPhysical() const
Return true if the specified register number is in the physical register namespace.
Represents a location in source code.
bool erase(PtrType Ptr)
Remove pointer from the set.
std::pair< iterator, bool > insert(PtrType Ptr)
Inserts Ptr if and only if there is no element in the container equal to Ptr.
SmallPtrSet - This class implements a set which is optimized for holding SmallSize or less elements.
SmallSet - This maintains a set of unique values, optimizing for the case when the set is small (less...
SmallString - A SmallString is just a SmallVector with methods and accessors that make it work better...
void append(StringRef RHS)
Append from a StringRef.
StringRef str() const
Explicit conversion to StringRef.
This class consists of common code factored out of the SmallVector class to reduce code duplication b...
void push_back(const T &Elt)
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
MI-level stackmap operands.
uint32_t getNumPatchBytes() const
Return the number of patchable bytes the given stackmap should emit.
StackOffset holds a fixed and a scalable offset in bytes.
int64_t getFixed() const
Returns the fixed component of the stack.
int64_t getScalable() const
Returns the scalable component of the stack.
static StackOffset get(int64_t Fixed, int64_t Scalable)
static StackOffset getScalable(int64_t Scalable)
static StackOffset getFixed(int64_t Fixed)
MI-level Statepoint operands.
uint32_t getNumPatchBytes() const
Return the number of patchable bytes the given statepoint should emit.
Represent a constant reference to a string, i.e.
Object returned by analyzeLoopForPipelining.
TargetInstrInfo - Interface to description of machine instruction set.
virtual void genAlternativeCodeSequence(MachineInstr &Root, unsigned Pattern, SmallVectorImpl< MachineInstr * > &InsInstrs, SmallVectorImpl< MachineInstr * > &DelInstrs, DenseMap< Register, unsigned > &InstIdxForVirtReg) const
When getMachineCombinerPatterns() finds patterns, this function generates the instructions that could...
virtual std::optional< ParamLoadedValue > describeLoadedValue(const MachineInstr &MI, Register Reg) const
Produce the expression describing the MI loading a value into the physical register Reg.
virtual bool getMachineCombinerPatterns(MachineInstr &Root, SmallVectorImpl< unsigned > &Patterns, bool DoRegPressureReduce) const
Return true when there is potentially a faster code sequence for an instruction chain ending in Root.
virtual bool isSchedulingBoundary(const MachineInstr &MI, const MachineBasicBlock *MBB, const MachineFunction &MF) const
Test if the given instruction should be considered a scheduling boundary.
virtual CombinerObjective getCombinerObjective(unsigned Pattern) const
Return the objective of a combiner pattern.
virtual bool isFunctionSafeToSplit(const MachineFunction &MF) const
Return true if the function is a viable candidate for machine function splitting.
const MCAsmInfo & getMCAsmInfo() const
Return target specific asm information.
CodeModel::Model getCodeModel() const
Returns the code model.
bool contains(Register Reg) const
Return true if the specified register is included in this register class.
bool hasSubClassEq(const TargetRegisterClass *RC) const
Returns true if RC is a sub-class of or equal to this class.
bool hasSuperClassEq(const TargetRegisterClass *RC) const
Returns true if RC is a super-class of or equal to this class.
TargetRegisterInfo base class - We assume that the target defines a static array of TargetRegisterDes...
TargetSubtargetInfo - Generic base class for all target subtargets.
virtual const TargetInstrInfo * getInstrInfo() const
virtual const TargetRegisterInfo * getRegisterInfo() const =0
Return the target's register information.
Target - Wrapper for Target specific information.
static constexpr TypeSize getFixed(ScalarTy ExactSize)
static constexpr TypeSize getScalable(ScalarTy MinimumSize)
Value * getOperand(unsigned i) const
constexpr bool isScalable() const
Returns whether the quantity is scaled by a runtime quantity (vscale).
constexpr ScalarTy getKnownMinValue() const
Returns the minimum value this quantity can represent.
self_iterator getIterator()
A raw_ostream that writes to an std::string.
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
static CondCode getInvertedCondCode(CondCode Code)
@ MO_DLLIMPORT
MO_DLLIMPORT - On a symbol operand, this represents that the reference to the symbol is for an import...
@ MO_NC
MO_NC - Indicates whether the linker is expected to check the symbol reference for overflow.
@ MO_G1
MO_G1 - A symbol operand with this flag (granule 1) represents the bits 16-31 of a 64-bit address,...
@ MO_S
MO_S - Indicates that the bits of the symbol operand represented by MO_G0 etc are signed.
@ MO_PAGEOFF
MO_PAGEOFF - A symbol operand with this flag represents the offset of that symbol within a 4K page.
@ MO_GOT
MO_GOT - This flag indicates that a symbol operand represents the address of the GOT entry for the sy...
@ MO_PREL
MO_PREL - Indicates that the bits of the symbol operand represented by MO_G0 etc are PC relative.
@ MO_G0
MO_G0 - A symbol operand with this flag (granule 0) represents the bits 0-15 of a 64-bit address,...
@ MO_ARM64EC_CALLMANGLE
MO_ARM64EC_CALLMANGLE - Operand refers to the Arm64EC-mangled version of a symbol,...
@ MO_PAGE
MO_PAGE - A symbol operand with this flag represents the pc-relative offset of the 4K page containing...
@ MO_HI12
MO_HI12 - This flag indicates that a symbol operand represents the bits 13-24 of a 64-bit address,...
@ MO_TLS
MO_TLS - Indicates that the operand being accessed is some kind of thread-local symbol.
@ MO_G2
MO_G2 - A symbol operand with this flag (granule 2) represents the bits 32-47 of a 64-bit address,...
@ MO_TAGGED
MO_TAGGED - With MO_PAGE, indicates that the page includes a memory tag in bits 56-63.
@ MO_G3
MO_G3 - A symbol operand with this flag (granule 3) represents the high 16-bits of a 64-bit address,...
@ MO_COFFSTUB
MO_COFFSTUB - On a symbol operand "FOO", this indicates that the reference is actually to the "....
unsigned getCheckerSizeInBytes(AuthCheckMethod Method)
Returns the number of bytes added by checkAuthenticatedRegister.
static uint64_t decodeLogicalImmediate(uint64_t val, unsigned regSize)
decodeLogicalImmediate - Decode a logical immediate value in the form "N:immr:imms" (where the immr a...
static unsigned getShiftValue(unsigned Imm)
getShiftValue - Extract the shift value.
static unsigned getArithExtendImm(AArch64_AM::ShiftExtendType ET, unsigned Imm)
getArithExtendImm - Encode the extend type and shift amount for an arithmetic instruction: imm: 3-bit...
constexpr bool isLegalArithImmed(const uint64_t C)
isLegalArithImmed -
static unsigned getArithShiftValue(unsigned Imm)
getArithShiftValue - get the arithmetic shift value.
static uint64_t encodeLogicalImmediate(uint64_t imm, unsigned regSize)
encodeLogicalImmediate - Return the encoded immediate value for a logical immediate instruction of th...
static AArch64_AM::ShiftExtendType getExtendType(unsigned Imm)
getExtendType - Extract the extend type for operands of arithmetic ops.
static AArch64_AM::ShiftExtendType getArithExtendType(unsigned Imm)
static AArch64_AM::ShiftExtendType getShiftType(unsigned Imm)
getShiftType - Extract the shift type.
static unsigned getShifterImm(AArch64_AM::ShiftExtendType ST, unsigned Imm)
getShifterImm - Encode the shift type and amount: imm: 6-bit shift amount shifter: 000 ==> lsl 001 ==...
void expandMOVAddr(unsigned Opcode, unsigned TargetFlags, bool IsTargetMachO, SmallVectorImpl< AddrInsnModel > &Insn)
void expandMOVImm(uint64_t Imm, unsigned BitSize, SmallVectorImpl< ImmInsnModel > &Insn)
Expand a MOVi32imm or MOVi64imm pseudo instruction to one or more real move-immediate instructions to...
static const uint64_t InstrFlagIsWhile
static const uint64_t InstrFlagIsPTestLike
constexpr std::underlying_type_t< E > Mask()
Get a bitmask with 1s in all places up to the high-order bit of E's largest value.
@ C
The default llvm calling convention, compatible with C.
@ ScalablePredicateVector
initializer< Ty > init(const Ty &Val)
InstrType
Represents how an instruction should be mapped by the outliner.
NodeAddr< InstrNode * > Instr
LLVM_ABI Instruction & back() const
LLVM_ABI iterator begin() const
This is an optimization pass for GlobalISel generic memory operations.
auto drop_begin(T &&RangeOrContainer, size_t N=1)
Return a range covering RangeOrContainer with the first N elements excluded.
bool all_of(R &&range, UnaryPredicate P)
Provide wrappers to std::all_of which take ranges instead of having to pass begin/end explicitly.
static bool isCondBranchOpcode(int Opc)
MCCFIInstruction createDefCFA(const TargetRegisterInfo &TRI, unsigned FrameReg, unsigned Reg, const StackOffset &Offset, bool LastAdjustmentWasScalable=true)
static bool isPTrueOpcode(unsigned Opc)
MachineInstrBuilder BuildMI(MachineFunction &MF, const MIMetadata &MIMD, const MCInstrDesc &MCID)
Builder interface. Specify how to create the initial instruction itself.
bool succeeded(LogicalResult Result)
Utility function that returns true if the provided LogicalResult corresponds to a success value.
int isAArch64FrameOffsetLegal(const MachineInstr &MI, StackOffset &Offset, bool *OutUseUnscaledOp=nullptr, unsigned *OutUnscaledOp=nullptr, int64_t *EmittableOffset=nullptr)
Check if the Offset is a valid frame offset for MI.
constexpr bool isInt(int64_t x)
Checks if an integer fits into the given bit width.
RegState
Flags to represent properties of register accesses.
@ Implicit
Not emitted register (e.g. carry, or temporary result).
@ Kill
The last use of a register.
@ Undef
Value of the register doesn't matter.
@ Define
Register definition.
@ Renamable
Register that may be renamed.
auto enumerate(FirstRange &&First, RestRanges &&...Rest)
Given two or more input ranges, returns a new range whose values are tuples (A, B,...
constexpr RegState getKillRegState(bool B)
decltype(auto) dyn_cast(const From &Val)
dyn_cast<X> - Return the argument parameter cast to the specified type.
static bool isIndirectBranchOpcode(int Opc)
iterator_range< T > make_range(T x, T y)
Convenience function for iterating over sub-ranges.
unsigned getBLRCallOpcode(const MachineFunction &MF)
Return opcode to be used for indirect calls.
@ AArch64FrameOffsetIsLegal
Offset is legal.
@ AArch64FrameOffsetCanUpdate
Offset can apply, at least partly.
@ AArch64FrameOffsetCannotUpdate
Offset cannot apply.
constexpr bool isPowerOf2_64(uint64_t Value)
Return true if the argument is a power of two > 0 (64 bit edition.)
unsigned Log2_64(uint64_t Value)
Return the floor log base 2 of the specified value, -1 if the value is zero.
static bool isSEHInstruction(const MachineInstr &MI)
bool isLFIPrePostMemAccess(unsigned Opcode)
Returns true if Opcode is a pre- or post-indexed memory access that the LFI rewriter expands with a b...
bool any_of(R &&range, UnaryPredicate P)
Provide wrappers to std::any_of which take ranges instead of having to pass begin/end explicitly.
auto reverse(ContainerTy &&C)
MachineInstr * getImm(const MachineOperand &MO, const MachineRegisterInfo *MRI)
decltype(auto) get(const PointerIntPair< PointerTy, IntBits, IntType, PtrTraits, Info > &Pair)
void sort(IteratorTy Start, IteratorTy End)
AArch64MachineCombinerPattern
@ MULSUBv2i32_indexed_OP1
@ MULADDv4i16_indexed_OP2
@ MULSUBv8i16_indexed_OP2
@ MULSUBv4i16_indexed_OP2
@ MULSUBv4i32_indexed_OP2
@ MULADDv2i32_indexed_OP1
@ MULADDv4i32_indexed_OP1
@ MULADDv2i32_indexed_OP2
@ MULSUBv4i16_indexed_OP1
@ MULADDv4i32_indexed_OP2
@ MULSUBv8i16_indexed_OP1
@ MULSUBv2i32_indexed_OP2
@ MULADDv8i16_indexed_OP1
@ MULSUBv4i32_indexed_OP1
@ MULADDv8i16_indexed_OP2
@ MULADDv4i16_indexed_OP1
LLVM_ABI raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
void emitFrameOffset(MachineBasicBlock &MBB, MachineBasicBlock::iterator MBBI, const DebugLoc &DL, unsigned DestReg, unsigned SrcReg, StackOffset Offset, const TargetInstrInfo *TII, MachineInstr::MIFlag=MachineInstr::NoFlags, bool SetNZCV=false, bool NeedsWinCFI=false, bool *HasWinCFI=nullptr, bool EmitCFAOffset=false, StackOffset InitialOffset={}, unsigned FrameReg=AArch64::SP)
emitFrameOffset - Emit instructions as needed to set DestReg to SrcReg plus Offset.
LLVM_ABI void report_fatal_error(Error Err, bool gen_crash_diag=true)
constexpr RegState getDefRegState(bool B)
CombinerObjective
The combiner's goal may differ based on which pattern it is attempting to optimize.
std::optional< UsedNZCV > examineCFlagsUse(MachineInstr &MI, MachineInstr &CmpInstr, const TargetRegisterInfo &TRI, SmallVectorImpl< MachineInstr * > *CCUseInstrs=nullptr)
CodeGenOptLevel
Code generation optimization level.
class LLVM_GSL_OWNER SmallVector
Forward declaration of SmallVector so that calculateSmallVectorDefaultInlinedElements can reference s...
auto instructionsWithoutDebug(IterT It, IterT End, bool SkipPseudoOp=true)
Construct a range iterator which begins at It and moves forwards until End is reached,...
LLVM_ABI raw_fd_ostream & errs()
This returns a reference to a raw_ostream for standard error.
auto drop_end(T &&RangeOrContainer, size_t N=1)
Return a range covering RangeOrContainer with the last N elements excluded.
static MCRegister getXRegFromWReg(MCRegister Reg)
MCCFIInstruction createCFAOffset(const TargetRegisterInfo &MRI, unsigned Reg, const StackOffset &OffsetFromDefCFA, std::optional< int64_t > IncomingVGOffsetFromDefCFA)
DWARFExpression::Operation Op
ArrayRef(const T &OneElt) -> ArrayRef< T >
static bool isUncondBranchOpcode(int Opc)
decltype(auto) cast(const From &Val)
cast<X> - Return the argument parameter cast to the specified type.
void erase_if(Container &C, UnaryPredicate P)
Provide a container algorithm similar to C++ Library Fundamentals v2's erase_if which is equivalent t...
constexpr bool isIntN(unsigned N, int64_t x)
Checks if an signed integer fits into the given (dynamic) bit width.
bool rewriteAArch64FrameIndex(MachineInstr &MI, unsigned FrameRegIdx, unsigned FrameReg, StackOffset &Offset, const AArch64InstrInfo *TII)
rewriteAArch64FrameIndex - Rewrite MI to access 'Offset' bytes from the FP.
bool is_contained(R &&Range, const E &Element)
Returns true if Element is found in Range.
static const MachineMemOperand::Flags MOSuppressPair
constexpr int64_t SignExtend64(uint64_t x)
Sign-extend the number in the bottom B bits of X to a 64-bit integer.
void appendLEB128(SmallVectorImpl< U > &Buffer, T Value)
RelativeUniformCounterPtr ValuesPtrExpr VTableAddr Next
bool optimizeTerminators(MachineBasicBlock *MBB, const TargetInstrInfo &TII)
std::pair< MachineOperand, DIExpression * > ParamLoadedValue
bool isNZCVTouchedInInstructionRange(const MachineInstr &DefMI, const MachineInstr &UseMI, const TargetRegisterInfo *TRI)
Return true if there is an instruction /after/ DefMI and before UseMI which either reads or clobbers ...
auto seq(T Begin, T End)
Iterate over an integral type from Begin up to - but not including - End.
static const MachineMemOperand::Flags MOStridedAccess
constexpr RegState getUndefRegState(bool B)
void fullyRecomputeLiveIns(ArrayRef< MachineBasicBlock * > MBBs)
Convenience function for recomputing live-in's for a set of MBBs until the computation converges.
LLVM_ABI Printable printReg(Register Reg, const TargetRegisterInfo *TRI=nullptr, unsigned SubIdx=0, const MachineRegisterInfo *MRI=nullptr)
Prints virtual and physical registers with or without a TRI instance.
This struct is a compact representation of a valid (non-zero power of two) alignment.
Used to describe addressing mode similar to ExtAddrMode in CodeGenPrepare.
LLVM_ABI static const MBBSectionID ColdSectionID
This class contains a discriminated union of information about pointers in memory operands,...
static LLVM_ABI MachinePointerInfo getUnknownStack(MachineFunction &MF)
Stack memory without other information.
static LLVM_ABI MachinePointerInfo getFixedStack(MachineFunction &MF, int FI, int64_t Offset=0)
Return a MachinePointerInfo record that refers to the specified FrameIndex.
An individual sequence of instructions to be replaced with a call to an outlined function.
MachineFunction * getMF() const
The information necessary to create an outlined function for some class of candidate.