107 std::initializer_list<LLT> PackedVectorAllTypeList = {
113 std::initializer_list<LLT> ScalarAndPtrTypesList = {s8, s16, s32, s64, p0};
117 const TargetMachine &TM = ST.getTargetLowering()->getTargetMachine();
120 if (!ST.hasNEON() || !ST.hasFPARMv8()) {
127 const bool HasFP16 = ST.hasFullFP16();
128 const LLT &MinFPScalar = HasFP16 ? f16 : f32;
130 const bool HasCSSC = ST.hasCSSC();
131 const bool HasRCPC3 = ST.hasRCPC3();
132 const bool HasSVE = ST.hasSVE();
135 {G_IMPLICIT_DEF, G_FREEZE, G_CONSTANT_FOLD_BARRIER})
136 .legalFor({p0, s8, s16, s32, s64, s128})
137 .legalFor({v2s8, v4s8, v8s8, v16s8, v2s16, v4s16, v8s16, v2s32, v4s32,
139 .widenScalarToNextPow2(0)
152 .legalFor(PackedVectorAllTypeList)
166 .widenScalarToNextPow2(0)
171 .maxScalarIf(
typeInSet(0, {s64, p0}), 1, s32);
176 .widenScalarToNextPow2(1)
181 .maxScalarIf(
typeInSet(1, {s64, p0}), 0, s32)
182 .maxScalarIf(
typeInSet(1, {s128}), 0, s64);
185 .legalFor({i32, i64, v8i8, v16i8, v4i16, v8i16, v2i32, v4i32, v2i64})
186 .legalFor(HasSVE, {nxv16i8, nxv8i16, nxv4i32, nxv2i64})
187 .widenScalarToNextPow2(0)
195 return Query.
Types[0].getNumElements() <= 2;
200 return Query.
Types[0].getNumElements() <= 4;
205 return Query.
Types[0].getNumElements() <= 16;
212 .
legalFor({i32, i64, v8i8, v16i8, v4i16, v8i16, v2i32, v4i32, v2i64})
213 .widenScalarToNextPow2(0)
221 return Query.
Types[0].getNumElements() <= 2;
226 return Query.
Types[0].getNumElements() <= 4;
231 return Query.
Types[0].getNumElements() <= 16;
239 const auto &SrcTy = Query.
Types[0];
240 const auto &AmtTy = Query.
Types[1];
241 return !SrcTy.isVector() && SrcTy.getSizeInBits() == 32 &&
242 AmtTy.getSizeInBits() == 32;
256 .widenScalarToNextPow2(0)
270 .
legalFor({{p0, i64}, {v2p0, v2i64}})
271 .clampScalarOrElt(1, s64, s64)
277 .legalFor({i32, i64})
279 .clampScalar(0, s32, s64)
284 .lowerFor({i8, i16, i32, i64, v2i32, v4i32, v2i64})
293 .widenScalarToNextPow2(0, 32)
298 .legalFor({i64, v16i8, v8i16, v4i32})
304 .legalFor({v8i8, v16i8, v4i16, v8i16, v2i32, v4i32})
305 .legalFor(HasCSSC, {i32, i64})
306 .minScalar(HasCSSC, 0, s32)
315 .legalFor({v16i8, v8i16, v4i32, v2i64, v2p0, v8i8, v4i16, v2i32})
319 return SrcTy.isScalar() && SrcTy.getSizeInBits() < 128;
323 [=](
const LegalityQuery &Query) {
return std::make_pair(0, v4i16); })
326 [=](
const LegalityQuery &Query) {
return std::make_pair(0, v2i32); })
327 .clampNumElements(0, v8s8, v16s8)
335 {G_ABDS, G_ABDU, G_UAVGFLOOR, G_UAVGCEIL, G_SAVGFLOOR, G_SAVGCEIL})
336 .legalFor({v8i8, v16i8, v4i16, v8i16, v2i32, v4i32})
340 {G_SADDE, G_SSUBE, G_UADDE, G_USUBE, G_SADDO, G_SSUBO, G_UADDO, G_USUBO})
341 .legalFor({{i32, i32}, {i64, i32}})
342 .clampScalar(0, s32, s64)
347 .customFor({{i32, i32}, {i32, i64}, {i64, i64}})
353 return Q.
Types[0].isScalar() && Q.
Types[1].getScalarSizeInBits() < 64;
359 .customFor({{s32, s32}, {s64, s64}});
363 .
legalFor(HasCSSC, {{i32, i32}, {i64, i64}})
364 .legalFor({{v8i8, v8i8}, {v16i8, v16i8}})
365 .customFor(!HasCSSC, {{s32, s32}, {s64, s64}})
366 .customFor({{s128, s128},
372 .clampScalar(0, s32, s128)
385 .legalFor({{i32, i32},
393 .widenScalarToNextPow2(1, 32)
413 .customFor(!HasCSSC, {s32, s64});
419 .widenScalarToNextPow2(0, 32)
433 .
legalFor({i32, i64, v4i16, v8i16, v2i32, v4i32, v2i64})
442 .legalFor({v8i8, v16i8, v4i16, v8i16, v2i32, v4i32, v2i64})
443 .legalFor(HasSVE, {nxv16i8, nxv8i16, nxv4i32, nxv2i64})
444 .clampNumElements(0, v8s8, v16s8)
453 {G_FADD, G_FSUB, G_FMUL, G_FDIV, G_FMA, G_FSQRT, G_FMAXNUM, G_FMINNUM,
454 G_FMAXIMUM, G_FMINIMUM, G_FCEIL, G_FFLOOR, G_FRINT, G_FNEARBYINT,
455 G_INTRINSIC_TRUNC, G_INTRINSIC_ROUND, G_INTRINSIC_ROUNDEVEN})
456 .legalFor({f32, f64, v2f32, v4f32, v2f64})
457 .legalFor(HasFP16, {f16, v4f16, v8f16})
462 return (!HasFP16 && Q.
Types[0].getScalarType().isFloat16()) ||
463 Q.
Types[0].getScalarType().isBFloat16();
466 .clampNumElements(0, v4s16, v8s16)
472 .legalFor({f32, f64, v2f32, v4f32, v2f64})
473 .legalFor(HasFP16, {f16, bf16, v4f16, v4bf16, v8f16, v8bf16})
480 .
lowerFor({f16, bf16, v4f16, v4bf16, v8f16, v8bf16});
483 G_FLOG10, G_FTAN, G_FEXP, G_FEXP2, G_FEXP10,
484 G_FACOS, G_FASIN, G_FATAN, G_FATAN2, G_FCOSH,
485 G_FSINH, G_FTANH, G_FMODF})
486 .libcallFor({f32, f64, f128})
490 .libcallFor({{f32, i32}, {f64, i32}, {f128, i32}})
495 .legalFor({{i32, f32}, {i32, f64}, {i64, f32}, {i64, f64}})
496 .legalFor(HasFP16, {{i32, f16}, {i64, f16}})
501 .legalFor({{i64, f32}, {i64, f64}})
502 .legalFor(HasFP16, {{i64, f16}})
520 for (
unsigned Op : {G_SEXTLOAD, G_ZEXTLOAD}) {
523 if (
Op == G_SEXTLOAD)
528 .legalForTypesWithMemDesc({{s32, p0, s8, 8},
536 {v2s32, p0, s64, 8}})
537 .widenScalarToNextPow2(0)
538 .clampScalar(0, s32, s64)
541 .unsupportedIfMemSizeNotPow2()
553 return HasRCPC3 && Query.
Types[0] == s128 &&
557 return Query.
Types[0] == s128 &&
560 .legalForTypesWithMemDesc({{s8, p0, s8, 8},
567 {v16s8, p0, s128, 8},
569 {v8s16, p0, s128, 8},
571 {v4s32, p0, s128, 8},
572 {v2s64, p0, s128, 8}})
574 .legalForTypesWithMemDesc(
575 {{s32, p0, s8, 8}, {s32, p0, s16, 8}, {s64, p0, s32, 8}})
576 .legalForTypesWithMemDesc({
578 {nxv16s8, p0, nxv16s8, 8},
579 {nxv8s16, p0, nxv8s16, 8},
580 {nxv4s32, p0, nxv4s32, 8},
581 {nxv2s64, p0, nxv2s64, 8},
583 .widenScalarToNextPow2(0, 8)
594 return Query.
Types[0].isScalar() &&
596 Query.
Types[0].getSizeInBits() > 32;
605 .customIf(IsPtrVecPred)
611 return HasRCPC3 && Query.
Types[0] == s128 &&
615 return Query.
Types[0] == s128 &&
623 {{s8, p0, s8, 8}, {s16, p0, s8, 8},
626 {s16, p0, s16, 8}, {s32, p0, s16, 8},
628 {s32, p0, s8, 8}, {s32, p0, s16, 8}, {s32, p0, s32, 8},
629 {s64, p0, s64, 8}, {s64, p0, s32, 8},
630 {p0, p0, s64, 8}, {s128, p0, s128, 8}, {v16s8, p0, s128, 8},
631 {v8s8, p0, s64, 8}, {v4s16, p0, s64, 8}, {v8s16, p0, s128, 8},
632 {v2s32, p0, s64, 8}, {v4s32, p0, s128, 8}, {v2s64, p0, s128, 8}})
633 .legalForTypesWithMemDesc({
638 {nxv16s8, p0, nxv16s8, 8},
639 {nxv8s16, p0, nxv8s16, 8},
640 {nxv4s32, p0, nxv4s32, 8},
641 {nxv2s64, p0, nxv2s64, 8},
643 .clampScalar(0, s8, s64)
646 return Query.
Types[0].isScalar() &&
650 .clampMaxNumElements(0, s8, 16)
659 return Query.
Types[0].getSizeInBits() ==
660 Query.
MMODescrs[0].MemoryTy.getSizeInBits();
666 .customIf(IsPtrVecPred)
684 {p0, v16s8, v16s8, 8},
685 {p0, v4s16, v4s16, 8},
686 {p0, v8s16, v8s16, 8},
687 {p0, v2s32, v2s32, 8},
688 {p0, v4s32, v4s32, 8},
689 {p0, v2s64, v2s64, 8},
695 auto IndexedLoadBasicPred = [=](
const LegalityQuery &Query) {
723 return MemTy == s8 || MemTy == s16;
725 return MemTy == s8 || MemTy == s16 || MemTy == s32;
733 .widenScalarToNextPow2(0)
740 .
legalFor({{i32, i32}, {i32, i64}, {i32, p0}})
750 return Ty.isVector() && !SrcTy.isPointerVector() &&
751 Ty.getElementType() != SrcTy.getElementType();
759 return Query.
Types[1].isPointerVector();
776 .legalFor(HasFP16, {{i32, f16}, {v4i16, v4f16}, {v8i16, v8f16}})
781 return (!HasFP16 && Q.
Types[1].getScalarType().isFloat16()) ||
782 Q.
Types[1].getScalarType().isBFloat16();
790 return Ty.isVector() && !SrcTy.isPointerVector() &&
791 Ty.getElementType() != SrcTy.getElementType();
794 .clampNumElements(1, v4s16, v8s16)
802 unsigned DstSize = Query.
Types[0].getSizeInBits();
805 if (Query.
Types[0].isVector())
808 if (DstSize < 8 || DstSize >= 128 || !
isPowerOf2_32(DstSize))
816 unsigned SrcSize = SrcTy.getSizeInBits();
823 .legalIf(ExtLegalFunc)
824 .
legalFor({{v8s16, v8s8}, {v4s32, v4s16}, {v2s64, v2s32}})
825 .clampScalar(0, s64, s64)
832 return (Query.
Types[0].getScalarSizeInBits() >
833 Query.
Types[1].getScalarSizeInBits() * 2) &&
834 Query.
Types[0].isVector() &&
835 (Query.
Types[1].getScalarSizeInBits() == 8 ||
836 Query.
Types[1].getScalarSizeInBits() == 16);
838 .clampMinNumElements(1, s8, 8)
843 .
legalFor({{v8s8, v8s16}, {v4s16, v4s32}, {v2s32, v2s64}})
854 return DstTy.
isVector() && SrcTy.getSizeInBits() > 128 &&
857 .clampMinNumElements(0, s8, 8)
862 .legalFor({{v8i8, v8i16}, {v4i16, v4i32}, {v2i32, v2i64}})
863 .clampNumElements(0, v2s32, v2s32);
866 .
legalFor({i32, i64, v8i8, v16i8, v4i16, v8i16, v2i32, v4i32, v2i64})
877 {{f16, f32}, {f16, f64}, {f32, f64}, {v4f16, v4f32}, {v2f32, v2f64}})
878 .legalFor(ST.hasBF16(), {{bf16, f32}, {v4bf16, v4f32}})
879 .libcallFor({{f16, f128}, {f32, f128}, {f64, f128}})
887 .lowerFor({{bf16, f32}, {v4bf16, v4f32}})
889 .clampNumElements(1, v4s32, v4s32)
893 getActionDefinitionsBuilder(G_FPEXT)
901 .libcallFor({{f128, f64}, {f128, f32}, {f128, f16}})
912 .clampNumElements(0, v4s32, v4s32)
917 getActionDefinitionsBuilder({G_FPTOSI, G_FPTOUI})
918 .legalFor({{i32, f32},
926 {{i32, f16}, {i64, f16}, {v4i16, v4f16}, {v8i16, v8f16}})
933 return Query.
Types[1] == f16 && Query.
Types[0].getSizeInBits() > 64;
942 return Query.
Types[0].getScalarSizeInBits() <= 64 &&
943 Query.
Types[0].getScalarSizeInBits() >
944 Query.
Types[1].getScalarSizeInBits();
949 return Query.
Types[1].getScalarSizeInBits() <= 64 &&
950 Query.
Types[0].getScalarSizeInBits() <
951 Query.
Types[1].getScalarSizeInBits();
954 .clampNumElements(0, v4s16, v8s16)
958 {{i32, f128}, {i64, f128}, {i128, f128}, {i128, f32}, {i128, f64}});
960 getActionDefinitionsBuilder({G_FPTOSI_SAT, G_FPTOUI_SAT})
961 .legalFor({{i32, f32},
970 {{i16, f16}, {i32, f16}, {i64, f16}, {v4i16, v4f16}, {v8i16, v8f16}})
978 return Query.
Types[1] == f16 && Query.
Types[0].getSizeInBits() > 64;
988 unsigned ITySize = Query.
Types[0].getScalarSizeInBits();
989 return (ITySize == 16 || ITySize == 32 || ITySize == 64) &&
990 ITySize > Query.
Types[1].getScalarSizeInBits();
995 unsigned FTySize = Query.
Types[1].getScalarSizeInBits();
996 return (FTySize == 16 || FTySize == 32 || FTySize == 64) &&
997 Query.
Types[0].getScalarSizeInBits() < FTySize;
1005 getActionDefinitionsBuilder({G_SITOFP, G_UITOFP})
1006 .legalFor({{f32, i32},
1014 {{f16, i32}, {f16, i64}, {v4f16, v4i16}, {v8f16, v8i16}})
1016 return Query.
Types[0].getScalarType().isBFloat16();
1024 return Query.
Types[1].isVector() &&
1025 Query.
Types[1].getScalarSizeInBits() == 64 &&
1026 Query.
Types[0].getScalarSizeInBits() == 16;
1028 .widenScalarOrEltToNextPow2OrMinSize(0, HasFP16 ? 16 : 32)
1032 return Query.
Types[0].getScalarSizeInBits() == 32 &&
1033 Query.
Types[1].getScalarSizeInBits() == 64;
1038 return Query.
Types[1].getScalarSizeInBits() <= 64 &&
1039 Query.
Types[0].getScalarSizeInBits() <
1040 Query.
Types[1].getScalarSizeInBits();
1045 return Query.
Types[0].getScalarSizeInBits() <= 64 &&
1046 Query.
Types[0].getScalarSizeInBits() >
1047 Query.
Types[1].getScalarSizeInBits();
1050 .clampNumElements(0, v4s16, v8s16)
1062 getActionDefinitionsBuilder(G_BRCOND)
1064 .clampScalar(0, s32, s32);
1065 getActionDefinitionsBuilder(G_BRINDIRECT).
legalFor({p0});
1067 getActionDefinitionsBuilder(G_SELECT)
1068 .
legalFor({{s32, s32}, {s64, s32}, {p0, s32}})
1069 .widenScalarToNextPow2(0)
1077 getActionDefinitionsBuilder(G_FRAME_INDEX).
legalFor({p0});
1080 getActionDefinitionsBuilder(G_GLOBAL_VALUE).
custom();
1082 getActionDefinitionsBuilder(G_GLOBAL_VALUE).
legalFor({p0});
1084 getActionDefinitionsBuilder(G_PTRAUTH_GLOBAL_VALUE)
1087 getActionDefinitionsBuilder(G_PTRTOINT)
1088 .
legalFor({{i64, p0}, {v2i64, v2p0}})
1089 .widenScalarToNextPow2(0, 64)
1093 getActionDefinitionsBuilder(G_INTTOPTR)
1095 return Query.
Types[0].getSizeInBits() != Query.
Types[1].getSizeInBits();
1097 .legalFor({{p0, i64}, {v2p0, v2i64}})
1098 .clampMaxNumElements(1, s64, 2);
1102 getActionDefinitionsBuilder(G_BITCAST)
1105 .legalForCartesianProduct({s32, v2s16, v4s8})
1106 .legalForCartesianProduct({s64, v8s8, v4s16, v2s32})
1107 .legalForCartesianProduct({s128, v16s8, v8s16, v4s32, v2s64, v2p0})
1116 return Query.
Types[0].isVector() != Query.
Types[1].isVector();
1125 getActionDefinitionsBuilder(G_VASTART).
legalFor({p0});
1129 getActionDefinitionsBuilder(G_VAARG)
1131 .clampScalar(0, s8, s64)
1134 getActionDefinitionsBuilder(G_ATOMIC_CMPXCHG_WITH_SUCCESS)
1138 bool UseOutlineAtomics =
ST.outlineAtomics() && !
ST.hasLSE();
1140 getActionDefinitionsBuilder(G_ATOMIC_CMPXCHG)
1141 .legalFor(!UseOutlineAtomics, {{s32, p0}, {s64, p0}})
1142 .customFor(!UseOutlineAtomics, {{s128, p0}})
1143 .libcallFor(UseOutlineAtomics,
1144 {{s8, p0}, {s16, p0}, {s32, p0}, {s64, p0}, {s128, p0}})
1145 .clampScalar(0, s32, s64);
1147 getActionDefinitionsBuilder({G_ATOMICRMW_XCHG, G_ATOMICRMW_ADD,
1148 G_ATOMICRMW_SUB, G_ATOMICRMW_AND, G_ATOMICRMW_OR,
1150 .legalFor(!UseOutlineAtomics, {{s32, p0}, {s64, p0}})
1151 .libcallFor(UseOutlineAtomics,
1152 {{s8, p0}, {s16, p0}, {s32, p0}, {s64, p0}})
1153 .clampScalar(0, s32, s64);
1157 getActionDefinitionsBuilder(
1158 {G_ATOMICRMW_MIN, G_ATOMICRMW_MAX, G_ATOMICRMW_UMIN, G_ATOMICRMW_UMAX})
1160 .clampScalar(0, s32, s64);
1162 getActionDefinitionsBuilder(G_BLOCK_ADDR).legalFor({p0});
1165 for (
unsigned Op : {G_MERGE_VALUES, G_UNMERGE_VALUES}) {
1166 unsigned BigTyIdx =
Op == G_MERGE_VALUES ? 0 : 1;
1167 unsigned LitTyIdx =
Op == G_MERGE_VALUES ? 1 : 0;
1168 getActionDefinitionsBuilder(
Op)
1169 .widenScalarToNextPow2(LitTyIdx, 8)
1170 .widenScalarToNextPow2(BigTyIdx, 32)
1171 .clampScalar(LitTyIdx, s8, s64)
1172 .clampScalar(BigTyIdx, s32, s128)
1174 switch (Q.
Types[BigTyIdx].getSizeInBits()) {
1182 switch (Q.
Types[LitTyIdx].getSizeInBits()) {
1195 getActionDefinitionsBuilder(G_EXTRACT_VECTOR_ELT)
1196 .legalFor(HasSVE, {{s16, nxv16s8, s64},
1197 {s16, nxv8s16, s64},
1198 {s32, nxv4s32, s64},
1199 {s64, nxv2s64, s64}})
1201 const LLT &EltTy = Query.
Types[1].getElementType();
1202 if (Query.
Types[1].isScalableVector())
1204 return Query.
Types[0] != EltTy;
1209 return VecTy == v8s8 || VecTy == v16s8 || VecTy == v2s16 ||
1210 VecTy == v4s16 || VecTy == v8s16 || VecTy == v2s32 ||
1211 VecTy == v4s32 || VecTy == v2s64 || VecTy == v2p0;
1217 return Query.
Types[1].isFixedVector() &&
1218 Query.
Types[1].getNumElements() <= 2;
1223 return Query.
Types[1].isFixedVector() &&
1224 Query.
Types[1].getNumElements() <= 4;
1229 return Query.
Types[1].isFixedVector() &&
1230 Query.
Types[1].getNumElements() <= 8;
1235 return Query.
Types[1].isFixedVector() &&
1236 Query.
Types[1].getNumElements() <= 16;
1239 .minScalarOrElt(0, s8)
1240 .moreElementsToNextPow2(1)
1241 .clampMaxNumElements(1, s64, 2)
1242 .clampMaxNumElements(1, s32, 4)
1243 .clampMaxNumElements(1, s16, 8)
1244 .clampMaxNumElements(1, s8, 16)
1245 .clampMaxNumElements(1, p0, 2)
1248 getActionDefinitionsBuilder(G_INSERT_VECTOR_ELT)
1250 typeInSet(0, {v8s8, v16s8, v4s16, v8s16, v2s32, v4s32, v2s64, v2p0}))
1251 .legalFor(HasSVE, {{nxv16s8, s32, s64},
1252 {nxv8s16, s32, s64},
1253 {nxv4s32, s32, s64},
1254 {nxv2s64, s64, s64}})
1256 .widenVectorEltsToVectorMinSize(0, 64)
1257 .clampNumElements(0, v8s8, v16s8)
1258 .clampNumElements(0, v4s16, v8s16)
1259 .clampNumElements(0, v2s32, v4s32)
1260 .clampMaxNumElements(0, s64, 2)
1261 .clampMaxNumElements(0, p0, 2)
1264 getActionDefinitionsBuilder(G_BUILD_VECTOR)
1265 .legalFor({{v8s8, s8},
1273 .clampNumElements(0, v4s32, v4s32)
1274 .clampNumElements(0, v2s64, v2s64)
1275 .minScalarOrElt(0, s8)
1276 .widenVectorEltsToVectorMinSize(0, 64)
1277 .widenScalarOrEltToNextPow2(0)
1278 .minScalarSameAs(1, 0);
1280 getActionDefinitionsBuilder(G_BUILD_VECTOR_TRUNC).lower();
1282 getActionDefinitionsBuilder(G_SHUFFLE_VECTOR)
1291 {v8s8, v16s8, v4s16, v8s16, v2s32, v4s32, v2s64}, DstTy);
1295 return Query.
Types[0].getNumElements() >
1296 Query.
Types[1].getNumElements();
1302 return Query.
Types[0].getNumElements() <
1303 Query.
Types[1].getNumElements();
1306 .widenScalarOrEltToNextPow2OrMinSize(0, 8)
1307 .clampNumElements(0, v8s8, v16s8)
1308 .clampNumElements(0, v4s16, v8s16)
1309 .clampNumElements(0, v4s32, v4s32)
1310 .clampNumElements(0, v2s64, v2s64)
1319 getActionDefinitionsBuilder(G_CONCAT_VECTORS)
1320 .legalFor({{v16s8, v8s8}, {v8s16, v4s16}, {v4s32, v2s32}})
1322 return Query.
Types[0].isFixedVector() &&
1323 Query.
Types[0].getScalarSizeInBits() < 8;
1327 return Query.
Types[0].isFixedVector() &&
1328 Query.
Types[1].isFixedVector() &&
1329 Query.
Types[0].getScalarSizeInBits() >= 8 &&
1331 Query.
Types[0].getSizeInBits() <= 128 &&
1332 Query.
Types[1].getSizeInBits() <= 64;
1344 getActionDefinitionsBuilder(G_EXTRACT_SUBVECTOR)
1345 .legalFor({{v8s8, v16s8}, {v4s16, v8s16}, {v2s32, v4s32}})
1350 getActionDefinitionsBuilder(G_SPLAT_VECTOR)
1351 .legalFor(HasSVE, {{nxv4s32, s32}, {nxv2s64, s64}});
1353 getActionDefinitionsBuilder(G_JUMP_TABLE).legalFor({p0});
1355 getActionDefinitionsBuilder(G_BRJT).legalFor({{p0, s64}});
1357 getActionDefinitionsBuilder({G_TRAP, G_DEBUGTRAP, G_UBSANTRAP}).alwaysLegal();
1359 getActionDefinitionsBuilder(G_DYN_STACKALLOC).custom();
1361 getActionDefinitionsBuilder({G_STACKSAVE, G_STACKRESTORE}).lower();
1366 getActionDefinitionsBuilder(G_BZERO).unsupported();
1368 getActionDefinitionsBuilder(G_MEMSET)
1369 .legalForCartesianProduct({p0}, {s64}, {s64})
1370 .customForCartesianProduct({p0}, {s8}, {s64})
1373 getActionDefinitionsBuilder({G_MEMCPY, G_MEMMOVE})
1374 .legalForCartesianProduct({p0}, {p0}, {s64})
1378 getActionDefinitionsBuilder(G_MEMCPY_INLINE)
1379 .legalForCartesianProduct({p0}, {p0}, {s64});
1381 getActionDefinitionsBuilder(G_MEMSET_INLINE)
1382 .legalForCartesianProduct({p0}, {s64}, {s64})
1383 .customForCartesianProduct({p0}, {s8}, {s64});
1385 getActionDefinitionsBuilder({G_BZERO, G_MEMCPY, G_MEMMOVE, G_MEMSET})
1392 getActionDefinitionsBuilder(G_VECREDUCE_FADD)
1393 .legalFor({{f32, v2f32}, {f32, v4f32}, {f64, v2f64}})
1394 .legalFor(HasFP16, {{f16, v4f16}, {f16, v8f16}})
1395 .minScalarOrElt(0, MinFPScalar)
1396 .clampMaxNumElements(1, s64, 2)
1397 .clampMaxNumElements(1, s32, 4)
1398 .clampMaxNumElements(1, s16, 8)
1399 .moreElementsToNextPow2(1)
1406 getActionDefinitionsBuilder(G_VECREDUCE_FMUL)
1407 .minScalarOrElt(0, MinFPScalar)
1408 .clampMaxNumElements(1, s64, 2)
1409 .clampMaxNumElements(1, s32, 4)
1410 .clampMaxNumElements(1, s16, 8)
1411 .clampMaxNumElements(1, s32, 2)
1412 .clampMaxNumElements(1, s16, 4)
1416 getActionDefinitionsBuilder({G_VECREDUCE_SEQ_FADD, G_VECREDUCE_SEQ_FMUL})
1420 getActionDefinitionsBuilder(G_VECREDUCE_ADD)
1421 .legalFor({{i8, v8i8},
1429 .clampMaxNumElements(1, s64, 2)
1430 .clampMaxNumElements(1, s32, 4)
1431 .clampMaxNumElements(1, s16, 8)
1432 .clampMaxNumElements(1, s8, 16)
1433 .widenVectorEltsToVectorMinSize(1, 64)
1436 getActionDefinitionsBuilder({G_VECREDUCE_FMIN, G_VECREDUCE_FMAX,
1437 G_VECREDUCE_FMINIMUM, G_VECREDUCE_FMAXIMUM})
1438 .legalFor({{f32, v2f32}, {f32, v4f32}, {f64, v2f64}})
1439 .legalFor(HasFP16, {{f16, v4f16}, {f16, v8f16}})
1440 .minScalarOrElt(0, MinFPScalar)
1441 .clampMaxNumElements(1, s64, 2)
1442 .clampMaxNumElements(1, s32, 4)
1443 .clampMaxNumElements(1, s16, 8)
1447 getActionDefinitionsBuilder(G_VECREDUCE_MUL)
1448 .clampMaxNumElements(1, s32, 2)
1449 .clampMaxNumElements(1, s16, 4)
1450 .clampMaxNumElements(1, s8, 8)
1454 getActionDefinitionsBuilder(
1455 {G_VECREDUCE_SMIN, G_VECREDUCE_SMAX, G_VECREDUCE_UMIN, G_VECREDUCE_UMAX})
1456 .legalFor({{i8, v8i8},
1464 return Query.
Types[1].isVector() &&
1465 Query.
Types[1].getElementType() != s8 &&
1466 Query.
Types[1].getNumElements() & 1;
1469 .clampMaxNumElements(1, s64, 2)
1470 .clampMaxNumElements(1, s32, 4)
1471 .clampMaxNumElements(1, s16, 8)
1472 .clampMaxNumElements(1, s8, 16)
1476 getActionDefinitionsBuilder(
1477 {G_VECREDUCE_OR, G_VECREDUCE_AND, G_VECREDUCE_XOR})
1493 return std::make_pair(1, SrcTy.
divide(2));
1499 getActionDefinitionsBuilder(G_VECTOR_COMPRESS).lower();
1502 getActionDefinitionsBuilder({G_GET_FPENV, G_SET_FPENV, G_RESET_FPENV,
1503 G_GET_FPMODE, G_SET_FPMODE, G_RESET_FPMODE})
1506 getActionDefinitionsBuilder(G_IS_FPCLASS).lower();
1508 getActionDefinitionsBuilder(G_PREFETCH).custom();
1510 getActionDefinitionsBuilder({G_SCMP, G_UCMP}).lower();
1512 getActionDefinitionsBuilder({G_INTRINSIC, G_INTRINSIC_W_SIDE_EFFECTS})
1514 getActionDefinitionsBuilder(G_FENCE).alwaysLegal();
1515 getActionDefinitionsBuilder(G_INVOKE_REGION_START).alwaysLegal();
1517 getLegacyLegalizerInfo().computeTables();
1764 auto LowerUnaryOp = [&
MI, &MIB](
unsigned Opcode) {
1766 MI.eraseFromParent();
1769 auto LowerBinOp = [&
MI, &MIB](
unsigned Opcode) {
1771 {
MI.getOperand(2),
MI.getOperand(3)});
1772 MI.eraseFromParent();
1775 auto LowerTriOp = [&
MI, &MIB](
unsigned Opcode) {
1777 {
MI.getOperand(2),
MI.getOperand(3),
MI.getOperand(4)});
1778 MI.eraseFromParent();
1783 switch (IntrinsicID) {
1784 case Intrinsic::vacopy: {
1785 unsigned PtrSize = ST->isTargetILP32() ? 4 : 8;
1786 unsigned VaListSize =
1787 (ST->isTargetDarwin() || ST->isTargetWindows())
1789 : ST->isTargetILP32() ? 20 : 32;
1797 VaListSize,
Align(PtrSize)));
1801 VaListSize,
Align(PtrSize)));
1802 MI.eraseFromParent();
1805 case Intrinsic::get_dynamic_area_offset: {
1807 MI.eraseFromParent();
1810 case Intrinsic::aarch64_mops_memset_tag: {
1811 assert(
MI.getOpcode() == TargetOpcode::G_INTRINSIC_W_SIDE_EFFECTS);
1814 auto &
Value =
MI.getOperand(3);
1816 Value.setReg(ExtValueReg);
1819 case Intrinsic::aarch64_prefetch: {
1820 auto &AddrVal =
MI.getOperand(1);
1822 int64_t IsWrite =
MI.getOperand(2).getImm();
1823 int64_t
Target =
MI.getOperand(3).getImm();
1824 int64_t IsStream =
MI.getOperand(4).getImm();
1825 int64_t IsData =
MI.getOperand(5).getImm();
1827 unsigned PrfOp = (IsWrite << 4) |
1833 MI.eraseFromParent();
1836 case Intrinsic::aarch64_range_prefetch: {
1837 auto &AddrVal =
MI.getOperand(1);
1839 int64_t IsWrite =
MI.getOperand(2).getImm();
1840 int64_t IsStream =
MI.getOperand(3).getImm();
1841 unsigned PrfOp = (IsStream << 2) | IsWrite;
1843 MIB.
buildInstr(AArch64::G_AARCH64_RANGE_PREFETCH)
1846 .
addUse(
MI.getOperand(4).getReg());
1847 MI.eraseFromParent();
1850 case Intrinsic::aarch64_prefetch_ir: {
1851 auto &AddrVal =
MI.getOperand(1);
1853 MI.eraseFromParent();
1856 case Intrinsic::aarch64_neon_uaddv:
1857 case Intrinsic::aarch64_neon_saddv:
1858 case Intrinsic::aarch64_neon_umaxv:
1859 case Intrinsic::aarch64_neon_smaxv:
1860 case Intrinsic::aarch64_neon_uminv:
1861 case Intrinsic::aarch64_neon_sminv: {
1862 bool IsSigned = IntrinsicID == Intrinsic::aarch64_neon_saddv ||
1863 IntrinsicID == Intrinsic::aarch64_neon_smaxv ||
1864 IntrinsicID == Intrinsic::aarch64_neon_sminv;
1866 auto OldDst =
MI.getOperand(0).getReg();
1867 auto OldDstTy = MRI.
getType(OldDst);
1869 if (OldDstTy == NewDstTy)
1875 MI.getOperand(0).setReg(NewDst);
1879 MIB.
buildExtOrTrunc(IsSigned ? TargetOpcode::G_SEXT : TargetOpcode::G_ZEXT,
1884 case Intrinsic::aarch64_neon_uaddlp:
1885 case Intrinsic::aarch64_neon_saddlp: {
1886 unsigned Opc = IntrinsicID == Intrinsic::aarch64_neon_uaddlp
1888 : AArch64::G_SADDLP;
1890 MI.eraseFromParent();
1894 case Intrinsic::aarch64_neon_uaddlv:
1895 case Intrinsic::aarch64_neon_saddlv: {
1896 unsigned Opc = IntrinsicID == Intrinsic::aarch64_neon_uaddlv
1898 : AArch64::G_SADDLV;
1925 MI.eraseFromParent();
1929 case Intrinsic::aarch64_neon_smax:
1930 return LowerBinOp(TargetOpcode::G_SMAX);
1931 case Intrinsic::aarch64_neon_smin:
1932 return LowerBinOp(TargetOpcode::G_SMIN);
1933 case Intrinsic::aarch64_neon_umax:
1934 return LowerBinOp(TargetOpcode::G_UMAX);
1935 case Intrinsic::aarch64_neon_umin:
1936 return LowerBinOp(TargetOpcode::G_UMIN);
1937 case Intrinsic::aarch64_neon_fmax:
1938 return LowerBinOp(TargetOpcode::G_FMAXIMUM);
1939 case Intrinsic::aarch64_neon_fmin:
1940 return LowerBinOp(TargetOpcode::G_FMINIMUM);
1941 case Intrinsic::aarch64_neon_fmaxnm:
1942 return LowerBinOp(TargetOpcode::G_FMAXNUM);
1943 case Intrinsic::aarch64_neon_fminnm:
1944 return LowerBinOp(TargetOpcode::G_FMINNUM);
1945 case Intrinsic::aarch64_neon_pmul:
1946 return LowerBinOp(TargetOpcode::G_CLMUL);
1947 case Intrinsic::aarch64_neon_pmull:
1948 case Intrinsic::aarch64_neon_pmull64:
1949 return LowerBinOp(AArch64::G_PMULL);
1950 case Intrinsic::aarch64_neon_smull:
1951 return LowerBinOp(AArch64::G_SMULL);
1952 case Intrinsic::aarch64_neon_umull:
1953 return LowerBinOp(AArch64::G_UMULL);
1954 case Intrinsic::aarch64_neon_sabd:
1955 return LowerBinOp(TargetOpcode::G_ABDS);
1956 case Intrinsic::aarch64_neon_uabd:
1957 return LowerBinOp(TargetOpcode::G_ABDU);
1958 case Intrinsic::aarch64_neon_uhadd:
1959 return LowerBinOp(TargetOpcode::G_UAVGFLOOR);
1960 case Intrinsic::aarch64_neon_urhadd:
1961 return LowerBinOp(TargetOpcode::G_UAVGCEIL);
1962 case Intrinsic::aarch64_neon_shadd:
1963 return LowerBinOp(TargetOpcode::G_SAVGFLOOR);
1964 case Intrinsic::aarch64_neon_srhadd:
1965 return LowerBinOp(TargetOpcode::G_SAVGCEIL);
1966 case Intrinsic::aarch64_neon_sqshrn: {
1971 {MRI.
getType(
MI.getOperand(2).getReg())},
1972 {
MI.getOperand(2),
MI.getOperand(3).getImm()});
1974 MIB.
buildInstr(TargetOpcode::G_TRUNC_SSAT_S, {
MI.getOperand(0)}, {Shr});
1975 MI.eraseFromParent();
1978 case Intrinsic::aarch64_neon_sqshrun: {
1983 {MRI.
getType(
MI.getOperand(2).getReg())},
1984 {
MI.getOperand(2),
MI.getOperand(3).getImm()});
1986 MIB.
buildInstr(TargetOpcode::G_TRUNC_SSAT_U, {
MI.getOperand(0)}, {Shr});
1987 MI.eraseFromParent();
1990 case Intrinsic::aarch64_neon_sqrshrn: {
1994 auto Shr = MIB.
buildInstr(AArch64::G_SRSHR_I,
1995 {MRI.
getType(
MI.getOperand(2).getReg())},
1996 {
MI.getOperand(2),
MI.getOperand(3).getImm()});
1998 MIB.
buildInstr(TargetOpcode::G_TRUNC_SSAT_S, {
MI.getOperand(0)}, {Shr});
1999 MI.eraseFromParent();
2002 case Intrinsic::aarch64_neon_sqrshrun: {
2006 auto Shr = MIB.
buildInstr(AArch64::G_SRSHR_I,
2007 {MRI.
getType(
MI.getOperand(2).getReg())},
2008 {
MI.getOperand(2),
MI.getOperand(3).getImm()});
2010 MIB.
buildInstr(TargetOpcode::G_TRUNC_SSAT_U, {
MI.getOperand(0)}, {Shr});
2011 MI.eraseFromParent();
2014 case Intrinsic::aarch64_neon_uqrshrn: {
2018 auto Shr = MIB.
buildInstr(AArch64::G_URSHR_I,
2019 {MRI.
getType(
MI.getOperand(2).getReg())},
2020 {
MI.getOperand(2),
MI.getOperand(3).getImm()});
2022 MIB.
buildInstr(TargetOpcode::G_TRUNC_USAT_U, {
MI.getOperand(0)}, {Shr});
2023 MI.eraseFromParent();
2026 case Intrinsic::aarch64_neon_uqshrn: {
2031 {MRI.
getType(
MI.getOperand(2).getReg())},
2032 {
MI.getOperand(2),
MI.getOperand(3).getImm()});
2034 MIB.
buildInstr(TargetOpcode::G_TRUNC_USAT_U, {
MI.getOperand(0)}, {Shr});
2035 MI.eraseFromParent();
2038 case Intrinsic::aarch64_neon_sqshlu: {
2044 MIB.
buildInstr(AArch64::G_SQSHLU_I, {
MI.getOperand(0)},
2046 .addImm(ShiftAmount->getSExtValue());
2047 MI.eraseFromParent();
2052 case Intrinsic::aarch64_neon_vsli: {
2054 AArch64::G_SLI, {
MI.getOperand(0)},
2055 {
MI.getOperand(2),
MI.getOperand(3),
MI.getOperand(4).getImm()});
2056 MI.eraseFromParent();
2059 case Intrinsic::aarch64_neon_vsri: {
2061 AArch64::G_SRI, {
MI.getOperand(0)},
2062 {
MI.getOperand(2),
MI.getOperand(3),
MI.getOperand(4).getImm()});
2063 MI.eraseFromParent();
2066 case Intrinsic::aarch64_neon_abs: {
2068 MIB.
buildInstr(TargetOpcode::G_ABS, {
MI.getOperand(0)}, {
MI.getOperand(2)});
2069 MI.eraseFromParent();
2072 case Intrinsic::aarch64_neon_sqadd: {
2074 return LowerBinOp(TargetOpcode::G_SADDSAT);
2077 case Intrinsic::aarch64_neon_sqsub: {
2079 return LowerBinOp(TargetOpcode::G_SSUBSAT);
2082 case Intrinsic::aarch64_neon_uqadd: {
2084 return LowerBinOp(TargetOpcode::G_UADDSAT);
2087 case Intrinsic::aarch64_neon_uqsub: {
2089 return LowerBinOp(TargetOpcode::G_USUBSAT);
2092 case Intrinsic::aarch64_neon_udot:
2093 return LowerTriOp(AArch64::G_UDOT);
2094 case Intrinsic::aarch64_neon_sdot:
2095 return LowerTriOp(AArch64::G_SDOT);
2096 case Intrinsic::aarch64_neon_usdot:
2097 return LowerTriOp(AArch64::G_USDOT);
2098 case Intrinsic::aarch64_neon_sqxtn:
2099 return LowerUnaryOp(TargetOpcode::G_TRUNC_SSAT_S);
2100 case Intrinsic::aarch64_neon_sqxtun:
2101 return LowerUnaryOp(TargetOpcode::G_TRUNC_SSAT_U);
2102 case Intrinsic::aarch64_neon_uqxtn:
2103 return LowerUnaryOp(TargetOpcode::G_TRUNC_USAT_U);
2104 case Intrinsic::aarch64_neon_fcvtzu:
2105 return LowerUnaryOp(TargetOpcode::G_FPTOUI_SAT);
2106 case Intrinsic::aarch64_neon_fcvtzs:
2107 return LowerUnaryOp(TargetOpcode::G_FPTOSI_SAT);
2108 case Intrinsic::aarch64_neon_cls:
2109 return LowerUnaryOp(TargetOpcode::G_CTLS);
2111 case Intrinsic::vector_reverse: