107 std::initializer_list<LLT> PackedVectorAllTypeList = {
113 std::initializer_list<LLT> ScalarAndPtrTypesList = {s8, s16, s32, s64, p0};
117 const TargetMachine &TM = ST.getTargetLowering()->getTargetMachine();
120 if (!ST.hasNEON() || !ST.hasFPARMv8()) {
127 const bool HasFP16 = ST.hasFullFP16();
128 const LLT &MinFPScalar = HasFP16 ? f16 : f32;
130 const bool HasCSSC = ST.hasCSSC();
131 const bool HasRCPC3 = ST.hasRCPC3();
132 const bool HasSVE = ST.hasSVE();
135 {G_IMPLICIT_DEF, G_FREEZE, G_CONSTANT_FOLD_BARRIER})
136 .legalFor({p0, s8, s16, s32, s64})
137 .legalFor({v2s8, v4s8, v8s8, v16s8, v2s16, v4s16, v8s16, v2s32, v4s32,
139 .widenScalarToNextPow2(0)
152 .legalFor(PackedVectorAllTypeList)
166 .widenScalarToNextPow2(0)
171 .maxScalarIf(
typeInSet(0, {s64, p0}), 1, s32);
176 .widenScalarToNextPow2(1)
181 .maxScalarIf(
typeInSet(1, {s64, p0}), 0, s32)
182 .maxScalarIf(
typeInSet(1, {s128}), 0, s64);
185 .legalFor({i32, i64, v8i8, v16i8, v4i16, v8i16, v2i32, v4i32, v2i64})
186 .legalFor(HasSVE, {nxv16i8, nxv8i16, nxv4i32, nxv2i64})
187 .widenScalarToNextPow2(0)
195 return Query.
Types[0].getNumElements() <= 2;
200 return Query.
Types[0].getNumElements() <= 4;
205 return Query.
Types[0].getNumElements() <= 16;
212 .
legalFor({i32, i64, v8i8, v16i8, v4i16, v8i16, v2i32, v4i32, v2i64})
213 .widenScalarToNextPow2(0)
221 return Query.
Types[0].getNumElements() <= 2;
226 return Query.
Types[0].getNumElements() <= 4;
231 return Query.
Types[0].getNumElements() <= 16;
239 const auto &SrcTy = Query.
Types[0];
240 const auto &AmtTy = Query.
Types[1];
241 return !SrcTy.isVector() && SrcTy.getSizeInBits() == 32 &&
242 AmtTy.getSizeInBits() == 32;
256 .widenScalarToNextPow2(0)
270 .
legalFor({{p0, i64}, {v2p0, v2i64}})
271 .clampScalarOrElt(1, s64, s64)
277 .legalFor({i32, i64})
279 .clampScalar(0, s32, s64)
284 .lowerFor({i8, i16, i32, i64, v2i32, v4i32, v2i64})
293 .widenScalarToNextPow2(0, 32)
298 .legalFor({i64, v16i8, v8i16, v4i32})
304 .legalFor({v8i8, v16i8, v4i16, v8i16, v2i32, v4i32})
305 .legalFor(HasCSSC, {i32, i64})
306 .minScalar(HasCSSC, 0, s32)
315 .legalFor({v16i8, v8i16, v4i32, v2i64, v2p0, v8i8, v4i16, v2i32})
319 return SrcTy.isScalar() && SrcTy.getSizeInBits() < 128;
323 [=](
const LegalityQuery &Query) {
return std::make_pair(0, v4i16); })
326 [=](
const LegalityQuery &Query) {
return std::make_pair(0, v2i32); })
327 .clampNumElements(0, v8s8, v16s8)
335 {G_ABDS, G_ABDU, G_UAVGFLOOR, G_UAVGCEIL, G_SAVGFLOOR, G_SAVGCEIL})
336 .legalFor({v8i8, v16i8, v4i16, v8i16, v2i32, v4i32})
340 {G_SADDE, G_SSUBE, G_UADDE, G_USUBE, G_SADDO, G_SSUBO, G_UADDO, G_USUBO})
341 .legalFor({{i32, i32}, {i64, i32}})
342 .clampScalar(0, s32, s64)
347 .customFor({{i32, i32}, {i32, i64}, {i64, i64}})
353 return Q.
Types[0].isScalar() && Q.
Types[1].getScalarSizeInBits() < 64;
359 .customFor({{s32, s32}, {s64, s64}});
363 .
legalFor(HasCSSC, {{i32, i32}, {i64, i64}})
364 .legalFor({{v8i8, v8i8}, {v16i8, v16i8}})
365 .customFor(!HasCSSC, {{s32, s32}, {s64, s64}})
366 .customFor({{s128, s128},
372 .clampScalar(0, s32, s128)
385 .legalFor({{i32, i32},
393 .widenScalarToNextPow2(1, 32)
411 .customFor(!HasCSSC, {s32, s64});
417 .widenScalarToNextPow2(0, 32)
431 .
legalFor({i32, i64, v4i16, v8i16, v2i32, v4i32, v2i64})
440 .legalFor({v8i8, v16i8, v4i16, v8i16, v2i32, v4i32, v2i64})
441 .legalFor(HasSVE, {nxv16i8, nxv8i16, nxv4i32, nxv2i64})
442 .clampNumElements(0, v8s8, v16s8)
451 {G_FADD, G_FSUB, G_FMUL, G_FDIV, G_FMA, G_FSQRT, G_FMAXNUM, G_FMINNUM,
452 G_FMAXIMUM, G_FMINIMUM, G_FCEIL, G_FFLOOR, G_FRINT, G_FNEARBYINT,
453 G_INTRINSIC_TRUNC, G_INTRINSIC_ROUND, G_INTRINSIC_ROUNDEVEN})
454 .legalFor({f32, f64, v2f32, v4f32, v2f64})
455 .legalFor(HasFP16, {f16, v4f16, v8f16})
460 return (!HasFP16 && Q.
Types[0].getScalarType().isFloat16()) ||
461 Q.
Types[0].getScalarType().isBFloat16();
464 .clampNumElements(0, v4s16, v8s16)
470 .legalFor({f32, f64, v2f32, v4f32, v2f64})
471 .legalFor(HasFP16, {f16, bf16, v4f16, v4bf16, v8f16, v8bf16})
478 .
lowerFor({f16, bf16, v4f16, v4bf16, v8f16, v8bf16});
481 G_FLOG10, G_FTAN, G_FEXP, G_FEXP2, G_FEXP10,
482 G_FACOS, G_FASIN, G_FATAN, G_FATAN2, G_FCOSH,
483 G_FSINH, G_FTANH, G_FMODF})
484 .libcallFor({f32, f64, f128})
488 .libcallFor({{f32, i32}, {f64, i32}, {f128, i32}})
493 .legalFor({{i32, f32}, {i32, f64}, {i64, f32}, {i64, f64}})
494 .legalFor(HasFP16, {{i32, f16}, {i64, f16}})
499 .legalFor({{i64, f32}, {i64, f64}})
500 .legalFor(HasFP16, {{i64, f16}})
518 for (
unsigned Op : {G_SEXTLOAD, G_ZEXTLOAD}) {
521 if (
Op == G_SEXTLOAD)
526 .legalForTypesWithMemDesc({{s32, p0, s8, 8},
534 {v2s32, p0, s64, 8}})
535 .widenScalarToNextPow2(0)
536 .clampScalar(0, s32, s64)
539 .unsupportedIfMemSizeNotPow2()
551 return HasRCPC3 && Query.
Types[0] == s128 &&
555 return Query.
Types[0] == s128 &&
558 .legalForTypesWithMemDesc({{s8, p0, s8, 8},
565 {v16s8, p0, s128, 8},
567 {v8s16, p0, s128, 8},
569 {v4s32, p0, s128, 8},
570 {v2s64, p0, s128, 8}})
572 .legalForTypesWithMemDesc(
573 {{s32, p0, s8, 8}, {s32, p0, s16, 8}, {s64, p0, s32, 8}})
574 .legalForTypesWithMemDesc({
576 {nxv16s8, p0, nxv16s8, 8},
577 {nxv8s16, p0, nxv8s16, 8},
578 {nxv4s32, p0, nxv4s32, 8},
579 {nxv2s64, p0, nxv2s64, 8},
581 .widenScalarToNextPow2(0, 8)
592 return Query.
Types[0].isScalar() &&
594 Query.
Types[0].getSizeInBits() > 32;
603 .customIf(IsPtrVecPred)
609 return HasRCPC3 && Query.
Types[0] == s128 &&
613 return Query.
Types[0] == s128 &&
621 {{s8, p0, s8, 8}, {s16, p0, s8, 8},
624 {s16, p0, s16, 8}, {s32, p0, s16, 8},
626 {s32, p0, s8, 8}, {s32, p0, s16, 8}, {s32, p0, s32, 8},
627 {s64, p0, s64, 8}, {s64, p0, s32, 8},
628 {p0, p0, s64, 8}, {s128, p0, s128, 8}, {v16s8, p0, s128, 8},
629 {v8s8, p0, s64, 8}, {v4s16, p0, s64, 8}, {v8s16, p0, s128, 8},
630 {v2s32, p0, s64, 8}, {v4s32, p0, s128, 8}, {v2s64, p0, s128, 8}})
631 .legalForTypesWithMemDesc({
636 {nxv16s8, p0, nxv16s8, 8},
637 {nxv8s16, p0, nxv8s16, 8},
638 {nxv4s32, p0, nxv4s32, 8},
639 {nxv2s64, p0, nxv2s64, 8},
641 .clampScalar(0, s8, s64)
644 return Query.
Types[0].isScalar() &&
648 .clampMaxNumElements(0, s8, 16)
657 return Query.
Types[0].getSizeInBits() ==
658 Query.
MMODescrs[0].MemoryTy.getSizeInBits();
664 .customIf(IsPtrVecPred)
682 {p0, v16s8, v16s8, 8},
683 {p0, v4s16, v4s16, 8},
684 {p0, v8s16, v8s16, 8},
685 {p0, v2s32, v2s32, 8},
686 {p0, v4s32, v4s32, 8},
687 {p0, v2s64, v2s64, 8},
693 auto IndexedLoadBasicPred = [=](
const LegalityQuery &Query) {
721 return MemTy == s8 || MemTy == s16;
723 return MemTy == s8 || MemTy == s16 || MemTy == s32;
731 .widenScalarToNextPow2(0)
738 .
legalFor({{i32, i32}, {i32, i64}, {i32, p0}})
748 return Ty.isVector() && !SrcTy.isPointerVector() &&
749 Ty.getElementType() != SrcTy.getElementType();
757 return Query.
Types[1].isPointerVector();
774 .legalFor(HasFP16, {{i32, f16}, {v4i16, v4f16}, {v8i16, v8f16}})
779 return (!HasFP16 && Q.
Types[1].getScalarType().isFloat16()) ||
780 Q.
Types[1].getScalarType().isBFloat16();
788 return Ty.isVector() && !SrcTy.isPointerVector() &&
789 Ty.getElementType() != SrcTy.getElementType();
792 .clampNumElements(1, v4s16, v8s16)
800 unsigned DstSize = Query.
Types[0].getSizeInBits();
803 if (Query.
Types[0].isVector())
806 if (DstSize < 8 || DstSize >= 128 || !
isPowerOf2_32(DstSize))
814 unsigned SrcSize = SrcTy.getSizeInBits();
821 .legalIf(ExtLegalFunc)
822 .
legalFor({{v8s16, v8s8}, {v4s32, v4s16}, {v2s64, v2s32}})
823 .clampScalar(0, s64, s64)
830 return (Query.
Types[0].getScalarSizeInBits() >
831 Query.
Types[1].getScalarSizeInBits() * 2) &&
832 Query.
Types[0].isVector() &&
833 (Query.
Types[1].getScalarSizeInBits() == 8 ||
834 Query.
Types[1].getScalarSizeInBits() == 16);
836 .clampMinNumElements(1, s8, 8)
841 .
legalFor({{v8s8, v8s16}, {v4s16, v4s32}, {v2s32, v2s64}})
852 return DstTy.
isVector() && SrcTy.getSizeInBits() > 128 &&
855 .clampMinNumElements(0, s8, 8)
860 .legalFor({{v8i8, v8i16}, {v4i16, v4i32}, {v2i32, v2i64}})
861 .clampNumElements(0, v2s32, v2s32);
864 .
legalFor({i32, i64, v8i8, v16i8, v4i16, v8i16, v2i32, v4i32, v2i64})
875 {{f16, f32}, {f16, f64}, {f32, f64}, {v4f16, v4f32}, {v2f32, v2f64}})
876 .legalFor(ST.hasBF16(), {{bf16, f32}, {v4bf16, v4f32}})
877 .libcallFor({{f16, f128}, {f32, f128}, {f64, f128}})
885 .lowerFor({{bf16, f32}, {v4bf16, v4f32}})
887 .clampNumElements(1, v4s32, v4s32)
891 getActionDefinitionsBuilder(G_FPEXT)
899 .libcallFor({{f128, f64}, {f128, f32}, {f128, f16}})
910 .clampNumElements(0, v4s32, v4s32)
915 getActionDefinitionsBuilder({G_FPTOSI, G_FPTOUI})
916 .legalFor({{i32, f32},
924 {{i32, f16}, {i64, f16}, {v4i16, v4f16}, {v8i16, v8f16}})
931 return Query.
Types[1] == f16 && Query.
Types[0].getSizeInBits() > 64;
940 return Query.
Types[0].getScalarSizeInBits() <= 64 &&
941 Query.
Types[0].getScalarSizeInBits() >
942 Query.
Types[1].getScalarSizeInBits();
947 return Query.
Types[1].getScalarSizeInBits() <= 64 &&
948 Query.
Types[0].getScalarSizeInBits() <
949 Query.
Types[1].getScalarSizeInBits();
952 .clampNumElements(0, v4s16, v8s16)
956 {{i32, f128}, {i64, f128}, {i128, f128}, {i128, f32}, {i128, f64}});
958 getActionDefinitionsBuilder({G_FPTOSI_SAT, G_FPTOUI_SAT})
959 .legalFor({{i32, f32},
968 {{i16, f16}, {i32, f16}, {i64, f16}, {v4i16, v4f16}, {v8i16, v8f16}})
976 return Query.
Types[1] == f16 && Query.
Types[0].getSizeInBits() > 64;
986 unsigned ITySize = Query.
Types[0].getScalarSizeInBits();
987 return (ITySize == 16 || ITySize == 32 || ITySize == 64) &&
988 ITySize > Query.
Types[1].getScalarSizeInBits();
993 unsigned FTySize = Query.
Types[1].getScalarSizeInBits();
994 return (FTySize == 16 || FTySize == 32 || FTySize == 64) &&
995 Query.
Types[0].getScalarSizeInBits() < FTySize;
1003 getActionDefinitionsBuilder({G_SITOFP, G_UITOFP})
1004 .legalFor({{f32, i32},
1012 {{f16, i32}, {f16, i64}, {v4f16, v4i16}, {v8f16, v8i16}})
1014 return Query.
Types[0].getScalarType().isBFloat16();
1022 return Query.
Types[1].isVector() &&
1023 Query.
Types[1].getScalarSizeInBits() == 64 &&
1024 Query.
Types[0].getScalarSizeInBits() == 16;
1026 .widenScalarOrEltToNextPow2OrMinSize(0, HasFP16 ? 16 : 32)
1030 return Query.
Types[0].getScalarSizeInBits() == 32 &&
1031 Query.
Types[1].getScalarSizeInBits() == 64;
1036 return Query.
Types[1].getScalarSizeInBits() <= 64 &&
1037 Query.
Types[0].getScalarSizeInBits() <
1038 Query.
Types[1].getScalarSizeInBits();
1043 return Query.
Types[0].getScalarSizeInBits() <= 64 &&
1044 Query.
Types[0].getScalarSizeInBits() >
1045 Query.
Types[1].getScalarSizeInBits();
1048 .clampNumElements(0, v4s16, v8s16)
1060 getActionDefinitionsBuilder(G_BRCOND)
1062 .clampScalar(0, s32, s32);
1063 getActionDefinitionsBuilder(G_BRINDIRECT).
legalFor({p0});
1065 getActionDefinitionsBuilder(G_SELECT)
1066 .
legalFor({{s32, s32}, {s64, s32}, {p0, s32}})
1067 .widenScalarToNextPow2(0)
1075 getActionDefinitionsBuilder(G_FRAME_INDEX).
legalFor({p0});
1078 getActionDefinitionsBuilder(G_GLOBAL_VALUE).
custom();
1080 getActionDefinitionsBuilder(G_GLOBAL_VALUE).
legalFor({p0});
1082 getActionDefinitionsBuilder(G_PTRAUTH_GLOBAL_VALUE)
1085 getActionDefinitionsBuilder(G_PTRTOINT)
1086 .
legalFor({{i64, p0}, {v2i64, v2p0}})
1087 .widenScalarToNextPow2(0, 64)
1091 getActionDefinitionsBuilder(G_INTTOPTR)
1093 return Query.
Types[0].getSizeInBits() != Query.
Types[1].getSizeInBits();
1095 .legalFor({{p0, i64}, {v2p0, v2i64}})
1096 .clampMaxNumElements(1, s64, 2);
1100 getActionDefinitionsBuilder(G_BITCAST)
1103 .legalForCartesianProduct({s32, v2s16, v4s8})
1104 .legalForCartesianProduct({s64, v8s8, v4s16, v2s32})
1105 .legalForCartesianProduct({s128, v16s8, v8s16, v4s32, v2s64, v2p0})
1114 return Query.
Types[0].isVector() != Query.
Types[1].isVector();
1123 getActionDefinitionsBuilder(G_VASTART).
legalFor({p0});
1127 getActionDefinitionsBuilder(G_VAARG)
1129 .clampScalar(0, s8, s64)
1132 getActionDefinitionsBuilder(G_ATOMIC_CMPXCHG_WITH_SUCCESS)
1136 bool UseOutlineAtomics =
ST.outlineAtomics() && !
ST.hasLSE();
1138 getActionDefinitionsBuilder(G_ATOMIC_CMPXCHG)
1139 .legalFor(!UseOutlineAtomics, {{s32, p0}, {s64, p0}})
1140 .customFor(!UseOutlineAtomics, {{s128, p0}})
1141 .libcallFor(UseOutlineAtomics,
1142 {{s8, p0}, {s16, p0}, {s32, p0}, {s64, p0}, {s128, p0}})
1143 .clampScalar(0, s32, s64);
1145 getActionDefinitionsBuilder({G_ATOMICRMW_XCHG, G_ATOMICRMW_ADD,
1146 G_ATOMICRMW_SUB, G_ATOMICRMW_AND, G_ATOMICRMW_OR,
1148 .legalFor(!UseOutlineAtomics, {{s32, p0}, {s64, p0}})
1149 .libcallFor(UseOutlineAtomics,
1150 {{s8, p0}, {s16, p0}, {s32, p0}, {s64, p0}})
1151 .clampScalar(0, s32, s64);
1155 getActionDefinitionsBuilder(
1156 {G_ATOMICRMW_MIN, G_ATOMICRMW_MAX, G_ATOMICRMW_UMIN, G_ATOMICRMW_UMAX})
1158 .clampScalar(0, s32, s64);
1160 getActionDefinitionsBuilder(G_BLOCK_ADDR).legalFor({p0});
1163 for (
unsigned Op : {G_MERGE_VALUES, G_UNMERGE_VALUES}) {
1164 unsigned BigTyIdx =
Op == G_MERGE_VALUES ? 0 : 1;
1165 unsigned LitTyIdx =
Op == G_MERGE_VALUES ? 1 : 0;
1166 getActionDefinitionsBuilder(
Op)
1167 .widenScalarToNextPow2(LitTyIdx, 8)
1168 .widenScalarToNextPow2(BigTyIdx, 32)
1169 .clampScalar(LitTyIdx, s8, s64)
1170 .clampScalar(BigTyIdx, s32, s128)
1172 switch (Q.
Types[BigTyIdx].getSizeInBits()) {
1180 switch (Q.
Types[LitTyIdx].getSizeInBits()) {
1193 getActionDefinitionsBuilder(G_EXTRACT_VECTOR_ELT)
1194 .legalFor(HasSVE, {{s16, nxv16s8, s64},
1195 {s16, nxv8s16, s64},
1196 {s32, nxv4s32, s64},
1197 {s64, nxv2s64, s64}})
1199 const LLT &EltTy = Query.
Types[1].getElementType();
1200 if (Query.
Types[1].isScalableVector())
1202 return Query.
Types[0] != EltTy;
1207 return VecTy == v8s8 || VecTy == v16s8 || VecTy == v2s16 ||
1208 VecTy == v4s16 || VecTy == v8s16 || VecTy == v2s32 ||
1209 VecTy == v4s32 || VecTy == v2s64 || VecTy == v2p0;
1215 return Query.
Types[1].isFixedVector() &&
1216 Query.
Types[1].getNumElements() <= 2;
1221 return Query.
Types[1].isFixedVector() &&
1222 Query.
Types[1].getNumElements() <= 4;
1227 return Query.
Types[1].isFixedVector() &&
1228 Query.
Types[1].getNumElements() <= 8;
1233 return Query.
Types[1].isFixedVector() &&
1234 Query.
Types[1].getNumElements() <= 16;
1237 .minScalarOrElt(0, s8)
1238 .moreElementsToNextPow2(1)
1239 .clampMaxNumElements(1, s64, 2)
1240 .clampMaxNumElements(1, s32, 4)
1241 .clampMaxNumElements(1, s16, 8)
1242 .clampMaxNumElements(1, s8, 16)
1243 .clampMaxNumElements(1, p0, 2)
1246 getActionDefinitionsBuilder(G_INSERT_VECTOR_ELT)
1248 typeInSet(0, {v8s8, v16s8, v4s16, v8s16, v2s32, v4s32, v2s64, v2p0}))
1249 .legalFor(HasSVE, {{nxv16s8, s32, s64},
1250 {nxv8s16, s32, s64},
1251 {nxv4s32, s32, s64},
1252 {nxv2s64, s64, s64}})
1254 .widenVectorEltsToVectorMinSize(0, 64)
1255 .clampNumElements(0, v8s8, v16s8)
1256 .clampNumElements(0, v4s16, v8s16)
1257 .clampNumElements(0, v2s32, v4s32)
1258 .clampMaxNumElements(0, s64, 2)
1259 .clampMaxNumElements(0, p0, 2)
1262 getActionDefinitionsBuilder(G_BUILD_VECTOR)
1263 .legalFor({{v8s8, s8},
1271 .clampNumElements(0, v4s32, v4s32)
1272 .clampNumElements(0, v2s64, v2s64)
1273 .minScalarOrElt(0, s8)
1274 .widenVectorEltsToVectorMinSize(0, 64)
1275 .widenScalarOrEltToNextPow2(0)
1276 .minScalarSameAs(1, 0);
1278 getActionDefinitionsBuilder(G_BUILD_VECTOR_TRUNC).lower();
1280 getActionDefinitionsBuilder(G_SHUFFLE_VECTOR)
1289 {v8s8, v16s8, v4s16, v8s16, v2s32, v4s32, v2s64}, DstTy);
1293 return Query.
Types[0].getNumElements() >
1294 Query.
Types[1].getNumElements();
1300 return Query.
Types[0].getNumElements() <
1301 Query.
Types[1].getNumElements();
1304 .widenScalarOrEltToNextPow2OrMinSize(0, 8)
1305 .clampNumElements(0, v8s8, v16s8)
1306 .clampNumElements(0, v4s16, v8s16)
1307 .clampNumElements(0, v4s32, v4s32)
1308 .clampNumElements(0, v2s64, v2s64)
1317 getActionDefinitionsBuilder(G_CONCAT_VECTORS)
1318 .legalFor({{v16s8, v8s8}, {v8s16, v4s16}, {v4s32, v2s32}})
1320 return Query.
Types[0].isFixedVector() &&
1321 Query.
Types[0].getScalarSizeInBits() < 8;
1325 return Query.
Types[0].isFixedVector() &&
1326 Query.
Types[1].isFixedVector() &&
1327 Query.
Types[0].getScalarSizeInBits() >= 8 &&
1329 Query.
Types[0].getSizeInBits() <= 128 &&
1330 Query.
Types[1].getSizeInBits() <= 64;
1342 getActionDefinitionsBuilder(G_EXTRACT_SUBVECTOR)
1343 .legalFor({{v8s8, v16s8}, {v4s16, v8s16}, {v2s32, v4s32}})
1348 getActionDefinitionsBuilder(G_SPLAT_VECTOR)
1349 .legalFor(HasSVE, {{nxv4s32, s32}, {nxv2s64, s64}});
1351 getActionDefinitionsBuilder(G_JUMP_TABLE).legalFor({p0});
1353 getActionDefinitionsBuilder(G_BRJT).legalFor({{p0, s64}});
1355 getActionDefinitionsBuilder({G_TRAP, G_DEBUGTRAP, G_UBSANTRAP}).alwaysLegal();
1357 getActionDefinitionsBuilder(G_DYN_STACKALLOC).custom();
1359 getActionDefinitionsBuilder({G_STACKSAVE, G_STACKRESTORE}).lower();
1364 getActionDefinitionsBuilder(G_BZERO).unsupported();
1366 getActionDefinitionsBuilder(G_MEMSET)
1367 .legalForCartesianProduct({p0}, {s64}, {s64})
1368 .customForCartesianProduct({p0}, {s8}, {s64})
1371 getActionDefinitionsBuilder({G_MEMCPY, G_MEMMOVE})
1372 .legalForCartesianProduct({p0}, {p0}, {s64})
1376 getActionDefinitionsBuilder(G_MEMCPY_INLINE)
1377 .legalForCartesianProduct({p0}, {p0}, {s64});
1379 getActionDefinitionsBuilder(G_MEMSET_INLINE)
1380 .legalForCartesianProduct({p0}, {s64}, {s64})
1381 .customForCartesianProduct({p0}, {s8}, {s64});
1383 getActionDefinitionsBuilder({G_BZERO, G_MEMCPY, G_MEMMOVE, G_MEMSET})
1390 getActionDefinitionsBuilder(G_VECREDUCE_FADD)
1391 .legalFor({{f32, v2f32}, {f32, v4f32}, {f64, v2f64}})
1392 .legalFor(HasFP16, {{f16, v4f16}, {f16, v8f16}})
1393 .minScalarOrElt(0, MinFPScalar)
1394 .clampMaxNumElements(1, s64, 2)
1395 .clampMaxNumElements(1, s32, 4)
1396 .clampMaxNumElements(1, s16, 8)
1397 .moreElementsToNextPow2(1)
1404 getActionDefinitionsBuilder(G_VECREDUCE_FMUL)
1405 .minScalarOrElt(0, MinFPScalar)
1406 .clampMaxNumElements(1, s64, 2)
1407 .clampMaxNumElements(1, s32, 4)
1408 .clampMaxNumElements(1, s16, 8)
1409 .clampMaxNumElements(1, s32, 2)
1410 .clampMaxNumElements(1, s16, 4)
1414 getActionDefinitionsBuilder({G_VECREDUCE_SEQ_FADD, G_VECREDUCE_SEQ_FMUL})
1418 getActionDefinitionsBuilder(G_VECREDUCE_ADD)
1419 .legalFor({{i8, v8i8},
1427 .clampMaxNumElements(1, s64, 2)
1428 .clampMaxNumElements(1, s32, 4)
1429 .clampMaxNumElements(1, s16, 8)
1430 .clampMaxNumElements(1, s8, 16)
1431 .widenVectorEltsToVectorMinSize(1, 64)
1434 getActionDefinitionsBuilder({G_VECREDUCE_FMIN, G_VECREDUCE_FMAX,
1435 G_VECREDUCE_FMINIMUM, G_VECREDUCE_FMAXIMUM})
1436 .legalFor({{f32, v2f32}, {f32, v4f32}, {f64, v2f64}})
1437 .legalFor(HasFP16, {{f16, v4f16}, {f16, v8f16}})
1438 .minScalarOrElt(0, MinFPScalar)
1439 .clampMaxNumElements(1, s64, 2)
1440 .clampMaxNumElements(1, s32, 4)
1441 .clampMaxNumElements(1, s16, 8)
1445 getActionDefinitionsBuilder(G_VECREDUCE_MUL)
1446 .clampMaxNumElements(1, s32, 2)
1447 .clampMaxNumElements(1, s16, 4)
1448 .clampMaxNumElements(1, s8, 8)
1452 getActionDefinitionsBuilder(
1453 {G_VECREDUCE_SMIN, G_VECREDUCE_SMAX, G_VECREDUCE_UMIN, G_VECREDUCE_UMAX})
1454 .legalFor({{i8, v8i8},
1462 return Query.
Types[1].isVector() &&
1463 Query.
Types[1].getElementType() != s8 &&
1464 Query.
Types[1].getNumElements() & 1;
1467 .clampMaxNumElements(1, s64, 2)
1468 .clampMaxNumElements(1, s32, 4)
1469 .clampMaxNumElements(1, s16, 8)
1470 .clampMaxNumElements(1, s8, 16)
1474 getActionDefinitionsBuilder(
1475 {G_VECREDUCE_OR, G_VECREDUCE_AND, G_VECREDUCE_XOR})
1491 return std::make_pair(1, SrcTy.
divide(2));
1497 getActionDefinitionsBuilder(G_VECTOR_COMPRESS).lower();
1500 getActionDefinitionsBuilder({G_GET_FPENV, G_SET_FPENV, G_RESET_FPENV,
1501 G_GET_FPMODE, G_SET_FPMODE, G_RESET_FPMODE})
1504 getActionDefinitionsBuilder(G_IS_FPCLASS).lower();
1506 getActionDefinitionsBuilder(G_PREFETCH).custom();
1508 getActionDefinitionsBuilder({G_SCMP, G_UCMP}).lower();
1510 getActionDefinitionsBuilder({G_INTRINSIC, G_INTRINSIC_W_SIDE_EFFECTS})
1512 getActionDefinitionsBuilder(G_FENCE).alwaysLegal();
1513 getActionDefinitionsBuilder(G_INVOKE_REGION_START).alwaysLegal();
1515 getLegacyLegalizerInfo().computeTables();
1762 auto LowerUnaryOp = [&
MI, &MIB](
unsigned Opcode) {
1764 MI.eraseFromParent();
1767 auto LowerBinOp = [&
MI, &MIB](
unsigned Opcode) {
1769 {
MI.getOperand(2),
MI.getOperand(3)});
1770 MI.eraseFromParent();
1773 auto LowerTriOp = [&
MI, &MIB](
unsigned Opcode) {
1775 {
MI.getOperand(2),
MI.getOperand(3),
MI.getOperand(4)});
1776 MI.eraseFromParent();
1781 switch (IntrinsicID) {
1782 case Intrinsic::vacopy: {
1783 unsigned PtrSize = ST->isTargetILP32() ? 4 : 8;
1784 unsigned VaListSize =
1785 (ST->isTargetDarwin() || ST->isTargetWindows())
1787 : ST->isTargetILP32() ? 20 : 32;
1795 VaListSize,
Align(PtrSize)));
1799 VaListSize,
Align(PtrSize)));
1800 MI.eraseFromParent();
1803 case Intrinsic::get_dynamic_area_offset: {
1805 MI.eraseFromParent();
1808 case Intrinsic::aarch64_mops_memset_tag: {
1809 assert(
MI.getOpcode() == TargetOpcode::G_INTRINSIC_W_SIDE_EFFECTS);
1812 auto &
Value =
MI.getOperand(3);
1814 Value.setReg(ExtValueReg);
1817 case Intrinsic::aarch64_prefetch: {
1818 auto &AddrVal =
MI.getOperand(1);
1820 int64_t IsWrite =
MI.getOperand(2).getImm();
1821 int64_t
Target =
MI.getOperand(3).getImm();
1822 int64_t IsStream =
MI.getOperand(4).getImm();
1823 int64_t IsData =
MI.getOperand(5).getImm();
1825 unsigned PrfOp = (IsWrite << 4) |
1831 MI.eraseFromParent();
1834 case Intrinsic::aarch64_range_prefetch: {
1835 auto &AddrVal =
MI.getOperand(1);
1837 int64_t IsWrite =
MI.getOperand(2).getImm();
1838 int64_t IsStream =
MI.getOperand(3).getImm();
1839 unsigned PrfOp = (IsStream << 2) | IsWrite;
1841 MIB.
buildInstr(AArch64::G_AARCH64_RANGE_PREFETCH)
1844 .
addUse(
MI.getOperand(4).getReg());
1845 MI.eraseFromParent();
1848 case Intrinsic::aarch64_prefetch_ir: {
1849 auto &AddrVal =
MI.getOperand(1);
1851 MI.eraseFromParent();
1854 case Intrinsic::aarch64_neon_uaddv:
1855 case Intrinsic::aarch64_neon_saddv:
1856 case Intrinsic::aarch64_neon_umaxv:
1857 case Intrinsic::aarch64_neon_smaxv:
1858 case Intrinsic::aarch64_neon_uminv:
1859 case Intrinsic::aarch64_neon_sminv: {
1860 bool IsSigned = IntrinsicID == Intrinsic::aarch64_neon_saddv ||
1861 IntrinsicID == Intrinsic::aarch64_neon_smaxv ||
1862 IntrinsicID == Intrinsic::aarch64_neon_sminv;
1864 auto OldDst =
MI.getOperand(0).getReg();
1865 auto OldDstTy = MRI.
getType(OldDst);
1867 if (OldDstTy == NewDstTy)
1873 MI.getOperand(0).setReg(NewDst);
1877 MIB.
buildExtOrTrunc(IsSigned ? TargetOpcode::G_SEXT : TargetOpcode::G_ZEXT,
1882 case Intrinsic::aarch64_neon_uaddlp:
1883 case Intrinsic::aarch64_neon_saddlp: {
1884 unsigned Opc = IntrinsicID == Intrinsic::aarch64_neon_uaddlp
1886 : AArch64::G_SADDLP;
1888 MI.eraseFromParent();
1892 case Intrinsic::aarch64_neon_uaddlv:
1893 case Intrinsic::aarch64_neon_saddlv: {
1894 unsigned Opc = IntrinsicID == Intrinsic::aarch64_neon_uaddlv
1896 : AArch64::G_SADDLV;
1923 MI.eraseFromParent();
1927 case Intrinsic::aarch64_neon_smax:
1928 return LowerBinOp(TargetOpcode::G_SMAX);
1929 case Intrinsic::aarch64_neon_smin:
1930 return LowerBinOp(TargetOpcode::G_SMIN);
1931 case Intrinsic::aarch64_neon_umax:
1932 return LowerBinOp(TargetOpcode::G_UMAX);
1933 case Intrinsic::aarch64_neon_umin:
1934 return LowerBinOp(TargetOpcode::G_UMIN);
1935 case Intrinsic::aarch64_neon_fmax:
1936 return LowerBinOp(TargetOpcode::G_FMAXIMUM);
1937 case Intrinsic::aarch64_neon_fmin:
1938 return LowerBinOp(TargetOpcode::G_FMINIMUM);
1939 case Intrinsic::aarch64_neon_fmaxnm:
1940 return LowerBinOp(TargetOpcode::G_FMAXNUM);
1941 case Intrinsic::aarch64_neon_fminnm:
1942 return LowerBinOp(TargetOpcode::G_FMINNUM);
1943 case Intrinsic::aarch64_neon_pmul:
1944 return LowerBinOp(TargetOpcode::G_CLMUL);
1945 case Intrinsic::aarch64_neon_pmull:
1946 case Intrinsic::aarch64_neon_pmull64:
1947 return LowerBinOp(AArch64::G_PMULL);
1948 case Intrinsic::aarch64_neon_smull:
1949 return LowerBinOp(AArch64::G_SMULL);
1950 case Intrinsic::aarch64_neon_umull:
1951 return LowerBinOp(AArch64::G_UMULL);
1952 case Intrinsic::aarch64_neon_sabd:
1953 return LowerBinOp(TargetOpcode::G_ABDS);
1954 case Intrinsic::aarch64_neon_uabd:
1955 return LowerBinOp(TargetOpcode::G_ABDU);
1956 case Intrinsic::aarch64_neon_uhadd:
1957 return LowerBinOp(TargetOpcode::G_UAVGFLOOR);
1958 case Intrinsic::aarch64_neon_urhadd:
1959 return LowerBinOp(TargetOpcode::G_UAVGCEIL);
1960 case Intrinsic::aarch64_neon_shadd:
1961 return LowerBinOp(TargetOpcode::G_SAVGFLOOR);
1962 case Intrinsic::aarch64_neon_srhadd:
1963 return LowerBinOp(TargetOpcode::G_SAVGCEIL);
1964 case Intrinsic::aarch64_neon_sqshrn: {
1969 {MRI.
getType(
MI.getOperand(2).getReg())},
1970 {
MI.getOperand(2),
MI.getOperand(3).getImm()});
1972 MIB.
buildInstr(TargetOpcode::G_TRUNC_SSAT_S, {
MI.getOperand(0)}, {Shr});
1973 MI.eraseFromParent();
1976 case Intrinsic::aarch64_neon_sqshrun: {
1981 {MRI.
getType(
MI.getOperand(2).getReg())},
1982 {
MI.getOperand(2),
MI.getOperand(3).getImm()});
1984 MIB.
buildInstr(TargetOpcode::G_TRUNC_SSAT_U, {
MI.getOperand(0)}, {Shr});
1985 MI.eraseFromParent();
1988 case Intrinsic::aarch64_neon_sqrshrn: {
1992 auto Shr = MIB.
buildInstr(AArch64::G_SRSHR_I,
1993 {MRI.
getType(
MI.getOperand(2).getReg())},
1994 {
MI.getOperand(2),
MI.getOperand(3).getImm()});
1996 MIB.
buildInstr(TargetOpcode::G_TRUNC_SSAT_S, {
MI.getOperand(0)}, {Shr});
1997 MI.eraseFromParent();
2000 case Intrinsic::aarch64_neon_sqrshrun: {
2004 auto Shr = MIB.
buildInstr(AArch64::G_SRSHR_I,
2005 {MRI.
getType(
MI.getOperand(2).getReg())},
2006 {
MI.getOperand(2),
MI.getOperand(3).getImm()});
2008 MIB.
buildInstr(TargetOpcode::G_TRUNC_SSAT_U, {
MI.getOperand(0)}, {Shr});
2009 MI.eraseFromParent();
2012 case Intrinsic::aarch64_neon_uqrshrn: {
2016 auto Shr = MIB.
buildInstr(AArch64::G_URSHR_I,
2017 {MRI.
getType(
MI.getOperand(2).getReg())},
2018 {
MI.getOperand(2),
MI.getOperand(3).getImm()});
2020 MIB.
buildInstr(TargetOpcode::G_TRUNC_USAT_U, {
MI.getOperand(0)}, {Shr});
2021 MI.eraseFromParent();
2024 case Intrinsic::aarch64_neon_uqshrn: {
2029 {MRI.
getType(
MI.getOperand(2).getReg())},
2030 {
MI.getOperand(2),
MI.getOperand(3).getImm()});
2032 MIB.
buildInstr(TargetOpcode::G_TRUNC_USAT_U, {
MI.getOperand(0)}, {Shr});
2033 MI.eraseFromParent();
2036 case Intrinsic::aarch64_neon_sqshlu: {
2042 MIB.
buildInstr(AArch64::G_SQSHLU_I, {
MI.getOperand(0)},
2044 .addImm(ShiftAmount->getSExtValue());
2045 MI.eraseFromParent();
2050 case Intrinsic::aarch64_neon_vsli: {
2052 AArch64::G_SLI, {
MI.getOperand(0)},
2053 {
MI.getOperand(2),
MI.getOperand(3),
MI.getOperand(4).getImm()});
2054 MI.eraseFromParent();
2057 case Intrinsic::aarch64_neon_vsri: {
2059 AArch64::G_SRI, {
MI.getOperand(0)},
2060 {
MI.getOperand(2),
MI.getOperand(3),
MI.getOperand(4).getImm()});
2061 MI.eraseFromParent();
2064 case Intrinsic::aarch64_neon_abs: {
2066 MIB.
buildInstr(TargetOpcode::G_ABS, {
MI.getOperand(0)}, {
MI.getOperand(2)});
2067 MI.eraseFromParent();
2070 case Intrinsic::aarch64_neon_sqadd: {
2072 return LowerBinOp(TargetOpcode::G_SADDSAT);
2075 case Intrinsic::aarch64_neon_sqsub: {
2077 return LowerBinOp(TargetOpcode::G_SSUBSAT);
2080 case Intrinsic::aarch64_neon_uqadd: {
2082 return LowerBinOp(TargetOpcode::G_UADDSAT);
2085 case Intrinsic::aarch64_neon_uqsub: {
2087 return LowerBinOp(TargetOpcode::G_USUBSAT);
2090 case Intrinsic::aarch64_neon_udot:
2091 return LowerTriOp(AArch64::G_UDOT);
2092 case Intrinsic::aarch64_neon_sdot:
2093 return LowerTriOp(AArch64::G_SDOT);
2094 case Intrinsic::aarch64_neon_usdot:
2095 return LowerTriOp(AArch64::G_USDOT);
2096 case Intrinsic::aarch64_neon_sqxtn:
2097 return LowerUnaryOp(TargetOpcode::G_TRUNC_SSAT_S);
2098 case Intrinsic::aarch64_neon_sqxtun:
2099 return LowerUnaryOp(TargetOpcode::G_TRUNC_SSAT_U);
2100 case Intrinsic::aarch64_neon_uqxtn:
2101 return LowerUnaryOp(TargetOpcode::G_TRUNC_USAT_U);
2102 case Intrinsic::aarch64_neon_fcvtzu:
2103 return LowerUnaryOp(TargetOpcode::G_FPTOUI_SAT);
2104 case Intrinsic::aarch64_neon_fcvtzs:
2105 return LowerUnaryOp(TargetOpcode::G_FPTOSI_SAT);
2106 case Intrinsic::aarch64_neon_cls:
2107 return LowerUnaryOp(TargetOpcode::G_CTLS);
2109 case Intrinsic::vector_reverse: