@@ -2983,13 +2983,6 @@ let TargetPrefix = "aarch64" in {
2983
2983
LLVMMatchType<0>,
2984
2984
llvm_anyvector_ty], [ImmArg<ArgIndex<0>>]>;
2985
2985
2986
- class SME_FP8_OuterProduct_Intrinsic
2987
- : DefaultAttrsIntrinsic<[],
2988
- [llvm_i32_ty,
2989
- llvm_nxv16i1_ty, llvm_nxv16i1_ty,
2990
- llvm_nxv16i8_ty, llvm_nxv16i8_ty],
2991
- [ImmArg<ArgIndex<0>>, IntrInaccessibleMemOnly, IntrHasSideEffects]>;
2992
-
2993
2986
def int_aarch64_sme_mopa : SME_OuterProduct_Intrinsic;
2994
2987
def int_aarch64_sme_mops : SME_OuterProduct_Intrinsic;
2995
2988
@@ -3005,10 +2998,6 @@ let TargetPrefix = "aarch64" in {
3005
2998
def int_aarch64_sme_usmopa_wide : SME_OuterProduct_Intrinsic;
3006
2999
def int_aarch64_sme_usmops_wide : SME_OuterProduct_Intrinsic;
3007
3000
3008
- // FP8 outer product
3009
- def int_aarch64_sme_fp8_fmopa_za16 : SME_FP8_OuterProduct_Intrinsic;
3010
- def int_aarch64_sme_fp8_fmopa_za32 : SME_FP8_OuterProduct_Intrinsic;
3011
-
3012
3001
class SME_AddVectorToTile_Intrinsic
3013
3002
: DefaultAttrsIntrinsic<[],
3014
3003
[llvm_i32_ty,
@@ -3875,6 +3864,13 @@ let TargetPrefix = "aarch64" in {
3875
3864
: DefaultAttrsIntrinsic<[llvm_anyvector_ty, LLVMMatchType<0>],
3876
3865
[llvm_nxv16i8_ty],
3877
3866
[IntrReadMem, IntrInaccessibleMemOnly]>;
3867
+
3868
+ class SME_FP8_OuterProduct_Intrinsic
3869
+ : DefaultAttrsIntrinsic<[],
3870
+ [llvm_i32_ty,
3871
+ llvm_nxv16i1_ty, llvm_nxv16i1_ty,
3872
+ llvm_nxv16i8_ty, llvm_nxv16i8_ty],
3873
+ [ImmArg<ArgIndex<0>>, IntrInaccessibleMemOnly, IntrHasSideEffects]>;
3878
3874
//
3879
3875
// CVT from FP8 to half-precision/BFloat16 multi-vector
3880
3876
//
@@ -3886,4 +3882,8 @@ let TargetPrefix = "aarch64" in {
3886
3882
//
3887
3883
def int_aarch64_sve_fp8_cvtl1_x2 : SME2_FP8_CVT_X2_Single_Intrinsic;
3888
3884
def int_aarch64_sve_fp8_cvtl2_x2 : SME2_FP8_CVT_X2_Single_Intrinsic;
3885
+
3886
+ // FP8 outer product
3887
+ def int_aarch64_sme_fp8_fmopa_za16 : SME_FP8_OuterProduct_Intrinsic;
3888
+ def int_aarch64_sme_fp8_fmopa_za32 : SME_FP8_OuterProduct_Intrinsic;
3889
3889
}
0 commit comments