Skip to content

Commit cb6e6b5

Browse files
committed
Add SME2 builtins for pfalse and ptrue
Extend pfalse and ptrue builtins with svcount_t return types to be enabled for sve2p1 and sme2
1 parent 9db3b8d commit cb6e6b5

File tree

3 files changed

+41
-19
lines changed

3 files changed

+41
-19
lines changed

clang/include/clang/Basic/arm_sve.td

Lines changed: 5 additions & 18 deletions
Original file line numberDiff line numberDiff line change
@@ -1925,8 +1925,6 @@ def SVBGRP_N : SInst<"svbgrp[_n_{d}]", "dda", "UcUsUiUl", MergeNone, "aarch64_sv
19251925

19261926
let TargetGuard = "sve2p1" in {
19271927
def SVFCLAMP : SInst<"svclamp[_{d}]", "dddd", "hfd", MergeNone, "aarch64_sve_fclamp", [], []>;
1928-
def SVPTRUE_COUNT : SInst<"svptrue_{d}", "}v", "QcQsQiQl", MergeNone, "aarch64_sve_ptrue_{d}", [IsOverloadNone], []>;
1929-
def SVPFALSE_COUNT_ALIAS : SInst<"svpfalse_c", "}v", "", MergeNone, "", [IsOverloadNone]>;
19301928

19311929
def SVPEXT_SINGLE : SInst<"svpext_lane_{d}", "P}i", "QcQsQiQl", MergeNone, "aarch64_sve_pext", [], [ImmCheck<1, ImmCheck0_3>]>;
19321930
def SVPEXT_X2 : SInst<"svpext_lane_{d}_x2", "2.P}i", "QcQsQiQl", MergeNone, "aarch64_sve_pext_x2", [], [ImmCheck<1, ImmCheck0_1>]>;
@@ -2045,23 +2043,12 @@ def SVCNTP_COUNT : SInst<"svcntp_{d}", "n}i", "QcQsQiQl", MergeNone, "aarch64_sv
20452043
defm SVREVD : SInstZPZ<"svrevd", "csilUcUsUiUl", "aarch64_sve_revd">;
20462044
}
20472045

2046+
let TargetGuard = "sve2p1|sme2" in {
2047+
def SVPTRUE_COUNT : SInst<"svptrue_{d}", "}v", "QcQsQiQl", MergeNone, "aarch64_sve_ptrue_{d}", [IsOverloadNone], []>;
2048+
def SVPFALSE_COUNT_ALIAS : SInst<"svpfalse_c", "}v", "", MergeNone, "", [IsOverloadNone]>;
2049+
}
20482050

2049-
let TargetGuard = "sve2p1,b16b16" in {
2050-
defm SVMUL_BF : SInstZPZZ<"svmul", "b", "aarch64_sve_fmul", "aarch64_sve_fmul_u">;
2051-
defm SVADD_BF : SInstZPZZ<"svadd", "b", "aarch64_sve_fadd", "aarch64_sve_fadd_u">;
2052-
defm SVSUB_BF : SInstZPZZ<"svsub", "b", "aarch64_sve_fsub", "aarch64_sve_fsub_u">;
2053-
defm SVMAXNM_BF : SInstZPZZ<"svmaxnm","b", "aarch64_sve_fmaxnm", "aarch64_sve_fmaxnm_u">;
2054-
defm SVMINNM_BF : SInstZPZZ<"svminnm","b", "aarch64_sve_fminnm", "aarch64_sve_fminnm_u">;
2055-
defm SVMAX_BF : SInstZPZZ<"svmax", "b", "aarch64_sve_fmax", "aarch64_sve_fmax_u">;
2056-
defm SVMIN_BF : SInstZPZZ<"svmin", "b", "aarch64_sve_fmin", "aarch64_sve_fmin_u">;
2057-
defm SVMLA_BF : SInstZPZZZ<"svmla", "b", "aarch64_sve_fmla", "aarch64_sve_fmla_u", []>;
2058-
defm SVMLS_BF : SInstZPZZZ<"svmls", "b", "aarch64_sve_fmls", "aarch64_sve_fmls_u", []>;
2059-
def SVMLA_LANE_BF : SInst<"svmla_lane[_{d}]", "ddddi", "b", MergeNone, "aarch64_sve_fmla_lane", [], [ImmCheck<3, ImmCheckLaneIndex, 2>]>;
2060-
def SVMLS_LANE_BF : SInst<"svmls_lane[_{d}]", "ddddi", "b", MergeNone, "aarch64_sve_fmls_lane", [], [ImmCheck<3, ImmCheckLaneIndex, 2>]>;
2061-
def SVMUL_LANE_BF : SInst<"svmul_lane[_{d}]", "dddi", "b", MergeNone, "aarch64_sve_fmul_lane", [], [ImmCheck<2, ImmCheckLaneIndex, 1>]>;
2062-
def SVFCLAMP_BF : SInst<"svclamp[_{d}]", "dddd", "b", MergeNone, "aarch64_sve_fclamp", [], []>;
2063-
} //sve2p1,b16b16
2064-
2051+
////////////////////////////////////////////////////////////////////////////////
20652052
// SME2
20662053

20672054
// SME intrinsics which operate only on vectors and do not require ZA should be added here,

clang/lib/Sema/Sema.cpp

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -2085,7 +2085,8 @@ void Sema::checkTypeSupport(QualType Ty, SourceLocation Loc, ValueDecl *D) {
20852085
llvm::StringMap<bool> CallerFeatureMap;
20862086
Context.getFunctionFeatureMap(CallerFeatureMap, FD);
20872087
if (!Builtin::evaluateRequiredTargetFeatures(
2088-
"sve", CallerFeatureMap))
2088+
"sve", CallerFeatureMap) && !Builtin::evaluateRequiredTargetFeatures(
2089+
"sme", CallerFeatureMap))
20892090
Diag(D->getLocation(), diag::err_sve_vector_in_non_sve_target) << Ty;
20902091
}
20912092
};
Lines changed: 34 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,34 @@
1+
// NOTE: Assertions have been autogenerated by utils/update_cc_test_checks.py
2+
// REQUIRES: aarch64-registered-target
3+
// RUN: %clang_cc1 -triple aarch64-none-linux-gnu -target-feature +sme2 -S -disable-O0-optnone -Werror -Wall -emit-llvm -o - %s | FileCheck %s
4+
// RUN: %clang_cc1 -triple aarch64-none-linux-gnu -target-feature +sme2 -S -disable-O0-optnone -Werror -Wall -emit-llvm -o - -x c++ %s | FileCheck %s -check-prefix=CPP-CHECK
5+
// RUN: %clang_cc1 -triple aarch64-none-linux-gnu -target-feature +sme2 -S -disable-O0-optnone -Werror -Wall -o /dev/null %s
6+
#include <arm_sve.h>
7+
8+
// CHECK-LABEL: @test_svptrue_c8_attr(
9+
// CHECK-NEXT: entry:
10+
// CHECK-NEXT: [[TMP0:%.*]] = call target("aarch64.svcount") @llvm.aarch64.sve.ptrue.c8()
11+
// CHECK-NEXT: ret target("aarch64.svcount") [[TMP0]]
12+
//
13+
// CPP-CHECK-LABEL: @_Z20test_svptrue_c8_attrv(
14+
// CPP-CHECK-NEXT: entry:
15+
// CPP-CHECK-NEXT: [[TMP0:%.*]] = call target("aarch64.svcount") @llvm.aarch64.sve.ptrue.c8()
16+
// CPP-CHECK-NEXT: ret target("aarch64.svcount") [[TMP0]]
17+
//
18+
svcount_t test_svptrue_c8_attr(void) __arm_streaming {
19+
return svptrue_c8();
20+
}
21+
22+
// CHECK-LABEL: @test_svptrue_c(
23+
// CHECK-NEXT: entry:
24+
// CHECK-NEXT: [[TMP0:%.*]] = call target("aarch64.svcount") @llvm.aarch64.sve.convert.from.svbool.taarch64.svcountt(<vscale x 16 x i1> zeroinitializer)
25+
// CHECK-NEXT: ret target("aarch64.svcount") [[TMP0]]
26+
//
27+
// CPP-CHECK-LABEL: @_Z14test_svptrue_cv(
28+
// CPP-CHECK-NEXT: entry:
29+
// CPP-CHECK-NEXT: [[TMP0:%.*]] = call target("aarch64.svcount") @llvm.aarch64.sve.convert.from.svbool.taarch64.svcountt(<vscale x 16 x i1> zeroinitializer)
30+
// CPP-CHECK-NEXT: ret target("aarch64.svcount") [[TMP0]]
31+
//
32+
svcount_t test_svptrue_c(void) __arm_streaming {
33+
return svpfalse_c();
34+
}

0 commit comments

Comments
 (0)