Skip to content

Commit fb60cf1

Browse files
committed
Add isNeonAvailable test
1 parent 114dda0 commit fb60cf1

File tree

2 files changed

+27
-1
lines changed

2 files changed

+27
-1
lines changed

llvm/lib/Target/AArch64/AArch64.td

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -509,7 +509,7 @@ def FeatureSMEF16F16 : SubtargetFeature<"sme-f16f16", "HasSMEF16F16", "true",
509509
"Enable SME2.1 non-widening Float16 instructions (FEAT_SME_F16F16)", []>;
510510

511511
def FeatureSMEFA64 : SubtargetFeature<"sme-fa64", "HasSMEFA64", "true",
512-
"Enable the full A64 instruction set in SVE streaming mode (FEAT_SME_FA64)", []>;
512+
"Enable the full A64 instruction set in streaming SVE mode (FEAT_SME_FA64)", []>;
513513

514514
def FeatureSME2 : SubtargetFeature<"sme2", "HasSME2", "true",
515515
"Enable Scalable Matrix Extension 2 (SME2) instructions", [FeatureSME]>;
Lines changed: 26 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,26 @@
1+
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
2+
; RUN: llc -mattr=+sve -mattr=+sme-fa64 -force-streaming-compatible-sve < %s | FileCheck %s -check-prefix=FA64
3+
; RUN: llc -mattr=+sve -force-streaming-compatible-sve < %s | FileCheck %s -check-prefix=NO-FA64
4+
5+
target triple = "aarch64-unknown-linux-gnu"
6+
7+
define <8 x i8> @mla8xi8(<8 x i8> %A, <8 x i8> %B, <8 x i8> %C) {
8+
; FA64-LABEL: mla8xi8:
9+
; FA64: // %bb.0:
10+
; FA64-NEXT: mla v2.8b, v0.8b, v1.8b
11+
; FA64-NEXT: fmov d0, d2
12+
; FA64-NEXT: ret
13+
;
14+
; NO-FA64-LABEL: mla8xi8:
15+
; NO-FA64: // %bb.0:
16+
; NO-FA64-NEXT: ptrue p0.b, vl8
17+
; NO-FA64-NEXT: // kill: def $d0 killed $d0 def $z0
18+
; NO-FA64-NEXT: // kill: def $d2 killed $d2 def $z2
19+
; NO-FA64-NEXT: // kill: def $d1 killed $d1 def $z1
20+
; NO-FA64-NEXT: mad z0.b, p0/m, z1.b, z2.b
21+
; NO-FA64-NEXT: // kill: def $d0 killed $d0 killed $z0
22+
; NO-FA64-NEXT: ret
23+
%tmp1 = mul <8 x i8> %A, %B;
24+
%tmp2 = add <8 x i8> %C, %tmp1;
25+
ret <8 x i8> %tmp2
26+
}

0 commit comments

Comments
 (0)