Skip to content

Commit 1fe096e

Browse files
committed
[AArch64][SVE2] Add the SVE2.1 signed and unsigned 2-way dot instructions
This patch adds the assembly/disassembly for the following instructions: SDOT : Signed integer 2-way dot product indexed and non-indexed UDOT : Unsigned integer 2-way dot product, indexed and non-indexed The reference can be found here: https://developer.arm.com/documentation/ddi0602/2022-09 Differential Revision: https://reviews.llvm.org/D136464
1 parent 3d9bf8c commit 1fe096e

File tree

8 files changed

+284
-4
lines changed

8 files changed

+284
-4
lines changed

llvm/lib/Target/AArch64/AArch64SVEInstrInfo.td

Lines changed: 5 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -3581,4 +3581,9 @@ def BFMLSLB_ZZZ_S : sve_bfloat_matmul_longvecl<0b0, 0b1, "bfmlslb">;
35813581
def BFMLSLT_ZZZ_S : sve_bfloat_matmul_longvecl<0b1, 0b1, "bfmlslt">;
35823582
def BFMLSLB_ZZZI_S : sve_bfloat_matmul_longvecl_idx<0b0, 0b1, "bfmlslb">;
35833583
def BFMLSLT_ZZZI_S : sve_bfloat_matmul_longvecl_idx<0b1, 0b1, "bfmlslt">;
3584+
3585+
def SDOT_ZZZ_HtoS : sve2p1_two_way_dot_vv<"sdot", 0b0>;
3586+
def UDOT_ZZZ_HtoS : sve2p1_two_way_dot_vv<"udot", 0b1>;
3587+
def SDOT_ZZZI_HtoS : sve2p1_two_way_dot_vvi<"sdot", 0b0>;
3588+
def UDOT_ZZZI_HtoS : sve2p1_two_way_dot_vvi<"udot", 0b1>;
35843589
} // End HasSVE2p1_or_HasSME2

llvm/lib/Target/AArch64/SVEInstrFormats.td

Lines changed: 41 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -8654,3 +8654,44 @@ multiclass sve2p1_fclamp<string asm> {
86548654
def _S : sve2p1_fclamp<asm, 0b10, ZPR32>;
86558655
def _D : sve2p1_fclamp<asm, 0b11, ZPR64>;
86568656
}
8657+
8658+
// SVE two-way dot product
8659+
class sve2p1_two_way_dot_vv<string mnemonic, bit u>
8660+
: I<(outs ZPR32:$Zda), (ins ZPR32:$_Zda, ZPR16:$Zn, ZPR16:$Zm),
8661+
mnemonic, "\t$Zda, $Zn, $Zm",
8662+
"", []>, Sched<[]> {
8663+
bits<5> Zda;
8664+
bits<5> Zn;
8665+
bits<5> Zm;
8666+
let Inst{31-21} = 0b01000100000;
8667+
let Inst{20-16} = Zm;
8668+
let Inst{15-11} = 0b11001;
8669+
let Inst{10} = u;
8670+
let Inst{9-5} = Zn;
8671+
let Inst{4-0} = Zda;
8672+
8673+
let Constraints = "$Zda = $_Zda";
8674+
let DestructiveInstType = DestructiveOther;
8675+
}
8676+
8677+
8678+
// SVE two-way dot product (indexed)
8679+
class sve2p1_two_way_dot_vvi<string mnemonic, bit u>
8680+
: I<(outs ZPR32:$Zda), (ins ZPR32:$_Zda, ZPR16:$Zn, ZPR3b16:$Zm, VectorIndexS:$i2),
8681+
mnemonic, "\t$Zda, $Zn, $Zm$i2",
8682+
"", []>, Sched<[]> {
8683+
bits<5> Zda;
8684+
bits<5> Zn;
8685+
bits<3> Zm;
8686+
bits<2> i2;
8687+
let Inst{31-21} = 0b01000100100;
8688+
let Inst{20-19} = i2;
8689+
let Inst{18-16} = Zm;
8690+
let Inst{15-11} = 0b11001;
8691+
let Inst{10} = u;
8692+
let Inst{9-5} = Zn;
8693+
let Inst{4-0} = Zda;
8694+
8695+
let Constraints = "$Zda = $_Zda";
8696+
let DestructiveInstType = DestructiveOther;
8697+
}

llvm/test/MC/AArch64/SVE/sdot-diagnostics.s

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -4,9 +4,9 @@
44
// ------------------------------------------------------------------------- //
55
// Invalid element size
66

7-
sdot z0.s, z1.h, z31.h
7+
sdot z0.b, z1.h, z31.h
88
// CHECK: [[@LINE-1]]:{{[0-9]+}}: error: invalid element width
9-
// CHECK-NEXT: sdot z0.s, z1.h, z31.h
9+
// CHECK-NEXT: sdot z0.b, z1.h, z31.h
1010
// CHECK-NOT: [[@LINE-1]]:{{[0-9]+}}:
1111

1212
sdot z0.d, z1.b, z31.b

llvm/test/MC/AArch64/SVE/udot-diagnostics.s

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -4,9 +4,9 @@
44
// ------------------------------------------------------------------------- //
55
// Invalid element size
66

7-
udot z0.s, z1.h, z31.h
7+
udot z0.b, z1.h, z31.h
88
// CHECK: [[@LINE-1]]:{{[0-9]+}}: error: invalid element width
9-
// CHECK-NEXT: udot z0.s, z1.h, z31.h
9+
// CHECK-NEXT: udot z0.b, z1.h, z31.h
1010
// CHECK-NOT: [[@LINE-1]]:{{[0-9]+}}:
1111

1212
udot z0.d, z1.b, z31.b
Lines changed: 39 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,39 @@
1+
// RUN: not llvm-mc -triple=aarch64 -show-encoding -mattr=+sve2p1 2>&1 < %s | FileCheck %s
2+
3+
// --------------------------------------------------------------------------//
4+
// Invalid vector lane index
5+
6+
sdot z0.s, z0.h, z0.h[8]
7+
// CHECK: [[@LINE-1]]:{{[0-9]+}}: error: vector lane must be an integer in range [0, 3].
8+
// CHECK-NEXT: sdot z0.s, z0.h, z0.h[8]
9+
// CHECK-NOT: [[@LINE-1]]:{{[0-9]+}}:
10+
11+
sdot z0.s, z0.h, z0.h[-1]
12+
// CHECK: [[@LINE-1]]:{{[0-9]+}}: error: vector lane must be an integer in range [0, 3].
13+
// CHECK-NEXT: sdot z0.s, z0.h, z0.h[-1]
14+
// CHECK-NOT: [[@LINE-1]]:{{[0-9]+}}:
15+
16+
movprfx z0, z31
17+
sdot z0.s, z0.h, z0.h[8]
18+
// CHECK: [[@LINE-1]]:{{[0-9]+}}: error: vector lane must be an integer in range [0, 3].
19+
// CHECK-NEXT: sdot z0.s, z0.h, z0.h[8]
20+
// CHECK-NOT: [[@LINE-1]]:{{[0-9]+}}:
21+
22+
movprfx z0, z31
23+
sdot z0.s, z0.h, z0.h[-1]
24+
// CHECK: [[@LINE-1]]:{{[0-9]+}}: error: vector lane must be an integer in range [0, 3].
25+
// CHECK-NEXT: sdot z0.s, z0.h, z0.h[-1]
26+
// CHECK-NOT: [[@LINE-1]]:{{[0-9]+}}:
27+
28+
// --------------------------------------------------------------------------//
29+
// Invalid vector suffix
30+
31+
sdot z0.h, z0.s, z0.s
32+
// CHECK: [[@LINE-1]]:{{[0-9]+}}: error: invalid element width
33+
// CHECK-NEXT: sdot z0.h, z0.s, z0.s
34+
// CHECK-NOT: [[@LINE-1]]:{{[0-9]+}}:
35+
36+
sdot z0.b, z0.h, z0.h[1]
37+
// CHECK: [[@LINE-1]]:{{[0-9]+}}: error: invalid element width
38+
// CHECK-NEXT: sdot z0.b, z0.h, z0.h[1]
39+
// CHECK-NOT: [[@LINE-1]]:{{[0-9]+}}:

llvm/test/MC/AArch64/SVE2p1/sdot.s

Lines changed: 78 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,78 @@
1+
// RUN: llvm-mc -triple=aarch64 -show-encoding -mattr=+sme2 < %s \
2+
// RUN: | FileCheck %s --check-prefixes=CHECK-ENCODING,CHECK-INST
3+
// RUN: llvm-mc -triple=aarch64 -show-encoding -mattr=+sve2p1 < %s \
4+
// RUN: | FileCheck %s --check-prefixes=CHECK-ENCODING,CHECK-INST
5+
// RUN: not llvm-mc -triple=aarch64 -show-encoding < %s 2>&1 \
6+
// RUN: | FileCheck %s --check-prefix=CHECK-ERROR
7+
// RUN: llvm-mc -triple=aarch64 -filetype=obj -mattr=+sme2 < %s \
8+
// RUN: | llvm-objdump -d --mattr=+sme2 - | FileCheck %s --check-prefix=CHECK-INST
9+
// RUN: llvm-mc -triple=aarch64 -filetype=obj -mattr=+sme2 < %s \
10+
// RUN: | llvm-objdump -d - | FileCheck %s --check-prefix=CHECK-UNKNOWN
11+
// RUN: llvm-mc -triple=aarch64 -show-encoding -mattr=+sme2 < %s \
12+
// RUN: | sed '/.text/d' | sed 's/.*encoding: //g' \
13+
// RUN: | llvm-mc -triple=aarch64 -mattr=+sme2 -disassemble -show-encoding \
14+
// RUN: | FileCheck %s --check-prefixes=CHECK-ENCODING,CHECK-INST
15+
16+
movprfx z23, z31
17+
sdot z23.s, z13.h, z0.h[1] // 01000100-10001000-11001001-10110111
18+
// CHECK-INST: movprfx z23, z31
19+
// CHECK-INST: sdot z23.s, z13.h, z0.h[1]
20+
// CHECK-ENCODING: [0xb7,0xc9,0x88,0x44]
21+
// CHECK-ERROR: instruction requires: sme2 or sve2p1
22+
// CHECK-UNKNOWN: 4488c9b7 <unknown>
23+
24+
sdot z0.s, z0.h, z0.h[0] // 01000100-10000000-11001000-00000000
25+
// CHECK-INST: sdot z0.s, z0.h, z0.h[0]
26+
// CHECK-ENCODING: [0x00,0xc8,0x80,0x44]
27+
// CHECK-ERROR: instruction requires: sme2 or sve2p1
28+
// CHECK-UNKNOWN: 4480c800 <unknown>
29+
30+
sdot z21.s, z10.h, z5.h[2] // 01000100-10010101-11001001-01010101
31+
// CHECK-INST: sdot z21.s, z10.h, z5.h[2]
32+
// CHECK-ENCODING: [0x55,0xc9,0x95,0x44]
33+
// CHECK-ERROR: instruction requires: sme2 or sve2p1
34+
// CHECK-UNKNOWN: 4495c955 <unknown>
35+
36+
sdot z23.s, z13.h, z0.h[1] // 01000100-10001000-11001001-10110111
37+
// CHECK-INST: sdot z23.s, z13.h, z0.h[1]
38+
// CHECK-ENCODING: [0xb7,0xc9,0x88,0x44]
39+
// CHECK-ERROR: instruction requires: sme2 or sve2p1
40+
// CHECK-UNKNOWN: 4488c9b7 <unknown>
41+
42+
sdot z31.s, z31.h, z7.h[3] // 01000100-10011111-11001011-11111111
43+
// CHECK-INST: sdot z31.s, z31.h, z7.h[3]
44+
// CHECK-ENCODING: [0xff,0xcb,0x9f,0x44]
45+
// CHECK-ERROR: instruction requires: sme2 or sve2p1
46+
// CHECK-UNKNOWN: 449fcbff <unknown>
47+
48+
movprfx z23, z31
49+
sdot z23.s, z13.h, z8.h // 01000100-00001000-11001001-10110111
50+
// CHECK-INST: movprfx z23, z31
51+
// CHECK-INST: sdot z23.s, z13.h, z8.h
52+
// CHECK-ENCODING: [0xb7,0xc9,0x08,0x44]
53+
// CHECK-ERROR: instruction requires: sme2 or sve2p1
54+
// CHECK-UNKNOWN: 4408c9b7 <unknown>
55+
56+
sdot z0.s, z0.h, z0.h // 01000100-00000000-11001000-00000000
57+
// CHECK-INST: sdot z0.s, z0.h, z0.h
58+
// CHECK-ENCODING: [0x00,0xc8,0x00,0x44]
59+
// CHECK-ERROR: instruction requires: sme2 or sve2p1
60+
// CHECK-UNKNOWN: 4400c800 <unknown>
61+
62+
sdot z21.s, z10.h, z21.h // 01000100-00010101-11001001-01010101
63+
// CHECK-INST: sdot z21.s, z10.h, z21.h
64+
// CHECK-ENCODING: [0x55,0xc9,0x15,0x44]
65+
// CHECK-ERROR: instruction requires: sme2 or sve2p1
66+
// CHECK-UNKNOWN: 4415c955 <unknown>
67+
68+
sdot z23.s, z13.h, z8.h // 01000100-00001000-11001001-10110111
69+
// CHECK-INST: sdot z23.s, z13.h, z8.h
70+
// CHECK-ENCODING: [0xb7,0xc9,0x08,0x44]
71+
// CHECK-ERROR: instruction requires: sme2 or sve2p1
72+
// CHECK-UNKNOWN: 4408c9b7 <unknown>
73+
74+
sdot z31.s, z31.h, z31.h // 01000100-00011111-11001011-11111111
75+
// CHECK-INST: sdot z31.s, z31.h, z31.h
76+
// CHECK-ENCODING: [0xff,0xcb,0x1f,0x44]
77+
// CHECK-ERROR: instruction requires: sme2 or sve2p1
78+
// CHECK-UNKNOWN: 441fcbff <unknown>
Lines changed: 39 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,39 @@
1+
// RUN: not llvm-mc -triple=aarch64 -show-encoding -mattr=+sve2p1 2>&1 < %s | FileCheck %s
2+
3+
// --------------------------------------------------------------------------//
4+
// Invalid vector lane index
5+
6+
udot z0.s, z0.h, z0.h[8]
7+
// CHECK: [[@LINE-1]]:{{[0-9]+}}: error: vector lane must be an integer in range [0, 3].
8+
// CHECK-NEXT: udot z0.s, z0.h, z0.h[8]
9+
// CHECK-NOT: [[@LINE-1]]:{{[0-9]+}}:
10+
11+
udot z0.s, z0.h, z0.h[-1]
12+
// CHECK: [[@LINE-1]]:{{[0-9]+}}: error: vector lane must be an integer in range [0, 3].
13+
// CHECK-NEXT: udot z0.s, z0.h, z0.h[-1]
14+
// CHECK-NOT: [[@LINE-1]]:{{[0-9]+}}:
15+
16+
movprfx z0, z31
17+
udot z0.s, z0.h, z0.h[8]
18+
// CHECK: [[@LINE-1]]:{{[0-9]+}}: error: vector lane must be an integer in range [0, 3].
19+
// CHECK-NEXT: udot z0.s, z0.h, z0.h[8]
20+
// CHECK-NOT: [[@LINE-1]]:{{[0-9]+}}:
21+
22+
movprfx z0, z31
23+
udot z0.s, z0.h, z0.h[-1]
24+
// CHECK: [[@LINE-1]]:{{[0-9]+}}: error: vector lane must be an integer in range [0, 3].
25+
// CHECK-NEXT: udot z0.s, z0.h, z0.h[-1]
26+
// CHECK-NOT: [[@LINE-1]]:{{[0-9]+}}:
27+
28+
// --------------------------------------------------------------------------//
29+
// Invalid vector suffix
30+
31+
udot z0.h, z0.s, z0.s
32+
// CHECK: [[@LINE-1]]:{{[0-9]+}}: error: invalid element width
33+
// CHECK-NEXT: udot z0.h, z0.s, z0.s
34+
// CHECK-NOT: [[@LINE-1]]:{{[0-9]+}}:
35+
36+
udot z0.h, z0.s, z0.s[1]
37+
// CHECK: [[@LINE-1]]:{{[0-9]+}}: error: invalid element width
38+
// CHECK-NEXT: udot z0.h, z0.s, z0.s[1]
39+
// CHECK-NOT: [[@LINE-1]]:{{[0-9]+}}:

llvm/test/MC/AArch64/SVE2p1/udot.s

Lines changed: 78 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,78 @@
1+
// RUN: llvm-mc -triple=aarch64 -show-encoding -mattr=+sme2 < %s \
2+
// RUN: | FileCheck %s --check-prefixes=CHECK-ENCODING,CHECK-INST
3+
// RUN: llvm-mc -triple=aarch64 -show-encoding -mattr=+sve2p1 < %s \
4+
// RUN: | FileCheck %s --check-prefixes=CHECK-ENCODING,CHECK-INST
5+
// RUN: not llvm-mc -triple=aarch64 -show-encoding < %s 2>&1 \
6+
// RUN: | FileCheck %s --check-prefix=CHECK-ERROR
7+
// RUN: llvm-mc -triple=aarch64 -filetype=obj -mattr=+sme2 < %s \
8+
// RUN: | llvm-objdump -d --mattr=+sme2 - | FileCheck %s --check-prefix=CHECK-INST
9+
// RUN: llvm-mc -triple=aarch64 -filetype=obj -mattr=+sme2 < %s \
10+
// RUN: | llvm-objdump -d - | FileCheck %s --check-prefix=CHECK-UNKNOWN
11+
// RUN: llvm-mc -triple=aarch64 -show-encoding -mattr=+sme2 < %s \
12+
// RUN: | sed '/.text/d' | sed 's/.*encoding: //g' \
13+
// RUN: | llvm-mc -triple=aarch64 -mattr=+sme2 -disassemble -show-encoding \
14+
// RUN: | FileCheck %s --check-prefixes=CHECK-ENCODING,CHECK-INST
15+
16+
movprfx z23, z31
17+
udot z23.s, z13.h, z0.h[1] // 01000100-10001000-11001101-10110111
18+
// CHECK-INST: movprfx z23, z31
19+
// CHECK-INST: udot z23.s, z13.h, z0.h[1]
20+
// CHECK-ENCODING: [0xb7,0xcd,0x88,0x44]
21+
// CHECK-ERROR: instruction requires: sme2 or sve2p1
22+
// CHECK-UNKNOWN: 4488cdb7 <unknown>
23+
24+
udot z0.s, z0.h, z0.h[0] // 01000100-10000000-11001100-00000000
25+
// CHECK-INST: udot z0.s, z0.h, z0.h[0]
26+
// CHECK-ENCODING: [0x00,0xcc,0x80,0x44]
27+
// CHECK-ERROR: instruction requires: sme2 or sve2p1
28+
// CHECK-UNKNOWN: 4480cc00 <unknown>
29+
30+
udot z21.s, z10.h, z5.h[2] // 01000100-10010101-11001101-01010101
31+
// CHECK-INST: udot z21.s, z10.h, z5.h[2]
32+
// CHECK-ENCODING: [0x55,0xcd,0x95,0x44]
33+
// CHECK-ERROR: instruction requires: sme2 or sve2p1
34+
// CHECK-UNKNOWN: 4495cd55 <unknown>
35+
36+
udot z23.s, z13.h, z0.h[1] // 01000100-10001000-11001101-10110111
37+
// CHECK-INST: udot z23.s, z13.h, z0.h[1]
38+
// CHECK-ENCODING: [0xb7,0xcd,0x88,0x44]
39+
// CHECK-ERROR: instruction requires: sme2 or sve2p1
40+
// CHECK-UNKNOWN: 4488cdb7 <unknown>
41+
42+
udot z31.s, z31.h, z7.h[3] // 01000100-10011111-11001111-11111111
43+
// CHECK-INST: udot z31.s, z31.h, z7.h[3]
44+
// CHECK-ENCODING: [0xff,0xcf,0x9f,0x44]
45+
// CHECK-ERROR: instruction requires: sme2 or sve2p1
46+
// CHECK-UNKNOWN: 449fcfff <unknown>
47+
48+
movprfx z23, z31
49+
udot z23.s, z13.h, z8.h // 01000100-00001000-11001101-10110111
50+
// CHECK-INST: movprfx z23, z31
51+
// CHECK-INST: udot z23.s, z13.h, z8.h
52+
// CHECK-ENCODING: [0xb7,0xcd,0x08,0x44]
53+
// CHECK-ERROR: instruction requires: sme2 or sve2p1
54+
// CHECK-UNKNOWN: 4408cdb7 <unknown>
55+
56+
udot z0.s, z0.h, z0.h // 01000100-00000000-11001100-00000000
57+
// CHECK-INST: udot z0.s, z0.h, z0.h
58+
// CHECK-ENCODING: [0x00,0xcc,0x00,0x44]
59+
// CHECK-ERROR: instruction requires: sme2 or sve2p1
60+
// CHECK-UNKNOWN: 4400cc00 <unknown>
61+
62+
udot z21.s, z10.h, z21.h // 01000100-00010101-11001101-01010101
63+
// CHECK-INST: udot z21.s, z10.h, z21.h
64+
// CHECK-ENCODING: [0x55,0xcd,0x15,0x44]
65+
// CHECK-ERROR: instruction requires: sme2 or sve2p1
66+
// CHECK-UNKNOWN: 4415cd55 <unknown>
67+
68+
udot z23.s, z13.h, z8.h // 01000100-00001000-11001101-10110111
69+
// CHECK-INST: udot z23.s, z13.h, z8.h
70+
// CHECK-ENCODING: [0xb7,0xcd,0x08,0x44]
71+
// CHECK-ERROR: instruction requires: sme2 or sve2p1
72+
// CHECK-UNKNOWN: 4408cdb7 <unknown>
73+
74+
udot z31.s, z31.h, z31.h // 01000100-00011111-11001111-11111111
75+
// CHECK-INST: udot z31.s, z31.h, z31.h
76+
// CHECK-ENCODING: [0xff,0xcf,0x1f,0x44]
77+
// CHECK-ERROR: instruction requires: sme2 or sve2p1
78+
// CHECK-UNKNOWN: 441fcfff <unknown>

0 commit comments

Comments
 (0)