1
1
// RUN: mlir-opt %s -test-sink-vector-broadcast -split-input-file | FileCheck %s
2
2
3
+ //-----------------------------------------------------------------------------
4
+ // [Pattern: ReorderElementwiseOpsOnBroadcast]
5
+ //-----------------------------------------------------------------------------
6
+
3
7
// CHECK-LABEL: func.func @broadcast_scalar_with_bcast(
4
8
// CHECK-SAME: %[[ARG_0:.*]]: index, %[[ARG_1:.*]]: index) -> vector<1x4xindex> {
5
9
// CHECK: %[[ADD:.*]] = arith.addi %[[ARG_0]], %[[ARG_1]] : index
6
10
// CHECK: %[[BCAST:.*]] = vector.broadcast %[[ADD]] : index to vector<1x4xindex>
7
11
// CHECK: return %[[BCAST]] : vector<1x4xindex>
8
12
9
- func.func @broadcast_scalar_with_bcast ( %arg1: index , %arg2: index ) -> vector <1 x4 xindex > {
13
+ func.func @broadcast_scalar_with_bcast (%arg1: index , %arg2: index ) -> vector <1 x4 xindex > {
10
14
%0 = vector.broadcast %arg1 : index to vector <1 x4 xindex >
11
15
%1 = vector.broadcast %arg2 : index to vector <1 x4 xindex >
12
- %2 = arith.addi %0 , %1 : vector <1 x4 xindex >
13
- return %2 : vector <1 x4 xindex >
16
+ %2 = arith.addi %0 , %1 : vector <1 x4 xindex > return %2 : vector <1 x4 xindex >
17
+ }
18
+
19
+ // CHECK-LABEL: func.func @broadcast_scalar_with_bcast_scalable(
20
+ // CHECK-SAME: %[[ARG_0:.*]]: index, %[[ARG_1:.*]]: index) -> vector<1x[4]xindex> {
21
+ // CHECK: %[[ADD:.*]] = arith.addi %[[ARG_0]], %[[ARG_1]] : index
22
+ // CHECK: %[[BCAST:.*]] = vector.broadcast %[[ADD]] : index to vector<1x[4]xindex>
23
+ // CHECK: return %[[BCAST]] : vector<1x[4]xindex>
24
+
25
+ func.func @broadcast_scalar_with_bcast_scalable (%arg1: index , %arg2: index ) -> vector <1 x[4 ]xindex > {
26
+ %0 = vector.broadcast %arg1 : index to vector <1 x[4 ]xindex >
27
+ %1 = vector.broadcast %arg2 : index to vector <1 x[4 ]xindex >
28
+ %2 = arith.addi %0 , %1 : vector <1 x[4 ]xindex >
29
+ return %2 : vector <1 x[4 ]xindex >
14
30
}
15
31
16
32
// -----
@@ -21,13 +37,26 @@ func.func @broadcast_scalar_with_bcast( %arg1: index, %arg2: index) -> vector<1x
21
37
// CHECK: %[[ADD:.*]] = arith.addi %[[ARG1]], %[[ARG2]] : index
22
38
// CHECK: %[[BCAST:.*]] = vector.broadcast %[[ADD]] : index to vector<1x4xindex>
23
39
// CHECK: return %[[BCAST]] : vector<1x4xindex>
24
- func.func @broadcast_scalar_with_bcast_and_splat ( %arg1: index , %arg2: index ) -> vector <1 x4 xindex > {
40
+ func.func @broadcast_scalar_with_bcast_and_splat (%arg1: index , %arg2: index ) -> vector <1 x4 xindex > {
25
41
%0 = vector.splat %arg1 : vector <1 x4 xindex >
26
42
%1 = vector.broadcast %arg2 : index to vector <1 x4 xindex >
27
43
%2 = arith.addi %0 , %1 : vector <1 x4 xindex >
28
44
return %2 : vector <1 x4 xindex >
29
45
}
30
46
47
+ // CHECK-LABEL: func.func @broadcast_scalar_with_bcast_and_splat_scalable(
48
+ // CHECK-SAME: %[[ARG1:.*]]: index,
49
+ // CHECK-SAME: %[[ARG2:.*]]: index) -> vector<1x[4]xindex> {
50
+ // CHECK: %[[ADD:.*]] = arith.addi %[[ARG1]], %[[ARG2]] : index
51
+ // CHECK: %[[BCAST:.*]] = vector.broadcast %[[ADD]] : index to vector<1x[4]xindex>
52
+ // CHECK: return %[[BCAST]] : vector<1x[4]xindex>
53
+ func.func @broadcast_scalar_with_bcast_and_splat_scalable (%arg1: index , %arg2: index ) -> vector <1 x[4 ]xindex > {
54
+ %0 = vector.splat %arg1 : vector <1 x[4 ]xindex >
55
+ %1 = vector.broadcast %arg2 : index to vector <1 x[4 ]xindex >
56
+ %2 = arith.addi %0 , %1 : vector <1 x[4 ]xindex >
57
+ return %2 : vector <1 x[4 ]xindex >
58
+ }
59
+
31
60
// -----
32
61
33
62
// CHECK-LABEL: func.func @broadcast_vector(
@@ -37,13 +66,27 @@ func.func @broadcast_scalar_with_bcast_and_splat( %arg1: index, %arg2: index) ->
37
66
// CHECK: %[[BCAST:.*]] = vector.broadcast %[[ADDF]] : vector<4xf32> to vector<3x4xf32>
38
67
// CHECK: return %[[BCAST]] : vector<3x4xf32>
39
68
40
- func.func @broadcast_vector ( %arg1: vector <4 xf32 >, %arg2: vector <4 xf32 >) -> vector <3 x4 xf32 > {
69
+ func.func @broadcast_vector (%arg1: vector <4 xf32 >, %arg2: vector <4 xf32 >) -> vector <3 x4 xf32 > {
41
70
%arg1_bcast = vector.broadcast %arg1 : vector <4 xf32 > to vector <3 x4 xf32 >
42
71
%arg2_bcast = vector.broadcast %arg2 : vector <4 xf32 > to vector <3 x4 xf32 >
43
72
%2 = arith.addf %arg1_bcast , %arg2_bcast : vector <3 x4 xf32 >
44
73
return %2 : vector <3 x4 xf32 >
45
74
}
46
75
76
+ // CHECK-LABEL: func.func @broadcast_vector_scalable(
77
+ // CHECK-SAME: %[[ARG_0:.*]]: vector<[4]xf32>,
78
+ // CHECK-SAME: %[[ARG_1:.*]]: vector<[4]xf32>) -> vector<3x[4]xf32> {
79
+ // CHECK: %[[ADDF:.*]] = arith.addf %[[ARG_0]], %[[ARG_1]] : vector<[4]xf32>
80
+ // CHECK: %[[BCAST:.*]] = vector.broadcast %[[ADDF]] : vector<[4]xf32> to vector<3x[4]xf32>
81
+ // CHECK: return %[[BCAST]] : vector<3x[4]xf32>
82
+
83
+ func.func @broadcast_vector_scalable (%arg1: vector <[4 ]xf32 >, %arg2: vector <[4 ]xf32 >) -> vector <3 x[4 ]xf32 > {
84
+ %arg1_bcast = vector.broadcast %arg1 : vector <[4 ]xf32 > to vector <3 x[4 ]xf32 >
85
+ %arg2_bcast = vector.broadcast %arg2 : vector <[4 ]xf32 > to vector <3 x[4 ]xf32 >
86
+ %2 = arith.addf %arg1_bcast , %arg2_bcast : vector <3 x[4 ]xf32 >
87
+ return %2 : vector <3 x[4 ]xf32 >
88
+ }
89
+
47
90
// -----
48
91
49
92
// CHECK-LABEL: func.func @broadcast_scalar_and_vec(
@@ -53,13 +96,27 @@ func.func @broadcast_vector( %arg1: vector<4xf32>, %arg2: vector<4xf32>) -> vect
53
96
// CHECK: %[[BCAST:.*]] = vector.broadcast %[[ARG2]] : vector<4xindex> to vector<1x4xindex>
54
97
// CHECK: %[[ADD:.*]] = arith.addi %[[SPLAT]], %[[BCAST]] : vector<1x4xindex>
55
98
// CHECK: return %[[ADD]] : vector<1x4xindex>
56
- func.func @broadcast_scalar_and_vec ( %arg1: index , %arg2: vector <4 xindex >) -> vector <1 x4 xindex > {
99
+ func.func @broadcast_scalar_and_vec (%arg1: index , %arg2: vector <4 xindex >) -> vector <1 x4 xindex > {
57
100
%0 = vector.splat %arg1 : vector <1 x4 xindex >
58
101
%1 = vector.broadcast %arg2 : vector <4 xindex > to vector <1 x4 xindex >
59
102
%2 = arith.addi %0 , %1 : vector <1 x4 xindex >
60
103
return %2 : vector <1 x4 xindex >
61
104
}
62
105
106
+ // CHECK-LABEL: func.func @broadcast_scalar_and_vec_scalable(
107
+ // CHECK-SAME: %[[ARG1:.*]]: index,
108
+ // CHECK-SAME: %[[ARG2:.*]]: vector<[4]xindex>) -> vector<1x[4]xindex> {
109
+ // CHECK: %[[SPLAT:.*]] = vector.splat %[[ARG1]] : vector<1x[4]xindex>
110
+ // CHECK: %[[BCAST:.*]] = vector.broadcast %[[ARG2]] : vector<[4]xindex> to vector<1x[4]xindex>
111
+ // CHECK: %[[ADD:.*]] = arith.addi %[[SPLAT]], %[[BCAST]] : vector<1x[4]xindex>
112
+ // CHECK: return %[[ADD]] : vector<1x[4]xindex>
113
+ func.func @broadcast_scalar_and_vec_scalable (%arg1: index , %arg2: vector <[4 ]xindex >) -> vector <1 x[4 ]xindex > {
114
+ %0 = vector.splat %arg1 : vector <1 x[4 ]xindex >
115
+ %1 = vector.broadcast %arg2 : vector <[4 ]xindex > to vector <1 x[4 ]xindex >
116
+ %2 = arith.addi %0 , %1 : vector <1 x[4 ]xindex >
117
+ return %2 : vector <1 x[4 ]xindex >
118
+ }
119
+
63
120
// -----
64
121
65
122
// CHECK-LABEL: func.func @broadcast_vector_and_scalar(
@@ -69,12 +126,25 @@ func.func @broadcast_scalar_and_vec( %arg1: index, %arg2: vector<4xindex>) -> ve
69
126
// CHECK: %[[ADD:.*]] = arith.addi %[[BCAST]], %[[ARG_1]] : vector<4xi32>
70
127
// CHECK: return %[[ADD]] : vector<4xi32>
71
128
72
- func.func @broadcast_vector_and_scalar ( %arg1: i32 , %arg2: vector <4 xi32 >) -> vector <4 xi32 > {
129
+ func.func @broadcast_vector_and_scalar (%arg1: i32 , %arg2: vector <4 xi32 >) -> vector <4 xi32 > {
73
130
%arg1_bcast = vector.broadcast %arg1 : i32 to vector <4 xi32 >
74
131
%2 = arith.addi %arg1_bcast , %arg2 : vector <4 xi32 >
75
132
return %2 : vector <4 xi32 >
76
133
}
77
134
135
+ // CHECK-LABEL: func.func @broadcast_vector_and_scalar_scalable(
136
+ // CHECK-SAME: %[[ARG_0:.*]]: i32,
137
+ // CHECK-SAME: %[[ARG_1:.*]]: vector<[4]xi32>) -> vector<[4]xi32> {
138
+ // CHECK: %[[BCAST:.*]] = vector.broadcast %[[ARG_0]] : i32 to vector<[4]xi32>
139
+ // CHECK: %[[ADD:.*]] = arith.addi %[[BCAST]], %[[ARG_1]] : vector<[4]xi32>
140
+ // CHECK: return %[[ADD]] : vector<[4]xi32>
141
+
142
+ func.func @broadcast_vector_and_scalar_scalable (%arg1: i32 , %arg2: vector <[4 ]xi32 >) -> vector <[4 ]xi32 > {
143
+ %arg1_bcast = vector.broadcast %arg1 : i32 to vector <[4 ]xi32 >
144
+ %2 = arith.addi %arg1_bcast , %arg2 : vector <[4 ]xi32 >
145
+ return %2 : vector <[4 ]xi32 >
146
+ }
147
+
78
148
// -----
79
149
80
150
#matmat_accesses = [
@@ -87,40 +157,52 @@ func.func @broadcast_vector_and_scalar( %arg1: i32, %arg2: vector<4xi32>) -> vec
87
157
iterator_types = [" parallel" , " parallel" , " reduction" ]
88
158
}
89
159
90
- // CHECK-LABEL: func.func @broadcast_not_elementwise() -> vector<2x2xf32> {
91
- // CHECK-DAG: %[[VAL_0 :.*]] = arith.constant dense<1.000000e+00> : vector<2x2xf32>
92
- // CHECK-DAG: %[[VAL_1 :.*]] = arith.constant dense<2.000000e+00> : vector<2x2xf32>
93
- // CHECK-DAG: %[[VAL_2 :.*]] = arith.constant dense<3.000000e+00> : vector<2x2xf32>
94
- // CHECK: %[[VAL_3 :.*]] = vector.contract {indexing_maps = [#map, #map1, #map2], iterator_types = ["parallel", "parallel", "reduction"], kind = #vector.kind<add>} %[[VAL_0 ]], %[[VAL_1 ]], %[[VAL_2 ]] : vector<2x2xf32>, vector<2x2xf32> into vector<2x2xf32>
95
- func.func @broadcast_not_elementwise () -> vector <2 x2 xf32 > {
160
+ // CHECK-LABEL: func.func @negative_not_elementwise
161
+ // CHECK-DAG: %[[F1 :.*]] = arith.constant dense<1.000000e+00> : vector<2x2xf32>
162
+ // CHECK-DAG: %[[F2 :.*]] = arith.constant dense<2.000000e+00> : vector<2x2xf32>
163
+ // CHECK-DAG: %[[F3 :.*]] = arith.constant dense<3.000000e+00> : vector<2x2xf32>
164
+ // CHECK: %[[RES :.*]] = vector.contract {indexing_maps = [#map, #map1, #map2], iterator_types = ["parallel", "parallel", "reduction"], kind = #vector.kind<add>} %[[F1 ]], %[[F2 ]], %[[F3 ]] : vector<2x2xf32>, vector<2x2xf32> into vector<2x2xf32>
165
+ func.func @negative_not_elementwise () -> vector <2 x2 xf32 > {
96
166
%f1 = arith.constant 1.0 : f32
97
167
%f2 = arith.constant 2.0 : f32
98
168
%f3 = arith.constant 3.0 : f32
99
169
100
170
%A = vector.broadcast %f1 : f32 to vector <2 x2 xf32 >
101
171
%B = vector.broadcast %f2 : f32 to vector <2 x2 xf32 >
102
172
%C = vector.broadcast %f3 : f32 to vector <2 x2 xf32 >
103
- %mm1 = vector.contract #matmat_trait %A , %B , %C
173
+ %res = vector.contract #matmat_trait %A , %B , %C
104
174
: vector <2 x2 xf32 >, vector <2 x2 xf32 > into vector <2 x2 xf32 >
105
175
106
- return %mm1 : vector <2 x2 xf32 >
176
+ return %res : vector <2 x2 xf32 >
107
177
}
108
178
109
- // CHECK-LABEL: func.func @dont_sink_cmp(
179
+ // -----
180
+
181
+ // The source and the result for arith.cmp have different types - not supported
182
+
183
+ // CHECK-LABEL: func.func @negative_source_and_result_mismatch
110
184
// CHECK: %[[BROADCAST:.+]] = vector.broadcast
111
185
// CHECK: %[[RETURN:.+]] = arith.cmpf uno, %[[BROADCAST]], %[[BROADCAST]]
112
186
// CHECK: return %[[RETURN]]
113
- func.func @dont_sink_cmp (%arg0 : f32 , %arg1 : vector <1 xf32 >) -> vector <1 xi1 > {
187
+ func.func @negative_source_and_result_mismatch (%arg0 : f32 , %arg1 : vector <1 xf32 >) -> vector <1 xi1 > {
114
188
%0 = vector.broadcast %arg0 : f32 to vector <1 xf32 >
115
189
%1 = arith.cmpf uno , %0 , %0 : vector <1 xf32 >
116
190
return %1 : vector <1 xi1 >
117
191
}
118
192
119
- // CHECK-LABEL: func.func @dont_sink_fma(
193
+ // -----
194
+
195
+ // vector.fma only supports vectors - currently it's not possible to replace this with e.g.:
196
+ // %scalar_res = vector.fma %scalar_1, %scalar2
197
+ // %vec_res = vector.broadcast %scalar_res
198
+ //
199
+ // TODO: It should be possible to support this case
200
+
201
+ // CHECK-LABEL: func.func @negative_op_only_supports_vectors
120
202
// CHECK: %[[BROADCAST:.+]] = vector.broadcast
121
203
// CHECK: %[[RESULT:.+]] = vector.fma %[[BROADCAST]]
122
204
// CHECK: return %[[RESULT]]
123
- func.func @dont_sink_fma (%arg0 : f32 ) -> vector <1 xf32 > {
205
+ func.func @negative_op_only_supports_vectors (%arg0 : f32 ) -> vector <1 xf32 > {
124
206
%0 = vector.broadcast %arg0 : f32 to vector <1 xf32 >
125
207
%1 = vector.fma %0 , %0 , %0 : vector <1 xf32 >
126
208
return %1 : vector <1 xf32 >
0 commit comments