@@ -96,6 +96,34 @@ module attributes {transform.with_named_sequence} {
96
96
97
97
// -----
98
98
99
+ // This is same as pack_as_pad but since we explicitly added {allowInsertSliceLowering = false}, it should not
100
+ // be lowered to insert_slice.
101
+ // CHECK-LABEL: func.func @pack_disallowed_as_pad(
102
+ // CHECK: %[[SRC:.+]]: tensor<129x47x16x16xf32>,
103
+ // CHECK: %[[OUT:.+]]: tensor<1x1x1x1x136x64x16x16xf32>)
104
+ func.func @pack_disallowed_as_pad (%arg0: tensor <129 x47 x16 x16 xf32 >, %arg1: tensor <1 x1 x1 x1 x136 x64 x16 x16 xf32 >) -> tensor <1 x1 x1 x1 x136 x64 x16 x16 xf32 > {
105
+ %cst_0 = arith.constant 0.0 : f32
106
+ // tensor.pack is lowered to tensor.pad + tensor.expand_shape + tensor.insert_slice
107
+ // CHECK: %[[PAD:.*]] = tensor.pad %[[SRC]] low[0, 0, 0, 0] high[7, 17, 0, 0]
108
+ // CHECK: : tensor<129x47x16x16xf32> to tensor<136x64x16x16xf32>
109
+ // CHECK-NOT: %[[RES:.*]] = tensor.insert_slice %[[PAD]] into %[[OUT]]
110
+ %pack = tensor.pack %arg0 padding_value (%cst_0 : f32 ) inner_dims_pos = [0 , 1 , 2 , 3 ] inner_tiles = [136 , 64 , 16 , 16 ] into %arg1
111
+ : tensor <129 x47 x16 x16 xf32 > -> tensor <1 x1 x1 x1 x136 x64 x16 x16 xf32 >
112
+ return %pack : tensor <1 x1 x1 x1 x136 x64 x16 x16 xf32 >
113
+ }
114
+
115
+ module attributes {transform.with_named_sequence } {
116
+ transform.named_sequence @__transform_main (%module_op: !transform.any_op {transform.readonly }) {
117
+ %pack = transform.structured.match ops {[" tensor.pack" ]} in %module_op
118
+ : (!transform.any_op ) -> !transform.op <" tensor.pack" >
119
+ transform.structured.lower_pack %pack {allowInsertSliceLowering = false }: (!transform.op <" tensor.pack" >)
120
+ -> (!transform.op <" tensor.pad" >, !transform.op <" tensor.expand_shape" >, !transform.op <" linalg.transpose" >)
121
+ transform.yield
122
+ }
123
+ }
124
+
125
+ // -----
126
+
99
127
// Check that we don't lower the following pack as a pad.
100
128
// Although all the outer most dimensions in the resulting shape are 1s,
101
129
// some of the original dimensions are not part of the inner_dims_pos, hence
@@ -233,6 +261,34 @@ module attributes {transform.with_named_sequence} {
233
261
234
262
// -----
235
263
264
+ // This is same as upack_as_pad but since we explicitly added {allowExtractSlicelowering = false}, it should not
265
+ // be lowered to extract_slice.
266
+ // CHECK-LABEL: func.func @unpack_disallowed_as_pad(
267
+ func.func @unpack_disallowed_as_pad (%arg0: tensor <1 x1 x1 x1 x136 x64 x16 x16 xf32 >, %arg1: tensor <129 x47 x16 x16 xf32 >) -> tensor <129 x47 x16 x16 xf32 > {
268
+ %cst_0 = arith.constant 0.0 : f32
269
+
270
+ // CHECK-SAME: %[[ARG0:[^:]*]]: tensor<1x1x1x1x136x64x16x16xf32>
271
+ // CHECK-NOT: %[[RES:.*]] = tensor.extract_slice %[[ARG0]]
272
+ %pack = tensor.unpack %arg0 inner_dims_pos = [0 , 1 , 2 , 3 ] inner_tiles = [136 , 64 , 16 , 16 ] into %arg1
273
+ : tensor <1 x1 x1 x1 x136 x64 x16 x16 xf32 > -> tensor <129 x47 x16 x16 xf32 >
274
+ return %pack : tensor <129 x47 x16 x16 xf32 >
275
+ }
276
+
277
+ module attributes {transform.with_named_sequence } {
278
+ transform.named_sequence @__transform_main (%module_op: !transform.any_op {transform.readonly }) {
279
+ %unpack = transform.structured.match ops {[" tensor.unpack" ]} in %module_op
280
+ : (!transform.any_op ) -> !transform.op <" tensor.unpack" >
281
+ transform.structured.lower_unpack %unpack {allowExtractSliceLowering = false }: (!transform.op <" tensor.unpack" >)
282
+ -> (!transform.op <" tensor.empty" >,
283
+ !transform.op <" linalg.transpose" >,
284
+ !transform.op <" tensor.collapse_shape" >,
285
+ !transform.op <" tensor.extract_slice" >)
286
+ transform.yield
287
+ }
288
+ }
289
+
290
+ // -----
291
+
236
292
// CHECK-LABEL: func.func @pack_with_outer_dims_perm(
237
293
func.func @pack_with_outer_dims_perm (%src: tensor <100 x200 x128 x256 xi32 >,
238
294
%dest: tensor <200 x4 x16 x100 x16 x32 xi32 >)
0 commit comments