@@ -965,11 +965,11 @@ def FMopaWide2WayOp
965
965
966
966
```mlir
967
967
%undef = llvm.mlir.undef : vector<[8]xf16>
968
- %a0_ins = vector.scalable.insert %a0_ext , %undef[0] : vector<[4]xf16> into vector<[8]xf16>
969
- %a1_ins = vector.scalable.insert %a1_ext , %undef[0] : vector<[4]xf16> into vector<[8]xf16>
968
+ %a0_ins = vector.scalable.insert %a0 , %undef[0] : vector<[4]xf16> into vector<[8]xf16>
969
+ %a1_ins = vector.scalable.insert %a1 , %undef[0] : vector<[4]xf16> into vector<[8]xf16>
970
970
%a_packed = "arm_sve.intr.zip1"(%a0_ins, %a1_ins) : (vector<[8]xf16>, vector<[8]xf16>) -> vector<[8]xf16>
971
- %b0_ins = vector.scalable.insert %b0_ext , %undef[0] : vector<[4]xf16> into vector<[8]xf16>
972
- %b1_ins = vector.scalable.insert %b1_ext , %undef[0] : vector<[4]xf16> into vector<[8]xf16>
971
+ %b0_ins = vector.scalable.insert %b0 , %undef[0] : vector<[4]xf16> into vector<[8]xf16>
972
+ %b1_ins = vector.scalable.insert %b1 , %undef[0] : vector<[4]xf16> into vector<[8]xf16>
973
973
%b_packed = "arm_sve.intr.zip1"(%b0_ins, %b1_ins) : (vector<[8]xf16>, vector<[8]xf16>) -> vector<[8]xf16>
974
974
%0 = arm_sme.fmopa_wide_2way %a_packed, %b_packed : vector<[8]xf16>, vector<[8]xf16> into vector<[4]x[4]xf32>
975
975
```
@@ -1220,18 +1220,18 @@ def SMopaWide4WayOp
1220
1220
1221
1221
```mlir
1222
1222
%undef = llvm.mlir.undef : vector<[8]xf16>
1223
- %a0_ins = vector.scalable.insert %a0_ext , %undef[0] : vector<[4]xf16> into vector<[8]xf16>
1224
- %a1_ins = vector.scalable.insert %a1_ext , %undef[0] : vector<[4]xf16> into vector<[8]xf16>
1225
- %a2_ins = vector.scalable.insert %a2_ext , %undef[0] : vector<[4]xf16> into vector<[8]xf16>
1226
- %a3_ins = vector.scalable.insert %a3_ext , %undef[0] : vector<[4]xf16> into vector<[8]xf16>
1223
+ %a0_ins = vector.scalable.insert %a0 , %undef[0] : vector<[4]xf16> into vector<[8]xf16>
1224
+ %a1_ins = vector.scalable.insert %a1 , %undef[0] : vector<[4]xf16> into vector<[8]xf16>
1225
+ %a2_ins = vector.scalable.insert %a2 , %undef[0] : vector<[4]xf16> into vector<[8]xf16>
1226
+ %a3_ins = vector.scalable.insert %a3 , %undef[0] : vector<[4]xf16> into vector<[8]xf16>
1227
1227
%lhs0 = "arm_sve.intr.zip1"(%a0_ins, %a2_ins) : (vector<[8]xf16>, vector<[8]xf16>) -> vector<[8]xf16>
1228
1228
%lhs1 = "arm_sve.intr.zip1"(%a1_ins, %a3_ins) : (vector<[8]xf16>, vector<[8]xf16>) -> vector<[8]xf16>
1229
1229
%lhs = "arm_sve.intr.zip1"(%lhs0, %lhs1) : (vector<[8]xf16>, vector<[8]xf16>) -> vector<[8]xf16>
1230
1230
1231
- %b0_ins = vector.scalable.insert %b0_ext , %undef[0] : vector<[4]xf16> into vector<[8]xf16>
1232
- %b1_ins = vector.scalable.insert %b1_ext , %undef[0] : vector<[4]xf16> into vector<[8]xf16>
1233
- %b2_ins = vector.scalable.insert %b2_ext , %undef[0] : vector<[4]xf16> into vector<[8]xf16>
1234
- %b3_ins = vector.scalable.insert %b3_ext , %undef[0] : vector<[4]xf16> into vector<[8]xf16>
1231
+ %b0_ins = vector.scalable.insert %b0 , %undef[0] : vector<[4]xf16> into vector<[8]xf16>
1232
+ %b1_ins = vector.scalable.insert %b1 , %undef[0] : vector<[4]xf16> into vector<[8]xf16>
1233
+ %b2_ins = vector.scalable.insert %b2 , %undef[0] : vector<[4]xf16> into vector<[8]xf16>
1234
+ %b3_ins = vector.scalable.insert %b3 , %undef[0] : vector<[4]xf16> into vector<[8]xf16>
1235
1235
%rhs0 = "arm_sve.intr.zip1"(%b0_ins, %b2_ins) : (vector<[8]xf16>, vector<[8]xf16>) -> vector<[8]xf16>
1236
1236
%rhs1 = "arm_sve.intr.zip1"(%b1_ins, %b3_ins) : (vector<[8]xf16>, vector<[8]xf16>) -> vector<[8]xf16>
1237
1237
%rhs = "arm_sve.intr.zip1"(%rhs0, %rhs1) : (vector<[8]xf16>, vector<[8]xf16>) -> vector<[8]xf16>
0 commit comments