broadcast the two input shapes for transposed matmul

nvpohanh · nvpohanh · commit 75b445bf9864 · 2022-12-04T23:20:13.000-08:00
diff --git a/py/torch_tensorrt/fx/converters/acc_ops_converters.py b/py/torch_tensorrt/fx/converters/acc_ops_converters.py
@@ -38,6 +38,14 @@ def trt_transposed_matmul_converter(network, target, args, kwargs, name):
         lhs = get_trt_tensor(network, lhs, f"{name}_lhs")
     if isinstance(rhs, torch.nn.Parameter):
         rhs = get_trt_tensor(network, rhs, f"{name}_rhs")
+
+    lhs, rhs = broadcast(
+        network,
+        lhs,
+        rhs,
+        f"{lhs.name}_broadcast",
+        f"{rhs.name}_broadcast",
+    )
     layer = network.add_matrix_multiply(
         lhs,
         trt.MatrixOperation.TRANSPOSE if lhs_transposed else trt.MatrixOperation.NONE,
diff --git a/py/torch_tensorrt/fx/test/passes/test_fuse_permute_matmul_trt.py b/py/torch_tensorrt/fx/test/passes/test_fuse_permute_matmul_trt.py
@@ -37,6 +37,8 @@ class TestFusePermuteMatmul(AccTestCase):
                 lambda x: x.permute(0, 1, 3, 2),
                 torch.matmul,
             ),
+            param("transpose_lhs_bmm_broadcast", (3, 2), (3, 3, 4), tranpose_last_two_dims, op=torch.matmul),
+            param("transpose_rhs_bmm_broadcast", (3, 3, 4), (3, 4), rhs_op=tranpose_last_two_dims, op=torch.matmul),
         ]
     )
     def test_fuse_permute_matmul(
@@ -58,6 +60,7 @@ def forward(self, x, y):
             inputs,
             {trt_transposed_matmul},
             apply_passes=[fuse_permute_matmul],
+            test_implicit_batch_dim=(len(lhs_shape) == len(rhs_shape)),
         )
 
     @parameterized.expand(

Original file line number	Diff line number	Diff line change
`@@ -37,6 +37,8 @@ class TestFusePermuteMatmul(AccTestCase):`
`37`	`37`	`lambda x: x.permute(0, 1, 3, 2),`
`38`	`38`	`torch.matmul,`
`39`	`39`	`),`
	`40`	`+ param("transpose_lhs_bmm_broadcast", (3, 2), (3, 3, 4), tranpose_last_two_dims, op=torch.matmul),`
	`41`	`+ param("transpose_rhs_bmm_broadcast", (3, 3, 4), (3, 4), rhs_op=tranpose_last_two_dims, op=torch.matmul),`
`40`	`42`	`]`
`41`	`43`	`)`
`42`	`44`	`def test_fuse_permute_matmul(`
`@@ -58,6 +60,7 @@ def forward(self, x, y):`
`58`	`60`	`inputs,`
`59`	`61`	`{trt_transposed_matmul},`
`60`	`62`	`apply_passes=[fuse_permute_matmul],`
	`63`	`+ test_implicit_batch_dim=(len(lhs_shape) == len(rhs_shape)),`
`61`	`64`	`)`
`62`	`65`
`63`	`66`	`@parameterized.expand(`