add dynamic support for embedding_bag/index_select (#3032)

lanluo-nvidia · web-flow · commit 2eb7341e3121 · 2024-07-24T18:32:46.000-07:00
diff --git a/py/torch_tensorrt/dynamo/conversion/aten_ops_converters.py b/py/torch_tensorrt/dynamo/conversion/aten_ops_converters.py
@@ -283,10 +283,14 @@ def embedding_bag_validator(node: Node) -> bool:
 
 
 @dynamo_tensorrt_converter(
-    torch.ops.aten.embedding_bag.default, capability_validator=embedding_bag_validator
+    torch.ops.aten.embedding_bag.default,
+    capability_validator=embedding_bag_validator,
+    supports_dynamic_shapes=True,
 )
 @dynamo_tensorrt_converter(
-    torch.ops.aten._embedding_bag.default, capability_validator=embedding_bag_validator
+    torch.ops.aten._embedding_bag.default,
+    capability_validator=embedding_bag_validator,
+    supports_dynamic_shapes=True,
 )
 @enforce_tensor_types(
     {
@@ -3379,7 +3383,9 @@ def aten_ops_roll(
     )
 
 
-@dynamo_tensorrt_converter(torch.ops.aten.index_select.default)
+@dynamo_tensorrt_converter(
+    torch.ops.aten.index_select.default, supports_dynamic_shapes=True
+)
 @enforce_tensor_types(
     {
         0: (TRTTensor,),
diff --git a/tests/py/dynamo/conversion/test_embedding_bag_aten.py b/tests/py/dynamo/conversion/test_embedding_bag_aten.py
@@ -1,6 +1,8 @@
 import torch
+import torch_tensorrt
 from parameterized import param, parameterized
 from torch.testing._internal.common_utils import run_tests
+from torch_tensorrt import Input
 
 from .harness import DispatchTestCase
 
@@ -408,6 +410,103 @@ def forward(self, weight, indices, offsets):
             propagate_shapes=True,
         )
 
+    @parameterized.expand(
+        [
+            param(
+                # 1d_indices_mode_0_with_per_sample_weights
+                # weights is for compile
+                weights=torch.randn((5, 2), dtype=torch.float32),
+                # weights_1 is for inference
+                weights_1=torch.randn((6, 2), dtype=torch.float32),
+                dynamic_shapes={
+                    "weights": {0: torch.export.Dim("dyn_dim", min=2, max=6)},
+                    "indices": {},
+                    "offsets": {},
+                },
+                indices=torch.tensor([1, 2, 4], dtype=torch.int32),
+                offsets=torch.tensor([0, 2, 3], dtype=torch.int32),
+                mode=0,
+                per_sample_weights=torch.randn((3,), dtype=torch.float32),
+            ),
+            param(
+                # 1d_indices_mode_1_without_per_sample_weights
+                # weights is for compile
+                weights=torch.randn((5, 2), dtype=torch.float32),
+                # weights_1 is for inference
+                weights_1=torch.randn((6, 3), dtype=torch.float32),
+                dynamic_shapes={
+                    "weights": {
+                        0: torch.export.Dim("dyn_dim", min=2, max=8),
+                        1: torch.export.Dim("dyn_dim_1", min=1, max=3),
+                    },
+                    "indices": {},
+                    "offsets": {},
+                },
+                indices=torch.tensor([1, 2, 4, 2, 3, 4], dtype=torch.int32),
+                offsets=torch.tensor([0, 2, 4], dtype=torch.int32),
+                mode=1,
+                per_sample_weights=None,
+            ),
+        ]
+    )
+    def test_embedding_bag_with_weights_dynamic_shape(
+        self,
+        weights,
+        weights_1,
+        dynamic_shapes,
+        indices,
+        offsets,
+        mode,
+        per_sample_weights,
+    ):
+        class EmbeddingBag(torch.nn.Module):
+            def forward(self, weights, indices, offsets, per_sample_weights=None):
+                return torch.ops.aten._embedding_bag.default(
+                    weight=weights,
+                    indices=indices,
+                    offsets=offsets,
+                    per_sample_weights=per_sample_weights,
+                    scale_grad_by_freq=False,
+                    mode=mode,
+                    sparse=False,
+                    include_last_offset=False,
+                    padding_idx=-1,
+                )
+
+        if per_sample_weights is None:
+            inputs = (weights, indices, offsets)
+        else:
+            inputs = (weights, indices, offsets, per_sample_weights)
+        mod = EmbeddingBag()
+
+        if per_sample_weights is not None:
+            dynamic_shapes["per_sample_weights"] = {}
+        fx_mod = torch.export.export(mod, inputs, dynamic_shapes=dynamic_shapes)
+        trt_mod = torch_tensorrt.dynamo.compile(
+            fx_mod, inputs=inputs, enable_precisions=torch.float32, min_block_size=1
+        )
+        # use the inputs with different shape to inference:
+        if per_sample_weights is None:
+            inputs = (weights_1, indices, offsets)
+        else:
+            inputs = (weights_1, indices, offsets, per_sample_weights)
+
+        with torch.no_grad():
+            cuda_inputs = []
+            for i in inputs:
+                cuda_inputs.append(i.cuda())
+            ref_outputs = mod(*cuda_inputs)
+            outputs = trt_mod(*cuda_inputs)
+            for out, ref in zip(outputs, ref_outputs):
+                torch.testing.assert_close(
+                    out,
+                    ref,
+                    rtol=0.001,
+                    atol=0.001,
+                    equal_nan=True,
+                    check_dtype=True,
+                )
+
 
 if __name__ == "__main__":
     run_tests()
diff --git a/tests/py/dynamo/conversion/test_index_select_aten.py b/tests/py/dynamo/conversion/test_index_select_aten.py
@@ -1,7 +1,9 @@
 import torch
 import torch.nn as nn
-from parameterized import parameterized
+import torch_tensorrt
+from parameterized import param, parameterized
 from torch.testing._internal.common_utils import run_tests
+from torch_tensorrt import Input
 
 from .harness import DispatchTestCase
 
@@ -36,6 +38,96 @@ def forward(self, source_tensor, indices_tensor):
             input,
         )
 
+    @parameterized.expand(
+        [
+            param(
+                # 1d_source_tensor
+                # source_tensor is for compile
+                source_tensor=torch.randn((3,), dtype=torch.float32),
+                # source_tensor_1 is for inference
+                source_tensor_1=torch.randn((5,), dtype=torch.float32),
+                dynamic_shapes={
+                    "source_tensor": {0: torch.export.Dim("dyn_dim", min=3, max=6)},
+                    "indice_tensor": {},
+                },
+                dim=0,
+                indice_tensor=torch.tensor(
+                    [
+                        1,
+                    ],
+                    dtype=torch.int32,
+                ),
+            ),
+            param(
+                # 2d_source_tensor
+                # source_tensor is for compile
+                source_tensor=torch.randn((3, 3), dtype=torch.float32),
+                # source_tensor_1 is for inference
+                source_tensor_1=torch.randn((4, 6), dtype=torch.float32),
+                dynamic_shapes={
+                    "source_tensor": {
+                        0: torch.export.Dim("dyn_dim1", min=3, max=6),
+                        1: torch.export.Dim("dyn_dim2", min=2, max=7),
+                    },
+                    "indice_tensor": {},
+                },
+                dim=-1,
+                indice_tensor=torch.tensor([0, 2], dtype=torch.int32),
+            ),
+            param(
+                # 3d_source_tensor
+                # source_tensor is for compile
+                source_tensor=torch.randn((3, 4, 2), dtype=torch.float32),
+                # source_tensor_1 is for inference
+                source_tensor_1=torch.randn((6, 7, 2), dtype=torch.float32),
+                dynamic_shapes={
+                    "source_tensor": {
+                        0: torch.export.Dim("dyn_dim1", min=3, max=6),
+                        1: torch.export.Dim("dyn_dim2", min=2, max=7),
+                    },
+                    "indice_tensor": {},
+                },
+                dim=-2,
+                indice_tensor=torch.tensor([0, 0, 2], dtype=torch.int32),
+            ),
+        ]
+    )
+    def test_index_select_dynamic_shape(
+        self, source_tensor, source_tensor_1, dynamic_shapes, dim, indice_tensor
+    ):
+        class IndexSelect(torch.nn.Module):
+            def forward(self, source_tensor, indice_tensor):
+                return torch.ops.aten.index_select.default(
+                    source_tensor,
+                    dim,
+                    indice_tensor,
+                )
+
+        inputs = (source_tensor, indice_tensor)
+        mod = IndexSelect()
+
+        fx_mod = torch.export.export(mod, inputs, dynamic_shapes=dynamic_shapes)
+        trt_mod = torch_tensorrt.dynamo.compile(
+            fx_mod, inputs=inputs, enable_precisions=torch.float32, min_block_size=1
+        )
+        # use different shape of inputs for inference:
+        inputs = (source_tensor_1, indice_tensor)
+        with torch.no_grad():
+            cuda_inputs = []
+            for i in inputs:
+                cuda_inputs.append(i.cuda())
+            ref_outputs = mod(*cuda_inputs)
+            outputs = trt_mod(*cuda_inputs)
+            for out, ref in zip(outputs, ref_outputs):
+                torch.testing.assert_close(
+                    out,
+                    ref,
+                    rtol=0.001,
+                    atol=0.001,
+                    equal_nan=True,
+                    check_dtype=True,
+                )
+
 
 if __name__ == "__main__":
     run_tests()

Original file line number	Diff line number	Diff line change
`@@ -283,10 +283,14 @@ def embedding_bag_validator(node: Node) -> bool:`
`283`	`283`
`284`	`284`
`285`	`285`	`@dynamo_tensorrt_converter(`
`286`		`- torch.ops.aten.embedding_bag.default, capability_validator=embedding_bag_validator`
	`286`	`+ torch.ops.aten.embedding_bag.default,`
	`287`	`+ capability_validator=embedding_bag_validator,`
	`288`	`+ supports_dynamic_shapes=True,`
`287`	`289`	`)`
`288`	`290`	`@dynamo_tensorrt_converter(`
`289`		`- torch.ops.aten._embedding_bag.default, capability_validator=embedding_bag_validator`
	`291`	`+ torch.ops.aten._embedding_bag.default,`
	`292`	`+ capability_validator=embedding_bag_validator,`
	`293`	`+ supports_dynamic_shapes=True,`
`290`	`294`	`)`
`291`	`295`	`@enforce_tensor_types(`
`292`	`296`	`{`
`@@ -3379,7 +3383,9 @@ def aten_ops_roll(`
`3379`	`3383`	`)`
`3380`	`3384`
`3381`	`3385`
`3382`		`-@dynamo_tensorrt_converter(torch.ops.aten.index_select.default)`
	`3386`	`+@dynamo_tensorrt_converter(`
	`3387`	`+ torch.ops.aten.index_select.default, supports_dynamic_shapes=True`
	`3388`	`+)`
`3383`	`3389`	`@enforce_tensor_types(`
`3384`	`3390`	`{`
`3385`	`3391`	`0: (TRTTensor,),`