chore(//py/torch_tensorrt): _compile.py conforms to mypy

narendasan · narendasan · commit 790c78fccf14 · 2023-07-19T11:20:22.000-07:00
Signed-off-by: Naren Dasan &lt;naren@narendasan.com&gt;
Signed-off-by: Naren Dasan &lt;narens@nvidia.com&gt;
diff --git a/py/torch_tensorrt/_compile.py b/py/torch_tensorrt/_compile.py
@@ -1,15 +1,23 @@
-from typing import List, Dict, Any
+from typing import List, Dict, Any, Set, Union, Callable, TypeGuard
+
 import torch_tensorrt.ts
 
-from torch_tensorrt import logging
+from torch_tensorrt import logging, Input, dtype
 import torch
 import torch.fx
 from enum import Enum
 
 import torch_tensorrt.fx
+from torch_tensorrt.fx import InputTensorSpec
 from torch_tensorrt.fx.utils import LowerPrecision
 
 
+def _non_fx_input_interface(inputs: List[Input | torch.Tensor | InputTensorSpec]) -> TypeGuard[List[Input | torch.Tensor]]:
+    return all([isinstance(i, torch.Tensor | Input) for i in inputs])
+
+def _fx_input_interface(inputs: List[Input | torch.Tensor | InputTensorSpec]) -> TypeGuard[List[InputTensorSpec | torch.Tensor]]:
+    return all([isinstance(i, torch.Tensor | InputTensorSpec) for i in inputs])
+
 class _IRType(Enum):
     """Enum to set the minimum required logging level to print a message to stdout"""
 
@@ -80,11 +88,11 @@ def _get_target_ir(module_type: _ModuleType, ir: str) -> _IRType:
 
 def compile(
     module: Any,
-    ir="default",
-    inputs=[],
-    enabled_precisions=set([torch.float]),
-    **kwargs,
-):
+    ir: str = "default",
+    inputs: List[Union[Input, torch.Tensor, InputTensorSpec]] = [],
+    enabled_precisions: Set[Union[torch.dtype, dtype]] = set([torch.float]),
+    **kwargs: Any,
+) -> Union[torch.nn.Module, torch.jit.ScriptModule, torch.fx.GraphModule, Callable[[Any], Any]]:
     """Compile a PyTorch module for NVIDIA GPUs using TensorRT
 
     Takes a existing PyTorch module and a set of settings to configure the compiler
@@ -130,9 +138,11 @@ def compile(
                 "Module was provided as a torch.nn.Module, trying to script the module with torch.jit.script. In the event of a failure please preconvert your module to TorchScript",
             )
             ts_mod = torch.jit.script(module)
-        return torch_tensorrt.ts.compile(
+        assert _non_fx_input_interface(inputs)
+        compiled_ts_module: torch.jit.ScriptModule = torch_tensorrt.ts.compile(
             ts_mod, inputs=inputs, enabled_precisions=enabled_precisions, **kwargs
         )
+        return compiled_ts_module
     elif target_ir == _IRType.fx:
         if (
             torch.float16 in enabled_precisions
@@ -147,38 +157,31 @@ def compile(
         else:
             raise ValueError(f"Precision {enabled_precisions} not supported on FX")
 
-        return torch_tensorrt.fx.compile(
+        assert _fx_input_interface(inputs)
+        compiled_fx_module: torch.nn.Module = torch_tensorrt.fx.compile(
             module,
             inputs,
             lower_precision=lower_precision,
-            max_batch_size=inputs[0].size(0),
             explicit_batch_dimension=True,
             dynamic_batch=False,
             **kwargs,
         )
+        return compiled_fx_module
     elif target_ir == _IRType.dynamo:
-        from torch_tensorrt import Device
-        from torch_tensorrt.dynamo.utils import prepare_inputs, prepare_device
-        import collections.abc
-
-        if not isinstance(inputs, collections.abc.Sequence):
-            inputs = [inputs]
-        device = kwargs.get("device", Device._current_device())
-        torchtrt_inputs, torch_inputs = prepare_inputs(inputs, prepare_device(device))
-        module = torch_tensorrt.dynamo.trace(module, torch_inputs, **kwargs)
         return torch_tensorrt.dynamo.compile(
             module,
             inputs=inputs,
             enabled_precisions=enabled_precisions,
             **kwargs,
         )
+        return compiled_aten_module
     elif target_ir == _IRType.torch_compile:
         return torch_compile(module, enabled_precisions=enabled_precisions, **kwargs)
     else:
         raise RuntimeError("Module is an unknown format or the ir requested is unknown")
 
 
-def torch_compile(module, **kwargs):
+def torch_compile(module: torch.nn.Module, **kwargs: Any) -> Callable[..., Any]:
     """
     Returns a boxed model which is the output of torch.compile.
     This does not compile the model to TRT. Execute this model on
@@ -194,11 +197,11 @@ def torch_compile(module, **kwargs):
 def convert_method_to_trt_engine(
     module: Any,
     method_name: str,
-    ir="default",
-    inputs=[],
-    enabled_precisions=set([torch.float]),
-    **kwargs,
-):
+    ir: str = "default",
+    inputs: List[Union[Input, torch.Tensor]] = [],
+    enabled_precisions: Set[Union[torch.dtype, dtype]] = set([torch.float]),
+    **kwargs: Any,
+) -> bytes:
     """Convert a TorchScript module method to a serialized TensorRT engine
 
     Converts a specified method of a module to a serialized TensorRT engine given a dictionary of conversion settings