feat(//core/conversion/converters/evaluators): New evaluators for

narendasan · narendasan · commit 8b891fb18bee · 2022-08-03T20:32:54.000-07:00
collections

Implements evaluators for:

- prim::TupleUnpack
- prim::TupleConstruct
- prim::TupleIndex

Signed-off-by: Naren Dasan &lt;naren@narendasan.com&gt;
Signed-off-by: Naren Dasan &lt;narens@nvidia.com&gt;
diff --git a/core/conversion/evaluators/aten.cpp b/core/conversion/evaluators/aten.cpp
@@ -19,14 +19,6 @@ namespace conversion {
 namespace evaluators {
 namespace {
 
-int64_t normalizeIndex(int64_t idx, int64_t list_size) {
-  if (idx < 0) {
-    // Handle negative indexing
-    idx = list_size + idx;
-  }
-  return idx;
-}
-
 DEFINE_GENERIC_TWO_INPUT_EVALUATOR(
     eq,
     "aten::eq",
diff --git a/core/conversion/evaluators/eval_util.cpp b/core/conversion/evaluators/eval_util.cpp
@@ -12,6 +12,15 @@ namespace core {
 namespace conversion {
 namespace evaluators {
 
+int64_t normalizeIndex(int64_t idx, int64_t list_size) {
+  if (idx < 0) {
+    // Handle negative indexing
+    idx = list_size + idx;
+  }
+  return idx;
+}
+
+
 // TODO: Switch back to PyTorch canonical implimentation
 c10::optional<torch::jit::IValue> toIValue(const torch::jit::Value* v) {
   if (v->node()->kind() != torch::jit::prim::Constant || v->type()->cast<c10::FunctionType>()) {
diff --git a/core/conversion/evaluators/eval_util.h b/core/conversion/evaluators/eval_util.h
@@ -13,6 +13,8 @@ at::Tensor createTensorFromList(
     const torch::jit::IValue& dtype,
     const torch::jit::IValue& device);
 
+int64_t normalizeIndex(int64_t idx, int64_t list_size);
+
 at::Tensor scalar_to_tensor(const at::Scalar& s, const at::Device device = at::kCPU);
 
 } // namespace evaluators
diff --git a/core/conversion/evaluators/prim.cpp b/core/conversion/evaluators/prim.cpp
@@ -259,6 +259,56 @@ auto prim_registrations =
                       }
                     },
                     EvalOptions().validSchemas({"prim::shape(Tensor a) -> (int[])"})})
+        .evaluator({torch::jit::prim::TupleConstruct,
+                  [](const torch::jit::Node* n, kwargs& args) -> c10::optional<torch::jit::IValue> {
+                    auto num_inputs = n->inputs().size();
+                    c10::IValue tuple = c10::ivalue::Tuple::create();
+                    switch (num_inputs) {
+                      case 0:
+                        tuple = c10::ivalue::Tuple::create();
+                        break;
+                      case 1:
+                        tuple = c10::ivalue::Tuple::create(std::move((*args.at(n->input(0)).IValue())));
+                        break;
+                      case 2: {
+                        tuple = c10::ivalue::Tuple::create(
+                            std::move(*(args.at(n->input(0)).IValue())),
+                            std::move(*(args.at(n->input(1)).IValue())));
+                        break;
+                      }
+                      case 3: {
+                        tuple = c10::ivalue::Tuple::create(
+                            std::move(*(args.at(n->input(0)).IValue())),
+                            std::move(*(args.at(n->input(1)).IValue())),
+                            std::move(*(args.at(n->input(2)).IValue())));
+                        break;
+                      }
+                      default: {
+                        std::vector<c10::IValue> elems;
+                        for (size_t i = 0; i < num_inputs; i++) {
+                          elems.push_back(*(args.at(n->input(i)).IValue()));
+                        }
+                        tuple = c10::ivalue::Tuple::create(std::move(elems));
+                        break;
+                      }
+                    }
+                    return c10::optional<torch::jit::IValue>(std::move(tuple));
+                  }})
+        .evaluator({torch::jit::prim::TupleIndex,
+                    [](const torch::jit::Node* n, kwargs& args) -> c10::optional<torch::jit::IValue> {
+                      // Outputs is an IValue which has list of tensors which can be found in ctx->evaluated_value_map
+                      auto tuple = args.at(n->input(0)).IValue()->toTuple();
+                      int64_t idx = args.at(n->input(1)).IValue()->toInt();
+                      int64_t norm_idx = normalizeIndex(idx, tuple->elements().size());
+                      return c10::optional<torch::jit::IValue>(std::move(tuple->elements()[norm_idx]));
+                    },
+                    EvalOptions().validSchemas({"prim::TupleIndex(Any tup, int i) -> (Any)"})})
+        .evaluator({torch::jit::prim::TupleUnpack,
+                    [](const torch::jit::Node* n, kwargs& args) -> c10::optional<torch::jit::IValue> {
+                      // Outputs is an IValue which has list of tensors which can be found in ctx->evaluated_value_map
+                      auto output = args.at(n->input()).IValue()->toTuple();
+                      return c10::optional<torch::jit::IValue>(std::move(output));
+                    }})
         .evaluator({c10::Symbol::fromQualString("prim::unchecked_cast"),
                     [](const torch::jit::Node* n, kwargs& args) -> c10::optional<torch::jit::IValue> {
                       return *(args.at(n->input(0)).IValue());
@@ -277,4 +327,4 @@ auto prim_registrations =
 } // namespace evaluators
 } // namespace conversion
 } // namespace core
-} // namespace torch_tensorrt
+} // namespace torch_tensorrt
diff --git a/core/ir/GraphInputs.cpp b/core/ir/GraphInputs.cpp
@@ -54,7 +54,6 @@ void flatten_dfs(
 }
 
 GraphInputs::GraphInputs(std::vector<ir::Input> inputs_) {
-  LOG_DEBUG("Construct GraphInput with ir::Input");
   inputs = inputs_;
   collection_inputs.resize(inputs_.size());
   for (size_t i = 0; i < inputs_.size(); i++) {
@@ -63,8 +62,6 @@ GraphInputs::GraphInputs(std::vector<ir::Input> inputs_) {
 }
 
 GraphInputs::GraphInputs(torch::jit::IValue& input_signature_) {
-  LOG_DEBUG("Construct GraphInput with IValue");
-
   std::vector<torch_tensorrt::core::ir::Input> flattened_inputs;
   std::vector<std::vector<torch_tensorrt::core::ir::Input>> collection_inputs_;
 
diff --git a/core/ir/ir.cpp b/core/ir/ir.cpp
@@ -29,7 +29,7 @@ InputSpecMap pair_input_vals_with_specs(std::vector<const torch::jit::Value*> va
 
   std::unordered_map<const torch::jit::Value*, core::ir::Input> a;
   for (size_t i = 0; i < vals.size(); i++) {
-    LOG_DEBUG("Pairing " << i << ": " << vals[i]->debugName() << " : " << specs[i]);
+    LOG_DEBUG("Pairing " << i << ": " << vals[i]->debugName() << ": " << specs[i]);
     a.insert({vals[i], specs[i]});
   }
   return a;
@@ -56,7 +56,7 @@ std::vector<const torch::jit::Value*> get_tensor_inputs(
     StaticParams& static_params) {
   std::vector<const torch::jit::Value*> input_tensors;
   auto inputs = g->inputs();
-  LOG_DEBUG("Raw inputs size of get_tensor_inputs: " << inputs.size());
+  LOG_DEBUG("Found " << inputs.size() << " inputs to graph");
   for (auto in : inputs) {
     LOG_DEBUG("Handle input of debug name: " << in->debugName());
     // Disregarding inputs that are not tensors or are static
@@ -76,7 +76,7 @@ std::vector<const torch::jit::Value*> get_collection_inputs(
     StaticParams& static_params) {
   std::vector<const torch::jit::Value*> input_tensors;
   auto inputs = g->inputs();
-  LOG_DEBUG("Raw inputs size of get_collection_inputs: " << inputs.size());
+  LOG_DEBUG("Found " << inputs.size() << " inputs to graph");
   for (auto in : inputs) {
     LOG_DEBUG("Handle input of debug name: " << in->debugName());
     if (in->type()->isSubtypeOf(c10::TensorType::get()) && static_params.find(in) == static_params.end()) {
@@ -86,9 +86,9 @@ std::vector<const torch::jit::Value*> get_collection_inputs(
       // {
       input_tensors.push_back(in); // push original tuple
       at::ArrayRef<torch::jit::Value*> unpack_tuple = torch::jit::createTupleUnpack(in);
-      LOG_DEBUG("get_collection_inputs, tuple size " << unpack_tuple.size());
+      LOG_DEBUG("Input tuple size " << unpack_tuple.size());
     } else if (in->type()->kind() == torch::jit::TypeKind::ListType && static_params.find(in) == static_params.end()) {
-      LOG_DEBUG("get_collection_inputs, list use size " << in->uses().size());
+      LOG_DEBUG("Input list use size " << in->uses().size());
       input_tensors.push_back(in); // push original list
     }
   }
@@ -227,7 +227,7 @@ CollectionTypeMap get_block_first_calc_dtypes_opt_collection(torch::jit::Block*
 
     } else if (i->type()->kind() == torch::jit::TypeKind::ListType) {
       // TODO: to decide the size of list and type of list element
-      LOG_DEBUG("get_block_first_calc_dtypes_opt ListType: use size " << i->uses().size());
+      LOG_DEBUG("Number of list uses " << i->uses().size());
       c10::optional<at::ScalarType> tp = get_value_first_calc_dtype_opt(b, i);
       // std::vector<c10::optional<at::ScalarType>> dytpes(i->uses().size());
       std::vector<c10::optional<at::ScalarType>> dytpes(i->uses().size(), tp);
diff --git a/cpp/src/compile_spec.cpp b/cpp/src/compile_spec.cpp
@@ -69,6 +69,7 @@ torchtrt::core::CompileSpec init_compile_spec(CompileSpec external) {
     return internal;
   } else {
     torch::jit::IValue converted_input_signature;
+    LOG_WARNING( "Input signature parsing is an experimental feature, behavior and APIs may change");
     to_internal_input_signature(external.graph_inputs.input_signature, converted_input_signature);
     torchtrt::core::CompileSpec internal(converted_input_signature);
     return internal;
diff --git a/py/torch_tensorrt/ts/_compile_spec.py b/py/torch_tensorrt/ts/_compile_spec.py
@@ -305,6 +305,20 @@ def TensorRTCompileSpec(inputs=[],
                     torch.randn((1, 3, 224, 244)) # Use an example tensor and let torch_tensorrt infer settings
                 ]
 
+        input_signature Union(List, Tuple, torch_tensorrt.Input, torch.Tensor): A formatted collection of input specifications for the module. Input Sizes can be specified as torch sizes, tuples or lists. dtypes can be specified using
+            torch datatypes or torch_tensorrt datatypes and you can use either torch devices or the torch_tensorrt device type enum to select device type. **This API should be considered beta-level stable and may change in the future** ::
+
+                input_signature=([
+                    torch_tensorrt.Input((1, 3, 224, 224)), # Static NCHW input shape for input #1
+                    torch_tensorrt.Input(
+                        min_shape=(1, 224, 224, 3),
+                        opt_shape=(1, 512, 512, 3),
+                        max_shape=(1, 1024, 1024, 3),
+                        dtype=torch.int32
+                        format=torch.channel_last
+                    ), # Dynamic input shape for input #2
+                ], torch.randn((1, 3, 224, 244))) # Use an example tensor and let torch_tensorrt infer settings for input #3
+
         device (Union(torch_tensorrt.Device, torch.device, dict)): Target device for TensorRT engines to run on ::
 
             device=torch_tensorrt.Device("dla:1", allow_gpu_fallback=True)
diff --git a/py/torch_tensorrt/ts/_compiler.py b/py/torch_tensorrt/ts/_compiler.py
@@ -58,6 +58,19 @@ def compile(module: torch.jit.ScriptModule,
                     torch.randn((1, 3, 224, 244)) # Use an example tensor and let torch_tensorrt infer settings
                 ]
 
+        input_signature Union(List, Tuple, torch_tensorrt.Input, torch.Tensor): A formatted collection of input specifications for the module. Input Sizes can be specified as torch sizes, tuples or lists. dtypes can be specified using
+            torch datatypes or torch_tensorrt datatypes and you can use either torch devices or the torch_tensorrt device type enum to select device type. **This API should be considered beta-level stable and may change in the future** ::
+
+                input_signature=([
+                    torch_tensorrt.Input((1, 3, 224, 224)), # Static NCHW input shape for input #1
+                    torch_tensorrt.Input(
+                        min_shape=(1, 224, 224, 3),
+                        opt_shape=(1, 512, 512, 3),
+                        max_shape=(1, 1024, 1024, 3),
+                        dtype=torch.int32
+                        format=torch.channel_last
+                    ), # Dynamic input shape for input #2
+                ], torch.randn((1, 3, 224, 244))) # Use an example tensor and let torch_tensorrt infer settings for input #3
         device (Union(torch_tensorrt.Device, torch.device, dict)): Target device for TensorRT engines to run on ::
 
             device=torch_tensorrt.Device("dla:1", allow_gpu_fallback=True)
@@ -163,6 +176,20 @@ def convert_method_to_trt_engine(module: torch.jit.ScriptModule,
                     torch.randn((1, 3, 224, 244)) # Use an example tensor and let torch_tensorrt infer settings
                 ]
 
+        input_signature Union(List, Tuple, torch_tensorrt.Input, torch.Tensor): A formatted collection of input specifications for the module. Input Sizes can be specified as torch sizes, tuples or lists. dtypes can be specified using
+            torch datatypes or torch_tensorrt datatypes and you can use either torch devices or the torch_tensorrt device type enum to select device type. **This API should be considered beta-level stable and may change in the future** ::
+
+                input_signature=([
+                    torch_tensorrt.Input((1, 3, 224, 224)), # Static NCHW input shape for input #1
+                    torch_tensorrt.Input(
+                        min_shape=(1, 224, 224, 3),
+                        opt_shape=(1, 512, 512, 3),
+                        max_shape=(1, 1024, 1024, 3),
+                        dtype=torch.int32
+                        format=torch.channel_last
+                    ), # Dynamic input shape for input #2
+                ], torch.randn((1, 3, 224, 244))) # Use an example tensor and let torch_tensorrt infer settings for input #3
+
         device (Union(torch_tensorrt.Device, torch.device, dict)): Target device for TensorRT engines to run on ::
 
             device=torch_tensorrt.Device("dla:1", allow_gpu_fallback=True)
diff --git a/tests/core/conversion/evaluators/test_prim_evaluators.cpp b/tests/core/conversion/evaluators/test_prim_evaluators.cpp
@@ -51,5 +51,112 @@ TEST(Evaluators, NumToTensorEvaluatesCorrectly) {
   auto jit_results = torch_tensorrt::tests::util::EvaluateGraphJIT(g, {});
   auto trt_results = torch_tensorrt::tests::util::EvaluateGraph(g->block(), {});
 
+  ASSERT_TRUE(jit_results[0] == trt_results[0]);
+}
+
+TEST(Evaluators, PrimTupleConstruct1EvaluatesCorrectly) {
+  const auto graph = R"IR(
+      graph():
+        %1 : int = prim::Constant[value=3]()
+        %tc : (int) = prim::TupleConstruct(%1)
+        return (%tc))IR";
+
+  auto g = std::make_shared<torch::jit::Graph>();
+  torch::jit::parseIR(graph, g.get());
+
+  auto jit_results = torch_tensorrt::tests::util::EvaluateGraphJIT(g, {});
+  auto trt_results = torch_tensorrt::tests::util::EvaluateGraph(g->block(), {});
+
+  ASSERT_TRUE(jit_results[0] == trt_results[0]);
+}
+
+TEST(Evaluators, PrimTupleConstruct2EvaluatesCorrectly) {
+  const auto graph = R"IR(
+      graph():
+        %1 : int = prim::Constant[value=3]()
+        %2 : int = prim::Constant[value=4]()
+        %tc : (int, int) = prim::TupleConstruct(%1, %2)
+        return (%tc))IR";
+
+  auto g = std::make_shared<torch::jit::Graph>();
+  torch::jit::parseIR(graph, g.get());
+
+  auto jit_results = torch_tensorrt::tests::util::EvaluateGraphJIT(g, {});
+  auto trt_results = torch_tensorrt::tests::util::EvaluateGraph(g->block(), {});
+
+  ASSERT_TRUE(jit_results[0] == trt_results[0]);
+}
+
+TEST(Evaluators, PrimTupleConstruct3EvaluatesCorrectly) {
+  const auto graph = R"IR(
+      graph():
+        %1 : int = prim::Constant[value=3]()
+        %2 : int = prim::Constant[value=4]()
+        %3 : int = prim::Constant[value=4]()
+        %tc : (int, int, int) = prim::TupleConstruct(%1, %2, %3)
+        return (%tc))IR";
+
+  auto g = std::make_shared<torch::jit::Graph>();
+  torch::jit::parseIR(graph, g.get());
+
+  auto jit_results = torch_tensorrt::tests::util::EvaluateGraphJIT(g, {});
+  auto trt_results = torch_tensorrt::tests::util::EvaluateGraph(g->block(), {});
+
+  ASSERT_TRUE(jit_results[0] == trt_results[0]);
+}
+
+TEST(Evaluators, PrimTupleConstruct4EvaluatesCorrectly) {
+  const auto graph = R"IR(
+      graph():
+        %1 : int = prim::Constant[value=3]()
+        %2 : int = prim::Constant[value=4]()
+        %3 : int = prim::Constant[value=3]()
+        %4 : int = prim::Constant[value=4]()
+        %tc : (int, int, int, int) = prim::TupleConstruct(%1, %2, %3, %4)
+        return (%tc))IR";
+
+  auto g = std::make_shared<torch::jit::Graph>();
+  torch::jit::parseIR(graph, g.get());
+
+  auto jit_results = torch_tensorrt::tests::util::EvaluateGraphJIT(g, {});
+  auto trt_results = torch_tensorrt::tests::util::EvaluateGraph(g->block(), {});
+
+  ASSERT_TRUE(jit_results[0] == trt_results[0]);
+}
+
+TEST(Evaluators, PrimTupleUnpackEvaluatesCorrectly) {
+  const auto graph = R"IR(
+      graph():
+        %1 : int = prim::Constant[value=3]()
+        %2 : int = prim::Constant[value=4]()
+        %tc : (int, int) = prim::TupleConstruct(%1, %2)
+        %tu.1 : int, %tu.2 : int = prim::TupleUnpack(%tc)
+        return (%tu.1, %tu.2))IR";
+
+  auto g = std::make_shared<torch::jit::Graph>();
+  torch::jit::parseIR(graph, g.get());
+
+  auto jit_results = torch_tensorrt::tests::util::EvaluateGraphJIT(g, {});
+  auto trt_results = torch_tensorrt::tests::util::EvaluateGraph(g->block(), {});
+
+  ASSERT_TRUE(jit_results[0] == trt_results[0]);
+}
+
+TEST(Evaluators, PrimTupleIndexEvaluatesCorrectly) {
+  const auto graph = R"IR(
+      graph():
+        %0 : int = prim::Constant[value=1]()
+        %1 : int = prim::Constant[value=3]()
+        %2 : int = prim::Constant[value=4]()
+        %tc : (int, int) = prim::TupleConstruct(%1, %2)
+        %ti : int = prim::TupleIndex(%tc, %0)
+        return (%ti))IR";
+
+  auto g = std::make_shared<torch::jit::Graph>();
+  torch::jit::parseIR(graph, g.get());
+
+  auto jit_results = torch_tensorrt::tests::util::EvaluateGraphJIT(g, {});
+  auto trt_results = torch_tensorrt::tests::util::EvaluateGraph(g->block(), {});
+
   ASSERT_TRUE(jit_results[0] == trt_results[0]);
 }
diff --git a/tests/cpp/test_collections.cpp b/tests/cpp/test_collections.cpp
diff --git a/tests/util/evaluate_graph.cpp b/tests/util/evaluate_graph.cpp

Original file line number	Diff line number	Diff line change
`@@ -54,7 +54,6 @@ void flatten_dfs(`
`54`	`54`	`}`
`55`	`55`
`56`	`56`	`GraphInputs::GraphInputs(std::vector<ir::Input> inputs_) {`
`57`		`- LOG_DEBUG("Construct GraphInput with ir::Input");`
`58`	`57`	`inputs = inputs_;`
`59`	`58`	`collection_inputs.resize(inputs_.size());`
`60`	`59`	`for (size_t i = 0; i < inputs_.size(); i++) {`
`@@ -63,8 +62,6 @@ GraphInputs::GraphInputs(std::vector<ir::Input> inputs_) {`
`63`	`62`	`}`
`64`	`63`
`65`	`64`	`GraphInputs::GraphInputs(torch::jit::IValue& input_signature_) {`
`66`		`- LOG_DEBUG("Construct GraphInput with IValue");`
`67`		`-`
`68`	`65`	`std::vector<torch_tensorrt::core::ir::Input> flattened_inputs;`
`69`	`66`	`std::vector<std::vector<torch_tensorrt::core::ir::Input>> collection_inputs_;`
`70`	`67`