pytorch
diff --git a/‎README.md
Lines changed: 1 addition & 1 deletion b/‎README.md
Lines changed: 1 addition & 1 deletion
diff --git a/‎core/conversion/converters/impl/select.cpp
Lines changed: 14 additions & 0 deletions b/‎core/conversion/converters/impl/select.cpp
Lines changed: 14 additions & 0 deletions
diff --git a/‎core/lowering/lowering.h
Lines changed: 1 addition & 1 deletion b/‎core/lowering/lowering.h
Lines changed: 1 addition & 1 deletion
diff --git a/‎core/partitioning/partitioninginfo/PartitioningInfo.h
Lines changed: 5 additions & 0 deletions b/‎core/partitioning/partitioninginfo/PartitioningInfo.h
Lines changed: 5 additions & 0 deletions
diff --git a/‎core/partitioning/shape_analysis.cpp
Lines changed: 9 additions & 4 deletions b/‎core/partitioning/shape_analysis.cpp
Lines changed: 9 additions & 4 deletions
diff --git a/‎cpp/src/compile_spec.cpp
Lines changed: 6 additions & 0 deletions b/‎cpp/src/compile_spec.cpp
Lines changed: 6 additions & 0 deletions
diff --git a/‎docs/_cpp_api/classtorch__tensorrt_1_1DataType.html
Lines changed: 2 additions & 2 deletions b/‎docs/_cpp_api/classtorch__tensorrt_1_1DataType.html
Lines changed: 2 additions & 2 deletions
diff --git a/‎docs/_cpp_api/classtorch__tensorrt_1_1Device_1_1DeviceType.html
Lines changed: 2 additions & 2 deletions b/‎docs/_cpp_api/classtorch__tensorrt_1_1Device_1_1DeviceType.html
Lines changed: 2 additions & 2 deletions
diff --git a/‎docs/_cpp_api/classtorch__tensorrt_1_1TensorFormat.html
Lines changed: 2 additions & 2 deletions b/‎docs/_cpp_api/classtorch__tensorrt_1_1TensorFormat.html
Lines changed: 2 additions & 2 deletions
diff --git a/‎docs/_cpp_api/classtorch__tensorrt_1_1ptq_1_1Int8CacheCalibrator.html
Lines changed: 2 additions & 2 deletions b/‎docs/_cpp_api/classtorch__tensorrt_1_1ptq_1_1Int8CacheCalibrator.html
Lines changed: 2 additions & 2 deletions
diff --git a/‎docs/_cpp_api/classtorch__tensorrt_1_1ptq_1_1Int8Calibrator.html
Lines changed: 2 additions & 2 deletions b/‎docs/_cpp_api/classtorch__tensorrt_1_1ptq_1_1Int8Calibrator.html
Lines changed: 2 additions & 2 deletions
diff --git a/‎docs/_cpp_api/define_macros_8h_1a18d295a837ac71add5578860b55e5502.html
Lines changed: 2 additions & 2 deletions b/‎docs/_cpp_api/define_macros_8h_1a18d295a837ac71add5578860b55e5502.html
Lines changed: 2 additions & 2 deletions
diff --git a/‎docs/_cpp_api/define_macros_8h_1a282fd3c0b1c3a215148ae372070e1268.html
Lines changed: 2 additions & 2 deletions b/‎docs/_cpp_api/define_macros_8h_1a282fd3c0b1c3a215148ae372070e1268.html
Lines changed: 2 additions & 2 deletions
diff --git a/‎docs/_cpp_api/define_macros_8h_1a31398a6d4d27e28817afb0f0139e909e.html
Lines changed: 2 additions & 2 deletions b/‎docs/_cpp_api/define_macros_8h_1a31398a6d4d27e28817afb0f0139e909e.html
Lines changed: 2 additions & 2 deletions
diff --git a/‎docs/_cpp_api/define_macros_8h_1a35703561b26b1a9d2738ad7d58b27827.html
Lines changed: 2 additions & 2 deletions b/‎docs/_cpp_api/define_macros_8h_1a35703561b26b1a9d2738ad7d58b27827.html
Lines changed: 2 additions & 2 deletions
diff --git a/‎docs/_cpp_api/define_macros_8h_1abd1465eb38256d3f22cc1426b23d516b.html
Lines changed: 2 additions & 2 deletions b/‎docs/_cpp_api/define_macros_8h_1abd1465eb38256d3f22cc1426b23d516b.html
Lines changed: 2 additions & 2 deletions
diff --git a/‎docs/_cpp_api/define_macros_8h_1abe87b341f562fd1cf40b7672e4d759da.html
Lines changed: 2 additions & 2 deletions b/‎docs/_cpp_api/define_macros_8h_1abe87b341f562fd1cf40b7672e4d759da.html
Lines changed: 2 additions & 2 deletions
diff --git a/‎docs/_cpp_api/define_macros_8h_1ad19939408f7be171a74a89928b36eb59.html
Lines changed: 2 additions & 2 deletions b/‎docs/_cpp_api/define_macros_8h_1ad19939408f7be171a74a89928b36eb59.html
Lines changed: 2 additions & 2 deletions
diff --git a/‎docs/_cpp_api/define_macros_8h_1adad592a7b1b7eed529cdf6acd584c883.html
Lines changed: 2 additions & 2 deletions b/‎docs/_cpp_api/define_macros_8h_1adad592a7b1b7eed529cdf6acd584c883.html
Lines changed: 2 additions & 2 deletions
diff --git a/‎docs/_cpp_api/dir_cpp.html
Lines changed: 2 additions & 2 deletions b/‎docs/_cpp_api/dir_cpp.html
Lines changed: 2 additions & 2 deletions
@@ -114,7 +114,7 @@ torch.jit.save(trt_ts_module, "trt_torchscript_module.ts") # save the TRT embedd
 These are the following dependencies used to verify the testcases. Torch-TensorRT can work with other versions, but the tests are not guaranteed to pass.
 
 - Bazel 5.2.0
-- Libtorch 1.14.0.dev20221114 (built with CUDA 11.7)
+- Libtorch 1.14.0.dev20221205 (built with CUDA 11.7)
 - CUDA 11.7
 - cuDNN 8.5.0
 - TensorRT 8.5.1.7
 
@@ -736,8 +736,22 @@ auto select_registrations TORCHTRT_UNUSED =
             {"aten::where.self(Tensor condition, Tensor self, Tensor other) -> (Tensor)",
              [](ConversionCtx* ctx, const torch::jit::Node* n, args& args) -> bool {
                auto condition = args[0].ITensorOrFreeze(ctx);
+               auto condition_nbDims = condition->getDimensions().nbDims;
                auto x = args[1].ITensorOrFreeze(ctx);
+               auto x_nbDims = x->getDimensions().nbDims;
                auto y = args[2].ITensorOrFreeze(ctx);
+               auto y_nbDims = y->getDimensions().nbDims;
+
+               // Get maximum rank of all input tensors
+               auto max_nbDims = std::max(condition_nbDims, std::max(x_nbDims, y_nbDims));
+
+               // TensorRT requires all inputs to Select layers to have the same rank, so for each
+               // tensor input, ensure that its rank is equal to the maximum number of dimensions
+               // If not, left-pad the tensor dimension with 1s until the max rank is achieved
+               condition =
+                   addPadding(ctx, n, condition, max_nbDims, /*bool trailing =*/false, /*bool use_zeros =*/false);
+               x = addPadding(ctx, n, x, max_nbDims, /*bool trailing =*/false, /*bool use_zeros =*/false);
+               y = addPadding(ctx, n, y, max_nbDims, /*bool trailing =*/false, /*bool use_zeros =*/false);
 
                auto layer = ctx->net->addSelect(*condition, *x, *y);
 
 
@@ -20,7 +20,7 @@ struct LowerInfo {
   std::vector<std::string> forced_fallback_modules;
   friend std::ostream& operator<<(std::ostream& os, const LowerInfo& l);
 
-  std::string getGPUDeviceString() {
+  std::string getGPUDeviceString() const {
     return "cuda:" + std::to_string(target_device.gpu_id);
   };
 };
 
@@ -16,6 +16,11 @@ struct PartitioningInfo {
   uint64_t min_block_size = 1;
   std::vector<std::string> forced_fallback_operators;
   bool truncate_long_and_double;
+  ir::Device target_device;
+
+  std::string getGPUDeviceString() const {
+    return "cuda:" + std::to_string(target_device.gpu_id);
+  };
 };
 
 std::ostream& operator<<(std::ostream& os, const PartitioningInfo& s);
 
@@ -99,7 +99,7 @@ torch::jit::Node* getUpstreamCastNode(torch::jit::Value* val) {
   return nullptr;
 }
 
-torch::jit::Node* createCastNode(SegmentedBlock& seg_block, size_t index, bool is_input) {
+torch::jit::Node* createCastNode(SegmentedBlock& seg_block, size_t index, bool is_input, std::string device) {
   auto cast_raw_value = is_input ? seg_block.raw_inputs()[index] : seg_block.raw_outputs()[index];
   auto cast_subgraph_value = is_input ? seg_block.inputs()[index] : seg_block.outputs()[index];
   torch::jit::Node* cast_node = getUpstreamCastNode(cast_raw_value);
@@ -125,8 +125,11 @@ torch::jit::Node* createCastNode(SegmentedBlock& seg_block, size_t index, bool i
     auto const_type = is_input ? g->insertConstant(4) : g->insertConstant(3);
     auto const_zero = g->insertConstant(0);
     const_zero->setType(torch::jit::BoolType::get());
+    auto cuda = g->insertConstant(device);
+    cuda->setType(torch::jit::DeviceObjType::get());
     auto none_val = g->insertNode(g->createNone())->output();
-    cast_node = g->create(torch::jit::aten::to, {cast_subgraph_value, const_type, const_zero, const_zero, none_val});
+    cast_node =
+        g->create(torch::jit::aten::to, {cast_subgraph_value, cuda, const_type, const_zero, const_zero, none_val});
   }
   return cast_node;
 }
@@ -217,6 +220,8 @@ void getSegmentsOutputByRunning(
     ivalues_maps[output] = jit_results[idx++];
   }
 
+  auto target_device = partitioning_info.getGPUDeviceString();
+
   // auto int64 <=> int32 conversion
   if (seg_block.target() == SegmentedBlock::kTorch && partitioning_info.truncate_long_and_double) {
     // First, check if there is Int64 input
@@ -226,7 +231,7 @@ void getSegmentsOutputByRunning(
         at::ScalarType t = cur_ivalue.toTensor().scalar_type();
         if (t == at::kLong) {
           // we add a cast operation to cast the type to Int64
-          auto cast_node = createCastNode(seg_block, i, true);
+          auto cast_node = createCastNode(seg_block, i, true, target_device);
           seg_block.g()->prependNode(cast_node);
           seg_block.inputs()[i]->replaceAllUsesAfterNodeWith(cast_node, cast_node->outputs()[0]);
         }
@@ -237,7 +242,7 @@ void getSegmentsOutputByRunning(
         auto cur_ivalue = ivalues_maps[seg_block.raw_outputs()[i]];
         at::ScalarType t = cur_ivalue.toTensor().scalar_type();
         if (t == at::kLong) {
-          auto cast_node = createCastNode(seg_block, i, false);
+          auto cast_node = createCastNode(seg_block, i, false, target_device);
           seg_block.g()->appendNode(cast_node);
           seg_block.g()->block()->replaceOutput(i, cast_node->outputs()[0]);
         }
 
@@ -111,6 +111,7 @@ torchtrt::core::CompileSpec to_internal_compile_spec(CompileSpec external) {
   internal.convert_info.engine_settings.truncate_long_and_double = external.truncate_long_and_double;
   internal.convert_info.engine_settings.device.allow_gpu_fallback = external.device.allow_gpu_fallback;
   internal.lower_info.target_device.allow_gpu_fallback = external.device.allow_gpu_fallback;
+  internal.partitioning_info.target_device.allow_gpu_fallback = external.device.allow_gpu_fallback;
 
   TORCHTRT_CHECK(
       !(external.require_full_compilation && (external.torch_executed_ops.size() > 0)),
@@ -132,11 +133,13 @@ torchtrt::core::CompileSpec to_internal_compile_spec(CompileSpec external) {
     case Device::DeviceType::kDLA:
       internal.convert_info.engine_settings.device.device_type = nvinfer1::DeviceType::kDLA;
       internal.lower_info.target_device.device_type = nvinfer1::DeviceType::kDLA;
+      internal.partitioning_info.target_device.device_type = nvinfer1::DeviceType::kDLA;
       break;
     case Device::DeviceType::kGPU:
     default:
       internal.convert_info.engine_settings.device.device_type = nvinfer1::DeviceType::kGPU;
       internal.lower_info.target_device.device_type = nvinfer1::DeviceType::kGPU;
+      internal.partitioning_info.target_device.device_type = nvinfer1::DeviceType::kGPU;
   }
 
   switch (external.capability) {
@@ -155,6 +158,9 @@ torchtrt::core::CompileSpec to_internal_compile_spec(CompileSpec external) {
   internal.convert_info.engine_settings.device.dla_core = external.device.dla_core;
   internal.lower_info.target_device.gpu_id = external.device.gpu_id;
   internal.lower_info.target_device.dla_core = external.device.dla_core;
+  internal.partitioning_info.target_device.gpu_id = external.device.gpu_id;
+  internal.partitioning_info.target_device.dla_core = external.device.dla_core;
+
   internal.convert_info.engine_settings.num_avg_timing_iters = external.num_avg_timing_iters;
   internal.convert_info.engine_settings.workspace_size = external.workspace_size;
   internal.convert_info.engine_settings.dla_sram_size = external.dla_sram_size;
 
@@ -10,7 +10,7 @@
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0">
 
-  <title>Class DataType &mdash; Torch-TensorRT v1.4.0dev0+b7ceedf documentation</title>
+  <title>Class DataType &mdash; Torch-TensorRT v1.4.0dev0+af39c65 documentation</title>
 
 
 
@@ -215,7 +215,7 @@
 
 
                 <div class="version">
-                  v1.4.0dev0+b7ceedf
+                  v1.4.0dev0+af39c65
                 </div>
 
 
 
@@ -10,7 +10,7 @@
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0">
 
-  <title>Class Device::DeviceType &mdash; Torch-TensorRT v1.4.0dev0+b7ceedf documentation</title>
+  <title>Class Device::DeviceType &mdash; Torch-TensorRT v1.4.0dev0+af39c65 documentation</title>
 
 
 
@@ -215,7 +215,7 @@
 
 
                 <div class="version">
-                  v1.4.0dev0+b7ceedf
+                  v1.4.0dev0+af39c65
                 </div>
 
 
 
@@ -10,7 +10,7 @@
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0">
 
-  <title>Class TensorFormat &mdash; Torch-TensorRT v1.4.0dev0+b7ceedf documentation</title>
+  <title>Class TensorFormat &mdash; Torch-TensorRT v1.4.0dev0+af39c65 documentation</title>
 
 
 
@@ -215,7 +215,7 @@
 
 
                 <div class="version">
-                  v1.4.0dev0+b7ceedf
+                  v1.4.0dev0+af39c65
                 </div>
 
 
 
@@ -10,7 +10,7 @@
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0">
 
-  <title>Template Class Int8CacheCalibrator &mdash; Torch-TensorRT v1.4.0dev0+b7ceedf documentation</title>
+  <title>Template Class Int8CacheCalibrator &mdash; Torch-TensorRT v1.4.0dev0+af39c65 documentation</title>
 
 
 
@@ -215,7 +215,7 @@
 
 
                 <div class="version">
-                  v1.4.0dev0+b7ceedf
+                  v1.4.0dev0+af39c65
                 </div>
 
 
 
@@ -10,7 +10,7 @@
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0">
 
-  <title>Template Class Int8Calibrator &mdash; Torch-TensorRT v1.4.0dev0+b7ceedf documentation</title>
+  <title>Template Class Int8Calibrator &mdash; Torch-TensorRT v1.4.0dev0+af39c65 documentation</title>
 
 
 
@@ -215,7 +215,7 @@
 
 
                 <div class="version">
-                  v1.4.0dev0+b7ceedf
+                  v1.4.0dev0+af39c65
                 </div>
 
 
 
@@ -10,7 +10,7 @@
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0">
 
-  <title>Define STR &mdash; Torch-TensorRT v1.4.0dev0+b7ceedf documentation</title>
+  <title>Define STR &mdash; Torch-TensorRT v1.4.0dev0+af39c65 documentation</title>
 
 
 
@@ -215,7 +215,7 @@
 
 
                 <div class="version">
-                  v1.4.0dev0+b7ceedf
+                  v1.4.0dev0+af39c65
                 </div>
 
 
 
@@ -10,7 +10,7 @@
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0">
 
-  <title>Define TORCH_TENSORRT_PATCH_VERSION &mdash; Torch-TensorRT v1.4.0dev0+b7ceedf documentation</title>
+  <title>Define TORCH_TENSORRT_PATCH_VERSION &mdash; Torch-TensorRT v1.4.0dev0+af39c65 documentation</title>
 
 
 
@@ -215,7 +215,7 @@
 
 
                 <div class="version">
-                  v1.4.0dev0+b7ceedf
+                  v1.4.0dev0+af39c65
                 </div>
 
 
 
@@ -10,7 +10,7 @@
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0">
 
-  <title>Define TORCH_TENSORRT_MAJOR_VERSION &mdash; Torch-TensorRT v1.4.0dev0+b7ceedf documentation</title>
+  <title>Define TORCH_TENSORRT_MAJOR_VERSION &mdash; Torch-TensorRT v1.4.0dev0+af39c65 documentation</title>
 
 
 
@@ -215,7 +215,7 @@
 
 
                 <div class="version">
-                  v1.4.0dev0+b7ceedf
+                  v1.4.0dev0+af39c65
                 </div>
 
 
 
@@ -10,7 +10,7 @@
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0">
 
-  <title>Define TORCH_TENSORRT_MINOR_VERSION &mdash; Torch-TensorRT v1.4.0dev0+b7ceedf documentation</title>
+  <title>Define TORCH_TENSORRT_MINOR_VERSION &mdash; Torch-TensorRT v1.4.0dev0+af39c65 documentation</title>
 
 
 
@@ -215,7 +215,7 @@
 
 
                 <div class="version">
-                  v1.4.0dev0+b7ceedf
+                  v1.4.0dev0+af39c65
                 </div>
 
 
 
@@ -10,7 +10,7 @@
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0">
 
-  <title>Define TORCHTRT_API &mdash; Torch-TensorRT v1.4.0dev0+b7ceedf documentation</title>
+  <title>Define TORCHTRT_API &mdash; Torch-TensorRT v1.4.0dev0+af39c65 documentation</title>
 
 
 
@@ -215,7 +215,7 @@
 
 
                 <div class="version">
-                  v1.4.0dev0+b7ceedf
+                  v1.4.0dev0+af39c65
                 </div>
 
 
 
@@ -10,7 +10,7 @@
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0">
 
-  <title>Define XSTR &mdash; Torch-TensorRT v1.4.0dev0+b7ceedf documentation</title>
+  <title>Define XSTR &mdash; Torch-TensorRT v1.4.0dev0+af39c65 documentation</title>
 
 
 
@@ -215,7 +215,7 @@
 
 
                 <div class="version">
-                  v1.4.0dev0+b7ceedf
+                  v1.4.0dev0+af39c65
                 </div>
 
 
 
@@ -10,7 +10,7 @@
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0">
 
-  <title>Define TORCHTRT_HIDDEN &mdash; Torch-TensorRT v1.4.0dev0+b7ceedf documentation</title>
+  <title>Define TORCHTRT_HIDDEN &mdash; Torch-TensorRT v1.4.0dev0+af39c65 documentation</title>
 
 
 
@@ -215,7 +215,7 @@
 
 
                 <div class="version">
-                  v1.4.0dev0+b7ceedf
+                  v1.4.0dev0+af39c65
                 </div>
 
 
 
@@ -10,7 +10,7 @@
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0">
 
-  <title>Define TORCH_TENSORRT_VERSION &mdash; Torch-TensorRT v1.4.0dev0+b7ceedf documentation</title>
+  <title>Define TORCH_TENSORRT_VERSION &mdash; Torch-TensorRT v1.4.0dev0+af39c65 documentation</title>
 
 
 
@@ -215,7 +215,7 @@
 
 
                 <div class="version">
-                  v1.4.0dev0+b7ceedf
+                  v1.4.0dev0+af39c65
                 </div>
 
 
 
@@ -10,7 +10,7 @@
 
   <meta name="viewport" content="width=device-width, initial-scale=1.0">
 
-  <title>Directory cpp &mdash; Torch-TensorRT v1.4.0dev0+b7ceedf documentation</title>
+  <title>Directory cpp &mdash; Torch-TensorRT v1.4.0dev0+af39c65 documentation</title>
 
 
 
@@ -213,7 +213,7 @@
 
 
                 <div class="version">
-                  v1.4.0dev0+b7ceedf
+                  v1.4.0dev0+af39c65
                 </div>