pytorch
diff --git a/‎cpp/api/include/trtorch/trtorch.h
Lines changed: 80 additions & 7 deletions b/‎cpp/api/include/trtorch/trtorch.h
Lines changed: 80 additions & 7 deletions
diff --git a/‎cpp/api/src/compile_spec.cpp
Lines changed: 68 additions & 3 deletions b/‎cpp/api/src/compile_spec.cpp
Lines changed: 68 additions & 3 deletions
diff --git a/‎tests/BUILD
Lines changed: 8 additions & 1 deletion b/‎tests/BUILD
Lines changed: 8 additions & 1 deletion
diff --git a/‎tests/core/runtime/BUILD
Lines changed: 8 additions & 0 deletions b/‎tests/core/runtime/BUILD
Lines changed: 8 additions & 0 deletions
@@ -371,6 +371,19 @@ struct TRTORCH_API CompileSpec {
     DataType dtype;
     /// Expected tensor format for the input
     TensorFormat format;
+
+    /**
+     * @brief Construct a new Input spec object for static input size from
+     * vector, optional arguments allow the user to configure expected input shape
+     * tensor format. dtype (Expected data type for the input) defaults to PyTorch
+     * / traditional TRT convection (FP32 for FP32 only, FP16 for FP32 and FP16, FP32 for Int8)
+     *
+     * @param shape Input tensor shape
+     * @param dtype Expected data type for the input (Defaults to Float32)
+     * @param format Expected tensor format for the input (Defaults to contiguous)
+     */
+    Input(std::vector<int64_t> shape, TensorFormat format=TensorFormat::kContiguous);
+
     /**
      * @brief Construct a new Input spec object for static input size from
      * vector, optional arguments allow the user to configure expected input shape
@@ -380,7 +393,20 @@ struct TRTORCH_API CompileSpec {
      * @param dtype Expected data type for the input (Defaults to Float32)
      * @param format Expected tensor format for the input (Defaults to contiguous)
      */
-    Input(std::vector<int64_t> shape, DataType dtype=DataType::kFloat, TensorFormat format=TensorFormat::kContiguous);
+    Input(std::vector<int64_t> shape, DataType dtype, TensorFormat format=TensorFormat::kContiguous);
+
+    /**
+     * @brief Construct a new Input spec object for static input size from
+     * c10::ArrayRef (the type produced by tensor.sizes()), vector, optional arguments
+     * allow the user to configure expected input shape tensor format
+     * dtype (Expected data type for the input) defaults to PyTorch
+     * / traditional TRT convection (FP32 for FP32 only, FP16 for FP32 and FP16, FP32 for Int8)
+     *
+     * @param shape Input tensor shape
+     * @param format Expected tensor format for the input (Defaults to contiguous)
+     */
+    Input(c10::ArrayRef<int64_t> shape, TensorFormat format=TensorFormat::kContiguous);
+
     /**
      * @brief Construct a new Input spec object for static input size from
      * c10::ArrayRef (the type produced by tensor.sizes()), vector, optional arguments
@@ -390,7 +416,21 @@ struct TRTORCH_API CompileSpec {
      * @param dtype Expected data type for the input (Defaults to Float32)
      * @param format Expected tensor format for the input (Defaults to contiguous)
      */
-    Input(c10::ArrayRef<int64_t> shape, DataType dtype=DataType::kFloat, TensorFormat format=TensorFormat::kContiguous);
+    Input(c10::ArrayRef<int64_t> shape, DataType dtype, TensorFormat format=TensorFormat::kContiguous);
+
+    /**
+     * @brief Construct a new Input Range object dynamic input size from
+     * c10::ArrayRef (the type produced by tensor.sizes()) for min, opt, and max
+     * supported sizes. dtype (Expected data type for the input) defaults to PyTorch
+     * / traditional TRT convection (FP32 for FP32 only, FP16 for FP32 and FP16, FP32 for Int8)
+     *
+     * @param min_shape Minimum shape for input tensor
+     * @param opt_shape Target optimization shape for input tensor
+     * @param max_shape Maximum acceptible shape for input tensor
+     * @param format Expected tensor format for the input (Defaults to contiguous)
+     */
+    Input(std::vector<int64_t> min_shape, std::vector<int64_t> opt_shape, std::vector<int64_t> max_shape, TensorFormat format=TensorFormat::kContiguous);
+
     /**
      * @brief Construct a new Input spec object for a dynamic input size from vectors
      * for minimum shape, optimal shape, and max shape supported sizes optional arguments
@@ -402,7 +442,21 @@ struct TRTORCH_API CompileSpec {
      * @param dtype Expected data type for the input (Defaults to Float32)
      * @param format Expected tensor format for the input (Defaults to contiguous)
      */
-    Input(std::vector<int64_t> min_shape, std::vector<int64_t> opt_shape, std::vector<int64_t> max_shape, DataType dtype=DataType::kFloat, TensorFormat format=TensorFormat::kContiguous);
+    Input(std::vector<int64_t> min_shape, std::vector<int64_t> opt_shape, std::vector<int64_t> max_shape, DataType dtype, TensorFormat format=TensorFormat::kContiguous);
+
+    /**
+     * @brief Construct a new Input Range object dynamic input size from
+     * c10::ArrayRef (the type produced by tensor.sizes()) for min, opt, and max
+     * supported sizes. dtype (Expected data type for the input) defaults to PyTorch
+     * / traditional TRT convection (FP32 for FP32 only, FP16 for FP32 and FP16, FP32 for Int8)
+     *
+     * @param min_shape Minimum shape for input tensor
+     * @param opt_shape Target optimization shape for input tensor
+     * @param max_shape Maximum acceptible shape for input tensor
+     * @param format Expected tensor format for the input (Defaults to contiguous)
+     */
+    Input(c10::ArrayRef<int64_t> min_shape, c10::ArrayRef<int64_t> opt_shape, c10::ArrayRef<int64_t> max_shape, TensorFormat format=TensorFormat::kContiguous);
+
     /**
      * @brief Construct a new Input Range object dynamic input size from
      * c10::ArrayRef (the type produced by tensor.sizes()) for min, opt, and max
@@ -414,10 +468,12 @@ struct TRTORCH_API CompileSpec {
      * @param dtype Expected data type for the input (Defaults to Float32)
      * @param format Expected tensor format for the input (Defaults to contiguous)
      */
-    Input(c10::ArrayRef<int64_t> min_shape, c10::ArrayRef<int64_t> opt_shape, c10::ArrayRef<int64_t> max_shape, DataType dtype=DataType::kFloat, TensorFormat format=TensorFormat::kContiguous);
+    Input(c10::ArrayRef<int64_t> min_shape, c10::ArrayRef<int64_t> opt_shape, c10::ArrayRef<int64_t> max_shape, DataType dtype, TensorFormat format=TensorFormat::kContiguous);
 
+    bool get_explicit_set_dtype() {return explicit_set_dtype;}
   private:
     bool input_is_dynamic;
+    bool explicit_set_dtype;
   };
 
   /**
@@ -512,28 +568,45 @@ struct TRTORCH_API CompileSpec {
    *
    * @param input_ranges
    */
-  [[deprecated("trtorch::CompileSpec::CompileSpec(std::vector<InputRange> input_ranges) is being deprecated in favor of trtorch::CompileSpec::CompileSpec(std::vector<Input> inputs). trtorch::CompileSpec::CompileSpec(std::vector<InputRange> input_ranges) will be removed in TRTorch v0.5.0")]]
+  [[deprecated("trtorch::CompileSpec::CompileSpec(std::vector<InputRange> input_ranges) is being deprecated in favor of trtorch::CompileSpec::CompileSpec(std::vector<Input> inputs). Please use CompileSpec(std::vector<Input> inputs). trtorch::CompileSpec::CompileSpec(std::vector<InputRange> input_ranges) will be removed in TRTorch v0.5.0")]]
   CompileSpec(std::vector<InputRange> input_ranges) : input_ranges(std::move(input_ranges)) {}
   /**
    * @brief Construct a new Extra Info object
    * Convienence constructor to set fixed input size from vectors describing
    * size of input tensors. Each entry in the vector represents a input and
    * should be provided in call order.
    *
+   * This constructor should be use as a convience in the case that all inputs are static sized and
+   * you are okay with default input dtype and formats (FP32 for FP32 and INT8 weights, FP16 for FP16 weights, contiguous)
+   *
    * @param fixed_sizes
    */
-  [[deprecated("trtorch::CompileSpec::InputRange is being deprecated in favor of trtorch::CompileSpec::Input. trtorch::CompileSpec::InputRange will be removed in TRTorch v0.5.0")]]
   CompileSpec(std::vector<std::vector<int64_t>> fixed_sizes);
+
   /**
    * @brief Construct a new Extra Info object
    * Convienence constructor to set fixed input size from c10::ArrayRef's (the
    * output of tensor.sizes()) describing size of input tensors. Each entry in
    * the vector represents a input and should be provided in call order.
+   *
+   * This constructor should be use as a convience in the case that all inputs are static sized and
+   * you are okay with default input dtype and formats (FP32 for FP32 and INT8 weights, FP16 for FP16 weights, contiguous)
+   *
    * @param fixed_sizes
    */
-  [[deprecated("trtorch::CompileSpec::InputRange is being deprecated in favor of trtorch::CompileSpec::Input. trtorch::CompileSpec::InputRange will be removed in TRTorch v0.5.0")]]
   CompileSpec(std::vector<c10::ArrayRef<int64_t>> fixed_sizes);
 
+  /**
+   * @brief Construct a new Extra Info object from input ranges.
+   * Each entry in the vector represents a input and should be provided in call
+   * order.
+   *
+   * Use this constructor to define inputs with dynamic shape, specific input types or tensor formats
+   *
+   * @param inputs
+   */
+  CompileSpec(std::vector<Input> inputs) : inputs(std::move(inputs)) {}
+
   // Defaults should reflect TensorRT defaults for BuilderConfig
 
   /**
 
@@ -105,23 +105,46 @@ CompileSpec::InputRange::InputRange(c10::IntArrayRef min, c10::IntArrayRef opt,
 
 CompileSpec::CompileSpec(std::vector<c10::ArrayRef<int64_t>> fixed_sizes) {
   for (auto in : fixed_sizes) {
-    input_ranges.push_back(InputRange(in));
+    inputs.push_back(Input(in));
   }
 }
 
 CompileSpec::CompileSpec(std::vector<std::vector<int64_t>> fixed_sizes) {
   for (auto in : fixed_sizes) {
-    input_ranges.push_back(InputRange(in));
+    inputs.push_back(Input(in));
   }
 }
 
 /* ====== DEFINE INPUTS CLASS MEMBERS ======*/
+CompileSpec::Input::Input(std::vector<int64_t> shape, TensorFormat format) {
+  this->opt_shape = shape;
+  this->min_shape = shape;
+  this->max_shape = shape;
+  this->shape = shape;
+  this->dtype = dtype;
+  this->explicit_set_dtype = false;
+  this->format = format;
+  this->input_is_dynamic = false;
+}
+
 CompileSpec::Input::Input(std::vector<int64_t> shape, DataType dtype, TensorFormat format) {
   this->opt_shape = shape;
   this->min_shape = shape;
   this->max_shape = shape;
   this->shape = shape;
   this->dtype = dtype;
+  this->explicit_set_dtype = true;
+  this->format = format;
+  this->input_is_dynamic = false;
+}
+
+CompileSpec::Input::Input(c10::IntArrayRef shape, TensorFormat format) {
+  this->opt_shape = core::util::toVec(shape);
+  this->min_shape = core::util::toVec(shape);
+  this->max_shape = core::util::toVec(shape);
+  this->shape = core::util::toVec(shape);
+  this->dtype = DataType::kFloat;
+  this->explicit_set_dtype = false;
   this->format = format;
   this->input_is_dynamic = false;
 }
@@ -132,16 +155,40 @@ CompileSpec::Input::Input(c10::IntArrayRef shape, DataType dtype, TensorFormat f
   this->max_shape = core::util::toVec(shape);
   this->shape = core::util::toVec(shape);
   this->dtype = dtype;
+  this->explicit_set_dtype = true;
   this->format = format;
   this->input_is_dynamic = false;
 }
 
+CompileSpec::Input::Input(std::vector<int64_t> min_shape, std::vector<int64_t> opt_shape, std::vector<int64_t> max_shape, TensorFormat format) {
+  this->opt_shape = opt_shape;
+  this->min_shape = min_shape;
+  this->max_shape = max_shape;
+  this->shape = core::util::toVec(core::ir::Input(this->min_shape, this->opt_shape, this->max_shape).input_shape);
+  this->dtype = dtype;
+  this->explicit_set_dtype = false;
+  this->format = format;
+  this->input_is_dynamic = true;
+}
+
 CompileSpec::Input::Input(std::vector<int64_t> min_shape, std::vector<int64_t> opt_shape, std::vector<int64_t> max_shape, DataType dtype, TensorFormat format) {
   this->opt_shape = opt_shape;
   this->min_shape = min_shape;
   this->max_shape = max_shape;
   this->shape = core::util::toVec(core::ir::Input(this->min_shape, this->opt_shape, this->max_shape).input_shape);
   this->dtype = dtype;
+  this->explicit_set_dtype = true;
+  this->format = format;
+  this->input_is_dynamic = true;
+}
+
+CompileSpec::Input::Input(c10::IntArrayRef min_shape, c10::IntArrayRef opt_shape, c10::IntArrayRef max_shape, TensorFormat format) {
+  this->opt_shape = core::util::toVec(opt_shape);
+  this->min_shape = core::util::toVec(min_shape);
+  this->max_shape = core::util::toVec(max_shape);
+  this->shape = core::util::toVec(core::ir::Input(this->min_shape, this->opt_shape, this->max_shape).input_shape);
+  this->dtype = dtype;
+  this->explicit_set_dtype = false;
   this->format = format;
   this->input_is_dynamic = true;
 }
@@ -152,6 +199,7 @@ CompileSpec::Input::Input(c10::IntArrayRef min_shape, c10::IntArrayRef opt_shape
   this->max_shape = core::util::toVec(max_shape);
   this->shape = core::util::toVec(core::ir::Input(this->min_shape, this->opt_shape, this->max_shape).input_shape);
   this->dtype = dtype;
+  this->explicit_set_dtype = true;
   this->format = format;
   this->input_is_dynamic = true;
 }
@@ -191,14 +239,31 @@ core::CompileSpec to_internal_compile_spec(CompileSpec external) {
     internal = core::CompileSpec(to_vec_internal_inputs(external.inputs));
   }
 
-  if (external.enabled_precisions.size() <= 1 && toTRTDataType(external.op_precision) != nvinfer1::DataType::kFLOAT) {
+  if (external.enabled_precisions.size() <= 1 && toTRTDataType(*external.enabled_precisions.begin()) ==  nvinfer1::DataType::kFLOAT && toTRTDataType(external.op_precision) != nvinfer1::DataType::kFLOAT) {
     internal.convert_info.engine_settings.enabled_precisions.insert(toTRTDataType(external.op_precision));
   } else {
     for(auto p : external.enabled_precisions) {
       internal.convert_info.engine_settings.enabled_precisions.insert(toTRTDataType(p));
     }
   }
 
+  /* We want default behavior for types to match PyTorch, so in the case the user did not explicitly set the dtype for
+  inputs they will follow PyTorch convetions */
+  for (size_t i = 0; i < external.inputs.size(); i++) {
+    std::cout << "EXPLICIT " << external.inputs[i].get_explicit_set_dtype() << std::endl;
+    if (!external.inputs[i].get_explicit_set_dtype()) {
+      auto& precisions = internal.convert_info.engine_settings.enabled_precisions;
+      auto& internal_ins = internal.convert_info.inputs;
+      if (precisions.find(nvinfer1::DataType::kINT8) != precisions.end()) {
+        internal_ins[i].dtype = nvinfer1::DataType::kFLOAT;
+      } else if (precisions.find(nvinfer1::DataType::kHALF) != precisions.end()) {
+        internal_ins[i].dtype = nvinfer1::DataType::kHALF;
+      } else {
+        internal_ins[i].dtype = nvinfer1::DataType::kFLOAT;
+      }
+      std::cout << "internal type: " << internal_ins[i].dtype;
+    }
+  }
   internal.convert_info.engine_settings.disable_tf32 = external.disable_tf32;
   internal.convert_info.engine_settings.refit = external.refit;
   internal.convert_info.engine_settings.debug = external.debug;
 
@@ -1,8 +1,8 @@
 test_suite(
     name = "tests",
     tests = [
+        ":cpp_api_tests",
         "//tests/core:core_tests",
-        "//tests/modules:module_tests",
     ],
 )
 
@@ -30,6 +30,13 @@ test_suite(
     ],
 )
 
+test_suite(
+    name = "cpp_api_tests",
+    tests = [
+        "//tests/cpp:api_tests"
+    ]
+)
+
 test_suite(
     name = "python_api_tests",
     tests = [
 
@@ -0,0 +1,8 @@
+package(default_visibility = ["//visibility:public"])
+
+config_setting(
+    name = "use_pre_cxx11_abi",
+    values = {
+        "define": "abi=pre_cxx11_abi",
+    },
+)