pytorch
diff --git a/‎.github/workflows/stale.yml
Lines changed: 4 additions & 4 deletions b/‎.github/workflows/stale.yml
Lines changed: 4 additions & 4 deletions
diff --git a/‎core/conversion/converters/BUILD
Lines changed: 2 additions & 0 deletions b/‎core/conversion/converters/BUILD
Lines changed: 2 additions & 0 deletions
diff --git a/‎core/conversion/converters/impl/activation.cpp
Lines changed: 29 additions & 1 deletion b/‎core/conversion/converters/impl/activation.cpp
Lines changed: 29 additions & 1 deletion
diff --git a/‎core/conversion/converters/impl/element_wise.cpp
Lines changed: 368 additions & 17 deletions b/‎core/conversion/converters/impl/element_wise.cpp
Lines changed: 368 additions & 17 deletions
diff --git a/‎core/conversion/converters/impl/expand.cpp
Lines changed: 152 additions & 0 deletions b/‎core/conversion/converters/impl/expand.cpp
Lines changed: 152 additions & 0 deletions
diff --git a/‎core/conversion/converters/impl/topk.cpp
Lines changed: 62 additions & 0 deletions b/‎core/conversion/converters/impl/topk.cpp
Lines changed: 62 additions & 0 deletions
diff --git a/‎core/conversion/evaluators/aten.cpp
Lines changed: 2 additions & 1 deletion b/‎core/conversion/evaluators/aten.cpp
Lines changed: 2 additions & 1 deletion
diff --git a/‎core/lowering/passes/BUILD
Lines changed: 1 addition & 2 deletions b/‎core/lowering/passes/BUILD
Lines changed: 1 addition & 2 deletions
diff --git a/‎docs/_notebooks/Resnet50-example.html
Lines changed: 2 additions & 2 deletions b/‎docs/_notebooks/Resnet50-example.html
Lines changed: 2 additions & 2 deletions
diff --git a/‎docs/_notebooks/lenet-getting-started.html
Lines changed: 2 additions & 2 deletions b/‎docs/_notebooks/lenet-getting-started.html
Lines changed: 2 additions & 2 deletions
diff --git a/‎docs/_notebooks/ssd-object-detection-demo.html
Lines changed: 2 additions & 2 deletions b/‎docs/_notebooks/ssd-object-detection-demo.html
Lines changed: 2 additions & 2 deletions
diff --git a/‎docs/py_api/trtorch.html
Lines changed: 2 additions & 2 deletions b/‎docs/py_api/trtorch.html
Lines changed: 2 additions & 2 deletions
diff --git a/‎docs/searchindex.js
Lines changed: 1 addition & 1 deletion b/‎docs/searchindex.js
Lines changed: 1 addition & 1 deletion
@@ -13,11 +13,11 @@ jobs:
     - uses: actions/stale@v1
       with:
         repo-token: ${{ secrets.GITHUB_TOKEN }}
-        stale-issue-message: 'This issue has not seen activity for 30 days, Remove stale label or comment or this will be closed in 5 days'
-        stale-pr-message: 'This PR has not seen activity for 30 days, Remove stale label or comment or this will be closed in 5 days'
+        stale-issue-message: 'This issue has not seen activity for 90 days, Remove stale label or comment or this will be closed in 10 days'
+        stale-pr-message: 'This PR has not seen activity for 90 days, Remove stale label or comment or this will be closed in 10 days'
         stale-issue-label: 'No Activity'
         exempt-issue-labels: 'feature request'
         stale-pr-label: 'No Activity'
         exempt-pr-labels: 'WIP'
-        days-before-stale: 30
-        days-before-close: 5
+        days-before-stale: 90
+        days-before-close: 10
@@ -39,6 +39,7 @@ cc_library(
         "impl/constant.cpp",
         "impl/conv_deconv.cpp",
         "impl/element_wise.cpp",
+        "impl/expand.cpp",
         "impl/linear.cpp",
         "impl/matrix_multiply.cpp",
         "impl/pooling.cpp",
@@ -52,6 +53,7 @@ cc_library(
         "impl/stack.cpp",
         "impl/lstm_cell.cpp",
         "impl/unsqueeze.cpp",
+        "impl/topk.cpp",
     ],
     deps = [
         "@tensorrt//:nvinfer",
 
@@ -124,7 +124,35 @@ auto acthardtanh TRTORCH_UNUSED =
                out_tensor = ctx->AssociateValueAndTensor(n->outputs()[0], out_tensor);
                LOG_DEBUG("Output shape: " << out_tensor->getDimensions());
                return true;
-             }});
+             }})
+        .pattern({"aten::leaky_relu(Tensor self, Scalar negative_slope=0.01) -> (Tensor)",
+                  [](ConversionCtx* ctx, const torch::jit::Node* n, args& args) -> bool {
+                    auto self = args[0].ITensorOrFreeze(ctx);
+                    auto negative_slopeScalar = args[1].unwrapToScalar().to<float>();
+
+                    auto new_layer = ctx->net->addActivation(*self, nvinfer1::ActivationType::kLEAKY_RELU);
+                    new_layer->setAlpha(negative_slopeScalar);
+
+                    new_layer->setName(util::node_info(n).c_str());
+                    auto out_tensor = new_layer->getOutput(0);
+                    out_tensor = ctx->AssociateValueAndTensor(n->outputs()[0], out_tensor);
+                    LOG_DEBUG("Output shape: " << out_tensor->getDimensions());
+                    return true;
+                  }})
+        .pattern({"aten::leaky_relu_(Tensor(a!) self, Scalar negative_slope=0.01) -> Tensor(a!)",
+                  [](ConversionCtx* ctx, const torch::jit::Node* n, args& args) -> bool {
+                    auto self = args[0].ITensorOrFreeze(ctx);
+                    auto negative_slopeScalar = args[1].unwrapToScalar().to<float>();
+
+                    auto new_layer = ctx->net->addActivation(*self, nvinfer1::ActivationType::kLEAKY_RELU);
+                    new_layer->setAlpha(negative_slopeScalar);
+
+                    new_layer->setName(util::node_info(n).c_str());
+                    auto out_tensor = new_layer->getOutput(0);
+                    out_tensor = ctx->AssociateValueAndTensor(n->outputs()[0], out_tensor);
+                    LOG_DEBUG("Output shape: " << out_tensor->getDimensions());
+                    return true;
+                  }});
 
 } // namespace
 } // namespace impl
 
@@ -0,0 +1,152 @@
+#include "NvInfer.h"
+#include "core/conversion/converters/converters.h"
+#include "core/conversion/tensorcontainer/TensorContainer.h"
+#include "core/util/prelude.h"
+#include "core/util/trt_util.h"
+#include "torch/torch.h"
+
+#include <ATen/ATen.h>
+#include <vector>
+
+namespace trtorch {
+namespace core {
+namespace conversion {
+namespace converters {
+namespace impl {
+namespace {
+
+bool add_expand(ConversionCtx* ctx, const torch::jit::Node* n, nvinfer1::ITensor* in, nvinfer1::Dims expandedDims) {
+  auto input_dims = in->getDimensions();
+  TRTORCH_CHECK(
+      input_dims.nbDims <= expandedDims.nbDims,
+      "Number of dimensions of the desired expansion must be greater than or equal to the number of input dimensions");
+
+  // Validate the expansion. Eg: an input of [3, 1] can be expanded to [1, 3, 4] but not [3, 4, 1]
+  for (int64_t i = expandedDims.nbDims - 1; i >= 0; --i) {
+    int64_t offset = expandedDims.nbDims - 1 - i;
+    int64_t dim = input_dims.nbDims - 1 - offset;
+    int64_t size = (dim >= 0) ? input_dims.d[dim] : 1;
+    int64_t targetSize = expandedDims.d[i];
+    if (size != targetSize) {
+      if (size != 1) {
+        TRTORCH_THROW_ERROR(
+            "The expanded size of tensor (" << targetSize << ")"
+                                            << " must match the existing size (" << size << ")"
+                                            << " at dimension " << i);
+      }
+    }
+  }
+
+  auto num_expand_dims = expandedDims.nbDims - input_dims.nbDims;
+  if (num_expand_dims > 0) {
+    nvinfer1::Dims reshape_dims;
+    reshape_dims.nbDims = expandedDims.nbDims;
+    for (int64_t i = 0; i < num_expand_dims; i++) {
+      reshape_dims.d[i] = 1;
+    }
+    for (int64_t i = 0; i < input_dims.nbDims; i++) {
+      reshape_dims.d[num_expand_dims + i] = input_dims.d[i];
+    }
+    // Add a reshape layer to expand dims
+    auto reshape_layer = ctx->net->addShuffle(*in);
+    reshape_layer->setReshapeDimensions(reshape_dims);
+    in = reshape_layer->getOutput(0);
+    LOG_DEBUG("Input reshaped to : " << in->getDimensions() << " from " << input_dims);
+  }
+
+  // Start the slicing from beginning of tensor since this is an expand layer
+  std::vector<int64_t> start_vec(expandedDims.nbDims, 0);
+  auto start_offset = util::toDims(c10::IntArrayRef(start_vec));
+
+  // Set the stride of non singleton dimension to 1
+  std::vector<int64_t> strides_vec(expandedDims.nbDims, 0);
+  for (int64_t i = 0; i < expandedDims.nbDims; i++) {
+    strides_vec[i] = (in->getDimensions().d[i] != 1);
+  }
+
+  auto strides = util::toDims(c10::IntArrayRef(strides_vec));
+  // Slice layer does the expansion in TRT. Desired output size is specified by expandedDims
+  auto slice_layer = ctx->net->addSlice(*in, start_offset, expandedDims, strides);
+  slice_layer->setName(util::node_info(n).c_str());
+
+  auto out = ctx->AssociateValueAndTensor(n->outputs()[0], slice_layer->getOutput(0));
+
+  LOG_DEBUG("Expand layer output tensor shape: " << out->getDimensions());
+
+  return true;
+}
+
+auto expand_registrations TRTORCH_UNUSED =
+    RegisterNodeConversionPatterns()
+        .pattern({"aten::expand(Tensor(a) self, int[] size, *, bool implicit=False) -> (Tensor(a))",
+                  [](ConversionCtx* ctx, const torch::jit::Node* n, args& args) -> bool {
+                    auto in = args[0].ITensor();
+                    auto input_dims = in->getDimensions();
+                    auto expanded_size = args[1].unwrapToIntList();
+                    auto expandedDims = util::toDims(expanded_size);
+                    LOG_DEBUG("(expand layer) Expand input from " << input_dims << " to " << expandedDims);
+                    return add_expand(ctx, n, in, expandedDims);
+                  }})
+        .pattern({"aten::expand_as(Tensor(a) self, Tensor other) -> (Tensor(a))",
+                  [](ConversionCtx* ctx, const torch::jit::Node* n, args& args) -> bool {
+                    // TODO: Currently expand supports static shapes. Need to explore if the same code can be extended
+                    // to dynamic expansion.
+                    auto in = args[0].ITensor();
+                    auto input_dims = in->getDimensions();
+                    auto targetTensor = args[1].ITensor();
+                    auto targetDims = targetTensor->getDimensions();
+                    LOG_DEBUG("(expand_as layer) Expand input from " << input_dims << " to " << targetDims);
+                    return add_expand(ctx, n, in, targetDims);
+                  }})
+        .pattern({"aten::repeat(Tensor self, int[] repeats) -> (Tensor)",
+                  [](ConversionCtx* ctx, const torch::jit::Node* n, args& args) -> bool {
+                    auto in = args[0].ITensor();
+                    auto input_dims = in->getDimensions();
+                    auto repeats = args[1].unwrapToIntList().vec();
+                    TRTORCH_CHECK(
+                        static_cast<int64_t>(repeats.size()) >= input_dims.nbDims,
+                        "Number of repeat dimensions cannot be smaller than number of input dimensions");
+                    auto num_expand_dims = repeats.size() - input_dims.nbDims;
+                    if (num_expand_dims > 0) {
+                      nvinfer1::Dims reshape_dims;
+                      reshape_dims.nbDims = repeats.size();
+                      for (size_t i = 0; i < num_expand_dims; i++) {
+                        reshape_dims.d[i] = 1;
+                      }
+                      for (int64_t i = 0; i < input_dims.nbDims; i++) {
+                        reshape_dims.d[num_expand_dims + i] = input_dims.d[i];
+                      }
+                      // Add a reshape layer to expand dims
+                      auto reshape_layer = ctx->net->addShuffle(*in);
+                      reshape_layer->setReshapeDimensions(reshape_dims);
+                      in = reshape_layer->getOutput(0);
+                      LOG_DEBUG("Input reshaped to : " << in->getDimensions() << " from " << input_dims);
+                    }
+
+                    LOG_DEBUG("Repeats: " << repeats);
+
+                    // Concat across all repeat axes.
+                    // TODO: Implementation might not be performant. Explore other strategies to improve performance.
+                    for (int64_t i = repeats.size() - 1; i >= 0; --i) {
+                      std::vector<nvinfer1::ITensor*> tensors_vec;
+                      for (int64_t j = 0; j < repeats[i]; j++) {
+                        tensors_vec.push_back(in);
+                      }
+                      auto concat_layer = ctx->net->addConcatenation(tensors_vec.data(), tensors_vec.size());
+                      concat_layer->setAxis(i);
+                      in = concat_layer->getOutput(0);
+                    }
+
+                    auto out = ctx->AssociateValueAndTensor(n->outputs()[0], in);
+
+                    LOG_DEBUG("Repeat layer output tensor shape: " << out->getDimensions());
+
+                    return true;
+                  }});
+
+} // namespace
+} // namespace impl
+} // namespace converters
+} // namespace conversion
+} // namespace core
+} // namespace trtorch
@@ -0,0 +1,62 @@
+#include "NvInfer.h"
+#include "core/conversion/converters/converters.h"
+#include "core/conversion/tensorcontainer/TensorContainer.h"
+#include "core/util/prelude.h"
+#include "torch/torch.h"
+
+#include <ATen/ATen.h>
+#include <vector>
+
+namespace trtorch {
+namespace core {
+namespace conversion {
+namespace converters {
+namespace impl {
+namespace {
+
+auto topk_registrations TRTORCH_UNUSED = RegisterNodeConversionPatterns().pattern(
+    {"aten::topk(Tensor self, int k, int dim=-1, bool largest=True, bool sorted=True) -> (Tensor values, Tensor indices)",
+     [](ConversionCtx* ctx, const torch::jit::Node* n, args& args) -> bool {
+       auto self = args[0].ITensorOrFreeze(ctx);
+       auto k = args[1].unwrapToInt();
+       auto dim = args[2].unwrapToInt();
+       auto largest = args[3].unwrapToBool();
+       LOG_DEBUG(
+           "Note: sorted argument is not used in TensorRT for aten::topk, results will depend on the value of largest");
+       // auto sorted = args[4].unwrapToBool(); # Currently unused
+
+       auto selfDim = util::toVec(self->getDimensions());
+
+       // reduceAxes	The reduction dimensions. The bit in position i of bitmask reduceAxes corresponds to explicit
+       // dimension i of the result. E.g., the least significant bit corresponds to the first explicit dimension and the
+       // next to least significant bit corresponds to the second explicit dimension.
+
+       if (dim < 0) {
+         dim = selfDim.size() + dim;
+       }
+
+       uint32_t shiftDim = 1 << dim;
+
+       LOG_DEBUG("Output topk reduce dim: " << dim);
+
+       auto TopKOperation = largest ? (nvinfer1::TopKOperation::kMAX) : (nvinfer1::TopKOperation::kMIN);
+
+       auto new_layer = ctx->net->addTopK(*self, TopKOperation, k, shiftDim);
+
+       TRTORCH_CHECK(new_layer, "Unable to create topk layer from node: " << *n);
+
+       auto out0 = ctx->AssociateValueAndTensor(n->outputs()[0], new_layer->getOutput(0));
+       auto out1 = ctx->AssociateValueAndTensor(n->outputs()[1], new_layer->getOutput(1));
+
+       LOG_DEBUG("Output tensor(0) shape: " << out0->getDimensions());
+       LOG_DEBUG("Output tensor(1) shape: " << out1->getDimensions());
+
+       return true;
+     }});
+
+} // namespace
+} // namespace impl
+} // namespace converters
+} // namespace conversion
+} // namespace core
+} // namespace trtorch
@@ -426,7 +426,8 @@ auto aten_registrations TRTORCH_UNUSED =
                       }
                     },
                     EvalOptions().validSchemas({
-                        "aten::div.Scalar(Scalar a, Scalar b) -> (float)",
+                        "aten::div.float(float a, float b) -> (float)",
+                        "aten::div.int(int a, int b) -> (float)",
                     })})
         .evaluator({c10::Symbol::fromQualString("aten::floordiv"),
                     [](const torch::jit::Node* n, kwargs& args) -> c10::optional<torch::jit::IValue> {
 
@@ -40,5 +40,4 @@ pkg_tar(
     name = "include",
     package_dir = "core/lowering/passes/",
     srcs = ["passes.h"],
-)
-
+)
@@ -675,7 +675,7 @@
         </div>
        </div>
        <p>
-        <img alt="b1ce51ad50c14266ad34bbbad8367ca9" src="http://developer.download.nvidia.com/compute/machine-learning/frameworks/nvidia_logo.png"/>
+        <img alt="ed47660d576647068791c7f711e0cc16" src="http://developer.download.nvidia.com/compute/machine-learning/frameworks/nvidia_logo.png"/>
        </p>
        <h1 id="notebooks-resnet50-example--page-root">
         TRTorch Getting Started - ResNet 50
@@ -1920,4 +1920,4 @@ <h3 id="What's-next">
    app.initialize({version: "1.0.4", url: {base: ".."}})
   </script>
  </body>
-</html>
+</html>
@@ -769,7 +769,7 @@
         </div>
        </div>
        <p>
-        <img alt="b8dc0146a6bf40f6a57bd302dec7e424" src="http://developer.download.nvidia.com/compute/machine-learning/frameworks/nvidia_logo.png"/>
+        <img alt="e10d990c04c741a082279a3b35df9fb4" src="http://developer.download.nvidia.com/compute/machine-learning/frameworks/nvidia_logo.png"/>
        </p>
        <h1 id="notebooks-lenet-getting-started--page-root">
         TRTorch Getting Started - LeNet
@@ -1520,4 +1520,4 @@ <h3 id="What's-next">
    app.initialize({version: "1.0.4", url: {base: ".."}})
   </script>
  </body>
-</html>
+</html>
@@ -789,7 +789,7 @@
         </div>
        </div>
        <p>
-        <img alt="cef98741e4a14fc08fd52dc41f45e820" src="http://developer.download.nvidia.com/compute/machine-learning/frameworks/nvidia_logo.png"/>
+        <img alt="9d1cf3e0c29c4704bace293a8b3b2f7f" src="http://developer.download.nvidia.com/compute/machine-learning/frameworks/nvidia_logo.png"/>
        </p>
        <h1 id="notebooks-ssd-object-detection-demo--page-root">
         Object Detection with TRTorch (SSD)
@@ -1769,4 +1769,4 @@ <h3 id="References">
    app.initialize({version: "1.0.4", url: {base: ".."}})
   </script>
  </body>
-</html>
+</html>
@@ -969,7 +969,7 @@ <h2 id="functions">
          <span class="sig-paren">
           )
          </span>
-         → &lt;torch._C.ScriptClass object at 0x7fc40e70ea08&gt;
+         → &lt;torch._C.ScriptClass object at 0x7fddd4d11a08&gt;
          <a class="headerlink" href="#trtorch.TensorRTCompileSpec" title="Permalink to this definition">
           ¶
          </a>
@@ -1265,4 +1265,4 @@ <h2 id="submodules">
    app.initialize({version: "1.0.4", url: {base: ".."}})
   </script>
  </body>
-</html>
+</html>