pytorch
diff --git a/‎README.md
Lines changed: 3 additions & 1 deletion b/‎README.md
Lines changed: 3 additions & 1 deletion
diff --git a/‎WORKSPACE
Lines changed: 12 additions & 12 deletions b/‎WORKSPACE
Lines changed: 12 additions & 12 deletions
diff --git a/‎core/conversion/conversion.cpp
Lines changed: 16 additions & 7 deletions b/‎core/conversion/conversion.cpp
Lines changed: 16 additions & 7 deletions
diff --git a/‎core/conversion/converters/BUILD
Lines changed: 1 addition & 0 deletions b/‎core/conversion/converters/BUILD
Lines changed: 1 addition & 0 deletions
diff --git a/‎core/conversion/converters/impl/reflection_pad.cpp
Lines changed: 145 additions & 0 deletions b/‎core/conversion/converters/impl/reflection_pad.cpp
Lines changed: 145 additions & 0 deletions
diff --git a/‎core/conversion/evaluators/aten.cpp
Lines changed: 38 additions & 0 deletions b/‎core/conversion/evaluators/aten.cpp
Lines changed: 38 additions & 0 deletions
diff --git a/‎core/conversion/evaluators/eval_macros.h
Lines changed: 47 additions & 0 deletions b/‎core/conversion/evaluators/eval_macros.h
Lines changed: 47 additions & 0 deletions
@@ -12,6 +12,8 @@ Resources:
 - [Comprehensive Discusion (GTC Event)](https://www.nvidia.com/en-us/on-demand/session/gtcfall21-a31107/)
 - [Pre-built Docker Container](https://catalog.ngc.nvidia.com/orgs/nvidia/containers/pytorch). To use this container, make an NGC account and sign in to NVIDIA's registry with an API key. Refer to [this guide](https://docs.nvidia.com/ngc/ngc-catalog-user-guide/index.html#registering-activating-ngc-account) for the same.
 
+## NVIDIA NGC Container
+Torch-TensorRT is distributed in the ready-to-run NVIDIA [NGC PyTorch Container](https://catalog.ngc.nvidia.com/orgs/nvidia/containers/pytorch) starting with 21.11. We recommend using this prebuilt container to experiment & develop with Torch-TensorRT; it has all dependencies with the proper versions as well as example notebooks included.
 
 ## Building a docker container for Torch-TensorRT
 
@@ -48,7 +50,7 @@ If you would like to build outside a docker container, please follow the section
 // Set input datatypes. Allowerd options torch::{kFloat, kHalf, kChar, kInt32, kBool}
 // Size of input_dtypes should match number of inputs to the network.
 // If input_dtypes is not set, default precision follows traditional PyT / TRT rules
-auto input = torch_tensorrt::Input(dims, torch::kHalf)
+auto input = torch_tensorrt::Input(dims, torch::kHalf);
 auto compile_settings = torch_tensorrt::ts::CompileSpec({input});
 // FP16 execution
 compile_settings.enabled_precisions = {torch::kHalf};
 
@@ -128,18 +128,18 @@ http_archive(
 #   build_file = "@//third_party/tensorrt/local:BUILD"
 #)
 
-#########################################################################
-# Testing Dependencies (optional - comment out on aarch64)
-#########################################################################
-pip_install(
-    name = "torch_tensorrt_py_deps",
-    requirements = "//py:requirements.txt",
-)
-
-pip_install(
-    name = "py_test_deps",
-    requirements = "//tests/py:requirements.txt",
-)
+# #########################################################################
+# # Testing Dependencies (optional - comment out on aarch64)
+# #########################################################################
+# pip_install(
+#     name = "torch_tensorrt_py_deps",
+#     requirements = "//py:requirements.txt",
+# )
+
+# pip_install(
+#     name = "py_test_deps",
+#     requirements = "//tests/py:requirements.txt",
+# )
 
 pip_install(
     name = "pylinter_deps",
 
@@ -105,7 +105,8 @@ void AddLayer(ConversionCtx* ctx, const torch::jit::Node* n) {
       // Node input has not been converted yet or is a prim op
       TORCHTRT_THROW_ERROR(
           "Unable to retrieve all node inputs for node: "
-          << util::node_info(n) << " (ctx.AddLayer)\nSpecifically failed to retrieve value for input: " << *input_node);
+          << util::node_info(n) << " (ctx.AddLayer)\nSpecifically failed to retrieve value for input: %"
+          << input->debugName());
     }
   }
 
@@ -534,18 +535,22 @@ bool VerifyConverterSupportForBlock(const torch::jit::Block* b, bool suppress_er
   if (unsupported_ops.size() != 0) {
     std::stringstream unsupported_msg;
     unsupported_msg
-        << "Method requested cannot be compiled by Torch-TensorRT.TorchScript.\nUnsupported operators listed below:"
+        << "Method requested cannot be compiled end to end by Torch-TensorRT.TorchScript.\nUnsupported operators listed below:"
         << std::endl;
     for (auto s : unsupported_ops) {
       unsupported_msg << "  - " << s.second << std::endl;
     }
-    unsupported_msg << "You can either implement converters for these ops in your application or request implementation"
-                    << std::endl;
-    unsupported_msg << "https://www.github.com/nvidia/Torch-TensorRT/issues" << std::endl;
-    unsupported_msg << std::endl << "In Module:" << std::endl;
 
     if (!suppress_errors) {
+      unsupported_msg
+          << "You can either implement converters for these ops in your application or request implementation"
+          << std::endl;
+      unsupported_msg << "https://www.github.com/nvidia/Torch-TensorRT/issues" << std::endl;
+      unsupported_msg << std::endl << "In Module:" << std::endl;
+
       LOG_ERROR(unsupported_msg.str());
+    } else {
+      LOG_INFO(unsupported_msg.str());
     }
 
     std::unordered_map<std::string, std::unordered_set<std::string>> unsupported_node_locations;
@@ -572,7 +577,11 @@ bool VerifyConverterSupportForBlock(const torch::jit::Block* b, bool suppress_er
         traceback << str;
       }
       auto tb_str = traceback.str();
-      LOG_ERROR(tb_str);
+      if (!suppress_errors) {
+        LOG_ERROR(tb_str);
+      } else {
+        LOG_DEBUG(tb_str);
+      }
     }
 
     return false;
 
@@ -71,6 +71,7 @@ cc_library(
         "impl/pooling.cpp",
         "impl/quantization.cpp",
         "impl/reduce.cpp",
+        "impl/reflection_pad.cpp",
         "impl/replication_pad.cpp",
         "impl/select.cpp",
         "impl/shuffle.cpp",
 
@@ -0,0 +1,145 @@
+#include <ATen/ATen.h>
+#include <vector>
+#include "NvInfer.h"
+#include "core/conversion/converters/converters.h"
+#include "core/util/prelude.h"
+#include "torch/torch.h"
+
+namespace torch_tensorrt {
+namespace core {
+namespace conversion {
+namespace converters {
+namespace impl {
+namespace {
+
+auto reflection_padXd TORCHTRT_UNUSED =
+    RegisterNodeConversionPatterns()
+        .pattern({"aten::reflection_pad2d(Tensor self, int[4] padding) -> (Tensor)",
+                  [](ConversionCtx* ctx, const torch::jit::Node* n, args& args) -> bool {
+                    auto in = args[0].ITensor();
+                    auto inDims = in->getDimensions();
+                    int64_t inRank = inDims.nbDims;
+                    auto padding = args[1].unwrapToIntList().vec();
+                    if (padding.size() == 1) {
+                      for (int64_t i = 0; i < 3; i++)
+                        padding.push_back(padding[0]);
+                    }
+                    if (inRank == 4) {
+                      TORCHTRT_CHECK(padding.size() == 4, "4D tensors expect 4 values for padding");
+                    } else {
+                      TORCHTRT_THROW_ERROR("Only 4D padding are supported for now");
+                    }
+
+                    std::vector<nvinfer1::ITensor*> tensors_vec;
+                    // 2d padding: (padding_left, padding_right, padding_top, padding_bottom)
+
+                    for (int64_t i = 0; i < int(padding.size() / 2); i++) {
+                      int64_t axis = inRank - (i + 1); // axis = {inRank - 1, inRank - 2}
+                      int64_t padding_index = i * 2;
+
+                      if (padding[padding_index] > 0) { // left/top padding value
+                        tensors_vec.clear();
+
+                        for (int i = 0; i < padding[padding_index]; i++) {
+                          at::Tensor left_indices = torch::tensor({padding[padding_index] - i}, torch::kInt32);
+                          auto indicesTensor = tensor_to_const(ctx, left_indices);
+                          auto left_gather_layer = ctx->net->addGather(*in, *indicesTensor, axis);
+                          auto left_gather_out = left_gather_layer->getOutput(0);
+                          tensors_vec.push_back(left_gather_out);
+                        }
+                        tensors_vec.push_back(in);
+                        auto concat_layer = ctx->net->addConcatenation(tensors_vec.data(), tensors_vec.size());
+                        concat_layer->setAxis(axis);
+                        in = concat_layer->getOutput(0);
+                        inDims = in->getDimensions();
+                      }
+
+                      if (padding[padding_index + 1] > 0) { // right/bottom padding value
+                        tensors_vec.clear();
+                        tensors_vec.push_back(in);
+
+                        for (int i = 0; i < padding[padding_index + 1]; i++) {
+                          nvinfer1::ITensor* indicesTensor = NULL;
+                          auto indices = torch::tensor({inDims.d[axis] - 1 - (i + 1)}, torch::kInt32);
+                          indicesTensor = tensor_to_const(ctx, indices);
+                          auto right_gather_layer = ctx->net->addGather(*in, *indicesTensor, axis);
+                          auto right_gather_out = right_gather_layer->getOutput(0);
+                          tensors_vec.push_back(right_gather_out);
+                        }
+
+                        auto concat_layer = ctx->net->addConcatenation(tensors_vec.data(), tensors_vec.size());
+                        concat_layer->setAxis(axis);
+                        in = concat_layer->getOutput(0);
+                        inDims = in->getDimensions();
+                      }
+                    }
+                    auto out = ctx->AssociateValueAndTensor(n->outputs()[0], in);
+                    LOG_DEBUG("Output tensor shape: " << out->getDimensions());
+
+                    return true;
+                  }})
+        .pattern({"aten::reflection_pad1d(Tensor self, int[2] padding) -> (Tensor)",
+                  [](ConversionCtx* ctx, const torch::jit::Node* n, args& args) -> bool {
+                    auto in = args[0].ITensor();
+                    auto inDims = in->getDimensions();
+                    int64_t inRank = inDims.nbDims;
+                    auto padding = args[1].unwrapToIntList().vec();
+                    if (padding.size() == 1) {
+                      for (int64_t i = 0; i < 1; i++)
+                        padding.push_back(padding[0]);
+                    }
+
+                    std::vector<nvinfer1::ITensor*> tensors_vec;
+                    // 1d padding: (padding_left, padding_right)
+
+                    int64_t axis = inRank - 1;
+                    int64_t padding_index = 0;
+
+                    if (padding[padding_index] > 0) { // left padding value
+                      tensors_vec.clear();
+
+                      for (int i = 0; i < padding[padding_index]; i++) {
+                        at::Tensor left_indices = torch::tensor({padding[padding_index] - i}, torch::kInt32);
+                        auto indicesTensor = tensor_to_const(ctx, left_indices);
+                        auto left_gather_layer = ctx->net->addGather(*in, *indicesTensor, axis);
+                        auto left_gather_out = left_gather_layer->getOutput(0);
+                        tensors_vec.push_back(left_gather_out);
+                      }
+                      tensors_vec.push_back(in);
+                      auto concat_layer = ctx->net->addConcatenation(tensors_vec.data(), tensors_vec.size());
+                      concat_layer->setAxis(axis);
+                      in = concat_layer->getOutput(0);
+                      inDims = in->getDimensions();
+                    }
+
+                    if (padding[padding_index + 1] > 0) { // right padding value
+                      tensors_vec.clear();
+                      tensors_vec.push_back(in);
+
+                      for (int i = 0; i < padding[padding_index + 1]; i++) {
+                        nvinfer1::ITensor* indicesTensor = NULL;
+                        auto indices = torch::tensor({inDims.d[axis] - 1 - (i + 1)}, torch::kInt32);
+                        indicesTensor = tensor_to_const(ctx, indices);
+                        auto right_gather_layer = ctx->net->addGather(*in, *indicesTensor, axis);
+                        auto right_gather_out = right_gather_layer->getOutput(0);
+                        tensors_vec.push_back(right_gather_out);
+                      }
+
+                      auto concat_layer = ctx->net->addConcatenation(tensors_vec.data(), tensors_vec.size());
+                      concat_layer->setAxis(axis);
+                      in = concat_layer->getOutput(0);
+                      inDims = in->getDimensions();
+                    }
+
+                    auto out = ctx->AssociateValueAndTensor(n->outputs()[0], in);
+                    LOG_DEBUG("Output tensor shape: " << out->getDimensions());
+
+                    return true;
+                  }});
+
+} // namespace
+} // namespace impl
+} // namespace converters
+} // namespace conversion
+} // namespace core
+} // namespace torch_tensorrt
@@ -1,3 +1,5 @@
+#include <math.h>
+
 #include "ATen/core/List.h"
 #include "ATen/core/functional.h"
 #include "ATen/core/ivalue.h"
@@ -98,6 +100,17 @@ DEFINE_GENERIC_TWO_INPUT_EVALUATOR(
         "aten::ge.float_int(float a, int b) -> (bool)",
     }));
 
+DEFINE_ARITHMATIC_TWO_INPUT_EVALUATOR(
+    pow,
+    "aten::pow",
+    pow(a, b),
+    std::set<std::string>({
+        "aten::pow.int(int a, int b) -> (float)",
+        "aten::pow.float(float a, float b) -> (float)",
+        "aten::pow.int_float(int a, float b) -> (float)",
+        "aten::pow.float_int(float a, int b) -> (float)",
+    }));
+
 DEFINE_TWO_INPUT_SIMPLE_EVALUATOR(
     and,
     "aten::__and__",
@@ -285,6 +298,31 @@ auto aten_registrations TORCHTRT_UNUSED =
                     EvalOptions().validSchemas({
                         "aten::append.t(t[](a!) self, t(c -> *) el) -> (t[](a!))",
                     })})
+        .evaluator({c10::Symbol::fromQualString("aten::extend"),
+                    [](const torch::jit::Node* n, kwargs& args) -> c10::optional<torch::jit::IValue> {
+                      if (args.at(n->input(0)).IValue()->isList() && args.at(n->input(1)).IValue()->isList()) {
+                        c10::IValue* self_ptr = args.at(n->input(0)).IValueMut();
+                        auto self = self_ptr->to<c10::List<c10::IValue>>();
+                        auto other = args.at(n->input(1)).IValue()->to<c10::List<c10::IValue>>();
+                        const int64_t other_size = other.size();
+
+                        // Modify value in place
+                        for (int64_t i = 0; i < other_size; i++) {
+                          self.push_back(other.get(i));
+                        }
+
+                        *self_ptr = c10::IValue(self);
+                        return {};
+                      } else {
+                        TORCHTRT_THROW_ERROR(
+                            "Unimplemented data type for aten::extend.t evaluator: "
+                            << args.at(n->input(0)).IValue()->type()->str() << ", "
+                            << args.at(n->input(1)).IValue()->type()->str());
+                      }
+                    },
+                    EvalOptions().validSchemas({
+                        "aten::extend.t(t[](a!) self, t[] other) -> ()",
+                    })})
         .evaluator({c10::Symbol::fromQualString("aten::neg"),
                     [](const torch::jit::Node* n, kwargs& args) -> c10::optional<torch::jit::IValue> {
                       auto el = args.at(n->input(0)).unwrapToInt();
 
@@ -77,6 +77,53 @@
        },                                                                                              \
        EvalOptions().validSchemas(schemas)});
 
+#define DEFINE_ARITHMATIC_TWO_INPUT_EVALUATOR(name, node_kind, operation, schemas)                     \
+  auto name##_registrations TORCHTRT_UNUSED = RegisterNodeEvaluators().evaluator(                      \
+      {c10::Symbol::fromQualString(node_kind),                                                         \
+       [](const torch::jit::Node* n, kwargs& args) -> c10::optional<torch::jit::IValue> {              \
+         if (args.at(n->input(0)).IValue()->isInt()) {                                                 \
+           auto a = args.at(n->input(0)).unwrapToInt();                                                \
+           if (args.at(n->input(1)).IValue()->isInt()) {                                               \
+             auto b = args.at(n->input(1)).unwrapToInt();                                              \
+             return operation;                                                                         \
+           } else if (args.at(n->input(1)).IValue()->isDouble()) {                                     \
+             auto b = args.at(n->input(1)).unwrapToDouble();                                           \
+             return operation;                                                                         \
+           } else if (args.at(n->input(1)).IValue()->isBool()) {                                       \
+             auto b = args.at(n->input(1)).unwrapToBool();                                             \
+             return operation;                                                                         \
+           } else {                                                                                    \
+             TORCHTRT_THROW_ERROR(                                                                     \
+                 "Unimplemented data type for "                                                        \
+                 << node_kind << " evaluator b arg:" << args.at(n->input(1)).IValue()->type()->str()); \
+             return {};                                                                                \
+           }                                                                                           \
+         } else if (args.at(n->input(0)).IValue()->isDouble()) {                                       \
+           auto a = args.at(n->input(0)).unwrapToDouble();                                             \
+           if (args.at(n->input(1)).IValue()->isInt()) {                                               \
+             auto b = args.at(n->input(1)).unwrapToInt();                                              \
+             return operation;                                                                         \
+           } else if (args.at(n->input(1)).IValue()->isDouble()) {                                     \
+             auto b = args.at(n->input(1)).unwrapToDouble();                                           \
+             return operation;                                                                         \
+           } else if (args.at(n->input(1)).IValue()->isBool()) {                                       \
+             auto b = args.at(n->input(1)).unwrapToBool();                                             \
+             return operation;                                                                         \
+           } else {                                                                                    \
+             TORCHTRT_THROW_ERROR(                                                                     \
+                 "Unimplemented data type for "                                                        \
+                 << node_kind << " evaluator b arg:" << args.at(n->input(1)).IValue()->type()->str()); \
+             return {};                                                                                \
+           }                                                                                           \
+         } else {                                                                                      \
+           TORCHTRT_THROW_ERROR(                                                                       \
+               "Unimplemented data type for "                                                          \
+               << node_kind << " evaluator a arg: " << args.at(n->input(0)).IValue()->type()->str());  \
+           return {};                                                                                  \
+         }                                                                                             \
+       },                                                                                              \
+       EvalOptions().validSchemas(schemas)});
+
 #define DEFINE_TWO_INPUT_SIMPLE_EVALUATOR(node_kind, node_name, operation, type, schemas) \
   auto node_kind##_registrations TORCHTRT_UNUSED = RegisterNodeEvaluators().evaluator(    \
       {c10::Symbol::fromQualString(node_name),                                            \