pytorch
diff --git a/‎caffe2/contrib/aten/aten_op_template.h
Lines changed: 2 additions & 1 deletion b/‎caffe2/contrib/aten/aten_op_template.h
Lines changed: 2 additions & 1 deletion
diff --git a/‎caffe2/core/IValueInterface.cc
Lines changed: 178 additions & 0 deletions b/‎caffe2/core/IValueInterface.cc
Lines changed: 178 additions & 0 deletions
diff --git a/‎caffe2/core/IValueInterface.h
Lines changed: 51 additions & 0 deletions b/‎caffe2/core/IValueInterface.h
Lines changed: 51 additions & 0 deletions
diff --git a/‎caffe2/core/export_caffe2_op_to_c10.h
Lines changed: 12 additions & 5 deletions b/‎caffe2/core/export_caffe2_op_to_c10.h
Lines changed: 12 additions & 5 deletions
diff --git a/‎caffe2/core/operator.cc
Lines changed: 13 additions & 41 deletions b/‎caffe2/core/operator.cc
Lines changed: 13 additions & 41 deletions
@@ -2,6 +2,7 @@
 #include <unordered_map>
 #include <string>
 #include <ATen/Functions.h>
+#include <ATen/core/List.h>
 #include <c10/macros/Macros.h>
 #include <caffe2/core/context.h>
 #include <caffe2/core/operator.h>
@@ -21,7 +22,7 @@ using at::Half; // for AT_FORALL_SCALAR_TYPES_AND3(Bool, Half, BFloat16, ...)
 namespace internal {
 TORCH_API at::Tensor index_with_uint8_handling(
     const at::Tensor& self,
-    const torch::List<c10::optional<at::Tensor>>& indices);
+    const c10::List<c10::optional<at::Tensor>>& indices);
 }
 
 template <class Context>
 
@@ -0,0 +1,178 @@
+#define TORCH_ASSERT_NO_OPERATORS
+#include <caffe2/core/IValueInterface.h>
+#undef TORCH_ASSERT_NO_OPERATORS
+#include <ATen/core/ivalue.h>
+#include <c10/util/irange.h>
+
+#include <memory>
+
+namespace caffe2 {
+namespace detail {
+
+caffe2::Tensor contiguous(caffe2::Tensor t) {
+  return caffe2::Tensor(at::Tensor(std::move(t)).contiguous());
+}
+
+
+IValueInterface::IValueInterface(ArrayRef<c10::IValue> values):
+  size_(values.size()) {
+  auto values_tmp = std::make_unique<c10::IValue[]>(size_);
+  std::copy_n(values.data(), size_, values_tmp.get());
+  values_ = values_tmp.release();
+}
+
+IValueInterface::~IValueInterface() {
+  delete[] values_;
+}
+
+bool IValueInterface::isTensorList(size_t idx) const {
+  return at(idx).isTensorList();
+}
+
+bool IValueInterface::isTensor(size_t idx) const {
+  return at(idx).isTensor();
+}
+
+const c10::IValue& IValueInterface::at(size_t idx) const {
+  TORCH_INTERNAL_ASSERT(idx < size_, "caffe2: Input index ", idx,
+                        " is out of range for call with ", size_, " arguments");
+  return values_[idx];
+}
+
+std::vector<caffe2::Tensor> IValueInterface::toTensorVector(size_t idx) const {
+  auto list = at(idx).toTensorList();
+  std::vector<caffe2::Tensor> ret(list.size());
+  for (auto i : c10::irange(list.size())) {
+    ret[i] = caffe2::Tensor(list.get(i));
+  }
+  return ret;
+}
+
+caffe2::Tensor IValueInterface::toTensor(size_t idx) const {
+  return caffe2::Tensor(at(idx).toTensor());
+}
+
+int IValueInterface::compute_input_size() const {
+  if (empty()) {
+    return 0;
+  }
+  if (values_[0].isTensorList()) {
+    // if the first input is a tensor list, we get input tensors by indexing
+    // into that list. currently, this means that only tensors from that list
+    // are accessible as inputs. any hypothetical input tensors that come after
+    // the list are not accessible.
+    return values_[0].toTensorList().size();
+  }
+  // it's not a tensor list. Count the number of tensor inputs and return them.
+  int num_tensor_inputs = 0;
+  bool found_nontensor = false;
+  for (auto i: c10::irange(size())) {
+    if (values_[i].isTensor()) {
+      TORCH_INTERNAL_ASSERT(
+          !found_nontensor,
+          "All tensor arguments must come before non-tensor arguments");
+      ++num_tensor_inputs;
+    } else {
+      found_nontensor = true;
+    }
+  }
+  return num_tensor_inputs;
+}
+
+template <typename T>
+typename c10::detail::ivalue_to_const_ref_overload_return<T>::type
+IValueInterface::to(size_t idx) const {
+  return at(idx).template to<T>();
+}
+
+#define INSTANTIATE_TO(Type) \
+  template typename c10::detail::ivalue_to_const_ref_overload_return<Type>::type \
+  IValueInterface::to<Type>(size_t idx) const
+
+INSTANTIATE_TO(at::Tensor);
+INSTANTIATE_TO(at::Storage);
+INSTANTIATE_TO(c10::Stream);
+INSTANTIATE_TO(float);
+INSTANTIATE_TO(double);
+INSTANTIATE_TO(c10::complex<double>);
+INSTANTIATE_TO(unsigned char);
+INSTANTIATE_TO(signed char);
+INSTANTIATE_TO(unsigned short);
+INSTANTIATE_TO(short);
+INSTANTIATE_TO(int);
+INSTANTIATE_TO(uint32_t);
+INSTANTIATE_TO(uint64_t);
+INSTANTIATE_TO(int64_t);
+INSTANTIATE_TO(bool);
+INSTANTIATE_TO(c10::intrusive_ptr<caffe2::Blob>);;
+INSTANTIATE_TO(c10::intrusive_ptr<ivalue::ConstantString>);
+INSTANTIATE_TO(c10::intrusive_ptr<ivalue::Object>);
+INSTANTIATE_TO(at::Scalar);
+INSTANTIATE_TO(c10::List<int64_t>);
+INSTANTIATE_TO(c10::List<double>);
+INSTANTIATE_TO(c10::List<c10::complex<double>>);
+INSTANTIATE_TO(c10::List<bool>);
+INSTANTIATE_TO(c10::List<at::Tensor>);
+INSTANTIATE_TO(c10::impl::GenericList);
+INSTANTIATE_TO(c10::impl::GenericDict);
+INSTANTIATE_TO(c10::intrusive_ptr<ivalue::Tuple>);
+INSTANTIATE_TO(std::string);
+INSTANTIATE_TO(c10::string_view);
+INSTANTIATE_TO(c10::intrusive_ptr<ivalue::Future>);
+INSTANTIATE_TO(c10::intrusive_ptr<c10::RRefInterface>);
+INSTANTIATE_TO(c10::intrusive_ptr<at::Quantizer>);
+INSTANTIATE_TO(IValue);
+INSTANTIATE_TO(c10::Device);
+INSTANTIATE_TO(at::ScalarType);
+INSTANTIATE_TO(at::Layout);
+INSTANTIATE_TO(at::MemoryFormat);
+INSTANTIATE_TO(at::QScheme);
+INSTANTIATE_TO(at::Dimname);
+INSTANTIATE_TO(at::Generator);
+
+template <typename T>
+struct list_value_type {
+  using type = T;
+};
+
+template <>
+struct list_value_type<int> {
+    using type = int64_t;
+};
+
+template <>
+struct list_value_type<int16_t> {
+  using type = int64_t;
+};
+
+template <>
+struct list_value_type<float> {
+  using type = double;
+};
+
+template <typename T, typename U>
+static std::vector<T> to_vector(const c10::List<U> &list) {
+  std::vector<T> ret;
+  for (auto i: c10::irange(list.size())) {
+    ret.push_back(list.get(i));
+  }
+  return ret;
+}
+
+template <typename T>
+std::vector<T> IValueInterface::toVec(size_t idx) const {
+  using list_value_t = typename list_value_type<T>::type;
+  return to_vector<T>(to<c10::List<list_value_t>>(idx));
+}
+
+#define INSTANTIATE_TO_VEC(Type)                                        \
+  template std::vector<Type> IValueInterface::toVec<Type>(size_t idx) const;
+
+INSTANTIATE_TO_VEC(int64_t);
+INSTANTIATE_TO_VEC(int32_t);
+INSTANTIATE_TO_VEC(int16_t);
+INSTANTIATE_TO_VEC(float);
+INSTANTIATE_TO_VEC(double);
+INSTANTIATE_TO_VEC(bool);
+
+}}  // namespace caffe2::detail
@@ -0,0 +1,51 @@
+#pragma once
+#include <ATen/core/ivalue_to.h>
+#include <c10/util/ArrayRef.h>
+#include <caffe2/core/tensor.h>
+
+
+namespace c10 {
+class IValue;
+}
+
+namespace caffe2 {
+namespace detail {
+
+TORCH_API caffe2::Tensor contiguous(caffe2::Tensor);
+
+class TORCH_API IValueInterface {
+public:
+  IValueInterface(): values_(nullptr), size_(0) {}
+  IValueInterface(ArrayRef<c10::IValue> values);
+  ~IValueInterface();
+
+  bool isTensorList(size_t idx) const;
+  bool isTensor(size_t idx) const;
+
+  size_t size() const {
+    return size_;
+  }
+  bool empty() const {
+    return size() == 0;
+  }
+
+  const c10::IValue& at(size_t idx) const;
+  std::vector<caffe2::Tensor> toTensorVector(size_t idx) const;
+  caffe2::Tensor toTensor(size_t idx) const;
+
+  int compute_input_size() const;
+
+  // These template functions are not defined in the header,
+  // but are explicitly instantiated in IValueInterface.cc
+  template <typename T>
+  typename c10::detail::ivalue_to_const_ref_overload_return<T>::type to(size_t idx) const;
+
+  template <typename T>
+  std::vector<T> toVec(size_t idx) const;
+
+private:
+  c10::IValue *values_;
+  size_t size_;
+};
+
+}}  // namespace caffe2::detail
@@ -8,6 +8,7 @@
 #include <ATen/core/grad_mode.h>
 #include <ATen/core/op_registration/op_registration.h>
 #include <torch/csrc/jit/frontend/function_schema_parser.h>
+#include <caffe2/core/tensor.h>
 #include <c10/core/CompileTimeFunctionPointer.h>
 #include <torch/library.h>
 #include <vector>
@@ -20,16 +21,22 @@ constexpr const char* PREALLOCATED_OUTPUT_ARGNAME =
 
 using _CallCaffe2OpFunc = c10::List<at::Tensor>(
     const c10::FunctionSchema& schema,
-    std::vector<c10::IValue>&& inputs,
-    c10::List<at::Tensor>&& outputs);
+    const std::vector<c10::IValue> &inputs,
+    c10::List<at::Tensor> &&outputs);
 
 template <class Caffe2Operator>
 inline c10::List<at::Tensor> _call_caffe2_op(
     const c10::FunctionSchema& schema,
-    std::vector<c10::IValue>&& inputs,
-    c10::List<at::Tensor>&& outputs) {
-  Caffe2Operator op(schema, std::move(inputs), std::move(outputs), -1);
+    const std::vector<c10::IValue> &inputs,
+    c10::List<at::Tensor> &&outputs) {
+  c10::SmallVector<caffe2::Tensor, 6> outputs_caffe2(outputs.size());
+  for (auto i : c10::irange(outputs.size())) {
+    outputs_caffe2[i] = caffe2::Tensor(outputs.get(i));
+  }
+
+  Caffe2Operator op(schema, inputs, outputs_caffe2, -1);
   op.Run(-1);
+
   auto op_outputs = std::move(op).move_output_tensors();
   TORCH_INTERNAL_ASSERT(outputs.size() == op_outputs.size());
   for (auto i : c10::irange(op_outputs.size())) {
 
@@ -1,3 +1,4 @@
+#define TORCH_ASSERT_NO_OPERATORS
 #include "caffe2/core/operator.h"
 
 #include <algorithm>
@@ -15,8 +16,12 @@
 #include "caffe2/proto/caffe2_pb.h"
 #include "caffe2/utils/proto_utils.h"
 #include "caffe2/utils/string_utils.h"
-#if !defined(CAFFE2_IS_XPLAT_BUILD) && !defined(C10_MOBILE)
-#include <ATen/core/List.h>
+
+#undef TORCH_ASSERT_NO_OPERATORS
+
+#if defined(EXPOSE_C2_OPS) ||                               \
+  !defined(CAFFE2_IS_XPLAT_BUILD) && !defined(C10_MOBILE)
+#include <ATen/core/function_schema.h>
 #endif
 
 #include "caffe2/core/export_c10_op_to_caffe2.h"
@@ -86,51 +91,18 @@ OperatorBase::OperatorBase(const OperatorDef& operator_def, Workspace* ws)
 
 #if defined(EXPOSE_C2_OPS) || \
     !defined(CAFFE2_IS_XPLAT_BUILD) && !defined(C10_MOBILE)
-namespace {
-int C10_UNUSED // Suppress unused function warning on mobile.
-compute_input_size_(const std::vector<c10::IValue>& inputs) {
-  if (inputs.empty()) {
-    return 0;
-  }
-  if (inputs[0].isTensorList()) {
-    // if the first input is a tensor list, we get input tensors by indexing
-    // into that list. currently, this means that only tensors from that list
-    // are accessible as inputs. any hypothetical input tensors that come after
-    // the list are not accessible.
-    return inputs[0].toTensorVector().size();
-  }
-  // it's not a tensor list. Count the number of tensor inputs and return them.
-  size_t num_tensor_inputs = 0;
-  bool found_nontensor = false;
-  for (const auto& input : inputs) {
-    if (input.isTensor()) {
-      AT_ASSERTM(
-          !found_nontensor,
-          "All tensor arguments must come before non-tensor arguments");
-      ++num_tensor_inputs;
-    } else {
-      found_nontensor = true;
-    }
-  }
-  return num_tensor_inputs;
-}
-} // namespace
 
 // NOLINTNEXTLINE(cppcoreguidelines-pro-type-member-init)
 OperatorBase::OperatorBase(
     const c10::FunctionSchema& fn_schema,
-    std::vector<c10::IValue> inputs,
-    const c10::List<at::Tensor> &outputs)
+    c10::ArrayRef<c10::IValue> inputs,
+    c10::ArrayRef<caffe2::Tensor> outputs)
     // NOLINTNEXTLINE(performance-move-const-arg)
-    : fn_schema_(make_unique<c10::FunctionSchema>(std::move(fn_schema))),
-      newstyle_inputs_(std::move(inputs)),
-      input_size_(compute_input_size_(newstyle_inputs_)) {
+    : fn_schema_(new c10::FunctionSchema(std::move(fn_schema))),
+      newstyle_inputs_(inputs),
+      output_tensors_(outputs.vec()),
+      input_size_(newstyle_inputs_.compute_input_size()) {
   input_tensors_.resize(input_size_);
-
-  output_tensors_.reserve(outputs_.size());
-  for (auto i : c10::irange(outputs.size())) {
-    output_tensors_.emplace_back(outputs.extract(i));
-  }
 }
 #endif