pytorch
diff --git a/‎.circleci/config.yml
Lines changed: 44 additions & 0 deletions b/‎.circleci/config.yml
Lines changed: 44 additions & 0 deletions
diff --git a/‎.circleci/verbatim-sources/job-specs-custom.yml
Lines changed: 40 additions & 0 deletions b/‎.circleci/verbatim-sources/job-specs-custom.yml
Lines changed: 40 additions & 0 deletions
diff --git a/‎.circleci/verbatim-sources/workflows-pytorch-ios-builds.yml
Lines changed: 4 additions & 0 deletions b/‎.circleci/verbatim-sources/workflows-pytorch-ios-builds.yml
Lines changed: 4 additions & 0 deletions
diff --git a/‎aten/src/ATen/CMakeLists.txt
Lines changed: 3 additions & 2 deletions b/‎aten/src/ATen/CMakeLists.txt
Lines changed: 3 additions & 2 deletions
diff --git a/‎aten/src/ATen/Dispatch.h
Lines changed: 16 additions & 2 deletions b/‎aten/src/ATen/Dispatch.h
Lines changed: 16 additions & 2 deletions
diff --git a/‎aten/src/ATen/NumericUtils.h
Lines changed: 7 additions & 0 deletions b/‎aten/src/ATen/NumericUtils.h
Lines changed: 7 additions & 0 deletions
diff --git a/‎aten/src/ATen/core/ATenDispatch.h
Lines changed: 2 additions & 1 deletion b/‎aten/src/ATen/core/ATenDispatch.h
Lines changed: 2 additions & 1 deletion
diff --git a/‎aten/src/ATen/core/CMakeLists.txt
Lines changed: 14 additions & 14 deletions b/‎aten/src/ATen/core/CMakeLists.txt
Lines changed: 14 additions & 14 deletions
diff --git a/‎aten/src/ATen/core/LegacyTypeDispatch.h
Lines changed: 10 additions & 12 deletions b/‎aten/src/ATen/core/LegacyTypeDispatch.h
Lines changed: 10 additions & 12 deletions
diff --git a/‎aten/src/ATen/core/NamedTensor.cpp
Lines changed: 19 additions & 16 deletions b/‎aten/src/ATen/core/NamedTensor.cpp
Lines changed: 19 additions & 16 deletions
@@ -1312,6 +1312,28 @@ jobs:
       - should_run_job
       - checkout
       - run_brew_for_ios_build
+      - run:
+          name: cert install
+          no_output_timeout: "1h"
+          command: |
+            set -e 
+            PROJ_ROOT=/Users/distiller/project
+            cd ${PROJ_ROOT}/ios/TestApp
+            # install fastlane
+            sudo gem install bundler && bundle install
+            # install certificates
+            echo ${IOS_CERT_KEY} >> cert.txt
+            base64 --decode cert.txt -o Certificates.p12
+            rm cert.txt
+            bundle exec fastlane install_cert
+            # install the provisioning profile
+            PROFILE=TestApp_CI.mobileprovision
+            PROVISIONING_PROFILES=~/Library/MobileDevice/Provisioning\ Profiles
+            mkdir -pv "${PROVISIONING_PROFILES}"
+            cd "${PROVISIONING_PROFILES}"
+            echo ${IOS_SIGN_KEY} >> cert.txt
+            base64 --decode cert.txt -o ${PROFILE}
+            rm cert.txt
       - run:
           name: Build
           no_output_timeout: "1h"
@@ -1344,6 +1366,24 @@ jobs:
             export IOS_ARCH=${IOS_ARCH}
             export IOS_PLATFORM=${IOS_PLATFORM}
             unbuffer ${PROJ_ROOT}/scripts/build_ios.sh 2>&1 | ts
+      - run:
+          name: Test
+          no_output_timeout: "30m"
+          command: |
+            set -e
+            PROJ_ROOT=/Users/distiller/project
+            PROFILE=TestApp_CI
+            # run the ruby build script
+            if ! [ -x "$(command -v xcodebuild)" ]; then
+              echo 'Error: xcodebuild is not installed.'
+              exit 1
+            fi 
+            echo ${IOS_DEV_TEAM_ID}
+            ruby ${PROJ_ROOT}/scripts/xcode_build.rb -i ${PROJ_ROOT}/build_ios/install -x ${PROJ_ROOT}/ios/TestApp/TestApp.xcodeproj -p ${IOS_PLATFORM} -c ${PROFILE} -t ${IOS_DEV_TEAM_ID}
+            if ! [ "$?" -eq "0" ]; then
+              echo 'xcodebuild failed!'
+              exit 1
+            fi
 
   # update_s3_htmls job
   # These jobs create html files for every cpu/cu## folder in s3. The html
@@ -1925,14 +1965,18 @@ workflows:
       # Pytorch iOS PR builds
       - pytorch_ios_build:
           name: pytorch_ios_10_2_1_x86_64_build
+          context: org-member
           build_environment: "pytorch-ios-10.2.1-x86_64_build"
+          ios_arch: "x86_64"
           ios_platform: "SIMULATOR"
           requires:
             - setup
       - pytorch_ios_build:
           name: pytorch_ios_10_2_1_arm64_build
+          context: org-member
           build_environment: "pytorch-ios-10.2.1-arm64_build"
           ios_arch: "arm64"
+          ios_platform: "OS"
           requires:
             - setup
       - caffe2_linux_build:
 
@@ -412,6 +412,28 @@
       - should_run_job
       - checkout
       - run_brew_for_ios_build
+      - run:
+          name: cert install
+          no_output_timeout: "1h"
+          command: |
+            set -e 
+            PROJ_ROOT=/Users/distiller/project
+            cd ${PROJ_ROOT}/ios/TestApp
+            # install fastlane
+            sudo gem install bundler && bundle install
+            # install certificates
+            echo ${IOS_CERT_KEY} >> cert.txt
+            base64 --decode cert.txt -o Certificates.p12
+            rm cert.txt
+            bundle exec fastlane install_cert
+            # install the provisioning profile
+            PROFILE=TestApp_CI.mobileprovision
+            PROVISIONING_PROFILES=~/Library/MobileDevice/Provisioning\ Profiles
+            mkdir -pv "${PROVISIONING_PROFILES}"
+            cd "${PROVISIONING_PROFILES}"
+            echo ${IOS_SIGN_KEY} >> cert.txt
+            base64 --decode cert.txt -o ${PROFILE}
+            rm cert.txt
       - run:
           name: Build
           no_output_timeout: "1h"
@@ -444,3 +466,21 @@
             export IOS_ARCH=${IOS_ARCH}
             export IOS_PLATFORM=${IOS_PLATFORM}
             unbuffer ${PROJ_ROOT}/scripts/build_ios.sh 2>&1 | ts
+      - run:
+          name: Test
+          no_output_timeout: "30m"
+          command: |
+            set -e
+            PROJ_ROOT=/Users/distiller/project
+            PROFILE=TestApp_CI
+            # run the ruby build script
+            if ! [ -x "$(command -v xcodebuild)" ]; then
+              echo 'Error: xcodebuild is not installed.'
+              exit 1
+            fi 
+            echo ${IOS_DEV_TEAM_ID}
+            ruby ${PROJ_ROOT}/scripts/xcode_build.rb -i ${PROJ_ROOT}/build_ios/install -x ${PROJ_ROOT}/ios/TestApp/TestApp.xcodeproj -p ${IOS_PLATFORM} -c ${PROFILE} -t ${IOS_DEV_TEAM_ID}
+            if ! [ "$?" -eq "0" ]; then
+              echo 'xcodebuild failed!'
+              exit 1
+            fi
@@ -1,13 +1,17 @@
       # Pytorch iOS PR builds
       - pytorch_ios_build:
           name: pytorch_ios_10_2_1_x86_64_build
+          context: org-member
           build_environment: "pytorch-ios-10.2.1-x86_64_build"
+          ios_arch: "x86_64"
           ios_platform: "SIMULATOR"
           requires:
             - setup
       - pytorch_ios_build:
           name: pytorch_ios_10_2_1_arm64_build
+          context: org-member
           build_environment: "pytorch-ios-10.2.1-arm64_build"
           ios_arch: "arm64"
+          ios_platform: "OS"
           requires:
             - setup
@@ -449,9 +449,10 @@ endif()
 
 # https://stackoverflow.com/questions/11096471/how-can-i-install-a-hierarchy-of-files-using-cmake
 FOREACH(HEADER  ${INSTALL_HEADERS})
-  string(REPLACE "${CMAKE_CURRENT_SOURCE_DIR}/" "" HEADER_SUB ${HEADER})
+  string(REPLACE "${CMAKE_CURRENT_SOURCE_DIR}/" "ATen/" HEADER_SUB ${HEADER})
+  string(REPLACE "${Caffe2_SOURCE_DIR}/" "" HEADER_SUB ${HEADER_SUB})
   GET_FILENAME_COMPONENT(DIR ${HEADER_SUB} DIRECTORY)
-  INSTALL(FILES ${HEADER} DESTINATION ${AT_INSTALL_INCLUDE_DIR}/ATen/${DIR})
+  INSTALL(FILES ${HEADER} DESTINATION "${AT_INSTALL_INCLUDE_DIR}/${DIR}")
 ENDFOREACH()
 
 # TODO: Install hip_generated_h when we have it
 
@@ -146,10 +146,24 @@ inline void deprecated_AT_DISPATCH_ALL_TYPES_AND_HALF_AND_COMPLEX() {}
     switch (_st) {                                                                                               \
       AT_PRIVATE_CASE_TYPE(at::ScalarType::Double, double, __VA_ARGS__)                                          \
       AT_PRIVATE_CASE_TYPE(at::ScalarType::Float, float, __VA_ARGS__)                                            \
-      AT_PRIVATE_CASE_TYPE(at::ScalarType::Half, at::Half, __VA_ARGS__)                                          \
       AT_PRIVATE_CASE_TYPE(at::ScalarType::ComplexDouble, std::complex<double>, __VA_ARGS__)                     \
       AT_PRIVATE_CASE_TYPE(at::ScalarType::ComplexFloat, std::complex<float>, __VA_ARGS__)                       \
-      AT_PRIVATE_CASE_TYPE(at::ScalarType::ComplexHalf, std::complex<at::Half>, __VA_ARGS__)                     \
+      default:                                                                                                   \
+        AT_ERROR(#NAME, " not implemented for '", toString(_st), "'");                                           \
+    }                                                                                                            \
+  }()
+
+ #define AT_DISPATCH_FLOATING_AND_COMPLEX_TYPES_AND1(SCALARTYPE, TYPE, NAME, ...)                                \
+  [&] {                                                                                                          \
+    const auto& the_type = TYPE;                                                                                 \
+    /* don't use TYPE again in case it is an expensive or side-effect op */                                      \
+    at::ScalarType _st = ::detail::scalar_type(the_type);                                                        \
+    switch (_st) {                                                                                               \
+      AT_PRIVATE_CASE_TYPE(at::ScalarType::Double, double, __VA_ARGS__)                                          \
+      AT_PRIVATE_CASE_TYPE(at::ScalarType::Float, float, __VA_ARGS__)                                            \
+      AT_PRIVATE_CASE_TYPE(at::ScalarType::ComplexDouble, std::complex<double>, __VA_ARGS__)                     \
+      AT_PRIVATE_CASE_TYPE(at::ScalarType::ComplexFloat, std::complex<float>, __VA_ARGS__)                       \
+      AT_PRIVATE_CASE_TYPE(SCALARTYPE, decltype(c10::impl::ScalarTypeToCPPType<SCALARTYPE>::t), __VA_ARGS__)     \
       default:                                                                                                   \
         AT_ERROR(#NAME, " not implemented for '", toString(_st), "'");                                           \
     }                                                                                                            \
 
@@ -7,6 +7,7 @@
 #include <cmath>
 #include <type_traits>
 #include <c10/util/BFloat16.h>
+#include <c10/util/Complex.h>
 #include <c10/macros/Macros.h>
 
 namespace at {
@@ -31,6 +32,12 @@ inline C10_HOST_DEVICE bool _isnan(T val) {
 #endif
 }
 
+template <typename T,
+          typename std::enable_if<std::is_complex_t<T>::value, int>::type = 0>
+inline bool _isnan(T val) {
+  return std::isnan(std::real(val)) || std::isnan(std::imag(val));
+}
+
 inline C10_HOST_DEVICE bool _isnan(at::BFloat16 val) {
   return at::_isnan(float(val));
 }
 
@@ -40,7 +40,8 @@ namespace impl {
 // question is whether or not we have access to all the relevant TLS at this
 // point.
 static inline TensorTypeId dispatchTypeId(TensorTypeSet ts) {
-  return (ts - c10::impl::tls_excluded_tensor_type_set()).highestPriorityTypeId();
+  c10::impl::LocalTensorTypeSet local = c10::impl::tls_local_tensor_type_set();
+  return ((ts | local.included_) - local.excluded_).highestPriorityTypeId();
 }
 
 }
 
@@ -8,22 +8,22 @@ EXCLUDE(ATen_CORE_SRCS "${ATen_CORE_SRCS}" ${ATen_CORE_TEST_SRCS})
 
 # Add files needed from jit folders
 LIST(APPEND ATen_CORE_HEADERS
-    ${CMAKE_CURRENT_SOURCE_DIR}/../../../../torch/csrc/jit/source_range.h
-    ${CMAKE_CURRENT_SOURCE_DIR}/../../../../torch/csrc/jit/script/function_schema_parser.h
-    ${CMAKE_CURRENT_SOURCE_DIR}/../../../../torch/csrc/jit/script/lexer.h
-    ${CMAKE_CURRENT_SOURCE_DIR}/../../../../torch/csrc/jit/script/strtod.h
-    ${CMAKE_CURRENT_SOURCE_DIR}/../../../../torch/csrc/jit/script/parse_string_literal.h
-    ${CMAKE_CURRENT_SOURCE_DIR}/../../../../torch/csrc/jit/script/schema_type_parser.h
-    ${CMAKE_CURRENT_SOURCE_DIR}/../../../../torch/csrc/jit/script/error_report.h
-    ${CMAKE_CURRENT_SOURCE_DIR}/../../../../torch/csrc/jit/script/tree.h
+    ${Caffe2_SOURCE_DIR}/torch/csrc/jit/source_range.h
+    ${Caffe2_SOURCE_DIR}/torch/csrc/jit/script/function_schema_parser.h
+    ${Caffe2_SOURCE_DIR}/torch/csrc/jit/script/lexer.h
+    ${Caffe2_SOURCE_DIR}/torch/csrc/jit/script/strtod.h
+    ${Caffe2_SOURCE_DIR}/torch/csrc/jit/script/parse_string_literal.h
+    ${Caffe2_SOURCE_DIR}/torch/csrc/jit/script/schema_type_parser.h
+    ${Caffe2_SOURCE_DIR}/torch/csrc/jit/script/error_report.h
+    ${Caffe2_SOURCE_DIR}/torch/csrc/jit/script/tree.h
 )
 LIST(APPEND ATen_CORE_SRCS
-    ${CMAKE_CURRENT_SOURCE_DIR}/../../../../torch/csrc/jit/script/error_report.cpp
-    ${CMAKE_CURRENT_SOURCE_DIR}/../../../../torch/csrc/jit/script/function_schema_parser.cpp
-    ${CMAKE_CURRENT_SOURCE_DIR}/../../../../torch/csrc/jit/script/lexer.cpp
-    ${CMAKE_CURRENT_SOURCE_DIR}/../../../../torch/csrc/jit/script/strtod.cpp
-    ${CMAKE_CURRENT_SOURCE_DIR}/../../../../torch/csrc/jit/script/schema_type_parser.cpp
-    ${CMAKE_CURRENT_SOURCE_DIR}/../../../../torch/csrc/jit/source_range.cpp
+    ${Caffe2_SOURCE_DIR}/torch/csrc/jit/script/error_report.cpp
+    ${Caffe2_SOURCE_DIR}/torch/csrc/jit/script/function_schema_parser.cpp
+    ${Caffe2_SOURCE_DIR}/torch/csrc/jit/script/lexer.cpp
+    ${Caffe2_SOURCE_DIR}/torch/csrc/jit/script/strtod.cpp
+    ${Caffe2_SOURCE_DIR}/torch/csrc/jit/script/schema_type_parser.cpp
+    ${Caffe2_SOURCE_DIR}/torch/csrc/jit/source_range.cpp
 
 # Pass to parent
 
@@ -12,6 +12,7 @@
 #include <c10/core/ScalarType.h>
 #include <c10/util/Exception.h>
 #include <ATen/core/LegacyDeviceTypeInit.h>
+#include <c10/core/impl/LocalTensorTypeSet.h>
 #include <c10/core/TensorImpl.h>
 #include <ATen/core/ATenDispatch.h>
 #include <ATen/core/TensorBody.h>
@@ -47,22 +48,19 @@ class CAFFE2_API LegacyTypeDispatch {
 
 CAFFE2_API LegacyTypeDispatch& globalLegacyTypeDispatch();
 
-// A RAII, thread local (!) guard that has the following effect:
-//
-// Upon construction: sets NonVariableTypeMode_enabled for the current thread to
-// control whether we are in non-Variable-type mode.
-//
-// Upon destruction: sets NonVariableTypeMode_enabled back to the original value.
+// A RAII, thread local (!) guard that will disable dispatch to variable
+// handler.
 //
 // See NOTE [ Treating Variables as non-Variables in type dispatch ] for details.
 struct CAFFE2_API AutoNonVariableTypeMode {
-  AutoNonVariableTypeMode(bool enabled) : prev_mode(NonVariableTypeMode::is_enabled()) {
-    NonVariableTypeMode::set_enabled(enabled);
-  }
-  ~AutoNonVariableTypeMode() {
-    NonVariableTypeMode::set_enabled(prev_mode);
+  // NB: The enabled parameter must ALWAYS be black, as Henry Ford used to say.
+  // TODO: Eliminate this parameter entirely
+  AutoNonVariableTypeMode(bool enabled = true) :
+    guard_(TensorTypeId::VariableTensorId) {
+
+    TORCH_INTERNAL_ASSERT(enabled);
   }
-  bool prev_mode;
+  c10::impl::ExcludeTensorTypeIdGuard guard_;
 };
 
 } // namespace at
@@ -42,12 +42,6 @@ DimnameList default_names(size_t len) {
   return DimnameList(&all_unnamed.front(), len);
 }
 
-void check_names_valid_for(const Tensor& tensor, DimnameList names) {
-  return impl::check_names_valid_for(tensor.unsafeGetTensorImpl(), names);
-}
-
-namespace impl {
-
 static void check_unique_names(DimnameList names) {
   // Strategy: Compare each element with the ones that come after it.
   // Although this is O(N^2), in practice N is small (no more than 25).
@@ -62,6 +56,24 @@ static void check_unique_names(DimnameList names) {
   }
 }
 
+void check_names_valid_for(const Tensor& tensor, DimnameList names) {
+  return impl::check_names_valid_for(tensor.unsafeGetTensorImpl(), names);
+}
+
+void check_names_valid_for(int64_t tensor_dim, DimnameList names) {
+  TORCH_CHECK(
+      tensor_dim <= kMaxNamedTensorDim,
+      "Named tensors only support up to ", kMaxNamedTensorDim, " dims: "
+      "Attempted to create a tensor with dim ", tensor_dim, " with names ", names);
+  TORCH_CHECK(tensor_dim == names.size(),
+      "Number of names (", names.size(), ") and "
+      "number of dimensions in tensor (", tensor_dim, ") ",
+      "do not match. Attempted to create a tensor with names ", names);
+  check_unique_names(names);
+}
+
+namespace impl {
+
 static NamedTensorMeta* get_named_tensor_meta(TensorImpl* impl) {
   if (!NamesMode::is_enabled()) {
     return nullptr;
@@ -77,16 +89,7 @@ static const NamedTensorMeta* get_named_tensor_meta(const TensorImpl* impl) {
 }
 
 void check_names_valid_for(TensorImpl* impl, DimnameList names) {
-  auto ndim = impl->dim();
-  TORCH_CHECK(
-      ndim <= kMaxNamedTensorDim,
-      "Named tensors only support up to ", kMaxNamedTensorDim, " dims: "
-      "Attempted to create a tensor with dim ", ndim, " with names ", names);
-  TORCH_CHECK(ndim == names.size(),
-      "Number of names (", names.size(), ") and "
-      "number of dimensions in tensor (", ndim, ") ",
-      "do not match. Attempted to create a tensor with names ", names);
-  check_unique_names(names);
+  check_names_valid_for(impl->dim(), names);
 }
 
 void internal_set_names_inplace(TensorImpl* impl, optional<DimnameList> names) {
Original file line number	Diff line number	Diff line change
`@@ -40,7 +40,8 @@ namespace impl {`
`40`	`40`	`// question is whether or not we have access to all the relevant TLS at this`
`41`	`41`	`// point.`
`42`	`42`	`static inline TensorTypeId dispatchTypeId(TensorTypeSet ts) {`
`43`		`- return (ts - c10::impl::tls_excluded_tensor_type_set()).highestPriorityTypeId();`
	`43`	`+ c10::impl::LocalTensorTypeSet local = c10::impl::tls_local_tensor_type_set();`
	`44`	`+ return ((ts \| local.included_) - local.excluded_).highestPriorityTypeId();`
`44`	`45`	`}`
`45`	`46`
`46`	`47`	`}`