pytorch
diff --git a/‎BUILD.bazel
Lines changed: 8 additions & 0 deletions b/‎BUILD.bazel
Lines changed: 8 additions & 0 deletions
diff --git a/‎c10/core/DeviceType.cpp
Lines changed: 0 additions & 168 deletions b/‎c10/core/DeviceType.cpp
Lines changed: 0 additions & 168 deletions
diff --git a/‎c10/core/DeviceType.h
Lines changed: 3 additions & 118 deletions b/‎c10/core/DeviceType.h
Lines changed: 3 additions & 118 deletions
diff --git a/‎c10/core/build.bzl
Lines changed: 1 addition & 0 deletions b/‎c10/core/build.bzl
Lines changed: 1 addition & 0 deletions
diff --git a/‎caffe2/CMakeLists.txt
Lines changed: 6 additions & 2 deletions b/‎caffe2/CMakeLists.txt
Lines changed: 6 additions & 2 deletions
diff --git a/‎torch/CMakeLists.txt
Lines changed: 1 addition & 0 deletions b/‎torch/CMakeLists.txt
Lines changed: 1 addition & 0 deletions
@@ -670,6 +670,14 @@ flatbuffer_cc_library(
     out_prefix = "torch/csrc/jit/serialization/",
 )
 
+cc_library(
+    name = "torch_standalone_headers",
+    hdrs = glob([
+        "torch/standalone/header_only/**/*.h"
+    ]),
+    visibility = ["//visibility:public"],
+)
+
 cc_library(
     name = "torch_headers",
     hdrs = if_cuda(
 
@@ -1,123 +1,8 @@
 #pragma once
 
-// This is directly synchronized with caffe2/proto/caffe2.proto, but
-// doesn't require me to figure out how to get Protobuf headers into
-// ATen/core (which would require a lot more build system hacking.)
-// If you modify me, keep me synchronized with that file.
-
-#include <c10/macros/Export.h>
-
-#include <cstddef>
-#include <cstdint>
-#include <functional>
-#include <ostream>
-#include <string>
+#include <torch/standalone/header_only/core/DeviceType.h>
 
 namespace c10 {
-
-// These contains all device types that also have a BackendComponent
-// and therefore participate in per-backend functionality dispatch keys.
-// This is most backends except PrivateUse2 and PrivateUse3
-#define C10_FORALL_BACKEND_DEVICE_TYPES(_, extra) \
-  _(CPU, extra)                                   \
-  _(CUDA, extra)                                  \
-  _(HIP, extra)                                   \
-  _(XLA, extra)                                   \
-  _(MPS, extra)                                   \
-  _(IPU, extra)                                   \
-  _(XPU, extra)                                   \
-  _(HPU, extra)                                   \
-  _(VE, extra)                                    \
-  _(Lazy, extra)                                  \
-  _(Meta, extra)                                  \
-  _(MTIA, extra)                                  \
-  _(PrivateUse1, extra)
-
-enum class DeviceType : int8_t {
-  CPU = 0,
-  CUDA = 1, // CUDA.
-  MKLDNN = 2, // Reserved for explicit MKLDNN
-  OPENGL = 3, // OpenGL
-  OPENCL = 4, // OpenCL
-  IDEEP = 5, // IDEEP.
-  HIP = 6, // AMD HIP
-  FPGA = 7, // FPGA
-  MAIA = 8, // ONNX Runtime / Microsoft
-  XLA = 9, // XLA / TPU
-  Vulkan = 10, // Vulkan
-  Metal = 11, // Metal
-  XPU = 12, // XPU
-  MPS = 13, // MPS
-  Meta = 14, // Meta (tensors with no data)
-  HPU = 15, // HPU / HABANA
-  VE = 16, // SX-Aurora / NEC
-  Lazy = 17, // Lazy Tensors
-  IPU = 18, // Graphcore IPU
-  MTIA = 19, // Meta training and inference devices
-  PrivateUse1 = 20, // PrivateUse1 device
-  // NB: If you add more devices:
-  //  - Change the implementations of DeviceTypeName and isValidDeviceType
-  //    in DeviceType.cpp
-  //  - Change the number below
-  COMPILE_TIME_MAX_DEVICE_TYPES = 21,
-};
-
-constexpr DeviceType kCPU = DeviceType::CPU;
-constexpr DeviceType kCUDA = DeviceType::CUDA;
-constexpr DeviceType kHIP = DeviceType::HIP;
-constexpr DeviceType kFPGA = DeviceType::FPGA;
-constexpr DeviceType kMAIA = DeviceType::MAIA;
-constexpr DeviceType kXLA = DeviceType::XLA;
-constexpr DeviceType kMPS = DeviceType::MPS;
-constexpr DeviceType kMeta = DeviceType::Meta;
-constexpr DeviceType kVulkan = DeviceType::Vulkan;
-constexpr DeviceType kMetal = DeviceType::Metal;
-constexpr DeviceType kXPU = DeviceType::XPU;
-constexpr DeviceType kHPU = DeviceType::HPU;
-constexpr DeviceType kVE = DeviceType::VE;
-constexpr DeviceType kLazy = DeviceType::Lazy;
-constexpr DeviceType kIPU = DeviceType::IPU;
-constexpr DeviceType kMTIA = DeviceType::MTIA;
-constexpr DeviceType kPrivateUse1 = DeviceType::PrivateUse1;
-
-// define explicit int constant
-constexpr int COMPILE_TIME_MAX_DEVICE_TYPES =
-    static_cast<int>(DeviceType::COMPILE_TIME_MAX_DEVICE_TYPES);
-
 static_assert(
-    COMPILE_TIME_MAX_DEVICE_TYPES <= 21,
-    "Hey!  You seem to be adding a lot of new DeviceTypes.  The intent was "
-    "for this constant to reflect the actual number of DeviceTypes we support "
-    "in PyTorch; it's important that this number is not too large as we "
-    "use this to allocate stack arrays in some places in our code.  If you "
-    "are indeed just adding the 20th device type, feel free to change "
-    "the check to 32; but if you are adding some sort of extensible device "
-    "types registration, please be aware that you are affecting code that "
-    "this number is small.  Try auditing uses of this constant.");
-
-C10_API std::string DeviceTypeName(DeviceType d, bool lower_case = false);
-
-C10_API bool isValidDeviceType(DeviceType d);
-
-C10_API std::ostream& operator<<(std::ostream& stream, DeviceType type);
-
-C10_API void register_privateuse1_backend(const std::string& backend_name);
-C10_API std::string get_privateuse1_backend(bool lower_case = true);
-
-C10_API bool is_privateuse1_backend_registered();
-
+using namespace torch::standalone;
+using torch::standalone::DeviceType;
 } // namespace c10
-
-namespace std {
-template <>
-struct hash<c10::DeviceType> {
-  std::size_t operator()(c10::DeviceType k) const {
-    return std::hash<int>()(static_cast<int>(k));
-  }
-};
-} // namespace std
-
-namespace torch {
-// NOLINTNEXTLINE(misc-unused-using-decls)
-using c10::DeviceType;
-} // namespace torch
@@ -80,6 +80,7 @@ def define_targets(rules):
         deps = [
             ":ScalarType",
             "//third_party/cpuinfo",
+            "//:torch_standalone_headers",
             "//c10/macros",
             "//c10/util:TypeCast",
             "//c10/util:base",
 
@@ -1282,7 +1282,8 @@ endif()
 target_include_directories(torch_cpu PRIVATE ${ATen_CPU_INCLUDE})
 
 target_include_directories(torch_cpu PRIVATE
-  ${TORCH_SRC_DIR}/csrc)
+  ${TORCH_SRC_DIR}/csrc
+  ${TORCH_SRC_DIR}/standalone)
 
 target_include_directories(torch_cpu PRIVATE
   ${TORCH_ROOT}/third_party/miniz-3.0.2)
@@ -1301,9 +1302,12 @@ target_include_directories(torch_cpu PRIVATE
 target_include_directories(torch_cpu PRIVATE
   ${TORCH_ROOT}/third_party/nlohmann/include)
 
-install(DIRECTORY "${TORCH_SRC_DIR}/csrc"
+install(DIRECTORY
+  "${TORCH_SRC_DIR}/csrc"
+  "${TORCH_SRC_DIR}/standalone"
   DESTINATION ${TORCH_INSTALL_INCLUDE_DIR}/torch
   FILES_MATCHING PATTERN "*.h" PATTERN "*.hpp")
+
 install(FILES
   "${TORCH_SRC_DIR}/script.h"
   "${TORCH_SRC_DIR}/extension.h"
 
@@ -74,6 +74,7 @@ set(TORCH_PYTHON_INCLUDE_DIRECTORIES
     ${TORCH_SRC_DIR}/csrc
     ${TORCH_SRC_DIR}/csrc/api/include
     ${TORCH_SRC_DIR}/lib
+    <
46C0
span class="pl-smi">${TORCH_SRC_DIR}/standalone
     )
 
 list(APPEND TORCH_PYTHON_INCLUDE_DIRECTORIES ${LIBSHM_SRCDIR})
Original file line number	Diff line number	Diff line change
`@@ -74,6 +74,7 @@ set(TORCH_PYTHON_INCLUDE_DIRECTORIES`
`74`	`74`	`${TORCH_SRC_DIR}/csrc`
`75`	`75`	`${TORCH_SRC_DIR}/csrc/api/include`
`76`	`76`	`${TORCH_SRC_DIR}/lib`
	`77`	`+ < 46C0 span class="pl-smi">${TORCH_SRC_DIR}/standalone`
`77`	`78`	`)`
`78`	`79`
`79`	`80`	`list(APPEND TORCH_PYTHON_INCLUDE_DIRECTORIES ${LIBSHM_SRCDIR})`