csarofeen
diff --git a/‎aten/src/ATen/FunctionalInverses.cpp
Lines changed: 11 additions & 11 deletions b/‎aten/src/ATen/FunctionalInverses.cpp
Lines changed: 11 additions & 11 deletions
diff --git a/‎aten/src/ATen/functorch/BatchRulesDecompositions.cpp
Lines changed: 1 addition & 1 deletion b/‎aten/src/ATen/functorch/BatchRulesDecompositions.cpp
Lines changed: 1 addition & 1 deletion
diff --git a/‎aten/src/ATen/native/Dropout.cpp
Lines changed: 4 additions & 4 deletions b/‎aten/src/ATen/native/Dropout.cpp
Lines changed: 4 additions & 4 deletions
diff --git a/‎aten/src/ATen/native/TensorAdvancedIndexing.cpp
Lines changed: 1 addition & 1 deletion b/‎aten/src/ATen/native/TensorAdvancedIndexing.cpp
Lines changed: 1 addition & 1 deletion
diff --git a/‎aten/src/ATen/native/TensorShape.cpp
Lines changed: 7 additions & 7 deletions b/‎aten/src/ATen/native/TensorShape.cpp
Lines changed: 7 additions & 7 deletions
diff --git a/‎aten/src/ATen/native/native_functions.yaml
Lines changed: 11 additions & 9 deletions b/‎aten/src/ATen/native/native_functions.yaml
Lines changed: 11 additions & 9 deletions
diff --git a/‎aten/src/ATen/native/quantized/cpu/fused_obs_fake_quant.cpp
Lines changed: 1 addition & 1 deletion b/‎aten/src/ATen/native/quantized/cpu/fused_obs_fake_quant.cpp
Lines changed: 1 addition & 1 deletion
diff --git a/‎c10/core/SymFloatNodeImpl.cpp
Lines changed: 4 additions & 0 deletions b/‎c10/core/SymFloatNodeImpl.cpp
Lines changed: 4 additions & 0 deletions
diff --git a/‎c10/core/SymFloatNodeImpl.h
Lines changed: 1 addition & 0 deletions b/‎c10/core/SymFloatNodeImpl.h
Lines changed: 1 addition & 0 deletions
diff --git a/‎functorch/test/test_aotdispatch.py
Lines changed: 0 additions & 4 deletions b/‎functorch/test/test_aotdispatch.py
Lines changed: 0 additions & 4 deletions
@@ -177,31 +177,31 @@ Tensor FunctionalInverses::slice_copy_Tensor_inverse(const Tensor& base, const T
     return base.slice_scatter_symint(mutated_view, dim, start, end, step);
 }
 
-Tensor FunctionalInverses::split_copy_Tensor_inverse(const Tensor& base, const Tensor& mutated_view, bool reapply_views, int64_t mutated_view_idx, int64_t split_size, int64_t dim) {
+Tensor FunctionalInverses::split_copy_Tensor_inverse(const Tensor& base, const Tensor& mutated_view, bool reapply_views, int64_t mutated_view_idx, c10::SymInt split_size, int64_t dim) {
     // It would be nice if this logic could be re-used from autograd's split_backward(), but I don't think it can.
     // For functionalization, we have only have one of the tensors from the TensorList outputed by split(), and we want to layer i
     // on top of the base tensor.
     // For autograd, we have all of the tensors outputted by split() and we just want to stack them.
-    dim = at::maybe_wrap_dim(dim, base.sizes().size());
-    auto dim_size = base.size(dim);
-    auto start = mutated_view_idx * split_size;
-    auto end = start + split_size;
+    dim = at::maybe_wrap_dim(dim, base.dim());
+    auto dim_size = base.sym_size(dim);
+    auto start = split_size * mutated_view_idx;
+    auto end = split_size + start;
     if (end > dim_size) end = dim_size;
     // Pessimism: we can't reapply views for slice_scatter.
-    return base.slice_scatter(mutated_view, dim, start, end, 1);
+    return base.slice_scatter_symint(mutated_view, dim, start, end, 1);
 }
 
-Tensor FunctionalInverses::split_with_sizes_copy_inverse(const Tensor& base, const Tensor& mutated_view, bool reapply_views, int64_t mutated_view_idx, at::IntArrayRef split_sizes, int64_t dim) {
-    dim = at::maybe_wrap_dim(dim, base.sizes().size());
-    auto dim_size = base.size(dim);
-    int64_t start = 0;
+Tensor FunctionalInverses::split_with_sizes_copy_inverse(const Tensor& base, const Tensor& mutated_view, bool reapply_views, int64_t mutated_view_idx, c10::SymIntArrayRef split_sizes, int64_t dim) {
+    dim = at::maybe_wrap_dim(dim, base.dim());
+    auto dim_size = base.sym_size(dim);
+    c10::SymInt start = 0;
     for (auto i = 0; i < mutated_view_idx; ++i) {
         start += split_sizes[i];
     }
     auto end = start + split_sizes[mutated_view_idx];
     if (end > dim_size) end = dim_size;
     // Pessimism: we can't reapply views for slice_scatter.
-    return base.slice_scatter(mutated_view, dim, start, end, 1);
+    return base.slice_scatter_symint(mutated_view, dim, start, end, 1);
 }
 
 Tensor FunctionalInverses::squeeze_copy_inverse(const Tensor& base, const Tensor& mutated_view, bool reapply_views) {
 
@@ -200,7 +200,7 @@ TORCH_LIBRARY_IMPL(aten, FuncTorchBatched, m) {
   OP_DECOMPOSE(special_multigammaln);
   OP_DECOMPOSE(special_polygamma);
   OP_DECOMPOSE(special_softmax);
-  OP_DECOMPOSE2(split, sizes);
+  m.impl("split.sizes", native::split_symint);
   OP_DECOMPOSE(square);
   OP_DECOMPOSE(numpy_T);
   OP_DECOMPOSE(reshape_as);
 
@@ -12,17 +12,17 @@ template<bool inplace>
 using Ctype = typename std::conditional<inplace, Tensor&, Tensor>::type;
 
 Tensor make_feature_noise(const Tensor& input) {
-  auto input_sizes = input.sizes();
+  auto input_sizes = input.sym_sizes();
   TORCH_CHECK(input.dim() >= 2, "Feature dropout requires at least 2 dimensions in the input");
-  std::vector<int64_t> sizes;
+  std::vector<c10::SymInt> sizes;
   sizes.reserve(input.dim());
   sizes.push_back(input_sizes[0]);
   sizes.push_back(input_sizes[1]);
   for (const auto i : c10::irange(2, input.dim())) {
     (void)i; //Suppress unused variable warning
     sizes.push_back(1);
   }
-  return input.new_empty(sizes);
+  return input.new_empty_symint(sizes);
 }
 
 bool is_fused_kernel_acceptable(const Tensor& input, double p) {
@@ -46,7 +46,7 @@ Tensor multiply(const Tensor& input, const Tensor& noise) {
 template<bool feature_dropout, bool alpha_dropout, bool inplace, typename T>
 Ctype<inplace> _dropout_impl(T& input, double p, bool train) {
   TORCH_CHECK(p >= 0 && p <= 1, "dropout probability has to be between 0 and 1, but got ", p);
-  if (p == 0 || !train || input.numel() == 0) {
+  if (p == 0 || !train || input.sym_numel() == 0) {
     return input;
   }
 
 
@@ -1365,7 +1365,7 @@ Tensor gather_backward(const Tensor& grad, const Tensor& self, int64_t dim, cons
   if (sparse_grad) {
     return at::_gather_sparse_backward(self, dim, index, grad);
   }
-  auto result = grad.new_zeros(self.sizes());
+  auto result = grad.new_zeros_symint(self.sym_sizes());
   // for composite compliance, use out-of-place variant of
   // `scatter_add` if index tensor is a Tensor Subclass.
   if (isTensorSubclassLike(index)) {
 
@@ -723,19 +723,19 @@ std::vector<Tensor> chunk(const Tensor& self, int64_t chunks, int64_t dim) {
   TORCH_CHECK(chunks > 0,
            "chunk expects `chunks` to be greater than 0, got: ", chunks);
 
-  const auto dim_size = self.size(dim);
-  int64_t split_size = (dim_size + chunks - 1) / chunks;
+  const auto dim_size = self.sym_size(dim);
+  auto split_size = (dim_size + chunks - 1) / chunks;
 
   // We need to call split_with_sizes in the case where split_size and dimension size are 0, because
   // a call to split would discard the number of chunks (because we can have an arbitrary number of
   // 0-sized chunks adding up to 0).  So, call split_with_sizes with the correct number of chunks,
   // eventually we will do this for all cases.
   if (split_size == 0 && dim_size == 0) {
-    std::vector<int64_t> split_sizes(chunks, split_size);
+    std::vector<c10::SymInt> split_sizes(chunks, split_size);
     split_sizes[chunks - 1] = split_size - (split_size * chunks - dim_size);
-    return self.split_with_sizes(split_sizes, dim);
+    return self.split_with_sizes_symint(split_sizes, dim);
   } else {
-    return self.split(split_size, dim);
+    return self.split_symint(split_size, dim);
   }
 }
 
@@ -2273,8 +2273,8 @@ std::vector<Tensor> split(const Tensor& self, int64_t split_size, int64_t dim) {
   return splits;
 }
 
-std::vector<Tensor> split(const Tensor& self, IntArrayRef sizes, int64_t dim) {
-  return at::split_with_sizes(self, sizes, dim);
+std::vector<Tensor> split_symint(const Tensor& self, c10::SymIntArrayRef sizes, int64_t dim) {
+  return at::split_with_sizes_symint(self, sizes, dim);
 }
 
 std::vector<Tensor> unsafe_split(const Tensor& self, int64_t split_size, int64_t dim) {
 
@@ -4782,34 +4782,36 @@
     CUDA: softmax_backward_cuda_out
     MPS: softmax_backward_mps_out
 
-- func: unsafe_split.Tensor(Tensor self, int split_size, int dim=0) -> Tensor[]
+- func: unsafe_split.Tensor(Tensor self, SymInt split_size, int dim=0) -> Tensor[]
   variants: function, method
   device_check: NoCheck
   device_guard: False
   dispatch:
     CompositeExplicitAutograd: unsafe_split
   autogen: unsafe_split.Tensor_out
 
-- func: split.Tensor(Tensor(a -> *) self, int split_size, int dim=0) -> Tensor(a)[]
+- func: split.Tensor(Tensor(a -> *) self, SymInt split_size, int dim=0) -> Tensor(a)[]
   variants: function, method
   device_check: NoCheck
   device_guard: False
   dispatch:
     CompositeExplicitAutograd: split
 
-- func: split.sizes(Tensor(a -> *) self, int[] split_size, int dim=0) -> Tensor(a)[]
+- func: split.sizes(Tensor(a -> *) self, SymInt[] split_size, int dim=0) -> Tensor(a)[]
   variants: function, method
   device_guard: False
+  dispatch:
+    CompositeImplicitAutograd: split_symint
 
-- func: unsafe_split_with_sizes(Tensor self, int[] split_sizes, int dim=0) -> Tensor[]
+- func: unsafe_split_with_sizes(Tensor self, SymInt[] split_sizes, int dim=0) -> Tensor[]
   variants: function, method
   device_check: NoCheck
   device_guard: False
   dispatch:
     CompositeExplicitAutograd: unsafe_split_with_sizes
   autogen: unsafe_split_with_sizes.out
 
-- func: split_with_sizes(Tensor(a -> *) self, int[] split_sizes, int dim=0) -> Tensor(a)[]
+- func: split_with_sizes(Tensor(a -> *) self, SymInt[] split_sizes, int dim=0) -> Tensor(a)[]
   variants: function, method
   device_check: NoCheck
   device_guard: False
@@ -12810,13 +12812,13 @@
     CompositeExplicitAutogradNonFunctional: slice_copy_Tensor
   tags: view_copy
 
-- func: split_copy.Tensor(Tensor self, int split_size, int dim=0) -> Tensor[]
+- func: split_copy.Tensor(Tensor self, SymInt split_size, int dim=0) -> Tensor[]
   variants: function
   dispatch:
     CompositeExplicitAutogradNonFunctional: split_copy_Tensor
   tags: view_copy
 
-- func: split_with_sizes_copy(Tensor self, int[] split_sizes, int dim=0) -> Tensor[]
+- func: split_with_sizes_copy(Tensor self, SymInt[] split_sizes, int dim=0) -> Tensor[]
   variants: function
   dispatch:
     CompositeExplicitAutogradNonFunctional: split_with_sizes_copy
@@ -13022,13 +13024,13 @@
     CompositeExplicitAutograd: slice_copy_Tensor_out
 
 
-- func: split_copy.Tensor_out(Tensor self, int split_size, int dim=0, *, Tensor(a!)[] out) -> ()
+- func: split_copy.Tensor_out(Tensor self, SymInt split_size, int dim=0, *, Tensor(a!)[] out) -> ()
   variants: function
   dispatch:
     CompositeExplicitAutograd: split_copy_Tensor_out
 
 
-- func: split_with_sizes_copy.out(Tensor self, int[] split_sizes, int dim=0, *, Tensor(a!)[] out) -> ()
+- func: split_with_sizes_copy.out(Tensor self, SymInt[] split_sizes, int dim=0, *, Tensor(a!)[] out) -> ()
   variants: function
   dispatch:
     CompositeExplicitAutograd: split_with_sizes_copy_out
 
@@ -236,7 +236,7 @@ at::Tensor fused_moving_avg_obs_fake_quant(
     const int64_t ch_axis,
     bool per_row_fake_quant,
     bool symmetric_quant) {
-  if (self.numel() == 0) {
+  if (self.sym_numel() == 0) {
     return self.clone();
   }
   const auto res = at::_fused_moving_avg_obs_fq_helper(
 
@@ -13,4 +13,8 @@ c10::SymIntNode SymFloatNodeImpl::ceil() {
   TORCH_CHECK(false, "NYI");
 }
 
+c10::SymIntNode SymFloatNodeImpl::floor() {
+  TORCH_CHECK(false, "NYI");
+}
+
 } // namespace c10
@@ -60,6 +60,7 @@ class C10_API SymFloatNodeImpl : public c10::intrusive_ptr_target {
     TORCH_CHECK(false, "NYI");
   };
   virtual SymIntNode ceil();
+  virtual SymIntNode floor();
   virtual std::string str() {
     TORCH_CHECK(false, "NYI");
   };
 
@@ -785,7 +785,6 @@ def assert_compiler(gm: torch.fx.GraphModule, _):
     xfail('fmax', ''),  # aten.logical_or_.default - couldn't find symbolic meta function/decomposition
     xfail('fmin', ''),  # aten.logical_or_.default - couldn't find symbolic meta function/decomposition
     xfail('frexp', ''),  # aten.frexp.Tensor - couldn't find symbolic meta function/decomposition
-    xfail('gather', ''),  # aten.gather.default - couldn't find symbolic meta function/decomposition
     xfail('gradient', ''),  # Cannot call sizes() on tensor with symbolic sizes/strides
     xfail('hsplit', ''),  # Cannot call sizes() on tensor with symbolic sizes/strides
     xfail('i0', ''),  # aten.i0.default - couldn't find symbolic meta function/decomposition
@@ -975,7 +974,6 @@ def assert_compiler(gm: torch.fx.GraphModule, _):
     xfail('round', 'decimals_0'),  # aten.round.decimals - couldn't find symbolic meta function/decomposition
     xfail('round', 'decimals_3'),  # aten.round.decimals - couldn't find symbolic meta function/decomposition
     xfail('round', 'decimals_neg_3'),  # aten.round.decimals - couldn't find symbolic meta function/decompos...
-    xfail('scatter_add', ''),  # aten.scatter_add.default - couldn't find symbolic meta function/decomposition
     xfail('scatter', ''),  # aten.scatter.src - couldn't find symbolic meta function/decomposition
     xfail('scatter_reduce', 'amax'),  # aten.scatter_reduce.two - couldn't find symbolic meta function/decom...
     xfail('scatter_reduce', 'amin'),  # aten.scatter_reduce.two - couldn't find symbolic meta function/decom...
@@ -993,8 +991,6 @@ def assert_compiler(gm: torch.fx.GraphModule, _):
     xfail('special.polygamma', 'special_polygamma_n_0'),  # aten.polygamma.default - couldn't find symbolic ...
     xfail('special.xlog1py', ''),  # aten.special_xlog1py.default - couldn't find symbolic meta function/deco...
     xfail('split', ''),  # Cannot call sizes() on tensor with symbolic sizes/strides
-    xfail('split', 'list_args'),  # Cannot call sizes() on tensor with symbolic sizes/strides
-    xfail('split_with_sizes', ''),  # Cannot call sizes() on tensor with symbolic sizes/strides
     xfail('squeeze', ''),  # Cannot call sizes() on tensor with symbolic sizes/strides
     xfail('std', ''),  # Cannot call numel() on tensor with symbolic sizes/strides
     xfail('std_mean', ''),  # Cannot call numel() on tensor with symbolic sizes/strides
Original file line number	Diff line number	Diff line change
`@@ -1365,7 +1365,7 @@ Tensor gather_backward(const Tensor& grad, const Tensor& self, int64_t dim, cons`
`1365`	`1365`	`if (sparse_grad) {`
`1366`	`1366`	`return at::_gather_sparse_backward(self, dim, index, grad);`
`1367`	`1367`	`}`
`1368`		`- auto result = grad.new_zeros(self.sizes());`
	`1368`	`+ auto result = grad.new_zeros_symint(self.sym_sizes());`
`1369`	`1369`	`// for composite compliance, use out-of-place variant of`
`1370`	`1370`	// `scatter_add` if index tensor is a Tensor Subclass.
`1371`	`1371`	`if (isTensorSubclassLike(index)) {`
Original file line number	Diff line number	Diff line change
`@@ -236,7 +236,7 @@ at::Tensor fused_moving_avg_obs_fake_quant(`
`236`	`236`	`const int64_t ch_axis,`
`237`	`237`	`bool per_row_fake_quant,`
`238`	`238`	`bool symmetric_quant) {`
`239`		`- if (self.numel() == 0) {`
	`239`	`+ if (self.sym_numel() == 0) {`
`240`	`240`	`return self.clone();`
`241`	`241`	`}`
`242`	`242`	`const auto res = at::_fused_moving_avg_obs_fq_helper(`
Original file line number	Diff line number	Diff line change
`@@ -13,4 +13,8 @@ c10::SymIntNode SymFloatNodeImpl::ceil() {`
`13`	`13`	`TORCH_CHECK(false, "NYI");`
`14`	`14`	`}`
`15`	`15`
	`16`	`+c10::SymIntNode SymFloatNodeImpl::floor() {`
	`17`	`+ TORCH_CHECK(false, "NYI");`
	`18`	`+}`
	`19`	`+`
`16`	`20`	`} // namespace c10`