pytorch
diff --git a/‎aten/src/ATen/native/cuda/SummaryOps.cu
Lines changed: 3 additions & 3 deletions b/‎aten/src/ATen/native/cuda/SummaryOps.cu
Lines changed: 3 additions & 3 deletions
diff --git a/‎aten/src/ATen/native/cuda/UpSampleBilinear2d.cu
Lines changed: 2 additions & 8 deletions b/‎aten/src/ATen/native/cuda/UpSampleBilinear2d.cu
Lines changed: 2 additions & 8 deletions
diff --git a/‎aten/src/ATen/native/native_functions.yaml
Lines changed: 1 addition & 1 deletion b/‎aten/src/ATen/native/native_functions.yaml
Lines changed: 1 addition & 1 deletion
diff --git a/‎caffe2/operators/elementwise_ops.cu
Lines changed: 3 additions & 0 deletions b/‎caffe2/operators/elementwise_ops.cu
Lines changed: 3 additions & 0 deletions
diff --git a/‎test/cpp/api/functional.cpp
Lines changed: 15 additions & 1 deletion b/‎test/cpp/api/functional.cpp
Lines changed: 15 additions & 1 deletion
diff --git a/‎test/onnx/test_pytorch_onnx_onnxruntime.py
Lines changed: 10 additions & 0 deletions b/‎test/onnx/test_pytorch_onnx_onnxruntime.py
Lines changed: 10 additions & 0 deletions
diff --git a/‎test/run_test.py
Lines changed: 9 additions & 1 deletion b/‎test/run_test.py
Lines changed: 9 additions & 1 deletion
@@ -311,7 +311,7 @@ Tensor _bincount_cuda_template(
         weights.options().layout_opt(),
         weights.options().device_opt(),
         weights.options().pinned_memory_opt());
-    auto ret = cuda::CUDA_tensor_histogram<weights_t, input_t, true>(
+    cuda::CUDA_tensor_histogram<weights_t, input_t, true>(
         output, self, weights, nbins, minvalue, maxvalue);
   } else {
     output = native::zeros(
@@ -320,7 +320,7 @@ Tensor _bincount_cuda_template(
         c10::nullopt /* layout */,
         DeviceType::CUDA,
         c10::nullopt /* pin_memory */);
-    auto ret = cuda::CUDA_tensor_histogram<int64_t, input_t, false>(
+    cuda::CUDA_tensor_histogram<int64_t, input_t, false>(
         output, self, weights, nbins, minvalue, maxvalue);
   }
   return output;
@@ -374,7 +374,7 @@ Tensor _histc_cuda_template(
 #endif
   TORCH_CHECK(minvalue < maxvalue, "max must be larger than min");
 
-  auto ret = cuda::CUDA_tensor_histogram<input_t, input_t, false>(
+  cuda::CUDA_tensor_histogram<input_t, input_t, false>(
     output, self, Tensor(), nbins, minvalue, maxvalue);
   return output;
 }
 
@@ -456,7 +456,6 @@ C10_LAUNCH_BOUNDS_1(256) // 256 performs better then 1024
 __global__ void upsample_gen2d_aa_out_frame(
     const accscalar_t height_scale,
     const accscalar_t width_scale,
-    const bool align_corners,
     const PackedTensorAccessor64<scalar_t, 4> idata,
     PackedTensorAccessor64<scalar_t, 4> odata,
     const InterpFilter & interp_filter) {
@@ -550,7 +549,6 @@ C10_LAUNCH_BOUNDS_1(256) // 256 performs better then 1024
 __global__ void upsample_gen2d_aa_backward_out_frame(
     const accscalar_t height_scale,
     const accscalar_t width_scale,
-    const bool align_corners,
     PackedTensorAccessor64<scalar_t, 4> idata,
     const PackedTensorAccessor64<scalar_t, 4> odata,
     const InterpFilter & interp_filter) {
@@ -672,8 +670,6 @@ static void upsample_gen2d_aa_out_cuda_template(
   int output_height = output_size[0];
   int output_width = output_size[1];
 
-  int nbatch = input.size(0);
-  int channels = input.size(1);
   int input_height = input.size(2);
   int input_width = input.size(3);
 
@@ -735,7 +731,7 @@ static void upsample_gen2d_aa_out_cuda_template(
             <<<grid,
                block,
                shmem_size,
-               stream>>>(height_scale, width_scale, align_corners, idata, odata, interp_filter);
+               stream>>>(height_scale, width_scale, idata, odata, interp_filter);
         C10_CUDA_KERNEL_LAUNCH_CHECK();
       });
 
@@ -766,8 +762,6 @@ static void upsample_gen2d_aa_backward_out_cuda_template(
   int output_height = output_size[0];
   int output_width = output_size[1];
 
-  int nbatch = input_size[0];
-  int channels = input_size[1];
   int input_height = input_size[2];
   int input_width = input_size[3];
 
@@ -819,7 +813,7 @@ static void upsample_gen2d_aa_backward_out_cuda_template(
             <<<grid,
                block,
                shmem_size,
-               stream>>>(height_scale, width_scale, align_corners, idata, odata, interp_filter);
+               stream>>>(height_scale, width_scale, idata, odata, interp_filter);
         C10_CUDA_KERNEL_LAUNCH_CHECK();
       });
 }
 
@@ -1366,7 +1366,7 @@
   device_guard: False
   dispatch:
     MkldnnCPU: copy_mkldnn_
-    SparseCPU, SparseCUDA, SparseHIP: copy_sparse_wrapper_
+    SparseCPU, SparseCUDA: copy_sparse_wrapper_
     CompositeExplicitAutograd: copy_
     SparseCsrCPU, SparseCsrCUDA: copy_sparse_csr_
 
 
@@ -119,6 +119,9 @@ void device_reduce<at::Half>(
     int N,
     Tensor* buffer,
     CUDAContext* context) {
+  (void)N; // Suppress unused variable warning
+  (void)buffer; // Suppress unused variable warning
+  (void)context; // Suppress unused variable warning
 #if TORCH_HIP_VERSION >= 210
   auto buffer_size = 1;
 
 
@@ -2174,7 +2174,7 @@ TEST_F(FunctionalTest, Interpolate) {
   }
 }
 
-TEST_F(FunctionalTest, Pad) {
+TEST_F(FunctionalTest, Pad1) {
   {
     auto input = torch::arange(6, torch::kDouble).reshape({1, 2, 3});
     auto output = F::pad(input, F::PadFuncOptions({1, 2}).mode(torch::kCircular));
@@ -2183,6 +2183,8 @@ TEST_F(FunctionalTest, Pad) {
     ASSERT_EQ(output.sizes(), std::vector<int64_t>({1, 2, 6}));
     ASSERT_TRUE(output.allclose(expected, 1e-04));
   }
+}
+TEST_F(FunctionalTest, Pad2) {
   {
     auto input = torch::arange(9, torch::kDouble).reshape({1, 1, 3, 3});
     auto output = F::pad(input, F::PadFuncOptions({3, 3, 3, 1}).mode(torch::kCircular));
@@ -2197,6 +2199,8 @@ TEST_F(FunctionalTest, Pad) {
     ASSERT_EQ(output.sizes(), std::vector<int64_t>({1, 1, 7, 9}));
     ASSERT_TRUE(output.allclose(expected, 1e-04));
   }
+}
+TEST_F(FunctionalTest, Pad3) {
   {
     auto input = torch::arange(12, torch::kDouble).reshape({1, 1, 2, 2, 3});
     auto output = F::pad(input, F::PadFuncOptions({3, 3, 2, 1, 2, 2}).mode(torch::kCircular));
@@ -2239,6 +2243,8 @@ TEST_F(FunctionalTest, Pad) {
     ASSERT_EQ(output.sizes(), std::vector<int64_t>({1, 1, 6, 5, 9}));
     ASSERT_TRUE(output.allclose(expected, 1e-04));
   }
+}
+TEST_F(FunctionalTest, Pad4) {
   {
     auto input = torch::arange(16, torch::kDouble).reshape({2, 2, 2, 2});
     auto output = F::pad(input, F::PadFuncOptions({1, 1, 1, 1}).mode(torch::kReflect));
@@ -2265,6 +2271,8 @@ TEST_F(FunctionalTest, Pad) {
     ASSERT_EQ(output.sizes(), std::vector<int64_t>({2, 2, 4, 4}));
     ASSERT_TRUE(output.allclose(expected, 1e-04));
   }
+}
+TEST_F(FunctionalTest, Pad5) {
   {
     auto input = torch::arange(12, torch::kDouble).reshape({1, 1, 2, 2, 3});
     auto output = F::pad(input, F::PadFuncOptions({1, 2, 2, 1, 1, 2}).mode(torch::kReplicate));
@@ -2301,6 +2309,8 @@ TEST_F(FunctionalTest, Pad) {
     ASSERT_EQ(output.sizes(), std::vector<int64_t>({1, 1, 5, 5, 6}));
     ASSERT_TRUE(output.allclose(expected, 1e-04));
   }
+}
+TEST_F(FunctionalTest, Pad6) {
   {
     auto input = torch::arange(18, torch::kDouble).reshape({1, 1, 3, 2, 3});
     auto output = F::pad(input, F::PadFuncOptions({0, 2, 1, 0, 1, 2}).mode(torch::kReflect));
@@ -2331,12 +2341,16 @@ TEST_F(FunctionalTest, Pad) {
     ASSERT_EQ(output.sizes(), std::vector<int64_t>({1, 1, 6, 3, 5}));
     ASSERT_TRUE(output.allclose(expected, 1e-04));
   }
+}
+TEST_F(FunctionalTest, Pad7) {
   {
     auto input = torch::ones({1, 1, 1, 1}, torch::kDouble);
     auto output = F::pad(input, F::PadFuncOptions({1, 1}).mode(torch::kConstant).value(0));
     ASSERT_EQ(output.sizes(), std::vector<int64_t>({1, 1, 1, 3}));
     auto expected = torch::tensor({{{{0., 1., 0.}}}}, torch::kDouble);
   }
+}
+TEST_F(FunctionalTest, Pad8) {
   {
     auto input = torch::ones({1, 1, 1, 1}, torch::kDouble);
     auto output = F::pad(input, F::PadFuncOptions({1, 1}));
 
@@ -6308,6 +6308,16 @@ def forward(self, x):
         x = torch.randn(4, 2, 3, requires_grad=True)
         self.run_test(InplaceAddModel(), x)
 
+    def test_addcmul(self):
+        class AddcmulModel(torch.nn.Module):
+            def forward(self, x, t1, t2):
+                return torch.addcmul(x, t1, t2), torch.addcmul(x, t1, t2, value=2.2)
+
+        x = torch.randn(1, 3)
+        t1 = torch.randn(3, 1)
+        t2 = torch.randn(1, 3)
+        self.run_test(AddcmulModel(), (x, t1, t2))
+
     def test_rsqrt(self):
         class RsqrtModel(torch.nn.Module):
             def forward(self, x):
 
@@ -821,6 +821,11 @@ def parse_args():
         " within a specified test module. For unspecified test modules with the bring-to-front "
         "option, all test cases will be run, as one may expect.",
     )
+    parser.add_argument(
+        "--dry-run",
+        action="store_true",
+        help="Only list the test that will run.",
+    )
     return parser.parse_args()
 
 
@@ -1022,7 +1027,10 @@ def main():
     selected_tests = get_selected_tests(options)
 
     if options.verbose:
-        print_to_stderr("Selected tests: {}".format(", ".join(selected_tests)))
+        print_to_stderr("Selected tests:\n {}".format("\n ".join(selected_tests)))
+
+    if options.dry_run:
+        return
 
     if options.coverage and not PYTORCH_COLLECT_COVERAGE:
         shell(["coverage", "erase"])
Original file line number	Diff line number	Diff line change
`@@ -2174,7 +2174,7 @@ TEST_F(FunctionalTest, Interpolate) {`
`2174`	`2174`	`}`
`2175`	`2175`	`}`
`2176`	`2176`
`2177`		`-TEST_F(FunctionalTest, Pad) {`
	`2177`	`+TEST_F(FunctionalTest, Pad1) {`
`2178`	`2178`	`{`
`2179`	`2179`	`auto input = torch::arange(6, torch::kDouble).reshape({1, 2, 3});`
`2180`	`2180`	`auto output = F::pad(input, F::PadFuncOptions({1, 2}).mode(torch::kCircular));`
`@@ -2183,6 +2183,8 @@ TEST_F(FunctionalTest, Pad) {`
`2183`	`2183`	`ASSERT_EQ(output.sizes(), std::vector<int64_t>({1, 2, 6}));`
`2184`	`2184`	`ASSERT_TRUE(output.allclose(expected, 1e-04));`
`2185`	`2185`	`}`
	`2186`	`+}`
	`2187`	`+TEST_F(FunctionalTest, Pad2) {`
`2186`	`2188`	`{`
`2187`	`2189`	`auto input = torch::arange(9, torch::kDouble).reshape({1, 1, 3, 3});`
`2188`	`2190`	`auto output = F::pad(input, F::PadFuncOptions({3, 3, 3, 1}).mode(torch::kCircular));`
`@@ -2197,6 +2199,8 @@ TEST_F(FunctionalTest, Pad) {`
`2197`	`2199`	`ASSERT_EQ(output.sizes(), std::vector<int64_t>({1, 1, 7, 9}));`
`2198`	`2200`	`ASSERT_TRUE(output.allclose(expected, 1e-04));`
`2199`	`2201`	`}`
	`2202`	`+}`
	`2203`	`+TEST_F(FunctionalTest, Pad3) {`
`2200`	`2204`	`{`
`2201`	`2205`	`auto input = torch::arange(12, torch::kDouble).reshape({1, 1, 2, 2, 3});`
`2202`	`2206`	`auto output = F::pad(input, F::PadFuncOptions({3, 3, 2, 1, 2, 2}).mode(torch::kCircular));`
`@@ -2239,6 +2243,8 @@ TEST_F(FunctionalTest, Pad) {`
`2239`	`2243`	`ASSERT_EQ(output.sizes(), std::vector<int64_t>({1, 1, 6, 5, 9}));`
`2240`	`2244`	`ASSERT_TRUE(output.allclose(expected, 1e-04));`
`2241`	`2245`	`}`
	`2246`	`+}`
	`2247`	`+TEST_F(FunctionalTest, Pad4) {`
`2242`	`2248`	`{`
`2243`	`2249`	`auto input = torch::arange(16, torch::kDouble).reshape({2, 2, 2, 2});`
`2244`	`2250`	`auto output = F::pad(input, F::PadFuncOptions({1, 1, 1, 1}).mode(torch::kReflect));`
`@@ -2265,6 +2271,8 @@ TEST_F(FunctionalTest, Pad) {`
`2265`	`2271`	`ASSERT_EQ(output.sizes(), std::vector<int64_t>({2, 2, 4, 4}));`
`2266`	`2272`	`ASSERT_TRUE(output.allclose(expected, 1e-04));`
`2267`	`2273`	`}`
	`2274`	`+}`
	`2275`	`+TEST_F(FunctionalTest, Pad5) {`
`2268`	`2276`	`{`
`2269`	`2277`	`auto input = torch::arange(12, torch::kDouble).reshape({1, 1, 2, 2, 3});`
`2270`	`2278`	`auto output = F::pad(input, F::PadFuncOptions({1, 2, 2, 1, 1, 2}).mode(torch::kReplicate));`
`@@ -2301,6 +2309,8 @@ TEST_F(FunctionalTest, Pad) {`
`2301`	`2309`	`ASSERT_EQ(output.sizes(), std::vector<int64_t>({1, 1, 5, 5, 6}));`
`2302`	`2310`	`ASSERT_TRUE(output.allclose(expected, 1e-04));`
`2303`	`2311`	`}`
	`2312`	`+}`
	`2313`	`+TEST_F(FunctionalTest, Pad6) {`
`2304`	`2314`	`{`
`2305`	`2315`	`auto input = torch::arange(18, torch::kDouble).reshape({1, 1, 3, 2, 3});`
`2306`	`2316`	`auto output = F::pad(input, F::PadFuncOptions({0, 2, 1, 0, 1, 2}).mode(torch::kReflect));`
`@@ -2331,12 +2341,16 @@ TEST_F(FunctionalTest, Pad) {`
`2331`	`2341`	`ASSERT_EQ(output.sizes(), std::vector<int64_t>({1, 1, 6, 3, 5}));`
`2332`	`2342`	`ASSERT_TRUE(output.allclose(expected, 1e-04));`
`2333`	`2343`	`}`
	`2344`	`+}`
	`2345`	`+TEST_F(FunctionalTest, Pad7) {`
`2334`	`2346`	`{`
`2335`	`2347`	`auto input = torch::ones({1, 1, 1, 1}, torch::kDouble);`
`2336`	`2348`	`auto output = F::pad(input, F::PadFuncOptions({1, 1}).mode(torch::kConstant).value(0));`
`2337`	`2349`	`ASSERT_EQ(output.sizes(), std::vector<int64_t>({1, 1, 1, 3}));`
`2338`	`2350`	`auto expected = torch::tensor({{{{0., 1., 0.}}}}, torch::kDouble);`
`2339`	`2351`	`}`
	`2352`	`+}`
	`2353`	`+TEST_F(FunctionalTest, Pad8) {`
`2340`	`2354`	`{`
`2341`	`2355`	`auto input = torch::ones({1, 1, 1, 1}, torch::kDouble);`
`2342`	`2356`	`auto output = F::pad(input, F::PadFuncOptions({1, 1}));`