8000 2025-05-01 nightly release (3849fd13de1a5ee727fd64351edb0d3b1bb637a9) · pytorch/pytorch@8c7f928 · GitHub
[go: up one dir, main page]

Skip to content

Commit 8c7f928

Browse files
author
pytorchbot
committed
2025-05-01 nightly release (3849fd1)
1 parent 43be185 commit 8c7f928

File tree

119 files changed

+6022
-2077
lines changed

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

119 files changed

+6022
-2077
lines changed

.ci/docker/almalinux/Dockerfile

Lines changed: 7 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,6 @@
11
ARG CUDA_VERSION=12.4
22
ARG BASE_TARGET=cuda${CUDA_VERSION}
3+
ARG ROCM_IMAGE=rocm/dev-almalinux-8:6.3-complete
34
FROM amd64/almalinux:8 as base
45

56
ENV LC_ALL en_US.UTF-8
@@ -8,10 +9,6 @@ ENV LANGUAGE en_US.UTF-8
89

910
ARG DEVTOOLSET_VERSION=11
1011

11-
ENV LC_ALL en_US.UTF-8
12-
ENV LANG en_US.UTF-8
13-
ENV LANGUAGE en_US.UTF-8
14-
1512
RUN yum -y update
1613
RUN yum -y install epel-release
1714
RUN yum install -y sudo wget curl perl util-linux xz bzip2 git patch which perl zlib-devel openssl-devel yum-utils autoconf automake make gcc-toolset-${DEVTOOLSET_VERSION}-toolchain
@@ -65,6 +62,12 @@ FROM cuda as cuda12.8
6562
RUN bash ./install_cuda.sh 12.8
6663
ENV DESIRED_CUDA=12.8
6764

65+
FROM ${ROCM_IMAGE} as rocm
66+
ENV PYTORCH_ROCM_ARCH="gfx900;gfx906;gfx908;gfx90a;gfx942;gfx1030;gfx1100;gfx1101;gfx1102;gfx1200;gfx1201"
67+
ADD ./common/install_mkl.sh install_mkl.sh
68+
RUN bash ./install_mkl.sh && rm install_mkl.sh
69+
ENV MKLROOT /opt/intel
70+
6871
# Install MNIST test data
6972
FROM base as mnist
7073
ADD ./common/install_mnist.sh install_mnist.sh

.ci/docker/almalinux/build.sh

Lines changed: 11 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -15,9 +15,16 @@ fi
1515
DOCKER_TAG_PREFIX=$(echo "${image}" | awk -F':' '{print $2}')
1616

1717
CUDA_VERSION=""
18+
ROCM_VERSION=""
19+
EXTRA_BUILD_ARGS=""
1820
if [[ "${DOCKER_TAG_PREFIX}" == cuda* ]]; then
1921
# extract cuda version from image name and tag. e.g. manylinux2_28-builder:cuda12.8 returns 12.8
2022
CUDA_VERSION=$(echo "${DOCKER_TAG_PREFIX}" | awk -F'cuda' '{print $2}')
23+
EXTRA_BUILD_ARGS="--build-arg CUDA_VERSION=${CUDA_VERSION}"
24+
elif [[ "${DOCKER_TAG_PREFIX}" == rocm* ]]; then
25+
# extract rocm version from image name and tag. e.g. manylinux2_28-builder:rocm6.2.4 returns 6.2.4
26+
ROCM_VERSION=$(echo "${DOCKER_TAG_PREFIX}" | awk -F'rocm' '{print $2}')
27+
EXTRA_BUILD_ARGS="--build-arg ROCM_IMAGE=rocm/dev-almalinux-8:${ROCM_VERSION}-complete"
2128
fi
2229

2330
case ${DOCKER_TAG_PREFIX} in
@@ -27,6 +34,9 @@ case ${DOCKER_TAG_PREFIX} in
2734
cuda*)
2835
BASE_TARGET=cuda${CUDA_VERSION}
2936
;;
37+
rocm*)
38+
BASE_TARGET=rocm
39+
;;
3040
*)
3141
echo "ERROR: Unknown docker tag ${DOCKER_TAG_PREFIX}"
3242
exit 1
@@ -47,8 +57,8 @@ docker build \
4757
--target final \
4858
--progress plain \
4959
--build-arg "BASE_TARGET=${BASE_TARGET}" \
50-
--build-arg "CUDA_VERSION=${CUDA_VERSION}" \
5160
--build-arg "DEVTOOLSET_VERSION=11" \
61+
${EXTRA_BUILD_ARGS} \
5262
-t ${tmp_tag} \
5363
$@ \
5464
-f "${TOPDIR}/.ci/docker/almalinux/Dockerfile" \

.ci/docker/common/install_cuda.sh

Lines changed: 47 additions & 60 deletions
Original file line numberDiff line numberDiff line change
@@ -2,27 +2,50 @@
22

33
set -ex
44

5-
CUDNN_VERSION=9.5.1.17
5+
arch_path=''
6+
targetarch=${TARGETARCH:-$(uname -m)}
7+
if [ ${targetarch} = 'amd64' ] || [ "${targetarch}" = 'x86_64' ]; then
8+
arch_path='x86_64'
9+
else
10+
arch_path='sbsa'
11+
fi
12+
13+
function install_cuda {
14+
version=$1
15+
runfile=$2
16+
major_minor=${version%.*}
17+
rm -rf /usr/local/cuda-${major_minor} /usr/local/cuda
18+
if [[ ${arch_path} == 'sbsa' ]]; then
19+
runfile="${runfile}_sbsa"
20+
fi
21+
runfile="${runfile}.run"
22+
wget -q https://developer.download.nvidia.com/compute/cuda/${version}/local_installers/${runfile} -O ${runfile}
23+
chmod +x ${runfile}
24+
./${runfile} --toolkit --silent
25+
rm -f ${runfile}
26+
rm -f /usr/local/cuda && ln -s /usr/local/cuda-${major_minor} /usr/local/cuda
27+
}
28+
29+
function install_cudnn {
30+
cuda_major_version=$1
31+
cudnn_version=$2
32+
mkdir tmp_cudnn && cd tmp_cudnn
33+
# cuDNN license: https://developer.nvidia.com/cudnn/license_agreement
34+
filepath="cudnn-linux-${arch_path}-${cudnn_version}_cuda${cuda_major_version}-archive"
35+
wget -q https://developer.download.nvidia.com/compute/cudnn/redist/cudnn/linux-${arch_path}/${filepath}.tar.xz
36+
tar xf ${filepath}.tar.xz
37+
cp -a ${filepath}/include/* /usr/local/cuda/include/
38+
cp -a ${filepath}/lib/* /usr/local/cuda/lib64/
39+
cd ..
40+
rm -rf tmp_cudnn
41+
}
642

743
function install_118 {
844
CUDNN_VERSION=9.1.0.70
945
echo "Installing CUDA 11.8 and cuDNN ${CUDNN_VERSION} and NCCL and cuSparseLt-0.4.0"
10-
rm -rf /usr/local/cuda-11.8 /usr/local/cuda
11-
# install CUDA 11.8.0 in the same container
12-
wget -q https://developer.download.nvidia.com/compute/cuda/11.8.0/local_installers/cuda_11.8.0_520.61.05_linux.run
13-
chmod +x cuda_11.8.0_520.61.05_linux.run
14-
./cuda_11.8.0_520.61.05_linux.run --toolkit --silent
15-
rm -f cuda_11.8.0_520.61.05_linux.run
16-
rm -f /usr/local/cuda && ln -s /usr/local/cuda-11.8 /usr/local/cuda
17-
18-
# cuDNN license: https://developer.nvidia.com/cudnn/license_agreement
19-
mkdir tmp_cudnn && cd tmp_cudnn
20-
wget -q https://developer.download.nvidia.com/compute/cudnn/redist/cudnn/linux-x86_64/cudnn-linux-x86_64-${CUDNN_VERSION}_cuda11-archive.tar.xz -O cudnn-linux-x86_64-${CUDNN_VERSION}_cuda11-archive.tar.xz
21-
tar xf cudnn-linux-x86_64-${CUDNN_VERSION}_cuda11-archive.tar.xz
22-
cp -a cudnn-linux-x86_64-${CUDNN_VERSION}_cuda11-archive/include/* /usr/local/cuda/include/
23-
cp -a cudnn-linux-x86_64-${CUDNN_VERSION}_cuda11-archive/lib/* /usr/local/cuda/lib64/
24-
cd ..
25-
rm -rf tmp_cudnn
46+
install_cuda 11.8.0 cuda_11.8.0_520.61.05_linux
47+
48+
install_cudnn 11 $CUDNN_VERSION
2649

2750
CUDA_VERSION=11.8 bash install_nccl.sh
2851

@@ -34,22 +57,9 @@ function install_118 {
3457
function install_124 {
3558
CUDNN_VERSION=9.1.0.70
3659
echo "Installing CUDA 12.4.1 and cuDNN ${CUDNN_VERSION} and NCCL and cuSparseLt-0.6.2"
37-
rm -rf /usr/local/cuda-12.4 /usr/local/cuda
38-
# install CUDA 12.4.1 in the same container
39-
wget -q https://developer.download.nvidia.com/compute/cuda/12.4.1/local_installers/cuda_12.4.1_550.54.15_linux.run
40-
chmod +x cuda_12.4.1_550.54.15_linux.run
41-
./cuda_12.4.1_550.54.15_linux.run --toolkit --silent
42-
rm -f cuda_12.4.1_550.54.15_linux.run
43-
rm -f /usr/local/cuda && ln -s /usr/local/cuda-12.4 /usr/local/cuda
60+
install_cuda 12.4.1 cuda_12.4.1_550.54.15_linux
4461

45-
# cuDNN license: https://developer.nvidia.com/cudnn/license_agreement
46-
mkdir tmp_cudnn && cd tmp_cudnn
47-
wget -q https://developer.download.nvidia.com/compute/cudnn/redist/cudnn/linux-x86_64/cudnn-linux-x86_64-${CUDNN_VERSION}_cuda12-archive.tar.xz -O cudnn-linux-x86_64-${CUDNN_VERSION}_cuda12-archive.tar.xz
48-
tar xf cudnn-linux-x86_64-${CUDNN_VERSION}_cuda12-archive.tar.xz
49-
cp -a cudnn-linux-x86_64-${CUDNN_VERSION}_cuda12-archive/include/* /usr/local/cuda/include/
50-
cp -a cudnn-linux-x86_64-${CUDNN_VERSION}_cuda12-archive/lib/* /usr/local/cuda/lib64/
51-
cd ..
52-
rm -rf tmp_cudnn
62+
install_cudnn 12 $CUDNN_VERSION
5363

5464
CUDA_VERSION=12.4 bash install_nccl.sh
5565

@@ -59,23 +69,11 @@ function install_124 {
5969
}
6070

6171
function install_126 {
72+
CUDNN_VERSION=9.5.1.17
6273
echo "Installing CUDA 12.6.3 and cuDNN ${CUDNN_VERSION} and NCCL and cuSparseLt-0.6.3"
63-
rm -rf /usr/local/cuda-12.6 /usr/local/cuda
64-
# install CUDA 12.6.3 in the same container
65-
wget -q https://developer.download.nvidia.com/compute/cuda/12.6.3/local_installers/cuda_12.6.3_560.35.05_linux.run
66-
chmod +x cuda_12.6.3_560.35.05_linux.run
67-
./cuda_12.6.3_560.35.05_linux.run --toolkit --silent
68-
rm -f cuda_12.6.3_560.35.05_linux.run
69-
rm -f /usr/local/cuda && ln -s /usr/local/cuda-12.6 /usr/local/cuda
74+
install_cuda 12.6.3 cuda_12.6.3_560.35.05_linux
7075

71-
# cuDNN license: https://developer.nvidia.com/cudnn/license_agreement
72-
mkdir tmp_cudnn && cd tmp_cudnn
73-
wget -q https://developer.download.nvidia.com/compute/cudnn/redist/cudnn/linux-x86_64/cudnn-linux-x86_64-${CUDNN_VERSION}_cuda12-archive.tar.xz -O cudnn-linux-x86_64-${CUDNN_VERSION}_cuda12-archive.tar.xz
74-
tar xf cudnn-linux-x86_64-${CUDNN_VERSION}_cuda12-archive.tar.xz
75-
cp -a cudnn-linux-x86_64-${CUDNN_VERSION}_cuda12-archive/include/* /usr/local/cuda/include/
76-
cp -a cudnn-linux-x86_64-${CUDNN_VERSION}_cuda12-archive/lib/* /usr/local/cuda/lib64/
77-
cd ..
78-
rm -rf tmp_cudnn
76+
install_cudnn 12 $CUDNN_VERSION
7977

8078
CUDA_VERSION=12.6 bash install_nccl.sh
8179

@@ -186,22 +184,11 @@ function prune_126 {
186184
function install_128 {
187185
CUDNN_VERSION=9.8.0.87
188186
echo "Installing CUDA 12.8.0 and cuDNN ${CUDNN_VERSION} and NCCL and cuSparseLt-0.6.3"
189-
rm -rf /usr/local/cuda-12.8 /usr/local/cuda
190187
# install CUDA 12.8.0 in the same container
191-
wget -q https://developer.download.nvidia.com/compute/cuda/12.8.0/local_installers/cuda_12.8.0_570.86.10_linux.run
192-
chmod +x cuda_12.8.0_570.86.10_linux.run
193-
./cuda_12.8.0_570.86.10_linux.run --toolkit --silent
194-
rm -f cuda_12.8.0_570.86.10_linux.run
195-
rm -f /usr/local/cuda && ln -s /usr/local/cuda-12.8 /usr/local/cuda
188+
install_cuda 12.8.0 cuda_12.8.0_570.86.10_linux
196189

197190
# cuDNN license: https://developer.nvidia.com/cudnn/license_agreement
198-
mkdir tmp_cudnn && cd tmp_cudnn
199-
wget -q https://developer.download.nvidia.com/compute/cudnn/redist/cudnn/linux-x86_64/cudnn-linux-x86_64-${CUDNN_VERSION}_cuda12-archive.tar.xz -O cudnn-linux-x86_64-${CUDNN_VERSION}_cuda12-archive.tar.xz
200-
tar xf cudnn-linux-x86_64-${CUDNN_VERSION}_cuda12-archive.tar.xz
201-
cp -a cudnn-linux-x86_64-${CUDNN_VERSION}_cuda12-archive/include/* /usr/local/cuda/include/
202-
cp -a cudnn-linux-x86_64-${CUDNN_VERSION}_cuda12-archive/lib/* /usr/local/cuda/lib64/
203-
cd ..
204-
rm -rf tmp_cudnn
191+
install_cudnn 12 $CUDNN_VERSION
205192

206193
CUDA_VERSION=12.8 bash install_nccl.sh
207194

.ci/docker/common/install_cuda_aarch64.sh

Lines changed: 0 additions & 44 deletions
This file was deleted.

.ci/docker/manywheel/Dockerfile_cuda_aarch64

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -66,11 +66,11 @@ RUN rm -rf /opt/python/cp34-cp34m /opt/_internal/cpython-3.4.6
6666
FROM base as cuda
6767
ARG BASE_CUDA_VERSION
6868
# Install CUDA
69-
ADD ./common/install_cuda_aarch64.sh install_cuda_aarch64.sh
69+
ADD ./common/install_cuda.sh install_cuda.sh
7070
COPY ./common/install_nccl.sh install_nccl.sh
7171
COPY ./common/install_cusparselt.sh install_cusparselt.sh
7272
COPY ./ci_commit_pins/nccl-cu* /ci_commit_pins/
73-
RUN bash ./install_cuda_aarch64.sh ${BASE_CUDA_VERSION} && rm install_cuda_aarch64.sh install_nccl.sh ci_commit_pins/nccl-cu* install_cusparselt.sh
73+
RUN bash ./install_cuda.sh ${BASE_CUDA_VERSION} && rm install_cuda.sh install_nccl.sh ci_commit_pins/nccl-cu* install_cusparselt.sh
7474

7575
FROM base as magma
7676
ARG BASE_CUDA_VERSION

.ci/magma-rocm/Makefile

Lines changed: 1 addition & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -12,13 +12,12 @@ DOCKER_RUN = set -eou pipefail; ${DOCKER_CMD} run --rm -i \
1212
-w /builder \
1313
-e PACKAGE_NAME=${PACKAGE_NAME}${DESIRED_ROCM_SHORT} \
1414
-e DESIRED_ROCM=${DESIRED_ROCM} \
15-
"pytorch/manylinux2_28-builder:rocm${DESIRED_ROCM}-main" \
15+
"pytorch/almalinux-builder:rocm${DESIRED_ROCM}" \
1616
magma-rocm/build_magma.sh
1717

1818
.PHONY: all
1919
all: magma-rocm64
2020
all: magma-rocm63
21-
all: magma-rocm624
2221

2322
.PHONY:
2423
clean:
@@ -34,8 +33,3 @@ magma-rocm64:
3433
magma-rocm63: DESIRED_ROCM := 6.3
3534
magma-rocm63:
3635
$(DOCKER_RUN)
37-
38-
.PHONY: magma-rocm624
39-
magma-rocm624: DESIRED_ROCM := 6.2.4
40-
magma-rocm624:
41-
$(DOCKER_RUN)

.ci/pytorch/test.sh

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1520,7 +1520,7 @@ test_linux_aarch64() {
15201520
inductor/test_inplacing_pass inductor/test_kernel_benchmark inductor/test_layout_optim \
15211521
inductor/test_max_autotune inductor/test_memory_planning inductor/test_metrics inductor/test_multi_kernel inductor/test_pad_mm \
15221522
inductor/test_pattern_matcher inductor/test_perf inductor/test_profiler inductor/test_select_algorithm inductor/test_smoke \
1523-
inductor/test_split_cat_fx_passes inductor/test_standalone_compile inductor/test_torchinductor \
1523+
inductor/test_split_cat_fx_passes inductor/test_compile inductor/test_torchinductor \
15241524
inductor/test_torchinductor_codegen_dynamic_shapes inductor/test_torchinductor_dynamic_shapes inductor/test_memory \
15251525
inductor/test_triton_cpu_backend inductor/test_triton_extension_backend inductor/test_mkldnn_pattern_matcher inductor/test_cpu_cpp_wrapper \
15261526
--shard "$SHARD_NUMBER" "$NUM_TEST_SHARDS" --verbose

.circleci/scripts/binary_ios_build.sh

Lines changed: 0 additions & 47 deletions
This file was deleted.

.circleci/scripts/binary_ios_test.sh

Lines changed: 0 additions & 19 deletions
This file was deleted.

0 commit comments

Comments
 (0)
0