Skip to content

Commit 12c8ea0

Browse files
authored
Merge branch 'pytorch:main' into main
2 parents fc70838 + a5436a5 commit 12c8ea0

File tree

862 files changed

+25658
-7770
lines changed

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

862 files changed

+25658
-7770
lines changed

.ci/docker/build.sh

Lines changed: 3 additions & 13 deletions
Original file line numberDiff line numberDiff line change
@@ -125,10 +125,10 @@ case "$tag" in
125125
UCC_COMMIT=${_UCC_COMMIT}
126126
TRITON=yes
127127
;;
128-
pytorch-linux-jammy-cuda12.8-cudnn9-py3-gcc9-inductor-benchmarks)
128+
pytorch-linux-jammy-cuda12.8-cudnn9-py3-gcc11-inductor-benchmarks)
129129
CUDA_VERSION=12.8.1
130130
ANACONDA_PYTHON_VERSION=3.10
131-
GCC_VERSION=9
131+
GCC_VERSION=11
132132
VISION=yes
133133
KATEX=yes
134134
UCX_COMMIT=${_UCX_COMMIT}
@@ -146,16 +146,6 @@ case "$tag" in
146146
UCC_COMMIT=${_UCC_COMMIT}
147147
TRITON=yes
148148
;;
149-
pytorch-linux-jammy-cuda12.8-cudnn9-py3-gcc9)
150-
CUDA_VERSION=12.8.1
151-
ANACONDA_PYTHON_VERSION=3.10
152-
GCC_VERSION=9
153-
VISION=yes
154-
KATEX=yes
155-
UCX_COMMIT=${_UCX_COMMIT}
156-
UCC_COMMIT=${_UCC_COMMIT}
157-
TRITON=yes
158-
;;
159149
pytorch-linux-jammy-py3-clang12-onnx)
160150
ANACONDA_PYTHON_VERSION=3.10
161151
CLANG_VERSION=12
@@ -188,7 +178,7 @@ case "$tag" in
188178
fi
189179
GCC_VERSION=11
190180
VISION=yes
191-
ROCM_VERSION=7.0
181+
ROCM_VERSION=7.1
192182
NINJA_VERSION=1.9.0
193183
TRITON=yes
194184
KATEX=yes
Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1 +1 @@
1-
1b0418a9a454b2b93ab8d71f40e59d2297157fae
1+
aa01f5c2cd4db2b7bfa53ea98a1a8dfbd6d77c92

.ci/docker/common/install_rocm.sh

Lines changed: 10 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -60,14 +60,16 @@ EOF
6060
DEBIAN_FRONTEND=noninteractive apt-get install -y --allow-unauthenticated rocm-llvm-dev
6161
fi
6262

63-
# precompiled miopen kernels added in ROCm 3.5, renamed in ROCm 5.5
64-
# search for all unversioned packages
65-
# if search fails it will abort this script; use true to avoid case where search fails
66-
MIOPENHIPGFX=$(apt-cache search --names-only miopen-hip-gfx | awk '{print $1}' | grep -F -v . || true)
67-
if [[ "x${MIOPENHIPGFX}" = x ]]; then
68-
echo "miopen-hip-gfx package not available" && exit 1
69-
else
70-
DEBIAN_FRONTEND=noninteractive apt-get install -y --allow-unauthenticated ${MIOPENHIPGFX}
63+
if [[ $(ver $ROCM_VERSION) -lt $(ver 7.1) ]]; then
64+
# precompiled miopen kernels added in ROCm 3.5, renamed in ROCm 5.5, removed in ROCm 7.1
65+
# search for all unversioned packages
66+
# if search fails it will abort this script; use true to avoid case where search fails
67+
MIOPENHIPGFX=$(apt-cache search --names-only miopen-hip-gfx | awk '{print $1}' | grep -F -v . || true)
68+
if [[ "x${MIOPENHIPGFX}" = x ]]; then
69+
echo "miopen-hip-gfx package not available" && exit 1
70+
else
71+
DEBIAN_FRONTEND=noninteractive apt-get install -y --allow-unauthenticated ${MIOPENHIPGFX}
72+
fi
7173
fi
7274

7375
# ROCm 6.0 had a regression where journal_mode was enabled on the kdb files resulting in permission errors at runtime

.ci/docker/common/install_rocm_magma.sh

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -12,8 +12,8 @@ function do_install() {
1212

1313
rocm_version_nodot=${rocm_version//./}
1414

15-
# post merge of https://github.com/icl-utk-edu/magma/pull/65
16-
MAGMA_VERSION=c0792ae825fb36872784892ea643dd6f3456bc5f
15+
# https://github.com/icl-utk-edu/magma/pull/65
16+
MAGMA_VERSION=d6e4117bc88e73f06d26c6c2e14f064e8fc3d1ec
1717
magma_archive="magma-rocm${rocm_version_nodot}-${MAGMA_VERSION}-1.tar.bz2"
1818

1919
rocm_dir="/opt/rocm"

.ci/docker/common/install_xpu.sh

Lines changed: 7 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -64,14 +64,13 @@ function install_ubuntu() {
6464

6565
function install_rhel() {
6666
. /etc/os-release
67-
if [[ "${ID}" == "rhel" ]]; then
68-
if [[ ! " 8.8 8.10 9.0 9.2 9.3 " =~ " ${VERSION_ID} " ]]; then
69-
echo "RHEL version ${VERSION_ID} not supported"
70-
exit
71-
fi
72-
elif [[ "${ID}" == "almalinux" ]]; then
73-
# Workaround for almalinux8 which used by quay.io/pypa/manylinux_2_28_x86_64
74-
VERSION_ID="8.8"
67+
if [[ ! " 8.8 8.10 9.0 9.2 9.3 " =~ " ${VERSION_ID} " ]]; then
68+
echo "RHEL version ${VERSION_ID} not supported"
69+
exit
70+
fi
71+
# Using testing channel for CD build
72+
if [[ "${ID}" == "almalinux" ]]; then
73+
XPU_DRIVER_VERSION="/testing"
7574
fi
7675

7776
dnf install -y 'dnf-command(config-manager)'

.ci/docker/requirements-ci.txt

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -402,3 +402,6 @@ scikit-build==0.18.1
402402
pyre-extensions==0.0.32
403403
tabulate==0.9.0
404404
#Description: These package are needed to build FBGEMM and torchrec on PyTorch CI
405+
406+
Jinja2==3.1.6
407+
#Description: required for torch.distributed.debug

.ci/lumen_cli/cli/lib/core/vllm/vllm_test.py

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -84,7 +84,6 @@ def __init__(self, args: Any):
8484
self.VLLM_TEST_WHLS_REGEX = [
8585
"xformers/*.whl",
8686
"vllm/vllm*.whl",
87-
"flashinfer-python/flashinfer*.whl",
8887
]
8988

9089
def prepare(self):

.ci/manywheel/build.sh

Lines changed: 0 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -4,9 +4,6 @@ set -ex
44

55
SCRIPTPATH="$( cd "$( dirname "${BASH_SOURCE[0]}" )" >/dev/null 2>&1 && pwd )"
66

7-
# Source the common build script for architecture-specific configurations (MKLDNN, ACL, etc.)
8-
source "${SCRIPTPATH}/../pytorch/build.sh" || true
9-
107
case "${GPU_ARCH_TYPE:-BLANK}" in
118
cuda | cuda-aarch64)
129
bash "${SCRIPTPATH}/build_cuda.sh"

.ci/manywheel/build_common.sh

Lines changed: 7 additions & 20 deletions
Original file line numberDiff line numberDiff line change
@@ -35,12 +35,8 @@ if [[ "$OS_NAME" == *"AlmaLinux"* ]]; then
3535
aarch64)
3636
PLATFORM="manylinux_2_28_aarch64"
3737
;;
38-
s390x)
39-
PLATFORM="manylinux_2_28_s390x"
40-
;;
4138
*)
42-
echo "Unsupported architecture: $ARCH"
43-
exit 1
39+
echo "Other architectures: $ARCH, not setting PLATFORM"
4440
;;
4541
esac
4642
elif [[ "$OS_NAME" == *"Red Hat Enterprise Linux"* ]]; then
@@ -367,22 +363,13 @@ for pkg in /$WHEELHOUSE_DIR/torch_no_python*.whl /$WHEELHOUSE_DIR/torch*linux*.w
367363
done
368364

369365
# create Manylinux 2_28 tag this needs to happen before regenerate the RECORD
370-
# Support all architectures (x86_64, aarch64, s390x)
371-
if [[ "$IS_MANYLINUX2_28" == "1" && $GPU_ARCH_TYPE != "xpu" ]]; then
366+
if [[ $PLATFORM == "manylinux_2_28_x86_64" && $GPU_ARCH_TYPE != "cpu-s390x" && $GPU_ARCH_TYPE != "xpu" ]]; then
367+
wheel_file=$(echo $(basename $pkg) | sed -e 's/-cp.*$/.dist-info\/WHEEL/g')
368+
sed -i -e s#linux_x86_64#"${PLATFORM}"# $wheel_file;
369+
fi
370+
if [[ $PLATFORM == "manylinux_2_28_aarch64" ]]; then
372371
wheel_file=$(echo $(basename $pkg) | sed -e 's/-cp.*$/.dist-info\/WHEEL/g')
373-
echo "Updating wheel tag for $ARCH architecture"
374-
# Replace linux_* with manylinux_2_28_* based on architecture
375-
case $ARCH in
376-
x86_64)
377-
sed -i -e 's#linux_x86_64#manylinux_2_28_x86_64#g' $wheel_file
378-
;;
379-
aarch64)
380-
sed -i -e 's#linux_aarch64#manylinux_2_28_aarch64#g' $wheel_file
381-
;;
382-
s390x)
383-
sed -i -e 's#linux_s390x#manylinux_2_28_s390x#g' $wheel_file
384-
;;
385-
esac
372+
sed -i -e s#linux_aarch64#"${PLATFORM}"# $wheel_file;
386373
fi
387374

388375
# regenerate the RECORD file with new hashes

.ci/manywheel/build_cpu.sh

Lines changed: 25 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -19,6 +19,31 @@ fi
1919
ARCH=$(uname -m)
2020
echo "Building CPU wheel for architecture: $ARCH"
2121

22+
# Detect and configure OpenBLAS and ARM Compute Libraryfor CPU aarch64
23+
if [[ "$ARCH" == "aarch64" ]]; then
24+
# Use OpenBLAS for BLAS/LAPACK on CPU aarch64 builds
25+
if [[ ! -f "/opt/OpenBLAS/lib/libopenblas.so.0" ]]; then
26+
echo "ERROR: OpenBLAS not found at /opt/OpenBLAS/lib/"
27+
echo "OpenBLAS (BLAS/LAPACK) is required for CPU aarch64 builds"
28+
exit 1
29+
fi
30+
echo "Using OpenBLAS for CPU aarch64"
31+
export BLAS=OpenBLAS
32+
export OpenBLAS_HOME=/opt/OpenBLAS
33+
34+
# ACL is required for aarch64 builds
35+
if [[ ! -d "/acl" ]]; then
36+
echo "ERROR: ARM Compute Library not found at /acl"
37+
echo "ACL is required for aarch64 builds. Check Docker image setup."
38+
exit 1
39+
fi
40+
41+
export USE_MKLDNN=1
42+
export USE_MKLDNN_ACL=1
43+
export ACL_ROOT_DIR=/acl
44+
echo "ARM Compute Library enabled for MKLDNN: ACL_ROOT_DIR=/acl"
45+
fi
46+
2247
WHEELHOUSE_DIR="wheelhousecpu"
2348
LIBTORCH_HOUSE_DIR="libtorch_housecpu"
2449
if [[ -z "$PYTORCH_FINAL_PACKAGE_DIR" ]]; then

0 commit comments

Comments
 (0)