TensorRT-LLMs/docker/common/install_pytorch.sh
Zhanrui Sun 4de31bece2
[TRTLLM-8994][infra] upgrade to DLFW 25.10 and pytorch 2.9.0 / triton 3.5.0 (#8838)
Signed-off-by: ZhanruiSunCh <184402041+ZhanruiSunCh@users.noreply.github.com>
Signed-off-by: Yanchao Lu <yanchaol@nvidia.com>
Co-authored-by: Yanchao Lu <yanchaol@nvidia.com>
2025-11-04 18:59:34 +08:00

93 lines
2.7 KiB
Bash

#!/bin/bash
set -ex
# Use latest stable version from https://pypi.org/project/torch/#history
# and closest to the version specified in
# https://docs.nvidia.com/deeplearning/frameworks/pytorch-release-notes/rel-25-10.html#rel-25-10
TORCH_VERSION="2.9.0"
SYSTEM_ID=$(grep -oP '(?<=^ID=).+' /etc/os-release | tr -d '"')
prepare_environment() {
if [[ $SYSTEM_ID == *"ubuntu"* ]]; then
apt-get update && apt-get -y install ninja-build
apt-get clean && rm -rf /var/lib/apt/lists/*
elif [[ $SYSTEM_ID == *"rocky"* ]]; then
dnf makecache --refresh && dnf install -y ninja-build && dnf clean all
else
echo "This system type cannot be supported..."
exit 1
fi
}
install_from_source() {
if [[ $SYSTEM_ID == *"rocky"* ]]; then
VERSION_ID=$(grep -oP '(?<=^VERSION_ID=).+' /etc/os-release | tr -d '"')
if [[ $VERSION_ID == "7" ]]; then
echo "Installation from PyTorch source codes cannot be supported..."
exit 1
fi
fi
ARCH=$(uname -m)
if [ "$ARCH" = "amd64" ];then ARCH="x86_64";fi
if [ "$ARCH" = "aarch64" ];then ARCH="sbsa";fi
prepare_environment $1
export _GLIBCXX_USE_CXX11_ABI=$1
export TORCH_CUDA_ARCH_LIST="8.0;8.6;9.0;10.0;12.0"
export PYTORCH_BUILD_VERSION=${TORCH_VERSION}
export PYTORCH_BUILD_NUMBER=0
export MAX_JOBS=12
pip3 uninstall -y torch
cd /tmp
git clone --depth 1 --branch v${TORCH_VERSION} https://github.com/pytorch/pytorch
cd pytorch
git submodule sync && git submodule update --init --recursive
pip3 install -r requirements.txt
python3 setup.py install
cd /tmp && rm -rf /tmp/pytorch
# Get torchvision version by dry run
TORCHVISION_VERSION=$(pip3 install --dry-run torch==${TORCH_VERSION} torchvision | grep "Would install" | tr ' ' '\n' | grep torchvision | cut -d "-" -f 2)
export PYTORCH_VERSION=${PYTORCH_BUILD_VERSION}
export FORCE_CUDA=1
export BUILD_VERSION=${TORCHVISION_VERSION}
export MAX_JOBS=12
pip3 uninstall -y torchvision
cd /tmp
git clone --depth 1 --branch v${TORCHVISION_VERSION} https://github.com/pytorch/vision
cd vision
python3 setup.py install
cd /tmp && rm -rf /tmp/vision
}
install_from_pypi() {
ARCH=$(uname -m)
if [ "$ARCH" = "amd64" ];then ARCH="x86_64";fi
if [ "$ARCH" = "aarch64" ];then ARCH="sbsa";fi
pip3 uninstall -y torch torchvision
pip3 install torch==${TORCH_VERSION} torchvision --index-url https://download.pytorch.org/whl/cu130
}
case "$1" in
"skip")
;;
"pypi")
install_from_pypi
;;
"src_cxx11_abi")
install_from_source 1
;;
"src_non_cxx11_abi")
install_from_source 0
;;
*)
echo "Incorrect input argument..."
exit 1
;;
esac