Skip to content

Commit 2fdd6b3

Browse files
committed
TAO 5.5 Release - PyTorch
1 parent 83f6490 commit 2fdd6b3

File tree

6 files changed

+15
-34
lines changed

6 files changed

+15
-34
lines changed

docker/Dockerfile

Lines changed: 0 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -46,11 +46,6 @@ RUN pip uninstall -y jupyterlab \
4646
&& rm requirements-pip.txt \
4747
&& mim install "mmengine==0.10.4" "mmpretrain>=1.0.0rc8"
4848

49-
COPY tao-core tao-core
50-
RUN cd tao-core && bash release/python/build_wheel.sh && \
51-
find dist/ -name "nvidia_tao_core*.whl" -type f | xargs -n 1 pip install && \
52-
rm -rf *
53-
5449
ENV FORCE_CUDA="1"
5550
RUN mkdir mmcv_src && \
5651
cd mmcv_src && \

docker/build.sh

Lines changed: 7 additions & 11 deletions
Original file line numberDiff line numberDiff line change
@@ -3,12 +3,10 @@
33
set -eo pipefail
44
cd "$( dirname "${BASH_SOURCE[0]}" )"
55

6-
registry="nvcr.io"
7-
repository="nvstaging/tao/tao_pytorch_base_image"
8-
base_image="nvcr.io/nvidia/pytorch:24.04-py3"
9-
10-
tag="$USER-$(date +%Y%m%d%H%M)"
11-
local_tag="$USER"
6+
# Read parameters from manifest.json
7+
registry=`jq -r '.registry' $NV_TAO_PYTORCH_TOP/docker/manifest.json`
8+
repository=`jq -r '.repository' $NV_TAO_PYTORCH_TOP/docker/manifest.json`
9+
tag=`jq -r '.tag' $NV_TAO_PYTORCH_TOP/docker/manifest.json`
1210

1311
# Build parameters.
1412
BUILD_DOCKER="0"
@@ -56,12 +54,10 @@ if [ $BUILD_DOCKER = "1" ]; then
5654
else
5755
NO_CACHE=""
5856
fi
59-
DOCKER_BUILDKIT=1 docker build --pull -f $NV_TAO_PYTORCH_TOP/docker/Dockerfile -t $registry/$repository:$local_tag $NO_CACHE \
60-
--network=host --build-arg PYTORCH_BASE_IMAGE=${base_image} \
61-
$NV_TAO_PYTORCH_TOP/.
57+
DOCKER_BUILDKIT=1 docker build --pull -f $NV_TAO_PYTORCH_TOP/docker/Dockerfile -t $registry/$repository:$tag $NO_CACHE \
58+
--network=host $NV_TAO_PYTORCH_TOP/.
6259
if [ $PUSH_DOCKER = "1" ]; then
6360
echo "Pusing docker ..."
64-
docker tag $registry/$repository:$local_tag $registry/$repository:$tag
6561
docker push $registry/$repository:$tag
6662
digest=$(docker inspect --format='{{index .RepoDigests 0}}' $registry/$repository:$tag)
6763
echo -e "\033[1;33mUpdate the digest in the manifest.json file to:\033[0m"
@@ -72,4 +68,4 @@ if [ $BUILD_DOCKER = "1" ]; then
7268
# Exit by printing usage.
7369
else
7470
echo "Usage: ./build.sh [--build] [--push] [--force] [--default]"
75-
fi
71+
fi

docker/manifest.json

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,6 @@
11
{
22
"registry": "nvcr.io",
33
"repository": "nvidia/tao/tao-toolkit",
4-
"digest": "sha256:ff920080025e2dd12d5740c3d722f0630f1f84630ae6f55e56f872d4914fca03"
4+
"digest": "sha256:ff920080025e2dd12d5740c3d722f0630f1f84630ae6f55e56f872d4914fca03",
5+
"tag": "5.5.0-pyt-base"
56
}

release/docker/Dockerfile

Lines changed: 0 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -29,11 +29,6 @@ COPY release/docker/entrypoint.d/* /opt/nvidia/entrypoint.d/
2929
# Copying tlt-converter and building it in the docker.
3030
ENV TRT_LIB_PATH="/usr/lib/x86_64-linux-gnu"
3131
ENV TRT_INCLUDE_PATH="/usr/include/x86_64-linux-gnu"
32-
COPY tao-converter /opt/nvidia/tools
33-
WORKDIR /opt/nvidia/tools
34-
RUN make \
35-
&& rm -rf Makefile *.cc *.h *.o
36-
RUN ln -s tao-converter converter
3732

3833
ENV NVIDIA_PRODUCT_NAME "TAO Toolkit"
3934
ENV TAO_TOOLKIT_VERSION="5.2.0"

release/docker/deploy.sh

Lines changed: 6 additions & 9 deletions
Original file line numberDiff line numberDiff line change
@@ -4,18 +4,16 @@ set -eo pipefail
44
# cd "$( dirname "${BASH_SOURCE[0]}" )"
55

66
registry="nvcr.io"
7-
pytorch_version="2.1.0"
8-
tao_version="5.2.0"
9-
repository="nvstaging/tao/tao-toolkit-pyt"
10-
build_id="01"
11-
tag="v${tao_version}-pyt${pytorch_version}-py3-${build_id}"
7+
tao_version="5.0.0"
8+
repository="nvidia/tao/tao-toolkit"
9+
tag="${tao_version}-pyt-base"
1210

1311
# Required for the tao-converter since it is now a submodule.
1412
git submodule update --init --recursive
1513

1614
# Build parameters.
1715
BUILD_DOCKER="0"
18-
BUILD_WHEEL="0"
16+
BUILD_WHEELS="0"
1917
PUSH_DOCKER="0"
2018
FORCE="0"
2119

@@ -83,7 +81,6 @@ if [ $BUILD_DOCKER = "1" ]; then
8381
mkdir -p $wheel_dir
8482
fi
8583
echo "Building source code wheel ..."
86-
# tao_pt --env 'TORCH_CUDA_ARCH_LIST="5.3 6.0 6.1 7.0 7.5 8.0 8.6 9.0"' -- bash /tao-pt/release/docker/build_wheel.sh
8784
tao_pt --env 'TORCH_CUDA_ARCH_LIST="5.3 6.0 6.1 7.0 7.5 8.0 8.6 9.0"' -- python setup.py bdist_wheel
8885
else
8986
echo "Skipping wheel builds ..."
@@ -108,12 +105,12 @@ if [ $BUILD_DOCKER = "1" ]; then
108105
fi
109106
elif [ $RUN_DOCKER ="1" ]; then
110107
echo "Running docker interactively..."
111-
docker run --gpus all -v $HOME/tlt-experiments:/workspace/tlt-experiments \
108+
docker run --gpus all -v $HOME/tlt-experiments:/workspace/tlt-experiments \
112109
--network=host \
113110
--shm-size=30g \
114111
--ulimit memlock=-1 \
115112
--ulimit stack=67108864 \
116113
--rm -it $registry/$repository:$tag /bin/bash
117114
else
118115
echo "Usage: ./deploy.sh [--build] [--wheel] [--run] [--push] [--default]"
119-
fi
116+
fi

release/docker/pyarmor-regfile-1219.zip

Lines changed: 0 additions & 3 deletions
This file was deleted.

0 commit comments

Comments
 (0)