From 55c44af3817c8a015bce0e688956887a2c1319cb Mon Sep 17 00:00:00 2001 From: Samiur Rahman Date: Tue, 11 Jul 2023 17:56:04 +0000 Subject: [PATCH 1/2] Fix build for Triton 23.05 --- docker/Dockerfile | 26 +++++++++++++------------- 1 file changed, 13 insertions(+), 13 deletions(-) diff --git a/docker/Dockerfile b/docker/Dockerfile index 369ba9d..a430761 100644 --- a/docker/Dockerfile +++ b/docker/Dockerfile @@ -16,8 +16,8 @@ ARG TRITON_VERSION=22.12 ARG BASE_IMAGE=nvcr.io/nvidia/tritonserver:${TRITON_VERSION}-py3 FROM ${BASE_IMAGE} -RUN apt-get update -RUN apt-get install -y --no-install-recommends \ +RUN apt-get update && \ + apt-get install -y --no-install-recommends \ autoconf \ autogen \ clangd \ @@ -35,22 +35,22 @@ RUN apt-get install -y --no-install-recommends \ unzip \ zstd \ zip \ - zsh -RUN pip3 install torch==1.12.1+cu116 -f https://download.pytorch.org/whl/torch_stable.html && \ - pip3 install --extra-index-url https://pypi.ngc.nvidia.com regex fire tritonclient[all] && \ - pip3 install transformers huggingface_hub tokenizers SentencePiece sacrebleu datasets tqdm omegaconf rouge_score && \ - pip3 install cmake==3.24.3 - -RUN apt-get clean && \ + zsh && \ + apt-get clean && \ rm -rf /var/lib/apt/lists/* +RUN pip3 install --no-cache-dir --extra-index-url https://download.pytorch.org/whl/cu118 torch==2.0.1+cu118 && \ + pip3 install --no-cache-dir --extra-index-url https://pypi.ngc.nvidia.com regex fire tritonclient[all] && \ + pip3 install --no-cache-dir accelerate transformers huggingface_hub tokenizers SentencePiece sacrebleu datasets tqdm omegaconf rouge_score && \ + pip3 install --no-cache-dir cmake==3.24.3 + # backend build ADD . /workspace/build/fastertransformer_backend RUN mkdir -p /workspace/build/fastertransformer_backend/build WORKDIR /workspace/build/fastertransformer_backend/build ARG FORCE_BACKEND_REBUILD=0 -RUN cmake \ +RUN CUDAFLAGS="-include stdio.h" cmake \ -D CMAKE_EXPORT_COMPILE_COMMANDS=1 \ -D CMAKE_BUILD_TYPE=Release \ -D ENABLE_FP8=OFF \ @@ -58,11 +58,11 @@ RUN cmake \ -D TRITON_COMMON_REPO_TAG="r${NVIDIA_TRITON_SERVER_VERSION}" \ -D TRITON_CORE_REPO_TAG="r${NVIDIA_TRITON_SERVER_VERSION}" \ -D TRITON_BACKEND_REPO_TAG="r${NVIDIA_TRITON_SERVER_VERSION}" \ - .. -RUN cd _deps/repo-ft-src/ && \ + .. && \ + cd _deps/repo-ft-src/ && \ git log | head -n 3 2>&1 | tee /workspace/build/fastertransformer_backend/FT_version.txt && \ cd /workspace/build/fastertransformer_backend/build && \ - make -j"$(grep -c ^processor /proc/cpuinfo)" install && \ + CUDAFLAGS="-include stdio.h" make -O -j"$(grep -c ^processor /proc/cpuinfo)" install && \ rm /workspace/build/fastertransformer_backend/build/bin/*_example -rf && \ rm /workspace/build/fastertransformer_backend/build/lib/lib*Backend.so -rf From 0e3522bc7a88fcd1a9fa270f93e1f8c23d8b8cbb Mon Sep 17 00:00:00 2001 From: Samiur Rahman Date: Tue, 11 Jul 2023 17:57:03 +0000 Subject: [PATCH 2/2] Update default base image version --- docker/Dockerfile | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/docker/Dockerfile b/docker/Dockerfile index a430761..bfbfba0 100644 --- a/docker/Dockerfile +++ b/docker/Dockerfile @@ -12,7 +12,7 @@ # See the License for the specific language governing permissions and # limitations under the License. -ARG TRITON_VERSION=22.12 +ARG TRITON_VERSION=23.05 ARG BASE_IMAGE=nvcr.io/nvidia/tritonserver:${TRITON_VERSION}-py3 FROM ${BASE_IMAGE}