This repository was archived by the owner on Jul 4, 2025. It is now read-only.
File tree Expand file tree Collapse file tree 4 files changed +13
-7
lines changed Expand file tree Collapse file tree 4 files changed +13
-7
lines changed Original file line number Diff line number Diff line change 1+ FROM nvidia/cuda:12.3.0-devel-ubuntu22.04
2+
3+ RUN apt-get update && apt-get -y install python3.10 python3-pip openmpi-bin libopenmpi-dev git git-lfs
4+
5+ RUN pip3 install tensorrt_llm==0.9.0 --extra-index-url https://pypi.nvidia.com
6+
7+ RUN pip3 install numpy==1.26.4
8+
9+ RUN git clone https://github.com/NVIDIA/TensorRT-LLM.git && cd TensorRT-LLM && git checkout v0.9.0
Original file line number Diff line number Diff line change 4949 runs-on : " linux-tensorrt-llm-0-10-0-cuda-12-4"
5050 run-e2e : false
5151 s3-key-prefix : " linux-tensorrt-llm-tensorrt-llm-0-10-0-sccache"
52- ccache-dir : ' /home/runner/.ccache'
52+ ccache-dir : ' /home/runner/.cache/ ccache'
5353 permissions :
5454 contents : write
5555 steps :
@@ -169,4 +169,4 @@ jobs:
169169 # config-name: my-config.yml
170170 # disable-autolabeler: true
171171 env :
172- GITHUB_TOKEN : ${{ secrets.GITHUB_TOKEN }}
172+ GITHUB_TOKEN : ${{ secrets.GITHUB_TOKEN }}
Original file line number Diff line number Diff line change 2424 runs-on : " linux-tensorrt-llm-0-10-0-cuda-12-4"
2525 run-e2e : false
2626 s3-key-prefix : " linux-tensorrt-llm-tensorrt-llm-0-10-0-sccache"
27- ccache-dir : ' /home/runner/.ccache'
27+ ccache-dir : ' /home/runner/.cache/ ccache'
2828 permissions :
2929 contents : write
3030 steps :
@@ -111,5 +111,3 @@ jobs:
111111 AWS_ACCESS_KEY_ID : " ${{ secrets.MINIO_ACCESS_KEY_ID }}"
112112 AWS_SECRET_ACCESS_KEY : " ${{ secrets.MINIO_SECRET_ACCESS_KEY }}"
113113 AWS_DEFAULT_REGION : " ${{ secrets.MINIO_REGION }}"
114-
115-
Original file line number Diff line number Diff line change @@ -18,7 +18,7 @@ build-deps:
1818ifeq ($(OS ) ,Windows_NT)
1919 @powershell -Command "cd tensorrt_llm/cortex.tensorrt-llm; cmake -S ./third-party -B ./build_deps/third-party -DCMAKE_CXX_COMPILER_LAUNCHER=ccache -DCMAKE_C_COMPILER_LAUNCHER=ccache -DCMAKE_CUDA_COMPILER_LAUNCHER=ccache -DCMAKE_BUILD_TYPE=Release -DCMAKE_OBJECT_PATH_MAX=500; cmake --build ./build_deps/third-party --config Release -j8;"
2020else
21- @cd tensorrt_llm/cortex.tensorrt-llm && cmake -S ./third-party -B ./build_deps/third-party -DCMAKE_BUILD_TYPE=Release -DCMAKE_OBJECT_PATH_MAX=500 && make -C ./build_deps/third-party -j 10 && rm -rf ./build_deps/third-party;
21+ @cd tensorrt_llm/cortex.tensorrt-llm && cmake -S ./third-party -B ./build_deps/third-party -DCMAKE_BUILD_TYPE=Release && make -C ./build_deps/third-party -j 10 && rm -rf ./build_deps/third-party;
2222endif
2323
2424# Build the Cortex engine
@@ -29,7 +29,6 @@ ifeq ($(OS),Windows_NT)
2929else
3030 @cd .. && python3 ./scripts/build_wheel.py --trt_root /usr/local/tensorrt --cuda_architectures "80-real;86-real;89-real" --extra-cmake-vars "BUILD_CORTEX_TENSORRT-LLM=ON" --use_ccache
3131 @cd build && cmake .. -DCMAKE_CUDA_ARCHITECTURES='80-real;86-real;89-real' -DTRT_LIB_DIR='/usr/local/tensorrt/lib' -DTRT_INCLUDE_DIR='/usr/local/tensorrt/include' -DBUILD_CORTEX_TENSORRT-LLM=ON -DCMAKE_CXX_COMPILER_LAUNCHER=ccache -DCMAKE_CUDA_COMPILER_LAUNCHER=ccache -G Ninja && cmake --build . --config Release;
32-
3332endif
3433
3534# Prepackage the Cortex engine
You can’t perform that action at this time.
0 commit comments