Skip to content
This repository was archived by the owner on Jul 4, 2025. It is now read-only.

Commit c5aa6bc

Browse files
committed
Merge branch 'rel' into sync-0.10.0
2 parents ad7ef8e + 4da5cc0 commit c5aa6bc

File tree

4 files changed

+13
-7
lines changed

4 files changed

+13
-7
lines changed
Lines changed: 9 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,9 @@
1+
FROM nvidia/cuda:12.3.0-devel-ubuntu22.04
2+
3+
RUN apt-get update && apt-get -y install python3.10 python3-pip openmpi-bin libopenmpi-dev git git-lfs
4+
5+
RUN pip3 install tensorrt_llm==0.9.0 --extra-index-url https://pypi.nvidia.com
6+
7+
RUN pip3 install numpy==1.26.4
8+
9+
RUN git clone https://github.com/NVIDIA/TensorRT-LLM.git && cd TensorRT-LLM && git checkout v0.9.0

.github/workflows/build.yml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -49,7 +49,7 @@ jobs:
4949
runs-on: "linux-tensorrt-llm-0-10-0-cuda-12-4"
5050
run-e2e: false
5151
s3-key-prefix: "linux-tensorrt-llm-tensorrt-llm-0-10-0-sccache"
52-
ccache-dir: '/home/runner/.ccache'
52+
ccache-dir: '/home/runner/.cache/ccache'
5353
permissions:
5454
contents: write
5555
steps:
@@ -169,4 +169,4 @@ jobs:
169169
# config-name: my-config.yml
170170
# disable-autolabeler: true
171171
env:
172-
GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }}
172+
GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }}

.github/workflows/quality-gate.yml

Lines changed: 1 addition & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -24,7 +24,7 @@ jobs:
2424
runs-on: "linux-tensorrt-llm-0-10-0-cuda-12-4"
2525
run-e2e: false
2626
s3-key-prefix: "linux-tensorrt-llm-tensorrt-llm-0-10-0-sccache"
27-
ccache-dir: '/home/runner/.ccache'
27+
ccache-dir: '/home/runner/.cache/ccache'
2828
permissions:
2929
contents: write
3030
steps:
@@ -111,5 +111,3 @@ jobs:
111111
AWS_ACCESS_KEY_ID: "${{ secrets.MINIO_ACCESS_KEY_ID }}"
112112
AWS_SECRET_ACCESS_KEY: "${{ secrets.MINIO_SECRET_ACCESS_KEY }}"
113113
AWS_DEFAULT_REGION: "${{ secrets.MINIO_REGION }}"
114-
115-

cpp/Makefile

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -18,7 +18,7 @@ build-deps:
1818
ifeq ($(OS),Windows_NT)
1919
@powershell -Command "cd tensorrt_llm/cortex.tensorrt-llm; cmake -S ./third-party -B ./build_deps/third-party -DCMAKE_CXX_COMPILER_LAUNCHER=ccache -DCMAKE_C_COMPILER_LAUNCHER=ccache -DCMAKE_CUDA_COMPILER_LAUNCHER=ccache -DCMAKE_BUILD_TYPE=Release -DCMAKE_OBJECT_PATH_MAX=500; cmake --build ./build_deps/third-party --config Release -j8;"
2020
else
21-
@cd tensorrt_llm/cortex.tensorrt-llm && cmake -S ./third-party -B ./build_deps/third-party -DCMAKE_BUILD_TYPE=Release -DCMAKE_OBJECT_PATH_MAX=500 && make -C ./build_deps/third-party -j 10 && rm -rf ./build_deps/third-party;
21+
@cd tensorrt_llm/cortex.tensorrt-llm && cmake -S ./third-party -B ./build_deps/third-party -DCMAKE_BUILD_TYPE=Release && make -C ./build_deps/third-party -j 10 && rm -rf ./build_deps/third-party;
2222
endif
2323

2424
# Build the Cortex engine
@@ -29,7 +29,6 @@ ifeq ($(OS),Windows_NT)
2929
else
3030
@cd .. && python3 ./scripts/build_wheel.py --trt_root /usr/local/tensorrt --cuda_architectures "80-real;86-real;89-real" --extra-cmake-vars "BUILD_CORTEX_TENSORRT-LLM=ON" --use_ccache
3131
@cd build && cmake .. -DCMAKE_CUDA_ARCHITECTURES='80-real;86-real;89-real' -DTRT_LIB_DIR='/usr/local/tensorrt/lib' -DTRT_INCLUDE_DIR='/usr/local/tensorrt/include' -DBUILD_CORTEX_TENSORRT-LLM=ON -DCMAKE_CXX_COMPILER_LAUNCHER=ccache -DCMAKE_CUDA_COMPILER_LAUNCHER=ccache -G Ninja && cmake --build . --config Release;
32-
3332
endif
3433

3534
# Prepackage the Cortex engine

0 commit comments

Comments
 (0)