Skip to content
This repository was archived by the owner on Jul 4, 2025. It is now read-only.

Commit 98e5ccd

Browse files
committed
Add CICD for nitro tensorrt llm version 0.7.1
1 parent ce31887 commit 98e5ccd

File tree

4 files changed

+36
-45
lines changed

4 files changed

+36
-45
lines changed

.github/runners/Dockerfile.window.runner-all-arch

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -17,7 +17,7 @@ RUN powershell -Command \
1717
curl.exe https://delta.jan.ai/dist/windows-container-dependencies/1/cuda_12.2.2_537.13_windows.exe \
1818
--output "cuda_installer.exe"; \
1919
Start-Process cuda_installer.exe -Wait -ArgumentList '-s'; \
20-
Remove-Item cuda_installer.exe -Force
20+
Remove-Item cuda_installer.exe -Force;
2121

2222
# -----------------------------------------------------------------------------
2323

@@ -194,7 +194,7 @@ RUN powershell -Command \
194194
curl.exe https://delta.jan.ai/dist/windows-container-dependencies/1/cuDNN.zip \
195195
--output cuDNN.zip; \
196196
Expand-Archive .\cuDNN.zip -DestinationPath .; \
197-
Remove-Item cuDNN.zip -Force
197+
Remove-Item cuDNN.zip -Force;
198198

199199
# Add cuDNN libs and bin to Path.
200200
RUN setx Path "%Path%;C:\workspace\cuDNN\lib;C:\workspace\cuDNN\bin;"
@@ -251,12 +251,12 @@ RUN powershell -Command \
251251
$ErrorActionPreference = 'Stop'; \
252252
git clone https://github.com/janhq/nitro-tensorrt-llm.git; \
253253
cd nitro-tensorrt-llm; \
254-
git checkout tensorrt-llm-nitro-rel; \
254+
git checkout rel-v0.7.1; \
255255
git submodule update --init --recursive; \
256256
pip install --no-cache-dir -r .\requirements-dev-windows.txt; \
257257
cd cpp/tensorrt_llm/nitro; \
258258
cmake -S ./nitro_deps -B ./build_deps/nitro_deps; \
259-
cmake --build ./build_deps/nitro_deps --config Release
259+
cmake --build ./build_deps/nitro_deps --config Release;
260260

261261
RUN setx Path "%Path%;C:\Program Files (x86)\Microsoft Visual Studio\2022\BuildTools\Common7\Tools"
262262

.github/workflows/python-windows-build-release.yml

Lines changed: 6 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -34,12 +34,12 @@ jobs:
3434
strategy:
3535
matrix:
3636
include:
37-
- cuda_arch: '80-real;86-real'
38-
cuda_arch_name: 'ampere'
39-
- cuda_arch: '89-real'
40-
cuda_arch_name: 'ada'
41-
- cuda_arch: '75-real'
42-
cuda_arch_name: 'turing'
37+
# - cuda_arch: '80-real;86-real'
38+
# cuda_arch_name: 'ampere'
39+
# - cuda_arch: '89-real'
40+
# cuda_arch_name: 'ada'
41+
# - cuda_arch: '75-real'
42+
# cuda_arch_name: 'turing'
4343
- cuda_arch: '75-real;80-real;86-real;89-real'
4444
cuda_arch_name: 'all'
4545
permissions:

.github/workflows/windows-build-manual.yml

Lines changed: 6 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -8,12 +8,12 @@ jobs:
88
strategy:
99
matrix:
1010
include:
11-
- cuda_arch: '80-real;86-real'
12-
cuda_arch_name: 'ampere'
13-
- cuda_arch: '89-real'
14-
cuda_arch_name: 'ada'
15-
- cuda_arch: '75-real'
16-
cuda_arch_name: 'turing'
11+
# - cuda_arch: '80-real;86-real'
12+
# cuda_arch_name: 'ampere'
13+
# - cuda_arch: '89-real'
14+
# cuda_arch_name: 'ada'
15+
# - cuda_arch: '75-real'
16+
# cuda_arch_name: 'turing'
1717
- cuda_arch: '75-real;80-real;86-real;89-real'
1818
cuda_arch_name: 'all'
1919
permissions:

.github/workflows/windows-build-release.yml

Lines changed: 20 additions & 29 deletions
Original file line numberDiff line numberDiff line change
@@ -4,11 +4,10 @@ on:
44
tags: ["windows-v[0-9]+.[0-9]+.[0-9]+"]
55

66
jobs:
7-
create-draft-release:
7+
get-version:
88
runs-on: ubuntu-latest
99
if: github.event_name == 'push' && startsWith(github.ref, 'refs/tags/')
1010
outputs:
11-
upload_url: ${{ steps.create_release.outputs.upload_url }}
1211
version: ${{ steps.get_version.outputs.version }}
1312
permissions:
1413
contents: write
@@ -18,30 +17,21 @@ jobs:
1817
run: echo "VERSION=${GITHUB_REF#refs/tags/}" >> $GITHUB_ENV && echo "::set-output name=version::${GITHUB_REF#refs/tags/}"
1918
env:
2019
GITHUB_REF: ${{ github.ref }}
21-
- name: Create Draft Release
22-
id: create_release
23-
uses: actions/create-release@v1
24-
env:
25-
GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }}
26-
with:
27-
tag_name: ${{ github.ref_name }}
28-
release_name: "${{ env.VERSION }}"
29-
draft: true
30-
prerelease: false
20+
3121
windows-build:
32-
needs: create-draft-release
22+
needs: get-version
3323
runs-on: windows-nitro-tensorrt-llm-${{ matrix.cuda_arch_name }}
3424
strategy:
3525
matrix:
3626
include:
37-
- cuda_arch: '80-real;86-real'
38-
cuda_arch_name: 'ampere'
39-
- cuda_arch: '89-real'
40-
cuda_arch_name: 'ada'
41-
- cuda_arch: '75-real'
42-
cuda_arch_name: 'turing'
43-
# - cuda_arch: '75-real;80-real;86-real;89-real'
44-
# cuda_arch_name: 'all'
27+
# - cuda_arch: '80-real;86-real'
28+
# cuda_arch_name: 'ampere'
29+
# - cuda_arch: '89-real'
30+
# cuda_arch_name: 'ada'
31+
# - cuda_arch: '75-real'
32+
# cuda_arch_name: 'turing'
33+
- cuda_arch: '75-real;80-real;86-real;89-real'
34+
cuda_arch_name: 'all'
4535
permissions:
4636
contents: write
4737
steps:
@@ -92,12 +82,13 @@ jobs:
9282
cd .\build_nitro
9383
tar -czvf ..\nitro.tar.gz .\*
9484
95-
- uses: actions/upload-release-asset@v1.0.1
96-
if: github.event_name == 'push' && startsWith(github.ref, 'refs/tags/')
97-
env:
98-
GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }}
85+
86+
- name: Upload binaries to release
87+
uses: svenstaro/upload-release-action@v2
9988
with:
100-
upload_url: ${{ needs.create-draft-release.outputs.upload_url }}
101-
asset_path: ./nitro.tar.gz
102-
asset_name: nitro-${{ needs.create-draft-release.outputs.version }}-amd64-tensorrt-llm-${{ matrix.cuda_arch_name }}.tar.gz
103-
asset_content_type: application/gzip
89+
repo_token: ${{ secrets.GITHUB_TOKEN }}
90+
file: ./nitro.tar.gz
91+
asset_name: nitro-${{ needs.get-version.outputs.version }}-amd64-tensorrt-llm-${{ matrix.cuda_arch_name }}.tar.gz
92+
tag: ${{ github.ref }}
93+
overwrite: true
94+
draft: true

0 commit comments

Comments
 (0)