Skip to content

Commit

Permalink
Add CICD for nitro tensorrt llm version 0.7.1
Browse files Browse the repository at this point in the history
  • Loading branch information
hiento09 committed Mar 18, 2024
1 parent ce31887 commit 14e3d38
Show file tree
Hide file tree
Showing 4 changed files with 38 additions and 46 deletions.
8 changes: 4 additions & 4 deletions .github/runners/Dockerfile.window.runner-all-arch
Original file line number Diff line number Diff line change
Expand Up @@ -17,7 +17,7 @@ RUN powershell -Command \
curl.exe https://delta.jan.ai/dist/windows-container-dependencies/1/cuda_12.2.2_537.13_windows.exe \
--output "cuda_installer.exe"; \
Start-Process cuda_installer.exe -Wait -ArgumentList '-s'; \
Remove-Item cuda_installer.exe -Force
Remove-Item cuda_installer.exe -Force;

# -----------------------------------------------------------------------------

Expand Down Expand Up @@ -194,7 +194,7 @@ RUN powershell -Command \
curl.exe https://delta.jan.ai/dist/windows-container-dependencies/1/cuDNN.zip \
--output cuDNN.zip; \
Expand-Archive .\cuDNN.zip -DestinationPath .; \
Remove-Item cuDNN.zip -Force
Remove-Item cuDNN.zip -Force;

# Add cuDNN libs and bin to Path.
RUN setx Path "%Path%;C:\workspace\cuDNN\lib;C:\workspace\cuDNN\bin;"
Expand Down Expand Up @@ -251,12 +251,12 @@ RUN powershell -Command \
$ErrorActionPreference = 'Stop'; \
git clone https://github.com/janhq/nitro-tensorrt-llm.git; \
cd nitro-tensorrt-llm; \
git checkout tensorrt-llm-nitro-rel; \
git checkout rel-v0.7.1; \
git submodule update --init --recursive; \
pip install --no-cache-dir -r .\requirements-dev-windows.txt; \
cd cpp/tensorrt_llm/nitro; \
cmake -S ./nitro_deps -B ./build_deps/nitro_deps; \
cmake --build ./build_deps/nitro_deps --config Release
cmake --build ./build_deps/nitro_deps --config Release;

RUN setx Path "%Path%;C:\Program Files (x86)\Microsoft Visual Studio\2022\BuildTools\Common7\Tools"

Expand Down
12 changes: 6 additions & 6 deletions .github/workflows/python-windows-build-release.yml
Original file line number Diff line number Diff line change
Expand Up @@ -34,12 +34,12 @@ jobs:
strategy:
matrix:
include:
- cuda_arch: '80-real;86-real'
cuda_arch_name: 'ampere'
- cuda_arch: '89-real'
cuda_arch_name: 'ada'
- cuda_arch: '75-real'
cuda_arch_name: 'turing'
# - cuda_arch: '80-real;86-real'
# cuda_arch_name: 'ampere'
# - cuda_arch: '89-real'
# cuda_arch_name: 'ada'
# - cuda_arch: '75-real'
# cuda_arch_name: 'turing'
- cuda_arch: '75-real;80-real;86-real;89-real'
cuda_arch_name: 'all'
permissions:
Expand Down
12 changes: 6 additions & 6 deletions .github/workflows/windows-build-manual.yml
Original file line number Diff line number Diff line change
Expand Up @@ -8,12 +8,12 @@ jobs:
strategy:
matrix:
include:
- cuda_arch: '80-real;86-real'
cuda_arch_name: 'ampere'
- cuda_arch: '89-real'
cuda_arch_name: 'ada'
- cuda_arch: '75-real'
cuda_arch_name: 'turing'
# - cuda_arch: '80-real;86-real'
# cuda_arch_name: 'ampere'
# - cuda_arch: '89-real'
# cuda_arch_name: 'ada'
# - cuda_arch: '75-real'
# cuda_arch_name: 'turing'
- cuda_arch: '75-real;80-real;86-real;89-real'
cuda_arch_name: 'all'
permissions:
Expand Down
52 changes: 22 additions & 30 deletions .github/workflows/windows-build-release.yml
Original file line number Diff line number Diff line change
@@ -1,14 +1,13 @@
name: Release for Windows
on:
push:
tags: ["windows-v[0-9]+.[0-9]+.[0-9]+"]
tags: ["windows-v[0-9]+.[0-9]+.[0-9]+-tensorrt-llm-v[0-9]+.[0-9]+.[0-9]+"]

jobs:
create-draft-release:
get-version:
runs-on: ubuntu-latest
if: github.event_name == 'push' && startsWith(github.ref, 'refs/tags/')
outputs:
upload_url: ${{ steps.create_release.outputs.upload_url }}
version: ${{ steps.get_version.outputs.version }}
permissions:
contents: write
Expand All @@ -18,30 +17,21 @@ jobs:
run: echo "VERSION=${GITHUB_REF#refs/tags/}" >> $GITHUB_ENV && echo "::set-output name=version::${GITHUB_REF#refs/tags/}"
env:
GITHUB_REF: ${{ github.ref }}
- name: Create Draft Release
id: create_release
uses: actions/create-release@v1
env:
GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }}
with:
tag_name: ${{ github.ref_name }}
release_name: "${{ env.VERSION }}"
draft: true
prerelease: false

windows-build:
needs: create-draft-release
needs: get-version
runs-on: windows-nitro-tensorrt-llm-${{ matrix.cuda_arch_name }}
strategy:
matrix:
include:
- cuda_arch: '80-real;86-real'
cuda_arch_name: 'ampere'
- cuda_arch: '89-real'
cuda_arch_name: 'ada'
- cuda_arch: '75-real'
cuda_arch_name: 'turing'
# - cuda_arch: '75-real;80-real;86-real;89-real'
# cuda_arch_name: 'all'
# - cuda_arch: '80-real;86-real'
# cuda_arch_name: 'ampere'
# - cuda_arch: '89-real'
# cuda_arch_name: 'ada'
# - cuda_arch: '75-real'
# cuda_arch_name: 'turing'
- cuda_arch: '75-real;80-real;86-real;89-real'
cuda_arch_name: 'all'
permissions:
contents: write
steps:
Expand Down Expand Up @@ -92,12 +82,14 @@ jobs:
cd .\build_nitro
tar -czvf ..\nitro.tar.gz .\*
- uses: actions/[email protected]
if: github.event_name == 'push' && startsWith(github.ref, 'refs/tags/')
env:
GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }}
- name: Upload binaries to release
uses: svenstaro/upload-release-action@v2
with:
upload_url: ${{ needs.create-draft-release.outputs.upload_url }}
asset_path: ./nitro.tar.gz
asset_name: nitro-${{ needs.create-draft-release.outputs.version }}-amd64-tensorrt-llm-${{ matrix.cuda_arch_name }}.tar.gz
asset_content_type: application/gzip
repo_token: ${{ secrets.GITHUB_TOKEN }}
file: ./nitro.tar.gz
asset_name: nitro-${{ needs.get-version.outputs.version }}-amd64-${{ matrix.cuda_arch_name }}-arch.tar.gz
tag: ${{ github.ref }}
overwrite: true
draft: true
release_name: ${{ github.ref }}

0 comments on commit 14e3d38

Please sign in to comment.