chore(gb200): update to CUDA 12.9 and improve build process (#8772)

This commit is contained in:
ishandhanani
2025-08-08 13:42:47 -07:00
committed by GitHub
parent 36bfddecb9
commit 4e7f025219
7 changed files with 86 additions and 50 deletions

View File

@@ -11,7 +11,7 @@ jobs:
publish:
if: github.repository == 'sgl-project/sglang'
runs-on: ubuntu-22.04-arm
environment: 'prod'
environment: "prod"
steps:
- name: Delete huge unnecessary tools folder
run: rm -rf /opt/hostedtoolcache
@@ -31,6 +31,6 @@ jobs:
- name: Build and Push
run: |
version=$(cat python/sglang/version.py | cut -d'"' -f2)
tag=v${version}-cu128-gb200
tag=v${version}-cu129-gb200
docker buildx build --platform linux/arm64 --push --output type=image -t lmsysorg/sglang:${tag} -f docker/Dockerfile.gb200 --build-arg CUDA_VERSION=12.8.1 --build-arg BUILD_TYPE=blackwell --no-cache .
docker buildx build --platform linux/arm64 --push --output type=image -t lmsysorg/sglang:${tag} -f docker/Dockerfile.gb200 --build-arg CUDA_VERSION=12.9.1 --build-arg BUILD_TYPE=blackwell --no-cache .

View File

@@ -17,17 +17,17 @@ concurrency:
cancel-in-progress: true
jobs:
build-cu128-aarch64:
build-cu129-aarch64:
if: github.repository == 'sgl-project/sglang'
runs-on: sgl-kernel-release-node
runs-on: sgl-kernel-release-node-arm
strategy:
matrix:
python-version: ['3.9']
cuda-version: ['12.8']
python-version: ["3.10"]
cuda-version: ["12.9"]
steps:
- uses: actions/checkout@v4
with:
submodules: 'recursive'
submodules: "recursive"
- name: Set up Python ${{ matrix.python-version }}
uses: actions/setup-python@v5
@@ -47,7 +47,7 @@ jobs:
path: sgl-kernel/dist/*
release:
needs: build-cu128-aarch64
needs: build-cu129-aarch64
runs-on: ubuntu-latest
steps:
- uses: actions/checkout@v4
@@ -84,7 +84,7 @@ jobs:
WHL_TOKEN: ${{ secrets.WHL_TOKEN }}
- name: Update wheel index
run: python3 scripts/update_kernel_whl_index.py --cuda 128
run: python3 scripts/update_kernel_whl_index.py --cuda 129
- name: Push wheel index
run: |