91 lines
2.9 KiB
YAML
91 lines
2.9 KiB
YAML
name: PR Test (Xeon)
|
|
|
|
on:
|
|
push:
|
|
branches: [ main ]
|
|
paths:
|
|
- "python/**"
|
|
- "scripts/ci/**"
|
|
- "test/**"
|
|
- "sgl-kernel/**"
|
|
- ".github/workflows/pr-test-xeon.yml"
|
|
pull_request:
|
|
branches: [ main ]
|
|
paths:
|
|
- "python/**"
|
|
- "scripts/ci/**"
|
|
- "test/**"
|
|
- "sgl-kernel/**"
|
|
- ".github/workflows/pr-test-xeon.yml"
|
|
types: [synchronize, labeled]
|
|
workflow_dispatch:
|
|
|
|
concurrency:
|
|
group: pr-test-xeon-${{ github.ref }}
|
|
cancel-in-progress: false
|
|
|
|
jobs:
|
|
build-test:
|
|
if: github.event_name != 'pull_request' || contains(github.event.pull_request.labels.*.name, 'run-ci')
|
|
runs-on: xeon-gnr
|
|
env:
|
|
HF_HOME: /home/sdp/.cache/huggingface
|
|
strategy:
|
|
matrix:
|
|
build_type: ['all']
|
|
steps:
|
|
- name: Checkout repository
|
|
uses: actions/checkout@v4
|
|
|
|
- name: Build and Push
|
|
run: |
|
|
version=$(cat python/sglang/version.py | cut -d'"' -f2)
|
|
tag=v${version}-xeon
|
|
|
|
docker build . -f docker/Dockerfile.xeon -t sglang_xeon --no-cache
|
|
|
|
- name: Run container
|
|
run: |
|
|
docker run -dt \
|
|
-v ${{ github.workspace }}:/sglang-checkout/ --ipc=host \
|
|
-v ${HF_HOME}:/root/.cache/huggingface \
|
|
--name ci_sglang_xeon \
|
|
sglang_xeon
|
|
|
|
- name: Install dependencies
|
|
timeout-minutes: 20
|
|
run: |
|
|
docker exec ci_sglang_xeon bash -c "python3 -m pip install --upgrade pip"
|
|
docker exec ci_sglang_xeon pip uninstall sgl-kernel -y || true
|
|
docker exec -w /sglang-checkout/sgl-kernel ci_sglang_xeon bash -c "cp pyproject_cpu.toml pyproject.toml && pip install -v ."
|
|
docker exec -w /sglang-checkout/ ci_sglang_xeon bash -c "rm -rf python/pyproject.toml && mv python/pyproject_other.toml python/pyproject.toml"
|
|
docker exec -w /sglang-checkout/ ci_sglang_xeon bash -c "pip install -e "python[dev_cpu]""
|
|
|
|
- name: Check AMX support
|
|
id: check_amx
|
|
timeout-minutes: 5
|
|
run: |
|
|
docker exec -w /sglang-checkout/ ci_sglang_xeon \
|
|
bash -c "python3 -c 'import torch; import sgl_kernel; assert torch._C._cpu._is_amx_tile_supported(); assert hasattr(torch.ops.sgl_kernel, \"convert_weight_packed\"); '"
|
|
continue-on-error: true
|
|
|
|
- name: Run unit tests
|
|
if: steps.check_amx.outcome == 'success'
|
|
timeout-minutes: 36
|
|
run: |
|
|
docker exec -w /sglang-checkout/ ci_sglang_xeon \
|
|
bash -c "cd ./test/srt && python3 run_suite.py --suite per-commit-cpu"
|
|
|
|
- name: Change permission
|
|
timeout-minutes: 2
|
|
run: |
|
|
docker exec -u root ci_sglang_xeon bash -c "
|
|
rm -rf /tmp/ci-home &&
|
|
chown -R $(id -u):$(id -g) /sglang-checkout/ 2>/dev/null || true
|
|
"
|
|
|
|
- name: Cleanup container
|
|
if: always()
|
|
run: |
|
|
docker rm -f ci_sglang_xeon || true
|