diff --git a/.github/workflows/_e2e_test.yaml b/.github/workflows/_e2e_test.yaml index 8e3b0d6d..cab9ca92 100644 --- a/.github/workflows/_e2e_test.yaml +++ b/.github/workflows/_e2e_test.yaml @@ -108,7 +108,7 @@ jobs: pytest -sv tests/e2e/singlecard/spec_decode_v1/test_v1_mtp_correctness.py pytest -sv tests/e2e/singlecard/spec_decode_v1/test_v1_mtp_torchair_correctness.py # Fix me: test_eagle_correctness OOM error - pytest -sv tests/e2e/singlecard/spec_decode_v1/test_v1_spec_decode.py + #pytest -sv tests/e2e/singlecard/spec_decode_v1/test_v1_spec_decode.py e2e-2-cards: name: multicard-2 diff --git a/.github/workflows/format_pr_body.yaml b/.github/workflows/format_pr_body.yaml index 5585e759..1493c661 100644 --- a/.github/workflows/format_pr_body.yaml +++ b/.github/workflows/format_pr_body.yaml @@ -36,7 +36,7 @@ jobs: - name: Get vLLM version run: | - VLLM_COMMIT=v0.12.0 + VLLM_COMMIT=ad32e3e19ccf0526cb6744a5fed09a138a5fb2f9 echo "VLLM_COMMIT=https://github.com/vllm-project/vllm/commit/$VLLM_COMMIT" >> $GITHUB_ENV - name: Checkout repository diff --git a/.github/workflows/vllm_ascend_test_pr_full.yaml b/.github/workflows/vllm_ascend_test_pr_full.yaml index 1c6993cf..62c32ca0 100644 --- a/.github/workflows/vllm_ascend_test_pr_full.yaml +++ b/.github/workflows/vllm_ascend_test_pr_full.yaml @@ -69,7 +69,7 @@ jobs: name: e2e-full strategy: matrix: - vllm_version: [v0.12.0] + vllm_version: [ad32e3e19ccf0526cb6744a5fed09a138a5fb2f9, v0.12.0] needs: [changes] if: ${{ needs.changes.outputs.e2e_tracker == 'true' }} uses: ./.github/workflows/_e2e_test.yaml diff --git a/.github/workflows/vllm_ascend_test_pr_light.yaml b/.github/workflows/vllm_ascend_test_pr_light.yaml index fdb765ed..4e40c013 100644 --- a/.github/workflows/vllm_ascend_test_pr_light.yaml +++ b/.github/workflows/vllm_ascend_test_pr_light.yaml @@ -42,7 +42,7 @@ jobs: lint: uses: ./.github/workflows/pre-commit.yml with: - vllm: v0.12.0 + vllm: ad32e3e19ccf0526cb6744a5fed09a138a5fb2f9 changes: runs-on: ubuntu-latest outputs: @@ -84,8 +84,8 @@ jobs: SOC_VERSION: ascend910b1 strategy: matrix: - vllm_version: [v0.12.0] - + vllm_version: [ad32e3e19ccf0526cb6744a5fed09a138a5fb2f9, v0.12.0] + steps: - name: Free up disk space uses: jlumbroso/free-disk-space@54081f138730dfa15788a46383842cd2f914a1be # v1.3.1 @@ -157,7 +157,7 @@ jobs: name: e2e-light strategy: matrix: - vllm_version: [v0.12.0] + vllm_version: [ad32e3e19ccf0526cb6744a5fed09a138a5fb2f9, v0.12.0] # Note (yikun): If CI resource are limited we can split job into two chain jobs needs: [lint, changes] # only trigger e2e test after lint passed and the change is e2e related with pull request. diff --git a/docs/source/community/versioning_policy.md b/docs/source/community/versioning_policy.md index 38130569..46c70867 100644 --- a/docs/source/community/versioning_policy.md +++ b/docs/source/community/versioning_policy.md @@ -44,7 +44,7 @@ The table below is the release compatibility matrix for vLLM Ascend release. For main branch of vLLM Ascend, we usually make it compatible with the latest vLLM release and a newer commit hash of vLLM. Please note that this table is usually updated. Please check it regularly. | vLLM Ascend | vLLM | Python | Stable CANN | PyTorch/torch_npu | |-------------|--------------|------------------|-------------|--------------------| -| main | v0.12.0 tag | >= 3.10, < 3.12 | 8.3.RC2 | 2.8.0 / 2.8.0 | +| main | ad32e3e19ccf0526cb6744a5fed09a138a5fb2f9, v0.12.0 tag | >= 3.10, < 3.12 | 8.3.RC2 | 2.8.0 / 2.8.0 | ## Release cadence