From cee9b715b578c20147948aa0336baf428cf1970b Mon Sep 17 00:00:00 2001 From: zhangxinyuehfad <59153331+zhangxinyuehfad@users.noreply.github.com> Date: Fri, 19 Dec 2025 10:40:46 +0800 Subject: [PATCH] [Bugfix] install trition for test_custom_op (#5112) ### What this PR does / why we need it? 1. install trition for test_custom_op 2. tests/e2e/nightly/ops test timeout, set timeout-minutes let it test over: https://github.com/vllm-project/vllm-ascend/actions/runs/20326482497/job/58392757707?pr=5112 3. ignore test_dispatch_ffn_combine until it is fixed @kiscad ### Does this PR introduce _any_ user-facing change? ### How was this patch tested? - vLLM version: v0.12.0 - vLLM main: https://github.com/vllm-project/vllm/commit/ad32e3e19ccf0526cb6744a5fed09a138a5fb2f9 Signed-off-by: hfadzxy --- .../workflows/_e2e_nightly_single_node.yaml | 18 ++++++++++++------ .github/workflows/nightly_test_a2.yaml | 1 + 2 files changed, 13 insertions(+), 6 deletions(-) diff --git a/.github/workflows/_e2e_nightly_single_node.yaml b/.github/workflows/_e2e_nightly_single_node.yaml index fbabe7ff..df91260f 100644 --- a/.github/workflows/_e2e_nightly_single_node.yaml +++ b/.github/workflows/_e2e_nightly_single_node.yaml @@ -54,6 +54,7 @@ jobs: e2e-nightly: name: ${{ inputs.tests }} runs-on: ${{ inputs.runner }} + timeout-minutes: 600 container: image: ${{ inputs.image }} steps: @@ -126,6 +127,14 @@ jobs: pip install custom_ops-1.0-cp311-cp311-linux_aarch64.whl . /usr/local/Ascend/ascend-toolkit/set_env.sh + - name: Install triton-ascend + if: ${{ inputs.name == 'test_custom_op' }} + shell: bash -l {0} + run: | + . /usr/local/Ascend/ascend-toolkit/8.3.RC2/bisheng_toolkit/set_env.sh + wget https://vllm-ascend.obs.cn-north-4.myhuaweicloud.com/vllm-ascend/triton_ascend-3.2.0.dev2025110717-cp311-cp311-manylinux_2_27_aarch64.whl + pip install triton_ascend-3.2.0.dev2025110717-cp311-cp311-manylinux_2_27_aarch64.whl + - name: Run vllm-project/vllm-ascend test env: VLLM_WORKER_MULTIPROC_METHOD: spawn @@ -134,10 +143,7 @@ jobs: BENCHMARK_HOME: /vllm-workspace/vllm-ascend/benchmark working-directory: /vllm-workspace/vllm-ascend run: | - pytest -sv ${{ inputs.tests }} + # ignore test_dispatch_ffn_combine until the test is fixed + pytest -sv ${{ inputs.tests }} \ + --ignore=tests/e2e/nightly/ops/test_dispatch_ffn_combine.py - - name: Install triton-ascend - run: | - source /usr/local/Ascend/ascend-toolkit/8.3.RC2/bisheng_toolkit/set_env.sh - wget https://vllm-ascend.obs.cn-north-4.myhuaweicloud.com/vllm-ascend/triton_ascend-3.2.0.dev2025110717-cp311-cp311-manylinux_2_27_aarch64.whl - pip install triton_ascend-3.2.0.dev2025110717-cp311-cp311-manylinux_2_27_aarch64.whl diff --git a/.github/workflows/nightly_test_a2.yaml b/.github/workflows/nightly_test_a2.yaml index dee605cc..d1113622 100644 --- a/.github/workflows/nightly_test_a2.yaml +++ b/.github/workflows/nightly_test_a2.yaml @@ -63,6 +63,7 @@ jobs: vllm: v0.12.0 runner: ${{ matrix.test_config.os }} tests: ${{ matrix.test_config.tests }} + name: ${{ matrix.test_config.name }} image: 'swr.cn-southwest-2.myhuaweicloud.com/base_image/ascend-ci/vllm-ascend:nightly-a2' single-node-accuracy-tests: