AITER backend extension and workload optimizations (#6838)
Co-authored-by: wunhuang <wunhuang@amd.com> Co-authored-by: Hubert Lu <Hubert.Lu@amd.com>
This commit is contained in:
2
.github/workflows/pr-test-amd.yml
vendored
2
.github/workflows/pr-test-amd.yml
vendored
@@ -72,7 +72,7 @@ jobs:
|
||||
- name: Evaluate accuracy (TP=2)
|
||||
timeout-minutes: 30
|
||||
run: |
|
||||
bash scripts/amd_ci_exec.sh python3 test_moe_eval_accuracy_large.py
|
||||
bash scripts/amd_ci_exec.sh -e SGLANG_USE_AITER=0 python3 test_moe_eval_accuracy_large.py
|
||||
|
||||
mla-test-1-gpu-amd:
|
||||
if: (github.repository == 'sgl-project/sglang' || github.event_name == 'pull_request') &&
|
||||
|
||||
Reference in New Issue
Block a user