[CI] Split test cases in CI for better load balancing (#2180)

This commit is contained in:
Lianmin Zheng
2024-11-25 04:58:16 -08:00
committed by GitHub
parent 538fa0ae13
commit 254fd130e2
6 changed files with 37 additions and 23 deletions

View File

@@ -6,3 +6,7 @@ pip install --upgrade pip
pip install -e "python[all]"
pip install transformers==4.45.2 sentence_transformers accelerate peft
pip install flashinfer -i https://flashinfer.ai/whl/cu121/torch2.4/ --force-reinstall
# for compling eagle kernels
pip install cutex
# for compling xgrammar kernels
pip install cuda-python nvidia-cuda-nvrtc-cu12