Add accuracy test to CI: MMLU (#882)

This commit is contained in:
Ying Sheng
2024-08-01 21:20:17 -07:00
committed by GitHub
parent 76e59088d8
commit ae7ee01a8e
24 changed files with 831 additions and 136 deletions

View File

@@ -18,7 +18,7 @@ concurrency:
cancel-in-progress: true
jobs:
pr-e2e-test:
e2e-test:
runs-on: self-hosted
env:
@@ -38,7 +38,7 @@ jobs:
pip install flashinfer -i https://flashinfer.ai/whl/cu121/torch2.3/ --force-reinstall
pip install --upgrade transformers
- name: Benchmark Serving
- name: Benchmark Serving Throughput
run: |
cd /data/zhyncs/venv && source ./bin/activate && cd -
python3 -m sglang.launch_server --model meta-llama/Meta-Llama-3.1-8B-Instruct --port 8413 --disable-radix-cache &

View File

@@ -59,3 +59,10 @@ jobs:
cd test/srt
python3 test_openai_server.py
- name: Test Accuracy
run: |
cd /data/zhyncs/venv && source ./bin/activate && cd -
cd test/srt
python3 test_eval_accuracy.py