misc: update test config (#990)

This commit is contained in:
Yineng Zhang
2024-08-11 02:20:30 +08:00
committed by GitHub
parent 7599badeaf
commit e712837d38
3 changed files with 5 additions and 5 deletions

View File

@@ -20,7 +20,7 @@ concurrency:
jobs: jobs:
e2e-test: e2e-test:
if: github.repository == 'sgl-project/sglang' || github.event_name == 'pull_request' if: github.repository == 'sgl-project/sglang' || github.event_name == 'pull_request'
runs-on: self-hosted runs-on: bench
steps: steps:
- name: Checkout code - name: Checkout code
@@ -38,6 +38,7 @@ jobs:
- name: Benchmark Serving Throughput - name: Benchmark Serving Throughput
run: | run: |
python3 -m sglang.launch_server --model meta-llama/Meta-Llama-3.1-8B-Instruct --port 8413 --disable-radix-cache & python3 -m sglang.launch_server --model meta-llama/Meta-Llama-3.1-8B-Instruct --port 8413 --disable-radix-cache &
SERVER_PID=$!
echo "Waiting for server to start..." echo "Waiting for server to start..."
for i in {1..120}; do for i in {1..120}; do
@@ -52,7 +53,7 @@ jobs:
sleep 1 sleep 1
done done
cd $HOME && python3 -m sglang.bench_serving --backend sglang --port 8413 --dataset-name random --num-prompts 3000 --random-input 256 --random-output 512 cd $HOME && python3 -m sglang.bench_serving --backend sglang --port 8413 --dataset-name random --num-prompts 500 --random-input 4096 --random-output 2048
echo "Stopping server..." echo "Stopping server..."
kill -9 $(ps aux | grep sglang | grep Meta-Llama-3.1-8B-Instruct | grep -- "--port 8413" | grep -v grep | awk '{print $2}') kill -9 $SERVER_PID

View File

@@ -20,7 +20,7 @@ concurrency:
jobs: jobs:
unit-test: unit-test:
if: github.repository == 'sgl-project/sglang' || github.event_name == 'pull_request' if: github.repository == 'sgl-project/sglang' || github.event_name == 'pull_request'
runs-on: self-hosted runs-on: unit
steps: steps:
- name: Checkout code - name: Checkout code

View File

@@ -1,6 +1,5 @@
# Code Structures # Code Structures
- `lang`: The frontend language. - `lang`: The frontend language.
- `srt`: The backend engine for running local models. (SRT = SGLang Runtime). - `srt`: The backend engine for running local models. (SRT = SGLang Runtime).
- `test`: Test utilities. - `test`: Test utilities.