sglangv0.5.2 & support Qwen3-Next-80B-A3B-Instruct
This commit is contained in:
27
3rdparty/amd/profiling/client.sh
vendored
Executable file
27
3rdparty/amd/profiling/client.sh
vendored
Executable file
@@ -0,0 +1,27 @@
|
||||
#!/bin/bash
|
||||
|
||||
# Start profiling via API
|
||||
curl http://localhost:30000/start_profile -H "Content-Type: application/json"
|
||||
|
||||
# Benchmark serving using sglang with random dataset and tokenizer
|
||||
# Define the log file with a timestamp
|
||||
TIMESTAMP=$(date +%Y%m%d_%H%M%S)
|
||||
LOGFILE="sglang_client_log_$TIMESTAMP.json"
|
||||
|
||||
# Run the benchmark with specified parameters and save logs
|
||||
python3 -m sglang.bench_serving \
|
||||
--backend sglang \
|
||||
--tokenizer Xenova/grok-1-tokenizer \
|
||||
--dataset-name random \
|
||||
--random-input 1024\
|
||||
--random-output 1024 \
|
||||
--num-prompts 240 \
|
||||
--request-rate 8 \
|
||||
--output-file online.jsonl 2>&1 | tee "$LOGFILE"
|
||||
|
||||
# Stop profiling via API
|
||||
curl http://localhost:30000/stop_profile -H "Content-Type: application/json"
|
||||
|
||||
# Convert tracing file to csv & json
|
||||
sqlite3 trace.rpd ".mode csv" ".header on" ".output trace.csv" "select * from top;" ".output stdout"
|
||||
python3 /sgl-workspace/rocmProfileData/tools/rpd2tracing.py trace.rpd trace.json
|
||||
Reference in New Issue
Block a user