forked from EngineX-Cambricon/enginex-mlu370-vllm
add qwen3
This commit is contained in:
50
vllm-v0.6.2/tests/test_mlu_ut.sh
Normal file
50
vllm-v0.6.2/tests/test_mlu_ut.sh
Normal file
@@ -0,0 +1,50 @@
|
||||
source mlu_cases_list.sh
|
||||
|
||||
# link models before test
|
||||
LINK_MODELS
|
||||
|
||||
start_time=`date +%s`
|
||||
|
||||
HOST_IP=$(ip address | grep "inet.*eth0" | awk -F' ' '{ print $2 }' | awk -F'/' '{ print $1 }')
|
||||
|
||||
export VLLM_HOST_IP=$HOST_IP
|
||||
|
||||
# It took 1419s
|
||||
export VLLM_LATENCY_DEBUG=true
|
||||
run_ut 3 ${BENCHMARK_CASES[@]}
|
||||
unset VLLM_LATENCY_DEBUG
|
||||
|
||||
export VLLM_TEST_ENABLE_ARTIFICIAL_PREEMPT=1
|
||||
run_ut 3 ${BASIC_CORRECTNESS_CASES[@]}
|
||||
unset VLLM_TEST_ENABLE_ARTIFICIAL_PREEMPT
|
||||
|
||||
UNLINK_MODELS
|
||||
run_ut 3 ${DISTRIBUTED_NEED_PACK_CASES}
|
||||
LINK_MODELS
|
||||
|
||||
# It took 4031s
|
||||
run_ut 3 ${OFFLINE_CASES0[@]}
|
||||
|
||||
# It took 884s
|
||||
run_ut 3 ${OFFLINE_CASES1[@]}
|
||||
|
||||
# It took xxxs
|
||||
run_ut 3 ${OFFLINE_CASES2[@]}
|
||||
|
||||
# It took 1897s
|
||||
run_ut 30 ${ONLINE_CASES[@]}
|
||||
|
||||
# examples/cambricon_custom_func cases
|
||||
SCRIPT_DIR=$(dirname $(readlink -f "$0"))
|
||||
pushd ${SCRIPT_DIR}/../examples/cambricon_custom_func/tests
|
||||
run_ut 1 ${CAMBRICON_CUSTOM_FUNC_CASES}
|
||||
popd
|
||||
|
||||
end_time=`date +%s`
|
||||
|
||||
exec_time=$((end_time-start_time))
|
||||
|
||||
echo "All ut pass, total time ${exec_time}s."
|
||||
|
||||
# unlink models after test
|
||||
UNLINK_MODELS
|
||||
Reference in New Issue
Block a user