Files
vLLM-Iluvatar_bi-100-opt/vllm_wrapper.sh

18 lines
566 B
Bash
Raw Normal View History

#!/bin/bash
set -e
# 只拦截 "serve <model_dir>" 子命令,其他子命令直接透传
if [ "$1" = "serve" ] && [ -n "$2" ]; then
MODEL_DIR="$2"
shift 2
FIXED_DIR=$(python3 /opt/fix_tokenizer.py "$MODEL_DIR")
if [ -n "$FIXED_DIR" ]; then
exec /usr/local/corex/lib64/python3/dist-packages/bin/vllm_real serve "$MODEL_DIR" --tokenizer "$FIXED_DIR" "$@"
else
exec /usr/local/corex/lib64/python3/dist-packages/bin/vllm_real serve "$MODEL_DIR" "$@"
fi
fi
exec /usr/local/corex/lib64/python3/dist-packages/bin/vllm_real "$@"