From 252d761afc903b34e2c18e7e9cac686eb9c54645 Mon Sep 17 00:00:00 2001 From: 4paradigm <4paradigm@4paradigmdeMacBook-Pro.local> Date: Tue, 30 Jun 2026 15:35:45 +0800 Subject: [PATCH] fix tokenizer --- vllm_wrapper.sh | 17 +++++++++++++++++ 1 file changed, 17 insertions(+) create mode 100644 vllm_wrapper.sh diff --git a/vllm_wrapper.sh b/vllm_wrapper.sh new file mode 100644 index 0000000..a8f10e8 --- /dev/null +++ b/vllm_wrapper.sh @@ -0,0 +1,17 @@ +#!/bin/bash +set -e + +# 只拦截 "serve " 子命令,其他子命令直接透传 +if [ "$1" = "serve" ] && [ -n "$2" ]; then + MODEL_DIR="$2" + shift 2 + + FIXED_DIR=$(python3 /opt/fix_tokenizer.py "$MODEL_DIR") + if [ -n "$FIXED_DIR" ]; then + exec /opt/vllm_kunlun/bin/vllm_real serve "$MODEL_DIR" --tokenizer "$FIXED_DIR" "$@" + else + exec /opt/vllm_kunlun/bin/vllm_real serve "$MODEL_DIR" "$@" + fi +fi + +exec /opt/vllm_kunlun/bin/vllm_real "$@"