36 lines
821 B
Bash
36 lines
821 B
Bash
|
|
#!/bin/bash
|
||
|
|
set -e
|
||
|
|
|
||
|
|
MODEL_DIR=${1:-/model}
|
||
|
|
shift || true
|
||
|
|
|
||
|
|
FIX_TOKENIZER_DIR=/tmp/fixed_tokenizer
|
||
|
|
AUTO_FIX=${AUTO_FIX_TOKENIZER:-auto}
|
||
|
|
|
||
|
|
echo "[entrypoint] model dir: $MODEL_DIR"
|
||
|
|
|
||
|
|
NEED_FIX=0
|
||
|
|
|
||
|
|
if [ "$AUTO_FIX" = "1" ] || [ "$AUTO_FIX" = "true" ]; then
|
||
|
|
NEED_FIX=1
|
||
|
|
elif [ "$AUTO_FIX" = "auto" ]; then
|
||
|
|
if [ -f "$MODEL_DIR/tokenizer_config.json" ]; then
|
||
|
|
if grep -q "TokenizersBackend\|TiktokenTokenizer" "$MODEL_DIR/tokenizer_config.json"; then
|
||
|
|
NEED_FIX=1
|
||
|
|
fi
|
||
|
|
fi
|
||
|
|
fi
|
||
|
|
|
||
|
|
if [ $NEED_FIX -eq 1 ]; then
|
||
|
|
echo "[entrypoint] fixing tokenizer..."
|
||
|
|
python3 /opt/fix_tokenizer.py
|
||
|
|
TOKENIZER_ARG="--tokenizer $FIX_TOKENIZER_DIR"
|
||
|
|
else
|
||
|
|
echo "[entrypoint] tokenizer OK, skip fix"
|
||
|
|
TOKENIZER_ARG=""
|
||
|
|
fi
|
||
|
|
|
||
|
|
echo "[entrypoint] starting vllm..."
|
||
|
|
|
||
|
|
exec vllm serve "$MODEL_DIR" $TOKENIZER_ARG "$@"
|