FRAMEWORK=vllm-patch-tokenizer GPU_TYPE=Iluvatar_bi-100 TASK_TYPE=text-generation