FRAMEWORK=vllm_tokenizer_patch GPU_TYPE=Kunlunxin_p-800 TASK_TYPE=text-generation