FRAMEWORK=vllm_tokenizer_patch GPU_TYPE=Kunlun_P800 TASK_TYPE=text-generation