[CI] rename Qwen2.5-0.5B-Instruct-W8A8 model (#1145)
1. rename vllm-ascend/Qwen2.5-0.5B-Instruct-W8A8-new to vllm-ascend/Qwen2.5-0.5B-Instruct-W8A8 Signed-off-by: 22dimensions <waitingwind@foxmail.com>
This commit is contained in:
@@ -39,7 +39,7 @@ MODELS = [
|
|||||||
MULTIMODALITY_MODELS = ["Qwen/Qwen2.5-VL-3B-Instruct"]
|
MULTIMODALITY_MODELS = ["Qwen/Qwen2.5-VL-3B-Instruct"]
|
||||||
|
|
||||||
QUANTIZATION_MODELS = [
|
QUANTIZATION_MODELS = [
|
||||||
"vllm-ascend/Qwen2.5-0.5B-Instruct-W8A8-new",
|
"vllm-ascend/Qwen2.5-0.5B-Instruct-W8A8",
|
||||||
]
|
]
|
||||||
os.environ["PYTORCH_NPU_ALLOC_CONF"] = "max_split_size_mb:256"
|
os.environ["PYTORCH_NPU_ALLOC_CONF"] = "max_split_size_mb:256"
|
||||||
|
|
||||||
|
|||||||
Reference in New Issue
Block a user