forked from EngineX-MetaX/enginex-c_series-vllm
Add support for Qwen3 MoE+GPTQ
This commit is contained in:
@@ -522,7 +522,6 @@ class EngineArgs:
|
||||
help="Disable async output processing. This may result in "
|
||||
"lower performance.")
|
||||
model_group.add_argument("--config-format",
|
||||
choices=[f.value for f in ConfigFormat],
|
||||
**model_kwargs["config_format"])
|
||||
# This one is a special case because it can bool
|
||||
# or str. TODO: Handle this in get_kwargs
|
||||
|
||||
Reference in New Issue
Block a user