[Bugfix] quick fix balance scheduling patch (#5281)
### What this PR does / why we need it?
quick fix balance scheduling patch
- vLLM version: release/v0.13.0
- vLLM main:
ad32e3e19c
Signed-off-by: GDzhu01 <809721801@qq.com>
This commit is contained in:
@@ -146,7 +146,7 @@ env_variables: Dict[str, Callable[[], Any]] = {
|
|||||||
lambda: int(os.getenv("VLLM_ASCEND_ENABLE_FUSED_MC2", '0')),
|
lambda: int(os.getenv("VLLM_ASCEND_ENABLE_FUSED_MC2", '0')),
|
||||||
# Whether to anbale balance scheduling
|
# Whether to anbale balance scheduling
|
||||||
"VLLM_ASCEND_BALANCE_SCHEDULING":
|
"VLLM_ASCEND_BALANCE_SCHEDULING":
|
||||||
lambda: bool(os.getenv("VLLM_ASCEND_BALANCE_SCHEDULING", '0')),
|
lambda: bool(int(os.getenv("VLLM_ASCEND_BALANCE_SCHEDULING", '0'))),
|
||||||
}
|
}
|
||||||
|
|
||||||
# end-env-vars-definition
|
# end-env-vars-definition
|
||||||
|
|||||||
Reference in New Issue
Block a user