refactor: add a check before layer_sharding logging (#7186)
### What this PR does / why we need it?
We should only display this log message when layer_sharding is enabled.
- vLLM version: v0.16.0
- vLLM main:
4034c3d32e
Signed-off-by: QiuChunshuo <qiuchunshuo@huawei.com>
This commit is contained in:
@@ -52,6 +52,7 @@ class AscendConfig:
|
|||||||
self.dump_config_path = additional_config.get("dump_config_path", None)
|
self.dump_config_path = additional_config.get("dump_config_path", None)
|
||||||
self._construct_weight_prefetch_config(additional_config)
|
self._construct_weight_prefetch_config(additional_config)
|
||||||
self.layer_sharding = additional_config.get("layer_sharding", None)
|
self.layer_sharding = additional_config.get("layer_sharding", None)
|
||||||
|
if self.layer_sharding:
|
||||||
logger.info_once(
|
logger.info_once(
|
||||||
f"Linear layer sharding enabled with config: {self.layer_sharding}. "
|
f"Linear layer sharding enabled with config: {self.layer_sharding}. "
|
||||||
"Note: This feature works optimally with FLASHCOMM2 and DSA-CP enabled; "
|
"Note: This feature works optimally with FLASHCOMM2 and DSA-CP enabled; "
|
||||||
|
|||||||
Reference in New Issue
Block a user