oproj TP support acl graph (#4073)
### What this PR does / why we need it?
Reference #2167 and orpoj TP supports ACL graph.
- vLLM version: v0.11.0
- vLLM main:
83f478bb19
---------
Signed-off-by: zzhx1 <zzh_201018@outlook.com>
This commit is contained in:
@@ -359,4 +359,7 @@ class TestAscendConfig(TestBase):
|
||||
}
|
||||
test_vllm_config.parallel_config = ParallelConfig(
|
||||
data_parallel_size=4, tensor_parallel_size=1)
|
||||
model_path = os.path.join(os.path.dirname(__file__), "fake_weight")
|
||||
test_vllm_config.model_config = ModelConfig(model=model_path,
|
||||
enforce_eager=True)
|
||||
init_ascend_config(test_vllm_config)
|
||||
|
||||
@@ -92,7 +92,7 @@ class AscendConfig:
|
||||
raise AssertionError(
|
||||
"oproj_tensor_parallel_size is only supported in the pure DP scenario"
|
||||
)
|
||||
if not self.torchair_graph_config.enabled:
|
||||
if vllm_config.model_config.enforce_eager is True:
|
||||
raise AssertionError(
|
||||
"oproj_tensor_parallel_size is only supported in graph mode"
|
||||
)
|
||||
|
||||
Reference in New Issue
Block a user