[Bugfix] Fix XliteModelRunner init failed when aclgraph is enabled (#5899)
### What this PR does / why we need it?
Fix XliteModelRunner init failed when aclgraph is enabled. Ensure
function graph_capture of vllm.v1.worker.gpu_model_runner is replaced.
- vLLM version: v0.13.0
- vLLM main:
bde38c11df
Signed-off-by: changdawei1 <changdawei3@huawei.com>
This commit is contained in:
@@ -2992,10 +2992,16 @@ class NPUModelRunner(GPUModelRunner):
|
|||||||
set_draft_graph_params(self.cudagraph_batch_sizes)
|
set_draft_graph_params(self.cudagraph_batch_sizes)
|
||||||
|
|
||||||
def capture_model(self) -> None:
|
def capture_model(self) -> None:
|
||||||
parent_module_name = self.__class__.__base__.__module__
|
gpu_model_runner_cls = next((cls for cls in self.__class__.__mro__
|
||||||
|
if cls.__name__ == "GPUModelRunner"),
|
||||||
|
None)
|
||||||
|
if gpu_model_runner_cls is None:
|
||||||
|
raise TypeError("Could not find GPUModelRunner in the MRO. "
|
||||||
|
"The class hierarchy may have changed.")
|
||||||
|
parent_module_name = gpu_model_runner_cls.__module__
|
||||||
with _torch_cuda_wrapper(), _replace_gpu_model_runner_function_wrapper(
|
with _torch_cuda_wrapper(), _replace_gpu_model_runner_function_wrapper(
|
||||||
parent_module_name):
|
parent_module_name):
|
||||||
super().capture_model()
|
GPUModelRunner.capture_model(self)
|
||||||
|
|
||||||
def _prepare_multimodal_fields(self):
|
def _prepare_multimodal_fields(self):
|
||||||
"""
|
"""
|
||||||
|
|||||||
Reference in New Issue
Block a user