diff --git a/vllm_ascend/worker/model_runner_v1.py b/vllm_ascend/worker/model_runner_v1.py index 47ba7c8b..8000dbca 100644 --- a/vllm_ascend/worker/model_runner_v1.py +++ b/vllm_ascend/worker/model_runner_v1.py @@ -3225,6 +3225,8 @@ def _replace_gpu_model_runner_function_wrapper(target_module_name): target_module = sys.modules[target_module_name] setattr(target_module, "graph_capture", graph_capture) # noqa: B010 yield + except Exception as e: + raise RuntimeError(f"NPUModelRunner failed, error is {e}") finally: setattr(target_module, "graph_capture", graph_capture) # noqa: B010