[Communicator] Add monkey patch (#30)
Some PR for plugin support is not merged by vllm yet. This PR add monkey patch to vllm-ascend to make vllm-ascend work with vllm directly. This patch code should be removed once the related function is supported by vllm originally. Signed-off-by: wangxiyuan <wangxiyuan1007@gmail.com>
This commit is contained in:
@@ -88,8 +88,9 @@ class NPUPlatform(Platform):
|
||||
|
||||
@classmethod
|
||||
def check_and_update_config(cls, vllm_config: VllmConfig) -> None:
|
||||
# Register ops when setup.
|
||||
# Register ops and patch when setup.
|
||||
from vllm_ascend import ops # noqa: F401
|
||||
from vllm_ascend import patch # noqa: F401
|
||||
|
||||
parallel_config = vllm_config.parallel_config
|
||||
if parallel_config.worker_cls == "auto":
|
||||
|
||||
Reference in New Issue
Block a user