init

2026-04-02 04:53:13 +00:00
parent 80932c96e5
commit 24df76db9d
1987 changed files with 447445 additions and 0 deletions
--- a/vllm_vacc/vllm/executor/init.py
+++ b/vllm_vacc/vllm/executor/init.py
--- a/vllm_vacc/vllm/executor/pycache/init.cpython-312.pyc
+++ b/vllm_vacc/vllm/executor/pycache/init.cpython-312.pyc
--- a/vllm_vacc/vllm/executor/pycache/executor_base.cpython-312.pyc
+++ b/vllm_vacc/vllm/executor/pycache/executor_base.cpython-312.pyc
--- a/vllm_vacc/vllm/executor/executor_base.py
+++ b/vllm_vacc/vllm/executor/executor_base.py
@@ -0,0 +1,20 @@
+import asyncio
+from typing import List
+
+from vllm.v1.outputs import PoolerOutput, SamplerOutput
+from vllm.sequence import ExecuteModelRequest
+
+# class DistributedExecutorBase():
+#     """Abstract superclass of distributed executor implementations."""
+
+async def execute_model_async(
+        self,
+        execute_model_req: ExecuteModelRequest) -> List[SamplerOutput]:
+    if self.parallel_worker_tasks is None:
+        # Start model execution loop running in the parallel workers
+        self.parallel_worker_tasks = asyncio.create_task(
+            self._start_worker_execution_loop())
+        await asyncio.sleep(0)
+    # Only the driver worker returns the sampling results.
+    await asyncio.sleep(0)
+    return await self._driver_execute_model_async(execute_model_req)