init
This commit is contained in:
0
vllm_vacc/vllm/executor/__init__.py
Normal file
0
vllm_vacc/vllm/executor/__init__.py
Normal file
BIN
vllm_vacc/vllm/executor/__pycache__/__init__.cpython-312.pyc
Normal file
BIN
vllm_vacc/vllm/executor/__pycache__/__init__.cpython-312.pyc
Normal file
Binary file not shown.
Binary file not shown.
20
vllm_vacc/vllm/executor/executor_base.py
Normal file
20
vllm_vacc/vllm/executor/executor_base.py
Normal file
@@ -0,0 +1,20 @@
|
||||
import asyncio
|
||||
from typing import List
|
||||
|
||||
from vllm.v1.outputs import PoolerOutput, SamplerOutput
|
||||
from vllm.sequence import ExecuteModelRequest
|
||||
|
||||
# class DistributedExecutorBase():
|
||||
# """Abstract superclass of distributed executor implementations."""
|
||||
|
||||
async def execute_model_async(
|
||||
self,
|
||||
execute_model_req: ExecuteModelRequest) -> List[SamplerOutput]:
|
||||
if self.parallel_worker_tasks is None:
|
||||
# Start model execution loop running in the parallel workers
|
||||
self.parallel_worker_tasks = asyncio.create_task(
|
||||
self._start_worker_execution_loop())
|
||||
await asyncio.sleep(0)
|
||||
# Only the driver worker returns the sampling results.
|
||||
await asyncio.sleep(0)
|
||||
return await self._driver_execute_model_async(execute_model_req)
|
||||
Reference in New Issue
Block a user