Tiny add Engine.flush_cache API (#5241)

This commit is contained in:
fzyzcjy
2025-04-21 09:15:03 +08:00
committed by GitHub
parent 5239d79568
commit 1195182040
5 changed files with 29 additions and 11 deletions

View File

@@ -60,7 +60,8 @@ from sglang.srt.managers.io_struct import (
CloseSessionReqInput,
ExpertDistributionReq,
ExpertDistributionReqOutput,
FlushCacheReq,
FlushCacheReqInput,
FlushCacheReqOutput,
GetInternalStateReq,
GetInternalStateReqOutput,
GetWeightsByNameReqInput,
@@ -402,7 +403,7 @@ class Scheduler(
[
(TokenizedGenerateReqInput, self.handle_generate_request),
(TokenizedEmbeddingReqInput, self.handle_embedding_request),
(FlushCacheReq, self.flush_cache_wrapped),
(FlushCacheReqInput, self.flush_cache_wrapped),
(AbortReq, self.abort_request),
(OpenSessionReqInput, self.open_session),
(CloseSessionReqInput, self.close_session),
@@ -1596,8 +1597,9 @@ class Scheduler(
time.sleep(5)
self.parent_process.send_signal(signal.SIGQUIT)
def flush_cache_wrapped(self, recv_req: FlushCacheReq):
self.flush_cache()
def flush_cache_wrapped(self, recv_req: FlushCacheReqInput):
success = self.flush_cache()
return FlushCacheReqOutput(success=success)
def flush_cache(self):
"""Flush the memory pool and cache."""