From 67073dde85b79aa499ba51865f8e2af15f3f560a Mon Sep 17 00:00:00 2001 From: brayden-hai Date: Thu, 18 Sep 2025 11:52:35 -0700 Subject: [PATCH] Garbage collector regression in the online server (#10621) --- python/sglang/srt/model_executor/cuda_graph_runner.py | 1 + 1 file changed, 1 insertion(+) diff --git a/python/sglang/srt/model_executor/cuda_graph_runner.py b/python/sglang/srt/model_executor/cuda_graph_runner.py index 14da84e42..8cab1b69f 100644 --- a/python/sglang/srt/model_executor/cuda_graph_runner.py +++ b/python/sglang/srt/model_executor/cuda_graph_runner.py @@ -100,6 +100,7 @@ def freeze_gc(enable_cudagraph_gc: bool): finally: if should_freeze: gc.unfreeze() + gc.collect() def _to_torch(model: torch.nn.Module, reverse: bool, num_tokens: int):