Garbage collector regression in the online server (#10621)

This commit is contained in:
brayden-hai
2025-09-18 11:52:35 -07:00
committed by GitHub
parent 9a5c42f9ad
commit 67073dde85

View File

@@ -100,6 +100,7 @@ def freeze_gc(enable_cudagraph_gc: bool):
finally:
if should_freeze:
gc.unfreeze()
gc.collect()
def _to_torch(model: torch.nn.Module, reverse: bool, num_tokens: int):