Turn on overlap scheduler for multimodal models (#5771)

This commit is contained in:
Lianmin Zheng
2025-04-27 23:45:09 -07:00
committed by GitHub
parent ef15dcda26
commit 3029889cb4

View File

@@ -248,9 +248,6 @@ class Scheduler(
if not self.is_generation:
self.enable_overlap = False
logger.info("Overlap scheduler is disabled for embedding models.")
if self.model_config.is_multimodal:
self.enable_overlap = False
logger.info("Overlap scheduler is disabled for multimodal models.")
# Launch a tensor parallel worker
if self.enable_overlap: