Turn on overlap scheduler for multimodal models (#5771)
This commit is contained in:
@@ -248,9 +248,6 @@ class Scheduler(
|
||||
if not self.is_generation:
|
||||
self.enable_overlap = False
|
||||
logger.info("Overlap scheduler is disabled for embedding models.")
|
||||
if self.model_config.is_multimodal:
|
||||
self.enable_overlap = False
|
||||
logger.info("Overlap scheduler is disabled for multimodal models.")
|
||||
|
||||
# Launch a tensor parallel worker
|
||||
if self.enable_overlap:
|
||||
|
||||
Reference in New Issue
Block a user