[ci] disable memory imbalance check for draft worker (#8108)
This commit is contained in:
@@ -561,7 +561,7 @@ class ModelRunner:
|
|||||||
|
|
||||||
# Check memory for tensor parallelism
|
# Check memory for tensor parallelism
|
||||||
local_gpu_memory = get_available_gpu_memory(self.device, self.gpu_id)
|
local_gpu_memory = get_available_gpu_memory(self.device, self.gpu_id)
|
||||||
if self.tp_size > 1:
|
if self.tp_size > 1 and not self.is_draft_worker:
|
||||||
if min_per_gpu_memory < local_gpu_memory * 0.9:
|
if min_per_gpu_memory < local_gpu_memory * 0.9:
|
||||||
if get_bool_env_var("SGL_DISABLE_TP_MEMORY_INBALANCE_CHECK"):
|
if get_bool_env_var("SGL_DISABLE_TP_MEMORY_INBALANCE_CHECK"):
|
||||||
logger.warning(
|
logger.warning(
|
||||||
|
|||||||
Reference in New Issue
Block a user