[RL] fix skip_server_warmup and rl health_generate logic (#8757)
This commit is contained in:
@@ -473,6 +473,7 @@ class Scheduler(
|
||||
self.memory_saver_adapter = TorchMemorySaverAdapter.create(
|
||||
enable=server_args.enable_memory_saver
|
||||
)
|
||||
self.offload_tags = set()
|
||||
self.init_profier()
|
||||
|
||||
self.recv_skipper = SchedulerRecvSkipper.maybe_create(server_args)
|
||||
@@ -1040,7 +1041,9 @@ class Scheduler(
|
||||
for recv_req in recv_reqs:
|
||||
# If it is a health check generation request and there are running requests, ignore it.
|
||||
if is_health_check_generate_req(recv_req) and (
|
||||
self.chunked_req is not None or not self.running_batch.is_empty()
|
||||
self.chunked_req is not None
|
||||
or not self.running_batch.is_empty()
|
||||
or len(self.offload_tags) > 0
|
||||
):
|
||||
self.return_health_check_ct += 1
|
||||
continue
|
||||
|
||||
Reference in New Issue
Block a user