[RL] add --skip-warmup (#7416)
This commit is contained in:
@@ -932,11 +932,9 @@ def launch_server(
|
|||||||
warmup_thread.join()
|
warmup_thread.join()
|
||||||
|
|
||||||
|
|
||||||
def _wait_and_warmup(
|
def _execute_server_warmup(
|
||||||
server_args: ServerArgs,
|
server_args: ServerArgs,
|
||||||
pipe_finish_writer: Optional[multiprocessing.connection.Connection],
|
pipe_finish_writer: Optional[multiprocessing.connection.Connection],
|
||||||
image_token_text: str,
|
|
||||||
launch_callback: Optional[Callable[[], None]] = None,
|
|
||||||
):
|
):
|
||||||
headers = {}
|
headers = {}
|
||||||
url = server_args.url()
|
url = server_args.url()
|
||||||
@@ -961,7 +959,7 @@ def _wait_and_warmup(
|
|||||||
pipe_finish_writer.send(last_traceback)
|
pipe_finish_writer.send(last_traceback)
|
||||||
logger.error(f"Initialization failed. warmup error: {last_traceback}")
|
logger.error(f"Initialization failed. warmup error: {last_traceback}")
|
||||||
kill_process_tree(os.getpid())
|
kill_process_tree(os.getpid())
|
||||||
return
|
return success
|
||||||
|
|
||||||
model_info = res.json()
|
model_info = res.json()
|
||||||
|
|
||||||
@@ -1035,10 +1033,25 @@ def _wait_and_warmup(
|
|||||||
pipe_finish_writer.send(last_traceback)
|
pipe_finish_writer.send(last_traceback)
|
||||||
logger.error(f"Initialization failed. warmup error: {last_traceback}")
|
logger.error(f"Initialization failed. warmup error: {last_traceback}")
|
||||||
kill_process_tree(os.getpid())
|
kill_process_tree(os.getpid())
|
||||||
return
|
return False
|
||||||
|
|
||||||
# Debug print
|
# Debug print
|
||||||
# logger.info(f"warmup request returns: {res.json()=}")
|
# logger.info(f"warmup request returns: {res.json()=}")
|
||||||
|
return success
|
||||||
|
|
||||||
|
|
||||||
|
def _wait_and_warmup(
|
||||||
|
server_args: ServerArgs,
|
||||||
|
pipe_finish_writer: Optional[multiprocessing.connection.Connection],
|
||||||
|
image_token_text: str,
|
||||||
|
launch_callback: Optional[Callable[[], None]] = None,
|
||||||
|
):
|
||||||
|
if not server_args.skip_server_warmup:
|
||||||
|
if not _execute_server_warmup(
|
||||||
|
server_args,
|
||||||
|
pipe_finish_writer,
|
||||||
|
):
|
||||||
|
return
|
||||||
|
|
||||||
logger.info("The server is fired up and ready to roll!")
|
logger.info("The server is fired up and ready to roll!")
|
||||||
|
|
||||||
|
|||||||
@@ -46,6 +46,7 @@ class ServerArgs:
|
|||||||
tokenizer_path: Optional[str] = None
|
tokenizer_path: Optional[str] = None
|
||||||
tokenizer_mode: str = "auto"
|
tokenizer_mode: str = "auto"
|
||||||
skip_tokenizer_init: bool = False
|
skip_tokenizer_init: bool = False
|
||||||
|
skip_server_warmup: bool = False
|
||||||
load_format: str = "auto"
|
load_format: str = "auto"
|
||||||
model_loader_extra_config: str = "{}"
|
model_loader_extra_config: str = "{}"
|
||||||
trust_remote_code: bool = False
|
trust_remote_code: bool = False
|
||||||
@@ -597,6 +598,11 @@ class ServerArgs:
|
|||||||
action="store_true",
|
action="store_true",
|
||||||
help="If set, skip init tokenizer and pass input_ids in generate request.",
|
help="If set, skip init tokenizer and pass input_ids in generate request.",
|
||||||
)
|
)
|
||||||
|
parser.add_argument(
|
||||||
|
"--skip-server-warmup",
|
||||||
|
action="store_true",
|
||||||
|
help="If set, skip warmup.",
|
||||||
|
)
|
||||||
parser.add_argument(
|
parser.add_argument(
|
||||||
"--load-format",
|
"--load-format",
|
||||||
type=str,
|
type=str,
|
||||||
|
|||||||
Reference in New Issue
Block a user