Log if cuda graph is used & extend cuda graph capture to cuda-graph-max-bs (#6201)
Co-authored-by: SangBin Cho <rkooo567@gmail.com>
This commit is contained in:
@@ -330,7 +330,7 @@ class Engine(EngineBase):
|
||||
return {
|
||||
**dataclasses.asdict(self.tokenizer_manager.server_args),
|
||||
**self.scheduler_info,
|
||||
**internal_states,
|
||||
"internal_states": internal_states,
|
||||
"version": __version__,
|
||||
}
|
||||
|
||||
|
||||
Reference in New Issue
Block a user