Open AI API hidden states (#6716)
This commit is contained in:
@@ -215,6 +215,7 @@ class ServerArgs:
|
||||
disable_chunked_prefix_cache: bool = False
|
||||
disable_fast_image_processor: bool = False
|
||||
warmups: Optional[str] = None
|
||||
enable_return_hidden_states: bool = False
|
||||
|
||||
# Debug tensor dumps
|
||||
debug_tensor_dump_output_folder: Optional[str] = None
|
||||
@@ -1456,6 +1457,12 @@ class ServerArgs:
|
||||
default=ServerArgs.debug_tensor_dump_inject,
|
||||
help="Inject the outputs from jax as the input of every layer.",
|
||||
)
|
||||
|
||||
parser.add_argument(
|
||||
"--enable-return-hidden-states",
|
||||
action="store_true",
|
||||
help="Enable returning hidden states with responses.",
|
||||
)
|
||||
parser.add_argument(
|
||||
"--debug-tensor-dump-prefill-only",
|
||||
action="store_true",
|
||||
|
||||
Reference in New Issue
Block a user