feat: Add model version tracking with API endpoints and response metadata (#8795)
This commit is contained in:
@@ -723,6 +723,7 @@ class OpenAIServingChat(OpenAIServingBase):
|
||||
model=request.model,
|
||||
choices=choices,
|
||||
usage=usage,
|
||||
metadata={"weight_version": ret[0]["meta_info"]["weight_version"]},
|
||||
)
|
||||
|
||||
def _process_logprobs_tokens(
|
||||
|
||||
Reference in New Issue
Block a user