feat: Add model version tracking with API endpoints and response metadata (#8795)

This commit is contained in:
Chengxing Xie
2025-08-15 03:13:46 +08:00
committed by GitHub
parent 2cc9eeab01
commit c1c7dc4534
9 changed files with 320 additions and 1 deletions

View File

@@ -373,6 +373,7 @@ class OpenAIServingCompletion(OpenAIServingBase):
created=created,
choices=choices,
usage=usage,
metadata={"weight_version": ret[0]["meta_info"]["weight_version"]},
)
def _get_echo_text(self, request: CompletionRequest, index: int) -> str: