[router][refactor] Clean up protobuf fields (#10923)

This commit is contained in:
Chang Su
2025-09-25 17:48:47 -07:00
committed by GitHub
parent f7bab41a29
commit 7dcd689b47
5 changed files with 102 additions and 109 deletions

View File

@@ -165,28 +165,22 @@ message GenerateResponse {
message GenerateStreamChunk {
// Generated token
int32 token_id = 1;
string text = 2;
// Cumulative counts
int32 prompt_tokens = 3;
int32 completion_tokens = 4;
int32 cached_tokens = 5;
int32 prompt_tokens = 2;
int32 completion_tokens = 3;
int32 cached_tokens = 4;
// Logprobs (if requested)
LogProbs logprobs = 6;
LogProbs logprobs = 5;
// Hidden states (if requested)
repeated float hidden_states = 7;
// Metadata
float generation_time = 8; // Time to generate this token
int32 queue_time = 9; // Time spent in queue
repeated float hidden_states = 6;
}
message GenerateComplete {
// Final output
repeated int32 output_ids = 1;
string output_text = 2;
// Finish reason
enum FinishReason {
@@ -201,13 +195,18 @@ message GenerateComplete {
// The request was aborted by the user or system.
ABORT = 4;
}
FinishReason finish_reason = 3;
FinishReason finish_reason = 2;
// Token usage counts
int32 prompt_tokens = 3;
int32 completion_tokens = 4;
int32 cached_tokens = 5;
// All logprobs if requested
repeated LogProbs all_logprobs = 11;
repeated LogProbs all_logprobs = 6;
// All hidden states if requested
repeated HiddenStates all_hidden_states = 12;
repeated HiddenStates all_hidden_states = 7;
}
message GenerateError {
@@ -285,10 +284,9 @@ message EmbedComplete {
// Additional metadata
int32 embedding_dim = 4;
float generation_time = 5;
// For batch embeddings
repeated Embedding batch_embeddings = 6;
repeated Embedding batch_embeddings = 5;
}
message Embedding {