Remove dp balance metadata and minimul token balance. (#11170)

This commit is contained in:
Liangsheng Yin
2025-10-03 01:48:15 +08:00
committed by GitHub
parent bfcd9b2433
commit 7ff740a6ce
11 changed files with 77 additions and 316 deletions

View File

@@ -120,11 +120,8 @@ message GenerateRequest {
// Data parallel routing
int32 data_parallel_rank = 16;
// For load balancing
int32 dp_balance_id = 17;
// Whether client wants streaming response
bool stream = 18;
bool stream = 17;
}
message TokenizedInput {