diff --git a/sgl-router/src/grpc_client/sglang_scheduler.rs b/sgl-router/src/grpc_client/sglang_scheduler.rs index e1d91c842..6d36feea5 100644 --- a/sgl-router/src/grpc_client/sglang_scheduler.rs +++ b/sgl-router/src/grpc_client/sglang_scheduler.rs @@ -132,7 +132,6 @@ impl SglangSchedulerClient { }; let channel = Channel::from_shared(http_endpoint)? - .timeout(Duration::from_secs(3600)) // 1 hr timeout for connection .http2_keep_alive_interval(Duration::from_secs(30)) .keep_alive_timeout(Duration::from_secs(10)) .keep_alive_while_idle(true) diff --git a/sgl-router/src/protocols/chat.rs b/sgl-router/src/protocols/chat.rs index f81105ec6..cce290dfd 100644 --- a/sgl-router/src/protocols/chat.rs +++ b/sgl-router/src/protocols/chat.rs @@ -496,7 +496,6 @@ impl Normalizable for ChatCompletionRequest { // Migrate deprecated max_tokens → max_completion_tokens #[allow(deprecated)] if self.max_completion_tokens.is_none() && self.max_tokens.is_some() { - tracing::warn!("max_tokens is deprecated, use max_completion_tokens instead"); self.max_completion_tokens = self.max_tokens; self.max_tokens = None; // Clear deprecated field }