diff --git a/sgl-router/src/routers/pd_router.rs b/sgl-router/src/routers/pd_router.rs index 1d0dd3a60..79589ef5d 100644 --- a/sgl-router/src/routers/pd_router.rs +++ b/sgl-router/src/routers/pd_router.rs @@ -886,12 +886,9 @@ impl PDRouter { tokio::spawn(async move { if let Ok(response) = prefill_future.await { - // Consume at most one small chunk with a very short timeout to advance flow control - let _ = tokio::time::timeout(Duration::from_millis(20), async { - let mut s = response.bytes_stream(); - let _ = s.next().await; - }) - .await; + // Consume the entire response body to maintain HTTP compliance + // This runs in the background and won't block the decode response + let _ = response.bytes().await; } });