From ced35a06490ffe4a75dac87648a7da68d84aef4c Mon Sep 17 00:00:00 2001
From: Thysrael <72613958+Thysrael@users.noreply.github.com>
Date: Wed, 26 Mar 2025 15:19:12 +0800
Subject: [PATCH] fix(typo): fix `reply` to `replay` in `base_attn_backend.py`
 (#4784)

---
 python/sglang/srt/layers/attention/base_attn_backend.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/python/sglang/srt/layers/attention/base_attn_backend.py b/python/sglang/srt/layers/attention/base_attn_backend.py
index 8364a82ca..2ad35914a 100644
--- a/python/sglang/srt/layers/attention/base_attn_backend.py
+++ b/python/sglang/srt/layers/attention/base_attn_backend.py
@@ -47,7 +47,7 @@ class AttentionBackend(ABC):
         spec_info: Optional[Union[EagleDraftInput, EagleVerifyInput]],
         seq_lens_cpu: Optional[torch.Tensor],
     ):
-        """Init the metadata for a forward pass for replying a cuda graph."""
+        """Init the metadata for a forward pass for replaying a cuda graph."""
         raise NotImplementedError()
 
     def get_cuda_graph_seq_len_fill_value(self):