fix(typo): fix reply to replay in base_attn_backend.py (#4784)

2025-03-26 15:19:12 +08:00
parent 26f07294f1
commit ced35a0649
1 changed files with 1 additions and 1 deletions
--- a/python/sglang/srt/layers/attention/base_attn_backend.py
+++ b/python/sglang/srt/layers/attention/base_attn_backend.py
@@ -47,7 +47,7 @@ class AttentionBackend(ABC):
        spec_info: Optional[Union[EagleDraftInput, EagleVerifyInput]],
        seq_lens_cpu: Optional[torch.Tensor],
    ):
-        """Init the metadata for a forward pass for replying a cuda graph."""
+        """Init the metadata for a forward pass for replaying a cuda graph."""
        raise NotImplementedError()

    def get_cuda_graph_seq_len_fill_value(self):