From ced35a06490ffe4a75dac87648a7da68d84aef4c Mon Sep 17 00:00:00 2001 From: Thysrael <72613958+Thysrael@users.noreply.github.com> Date: Wed, 26 Mar 2025 15:19:12 +0800 Subject: [PATCH] fix(typo): fix `reply` to `replay` in `base_attn_backend.py` (#4784) --- python/sglang/srt/layers/attention/base_attn_backend.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/python/sglang/srt/layers/attention/base_attn_backend.py b/python/sglang/srt/layers/attention/base_attn_backend.py index 8364a82ca..2ad35914a 100644 --- a/python/sglang/srt/layers/attention/base_attn_backend.py +++ b/python/sglang/srt/layers/attention/base_attn_backend.py @@ -47,7 +47,7 @@ class AttentionBackend(ABC): spec_info: Optional[Union[EagleDraftInput, EagleVerifyInput]], seq_lens_cpu: Optional[torch.Tensor], ): - """Init the metadata for a forward pass for replying a cuda graph.""" + """Init the metadata for a forward pass for replaying a cuda graph.""" raise NotImplementedError() def get_cuda_graph_seq_len_fill_value(self):