From 43f80884c59a386402e8870defb5601b1ef4b971 Mon Sep 17 00:00:00 2001 From: Qiaolin Yu Date: Mon, 13 Oct 2025 16:35:50 -0700 Subject: [PATCH] Fix accept rate in speculative decoding metrics (#11572) --- python/sglang/srt/managers/scheduler_metrics_mixin.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/python/sglang/srt/managers/scheduler_metrics_mixin.py b/python/sglang/srt/managers/scheduler_metrics_mixin.py index 521cf3d52..91fff9e9b 100644 --- a/python/sglang/srt/managers/scheduler_metrics_mixin.py +++ b/python/sglang/srt/managers/scheduler_metrics_mixin.py @@ -259,7 +259,7 @@ class SchedulerMetricsMixin: ) # Calculate acceptance rate: accepted tokens / total draft tokens total_draft_tokens = self.spec_num_total_forward_ct * ( - self.server_args.speculative_num_steps or 1 + (self.server_args.speculative_num_steps or 0) + 1 ) spec_accept_rate = ( self.spec_num_total_accepted_tokens / total_draft_tokens