Cleaning codes for speculative attention mode (#10149)

This commit is contained in:
Baizhou Zhang
2025-09-08 17:38:06 -07:00
committed by GitHub
parent 148022fc36
commit 8ad700f735
7 changed files with 14 additions and 35 deletions

View File

@@ -98,7 +98,7 @@ GLOBAL_SERVER_ARGS_KEYS = [
"sampling_backend",
"speculative_accept_threshold_single",
"speculative_accept_threshold_acc",
"speculative_attention_backend",
"speculative_attention_mode",
"torchao_config",
"triton_attention_reduce_in_fp32",
"num_reserved_decode_tokens",