From e3e75a786a5bed2706f8764eaec256d9afd46880 Mon Sep 17 00:00:00 2001 From: Cheng Wan <54331508+ch-wan@users.noreply.github.com> Date: Thu, 14 Aug 2025 23:59:35 -0700 Subject: [PATCH] Fix the deprecation warning for enable_flashinfer_mxfp4_moe (#9214) --- python/sglang/srt/server_args.py | 16 +++++++++++----- 1 file changed, 11 insertions(+), 5 deletions(-) diff --git a/python/sglang/srt/server_args.py b/python/sglang/srt/server_args.py index c4f664872..0edc3ca08 100644 --- a/python/sglang/srt/server_args.py +++ b/python/sglang/srt/server_args.py @@ -290,6 +290,7 @@ class ServerArgs: enable_flashinfer_cutlass_moe: bool = False enable_flashinfer_trtllm_moe: bool = False enable_triton_kernel_moe: bool = False + enable_flashinfer_mxfp4_moe: bool = False def __post_init__(self): # Check deprecated arguments @@ -321,6 +322,11 @@ class ServerArgs: print_deprecated_warning( "NOTE: --enable-flashinfer-trtllm-moe is deprecated. Please set `--moe-runner-backend` to 'flashinfer_trtllm' instead." ) + if self.enable_flashinfer_mxfp4_moe: + self.moe_runner_backend = "flashinfer_mxfp4" + print_deprecated_warning( + "NOTE: --enable-flashinfer-mxfp4-moe is deprecated. Please set `--moe-runner-backend` to 'flashinfer_mxfp4' instead." + ) # Set missing default values if self.tokenizer_path is None: @@ -1851,11 +1857,6 @@ class ServerArgs: action="store_true", help="Enable returning hidden states with responses.", ) - parser.add_argument( - "--enable-flashinfer-mxfp4-moe", - action="store_true", - help="Enable FlashInfer MXFP4 MoE backend for modelopt_fp4 quant on Blackwell.", - ) parser.add_argument( "--scheduler-recv-interval", type=int, @@ -2001,6 +2002,11 @@ class ServerArgs: action="store_true", help="(Deprecated) Use triton moe grouped gemm kernel.", ) + parser.add_argument( + "--enable-flashinfer-mxfp4-moe", + action="store_true", + help="(Deprecated) Enable FlashInfer MXFP4 MoE backend for modelopt_fp4 quant on Blackwell.", + ) @classmethod def from_cli_args(cls, args: argparse.Namespace):