From 9bd4872a343e55df62f00da0cff6d46a9ed9cd3f Mon Sep 17 00:00:00 2001 From: Trevor Morris Date: Mon, 4 Aug 2025 11:08:08 -0700 Subject: [PATCH] [bugfix] Fix typo in modelopt quant: 'FusedMoE' object has no attribute 'local_num_experts' (#8768) --- python/sglang/srt/layers/quantization/modelopt_quant.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/python/sglang/srt/layers/quantization/modelopt_quant.py b/python/sglang/srt/layers/quantization/modelopt_quant.py index 7073f6be5..fca0ee38b 100755 --- a/python/sglang/srt/layers/quantization/modelopt_quant.py +++ b/python/sglang/srt/layers/quantization/modelopt_quant.py @@ -776,7 +776,7 @@ class ModelOptNvFp4FusedMoEMethod(FusedMoEMethodBase): # GEMM 1 w13_weight = ModelWeightParameter( data=torch.empty( - layer.local_num_experts, + layer.num_local_experts, 2 * intermediate_size_per_partition, # 2 fp4 items are packed in the input dimension hidden_size // 2,