From 9bd4872a343e55df62f00da0cff6d46a9ed9cd3f Mon Sep 17 00:00:00 2001
From: Trevor Morris <tmorris@nvidia.com>
Date: Mon, 4 Aug 2025 11:08:08 -0700
Subject: [PATCH] [bugfix] Fix typo in modelopt quant: 'FusedMoE' object has no
 attribute 'local_num_experts' (#8768)

---
 python/sglang/srt/layers/quantization/modelopt_quant.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/python/sglang/srt/layers/quantization/modelopt_quant.py b/python/sglang/srt/layers/quantization/modelopt_quant.py
index 7073f6be5..fca0ee38b 100755
--- a/python/sglang/srt/layers/quantization/modelopt_quant.py
+++ b/python/sglang/srt/layers/quantization/modelopt_quant.py
@@ -776,7 +776,7 @@ class ModelOptNvFp4FusedMoEMethod(FusedMoEMethodBase):
         # GEMM 1
         w13_weight = ModelWeightParameter(
             data=torch.empty(
-                layer.local_num_experts,
+                layer.num_local_experts,
                 2 * intermediate_size_per_partition,
                 # 2 fp4 items are packed in the input dimension
                 hidden_size // 2,