Support dispatching logical to physical experts (#6385)

This commit is contained in:
fzyzcjy
2025-05-20 13:13:55 +08:00
committed by GitHub
parent 69af3ec35f
commit e98afbe042
9 changed files with 184 additions and 5 deletions

View File

@@ -80,6 +80,7 @@ from sglang.srt.managers.expert_distribution import (
get_global_expert_distribution_recorder,
)
from sglang.srt.managers.expert_location import ModelConfigForExpertLocation
from sglang.srt.managers.expert_location_dispatch import ExpertLocationDispatchInfo
from sglang.srt.managers.schedule_batch import global_server_args_dict
from sglang.srt.model_executor.forward_batch_info import ForwardBatch, ForwardMode
from sglang.srt.model_loader.weight_utils import default_weight_loader
@@ -113,6 +114,7 @@ if _is_hip:
decode_attention_fwd_grouped_rope,
)
logger = logging.getLogger(__name__)