[Auto Sync] Update fused_moe_triton_config.py (20250930) (#11099)

Co-authored-by: github-actions[bot] <github-actions[bot]@users.noreply.github.com>
Co-authored-by: Cheng Wan <54331508+ch-wan@users.noreply.github.com>
This commit is contained in:
Lianmin Zheng
2025-09-30 00:57:16 -07:00
committed by GitHub
parent 5991119541
commit 1237aa19ce

View File

@@ -51,10 +51,14 @@ def get_moe_configs(
# We found that using the fused_moe_kernel config from Triton 3.1.0 with Triton 3.2.0 results in negative performance gains,
# so we also include the Triton version as a key for finding the fused_moe_kernel config to achieve the best performance.
config_dir = os.environ.get(
"SGLANG_MOE_CONFIG_DIR", os.path.dirname(os.path.realpath(__file__))
)
triton_version = triton.__version__
version_dir = f"triton_{triton_version.replace('.', '_')}"
config_file_path = os.path.join(
os.path.dirname(os.path.realpath(__file__)),
config_dir,
"configs",
version_dir,
json_file_name,
@@ -75,7 +79,7 @@ def get_moe_configs(
if try_triton_version == triton_version:
continue
try_config_file_path = os.path.join(
os.path.dirname(os.path.realpath(__file__)),
config_dir,
"configs",
f"triton_{try_triton_version.replace('.', '_')}",
json_file_name,