[Auto Sync] Update fused_moe_triton_config.py (20250930) (#11099)
Co-authored-by: github-actions[bot] <github-actions[bot]@users.noreply.github.com> Co-authored-by: Cheng Wan <54331508+ch-wan@users.noreply.github.com>
This commit is contained in:
@@ -51,10 +51,14 @@ def get_moe_configs(
|
|||||||
|
|
||||||
# We found that using the fused_moe_kernel config from Triton 3.1.0 with Triton 3.2.0 results in negative performance gains,
|
# We found that using the fused_moe_kernel config from Triton 3.1.0 with Triton 3.2.0 results in negative performance gains,
|
||||||
# so we also include the Triton version as a key for finding the fused_moe_kernel config to achieve the best performance.
|
# so we also include the Triton version as a key for finding the fused_moe_kernel config to achieve the best performance.
|
||||||
|
config_dir = os.environ.get(
|
||||||
|
"SGLANG_MOE_CONFIG_DIR", os.path.dirname(os.path.realpath(__file__))
|
||||||
|
)
|
||||||
|
|
||||||
triton_version = triton.__version__
|
triton_version = triton.__version__
|
||||||
version_dir = f"triton_{triton_version.replace('.', '_')}"
|
version_dir = f"triton_{triton_version.replace('.', '_')}"
|
||||||
config_file_path = os.path.join(
|
config_file_path = os.path.join(
|
||||||
os.path.dirname(os.path.realpath(__file__)),
|
config_dir,
|
||||||
"configs",
|
"configs",
|
||||||
version_dir,
|
version_dir,
|
||||||
json_file_name,
|
json_file_name,
|
||||||
@@ -75,7 +79,7 @@ def get_moe_configs(
|
|||||||
if try_triton_version == triton_version:
|
if try_triton_version == triton_version:
|
||||||
continue
|
continue
|
||||||
try_config_file_path = os.path.join(
|
try_config_file_path = os.path.join(
|
||||||
os.path.dirname(os.path.realpath(__file__)),
|
config_dir,
|
||||||
"configs",
|
"configs",
|
||||||
f"triton_{try_triton_version.replace('.', '_')}",
|
f"triton_{try_triton_version.replace('.', '_')}",
|
||||||
json_file_name,
|
json_file_name,
|
||||||
|
|||||||
Reference in New Issue
Block a user