Unverified Commit 1237aa19 authored by Lianmin Zheng's avatar Lianmin Zheng Committed by GitHub
Browse files

[Auto Sync] Update fused_moe_triton_config.py (20250930) (#11099)


Co-authored-by: default avatargithub-actions[bot] <github-actions[bot]@users.noreply.github.com>
Co-authored-by: default avatarCheng Wan <54331508+ch-wan@users.noreply.github.com>
parent 59911195
...@@ -51,10 +51,14 @@ def get_moe_configs( ...@@ -51,10 +51,14 @@ def get_moe_configs(
# We found that using the fused_moe_kernel config from Triton 3.1.0 with Triton 3.2.0 results in negative performance gains, # We found that using the fused_moe_kernel config from Triton 3.1.0 with Triton 3.2.0 results in negative performance gains,
# so we also include the Triton version as a key for finding the fused_moe_kernel config to achieve the best performance. # so we also include the Triton version as a key for finding the fused_moe_kernel config to achieve the best performance.
config_dir = os.environ.get(
"SGLANG_MOE_CONFIG_DIR", os.path.dirname(os.path.realpath(__file__))
)
triton_version = triton.__version__ triton_version = triton.__version__
version_dir = f"triton_{triton_version.replace('.', '_')}" version_dir = f"triton_{triton_version.replace('.', '_')}"
config_file_path = os.path.join( config_file_path = os.path.join(
os.path.dirname(os.path.realpath(__file__)), config_dir,
"configs", "configs",
version_dir, version_dir,
json_file_name, json_file_name,
...@@ -75,7 +79,7 @@ def get_moe_configs( ...@@ -75,7 +79,7 @@ def get_moe_configs(
if try_triton_version == triton_version: if try_triton_version == triton_version:
continue continue
try_config_file_path = os.path.join( try_config_file_path = os.path.join(
os.path.dirname(os.path.realpath(__file__)), config_dir,
"configs", "configs",
f"triton_{try_triton_version.replace('.', '_')}", f"triton_{try_triton_version.replace('.', '_')}",
json_file_name, json_file_name,
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment