[doc] add a note for --n-share-experts-fusion args (#6154)

9f2c9568 · Xiaoyu Zhang · GitHub · 3f2702ae · 9f2c9568
Unverified Commit 9f2c9568 authored May 12, 2025 by Xiaoyu Zhang Committed by GitHub May 11, 2025
Hide whitespace changes
Inline Side-by-side

Showing with 1 addition and 1 deletion

python/sglang/srt/server_args.py python/sglang/srt/server_args.py +1 -1

No files found.
--- a/python/sglang/srt/server_args.py
+++ b/python/sglang/srt/server_args.py
@@ -1194,7 +1194,7 @@ class ServerArgs:
            type=int,
            default=0,
            help="The number of shared_experts need to be replicated to fuse with normal experts in deepseek v3/r1, "
-            "set it to tp_size can get best optimized performance.",
+            "set it to tp_size can get best optimized performance. Note that for architectures with SM==90, we have enabled the shared experts fusion optimization by default for DeepSeek V3/R1, with n_share_experts_fusion automatically set to the TP size.",
        )
        parser.add_argument(
            "--disable-chunked-prefix-cache",