[deepep] fix: shared experts are not initialized when shared experts fusion is enabled (#5072)

4c54f442 · Cheng Wan · GitHub · 924ca7c9 · 4c54f442
Unverified Commit 4c54f442 authored Apr 04, 2025 by Cheng Wan Committed by GitHub Apr 04, 2025
Hide whitespace changes
Inline Side-by-side

Showing with 2 additions and 2 deletions

python/sglang/srt/server_args.py python/sglang/srt/server_args.py +2 -2

No files found.
--- a/python/sglang/srt/server_args.py
+++ b/python/sglang/srt/server_args.py
@@ -183,7 +183,7 @@ class ServerArgs:
    enable_flashmla: bool = False
    flashinfer_mla_disable_ragged: bool = False
    warmups: Optional[str] = None
-    n_share_experts_fusion: Optional[int] = None
+    n_share_experts_fusion: int = 0
    disable_shared_experts_fusion: bool = False

    # Debug tensor dumps
@@ -1110,7 +1110,7 @@ class ServerArgs:
        parser.add_argument(
            "--n-share-experts-fusion",
            type=int,
-            default=None,
+            default=0,
            help="The number of shared_experts need to be replica to fuse with normal experts in deepseek v3/r1 "
            "we use tp_size by default.",
        )