"ssh:/git@developer.sourcefind.cn:2222/OpenDAS/vllm_cscc.git" did not exist on "3249f6cc54fea1f43c4ccb97b2eb702a772a27cd"
Commit 50bed026 authored by zhuwenwen's avatar zhuwenwen
Browse files

remove redundant shared_output

parent 42b06117
...@@ -206,7 +206,6 @@ class FusedMoEMethodBase(QuantizeMethodBase): ...@@ -206,7 +206,6 @@ class FusedMoEMethodBase(QuantizeMethodBase):
layer: torch.nn.Module, layer: torch.nn.Module,
x: torch.Tensor, x: torch.Tensor,
router_logits: torch.Tensor, router_logits: torch.Tensor,
shared_output: torch.Tensor,
top_k: int, top_k: int,
renormalize: bool, renormalize: bool,
use_grouped_topk: bool = False, use_grouped_topk: bool = False,
...@@ -359,7 +358,6 @@ class UnquantizedFusedMoEMethod(FusedMoEMethodBase, CustomOp): ...@@ -359,7 +358,6 @@ class UnquantizedFusedMoEMethod(FusedMoEMethodBase, CustomOp):
layer: torch.nn.Module, layer: torch.nn.Module,
x: torch.Tensor, x: torch.Tensor,
router_logits: torch.Tensor, router_logits: torch.Tensor,
shared_output: torch.Tensor,
top_k: int, top_k: int,
renormalize: bool, renormalize: bool,
use_grouped_topk: bool = False, use_grouped_topk: bool = False,
...@@ -389,7 +387,6 @@ class UnquantizedFusedMoEMethod(FusedMoEMethodBase, CustomOp): ...@@ -389,7 +387,6 @@ class UnquantizedFusedMoEMethod(FusedMoEMethodBase, CustomOp):
x=x, x=x,
layer=layer, layer=layer,
router_logits=router_logits, router_logits=router_logits,
shared_output=shared_output,
top_k=top_k, top_k=top_k,
renormalize=renormalize, renormalize=renormalize,
use_grouped_topk=use_grouped_topk, use_grouped_topk=use_grouped_topk,
...@@ -414,7 +411,6 @@ class UnquantizedFusedMoEMethod(FusedMoEMethodBase, CustomOp): ...@@ -414,7 +411,6 @@ class UnquantizedFusedMoEMethod(FusedMoEMethodBase, CustomOp):
use_grouped_topk: bool, use_grouped_topk: bool,
top_k: int, top_k: int,
router_logits: torch.Tensor, router_logits: torch.Tensor,
shared_output: torch.Tensor,
renormalize: bool, renormalize: bool,
topk_group: Optional[int] = None, topk_group: Optional[int] = None,
num_expert_group: Optional[int] = None, num_expert_group: Optional[int] = None,
...@@ -1544,7 +1540,6 @@ class FusedMoE(torch.nn.Module): ...@@ -1544,7 +1540,6 @@ class FusedMoE(torch.nn.Module):
layer=self, layer=self,
x=hidden_states, x=hidden_states,
router_logits=router_logits, router_logits=router_logits,
shared_output=shared_output,
top_k=self.top_k, top_k=self.top_k,
renormalize=self.renormalize, renormalize=self.renormalize,
use_grouped_topk=self.use_grouped_topk, use_grouped_topk=self.use_grouped_topk,
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment