"docs/git@developer.sourcefind.cn:OpenDAS/fairscale.git" did not exist on "ad611a34bd25a836b1191f5356aa849646362146"
Commit 47e4d923 authored by maxiao1's avatar maxiao1
Browse files

Merge branch 'v0.5.4_dev_qwennext' into 'v0.5.4_dev'

适配qwen3-next

See merge request OpenDAS/sglang!4
parents 0fbecc43 477fddf2
...@@ -396,7 +396,7 @@ class Qwen3GatedDeltaNet(nn.Module): ...@@ -396,7 +396,7 @@ class Qwen3GatedDeltaNet(nn.Module):
def _forward_input_proj(self, hidden_states: torch.Tensor): def _forward_input_proj(self, hidden_states: torch.Tensor):
DUAL_STREAM_TOKEN_THRESHOLD = 1024 if not _is_npu else 0 DUAL_STREAM_TOKEN_THRESHOLD = 1024 if not _is_npu else 0
seq_len, _ = hidden_states.shape seq_len, _ = hidden_states.shape
if seq_len < DUAL_STREAM_TOKEN_THRESHOLD: if seq_len < DUAL_STREAM_TOKEN_THRESHOLD and self.alt_stream is not None:
current_stream = torch.cuda.current_stream() current_stream = torch.cuda.current_stream()
self.alt_stream.wait_stream(current_stream) self.alt_stream.wait_stream(current_stream)
projected_states_qkvz, _ = self.in_proj_qkvz(hidden_states) projected_states_qkvz, _ = self.in_proj_qkvz(hidden_states)
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment