Unverified Commit b6b6268c authored by Yineng Zhang's avatar Yineng Zhang Committed by GitHub
Browse files

Revert "Embedding parallel by attn_tp (#7623)" (#7880)

parent 08702321
......@@ -1938,7 +1938,7 @@ class DeepseekV2Model(nn.Module):
self.embed_tokens = VocabParallelEmbedding(
config.vocab_size,
config.hidden_size,
use_attn_tp_group=True,
enable_tp=not global_server_args_dict["enable_dp_attention"],
)
self.alt_stream = torch.cuda.Stream() if _is_cuda else None
self.layers = nn.ModuleList(
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment