"src/vscode:/vscode.git/clone" did not exist on "6e8e1ed77a7da38a807f0bdb2bc2b70ae62c0c59"
Unverified Commit 2a206b22 authored by Kyungmin Lee's avatar Kyungmin Lee Committed by GitHub
Browse files

Fix RotaryEmbedding when using Triton backend for EXAONE-3.5-2.4B (#4064)

parent 4d253057
...@@ -148,7 +148,7 @@ class RotaryEmbedding(CustomOp): ...@@ -148,7 +148,7 @@ class RotaryEmbedding(CustomOp):
key: torch.Tensor, key: torch.Tensor,
offsets: Optional[torch.Tensor] = None, offsets: Optional[torch.Tensor] = None,
) -> Tuple[torch.Tensor, torch.Tensor]: ) -> Tuple[torch.Tensor, torch.Tensor]:
if _is_cuda_available: if _is_cuda_available and (self.head_size in [64, 128, 256, 512]):
apply_rope_with_cos_sin_cache_inplace( apply_rope_with_cos_sin_cache_inplace(
positions=positions, positions=positions,
query=query, query=query,
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment