Unverified Commit 8d2d876f authored by Ying Sheng's avatar Ying Sheng Committed by GitHub
Browse files

[Fix] fix the typo bug for window attention (#1106)

parent 326df4ba
...@@ -337,7 +337,7 @@ class ModelRunner: ...@@ -337,7 +337,7 @@ class ModelRunner:
use_tensor_cores=use_tensor_cores, use_tensor_cores=use_tensor_cores,
) )
else: else:
self.flashinfer_workspace_buffers = torch.empty( self.flashinfer_workspace_buffer = torch.empty(
global_config.flashinfer_workspace_size, global_config.flashinfer_workspace_size,
dtype=torch.uint8, dtype=torch.uint8,
device="cuda", device="cuda",
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment