Unverified Commit 6128f7cf authored by Yineng Zhang's avatar Yineng Zhang Committed by GitHub
Browse files

fix: specify dtype with begin_forward aka plan (#2404)

parent a2486eb5
......@@ -678,6 +678,7 @@ class FlashInferIndicesUpdaterPrefill:
self.num_qo_heads,
self.num_kv_heads,
self.head_dim,
q_data_type=self.q_data_type,
)
# cached part
......@@ -691,6 +692,7 @@ class FlashInferIndicesUpdaterPrefill:
self.num_kv_heads,
self.head_dim,
1,
q_data_type=self.q_data_type,
)
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment