Unverified Commit 8df2dc3c authored by Brittany's avatar Brittany Committed by GitHub
Browse files

[TPU] Update pallas.py to support trillium (#8871)

parent 6d792d2f
......@@ -130,7 +130,7 @@ class PallasAttentionBackendImpl(AttentionImpl):
assert tpu_type is not None
tpu_type = tpu_type.lower()
if "lite" not in tpu_type:
if (("lite" not in tpu_type) and ("v6" not in tpu_type)):
if self.num_kv_heads % 2 == 0:
self.megacore_mode = "kv_head"
else:
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment