Commit 5d35160b authored by zhuwenwen's avatar zhuwenwen
Browse files

update blockwise_int8.py

parent e34d3444
......@@ -139,7 +139,6 @@ class BlockInt8LinearMethod(LinearMethodBase):
assert self.quant_config.weight_block_size is not None
assert self.quant_config.is_checkpoint_int8_serialized
self.tritonsingleton= W8a8GetCacheJSON()
def create_weights(
self,
......@@ -337,6 +336,7 @@ class BlockInt8MoEMethod:
self.quant_config = quant_config
assert self.quant_config.weight_block_size is not None
assert self.quant_config.is_checkpoint_int8_serialized
self.tritonsingleton= W8a8GetCacheJSON()
def create_weights(
self,
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment