Unverified Commit e1ba2356 authored by Morrison Turnansky's avatar Morrison Turnansky Committed by GitHub
Browse files

[BugFix] Fix failing test...


[BugFix] Fix failing test quantization/test_compressed_tensors.py::test_compressed_tensors_fp8_block_enabled (#26436)
Signed-off-by: default avatarmorrison-turnansky <mturnans@redhat.com>
parent b82f4307
...@@ -597,7 +597,7 @@ class VllmConfig: ...@@ -597,7 +597,7 @@ class VllmConfig:
# https://github.com/vllm-project/vllm/issues/25094 # https://github.com/vllm-project/vllm/issues/25094
if has_blocked_weights(): if has_blocked_weights():
custom_ops = self.compilation_config.custom_ops custom_ops = self.compilation_config.custom_ops
if "none" not in custom_ops and "-quant_fp8" not in custom_ops: if "-quant_fp8" not in custom_ops:
custom_ops.append("+quant_fp8") custom_ops.append("+quant_fp8")
def update_sizes_for_sequence_parallelism(self, possible_sizes: list) -> list: def update_sizes_for_sequence_parallelism(self, possible_sizes: list) -> list:
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment