[Quantization] Skip Fp4 Test for `compressed-tensors` (#19217)

aa49f148 · Dipika Sikka · GitHub · 9ef9173c · aa49f148
Unverified Commit aa49f148 authored Jun 05, 2025 by Dipika Sikka Committed by GitHub Jun 05, 2025
Show whitespace changes
Inline Side-by-side

Showing with 1 addition and 0 deletions

tests/quantization/test_compressed_tensors.py tests/quantization/test_compressed_tensors.py +1 -0

No files found.
--- a/tests/quantization/test_compressed_tensors.py
+++ b/tests/quantization/test_compressed_tensors.py
@@ -651,6 +651,7 @@ def test_compressed_tensors_2of4_sparse_compressed(vllm_runner, args_2of4):
        assert output


+@pytest.mark.skip(reason="Skip until the model config is updated")
 def test_compressed_tensors_nvfp4a16(vllm_runner):
    # run weight only example
    model = "nm-testing/TinyLlama-1.1B-Chat-v1.0-FP4"