Unverified Commit aa49f148 authored by Dipika Sikka's avatar Dipika Sikka Committed by GitHub
Browse files

[Quantization] Skip Fp4 Test for `compressed-tensors` (#19217)

parent 9ef9173c
......@@ -651,6 +651,7 @@ def test_compressed_tensors_2of4_sparse_compressed(vllm_runner, args_2of4):
assert output
@pytest.mark.skip(reason="Skip until the model config is updated")
def test_compressed_tensors_nvfp4a16(vllm_runner):
# run weight only example
model = "nm-testing/TinyLlama-1.1B-Chat-v1.0-FP4"
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment