Fix failing test for CRadio (#27738)

Signed-off-by: Eugene Khvedchenia <ekhvedchenia@nvidia.com> Signed-off-by: Cyrus Leung <cyrus.tl.leung@gmail.com> Co-authored-by: Cyrus Leung <tlleungac@connect.ust.hk> Co-authored-by: Cyrus Leung <cyrus.tl.leung@gmail.com> Co-authored-by: gemini-code-assist[bot] <176961590+gemini-code-assist[bot]@users.noreply.github.com> Co-authored-by: wang.yuqi <noooop@126.com>

Fix failing test for CRadio (#27738)
Signed-off-by: Eugene Khvedchenia <ekhvedchenia@nvidia.com> Signed-off-by: Cyrus Leung <cyrus.tl.leung@gmail.com> Co-authored-by: Cyrus Leung <tlleungac@connect.ust.hk> Co-authored-by: Cyrus Leung <cyrus.tl.leung@gmail.com> Co-authored-by: gemini-code-assist[bot] <176961590+gemini-code-assist[bot]@users.noreply.github.com> Co-authored-by: wang.yuqi <noooop@126.com>
827e4237 · Eugene Khvedchenya · GitHub · ca6f755d · 827e4237
Unverified Commit 827e4237 authored Nov 07, 2025 by Eugene Khvedchenya Committed by GitHub Nov 06, 2025
Show whitespace changes
Inline Side-by-side

Showing with 12 additions and 1 deletion

tests/models/multimodal/pooling/test_radio.py tests/models/multimodal/pooling/test_radio.py +12 -1

No files found.
--- a/tests/models/multimodal/pooling/test_radio.py
+++ b/tests/models/multimodal/pooling/test_radio.py
@@ -42,6 +42,10 @@ def run_radio_test(

    config = AutoConfig.from_pretrained(model_id, trust_remote_code=True)

+    # RADIO model on HF does not properly handle torch_dtype argument
+    # And relies on args["dtype"] which we have to patch manually:
+    config.args["dtype"] = torch_dtype
+
    hf_model = AutoModel.from_pretrained(
        model_id,
        config=config,
@@ -50,6 +54,13 @@ def run_radio_test(
    ).to("cuda")
    hf_model.eval()

+    # A HF model has image normalization as a part of model's forward
+    # However in vLLM we don't make normalization a part of the model
+    # forward step since mean/std stored as model's parameters and
+    # subject to precision loss (when using fp16/bf16) which negatively
+    # affects evaluation benchmarks.
+    hf_model.make_preprocessor_external()
+
    hf_outputs_per_image = [
        hf_model(pixel_value.to("cuda")).features for pixel_value in pixel_values
    ]
@@ -78,7 +89,7 @@ def run_radio_test(
        "nvidia/C-RADIOv2-H",
    ],
 )
-@pytest.mark.parametrize("dtype", ["half"])
+@pytest.mark.parametrize("dtype", ["half", "bfloat16"])
 def test_radio(dist_init, image_assets, model_id, dtype: str) -> None:
    run_radio_test(
        image_assets,