[ROCm][CI] Add large_gpu_mark to test_max_tokens_none for ROCm (#37717)

Signed-off-by: Andreas Karatzas <akaratza@amd.com>

[ROCm][CI] Add large_gpu_mark to test_max_tokens_none for ROCm (#37717)
Signed-off-by: Andreas Karatzas <akaratza@amd.com>
c86b17cf · Andreas Karatzas · GitHub · 66f927f2 · c86b17cf
Unverified Commit c86b17cf authored Mar 21, 2026 by Andreas Karatzas Committed by GitHub Mar 22, 2026
Hide whitespace changes
Inline Side-by-side

Showing with 14 additions and 2 deletions

tests/test_regression.py tests/test_regression.py +14 -2

No files found.
--- a/tests/test_regression.py
+++ b/tests/test_regression.py
@@ -12,6 +12,7 @@ import gc
 import pytest
 import torch
+from tests.utils import large_gpu_mark
 from vllm import LLM, SamplingParams
 from vllm.platforms import current_platform
@@ -32,10 +33,21 @@ def test_duplicated_ignored_sequence_group():
    assert len(prompts) == len(outputs)
-def test_max_tokens_none():
+@pytest.mark.parametrize(
+    "model",
+    [
+        pytest.param(
+            "distilbert/distilgpt2",
+            marks=[
+                *([large_gpu_mark(min_gb=80)] if current_platform.is_rocm() else []),
+            ],
+        ),
+    ],
+)
+def test_max_tokens_none(model):
    sampling_params = SamplingParams(temperature=0.01, top_p=0.1, max_tokens=None)
    llm = LLM(
-        model="distilbert/distilgpt2",
+        model=model,
        max_num_batched_tokens=4096,
        tensor_parallel_size=1,
    )