fix: vllm lora (#3132)

3102a8e4 · MaYongQing · GitHub · cf631de0 · 3102a8e4
Unverified Commit 3102a8e4 authored Jul 15, 2025 by MaYongQing Committed by GitHub Jul 15, 2025
Show whitespace changes
Inline Side-by-side

Showing with 3 additions and 0 deletions

lm_eval/models/vllm_causallms.py lm_eval/models/vllm_causallms.py +3 -0

No files found.
--- a/lm_eval/models/vllm_causallms.py
+++ b/lm_eval/models/vllm_causallms.py
@@ -134,6 +134,7 @@ class VLLM(TemplateLM):
        data_parallel_size: int = 1,
        lora_local_path: str = None,
        enable_thinking: bool = False,
+        max_lora_rank: int = 16,
        **kwargs,
    ):
        super().__init__()
@@ -167,6 +168,8 @@ class VLLM(TemplateLM):
            "quantization": quantization,
            "seed": int(seed),
            "device": str(device),
+            "enable_lora": True if lora_local_path else False,
+            "max_lora_rank": int(max_lora_rank),
        }
        self.model_args.update(kwargs)
        self.batch_size = (