[fix]回退test_long_context中限制输入长度修改

9736caa9 · 王敏 · fa57cb7f · 9736caa9
Commit 9736caa9 authored Nov 15, 2024 by 王敏
Hide whitespace changes
Inline Side-by-side

Showing with 0 additions and 6 deletions

tests/lora/test_long_context.py tests/lora/test_long_context.py +0 -6

No files found.
--- a/tests/lora/test_long_context.py
+++ b/tests/lora/test_long_context.py
@@ -81,9 +81,6 @@ def generate(
    inputs: Tuple[str, SamplingParams, Optional[LoRARequest]],
 ):
    prompts, sampling_param, lora_request = inputs
-    max_model_len = llm.llm_engine.model_config.max_model_len
-    if len(prompts) >= max_model_len:
-        prompts = prompts[:max_model_len-1]
    outputs = llm.generate(prompts, sampling_param, lora_request=lora_request)
    return outputs[0].outputs[0].text.strip()
@@ -92,11 +89,8 @@ def batched_generate(
    llm: vllm.LLM,
    inputs: List[Tuple[str, SamplingParams, Optional[LoRARequest]]],
 ):
-    max_model_len = llm.llm_engine.model_config.max_model_len
    for input in inputs:
        prompt, sampling_param, lora_req = input
-        if len(prompt) >= max_model_len:
-            prompt = prompt[:max_model_len-1]
        # Add requests to the engine and run the engine
        llm._validate_and_add_requests(prompt,
                                       sampling_param,