Update Qwen1.5-7b_single_dcu_inference.py

aa2a1b8c · luopl · 7504ebd1 · aa2a1b8c
Commit aa2a1b8c authored Apr 30, 2024 by luopl
Show whitespace changes
Inline Side-by-side

Showing with 2 additions and 3 deletions

inference/inference_vllm/Qwen1.5-7b_single_dcu_inference.py inference/inference_vllm/Qwen1.5-7b_single_dcu_inference.py +2 -3

No files found.
--- a/inference/inference_vllm/Qwen1.5-7b_single_dcu_inference.py
+++ b/inference/inference_vllm/Qwen1.5-7b_single_dcu_inference.py
 from vllm import LLM, SamplingParams
 # Sample prompts.
 prompts = [
    "The capital of France is",
 ]
 # Create a sampling params object.
-sampling_params = SamplingParams(temperature=0.8, top_p=0.95,top_k=50,stop="</s>")
+sampling_params = SamplingParams(temperature=0.8, top_p=0.95)
 # Create an LLM.
 llm = LLM(model="./qwen2/Qwen1.5-7B-Chat",trust_remote_code=True,dtype="float16", enforce_eager=True)