Unverified Commit 44eef0ca authored by Louie Tsai's avatar Louie Tsai Committed by GitHub
Browse files

vLLM Benchmark Suite perf regression after PR#32723 (#38576)


Signed-off-by: default avatarlouie-tsai <louie.tsai@intel.com>
parent b9cdc852
...@@ -36,6 +36,7 @@ ...@@ -36,6 +36,7 @@
"model": "meta-llama/Llama-3.1-8B-Instruct", "model": "meta-llama/Llama-3.1-8B-Instruct",
"backend": "vllm", "backend": "vllm",
"ignore-eos": "", "ignore-eos": "",
"temperature": 0,
"num_prompts": 200 "num_prompts": 200
} }
}, },
...@@ -127,4 +128,4 @@ ...@@ -127,4 +128,4 @@
} }
} }
] ]
} }
\ No newline at end of file
...@@ -22,6 +22,7 @@ ...@@ -22,6 +22,7 @@
"hf_split": "test", "hf_split": "test",
"no_stream": "", "no_stream": "",
"no_oversample": "", "no_oversample": "",
"temperature": 0,
"num_prompts": 200 "num_prompts": 200
} }
}, },
......
...@@ -26,6 +26,7 @@ ...@@ -26,6 +26,7 @@
"model": "meta-llama/Llama-3.1-8B-Instruct", "model": "meta-llama/Llama-3.1-8B-Instruct",
"backend": "vllm", "backend": "vllm",
"ignore-eos": "", "ignore-eos": "",
"temperature": 0,
"num_prompts": 200 "num_prompts": 200
} }
}, },
......
...@@ -26,6 +26,7 @@ ...@@ -26,6 +26,7 @@
"model": "meta-llama/Llama-3.1-8B-Instruct", "model": "meta-llama/Llama-3.1-8B-Instruct",
"backend": "vllm", "backend": "vllm",
"ignore-eos": "", "ignore-eos": "",
"temperature": 0,
"num_prompts": 200 "num_prompts": 200
} }
}, },
......
...@@ -21,6 +21,7 @@ ...@@ -21,6 +21,7 @@
"backend": "vllm", "backend": "vllm",
"dataset_name": "sharegpt", "dataset_name": "sharegpt",
"dataset_path": "./ShareGPT_V3_unfiltered_cleaned_split.json", "dataset_path": "./ShareGPT_V3_unfiltered_cleaned_split.json",
"temperature": 0,
"num_prompts": 200 "num_prompts": 200
} }
}, },
...@@ -47,6 +48,7 @@ ...@@ -47,6 +48,7 @@
"backend": "vllm", "backend": "vllm",
"dataset_name": "sharegpt", "dataset_name": "sharegpt",
"dataset_path": "./ShareGPT_V3_unfiltered_cleaned_split.json", "dataset_path": "./ShareGPT_V3_unfiltered_cleaned_split.json",
"temperature": 0,
"num_prompts": 200 "num_prompts": 200
} }
}, },
...@@ -73,6 +75,7 @@ ...@@ -73,6 +75,7 @@
"backend": "vllm", "backend": "vllm",
"dataset_name": "sharegpt", "dataset_name": "sharegpt",
"dataset_path": "./ShareGPT_V3_unfiltered_cleaned_split.json", "dataset_path": "./ShareGPT_V3_unfiltered_cleaned_split.json",
"temperature": 0,
"num_prompts": 200 "num_prompts": 200
} }
}, },
...@@ -100,6 +103,7 @@ ...@@ -100,6 +103,7 @@
"backend": "vllm", "backend": "vllm",
"dataset_name": "sharegpt", "dataset_name": "sharegpt",
"dataset_path": "./ShareGPT_V3_unfiltered_cleaned_split.json", "dataset_path": "./ShareGPT_V3_unfiltered_cleaned_split.json",
"temperature": 0,
"num_prompts": 200 "num_prompts": 200
} }
}, },
...@@ -127,6 +131,7 @@ ...@@ -127,6 +131,7 @@
"backend": "vllm", "backend": "vllm",
"dataset_name": "sharegpt", "dataset_name": "sharegpt",
"dataset_path": "./ShareGPT_V3_unfiltered_cleaned_split.json", "dataset_path": "./ShareGPT_V3_unfiltered_cleaned_split.json",
"temperature": 0,
"num_prompts": 200 "num_prompts": 200
} }
}, },
...@@ -151,6 +156,7 @@ ...@@ -151,6 +156,7 @@
"backend": "vllm", "backend": "vllm",
"dataset_name": "sharegpt", "dataset_name": "sharegpt",
"dataset_path": "./ShareGPT_V3_unfiltered_cleaned_split.json", "dataset_path": "./ShareGPT_V3_unfiltered_cleaned_split.json",
"temperature": 0,
"num_prompts": 200 "num_prompts": 200
} }
} }
......
...@@ -13,6 +13,7 @@ ...@@ -13,6 +13,7 @@
"backend": "vllm", "backend": "vllm",
"dataset_name": "sharegpt", "dataset_name": "sharegpt",
"dataset_path": "./ShareGPT_V3_unfiltered_cleaned_split.json", "dataset_path": "./ShareGPT_V3_unfiltered_cleaned_split.json",
"temperature": 0,
"num_prompts": 200 "num_prompts": 200
} }
}, },
...@@ -30,6 +31,7 @@ ...@@ -30,6 +31,7 @@
"backend": "vllm", "backend": "vllm",
"dataset_name": "sharegpt", "dataset_name": "sharegpt",
"dataset_path": "./ShareGPT_V3_unfiltered_cleaned_split.json", "dataset_path": "./ShareGPT_V3_unfiltered_cleaned_split.json",
"temperature": 0,
"num_prompts": 200 "num_prompts": 200
} }
}, },
...@@ -47,6 +49,7 @@ ...@@ -47,6 +49,7 @@
"backend": "vllm", "backend": "vllm",
"dataset_name": "sharegpt", "dataset_name": "sharegpt",
"dataset_path": "./ShareGPT_V3_unfiltered_cleaned_split.json", "dataset_path": "./ShareGPT_V3_unfiltered_cleaned_split.json",
"temperature": 0,
"num_prompts": 200 "num_prompts": 200
} }
}, },
...@@ -67,6 +70,7 @@ ...@@ -67,6 +70,7 @@
"backend": "vllm", "backend": "vllm",
"dataset_name": "sharegpt", "dataset_name": "sharegpt",
"dataset_path": "./ShareGPT_V3_unfiltered_cleaned_split.json", "dataset_path": "./ShareGPT_V3_unfiltered_cleaned_split.json",
"temperature": 0,
"num_prompts": 200 "num_prompts": 200
} }
} }
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment