Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
44eef0ca
Unverified
Commit
44eef0ca
authored
Mar 30, 2026
by
Louie Tsai
Committed by
GitHub
Mar 31, 2026
Browse files
vLLM Benchmark Suite perf regression after PR#32723 (#38576)
Signed-off-by:
louie-tsai
<
louie.tsai@intel.com
>
parent
b9cdc852
Changes
6
Show whitespace changes
Inline
Side-by-side
Showing
6 changed files
with
15 additions
and
1 deletion
+15
-1
.buildkite/performance-benchmarks/tests/serving-tests-arm64-cpu.json
...performance-benchmarks/tests/serving-tests-arm64-cpu.json
+2
-1
.buildkite/performance-benchmarks/tests/serving-tests-cpu-asr.json
...e/performance-benchmarks/tests/serving-tests-cpu-asr.json
+1
-0
.buildkite/performance-benchmarks/tests/serving-tests-cpu-text.json
.../performance-benchmarks/tests/serving-tests-cpu-text.json
+1
-0
.buildkite/performance-benchmarks/tests/serving-tests-cpu.json
...dkite/performance-benchmarks/tests/serving-tests-cpu.json
+1
-0
.buildkite/performance-benchmarks/tests/serving-tests-hpu.json
...dkite/performance-benchmarks/tests/serving-tests-hpu.json
+6
-0
.buildkite/performance-benchmarks/tests/serving-tests.json
.buildkite/performance-benchmarks/tests/serving-tests.json
+4
-0
No files found.
.buildkite/performance-benchmarks/tests/serving-tests-arm64-cpu.json
View file @
44eef0ca
...
@@ -36,6 +36,7 @@
...
@@ -36,6 +36,7 @@
"model"
:
"meta-llama/Llama-3.1-8B-Instruct"
,
"model"
:
"meta-llama/Llama-3.1-8B-Instruct"
,
"backend"
:
"vllm"
,
"backend"
:
"vllm"
,
"ignore-eos"
:
""
,
"ignore-eos"
:
""
,
"temperature"
:
0
,
"num_prompts"
:
200
"num_prompts"
:
200
}
}
},
},
...
...
.buildkite/performance-benchmarks/tests/serving-tests-cpu-asr.json
View file @
44eef0ca
...
@@ -22,6 +22,7 @@
...
@@ -22,6 +22,7 @@
"hf_split"
:
"test"
,
"hf_split"
:
"test"
,
"no_stream"
:
""
,
"no_stream"
:
""
,
"no_oversample"
:
""
,
"no_oversample"
:
""
,
"temperature"
:
0
,
"num_prompts"
:
200
"num_prompts"
:
200
}
}
},
},
...
...
.buildkite/performance-benchmarks/tests/serving-tests-cpu-text.json
View file @
44eef0ca
...
@@ -26,6 +26,7 @@
...
@@ -26,6 +26,7 @@
"model"
:
"meta-llama/Llama-3.1-8B-Instruct"
,
"model"
:
"meta-llama/Llama-3.1-8B-Instruct"
,
"backend"
:
"vllm"
,
"backend"
:
"vllm"
,
"ignore-eos"
:
""
,
"ignore-eos"
:
""
,
"temperature"
:
0
,
"num_prompts"
:
200
"num_prompts"
:
200
}
}
},
},
...
...
.buildkite/performance-benchmarks/tests/serving-tests-cpu.json
View file @
44eef0ca
...
@@ -26,6 +26,7 @@
...
@@ -26,6 +26,7 @@
"model"
:
"meta-llama/Llama-3.1-8B-Instruct"
,
"model"
:
"meta-llama/Llama-3.1-8B-Instruct"
,
"backend"
:
"vllm"
,
"backend"
:
"vllm"
,
"ignore-eos"
:
""
,
"ignore-eos"
:
""
,
"temperature"
:
0
,
"num_prompts"
:
200
"num_prompts"
:
200
}
}
},
},
...
...
.buildkite/performance-benchmarks/tests/serving-tests-hpu.json
View file @
44eef0ca
...
@@ -21,6 +21,7 @@
...
@@ -21,6 +21,7 @@
"backend"
:
"vllm"
,
"backend"
:
"vllm"
,
"dataset_name"
:
"sharegpt"
,
"dataset_name"
:
"sharegpt"
,
"dataset_path"
:
"./ShareGPT_V3_unfiltered_cleaned_split.json"
,
"dataset_path"
:
"./ShareGPT_V3_unfiltered_cleaned_split.json"
,
"temperature"
:
0
,
"num_prompts"
:
200
"num_prompts"
:
200
}
}
},
},
...
@@ -47,6 +48,7 @@
...
@@ -47,6 +48,7 @@
"backend"
:
"vllm"
,
"backend"
:
"vllm"
,
"dataset_name"
:
"sharegpt"
,
"dataset_name"
:
"sharegpt"
,
"dataset_path"
:
"./ShareGPT_V3_unfiltered_cleaned_split.json"
,
"dataset_path"
:
"./ShareGPT_V3_unfiltered_cleaned_split.json"
,
"temperature"
:
0
,
"num_prompts"
:
200
"num_prompts"
:
200
}
}
},
},
...
@@ -73,6 +75,7 @@
...
@@ -73,6 +75,7 @@
"backend"
:
"vllm"
,
"backend"
:
"vllm"
,
"dataset_name"
:
"sharegpt"
,
"dataset_name"
:
"sharegpt"
,
"dataset_path"
:
"./ShareGPT_V3_unfiltered_cleaned_split.json"
,
"dataset_path"
:
"./ShareGPT_V3_unfiltered_cleaned_split.json"
,
"temperature"
:
0
,
"num_prompts"
:
200
"num_prompts"
:
200
}
}
},
},
...
@@ -100,6 +103,7 @@
...
@@ -100,6 +103,7 @@
"backend"
:
"vllm"
,
"backend"
:
"vllm"
,
"dataset_name"
:
"sharegpt"
,
"dataset_name"
:
"sharegpt"
,
"dataset_path"
:
"./ShareGPT_V3_unfiltered_cleaned_split.json"
,
"dataset_path"
:
"./ShareGPT_V3_unfiltered_cleaned_split.json"
,
"temperature"
:
0
,
"num_prompts"
:
200
"num_prompts"
:
200
}
}
},
},
...
@@ -127,6 +131,7 @@
...
@@ -127,6 +131,7 @@
"backend"
:
"vllm"
,
"backend"
:
"vllm"
,
"dataset_name"
:
"sharegpt"
,
"dataset_name"
:
"sharegpt"
,
"dataset_path"
:
"./ShareGPT_V3_unfiltered_cleaned_split.json"
,
"dataset_path"
:
"./ShareGPT_V3_unfiltered_cleaned_split.json"
,
"temperature"
:
0
,
"num_prompts"
:
200
"num_prompts"
:
200
}
}
},
},
...
@@ -151,6 +156,7 @@
...
@@ -151,6 +156,7 @@
"backend"
:
"vllm"
,
"backend"
:
"vllm"
,
"dataset_name"
:
"sharegpt"
,
"dataset_name"
:
"sharegpt"
,
"dataset_path"
:
"./ShareGPT_V3_unfiltered_cleaned_split.json"
,
"dataset_path"
:
"./ShareGPT_V3_unfiltered_cleaned_split.json"
,
"temperature"
:
0
,
"num_prompts"
:
200
"num_prompts"
:
200
}
}
}
}
...
...
.buildkite/performance-benchmarks/tests/serving-tests.json
View file @
44eef0ca
...
@@ -13,6 +13,7 @@
...
@@ -13,6 +13,7 @@
"backend"
:
"vllm"
,
"backend"
:
"vllm"
,
"dataset_name"
:
"sharegpt"
,
"dataset_name"
:
"sharegpt"
,
"dataset_path"
:
"./ShareGPT_V3_unfiltered_cleaned_split.json"
,
"dataset_path"
:
"./ShareGPT_V3_unfiltered_cleaned_split.json"
,
"temperature"
:
0
,
"num_prompts"
:
200
"num_prompts"
:
200
}
}
},
},
...
@@ -30,6 +31,7 @@
...
@@ -30,6 +31,7 @@
"backend"
:
"vllm"
,
"backend"
:
"vllm"
,
"dataset_name"
:
"sharegpt"
,
"dataset_name"
:
"sharegpt"
,
"dataset_path"
:
"./ShareGPT_V3_unfiltered_cleaned_split.json"
,
"dataset_path"
:
"./ShareGPT_V3_unfiltered_cleaned_split.json"
,
"temperature"
:
0
,
"num_prompts"
:
200
"num_prompts"
:
200
}
}
},
},
...
@@ -47,6 +49,7 @@
...
@@ -47,6 +49,7 @@
"backend"
:
"vllm"
,
"backend"
:
"vllm"
,
"dataset_name"
:
"sharegpt"
,
"dataset_name"
:
"sharegpt"
,
"dataset_path"
:
"./ShareGPT_V3_unfiltered_cleaned_split.json"
,
"dataset_path"
:
"./ShareGPT_V3_unfiltered_cleaned_split.json"
,
"temperature"
:
0
,
"num_prompts"
:
200
"num_prompts"
:
200
}
}
},
},
...
@@ -67,6 +70,7 @@
...
@@ -67,6 +70,7 @@
"backend"
:
"vllm"
,
"backend"
:
"vllm"
,
"dataset_name"
:
"sharegpt"
,
"dataset_name"
:
"sharegpt"
,
"dataset_path"
:
"./ShareGPT_V3_unfiltered_cleaned_split.json"
,
"dataset_path"
:
"./ShareGPT_V3_unfiltered_cleaned_split.json"
,
"temperature"
:
0
,
"num_prompts"
:
200
"num_prompts"
:
200
}
}
}
}
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment