"vscode:/vscode.git/clone" did not exist on "c413c41cda0f9359e7a12bb674c0f87bf41798c5"
Unverified Commit 01c16ede authored by Michael Goin's avatar Michael Goin Committed by GitHub
Browse files

[CI] Add smoke test for non-uniform AutoFP8 quantization (#6702)

parent 72fc7048
...@@ -13,6 +13,7 @@ from vllm.model_executor.layers.quantization.fp8 import (Fp8KVCacheMethod, ...@@ -13,6 +13,7 @@ from vllm.model_executor.layers.quantization.fp8 import (Fp8KVCacheMethod,
MODELS = [ MODELS = [
"neuralmagic/Meta-Llama-3-8B-Instruct-FP8-KV", "neuralmagic/Meta-Llama-3-8B-Instruct-FP8-KV",
"nm-testing/Phi-3-mini-128k-instruct-FP8", "nm-testing/Phi-3-mini-128k-instruct-FP8",
"nm-testing/Qwen2-0.5B-Instruct-FP8-SkipQKV",
] ]
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment