Unverified Commit e39dc46f authored by wang.yuqi's avatar wang.yuqi Committed by GitHub
Browse files

[CI] Pooling models mteb test disable enforce_eager (#26408)


Signed-off-by: default avatarwang.yuqi <noooop@126.com>
parent 10c75b54
...@@ -51,7 +51,6 @@ def wikitext_ppl_test( ...@@ -51,7 +51,6 @@ def wikitext_ppl_test(
gpu_memory_utilization=0.7, gpu_memory_utilization=0.7,
max_model_len=max_length, max_model_len=max_length,
max_num_seqs=1, max_num_seqs=1,
enforce_eager=True,
**vllm_extra_kwargs, **vllm_extra_kwargs,
) as vllm_model: ) as vllm_model:
# Use max_num_seqs=1 to avoid OOM, # Use max_num_seqs=1 to avoid OOM,
......
...@@ -192,7 +192,6 @@ def mteb_test_embed_models( ...@@ -192,7 +192,6 @@ def mteb_test_embed_models(
model_info.name, model_info.name,
runner="pooling", runner="pooling",
max_model_len=None, max_model_len=None,
enforce_eager=True,
**vllm_extra_kwargs, **vllm_extra_kwargs,
) as vllm_model: ) as vllm_model:
model_config = vllm_model.llm.llm_engine.model_config model_config = vllm_model.llm.llm_engine.model_config
...@@ -349,7 +348,6 @@ def mteb_test_rerank_models( ...@@ -349,7 +348,6 @@ def mteb_test_rerank_models(
runner="pooling", runner="pooling",
max_model_len=None, max_model_len=None,
max_num_seqs=8, max_num_seqs=8,
enforce_eager=True,
**vllm_extra_kwargs, **vllm_extra_kwargs,
) as vllm_model: ) as vllm_model:
model_config = vllm_model.llm.llm_engine.model_config model_config = vllm_model.llm.llm_engine.model_config
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment