test_get_eos.py 1.1 KB
Newer Older
1
# SPDX-License-Identifier: Apache-2.0
2
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
3
4
5
"""
This test file includes some cases where it is inappropriate to
only get the `eos_token_id` from the tokenizer as defined by
6
{meth}`vllm.LLMEngine._get_eos_token_id`.
7
"""
8

9
10
11
12
13
from vllm.transformers_utils.config import try_get_generation_config
from vllm.transformers_utils.tokenizer import get_tokenizer


def test_get_llama3_eos_token():
14
    model_name = "meta-llama/Llama-3.2-1B-Instruct"
15
16
17
18

    tokenizer = get_tokenizer(model_name)
    assert tokenizer.eos_token_id == 128009

19
    generation_config = try_get_generation_config(model_name, trust_remote_code=False)
20
    assert generation_config is not None
21
    assert generation_config.eos_token_id == [128001, 128008, 128009]
22
23
24
25
26
27
28
29


def test_get_blip2_eos_token():
    model_name = "Salesforce/blip2-opt-2.7b"

    tokenizer = get_tokenizer(model_name)
    assert tokenizer.eos_token_id == 2

30
    generation_config = try_get_generation_config(model_name, trust_remote_code=False)
31
32
    assert generation_config is not None
    assert generation_config.eos_token_id == 50118