test_get_eos.py 1.37 KB
Newer Older
1
# SPDX-License-Identifier: Apache-2.0
2
3
4
5
6
7
8
"""
This test file includes some cases where it is inappropriate to
only get the `eos_token_id` from the tokenizer as defined by
:meth:`vllm.LLMEngine._get_eos_token_id`.
"""
from vllm.transformers_utils.config import try_get_generation_config
from vllm.transformers_utils.tokenizer import get_tokenizer
9
10
from ..utils import models_path_prefix
import os
11
12
import pytest
from vllm.utils import is_hip
13
14


15
16
@pytest.mark.skipif(is_hip(),
                    reason="Consistent with NV.")
17
def test_get_llama3_eos_token():
18
    model_name = os.path.join(models_path_prefix, "meta-llama/Meta-Llama-3-8B-Instruct")
19
20
21
22
23
24
25

    tokenizer = get_tokenizer(model_name)
    assert tokenizer.eos_token_id == 128009

    generation_config = try_get_generation_config(model_name,
                                                  trust_remote_code=False)
    assert generation_config is not None
26
    assert generation_config.eos_token_id == [128001, 128008, 128009]
27
28
29


def test_get_blip2_eos_token():
30
    model_name = os.path.join(models_path_prefix, "Salesforce/blip2-opt-2.7b")
31
32
33
34
35
36
37
38

    tokenizer = get_tokenizer(model_name)
    assert tokenizer.eos_token_id == 2

    generation_config = try_get_generation_config(model_name,
                                                  trust_remote_code=False)
    assert generation_config is not None
    assert generation_config.eos_token_id == 50118