conftest.py 537 Bytes
Newer Older
jixx's avatar
init  
jixx committed
1
import pytest
jixx's avatar
jixx committed
2
import os
jixx's avatar
init  
jixx committed
3
4
from text_generation_server.pb import generate_pb2

jixx's avatar
jixx committed
5
6
7
os.environ["PREFIX_CACHING"] = "1"
os.environ["ATTENTION"] = "flashinfer"

jixx's avatar
init  
jixx committed
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23

@pytest.fixture
def default_pb_parameters():
    return generate_pb2.NextTokenChooserParameters(
        temperature=1.0,
        repetition_penalty=1.0,
        top_k=0,
        top_p=1.0,
        typical_p=1.0,
        do_sample=False,
    )


@pytest.fixture
def default_pb_stop_parameters():
    return generate_pb2.StoppingCriteriaParameters(stop_sequences=[], max_new_tokens=10)