"vscode:/vscode.git/clone" did not exist on "e38ee081a0495769e25766b894abe19bc8a6209e"
test_flash_falcon.py 2.35 KB
Newer Older
1
2
3
4
5
6
7
8
9
10
11
import pytest


@pytest.fixture(scope="module")
def flash_falcon_handle(launcher):
    with launcher("tiiuae/falcon-7b", trust_remote_code=True) as handle:
        yield handle


@pytest.fixture(scope="module")
async def flash_falcon(flash_falcon_handle):
OlivierDehaene's avatar
OlivierDehaene committed
12
    await flash_falcon_handle.health(300)
13
14
15
    return flash_falcon_handle.client


xuxzh1's avatar
last  
xuxzh1 committed
16
@pytest.mark.release
17
18
19
20
21
22
@pytest.mark.asyncio
@pytest.mark.private
async def test_flash_falcon(flash_falcon, response_snapshot):
    response = await flash_falcon.generate(
        "Girafatron is obsessed with giraffes, the most glorious animal on the face of this Earth. Giraftron believes all other animals are irrelevant when compared to the glorious majesty of the giraffe.\nDaniel: Hello, Girafatron!\nGirafatron:",
        max_new_tokens=10,
23
        decoder_input_details=True,
24
25
26
27
28
29
    )

    assert response.details.generated_tokens == 10
    assert response == response_snapshot


xuxzh1's avatar
last  
xuxzh1 committed
30
@pytest.mark.release
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
@pytest.mark.asyncio
@pytest.mark.private
async def test_flash_falcon_all_params(flash_falcon, response_snapshot):
    response = await flash_falcon.generate(
        "Girafatron is obsessed with giraffes, the most glorious animal on the face of this Earth. Giraftron believes all other animals are irrelevant when compared to the glorious majesty of the giraffe.\nDaniel: Hello, Girafatron!\nGirafatron:",
        max_new_tokens=10,
        repetition_penalty=1.2,
        return_full_text=True,
        stop_sequences=["test"],
        temperature=0.5,
        top_p=0.9,
        top_k=10,
        truncate=5,
        typical_p=0.9,
        watermark=True,
46
        decoder_input_details=True,
47
48
49
50
51
52
53
        seed=0,
    )

    assert response.details.generated_tokens == 10
    assert response == response_snapshot


xuxzh1's avatar
last  
xuxzh1 committed
54
@pytest.mark.release
55
56
57
58
59
60
61
62
63
64
65
66
67
68
@pytest.mark.asyncio
@pytest.mark.private
async def test_flash_falcon_load(flash_falcon, generate_load, response_snapshot):
    responses = await generate_load(
        flash_falcon,
        "Girafatron is obsessed with giraffes, the most glorious animal on the face of this Earth. Giraftron believes all other animals are irrelevant when compared to the glorious majesty of the giraffe.\nDaniel: Hello, Girafatron!\nGirafatron:",
        max_new_tokens=10,
        n=4,
    )

    assert len(responses) == 4
    assert all([r.generated_text == responses[0].generated_text for r in responses])

    assert responses == response_snapshot