llava_example.py 1.25 KB
Newer Older
1
2
3
import os
import subprocess

4
from PIL import Image
5
6
7
8

from vllm import LLM

# The assets are located at `s3://air-example-data-2/vllm_opensource_llava/`.
9
# You can use `.buildkite/download-images.sh` to download them
10
11


12
def run_llava():
13
14
15
16
17
18
19
    llm = LLM(
        model="llava-hf/llava-1.5-7b-hf",
        image_token_id=32000,
        image_input_shape="1,3,336,336",
        image_feature_size=576,
    )

20
    prompt = "USER: <image>\nWhat is the content of this image?\nASSISTANT:"
21

22
    image = Image.open("images/stop_sign.jpg")
23
24

    outputs = llm.generate({
25
        "prompt": prompt,
26
27
28
        "multi_modal_data": {
            "image": image
        },
29
    })
30
31
32
33
34
35

    for o in outputs:
        generated_text = o.outputs[0].text
        print(generated_text)


36
37
def main():
    run_llava()
38
39
40
41
42
43
44
45
46
47


if __name__ == "__main__":
    # Download from s3
    s3_bucket_path = "s3://air-example-data-2/vllm_opensource_llava/"
    local_directory = "images"

    # Make sure the local directory exists or create it
    os.makedirs(local_directory, exist_ok=True)

48
49
50
51
52
53
54
55
56
    # Use AWS CLI to sync the directory, assume anonymous access
    subprocess.check_call([
        "aws",
        "s3",
        "sync",
        s3_bucket_path,
        local_directory,
        "--no-sign-request",
    ])
57
    main()