llava_example.py 1.13 KB
Newer Older
1
2
3
import os
import subprocess

4
from PIL import Image
5
6
7
8

from vllm import LLM

# The assets are located at `s3://air-example-data-2/vllm_opensource_llava/`.
9
# You can use `.buildkite/download-images.sh` to download them
10
11


12
def run_llava():
13
    llm = LLM(model="llava-hf/llava-1.5-7b-hf")
14

15
    prompt = "USER: <image>\nWhat is the content of this image?\nASSISTANT:"
16

17
    image = Image.open("images/stop_sign.jpg")
18
19

    outputs = llm.generate({
20
        "prompt": prompt,
21
22
23
        "multi_modal_data": {
            "image": image
        },
24
    })
25
26
27
28
29
30

    for o in outputs:
        generated_text = o.outputs[0].text
        print(generated_text)


31
32
def main():
    run_llava()
33
34
35
36
37
38
39
40
41
42


if __name__ == "__main__":
    # Download from s3
    s3_bucket_path = "s3://air-example-data-2/vllm_opensource_llava/"
    local_directory = "images"

    # Make sure the local directory exists or create it
    os.makedirs(local_directory, exist_ok=True)

43
44
45
46
47
48
49
50
51
    # Use AWS CLI to sync the directory, assume anonymous access
    subprocess.check_call([
        "aws",
        "s3",
        "sync",
        s3_bucket_path,
        local_directory,
        "--no-sign-request",
    ])
52
    main()