llava_example.py 526 Bytes
Newer Older
1
from vllm import LLM
2
from vllm.assets.image import ImageAsset
3
4


5
def run_llava():
6
    llm = LLM(model="llava-hf/llava-1.5-7b-hf")
7

8
    prompt = "USER: <image>\nWhat is the content of this image?\nASSISTANT:"
9

10
    image = ImageAsset("stop_sign").pil_image
11
12

    outputs = llm.generate({
13
        "prompt": prompt,
14
15
16
        "multi_modal_data": {
            "image": image
        },
17
    })
18
19
20
21
22
23
24

    for o in outputs:
        generated_text = o.outputs[0].text
        print(generated_text)


if __name__ == "__main__":
25
    run_llava()