Llava Example#

Source vllm-project/vllm.

 1from vllm import LLM
 2from vllm.assets.image import ImageAsset
 3
 4
 5def run_llava():
 6    llm = LLM(model="llava-hf/llava-1.5-7b-hf")
 7
 8    prompt = "USER: <image>\nWhat is the content of this image?\nASSISTANT:"
 9
10    image = ImageAsset("stop_sign").pil_image
11
12    outputs = llm.generate({
13        "prompt": prompt,
14        "multi_modal_data": {
15            "image": image
16        },
17    })
18
19    for o in outputs:
20        generated_text = o.outputs[0].text
21        print(generated_text)
22
23
24if __name__ == "__main__":
25    run_llava()