Paligemma Example#
Source vllm-project/vllm.
1from vllm import LLM
2from vllm.assets.image import ImageAsset
3
4
5def run_paligemma():
6 llm = LLM(model="google/paligemma-3b-mix-224")
7
8 prompt = "caption es"
9
10 image = ImageAsset("stop_sign").pil_image
11
12 outputs = llm.generate({
13 "prompt": prompt,
14 "multi_modal_data": {
15 "image": image
16 },
17 })
18
19 for o in outputs:
20 generated_text = o.outputs[0].text
21 print(generated_text)
22
23
24if __name__ == "__main__":
25 run_paligemma()