Paligemma Example

Source vllm-project/vllm.

  1. 1from vllm import LLM
  2. 2from vllm.assets.image import ImageAsset
  3. 3
  4. 4
  5. 5def run_paligemma():
  6. 6 llm = LLM(model="google/paligemma-3b-mix-224")
  7. 7
  8. 8 prompt = "caption es"
  9. 9
  10. 10 image = ImageAsset("stop_sign").pil_image
  11. 11
  12. 12 outputs = llm.generate({
  13. 13 "prompt": prompt,
  14. 14 "multi_modal_data": {
  15. 15 "image": image
  16. 16 },
  17. 17 })
  18. 18
  19. 19 for o in outputs:
  20. 20 generated_text = o.outputs[0].text
  21. 21 print(generated_text)
  22. 22
  23. 23
  24. 24if __name__ == "__main__":
  25. 25 run_paligemma()