File: multimodal-chat.py

package info (click to toggle)

ollama-python 0.5.3-1

links: PTS, VCS
area: main
in suites: forky, sid
size: 376 kB
sloc: python: 3,056; makefile: 5

file content (24 lines) | stat: -rw-r--r-- 500 bytes

from ollama import chat

# from pathlib import Path

# Pass in the path to the image
path = input('Please enter the path to the image: ')

# You can also pass in base64 encoded image data
# img = base64.b64encode(Path(path).read_bytes()).decode()
# or the raw bytes
# img = Path(path).read_bytes()

response = chat(
  model='gemma3',
  messages=[
    {
      'role': 'user',
      'content': 'What is in this image? Be concise.',
      'images': [path],
    }
  ],
)

print(response.message.content)