omni_bot / playground /agents /mm_agent_example.py
WAWAA's picture
Upload folder using huggingface_hub
4962437
raw
history blame
383 Bytes
from swarms.agents import MultiModalAgent
load_dict = {
"ImageCaptioning": "cuda"
}
node = MultiModalAgent(load_dict)
text = node.run_text("What is your name? Generate a picture of yourself")
img = node.run_img("/image1", "What is this image about?")
chat = node.chat(
"What is your name? Generate a picture of yourself. What is this image about?",
streaming=True
)