File size: 383 Bytes
4962437
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
from swarms.agents import MultiModalAgent

load_dict = {
    "ImageCaptioning": "cuda"
}

node = MultiModalAgent(load_dict)

text = node.run_text("What is your name? Generate a picture of yourself")

img = node.run_img("/image1", "What is this image about?")

chat = node.chat(
    "What is your name? Generate a picture of yourself. What is this image about?",
    streaming=True
)