from swarms.agents import MultiModalAgent

load_dict = {"ImageCaptioning": "cuda"}

node = MultiModalAgent(load_dict)

text = node.run_text(
    "What is your name? Generate a picture of yourself"
)

img = node.run_img("/image1", "What is this image about?")

chat = node.chat(
    (
<<<<<<< HEAD
        "What is your name? Generate a picture of yourself. What is"
        " this image about?"
=======
        "What is your name? Generate a picture of yourself. What is this image"
        " about?"
>>>>>>> 49c7b97c (code quality fixes: line length = 80)
    ),
    streaming=True,
)