@ -1,7 +1,7 @@
from swarms.agents import MultiModalAgent
load_dict = {
"ImageCaptioning": "cudo"
"ImageCaptioning": "cuda"
}
node = MultiModalAgent(load_dict)
@ -1,4 +1,7 @@
from swarms import OmniModalAgent, OpenAIChat
from langchain.
from swarms.agents import OmniModalAgent
llm = OpenAIChat()
@ -3,7 +3,7 @@
#agents
# from swarms.agents.profitpilot import ProfitPilot
from swarms.agents.aot import AoTAgent
from swarms.agents.multi_modal_visual_agent import MultiModalAgent
# from swarms.agents.multi_modal_visual_agent import MultiModalAgent
from swarms.agents.omni_modal_agent import OmniModalAgent