From a61962ea9aba437e1ffa95178271197d1dd5e549 Mon Sep 17 00:00:00 2001 From: Kye Date: Mon, 26 Jun 2023 18:11:01 -0400 Subject: [PATCH] multi-modal agent in swarms --- swarms/agents/auto_agent.py | 16 ++++++++++++++++ 1 file changed, 16 insertions(+) diff --git a/swarms/agents/auto_agent.py b/swarms/agents/auto_agent.py index 5ea7bf55..0c036c75 100644 --- a/swarms/agents/auto_agent.py +++ b/swarms/agents/auto_agent.py @@ -37,6 +37,18 @@ from langchain.tools.human.tool import HumanInputRun +from swarms.agents.auto_agent import MultiModalVisualAgent + +class MultiModalVisualAgentTool(BaseTool): + name = "multi_visual_agent" + description = "Multi-Modal Visual agent tool" + + def __init__(self, agent: MultiModalVisualAgent): + self.agent = agent + + def _run(self, text: str) -> str: + #run the multi-modal visual agent with the give task + return self.agent.run_text(text) @@ -156,6 +168,10 @@ query_website_tool = WebpageQATool(qa_chain=load_qa_with_sources_chain(llm)) # !pip install duckduckgo_search web_search = DuckDuckGoSearchRun() +multimodal_agent = MultiModalVisualAgent() + +# +multimodal_agent_tool = MultiModalVisualAgentTool(MultiModalVisualAgent) tools = [ web_search,