From db7944fb4bf2a3be1370ef022fb9af319b009207 Mon Sep 17 00:00:00 2001 From: Kye Date: Fri, 6 Oct 2023 23:21:04 -0400 Subject: [PATCH] clean up --- swarms/agents/multi_modal_visual_agent.py | 60 ++++++++++------------- swarms/agents/omni_modal_agent.py | 1 + 2 files changed, 28 insertions(+), 33 deletions(-) diff --git a/swarms/agents/multi_modal_visual_agent.py b/swarms/agents/multi_modal_visual_agent.py index e4d005db..b0172431 100644 --- a/swarms/agents/multi_modal_visual_agent.py +++ b/swarms/agents/multi_modal_visual_agent.py @@ -1,54 +1,48 @@ -from swarms.agents.message import Message +import inspect +import math import os import random -import torch -import cv2 import re import uuid -from PIL import Image, ImageDraw, ImageOps, ImageFont -import math -import numpy as np -import inspect -from transformers import ( - pipeline, - BlipProcessor, - BlipForConditionalGeneration, - BlipForQuestionAnswering, -) +import cv2 + +# Grounding DINO +import groundingdino.datasets.transforms as T +import matplotlib.pyplot as plt +import numpy as np +import torch +import wget +from controlnet_aux import HEDdetector, MLSDdetector, OpenposeDetector from diffusers import ( - StableDiffusionPipeline, + ControlNetModel, + EulerAncestralDiscreteScheduler, + StableDiffusionControlNetPipeline, StableDiffusionInpaintPipeline, StableDiffusionInstructPix2PixPipeline, -) -from diffusers import EulerAncestralDiscreteScheduler -from diffusers import ( - StableDiffusionControlNetPipeline, - ControlNetModel, + StableDiffusionPipeline, UniPCMultistepScheduler, ) from diffusers.pipelines.stable_diffusion import StableDiffusionSafetyChecker - -from controlnet_aux import OpenposeDetector, MLSDdetector, HEDdetector - +from groundingdino.models import build_model +from groundingdino.util.slconfig import SLConfig +from groundingdino.util.utils import clean_state_dict, get_phrases_from_posmap from langchain.agents.initialize import initialize_agent from langchain.agents.tools import Tool from langchain.chains.conversation.memory import ConversationBufferMemory from langchain.llms.openai import OpenAI - -# Grounding DINO -import groundingdino.datasets.transforms as T -from groundingdino.models import build_model -from groundingdino.util.slconfig import SLConfig -from groundingdino.util.utils import clean_state_dict, get_phrases_from_posmap +from PIL import Image, ImageDraw, ImageFont, ImageOps # segment anything -from segment_anything import build_sam, SamPredictor, SamAutomaticMaskGenerator -import cv2 -import numpy as np -import matplotlib.pyplot as plt -import wget +from segment_anything import SamAutomaticMaskGenerator, SamPredictor, build_sam +from transformers import ( + BlipForConditionalGeneration, + BlipForQuestionAnswering, + BlipProcessor, + pipeline, +) +from swarms.agents.message import Message # prompts VISUAL_AGENT_PREFIX = """ diff --git a/swarms/agents/omni_modal_agent.py b/swarms/agents/omni_modal_agent.py index bdcb20ec..007a2219 100644 --- a/swarms/agents/omni_modal_agent.py +++ b/swarms/agents/omni_modal_agent.py @@ -12,6 +12,7 @@ from langchain_experimental.autonomous_agents.hugginggpt.task_planner import ( load_chat_planner, ) from transformers import load_tool + from swarms.agents.message import Message