Former-commit-id: 4ff7d1661e
group-chat
Kye 2 years ago
parent ffb9e50553
commit b4a85eb83e

@ -1,58 +1,45 @@
# coding: utf-8
import argparse
import inspect
import math
import os import os
import gradio as gr
import random import random
import torch
import cv2
import re import re
import uuid import uuid
from PIL import Image, ImageDraw, ImageOps, ImageFont
import cv2 import math
import gradio as gr
import matplotlib.pyplot as plt
import numpy as np import numpy as np
import torch import argparse
import wget import inspect
from controlnet_aux import HEDdetector, MLSDdetector, OpenposeDetector import tempfile
from diffusers import ( from transformers import CLIPSegProcessor, CLIPSegForImageSegmentation
ControlNetModel, from transformers import pipeline, BlipProcessor, BlipForConditionalGeneration, BlipForQuestionAnswering
EulerAncestralDiscreteScheduler, from transformers import AutoImageProcessor, UperNetForSemanticSegmentation
StableDiffusionControlNetPipeline,
StableDiffusionInpaintPipeline, from diffusers import StableDiffusionPipeline, StableDiffusionInpaintPipeline, StableDiffusionInstructPix2PixPipeline
StableDiffusionInstructPix2PixPipeline, from diffusers import EulerAncestralDiscreteScheduler
StableDiffusionPipeline, from diffusers import StableDiffusionControlNetPipeline, ControlNetModel, UniPCMultistepScheduler
UniPCMultistepScheduler,
)
from diffusers.pipelines.stable_diffusion import StableDiffusionSafetyChecker from diffusers.pipelines.stable_diffusion import StableDiffusionSafetyChecker
from controlnet_aux import OpenposeDetector, MLSDdetector, HEDdetector
from langchain.agents.initialize import initialize_agent from langchain.agents.initialize import initialize_agent
from langchain.agents.tools import Tool from langchain.agents.tools import Tool
from langchain.chains.conversation.memory import ConversationBufferMemory from langchain.chains.conversation.memory import ConversationBufferMemory
from langchain.llms.openai import OpenAI from langchain.llms.openai import OpenAI
from PIL import Image, ImageDraw, ImageFont, ImageOps
from transformers import (
BlipForConditionalGeneration,
BlipForQuestionAnswering,
BlipProcessor,
pipeline,
)
# Grounding DINO # Grounding DINO
# import groundingdino.datasets.transforms as T import groundingdino.datasets.transforms as T
from swarms.workers.models import ( from groundingdino.models import build_model
Compose, from groundingdino.util import box_ops
Normalize, from groundingdino.util.slconfig import SLConfig
RandomResize, from groundingdino.util.utils import clean_state_dict, get_phrases_from_posmap
SLConfig,
ToTensor, # segment anything
build_model, from segment_anything import build_sam, SamPredictor, SamAutomaticMaskGenerator
clean_state_dict, import cv2
get_phrases_from_posmap, import numpy as np
) import matplotlib.pyplot as plt
from swarms.workers.models.segment_anything import ( import wget
SamAutomaticMaskGenerator,
SamPredictor,
build_sam,
)
VISUAL_AGENT_PREFIX = """ VISUAL_AGENT_PREFIX = """
Worker Multi-Modal Agent is designed to be able to assist with Worker Multi-Modal Agent is designed to be able to assist with

Loading…
Cancel
Save