Merge pull request #4 from kyegomez/master

catch up 20231128 1801
2 years ago · fb0cfaefb4
parent 0ea531cca8 8484041847
commit fb0cfaefb4
22 changed files with 868 additions and 644 deletions
--- a/example.py
+++ b/example.py
@ -24,3 +24,4 @@ agent = Agent(llm=llm, max_loops=1, dashboard=True)
 # Run the workflow on a task
 out = agent.run("Generate a 10,000 word blog on health and wellness.")
 print(out)
--- a/mkdocs.yml
+++ b/mkdocs.yml
@ -104,9 +104,10 @@ nav:
 - Guides:
    - Overview: "examples/index.md"
    - Agents:
-      - Flow: "examples/flow.md"
+      - Agent: "examples/flow.md"
      - SequentialWorkflow: "examples/reliable_autonomous_agents.md"
      - OmniAgent: "examples/omni_agent.md"
    - Swarms:
      - SequentialWorkflow: "examples/reliable_autonomous_agents.md"
    - 2O+ Autonomous Agent Blogs: "examples/ideas.md"
 - Applications:
    - CustomerSupport: 
--- a/multi_modal_auto_agent.py
+++ b/multi_modal_auto_agent.py
@ -1,11 +1,20 @@
-from swarms.structs import Agent
+import os
 from dotenv import load_dotenv
 from swarms.models.gpt4_vision_api import GPT4VisionAPI
 from swarms.prompts.multi_modal_autonomous_instruction_prompt import (
    MULTI_MODAL_AUTO_AGENT_SYSTEM_PROMPT_1,
 )
 from swarms.structs import Agent
 load_dotenv()
 api_key = os.environ.get("OPENAI_API_KEY")
-llm = GPT4VisionAPI()
+llm = GPT4VisionAPI(
    openai_api_key=api_key,
 )
 task = "What is the color of the object?"
 img = "images/swarms.jpeg"
@ -15,6 +24,9 @@ agent = Agent(
    llm=llm,
    max_loops="auto",
    sop=MULTI_MODAL_AUTO_AGENT_SYSTEM_PROMPT_1,
    autosave=True,
    dashboard=True,
 )
-agent.run(task=task, img=img)
+out = agent.run(task=task, img=img)
 print(out)
--- a/playground/demos/developer_swarm/main.py
+++ b/playground/demos/developer_swarm/main.py
@ -27,8 +27,7 @@ api_key = os.getenv("OPENAI_API_KEY")
 TASK = """
-code
+CODE
 """
@ -38,12 +37,12 @@ llm = OpenAIChat(openai_api_key=api_key, max_tokens=5000)
 # Documentation agent
 documentation_agent = Agent(
-    llm=llm, sop=DOCUMENTATION_SOP, max_loops=1, multi_modal=True
+    llm=llm, sop=DOCUMENTATION_SOP, max_loops=1,
 )
 # Tests agent
-tests_agent = Agent(llm=llm, sop=TEST_SOP, max_loops=2, multi_modal=True)
+tests_agent = Agent(llm=llm, sop=TEST_SOP, max_loops=2,)
 # Run the documentation agent
--- a/swarms/memory/init.py
+++ b/swarms/memory/init.py
@ -1,11 +1,3 @@
-from swarms.memory.pinecone import PineconeVector
+# from swarms.memory.pinecone import PineconeVector
-from swarms.memory.base import BaseVectorStore
+# from swarms.memory.base import BaseVectorStore
-from swarms.memory.pg import PgVectorVectorStore
+# from swarms.memory.pg import PgVectorVectorStore
 from swarms.memory.ocean import OceanDB
 __all__ = [
    "BaseVectorStore",
    "PineconeVector",
    "PgVectorVectorStore",
    "OceanDB",
 ]
--- a/swarms/memory/base.py
+++ b/swarms/memory/base.py
@ -9,8 +9,6 @@ from griptape.artifacts import TextArtifact
@define
 class BaseVectorStore(ABC):
    """ """
    DEFAULT_QUERY_COUNT = 5
    @dataclass
--- a/swarms/memory/db.py
+++ b/swarms/memory/db.py
@ -1,177 +0,0 @@
 import uuid
 from abc import ABC
 from typing import Any, Dict, List, Optional
 from swarms.memory.schemas import Artifact, Status
 from swarms.memory.schemas import Step as APIStep
 from swarms.memory.schemas import Task as APITask
 class Step(APIStep):
    additional_properties: Optional[Dict[str, str]] = None
 class Task(APITask):
    steps: List[Step] = []
 class NotFoundException(Exception):
    """
    Exception raised when a resource is not found.
    """
    def __init__(self, item_name: str, item_id: str):
        self.item_name = item_name
        self.item_id = item_id
        super().__init__(f"{item_name} with {item_id} not found.")
 class TaskDB(ABC):
    async def create_task(
        self,
        input: Optional[str],
        additional_input: Any = None,
        artifacts: Optional[List[Artifact]] = None,
        steps: Optional[List[Step]] = None,
    ) -> Task:
        raise NotImplementedError
    async def create_step(
        self,
        task_id: str,
        name: Optional[str] = None,
        input: Optional[str] = None,
        is_last: bool = False,
        additional_properties: Optional[Dict[str, str]] = None,
    ) -> Step:
        raise NotImplementedError
    async def create_artifact(
        self,
        task_id: str,
        file_name: str,
        relative_path: Optional[str] = None,
        step_id: Optional[str] = None,
    ) -> Artifact:
        raise NotImplementedError
    async def get_task(self, task_id: str) -> Task:
        raise NotImplementedError
    async def get_step(self, task_id: str, step_id: str) -> Step:
        raise NotImplementedError
    async def get_artifact(self, task_id: str, artifact_id: str) -> Artifact:
        raise NotImplementedError
    async def list_tasks(self) -> List[Task]:
        raise NotImplementedError
    async def list_steps(
        self, task_id: str, status: Optional[Status] = None
    ) -> List[Step]:
        raise NotImplementedError
 class InMemoryTaskDB(TaskDB):
    _tasks: Dict[str, Task] = {}
    async def create_task(
        self,
        input: Optional[str],
        additional_input: Any = None,
        artifacts: Optional[List[Artifact]] = None,
        steps: Optional[List[Step]] = None,
    ) -> Task:
        if not steps:
            steps = []
        if not artifacts:
            artifacts = []
        task_id = str(uuid.uuid4())
        task = Task(
            task_id=task_id,
            input=input,
            steps=steps,
            artifacts=artifacts,
            additional_input=additional_input,
        )
        self._tasks[task_id] = task
        return task
    async def create_step(
        self,
        task_id: str,
        name: Optional[str] = None,
        input: Optional[str] = None,
        is_last=False,
        additional_properties: Optional[Dict[str, Any]] = None,
    ) -> Step:
        step_id = str(uuid.uuid4())
        step = Step(
            task_id=task_id,
            step_id=step_id,
            name=name,
            input=input,
            status=Status.created,
            is_last=is_last,
            additional_properties=additional_properties,
        )
        task = await self.get_task(task_id)
        task.steps.append(step)
        return step
    async def get_task(self, task_id: str) -> Task:
        task = self._tasks.get(task_id, None)
        if not task:
            raise NotFoundException("Task", task_id)
        return task
    async def get_step(self, task_id: str, step_id: str) -> Step:
        task = await self.get_task(task_id)
        step = next(filter(lambda s: s.task_id == task_id, task.steps), None)
        if not step:
            raise NotFoundException("Step", step_id)
        return step
    async def get_artifact(self, task_id: str, artifact_id: str) -> Artifact:
        task = await self.get_task(task_id)
        artifact = next(
            filter(lambda a: a.artifact_id == artifact_id, task.artifacts), None
        )
        if not artifact:
            raise NotFoundException("Artifact", artifact_id)
        return artifact
    async def create_artifact(
        self,
        task_id: str,
        file_name: str,
        relative_path: Optional[str] = None,
        step_id: Optional[str] = None,
    ) -> Artifact:
        artifact_id = str(uuid.uuid4())
        artifact = Artifact(
            artifact_id=artifact_id,
            file_name=file_name,
            relative_path=relative_path,
        )
        task = await self.get_task(task_id)
        task.artifacts.append(artifact)
        if step_id:
            step = await self.get_step(task_id, step_id)
            step.artifacts.append(artifact)
        return artifact
    async def list_tasks(self) -> List[Task]:
        return [task for task in self._tasks.values()]
    async def list_steps(
        self, task_id: str, status: Optional[Status] = None
    ) -> List[Step]:
        task = await self.get_task(task_id)
        steps = task.steps
        if status:
            steps = list(filter(lambda s: s.status == status, steps))
        return steps
--- a/swarms/memory/ocean.py
+++ b/swarms/memory/ocean.py
@ -1,157 +0,0 @@
 import logging
 from typing import List
 import oceandb
 from oceandb.utils.embedding_function import MultiModalEmbeddingFunction
 class OceanDB:
    """
    A class to interact with OceanDB.
    ...
    Attributes
    ----------
    client : oceandb.Client
        a client to interact with OceanDB
    Methods
    -------
    create_collection(collection_name: str, modality: str):
        Creates a new collection in OceanDB.
    append_document(collection, document: str, id: str):
        Appends a document to a collection in OceanDB.
    add_documents(collection, documents: List[str], ids: List[str]):
        Adds multiple documents to a collection in OceanDB.
    query(collection, query_texts: list[str], n_results: int):
        Queries a collection in OceanDB.
    """
    def __init__(self, client: oceandb.Client = None):
        """
        Constructs all the necessary attributes for the OceanDB object.
        Parameters
        ----------
            client : oceandb.Client, optional
                a client to interact with OceanDB (default is None, which creates a new client)
        """
        try:
            self.client = client if client else oceandb.Client()
            print(self.client.heartbeat())
        except Exception as e:
            logging.error(f"Failed to initialize OceanDB client. Error: {e}")
            raise
    def create_collection(self, collection_name: str, modality: str):
        """
        Creates a new collection in OceanDB.
        Parameters
        ----------
            collection_name : str
                the name of the new collection
            modality : str
                the modality of the new collection
        Returns
        -------
            collection
                the created collection
        """
        try:
            embedding_function = MultiModalEmbeddingFunction(modality=modality)
            collection = self.client.create_collection(
                collection_name, embedding_function=embedding_function
            )
            return collection
        except Exception as e:
            logging.error(f"Failed to create collection. Error {e}")
            raise
    def append_document(self, collection, document: str, id: str):
        """
        Appends a document to a collection in OceanDB.
        Parameters
        ----------
            collection
                the collection to append the document to
            document : str
                the document to append
            id : str
                the id of the document
        Returns
        -------
            result
                the result of the append operation
        """
        try:
            return collection.add(documents=[document], ids=[id])
        except Exception as e:
            logging.error(
                f"Failed to append document to the collection. Error {e}"
            )
            raise
    def add_documents(self, collection, documents: List[str], ids: List[str]):
        """
        Adds multiple documents to a collection in OceanDB.
        Parameters
        ----------
            collection
                the collection to add the documents to
            documents : List[str]
                the documents to add
            ids : List[str]
                the ids of the documents
        Returns
        -------
            result
                the result of the add operation
        """
        try:
            return collection.add(documents=documents, ids=ids)
        except Exception as e:
            logging.error(f"Failed to add documents to collection. Error: {e}")
            raise
    def query(self, collection, query_texts: list[str], n_results: int):
        """
        Queries a collection in OceanDB.
        Parameters
        ----------
            collection
                the collection to query
            query_texts : list[str]
                the texts to query
            n_results : int
                the number of results to return
        Returns
        -------
            results
                the results of the query
        """
        try:
            results = collection.query(
                query_texts=query_texts, n_results=n_results
            )
            return results
        except Exception as e:
            logging.error(f"Failed to query the collection. Error {e}")
            raise
 # Example
 # ocean = OceanDB()
 # collection = ocean.create_collection("test", "text")
 # ocean.append_document(collection, "hello world", "1")
 # ocean.add_documents(collection, ["hello world", "hello world"], ["2", "3"])
 # results = ocean.query(collection, ["hello world"], 3)
 # print(results)
--- a/swarms/memory/pinecone.py
+++ b/swarms/memory/pinecone.py
@ -1,12 +1,12 @@
 from typing import Optional
-from swarms.memory.vector_stores.base import BaseVector
+from swarms.memory.base import BaseVectorStore
 import pinecone
 from attr import define, field
 from swarms.utils.hash import str_to_hash
@define
-class PineconeVectorStoreStore(BaseVector):
+class PineconeVectorStoreStore(BaseVectorStore):
    """
    PineconeVectorStore is a vector storage driver that uses Pinecone as the underlying storage engine.
@ -24,11 +24,11 @@ class PineconeVectorStoreStore(BaseVector):
    Methods:
        upsert_vector(vector: list[float], vector_id: Optional[str] = None, namespace: Optional[str] = None, meta: Optional[dict] = None, **kwargs) -> str:
            Upserts a vector into the index.
-        load_entry(vector_id: str, namespace: Optional[str] = None) -> Optional[BaseVector.Entry]:
+        load_entry(vector_id: str, namespace: Optional[str] = None) -> Optional[BaseVectorStore.Entry]:
            Loads a single vector from the index.
-        load_entries(namespace: Optional[str] = None) -> list[BaseVector.Entry]:
+        load_entries(namespace: Optional[str] = None) -> list[BaseVectorStore.Entry]:
            Loads all vectors from the index.
-        query(query: str, count: Optional[int] = None, namespace: Optional[str] = None, include_vectors: bool = False, include_metadata=True, **kwargs) -> list[BaseVector.QueryResult]:
+        query(query: str, count: Optional[int] = None, namespace: Optional[str] = None, include_vectors: bool = False, include_metadata=True, **kwargs) -> list[BaseVectorStore.QueryResult]:
            Queries the index for vectors similar to the given query string.
        create_index(name: str, **kwargs) -> None:
            Creates a new index.
@ -121,7 +121,7 @@ class PineconeVectorStoreStore(BaseVector):
    def load_entry(
        self, vector_id: str, namespace: Optional[str] = None
-    ) -> Optional[BaseVector.Entry]:
+    ) -> Optional[BaseVectorStore.Entry]:
        """Load entry"""
        result = self.index.fetch(
            ids=[vector_id], namespace=namespace
@ -131,7 +131,7 @@ class PineconeVectorStoreStore(BaseVector):
        if len(vectors) > 0:
            vector = vectors[0]
-            return BaseVector.Entry(
+            return BaseVectorStore.Entry(
                id=vector["id"],
                meta=vector["metadata"],
                vector=vector["values"],
@ -142,7 +142,7 @@ class PineconeVectorStoreStore(BaseVector):
    def load_entries(
        self, namespace: Optional[str] = None
-    ) -> list[BaseVector.Entry]:
+    ) -> list[BaseVectorStore.Entry]:
        """Load entries"""
        # This is a hacky way to query up to 10,000 values from Pinecone. Waiting on an official API for fetching
        # all values from a namespace:
@ -156,7 +156,7 @@ class PineconeVectorStoreStore(BaseVector):
        )
        return [
-            BaseVector.Entry(
+            BaseVectorStore.Entry(
                id=r["id"],
                vector=r["values"],
                meta=r["metadata"],
@ -174,12 +174,12 @@ class PineconeVectorStoreStore(BaseVector):
        # PineconeVectorStoreStorageDriver-specific params:
        include_metadata=True,
        **kwargs,
-    ) -> list[BaseVector.QueryResult]:
+    ) -> list[BaseVectorStore.QueryResult]:
        """Query vectors"""
        vector = self.embedding_driver.embed_string(query)
        params = {
-            "top_k": count if count else BaseVector.DEFAULT_QUERY_COUNT,
+            "top_k": count if count else BaseVectorStore.DEFAULT_QUERY_COUNT,
            "namespace": namespace,
            "include_values": include_vectors,
            "include_metadata": include_metadata,
@ -188,7 +188,7 @@ class PineconeVectorStoreStore(BaseVector):
        results = self.index.query(vector, **params)
        return [
-            BaseVector.QueryResult(
+            BaseVectorStore.QueryResult(
                id=r["id"],
                vector=r["values"],
                score=r["score"],
--- a/swarms/models/init.py
+++ b/swarms/models/init.py
@ -1,8 +1,3 @@
 import sys
 log_file = open("errors.txt", "w")
 sys.stderr = log_file
 # LLMs
 from swarms.models.anthropic import Anthropic  # noqa: E402
 from swarms.models.petals import Petals  # noqa: E402
--- a/swarms/models/base_multimodal_model.py
+++ b/swarms/models/base_multimodal_model.py
@ -69,6 +69,10 @@ class BaseMultiModalModel:
        device: Optional[str] = "cuda",
        max_new_tokens: Optional[int] = 500,
        retries: Optional[int] = 3,
        system_prompt: Optional[str] = None,
        meta_prompt: Optional[str] = None,
        *args,
        **kwargs,
    ):
        self.model_name = model_name
        self.temperature = temperature
@ -265,3 +269,17 @@ class BaseMultiModalModel:
        """
        for chunk in content:
            print(chunk)
    def meta_prompt(self):
        """Meta Prompt
        Returns:
            _type_: _description_
        """
        META_PROMPT = """
        For any labels or markings on an image that you reference in your response, please 
        enclose them in square brackets ([]) and list them explicitly. Do not use ranges; for 
        example, instead of '1 - 4', list as '[1], [2], [3], [4]'. These labels could be 
        numbers or letters and typically correspond to specific segments or parts of the image.
        """
        return META_PROMPT
--- a/swarms/models/gpt4_vision_api.py
+++ b/swarms/models/gpt4_vision_api.py
@ -23,6 +23,12 @@ load_dotenv()
 openai_api_key = os.getenv("OPENAI_API_KEY")
 gpt4_vision_system_prompt = """
 You are an multi-modal autonomous agent. You are given a task and an image. You must generate a response to the task and image.
 """
 class GPT4VisionAPI:
    """
    GPT-4 Vision API
@ -67,6 +73,10 @@ class GPT4VisionAPI:
        openai_proxy: str = "https://api.openai.com/v1/chat/completions",
        beautify: bool = False,
        streaming_enabled: Optional[bool] = False,
        meta_prompt: Optional[bool] = False,
        system_prompt: Optional[str] = gpt4_vision_system_prompt,
        *args,
        **kwargs,
    ):
        super().__init__()
        self.openai_api_key = openai_api_key
@ -77,6 +87,8 @@ class GPT4VisionAPI:
        self.openai_proxy = openai_proxy
        self.beautify = beautify
        self.streaming_enabled = streaming_enabled
        self.meta_prompt = meta_prompt
        self.system_prompt = system_prompt
        if self.logging_enabled:
            logging.basicConfig(level=logging.DEBUG)
@ -85,6 +97,9 @@ class GPT4VisionAPI:
            logging.getLogger("requests").setLevel(logging.WARNING)
            logging.getLogger("urllib3").setLevel(logging.WARNING)
        if self.meta_prompt:
            self.system_prompt = self.meta_prompt_init()
    def encode_image(self, img: str):
        """Encode image to base64."""
        with open(img, "rb") as image_file:
@ -110,8 +125,9 @@ class GPT4VisionAPI:
                "Authorization": f"Bearer {openai_api_key}",
            }
            payload = {
-                "model": "gpt-4-vision-preview",
+                "model": self.model_name,
                "messages": [
                    {"role": "system", "content": [self.system_prompt]},
                    {
                        "role": "user",
                        "content": [
@ -125,7 +141,7 @@ class GPT4VisionAPI:
                                },
                            },
                        ],
-                    }
+                    },
                ],
                "max_tokens": self.max_tokens,
            }
@ -233,7 +249,13 @@ class GPT4VisionAPI:
        for img in base64_frames:
            base64.b64decode(img.encode("utf-8"))
-    def __call__(self, task: str, img: str):
+    def __call__(
        self,
        task: Optional[str] = None,
        img: Optional[str] = None,
        *args,
        **kwargs,
    ):
        """Run the model."""
        try:
            base64_image = self.encode_image(img)
@ -242,8 +264,9 @@ class GPT4VisionAPI:
                "Authorization": f"Bearer {openai_api_key}",
            }
            payload = {
-                "model": "gpt-4-vision-preview",
+                "model": self.model_name,
                "messages": [
                    {"role": "system", "content": [self.system_prompt]},
                    {
                        "role": "user",
                        "content": [
@ -257,7 +280,7 @@ class GPT4VisionAPI:
                                },
                            },
                        ],
-                    }
+                    },
                ],
                "max_tokens": self.max_tokens,
            }
@ -425,3 +448,17 @@ class GPT4VisionAPI:
            )
        )
        return dashboard
    # def meta_prompt_init(self):
    #     """Meta Prompt
    #     Returns:
    #         _type_: _description_
    #     """
    #     META_PROMPT = """
    #     For any labels or markings on an image that you reference in your response, please
    #     enclose them in square brackets ([]) and list them explicitly. Do not use ranges; for
    #     example, instead of '1 - 4', list as '[1], [2], [3], [4]'. These labels could be
    #     numbers or letters and typically correspond to specific segments or parts of the image.
    #     """
    #     return META_PROMPT
--- a/swarms/models/openai_models.py
+++ b/swarms/models/openai_models.py
@ -752,6 +752,21 @@ class OpenAIChat(BaseLLM):
    Any parameters that are valid to be passed to the openai.create call can be passed
    in, even if not explicitly saved on this class.
    Args:
        model_name: The model name to use.
        model_kwargs: Any additional kwargs to pass to the model.
        openai_api_key: The OpenAI API key to use.
        openai_api_base: The OpenAI API base to use.
        openai_proxy: The OpenAI proxy to use.
        max_retries: The maximum number of retries to make when generating.
        prefix_messages: The prefix messages to use.
        streaming: Whether to stream the results or not.
        allowed_special: Set of special tokens that are allowed。
        disallowed_special: Set of special tokens that are not allowed。
    Example:
        .. code-block:: python
@ -760,13 +775,10 @@ class OpenAIChat(BaseLLM):
    """
    client: Any  #: :meta private:
-    model_name: str = "gpt-3.5-turbo"
+    model_name: str = "gpt-3.5-turbo-1106"
    """Model name to use."""
    model_kwargs: Dict[str, Any] = Field(default_factory=dict)
    """Holds any model parameters valid for `create` call not explicitly specified."""
    openai_api_key: Optional[str] = None
    openai_api_base: Optional[str] = None
    # to support explicit proxy for OpenAI
    openai_proxy: Optional[str] = None
    max_retries: int = 6
    """Maximum number of retries to make when generating."""
--- a/swarms/models/sam.py
+++ b/swarms/models/sam.py
@ -0,0 +1,291 @@
 import cv2
 import numpy as np
 from PIL import Image
 from transformers import SamImageProcessor, SamModel, SamProcessor, pipeline
 try:
    import cv2
    import supervision as sv
 except ImportError:
    print("Please install supervision and cv")
 from enum import Enum
 class FeatureType(Enum):
    """
    An enumeration to represent the types of features for mask adjustment in image
    segmentation.
    """
    ISLAND = "ISLAND"
    HOLE = "HOLE"
    @classmethod
    def list(cls):
        return list(map(lambda c: c.value, cls))
 def compute_mask_iou_vectorized(masks: np.ndarray) -> np.ndarray:
    """
    Vectorized computation of the Intersection over Union (IoU) for all pairs of masks.
    Parameters:
        masks (np.ndarray): A 3D numpy array with shape `(N, H, W)`, where `N` is the
            number of masks, `H` is the height, and `W` is the width.
    Returns:
        np.ndarray: A 2D numpy array of shape `(N, N)` where each element `[i, j]` is
            the IoU between masks `i` and `j`.
    Raises:
        ValueError: If any of the masks is found to be empty.
    """
    if np.any(masks.sum(axis=(1, 2)) == 0):
        raise ValueError(
            "One or more masks are empty. Please filter out empty masks before"
            " using `compute_iou_vectorized` function."
        )
    masks_bool = masks.astype(bool)
    masks_flat = masks_bool.reshape(masks.shape[0], -1)
    intersection = np.logical_and(masks_flat[:, None], masks_flat[None, :]).sum(
        axis=2
    )
    union = np.logical_or(masks_flat[:, None], masks_flat[None, :]).sum(axis=2)
    iou_matrix = intersection / union
    return iou_matrix
 def mask_non_max_suppression(
    masks: np.ndarray, iou_threshold: float = 0.6
 ) -> np.ndarray:
    """
    Performs Non-Max Suppression on a set of masks by prioritizing larger masks and
        removing smaller masks that overlap significantly.
    When the IoU between two masks exceeds the specified threshold, the smaller mask
    (in terms of area) is discarded. This process is repeated for each pair of masks,
    effectively filtering out masks that are significantly overlapped by larger ones.
    Parameters:
        masks (np.ndarray): A 3D numpy array with shape `(N, H, W)`, where `N` is the
            number of masks, `H` is the height, and `W` is the width.
        iou_threshold (float): The IoU threshold for determining significant overlap.
    Returns:
        np.ndarray: A 3D numpy array of filtered masks.
    """
    num_masks = masks.shape[0]
    areas = masks.sum(axis=(1, 2))
    sorted_idx = np.argsort(-areas)
    keep_mask = np.ones(num_masks, dtype=bool)
    iou_matrix = compute_mask_iou_vectorized(masks)
    for i in range(num_masks):
        if not keep_mask[sorted_idx[i]]:
            continue
        overlapping_masks = iou_matrix[sorted_idx[i]] > iou_threshold
        overlapping_masks[sorted_idx[i]] = False
        keep_mask[sorted_idx] = np.logical_and(
            keep_mask[sorted_idx], ~overlapping_masks
        )
    return masks[keep_mask]
 def filter_masks_by_relative_area(
    masks: np.ndarray, minimum_area: float = 0.01, maximum_area: float = 1.0
 ) -> np.ndarray:
    """
    Filters masks based on their relative area within the total area of each mask.
    Parameters:
        masks (np.ndarray): A 3D numpy array with shape `(N, H, W)`, where `N` is the
            number of masks, `H` is the height, and `W` is the width.
        minimum_area (float): The minimum relative area threshold. Must be between `0`
            and `1`.
        maximum_area (float): The maximum relative area threshold. Must be between `0`
            and `1`.
    Returns:
        np.ndarray: A 3D numpy array containing masks that fall within the specified
            relative area range.
    Raises:
        ValueError: If `minimum_area` or `maximum_area` are outside the `0` to `1`
            range, or if `minimum_area` is greater than `maximum_area`.
    """
    if not (isinstance(masks, np.ndarray) and masks.ndim == 3):
        raise ValueError("Input must be a 3D numpy array.")
    if not (0 <= minimum_area <= 1) or not (0 <= maximum_area <= 1):
        raise ValueError(
            "`minimum_area` and `maximum_area` must be between 0 and 1."
        )
    if minimum_area > maximum_area:
        raise ValueError(
            "`minimum_area` must be less than or equal to `maximum_area`."
        )
    total_area = masks.shape[1] * masks.shape[2]
    relative_areas = masks.sum(axis=(1, 2)) / total_area
    return masks[
        (relative_areas >= minimum_area) & (relative_areas <= maximum_area)
    ]
 def adjust_mask_features_by_relative_area(
    mask: np.ndarray,
    area_threshold: float,
    feature_type: FeatureType = FeatureType.ISLAND,
 ) -> np.ndarray:
    """
    Adjusts a mask by removing small islands or filling small holes based on a relative
    area threshold.
    !!! warning
        Running this function on a mask with small islands may result in empty masks.
    Parameters:
        mask (np.ndarray): A 2D numpy array with shape `(H, W)`, where `H` is the
            height, and `W` is the width.
        area_threshold (float): Threshold for relative area to remove or fill features.
        feature_type (FeatureType): Type of feature to adjust (`ISLAND` for removing
            islands, `HOLE` for filling holes).
    Returns:
        np.ndarray: A 2D numpy array containing mask.
    """
    height, width = mask.shape
    total_area = width * height
    mask = np.uint8(mask * 255)
    operation = (
        cv2.RETR_EXTERNAL
        if feature_type == FeatureType.ISLAND
        else cv2.RETR_CCOMP
    )
    contours, _ = cv2.findContours(mask, operation, cv2.CHAIN_APPROX_SIMPLE)
    for contour in contours:
        area = cv2.contourArea(contour)
        relative_area = area / total_area
        if relative_area < area_threshold:
            cv2.drawContours(
                image=mask,
                contours=[contour],
                contourIdx=-1,
                color=(0 if feature_type == FeatureType.ISLAND else 255),
                thickness=-1,
            )
    return np.where(mask > 0, 1, 0).astype(bool)
 def masks_to_marks(masks: np.ndarray) -> sv.Detections:
    """
    Converts a set of masks to a marks (sv.Detections) object.
    Parameters:
        masks (np.ndarray): A 3D numpy array with shape `(N, H, W)`, where `N` is the
            number of masks, `H` is the height, and `W` is the width.
    Returns:
        sv.Detections: An object containing the masks and their bounding box
            coordinates.
    """
    return sv.Detections(mask=masks, xyxy=sv.mask_to_xyxy(masks=masks))
 def refine_marks(
    marks: sv.Detections,
    maximum_hole_area: float = 0.01,
    maximum_island_area: float = 0.01,
    minimum_mask_area: float = 0.02,
    maximum_mask_area: float = 1.0,
 ) -> sv.Detections:
    """
    Refines a set of masks by removing small islands and holes, and filtering by mask
    area.
    Parameters:
        marks (sv.Detections): An object containing the masks and their bounding box
            coordinates.
        maximum_hole_area (float): The maximum relative area of holes to be filled in
            each mask.
        maximum_island_area (float): The maximum relative area of islands to be removed
            from each mask.
        minimum_mask_area (float): The minimum relative area for a mask to be retained.
        maximum_mask_area (float): The maximum relative area for a mask to be retained.
    Returns:
        sv.Detections: An object containing the masks and their bounding box
            coordinates.
    """
    result_masks = []
    for mask in marks.mask:
        mask = adjust_mask_features_by_relative_area(
            mask=mask,
            area_threshold=maximum_island_area,
            feature_type=FeatureType.ISLAND,
        )
        mask = adjust_mask_features_by_relative_area(
            mask=mask,
            area_threshold=maximum_hole_area,
            feature_type=FeatureType.HOLE,
        )
        if np.any(mask):
            result_masks.append(mask)
    result_masks = np.array(result_masks)
    result_masks = filter_masks_by_relative_area(
        masks=result_masks,
        minimum_area=minimum_mask_area,
        maximum_area=maximum_mask_area,
    )
    return sv.Detections(
        mask=result_masks, xyxy=sv.mask_to_xyxy(masks=result_masks)
    )
 class SegmentAnythingMarkGenerator:
    """
    A class for performing image segmentation using a specified model.
    Parameters:
        device (str): The device to run the model on (e.g., 'cpu', 'cuda').
        model_name (str): The name of the model to be loaded. Defaults to
                          'facebook/sam-vit-huge'.
    """
    def __init__(
        self, device: str = "cpu", model_name: str = "facebook/sam-vit-huge"
    ):
        self.model = SamModel.from_pretrained(model_name).to(device)
        self.processor = SamProcessor.from_pretrained(model_name)
        self.image_processor = SamImageProcessor.from_pretrained(model_name)
        self.pipeline = pipeline(
            task="mask-generation",
            model=self.model,
            image_processor=self.image_processor,
            device=device,
        )
    def run(self, image: np.ndarray) -> sv.Detections:
        """
        Generate image segmentation marks.
        Parameters:
            image (np.ndarray): The image to be marked in BGR format.
        Returns:
            sv.Detections: An object containing the segmentation masks and their
                corresponding bounding box coordinates.
        """
        image = Image.fromarray(cv2.cvtColor(image, cv2.COLOR_BGR2RGB))
        outputs = self.pipeline(image, points_per_batch=64)
        masks = np.array(outputs["masks"])
        return masks_to_marks(masks=masks)
--- a/swarms/prompts/agent_system_prompts.py
+++ b/swarms/prompts/agent_system_prompts.py
@ -0,0 +1,11 @@
 # System prompt
 FLOW_SYSTEM_PROMPT = """
 You are an autonomous agent granted autonomy in a autonomous loop structure.
 Your role is to engage in multi-step conversations with your self or the user,
 generate long-form content like blogs, screenplays, or SOPs,
 and accomplish tasks bestowed by the user. 
 You can have internal dialogues with yourself or can interact with the user
 to aid in these complex tasks. Your responses should be coherent, contextually relevant, and tailored to the task at hand.
 """
--- a/swarms/prompts/self_operating_prompt.py
+++ b/swarms/prompts/self_operating_prompt.py
@ -0,0 +1,99 @@
 VISION_PROMPT = """
 You are a Self-Operating Computer. You use the same operating system as a human.
 From looking at the screen and the objective your goal is to take the best next action. 
 To operate the computer you have the four options below. 
 1. CLICK - Move mouse and click
 2. TYPE - Type on the keyboard
 3. SEARCH - Search for a program on Mac and open it
 4. DONE - When you completed the task respond with the exact following phrase content
 Here are the response formats below. 
 1. CLICK
 Response: CLICK {{ "x": "percent", "y": "percent", "description": "~description here~", "reason": "~reason here~" }} 
 2. TYPE
 Response: TYPE "value you want to type"
 2. SEARCH
 Response: SEARCH "app you want to search for on Mac"
 3. DONE
 Response: DONE
 Here are examples of how to respond.
 __
 Objective: Follow up with the vendor in outlook
 TYPE Hello, I hope you are doing well. I wanted to follow up
 __
 Objective: Open Spotify and play the beatles
 SEARCH Spotify
 __
 Objective: Find a image of a banana
 CLICK {{ "x": "50%", "y": "60%", "description": "Click: Google Search field", "reason": "This will allow me to search for a banana" }} 
 __
 Objective: Go buy a book about the history of the internet
 TYPE https://www.amazon.com/
 __
 A few important notes: 
 - Default to opening Google Chrome with SEARCH to find things that are on the internet. 
 - Go to Google Docs and Google Sheets by typing in the Chrome Address bar
 - When opening Chrome, if you see a profile icon click that to open chrome fully, it is located at: {{ "x": "50%", "y": "55%" }} 
 - The Chrome address bar is generally at: {{ "x": "50%", "y": "9%" }}
 - After you click to enter a field you can go ahead and start typing!
 {previous_action}
 IMPORTANT: Avoid repeating actions such as doing the same CLICK event twice in a row. 
 Objective: {objective}
 """
 USER_QUESTION = "Hello, I can help you with anything. What would you like done?"
 SUMMARY_PROMPT = """
 You are a Self-Operating Computer. You just completed a request from a user by operating the computer. Now you need to share the results. 
 You have three pieces of key context about the completed request.
 1. The original objective
 2. The steps you took to reach the objective that are available in the previous messages
 3. The screenshot you are looking at.
 Now you need to summarize what you did to reach the objective. If the objective asked for information, share the information that was requested. IMPORTANT: Don't forget to answer a user's question if they asked one.
 Thing to note: The user can not respond to your summary. You are just sharing the results of your work.
 The original objective was: {objective}
 Now share the results!
 """
 def format_summary_prompt(objective):
    """
    Format the summary prompt
    """
    prompt = SUMMARY_PROMPT.format(objective=objective)
    return prompt
 def format_vision_prompt(objective, previous_action):
    """
    Format the vision prompt
    """
    if previous_action:
        previous_action = (
            f"Here was the previous action you took: {previous_action}"
        )
    else:
        previous_action = ""
    prompt = VISION_PROMPT.format(
        objective=objective, previous_action=previous_action
    )
    return prompt
--- a/swarms/prompts/tools.py
+++ b/swarms/prompts/tools.py
@ -0,0 +1,60 @@
 # Prompts
 DYNAMIC_STOP_PROMPT = """
 Now, when you 99% sure you have completed the task, you may follow the instructions below to escape the autonomous loop.
 When you have finished the task from the Human, output a special token: <DONE>
 This will enable you to leave the autonomous loop.
 """
 # Make it able to handle multi input tools
 DYNAMICAL_TOOL_USAGE = """
 You have access to the following tools:
 Output a JSON object with the following structure to use the tools
 commands: {
    "tools": {
        tool1: "tool_name",
        "params": {
            "tool1": "inputs",
            "tool1": "inputs"
        }
        "tool2: "tool_name",
        "params": {
            "tool1": "inputs",
            "tool1": "inputs"
        }
        "tool3: "tool_name",
        "params": {
            "tool1": "inputs",
            "tool1": "inputs"
        }
    }
 }
 -------------TOOLS---------------------------
 {tools}
 """
 SCENARIOS = """
 commands: {
    "tools": {
        tool1: "tool_name",
        "params": {
            "tool1": "inputs",
            "tool1": "inputs"
        }
        "tool2: "tool_name",
        "params": {
            "tool1": "inputs",
            "tool1": "inputs"
        }
        "tool3: "tool_name",
        "params": {
            "tool1": "inputs",
            "tool1": "inputs"
        }
    }
 }
 """
--- a/swarms/structs/agent.py
+++ b/swarms/structs/agent.py
@ -5,92 +5,25 @@ import logging
 import random
 import re
 import time
 import uuid
 from typing import Any, Callable, Dict, List, Optional, Tuple
 from termcolor import colored
-from swarms.tools.tool import BaseTool
+from swarms.prompts.agent_system_prompts import FLOW_SYSTEM_PROMPT
 from swarms.utils.code_interpreter import SubprocessCodeInterpreter
 from swarms.utils.parse_code import extract_code_in_backticks_in_string
 from swarms.prompts.multi_modal_autonomous_instruction_prompt import (
    MULTI_MODAL_AUTO_AGENT_SYSTEM_PROMPT_1,
 )
 from swarms.prompts.tools import (
    DYNAMIC_STOP_PROMPT,
    DYNAMICAL_TOOL_USAGE,
    SCENARIOS,
 )
 from swarms.tools.tool import BaseTool
 from swarms.utils.code_interpreter import SubprocessCodeInterpreter
 from swarms.utils.parse_code import extract_code_in_backticks_in_string
 from swarms.utils.pdf_to_text import pdf_to_text
 # System prompt
 FLOW_SYSTEM_PROMPT = f"""
 You are an autonomous agent granted autonomy in a autonomous loop structure.
 Your role is to engage in multi-step conversations with your self or the user,
 generate long-form content like blogs, screenplays, or SOPs,
 and accomplish tasks bestowed by the user. 
 You can have internal dialogues with yourself or can interact with the user
 to aid in these complex tasks. Your responses should be coherent, contextually relevant, and tailored to the task at hand.
 """
 # Prompts
 DYNAMIC_STOP_PROMPT = """
 Now, when you 99% sure you have completed the task, you may follow the instructions below to escape the autonomous loop.
 When you have finished the task from the Human, output a special token: <DONE>
 This will enable you to leave the autonomous loop.
 """
 # Make it able to handle multi input tools
 DYNAMICAL_TOOL_USAGE = """
 You have access to the following tools:
 Output a JSON object with the following structure to use the tools
 commands: {
    "tools": {
        tool1: "tool_name",
        "params": {
            "tool1": "inputs",
            "tool1": "inputs"
        }
        "tool2: "tool_name",
        "params": {
            "tool1": "inputs",
            "tool1": "inputs"
        }
        "tool3: "tool_name",
        "params": {
            "tool1": "inputs",
            "tool1": "inputs"
        }
    }
 }
 -------------TOOLS---------------------------
 {tools}
 """
 SCENARIOS = """
 commands: {
    "tools": {
        tool1: "tool_name",
        "params": {
            "tool1": "inputs",
            "tool1": "inputs"
        }
        "tool2: "tool_name",
        "params": {
            "tool1": "inputs",
            "tool1": "inputs"
        }
        "tool3: "tool_name",
        "params": {
            "tool1": "inputs",
            "tool1": "inputs"
        }
    }
 }
 """
 def autonomous_agent_prompt(
    tools_prompt: str = DYNAMICAL_TOOL_USAGE,
@ -137,6 +70,11 @@ def parse_done_token(response: str) -> bool:
    return "<DONE>" in response
 def agent_id():
    """Generate an agent id"""
    return str(uuid.uuid4())
 class Agent:
    """
    Agent is the structure that provides autonomy to any llm in a reliable and effective fashion.
@ -162,52 +100,47 @@ class Agent:
        **kwargs (Any): Any additional keyword arguments
    Methods:
-        run: Run the autonomous agent loop
+        run(task: str, **kwargs: Any): Run the agent on a task
-        run_concurrent: Run the autonomous agent loop concurrently
+        run_concurrent(tasks: List[str], **kwargs: Any): Run the agent on a list of tasks concurrently
-        bulk_run: Run the autonomous agent loop in bulk
+        bulk_run(inputs: List[Dict[str, Any]]): Run the agent on a list of inputs
-        save: Save the agent history to a file
+        from_llm_and_template(llm: Any, template: str): Create AgentStream from LLM and a string template.
-        load: Load the agent history from a file
+        from_llm_and_template_file(llm: Any, template_file: str): Create AgentStream from LLM and a template file.
-        validate_response: Validate the response based on certain criteria
+        save(file_path): Save the agent history to a file
-        print_history_and_memory: Print the history and memory of the agent
+        load(file_path): Load the agent history from a file
-        step: Execute a single step in the agent interaction
+        validate_response(response: str): Validate the response based on certain criteria
-        graceful_shutdown: Gracefully shutdown the system saving the state
+        print_history_and_memory(): Print the entire history and memory of the agent
-        run_with_timeout: Run the loop but stop if it takes longer than the timeout
+        step(task: str, **kwargs): Executes a single step in the agent interaction, generating a response from the language model based on the given input text.
-        analyze_feedback: Analyze the feedback for issues
+        graceful_shutdown(): Gracefully shutdown the system saving the state
-        undo_last: Response the last response and return the previous state
+        run_with_timeout(task: str, timeout: int): Run the loop but stop if it takes longer than the timeout
-        add_response_filter: Add a response filter to filter out certain words from the response
+        analyze_feedback(): Analyze the feedback for issues
-        apply_reponse_filters: Apply the response filters to the response
+        undo_last(): Response the last response and return the previous state
-        filtered_run: Filter the response
+        add_response_filter(filter_word: str): Add a response filter to filter out certain words from the response
-        interactive_run: Interactive run mode
+        apply_reponse_filters(response: str): Apply the response filters to the response
-        streamed_generation: Stream the generation of the response
+        filtered_run(task: str): Filtered run
-        get_llm_params: Extracts and returns the parameters of the llm object for serialization.
+        interactive_run(max_loops: int): Interactive run mode
-        agent_history_prompt: Generate the agent history prompt
+        streamed_generation(prompt: str): Stream the generation of the response
-        add_task_to_memory: Add the task to the memory
+        get_llm_params(): Extracts and returns the parameters of the llm object for serialization.
-        add_message_to_memory: Add the message to the memory
+        save_state(file_path: str): Saves the current state of the agent to a JSON file, including the llm parameters.
-        add_message_to_memory_and_truncate: Add the message to the memory and truncate
+        load_state(file_path: str): Loads the state of the agent from a json file and restores the configuration and memory.
-        print_dashboard: Print dashboard
+        retry_on_failure(function, retries: int = 3, retry_delay: int = 1): Retry wrapper for LLM calls.
-        activate_autonomous_agent: Print the autonomous agent activation message
+        run_code(response: str): Run the code in the response
-        _check_stopping_condition: Check if the stopping condition is met
+        construct_dynamic_prompt(): Construct the dynamic prompt
-        format_prompt: Format the prompt
+        extract_tool_commands(text: str): Extract the tool commands from the text
-        get_llm_init_params: Get the llm init params
+        parse_and_execute_tools(response: str): Parse and execute the tools
-        provide_feedback: Allow users to provide feedback on the responses
+        execute_tools(tool_name, params): Execute the tool with the provided params
-        truncate_history: Take the history and truncate it to fit into the model context length
+        truncate_history(): Take the history and truncate it to fit into the model context length
-        agent_history_prompt: Generate the agent history prompt
+        add_task_to_memory(task: str): Add the task to the memory
-        extract_tool_commands: Extract the tool commands from the text
+        add_message_to_memory(message: str): Add the message to the memory
-        parse_and_execute_tools: Parse and execute the tools
+        add_message_to_memory_and_truncate(message: str): Add the message to the memory and truncate
-        execute_tools: Execute the tool with the provided parameters
+        print_dashboard(task: str): Print dashboard
-        construct_dynamic_prompt: Construct the dynamic prompt
+        activate_autonomous_agent(): Print the autonomous agent activation message
-        get_tool_description: Get the tool description
+        dynamic_temperature(): Dynamically change the temperature
-        find_tool_by_name: Find a tool by name
+        _check_stopping_condition(response: str): Check if the stopping condition is met
-        parse_tool_command: Parse the text for tool usage
+        format_prompt(template, **kwargs: Any): Format the template with the provided kwargs using f-string interpolation.
-        dynamic_temperature: Dynamically change the temperature
+        get_llm_init_params(): Get LLM init params
-        _run: Generate a result using the provided keyword args.
+        get_tool_description(): Get the tool description
-        from_llm_and_template: Create AgentStream from LLM and a string template.
+        find_tool_by_name(name: str): Find a tool by name
-        from_llm_and_template_file: Create AgentStream from LLM and a template file.
+        
        save_state: Save the state of the agent
        load_state: Load the state of the agent
        run_async: Run the agent asynchronously
        arun: Run the agent asynchronously
        run_code: Run the code in the response
    Example:
    >>> from swarms.models import OpenAIChat
@ -227,7 +160,8 @@ class Agent:
    def __init__(
        self,
-        llm: Any,
+        id: str = agent_id,
        llm: Any = None,
        template: Optional[str] = None,
        max_loops=5,
        stopping_condition: Optional[Callable[[str], bool]] = None,
@ -259,6 +193,7 @@ class Agent:
        *args,
        **kwargs: Any,
    ):
        self.id = id
        self.llm = llm
        self.template = template
        self.max_loops = max_loops
@ -471,6 +406,7 @@ class Agent:
                ----------------------------------------
                Agent Configuration:
                    Agent ID: {self.id}
                    Name: {self.agent_name}
                    Description: {self.agent_description}
                    Standard Operating Procedure: {self.sop}
@ -519,6 +455,45 @@ class Agent:
                )
            )
            print(error)
    def loop_count_print(self, loop_count, max_loops):
        """loop_count_print summary
        Args:
            loop_count (_type_): _description_
            max_loops (_type_): _description_
        """
        print(
            colored(f"\nLoop {loop_count} of {max_loops}", "cyan")
        )
        print("\n")
    def _history(self, user_name: str, task: str) -> str:
        """Generate the history for the history prompt
        Args:
            user_name (str): _description_
            task (str): _description_
        Returns:
            str: _description_
        """
        history = [f"{user_name}: {task}"]
        return history
    def _dynamic_prompt_setup(self, dynamic_prompt: str, task: str) -> str:
        """_dynamic_prompt_setup summary
        Args:
            dynamic_prompt (str): _description_
            task (str): _description_
        Returns:
            str: _description_
        """
        dynamic_prompt = dynamic_prompt or self.construct_dynamic_prompt()
        combined_prompt = f"{dynamic_prompt}\n{task}"
        return combined_prompt
    def run(self, task: Optional[str], img: Optional[str] = None, **kwargs):
        """
@ -536,14 +511,11 @@ class Agent:
        """
        try:
            # dynamic_prompt = self.construct_dynamic_prompt()
            # combined_prompt = f"{dynamic_prompt}\n{task}"
            # Activate Autonomous agent message
            self.activate_autonomous_agent()
            response = task  # or combined_prompt
-            history = [f"{self.user_name}: {task}"]
+            history = self._history(self.user_name, task)
            # If dashboard = True then print the dashboard
            if self.dashboard:
@ -555,9 +527,7 @@ class Agent:
            while self.max_loops == "auto" or loop_count < self.max_loops:
                # Loop count
                loop_count += 1
-                print(
+                self.loop_count_print(loop_count, self.max_loops)
                    colored(f"\nLoop {loop_count} of {self.max_loops}", "blue")
                )
                print("\n")
                # Check to see if stopping token is in the output to stop the loop
@ -1197,14 +1167,14 @@ class Agent:
        ‘‘‘
        """
-    def self_healing(self, **kwargs):
+    # def self_healing(self, **kwargs):
-        """
+    #     """
-        Self healing by debugging errors and refactoring its own code
+    #     Self healing by debugging errors and refactoring its own code
-        Args:
+    #     Args:
-            **kwargs (Any): Any additional keyword arguments
+    #         **kwargs (Any): Any additional keyword arguments
-        """
+    #     """
-        pass
+    #     pass
    # def refactor_code(
    #     self,
@ -1229,29 +1199,29 @@ class Agent:
    #     # Sort the changes in reverse line order
    #     # explanations.sort(key=lambda x: x["line", reverse=True])
-    # # def error_prompt_inject(
+    # def error_prompt_inject(
-    # #     self,
+    #     self,
-    # #     file_path: str,
+    #     file_path: str,
-    # #     args: List,
+    #     args: List,
-    # #     error: str,
+    #     error: str,
-    # # ):
+    # ):
-    # #     with open(file_path, "r") as f:
+    #     with open(file_path, "r") as f:
-    # #         file_lines = f.readlines()
+    #         file_lines = f.readlines()
-
+
-    # #     file_with_lines = []
+    #     file_with_lines = []
-    # #     for i, line in enumerate(file_lines):
+    #     for i, line in enumerate(file_lines):
-    # #         file_with_lines.append(str(i + 1) + "" + line)
+    #         file_with_lines.append(str(i + 1) + "" + line)
-    # #     file_with_lines = "".join(file_with_lines)
+    #     file_with_lines = "".join(file_with_lines)
-
+
-    # #     prompt = f"""
+    #     prompt = f"""
-    # #         Here is the script that needs fixing:\n\n
+    #         Here is the script that needs fixing:\n\n
-    # #         {file_with_lines}\n\n
+    #         {file_with_lines}\n\n
-    # #         Here are the arguments it was provided:\n\n
+    #         Here are the arguments it was provided:\n\n
-    # #         {args}\n\n
+    #         {args}\n\n
-    # #         Here is the error message:\n\n
+    #         Here is the error message:\n\n
-    # #         {error}\n
+    #         {error}\n
-    # #         "Please provide your suggested changes, and remember to stick to the "
+    #         "Please provide your suggested changes, and remember to stick to the "
-    # #         exact format as described above.
+    #         exact format as described above.
-    # #         """
+    #         """
-
+
-    # #     # Print(prompt)
+    #     print(prompt)
--- a/swarms/structs/non_linear_workflow.py
+++ b/swarms/structs/non_linear_workflow.py
@ -1,97 +0,0 @@
 from swarms.models import OpenAIChat
 from swarms.structs.agent import Agent
 import concurrent.futures
 from typing import Callable, List, Dict, Any, Sequence
 class Task:
    def __init__(
        self,
        id: str,
        task: str,
        flows: Sequence[Agent],
        dependencies: List[str] = [],
    ):
        self.id = id
        self.task = task
        self.flows = flows
        self.dependencies = dependencies
        self.results = []
    def execute(self, parent_results: Dict[str, Any]):
        args = [parent_results[dep] for dep in self.dependencies]
        for agent in self.flows:
            result = agent.run(self.task, *args)
            self.results.append(result)
            args = [
                result
            ]  # The output of one agent becomes the input to the next
 class Workflow:
    def __init__(self):
        self.tasks: Dict[str, Task] = {}
        self.executor = concurrent.futures.ThreadPoolExecutor()
    def add_task(self, task: Task):
        self.tasks[task.id] = task
    def run(self):
        completed_tasks = set()
        while len(completed_tasks) < len(self.tasks):
            futures = []
            for task in self.tasks.values():
                if task.id not in completed_tasks and all(
                    dep in completed_tasks for dep in task.dependencies
                ):
                    future = self.executor.submit(
                        task.execute,
                        {
                            dep: self.tasks[dep].results
                            for dep in task.dependencies
                        },
                    )
                    futures.append((future, task.id))
            for future, task_id in futures:
                future.result()  # Wait for task completion
                completed_tasks.add(task_id)
    def get_results(self):
        return {task_id: task.results for task_id, task in self.tasks.items()}
 # create flows
 llm = OpenAIChat(openai_api_key="sk-")
 flow1 = Agent(llm, max_loops=1)
 flow2 = Agent(llm, max_loops=1)
 flow3 = Agent(llm, max_loops=1)
 flow4 = Agent(llm, max_loops=1)
 # Create tasks with their respective Agents and task strings
 task1 = Task("task1", "Generate a summary on Quantum field theory", [flow1])
 task2 = Task(
    "task2",
    "Elaborate on the summary of topic X",
    [flow2, flow3],
    dependencies=["task1"],
 )
 task3 = Task(
    "task3", "Generate conclusions for topic X", [flow4], dependencies=["task1"]
 )
 # Create a workflow and add tasks
 workflow = Workflow()
 workflow.add_task(task1)
 workflow.add_task(task2)
 workflow.add_task(task3)
 # Run the workflow
 workflow.run()
 # Get results
 results = workflow.get_results()
 print(results)
--- a/swarms/structs/task.py
+++ b/swarms/structs/task.py
@ -0,0 +1,49 @@
 from swarms.structs.agent import Agent
 from typing import List, Dict, Any, Sequence
 class Task:
    """
    Task is a unit of work that can be executed by a set of agents.
    A task is defined by a task name and a set of agents that can execute the task.
    The task can also have a set of dependencies, which are the names of other tasks
    that must be executed before this task can be executed.
    Args:
        id (str): A unique identifier for the task
        task (str): The name of the task
        agents (Sequence[Agent]): A list of agents that can execute the task
        dependencies (List[str], optional): A list of task names that must be executed before this task can be executed. Defaults to [].
    Methods:
        execute(parent_results: Dict[str, Any]): Executes the task by passing the results of the parent tasks to the agents.
    """
    def __init__(
        self,
        id: str,
        task: str,
        agents: Sequence[Agent],
        dependencies: List[str] = [],
    ):
        self.id = id
        self.task = task
        self.agents = agents
        self.dependencies = dependencies
        self.results = []
    def execute(self, parent_results: Dict[str, Any]):
        """Executes the task by passing the results of the parent tasks to the agents.
        Args:
            parent_results (Dict[str, Any]): _description_
        """
        args = [parent_results[dep] for dep in self.dependencies]
        for agent in self.agents:
            result = agent.run(self.task, *args)
            self.results.append(result)
            args = [
                result
            ]  # The output of one agent becomes the input to the next
--- a/swarms/utils/disable_logging.py
+++ b/swarms/utils/disable_logging.py
@ -1,9 +1,12 @@
 import logging
 import os
 import warnings
-
+import sys
 def disable_logging():
    log_file = open("errors.txt", "w")
    sys.stderr = log_file
    warnings.filterwarnings("ignore", category=UserWarning)
    # disable tensorflow warnings
--- a/tests/structs/test_task.py
+++ b/tests/structs/test_task.py
@ -0,0 +1,107 @@
 import os
 from unittest.mock import Mock
 import pytest
 from dotenv import load_dotenv
 from swarms.models.gpt4_vision_api import GPT4VisionAPI
 from swarms.prompts.multi_modal_autonomous_instruction_prompt import (
    MULTI_MODAL_AUTO_AGENT_SYSTEM_PROMPT_1,
 )
 from swarms.structs.agent import Agent
 from swarms.structs.task import Task
 load_dotenv()
@pytest.fixture
 def llm():
    return GPT4VisionAPI()
 def test_agent_run_task(llm):
    task = (
        "Analyze this image of an assembly line and identify any issues such as"
        " misaligned parts, defects, or deviations from the standard assembly"
        " process. IF there is anything unsafe in the image, explain why it is"
        " unsafe and how it could be improved."
    )
    img = "assembly_line.jpg"
    agent = Agent(
        llm=llm,
        max_loops="auto",
        sop=MULTI_MODAL_AUTO_AGENT_SYSTEM_PROMPT_1,
        dashboard=True,
    )
    result = agent.run(task=task, img=img)
    # Add assertions here to verify the expected behavior of the agent's run method
    assert isinstance(result, dict)
    assert "response" in result
    assert "dashboard_data" in result
    # Add more assertions as needed
@pytest.fixture
 def task():
    agents = [Agent(llm=llm, id=f"Agent_{i}") for i in range(5)]
    return Task(id="Task_1", task="Task_Name", agents=agents, dependencies=[])
 # Basic tests
 def test_task_init(task):
    assert task.id == "Task_1"
    assert task.task == "Task_Name"
    assert isinstance(task.agents, list)
    assert len(task.agents) == 5
    assert isinstance(task.dependencies, list)
 def test_task_execute(task, mocker):
    mocker.patch.object(Agent, "run", side_effect=[1, 2, 3, 4, 5])
    parent_results = {}
    task.execute(parent_results)
    assert isinstance(task.results, list)
    assert len(task.results) == 5
    for result in task.results:
        assert isinstance(result, int)
 # Parameterized tests
@pytest.mark.parametrize("num_agents", [1, 3, 5, 10])
 def test_task_num_agents(task, num_agents, mocker):
    task.agents = [Agent(id=f"Agent_{i}") for i in range(num_agents)]
    mocker.patch.object(Agent, "run", return_value=1)
    parent_results = {}
    task.execute(parent_results)
    assert len(task.results) == num_agents
 # Exception testing
 def test_task_execute_with_dependency_error(task, mocker):
    task.dependencies = ["NonExistentTask"]
    mocker.patch.object(Agent, "run", return_value=1)
    parent_results = {}
    with pytest.raises(KeyError):
        task.execute(parent_results)
 # Mocking and monkeypatching tests
 def test_task_execute_with_mocked_agents(task, mocker):
    mock_agents = [Mock(spec=Agent) for _ in range(5)]
    mocker.patch.object(task, "agents", mock_agents)
    for mock_agent in mock_agents:
        mock_agent.run.return_value = 1
    parent_results = {}
    task.execute(parent_results)
    assert len(task.results) == 5