Merge pull request #4 from kyegomez/master

Catching up 20240128 1624
12 months ago · bb0d18eacc
parent 6c4e5cc2db d34427a4f8
commit bb0d18eacc
30 changed files with 1004 additions and 151 deletions
--- a/README.md
+++ b/README.md
@ -108,6 +108,56 @@ generated_data = agent.run(task)

 print(generated_data)

+```
+
+
+### `Worker`
+The `Worker` is a simple all-in-one agent equipped with an LLM, tools, and RAG. Get started below:
+
+✅ Plug in and Play LLM. Utilize any LLM from anywhere and any framework
+
+✅ Reliable RAG: Utilizes FAISS for efficient RAG but it's modular so you can use any DB.
+
+✅ Multi-Step Parallel Function Calling: Use any tool
+
+```python
+# Importing necessary modules
+import os
+from dotenv import load_dotenv
+from swarms import Worker, OpenAIChat, tool
+
+# Loading environment variables from .env file
+load_dotenv()
+
+# Retrieving the OpenAI API key from environment variables
+api_key = os.getenv("OPENAI_API_KEY")
+
+
+# Create a tool
+@tool
+def search_api(query: str):
+    pass
+
+
+# Creating a Worker instance
+worker = Worker(
+    name="My Worker",
+    role="Worker",
+    human_in_the_loop=False,
+    tools=[search_api],
+    temperature=0.5,
+    llm=OpenAIChat(openai_api_key=api_key),
+)
+
+# Running the worker with a prompt
+out = worker.run(
+    "Hello, how are you? Create an image of how your are doing!"
+)
+
+# Printing the output
+print(out)
+
+
 ```

 ------
@ -774,6 +824,115 @@ out = llm.run(task=task, img=img)
 print(out)
 ```

+### `GPT4Vision`
+```python
+from swarms import GPT4VisionAPI
+
+# Initialize with default API key and custom max_tokens
+api = GPT4VisionAPI(max_tokens=1000)
+
+# Define the task and image URL
+task = "Describe the scene in the image."
+img = "https://i.imgur.com/4P4ZRxU.jpeg"
+
+# Run the GPT-4 Vision model
+response = api.run(task, img)
+
+# Print the model's response
+print(response)
+```
+
+### `QwenVLMultiModal`
+A radically simple interface for QwenVLMultiModal comes complete with Quantization to turn it on just set quantize to true!
+
+```python
+from swarms import QwenVLMultiModal
+
+# Instantiate the QwenVLMultiModal model
+model = QwenVLMultiModal(
+    model_name="Qwen/Qwen-VL-Chat",
+    device="cuda",
+    quantize=True,
+)
+
+# Run the model
+response = model(
+    "Hello, how are you?", "https://example.com/image.jpg"
+)
+
+# Print the response
+print(response)
+
+
+```
+
+
+### `Kosmos`
+- Multi-Modal Model from microsoft!
+
+```python
+from swarms import Kosmos
+
+# Initialize the model
+model = Kosmos()
+
+# Generate
+out = model.run("Analyze the reciepts in this image", "docs.jpg")
+
+# Print the output
+print(out)
+
+```
+
+
+### `Idefics`
+- Multi-Modal model from Huggingface team!
+
+```python
+# Import the idefics model from the swarms.models module
+from swarms.models import Idefics
+
+# Create an instance of the idefics model
+model = Idefics()
+
+# Define user input with an image URL and chat with the model
+user_input = (
+    "User: What is in this image?"
+    " https://upload.wikimedia.org/wikipedia/commons/8/86/Id%C3%A9fix.JPG"
+)
+response = model.chat(user_input)
+print(response)
+
+# Define another user input with an image URL and chat with the model
+user_input = (
+    "User: And who is that?"
+    " https://static.wikia.nocookie.net/asterix/images/2/25/R22b.gif/revision/latest?cb=20110815073052"
+)
+response = model.chat(user_input)
+print(response)
+
+# Set the checkpoint of the model to "new_checkpoint"
+model.set_checkpoint("new_checkpoint")
+
+# Set the device of the model to "cpu"
+model.set_device("cpu")
+
+# Set the maximum length of the chat to 200
+model.set_max_length(200)
+
+# Clear the chat history of the model
+model.clear_chat_history()
+
+
+```
+
+## Radically Simple AI Model APIs
+We provide a vast array of language and multi-modal model APIs for you to generate text, images, music, speech, and even videos. Get started below:
+
+
+
+-----
+

 ### `Anthropic`
 ```python
@ -850,23 +1009,6 @@ print(image_url)
 ```


-### `GPT4Vision`
-```python
-from swarms import GPT4VisionAPI
-
-# Initialize with default API key and custom max_tokens
-api = GPT4VisionAPI(max_tokens=1000)
-
-# Define the task and image URL
-task = "Describe the scene in the image."
-img = "https://i.imgur.com/4P4ZRxU.jpeg"
-
-# Run the GPT-4 Vision model
-response = api.run(task, img)
-
-# Print the model's response
-print(response)
-```


 ### Text to Video with `ZeroscopeTTV`
@ -888,7 +1030,7 @@ print(video_path)
 ```


-### ModelScope
+<!-- ### ModelScope
 ```python
 from swarms.models import ModelScopeAutoModel

@ -910,32 +1052,9 @@ cog_agent = CogAgent()
 # Run the model on the tests
 cog_agent.run("Describe this scene", "images/1.jpg")

-```
+``` -->


-### `QwenVLMultiModal`
-A radically simple interface for QwenVLMultiModal comes complete with Quantization to turn it on just set quantize to true!
-
-```python
-from swarms import QwenVLMultiModal
-
-# Instantiate the QwenVLMultiModal model
-model = QwenVLMultiModal(
-    model_name="Qwen/Qwen-VL-Chat",
-    device="cuda",
-    quantize=True,
-)
-
-# Run the model
-response = model(
-    "Hello, how are you?", "https://example.com/image.jpg"
-)
-
-# Print the response
-print(response)
-
-
-```

 ----

--- a/docs/corporate/data_room.md
+++ b/docs/corporate/data_room.md
@ -80,23 +80,16 @@ Swarms is an open source framework for developers in python to enable seamless,
 [Here is the official Swarms Github Page:](https://github.com/kyegomez/swarms)

 ### Product Growth Metrics
+| Name                             | Description                                                                                                   | Link                                                                                      |
+|----------------------------------|---------------------------------------------------------------------------------------------------------------|-------------------------------------------------------------------------------------------|
+| Total Downloads of all time      | Total number of downloads for the product over its entire lifespan.                                           | [![Downloads](https://static.pepy.tech/badge/swarms)](https://pepy.tech/project/swarms)   |
+| Downloads this month             | Number of downloads for the product in the current month.                                                     | [![Downloads](https://static.pepy.tech/badge/swarms/month)](https://pepy.tech/project/swarms) |
+| Total Downloads this week        | Total number of downloads for the product in the current week.                                                | [![Downloads](https://static.pepy.tech/badge/swarms/week)](https://pepy.tech/project/swarms) |
+| Github Forks                     | Number of times the product's codebase has been copied for optimization, contribution, or usage.              | [![GitHub forks](https://img.shields.io/github/forks/kyegomez/swarms)](https://github.com/kyegomez/swarms/network) |
+| Github Stars                     | Number of users who have 'liked' the project.                                                                 | [![GitHub stars](https://img.shields.io/github/stars/kyegomez/swarms)](https://github.com/kyegomez/swarms/stargazers) |
+| Pip Module Metrics               | Various project statistics such as watchers, number of contributors, date repository was created, and more.   | [CLICK HERE](https://libraries.io/github/kyegomez/swarms)                                |
+| Contribution Based Statistics    | Statistics like number of contributors, lines of code changed, etc.                                           | [HERE](https://github.com/kyegomez/swarms/graphs/contributors)                           |
+| Github Community insights        | Insights into the Github community around the product.                                                        | [Github Community insights](https://github.com/kyegomez/swarms/graphs/community)         |
+| Github Traffic Metrics           | Metrics related to traffic, such as views and clones on Github.                                               | [Github Traffic Metrics](https://github.com/kyegomez/swarms/graphs/traffic)               |
+| Issues with the framework        | Current open issues for the product on Github.                                                                | [![GitHub issues](https://img.shields.io/github/issues/kyegomez/swarms)](https://github.com/kyegomez/swarms/issues) |

- Total Downloads of all time: [![GitHub issues](https://img.shields.io/github/issues/kyegomez/swarms)](https://github.com/kyegomez/swarms/issues)
-
- Click here for Downloads this month: [![Downloads](https://static.pepy.tech/badge/swarms/month)](https://pepy.tech/project/swarms)
-
- Total Downloads this week: [![GitHub issues](https://img.shields.io/github/issues/kyegomez/swarms)](https://github.com/kyegomez/swarms/issues)
-
- Click here for Forks which represent the number of times a user has copied the entire codebase for optimization, contribution, or usage. [![GitHub forks](https://img.shields.io/github/forks/kyegomez/swarms)](https://github.com/kyegomez/swarms/network) 
-
- Stars are the number of people that have liked our project, click here for more: [![GitHub stars](https://img.shields.io/github/stars/kyegomez/swarms)](https://github.com/kyegomez/swarms/stargazers)
-
- Various Project Statistics such as watchers, number of contributors, date repository was created and much more. [CLICK HERE](https://libraries.io/github/kyegomez/swarms)
-
- Contribution Based Statistics such as number of contributors, number of lines of code changed, and much more [HERE](https://github.com/kyegomez/swarms/graphs/contributors)
-
- [Github Community insights](https://github.com/kyegomez/swarms/graphs/community)
-
- [Github Traffic Metrics](https://github.com/kyegomez/swarms/graphs/traffic)
-
- Issues with the framework or Github Issues: [![GitHub issues](https://img.shields.io/github/issues/kyegomez/swarms)](https://github.com/kyegomez/swarms/issues)
--- a/playground/agents/worker_example.py
+++ b/playground/agents/worker_example.py
@ -1,12 +1,16 @@
+# Importing necessary modules
 import os
 from dotenv import load_dotenv
 from swarms.agents.worker_agent import Worker
 from swarms import OpenAIChat

+# Loading environment variables from .env file
 load_dotenv()

+# Retrieving the OpenAI API key from environment variables
 api_key = os.getenv("OPENAI_API_KEY")

+# Creating a Worker instance
 worker = Worker(
    name="My Worker",
    role="Worker",
@ -14,9 +18,13 @@ worker = Worker(
    tools=[],
    temperature=0.5,
    llm=OpenAIChat(openai_api_key=api_key),
+    verbose=True,
 )

+# Running the worker with a prompt
 out = worker.run(
    "Hello, how are you? Create an image of how your are doing!"
 )
+
+# Printing the output
 print(out)
--- a/playground/demos/fof/langchain.py
+++ b/playground/demos/fof/langchain.py
@ -0,0 +1,4 @@
+"""
+This tutorial shows you how to integrate swarms with Langchain
+
+"""
--- a/playground/models/idefics.py
+++ b/playground/models/idefics.py
@ -1,7 +1,10 @@
-from swarms.models import idefics
+# Import the idefics model from the swarms.models module
+from swarms.models import Idefics

-model = idefics()
+# Create an instance of the idefics model
+model = Idefics()

+# Define user input with an image URL and chat with the model
 user_input = (
    "User: What is in this image?"
    " https://upload.wikimedia.org/wikipedia/commons/8/86/Id%C3%A9fix.JPG"
@ -9,6 +12,7 @@ user_input = (
 response = model.chat(user_input)
 print(response)

+# Define another user input with an image URL and chat with the model
 user_input = (
    "User: And who is that?"
    " https://static.wikia.nocookie.net/asterix/images/2/25/R22b.gif/revision/latest?cb=20110815073052"
@ -16,7 +20,14 @@ user_input = (
 response = model.chat(user_input)
 print(response)

+# Set the checkpoint of the model to "new_checkpoint"
 model.set_checkpoint("new_checkpoint")
+
+# Set the device of the model to "cpu"
 model.set_device("cpu")
+
+# Set the maximum length of the chat to 200
 model.set_max_length(200)
+
+# Clear the chat history of the model
 model.clear_chat_history()
--- a/playground/models/kosmos.py
+++ b/playground/models/kosmos.py
@ -0,0 +1,10 @@
+from swarms import Kosmos
+
+# Initialize the model
+model = Kosmos()
+
+# Generate
+out = model.run("Analyze the reciepts in this image", "docs.jpg")
+
+# Print the output
+print(out)
--- a/pyproject.toml
+++ b/pyproject.toml
@ -4,7 +4,7 @@ build-backend = "poetry.core.masonry.api"

 [tool.poetry]
 name = "swarms"
-version = "3.7.9"
+version = "3.8.5"
 description = "Swarms - Pytorch"
 license = "MIT"
 authors = ["Kye Gomez <kye@apac.ai>"]
@ -24,7 +24,7 @@ classifiers = [
 [tool.poetry.dependencies]
 python = "^3.6.1"
 torch = "2.1.1"
-transformers = "4.36.2"
+transformers = "4.37.1"
 openai = "0.28.0"
 langchain = "0.0.333"
 asyncio = "3.4.3"
--- a/swarms/agents/init.py
+++ b/swarms/agents/init.py
@ -15,6 +15,7 @@ from swarms.agents.stopping_conditions import (
 )
 from swarms.agents.tool_agent import ToolAgent
 from swarms.agents.worker_agent import Worker
+from swarms.agents.agent_wrapper import agent_wrapper

 __all__ = [
    "AbstractAgent",
@ -32,4 +33,5 @@ __all__ = [
    "check_exit",
    "check_end",
    "Worker",
+    "agent_wrapper",
 ]
--- a/swarms/agents/agent_wrapper.py
+++ b/swarms/agents/agent_wrapper.py
@ -0,0 +1,26 @@
+from swarms.structs.agent import Agent
+
+
+def agent_wrapper(ClassToWrap):
+    """
+    This function takes a class 'ClassToWrap' and returns a new class that
+    inherits from both 'ClassToWrap' and 'Agent'. The new class overrides
+    the '__init__' method of 'Agent' to call the '__init__' method of 'ClassToWrap'.
+
+    Args:
+        ClassToWrap (type): The class to be wrapped and made to inherit from 'Agent'.
+
+    Returns:
+        type: The new class that inherits from both 'ClassToWrap' and 'Agent'.
+    """
+
+    class WrappedClass(ClassToWrap, Agent):
+        def __init__(self, *args, **kwargs):
+            try:
+                Agent.__init__(self, *args, **kwargs)
+                ClassToWrap.__init__(self, *args, **kwargs)
+            except Exception as e:
+                print(f"Error initializing WrappedClass: {e}")
+                raise e
+
+    return WrappedClass
--- a/swarms/agents/worker_agent.py
+++ b/swarms/agents/worker_agent.py
@ -51,6 +51,7 @@ class Worker:
        tools: List[Any] = None,
        embedding_size: int = 1536,
        search_kwargs: dict = {"k": 8},
+        verbose: bool = False,
        *args,
        **kwargs,
    ):
@ -64,6 +65,7 @@ class Worker:
        self.tools = tools
        self.embedding_size = embedding_size
        self.search_kwargs = search_kwargs
+        self.verbose = verbose

        self.setup_tools(external_tools)
        self.setup_memory()
@ -163,7 +165,7 @@ class Worker:
    # @log_decorator
    @error_decorator
    @timing_decorator
-    def run(self, task: str = None, *args, **kwargs):
+    def run(self, task: str = None, img=None, *args, **kwargs):
        """
        Run the autonomous agent on a given task.

--- a/swarms/memory/init.py
+++ b/swarms/memory/init.py
@ -1,11 +1,11 @@
-from swarms.memory.base_vectordb import VectorDatabase
+from swarms.memory.base_vectordb import AbstractDatabase
 from swarms.memory.short_term_memory import ShortTermMemory
 from swarms.memory.sqlite import SQLiteDB
 from swarms.memory.weaviate_db import WeaviateDB
 from swarms.memory.visual_memory import VisualShortTermMemory

 __all__ = [
-    "VectorDatabase",
+    "AbstractDatabase",
    "ShortTermMemory",
    "SQLiteDB",
    "WeaviateDB",
--- a/swarms/memory/base_vectordatabase.py
+++ b/swarms/memory/base_vectordatabase.py
@ -0,0 +1,141 @@
+from abc import ABC, abstractmethod
+
+
+class AbstractVectorDatabase(ABC):
+    """
+    Abstract base class for a database.
+
+    This class defines the interface for interacting with a database.
+    Subclasses must implement the abstract methods to provide the
+    specific implementation details for connecting to a database,
+    executing queries, and performing CRUD operations.
+
+    """
+
+    @abstractmethod
+    def connect(self):
+        """
+        Connect to the database.
+
+        This method establishes a connection to the database.
+
+        """
+
+        pass
+
+    @abstractmethod
+    def close(self):
+        """
+        Close the database connection.
+
+        This method closes the connection to the database.
+
+        """
+
+        pass
+
+    @abstractmethod
+    def query(self, query: str):
+        """
+        Execute a database query.
+
+        This method executes the given query on the database.
+
+        Parameters:
+            query (str): The query to be executed.
+
+        """
+
+        pass
+
+    @abstractmethod
+    def fetch_all(self):
+        """
+        Fetch all rows from the result set.
+
+        This method retrieves all rows from the result set of a query.
+
+        Returns:
+            list: A list of dictionaries representing the rows.
+
+        """
+
+        pass
+
+    @abstractmethod
+    def fetch_one(self):
+        """
+        Fetch one row from the result set.
+
+        This method retrieves one row from the result set of a query.
+
+        Returns:
+            dict: A dictionary representing the row.
+
+        """
+
+        pass
+
+    @abstractmethod
+    def add(self, doc: str):
+        """
+        Add a new record to the database.
+
+        This method adds a new record to the specified table in the database.
+
+        Parameters:
+            table (str): The name of the table.
+            data (dict): A dictionary representing the data to be added.
+
+        """
+
+        pass
+
+    @abstractmethod
+    def get(self, query: str):
+        """
+        Get a record from the database.
+
+        This method retrieves a record from the specified table in the database based on the given ID.
+
+        Parameters:
+            table (str): The name of the table.
+            id (int): The ID of the record to be retrieved.
+
+        Returns:
+            dict: A dictionary representing the retrieved record.
+
+        """
+
+        pass
+
+    @abstractmethod
+    def update(self, doc):
+        """
+        Update a record in the database.
+
+        This method updates a record in the specified table in the database based on the given ID.
+
+        Parameters:
+            table (str): The name of the table.
+            id (int): The ID of the record to be updated.
+            data (dict): A dictionary representing the updated data.
+
+        """
+
+        pass
+
+    @abstractmethod
+    def delete(self, message):
+        """
+        Delete a record from the database.
+
+        This method deletes a record from the specified table in the database based on the given ID.
+
+        Parameters:
+            table (str): The name of the table.
+            id (int): The ID of the record to be deleted.
+
+        """
+
+        pass
--- a/swarms/memory/base_vectordb.py
+++ b/swarms/memory/base_vectordb.py
@ -1,58 +0,0 @@
-from abc import ABC, abstractmethod
-from typing import Any, Dict
-
-
-class VectorDatabase(ABC):
-    @abstractmethod
-    def add(
-        self, vector: Dict[str, Any], metadata: Dict[str, Any]
-    ) -> None:
-        """
-        add a vector into the database.
-
-        Args:
-            vector (Dict[str, Any]): The vector to add.
-            metadata (Dict[str, Any]): Metadata associated with the vector.
-        """
-        pass
-
-    @abstractmethod
-    def query(self, text: str, num_results: int) -> Dict[str, Any]:
-        """
-        Query the database for vectors similar to the given vector.
-
-        Args:
-            text (Dict[str, Any]): The vector to compare against.
-            num_results (int): The number of similar vectors to return.
-
-        Returns:
-            Dict[str, Any]: The most similar vectors and their associated metadata.
-        """
-        pass
-
-    @abstractmethod
-    def delete(self, vector_id: str) -> None:
-        """
-        Delete a vector from the database.
-
-        Args:
-            vector_id (str): The ID of the vector to delete.
-        """
-        pass
-
-    @abstractmethod
-    def update(
-        self,
-        vector_id: str,
-        vector: Dict[str, Any],
-        metadata: Dict[str, Any],
-    ) -> None:
-        """
-        Update a vector in the database.
-
-        Args:
-            vector_id (str): The ID of the vector to update.
-            vector (Dict[str, Any]): The new vector.
-            metadata (Dict[str, Any]): The new metadata.
-        """
-        pass
--- a/swarms/memory/pinecone.py
+++ b/swarms/memory/pinecone.py
@ -1,12 +1,12 @@
 from typing import Optional
-from swarms.memory.base_vectordb import VectorDatabase
+from swarms.memory.base_vectordb import AbstractDatabase
 import pinecone
 from attr import define, field
 from swarms.utils.hash import str_to_hash


@define
-class PineconeDB(VectorDatabase):
+class PineconeDB(AbstractDatabase):
    """
    PineconeDB is a vector storage driver that uses Pinecone as the underlying storage engine.

--- a/swarms/memory/sqlite.py
+++ b/swarms/memory/sqlite.py
@ -1,5 +1,5 @@
 from typing import List, Tuple, Any, Optional
-from swarms.memory.base_vectordb import VectorDatabase
+from swarms.memory.base_vectordb import AbstractDatabase

 try:
    import sqlite3
@ -9,7 +9,7 @@ except ImportError:
    )


-class SQLiteDB(VectorDatabase):
+class SQLiteDB(AbstractDatabase):
    """
    A reusable class for SQLite database operations with methods for adding,
    deleting, updating, and querying data.
--- a/swarms/memory/weaviate_db.py
+++ b/swarms/memory/weaviate_db.py
@ -4,7 +4,7 @@ Weaviate API Client

 from typing import Any, Dict, List, Optional

-from swarms.memory.base_vectordb import VectorDatabase
+from swarms.memory.base_vectordb import AbstractDatabase

 try:
    import weaviate
@ -12,7 +12,7 @@ except ImportError:
    print("pip install weaviate-client")


-class WeaviateDB(VectorDatabase):
+class WeaviateDB(AbstractDatabase):
    """

    Weaviate API Client
--- a/swarms/models/init.py
+++ b/swarms/models/init.py
@ -47,6 +47,9 @@ from swarms.models.ultralytics_model import (
 from swarms.models.vip_llava import VipLlavaMultiModal  # noqa: E402
 from swarms.models.llava import LavaMultiModal  # noqa: E402
 from swarms.models.qwen import QwenVLMultiModal  # noqa: E402
+from swarms.models.clipq import CLIPQ  # noqa: E402
+from swarms.models.kosmos_two import Kosmos  # noqa: E402
+from swarms.models.fuyu import Fuyu  # noqa: E402

 # from swarms.models.dalle3 import Dalle3
 # from swarms.models.distilled_whisperx import DistilWhisperModel # noqa: E402
@ -78,7 +81,6 @@ __all__ = [
    "Zephyr",
    "BaseMultiModalModel",
    "Idefics",
-    # "Kosmos",
    "Vilt",
    "Nougat",
    "LayoutLMDocumentQA",
@ -101,13 +103,13 @@ __all__ = [
    "AudioModality",
    "VideoModality",
    "MultimodalData",
-    # "CogAgent",
-    # "ModelScopePipeline",
-    # "ModelScopeAutoModel",
    "TogetherLLM",
    "TimmModel",
    "UltralyticsModel",
    "VipLlavaMultiModal",
    "LavaMultiModal",
    "QwenVLMultiModal",
+    "CLIPQ",
+    "Kosmos",
+    "Fuyu",
 ]
--- a/swarms/models/anthropic.py
+++ b/swarms/models/anthropic.py
@ -29,9 +29,7 @@ from langchain.schema.language_model import BaseLanguageModel
 from langchain.schema.output import GenerationChunk
 from langchain.schema.prompt import PromptValue
 from langchain.utils import (
-    check_package_version,
    get_from_dict_or_env,
-    get_pydantic_field_names,
 )
 from packaging.version import parse
 from requests import HTTPError, Response
--- a/swarms/models/clipq.py
+++ b/swarms/models/clipq.py
@ -0,0 +1,183 @@
+from io import BytesIO
+
+import requests
+import torch
+from PIL import Image
+from torchvision.transforms import GaussianBlur
+from transformers import CLIPModel, CLIPProcessor
+
+
+class CLIPQ:
+    """
+    ClipQ is an CLIQ based model that can be used to generate captions for images.
+
+
+    Attributes:
+        model_name (str): The name of the model to be used.
+        query_text (str): The query text to be used for the model.
+
+    Args:
+        model_name (str): The name of the model to be used.
+        query_text (str): The query text to be used for the model.
+
+
+
+
+    """
+
+    def __init__(
+        self,
+        model_name: str = "openai/clip-vit-base-patch16",
+        query_text: str = "A photo ",
+        *args,
+        **kwargs,
+    ):
+        self.model = CLIPModel.from_pretrained(
+            model_name, *args, **kwargs
+        )
+        self.processor = CLIPProcessor.from_pretrained(model_name)
+        self.query_text = query_text
+
+    def fetch_image_from_url(self, url="https://picsum.photos/800"):
+        """Fetches an image from the given url"""
+        response = requests.get(url)
+        if response.status_code != 200:
+            raise Exception("Failed to fetch an image")
+        image = Image.open(BytesIO(response.content))
+        return image
+
+    def load_image_from_path(self, path):
+        """Loads an image from the given path"""
+        return Image.open(path)
+
+    def split_image(
+        self, image, h_splits: int = 2, v_splits: int = 2
+    ):
+        """Splits the given image into h_splits x v_splits parts"""
+        width, height = image.size
+        w_step, h_step = width // h_splits, height // v_splits
+        slices = []
+
+        for i in range(v_splits):
+            for j in range(h_splits):
+                slice = image.crop(
+                    (
+                        j * w_step,
+                        i * h_step,
+                        (j + 1) * w_step,
+                        (i + 1) * h_step,
+                    )
+                )
+                slices.append(slice)
+        return slices
+
+    def get_vectors(
+        self,
+        image,
+        h_splits: int = 2,
+        v_splits: int = 2,
+    ):
+        """Gets the vectors for the given image"""
+        slices = self.split_image(image, h_splits, v_splits)
+        vectors = []
+
+        for slice in slices:
+            inputs = self.processor(
+                text=self.query_text,
+                images=slice,
+                return_tensors="pt",
+                padding=True,
+            )
+            outputs = self.model(**inputs)
+            vectors.append(
+                outputs.image_embeds.squeeze().detach().numpy()
+            )
+        return vectors
+
+    def run_from_url(
+        self,
+        url: str = "https://picsum.photos/800",
+        h_splits: int = 2,
+        v_splits: int = 2,
+    ):
+        """Runs the model on the image fetched from the given url"""
+        image = self.fetch_image_from_url(url)
+        return self.get_vectors(image, h_splits, v_splits)
+
+    def check_hard_chunking(self, quadrants):
+        """Check if the chunking is hard"""
+        variances = []
+        for quadrant in quadrants:
+            edge_pixels = torch.cat(
+                [
+                    quadrant[0, 1],
+                    quadrant[-1, :],
+                ]
+            )
+            variances.append(torch.var(edge_pixels).item())
+        return variances
+
+    def embed_whole_image(self, image):
+        """Embed the entire image"""
+        inputs = self.processor(
+            image,
+            return_tensors="pt",
+        )
+        with torch.no_grad():
+            outputs = self.model(**inputs)
+            return outputs.image_embeds.squeeze()
+
+    def apply_noise_reduction(self, image, kernel_size: int = 5):
+        """Implement an upscaling method to upscale the image and tiling issues"""
+        blur = GaussianBlur(kernel_size)
+        return blur(image)
+
+    def run_from_path(
+        self, path: str = None, h_splits: int = 2, v_splits: int = 2
+    ):
+        """Runs the model on the image loaded from the given path"""
+        image = self.load_image_from_path(path)
+        return self.get_vectors(image, h_splits, v_splits)
+
+    def get_captions(self, image, candidate_captions):
+        """Get the best caption for the given image"""
+        inputs_image = self.processor(
+            images=image,
+            return_tensors="pt",
+        )
+
+        inputs_text = self.processor(
+            text=candidate_captions,
+            images=inputs_image.pixel_values[
+                0
+            ],  # Fix the argument name
+            return_tensors="pt",
+            padding=True,
+            truncation=True,
+        )
+
+        image_embeds = self.model(
+            pixel_values=inputs_image.pixel_values[0]
+        ).image_embeds
+        text_embeds = self.model(
+            input_ids=inputs_text.input_ids,
+            attention_mask=inputs_text.attention_mask,
+        ).text_embeds
+
+        # Calculate similarity between image and text
+        similarities = (image_embeds @ text_embeds.T).squeeze(0)
+        best_caption_index = similarities.argmax().item()
+
+        return candidate_captions[best_caption_index]
+
+    def get_and_concat_captions(
+        self, image, candidate_captions, h_splits=2, v_splits=2
+    ):
+        """Get the best caption for the given image"""
+        slices = self.split_image(image, h_splits, v_splits)
+        captions = [
+            self.get_captions(slice, candidate_captions)
+            for slice in slices
+        ]
+        concated_captions = "".join(captions)
+        return concated_captions
--- a/swarms/models/openai_models.py
+++ b/swarms/models/openai_models.py
@ -1,5 +1,7 @@
 from __future__ import annotations

+import asyncio
+import functools
 import logging
 import sys
 from typing import (
@ -16,6 +18,7 @@ from typing import (
    Optional,
    Set,
    Tuple,
+    Type,
    Union,
 )

@ -23,7 +26,7 @@ from langchain.callbacks.manager import (
    AsyncCallbackManagerForLLMRun,
    CallbackManagerForLLMRun,
 )
-from langchain.llms.base import BaseLLM, create_base_retry_decorator
+from langchain.llms.base import BaseLLM
 from langchain.pydantic_v1 import Field, root_validator
 from langchain.schema import Generation, LLMResult
 from langchain.schema.output import GenerationChunk
@ -32,7 +35,17 @@ from langchain.utils import (
    get_pydantic_field_names,
 )
 from langchain.utils.utils import build_extra_kwargs
+from tenacity import (
+    RetryCallState,
+    before_sleep_log,
+    retry,
+    retry_base,
+    retry_if_exception_type,
+    stop_after_attempt,
+    wait_exponential,
+)

+logger = logging.getLogger(__name__)

 from importlib.metadata import version

@ -41,6 +54,62 @@ from packaging.version import parse
 logger = logging.getLogger(__name__)


+@functools.lru_cache
+def _log_error_once(msg: str) -> None:
+    """Log an error once."""
+    logger.error(msg)
+
+
+def create_base_retry_decorator(
+    error_types: List[Type[BaseException]],
+    max_retries: int = 1,
+    run_manager: Optional[
+        Union[AsyncCallbackManagerForLLMRun, CallbackManagerForLLMRun]
+    ] = None,
+) -> Callable[[Any], Any]:
+    """Create a retry decorator for a given LLM and provided list of error types."""
+
+    _logging = before_sleep_log(logger, logging.WARNING)
+
+    def _before_sleep(retry_state: RetryCallState) -> None:
+        _logging(retry_state)
+        if run_manager:
+            if isinstance(run_manager, AsyncCallbackManagerForLLMRun):
+                coro = run_manager.on_retry(retry_state)
+                try:
+                    loop = asyncio.get_event_loop()
+                    if loop.is_running():
+                        loop.create_task(coro)
+                    else:
+                        asyncio.run(coro)
+                except Exception as e:
+                    _log_error_once(f"Error in on_retry: {e}")
+            else:
+                run_manager.on_retry(retry_state)
+        return None
+
+    min_seconds = 4
+    max_seconds = 10
+    # Wait 2^x * 1 second between each retry starting with
+    # 4 seconds, then up to 10 seconds, then 10 seconds afterwards
+    retry_instance: "retry_base" = retry_if_exception_type(
+        error_types[0]
+    )
+    for error in error_types[1:]:
+        retry_instance = retry_instance | retry_if_exception_type(
+            error
+        )
+    return retry(
+        reraise=True,
+        stop=stop_after_attempt(max_retries),
+        wait=wait_exponential(
+            multiplier=1, min=min_seconds, max=max_seconds
+        ),
+        retry=retry_instance,
+        before_sleep=_before_sleep,
+    )
+
+
 def is_openai_v1() -> bool:
    _version = parse(version("openai"))
    return _version.major >= 1
@ -833,7 +902,7 @@ class OpenAIChat(BaseLLM):
    """

    client: Any  #: :meta private:
-    model_name: str = "gpt-3.5-turbo-1106"
+    model_name: str = "gpt-4-1106-preview"
    model_kwargs: Dict[str, Any] = Field(default_factory=dict)
    openai_api_key: Optional[str] = None
    openai_api_base: Optional[str] = None
--- a/swarms/structs/agent.py
+++ b/swarms/structs/agent.py
@ -9,7 +9,7 @@ from typing import Any, Callable, Dict, List, Optional, Tuple

 from termcolor import colored

-from swarms.memory.base_vectordb import VectorDatabase
+from swarms.memory.base_vectordb import AbstractDatabase
 from swarms.prompts.agent_system_prompts import (
    AGENT_SYSTEM_PROMPT_3,
 )
@ -83,7 +83,7 @@ class Agent:
        pdf_path (str): The path to the pdf
        list_of_pdf (str): The list of pdf
        tokenizer (Any): The tokenizer
-        memory (VectorDatabase): The memory
+        memory (AbstractDatabase): The memory
        preset_stopping_token (bool): Enable preset stopping token
        traceback (Any): The traceback
        traceback_handlers (Any): The traceback handlers
@ -168,7 +168,7 @@ class Agent:
        pdf_path: Optional[str] = None,
        list_of_pdf: Optional[str] = None,
        tokenizer: Optional[Any] = None,
-        long_term_memory: Optional[VectorDatabase] = None,
+        long_term_memory: Optional[AbstractDatabase] = None,
        preset_stopping_token: Optional[bool] = False,
        traceback: Any = None,
        traceback_handlers: Any = None,
@ -657,7 +657,7 @@ class Agent:
            """
            return agent_history_prompt

-    def long_term_memory_prompt(self, query: str, prompt: str):
+    def long_term_memory_prompt(self, query: str):
        """
        Generate the agent long term memory prompt

@ -670,10 +670,15 @@ class Agent:
        """
        ltr = self.long_term_memory.query(query)

-        return f"""{prompt}
-            ################ CONTEXT ####################
+        context = f"""
+            {query}
+            ####### Long Term Memory ################
            {ltr}
        """
+        return self.short_memory.append([f"{context}"])
+
+    def add_memory(self, message: str):
+        return self.short_memory.append([f"{message}"])

    async def run_concurrent(self, tasks: List[str], **kwargs):
        """
--- a/swarms/structs/conversation.py
+++ b/swarms/structs/conversation.py
@ -60,6 +60,7 @@ class Conversation(BaseStructure):

    def __init__(
        self,
+        system_prompt: str,
        time_enabled: bool = False,
        database: AbstractDatabase = None,
        autosave: bool = False,
@ -68,12 +69,17 @@ class Conversation(BaseStructure):
        **kwargs,
    ):
        super().__init__()
+        self.system_prompt = system_prompt
        self.time_enabled = time_enabled
        self.database = database
        self.autosave = autosave
        self.save_filepath = save_filepath
        self.conversation_history = []

+        # If system prompt is not None, add it to the conversation history
+        if self.system_prompt:
+            self.add("system", self.system_prompt)
+
    def add(self, role: str, content: str, *args, **kwargs):
        """Add a message to the conversation history

--- a/swarms/structs/multi_agent_rag.py
+++ b/swarms/structs/multi_agent_rag.py
@ -0,0 +1,85 @@
+from dataclasses import dataclass
+from typing import List, Optional
+
+from swarms.memory.base_vectordatabase import AbstractVectorDatabase
+from swarms.structs.agent import Agent
+
+
+@dataclass
+class MultiAgentRag:
+    """
+    Represents a multi-agent RAG (Relational Agent Graph) structure.
+
+    Attributes:
+        agents (List[Agent]): List of agents in the multi-agent RAG.
+        db (AbstractVectorDatabase): Database used for querying.
+        verbose (bool): Flag indicating whether to print verbose output.
+    """
+
+    agents: List[Agent]
+    db: AbstractVectorDatabase
+    verbose: bool = False
+
+    def query_database(self, query: str):
+        """
+        Queries the database using the given query string.
+
+        Args:
+            query (str): The query string.
+
+        Returns:
+            List: The list of results from the database.
+        """
+        results = []
+        for agent in self.agents:
+            agent_results = agent.long_term_memory_prompt(query)
+            results.extend(agent_results)
+        return results
+
+    def get_agent_by_id(self, agent_id) -> Optional[Agent]:
+        """
+        Retrieves an agent from the multi-agent RAG by its ID.
+
+        Args:
+            agent_id: The ID of the agent to retrieve.
+
+        Returns:
+            Agent or None: The agent with the specified ID, or None if not found.
+        """
+        for agent in self.agents:
+            if agent.agent_id == agent_id:
+                return agent
+        return None
+
+    def add_message(
+        self, sender: Agent, message: str, *args, **kwargs
+    ):
+        """
+        Adds a message to the database.
+
+        Args:
+            sender (Agent): The agent sending the message.
+            message (str): The message to add.
+            *args: Additional positional arguments.
+            **kwargs: Additional keyword arguments.
+
+        Returns:
+            int: The ID of the added message.
+        """
+        doc = f"{sender.ai_name}: {message}"
+
+        return self.db.add(doc)
+
+    def query(self, message: str, *args, **kwargs):
+        """
+        Queries the database using the given message.
+
+        Args:
+            message (str): The message to query.
+            *args: Additional positional arguments.
+            **kwargs: Additional keyword arguments.
+
+        Returns:
+            List: The list of results from the database.
+        """
+        return self.db.query(message)
--- a/swarms/structs/task.py
+++ b/swarms/structs/task.py
@ -233,6 +233,7 @@ class Task:
                    if task.description is not None
                    else ""
                )
+
                result = (
                    task.result if task.result is not None else ""
                )
--- a/swarms/telemetry/sys_info.py
+++ b/swarms/telemetry/sys_info.py
@ -89,7 +89,6 @@ def get_package_mismatches(file_path="pyproject.toml"):
    return "\n" + "\n".join(mismatches)


-
 def system_info():
    swarms_verison = get_swarms_verison()
    return {
@ -100,4 +99,3 @@ def system_info():
        "CPU Info": get_cpu_info(),
        "RAM Info": get_ram_info(),
    }
-
--- a/swarms/telemetry/user_utils.py
+++ b/swarms/telemetry/user_utils.py
@ -5,6 +5,7 @@ import socket
 from swarms.telemetry.sys_info import system_info
 from swarms.telemetry.check_update import check_for_package

+
 # Helper functions
 def generate_user_id():
    """Generate user id
@ -75,7 +76,6 @@ def get_local_ip():
    return socket.gethostbyname(socket.gethostname())


-
 def get_user_device_data():
    data = {
        "ID": generate_user_id(),
@ -85,5 +85,6 @@ def get_user_device_data():
        "Swarms [Version]": check_for_package("swarms"),
    }
    return data
-    
-# 
+
+
+#
--- a/swarms/utils/init.py
+++ b/swarms/utils/init.py
@ -25,6 +25,14 @@ from swarms.utils.download_weights_from_url import (
 from swarms.utils.save_logs import parse_log_file


+########
+from swarms.utils.yaml_output_parser import YamlOutputParser
+from swarms.utils.json_output_parser import JsonOutputParser
+from swarms.utils.remove_json_whitespace import (
+    remove_whitespace_from_json,
+    remove_whitespace_from_yaml,
+)
+
 __all__ = [
    "SubprocessCodeInterpreter",
    "display_markdown_message",
@ -45,4 +53,8 @@ __all__ = [
    "try_except_wrapper",
    "download_weights_from_url",
    "parse_log_file",
+    "YamlOutputParser",
+    "JsonOutputParser",
+    "remove_whitespace_from_json",
+    "remove_whitespace_from_yaml",
 ]
--- a/swarms/utils/json_output_parser.py
+++ b/swarms/utils/json_output_parser.py
@ -0,0 +1,96 @@
+import json
+import re
+from typing import Type, TypeVar
+from pydantic import BaseModel, ValidationError
+
+T = TypeVar("T", bound=BaseModel)
+
+
+class JsonParsingException(Exception):
+    """Custom exception for errors in JSON parsing."""
+
+
+class JsonOutputParser:
+    """Parse JSON output using a Pydantic model.
+
+    This parser is designed to extract JSON formatted data from a given string
+    and parse it using a specified Pydantic model for validation.
+
+    Attributes:
+        pydantic_object: A Pydantic model class for parsing and validation.
+        pattern: A regex pattern to match JSON code blocks.
+
+    Examples:
+    >>> from pydantic import BaseModel
+    >>> from swarms.utils.json_output_parser import JsonOutputParser
+    >>> class MyModel(BaseModel):
+    ...     name: str
+    ...     age: int
+    ...
+    >>> parser = JsonOutputParser(MyModel)
+    >>> text = "```json\n{\"name\": \"John\", \"age\": 42}\n```"
+    >>> model = parser.parse(text)
+    >>> model.name
+
+    """
+
+    def __init__(self, pydantic_object: Type[T]):
+        self.pydantic_object = pydantic_object
+        self.pattern = re.compile(
+            r"^```(?:json)?(?P<json>[^`]*)", re.MULTILINE | re.DOTALL
+        )
+
+    def parse(self, text: str) -> T:
+        """Parse the provided text to extract and validate JSON data.
+
+        Args:
+            text: A string containing potential JSON data.
+
+        Returns:
+            An instance of the specified Pydantic model with parsed data.
+
+        Raises:
+            JsonParsingException: If parsing or validation fails.
+        """
+        try:
+            match = re.search(self.pattern, text.strip())
+            json_str = match.group("json") if match else text
+
+            json_object = json.loads(json_str)
+            return self.pydantic_object.parse_obj(json_object)
+
+        except (json.JSONDecodeError, ValidationError) as e:
+            name = self.pydantic_object.__name__
+            msg = (
+                f"Failed to parse {name} from text '{text}'."
+                f" Error: {e}"
+            )
+            raise JsonParsingException(msg) from e
+
+    def get_format_instructions(self) -> str:
+        """Generate formatting instructions based on the Pydantic model schema.
+
+        Returns:
+            A string containing formatting instructions.
+        """
+        schema = self.pydantic_object.schema()
+        reduced_schema = {
+            k: v
+            for k, v in schema.items()
+            if k not in ["title", "type"]
+        }
+        schema_str = json.dumps(reduced_schema, indent=4)
+
+        format_instructions = (
+            f"JSON Formatting Instructions:\n{schema_str}"
+        )
+        return format_instructions
+
+
+# # Example usage
+# class ExampleModel(BaseModel):
+#     field1: int
+#     field2: str
+
+# parser = JsonOutputParser(ExampleModel)
+# # Use parser.parse(text) to parse JSON data
--- a/swarms/utils/remove_json_whitespace.py
+++ b/swarms/utils/remove_json_whitespace.py
@ -0,0 +1,50 @@
+import json
+import yaml
+
+
+def remove_whitespace_from_json(json_string: str) -> str:
+    """
+    Removes unnecessary whitespace from a JSON string.
+
+    This function parses the JSON string into a Python object and then
+    serializes it back into a JSON string without unnecessary whitespace.
+
+    Args:
+        json_string (str): The JSON string.
+
+    Returns:
+        str: The JSON string with whitespace removed.
+    """
+    parsed = json.loads(json_string)
+    return json.dumps(parsed, separators=(",", ":"))
+
+
+# # Example usage for JSON
+# json_string = '{"field1": 123, "field2": "example text"}'
+# print(remove_whitespace_from_json(json_string))
+
+
+def remove_whitespace_from_yaml(yaml_string: str) -> str:
+    """
+    Removes unnecessary whitespace from a YAML string.
+
+    This function parses the YAML string into a Python object and then
+    serializes it back into a YAML string with minimized whitespace.
+    Note: This might change the representation style of YAML data.
+
+    Args:
+        yaml_string (str): The YAML string.
+
+    Returns:
+        str: The YAML string with whitespace reduced.
+    """
+    parsed = yaml.safe_load(yaml_string)
+    return yaml.dump(parsed, default_flow_style=True)
+
+
+# # Example usage for YAML
+# yaml_string = """
+# field1: 123
+# field2: example text
+# """
+# print(remove_whitespace_from_yaml(yaml_string))
--- a/swarms/utils/yaml_output_parser.py
+++ b/swarms/utils/yaml_output_parser.py
@ -0,0 +1,89 @@
+import json
+import re
+import yaml
+from typing import Type, TypeVar
+from pydantic import BaseModel, ValidationError
+
+T = TypeVar("T", bound=BaseModel)
+
+
+class YamlParsingException(Exception):
+    """Custom exception for errors in YAML parsing."""
+
+
+class YamlOutputParser:
+    """Parse YAML output using a Pydantic model.
+
+    This parser is designed to extract YAML formatted data from a given string
+    and parse it using a specified Pydantic model for validation.
+
+    Attributes:
+        pydantic_object: A Pydantic model class for parsing and validation.
+        pattern: A regex pattern to match YAML code blocks.
+
+
+    Examples:
+    >>> from pydantic import BaseModel
+    >>> from swarms.utils.yaml_output_parser import YamlOutputParser
+    >>> class MyModel(BaseModel):
+    ...     name: str
+    ...     age: int
+    ...
+    >>> parser = YamlOutputParser(MyModel)
+    >>> text = "```yaml\nname: John\nage: 42\n```"
+    >>> model = parser.parse(text)
+    >>> model.name
+
+    """
+
+    def __init__(self, pydantic_object: Type[T]):
+        self.pydantic_object = pydantic_object
+        self.pattern = re.compile(
+            r"^```(?:ya?ml)?(?P<yaml>[^`]*)", re.MULTILINE | re.DOTALL
+        )
+
+    def parse(self, text: str) -> T:
+        """Parse the provided text to extract and validate YAML data.
+
+        Args:
+            text: A string containing potential YAML data.
+
+        Returns:
+            An instance of the specified Pydantic model with parsed data.
+
+        Raises:
+            YamlParsingException: If parsing or validation fails.
+        """
+        try:
+            match = re.search(self.pattern, text.strip())
+            yaml_str = match.group("yaml") if match else text
+
+            json_object = yaml.safe_load(yaml_str)
+            return self.pydantic_object.parse_obj(json_object)
+
+        except (yaml.YAMLError, ValidationError) as e:
+            name = self.pydantic_object.__name__
+            msg = (
+                f"Failed to parse {name} from text '{text}'."
+                f" Error: {e}"
+            )
+            raise YamlParsingException(msg) from e
+
+    def get_format_instructions(self) -> str:
+        """Generate formatting instructions based on the Pydantic model schema.
+
+        Returns:
+            A string containing formatting instructions.
+        """
+        schema = self.pydantic_object.schema()
+        reduced_schema = {
+            k: v
+            for k, v in schema.items()
+            if k not in ["title", "type"]
+        }
+        schema_str = json.dumps(reduced_schema, indent=4)
+
+        format_instructions = (
+            f"YAML Formatting Instructions:\n{schema_str}"
+        )
+        return format_instructions