parent
e9bb8dcbf4
commit
aa4f3d1563
@ -1,132 +1,265 @@
|
|||||||
# Conversation Module Documentation
|
# Module/Class Name: Conversation
|
||||||
|
|
||||||
|
## Introduction
|
||||||
|
|
||||||
|
The `Conversation` class is a powerful tool for managing and structuring conversation data in a Python program. It enables you to create, manipulate, and analyze conversations easily. This documentation will provide you with a comprehensive understanding of the `Conversation` class, its attributes, methods, and how to effectively use it.
|
||||||
|
|
||||||
## Table of Contents
|
## Table of Contents
|
||||||
|
|
||||||
1. [Introduction](#introduction)
|
1. **Class Definition**
|
||||||
2. [Installation](#installation)
|
- Overview
|
||||||
3. [Class: Conversation](#class-conversation)
|
- Attributes
|
||||||
- [Attributes](#attributes)
|
|
||||||
- [Methods](#methods)
|
2. **Methods**
|
||||||
4. [Usage Examples](#usage-examples)
|
- `__init__(self, time_enabled: bool = False, *args, **kwargs)`
|
||||||
- [Example 1: Creating a Conversation](#example-1-creating-a-conversation)
|
- `add(self, role: str, content: str, *args, **kwargs)`
|
||||||
- [Example 2: Adding Messages](#example-2-adding-messages)
|
- `delete(self, index: str)`
|
||||||
- [Example 3: Displaying and Exporting Conversation](#example-3-displaying-and-exporting-conversation)
|
- `update(self, index: str, role, content)`
|
||||||
- [Example 4: Counting Messages by Role](#example-4-counting-messages-by-role)
|
- `query(self, index: str)`
|
||||||
- [Example 5: Loading and Searching](#example-5-loading-and-searching)
|
- `search(self, keyword: str)`
|
||||||
5. [Additional Information](#additional-information)
|
- `display_conversation(self, detailed: bool = False)`
|
||||||
6. [References](#references)
|
- `export_conversation(self, filename: str)`
|
||||||
|
- `import_conversation(self, filename: str)`
|
||||||
|
- `count_messages_by_role(self)`
|
||||||
|
- `return_history_as_string(self)`
|
||||||
|
- `save_as_json(self, filename: str)`
|
||||||
|
- `load_from_json(self, filename: str)`
|
||||||
|
- `search_keyword_in_conversation(self, keyword: str)`
|
||||||
|
- `pretty_print_conversation(self, messages)`
|
||||||
|
|
||||||
---
|
---
|
||||||
|
|
||||||
## 1. Introduction <a name="introduction"></a>
|
### 1. Class Definition
|
||||||
|
|
||||||
|
#### Overview
|
||||||
|
|
||||||
|
The `Conversation` class is designed to manage conversations by keeping track of messages and their attributes. It offers methods for adding, deleting, updating, querying, and displaying messages within the conversation. Additionally, it supports exporting and importing conversations, searching for specific keywords, and more.
|
||||||
|
|
||||||
|
#### Attributes
|
||||||
|
|
||||||
|
- `time_enabled (bool)`: A flag indicating whether to enable timestamp recording for messages.
|
||||||
|
- `conversation_history (list)`: A list that stores messages in the conversation.
|
||||||
|
|
||||||
|
### 2. Methods
|
||||||
|
|
||||||
|
#### `__init__(self, time_enabled: bool = False, *args, **kwargs)`
|
||||||
|
|
||||||
|
- **Description**: Initializes a new Conversation object.
|
||||||
|
- **Parameters**:
|
||||||
|
- `time_enabled (bool)`: If `True`, timestamps will be recorded for each message. Default is `False`.
|
||||||
|
|
||||||
|
#### `add(self, role: str, content: str, *args, **kwargs)`
|
||||||
|
|
||||||
|
- **Description**: Adds a message to the conversation history.
|
||||||
|
- **Parameters**:
|
||||||
|
- `role (str)`: The role of the speaker (e.g., "user," "assistant").
|
||||||
|
- `content (str)`: The content of the message.
|
||||||
|
|
||||||
|
#### `delete(self, index: str)`
|
||||||
|
|
||||||
|
- **Description**: Deletes a message from the conversation history.
|
||||||
|
- **Parameters**:
|
||||||
|
- `index (str)`: The index of the message to delete.
|
||||||
|
|
||||||
|
#### `update(self, index: str, role, content)`
|
||||||
|
|
||||||
|
- **Description**: Updates a message in the conversation history.
|
||||||
|
- **Parameters**:
|
||||||
|
- `index (str)`: The index of the message to update.
|
||||||
|
- `role (_type_)`: The new role of the speaker.
|
||||||
|
- `content (_type_)`: The new content of the message.
|
||||||
|
|
||||||
|
#### `query(self, index: str)`
|
||||||
|
|
||||||
|
- **Description**: Retrieves a message from the conversation history.
|
||||||
|
- **Parameters**:
|
||||||
|
- `index (str)`: The index of the message to query.
|
||||||
|
- **Returns**: The message as a string.
|
||||||
|
|
||||||
|
#### `search(self, keyword: str)`
|
||||||
|
|
||||||
|
- **Description**: Searches for messages containing a specific keyword in the conversation history.
|
||||||
|
- **Parameters**:
|
||||||
|
- `keyword (str)`: The keyword to search for.
|
||||||
|
- **Returns**: A list of messages that contain the keyword.
|
||||||
|
|
||||||
|
#### `display_conversation(self, detailed: bool = False)`
|
||||||
|
|
||||||
|
- **Description**: Displays the conversation history.
|
||||||
|
- **Parameters**:
|
||||||
|
- `detailed (bool, optional)`: If `True`, provides detailed information about each message. Default is `False`.
|
||||||
|
|
||||||
|
#### `export_conversation(self, filename: str)`
|
||||||
|
|
||||||
|
- **Description**: Exports the conversation history to a text file.
|
||||||
|
- **Parameters**:
|
||||||
|
- `filename (str)`: The name of the file to export to.
|
||||||
|
|
||||||
|
#### `import_conversation(self, filename: str)`
|
||||||
|
|
||||||
|
- **Description**: Imports a conversation history from a text file.
|
||||||
|
- **Parameters**:
|
||||||
|
- `filename (str)`: The name of the file to import from.
|
||||||
|
|
||||||
|
#### `count_messages_by_role(self)`
|
||||||
|
|
||||||
|
- **Description**: Counts the number of messages by role in the conversation.
|
||||||
|
- **Returns**: A dictionary containing the count of messages for each role.
|
||||||
|
|
||||||
|
#### `return_history_as_string(self)`
|
||||||
|
|
||||||
|
- **Description**: Returns the entire conversation history as a single string.
|
||||||
|
- **Returns**: The conversation history as a string.
|
||||||
|
|
||||||
|
#### `save_as_json(self, filename: str)`
|
||||||
|
|
||||||
|
- **Description**: Saves the conversation history as a JSON file.
|
||||||
|
- **Parameters**:
|
||||||
|
- `filename (str)`: The name of the JSON file to save.
|
||||||
|
|
||||||
The Conversation module provides a versatile and extensible structure for managing and analyzing text-based conversations. Whether you're developing a chatbot, analyzing customer support interactions, or conducting research on dialogues, this module simplifies the process of handling conversation data.
|
#### `load_from_json(self, filename: str)`
|
||||||
|
|
||||||
With the Conversation module, you can add, delete, update, query, and search for messages within a conversation. You can also display, export, and import conversation history, making it an essential tool for various applications.
|
- **Description**: Loads a conversation history from a JSON file.
|
||||||
|
- **Parameters**:
|
||||||
|
- `filename (str)`: The name of the JSON file to load.
|
||||||
|
|
||||||
## 2. Installation <a name="installation"></a>
|
#### `search_keyword_in_conversation(self, keyword: str)`
|
||||||
|
|
||||||
To use the Conversation module, you need to have Python installed on your system. Additionally, you can install the required dependencies using pip:
|
- **Description**: Searches for a keyword in the conversation history and returns matching messages.
|
||||||
|
- **Parameters**:
|
||||||
|
- `keyword (str)`: The keyword to search for.
|
||||||
|
- **Returns**: A list of messages containing the keyword.
|
||||||
|
|
||||||
```bash
|
#### `pretty_print_conversation(self, messages)`
|
||||||
pip install termcolor
|
|
||||||
|
- **Description**: Pretty prints a list of messages with colored role indicators.
|
||||||
|
- **Parameters**:
|
||||||
|
- `messages (list)`: A list of messages to print.
|
||||||
|
|
||||||
|
## Examples
|
||||||
|
|
||||||
|
Here are some usage examples of the `Conversation` class:
|
||||||
|
|
||||||
|
### Creating a Conversation
|
||||||
|
|
||||||
|
```python
|
||||||
|
from swarms.structs import Conversation
|
||||||
|
|
||||||
|
conv = Conversation()
|
||||||
```
|
```
|
||||||
|
|
||||||
Once you have the dependencies installed, you can import the Conversation module into your Python code.
|
### Adding Messages
|
||||||
|
|
||||||
```python
|
```python
|
||||||
from swarms.structs.conversation import Conversation
|
conv.add("user", "Hello, world!")
|
||||||
|
conv.add("assistant", "Hello, user!")
|
||||||
```
|
```
|
||||||
|
|
||||||
## 3. Class: Conversation <a name="class-conversation"></a>
|
### Displaying the Conversation
|
||||||
|
|
||||||
The Conversation class is the core of this module. It allows you to create and manipulate conversation histories. Below are the attributes and methods provided by this class.
|
```python
|
||||||
|
conv.display_conversation()
|
||||||
|
```
|
||||||
|
|
||||||
### Attributes <a name="attributes"></a>
|
### Searching for Messages
|
||||||
|
|
||||||
- `time_enabled` (bool): Indicates whether timestamps are enabled for messages in the conversation.
|
```python
|
||||||
- `conversation_history` (list): A list that stores the conversation history as a collection of messages.
|
result = conv.search("Hello")
|
||||||
|
```
|
||||||
|
|
||||||
### Methods <a name="methods"></a>
|
### Exporting and Importing Conversations
|
||||||
|
|
||||||
The Conversation class provides the following methods:
|
```python
|
||||||
|
conv.export_conversation("conversation.txt")
|
||||||
|
conv.import_conversation("conversation.txt")
|
||||||
|
```
|
||||||
|
|
||||||
- `add(role: str, content: str, *args, **kwargs)`: Adds a message to the conversation history.
|
### Counting Messages by Role
|
||||||
- `delete(index: str)`: Deletes a message from the conversation history.
|
|
||||||
- `update(index: str, role, content)`: Updates a message in the conversation history.
|
|
||||||
- `query(index: str)`: Queries a message in the conversation history.
|
|
||||||
- `search(keyword: str)`: Searches for messages containing a specific keyword.
|
|
||||||
- `display_conversation(detailed: bool = False)`: Displays the conversation history.
|
|
||||||
- `export_conversation(filename: str)`: Exports the conversation history to a file.
|
|
||||||
- `import_conversation(filename: str)`: Imports a conversation history from a file.
|
|
||||||
- `count_messages_by_role()`: Counts the number of messages by role.
|
|
||||||
- `return_history_as_string()`: Returns the conversation history as a string.
|
|
||||||
- `save_as_json(filename: str)`: Saves the conversation history as a JSON file.
|
|
||||||
- `load_from_json(filename: str)`: Loads the conversation history from a JSON file.
|
|
||||||
- `search_keyword_in_conversation(keyword: str)`: Searches for a keyword in the conversation history.
|
|
||||||
- `pretty_print_conversation(messages)`: Pretty prints the conversation history.
|
|
||||||
|
|
||||||
## 4. Usage Examples <a name="usage-examples"></a>
|
```python
|
||||||
|
counts = conv.count_messages_by_role()
|
||||||
|
```
|
||||||
|
|
||||||
In this section, we'll provide practical examples of how to use the Conversation module to manage and analyze conversation data.
|
### Loading and Saving as JSON
|
||||||
|
|
||||||
### Example 1: Creating a Conversation <a name="example-1-creating-a-conversation"></a>
|
```python
|
||||||
|
conv.save_as_json("conversation.json")
|
||||||
|
conv.load_from_json("conversation.json")
|
||||||
|
```
|
||||||
|
|
||||||
|
Certainly! Let's continue with more examples and additional information about the `Conversation` class.
|
||||||
|
|
||||||
Let's start by creating a Conversation object and enabling timestamps for messages:
|
### Querying a Specific Message
|
||||||
|
|
||||||
|
You can retrieve a specific message from the conversation by its index:
|
||||||
|
|
||||||
```python
|
```python
|
||||||
conversation = Conversation(time_enabled=True)
|
message = conv.query(0) # Retrieves the first message
|
||||||
```
|
```
|
||||||
|
|
||||||
### Example 2: Adding Messages <a name="example-2-adding-messages"></a>
|
### Updating a Message
|
||||||
|
|
||||||
You can add messages to the conversation using the `add` method. Here's how to add a user message and an assistant response:
|
You can update a message's content or role within the conversation:
|
||||||
|
|
||||||
```python
|
```python
|
||||||
conversation.add("user", "Hello, how can I help you?")
|
conv.update(0, "user", "Hi there!") # Updates the first message
|
||||||
conversation.add("assistant", "Hi there! I'm here to assist you.")
|
|
||||||
```
|
```
|
||||||
|
|
||||||
### Example 3: Displaying and Exporting Conversation <a name="example-3-displaying-and-exporting-conversation"></a>
|
### Deleting a Message
|
||||||
|
|
||||||
You can display the conversation history and export it to a file. Let's see how to do this:
|
If you want to remove a message from the conversation, you can use the `delete` method:
|
||||||
|
|
||||||
```python
|
```python
|
||||||
# Display the conversation
|
conv.delete(0) # Deletes the first message
|
||||||
conversation.display_conversation()
|
```
|
||||||
|
|
||||||
# Export the conversation to a file
|
### Counting Messages by Role
|
||||||
conversation.export_conversation("conversation_history.txt")
|
|
||||||
|
You can count the number of messages by role in the conversation:
|
||||||
|
|
||||||
|
```python
|
||||||
|
counts = conv.count_messages_by_role()
|
||||||
|
# Example result: {'user': 2, 'assistant': 2}
|
||||||
```
|
```
|
||||||
|
|
||||||
### Example 4: Counting Messages by Role <a name="example-4-counting-messages-by-role"></a>
|
### Exporting and Importing as Text
|
||||||
|
|
||||||
You can count the number of messages by role (e.g., user, assistant, system) using the `count_messages_by_role` method:
|
You can export the conversation to a text file and later import it:
|
||||||
|
|
||||||
```python
|
```python
|
||||||
message_counts = conversation.count_messages_by_role()
|
conv.export_conversation("conversation.txt") # Export
|
||||||
print(message_counts)
|
conv.import_conversation("conversation.txt") # Import
|
||||||
```
|
```
|
||||||
|
|
||||||
### Example 5: Loading and Searching <a name="example-5-loading-and-searching"></a>
|
### Exporting and Importing as JSON
|
||||||
|
|
||||||
You can load a conversation from a file and search for messages containing a specific keyword:
|
Conversations can also be saved and loaded as JSON files:
|
||||||
|
|
||||||
```python
|
```python
|
||||||
# Load conversation from a file
|
conv.save_as_json("conversation.json") # Save as JSON
|
||||||
conversation.load_from_json("saved_conversation.json")
|
conv.load_from_json("conversation.json") # Load from JSON
|
||||||
|
```
|
||||||
|
|
||||||
# Search for messages containing the keyword "help"
|
### Searching for a Keyword
|
||||||
results = conversation.search("help")
|
|
||||||
print(results)
|
You can search for messages containing a specific keyword within the conversation:
|
||||||
|
|
||||||
|
```python
|
||||||
|
results = conv.search_keyword_in_conversation("Hello")
|
||||||
```
|
```
|
||||||
|
|
||||||
## 5. Additional Information <a name="additional-information"></a>
|
### Pretty Printing
|
||||||
|
|
||||||
|
The `pretty_print_conversation` method provides a visually appealing way to display messages with colored role indicators:
|
||||||
|
|
||||||
|
```python
|
||||||
|
conv.pretty_print_conversation(conv.conversation_history)
|
||||||
|
```
|
||||||
|
|
||||||
- The Conversation module is designed to provide flexibility and ease of use for managing and analyzing text-based conversations.
|
These examples demonstrate the versatility of the `Conversation` class in managing and interacting with conversation data. Whether you're building a chatbot, conducting analysis, or simply organizing dialogues, this class offers a robust set of tools to help you accomplish your goals.
|
||||||
- You can extend the module by adding custom functionality or integrating it into your chatbot or natural language processing applications.
|
|
||||||
|
|
||||||
## 6. References <a name="references"></a>
|
## Conclusion
|
||||||
|
|
||||||
For more information on the Conversation module and its usage, refer to the official documentation and examples.
|
The `Conversation` class is a valuable utility for handling conversation data in Python. With its ability to add, update, delete, search, export, and import messages, you have the flexibility to work with conversations in various ways. Feel free to explore its features and adapt them to your specific projects and applications.
|
||||||
|
|
||||||
|
If you have any further questions or need additional assistance, please don't hesitate to ask!
|
@ -0,0 +1,159 @@
|
|||||||
|
from abc import ABC, abstractmethod
|
||||||
|
|
||||||
|
|
||||||
|
class AbstractDatabase(ABC):
|
||||||
|
"""
|
||||||
|
Abstract base class for a database.
|
||||||
|
|
||||||
|
This class defines the interface for interacting with a database.
|
||||||
|
Subclasses must implement the abstract methods to provide the
|
||||||
|
specific implementation details for connecting to a database,
|
||||||
|
executing queries, and performing CRUD operations.
|
||||||
|
|
||||||
|
"""
|
||||||
|
|
||||||
|
@abstractmethod
|
||||||
|
def connect(self):
|
||||||
|
"""
|
||||||
|
Connect to the database.
|
||||||
|
|
||||||
|
This method establishes a connection to the database.
|
||||||
|
|
||||||
|
"""
|
||||||
|
|
||||||
|
pass
|
||||||
|
|
||||||
|
@abstractmethod
|
||||||
|
def close(self):
|
||||||
|
"""
|
||||||
|
Close the database connection.
|
||||||
|
|
||||||
|
This method closes the connection to the database.
|
||||||
|
|
||||||
|
"""
|
||||||
|
|
||||||
|
pass
|
||||||
|
|
||||||
|
@abstractmethod
|
||||||
|
def execute_query(self, query):
|
||||||
|
"""
|
||||||
|
Execute a database query.
|
||||||
|
|
||||||
|
This method executes the given query on the database.
|
||||||
|
|
||||||
|
Parameters:
|
||||||
|
query (str): The query to be executed.
|
||||||
|
|
||||||
|
"""
|
||||||
|
|
||||||
|
pass
|
||||||
|
|
||||||
|
@abstractmethod
|
||||||
|
def fetch_all(self):
|
||||||
|
"""
|
||||||
|
Fetch all rows from the result set.
|
||||||
|
|
||||||
|
This method retrieves all rows from the result set of a query.
|
||||||
|
|
||||||
|
Returns:
|
||||||
|
list: A list of dictionaries representing the rows.
|
||||||
|
|
||||||
|
"""
|
||||||
|
|
||||||
|
pass
|
||||||
|
|
||||||
|
@abstractmethod
|
||||||
|
def fetch_one(self):
|
||||||
|
"""
|
||||||
|
Fetch one row from the result set.
|
||||||
|
|
||||||
|
This method retrieves one row from the result set of a query.
|
||||||
|
|
||||||
|
Returns:
|
||||||
|
dict: A dictionary representing the row.
|
||||||
|
|
||||||
|
"""
|
||||||
|
|
||||||
|
pass
|
||||||
|
|
||||||
|
@abstractmethod
|
||||||
|
def add(self, table, data):
|
||||||
|
"""
|
||||||
|
Add a new record to the database.
|
||||||
|
|
||||||
|
This method adds a new record to the specified table in the database.
|
||||||
|
|
||||||
|
Parameters:
|
||||||
|
table (str): The name of the table.
|
||||||
|
data (dict): A dictionary representing the data to be added.
|
||||||
|
|
||||||
|
"""
|
||||||
|
|
||||||
|
pass
|
||||||
|
|
||||||
|
@abstractmethod
|
||||||
|
def query(self, table, condition):
|
||||||
|
"""
|
||||||
|
Query the database.
|
||||||
|
|
||||||
|
This method queries the specified table in the database based on the given condition.
|
||||||
|
|
||||||
|
Parameters:
|
||||||
|
table (str): The name of the table.
|
||||||
|
condition (str): The condition to be applied in the query.
|
||||||
|
|
||||||
|
Returns:
|
||||||
|
list: A list of dictionaries representing the query results.
|
||||||
|
|
||||||
|
"""
|
||||||
|
|
||||||
|
pass
|
||||||
|
|
||||||
|
@abstractmethod
|
||||||
|
def get(self, table, id):
|
||||||
|
"""
|
||||||
|
Get a record from the database.
|
||||||
|
|
||||||
|
This method retrieves a record from the specified table in the database based on the given ID.
|
||||||
|
|
||||||
|
Parameters:
|
||||||
|
table (str): The name of the table.
|
||||||
|
id (int): The ID of the record to be retrieved.
|
||||||
|
|
||||||
|
Returns:
|
||||||
|
dict: A dictionary representing the retrieved record.
|
||||||
|
|
||||||
|
"""
|
||||||
|
|
||||||
|
pass
|
||||||
|
|
||||||
|
@abstractmethod
|
||||||
|
def update(self, table, id, data):
|
||||||
|
"""
|
||||||
|
Update a record in the database.
|
||||||
|
|
||||||
|
This method updates a record in the specified table in the database based on the given ID.
|
||||||
|
|
||||||
|
Parameters:
|
||||||
|
table (str): The name of the table.
|
||||||
|
id (int): The ID of the record to be updated.
|
||||||
|
data (dict): A dictionary representing the updated data.
|
||||||
|
|
||||||
|
"""
|
||||||
|
|
||||||
|
pass
|
||||||
|
|
||||||
|
@abstractmethod
|
||||||
|
def delete(self, table, id):
|
||||||
|
"""
|
||||||
|
Delete a record from the database.
|
||||||
|
|
||||||
|
This method deletes a record from the specified table in the database based on the given ID.
|
||||||
|
|
||||||
|
Parameters:
|
||||||
|
table (str): The name of the table.
|
||||||
|
id (int): The ID of the record to be deleted.
|
||||||
|
|
||||||
|
"""
|
||||||
|
|
||||||
|
pass
|
@ -1,302 +1,140 @@
|
|||||||
import subprocess
|
|
||||||
import uuid
|
import uuid
|
||||||
from typing import Optional
|
from typing import Any, List, Optional
|
||||||
from attr import define, field, Factory
|
from sqlalchemy import JSON, Column, String, create_engine
|
||||||
from dataclasses import dataclass
|
from sqlalchemy.dialects.postgresql import UUID
|
||||||
from swarms.memory.base import BaseVectorStore
|
from sqlalchemy.ext.declarative import declarative_base
|
||||||
|
from sqlalchemy.orm import Session
|
||||||
|
|
||||||
try:
|
|
||||||
from sqlalchemy.engine import Engine
|
|
||||||
from sqlalchemy import create_engine, Column, String, JSON
|
|
||||||
from sqlalchemy.ext.declarative import declarative_base
|
|
||||||
from sqlalchemy.dialects.postgresql import UUID
|
|
||||||
from sqlalchemy.orm import Session
|
|
||||||
except ImportError:
|
|
||||||
print(
|
|
||||||
"The PgVectorVectorStore requires sqlalchemy to be installed"
|
|
||||||
)
|
|
||||||
print("pip install sqlalchemy")
|
|
||||||
subprocess.run(["pip", "install", "sqlalchemy"])
|
|
||||||
|
|
||||||
try:
|
|
||||||
from pgvector.sqlalchemy import Vector
|
|
||||||
except ImportError:
|
|
||||||
print("The PgVectorVectorStore requires pgvector to be installed")
|
|
||||||
print("pip install pgvector")
|
|
||||||
subprocess.run(["pip", "install", "pgvector"])
|
|
||||||
|
|
||||||
|
class PostgresDB:
|
||||||
|
"""
|
||||||
|
A class representing a Postgres database.
|
||||||
|
|
||||||
@define
|
Args:
|
||||||
class PgVectorVectorStore(BaseVectorStore):
|
connection_string (str): The connection string for the Postgres database.
|
||||||
"""A vector store driver to Postgres using the PGVector extension.
|
table_name (str): The name of the table in the database.
|
||||||
|
|
||||||
Attributes:
|
Attributes:
|
||||||
connection_string: An optional string describing the target Postgres database instance.
|
engine: The SQLAlchemy engine for connecting to the database.
|
||||||
create_engine_params: Additional configuration params passed when creating the database connection.
|
table_name (str): The name of the table in the database.
|
||||||
engine: An optional sqlalchemy Postgres engine to use.
|
VectorModel: The SQLAlchemy model representing the vector table.
|
||||||
table_name: Optionally specify the name of the table to used to store vectors.
|
|
||||||
|
|
||||||
Methods:
|
|
||||||
upsert_vector(vector: list[float], vector_id: Optional[str] = None, namespace: Optional[str] = None, meta: Optional[dict] = None, **kwargs) -> str:
|
|
||||||
Upserts a vector into the index.
|
|
||||||
load_entry(vector_id: str, namespace: Optional[str] = None) -> Optional[BaseVector.Entry]:
|
|
||||||
Loads a single vector from the index.
|
|
||||||
load_entries(namespace: Optional[str] = None) -> list[BaseVector.Entry]:
|
|
||||||
Loads all vectors from the index.
|
|
||||||
query(query: str, count: Optional[int] = None, namespace: Optional[str] = None, include_vectors: bool = False, include_metadata=True, **kwargs) -> list[BaseVector.QueryResult]:
|
|
||||||
Queries the index for vectors similar to the given query string.
|
|
||||||
setup(create_schema: bool = True, install_uuid_extension: bool = True, install_vector_extension: bool = True) -> None:
|
|
||||||
Provides a mechanism to initialize the database schema and extensions.
|
|
||||||
|
|
||||||
Usage:
|
|
||||||
>>> from swarms.memory.vector_stores.pgvector import PgVectorVectorStore
|
|
||||||
>>> from swarms.utils.embeddings import USEEmbedding
|
|
||||||
>>> from swarms.utils.hash import str_to_hash
|
|
||||||
>>> from swarms.utils.dataframe import dataframe_to_hash
|
|
||||||
>>> import pandas as pd
|
|
||||||
>>>
|
|
||||||
>>> # Create a new PgVectorVectorStore instance:
|
|
||||||
>>> pv = PgVectorVectorStore(
|
|
||||||
>>> connection_string="postgresql://postgres:password@localhost:5432/postgres",
|
|
||||||
>>> table_name="your-table-name"
|
|
||||||
>>> )
|
|
||||||
>>> # Create a new index:
|
|
||||||
>>> pv.setup()
|
|
||||||
>>> # Create a new USEEmbedding instance:
|
|
||||||
>>> use = USEEmbedding()
|
|
||||||
>>> # Create a new dataframe:
|
|
||||||
>>> df = pd.DataFrame({
|
|
||||||
>>> "text": [
|
|
||||||
>>> "This is a test",
|
|
||||||
>>> "This is another test",
|
|
||||||
>>> "This is a third test"
|
|
||||||
>>> ]
|
|
||||||
>>> })
|
|
||||||
>>> # Embed the dataframe:
|
|
||||||
>>> df["embedding"] = df["text"].apply(use.embed_string)
|
|
||||||
>>> # Upsert the dataframe into the index:
|
|
||||||
>>> pv.upsert_vector(
|
|
||||||
>>> vector=df["embedding"].tolist(),
|
|
||||||
>>> vector_id=dataframe_to_hash(df),
|
|
||||||
>>> namespace="your-namespace"
|
|
||||||
>>> )
|
|
||||||
>>> # Query the index:
|
|
||||||
>>> pv.query(
|
|
||||||
>>> query="This is a test",
|
|
||||||
>>> count=10,
|
|
||||||
>>> namespace="your-namespace"
|
|
||||||
>>> )
|
|
||||||
>>> # Load a single entry from the index:
|
|
||||||
>>> pv.load_entry(
|
|
||||||
>>> vector_id=dataframe_to_hash(df),
|
|
||||||
>>> namespace="your-namespace"
|
|
||||||
>>> )
|
|
||||||
>>> # Load all entries from the index:
|
|
||||||
>>> pv.load_entries(
|
|
||||||
>>> namespace="your-namespace"
|
|
||||||
>>> )
|
|
||||||
|
|
||||||
|
|
||||||
"""
|
"""
|
||||||
|
|
||||||
connection_string: Optional[str] = field(
|
def __init__(
|
||||||
default=None, kw_only=True
|
self, connection_string: str, table_name: str, *args, **kwargs
|
||||||
)
|
):
|
||||||
create_engine_params: dict = field(factory=dict, kw_only=True)
|
"""
|
||||||
engine: Optional[Engine] = field(default=None, kw_only=True)
|
Initializes a new instance of the PostgresDB class.
|
||||||
table_name: str = field(kw_only=True)
|
|
||||||
_model: any = field(
|
|
||||||
default=Factory(
|
|
||||||
lambda self: self.default_vector_model(), takes_self=True
|
|
||||||
)
|
|
||||||
)
|
|
||||||
|
|
||||||
@connection_string.validator
|
|
||||||
def validate_connection_string(
|
|
||||||
self, _, connection_string: Optional[str]
|
|
||||||
) -> None:
|
|
||||||
# If an engine is provided, the connection string is not used.
|
|
||||||
if self.engine is not None:
|
|
||||||
return
|
|
||||||
|
|
||||||
# If an engine is not provided, a connection string is required.
|
Args:
|
||||||
if connection_string is None:
|
connection_string (str): The connection string for the Postgres database.
|
||||||
raise ValueError(
|
table_name (str): The name of the table in the database.
|
||||||
"An engine or connection string is required"
|
|
||||||
)
|
|
||||||
|
|
||||||
if not connection_string.startswith("postgresql://"):
|
"""
|
||||||
raise ValueError(
|
self.engine = create_engine(
|
||||||
"The connection string must describe a Postgres"
|
connection_string, *args, **kwargs
|
||||||
" database connection"
|
|
||||||
)
|
)
|
||||||
|
self.table_name = table_name
|
||||||
|
self.VectorModel = self._create_vector_model()
|
||||||
|
|
||||||
@engine.validator
|
def _create_vector_model(self):
|
||||||
def validate_engine(self, _, engine: Optional[Engine]) -> None:
|
"""
|
||||||
# If a connection string is provided, an engine does not need to be provided.
|
Creates the SQLAlchemy model for the vector table.
|
||||||
if self.connection_string is not None:
|
|
||||||
return
|
|
||||||
|
|
||||||
# If a connection string is not provided, an engine is required.
|
Returns:
|
||||||
if engine is None:
|
The SQLAlchemy model representing the vector table.
|
||||||
raise ValueError(
|
|
||||||
"An engine or connection string is required"
|
|
||||||
)
|
|
||||||
|
|
||||||
def __attrs_post_init__(self) -> None:
|
|
||||||
"""If a an engine is provided, it will be used to connect to the database.
|
|
||||||
If not, a connection string is used to create a new database connection here.
|
|
||||||
"""
|
"""
|
||||||
if self.engine is None:
|
Base = declarative_base()
|
||||||
self.engine = create_engine(
|
|
||||||
self.connection_string, **self.create_engine_params
|
|
||||||
)
|
|
||||||
|
|
||||||
def setup(
|
class VectorModel(Base):
|
||||||
self,
|
__tablename__ = self.table_name
|
||||||
create_schema: bool = True,
|
|
||||||
install_uuid_extension: bool = True,
|
|
||||||
install_vector_extension: bool = True,
|
|
||||||
) -> None:
|
|
||||||
"""Provides a mechanism to initialize the database schema and extensions."""
|
|
||||||
if install_uuid_extension:
|
|
||||||
self.engine.execute(
|
|
||||||
'CREATE EXTENSION IF NOT EXISTS "uuid-ossp";'
|
|
||||||
)
|
|
||||||
|
|
||||||
if install_vector_extension:
|
id = Column(
|
||||||
self.engine.execute(
|
UUID(as_uuid=True),
|
||||||
'CREATE EXTENSION IF NOT EXISTS "vector";'
|
primary_key=True,
|
||||||
|
default=uuid.uuid4,
|
||||||
|
unique=True,
|
||||||
|
nullable=False,
|
||||||
)
|
)
|
||||||
|
vector = Column(
|
||||||
|
String
|
||||||
|
) # Assuming vector is stored as a string
|
||||||
|
namespace = Column(String)
|
||||||
|
meta = Column(JSON)
|
||||||
|
|
||||||
if create_schema:
|
return VectorModel
|
||||||
self._model.metadata.create_all(self.engine)
|
|
||||||
|
|
||||||
def upsert_vector(
|
def add_or_update_vector(
|
||||||
self,
|
self,
|
||||||
vector: list[float],
|
vector: str,
|
||||||
vector_id: Optional[str] = None,
|
vector_id: Optional[str] = None,
|
||||||
namespace: Optional[str] = None,
|
namespace: Optional[str] = None,
|
||||||
meta: Optional[dict] = None,
|
meta: Optional[dict] = None,
|
||||||
**kwargs,
|
) -> None:
|
||||||
) -> str:
|
"""
|
||||||
"""Inserts or updates a vector in the collection."""
|
Adds or updates a vector in the database.
|
||||||
|
|
||||||
|
Args:
|
||||||
|
vector (str): The vector to be added or updated.
|
||||||
|
vector_id (str, optional): The ID of the vector. If not provided, a new ID will be generated.
|
||||||
|
namespace (str, optional): The namespace of the vector.
|
||||||
|
meta (dict, optional): Additional metadata associated with the vector.
|
||||||
|
|
||||||
|
"""
|
||||||
|
try:
|
||||||
with Session(self.engine) as session:
|
with Session(self.engine) as session:
|
||||||
obj = self._model(
|
obj = self.VectorModel(
|
||||||
id=vector_id,
|
id=vector_id,
|
||||||
vector=vector,
|
vector=vector,
|
||||||
namespace=namespace,
|
namespace=namespace,
|
||||||
meta=meta,
|
meta=meta,
|
||||||
)
|
)
|
||||||
|
session.merge(obj)
|
||||||
obj = session.merge(obj)
|
|
||||||
session.commit()
|
session.commit()
|
||||||
|
except Exception as e:
|
||||||
|
print(f"Error adding or updating vector: {e}")
|
||||||
|
|
||||||
return str(obj.id)
|
def query_vectors(
|
||||||
|
self, query: Any, namespace: Optional[str] = None
|
||||||
|
) -> List[Any]:
|
||||||
|
"""
|
||||||
|
Queries vectors from the database based on the given query and namespace.
|
||||||
|
|
||||||
def load_entry(
|
Args:
|
||||||
self, vector_id: str, namespace: Optional[str] = None
|
query (Any): The query or condition to filter the vectors.
|
||||||
) -> BaseVectorStore.Entry:
|
namespace (str, optional): The namespace of the vectors to be queried.
|
||||||
"""Retrieves a specific vector entry from the collection based on its identifier and optional namespace."""
|
|
||||||
with Session(self.engine) as session:
|
|
||||||
result = session.get(self._model, vector_id)
|
|
||||||
|
|
||||||
return BaseVectorStore.Entry(
|
Returns:
|
||||||
id=result.id,
|
List[Any]: A list of vectors that match the query and namespace.
|
||||||
vector=result.vector,
|
|
||||||
namespace=result.namespace,
|
|
||||||
meta=result.meta,
|
|
||||||
)
|
|
||||||
|
|
||||||
def load_entries(
|
|
||||||
self, namespace: Optional[str] = None
|
|
||||||
) -> list[BaseVectorStore.Entry]:
|
|
||||||
"""Retrieves all vector entries from the collection, optionally filtering to only
|
|
||||||
those that match the provided namespace.
|
|
||||||
"""
|
"""
|
||||||
|
try:
|
||||||
with Session(self.engine) as session:
|
with Session(self.engine) as session:
|
||||||
query = session.query(self._model)
|
q = session.query(self.VectorModel)
|
||||||
if namespace:
|
if namespace:
|
||||||
query = query.filter_by(namespace=namespace)
|
q = q.filter_by(namespace=namespace)
|
||||||
|
# Assuming 'query' is a condition or filter
|
||||||
results = query.all()
|
q = q.filter(query)
|
||||||
|
return q.all()
|
||||||
return [
|
except Exception as e:
|
||||||
BaseVectorStore.Entry(
|
print(f"Error querying vectors: {e}")
|
||||||
id=str(result.id),
|
return []
|
||||||
vector=result.vector,
|
|
||||||
namespace=result.namespace,
|
def delete_vector(self, vector_id):
|
||||||
meta=result.meta,
|
|
||||||
)
|
|
||||||
for result in results
|
|
||||||
]
|
|
||||||
|
|
||||||
def query(
|
|
||||||
self,
|
|
||||||
query: str,
|
|
||||||
count: Optional[int] = BaseVectorStore.DEFAULT_QUERY_COUNT,
|
|
||||||
namespace: Optional[str] = None,
|
|
||||||
include_vectors: bool = False,
|
|
||||||
distance_metric: str = "cosine_distance",
|
|
||||||
**kwargs,
|
|
||||||
) -> list[BaseVectorStore.QueryResult]:
|
|
||||||
"""Performs a search on the collection to find vectors similar to the provided input vector,
|
|
||||||
optionally filtering to only those that match the provided namespace.
|
|
||||||
"""
|
"""
|
||||||
distance_metrics = {
|
Deletes a vector from the database based on the given vector ID.
|
||||||
"cosine_distance": self._model.vector.cosine_distance,
|
|
||||||
"l2_distance": self._model.vector.l2_distance,
|
|
||||||
"inner_product": self._model.vector.max_inner_product,
|
|
||||||
}
|
|
||||||
|
|
||||||
if distance_metric not in distance_metrics:
|
|
||||||
raise ValueError("Invalid distance metric provided")
|
|
||||||
|
|
||||||
op = distance_metrics[distance_metric]
|
Args:
|
||||||
|
vector_id: The ID of the vector to be deleted.
|
||||||
|
|
||||||
|
"""
|
||||||
|
try:
|
||||||
with Session(self.engine) as session:
|
with Session(self.engine) as session:
|
||||||
vector = self.embedding_driver.embed_string(query)
|
obj = session.get(self.VectorModel, vector_id)
|
||||||
|
if obj:
|
||||||
# The query should return both the vector and the distance metric score.
|
session.delete(obj)
|
||||||
query = session.query(
|
session.commit()
|
||||||
self._model,
|
except Exception as e:
|
||||||
op(vector).label("score"),
|
print(f"Error deleting vector: {e}")
|
||||||
).order_by(op(vector))
|
|
||||||
|
|
||||||
if namespace:
|
|
||||||
query = query.filter_by(namespace=namespace)
|
|
||||||
|
|
||||||
results = query.limit(count).all()
|
|
||||||
|
|
||||||
return [
|
|
||||||
BaseVectorStore.QueryResult(
|
|
||||||
id=str(result[0].id),
|
|
||||||
vector=(
|
|
||||||
result[0].vector if include_vectors else None
|
|
||||||
),
|
|
||||||
score=result[1],
|
|
||||||
meta=result[0].meta,
|
|
||||||
namespace=result[0].namespace,
|
|
||||||
)
|
|
||||||
for result in results
|
|
||||||
]
|
|
||||||
|
|
||||||
def default_vector_model(self) -> any:
|
|
||||||
Base = declarative_base()
|
|
||||||
|
|
||||||
@dataclass
|
|
||||||
class VectorModel(Base):
|
|
||||||
__tablename__ = self.table_name
|
|
||||||
|
|
||||||
id = Column(
|
|
||||||
UUID(as_uuid=True),
|
|
||||||
primary_key=True,
|
|
||||||
default=uuid.uuid4,
|
|
||||||
unique=True,
|
|
||||||
nullable=False,
|
|
||||||
)
|
|
||||||
vector = Column(Vector())
|
|
||||||
namespace = Column(String)
|
|
||||||
meta = Column(JSON)
|
|
||||||
|
|
||||||
return VectorModel
|
|
||||||
|
Loading…
Reference in new issue