[BUFG][Tool Usage][Agent]

pull/443/head
Kye 9 months ago
parent 96cb98d36c
commit 4e757d5a7d

@ -5,7 +5,7 @@ build-backend = "poetry.core.masonry.api"
[tool.poetry] [tool.poetry]
name = "swarms" name = "swarms"
version = "4.7.9" version = "4.8.1"
description = "Swarms - Pytorch" description = "Swarms - Pytorch"
license = "MIT" license = "MIT"
authors = ["Kye Gomez <kye@apac.ai>"] authors = ["Kye Gomez <kye@apac.ai>"]

@ -1,5 +1,8 @@
import datetime import datetime
from pydantic import BaseModel, Field from pydantic import BaseModel, Field
from swarms.tools.tool import BaseTool
from swarms.tools.tool_utils import scrape_tool_func_docs
from typing import List
time = datetime.datetime.now().strftime("%Y-%m-%d %H:%M:%S") time = datetime.datetime.now().strftime("%Y-%m-%d %H:%M:%S")
@ -23,54 +26,202 @@ class ResponseFormat(BaseModel):
response_json = ResponseFormat.model_json_schema() response_json = ResponseFormat.model_json_schema()
def worker_tools_sop_promp(name: str, memory: str, time=time): tool_usage_browser = """
out = f"""
You are {name}, ```json
Your decisions must always be made independently without seeking user assistance. {
Play to your strengths as an LLM and pursue simple strategies with no legal complications. "thoughts": {
If you have completed all your tasks, make sure to use the 'finish' command. "text": "To check the weather in Miami, I will use the browser tool to search for 'Miami weather'.",
"reasoning": "The browser tool allows me to search the web, so I can look up the current weather conditions in Miami.",
GOALS: "plan": "Use the browser tool to search Google for 'Miami weather'. Parse the result to get the current temperature, conditions, etc. and format that into a readable weather report."
},
1. Hello, how are you? Create an image of how you are doing! "command": {
"name": "browser",
Constraints: "args": {
"query": "Miami weather"
1. ~4000 word limit for short term memory. Your short term memory is short, so immediately save important information to files. }
2. If you are unsure how you previously did something or want to recall past events, thinking about similar events will help you remember. }
3. No user assistance }
4. Exclusively use the commands listed in double quotes e.g. 'command name' ```
"""
tool_usage_terminal = """
```json
{
"thoughts": {
"text": "To check the weather in Miami, I will use the browser tool to search for 'Miami weather'.",
"reasoning": "The browser tool allows me to search the web, so I can look up the current weather conditions in Miami.",
"plan": "Use the browser tool to search Google for 'Miami weather'. Parse the result to get the current temperature, conditions, etc. and format that into a readable weather report."
},
"command": {
"name": "terminal",
"args": {
"code": "uptime"
}
}
}
```
"""
browser_and_terminal_tool = """
```
{
"thoughts": {
"text": "To analyze the latest stock market trends, I need to fetch current stock data and then process it using a script.",
"reasoning": "Using the browser tool to retrieve stock data ensures I have the most recent information. Following this, the terminal tool can run a script that analyzes this data to identify trends.",
"plan": "First, use the browser to get the latest stock prices. Then, use the terminal to execute a data analysis script on the fetched data."
},
"commands": [
{
"name": "browser",
"args": {
"query": "download latest stock data for NASDAQ"
}
},
{
"name": "terminal",
"args": {
"cmd": "python analyze_stocks.py"
}
}
]
}
```
"""
browser_and_terminal_tool_two = """
```
{
"thoughts": {
"text": "To prepare a monthly budget report, I need current expenditure data, process it, and calculate the totals and averages.",
"reasoning": "The browser will fetch the latest expenditure data. The terminal will run a processing script to organize the data, and the calculator will be used to sum up expenses and compute averages.",
"plan": "Download the data using the browser, process it with a terminal command, and then calculate totals and averages using the calculator."
},
"commands": [
{
"name": "browser",
"args": {
"query": "download monthly expenditure data"
}
},
{
"name": "terminal",
"args": {
"cmd": "python process_expenditures.py"
}
},
{
"name": "calculator",
"args": {
"operation": "sum",
"numbers": "[output_from_process_expenditures]"
}
}
]
}
```
"""
# Function to parse tools and get their documentation
def parse_tools(tools: List[BaseTool] = []):
tool_docs = []
for tool in tools:
tool_doc = scrape_tool_func_docs(tool)
tool_docs.append(tool_doc)
return tool_docs
# Function to generate the worker prompt
def tool_usage_worker_prompt(
current_time=time, tools: List[BaseTool] = []
):
tool_docs = parse_tools(tools)
prompt = f"""
**Date and Time**: {current_time}
### Constraints
- Only use the tools as specified in the instructions.
- Follow the command format strictly to avoid errors and ensure consistency.
- Only use the tools for the intended purpose as described in the SOP.
- Document your thoughts, reasoning, and plan before executing the command.
- Provide the output in JSON format within markdown code blocks.
- Review the output to ensure it matches the expected outcome.
- Only follow the instructions provided in the SOP and do not deviate from the specified tasks unless tool usage is not required.
### Performance Evaluation
- **Efficiency**: Use tools to complete tasks with minimal steps.
- **Accuracy**: Ensure that commands are executed correctly to achieve the desired outcome.
- **Adaptability**: Be ready to adjust the use of tools based on task requirements and feedback.
### Tool Commands
1. **Browser**
- **Purpose**: To retrieve information from the internet.
- **Usage**:
- `{{"name": "browser", "args": {{"query": "search query here"}}}}`
- Example: Fetch current weather in London.
- Command: `{{"name": "browser", "args": {{"query": "London weather"}}}}`
2. **Terminal**
- **Purpose**: To execute system commands.
- **Usage**:
- `{{"name": "terminal", "args": {{"cmd": "system command here"}}}}`
- Example: Check disk usage on a server.
- Command: `{{"name": "terminal", "args": {{"cmd": "df -h"}}}}`
3. **Custom Tool** (if applicable)
- **Purpose**: Describe specific functionality.
- **Usage**:
- `{{"name": "custom_tool", "args": {{"parameter": "value"}}}}`
- Example: Custom analytics tool.
- Command: `{{"name": "custom_tool", "args": {{"data": "analyze this data"}}}}`
### Usage Examples
- **Example 1**: Retrieving Weather Information
```json
{tool_usage_browser}
```
Commands: - **Example 2**: System Check via Terminal
```json
{tool_usage_terminal}
```
1. finish: use this to signal that you have finished all your objectives, args: 'response': 'final response to let people know you have finished your objectives' - **Example 3**: Combined Browser and Terminal Usage
```json
{browser_and_terminal_tool}
```
Resources: - **Example 4**: Combined Browser, Terminal, and Calculator Usage
```json
{browser_and_terminal_tool_two}
```
1. Internet access for searches and information gathering.
2. Long Term memory management.
3. Agents for delegation of simple tasks.
4. File output.
Performance Evaluation:
1. Continuously review and analyze your actions to ensure you are performing to the best of your abilities. ### Next Steps
2. Constructively self-criticize your big-picture behavior constantly. - Determine the appropriate tool for the task at hand.
3. Reflect on past decisions and strategies to refine your approach. - Format your command according to the examples provided.
4. Every command has a cost, so be smart and efficient. Aim to complete tasks in the least number of steps. - Execute the command and evaluate the results based on the expected outcome.
- Document any issues or challenges faced during the tool usage.
- Always output the results in the specified format: JSON in markdown code blocks.
You should only respond in JSON format as described below Response Format, you will respond only in markdown format within 6 backticks. The JSON will be in markdown format.
``` ###### Tools Available
{response_json}
```
Ensure the response can be parsed by Python json.loads {tool_docs}
System: The current time and date is {time}
System: This reminds you of these events from your past:
[{memory}]
Human: Determine which next command to use, and respond using the format specified above: This SOP is designed to guide you through the structured and effective use of tools. By adhering to this protocol, you will enhance your productivity and accuracy in task execution.
""" """
return str(out) return prompt

@ -6,7 +6,7 @@ import random
import sys import sys
import time import time
import uuid import uuid
from typing import Any, Callable, Dict, List, Optional, Tuple, Union from typing import Any, Callable, Dict, List, Optional, Tuple
import yaml import yaml
from loguru import logger from loguru import logger
@ -17,7 +17,6 @@ from swarms.prompts.agent_system_prompts import AGENT_SYSTEM_PROMPT_3
from swarms.prompts.multi_modal_autonomous_instruction_prompt import ( from swarms.prompts.multi_modal_autonomous_instruction_prompt import (
MULTI_MODAL_AUTO_AGENT_SYSTEM_PROMPT_1, MULTI_MODAL_AUTO_AGENT_SYSTEM_PROMPT_1,
) )
from swarms.prompts.worker_prompt import worker_tools_sop_promp
from swarms.structs.conversation import Conversation from swarms.structs.conversation import Conversation
from swarms.tools.tool import BaseTool from swarms.tools.tool import BaseTool
from swarms.utils.code_interpreter import SubprocessCodeInterpreter from swarms.utils.code_interpreter import SubprocessCodeInterpreter
@ -25,8 +24,8 @@ from swarms.utils.data_to_text import data_to_text
from swarms.utils.parse_code import extract_code_from_markdown from swarms.utils.parse_code import extract_code_from_markdown
from swarms.utils.pdf_to_text import pdf_to_text from swarms.utils.pdf_to_text import pdf_to_text
from swarms.tools.exec_tool import execute_tool_by_name from swarms.tools.exec_tool import execute_tool_by_name
from swarms.tools.function_util import process_tool_docs
from swarms.tools.code_executor import CodeExecutor from swarms.tools.code_executor import CodeExecutor
from swarms.prompts.worker_prompt import tool_usage_worker_prompt
# Utils # Utils
@ -172,7 +171,7 @@ class Agent:
agent_name: str = "swarm-worker-01", agent_name: str = "swarm-worker-01",
agent_description: str = None, agent_description: str = None,
system_prompt: str = AGENT_SYSTEM_PROMPT_3, system_prompt: str = AGENT_SYSTEM_PROMPT_3,
tools: Union[List[BaseTool]] = None, tools: List[BaseTool] = [],
dynamic_temperature_enabled: Optional[bool] = False, dynamic_temperature_enabled: Optional[bool] = False,
sop: Optional[str] = None, sop: Optional[str] = None,
sop_list: Optional[List[str]] = None, sop_list: Optional[List[str]] = None,
@ -210,6 +209,7 @@ class Agent:
custom_exit_command: Optional[str] = "exit", custom_exit_command: Optional[str] = "exit",
sentiment_analyzer: Optional[Callable] = None, sentiment_analyzer: Optional[Callable] = None,
limit_tokens_from_string: Optional[Callable] = None, limit_tokens_from_string: Optional[Callable] = None,
custom_tools_prompt: Optional[Callable] = None,
*args, *args,
**kwargs, **kwargs,
): ):
@ -318,21 +318,21 @@ class Agent:
# If tools are provided then set the tool prompt by adding to sop # If tools are provided then set the tool prompt by adding to sop
if self.tools: if self.tools:
tools_prompt = worker_tools_sop_promp( if custom_tools_prompt is not None:
name=self.agent_name, tools_prompt = custom_tools_prompt(tools=self.tools)
memory=self.short_memory.return_history_as_string(),
)
# Append the tools prompt to the short_term_memory
self.short_memory.add( self.short_memory.add(
role=self.agent_name, content=tools_prompt role=self.agent_name, content=tools_prompt
) )
# And, add the tool documentation to the memory else:
for tool in self.tools: tools_prompt = tool_usage_worker_prompt(
tool_docs = process_tool_docs(tool) tools=self.tools
)
# Append the tools prompt to the short_term_memory
self.short_memory.add( self.short_memory.add(
role=self.agent_name, content=tool_docs role=self.agent_name, content=tools_prompt
) )
# If the long term memory is provided then set the long term memory prompt # If the long term memory is provided then set the long term memory prompt
@ -713,10 +713,11 @@ class Agent:
break # Exit the loop if all retry attempts fail break # Exit the loop if all retry attempts fail
# Check stopping conditions # Check stopping conditions
if self.stopping_token is not None:
if self.stopping_token in response: if self.stopping_token in response:
break break
elif ( elif (
self.stopping_condition self.stopping_condition is not None
and self._check_stopping_condition(response) and self._check_stopping_condition(response)
): ):
break break

@ -0,0 +1,57 @@
from swarms import Agent, Anthropic, tool
# Model
llm = Anthropic(
temperature=0.1,
)
"""
How to create tools:
1. Define a function that takes the required arguments with documentation and type hints.
2. Add the `@tool` decorator to the function.
3. Add the function to the `tools` list in the `Agent` class.
"""
# Tools
# Browser tools
@tool
def browser(query: str):
"""
Opens a web browser and searches for the given query on Google.
Args:
query (str): The search query.
Returns:
str: A message indicating that the search is being performed.
"""
import webbrowser
url = f"https://www.google.com/search?q={query}"
webbrowser.open(url)
return f"Searching for {query} in the browser."
# Agent
agent = Agent(
agent_name="Devin",
system_prompt=(
"Autonomous agent that can interact with humans and other"
" agents. Be Helpful and Kind. Use the tools provided to"
" assist the user. Return all code in markdown format."
),
llm=llm,
max_loops="auto",
autosave=True,
dashboard=False,
verbose=True,
stopping_token="<DONE>",
interactive=True,
tools=[browser],
)
# Run the agent
out = agent.run("what's the weather in Miami?")
print(out)
Loading…
Cancel
Save