[FIX][Agent][list_tool_schemas -> list_base_models]

pull/541/merge
Kye Gomez 6 months ago
parent a811a81b9b
commit 450a7b7453

2
.gitignore vendored

@ -23,7 +23,7 @@ D_state.json
artifacts_six artifacts_six
artifacts_seven artifacts_seven
swarms/__pycache__ swarms/__pycache__
artifacts artifacts_once
transcript_generator.json transcript_generator.json
venv venv
.DS_Store .DS_Store

@ -460,7 +460,7 @@ agent = Agent(
output_type=tool_schema, # or dict, or str output_type=tool_schema, # or dict, or str
metadata_output_type="json", metadata_output_type="json",
# List of schemas that the agent can handle # List of schemas that the agent can handle
list_tool_schemas=[tool_schema], list_base_models=[tool_schema],
function_calling_format_type="OpenAI", function_calling_format_type="OpenAI",
function_calling_type="json", # or soon yaml function_calling_type="json", # or soon yaml
) )

@ -1,5 +1,5 @@
from pydantic import BaseModel, Field from pydantic import BaseModel, Field
from swarms import Anthropic from swarms import OpenAIChat
from swarms import Agent from swarms import Agent
@ -31,8 +31,8 @@ agent = Agent(
"Generate a person's information based on the following schema:" "Generate a person's information based on the following schema:"
), ),
# Set the tool schema to the JSON string -- this is the key difference # Set the tool schema to the JSON string -- this is the key difference
tool_schema=tool_schema, # tool_schema=tool_schema,
llm=Anthropic(), llm=OpenAIChat(),
max_loops=3, max_loops=3,
autosave=True, autosave=True,
dashboard=False, dashboard=False,
@ -40,10 +40,10 @@ agent = Agent(
verbose=True, verbose=True,
interactive=True, interactive=True,
# Set the output type to the tool schema which is a BaseModel # Set the output type to the tool schema which is a BaseModel
output_type=tool_schema, # or dict, or str # output_type=tool_schema, # or dict, or str
metadata_output_type="json", metadata_output_type="json",
# List of schemas that the agent can handle # List of schemas that the agent can handle
list_tool_schemas=[tool_schema], list_base_models=[tool_schema],
function_calling_format_type="OpenAI", function_calling_format_type="OpenAI",
function_calling_type="json", # or soon yaml function_calling_type="json", # or soon yaml
) )

@ -136,7 +136,7 @@ agent = Agent(
output_type=tool_schema, # or dict, or str output_type=tool_schema, # or dict, or str
metadata_output_type="json", metadata_output_type="json",
# List of schemas that the agent can handle # List of schemas that the agent can handle
list_tool_schemas=[tool_schema], list_base_models=[tool_schema],
function_calling_format_type="OpenAI", function_calling_format_type="OpenAI",
function_calling_type="json", # or soon yaml function_calling_type="json", # or soon yaml
) )

@ -0,0 +1,868 @@
# Comparing LLM Provider Pricing: A Guide for Enterprises
Large language models (LLMs) have become a cornerstone of innovation for enterprises across various industries.
As executives contemplate which model to integrate into their operations, understanding the intricacies of LLM provider pricing is crucial.
This comprehensive guide delves into the tactical business considerations, unit economics, profit margins, and ROI calculations that will empower decision-makers to deploy the right AI solution for their organization.
## Table of Contents
1. [Introduction to LLM Pricing Models](#introduction-to-llm-pricing-models)
2. [Understanding Unit Economics in LLM Deployment](#understanding-unit-economics-in-llm-deployment)
3. [Profit Margins and Cost Structures](#profit-margins-and-cost-structures)
4. [LLM Pricing in Action: Case Studies](#llm-pricing-in-action-case-studies)
5. [Calculating ROI for LLM Integration](#calculating-roi-for-llm-integration)
6. [Comparative Analysis of Major LLM Providers](#comparative-analysis-of-major-llm-providers)
7. [Hidden Costs and Considerations](#hidden-costs-and-considerations)
8. [Optimizing LLM Usage for Cost-Efficiency](#optimizing-llm-usage-for-cost-efficiency)
9. [Future Trends in LLM Pricing](#future-trends-in-llm-pricing)
10. [Strategic Decision-Making Framework](#strategic-decision-making-framework)
11. [Conclusion: Navigating the LLM Pricing Landscape](#conclusion-navigating-the-llm-pricing-landscape)
## 1. Introduction to LLM Pricing Models
The pricing of Large Language Models (LLMs) is a complex landscape that can significantly impact an enterprise's bottom line. As we dive into this topic, it's crucial to understand the various pricing models employed by LLM providers and how they align with different business needs.
### Pay-per-Token Model
The most common pricing structure in the LLM market is the pay-per-token model. In this system, businesses are charged based on the number of tokens processed by the model. A token can be as short as one character or as long as one word, depending on the language and the specific tokenization method used by the model.
**Advantages:**
- Scalability: Costs scale directly with usage, allowing for flexibility as demand fluctuates.
- Transparency: Easy to track and attribute costs to specific projects or departments.
**Disadvantages:**
- Unpredictability: Costs can vary significantly based on the verbosity of inputs and outputs.
- Potential for overruns: Without proper monitoring, costs can quickly escalate.
### Subscription-Based Models
Some providers offer subscription tiers that provide a set amount of compute resources or tokens for a fixed monthly or annual fee.
**Advantages:**
- Predictable costs: Easier budgeting and financial planning.
- Potential cost savings: Can be more economical for consistent, high-volume usage.
**Disadvantages:**
- Less flexibility: May lead to underutilization or overages.
- Commitment required: Often involves longer-term contracts.
### Custom Enterprise Agreements
For large-scale deployments, providers may offer custom pricing agreements tailored to the specific needs of an enterprise.
**Advantages:**
- Optimized for specific use cases: Can include specialized support, SLAs, and pricing structures.
- Potential for significant cost savings at scale.
**Disadvantages:**
- Complexity: Negotiating and managing these agreements can be resource-intensive.
- Less standardization: Difficult to compare across providers.
### Hybrid Models
Some providers are beginning to offer hybrid models that combine elements of pay-per-token and subscription-based pricing.
**Advantages:**
- Flexibility: Can adapt to varying usage patterns.
- Risk mitigation: Balances the benefits of both main pricing models.
**Disadvantages:**
- Complexity: Can be more challenging to understand and manage.
- Potential for suboptimal pricing if not carefully structured.
As we progress through this guide, we'll explore how these pricing models interact with various business considerations and how executives can leverage this understanding to make informed decisions.
## 2. Understanding Unit Economics in LLM Deployment
To make informed decisions about LLM deployment, executives must have a clear grasp of the unit economics involved. This section breaks down the components that contribute to the cost per unit of LLM usage and how they impact overall business economics.
### Defining the Unit
In the context of LLMs, a "unit" can be defined in several ways:
1. **Per Token**: The most granular unit, often used in pricing models.
2. **Per Request**: A single API call to the LLM, which may process multiple tokens.
3. **Per Task**: A complete operation, such as generating a summary or answering a question, which may involve multiple requests.
4. **Per User Interaction**: In customer-facing applications, this could be an entire conversation or session.
Understanding which unit is most relevant to your use case is crucial for accurate economic analysis.
### Components of Unit Cost
1. **Direct LLM Costs**
- Token processing fees
- API call charges
- Data transfer costs
2. **Indirect Costs**
- Compute resources for pre/post-processing
- Storage for inputs, outputs, and fine-tuning data
- Networking costs
3. **Operational Costs**
- Monitoring and management tools
- Integration and maintenance engineering time
- Customer support related to AI functions
4. **Overhead**
- Legal and compliance costs
- Training and documentation
- Risk management and insurance
### Calculating Unit Economics
To calculate the true unit economics, follow these steps:
1. **Determine Total Costs**: Sum all direct, indirect, operational, and overhead costs over a fixed period (e.g., monthly).
2. **Measure Total Units**: Track the total number of relevant units processed in the same period.
3. **Calculate Cost per Unit**: Divide total costs by total units.
```
Cost per Unit = Total Costs / Total Units
```
4. **Analyze Revenue per Unit**: If the LLM is part of a revenue-generating product, calculate the revenue attributed to each unit.
5. **Determine Profit per Unit**: Subtract the cost per unit from the revenue per unit.
```
Profit per Unit = Revenue per Unit - Cost per Unit
```
### Example Calculation
Let's consider a hypothetical customer service AI chatbot:
- Monthly LLM API costs: $10,000
- Indirect and operational costs: $5,000
- Total monthly interactions: 100,000
```
Cost per Interaction = ($10,000 + $5,000) / 100,000 = $0.15
```
If each interaction generates an average of $0.50 in value (through cost savings or revenue):
```
Profit per Interaction = $0.50 - $0.15 = $0.35
```
### Economies of Scale
As usage increases, unit economics often improve due to:
- Volume discounts from LLM providers
- Amortization of fixed costs over more units
- Efficiency gains through learning and optimization
However, it's crucial to model how these economies of scale manifest in your specific use case, as they may plateau or even reverse at very high volumes due to increased complexity and support needs.
### Diseconomies of Scale
Conversely, be aware of potential diseconomies of scale:
- Increased complexity in managing large-scale deployments
- Higher costs for specialized talent as operations grow
- Potential for diminishing returns on very large language models
By thoroughly understanding these unit economics, executives can make more informed decisions about which LLM provider and pricing model best aligns with their business objectives and scale.
## 3. Profit Margins and Cost Structures
Understanding profit margins and cost structures is crucial for executives evaluating LLM integration. This section explores how different pricing models and operational strategies can impact overall profitability.
### Components of Profit Margin
1. **Gross Margin**: The difference between revenue and the direct costs of LLM usage.
```
Gross Margin = Revenue - Direct LLM Costs
Gross Margin % = (Gross Margin / Revenue) * 100
```
2. **Contribution Margin**: Gross margin minus variable operational costs.
```
Contribution Margin = Gross Margin - Variable Operational Costs
```
3. **Net Margin**: The final profit after all costs, including fixed overheads.
```
Net Margin = Contribution Margin - Fixed Costs
Net Margin % = (Net Margin / Revenue) * 100
```
### Cost Structures in LLM Deployment
1. **Fixed Costs**
- Subscription fees for LLM access (if using a subscription model)
- Base infrastructure costs
- Core team salaries
- Licensing fees for essential software
2. **Variable Costs**
- Per-token or per-request charges
- Scaling infrastructure costs
- Usage-based API fees
- Performance-based team bonuses
3. **Step Costs**
- Costs that increase in chunks as usage scales
- Examples: Adding new server clusters, hiring additional support staff
### Analyzing Profit Margins Across Different Pricing Models
Let's compare how different LLM pricing models might affect profit margins for a hypothetical AI-powered writing assistant service:
**Scenario**: The service charges users $20/month and expects to process an average of 100,000 tokens per user per month.
1. **Pay-per-Token Model**
- LLM cost: $0.06 per 1,000 tokens
- Monthly LLM cost per user: $6
- Gross margin per user: $14 (70%)
2. **Subscription Model**
- Fixed monthly fee: $5,000 for up to 10 million tokens
- At 1,000 users: $5 per user
- Gross margin per user: $15 (75%)
3. **Hybrid Model**
- Base fee: $2,000 per month
- Reduced per-token rate: $0.04 per 1,000 tokens
- Monthly LLM cost per user: $6 ($2 base + $4 usage)
- Gross margin per user: $14 (70%)
### Strategies for Improving Profit Margins
1. **Optimize Token Usage**
- Implement efficient prompting techniques
- Cache common responses
- Use compression algorithms for inputs and outputs
2. **Leverage Economies of Scale**
- Negotiate better rates at higher volumes
- Spread fixed costs across a larger user base
3. **Implement Tiered Pricing**
- Offer different service levels to capture more value from power users
- Example: Basic ($10/month, 50K tokens), Pro ($30/month, 200K tokens)
4. **Vertical Integration**
- Invest in proprietary LLM development for core functionalities
- Reduce dependency on third-party providers for critical operations
5. **Smart Caching and Pre-computation**
- Store and reuse common LLM outputs
- Perform batch processing during off-peak hours
6. **Hybrid Cloud Strategies**
- Use on-premises solutions for consistent workloads
- Leverage cloud elasticity for demand spikes
### Case Study: Margin Improvement
Consider a company that initially used a pay-per-token model:
**Initial State:**
- Revenue per user: $20
- LLM cost per user: $6
- Other variable costs: $4
- Fixed costs per user: $5
- Net margin per user: $5 (25%)
**After Optimization:**
- Implemented efficient prompting: Reduced token usage by 20%
- Negotiated volume discount: 10% reduction in per-token price
- Introduced tiered pricing: Average revenue per user increased to $25
- Optimized operations: Reduced other variable costs to $3
**Result:**
- New LLM cost per user: $4.32
- New net margin per user: $12.68 (50.7%)
This case study demonstrates how a holistic approach to margin improvement, addressing both revenue and various cost components, can significantly enhance profitability.
Understanding these profit margin dynamics and cost structures is essential for executives to make informed decisions about LLM integration and to continuously optimize their AI-powered services for maximum profitability.
## 4. LLM Pricing in Action: Case Studies
To provide a concrete understanding of how LLM pricing models work in real-world scenarios, let's examine several case studies across different industries and use cases. These examples will illustrate the interplay between pricing models, usage patterns, and business outcomes.
### Case Study 1: E-commerce Product Description Generator
**Company**: GlobalMart, a large online retailer
**Use Case**: Automated generation of product descriptions
**LLM Provider**: GPT-4o
**Pricing Model**: Pay-per-token
- Input: $5.00 per 1M tokens
- Output: $15.00 per 1M tokens
**Usage Pattern**:
- Average input: 50 tokens per product (product attributes)
- Average output: 200 tokens per product (generated description)
- Daily products processed: 10,000
**Daily Cost Calculation**:
1. Input cost: (50 tokens * 10,000 products) / 1M * $5.00 = $2.50
2. Output cost: (200 tokens * 10,000 products) / 1M * $15.00 = $30.00
3. Total daily cost: $32.50
**Business Impact**:
- Reduced time to market for new products by 70%
- Improved SEO performance due to unique, keyword-rich descriptions
- Estimated daily value generated: $500 (based on increased sales and efficiency)
**ROI Analysis**:
- Daily investment: $32.50
- Daily return: $500
- ROI = (Return - Investment) / Investment * 100 = 1,438%
**Key Takeaway**: The pay-per-token model works well for this use case due to the predictable and moderate token usage per task. The high ROI justifies the investment in a more advanced model like GPT-4o.
### Case Study 2: Customer Service Chatbot
**Company**: TechSupport Inc., a software company
**Use Case**: 24/7 customer support chatbot
**LLM Provider**: Claude 3.5 Sonnet
**Pricing Model**: Input: $3 per 1M tokens, Output: $15 per 1M tokens
**Usage Pattern**:
- Average conversation: 500 tokens input (customer queries + context), 1000 tokens output (bot responses)
- Daily conversations: 5,000
**Daily Cost Calculation**:
1. Input cost: (500 tokens * 5,000 conversations) / 1M * $3 = $7.50
2. Output cost: (1000 tokens * 5,000 conversations) / 1M * $15 = $75.00
3. Total daily cost: $82.50
**Business Impact**:
- Reduced customer wait times by 90%
- Resolved 70% of queries without human intervention
- Estimated daily cost savings: $2,000 (based on reduced human support hours)
**ROI Analysis**:
- Daily investment: $82.50
- Daily return: $2,000
- ROI = (Return - Investment) / Investment * 100 = 2,324%
**Key Takeaway**: The higher cost of Claude 3.5 Sonnet is justified by its superior performance in handling complex customer queries, resulting in significant cost savings and improved customer satisfaction.
### Case Study 3: Financial Report Summarization
**Company**: FinAnalyze, a financial services firm
**Use Case**: Automated summarization of lengthy financial reports
**LLM Provider**: GPT-3.5 Turbo
**Pricing Model**: Input: $0.50 per 1M tokens, Output: $1.50 per 1M tokens
**Usage Pattern**:
- Average report: 20,000 tokens input, 2,000 tokens output
- Daily reports processed: 100
**Daily Cost Calculation**:
1. Input cost: (20,000 tokens * 100 reports) / 1M * $0.50 = $100
2. Output cost: (2,000 tokens * 100 reports) / 1M * $1.50 = $30
3. Total daily cost: $130
**Business Impact**:
- Reduced analysis time by 80%
- Improved consistency in report summaries
- Enabled analysts to focus on high-value tasks
- Estimated daily value generated: $1,000 (based on time savings and improved decision-making)
**ROI Analysis**:
- Daily investment: $130
- Daily return: $1,000
- ROI = (Return - Investment) / Investment * 100 = 669%
**Key Takeaway**: The lower cost of GPT-3.5 Turbo is suitable for this task, which requires processing large volumes of text but doesn't necessarily need the most advanced language understanding. The high input token count makes the input pricing a significant factor in model selection.
### Case Study 4: AI-Powered Language Learning App
**Company**: LinguaLeap, an edtech startup
**Use Case**: Personalized language exercises and conversations
**LLM Provider**: Claude 3 Haiku
**Pricing Model**: Input: $0.25 per 1M tokens, Output: $1.25 per 1M tokens
**Usage Pattern**:
- Average session: 300 tokens input (user responses + context), 500 tokens output (exercises + feedback)
- Daily active users: 50,000
- Average sessions per user per day: 3
**Daily Cost Calculation**:
1. Input cost: (300 tokens * 3 sessions * 50,000 users) / 1M * $0.25 = $11.25
2. Output cost: (500 tokens * 3 sessions * 50,000 users) / 1M * $1.25 = $93.75
3. Total daily cost: $105
**Business Impact**:
- Increased user engagement by 40%
- Improved learning outcomes, leading to higher user retention
- Enabled scaling to new languages without proportional increase in human tutors
- Estimated daily revenue: $5,000 (based on subscription fees and in-app purchases)
**ROI Analysis**:
- Daily investment: $105
- Daily revenue: $5,000
- ROI = (Revenue - Investment) / Investment * 100 = 4,662%
**Key Takeaway**: The high-volume, relatively simple interactions in this use case make Claude 3 Haiku an excellent choice. Its low cost allows for frequent interactions without prohibitive expenses, which is crucial for an app relying on regular user engagement.
### Case Study 5: Legal Document Analysis
**Company**: LegalEagle LLP, a large law firm
**Use Case**: Contract review and risk assessment
**LLM Provider**: Claude 3 Opus
**Pricing Model**: Input: $15 per 1M tokens, Output: $75 per 1M tokens
**Usage Pattern**:
- Average contract: 10,000 tokens input, 3,000 tokens output (analysis and risk assessment)
- Daily contracts processed: 50
**Daily Cost Calculation**:
1. Input cost: (10,000 tokens * 50 contracts) / 1M * $15 = $7.50
2. Output cost: (3,000 tokens * 50 contracts) / 1M * $75 = $11.25
3. Total daily cost: $18.75
**Business Impact**:
- Reduced contract review time by 60%
- Improved accuracy in identifying potential risks
- Enabled handling of more complex cases
- Estimated daily value: $10,000 (based on time savings and improved risk management)
**ROI Analysis**:
- Daily investment: $18.75
- Daily value: $10,000
- ROI = (Value - Investment) / Investment * 100 = 53,233%
**Key Takeaway**: Despite the high cost per token, Claude 3 Opus's advanced capabilities justify its use in this high-stakes environment where accuracy and nuanced understanding are critical. The high value generated per task offsets the higher token costs.
These case studies demonstrate how different LLM providers and pricing models can be optimal for various use cases, depending on factors such as token volume, task complexity, and the value generated by the AI application. Executives should carefully consider these factors when selecting an LLM provider and pricing model for their specific needs.
## 5. Calculating ROI for LLM Integration
Calculating the Return on Investment (ROI) for LLM integration is crucial for executives to justify the expenditure and assess the business value of AI implementation. This section will guide you through the process of calculating ROI, considering both tangible and intangible benefits.
### The ROI Formula
The basic ROI formula is:
```
ROI = (Net Benefit / Cost of Investment) * 100
```
For LLM integration, we can expand this to:
```
ROI = ((Total Benefits - Total Costs) / Total Costs) * 100
```
### Identifying Benefits
1. **Direct Cost Savings**
- Reduced labor costs
- Decreased operational expenses
- Lower error-related costs
2. **Revenue Increases**
- New product offerings enabled by LLM
- Improved customer acquisition and retention
- Upselling and cross-selling opportunities
3. **Productivity Gains**
- Time saved on repetitive tasks
- Faster decision-making processes
- Improved employee efficiency
4. **Quality Improvements**
- Enhanced accuracy in outputs
- Consistency in service delivery
- Reduced error rates
5. **Strategic Advantages**
- Market differentiation
- Faster time-to-market for new offerings
- Improved competitive positioning
### Calculating Costs
1. **Direct LLM Costs**
- API usage fees
- Subscription costs
2. **Infrastructure Costs**
- Cloud computing resources
- Data storage
- Networking expenses
3. **Integration and Development Costs**
- Initial setup and integration
- Ongoing maintenance and updates
- Custom feature development
4. **Training and Support**
- Employee training programs
- User support and documentation
- Change management initiatives
5. **Compliance and Security**
- Data privacy measures
- Security audits and implementations
- Regulatory compliance efforts
### Step-by-Step ROI Calculation
1. **Define the Time Period**: Determine the timeframe for your ROI calculation (e.g., 1 year, 3 years).
2. **Estimate Total Benefits**:
- Quantify direct cost savings and revenue increases
- Assign monetary values to productivity gains and quality improvements
- Estimate the value of strategic advantages (this may be more subjective)
3. **Calculate Total Costs**:
- Sum up all direct and indirect costs related to LLM integration
4. **Apply the ROI Formula**:
```
ROI = ((Total Benefits - Total Costs) / Total Costs) * 100
```
5. **Consider Time Value of Money**: For longer-term projections, use Net Present Value (NPV) to account for the time value of money.
### Example ROI Calculation
Let's consider a hypothetical customer service chatbot implementation:
**Time Period**: 1 year
**Benefits**:
- Labor cost savings: $500,000
- Increased sales from improved customer satisfaction: $300,000
- Productivity gains from faster query resolution: $200,000
Total Benefits: $1,000,000
**Costs**:
- LLM API fees: $100,000
- Integration and development: $150,000
- Training and support: $50,000
- Infrastructure: $50,000
Total Costs: $350,000
**ROI Calculation**:
```
ROI = (($1,000,000 - $350,000) / $350,000) * 100 = 185.7%
```
This indicates a strong positive return on investment, with benefits outweighing costs by a significant margin.
### Considerations for Accurate ROI Calculation
1. **Be Conservative in Estimates**: It's better to underestimate benefits and overestimate costs to provide a more realistic view.
2. **Account for Ramp-Up Time**: Full benefits may not be realized immediately. Consider a phased approach in your calculations.
3. **Include Opportunity Costs**: Consider the potential returns if the investment were made elsewhere.
4. **Factor in Risk**: Adjust your ROI based on the likelihood of achieving projected benefits.
5. **Consider Non-Financial Benefits**: Some benefits, like improved employee satisfaction or enhanced brand perception, may not have direct financial equivalents but are still valuable.
6. **Perform Sensitivity Analysis**: Calculate ROI under different scenarios (best case, worst case, most likely) to understand the range of possible outcomes.
7. **Benchmark Against Alternatives**: Compare the ROI of LLM integration against other potential investments or solutions.
### Long-Term ROI Considerations
While initial ROI calculations are crucial for decision-making, it's important to consider long-term implications:
1. **Scalability**: How will ROI change as usage increases?
2. **Technological Advancements**: Will newer, more efficient models become available?
3. **Market Changes**: How might shifts in the competitive landscape affect the value proposition?
4. **Regulatory Environment**: Could future regulations impact the cost or feasibility of LLM use?
By thoroughly calculating and analyzing the ROI of LLM integration, executives can make data-driven decisions about AI investments and set realistic expectations for the value these technologies can bring to their organizations.
## 6. Comparative Analysis of Major LLM Providers
In this section, we'll compare the offerings of major LLM providers, focusing on their pricing structures, model capabilities, and unique selling points. This analysis will help executives understand the landscape and make informed decisions about which provider best suits their needs.
### OpenAI
**Models**: GPT-4o, GPT-3.5 Turbo
**Pricing Structure**:
- Pay-per-token model
- Different rates for input and output tokens
- Bulk discounts available for high-volume users
**Key Features**:
- State-of-the-art performance on a wide range of tasks
- Regular model updates and improvements
- Extensive documentation and community support
**Considerations**:
- Higher pricing compared to some competitors
- Potential for rapid price changes as technology evolves
- Usage limits and approval process for higher-tier models
### Anthropic
**Models**: Claude 3.5 Sonnet, Claude 3 Opus, Claude 3 Haiku
**Pricing Structure**:
- Pay-per-token model
- Different rates for input and output tokens
- Tiered pricing based on model capabilities
**Key Features**:
- Strong focus on AI safety and ethics
- Long context windows (200K tokens)
- Specialized models for different use cases (e.g., Haiku for speed, Opus for complex tasks)
**Considerations**:
- Newer to the market compared to OpenAI
- Potentially more limited third-party integrations
- Strong emphasis on responsible AI use
### Google (Vertex AI)
**Models**: PaLM 2 for Chat, PaLM 2 for Text
**Pricing Structure**:
- Pay-per-thousand characters model
- Different rates for input and output
- Additional charges for advanced features (e.g., semantic retrieval)
**Key Features**:
- Integration with Google Cloud ecosystem
- Multi-modal capabilities (text, image, audio)
- Enterprise-grade security and compliance features
**Considerations**:
- Pricing can be complex due to additional Google Cloud costs
- Strong performance in specialized domains (e.g., coding, mathematical reasoning)
- Potential for integration with other Google services
### Amazon (Bedrock)
**Models**: Claude (Anthropic), Titan
**Pricing Structure**:
- Pay-per-second of compute time
- Additional charges for data transfer and storage
**Key Features**:
- Seamless integration with AWS services
- Access to multiple model providers through a single API
- Fine-tuning and customization options
**Considerations**:
- Pricing model can be less predictable for inconsistent workloads
- Strong appeal for existing AWS customers
- Potential for cost optimizations through AWS ecosystem
### Microsoft (Azure OpenAI Service)
**Models**: GPT-4, GPT-3.5 Turbo
**Pricing Structure**:
- Similar to OpenAI's pricing, but with Azure integration
- Additional costs for Azure services (e.g., storage, networking)
**Key Features**:
- Enterprise-grade security and compliance
- Integration with Azure AI services
- Access to fine-tuning and customization options
**Considerations**:
- Attractive for organizations already using Azure
- Potential for volume discounts through Microsoft Enterprise Agreements
- Additional overhead for Azure management
### Comparative Analysis
| Provider | Pricing Model | Strengths | Considerations |
|----------|---------------|-----------|----------------|
| OpenAI | Pay-per-token | - Top performance<br>- Regular updates<br>- Strong community | - Higher costs<br>- Usage limits |
| Anthropic| Pay-per-token | - Ethical focus<br>- Long context<br>- Specialized models | - Newer provider<br>- Limited integrations |
| Google | Pay-per-character | - Google Cloud integration<br>- Multi-modal<br>- Enterprise features | - Complex pricing<br>- Google ecosystem lock-in |
| Amazon | Pay-per-compute time | - AWS integration<br>- Multiple providers<br>- Customization options | - Less predictable costs<br>- AWS ecosystem focus |
| Microsoft| Pay-per-token (Azure-based) | - Enterprise security<br>- Azure integration<br>- Fine-tuning options | - Azure overhead<br>- Potential lock-in |
### Factors to Consider in Provider Selection
1. **Performance Requirements**: Assess whether you need state-of-the-art performance or if a less advanced (and potentially cheaper) model suffices.
2. **Pricing Predictability**: Consider whether your usage patterns align better with token-based or compute-time-based pricing.
3. **Integration Needs**: Evaluate how well each provider integrates with your existing technology stack.
4. **Scalability**: Assess each provider's ability to handle your expected growth in usage.
5. **Customization Options**: Determine if you need fine-tuning or specialized model development capabilities.
6. **Compliance and Security**: Consider your industry-specific regulatory requirements and each provider's security offerings.
7. **Support and Documentation**: Evaluate the quality of documentation, community support, and enterprise-level assistance.
8. **Ethical Considerations**: Assess each provider's stance on AI ethics and responsible use.
9. **Lock-In Concerns**: Consider the long-term implications of committing to a specific provider or cloud ecosystem.
10. **Multi-Provider Strategy**: Evaluate the feasibility and benefits of using multiple providers for different use cases.
By carefully comparing these providers and considering the factors most relevant to your organization, you can make an informed decision that balances cost, performance, and strategic fit. Remember that the LLM landscape is rapidly evolving, so it's important to regularly reassess your choices and stay informed about new developments and pricing changes.
## 7. Hidden Costs and Considerations
When evaluating LLM providers and calculating the total cost of ownership, it's crucial to look beyond the advertised pricing and consider the hidden costs and additional factors that can significantly impact your budget and overall implementation success. This section explores these often-overlooked aspects to help executives make more comprehensive and accurate assessments.
### 1. Data Preparation and Cleaning
**Considerations**:
- Cost of data collection and aggregation
- Expenses related to data cleaning and normalization
- Ongoing data maintenance and updates
**Impact**:
- Can be time-consuming and labor-intensive
- May require specialized tools or personnel
- Critical for model performance and accuracy
### 2. Fine-Tuning and Customization
**Considerations**:
- Costs associated with creating custom datasets
- Compute resources required for fine-tuning
- Potential need for specialized ML expertise
**Impact**:
- Can significantly improve model performance for specific tasks
- May lead to better ROI in the long run
- Increases initial implementation costs
### 3. Integration and Development
**Considerations**:
- Engineering time for API integration
- Development of custom interfaces or applications
- Ongoing maintenance and updates
**Impact**:
- Can be substantial, especially for complex integrations
- May require hiring additional developers or consultants
- Critical for seamless user experience and workflow integration
### 4. Monitoring and Optimization
**Considerations**:
- Tools and systems for performance monitoring
- Regular audits and optimizations
- Costs associated with debugging and troubleshooting
**Impact**:
- Ongoing expense that increases with scale
- Essential for maintaining efficiency and cost-effectiveness
- Can lead to significant savings through optimized usage
### 5. Compliance and Security
**Considerations**:
- Legal counsel for data privacy and AI regulations
- Implementation of security measures (e.g., encryption, access controls)
- Regular audits and certifications
**Impact**:
- Can be substantial, especially in heavily regulated industries
- Critical for risk management and maintaining customer trust
- May limit certain use cases or require additional safeguards
### 6. Training and Change Management
- Employee training programs
- Development of user guides and documentation
- Change management initiatives
**Impact**:
- Often underestimated but crucial for adoption
- Can affect productivity during the transition period
- Important for realizing the full potential of LLM integration
### 7. Scaling Costs
**Considerations**:
- Potential price increases as usage grows
- Need for additional infrastructure or resources
- Costs associated with managing increased complexity
**Impact**:
- Can lead to unexpected expenses if not properly forecasted
- May require renegotiation of contracts or switching providers
- Important to consider in long-term planning
### 8. Opportunity Costs
**Considerations**:
- Time and resources diverted from other projects
- Potential missed opportunities due to focus on LLM implementation
- Learning curve and productivity dips during adoption
**Impact**:
- Difficult to quantify but important to consider
- Can affect overall business strategy and priorities
- May influence timing and scope of LLM integration
### 9. Vendor Lock-in
**Considerations**:
- Costs associated with switching providers
- Dependency on provider-specific features or integrations
- Potential for price increases once deeply integrated
**Impact**:
- Can limit flexibility and negotiating power
- May affect long-term costs and strategic decisions
- Important to consider multi-provider or portable implementation strategies
### 10. Ethical and Reputational Considerations
**Considerations**:
- Potential backlash from AI-related controversies
- Costs of ensuring ethical AI use and transparency
- Investments in responsible AI practices
**Impact**:
- Can affect brand reputation and customer trust
- May require ongoing public relations efforts
- Important for long-term sustainability and social responsibility
By carefully considering these hidden costs and factors, executives can develop a more comprehensive understanding of the total investment required for successful LLM integration. This holistic approach allows for better budgeting, risk management, and strategic planning.
## Conclusion: Navigating the LLM Pricing Landscape
As we've explored throughout this guide, the landscape of LLM provider pricing is complex and multifaceted. From understanding the basic pricing models to calculating ROI and considering hidden costs, there are numerous factors that executives must weigh when making decisions about AI integration.
Key takeaways include:
1. The importance of aligning LLM selection with specific business needs and use cases.
2. The need for thorough ROI analysis that goes beyond simple cost calculations.
3. The value of considering both short-term implementation costs and long-term scalability.
4. The critical role of hidden costs in determining the true total cost of ownership.
5. The potential for significant business value when LLMs are strategically implemented and optimized.
As the AI landscape continues to evolve rapidly, staying informed and adaptable is crucial. What may be the best choice today could change as new models are released, pricing structures shift, and your organization's needs evolve.
To help you navigate these complexities and make the most informed decisions for your enterprise, we invite you to take the next steps in your AI journey:
1. **Book a Consultation**: Speak with our enterprise-grade LLM specialists who can provide personalized insights and recommendations tailored to your specific needs. Schedule a 15-minute call at [https://cal.com/swarms/15min](https://cal.com/swarms/15min).
2. **Join Our Community**: Connect with fellow AI executives, share experiences, and stay updated on the latest developments in the LLM space. Join our Discord community at [https://discord.gg/yxU9t9da](https://discord.gg/yxU9t9da).
By leveraging expert guidance and peer insights, you can position your organization to make the most of LLM technologies while optimizing costs and maximizing value. The future of AI in enterprise is bright, and with the right approach, your organization can be at the forefront of this transformative technology.

@ -217,6 +217,8 @@ nav:
- Swarms Platform: - Swarms Platform:
- Overview: "swarms_platform/index.md" - Overview: "swarms_platform/index.md"
- Prompts API: "swarms_platform/prompts_api.md" - Prompts API: "swarms_platform/prompts_api.md"
- Guides:
- Comparing LLM Provider Pricing A Guide for Enterprises: "guides/pricing.md"
- References: - References:
- Agent Glossary: "swarms/glossary.md" - Agent Glossary: "swarms/glossary.md"
- List of The Best Multi-Agent Papers: "swarms/papers.md" - List of The Best Multi-Agent Papers: "swarms/papers.md"

@ -0,0 +1,243 @@
# `Artifact`
The `Artifact` class represents a file artifact, encapsulating the file's path, type, contents, versions, and edit count. This class provides a comprehensive way to manage file versions, edit contents, and handle various file-related operations such as saving, loading, and exporting to JSON.
The `Artifact` class is particularly useful in contexts where file version control and content management are essential. By keeping track of the number of edits and maintaining a version history, it allows for robust file handling and auditability.
## Class Definition
### Artifact
| Attribute | Type | Default Value | Description |
|-------------|---------------------|------------------|--------------------------------------------------|
| `file_path` | `str` | N/A | The path to the file. |
| `file_type` | `str` | N/A | The type of the file. |
| `contents` | `str` | `""` | The contents of the file. |
| `versions` | `List[FileVersion]` | `[]` | The list of file versions. |
| `edit_count`| `int` | `0` | The number of times the file has been edited. |
### Parameters and Validation
- `file_path`: A string representing the file path.
- `file_type`: A string representing the file type. This attribute is validated to ensure it matches supported file types based on the file extension if not provided.
- `contents`: A string representing the contents of the file. Defaults to an empty string.
- `versions`: A list of `FileVersion` instances representing the version history of the file. Defaults to an empty list.
- `edit_count`: An integer representing the number of edits made to the file. Defaults to 0.
### Methods
The `Artifact` class includes various methods for creating, editing, saving, loading, and exporting file artifacts.
#### `create`
| Parameter | Type | Description |
|--------------------|--------|----------------------------------------|
| `initial_content` | `str` | The initial content of the file. |
**Usage Example:**
```python
artifact = Artifact(file_path="example.txt", file_type="txt")
artifact.create(initial_content="Initial file content")
```
#### `edit`
| Parameter | Type | Description |
|---------------|--------|----------------------------------------|
| `new_content` | `str` | The new content of the file. |
**Usage Example:**
```python
artifact.edit(new_content="Updated file content")
```
#### `save`
**Usage Example:**
```python
artifact.save()
```
#### `load`
**Usage Example:**
```python
artifact.load()
```
#### `get_version`
| Parameter | Type | Description |
|-------------------|-------|-----------------------------------------|
| `version_number` | `int` | The version number to retrieve. |
**Usage Example:**
```python
version = artifact.get_version(version_number=1)
```
#### `get_contents`
**Usage Example:**
```python
current_contents = artifact.get_contents()
```
#### `get_version_history`
**Usage Example:**
```python
version_history = artifact.get_version_history()
```
#### `export_to_json`
| Parameter | Type | Description |
|-------------|-------|----------------------------------------------|
| `file_path` | `str` | The path to the JSON file to save the artifact.|
**Usage Example:**
```python
artifact.export_to_json(file_path="artifact.json")
```
#### `import_from_json`
| Parameter | Type | Description |
|-------------|-------|--------------------------------------------------|
| `file_path` | `str` | The path to the JSON file to import the artifact from.|
**Usage Example:**
```python
imported_artifact = Artifact.import_from_json(file_path="artifact.json")
```
#### `get_metrics`
**Usage Example:**
```python
metrics = artifact.get_metrics()
```
#### `to_dict`
**Usage Example:**
```python
artifact_dict = artifact.to_dict()
```
#### `from_dict`
| Parameter | Type | Description |
|-----------|------------------|--------------------------------------------------|
| `data` | `Dict[str, Any]` | The dictionary representation of the artifact. |
**Usage Example:**
```python
artifact_data = {
"file_path": "example.txt",
"file_type": "txt",
"contents": "File content",
"versions": [],
"edit_count": 0
}
artifact = Artifact.from_dict(artifact_data)
```
## Additional Information and Tips
- The `Artifact` class uses the `pydantic` library to handle data validation and serialization.
- When editing the artifact, ensure that the `file_path` is set correctly to avoid file operation errors.
- Use the `get_version` and `get_version_history` methods to maintain a clear audit trail of changes to the file.
- The `export_to_json` and `import_from_json` methods are useful for backing up and restoring the state of an artifact.
## References and Resources
- [Pydantic Documentation](https://pydantic-docs.helpmanual.io/)
- [Python os.path module](https://docs.python.org/3/library/os.path.html)
- [JSON Documentation](https://docs.python.org/3/library/json.html)
## Examples of Usage
### Example 1: Creating and Editing an Artifact
```python
from datetime import datetime
from pydantic import BaseModel, Field, validator
from typing import List, Dict, Any, Union
import os
import json
# Define FileVersion class
class FileVersion(BaseModel):
version_number: int
content: str
timestamp: datetime
# Artifact class definition goes here
# Create an artifact
artifact = Artifact(file_path="example.txt", file_type="txt")
artifact.create(initial_content="Initial file content")
# Edit the artifact
artifact.edit(new_content="Updated file content")
# Save the artifact to a file
artifact.save()
# Load the artifact from the file
artifact.load()
# Print the current contents of the artifact
print(artifact.get_contents())
# Print the version history
print(artifact.get_version_history())
```
### Example 2: Exporting and Importing an Artifact
```python
# Export the artifact to a JSON file
artifact.export_to_json(file_path="artifact.json")
# Import
the artifact from a JSON file
imported_artifact = Artifact.import_from_json(file_path="artifact.json")
# Print the metrics of the imported artifact
print(imported_artifact.get_metrics())
```
### Example 3: Converting an Artifact to and from a Dictionary
```python
# Convert the artifact to a dictionary
artifact_dict = artifact.to_dict()
# Create a new artifact from the dictionary
new_artifact = Artifact.from_dict(artifact_dict)
# Print the metrics of the new artifact
print(new_artifact.get_metrics())
```

@ -304,7 +304,7 @@ agent = Agent(
output_type=tool_schema, # or dict, or str output_type=tool_schema, # or dict, or str
metadata_output_type="json", metadata_output_type="json",
# List of schemas that the agent can handle # List of schemas that the agent can handle
list_tool_schemas=[tool_schema], list_base_models=[tool_schema],
function_calling_format_type="OpenAI", function_calling_format_type="OpenAI",
function_calling_type="json", # or soon yaml function_calling_type="json", # or soon yaml
) )

@ -198,7 +198,7 @@ agent = Agent(
generate_invoice, generate_invoice,
summarize_expenses summarize_expenses
], ],
list_tool_schemas_json=create_tool_schema(), list_base_models_json=create_tool_schema(),
) )
``` ```
@ -274,7 +274,7 @@ agent = Agent(
summarize_expenses, summarize_expenses,
custom_accounting_tool custom_accounting_tool
], ],
list_tool_schemas_json=create_tool_schema(), list_base_models_json=create_tool_schema(),
) )
``` ```
@ -325,7 +325,7 @@ advanced_agent = AdvancedAccountingAgent(
summarize_expenses, summarize_expenses,
custom_accounting_tool custom_accounting_tool
], ],
list_tool_schemas_json=create_tool_schema(), list_base_models_json=create_tool_schema(),
) )
# Call custom methods # Call custom methods
@ -367,7 +367,7 @@ agent = Agent(
function_calling_format_type="OpenAI", function_calling_format_type="OpenAI",
function_calling_type="json", function_calling_type="json",
tools=[process_data_frame], tools=[process_data_frame],
list_tool_schemas_json=create_tool_schema(), list_base_models_json=create_tool_schema(),
) )
# Example task: Process a data frame # Example task: Process a data frame

@ -1,12 +1,14 @@
import os import os
from swarms import Agent, Anthropic from swarms import Agent, Anthropic
from swarms.prompts.finance_agent_sys_prompt import (
FINANCIAL_AGENT_SYS_PROMPT,
)
from swarms.utils.data_to_text import data_to_text
# Initialize the agent # Initialize the agent
agent = Agent( agent = Agent(
agent_name="Accounting Assistant", agent_name="Financial-Analysis-Agent",
system_prompt="You're the accounting agent, your purpose is to generate a profit report for a company!", system_prompt=FINANCIAL_AGENT_SYS_PROMPT,
agent_description="Generate a profit report for a company!",
llm=Anthropic(anthropic_api_key=os.getenv("ANTHROPIC_API_KEY")), llm=Anthropic(anthropic_api_key=os.getenv("ANTHROPIC_API_KEY")),
max_loops="auto", max_loops="auto",
autosave=True, autosave=True,
@ -15,33 +17,29 @@ agent = Agent(
verbose=True, verbose=True,
streaming_on=True, streaming_on=True,
# interactive=True, # Set to False to disable interactive mode # interactive=True, # Set to False to disable interactive mode
saved_state_path="accounting_agent.json", dynamic_temperature_enabled=True,
# tools=[ saved_state_path="finance_agent.json",
# # calculate_profit, # tools=[Add your functions here# ],
# # generate_report, # stopping_token="Stop!",
# # search_knowledge_base, # interactive=True,
# # write_memory_to_rag, # docs_folder="docs", # Enter your folder name
# # search_knowledge_base, # pdf_path="docs/finance_agent.pdf",
# # generate_speech,
# ],
stopping_token="Stop!",
interactive=True,
# docs_folder="docs",
# pdf_path="docs/accounting_agent.pdf",
# sop="Calculate the profit for a company.", # sop="Calculate the profit for a company.",
# sop_list=["Calculate the profit for a company."], # sop_list=["Calculate the profit for a company."],
# user_name="User", user_name="swarms_corp",
# # docs= # # docs=
# # docs_folder="docs", # # docs_folder="docs",
# retry_attempts=3, retry_attempts=3,
# context_length=1000, # context_length=1000,
# tool_schema = dict # tool_schema = dict
context_length=1000, context_length=200000,
# agent_ops_on=True, # agent_ops_on=True,
# tree_of_thoughts=True,
# long_term_memory=ChromaDB(docs_folder="artifacts"), # long_term_memory=ChromaDB(docs_folder="artifacts"),
) )
contract = data_to_text("your_contract_pdf.pdf")
agent.run( agent.run(
"Search the knowledge base for the swarms github framework and how it works" f"Analyze the following contract and give me a full summary: {contract}"
) )

@ -0,0 +1,78 @@
import os
from swarms import Agent, Anthropic, MultiAgentCollaboration
from swarms.prompts.finance_agent_sys_prompt import (
FINANCIAL_AGENT_SYS_PROMPT,
)
# Initialize the agent
fiancial_analyst = Agent(
agent_name="Financial-Analysis-Agent",
system_prompt=FINANCIAL_AGENT_SYS_PROMPT,
llm=Anthropic(anthropic_api_key=os.getenv("ANTHROPIC_API_KEY")),
max_loops="auto",
autosave=True,
# dynamic_temperature_enabled=True,
dashboard=False,
verbose=True,
streaming_on=True,
# interactive=True, # Set to False to disable interactive mode
dynamic_temperature_enabled=True,
saved_state_path="finance_agent.json",
# tools=[Add your functions here# ],
# stopping_token="Stop!",
# interactive=True,
# docs_folder="docs", # Enter your folder name
# pdf_path="docs/finance_agent.pdf",
# sop="Calculate the profit for a company.",
# sop_list=["Calculate the profit for a company."],
user_name="swarms_corp",
# # docs=
# # docs_folder="docs",
retry_attempts=3,
# context_length=1000,
# tool_schema = dict
context_length=200000,
# agent_ops_on=True,
# long_term_memory=ChromaDB(docs_folder="artifacts"),
)
# Initialize the agent
fiancial_director = Agent(
agent_name="Financial-Analysis-Agent",
system_prompt="Your the financial director"
+ FINANCIAL_AGENT_SYS_PROMPT,
llm=Anthropic(anthropic_api_key=os.getenv("ANTHROPIC_API_KEY")),
max_loops="auto",
autosave=True,
# dynamic_temperature_enabled=True,
dashboard=False,
verbose=True,
streaming_on=True,
# interactive=True, # Set to False to disable interactive mode
dynamic_temperature_enabled=True,
saved_state_path="finance_agent.json",
# tools=[Add your functions here# ],
# stopping_token="Stop!",
# interactive=True,
# docs_folder="docs", # Enter your folder name
# pdf_path="docs/finance_agent.pdf",
# sop="Calculate the profit for a company.",
# sop_list=["Calculate the profit for a company."],
user_name="swarms_corp",
# # docs=
# # docs_folder="docs",
retry_attempts=3,
# context_length=1000,
# tool_schema = dict
context_length=200000,
# agent_ops_on=True,
# long_term_memory=ChromaDB(docs_folder="artifacts"),
)
swarm = MultiAgentCollaboration(
agents=[fiancial_analyst, fiancial_director],
select_next_speaker="longest_response",
max_loops=10,
)

@ -96,7 +96,7 @@ agent = Agent(
# long_term_memory=chromadb, # long_term_memory=chromadb,
metadata_output_type="json", metadata_output_type="json",
# List of schemas that the agent can handle # List of schemas that the agent can handle
# list_tool_schemas=[tool_schema], # list_base_models=[tool_schema],
function_calling_format_type="OpenAI", function_calling_format_type="OpenAI",
function_calling_type="json", # or soon yaml function_calling_type="json", # or soon yaml
) )

@ -0,0 +1,17 @@
from swarms import Artifact
# Example usage
artifact = Artifact(file_path="example.txt", file_type=".txt")
artifact.create("Initial content")
artifact.edit("First edit")
artifact.edit("Second edit")
artifact.save()
# Export to JSON
artifact.export_to_json("artifact.json")
# Import from JSON
imported_artifact = Artifact.import_from_json("artifact.json")
# # Get metrics
print(artifact.get_metrics())

@ -189,7 +189,7 @@ agent = Agent(
agent_name="Account Management Agent", agent_name="Account Management Agent",
system_prompt=ACCOUNT_MANAGEMENT_SYSTEM_PROMPT, system_prompt=ACCOUNT_MANAGEMENT_SYSTEM_PROMPT,
# sop_list=[GLOSSARY_PROMPTS, FEW_SHORT_PROMPTS], # sop_list=[GLOSSARY_PROMPTS, FEW_SHORT_PROMPTS],
# sop=list_tool_schemas_json, # sop=list_base_models_json,
llm=llama3Hosted( llm=llama3Hosted(
max_tokens=3000, max_tokens=3000,
), ),

@ -31,7 +31,7 @@ agent = Agent(
# autosave=True, # autosave=True,
dashboard=False, dashboard=False,
verbose=True, verbose=True,
# sop=list_tool_schemas_json, # sop=list_base_models_json,
# sop_list=[ # sop_list=[
# prep_weather_tool_prompt # prep_weather_tool_prompt
# ], # Set the output type to the tool schema which is a BaseModel # ], # Set the output type to the tool schema which is a BaseModel
@ -48,7 +48,7 @@ agent = Agent(
agent2 = Agent( agent2 = Agent(
agent_name="Space Traffic Controller Agent", agent_name="Space Traffic Controller Agent",
system_prompt=SPACE_TRAFFIC_CONTROLLER_SYS_PROMPT, system_prompt=SPACE_TRAFFIC_CONTROLLER_SYS_PROMPT,
# sop=list_tool_schemas_json, # sop=list_base_models_json,
llm=llama3Hosted(), llm=llama3Hosted(),
max_loops=1, max_loops=1,
# autosave=True, # autosave=True,

@ -196,7 +196,7 @@
" output_type=tool_schema, # or dict, or str\n", " output_type=tool_schema, # or dict, or str\n",
" metadata_output_type=\"json\",\n", " metadata_output_type=\"json\",\n",
" # List of schemas that the agent can handle\n", " # List of schemas that the agent can handle\n",
" list_tool_schemas=[tool_schema],\n", " list_base_models=[tool_schema],\n",
" function_calling_format_type=\"OpenAI\",\n", " function_calling_format_type=\"OpenAI\",\n",
" function_calling_type=\"json\", # or soon yaml\n", " function_calling_type=\"json\", # or soon yaml\n",
")" ")"

@ -330,7 +330,7 @@ for character_name, character_system_message, bidding_template in zip(
) )
) )
max_iters = 10 max_loops = 10
n = 0 n = 0
simulator = DialogueSimulator( simulator = DialogueSimulator(
@ -341,7 +341,7 @@ simulator.inject("Debate Moderator", specified_topic)
print(f"(Debate Moderator): {specified_topic}") print(f"(Debate Moderator): {specified_topic}")
print("\n") print("\n")
while n < max_iters: while n < max_loops:
name, message = simulator.step() name, message = simulator.step()
print(f"({name}): {message}") print(f"({name}): {message}")
print("\n") print("\n")

@ -404,7 +404,7 @@
" output_type=tool_schema, # or dict, or str\n", " output_type=tool_schema, # or dict, or str\n",
" metadata_output_type=\"json\",\n", " metadata_output_type=\"json\",\n",
" # List of schemas that the agent can handle\n", " # List of schemas that the agent can handle\n",
" list_tool_schemas=[tool_schema],\n", " list_base_models=[tool_schema],\n",
" function_calling_format_type=\"OpenAI\",\n", " function_calling_format_type=\"OpenAI\",\n",
" function_calling_type=\"json\", # or soon yaml\n", " function_calling_type=\"json\", # or soon yaml\n",
")\n", ")\n",

@ -0,0 +1,83 @@
from swarms.tools.tool_parse_exec import parse_and_execute_json
# Example functions to be called
def add(a: int, b: int) -> int:
"""
Adds two integers and returns the result.
Parameters:
a (int): The first integer.
b (int): The second integer.
Returns:
int: The sum of the two integers.
"""
return a + b
def subtract(a: int, b: int) -> int:
"""
Subtracts two integers and returns the result.
Parameters:
a (int): The first integer.
b (int): The second integer.
Returns:
int: The difference between the two integers.
"""
return a - b
def multiply(a: int, b: int) -> int:
"""
Multiply two numbers.
Args:
a (int): The first number.
b (int): The second number.
Returns:
int: The product of the two numbers.
"""
return a * b
# Example usage
functions_list = [add, subtract, multiply]
json_input = """
{
"function": [
{"name": "add", "parameters": {"a": 10, "b": 5}},
{"name": "subtract", "parameters": {"a": 10, "b": 5}},
{"name": "multiply", "parameters": {"a": 10, "b": 5}}
]
}
"""
json_input_single = """
{
"function": {"name": "add", "parameters": {"a": 10, "b": 5}}
}
"""
# Testing multiple functions
results_multiple = parse_and_execute_json(
functions=functions_list,
json_string=json_input,
parse_md=False,
verbose=True,
)
print("Multiple functions results:\n", results_multiple)
# Testing single function
results_single = parse_and_execute_json(
functions=functions_list,
json_string=json_input_single,
parse_md=False,
verbose=True,
)
print("Single function result:\n", results_single)

@ -5,7 +5,7 @@ build-backend = "poetry.core.masonry.api"
[tool.poetry] [tool.poetry]
name = "swarms" name = "swarms"
version = "5.3.7" version = "5.3.9"
description = "Swarms - Pytorch" description = "Swarms - Pytorch"
license = "MIT" license = "MIT"
authors = ["Kye Gomez <kye@apac.ai>"] authors = ["Kye Gomez <kye@apac.ai>"]
@ -24,11 +24,12 @@ keywords = [
"transformers", "transformers",
"multi-agent", "multi-agent",
"swarms of agents", "swarms of agents",
"Enterprise-Grade", "Enterprise-Grade Agents",
"Production-Grade", "Production-Grade Agents",
"Agents", "Agents",
"Multi-Grade-Agents", "Multi-Grade-Agents",
"Swarms", "Swarms",
"Transformers",
] ]
classifiers = [ classifiers = [

@ -1,10 +1,11 @@
from swarms.artifacts.base_artifact import BaseArtifact from swarms.artifacts.base_artifact import BaseArtifact
from swarms.artifacts.text_artifact import TextArtifact from swarms.artifacts.text_artifact import TextArtifact
from swarms.artifacts.main_artifact import Artifact
# from swarms.artifacts.claude_like_artifact import Artifact # from swarms.artifacts.claude_like_artifact import Artifact
__all__ = [ __all__ = [
"BaseArtifact", "BaseArtifact",
"TextArtifact", "TextArtifact",
# "Artifact", "Artifact",
] ]

@ -0,0 +1,239 @@
from swarms.utils.loguru_logger import logger
import os
import json
from typing import List, Union, Dict, Any
from pydantic.v1 import BaseModel, Field, validator
from datetime import datetime
class FileVersion(BaseModel):
"""
Represents a version of the file with its content and timestamp.
"""
version_number: int
content: str
timestamp: datetime
def __str__(self) -> str:
return f"Version {self.version_number} (Timestamp: {self.timestamp}):\n{self.content}"
class Artifact(BaseModel):
"""
Represents a file artifact.
Attributes:
file_path (str): The path to the file.
file_type (str): The type of the file.
contents (str): The contents of the file.
versions (List[FileVersion]): The list of file versions.
edit_count (int): The number of times the file has been edited.
"""
file_path: str
file_type: str
contents: str = Field(default="")
versions: List[FileVersion] = Field(default_factory=list)
edit_count: int = Field(default=0)
@validator("file_type", pre=True, always=True)
def validate_file_type(cls, v, values):
if not v:
file_path = values.get("file_path")
_, ext = os.path.splitext(file_path)
if ext.lower() not in [
".py",
".csv",
".txt",
".json",
".xml",
".html",
".yaml",
".yml",
".md",
".rst",
".log",
".sh",
".bat",
".ps1",
".psm1",
".psd1",
".ps1xml",
".pssc",
".reg",
".mof",
".mfl",
".xaml",
".xml",
".wsf",
".config",
".ini",
".inf",
".json5",
".hcl",
".tf",
".tfvars",
".tsv",
".properties",
]:
raise ValueError("Unsupported file type")
return ext.lower()
return v
def create(self, initial_content: str) -> None:
"""
Creates a new file artifact with the initial content.
"""
try:
self.contents = initial_content
self.versions.append(
FileVersion(
version_number=1,
content=initial_content,
timestamp=datetime.now(),
)
)
self.edit_count = 0
except Exception as e:
logger.error(f"Error creating artifact: {e}")
raise e
def edit(self, new_content: str) -> None:
"""
Edits the artifact's content, tracking the change in the version history.
"""
try:
self.contents = new_content
self.edit_count += 1
new_version = FileVersion(
version_number=len(self.versions) + 1,
content=new_content,
timestamp=datetime.now(),
)
self.versions.append(new_version)
except Exception as e:
logger.error(f"Error editing artifact: {e}")
raise e
def save(self) -> None:
"""
Saves the current artifact's contents to the specified file path.
"""
with open(self.file_path, "w") as f:
f.write(self.contents)
def load(self) -> None:
"""
Loads the file contents from the specified file path into the artifact.
"""
with open(self.file_path, "r") as f:
self.contents = f.read()
self.create(self.contents)
def get_version(self, version_number: int) -> Union[FileVersion, None]:
"""
Retrieves a specific version of the artifact by its version number.
"""
for version in self.versions:
if version.version_number == version_number:
return version
return None
def get_contents(self) -> str:
"""
Returns the current contents of the artifact as a string.
"""
return self.contents
def get_version_history(self) -> str:
"""
Returns the version history of the artifact as a formatted string.
"""
return "\n\n".join([str(version) for version in self.versions])
def export_to_json(self, file_path: str) -> None:
"""
Exports the artifact to a JSON file.
Args:
file_path (str): The path to the JSON file where the artifact will be saved.
"""
with open(file_path, "w") as json_file:
json.dump(self.dict(), json_file, default=str, indent=4)
@classmethod
def import_from_json(cls, file_path: str) -> "Artifact":
"""
Imports an artifact from a JSON file.
Args:
file_path (str): The path to the JSON file to import the artifact from.
Returns:
Artifact: The imported artifact instance.
"""
with open(file_path, "r") as json_file:
data = json.load(json_file)
# Convert timestamp strings back to datetime objects
for version in data["versions"]:
version["timestamp"] = datetime.fromisoformat(
version["timestamp"]
)
return cls(**data)
def get_metrics(self) -> str:
"""
Returns all metrics of the artifact as a formatted string.
Returns:
str: A string containing all metrics of the artifact.
"""
metrics = (
f"File Path: {self.file_path}\n"
f"File Type: {self.file_type}\n"
f"Current Contents:\n{self.contents}\n\n"
f"Edit Count: {self.edit_count}\n"
f"Version History:\n{self.get_version_history()}"
)
return metrics
def to_dict(self) -> Dict[str, Any]:
"""
Converts the artifact instance to a dictionary representation.
"""
return self.dict()
@classmethod
def from_dict(cls, data: Dict[str, Any]) -> "Artifact":
"""
Creates an artifact instance from a dictionary representation.
"""
try:
# Convert timestamp strings back to datetime objects if necessary
for version in data.get("versions", []):
if isinstance(version["timestamp"], str):
version["timestamp"] = datetime.fromisoformat(
version["timestamp"]
)
return cls(**data)
except Exception as e:
logger.error(f"Error creating artifact from dict: {e}")
raise e
# # Example usage
# artifact = Artifact(file_path="example.txt", file_type=".txt")
# artifact.create("Initial content")
# artifact.edit("First edit")
# artifact.edit("Second edit")
# artifact.save()
# # Export to JSON
# artifact.export_to_json("artifact.json")
# # Import from JSON
# imported_artifact = Artifact.import_from_json("artifact.json")
# # # Get metrics
# print(artifact.get_metrics())

@ -45,7 +45,7 @@ from swarms.structs.round_robin import RoundRobinSwarm
from swarms.structs.sequential_workflow import SequentialWorkflow from swarms.structs.sequential_workflow import SequentialWorkflow
# New Swarms # New Swarms
from swarms.structs.swarm_load_balancer import AgentLoadBalancer # from swarms.structs.swarm_load_balancer import AgentLoadBalancer
# from swarms.structs.swarm_net import SwarmNetwork # from swarms.structs.swarm_net import SwarmNetwork
from swarms.structs.swarming_architectures import ( from swarms.structs.swarming_architectures import (
@ -167,7 +167,7 @@ __all__ = [
"rearrange", "rearrange",
"RoundRobinSwarm", "RoundRobinSwarm",
"HiearchicalSwarm", "HiearchicalSwarm",
"AgentLoadBalancer", # "AgentLoadBalancer",
"MixtureOfAgents", "MixtureOfAgents",
"GraphWorkflow", "GraphWorkflow",
"Node", "Node",

@ -1,14 +1,57 @@
import json from typing import List, Callable
import random
from typing import List
import tenacity
from swarms.structs.agent import Agent from swarms.structs.agent import Agent
from swarms.utils.logger import logger from swarms.utils.logger import logger
from swarms.structs.base_swarm import BaseSwarm from swarms.structs.base_swarm import BaseSwarm
from swarms.structs.conversation import Conversation
# [TODO]: Add type hints # def select_next_speaker_bid(
# step: int,
# agents: List[Agent],
# ) -> int:
# """Selects the next speaker."""
# bids = []
# for agent in agents:
# bid = ask_for_bid(agent)
# bids.append(bid)
# max_value = max(bids)
# max_indices = [i for i, x in enumerate(bids) if x == max_value]
# idx = random.choice(max_indices)
# return idx
def select_next_speaker_roundtable(step: int, agents: List[Agent]) -> int:
"""Selects the next speaker."""
return step % len(agents)
def select_next_speaker_director(
step: int, agents: List[Agent], director: Agent
) -> int:
# if the step if even => director
# => director selects next speaker
if step % 2 == 1:
idx = 0
else:
idx = director.select_next_speaker() + 1
return idx
def run_director(self, task: str):
"""Runs the multi-agent collaboration with a director."""
n = 0
self.reset()
self.inject("Debate Moderator", task)
print("(Debate Moderator): \n")
while n < self.max_loops:
name, message = self.step()
print(f"({name}): {message}\n")
n += 1
# [MAYBE]: Add type hints
class MultiAgentCollaboration(BaseSwarm): class MultiAgentCollaboration(BaseSwarm):
""" """
Multi-agent collaboration class. Multi-agent collaboration class.
@ -17,7 +60,7 @@ class MultiAgentCollaboration(BaseSwarm):
agents (List[Agent]): The agents in the collaboration. agents (List[Agent]): The agents in the collaboration.
selection_function (callable): The function that selects the next speaker. selection_function (callable): The function that selects the next speaker.
Defaults to select_next_speaker. Defaults to select_next_speaker.
max_iters (int): The maximum number of iterations. Defaults to 10. max_loops (int): The maximum number of iterations. Defaults to 10.
autosave (bool): Whether to autosave the state of all agents. Defaults to True. autosave (bool): Whether to autosave the state of all agents. Defaults to True.
saved_file_path_name (str): The path to the saved file. Defaults to saved_file_path_name (str): The path to the saved file. Defaults to
"multi_agent_collab.json". "multi_agent_collab.json".
@ -59,7 +102,7 @@ class MultiAgentCollaboration(BaseSwarm):
>>> # Initialize the multi-agent collaboration >>> # Initialize the multi-agent collaboration
>>> swarm = MultiAgentCollaboration( >>> swarm = MultiAgentCollaboration(
>>> agents=[agent], >>> agents=[agent],
>>> max_iters=4, >>> max_loops=4,
>>> ) >>> )
>>> >>>
>>> # Run the multi-agent collaboration >>> # Run the multi-agent collaboration
@ -76,8 +119,8 @@ class MultiAgentCollaboration(BaseSwarm):
description: str = "A multi-agent collaboration.", description: str = "A multi-agent collaboration.",
director: Agent = None, director: Agent = None,
agents: List[Agent] = None, agents: List[Agent] = None,
select_next_speaker: callable = None, select_next_speaker: Callable = None,
max_iters: int = 10, max_loops: int = 10,
autosave: bool = True, autosave: bool = True,
saved_file_path_name: str = "multi_agent_collab.json", saved_file_path_name: str = "multi_agent_collab.json",
stopping_token: str = "<DONE>", stopping_token: str = "<DONE>",
@ -92,7 +135,7 @@ class MultiAgentCollaboration(BaseSwarm):
self.agents = agents self.agents = agents
self.select_next_speaker = select_next_speaker self.select_next_speaker = select_next_speaker
self._step = 0 self._step = 0
self.max_iters = max_iters self.max_loops = max_loops
self.autosave = autosave self.autosave = autosave
self.saved_file_path_name = saved_file_path_name self.saved_file_path_name = saved_file_path_name
self.stopping_token = stopping_token self.stopping_token = stopping_token
@ -100,150 +143,90 @@ class MultiAgentCollaboration(BaseSwarm):
self.logger = logger self.logger = logger
self.logging = logging self.logging = logging
# Conversation
self.conversation = Conversation(
time_enabled=True, *args, **kwargs
)
def default_select_next_speaker(
self, step: int, agents: List[Agent]
) -> int:
"""Default speaker selection function."""
return step % len(agents)
def inject(self, name: str, message: str): def inject(self, name: str, message: str):
"""Injects a message into the multi-agent collaboration.""" """Injects a message into the multi-agent collaboration."""
for agent in self.agents: for agent in self.agents:
agent.run(f"Name {name} and message: {message}") self.conversation.add(name, message)
agent.run(self.conversation.return_history_as_string())
self._step += 1 self._step += 1
def step(self) -> tuple[str, str]: def step(self) -> str:
"""Steps through the multi-agent collaboration.""" """Steps through the multi-agent collaboration."""
speaker_idx = self.select_next_speaker(self._step, self.agents) speaker_idx = self.select_next_speaker(self._step, self.agents)
speaker = self.agents[speaker_idx] speaker = self.agents[speaker_idx]
message = speaker.send() message = speaker.send()
for receiver in self.agents: for receiver in self.agents:
receiver.receive(speaker.name, message) self.conversation.add(speaker.name, message)
receiver.run(self.conversation.return_history_as_string())
self._step += 1 self._step += 1
if self.logging: if self.logging:
self.log_step(speaker, message) self.log_step(speaker, message)
return speaker.name, message return self.conversation.return_history_as_string()
def log_step(self, speaker: str, response: str): def log_step(self, speaker: str, response: str):
"""Logs the step of the multi-agent collaboration.""" """Logs the step of the multi-agent collaboration."""
self.logger.info(f"{speaker.name}: {response}") self.logger.info(f"{speaker.name}: {response}")
@tenacity.retry(
stop=tenacity.stop_after_attempt(10),
wait=tenacity.wait_none(),
retry=tenacity.retry_if_exception_type(ValueError),
before_sleep=lambda retry_state: print(
f"ValueError occured: {retry_state.outcome.exception()},"
" retying..."
),
retry_error_callback=lambda retry_state: 0,
)
def select_next_speaker_bid(
self,
step: int,
agents: List[Agent],
) -> int:
"""Selects the next speaker."""
bids = []
for agent in agents:
bid = self.ask_for_bid(agent)
bids.append(bid)
max_value = max(bids)
max_indices = [i for i, x in enumerate(bids) if x == max_value]
idx = random.choice(max_indices)
return idx
@tenacity.retry(
stop=tenacity.stop_after_attempt(10),
wait=tenacity.wait_none(),
retry=tenacity.retry_if_exception_type(ValueError),
before_sleep=lambda retry_state: print(
f"ValueError occured: {retry_state.outcome.exception()},"
" retying..."
),
retry_error_callback=lambda retry_state: 0,
)
def run_director(self, task: str):
"""Runs the multi-agent collaboration."""
n = 0
self.reset()
self.inject("Debate Moderator")
print("(Debate Moderator): ")
print("\n")
while n < self.max_iters:
name, message = self.step()
print(f"({name}): {message}")
print("\n")
n += 1
def select_next_speaker_roundtable(
self, step: int, agents: List[Agent]
) -> int:
"""Selects the next speaker."""
return step % len(agents)
def select_next_speaker_director(
step: int, agents: List[Agent], director
) -> int:
# if the step if even => director
# => director selects next speaker
if step % 2 == 1:
idx = 0
else:
idx = director.select_next_speaker() + 1
return idx
def run(self, task: str, *args, **kwargs): def run(self, task: str, *args, **kwargs):
# [TODO]: Add type hints """Runs the multi-agent collaboration."""
# [TODO]: Implement the run method using step method for _ in range(self.max_loops):
conversation = task result = self.step()
for _ in range(self.max_iters):
for agent in self.agents:
result = agent.run(conversation, *args, **kwargs)
self.results.append({"agent": agent, "response": result})
conversation += result
if self.autosave: if self.autosave:
self.save_state() self.save_state()
if result == self.stopping_token: if self.stopping_token in result:
break break
return self.conversation.return_history_as_string()
return self.results
# def format_results(self, results):
def format_results(self, results): # """Formats the results of the run method"""
"""Formats the results of the run method""" # formatted_results = "\n".join(
formatted_results = "\n".join( # [
[ # f"{result['agent']} responded: {result['response']}"
f"{result['agent']} responded: {result['response']}" # for result in results
for result in results # ]
] # )
) # return formatted_results
return formatted_results
# def save(self):
def save(self): # """Saves the state of all agents."""
"""Saves the state of all agents.""" # state = {
state = { # "step": self._step,
"step": self._step, # "results": [
"results": [ # {"agent": r["agent"].name, "response": r["response"]}
{"agent": r["agent"].name, "response": r["response"]} # for r in self.results
for r in self.results # ],
], # }
}
# with open(self.saved_file_path_name, "w") as file:
with open(self.saved_file_path_name, "w") as file: # json.dump(state, file)
json.dump(state, file)
# def load(self):
def load(self): # """Loads the state of all agents."""
"""Loads the state of all agents.""" # with open(self.saved_file_path_name) as file:
with open(self.saved_file_path_name) as file: # state = json.load(file)
state = json.load(file) # self._step = state["step"]
self._step = state["step"] # self.results = state["results"]
self.results = state["results"] # return state
return state
# def __repr__(self):
def __repr__(self): # return (
return ( # f"MultiAgentCollaboration(agents={self.agents},"
f"MultiAgentCollaboration(agents={self.agents}," # f" selection_function={self.select_next_speaker},"
f" selection_function={self.select_next_speaker}," # f" max_loops={self.max_loops}, autosave={self.autosave},"
f" max_iters={self.max_iters}, autosave={self.autosave}," # f" saved_file_path_name={self.saved_file_path_name})"
f" saved_file_path_name={self.saved_file_path_name})" # )
)

@ -2,6 +2,7 @@ from typing import Any, List
from docstring_parser import parse from docstring_parser import parse
from pydantic import BaseModel from pydantic import BaseModel
from swarms.utils.loguru_logger import logger
def _remove_a_key(d: dict, remove_key: str) -> None: def _remove_a_key(d: dict, remove_key: str) -> None:
@ -14,6 +15,24 @@ def _remove_a_key(d: dict, remove_key: str) -> None:
_remove_a_key(d[key], remove_key) _remove_a_key(d[key], remove_key)
def check_pydantic_name(pydantic_type: type[BaseModel]) -> str:
"""
Check the name of the Pydantic model.
Args:
pydantic_type (type[BaseModel]): The Pydantic model type to check.
Returns:
str: The name of the Pydantic model.
"""
try:
return type(pydantic_type).__name__
except AttributeError as error:
logger.error(f"The Pydantic model does not have a name. {error}")
raise error
def base_model_to_openai_function( def base_model_to_openai_function(
pydantic_type: type[BaseModel], pydantic_type: type[BaseModel],
output_str: bool = False, output_str: bool = False,
@ -30,6 +49,9 @@ def base_model_to_openai_function(
""" """
schema = pydantic_type.model_json_schema() schema = pydantic_type.model_json_schema()
# Fetch the name of the class
name = type(pydantic_type).__name__
docstring = parse(pydantic_type.__doc__ or "") docstring = parse(pydantic_type.__doc__ or "")
parameters = { parameters = {
k: v k: v
@ -51,7 +73,7 @@ def base_model_to_openai_function(
schema["description"] = docstring.short_description schema["description"] = docstring.short_description
else: else:
schema["description"] = ( schema["description"] = (
f"Correctly extracted `{pydantic_type.__name__}` with all " f"Correctly extracted `{name}` with all "
f"the required parameters with correct types" f"the required parameters with correct types"
) )
@ -61,11 +83,11 @@ def base_model_to_openai_function(
if output_str: if output_str:
out = { out = {
"function_call": { "function_call": {
"name": pydantic_type.__name__, "name": name,
}, },
"functions": [ "functions": [
{ {
"name": pydantic_type.__name__, "name": name,
"description": schema["description"], "description": schema["description"],
"parameters": parameters, "parameters": parameters,
}, },
@ -76,11 +98,11 @@ def base_model_to_openai_function(
else: else:
return { return {
"function_call": { "function_call": {
"name": pydantic_type.__name__, "name": name,
}, },
"functions": [ "functions": [
{ {
"name": pydantic_type.__name__, "name": name,
"description": schema["description"], "description": schema["description"],
"parameters": parameters, "parameters": parameters,
}, },

@ -1,6 +1,7 @@
from typing import List
import json import json
import loguru from typing import List
from swarms.utils.loguru_logger import logger
from swarms.utils.parse_code import extract_code_from_markdown from swarms.utils.parse_code import extract_code_from_markdown
@ -28,7 +29,6 @@ def parse_and_execute_json(
# Create a dictionary that maps function names to functions # Create a dictionary that maps function names to functions
function_dict = {func.__name__: func for func in functions} function_dict = {func.__name__: func for func in functions}
loguru.logger.info(f"Extracted code: {json_string}")
data = json.loads(json_string) data = json.loads(json_string)
function_list = data.get("functions", []) function_list = data.get("functions", [])
@ -41,14 +41,163 @@ def parse_and_execute_json(
if function_name in function_dict: if function_name in function_dict:
# Call the function with the parsed parameters # Call the function with the parsed parameters
result = function_dict[function_name](**parameters) result = function_dict[function_name](**parameters)
results[function_name] = result results[function_name] = str(result)
else: else:
loguru.logger.warning(
f"No function named '{function_name}' found."
)
results[function_name] = None results[function_name] = None
return results return results
except Exception as e: except Exception as e:
loguru.logger.error(f"Error: {e}") logger.error(f"Error parsing and executing JSON: {e}")
return None return None
# def parse_and_execute_json(
# functions: List[Callable[..., Any]],
# json_string: str = None,
# parse_md: bool = False,
# verbose: bool = False,
# ) -> Dict[str, Any]:
# """
# Parses and executes a JSON string containing function names and parameters.
# Args:
# functions (List[Callable]): A list of callable functions.
# json_string (str): The JSON string to parse and execute.
# parse_md (bool): Flag indicating whether to extract code from Markdown.
# verbose (bool): Flag indicating whether to enable verbose logging.
# Returns:
# Dict[str, Any]: A dictionary containing the results of executing the functions with the parsed parameters.
# """
# if parse_md:
# json_string = extract_code_from_markdown(json_string)
# logger.info("Number of functions: " + str(len(functions)))
# try:
# # Create a dictionary that maps function names to functions
# function_dict = {func.__name__: func for func in functions}
# data = json.loads(json_string)
# function_list = data.get("functions") or [data.get("function")]
# # Ensure function_list is a list and filter out None values
# if isinstance(function_list, dict):
# function_list = [function_list]
# else:
# function_list = [f for f in function_list if f]
# results = {}
# # Determine if concurrency is needed
# concurrency = len(function_list) > 1
# if concurrency:
# with concurrent.futures.ThreadPoolExecutor() as executor:
# future_to_function = {
# executor.submit(
# execute_and_log_function,
# function_dict,
# function_data,
# verbose,
# ): function_data
# for function_data in function_list
# }
# for future in concurrent.futures.as_completed(
# future_to_function
# ):
# function_data = future_to_function[future]
# try:
# result = future.result()
# results.update(result)
# except Exception as e:
# if verbose:
# logger.error(
# f"Error executing function {function_data.get('name')}: {e}"
# )
# results[function_data.get("name")] = None
# else:
# for function_data in function_list:
# function_name = function_data.get("name")
# parameters = function_data.get("parameters")
# if verbose:
# logger.info(
# f"Executing function: {function_name} with parameters: {parameters}"
# )
# if function_name in function_dict:
# try:
# result = function_dict[function_name](**parameters)
# results[function_name] = str(result)
# if verbose:
# logger.info(
# f"Result for function {function_name}: {result}"
# )
# except Exception as e:
# if verbose:
# logger.error(
# f"Error executing function {function_name}: {e}"
# )
# results[function_name] = None
# else:
# if verbose:
# logger.warning(
# f"Function {function_name} not found."
# )
# results[function_name] = None
# # Merge all results into a single string
# merged_results = "\n".join(
# f"{key}: {value}" for key, value in results.items()
# )
# return {"merged_results": merged_results}
# except Exception as e:
# logger.error(f"Error parsing and executing JSON: {e}")
# return None
# def execute_and_log_function(
# function_dict: Dict[str, Callable],
# function_data: Dict[str, Any],
# verbose: bool,
# ) -> Dict[str, Any]:
# """
# Executes a function from a given dictionary of functions and logs the execution details.
# Args:
# function_dict (Dict[str, Callable]): A dictionary containing the available functions.
# function_data (Dict[str, Any]): A dictionary containing the function name and parameters.
# verbose (bool): A flag indicating whether to log the execution details.
# Returns:
# Dict[str, Any]: A dictionary containing the function name and its result.
# """
# function_name = function_data.get("name")
# parameters = function_data.get("parameters")
# if verbose:
# logger.info(
# f"Executing function: {function_name} with parameters: {parameters}"
# )
# if function_name in function_dict:
# try:
# result = function_dict[function_name](**parameters)
# if verbose:
# logger.info(
# f"Result for function {function_name}: {result}"
# )
# return {function_name: str(result)}
# except Exception as e:
# if verbose:
# logger.error(
# f"Error executing function {function_name}: {e}"
# )
# return {function_name: None}
# else:
# if verbose:
# logger.warning(f"Function {function_name} not found.")
# return {function_name: None}

@ -0,0 +1,101 @@
import pytest
from datetime import datetime
from swarms.artifacts.artifact_base import Artifact, FileVersion
def test_file_version():
version = FileVersion(
version_number=1,
content="Initial content",
timestamp=datetime.now(),
)
assert version.version_number == 1
assert version.content == "Initial content"
def test_artifact_creation():
artifact = Artifact(file_path="test.txt", file_type=".txt")
assert artifact.file_path == "test.txt"
assert artifact.file_type == ".txt"
assert artifact.contents == ""
assert artifact.versions == []
assert artifact.edit_count == 0
def test_artifact_create():
artifact = Artifact(file_path="test.txt", file_type=".txt")
artifact.create("Initial content")
assert artifact.contents == "Initial content"
assert len(artifact.versions) == 1
assert artifact.versions[0].content == "Initial content"
assert artifact.edit_count == 0
def test_artifact_edit():
artifact = Artifact(file_path="test.txt", file_type=".txt")
artifact.create("Initial content")
artifact.edit("First edit")
assert artifact.contents == "First edit"
assert len(artifact.versions) == 2
assert artifact.versions[1].content == "First edit"
assert artifact.edit_count == 1
def test_artifact_get_version():
artifact = Artifact(file_path="test.txt", file_type=".txt")
artifact.create("Initial content")
artifact.edit("First edit")
version = artifact.get_version(1)
assert version.content == "Initial content"
def test_artifact_get_contents():
artifact = Artifact(file_path="test.txt", file_type=".txt")
artifact.create("Initial content")
assert artifact.get_contents() == "Initial content"
def test_artifact_get_version_history():
artifact = Artifact(file_path="test.txt", file_type=".txt")
artifact.create("Initial content")
artifact.edit("First edit")
history = artifact.get_version_history()
assert "Version 1" in history
assert "Version 2" in history
def test_artifact_to_dict():
artifact = Artifact(file_path="test.txt", file_type=".txt")
artifact.create("Initial content")
artifact_dict = artifact.to_dict()
assert artifact_dict["file_path"] == "test.txt"
assert artifact_dict["file_type"] == ".txt"
assert artifact_dict["contents"] == "Initial content"
assert artifact_dict["edit_count"] == 0
def test_artifact_from_dict():
artifact_dict = {
"file_path": "test.txt",
"file_type": ".txt",
"contents": "Initial content",
"versions": [
{
"version_number": 1,
"content": "Initial content",
"timestamp": datetime.now().isoformat(),
}
],
"edit_count": 0,
}
artifact = Artifact.from_dict(artifact_dict)
assert artifact.file_path == "test.txt"
assert artifact.file_type == ".txt"
assert artifact.contents == "Initial content"
assert artifact.versions[0].content == "Initial content"
assert artifact.edit_count == 0
# Run the tests
if __name__ == "__main__":
pytest.main()

@ -54,7 +54,7 @@ def test_add_agents(agent_rearrange):
def test_validate_flow_valid(agent_rearrange): def test_validate_flow_valid(agent_rearrange):
assert agent_rearrange.validate_flow() == True assert agent_rearrange.validate_flow() is True
def test_validate_flow_invalid(agent_rearrange): def test_validate_flow_invalid(agent_rearrange):

@ -66,7 +66,7 @@ def collaboration():
def test_collaboration_initialization(collaboration): def test_collaboration_initialization(collaboration):
assert len(collaboration.agents) == 2 assert len(collaboration.agents) == 2
assert callable(collaboration.select_next_speaker) assert callable(collaboration.select_next_speaker)
assert collaboration.max_iters == 10 assert collaboration.max_loops == 10
assert collaboration.results == [] assert collaboration.results == []
assert collaboration.logging is True assert collaboration.logging is True
@ -113,7 +113,7 @@ def test_select_next_speaker(collaboration):
def test_run(collaboration): def test_run(collaboration):
collaboration.run() collaboration.run()
for agent in collaboration.agents: for agent in collaboration.agents:
assert agent.step == collaboration.max_iters assert agent.step == collaboration.max_loops
def test_format_results(collaboration): def test_format_results(collaboration):

@ -0,0 +1,30 @@
import os
import pandas as pd
# Specify the directory you want to use
directory = "emails"
# Create an empty DataFrame to store all data
all_data = pd.DataFrame(columns=["Email"])
# Loop over all files in the directory
for filename in os.listdir(directory):
# Check if the file is a .txt file
if filename.endswith(".txt"):
# Construct the full file path
filepath = os.path.join(directory, filename)
# Read the file into a pandas DataFrame
df = pd.read_csv(filepath, sep="\t", header=None)
# Rename the column
df.columns = ["Email"]
# Append the data to the all_data DataFrame
all_data = all_data._append(df, ignore_index=True)
# Construct the output file path
output_filepath = os.path.join(directory, "combined.csv")
# Write the DataFrame to a .csv file
all_data.to_csv(output_filepath, index=False)
Loading…
Cancel
Save