From a0075c369076351fd97ffcba21c9c3a3664ffeea Mon Sep 17 00:00:00 2001
From: Kye Gomez <kye@swarms.world>
Date: Tue, 2 Dec 2025 18:09:00 -0800
Subject: [PATCH] add agents in batches to graph workflow

---
 .../graph_workflow_basic.py                   |  65 +++---
 graph_workflow_basic.py                       |  48 +++++
 maker_example.py                              |  55 -----
 swarms/structs/graph_workflow.py              | 192 ++++++++++++------
 4 files changed, 208 insertions(+), 152 deletions(-)
 create mode 100644 graph_workflow_basic.py
 delete mode 100644 maker_example.py

diff --git a/examples/multi_agent/graphworkflow_examples/graph_workflow_basic.py b/examples/multi_agent/graphworkflow_examples/graph_workflow_basic.py
index afb3bd92..0f45f774 100644
--- a/examples/multi_agent/graphworkflow_examples/graph_workflow_basic.py
+++ b/examples/multi_agent/graphworkflow_examples/graph_workflow_basic.py
@@ -1,51 +1,44 @@
-#!/usr/bin/env python3
-"""
-Basic Graph Workflow Example
-
-A minimal example showing how to use GraphWorkflow with backend selection.
-"""
 
 from swarms.structs.graph_workflow import GraphWorkflow
 from swarms.structs.agent import Agent
 
-agent_one = Agent(agent_name="research_agent", model="gpt-4o-mini")
+agent_one = Agent(
+    agent_name="research_agent", 
+    model_name="gpt-4o-mini", 
+    name="Research Agent",
+    agent_description="Agent responsible for gathering and summarizing research information."
+)
 agent_two = Agent(
-    agent_name="research_agent_two", model="gpt-4o-mini"
+    agent_name="research_agent_two", 
+    model_name="gpt-4o-mini",
+    name="Analysis Agent",
+    agent_description="Agent that analyzes the research data provided and processes insights."
 )
 agent_three = Agent(
-    agent_name="research_agent_three", model="gpt-4o-mini"
+    agent_name="research_agent_three", 
+    model_name="gpt-4o-mini",
+    agent_description="Agent tasked with structuring analysis into a final report or output."
 )
 
+# Create workflow with backend selection
+workflow = GraphWorkflow(
+    name="Basic Example",
+    verbose=True,
+)
 
-def main():
-    """
-    Run a basic graph workflow example without print statements.
-    """
-    # Create agents
-
-    # Create workflow with backend selection
-    workflow = GraphWorkflow(
-        name="Basic Example",
-        verbose=True,
-    )
-
-    # Add agents to workflow
-    workflow.add_node(agent_one)
-    workflow.add_node(agent_two)
-    workflow.add_node(agent_three)
+workflow.add_nodes([agent_one, agent_two, agent_three])
 
-    # Create simple chain using the actual agent names
-    workflow.add_edge("research_agent", "research_agent_two")
-    workflow.add_edge("research_agent_two", "research_agent_three")
+# Create simple chain using the actual agent names
+workflow.add_edge("research_agent", "research_agent_two")
+workflow.add_edge("research_agent_two", "research_agent_three")
 
-    # Compile the workflow
-    workflow.compile()
+workflow.visualize()
 
-    # Run the workflow
-    task = "Complete a simple task"
-    results = workflow.run(task)
-    return results
+# Compile the workflow
+workflow.compile()
 
+# Run the workflow
+task = "Complete a simple task"
+results = workflow.run(task)
 
-if __name__ == "__main__":
-    main()
+print(results)
\ No newline at end of file
diff --git a/graph_workflow_basic.py b/graph_workflow_basic.py
new file mode 100644
index 00000000..d2876d04
--- /dev/null
+++ b/graph_workflow_basic.py
@@ -0,0 +1,48 @@
+
+from swarms.structs.graph_workflow import GraphWorkflow
+from swarms.structs.agent import Agent
+
+agent_one = Agent(
+    agent_name="research_agent", 
+    model_name="claude-haiku-4-5", 
+    top_p=None,
+    temperature=None,
+    agent_description="Agent responsible for gathering and summarizing research information."
+)
+agent_two = Agent(
+    agent_name="research_agent_two", 
+    model_name="claude-haiku-4-5",
+    top_p=None,
+    temperature=None,
+    agent_description="Agent that analyzes the research data provided and processes insights."
+)
+agent_three = Agent(
+    agent_name="research_agent_three", 
+    model_name="claude-haiku-4-5",
+    top_p=None,
+    temperature=None,
+    agent_description="Agent tasked with structuring analysis into a final report or output."
+)
+
+# Create workflow with backend selection
+workflow = GraphWorkflow(
+    name="Basic Example",
+    verbose=True,
+    backend="rustworkx",
+)
+
+agents = [agent_one, agent_two, agent_three]
+workflow.add_nodes(agents, batch_size=3)
+
+workflow.add_edge("research_agent", "research_agent_two")
+workflow.add_edge("research_agent_two", "research_agent_three")
+workflow.visualize()
+
+# Compile the workflow
+workflow.compile()
+
+# Run the workflow
+task = "Analyze the best mining companies in the US"
+results = workflow.run(task)
+
+print(results)
\ No newline at end of file
diff --git a/maker_example.py b/maker_example.py
deleted file mode 100644
index d8f6e062..00000000
--- a/maker_example.py
+++ /dev/null
@@ -1,55 +0,0 @@
-import re
-
-from swarms.structs.maker import MAKER
-
-
-# Define task-specific functions for a counting task
-def format_counting_prompt(
-    task, state, step_idx, previous_result
-):
-    """Format prompt for counting task."""
-    if previous_result is None:
-        return f"{task}\nThis is step 1. What is the first number? Reply with just the number."
-    return f"{task}\nThe previous number was {previous_result}. What is the next number? Reply with just the number."
-
-
-def parse_counting_response(response):
-    """Parse the counting response to extract the number."""
-    numbers = re.findall(r"\d+", response)
-    if numbers:
-        return int(numbers[0])
-    return response.strip()
-
-
-def validate_counting_response(response, max_tokens):
-    """Validate counting response."""
-    if len(response) > max_tokens * 4:
-        return False
-    return bool(re.search(r"\d+", response))
-
-
-# Create MAKER instance
-maker = MAKER(
-    name="CountingExample",
-    description="MAKER example: counting numbers",
-    model_name="gpt-4o-mini",
-    system_prompt="You are a helpful assistant. When asked to count, respond with just the number, nothing else.",
-    format_prompt=format_counting_prompt,
-    parse_response=parse_counting_response,
-    validate_response=validate_counting_response,
-    k=2,
-    max_tokens=100,
-    temperature=0.1,
-    verbose=True,
-)
-
-# Run the solver with the task as the main input
-results = maker.run(
-    task="Count from 1 to 10, one number at a time",
-    max_steps=5,
-)
-
-print(results)
-
-# Show statistics
-stats = maker.get_statistics()
diff --git a/swarms/structs/graph_workflow.py b/swarms/structs/graph_workflow.py
index d1a23594..99e3fb4b 100644
--- a/swarms/structs/graph_workflow.py
+++ b/swarms/structs/graph_workflow.py
@@ -1,10 +1,21 @@
 import asyncio
 import concurrent.futures
 import json
+import os
 import time
+import traceback
 import uuid
 from enum import Enum
-from typing import Any, Dict, Iterator, List, Optional, Set
+from typing import (
+    Any,
+    Dict,
+    Iterator,
+    List,
+    Optional,
+    Set,
+    Tuple,
+    Union,
+)
 
 import networkx as nx
 
@@ -596,12 +607,12 @@ class Node:
                 )
 
     @classmethod
-    def from_agent(cls, agent, **kwargs):
+    def from_agent(cls, agent: Agent, **kwargs: Any) -> "Node":
         """
         Create a Node from an Agent object.
 
         Args:
-            agent: The agent to create a node from.
+            agent (Agent): The agent to create a node from.
             **kwargs: Additional keyword arguments.
 
         Returns:
@@ -644,13 +655,18 @@ class Edge:
         self.metadata = metadata or {}
 
     @classmethod
-    def from_nodes(cls, source_node, target_node, **kwargs):
+    def from_nodes(
+        cls,
+        source_node: Union["Node", Agent, str],
+        target_node: Union["Node", Agent, str],
+        **kwargs: Any,
+    ) -> "Edge":
         """
         Create an Edge from node objects or ids.
 
         Args:
-            source_node: Source node object or ID.
-            target_node: Target node object or ID.
+            source_node (Union[Node, Agent, str]): Source node object or ID.
+            target_node (Union[Node, Agent, str]): Target node object or ID.
             **kwargs: Additional keyword arguments.
 
         Returns:
@@ -844,7 +860,7 @@ class GraphWorkflow:
                 "GraphWorkflow initialization completed successfully"
             )
 
-    def _invalidate_compilation(self):
+    def _invalidate_compilation(self) -> None:
         """
         Invalidate compiled optimizations when graph structure changes.
         Forces recompilation on next run to ensure cache coherency.
@@ -864,7 +880,7 @@ class GraphWorkflow:
             if self.verbose:
                 logger.debug("Cleared predecessors cache")
 
-    def compile(self):
+    def compile(self) -> None:
         """
         Pre-compute expensive operations for faster execution.
         Call this after building the graph structure.
@@ -932,7 +948,7 @@ class GraphWorkflow:
             )
             raise e
 
-    def add_node(self, agent: Agent, **kwargs):
+    def add_node(self, agent: Agent, **kwargs: Any) -> None:
         """
         Adds an agent node to the workflow graph.
 
@@ -970,14 +986,47 @@ class GraphWorkflow:
                 f"Error in GraphWorkflow.add_node for agent {getattr(agent, 'agent_name', 'unnamed')}: {e}"
             )
             raise e
+        
+    def add_nodes(self, agents: List[Agent], batch_size: int = 10, **kwargs: Any) -> None:
+        """
+        Add multiple agents to the workflow graph concurrently in batches.
+
+        Args:
+            agents (List[Agent]): List of agents to add.
+            batch_size (int): Number of agents to add concurrently in a batch. Defaults to 8.
+            **kwargs: Additional keyword arguments for each node addition.
+        """
+        
+        try:
+            with concurrent.futures.ThreadPoolExecutor(max_workers = self._max_workers) as executor:
+                # Process agents in batches
+                for i in range(0, len(agents), batch_size):
+                    batch = agents[i:i + batch_size]
+                    futures = [
+                        executor.submit(self.add_node, agent, **kwargs)
+                        for agent in batch
+                    ]
+                    # Ensure all nodes in batch are added before next batch
+                    for future in concurrent.futures.as_completed(futures):
+                        future.result()
+        except Exception as e:
+            logger.exception(
+                f"Error in GraphWorkflow.add_nodes for agents {agents}: {e} Traceback: {traceback.format_exc()}"
+            )
+            raise e
 
-    def add_edge(self, edge_or_source, target=None, **kwargs):
+    def add_edge(
+        self,
+        edge_or_source: Union[Edge, Node, Agent, str],
+        target: Optional[Union[Node, Agent, str]] = None,
+        **kwargs: Any,
+    ) -> None:
         """
         Add an edge by Edge object or by passing node objects/ids.
 
         Args:
-            edge_or_source: Either an Edge object or the source node/id.
-            target: Target node/id (required if edge_or_source is not an Edge).
+            edge_or_source (Union[Edge, Node, Agent, str]): Either an Edge object or the source node/id.
+            target (Optional[Union[Node, Agent, str]]): Target node/id (required if edge_or_source is not an Edge).
             **kwargs: Additional keyword arguments for the edge.
         """
         try:
@@ -1022,15 +1071,20 @@ class GraphWorkflow:
             logger.exception(f"Error in GraphWorkflow.add_edge: {e}")
             raise e
 
-    def add_edges_from_source(self, source, targets, **kwargs):
+    def add_edges_from_source(
+        self,
+        source: Union[Node, Agent, str],
+        targets: List[Union[Node, Agent, str]],
+        **kwargs: Any,
+    ) -> List[Edge]:
         """
         Add multiple edges from a single source to multiple targets for parallel processing.
         This creates a "fan-out" pattern where the source agent's output is distributed
         to all target agents simultaneously.
 
         Args:
-            source: Source node/id that will send output to multiple targets.
-            targets: List of target node/ids that will receive the source output in parallel.
+            source (Union[Node, Agent, str]): Source node/id that will send output to multiple targets.
+            targets (List[Union[Node, Agent, str]]): List of target node/ids that will receive the source output in parallel.
             **kwargs: Additional keyword arguments for all edges.
 
         Returns:
@@ -1091,14 +1145,19 @@ class GraphWorkflow:
             )
             raise e
 
-    def add_edges_to_target(self, sources, target, **kwargs):
+    def add_edges_to_target(
+        self,
+        sources: List[Union[Node, Agent, str]],
+        target: Union[Node, Agent, str],
+        **kwargs: Any,
+    ) -> List[Edge]:
         """
         Add multiple edges from multiple sources to a single target for convergence processing.
         This creates a "fan-in" pattern where multiple agents' outputs converge to a single target.
 
         Args:
-            sources: List of source node/ids that will send output to the target.
-            target: Target node/id that will receive all source outputs.
+            sources (List[Union[Node, Agent, str]]): List of source node/ids that will send output to the target.
+            target (Union[Node, Agent, str]): Target node/id that will receive all source outputs.
             **kwargs: Additional keyword arguments for all edges.
 
         Returns:
@@ -1159,14 +1218,19 @@ class GraphWorkflow:
             )
             raise e
 
-    def add_parallel_chain(self, sources, targets, **kwargs):
+    def add_parallel_chain(
+        self,
+        sources: List[Union[Node, Agent, str]],
+        targets: List[Union[Node, Agent, str]],
+        **kwargs: Any,
+    ) -> List[Edge]:
         """
         Create a parallel processing chain where multiple sources connect to multiple targets.
         This creates a full mesh connection pattern for maximum parallel processing.
 
         Args:
-            sources: List of source node/ids.
-            targets: List of target node/ids.
+            sources (List[Union[Node, Agent, str]]): List of source node/ids.
+            targets (List[Union[Node, Agent, str]]): List of target node/ids.
             **kwargs: Additional keyword arguments for all edges.
 
         Returns:
@@ -1230,7 +1294,7 @@ class GraphWorkflow:
             )
             raise e
 
-    def set_entry_points(self, entry_points: List[str]):
+    def set_entry_points(self, entry_points: List[str]) -> None:
         """
         Set the entry points for the workflow.
 
@@ -1261,7 +1325,7 @@ class GraphWorkflow:
             )
             raise e
 
-    def set_end_points(self, end_points: List[str]):
+    def set_end_points(self, end_points: List[str]) -> None:
         """
         Set the end points for the workflow.
 
@@ -1295,22 +1359,22 @@ class GraphWorkflow:
     @classmethod
     def from_spec(
         cls,
-        agents,
-        edges,
-        entry_points=None,
-        end_points=None,
-        task=None,
-        **kwargs,
-    ):
+        agents: List[Union[Agent, Node]],
+        edges: List[Union[Edge, Tuple[Any, Any]]],
+        entry_points: Optional[List[str]] = None,
+        end_points: Optional[List[str]] = None,
+        task: Optional[str] = None,
+        **kwargs: Any,
+    ) -> "GraphWorkflow":
         """
         Construct a workflow from a list of agents and connections.
 
         Args:
-            agents: List of agents or Node objects.
-            edges: List of edges or edge tuples.
-            entry_points: List of entry point node IDs.
-            end_points: List of end point node IDs.
-            task: Task to be executed by the workflow.
+            agents (List[Union[Agent, Node]]): List of agents or Node objects.
+            edges (List[Union[Edge, Tuple[Any, Any]]]): List of edges or edge tuples.
+            entry_points (Optional[List[str]]): List of entry point node IDs.
+            end_points (Optional[List[str]]): List of end point node IDs.
+            task (Optional[str]): Task to be executed by the workflow.
             **kwargs: Additional keyword arguments.
 
         Returns:
@@ -1425,7 +1489,7 @@ class GraphWorkflow:
             logger.exception(f"Error in GraphWorkflow.from_spec: {e}")
             raise e
 
-    def auto_set_entry_points(self):
+    def auto_set_entry_points(self) -> None:
         """
         Automatically set entry points to nodes with no incoming edges.
         """
@@ -1455,7 +1519,7 @@ class GraphWorkflow:
             )
             raise e
 
-    def auto_set_end_points(self):
+    def auto_set_end_points(self) -> None:
         """
         Automatically set end points to nodes with no outgoing edges.
         """
@@ -1483,7 +1547,7 @@ class GraphWorkflow:
             )
             raise e
 
-    def _get_predecessors(self, node_id: str) -> tuple:
+    def _get_predecessors(self, node_id: str) -> Tuple[str, ...]:
         """
         Cached predecessor lookup for faster repeated access.
 
@@ -1491,7 +1555,7 @@ class GraphWorkflow:
             node_id (str): The node ID to get predecessors for.
 
         Returns:
-            tuple: Tuple of predecessor node IDs.
+            Tuple[str, ...]: Tuple of predecessor node IDs.
         """
         # Use instance-level caching instead of @lru_cache to avoid hashing issues
         if not hasattr(self, "_predecessors_cache"):
@@ -1508,7 +1572,7 @@ class GraphWorkflow:
         self,
         node_id: str,
         task: str,
-        prev_outputs: Dict[str, str],
+        prev_outputs: Dict[str, Any],
         layer_idx: int,
     ) -> str:
         """
@@ -1517,7 +1581,7 @@ class GraphWorkflow:
         Args:
             node_id (str): The node ID to build a prompt for.
             task (str): The main task.
-            prev_outputs (Dict[str, str]): Previous outputs from predecessor nodes.
+            prev_outputs (Dict[str, Any]): Previous outputs from predecessor nodes.
             layer_idx (int): The current layer index.
 
         Returns:
@@ -1574,13 +1638,16 @@ class GraphWorkflow:
             raise e
 
     async def arun(
-        self, task: str = None, *args, **kwargs
+        self,
+        task: Optional[str] = None,
+        *args: Any,
+        **kwargs: Any,
     ) -> Dict[str, Any]:
         """
         Async version of run for better performance with I/O bound operations.
 
         Args:
-            task (str, optional): Task to execute. Uses self.task if not provided.
+            task (Optional[str]): Task to execute. Uses self.task if not provided.
             *args: Additional positional arguments.
             **kwargs: Additional keyword arguments.
 
@@ -1608,16 +1675,17 @@ class GraphWorkflow:
 
     def run(
         self,
-        task: str = None,
+        task: Optional[str] = None,
         img: Optional[str] = None,
-        *args,
-        **kwargs,
+        *args: Any,
+        **kwargs: Any,
     ) -> Dict[str, Any]:
         """
         Run the workflow graph with optimized parallel agent execution.
 
         Args:
-            task (str, optional): Task to execute. Uses self.task if not provided.
+            task (Optional[str]): Task to execute. Uses self.task if not provided.
+            img (Optional[str]): Optional image path for multimodal tasks.
             *args: Additional positional arguments.
             **kwargs: Additional keyword arguments.
 
@@ -1846,16 +1914,15 @@ class GraphWorkflow:
         view: bool = True,
         engine: str = "dot",
         show_summary: bool = False,
-    ):
+    ) -> str:
         """
         Visualize the workflow graph using Graphviz with enhanced parallel pattern detection.
 
         Args:
-            output_path (str, optional): Path to save the visualization file. If None, uses workflow name.
             format (str): Output format ('png', 'svg', 'pdf', 'dot'). Defaults to 'png'.
             view (bool): Whether to open the visualization after creation. Defaults to True.
             engine (str): Graphviz layout engine ('dot', 'neato', 'fdp', 'sfdp', 'twopi', 'circo'). Defaults to 'dot'.
-            show_summary (bool): Whether to print parallel processing summary. Defaults to True.
+            show_summary (bool): Whether to print parallel processing summary. Defaults to False.
 
         Returns:
             str: Path to the generated visualization file.
@@ -2138,7 +2205,7 @@ class GraphWorkflow:
             logger.exception(f"Error in GraphWorkflow.visualize: {e}")
             raise e
 
-    def visualize_simple(self):
+    def visualize_simple(self) -> str:
         """
         Simple text-based visualization for environments without Graphviz.
 
@@ -2225,13 +2292,14 @@ class GraphWorkflow:
                 f"Error in GraphWorkflow.visualize_simple: {e}"
             )
             raise e
+        
 
     def to_json(
         self,
-        fast=True,
-        include_conversation=False,
-        include_runtime_state=False,
-    ):
+        fast: bool = True,
+        include_conversation: bool = False,
+        include_runtime_state: bool = False,
+    ) -> str:
         """
         Serialize the workflow to JSON with comprehensive metadata and configuration.
 
@@ -2250,7 +2318,7 @@ class GraphWorkflow:
 
         try:
 
-            def node_to_dict(node):
+            def node_to_dict(node: Node) -> Dict[str, Any]:
                 node_data = {
                     "id": node.id,
                     "type": str(node.type),
@@ -2285,7 +2353,7 @@ class GraphWorkflow:
 
                 return node_data
 
-            def edge_to_dict(edge):
+            def edge_to_dict(edge: Edge) -> Dict[str, Any]:
                 return {
                     "source": edge.source,
                     "target": edge.target,
@@ -2402,7 +2470,11 @@ class GraphWorkflow:
             raise e
 
     @classmethod
-    def from_json(cls, json_str, restore_runtime_state=False):
+    def from_json(
+        cls,
+        json_str: str,
+        restore_runtime_state: bool = False,
+    ) -> "GraphWorkflow":
         """
         Deserialize a workflow from JSON with comprehensive parameter support and backward compatibility.
 
@@ -2660,7 +2732,6 @@ class GraphWorkflow:
             FileExistsError: If file exists and overwrite is False
             Exception: If save operation fails
         """
-        import os
 
         # Handle file path validation
         if not filepath.endswith(".json"):
@@ -2723,7 +2794,6 @@ class GraphWorkflow:
             FileNotFoundError: If file doesn't exist
             Exception: If load operation fails
         """
-        import os
 
         if not os.path.exists(filepath):
             raise FileNotFoundError(
@@ -2755,7 +2825,7 @@ class GraphWorkflow:
             )
             raise e
 
-    def validate(self, auto_fix=False) -> Dict[str, Any]:
+    def validate(self, auto_fix: bool = False) -> Dict[str, Any]:
         """
         Validate the workflow structure, checking for potential issues such as isolated nodes,
         cyclic dependencies, etc.