swarms/tests/structs/test_groupchat.py

import os
from dotenv import load_dotenv
from swarm_models import OpenAIChat
from swarms.structs.agent import Agent
from swarms.structs.groupchat import GroupChat, expertise_based


def setup_test_agents():
    model = OpenAIChat(
        openai_api_key=os.getenv("OPENAI_API_KEY"),
        model_name="gpt-4",
        temperature=0.1,
    )

    return [
        Agent(
            agent_name="Agent1",
            system_prompt="You only respond with 'A'",
            llm=model,
        ),
        Agent(
            agent_name="Agent2",
            system_prompt="You only respond with 'B'",
            llm=model,
        ),
        Agent(
            agent_name="Agent3",
            system_prompt="You only respond with 'C'",
            llm=model,
        ),
    ]


def test_round_robin_speaking():
    chat = GroupChat(agents=setup_test_agents())
    history = chat.run("Say your letter")

    # Verify agents speak in order
    responses = [
        r.message for t in history.turns for r in t.responses
    ]
    assert responses == ["A", "B", "C"] * (len(history.turns))


def test_concurrent_processing():
    chat = GroupChat(agents=setup_test_agents())
    tasks = ["Task1", "Task2", "Task3"]
    histories = chat.concurrent_run(tasks)

    assert len(histories) == len(tasks)
    for history in histories:
        assert history.total_messages > 0


def test_expertise_based_speaking():
    agents = setup_test_agents()
    chat = GroupChat(agents=agents, speaker_fn=expertise_based)

    # Test each agent's expertise trigger
    for agent in agents:
        history = chat.run(f"Trigger {agent.system_prompt}")
        first_response = history.turns[0].responses[0]
        assert first_response.agent_name == agent.agent_name


def test_max_loops_limit():
    max_loops = 3
    chat = GroupChat(agents=setup_test_agents(), max_loops=max_loops)
    history = chat.run("Test message")

    assert len(history.turns) == max_loops


def test_error_handling():
    broken_agent = Agent(
        agent_name="BrokenAgent",
        system_prompt="You raise errors",
        llm=None,
    )

    chat = GroupChat(agents=[broken_agent])
    history = chat.run("Trigger error")

    assert "Error" in history.turns[0].responses[0].message


def test_conversation_context():
    agents = setup_test_agents()
    complex_prompt = "Previous message refers to A. Now trigger B. Finally discuss C."

    chat = GroupChat(agents=agents, speaker_fn=expertise_based)
    history = chat.run(complex_prompt)

    responses = [
        r.agent_name for t in history.turns for r in t.responses
    ]
    assert all(agent.agent_name in responses for agent in agents)


def test_large_agent_group():
    large_group = setup_test_agents() * 5  # 15 agents
    chat = GroupChat(agents=large_group)
    history = chat.run("Test scaling")

    assert history.total_messages > len(large_group)


def test_long_conversations():
    chat = GroupChat(agents=setup_test_agents(), max_loops=50)
    history = chat.run("Long conversation test")

    assert len(history.turns) == 50
    assert history.total_messages > 100


def test_stress_batched_runs():
    chat = GroupChat(agents=setup_test_agents())
    tasks = ["Task"] * 100
    histories = chat.batched_run(tasks)

    assert len(histories) == len(tasks)
    total_messages = sum(h.total_messages for h in histories)
    assert total_messages > len(tasks) * 3


if __name__ == "__main__":
    load_dotenv()

    functions = [
        test_round_robin_speaking,
        test_concurrent_processing,
        test_expertise_based_speaking,
        test_max_loops_limit,
        test_error_handling,
        test_conversation_context,
        test_large_agent_group,
        test_long_conversations,
        test_stress_batched_runs,
    ]

    for func in functions:
        try:
            print(f"Running {func.__name__}...")
            func()
            print("✓ Passed")
        except Exception as e:
            print(f"✗ Failed: {str(e)}")
[GROUPCHAT] 2 weeks ago			`import os`
			`from dotenv import load_dotenv`
[CLEANUP] 4 months ago			`from swarm_models import OpenAIChat`
[5.4.8] 5 months ago			`from swarms.structs.agent import Agent`
[GROUPCHAT] 2 weeks ago			`from swarms.structs.groupchat import GroupChat, expertise_based`
[5.4.8] 5 months ago

[GROUPCHAT] 2 weeks ago			`def setup_test_agents():`
			`model = OpenAIChat(`
			`openai_api_key=os.getenv("OPENAI_API_KEY"),`
			`model_name="gpt-4",`
			`temperature=0.1,`
[5.4.8] 5 months ago			`)`

[GROUPCHAT] 2 weeks ago			`return [`
			`Agent(`
			`agent_name="Agent1",`
			`system_prompt="You only respond with 'A'",`
			`llm=model,`
			`),`
			`Agent(`
			`agent_name="Agent2",`
			`system_prompt="You only respond with 'B'",`
			`llm=model,`
			`),`
			`Agent(`
			`agent_name="Agent3",`
			`system_prompt="You only respond with 'C'",`
			`llm=model,`
			`),`
			`]`


			`def test_round_robin_speaking():`
			`chat = GroupChat(agents=setup_test_agents())`
			`history = chat.run("Say your letter")`

			`# Verify agents speak in order`
			`responses = [`
			`r.message for t in history.turns for r in t.responses`
			`]`
			`assert responses == ["A", "B", "C"] * (len(history.turns))`


			`def test_concurrent_processing():`
			`chat = GroupChat(agents=setup_test_agents())`
			`tasks = ["Task1", "Task2", "Task3"]`
			`histories = chat.concurrent_run(tasks)`

			`assert len(histories) == len(tasks)`
			`for history in histories:`
			`assert history.total_messages > 0`


			`def test_expertise_based_speaking():`
			`agents = setup_test_agents()`
			`chat = GroupChat(agents=agents, speaker_fn=expertise_based)`

			`# Test each agent's expertise trigger`
			`for agent in agents:`
			`history = chat.run(f"Trigger {agent.system_prompt}")`
			`first_response = history.turns[0].responses[0]`
			`assert first_response.agent_name == agent.agent_name`


[CLEANUP] 2 weeks ago			`def test_max_loops_limit():`
			`max_loops = 3`
			`chat = GroupChat(agents=setup_test_agents(), max_loops=max_loops)`
[GROUPCHAT] 2 weeks ago			`history = chat.run("Test message")`

[CLEANUP] 2 weeks ago			`assert len(history.turns) == max_loops`
[GROUPCHAT] 2 weeks ago

			`def test_error_handling():`
			`broken_agent = Agent(`
			`agent_name="BrokenAgent",`
			`system_prompt="You raise errors",`
			`llm=None,`
			`)`
[5.4.8] 5 months ago
[GROUPCHAT] 2 weeks ago			`chat = GroupChat(agents=[broken_agent])`
			`history = chat.run("Trigger error")`
[5.4.8] 5 months ago
[GROUPCHAT] 2 weeks ago			`assert "Error" in history.turns[0].responses[0].message`
[5.4.8] 5 months ago

[GROUPCHAT] 2 weeks ago			`def test_conversation_context():`
			`agents = setup_test_agents()`
			`complex_prompt = "Previous message refers to A. Now trigger B. Finally discuss C."`
[5.4.8] 5 months ago
[GROUPCHAT] 2 weeks ago			`chat = GroupChat(agents=agents, speaker_fn=expertise_based)`
			`history = chat.run(complex_prompt)`
[5.4.8] 5 months ago
[GROUPCHAT] 2 weeks ago			`responses = [`
			`r.agent_name for t in history.turns for r in t.responses`
			`]`
			`assert all(agent.agent_name in responses for agent in agents)`
[5.4.8] 5 months ago

[GROUPCHAT] 2 weeks ago			`def test_large_agent_group():`
			`large_group = setup_test_agents() * 5 # 15 agents`
			`chat = GroupChat(agents=large_group)`
			`history = chat.run("Test scaling")`
[5.4.8] 5 months ago
[GROUPCHAT] 2 weeks ago			`assert history.total_messages > len(large_group)`
[5.4.8] 5 months ago

[GROUPCHAT] 2 weeks ago			`def test_long_conversations():`
[CLEANUP] 2 weeks ago			`chat = GroupChat(agents=setup_test_agents(), max_loops=50)`
[GROUPCHAT] 2 weeks ago			`history = chat.run("Long conversation test")`
[5.4.8] 5 months ago
[GROUPCHAT] 2 weeks ago			`assert len(history.turns) == 50`
			`assert history.total_messages > 100`
[5.4.8] 5 months ago

[GROUPCHAT] 2 weeks ago			`def test_stress_batched_runs():`
			`chat = GroupChat(agents=setup_test_agents())`
			`tasks = ["Task"] * 100`
			`histories = chat.batched_run(tasks)`
[5.4.8] 5 months ago
[GROUPCHAT] 2 weeks ago			`assert len(histories) == len(tasks)`
			`total_messages = sum(h.total_messages for h in histories)`
			`assert total_messages > len(tasks) * 3`
[5.4.8] 5 months ago

[GROUPCHAT] 2 weeks ago			`if __name__ == "__main__":`
			`load_dotenv()`
[5.4.8] 5 months ago
[GROUPCHAT] 2 weeks ago			`functions = [`
			`test_round_robin_speaking,`
			`test_concurrent_processing,`
			`test_expertise_based_speaking,`
[CLEANUP] 2 weeks ago			`test_max_loops_limit,`
[GROUPCHAT] 2 weeks ago			`test_error_handling,`
			`test_conversation_context,`
			`test_large_agent_group,`
			`test_long_conversations,`
			`test_stress_batched_runs,`
			`]`
[5.4.8] 5 months ago
[GROUPCHAT] 2 weeks ago			`for func in functions:`
			`try:`
			`print(f"Running {func.__name__}...")`
			`func()`
			`print("✓ Passed")`
			`except Exception as e:`
			`print(f"✗ Failed: {str(e)}")`