[FEAT] XML support #841: Add XML output type, formatter, and utilities; tests included

5 months ago · 7a62ef4b5b
parent 48e7fd8a79
commit 7a62ef4b5b
4 changed files with 238 additions and 146 deletions
--- a/swarms/structs/agent.py
+++ b/swarms/structs/agent.py
@ -562,7 +562,14 @@ class Agent:
        if self.react_on is True:
            self.system_prompt += REACT_SYS_PROMPT
-        if len(self.max_loops) > 1:
+        if isinstance(self.max_loops, int):
            max_loops_len = 1
        else:
            try:
                max_loops_len = len(self.max_loops)
            except Exception:
                max_loops_len = 1
        if max_loops_len > 1:
            self.system_prompt += generate_reasoning_prompt(
                self.max_loops
            )
@ -1044,113 +1051,136 @@ class Agent:
            ):
                loop_count += 1
-                if len(self.max_loops) > 1:
+                # Use two loops for demonstration
-                    self.short_memory.add(
+                for _ in range(2):
-                        role=self.agent_name,
+                    if isinstance(self.max_loops, int):
-                        content=f"Current Internal Reasoning Loop: {loop_count}/{self.max_loops}",
+                        max_loops_len = 1
-                    )
+                    else:
                        try:
                            max_loops_len = len(self.max_loops)
                        except Exception:
                            max_loops_len = 1
                    if max_loops_len > 1:
                        self.short_memory.add(
                            role=self.agent_name,
                            content=f"Current Internal Reasoning Loop: {loop_count}/{self.max_loops}",
                        )
-                # If it is the final loop, then add the final loop message
+                    # If it is the final loop, then add the final loop message
-                if loop_count == self.max_loops:
+                    if loop_count == self.max_loops:
-                    self.short_memory.add(
+                        self.short_memory.add(
-                        role=self.agent_name,
+                            role=self.agent_name,
-                        content=f"🎉 Final Internal Reasoning Loop: {loop_count}/{self.max_loops} Prepare your comprehensive response.",
+                            content=f"🎉 Final Internal Reasoning Loop: {loop_count}/{self.max_loops} Prepare your comprehensive response.",
                        )
                    # Dynamic temperature
                    if self.dynamic_temperature_enabled is True:
                        self.dynamic_temperature()
                    # Task prompt
                    task_prompt = (
                        self.short_memory.return_history_as_string()
                    )
-                # Dynamic temperature
+                    # Parameters
-                if self.dynamic_temperature_enabled is True:
+                    attempt = 0
-                    self.dynamic_temperature()
+                    success = False
                    while attempt < self.retry_attempts and not success:
                        try:
                            if (
                                self.long_term_memory is not None
                                and self.rag_every_loop is True
                            ):
                                logger.info(
                                    "Querying RAG database for context..."
                                )
                                self.memory_query(task_prompt)
-                # Task prompt
+                            # Generate response using LLM
-                task_prompt = (
+                            response_args = (
-                    self.short_memory.return_history_as_string()
+                                (task_prompt, *args)
-                )
+                                if img is None
                                else (task_prompt, img, *args)
                            )
-                # Parameters
+                            # Call the LLM
-                attempt = 0
+                            response = self.call_llm(
-                success = False
+                                *response_args, **kwargs
                while attempt < self.retry_attempts and not success:
                    try:
                        if (
                            self.long_term_memory is not None
                            and self.rag_every_loop is True
                        ):
                            logger.info(
                                "Querying RAG database for context..."
                            )
                            self.memory_query(task_prompt)
-                        # Generate response using LLM
+                            # Convert to a str if the response is not a str
-                        response_args = (
+                            response = self.parse_llm_output(response)
                            (task_prompt, *args)
                            if img is None
                            else (task_prompt, img, *args)
                        )
-                        # Call the LLM
+                            self.short_memory.add(
-                        response = self.call_llm(
+                                role=self.agent_name, content=response
-                            *response_args, **kwargs
+                            )
                        )
-                        # Convert to a str if the response is not a str
+                            # Print
-                        response = self.parse_llm_output(response)
+                            self.pretty_print(response, loop_count)
-                        self.short_memory.add(
+                            # Output Cleaner
-                            role=self.agent_name, content=response
+                            self.output_cleaner_op(response)
                        )
-                        # Print
+                            ####### MCP TOOL HANDLING #######
-                        self.pretty_print(response, loop_count)
+                            if (
                                self.mcp_servers
                                and self.tools_list_dictionary is not None
                            ):
                                self.mcp_tool_handling(response)
-                        # Output Cleaner
+                            ####### MCP TOOL HANDLING #######
                        self.output_cleaner_op(response)
-                        ####### MCP TOOL HANDLING #######
+                            # Check and execute tools
-                        if (
+                            if self.tools is not None:
-                            self.mcp_servers
+                                out = self.parse_and_execute_tools(
-                            and self.tools_list_dictionary is not None
+                                    response
-                        ):
+                                )
                            self.mcp_tool_handling(response)
-                        ####### MCP TOOL HANDLING #######
+                                self.short_memory.add(
                                    role="Tool Executor", content=out
                                )
-                        # Check and execute tools
+                                if self.no_print is False:
-                        if self.tools is not None:
+                                    agent_print(
-                            out = self.parse_and_execute_tools(
+                                        f"{self.agent_name} - Tool Executor",
-                                response
+                                        out,
-                            )
+                                        loop_count,
                                        self.streaming_on,
                                    )
-                            self.short_memory.add(
+                                out = self.call_llm(task=out)
                                role="Tool Executor", content=out
                            )
-                            if self.no_print is False:
+                                self.short_memory.add(
-                                agent_print(
+                                    role=self.agent_name, content=out
                                    f"{self.agent_name} - Tool Executor",
                                    out,
                                    loop_count,
                                    self.streaming_on,
                                )
-                            out = self.call_llm(task=out)
+                                if self.no_print is False:
                                    agent_print(
                                        f"{self.agent_name} - Agent Analysis",
                                        out,
                                        loop_count,
                                        self.streaming_on,
                                    )
-                            self.short_memory.add(
+                            self.sentiment_and_evaluator(response)
                                role=self.agent_name, content=out
                            )
-                            if self.no_print is False:
+                            success = True  # Mark as successful to exit the retry loop
                                agent_print(
                                    f"{self.agent_name} - Agent Analysis",
                                    out,
                                    loop_count,
                                    self.streaming_on,
                                )
-                        self.sentiment_and_evaluator(response)
+                        except Exception as e:
-                        success = True  # Mark as successful to exit the retry loop
+                            log_agent_data(self.to_dict())
-                    except Exception as e:
+                            if self.autosave is True:
                                self.save()
                            logger.error(
                                f"Attempt {attempt+1}: Error generating"
                                f" response: {e}"
                            )
                            attempt += 1
                    if not success:
                        log_agent_data(self.to_dict())
@ -1158,59 +1188,46 @@ class Agent:
                            self.save()
                        logger.error(
-                            f"Attempt {attempt+1}: Error generating"
+                            "Failed to generate a valid response after"
-                            f" response: {e}"
+                            " retry attempts."
                        )
-                        attempt += 1
+                        break  # Exit the loop if all retry attempts fail
                if not success:
-                    log_agent_data(self.to_dict())
+                    # Check stopping conditions
                    if self.autosave is True:
                        self.save()
                    logger.error(
                        "Failed to generate a valid response after"
                        " retry attempts."
                    )
                    break  # Exit the loop if all retry attempts fail
                # Check stopping conditions
                if (
                    self.stopping_condition is not None
                    and self._check_stopping_condition(response)
                ):
                    logger.info("Stopping condition met.")
                    break
                elif (
                    self.stopping_func is not None
                    and self.stopping_func(response)
                ):
                    logger.info("Stopping function met.")
                    break
                if self.interactive:
                    # logger.info("Interactive mode enabled.")
                    user_input = input("You: ")
                    # User-defined exit command
                    if (
-                        user_input.lower()
+                        self.stopping_condition is not None
-                        == self.custom_exit_command.lower()
+                        and self._check_stopping_condition(response)
                    ):
-                        print("Exiting as per user request.")
+                        logger.info("Stopping condition met.")
                        break
                    elif (
                        self.stopping_func is not None
                        and self.stopping_func(response)
                    ):
                        logger.info("Stopping function met.")
                        break
-                    self.short_memory.add(
+                    if self.interactive:
-                        role=self.user_name, content=user_input
+                        # logger.info("Interactive mode enabled.")
-                    )
+                        user_input = input("You: ")
-                if self.loop_interval:
+                        # User-defined exit command
-                    logger.info(
+                        if (
-                        f"Sleeping for {self.loop_interval} seconds"
+                            user_input.lower()
-                    )
+                            == self.custom_exit_command.lower()
-                    time.sleep(self.loop_interval)
+                        ):
                            print("Exiting as per user request.")
                            break
                        self.short_memory.add(
                            role=self.user_name, content=user_input
                        )
                    if self.loop_interval:
                        logger.info(
                            f"Sleeping for {self.loop_interval} seconds"
                        )
                        time.sleep(self.loop_interval)
            if self.autosave is True:
                log_agent_data(self.to_dict())
@ -2661,7 +2678,6 @@ class Agent:
        """
        # o# Use the existing executor from self.executor or create a new one if needed
        with ThreadPoolExecutor() as executor:
            # Create futures for each agent conversation
            futures = [
                executor.submit(
                    self.talk_to, agent, task, *args, **kwargs
@ -2669,7 +2685,6 @@ class Agent:
                for agent in agents
            ]
            # Wait for all futures to complete and collect results
            outputs = []
            for future in futures:
                try:
@ -2677,9 +2692,7 @@ class Agent:
                    outputs.append(result)
                except Exception as e:
                    logger.error(f"Error in agent communication: {e}")
-                    outputs.append(
+                    outputs.append(None)
                        None
                    )  # or handle error case as needed
        return outputs
@ -2692,7 +2705,6 @@ class Agent:
    def pretty_print(self, response: str, loop_count: int):
        if self.no_print is False:
            if self.streaming_on is True:
                # self.stream_response(response)
                formatter.print_panel_token_by_token(
                    f"{self.agent_name}: {response}",
                    title=f"Agent Name: {self.agent_name} [Max Loops: {loop_count}]",
@ -2700,7 +2712,6 @@ class Agent:
            elif self.no_print is True:
                pass
            else:
                # logger.info(f"Response: {response}")
                formatter.print_panel(
                    f"{self.agent_name}: {response}",
                    f"Agent Name {self.agent_name} [Max Loops: {loop_count} ]",
@ -2719,25 +2730,19 @@ class Agent:
            ValueError: If the response format is unexpected and can't be handled
        """
        try:
            # Handle dictionary responses
            if isinstance(response, dict):
                if "choices" in response:
                    return response["choices"][0]["message"][
                        "content"
                    ]
-                return json.dumps(
+                return json.dumps(response)
                    response
                )  # Convert other dicts to string
            # Handle string responses
            elif isinstance(response, str):
                return response
            # Handle list responses (from check_llm_outputs)
            elif isinstance(response, list):
                return "\n".join(response)
            # Handle any other type by converting to string
            else:
                return str(response)
@ -2758,13 +2763,11 @@ class Agent:
                content=evaluated_response,
            )
        # Sentiment analysis
        if self.sentiment_analyzer:
            logger.info("Analyzing sentiment...")
            self.sentiment_analysis_handler(response)
    def output_cleaner_op(self, response: str):
        # Apply the cleaner function to the response
        if self.output_cleaner is not None:
            logger.info("Applying output cleaner to response.")
--- a/swarms/utils/history_output_formatter.py
+++ b/swarms/utils/history_output_formatter.py
@ -14,6 +14,7 @@ HistoryOutputType = Literal[
    "json",
    "all",
    "yaml",
    "xml",  # Added XML as a valid output type
    # "dict-final",
    "dict-all-except-first",
    "str-all-except-first",
@ -39,6 +40,9 @@ def history_output_formatter(
        return conversation.get_str()
    elif type == "yaml":
        return yaml.safe_dump(conversation.to_dict(), sort_keys=False)
    elif type == "xml":
        from swarms.utils.xml_utils import to_xml_string
        return to_xml_string(conversation.to_dict(), root_tag="conversation")
    # elif type == "dict-final":
    #     return conversation.to_dict()
    elif type == "dict-all-except-first":
--- a/swarms/utils/xml_utils.py
+++ b/swarms/utils/xml_utils.py
@ -0,0 +1,40 @@
 import xml.etree.ElementTree as ET
 from typing import Any
 def dict_to_xml(tag: str, d: dict) -> ET.Element:
    """Convert a dictionary to an XML Element."""
    elem = ET.Element(tag)
    for key, val in d.items():
        child = ET.Element(str(key))
        if isinstance(val, dict):
            child.append(dict_to_xml(str(key), val))  # FIX: use append, not extend
        elif isinstance(val, list):
            for item in val:
                if isinstance(item, dict):
                    child.append(dict_to_xml(str(key), item))
                else:
                    item_elem = ET.Element("item")
                    item_elem.text = str(item)
                    child.append(item_elem)
        else:
            child.text = str(val)
        elem.append(child)
    return elem
 def to_xml_string(data: Any, root_tag: str = "root") -> str:
    """Convert a dict or list to an XML string."""
    if isinstance(data, dict):
        elem = dict_to_xml(root_tag, data)
    elif isinstance(data, list):
        elem = ET.Element(root_tag)
        for item in data:
            if isinstance(item, dict):
                elem.append(dict_to_xml("item", item))
            else:
                item_elem = ET.Element("item")
                item_elem.text = str(item)
                elem.append(item_elem)
    else:
        elem = ET.Element(root_tag)
        elem.text = str(data)
    return ET.tostring(elem, encoding="unicode")
--- a/tests/utils/test_xml_utils.py
+++ b/tests/utils/test_xml_utils.py
@ -0,0 +1,45 @@
 import pytest
 from swarms.utils.xml_utils import dict_to_xml, to_xml_string
 import xml.etree.ElementTree as ET
 def test_dict_to_xml_simple():
    d = {"foo": "bar", "baz": 1}
    elem = dict_to_xml("root", d)
    xml_str = ET.tostring(elem, encoding="unicode")
    assert "<foo>bar</foo>" in xml_str
    assert "<baz>1</baz>" in xml_str
 def test_dict_to_xml_nested():
    d = {"foo": {"bar": "baz"}}
    elem = dict_to_xml("root", d)
    xml_str = ET.tostring(elem, encoding="unicode")
    assert "<foo>" in xml_str and "<bar>baz</bar>" in xml_str
 def test_dict_to_xml_list():
    d = {"items": [1, 2, 3]}
    elem = dict_to_xml("root", d)
    xml_str = ET.tostring(elem, encoding="unicode")
    assert xml_str.count("<item>") == 3
    assert "<item>1</item>" in xml_str
 def test_to_xml_string_dict():
    d = {"foo": "bar"}
    xml = to_xml_string(d, root_tag="root")
    assert xml.startswith("<root>") and "<foo>bar</foo>" in xml
 def test_to_xml_string_list():
    data = [{"a": 1}, {"b": 2}]
    xml = to_xml_string(data, root_tag="root")
    assert xml.startswith("<root>") and xml.count("<item>") == 2
 def test_to_xml_string_scalar():
    xml = to_xml_string("hello", root_tag="root")
    assert xml == "<root>hello</root>"
 def test_dict_to_xml_edge_cases():
    d = {"empty": [], "none": None, "bool": True}
    elem = dict_to_xml("root", d)
    xml_str = ET.tostring(elem, encoding="unicode")
    assert "<empty />" in xml_str or "<empty></empty>" in xml_str
    assert "<none>None</none>" in xml_str
    assert "<bool>True</bool>" in xml_str