Merge 7ee7569397 into 6558e39d8f

2 months ago · 9868d3accb
parent 6558e39d8f 7ee7569397
commit 9868d3accb
5 changed files with 220 additions and 15 deletions
--- a/examples/misc/conversation_cache_example.py
+++ b/examples/misc/conversation_cache_example.py
@ -0,0 +1,69 @@
+import importlib.util
+import sys
+import time
+from pathlib import Path
+from types import ModuleType
+
+# Load Conversation without importing full swarms package
+CONV_PATH = (
+    Path(__file__).resolve().parents[2]
+    / "swarms"
+    / "structs"
+    / "conversation.py"
+)
+spec = importlib.util.spec_from_file_location(
+    "swarms.structs.conversation", CONV_PATH
+)
+conversation = importlib.util.module_from_spec(spec)
+sys.modules.setdefault("swarms", ModuleType("swarms"))
+sys.modules.setdefault("swarms.structs", ModuleType("swarms.structs"))
+base_module = ModuleType("swarms.structs.base_structure")
+base_module.BaseStructure = object
+sys.modules["swarms.structs.base_structure"] = base_module
+utils_root = ModuleType("swarms.utils")
+any_to_str_mod = ModuleType("swarms.utils.any_to_str")
+formatter_mod = ModuleType("swarms.utils.formatter")
+token_mod = ModuleType("swarms.utils.litellm_tokenizer")
+any_to_str_mod.any_to_str = lambda x: str(x)
+formatter_mod.formatter = type(
+    "Formatter", (), {"print_panel": lambda *a, **k: None}
+)()
+token_mod.count_tokens = lambda s: len(str(s).split())
+sys.modules["swarms.utils"] = utils_root
+sys.modules["swarms.utils.any_to_str"] = any_to_str_mod
+sys.modules["swarms.utils.formatter"] = formatter_mod
+sys.modules["swarms.utils.litellm_tokenizer"] = token_mod
+spec.loader.exec_module(conversation)
+Conversation = conversation.Conversation
+
+# Demonstrate cached conversation history
+conv = Conversation()
+conv.add("user", "Hello")
+conv.add("assistant", "Hi there!")
+
+print(conv.get_str())
+print(conv.get_str())  # reuses cached string
+
+# Timing demo
+start = time.perf_counter()
+for _ in range(1000):
+    conv.get_str()
+cached_time = time.perf_counter() - start
+print("Cached retrieval:", round(cached_time, 6), "seconds")
+
+
+# Compare to rebuilding manually
+def slow_get():
+    formatted = [
+        f"{m['role']}: {m['content']}"
+        for m in conv.conversation_history
+    ]
+    return "\n\n".join(formatted)
+
+
+start = time.perf_counter()
+for _ in range(1000):
+    slow_get()
+slow_time = time.perf_counter() - start
+print("Manual join:", round(slow_time, 6), "seconds")
+print("Speedup:", round(slow_time / cached_time, 2), "x")
--- a/swarms/structs/agent.py
+++ b/swarms/structs/agent.py
@ -1015,9 +1015,7 @@ class Agent:
                    self.dynamic_temperature()

                # Task prompt
-                task_prompt = (
-                    self.short_memory.return_history_as_string()
-                )
+                task_prompt = self.short_memory.get_str()

                # Parameters
                attempt = 0
@ -2112,9 +2110,7 @@ class Agent:
    def check_available_tokens(self):
        # Log the amount of tokens left in the memory and in the task
        if self.tokenizer is not None:
-            tokens_used = count_tokens(
-                self.short_memory.return_history_as_string()
-            )
+            tokens_used = count_tokens(self.short_memory.get_str())
            logger.info(
                f"Tokens available: {self.context_length - tokens_used}"
            )
@ -2123,9 +2119,7 @@ class Agent:

    def tokens_checks(self):
        # Check the tokens available
-        tokens_used = count_tokens(
-            self.short_memory.return_history_as_string()
-        )
+        tokens_used = count_tokens(self.short_memory.get_str())
        out = self.check_available_tokens()

        logger.info(
--- a/swarms/structs/conversation.py
+++ b/swarms/structs/conversation.py
@ -137,6 +137,10 @@ class Conversation(BaseStructure):
        self.token_count = token_count
        self.provider = provider

+        # Cache for history string to avoid repeated joins
+        self._history_cache = ""
+        self._cache_index = 0
+
        # Create conversation directory if saving is enabled
        if self.save_enabled and self.conversations_dir:
            os.makedirs(self.conversations_dir, exist_ok=True)
@ -144,6 +148,14 @@ class Conversation(BaseStructure):
        # Try to load existing conversation or initialize new one
        self.setup()

+    def _refresh_cache(self):
+        """Refresh cached history string."""
+        self._history_cache = "\n\n".join(
+            f"{m['role']}: {m['content']}"
+            for m in self.conversation_history
+        )
+        self._cache_index = len(self.conversation_history)
+
    def setup(self):
        """Set up the conversation by either loading existing data or initializing new."""
        if self.load_filepath and os.path.exists(self.load_filepath):
@ -239,6 +251,14 @@ class Conversation(BaseStructure):
        # Add message to conversation history
        self.conversation_history.append(message)

+        # Incrementally update history cache
+        formatted = f"{role}: {content}"
+        if self._history_cache:
+            self._history_cache += "\n\n" + formatted
+        else:
+            self._history_cache = formatted
+        self._cache_index = len(self.conversation_history)
+
        if self.token_count is True:
            self._count_tokens(content, message)

@ -452,13 +472,14 @@ class Conversation(BaseStructure):
        Returns:
            str: The conversation history formatted as a string.
        """
-        formatted_messages = []
-        for message in self.conversation_history:
-            formatted_messages.append(
-                f"{message['role']}: {message['content']}"
+        # If new messages were added outside the add method, rebuild cache
+        if self._cache_index < len(self.conversation_history):
+            self._history_cache = "\n\n".join(
+                f"{m['role']}: {m['content']}"
+                for m in self.conversation_history
            )
-
-        return "\n\n".join(formatted_messages)
+            self._cache_index = len(self.conversation_history)
+        return self._history_cache

    def get_str(self) -> str:
        """Get the conversation history as a string.
@ -542,6 +563,9 @@ class Conversation(BaseStructure):
                # Load conversation history
                self.conversation_history = data.get("history", [])

+                # Rebuild cache from loaded history
+                self._refresh_cache()
+
                logger.info(
                    f"Successfully loaded conversation from {filename}"
                )
@ -604,6 +628,8 @@ class Conversation(BaseStructure):
    def clear(self):
        """Clear the conversation history."""
        self.conversation_history = []
+        self._history_cache = ""
+        self._cache_index = 0

    def to_json(self):
        """Convert the conversation history to a JSON string.
--- a/tests/structs/test_conversation_cache_perf.py
+++ b/tests/structs/test_conversation_cache_perf.py
@ -0,0 +1,65 @@
+import importlib.util
+import sys
+import time
+from pathlib import Path
+from types import ModuleType
+
+# Load Conversation without importing the full swarms package
+CONV_PATH = (
+    Path(__file__).resolve().parents[2]
+    / "swarms"
+    / "structs"
+    / "conversation.py"
+)
+spec = importlib.util.spec_from_file_location(
+    "swarms.structs.conversation", CONV_PATH
+)
+conversation = importlib.util.module_from_spec(spec)
+sys.modules.setdefault("swarms", ModuleType("swarms"))
+sys.modules.setdefault("swarms.structs", ModuleType("swarms.structs"))
+base_module = ModuleType("swarms.structs.base_structure")
+base_module.BaseStructure = object
+sys.modules["swarms.structs.base_structure"] = base_module
+utils_root = ModuleType("swarms.utils")
+any_to_str_mod = ModuleType("swarms.utils.any_to_str")
+formatter_mod = ModuleType("swarms.utils.formatter")
+token_mod = ModuleType("swarms.utils.litellm_tokenizer")
+any_to_str_mod.any_to_str = lambda x: str(x)
+formatter_mod.formatter = type(
+    "Formatter", (), {"print_panel": lambda *a, **k: None}
+)()
+token_mod.count_tokens = lambda s: len(str(s).split())
+sys.modules["swarms.utils"] = utils_root
+sys.modules["swarms.utils.any_to_str"] = any_to_str_mod
+sys.modules["swarms.utils.formatter"] = formatter_mod
+sys.modules["swarms.utils.litellm_tokenizer"] = token_mod
+spec.loader.exec_module(conversation)
+Conversation = conversation.Conversation
+
+
+class OldConversation(Conversation):
+    def return_history_as_string(self):
+        formatted = [
+            f"{m['role']}: {m['content']}"
+            for m in self.conversation_history
+        ]
+        return "\n\n".join(formatted)
+
+    def get_str(self):
+        return self.return_history_as_string()
+
+
+def measure(conv_cls, messages=50, loops=1000):
+    conv = conv_cls(token_count=False)
+    for i in range(messages):
+        conv.add("user", f"msg{i}")
+    start = time.perf_counter()
+    for _ in range(loops):
+        conv.get_str()
+    return time.perf_counter() - start
+
+
+def test_cache_perf_improvement():
+    old_time = measure(OldConversation)
+    new_time = measure(Conversation)
+    assert old_time / new_time >= 2
--- a/tests/structs/test_conversation_cache_simple.py
+++ b/tests/structs/test_conversation_cache_simple.py
@ -0,0 +1,51 @@
+import importlib.util
+import sys
+from pathlib import Path
+from types import ModuleType
+
+# Load Conversation without importing swarms package to avoid optional deps
+CONV_PATH = (
+    Path(__file__).resolve().parents[2]
+    / "swarms"
+    / "structs"
+    / "conversation.py"
+)
+spec = importlib.util.spec_from_file_location(
+    "swarms.structs.conversation", CONV_PATH
+)
+conversation = importlib.util.module_from_spec(spec)
+sys.modules.setdefault("swarms", ModuleType("swarms"))
+structs_module = ModuleType("swarms.structs")
+sys.modules.setdefault("swarms.structs", structs_module)
+# Minimal BaseStructure to satisfy Conversation import
+base_module = ModuleType("swarms.structs.base_structure")
+base_module.BaseStructure = object
+sys.modules["swarms.structs.base_structure"] = base_module
+utils_root = ModuleType("swarms.utils")
+any_to_str_mod = ModuleType("swarms.utils.any_to_str")
+formatter_mod = ModuleType("swarms.utils.formatter")
+token_mod = ModuleType("swarms.utils.litellm_tokenizer")
+any_to_str_mod.any_to_str = lambda x: str(x)
+formatter_mod.formatter = type(
+    "Formatter", (), {"print_panel": lambda *a, **k: None}
+)()
+token_mod.count_tokens = lambda s: len(str(s).split())
+sys.modules["swarms.utils"] = utils_root
+sys.modules["swarms.utils.any_to_str"] = any_to_str_mod
+sys.modules["swarms.utils.formatter"] = formatter_mod
+sys.modules["swarms.utils.litellm_tokenizer"] = token_mod
+spec.loader.exec_module(conversation)
+Conversation = conversation.Conversation
+
+
+def test_history_cache_updates_incrementally():
+    conv = Conversation(token_count=False)
+    conv.add("user", "Hello")
+    first_cache = conv.get_str()
+    assert first_cache == "user: Hello"
+    conv.add("assistant", "Hi")
+    second_cache = conv.get_str()
+    assert second_cache.endswith("assistant: Hi")
+    assert conv._cache_index == len(conv.conversation_history)
+    # Ensure cache reused when no new messages
+    assert conv.get_str() is second_cache