Source code for mesa_llm.memory.st_lt_memory

from collections import deque
from typing import TYPE_CHECKING

from mesa_llm.memory.memory import Memory, MemoryEntry, _format_message_entry

if TYPE_CHECKING:
    from mesa_llm.llm_agent import LLMAgent



[docs]
class STLTMemory(Memory):
    """
    Implements a dual-memory system where recent experiences are stored in short-term memory with limited capacity, and older memories are consolidated into long-term summaries using LLM-based summarization.

    Attributes:
        agent : the agent that the memory belongs to

    Memory is composed of
        - A short term memory who stores the n (int) most recent interactions (observations, planning, discussions)
        - A long term memory that is a summary of the memories that are removed from short term memory (summary
        completed/refactored as it goes)
        - Event types in ``additive_event_types`` accumulate within a step.
          Defaults to ``{"message", "action"}``.

    Logic behind the implementation
        - **Short-term capacity**: Configurable number of recent memory entries (default: short_term_capacity = 5)
        - **Consolidation**: When capacity is exceeded, oldest entries are summarized into long-term memory (number of entries to summarize is configurable, default: consolidation_capacity = 3)
        - **LLM Summarization**: Uses a separate LLM instance to create meaningful summaries of past experiences

    """

    def __init__(
        self,
        agent: "LLMAgent",
        short_term_capacity: int = 5,
        consolidation_capacity: int = 2,
        display: bool = True,
        llm_model: str | None = None,
        api_base: str | None = None,
        additive_event_types: list[str] | set[str] | tuple[str, ...] | None = None,
    ):
        """
        Initialize the memory

        Args:
            short_term_capacity : the number of interactions to store in the short term memory
            llm_model : the model to use for the summarization
            api_base : the API base URL to use for the LLM provider
            agent : the agent that the memory belongs to
            additive_event_types : event types that accumulate multiple values
                within a step instead of overwriting. Defaults to
                ``{"message", "action"}``.
        """
        if not llm_model:
            raise ValueError(
                "llm_model must be provided for the usage of st/lt memory. You can use the pre-built 'short-term-only' memory without a model."
            )

        super().__init__(
            agent=agent,
            llm_model=llm_model,
            api_base=api_base,
            display=display,
            additive_event_types=additive_event_types,
        )

        self.capacity = short_term_capacity
        self.consolidation_capacity = (
            consolidation_capacity if consolidation_capacity > 0 else None
        )

        self.short_term_memory = deque()
        self.long_term_memory = ""
        self.system_prompt = """
            You are a helpful assistant that summarizes the short term memory into a long term memory.
            The long term memory should be a summary of the short term memory that is concise and informative.
            If the short term memory is empty, return the long term memory unchanged.
            If the long term memory is not empty, update it to include the new information from the short term memory.
            """

        if self.agent.step_prompt:
            self.system_prompt += f" This is the prompt of the problem you will be tackling:{self.agent.step_prompt}, ensure you summarize the short-term memory into long-term a way that is relevant to the problem at hand."

        self.llm.system_prompt = self.system_prompt

    def _build_consolidation_prompt(self, evicted_entries: list[MemoryEntry]) -> str:
        """
        Build a prompt that asks the LLM to integrate *evicted* memories
        into the existing long-term summary.

        Args:
            evicted_entries: the oldest short-term entries that were just
                removed from the deque and need to be summarized.
        """
        evicted_text = "\n".join(
            f"Step {e.step}: \n{e.content}" for e in evicted_entries
        )
        return (
            "Memories to consolidate (oldest entries being removed "
            "from short-term memory):\n"
            f"{evicted_text}\n\n"
            f"Existing long term memory:\n{self.long_term_memory}\n\n"
            "Please integrate the above memories into a concise, updated "
            "long-term memory summary."
        )

    def _update_long_term_memory(self, evicted_entries: list[MemoryEntry]):
        """
        Update the long term memory by summarizing the evicted entries
        """
        prompt = self._build_consolidation_prompt(evicted_entries)
        response = self.llm.generate(prompt)
        self.long_term_memory = response.choices[0].message.content

    async def _aupdate_long_term_memory(self, evicted_entries: list[MemoryEntry]):
        """
        Async version of _update_long_term_memory
        """
        prompt = self._build_consolidation_prompt(evicted_entries)
        response = await self.llm.agenerate(prompt)
        self.long_term_memory = response.choices[0].message.content

    def _process_step_core(self, pre_step: bool):
        """
        Shared core logic for process_step and aprocess_step.

        Update short-term memory and decide if consolidation is needed.
        When entries are evicted for consolidation they are captured and
        returned so the caller can pass them to the LLM for summarization.

        Returns:
            ``(new_entry, evicted_entries)`` where *evicted_entries* is a
            (possibly empty) list of MemoryEntry objects that were removed
            from short-term memory and should be consolidated.
        """
        if pre_step:
            new_entry = MemoryEntry(
                agent=self.agent,
                content=self.step_content,
                step=None,
            )
            self.short_term_memory.append(new_entry)
            self.step_content = {}
            return None, []

        if not self.short_term_memory or self.short_term_memory[-1].step is not None:
            return None, []

        pre_step_entry = self.short_term_memory.pop()
        merged_content = self._merge_step_contents(
            self.step_content, pre_step_entry.content
        )
        new_entry = MemoryEntry(
            agent=self.agent,
            content=merged_content,
            step=self.agent.model.steps,
        )
        self.short_term_memory.append(new_entry)
        self.step_content = {}

        evicted: list[MemoryEntry] = []

        if (
            len(self.short_term_memory)
            > self.capacity + (self.consolidation_capacity or 0)
            and self.consolidation_capacity
        ):
            # Pop consolidation_capacity oldest entries for summarization
            for _ in range(self.consolidation_capacity):
                if self.short_term_memory:
                    evicted.append(self.short_term_memory.popleft())

        elif (
            len(self.short_term_memory) > self.capacity
            and not self.consolidation_capacity
        ):
            # No consolidation configured — just discard the oldest entry
            self.short_term_memory.popleft()

        return new_entry, evicted


[docs]
    def process_step(self, pre_step: bool = False):
        """
        Synchronous memory step handler
        """
        new_entry, evicted = self._process_step_core(pre_step)

        if evicted:
            self._update_long_term_memory(evicted)

        if new_entry and self.display:
            new_entry.display()



[docs]
    async def aprocess_step(self, pre_step: bool = False):
        """
        Async memory step handler (non-blocking consolidation)
        """
        new_entry, evicted = self._process_step_core(pre_step)

        if evicted:
            await self._aupdate_long_term_memory(evicted)

        if new_entry and self.display:
            new_entry.display()



[docs]
    def format_long_term(self) -> str:
        """
        Get the long term memory
        """
        return str(self.long_term_memory)



[docs]
    def format_short_term(self) -> str:
        """
        Get the short term memory
        """
        if not self.short_term_memory:
            return "No recent memory."

        else:
            lines = []
            for st_memory_entry in self.short_term_memory:
                lines.append(
                    f"Step {st_memory_entry.step}: \n{st_memory_entry.content}"
                )
            return "\n".join(lines)



[docs]
    def get_prompt_ready(self) -> str:
        return (
            f"Short term memory:\n {self.format_short_term()}\n\n"
            f"Long term memory: \n{self.format_long_term()}"
        )



[docs]
    def get_communication_history(self) -> str:
        """
        Get the communication history
        """
        lines = []
        for entry in self.short_term_memory:
            if "message" not in entry.content:
                continue
            msgs = entry.content["message"]
            if isinstance(msgs, list):
                for msg in msgs:
                    lines.append(f"Step {entry.step}: {_format_message_entry(msg)}\n\n")
            else:
                lines.append(f"Step {entry.step}: {_format_message_entry(msgs)}\n\n")
        return "\n".join(lines)