Source code for mesa_llm.llm_agent

from __future__ import annotations

import logging
import warnings
from collections.abc import Callable
from typing import TYPE_CHECKING

from mesa.agent import Agent
from mesa.discrete_space import (
    OrthogonalMooreGrid,
    OrthogonalVonNeumannGrid,
)
from mesa.model import Model
from mesa.space import (
    ContinuousSpace,
    MultiGrid,
    SingleGrid,
)

from mesa_llm import Plan
from mesa_llm.memory.st_lt_memory import STLTMemory
from mesa_llm.module_llm import ModuleLLM
from mesa_llm.reasoning.reasoning import (
    _UNSET,
    Observation,
    Reasoning,
)
from mesa_llm.tools.tool_manager import ToolManager

logger = logging.getLogger(__name__)

if TYPE_CHECKING:  # pragma: no cover
    from mesa_llm.recording.simulation_recorder import SimulationRecorder



[docs]
class LLMAgent(Agent):
    """
    LLMAgent manages an LLM backend and optionally connects to a memory module.

    Parameters:
        model (Model): The Mesa model the agent belongs to.
        reasoning (type[Reasoning]): The reasoning strategy used by the agent.
        llm_model (str): The model to use for the LLM in the format
            ``provider/model``. Defaults to ``gemini/gemini-2.0-flash``.
        system_prompt (str | None): Optional system prompt for the LLM.
        vision (float | None): Observation radius for nearby agents. Use ``-1``
            to observe all agents in the simulation.
        internal_state (list[str] | str | None): Optional internal state facts
            exposed to the reasoning module.
        step_prompt (str | None): Optional task-specific prompt used to guide
            the agent each step.
        api_base (str | None): Optional custom LiteLLM-compatible base URL for
            self-hosted or remote inference endpoints.
        tools (list[Callable | str] | tuple[Callable | str, ...] | None):
            Explicit tools exposed to this agent. ``None`` and ``[]`` expose
            no tools; pass a tool-set factory such as ``legacy_tools()`` to
            opt in to compatibility built-ins.

    Attributes:
        llm (ModuleLLM): The internal LLM interface used by the agent.
        memory (Memory | None): The memory module attached to this agent, if any.
    """

    def __init__(
        self,
        model: Model,
        reasoning: type[Reasoning],
        llm_model: str = "gemini/gemini-2.0-flash",
        system_prompt: str | None = None,
        vision: float | None = None,
        internal_state: list[str] | str | None = None,
        step_prompt: str | None = None,
        api_base: str | None = None,
        tools: list[Callable | str] | tuple[Callable | str, ...] | None = None,
    ):
        super().__init__(model=model)

        self.model = model
        self.step_prompt = step_prompt
        self.llm = ModuleLLM(
            llm_model=llm_model, system_prompt=system_prompt, api_base=api_base
        )

        self.memory = STLTMemory(
            agent=self,
            short_term_capacity=5,
            consolidation_capacity=2,
            llm_model=llm_model,
            api_base=api_base,
        )

        self._tool_manager = ToolManager(tools=tools)
        self.vision = vision
        self.reasoning = reasoning(agent=self)
        self.system_prompt = system_prompt
        self._current_plan = None  # Store current plan for formatting

        # display coordination
        self._step_display_data = {}

        # Placeholder so @record_model can attach the SimulationRecorder
        self.recorder: SimulationRecorder | None = None

        if isinstance(internal_state, str):
            internal_state = [internal_state]
        elif internal_state is None:
            internal_state = []

        self.internal_state = internal_state

    def __str__(self):
        return f"LLMAgent {self.unique_id}"

    @property
    def system_prompt(self) -> str | None:
        return self.llm.system_prompt

    @system_prompt.setter
    def system_prompt(self, value: str | None):
        self.llm.system_prompt = value

    @property
    def tool_manager(self) -> ToolManager:
        warnings.warn(
            "`agent.tool_manager` is deprecated; configure tools with "
            "`LLMAgent(..., tools=...)` and treat the manager as internal.",
            DeprecationWarning,
            stacklevel=2,
        )
        return self._tool_manager

    @tool_manager.setter
    def tool_manager(self, value: ToolManager):
        warnings.warn(
            "`agent.tool_manager = ...` is deprecated; pass tools explicitly "
            "or assign `agent._tool_manager` only inside framework internals.",
            DeprecationWarning,
            stacklevel=2,
        )
        self._tool_manager = value

    def _format_message_status(
        self, message: str, delivered_ids: list[int], skipped_ids: list[int]
    ) -> str:
        """Format direct-message delivery status to match the speak_to tool."""
        status_parts = []
        if delivered_ids:
            status_parts.append(f"sent message {message!r} to {delivered_ids}")
        if skipped_ids:
            status_parts.append(
                f"skipped {skipped_ids} because they have no `memory` attribute"
            )
        if not status_parts:
            return f"Could not send message {message!r}: no matching recipients found."
        return "; ".join(status_parts)


[docs]
    async def aapply_plan(self, plan: Plan) -> list[dict]:
        """
        Asynchronous version of apply_plan.
        """
        self._current_plan = plan

        plan_tools = getattr(plan, "tools", _UNSET)
        if plan_tools is _UNSET:
            tool_call_resp = await self._tool_manager.acall_tools(
                agent=self, llm_response=plan.llm_plan
            )
        else:
            tool_call_resp = await self._tool_manager.acall_tools(
                agent=self, llm_response=plan.llm_plan, tools=plan_tools
            )

        await self.memory.aadd_to_memory(
            type="action",
            content={
                "tool_calls": [
                    {k: v for k, v in tc.items() if k not in ["tool_call_id", "role"]}
                    for tc in tool_call_resp
                ]
            },
        )

        return tool_call_resp



[docs]
    def apply_plan(self, plan: Plan) -> list[dict]:
        """
        Execute the plan in the simulation.
        """
        # Store current plan for display
        self._current_plan = plan

        # Execute tool calls
        plan_tools = getattr(plan, "tools", _UNSET)
        if plan_tools is _UNSET:
            tool_call_resp = self._tool_manager.call_tools(
                agent=self, llm_response=plan.llm_plan
            )
        else:
            tool_call_resp = self._tool_manager.call_tools(
                agent=self, llm_response=plan.llm_plan, tools=plan_tools
            )

        # Add to memory
        self.memory.add_to_memory(
            type="action",
            content={
                "tool_calls": [
                    {k: v for k, v in tc.items() if k not in ["tool_call_id", "role"]}
                    for tc in tool_call_resp
                ]
            },
        )

        return tool_call_resp


    def _build_observation(self):
        """
        Construct the observation data visible to the agent at the current model step.

        This method encapsulates the shared logic used by both sync and
        async observation generation.
        This method constructs the agent's self state and determines which other
        agents are observable based on the configured vision:

        - vision > 0:
            The agent observes all agents within the specified vision radius.
        - vision == -1:
            The agent observes all agents present in the simulation.
        - vision == 0 or vision is None:
            The agent observes no other agents.

        The method supports grid-based and continuous spaces and builds a local
        state representation for all visible neighboring agents.

        Returns self_state and local_state of the agent
        """
        self_state = {
            "agent_unique_id": self.unique_id,
            "location": (
                self.pos
                if self.pos is not None
                else (
                    getattr(self, "cell", None).coordinate
                    if getattr(self, "cell", None) is not None
                    else None
                )
            ),
            "internal_state": self.internal_state,
        }
        if self.vision is not None and self.vision > 0:
            # Early return: agent has no position and no cell — cannot query neighbors
            if self.pos is None and getattr(self, "cell", None) is None:
                return self_state, {}

            # Check which type of space/grid the model uses
            grid = getattr(self.model, "grid", None)
            space = getattr(self.model, "space", None)

            if grid and isinstance(grid, SingleGrid | MultiGrid):
                neighbors = grid.get_neighbors(
                    tuple(self.pos),
                    moore=True,
                    include_center=False,
                    radius=self.vision,
                )
            elif grid and isinstance(
                grid, OrthogonalMooreGrid | OrthogonalVonNeumannGrid
            ):
                agent_cell = next(
                    (cell for cell in grid.all_cells if self in cell.agents),
                    None,
                )
                if agent_cell:
                    neighborhood = agent_cell.get_neighborhood(radius=self.vision)
                    neighbors = [a for cell in neighborhood for a in cell.agents]
                else:
                    neighbors = []

            elif space and isinstance(space, ContinuousSpace):
                all_nearby = space.get_neighbors(
                    self.pos, radius=self.vision, include_center=True
                )
                neighbors = [a for a in all_nearby if a is not self]

            else:
                # No recognized grid/space type
                neighbors = []

        elif self.vision == -1:
            all_agents = list(self.model.agents)
            neighbors = [agent for agent in all_agents if agent is not self]

        else:
            neighbors = []

        local_state = {}
        for i in neighbors:
            local_state[i.__class__.__name__ + " " + str(i.unique_id)] = {
                "position": (
                    i.pos
                    if i.pos is not None
                    else (
                        getattr(i, "cell", None).coordinate
                        if getattr(i, "cell", None) is not None
                        else None
                    )
                ),
                "internal_state": [
                    s for s in getattr(i, "internal_state", []) if not s.startswith("_")
                ],
            }
        return self_state, local_state


[docs]
    async def agenerate_obs(self) -> Observation:
        """
        This method builds the agent's observation using the shared observation
        construction logic, stores it in the agent's memory module using
        async memory operations, and returns it as an Observation instance.
        """
        step = self.model.steps
        self_state, local_state = self._build_observation()
        await self.memory.aadd_to_memory(
            type="observation",
            content={
                "self_state": self_state,
                "local_state": local_state,
            },
        )

        return Observation(step=step, self_state=self_state, local_state=local_state)



[docs]
    def generate_obs(self) -> Observation:
        """
        This method delegates observation construction to the shared observation
        builder, stores the resulting observation in the agent's memory module,
        and returns it as an Observation instance.
        """
        step = self.model.steps
        self_state, local_state = self._build_observation()
        # Add to memory (memory handles its own display separately)
        self.memory.add_to_memory(
            type="observation",
            content={
                "self_state": self_state,
                "local_state": local_state,
            },
        )

        return Observation(step=step, self_state=self_state, local_state=local_state)



[docs]
    async def asend_message(self, message: str, recipients: list[Agent]) -> str:
        """
        Asynchronous version of send_message.
        """
        delivered_ids = []
        skipped_ids = []
        for recipient in recipients:
            if recipient is self:
                continue
            if not hasattr(recipient, "memory"):
                skipped_ids.append(recipient.unique_id)
                logger.warning(
                    "Agent %s has no memory attribute; skipping send_message.",
                    recipient.unique_id,
                )
                continue
            delivered_ids.append(recipient.unique_id)
            await recipient.memory.aadd_to_memory(
                type="message",
                content={
                    "message": message,
                    "sender": self.unique_id,
                },
            )
        await self.memory.aadd_to_memory(
            type="message",
            content={
                "message": message,
                "sender": self.unique_id,
                "recipients": delivered_ids,
            },
        )
        return self._format_message_status(message, delivered_ids, skipped_ids)



[docs]
    def send_message(self, message: str, recipients: list[Agent]) -> str:
        """
        Send a message to the recipients.
        """
        delivered_ids = []
        skipped_ids = []
        for recipient in recipients:
            if recipient is self:
                continue
            if not hasattr(recipient, "memory"):
                skipped_ids.append(recipient.unique_id)
                logger.warning(
                    "Agent %s has no memory attribute; skipping send_message.",
                    recipient.unique_id,
                )
                continue
            delivered_ids.append(recipient.unique_id)
            recipient.memory.add_to_memory(
                type="message",
                content={
                    "message": message,
                    "sender": self.unique_id,
                },
            )
        self.memory.add_to_memory(
            type="message",
            content={
                "message": message,
                "sender": self.unique_id,
                "recipients": delivered_ids,
            },
        )
        return self._format_message_status(message, delivered_ids, skipped_ids)



[docs]
    async def apre_step(self):
        """
        Asynchronous version of pre_step.
        """
        await self.memory.aprocess_step(pre_step=True)



[docs]
    async def apost_step(self):
        """
        Asynchronous version of post_step.
        """
        await self.memory.aprocess_step()



[docs]
    def pre_step(self):
        """
        This is some code that is executed before the step method of the child agent is called.
        """
        self.memory.process_step(pre_step=True)



[docs]
    def post_step(self):
        """
        This is some code that is executed after the step method of the child agent is called.
        It functions because of the __init_subclass__ method that creates a wrapper around the step method of the child agent.
        """
        self.memory.process_step()



[docs]
    async def astep(self):
        """
        Default asynchronous step method for parallel agent execution.
        Subclasses should override this method for custom async behavior.
        If not overridden, falls back to calling the synchronous step() method.
        """
        await self.apre_step()

        raw_step = getattr(self.__class__, "_raw_user_step", None)
        if raw_step is not None:
            if not getattr(self.__class__, "_warned_sync_astep_fallback", False):
                warnings.warn(
                    (
                        f"{self.__class__.__name__}.astep() is falling back to "
                        "synchronous step(), which may block the asyncio event "
                        "loop. Override astep() for non-blocking behavior or use "
                        "threading parallel stepping."
                    ),
                    RuntimeWarning,
                    stacklevel=2,
                )
                self.__class__._warned_sync_astep_fallback = True
            raw_step(self)

        await self.apost_step()


    def __init_subclass__(cls, **kwargs):
        """
        Wrapper - allows to automatically integrate code to be executed after the step method of the child agent (created by the user) is called.
        """
        super().__init_subclass__(**kwargs)
        # only wrap if subclass actually defines its own step
        user_step = cls.__dict__.get("step")
        user_astep = cls.__dict__.get("astep")

        if user_step:
            # Store the raw user step for the default astep() to call
            # without the pre/post wrapper (astep handles its own pre/post)
            cls._raw_user_step = user_step

            def wrapped(self, *args, **kwargs):
                """
                This is the wrapper that is used to integrate the pre_step and post_step methods into the step method of the child agent.
                """
                LLMAgent.pre_step(self, *args, **kwargs)
                result = user_step(self, *args, **kwargs)
                LLMAgent.post_step(self, *args, **kwargs)
                return result

            cls.step = wrapped

        if user_astep:

            async def awrapped(self, *args, **kwargs):
                """
                Async wrapper for astep method.
                """
                await self.apre_step()
                result = await user_astep(self, *args, **kwargs)
                await self.apost_step()
                return result

            cls.astep = awrapped