perf(agents): stop inlining agent state into tool-dispatch Sends

In create_agent's model_to_tools edge, dispatch each tool call via the bare list form `Send("tools", [tool_call])` instead of wrapping it in ToolCallWithContext(state=state, ...). The tool node now hydrates ToolRuntime.state from graph channels at tool-execution time (see langchain-ai/langgraph#7594), so inlining the full state dict into every Send is no longer needed. This eliminates an O(N^2) storage term on __pregel_tasks checkpoint writes: previously each turn's Sends carried a serialized snapshot of the entire messages list at dispatch time. For a 500-turn agent run, this drops __pregel_tasks storage from ~815 MB to ~482 KB (1,691x reduction). See benchmark in PR description. Back-compat: the legacy ToolCallWithContext input shape is still accepted by ToolNode for any external dispatcher that hasn't migrated. Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
2026-04-23 20:23:59 +00:00 · 2026-04-22 19:40:19 -04:00
parent b57eea2aed
commit 2fb8464168
1 changed files with 16 additions and 20 deletions
--- a/libs/langchain_v1/langchain/agents/factory.py
+++ b/libs/langchain_v1/langchain/agents/factory.py
@@ -22,7 +22,7 @@ from langchain_core.tools import BaseTool
 from langgraph._internal._runnable import RunnableCallable
 from langgraph.constants import END, START
 from langgraph.graph.state import StateGraph
-from langgraph.prebuilt.tool_node import ToolCallWithContext, ToolNode
+from langgraph.prebuilt.tool_node import ToolNode
 from langgraph.types import Command, Send
 from langsmith import traceable
 from typing_extensions import NotRequired, Required, TypedDict
@@ -933,6 +933,15 @@ def create_agent(
    # Tools that require client-side execution (must be in ToolNode)
    available_tools = middleware_tools + regular_tools

+    # Resolve the agent state schema now so we can tell `ToolNode` which state
+    # keys to hydrate from channels when it receives `Send("tools", [tool_call])`
+    # (list-form dispatch that carries no inlined state).
+    state_schemas: set[type] = {m.state_schema for m in middleware}
+    base_state = state_schema if state_schema is not None else AgentState
+    state_schemas.add(base_state)
+    resolved_state_schema, input_schema, output_schema = _resolve_schemas(state_schemas)
+    agent_state_keys = tuple(resolved_state_schema.__annotations__)
+
    # Create ToolNode if we have client-side tools OR if middleware defines wrap_tool_call
    # (which may handle dynamically registered tools)
    tool_node = (
@@ -940,6 +949,7 @@ def create_agent(
            tools=available_tools,
            wrap_tool_call=wrap_tool_call_wrapper,
            awrap_tool_call=awrap_tool_call_wrapper,
+            state_keys=agent_state_keys,
        )
        if available_tools or wrap_tool_call_wrapper or awrap_tool_call_wrapper
        else None
@@ -1023,13 +1033,6 @@ def create_agent(
        ]
        awrap_model_call_handler = _chain_async_model_call_handlers(async_handlers)

-    state_schemas: set[type] = {m.state_schema for m in middleware}
-    # Use provided state_schema if available, otherwise use base AgentState
-    base_state = state_schema if state_schema is not None else AgentState
-    state_schemas.add(base_state)
-
-    resolved_state_schema, input_schema, output_schema = _resolve_schemas(state_schemas)
-
    # create graph, add nodes
    graph: StateGraph[
        AgentState[ResponseT], ContextT, _InputAgentState, _OutputAgentState[ResponseT]
@@ -1740,19 +1743,12 @@ def _make_model_to_tools_edge(
            if c["id"] not in tool_message_ids and c["name"] not in structured_output_tools
        ]

-        # 4. If there are pending tool calls, jump to the tool node
+        # 4. If there are pending tool calls, jump to the tool node.
+        # The tool node hydrates ToolRuntime.state from channels via
+        # CONFIG_KEY_READ at execution time, so we no longer inline the
+        # full state into each Send (previously O(N^2) in TASKS writes).
        if pending_tool_calls:
-            return [
-                Send(
-                    "tools",
-                    ToolCallWithContext(
-                        __type="tool_call_with_context",
-                        tool_call=tool_call,
-                        state=state,
-                    ),
-                )
-                for tool_call in pending_tool_calls
-            ]
+            return [Send("tools", [tool_call]) for tool_call in pending_tool_calls]

        # 5. If there is a structured response, exit the loop
        if "structured_response" in state: