diff --git a/src/oss/langchain/agents.mdx b/src/oss/langchain/agents.mdx
index 42696cc10..32d14582b 100644
--- a/src/oss/langchain/agents.mdx
+++ b/src/oss/langchain/agents.mdx
@@ -204,7 +204,7 @@ const agent = createAgent({
 :::
 
 <Tip>
-For model configuration details, see [Models](/oss/langchain/models).
+For model configuration details, see [Models](/oss/langchain/models). For dynamic model selection patterns, see [Dynamic model in middleware](/oss/langchain/middleware#dynamic-model).
 </Tip>
 
 ### Tools
@@ -519,7 +519,7 @@ const result = await agent.invoke(
 For more details on message types and formatting, see [Messages](/oss/langchain/messages). For comprehensive middleware documentation, see [Middleware](/oss/langchain/middleware).
 </Tip>
 
-## Advanced configuration
+## Advanced concepts
 
 ### Structured output
 
@@ -677,215 +677,6 @@ const CustomAgentState = createAgent({
 To learn more about memory, see [Memory](/oss/concepts/memory). For information on implementing long-term memory that persists across sessions, see [Long-term memory](/oss/langchain/long-term-memory).
 </Tip>
 
-### Before model hook
-
-Pre-model hook is middleware that processes state before the model is called. Use cases include message trimming, summarization, and context injection.
-
-```mermaid
-%%{
-    init: {
-        "fontFamily": "monospace",
-        "flowchart": {
-        "curve": "basis"
-        },
-        "themeVariables": {"edgeLabelBackground": "transparent"}
-    }
-}%%
-graph TD
-    S(["\_\_start\_\_"])
-    PRE(before_model)
-    MODEL(model)
-    TOOLS(tools)
-    END(["\_\_end\_\_"])
-
-    S --> PRE
-    PRE --> MODEL
-    MODEL -.-> TOOLS
-    MODEL -.-> END
-    TOOLS --> PRE
-
-    classDef blueHighlight fill:#0a1c25,stroke:#0a455f,color:#bae6fd;
-    class S blueHighlight;
-    class END blueHighlight;
-```
-
-:::python
-
-Use the `@before_model` decorator to create middleware that runs before the model is called:
-
-```python wrap
-from langchain.messages import RemoveMessage
-from langgraph.graph.message import REMOVE_ALL_MESSAGES
-from langchain.agents import create_agent, AgentState
-from langchain.agents.middleware import before_model
-from langgraph.runtime import Runtime
-
-@before_model
-def trim_messages(state: AgentState, runtime: Runtime) -> dict[str, Any] | None:
-    """Keep only the last few messages to fit context window."""
-    messages = state["messages"]
-
-    if len(messages) <= 3:
-        return None  # No changes needed
-
-    first_msg = messages[0]
-    recent_messages = messages[-3:] if len(messages) % 2 == 0 else messages[-4:]
-    new_messages = [first_msg] + recent_messages
-
-    return {
-        "messages": [
-            RemoveMessage(id=REMOVE_ALL_MESSAGES),
-            *new_messages
-        ]
-    }
-
-agent = create_agent(
-    model,
-    tools=tools,
-    middleware=[trim_messages]
-)
-```
-
-<Info>
-When returning `messages` from `before_model` middleware, you should **overwrite the `messages` key** by including `RemoveMessage(id=REMOVE_ALL_MESSAGES)` first, followed by your new messages.
-</Info>
-
-:::
-:::js
-```ts wrap
-import { createAgent, type AgentState } from "langchain";
-import { REMOVE_ALL_MESSAGES } from "@langchain/langgraph";
-import { RemoveMessage } from "@langchain/core/messages";
-
-const trimMessages = (state: AgentState) => {
-  const messages = state.messages;
-
-  if (messages.length <= 3) {
-    return { messages };
-  }
-
-  const firstMsg = messages[0];
-  const recentMessages = messages.length % 2 === 0
-    ? messages.slice(-3)
-    : messages.slice(-4);
-
-  const newMessages = [firstMsg, ...recentMessages];
-
-  return {
-    messages: [
-      new RemoveMessage({ id: REMOVE_ALL_MESSAGES }),
-      ...newMessages
-    ]
-  };
-};
-
-const agent = createAgent({
-  model: "openai:gpt-4o",
-  tools,
-  preModelHook: trimMessages,
-});
-```
-:::
-
-### After model hook
-
-After model hook is middleware that processes the model's response before tool execution. Use cases include validation, guardrails, or other post-processing.
-
-```mermaid
-%%{
-    init: {
-        "fontFamily": "monospace",
-        "flowchart": {
-        "curve": "basis"
-        },
-        "themeVariables": {"edgeLabelBackground": "transparent"}
-    }
-}%%
-graph TD
-    S(["\_\_start\_\_"])
-    MODEL(model)
-    POST(after_model)
-    TOOLS(tools)
-    END(["\_\_end\_\_"])
-
-    S --> MODEL
-    MODEL --> POST
-    POST -.-> END
-    POST -.-> TOOLS
-    TOOLS --> MODEL
-
-    classDef blueHighlight fill:#0a1c25,stroke:#0a455f,color:#bae6fd;
-    class S blueHighlight;
-    class END blueHighlight;
-    class POST greenHighlight;
-```
-
-:::python
-
-Use the `@after_model` decorator to create middleware that runs after the model is called:
-
-```python wrap
-from typing import Any
-from langchain.messages import AIMessage, RemoveMessage
-from langgraph.graph.message import REMOVE_ALL_MESSAGES
-from langchain.agents import create_agent, AgentState
-from langchain.agents.middleware import after_model
-from langgraph.runtime import Runtime
-
-@after_model
-def validate_response(state: AgentState, runtime: Runtime) -> dict[str, Any] | None:
-    """Check model response for policy violations."""
-    messages = state["messages"]
-    last_message = messages[-1]
-
-    if "confidential" in last_message.content.lower():
-        return {
-            "messages": [
-                RemoveMessage(id=REMOVE_ALL_MESSAGES),
-                *messages[:-1],
-                AIMessage(content="I cannot share confidential information.")
-            ]
-        }
-
-    return None  # No changes needed
-
-agent = create_agent(
-    model,
-    tools=tools,
-    middleware=[validate_response]
-)
-```
-
-:::
-:::js
-```ts wrap
-import { createAgent, type AgentState, AIMessage, RemoveMessage } from "langchain";
-import { REMOVE_ALL_MESSAGES } from "@langchain/langgraph";
-
-const validateResponse = (state: AgentState) => {
-  const messages = state.messages;
-  const lastMessage = messages.at(-1)?.text;
-
-  if (lastMessage?.toLowerCase().includes("confidential")) {
-    return {
-      messages: [
-        new RemoveMessage({ id: REMOVE_ALL_MESSAGES }),
-        ...state.messages.slice(0, -1),
-        new AIMessage("I cannot share confidential information."),
-      ],
-    };
-  }
-  return {};
-};
-
-const agent = createAgent({
-  model: "openai:gpt-4o",
-  tools,
-  postModelHook: validateResponse,
-});
-```
-:::
-
 ### Streaming
 
 We've seen how the agent can be called with `.invoke` to get a final response. If the agent executes multiple steps, this may take a while. To show intermediate progress, we can stream back messages as they occur.
@@ -931,3 +722,27 @@ for await (const chunk of stream) {
 <Tip>
 For more details on streaming, see [Streaming](/oss/langchain/streaming).
 </Tip>
+
+### Middleware
+
+[Middleware](/oss/langchain/middleware) provides powerful extensibility for customizing agent behavior at different stages of execution. You can use middleware to:
+
+- Process state before the model is called (e.g., message trimming, context injection)
+- Modify or validate the model's response (e.g., guardrails, content filtering)
+- Handle tool execution errors with custom logic
+- Implement dynamic model selection based on state or context
+- Add custom logging, monitoring, or analytics
+
+Middleware integrates seamlessly into the agent's execution graph, allowing you to intercept and modify data flow at key points without changing the core agent logic.
+
+:::python
+<Tip>
+For comprehensive middleware documentation including decorators like `@before_model`, `@after_model`, and `@wrap_tool_call`, see [Middleware](/oss/langchain/middleware).
+</Tip>
+:::
+
+:::js
+<Tip>
+For comprehensive middleware documentation including hooks like `beforeModel`, `afterModel`, and `wrapToolCall`, see [Middleware](/oss/langchain/middleware).
+</Tip>
+:::
diff --git a/src/oss/langchain/context-engineering.mdx b/src/oss/langchain/context-engineering.mdx
index 87205d998..1b506830f 100644
--- a/src/oss/langchain/context-engineering.mdx
+++ b/src/oss/langchain/context-engineering.mdx
@@ -86,106 +86,409 @@ This is not modified by the agent, and typically isn't passed into the LLM, but
 Examples include: user ID, DB connections
 
 
-## Functionality our agent needs to support to enable context engineering
+## Context engineering with LangChain
 
 Now we understand the basic agent loop, the importance of the model you use, and the different types of context that exist.
-What functionality does our agent need to support, and how does LangChain's agent support this?
-
-### Specify custom system prompt
-
-You can use [`prompt` parameter](/oss/langchain/agents#prompt) to pass in a function that returns a string to use as system prompt
-
-Use cases:
-- Personalize the system prompt with information in session context, long term memory, or runtime context
-
-### Explicit control over "messages generation" prior to calling model
-
-You can use [`prompt` parameter](/oss/langchain/agents#prompt) to pass in a function that returns a list of messages
-
-Use cases:
-- Reinforce instructions by dynamically adding an extra system message to the end of the messages sent in, without updating state
-
-### Access to runtime configuration in "messages generation"/custom system prompt
-
-You can use [`prompt` parameter](/oss/langchain/agents#prompt) to pass in a function that returns a list of messages or a custom system prompt.
-You can access runtime configuration by calling `get_runtime`
-
-Use cases:
-- Use `user_id` passed in to look up user profile, and put it in the system prompt
-
-### Access to session context in "messages generation"/custom system prompt
-
-You can use [`prompt` parameter](/oss/langchain/agents#prompt) to pass in a function that returns a list of messages or a custom system prompt.
-Session context is passed in with the [`state` parameter](/oss/langchain/short-term-memory#prompt)
-
-Use cases:
-- Use more structured information that the user passes in at runtime (preferences) in the system prompt
-
-### Access to long term memory in "messages generation"/custom system prompt
-
-You can use [`prompt` parameter](/oss/langchain/agents#prompt) to pass in a function that returns a list of messages or a custom system prompt.
-You can access long term memory by calling `get_store`
-
-Use cases:
-- Look up user preferences from long term memory and put them in the system prompt
-
-### Update session context before model invocation
-
-You can use [pre_model_hook](/oss/langchain/agents#pre-model-hook) to update state
-
-Use cases:
-- Filter out messages if message list is getting long, save filtered list in state and only use that
-- Create a summary of conversation every N messages, save that in state
-
-### Access to runtime configuration in tools
-
-You can use `get_runtime` to [access runtime configuration](/oss/langchain/tools#accessing-runtime-context-inside-a-tool) in tools
-
-Use cases:
-- Use `user_id` to look up information inside a tool call
-
-### Access to session context in tools
-
-You can add an argument with InjectedState to tools to access [session context in tools](/oss/langchain/short-term-memory#read-short-term-memory-in-a-tool)
-
-Use cases:
-- Pass messages in state to a sub agent
-
-### Access to long term memory in tools
-
-You can use `get_store` to [access long term memory in tools](/oss/langchain/long-term-memory#read-long-term-memory-in-tools)
-
-Use cases:
-- Look up memories from long term memory store
-
-### Update session context in tools
-
-You can [return state updates](/oss/langchain/short-term-memory#write-short-term-memory-from-tools) with Command from tools
-
-Use cases:
-- Use tools to update a "virtual file system"
-
-### Update long term memory in tools
-
-You can use `get_store` to access long term memory and then [update it inside tools](/oss/langchain/long-term-memory#write-long-term-memory-from-tools)
-
-Use cases:
-- Use tools to update user preferences that are stored in long term memory
-
-### Update tools before model call
-
-You can pass in a [function to `model` parameter](/oss/langchain/agents#dynamic-model) that attaches custom tools
-
-Use cases:
-- Force the agent to call a certain tool first
-- Only give the agent access to certain tools after it calls other tools
-- Remove access to tools (forcing the agent to respond) after N iterations
-
-### Update model to use before model call
-
-You can pass in a [function to `model` parameter](/oss/langchain/agents#dynamic-model) that returns a custom model
-
-Use cases:
-- Use a model with a longer context window once message history gets long
-- Use a smarter model if the original model gets stuck
+Let's explore the concrete patterns LangChain provides for context engineering.
+
+### Managing instructions (system prompts)
+
+#### Static instructions
+
+For fixed instructions that don't change, use the `system_prompt` parameter:
+
+:::python
+```python
+from langchain.agents import create_agent
+
+agent = create_agent(
+    model="openai:gpt-4o",
+    tools=[...],
+    system_prompt="You are a customer support agent. Be helpful, concise, and professional."
+)
+```
+:::
+
+:::js
+```typescript
+import { createAgent } from "langchain";
+
+const agent = createAgent({
+  model: "openai:gpt-4o",
+  tools: [...],
+  systemPrompt: "You are a customer support agent. Be helpful, concise, and professional.",
+});
+```
+:::
+
+#### Dynamic instructions
+
+For instructions that depend on context (user profile, preferences, session data), use the `@dynamic_prompt` middleware:
+
+:::python
+```python
+from dataclasses import dataclass
+from langchain.agents import create_agent
+from langchain.agents.middleware import dynamic_prompt, ModelRequest
+
+@dataclass
+class Context:
+    user_id: str
+
+@dynamic_prompt
+def personalized_prompt(request: ModelRequest) -> str:
+    # Access runtime context
+    user_id = request.runtime.context.user_id
+
+    # Look up user preferences from long-term memory
+    store = request.runtime.store
+    user_prefs = store.get(("users",), user_id)
+
+    # Access session state
+    message_count = len(request.state["messages"])
+
+    base = "You are a helpful assistant."
+
+    if user_prefs:
+        style = user_prefs.value.get("communication_style", "balanced")
+        base += f"\nUser prefers {style} responses."
+
+    if message_count > 10:
+        base += "\nThis is a long conversation - be extra concise."
+
+    return base
+
+agent = create_agent(
+    model="openai:gpt-4o",
+    tools=[...],
+    middleware=[personalized_prompt],
+    context_schema=Context
+)
+
+# Use the agent with context
+result = agent.invoke(
+    {"messages": [{"role": "user", "content": "Help me debug this code"}]},
+    context=Context(user_id="user_123")
+)
+```
+:::
+
+:::js
+```typescript
+import { z } from "zod";
+import { createAgent, dynamicSystemPromptMiddleware } from "langchain";
+
+const contextSchema = z.object({
+  userId: z.string(),
+});
+
+const agent = createAgent({
+  model: "openai:gpt-4o",
+  tools: [...],
+  contextSchema,
+  middleware: [
+    dynamicSystemPromptMiddleware((state, runtime) => {
+      const userId = runtime.context.userId;
+      const messageCount = state.messages.length;
+
+      let base = "You are a helpful assistant.";
+
+      // Add context-specific instructions
+      if (messageCount > 10) {
+        base += "\nThis is a long conversation - be extra concise.";
+      }
+
+      return base;
+    }),
+  ],
+});
+
+// Use the agent with context
+const result = await agent.invoke(
+  { messages: [{ role: "user", content: "Help me debug this code" }] },
+  { context: { userId: "user_123" } }
+);
+```
+:::
+
+<Tip>
+**When to use each:**
+- **Static prompts**: Base instructions that never change
+- **Dynamic prompts**: Personalization, A/B testing, context-dependent behavior
+</Tip>
+
+### Managing conversation context (messages)
+
+Long conversations can exceed context windows or degrade model performance. Use middleware to manage conversation history:
+
+#### Trimming messages
+
+:::python
+```python
+from langchain.agents import create_agent
+from langchain.agents.middleware import before_model, AgentState
+from langchain.messages import RemoveMessage
+from langgraph.graph.message import REMOVE_ALL_MESSAGES
+from langgraph.runtime import Runtime
+
+@before_model
+def trim_messages(state: AgentState, runtime: Runtime) -> dict | None:
+    """Keep only the most recent messages to stay within context window."""
+    messages = state["messages"]
+
+    if len(messages) <= 10:
+        return None  # No trimming needed
+
+    # Keep system message + last 8 messages
+    return {
+        "messages": [
+            RemoveMessage(id=REMOVE_ALL_MESSAGES),
+            messages[0],  # System message
+            *messages[-8:]  # Recent messages
+        ]
+    }
+
+agent = create_agent(
+    model="openai:gpt-4o",
+    tools=[...],
+    middleware=[trim_messages]
+)
+```
+:::
+
+:::js
+```typescript
+import { createMiddleware, RemoveMessage } from "langchain";
+import { REMOVE_ALL_MESSAGES } from "@langchain/langgraph";
+
+const trimMessages = createMiddleware({
+  name: "TrimMessages",
+  beforeModel: (state) => {
+    const messages = state.messages;
+
+    if (messages.length <= 10) {
+      return;  // No trimming needed
+    }
+
+    // Keep system message + last 8 messages
+    return {
+      messages: [
+        new RemoveMessage({ id: REMOVE_ALL_MESSAGES }),
+        messages[0],  // System message
+        ...messages.slice(-8)  // Recent messages
+      ]
+    };
+  },
+});
+
+const agent = createAgent({
+  model: "openai:gpt-4o",
+  tools: [...],
+  middleware: [trimMessages],
+});
+```
+:::
+
+For more sophisticated message management, use the built-in [SummarizationMiddleware](/oss/langchain/middleware#summarization) which automatically summarizes old messages when approaching token limits.
+
+See [Before model hook](/oss/langchain/agents#before-model-hook) for more examples.
+
+### Contextual tool execution
+
+Tools can access runtime context, session state, and long-term memory to make context-aware decisions:
+
+:::python
+```python
+from dataclasses import dataclass
+from langchain.tools import tool
+from langchain.agents import create_agent
+from langgraph.runtime import get_runtime
+from langgraph.config import get_store
+from typing_extensions import Annotated
+from langchain.tools import InjectedState
+
+@dataclass
+class Context:
+    user_id: str
+    api_key: str
+
+@tool
+def search_documents(
+    query: str,
+    state: Annotated[dict, InjectedState]
+) -> str:
+    """Search through documents."""
+    # Access runtime context for user-specific configuration
+    runtime = get_runtime(Context)
+    user_id = runtime.context.user_id
+
+    # Access long-term memory for user preferences
+    store = runtime.store
+    search_prefs = store.get(("preferences", user_id), "search")
+
+    # Access session state
+    conversation_history = state["messages"]
+
+    # Use all context to perform a better search
+    results = perform_search(query, user_id, search_prefs, conversation_history)
+    return f"Found {len(results)} results: {results}"
+
+agent = create_agent(
+    model="openai:gpt-4o",
+    tools=[search_documents],
+    context_schema=Context
+)
+```
+:::
+
+See [Tools](/oss/langchain/tools) for comprehensive examples of accessing state, context, and memory in tools.
+
+### Dynamic tool selection
+
+Control which tools the agent can access based on context, state, or user permissions:
+
+:::python
+```python
+from langchain.agents import create_agent
+from langchain.agents.middleware import wrap_model_call, ModelRequest, ModelResponse
+from typing import Callable
+
+@wrap_model_call
+def permission_based_tools(
+    request: ModelRequest,
+    handler: Callable[[ModelRequest], ModelResponse]
+) -> ModelResponse:
+    """Filter tools based on user permissions."""
+    user_role = request.runtime.context.get("user_role", "viewer")
+
+    if user_role == "admin":
+        # Admins get all tools
+        pass
+    elif user_role == "editor":
+        # Editors can't delete
+        request.tools = [t for t in request.tools if t.name != "delete_data"]
+    else:
+        # Viewers get read-only tools
+        request.tools = [t for t in request.tools if t.name.startswith("read_")]
+
+    return handler(request)
+
+agent = create_agent(
+    model="openai:gpt-4o",
+    tools=[read_data, write_data, delete_data],
+    middleware=[permission_based_tools]
+)
+```
+:::
+
+:::js
+```typescript
+import { createMiddleware } from "langchain";
+
+const permissionBasedTools = createMiddleware({
+  name: "PermissionBasedTools",
+  wrapModelCall: (request, handler) => {
+    const userRole = request.runtime.context.userRole || "viewer";
+    let filteredTools = request.tools;
+
+    if (userRole === "admin") {
+      // Admins get all tools
+    } else if (userRole === "editor") {
+      // Editors can't delete
+      filteredTools = request.tools.filter(t => t.name !== "delete_data");
+    } else {
+      // Viewers get read-only tools
+      filteredTools = request.tools.filter(t => t.name.startsWith("read_"));
+    }
+
+    return handler({ ...request, tools: filteredTools });
+  },
+});
+```
+:::
+
+See [Dynamically selecting tools](/oss/langchain/middleware#dynamically-selecting-tools) for more examples.
+
+### Dynamic model selection
+
+Switch models based on conversation complexity, context window needs, or cost optimization:
+
+:::python
+```python
+from langchain.agents import create_agent
+from langchain.agents.middleware import wrap_model_call, ModelRequest, ModelResponse
+from langchain.chat_models import init_chat_model
+from typing import Callable
+
+@wrap_model_call
+def adaptive_model(
+    request: ModelRequest,
+    handler: Callable[[ModelRequest], ModelResponse]
+) -> ModelResponse:
+    """Use different models based on conversation length."""
+    message_count = len(request.messages)
+
+    if message_count > 20:
+        # Long conversation - use model with larger context window
+        request.model = init_chat_model("anthropic:claude-sonnet-4-5-20250929")
+    elif message_count > 10:
+        # Medium conversation - use mid-tier model
+        request.model = init_chat_model("openai:gpt-4o")
+    else:
+        # Short conversation - use efficient model
+        request.model = init_chat_model("openai:gpt-4o-mini")
+
+    return handler(request)
+
+agent = create_agent(
+    model="openai:gpt-4o-mini",  # Default model
+    tools=[...],
+    middleware=[adaptive_model]
+)
+```
+:::
+
+:::js
+```typescript
+import { createMiddleware, initChatModel } from "langchain";
+
+const adaptiveModel = createMiddleware({
+  name: "AdaptiveModel",
+  wrapModelCall: (request, handler) => {
+    const messageCount = request.messages.length;
+    let model;
+
+    if (messageCount > 20) {
+      // Long conversation - use model with larger context window
+      model = initChatModel("anthropic:claude-sonnet-4-5-20250929");
+    } else if (messageCount > 10) {
+      // Medium conversation - use mid-tier model
+      model = initChatModel("openai:gpt-4o");
+    } else {
+      // Short conversation - use efficient model
+      model = initChatModel("openai:gpt-4o-mini");
+    }
+
+    return handler({ ...request, model });
+  },
+});
+```
+:::
+
+See [Dynamic model](/oss/langchain/agents#dynamic-model) for more examples.
+
+## Best practices
+
+1. **Start simple** - Begin with static prompts and tools, add dynamics only when needed
+2. **Test incrementally** - Add one context engineering feature at a time
+3. **Monitor performance** - Track model calls, token usage, and latency
+4. **Use built-in middleware** - Leverage [SummarizationMiddleware](/oss/langchain/middleware#summarization), [LLMToolSelectorMiddleware](/oss/langchain/middleware#llm-tool-selector), etc.
+5. **Document your context strategy** - Make it clear what context is being passed and why
+
+## Related resources
+
+- [Middleware](/oss/langchain/middleware) - Complete middleware guide
+- [Tools](/oss/langchain/tools) - Tool creation and context access
+- [Memory](/oss/concepts/memory) - Short-term and long-term memory patterns
+- [Agents](/oss/langchain/agents) - Core agent concepts
 
diff --git a/src/oss/langchain/long-term-memory.mdx b/src/oss/langchain/long-term-memory.mdx
index 5197f4c3f..f0230eb2e 100644
--- a/src/oss/langchain/long-term-memory.mdx
+++ b/src/oss/langchain/long-term-memory.mdx
@@ -105,7 +105,6 @@ from dataclasses import dataclass
 
 from langchain_core.runnables import RunnableConfig
 from langchain.agents import create_agent
-from langgraph.config import get_store
 from langgraph.runtime import get_runtime
 from langgraph.store.memory import InMemoryStore
 
diff --git a/src/oss/langchain/middleware.mdx b/src/oss/langchain/middleware.mdx
index 49a51fb3b..273557c8d 100644
--- a/src/oss/langchain/middleware.mdx
+++ b/src/oss/langchain/middleware.mdx
@@ -15,7 +15,7 @@ The core agent loop involves calling a model, letting it choose tools to execute
   <img
     src="/oss/images/core_agent_loop.png"
     alt="Core agent loop diagram"
-    height="300"
+    height="450"
     className="rounded-lg"
   />
 </div>
@@ -864,6 +864,100 @@ const agent = createAgent({
 
 Build custom middleware by implementing hooks that run at specific points in the agent execution flow.
 
+:::python
+
+You can create middleware in two ways:
+1. **Decorator-based** - Quick and simple for single-hook middleware
+2. **Class-based** - More powerful for complex middleware with multiple hooks
+
+## Decorator-based middleware
+
+For simple middleware that only needs a single hook, decorators provide the quickest way to add functionality:
+
+```python
+from langchain.agents.middleware import before_model, after_model, wrap_model_call
+from langchain.agents.middleware import AgentState, ModelRequest, ModelResponse
+from langgraph.runtime import Runtime
+from typing import Any, Callable
+
+# Node-style: logging before model calls
+@before_model
+def log_before_model(state: AgentState, runtime: Runtime) -> dict[str, Any] | None:
+    print(f"About to call model with {len(state['messages'])} messages")
+    return None
+
+# Node-style: validation after model calls
+@after_model(can_jump_to=["end"])
+def validate_output(state: AgentState, runtime: Runtime) -> dict[str, Any] | None:
+    last_message = state["messages"][-1]
+    if "BLOCKED" in last_message.content:
+        return {
+            "messages": [AIMessage("I cannot respond to that request.")],
+            "jump_to": "end"
+        }
+    return None
+
+# Wrap-style: retry logic
+@wrap_model_call
+def retry_model(
+    request: ModelRequest,
+    handler: Callable[[ModelRequest], ModelResponse],
+) -> ModelResponse:
+    for attempt in range(3):
+        try:
+            return handler(request)
+        except Exception as e:
+            if attempt == 2:
+                raise
+            print(f"Retry {attempt + 1}/3 after error: {e}")
+
+# Wrap-style: dynamic prompts
+@dynamic_prompt
+def personalized_prompt(request: ModelRequest) -> str:
+    user_id = request.runtime.context.get("user_id", "guest")
+    return f"You are a helpful assistant for user {user_id}. Be concise and friendly."
+
+# Use decorators in agent
+agent = create_agent(
+    model="openai:gpt-4o",
+    middleware=[log_before_model, validate_output, retry_model, personalized_prompt],
+    tools=[...],
+)
+```
+
+### Available decorators
+
+**Node-style** (run at specific execution points):
+- `@before_agent` - Before agent starts (once per invocation)
+- `@before_model` - Before each model call
+- `@after_model` - After each model response
+- `@after_agent` - After agent completes (once per invocation)
+
+**Wrap-style** (intercept and control execution):
+- `@wrap_model_call` - Around each model call
+- `@wrap_tool_call` - Around each tool call
+
+**Convenience decorators**:
+- `@dynamic_prompt` - Generates dynamic system prompts (equivalent to `@wrap_model_call` that modifies the prompt)
+
+### When to use decorators
+
+<CardGroup cols={2}>
+  <Card title="Use decorators when" icon="check">
+    - You need a single hook
+    - No complex configuration
+  </Card>
+  <Card title="Use classes when" icon="code">
+    - Multiple hooks needed
+    - Complex configuration
+    - Reusable across projects (config on init)
+  </Card>
+</CardGroup>
+
+:::
+
+## Class-based middleware
+
 ### Two hook styles
 
 <CardGroup cols={2}>
@@ -1279,57 +1373,6 @@ await agent.invoke(
 ```
 :::
 
-
-:::python
-
-### Decorator-based middleware
-
-For simple middleware that only needs a single hook, use decorator shortcuts:
-
-```python
-from langchain.agents.middleware import before_model, after_model, wrap_model_call
-from langchain.agents.middleware import AgentState, ModelRequest, ModelResponse
-from langgraph.runtime import Runtime
-from typing import Any, Callable
-
-# Node-style decorator
-@before_model
-def log_before_model(state: AgentState, runtime: Runtime) -> dict[str, Any] | None:
-    print(f"About to call model with {len(state['messages'])} messages")
-    return None
-
-# Wrap-style decorator
-@wrap_model_call
-def retry_model(
-    request: ModelRequest,
-    handler: Callable[[ModelRequest], ModelResponse],
-) -> ModelResponse:
-    for attempt in range(3):
-        try:
-            return handler(request)
-        except Exception:
-            if attempt == 2:
-                raise
-    return handler(request)  # This line is unreachable but satisfies type checker
-
-# Use decorators in agent
-agent = create_agent(
-    model="openai:gpt-4o",
-    middleware=[log_before_model, retry_model],
-    tools=[...],
-)
-```
-
-Available decorators:
-- `@before_agent`
-- `@before_model`
-- `@after_model`
-- `@after_agent`
-- `@wrap_model_call`
-- `@wrap_tool_call`
-- `@dynamic_prompt` - Convenience for dynamic system prompts
-:::
-
 ### Execution order
 
 When using multiple middleware, understanding execution order is important:
diff --git a/src/oss/langchain/rag.mdx b/src/oss/langchain/rag.mdx
index bb6b19fed..751b30f5e 100644
--- a/src/oss/langchain/rag.mdx
+++ b/src/oss/langchain/rag.mdx
@@ -892,6 +892,8 @@ class State(AgentState):
 
 
 class RetrieveDocumentsMiddleware(AgentMiddleware[State]):
+    state_schema = State
+
     def before_model(self, state: AgentState) -> dict[str, Any] | None:
         last_message = state["messages"][-1]
         retrieved_docs = vector_store.similarity_search(last_message.text)
@@ -913,7 +915,6 @@ agent = create_agent(
     llm,
     tools=[],
     middleware=[RetrieveDocumentsMiddleware()],
-    state_schema=State,
 )
 ```
 :::
diff --git a/src/oss/langchain/runtime.mdx b/src/oss/langchain/runtime.mdx
index d3eb55cf2..969a22cfa 100644
--- a/src/oss/langchain/runtime.mdx
+++ b/src/oss/langchain/runtime.mdx
@@ -20,7 +20,7 @@ LangGraph exposes a @[Runtime] object with the following information:
 2. **Store**: a @[BaseStore] instance used for [long-term memory](/oss/langchain/long-term-memory)
 3. **Stream writer**: an object used for streaming information via the `"custom"` stream mode
 
-You can access the runtime information within [tools](#inside-tools), [prompt](#inside-prompt), and [pre and post model hooks](#inside-pre-and-post-model-hooks).
+You can access the runtime information within [tools](#inside-tools) and [middleware](#inside-middleware).
 
 ## Access
 
@@ -145,34 +145,48 @@ const fetchUserEmailPreferences = tool(
 ```
 :::
 
-### Inside prompt
+### Inside middleware
+
+You can access runtime information in middleware to create dynamic prompts, modify messages, or control agent behavior based on user context.
 
 :::python
-Use the @[get_runtime] function from `langgraph.runtime` to access the @[Runtime] object inside a prompt function.
+Use `request.runtime` to access the @[Runtime] object inside middleware decorators. The runtime object is available in the `ModelRequest` parameter passed to middleware functions.
 
 ```python
 from dataclasses import dataclass
 
 from langchain.messages import AnyMessage
-from langchain.agents import create_agent
-from langgraph.runtime import get_runtime  # [!code highlight]
+from langchain.agents import create_agent, AgentState
+from langchain.agents.middleware import dynamic_prompt, ModelRequest, before_model, after_model
+from langgraph.runtime import Runtime
 
 @dataclass
 class Context:
     user_name: str
 
-from langchain.agents.middleware import dynamic_prompt, ModelRequest
-
+# Dynamic prompts
 @dynamic_prompt
 def dynamic_system_prompt(request: ModelRequest) -> str:
-    user_name = request.runtime.context["user_name"]
+    user_name = request.runtime.context.user_name  # [!code highlight]
     system_prompt = f"You are a helpful assistant. Address the user as {user_name}."
     return system_prompt
 
+# Before model hook
+@before_model
+def log_before_model(state: AgentState, runtime: Runtime[Context]) -> dict | None:  # [!code highlight]
+    print(f"Processing request for user: {runtime.context.user_name}")  # [!code highlight]
+    return None
+
+# After model hook
+@after_model
+def log_after_model(state: AgentState, runtime: Runtime[Context]) -> dict | None:  # [!code highlight]
+    print(f"Completed request for user: {runtime.context.user_name}")  # [!code highlight]
+    return None
+
 agent = create_agent(
     model="openai:gpt-5-nano",
     tools=[...],
-    middleware=[dynamic_system_prompt],
+    middleware=[dynamic_system_prompt, log_before_model, log_after_model],  # [!code highlight]
     context_schema=Context
 )
 
@@ -183,36 +197,52 @@ agent.invoke(
 ```
 :::
 :::js
-Use the `runtime` parameter to access the @[Runtime] object inside a prompt function.
+Use the `runtime` parameter to access the @[Runtime] object inside middleware.
 
 ```ts
 import { z } from "zod";
-import { createAgent, type AgentState, SystemMessage } from "langchain";
+import { createAgent, createMiddleware, type AgentState, SystemMessage } from "langchain";
 import { type Runtime } from "@langchain/langgraph"; // [!code highlight]
 
 const contextSchema = z.object({
   userName: z.string(),
 });
 
-const prompt = (
-  state: AgentState,
-  runtime: Runtime<z.infer<typeof contextSchema>> // [!code highlight]
-) => {
-  const userName = runtime.context?.userName; // [!code highlight]
-  if (!userName) {
-    throw new Error("userName is required");
+// Dynamic prompt middleware
+const dynamicPromptMiddleware = createMiddleware({
+  name: "DynamicPrompt",
+  beforeModel: (state: AgentState, runtime: Runtime<z.infer<typeof contextSchema>>) => {  // [!code highlight]
+    const userName = runtime.context?.userName;  // [!code highlight]
+    if (!userName) {
+      throw new Error("userName is required");
+    }
+
+    const systemMsg = `You are a helpful assistant. Address the user as ${userName}.`;
+    return {
+      messages: [new SystemMessage(systemMsg), ...state.messages]
+    };
   }
+});
 
-  const systemMsg = `You are a helpful assistant. Address the user as ${userName}.`; // [!code highlight]
-  return [new SystemMessage(systemMsg), ...state.messages];
-};
+// Logging middleware
+const loggingMiddleware = createMiddleware({
+  name: "Logging",
+  beforeModel: (state: AgentState, runtime: Runtime<z.infer<typeof contextSchema>>) => {  // [!code highlight]
+    console.log(`Processing request for user: ${runtime.context?.userName}`);  // [!code highlight]
+    return;
+  },
+  afterModel: (state: AgentState, runtime: Runtime<z.infer<typeof contextSchema>>) => {  // [!code highlight]
+    console.log(`Completed request for user: ${runtime.context?.userName}`);  // [!code highlight]
+    return;
+  }
+});
 
 const agent = createAgent({
   model: "openai:gpt-4o",
   tools: [
     /* ... */
   ],
-  prompt,
+  middleware: [dynamicPromptMiddleware, loggingMiddleware],  // [!code highlight]
   contextSchema,
 });
 
@@ -222,86 +252,3 @@ const result = await agent.invoke(
 );
 ```
 :::
-
-### Inside pre and post model hooks
-
-:::python
-To access the underlying graph runtime information in a pre or post model hook, you can:
-
-1. Use the @[get_runtime] function from `langgraph.runtime` to access the @[Runtime] object inside the hook
-2. Inject the @[Runtime] directly via the hook signature
-
-This above options are purely preferential and not functionally different.
-
-<Tabs>
-	<Tab title="Using get_runtime">
-		```python
-		from langgraph.runtime import get_runtime  # [!code highlight]
-
-		def pre_model_hook(state: State) -> State:
-		    runtime = get_runtime(Context)  # [!code highlight]
-            ...
-		```
-	</Tab>
-	<Tab title="Injection">
-		```python
-		from langgraph.runtime import Runtime  # [!code highlight]
-
-		def pre_model_hook(state: State, runtime: Runtime[Context]):  # [!code highlight]
-		    ...
-		```
-	</Tab>
-</Tabs>
-:::
-
-:::js
-Use the `runtime` parameter to access the @[Runtime] object inside a pre or post model hook.
-
-```ts
-import { z } from "zod";
-import { type Runtime } from "@langchain/langgraph"; // [!code highlight]
-import { createAgent, type AgentState } from "langchain";
-
-const contextSchema = z.object({
-  userName: z.string(),
-});
-
-const preModelHook = (
-  state: AgentState,
-  runtime: Runtime<z.infer<typeof contextSchema>> // [!code highlight]
-) => {
-  const userName = runtime.context?.userName; // [!code highlight]
-  if (!userName) {
-    throw new Error("userName is required");
-  }
-
-  return {
-    // ...
-  };
-};
-
-const postModelHook = (
-  state: AgentState,
-  runtime: Runtime<z.infer<typeof contextSchema>> // [!code highlight]
-) => {
-  const userName = runtime.context?.userName; // [!code highlight]
-  if (!userName) {
-    throw new Error("userName is required");
-  }
-
-  return {
-    // ...
-  };
-};
-
-const agent = createAgent({
-  model: "openai:gpt-4o-mini",
-  tools: [
-    /* ... */
-  ],
-  contextSchema,
-  preModelHook,
-  postModelHook,
-});
-```
-:::
diff --git a/src/oss/langchain/short-term-memory.mdx b/src/oss/langchain/short-term-memory.mdx
index 519d3991a..0e8950ff0 100644
--- a/src/oss/langchain/short-term-memory.mdx
+++ b/src/oss/langchain/short-term-memory.mdx
@@ -105,41 +105,67 @@ const checkpointer = PostgresSaver.fromConnString(DB_URI);
 
 By default, agents use `AgentState` to manage short term memory, specifically the conversation history via a `messages` key.
 
-Users can subclass `AgentState` to add additional fields to the state.
-
-This custom state can then be accessed via tools and dynamic prompt / model functions.
+You can extend `AgentState` to add additional fields. Custom state schemas are defined in middleware using the `state_schema` attribute.
 
 :::python
 ```python
 from langchain.agents import create_agent, AgentState
+from langchain.agents.middleware import AgentMiddleware
 from langgraph.checkpoint.memory import InMemorySaver
+
 class CustomAgentState(AgentState):  # [!code highlight]
     user_id: str  # [!code highlight]
+    preferences: dict  # [!code highlight]
+
+class StateExtensionMiddleware(AgentMiddleware[CustomAgentState]):
+    state_schema = CustomAgentState  # [!code highlight]
 
 agent = create_agent(
     "openai:gpt-5",
     [get_user_info],
-    state_schema=CustomAgentState,  # [!code highlight]
+    middleware=[StateExtensionMiddleware()],  # [!code highlight]
     checkpointer=InMemorySaver(),
 )
+
+# Custom state can be passed in invoke
+result = agent.invoke({
+    "messages": [{"role": "user", "content": "Hello"}],
+    "user_id": "user_123",  # [!code highlight]
+    "preferences": {"theme": "dark"}  # [!code highlight]
+})
 ```
 :::
 :::js
 ```typescript
 import { z } from "zod";
-import { createAgent } from "langchain";
-import { MemorySaver } from "@langchain/langgraph";
-const stateSchema = z.object({  // [!code highlight]
-    messages: z.array(z.any()),  // [!code highlight]
-}); // [!code highlight]
+import { createAgent, createMiddleware } from "langchain";
+import { MessagesZodState, MemorySaver } from "@langchain/langgraph";
+
+const customStateSchema = z.object({  // [!code highlight]
+    messages: MessagesZodState.shape.messages,  // [!code highlight]
+    userId: z.string(),  // [!code highlight]
+    preferences: z.record(z.string(), z.any()),  // [!code highlight]
+});  // [!code highlight]
+
+const stateExtensionMiddleware = createMiddleware({
+    name: "StateExtension",
+    stateSchema: customStateSchema,  // [!code highlight]
+});
 
 const checkpointer = new MemorySaver();
 const agent = createAgent({
     model: "openai:gpt-5",
     tools: [],
-    stateSchema,  // [!code highlight]
+    middleware: [stateExtensionMiddleware] as const,  // [!code highlight]
     checkpointer,
 });
+
+// Custom state can be passed in invoke
+const result = await agent.invoke({
+    messages: [{ role: "user", content: "Hello" }],
+    userId: "user_123",  // [!code highlight]
+    preferences: { theme: "dark" },  // [!code highlight]
+});
 ```
 :::
 
@@ -171,36 +197,40 @@ Most LLMs have a maximum supported context window (denominated in tokens).
 One way to decide when to truncate messages is to count the tokens in the message history and truncate whenever it approaches that limit. If you're using LangChain, you can use the trim messages utility and specify the number of tokens to keep from the list, as well as the `strategy` (e.g., keep the last `maxTokens`) to use for handling the boundary.
 
 :::python
-To trim message history in an agent, use @[`pre_model_hook`][create_agent] with the [`trim_messages`](https://python.langchain.com/api_reference/core/messages/langchain_core.messages.utils.trim_messages.html) function:
+To trim message history in an agent, use the `@before_model` middleware decorator:
 
 ```python
-from langchain_core.messages.utils import trim_messages, count_tokens_approximately
-from langchain.messages import BaseMessage
+from langchain.messages import RemoveMessage
+from langgraph.graph.message import REMOVE_ALL_MESSAGES
 from langgraph.checkpoint.memory import InMemorySaver
-from langchain.agents import create_agent
-from langchain_core.runnables import RunnableConfig
+from langchain.agents import create_agent, AgentState
+from langchain.agents.middleware import before_model
+from langgraph.runtime import Runtime
+from typing import Any
 
-def pre_model_hook(state) -> dict[str, list[BaseMessage]]:
-    """
-    This function will be called prior to every llm call to prepare the messages for the llm.
-    """
-    trimmed_messages = trim_messages(
-        state["messages"],
-        strategy="last",
-        token_counter=count_tokens_approximately,
-        max_tokens=384,
-        start_on="human",
-        end_on=("human", "tool"),
-    )
-    return {"llm_input_messages": trimmed_messages}
+@before_model
+def trim_messages(state: AgentState, runtime: Runtime) -> dict[str, Any] | None:
+    """Keep only the last few messages to fit context window."""
+    messages = state["messages"]
 
+    if len(messages) <= 3:
+        return None  # No changes needed
+
+    first_msg = messages[0]
+    recent_messages = messages[-3:] if len(messages) % 2 == 0 else messages[-4:]
+    new_messages = [first_msg] + recent_messages
+
+    return {
+        "messages": [
+            RemoveMessage(id=REMOVE_ALL_MESSAGES),
+            *new_messages
+        ]
+    }
 
-checkpointer = InMemorySaver()
 agent = create_agent(
-    "openai:gpt-5-nano",
-    tools=[],
-    pre_model_hook=pre_model_hook,
-    checkpointer=checkpointer,
+    model,
+    tools=tools,
+    middleware=[trim_messages]
 )
 
 config: RunnableConfig = {"configurable": {"thread_id": "1"}}
@@ -322,23 +352,28 @@ const deleteMessages = (state) => {
 
 ```python
 from langchain.messages import RemoveMessage
-from langchain.agents import create_agent
+from langchain.agents import create_agent, AgentState
+from langchain.agents.middleware import after_model
 from langgraph.checkpoint.memory import InMemorySaver
+from langgraph.runtime import Runtime
 from langchain_core.runnables import RunnableConfig
 
 
-def delete_messages(state):
+@after_model
+def delete_old_messages(state: AgentState, runtime: Runtime) -> dict | None:
+    """Remove old messages to keep conversation manageable."""
     messages = state["messages"]
     if len(messages) > 2:
         # remove the earliest two messages
         return {"messages": [RemoveMessage(id=m.id) for m in messages[:2]]}
+    return None
 
 
 agent = create_agent(
     "openai:gpt-5-nano",
     tools=[],
-    prompt="Please be concise and to the point.",
-    post_model_hook=delete_messages,
+    system_prompt="Please be concise and to the point.",
+    middleware=[delete_old_messages],
     checkpointer=InMemorySaver(),
 )
 
@@ -442,40 +477,27 @@ Because of this, some applications benefit from a more sophisticated approach of
 
 
 :::python
-To summarize message history in an agent, use @[`pre_model_hook`][create_agent] with a prebuilt [`SummarizationNode`](https://langchain-ai.github.io/langmem/reference/short_term/#langmem.short_term.SummarizationNode) abstraction:
-
-{/* TODO: FIX THIS EXAMPLE, NOT ABLE TO RUN */}
+To summarize message history in an agent, use the built-in [`SummarizationMiddleware`](/oss/langchain/middleware#summarization):
 
 ```python
-from langmem.short_term import SummarizationNode, RunningSummary
-from langchain_core.messages.utils import count_tokens_approximately
-from langchain.agents import create_agent, AgentState
+from langchain.agents import create_agent
+from langchain.agents.middleware import SummarizationMiddleware
 from langgraph.checkpoint.memory import InMemorySaver
-from langchain_openai import ChatOpenAI
 from langchain_core.runnables import RunnableConfig
 
-model = ChatOpenAI(model="gpt-4o-mini")
-
-summarization_node = SummarizationNode(
-    token_counter=count_tokens_approximately,
-    model=model,
-    max_tokens=384,
-    max_summary_tokens=128,
-    output_messages_key="llm_input_messages",
-)
-
-class State(AgentState):
-    # Added for the SummarizationNode to be able to keep track of the running summary information
-    context: dict[str, RunningSummary]
-
-checkpointer = InMemorySaver()  # [!code highlight]
+checkpointer = InMemorySaver()
 
 agent = create_agent(
-    model=model,
+    model="openai:gpt-4o",
     tools=[],
-    pre_model_hook=summarization_node,
-    state_schema=State,
-    checkpointer=checkpointer,  # [!code highlight]
+    middleware=[
+        SummarizationMiddleware(
+            model="openai:gpt-4o-mini",
+            max_tokens_before_summary=4000,  # Trigger summarization at 4000 tokens
+            messages_to_keep=20,  # Keep last 20 messages after summary
+        )
+    ],
+    checkpointer=checkpointer,
 )
 
 config: RunnableConfig = {"configurable": {"thread_id": "1"}}
@@ -484,23 +506,54 @@ agent.invoke({"messages": "write a short poem about cats"}, config)
 agent.invoke({"messages": "now do the same but for dogs"}, config)
 final_response = agent.invoke({"messages": "what's my name?"}, config)
 
-print(final_response.keys())
-
 final_response["messages"][-1].pretty_print()
-print("\nSummary:", final_response["context"]["running_summary"].summary)
+"""
+================================== Ai Message ==================================
+
+Your name is Bob!
+"""
 ```
+
+See [SummarizationMiddleware](/oss/langchain/middleware#summarization) for more configuration options.
 :::
 :::js
-TODO
-:::
+To summarize message history in an agent, use the built-in [`summarizationMiddleware`](/oss/langchain/middleware#summarization):
 
-## Access
+```typescript
+import { createAgent, summarizationMiddleware } from "langchain";
+import { MemorySaver } from "@langchain/langgraph";
 
-You can access the short-term memory of an agent in a few different ways:
+const checkpointer = new MemorySaver();
 
-* [Tools](#tools)
-* [Pre model hook](#pre-model-hook)
-* [Post model hook](#post-model-hook)
+const agent = createAgent({
+  model: "openai:gpt-4o",
+  tools: [],
+  middleware: [
+    summarizationMiddleware({
+      model: "openai:gpt-4o-mini",
+      maxTokensBeforeSummary: 4000,
+      messagesToKeep: 20,
+    }),
+  ],
+  checkpointer,
+});
+
+const config = { configurable: { thread_id: "1" } };
+await agent.invoke({ messages: "hi, my name is bob" }, config);
+await agent.invoke({ messages: "write a short poem about cats" }, config);
+await agent.invoke({ messages: "now do the same but for dogs" }, config);
+const finalResponse = await agent.invoke({ messages: "what's my name?" }, config);
+
+console.log(finalResponse.messages.at(-1)?.content);
+// Your name is Bob!
+```
+
+See [summarizationMiddleware](/oss/langchain/middleware#summarization) for more configuration options.
+:::
+
+## Access memory
+
+You can access and modify the short-term memory (state) of an agent in several ways:
 
 ### Tools
 
@@ -708,7 +761,7 @@ await agent.invoke(
 
 ### Prompt
 
-Access short term memory (state) in a dynamic prompt function by injecting the agent's state into the prompt function signature.
+Access short term memory (state) in middleware to create dynamic prompts based on conversation history or custom state fields.
 
 :::python
 ```python
@@ -802,7 +855,6 @@ const agent = createAgent({
             `You are a helpful assistant. Address the user as ${config.context?.userName}.`
         ),
         ...state.messages,
-        ];
     },
 });
 
@@ -845,110 +897,174 @@ for (const message of result.messages) {
  *   // ...
  * }
  * AIMessage {
- *   "content": "John Smith, here’s the latest: The weather in San Francisco is always sunny!\n\nIf you’d like more details (temperature, wind, humidity) or a forecast for the next few days, I can pull that up. What would you like?",
+ *   "content": "John Smith, here's the latest: The weather in San Francisco is always sunny!\n\nIf you'd like more details (temperature, wind, humidity) or a forecast for the next few days, I can pull that up. What would you like?",
  *   // ...
  * }
  */
 ```
 :::
 
-### Pre model hook
+### Before model
+
+Access short term memory (state) in `@before_model` middleware to process messages before model calls.
 
-Access short term memory (state) in a pre model hook by injecting the agent's state into the hook signature.
+
+```mermaid
+%%{
+    init: {
+        "fontFamily": "monospace",
+        "flowchart": {
+        "curve": "basis"
+        },
+        "themeVariables": {"edgeLabelBackground": "transparent"}
+    }
+}%%
+graph TD
+    S(["\_\_start\_\_"])
+    PRE(before_model)
+    MODEL(model)
+    TOOLS(tools)
+    END(["\_\_end\_\_"])
+    S --> PRE
+    PRE --> MODEL
+    MODEL -.-> TOOLS
+    MODEL -.-> END
+    TOOLS --> PRE
+    classDef blueHighlight fill:#0a1c25,stroke:#0a455f,color:#bae6fd;
+    class S blueHighlight;
+    class END blueHighlight;
+```
 
 :::python
 ```python
-from langchain_core.messages.utils import trim_messages, count_tokens_approximately
-from langchain.messages import BaseMessage
+from langchain.messages import RemoveMessage
+from langgraph.graph.message import REMOVE_ALL_MESSAGES
 from langgraph.checkpoint.memory import InMemorySaver
 from langchain.agents import create_agent, AgentState
+from langchain.agents.middleware import before_model
+from langgraph.runtime import Runtime
+from typing import Any
+
+@before_model
+def trim_messages(state: AgentState, runtime: Runtime) -> dict[str, Any] | None:
+    """Keep only the last few messages to fit context window."""
+    messages = state["messages"]
 
+    if len(messages) <= 3:
+        return None  # No changes needed
 
-def pre_model_hook(state: AgentState) -> dict[str, list[BaseMessage]]:
-    """
-    This function will be called prior to every llm call to prepare the messages for the llm.
-    """
-    trimmed_messages = trim_messages(
-        state["messages"],
-        strategy="last",
-        token_counter=count_tokens_approximately,
-        max_tokens=384,
-        start_on="human",
-        end_on=("human", "tool"),
-    )
-    return {"llm_input_messages": trimmed_messages}
+    first_msg = messages[0]
+    recent_messages = messages[-3:] if len(messages) % 2 == 0 else messages[-4:]
+    new_messages = [first_msg] + recent_messages
+
+    return {
+        "messages": [
+            RemoveMessage(id=REMOVE_ALL_MESSAGES),
+            *new_messages
+        ]
+    }
 
 agent = create_agent(
-    model="openai:gpt-5-nano",
-    tools=[],
-    pre_model_hook=pre_model_hook,
-    checkpointer=InMemorySaver(),
+    model,
+    tools=tools,
+    middleware=[trim_messages]
 )
 
-result = agent.invoke({"messages": "hi, my name is bob"}, {"configurable": {"thread_id": "1"}})
-print(result["messages"][-1].content)
+config: RunnableConfig = {"configurable": {"thread_id": "1"}}
+
+agent.invoke({"messages": "hi, my name is bob"}, config)
+agent.invoke({"messages": "write a short poem about cats"}, config)
+agent.invoke({"messages": "now do the same but for dogs"}, config)
+final_response = agent.invoke({"messages": "what's my name?"}, config)
+
+final_response["messages"][-1].pretty_print()
+"""
+================================== Ai Message ==================================
+
+Your name is Bob. You told me that earlier.
+If you'd like me to call you a nickname or use a different name, just say the word.
+"""
 ```
 :::
 :::js
 ```typescript
-import {
-    createAgent,
-    type AgentState,
-    trimMessages,
-    type BaseMessage,
-} from "langchain";
-
-const preModelHook = async (state: AgentState) => {
-    return {
-        messages: await trimMessages(state.messages, {
-        maxTokens: 384,
-        strategy: "last",
-        startOn: "human",
-        endOn: ["human", "tool"],
-        tokenCounter: (msgs: BaseMessage[]) => msgs.length,
-        }),
-    };
-};
+import { RemoveMessage } from "@langchain/core/messages";
+import { createAgent, createMiddleware, trimMessages, type AgentState } from "langchain";
+
+const trimMessageHistory = createMiddleware({
+  name: "TrimMessages",
+  beforeModel: async (state) => {
+    const trimmed = await trimMessages(state.messages, {
+      maxTokens: 384,
+      strategy: "last",
+      startOn: "human",
+      endOn: ["human", "tool"],
+      tokenCounter: (msgs) => msgs.length,
+    });
+    return { messages: trimmed };
+  },
+});
 
 const agent = createAgent({
     model: "openai:gpt-5-nano",
     tools: [],
-    preModelHook,
+    middleware: [trimMessageHistory],
 });
-
-const result = await agent.invoke(
-    {
-        messages: [{ role: "user", content: "hi, my name is bob" }],
-    },
-    {
-        context: { thread_id: "1" },
-    }
-);
-console.log(result.messages.at(-1)?.content);
 ```
 :::
 
-### Post model hook
+### After model
 
-Access short term memory (state) in a post model hook by injecting the agent's state into the hook signature.
+Access short term memory (state) in `@after_model` middleware to process messages after model calls.
+
+```mermaid
+%%{
+    init: {
+        "fontFamily": "monospace",
+        "flowchart": {
+        "curve": "basis"
+        },
+        "themeVariables": {"edgeLabelBackground": "transparent"}
+    }
+}%%
+graph TD
+    S(["\_\_start\_\_"])
+    MODEL(model)
+    POST(after_model)
+    TOOLS(tools)
+    END(["\_\_end\_\_"])
+    S --> MODEL
+    MODEL --> POST
+    POST -.-> END
+    POST -.-> TOOLS
+    TOOLS --> MODEL
+    classDef blueHighlight fill:#0a1c25,stroke:#0a455f,color:#bae6fd;
+    class S blueHighlight;
+    class END blueHighlight;
+    class POST greenHighlight;
+```
 
 :::python
 ```python
+from langchain.messages import RemoveMessage
+from langgraph.checkpoint.memory import InMemorySaver
 from langchain.agents import create_agent, AgentState
+from langchain.agents.middleware import after_model
+from langgraph.runtime import Runtime
 
-STOP_WORDS = ["password", "secret"]
-
-def validate_response(state: AgentState) -> dict[str, list[BaseMessage]]:
-    """Confirm the response doesn't have any content that is in the stop words list."""
+@after_model
+def validate_response(state: AgentState, runtime: Runtime) -> dict | None:
+    """Remove messages containing sensitive words."""
+    STOP_WORDS = ["password", "secret"]
     last_message = state["messages"][-1]
     if any(word in last_message.content for word in STOP_WORDS):
         return {"messages": [RemoveMessage(id=last_message.id)]}
-    return {}
+    return None
 
 agent = create_agent(
     model="openai:gpt-5-nano",
     tools=[],
-    post_model_hook=validate_response,
+    middleware=[validate_response],
     checkpointer=InMemorySaver(),
 )
 ```
@@ -956,25 +1072,27 @@ agent = create_agent(
 :::js
 ```typescript
 import { RemoveMessage } from "@langchain/core/messages";
-import { createAgent, type AgentState } from "langchain";
+import { createAgent, createMiddleware, type AgentState } from "langchain";
 
-function validateResponse(state: AgentState) {
+const validateResponse = createMiddleware({
+  name: "ValidateResponse",
+  afterModel: (state) => {
     const lastMessage = state.messages.at(-1)?.content;
-    if (
-        typeof lastMessage === "string" &&
-        lastMessage.toLowerCase().includes("confidential")
-    ) {
-        return {
+    if (typeof lastMessage === "string" && lastMessage.toLowerCase().includes("confidential")) {
+      return {
         messages: [new RemoveMessage({ id: "all" }), ...state.messages],
-        };
+      };
     }
-    return {};
-}
+    return;
+  },
+});
 
 const agent = createAgent({
-    model: "openai:gpt-5",
+    model: "openai:gpt-5-nano",
     tools: [],
-    postModelHook: validateResponse,
+    middleware: [validateResponse],
 });
 ```
 :::
+
+
diff --git a/src/oss/langchain/tools.mdx b/src/oss/langchain/tools.mdx
index 1fbb0c5f7..af75ced2d 100644
--- a/src/oss/langchain/tools.mdx
+++ b/src/oss/langchain/tools.mdx
@@ -136,363 +136,375 @@ Define complex inputs with Pydantic models or JSON schemas:
 </CodeGroup>
 :::
 
-## State, context, and memory
+## Accessing Context
+
+<Info>
+**Why this matters:** Tools are most powerful when they can access agent state, runtime context, and long-term memory. This enables tools to make context-aware decisions, personalize responses, and maintain information across conversations.
+</Info>
+
+Tools can access different types of data:
+
+- **State** - Mutable data that flows through execution (messages, counters, custom fields)
+- **Runtime** - Access to context, memory (store), and streaming capabilities via `get_runtime()`
+
+### State
+
+Use `InjectedState` to access and modify the agent's state during execution. State includes messages, custom fields, and any data your tools need to track.
+
+<Info>
+**`InjectedState`**: An annotation that allows tools to access the current graph state without exposing it to the LLM. This lets tools read information like message history or custom state fields while keeping the tool's schema simple.
+</Info>
 
-<AccordionGroup>
 :::python
-    <Accordion title="Accessing agent state inside a tool">
-        <Info>
-            **`state`**: The agent maintains state throughout its execution - this includes messages, custom fields, and any data your tools need to track. State flows through the graph and can be accessed and modified by tools.
-        </Info>
-
-        <Info>
-            **`InjectedState`**: An annotation that allows tools to access the current graph state without exposing it to the LLM. This lets tools read information like message history or custom state fields while keeping the tool's schema simple.
-        </Info>
-
-        Tools can access the current graph state using the `InjectedState` annotation:
-
-        ```python wrap
-        from typing_extensions import Annotated
-        from langchain.tools import InjectedState
-
-        # Access the current conversation state
-        @tool
-        def summarize_conversation(
-            state: Annotated[dict, InjectedState]
-        ) -> str:
-            """Summarize the conversation so far."""
-            messages = state["messages"]
-
-            human_msgs = sum(1 for m in messages if m.__class__.__name__ == "HumanMessage")
-            ai_msgs = sum(1 for m in messages if m.__class__.__name__ == "AIMessage")
-            tool_msgs = sum(1 for m in messages if m.__class__.__name__ == "ToolMessage")
-
-            return f"Conversation has {human_msgs} user messages, {ai_msgs} AI responses, and {tool_msgs} tool results"
-
-        # Access custom state fields
-        @tool
-        def get_user_preference(
-            pref_name: str,
-            preferences: Annotated[dict, InjectedState("user_preferences")]  # InjectedState parameters are not visible to the model
-        ) -> str:
-            """Get a user preference value."""
-            return preferences.get(pref_name, "Not set")
-        ```
-
-        <Warning>
-            State-injected arguments are hidden from the model. For the example above, the model only sees `pref_name` in the tool schema - `preferences` is *not* included in the request.
-        </Warning>
-    </Accordion>
-
-    <Accordion title="Updating agent state inside a tool">
-        <Info>
-        **`Command`**: A special return type that tools can use to update the agent's state or control the graph's execution flow. Instead of just returning data, tools can return `Command`s to modify state or direct the agent to specific nodes.
-        </Info>
-
-        Use a tool that returns a `Command` to update the agent state:
-
-        ```python wrap
-        from langgraph.types import Command
-        from langchain.messages import RemoveMessage
-        from langgraph.graph.message import REMOVE_ALL_MESSAGES
-        from langchain.tools import tool, InjectedToolCallId
-        from typing_extensions import Annotated
-
-        # Update the conversation history by removing all messages
-        @tool
-        def clear_conversation() -> Command:
-            """Clear the conversation history."""
-
-            return Command(
-                update={
-                    "messages": [RemoveMessage(id=REMOVE_ALL_MESSAGES)],
-                }
-            )
-
-        # Update the user_name in the agent state
-        @tool
-        def update_user_name(
-            new_name: str,
-            tool_call_id: Annotated[dict, InjectedToolCallId]
-        ) -> Command:
-            """Update the user's name."""
-            return Command(update={"user_name": new_name})
-        ```
-    </Accordion>
-:::
+**Accessing state:**
+
+Tools can access the current graph state using the `InjectedState` annotation:
 
-    <Accordion title="Accessing runtime context inside a tool">
-        <Info>
-            **`runtime`**: The execution environment of your agent, containing immutable configuration and contextual data that persists throughout the agent's execution (e.g., user IDs, session details, or application-specific configuration).
-        </Info>
-
-        :::python
-        Tools can access an agent's runtime context through `get_runtime`:
-
-        ```python wrap
-        from dataclasses import dataclass
-        from langchain_openai import ChatOpenAI
-        from langchain.agents import create_agent
-        from langchain.tools import tool
-        from langgraph.runtime import get_runtime
-
-        USER_DATABASE = {
-            "user123": {
-                "name": "Alice Johnson",
-                "account_type": "Premium",
-                "balance": 5000,
-                "email": "alice@example.com"
-            },
-            "user456": {
-                "name": "Bob Smith",
-                "account_type": "Standard",
-                "balance": 1200,
-                "email": "bob@example.com"
-            }
+```python wrap
+from typing_extensions import Annotated
+from langchain.tools import InjectedState
+
+# Access the current conversation state
+@tool
+def summarize_conversation(
+    state: Annotated[dict, InjectedState]
+) -> str:
+    """Summarize the conversation so far."""
+    messages = state["messages"]
+
+    human_msgs = sum(1 for m in messages if m.__class__.__name__ == "HumanMessage")
+    ai_msgs = sum(1 for m in messages if m.__class__.__name__ == "AIMessage")
+    tool_msgs = sum(1 for m in messages if m.__class__.__name__ == "ToolMessage")
+
+    return f"Conversation has {human_msgs} user messages, {ai_msgs} AI responses, and {tool_msgs} tool results"
+
+# Access custom state fields
+@tool
+def get_user_preference(
+    pref_name: str,
+    preferences: Annotated[dict, InjectedState("user_preferences")]  # InjectedState parameters are not visible to the model
+) -> str:
+    """Get a user preference value."""
+    return preferences.get(pref_name, "Not set")
+```
+
+<Warning>
+State-injected arguments are hidden from the model. For the example above, the model only sees `pref_name` in the tool schema - `preferences` is *not* included in the request.
+</Warning>
+
+**Updating state:**
+
+Use `Command` to update the agent's state or control the graph's execution flow:
+
+```python wrap
+from langgraph.types import Command
+from langchain.messages import RemoveMessage
+from langgraph.graph.message import REMOVE_ALL_MESSAGES
+from langchain.tools import tool, InjectedToolCallId
+from typing_extensions import Annotated
+
+# Update the conversation history by removing all messages
+@tool
+def clear_conversation() -> Command:
+    """Clear the conversation history."""
+
+    return Command(
+        update={
+            "messages": [RemoveMessage(id=REMOVE_ALL_MESSAGES)],
         }
+    )
 
-        @dataclass
-        class UserContext:
-            user_id: str
-
-        @tool
-        def get_account_info() -> str:
-            """Get the current user's account information."""
-            runtime = get_runtime(UserContext)
-            user_id = runtime.context.user_id
-
-            if user_id in USER_DATABASE:
-                user = USER_DATABASE[user_id]
-                return f"Account holder: {user['name']}\nType: {user['account_type']}\nBalance: ${user['balance']}"
-            return "User not found"
-
-        model = ChatOpenAI(model="gpt-4o")
-        agent = create_agent(
-            model,
-            tools=[get_account_info],
-            context_schema=UserContext,
-            system_prompt="You are a financial assistant."
-        )
+# Update the user_name in the agent state
+@tool
+def update_user_name(
+    new_name: str,
+    tool_call_id: Annotated[dict, InjectedToolCallId]
+) -> Command:
+    """Update the user's name."""
+    return Command(update={"user_name": new_name})
+```
+:::
 
-        result = agent.invoke(
-            {"messages": [{"role": "user", "content": "What's my current balance?"}]},
-            context=UserContext(user_id="user123")
-        )
-        ```
-        :::
-        :::js
-        Tools can access an agent's runtime context through the `config` parameter:
-
-        ```ts wrap
-        import { z } from "zod"
-        import { ChatOpenAI } from "@langchain/openai"
-        import { createAgent } from "langchain"
-
-        const getUserName = tool(
-          (_, config) => {
-            return config.context.user_name
-          },
-          {
-            name: "get_user_name",
-            description: "Get the user's name.",
-            schema: z.object({}),
-          }
-        );
-
-        const contextSchema = z.object({
-          user_name: z.string(),
-        });
-
-        const agent = createAgent({
-          model: new ChatOpenAI({ model: "gpt-4o" }),
-          tools: [getUserName],
-          contextSchema,
-        });
-
-        const result = await agent.invoke(
-          {
-            messages: [{ role: "user", content: "What is my name?" }]
-          },
-          {
-            context: { user_name: "John Smith" }
-          }
-        );
-        ```
-        :::
-    </Accordion>
-
-    <Accordion title="Accessing long-term memory inside a tool">
-        <Info>
-            **`store`**: LangChain's persistence layer. An agent's long-term memory store, e.g. user-specific or application-specific data stored across conversations.
-        </Info>
-
-        :::python
-        Tools can access an agent's store through `get_store`:
-
-        ```python wrap
-        from langgraph.config import get_store
-
-        @tool
-        def get_user_info(user_id: str) -> str:
-            """Look up user info."""
-            store = get_store()
-            user_info = store.get(("users",), user_id)
-            return str(user_info.value) if user_info else "Unknown user"
-        ```
-        :::
-        :::js
-        You can initialize an `InMemoryStore` to store long-term memory:
-
-        ```ts wrap
-        import { z } from "zod";
-        import { createAgent, InMemoryStore } from "langchain";
-        import { ChatOpenAI } from "@langchain/openai";
-
-        const store = new InMemoryStore();
-
-        const getUserInfo = tool(
-          ({ user_id }) => {
-            return store.get(["users"], user_id)
-          },
-          {
-            name: "get_user_info",
-            description: "Look up user info.",
-            schema: z.object({
-              user_id: z.string(),
-            }),
-          }
-        );
-
-        const agent = createAgent({
-          model: new ChatOpenAI({ model: "gpt-4o" }),
-          tools: [getUserInfo],
-          store,
-        });
-        ```
-        :::
-    </Accordion>
-
-    <Accordion title="Updating long-term memory inside a tool">
-        To update long-term memory, you can use the `.put()` method of `InMemoryStore`. A complete example of persistent memory across sessions:
-
-        :::python
-
-        ```python wrap expandable
-        from typing import Any
-        from langgraph.config import get_store
-        from langgraph.store.memory import InMemoryStore
-        from langchain.agents import create_agent
-        from langchain.tools import tool
-
-        @tool
-        def get_user_info(user_id: str) -> str:
-            """Look up user info."""
-            store = get_store()
-            user_info = store.get(("users",), user_id)
-            return str(user_info.value) if user_info else "Unknown user"
-
-        @tool
-        def save_user_info(user_id: str, user_info: dict[str, Any]) -> str:
-            """Save user info."""
-            store = get_store()
-            store.put(("users",), user_id, user_info)
-            return "Successfully saved user info."
-
-        store = InMemoryStore()
-        agent = create_agent(
-            model,
-            tools=[get_user_info, save_user_info],
-            store=store
-        )
+### Runtime
+
+Use `get_runtime()` to access immutable configuration, context, memory (store), and streaming capabilities. The runtime provides access to data that persists across the agent's execution.
+
+#### Context
+
+Access immutable configuration and contextual data like user IDs, session details, or application-specific configuration.
+
+:::python
+Tools can access runtime context through `get_runtime()`:
+
+```python wrap
+from dataclasses import dataclass
+from langchain_openai import ChatOpenAI
+from langchain.agents import create_agent
+from langchain.tools import tool
+from langgraph.runtime import get_runtime
+
+USER_DATABASE = {
+    "user123": {
+        "name": "Alice Johnson",
+        "account_type": "Premium",
+        "balance": 5000,
+        "email": "alice@example.com"
+    },
+    "user456": {
+        "name": "Bob Smith",
+        "account_type": "Standard",
+        "balance": 1200,
+        "email": "bob@example.com"
+    }
+}
+
+@dataclass
+class UserContext:
+    user_id: str
+
+@tool
+def get_account_info() -> str:
+    """Get the current user's account information."""
+    runtime = get_runtime(UserContext)
+    user_id = runtime.context.user_id
+
+    if user_id in USER_DATABASE:
+        user = USER_DATABASE[user_id]
+        return f"Account holder: {user['name']}\nType: {user['account_type']}\nBalance: ${user['balance']}"
+    return "User not found"
+
+model = ChatOpenAI(model="gpt-4o")
+agent = create_agent(
+    model,
+    tools=[get_account_info],
+    context_schema=UserContext,
+    system_prompt="You are a financial assistant."
+)
+
+result = agent.invoke(
+    {"messages": [{"role": "user", "content": "What's my current balance?"}]},
+    context=UserContext(user_id="user123")
+)
+```
+:::
+
+:::js
+Tools can access an agent's runtime context through the `config` parameter:
+
+```ts wrap
+import { z } from "zod"
+import { ChatOpenAI } from "@langchain/openai"
+import { createAgent } from "langchain"
+
+const getUserName = tool(
+  (_, config) => {
+    return config.context.user_name
+  },
+  {
+    name: "get_user_name",
+    description: "Get the user's name.",
+    schema: z.object({}),
+  }
+);
+
+const contextSchema = z.object({
+  user_name: z.string(),
+});
+
+const agent = createAgent({
+  model: new ChatOpenAI({ model: "gpt-4o" }),
+  tools: [getUserName],
+  contextSchema,
+});
+
+const result = await agent.invoke(
+  {
+    messages: [{ role: "user", content: "What is my name?" }]
+  },
+  {
+    context: { user_name: "John Smith" }
+  }
+);
+```
+:::
+
+#### Memory (Store)
+
+Access persistent data across conversations using the store. The store is accessed via `get_runtime().store` and allows you to save and retrieve user-specific or application-specific data.
+
+:::python
+Tools can access and update the store through `get_runtime().store`:
+
+```python wrap expandable
+from typing import Any
+from langgraph.runtime import get_runtime
+from langgraph.store.memory import InMemoryStore
+from langchain.agents import create_agent
+from langchain.tools import tool
+
+# Access memory
+@tool
+def get_user_info(user_id: str) -> str:
+    """Look up user info."""
+    store = get_runtime().store
+    user_info = store.get(("users",), user_id)
+    return str(user_info.value) if user_info else "Unknown user"
+
+# Update memory
+@tool
+def save_user_info(user_id: str, user_info: dict[str, Any]) -> str:
+    """Save user info."""
+    store = get_runtime().store
+    store.put(("users",), user_id, user_info)
+    return "Successfully saved user info."
+
+store = InMemoryStore()
+agent = create_agent(
+    model,
+    tools=[get_user_info, save_user_info],
+    store=store
+)
+
+# First session: save user info
+agent.invoke({
+    "messages": [{"role": "user", "content": "Save the following user: userid: abc123, name: Foo, age: 25, email: foo@langchain.dev"}]
+})
+
+# Second session: get user info
+agent.invoke({
+    "messages": [{"role": "user", "content": "Get user info for user with id 'abc123'"}]
+})
+# Here is the user info for user with ID "abc123":
+# - Name: Foo
+# - Age: 25
+# - Email: foo@langchain.dev
+```
+:::
+
+:::js
+```ts wrap expandable
+import { z } from "zod";
+import { createAgent, tool } from "langchain";
+import { InMemoryStore } from "@langchain/langgraph";
+import { ChatOpenAI } from "@langchain/openai";
+
+const store = new InMemoryStore();
+
+// Access memory
+const getUserInfo = tool(
+  async ({ user_id }) => {
+    const value = await store.get(["users"], user_id);
+    console.log("get_user_info", user_id, value);
+    return value;
+  },
+  {
+    name: "get_user_info",
+    description: "Look up user info.",
+    schema: z.object({
+      user_id: z.string(),
+    }),
+  }
+);
+
+// Update memory
+const saveUserInfo = tool(
+  async ({ user_id, name, age, email }) => {
+    console.log("save_user_info", user_id, name, age, email);
+    await store.put(["users"], user_id, { name, age, email });
+    return "Successfully saved user info.";
+  },
+  {
+    name: "save_user_info",
+    description: "Save user info.",
+    schema: z.object({
+      user_id: z.string(),
+      name: z.string(),
+      age: z.number(),
+      email: z.string(),
+    }),
+  }
+);
+
+const agent = createAgent({
+  llm: new ChatOpenAI({ model: "gpt-4o" }),
+  tools: [getUserInfo, saveUserInfo],
+  store,
+});
+
+// First session: save user info
+await agent.invoke({
+  messages: [
+    {
+      role: "user",
+      content: "Save the following user: userid: abc123, name: Foo, age: 25, email: foo@langchain.dev",
+    },
+  ],
+});
+
+// Second session: get user info
+const result = await agent.invoke({
+  messages: [
+    { role: "user", content: "Get user info for user with id 'abc123'" },
+  ],
+});
+
+console.log(result);
+// Here is the user info for user with ID "abc123":
+// - Name: Foo
+// - Age: 25
+// - Email: foo@langchain.dev
+```
+:::
+
+#### Stream Writer
+
+Stream custom updates from tools as they execute using `get_runtime().stream_writer`. This is useful for providing real-time feedback to users about what a tool is doing.
+
+:::python
+```python wrap
+from langchain.tools import tool
+from langgraph.runtime import get_runtime
+
+@tool
+def get_weather(city: str) -> str:
+    """Get weather for a given city."""
+    writer = get_runtime().stream_writer
+
+    # Stream custom updates as the tool executes
+    writer(f"Looking up data for city: {city}")
+    writer(f"Acquired data for city: {city}")
+
+    return f"It's always sunny in {city}!"
+```
+
+<Note>
+If you use `get_runtime().stream_writer` inside your tool, the tool must be invoked within a LangGraph execution context. See [Streaming](/oss/langchain/streaming) for more details.
+</Note>
+:::
+
+:::js
+```ts wrap
+import { z } from "zod";
+import { tool } from "langchain";
+
+const getWeather = tool(
+  ({ city }, config) => {
+    const writer = config.streamWriter;
+
+    // Stream custom updates as the tool executes
+    writer(`Looking up data for city: ${city}`);
+    writer(`Acquired data for city: ${city}`);
+
+    return `It's always sunny in ${city}!`;
+  },
+  {
+    name: "get_weather",
+    description: "Get weather for a given city.",
+    schema: z.object({
+      city: z.string(),
+    }),
+  }
+);
+```
+:::
 
-        # First session: save user info
-        agent.invoke({
-            "messages": [{"role": "user", "content": "Save the following user: userid: abc123, name: Foo, age: 25, email: foo@langchain.dev"}]
-        })
-
-        # Second session: get user info
-        agent.invoke({
-            "messages": [{"role": "user", "content": "Get user info for user with id 'abc123'"}]
-        })
-        # Here is the user info for user with ID "abc123":
-        # - Name: Foo
-        # - Age: 25
-        # - Email: foo@langchain.dev
-        ```
-        :::
-
-        :::js
-
-        ```ts wrap expandable
-        import { z } from "zod";
-        import { createAgent, tool } from "langchain";
-        import { InMemoryStore } from "@langchain/langgraph";
-        import { ChatOpenAI } from "@langchain/openai";
-
-        const store = new InMemoryStore();
-
-        const getUserInfo = tool(
-          async ({ user_id }) => {
-            const value = await store.get(["users"], user_id);
-            console.log("get_user_info", user_id, value);
-            return value;
-          },
-          {
-            name: "get_user_info",
-            description: "Look up user info.",
-            schema: z.object({
-              user_id: z.string(),
-            }),
-          }
-        );
-
-        const saveUserInfo = tool(
-          async ({ user_id, name, age, email }) => {
-            console.log("save_user_info", user_id, name, age, email);
-            await store.put(["users"], user_id, { name, age, email });
-            return "Successfully saved user info.";
-          },
-          {
-            name: "save_user_info",
-            description: "Save user info.",
-            schema: z.object({
-              user_id: z.string(),
-              name: z.string(),
-              age: z.number(),
-              email: z.string(),
-            }),
-          }
-        );
-
-        const agent = createAgent({
-          llm: new ChatOpenAI({ model: "gpt-4o" }),
-          tools: [getUserInfo, saveUserInfo],
-          store,
-        });
-
-        // First session: save user info
-        await agent.invoke({
-          messages: [
-            {
-              role: "user",
-              content: "Save the following user: userid: abc123, name: Foo, age: 25, email: foo@langchain.dev",
-            },
-          ],
-        });
-
-        // Second session: get user info
-        const result = await agent.invoke({
-          messages: [
-            { role: "user", content: "Get user info for user with id 'abc123'" },
-          ],
-        });
-
-        console.log(result);
-        // Here is the user info for user with ID "abc123":
-        // - Name: Foo
-        // - Age: 25
-        // - Email: foo@langchain.dev
-        ```
-        :::
-    </Accordion>
-</AccordionGroup>