From fe351be876dfb4efec9d9a08f13d1349d76d674d Mon Sep 17 00:00:00 2001
From: Om Gupta <omgupta0720@gmail.com>
Date: Sun, 3 May 2026 16:05:10 +0530
Subject: [PATCH 1/3] clarify web search action labels

---
 .../src/components/chat/ActionsGroup.tsx      | 126 +++++++++++++++---
 .../src/components/chat/MessageList.tsx       |  20 ++-
 2 files changed, 120 insertions(+), 26 deletions(-)

diff --git a/packages/desktop/src/components/chat/ActionsGroup.tsx b/packages/desktop/src/components/chat/ActionsGroup.tsx
index 2756329e..9f3f6521 100644
--- a/packages/desktop/src/components/chat/ActionsGroup.tsx
+++ b/packages/desktop/src/components/chat/ActionsGroup.tsx
@@ -1,30 +1,45 @@
 import { AnimatePresence, motion } from 'framer-motion'
 import { Brain, ChevronRight, Code, PanelRight, Workflow } from 'lucide-react'
 import type { ReactNode } from 'react'
-import { useEffect, useMemo, useState } from 'react'
+import { useEffect, useMemo, useRef, useState } from 'react'
 import { artifactStore } from '../../lib/store/artifactStore.js'
 import { parseCitationSources } from '../../lib/store/handlers/citationParser.js'
 import { ArtifactCard } from './ArtifactCard.js'
 import { SourceCards } from './SourceCards.js'
 import type { ToolAction } from './groupMessages.js'
 
-const SEARCH_TOOLS = new Set(['web_search', 'exa_search', 'exa_find_similar', 'web_research'])
+const SEARCH_TOOLS = new Set([
+  'web_search',
+  'exa_search',
+  'exa_answer',
+  'exa_find_similar',
+  'web_research',
+  'parallel_research',
+])
 
 // ── Tool type labels & helpers ─────────────────────────────────────
 
 /** Get a favicon URL for tools that interact with external URLs (free, no API key) */
 function getToolFavicon(toolName: string, toolInput?: Record<string, unknown>): string | null {
-  if (toolName === 'exa_search' || toolName === 'exa_find_similar') {
+  const normalizedToolName = normalizeToolName(toolName)
+  if (
+    normalizedToolName === 'exa_search' ||
+    normalizedToolName === 'exa_find_similar' ||
+    normalizedToolName === 'exa_answer'
+  ) {
     return 'https://www.google.com/s2/favicons?domain=exa.ai&sz=16'
   }
-  if (toolName === 'web_search') {
+  if (normalizedToolName === 'web_search') {
     return 'https://www.google.com/s2/favicons?domain=google.com&sz=16'
   }
+  if (normalizedToolName === 'web_research' || normalizedToolName === 'parallel_research') {
+    return 'https://www.google.com/s2/favicons?domain=parallel.ai&sz=16'
+  }
   if (!toolInput) return null
   let url: string | null = null
-  if (toolName === 'browser') url = toolInput.url as string
-  else if (toolName === 'network') url = (toolInput.url || toolInput.host) as string
-  else if (toolName === 'http_api') url = toolInput.url as string
+  if (normalizedToolName === 'browser') url = toolInput.url as string
+  else if (normalizedToolName === 'network') url = (toolInput.url || toolInput.host) as string
+  else if (normalizedToolName === 'http_api') url = toolInput.url as string
   if (!url) return null
   try {
     const hostname = new URL(url.startsWith('http') ? url : `https://${url}`).hostname
@@ -36,7 +51,8 @@ function getToolFavicon(toolName: string, toolInput?: Record<string, unknown>):
 
 /** Get a short, bold tool type label (like Claude Code's "Read", "Edit", "Shell") */
 function getToolTypeLabel(toolName: string, toolInput?: Record<string, unknown>): string {
-  switch (toolName) {
+  const normalizedToolName = normalizeToolName(toolName)
+  switch (normalizedToolName) {
     case 'shell':
       return 'Shell'
     case 'filesystem': {
@@ -78,11 +94,15 @@ function getToolTypeLabel(toolName: string, toolInput?: Record<string, unknown>)
     case 'sub_agent':
       return 'Agent'
     case 'web_search':
-      return 'Search'
+      return 'Web Search'
     case 'exa_search':
-      return 'Search'
+      return 'Web Search'
+    case 'exa_answer':
+      return 'Web Answer'
     case 'web_research':
-      return 'Research'
+      return 'Web Research'
+    case 'parallel_research':
+      return 'Web Research'
     case 'exa_find_similar':
       return 'Similar'
     default:
@@ -104,10 +124,62 @@ function formatMcpToolName(toolName: string): string {
     .join(' ')
 }
 
+function normalizeToolName(toolName: string): string {
+  const colonIdx = toolName.indexOf(':')
+  return colonIdx >= 0 ? toolName.slice(colonIdx + 1) : toolName
+}
+
+function getFirstString(...values: unknown[]): string | null {
+  for (const value of values) {
+    if (typeof value === 'string' && value.trim()) return value.trim()
+  }
+  return null
+}
+
+function getSearchQuery(toolInput?: Record<string, unknown>): string | null {
+  if (!toolInput) return null
+
+  const directQuery = getFirstString(
+    toolInput.query,
+    toolInput.q,
+    toolInput.question,
+    toolInput.objective,
+    toolInput.prompt,
+  )
+  if (directQuery) return directQuery
+
+  const searchQueries = toolInput.search_query ?? toolInput.searchQuery ?? toolInput.queries
+  if (Array.isArray(searchQueries)) {
+    const queries = searchQueries
+      .map((entry) => {
+        if (typeof entry === 'string') return entry.trim()
+        if (entry && typeof entry === 'object') {
+          return getFirstString(
+            (entry as Record<string, unknown>).q,
+            (entry as Record<string, unknown>).query,
+          )
+        }
+        return null
+      })
+      .filter((query): query is string => Boolean(query))
+
+    if (queries.length > 0) return queries.join(' | ')
+  }
+
+  return null
+}
+
+function formatQuotedTarget(value: string, maxLength = 60): string {
+  const trimmed = value.replace(/\s+/g, ' ').trim()
+  const short = trimmed.length > maxLength ? `${trimmed.slice(0, maxLength - 3)}...` : trimmed
+  return `"${short}"`
+}
+
 /** Get the target/description shown after the type label (in code-styled pill) */
 function getToolTarget(toolName: string, toolInput?: Record<string, unknown>): string | null {
   if (!toolInput) return null
-  switch (toolName) {
+  const normalizedToolName = normalizeToolName(toolName)
+  switch (normalizedToolName) {
     case 'shell': {
       const cmd = (toolInput.command as string) || ''
       return cmd.length > 80 ? `${cmd.slice(0, 77)}...` : cmd
@@ -147,7 +219,7 @@ function getToolTarget(toolName: string, toolInput?: Record<string, unknown>): s
     }
     case 'code_search': {
       const query = (toolInput.query as string) || ''
-      return query ? `"${query.slice(0, 50)}"` : null
+      return query ? formatQuotedTarget(query, 50) : null
     }
     case 'http_api': {
       const method = (toolInput.method as string) || 'GET'
@@ -175,11 +247,12 @@ function getToolTarget(toolName: string, toolInput?: Record<string, unknown>): s
       return (toolInput.task as string) || null
     case 'web_search':
     case 'exa_search':
+    case 'exa_answer':
+    case 'parallel_research':
     case 'web_research': {
-      const query = (toolInput.query as string) || ''
+      const query = getSearchQuery(toolInput) || ''
       if (!query) return null
-      const trimmed = query.length > 60 ? `${query.slice(0, 57)}...` : query
-      return `"${trimmed}"`
+      return formatQuotedTarget(query)
     }
     case 'exa_find_similar': {
       const url = (toolInput.url as string) || ''
@@ -208,7 +281,8 @@ function getToolMeta(
   }
   if (!resultContent) return null
 
-  switch (toolName) {
+  const normalizedToolName = normalizeToolName(toolName)
+  switch (normalizedToolName) {
     case 'filesystem': {
       const op = toolInput?.operation as string
       if (op === 'read') {
@@ -238,8 +312,10 @@ function getToolMeta(
     }
     case 'web_search':
     case 'exa_search':
+    case 'exa_answer':
     case 'exa_find_similar':
-    case 'web_research': {
+    case 'web_research':
+    case 'parallel_research': {
       const resultMatches = resultContent.match(/\burl\b/gi)
       if (resultMatches && resultMatches.length > 0) {
         const count = resultMatches.length
@@ -309,7 +385,7 @@ function ActionChip({ action }: ActionChipProps) {
   const [showFullResult, setShowFullResult] = useState(false)
   const displayedResult = showFullResult ? resultContent : resultLines.slice(0, 6).join('\n')
 
-  const isSearchTool = SEARCH_TOOLS.has(toolName)
+  const isSearchTool = SEARCH_TOOLS.has(normalizeToolName(toolName))
   const searchSources = useMemo(
     () => (isSearchTool && resultContent && !isError ? parseCitationSources(resultContent) : []),
     [isSearchTool, resultContent, isError],
@@ -426,12 +502,20 @@ function GroupChip({
   errorCount = 0,
 }: GroupChipProps) {
   const [open, setOpen] = useState(defaultOpen)
+  const userToggledRef = useRef(false)
   useEffect(() => {
-    if (defaultOpen) setOpen(true)
+    if (!userToggledRef.current) setOpen(defaultOpen)
   }, [defaultOpen])
   return (
     <div className={`conv-chip has-children${open ? ' open' : ''}`}>
-      <button type="button" className="conv-chip__row" onClick={() => setOpen((o) => !o)}>
+      <button
+        type="button"
+        className="conv-chip__row"
+        onClick={() => {
+          userToggledRef.current = true
+          setOpen((o) => !o)
+        }}
+      >
         <IconComp size={13} strokeWidth={1.5} className="conv-chip__icon" />
         <span className="conv-chip__label">{label}</span>
         {errorCount > 0 && <span className="conv-chip__error-badge">{errorCount} failed</span>}
diff --git a/packages/desktop/src/components/chat/MessageList.tsx b/packages/desktop/src/components/chat/MessageList.tsx
index 36c0f8fa..7ec62ff4 100644
--- a/packages/desktop/src/components/chat/MessageList.tsx
+++ b/packages/desktop/src/components/chat/MessageList.tsx
@@ -162,6 +162,7 @@ export function MessageList({ messages }: Props) {
   const prevScrollHeightRef = useRef(0)
 
   const prevMsgCountRef = useRef(0)
+  const stickToBottomRef = useRef(true)
 
   const scrollToBottom = useCallback((instant?: boolean) => {
     bottomRef.current?.scrollIntoView({ behavior: instant ? 'instant' : 'smooth' })
@@ -200,10 +201,8 @@ export function MessageList({ messages }: Props) {
       return
     }
 
-    const isNearBottom = container.scrollHeight - container.scrollTop - container.clientHeight < 100
-
-    if (isNearBottom) {
-      scrollToBottom()
+    if (stickToBottomRef.current) {
+      scrollToBottom(typeof document !== 'undefined' && document.hidden)
     }
   }, [messages, scrollToBottom])
 
@@ -215,6 +214,7 @@ export function MessageList({ messages }: Props) {
     const checkScroll = () => {
       const distFromBottom = container.scrollHeight - container.scrollTop - container.clientHeight
       setShowScrollBtn(distFromBottom > 200)
+      stickToBottomRef.current = distFromBottom < 100
 
       // Trigger loading older messages when scrolled near the top
       if (container.scrollTop < 80 && hasMore && !isLoadingOlder && activeSessionId) {
@@ -231,11 +231,21 @@ export function MessageList({ messages }: Props) {
       observer.observe(child)
     }
 
+    const onVisible = () => {
+      if (!document.hidden && stickToBottomRef.current) {
+        scrollToBottom(true)
+      }
+    }
+    document.addEventListener('visibilitychange', onVisible)
+    window.addEventListener('focus', onVisible)
+
     return () => {
       container.removeEventListener('scroll', checkScroll)
       observer.disconnect()
+      document.removeEventListener('visibilitychange', onVisible)
+      window.removeEventListener('focus', onVisible)
     }
-  }, [hasMore, isLoadingOlder, activeSessionId])
+  }, [hasMore, isLoadingOlder, activeSessionId, scrollToBottom])
 
   // Maintain scroll position when older messages are prepended
   // biome-ignore lint/correctness/useExhaustiveDependencies: messages.length triggers scroll position restore

From 53f851e2072969f565089eb1f7d2eef7e45e5f17 Mon Sep 17 00:00:00 2001
From: Om Gupta <omgupta0720@gmail.com>
Date: Sun, 3 May 2026 16:08:16 +0530
Subject: [PATCH 2/3] add ContextBreakdown protocol + per-layer size accounting

Lay the protocol + sizing groundwork for the composer Context gauge:
ContextBreakdown / AiContextUpdateMessage on the wire, and
SessionPromptLayerSizes + emptyPromptLayerSizes() so the Pi-SDK path
can report per-layer char budgets without re-running layer builders.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 packages/agent-core/src/prompt-layers.ts | 43 ++++++++++++++++++++++++
 packages/protocol/src/messages.ts        | 37 ++++++++++++++++++++
 2 files changed, 80 insertions(+)

diff --git a/packages/agent-core/src/prompt-layers.ts b/packages/agent-core/src/prompt-layers.ts
index da9cf332..135f35e3 100644
--- a/packages/agent-core/src/prompt-layers.ts
+++ b/packages/agent-core/src/prompt-layers.ts
@@ -713,6 +713,49 @@ Your native tools (filesystem, shell, code editing, git, web search, etc.) remai
   )
 }
 
+// ── Per-layer size accounting (for the Context gauge popover) ──────
+
+/**
+ * Char-budget breakdown of every layer that contributes to a Pi-SDK
+ * session's prompt. Returned alongside the assembled string so the
+ * server can populate `ContextBreakdown` without re-running the layer
+ * builders. Char counts get divided by 4 at the call site to estimate
+ * tokens — same heuristic as `estimateMessageTokens` in compaction.ts.
+ */
+export interface SessionPromptLayerSizes {
+  identity: number
+  workspaceRules: number
+  userRules: number
+  currentContext: number
+  surface: number
+  memory: number
+  projectMemoryInstructions: number
+  agentContext: number
+  connectors: number
+  projectTypeGuidelines: number
+  referenceKnowledge: number
+  skills: number
+  workflows: number
+}
+
+export function emptyPromptLayerSizes(): SessionPromptLayerSizes {
+  return {
+    identity: 0,
+    workspaceRules: 0,
+    userRules: 0,
+    currentContext: 0,
+    surface: 0,
+    memory: 0,
+    projectMemoryInstructions: 0,
+    agentContext: 0,
+    connectors: 0,
+    projectTypeGuidelines: 0,
+    referenceKnowledge: 0,
+    skills: 0,
+    workflows: 0,
+  }
+}
+
 // ── High-level entry point ──────────────────────────────────────────
 
 export interface HarnessContextPromptOpts {
diff --git a/packages/protocol/src/messages.ts b/packages/protocol/src/messages.ts
index 41282f89..cda796d0 100644
--- a/packages/protocol/src/messages.ts
+++ b/packages/protocol/src/messages.ts
@@ -696,6 +696,42 @@ export interface AiTokenUpdateMessage {
   sessionId?: string
 }
 
+/**
+ * Per-category breakdown of a session's prompt budget. Drives the in-composer
+ * Context gauge + popover: Pi-SDK sessions report the full breakdown, harness
+ * sessions populate `messages` + `contextWindow` only and leave the rest at 0.
+ *
+ * `freeSpace` is derived on the client as
+ *   contextWindow − (systemPrompt + systemTools + mcpTools + skills
+ *                    + memoryFiles + messages + autocompactBuffer)
+ */
+export interface ContextBreakdown {
+  /** Model context window — max tokens the model accepts. */
+  contextWindow: number
+  /** Identity + workspace/user rules + current context + project + agent context. */
+  systemPrompt: number
+  /** Built-in tool schemas (shell, read/write/edit, glob, grep, web_search, etc.). */
+  systemTools: number
+  /** MCP server tool schemas + direct OAuth connector tools. */
+  mcpTools: number
+  /** Active Skills layer (catalog + auto-loaded skill bodies). */
+  skills: number
+  /** Memory layer (global + conversation + cross-conversation). */
+  memoryFiles: number
+  /** Conversation history (user + assistant + tool-result messages). */
+  messages: number
+  /** Reserved for autocompaction headroom — `contextWindow * (1 − threshold)`. */
+  autocompactBuffer: number
+  /** Pi SDK = full breakdown. Harness = messages-only fallback. */
+  source: 'pi-sdk' | 'harness'
+}
+
+export interface AiContextUpdateMessage {
+  type: 'context_update'
+  sessionId?: string
+  breakdown: ContextBreakdown
+}
+
 export interface AiTextReplaceMessage {
   type: 'text_replace'
   sessionId?: string
@@ -1514,6 +1550,7 @@ export type AiMessage =
   | AiArtifactMessage
   | AiTasksUpdateMessage
   | AiTokenUpdateMessage
+  | AiContextUpdateMessage
   | AiTextReplaceMessage
   | AiDoneMessage
   | AiErrorMessage

From 2afa64c00f605a1c7980c49e46f9fc99156cad0b Mon Sep 17 00:00:00 2001
From: Om Gupta <omgupta0720@gmail.com>
Date: Mon, 4 May 2026 14:17:31 +0530
Subject: [PATCH 3/3] feat(chat): composer Context gauge + popover with
 calibrated breakdown

In-composer circular gauge plus floating popover with per-category
token usage (System prompt, System tools, MCP tools, Skills, Memory
files, Messages, Autocompact buffer, Free space). Pi-SDK sessions
report the full split; harness sessions report Messages + Free space.

Wires breakdown emission on session_created, every turn_end, model
switch, connector refresh, conversation-context load, and surface
change. Calibrates char/4 estimates against the model's reported
input_tokens via a pre-turn snapshot captured at turn_start, with
the resulting scale factor persisted in PersistedSession so resumed
sessions keep their calibration. Codex harness emits per-turn
last.inputTokens (not the cumulative total) capped at the model
context window.

Replaces the old memory-count ContextIndicator badge; the
"View memory details" link in the popover footer keeps the side
panel reachable from the composer.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 packages/agent-config/src/config.ts           |   7 +
 packages/agent-core/src/agent.ts              |  94 +++++++
 .../src/harness/codex-harness-session.ts      |  35 +++
 packages/agent-core/src/session.ts            | 255 ++++++++++++++++--
 packages/agent-server/src/server.ts           |  61 ++++-
 .../desktop/src/components/RoutineChat.tsx    |   2 -
 .../desktop/src/components/chat/ChatInput.tsx |   2 +
 .../src/components/chat/ContextGauge.tsx      | 120 +++++++++
 .../src/components/chat/ContextIndicator.tsx  |  40 ---
 .../src/components/chat/ContextPopover.tsx    | 240 +++++++++++++++++
 packages/desktop/src/index.css                | 171 ++++++++++--
 .../lib/store/handlers/interactionHandler.ts  |   8 +
 .../desktop/src/lib/store/sessionStore.ts     |   7 +
 specs/features/ui/CONTEXT_GAUGE.md            | 113 ++++++++
 specs/features/ui/CONTEXT_GAUGE_BLUNDERS.md   | 203 ++++++++++++++
 15 files changed, 1277 insertions(+), 81 deletions(-)
 create mode 100644 packages/desktop/src/components/chat/ContextGauge.tsx
 delete mode 100644 packages/desktop/src/components/chat/ContextIndicator.tsx
 create mode 100644 packages/desktop/src/components/chat/ContextPopover.tsx
 create mode 100644 specs/features/ui/CONTEXT_GAUGE.md
 create mode 100644 specs/features/ui/CONTEXT_GAUGE_BLUNDERS.md

diff --git a/packages/agent-config/src/config.ts b/packages/agent-config/src/config.ts
index 4eaecc1b..4ddda91b 100644
--- a/packages/agent-config/src/config.ts
+++ b/packages/agent-config/src/config.ts
@@ -136,6 +136,13 @@ export interface PersistedSession {
     cacheReadTokens: number
     cacheWriteTokens: number
   }
+  /**
+   * Calibration factor for the in-composer Context gauge — actual
+   * `input_tokens` / pre-turn estimate from the most recent completed
+   * turn. Persisted so a resumed session keeps its calibration instead
+   * of starting from 1.0 again.
+   */
+  contextEstimateScale?: number
 }
 
 // ── Main config ─────────────────────────────────────────────────────
diff --git a/packages/agent-core/src/agent.ts b/packages/agent-core/src/agent.ts
index 7fa1400a..d17443e1 100644
--- a/packages/agent-core/src/agent.ts
+++ b/packages/agent-core/src/agent.ts
@@ -228,6 +228,100 @@ export interface ToolCallbacks {
   getParentForkContext?: () => ParentForkContext | undefined
 }
 
+/**
+ * Names of every tool registered by `buildTools` itself (i.e. not from
+ * MCP servers or OAuth connector managers). Used by `categorizeTools`
+ * to split a flattened tool list into "system" vs. "MCP/connector" for
+ * the Context gauge popover. Keep this in sync when adding/removing
+ * built-in tools above. New tools added to `buildAntonCoreTools` should
+ * also land here.
+ */
+export const BUILT_IN_TOOL_NAMES = new Set<string>([
+  // Filesystem + shell + git + http
+  'shell',
+  'read',
+  'write',
+  'edit',
+  'glob',
+  'list',
+  'grep',
+  'git',
+  'http_api',
+  // Browser + media
+  'browser',
+  'image',
+  'clipboard',
+  // Web (Anton-native)
+  'web_search',
+  'web_research',
+  // Task / planning
+  'todo',
+  'task_tracker',
+  'plan',
+  'ask_user',
+  'artifact',
+  // Sub-agent / routine
+  'sub_agent',
+  'spawn_sub_agent',
+  'shared_state',
+  'routine',
+  'deliver_result',
+  // Anton platform
+  'memory',
+  'notification',
+  'database',
+  'publish',
+  'skill',
+  'set_session_title',
+  'update_project_context',
+  'activate_workflow',
+  // Pi-SDK low-level (rarely surfaced but possible)
+  'filesystem',
+  'process',
+  'network',
+])
+
+export interface CategorizedToolSizes {
+  /** Built-in tool count. */
+  systemToolCount: number
+  /** MCP-server + direct-OAuth-connector tool count. */
+  mcpToolCount: number
+  /** Sum of `name + description + JSON.stringify(parameters)` lengths for built-ins. */
+  systemToolChars: number
+  /** Same, for MCP/connector tools. */
+  mcpToolChars: number
+}
+
+/**
+ * Split a flattened `AgentTool[]` (as returned by `buildTools`) into
+ * built-in vs. MCP/connector buckets and report char-budget per bucket.
+ * The Context gauge popover divides the chars by 4 to estimate tokens.
+ */
+export function categorizeTools(tools: AgentTool[]): CategorizedToolSizes {
+  let systemToolCount = 0
+  let mcpToolCount = 0
+  let systemToolChars = 0
+  let mcpToolChars = 0
+  for (const tool of tools) {
+    const isBuiltIn = BUILT_IN_TOOL_NAMES.has(tool.name)
+    let chars = tool.name.length + (tool.description?.length ?? 0)
+    try {
+      chars += JSON.stringify(tool.parameters ?? {}).length
+    } catch {
+      // Parameter schemas should always serialize, but be defensive — a
+      // bad schema must not break the gauge.
+    }
+    if (isBuiltIn) {
+      systemToolCount += 1
+      systemToolChars += chars
+    } else {
+      mcpToolCount += 1
+      mcpToolChars += chars
+    }
+  }
+  return { systemToolCount, mcpToolCount, systemToolChars, mcpToolChars }
+}
+
 export function buildTools(
   config: AgentConfig,
   callbacks?: ToolCallbacks,
diff --git a/packages/agent-core/src/harness/codex-harness-session.ts b/packages/agent-core/src/harness/codex-harness-session.ts
index ce1f39df..ae91d57a 100644
--- a/packages/agent-core/src/harness/codex-harness-session.ts
+++ b/packages/agent-core/src/harness/codex-harness-session.ts
@@ -978,6 +978,7 @@ export class CodexHarnessSession {
               totalTokens?: number
             }
             last?: { inputTokens?: number; outputTokens?: number; cachedInputTokens?: number }
+            modelContextWindow?: number
           }
         }
       | undefined
@@ -1000,6 +1001,40 @@ export class CodexHarnessSession {
         cacheWriteTokens: 0,
       },
     })
+
+    // Drive the in-composer Context gauge for harness sessions. The
+    // harness CLI doesn't expose how its own prompt is split, so the
+    // popover renders a 2-row breakdown (Messages + Free space).
+    //
+    // Prefer `last.inputTokens` (per-turn input that just hit the model)
+    // over `total.inputTokens` for the gauge, because `total` is the
+    // SUM of input across every turn this thread (including cached
+    // tokens) — on long conversations it routinely exceeds the actual
+    // prompt size and would drive the gauge past 100%. Fall back to
+    // `total` only when `last` isn't reported.
+    const contextWindow = p?.tokenUsage?.modelContextWindow ?? 0
+    if (contextWindow > 0) {
+      const lastInput = p?.tokenUsage?.last?.inputTokens
+      const totalInput = p?.tokenUsage?.total?.inputTokens ?? 0
+      const messages = Math.min(
+        contextWindow,
+        typeof lastInput === 'number' && lastInput > 0 ? lastInput : totalInput,
+      )
+      this.emit({
+        type: 'context_update',
+        breakdown: {
+          contextWindow,
+          systemPrompt: 0,
+          systemTools: 0,
+          mcpTools: 0,
+          skills: 0,
+          memoryFiles: 0,
+          messages,
+          autocompactBuffer: 0,
+          source: 'harness',
+        },
+      })
+    }
   }
 
   private onCompacted() {
diff --git a/packages/agent-core/src/session.ts b/packages/agent-core/src/session.ts
index 40f339be..6b5c4f86 100644
--- a/packages/agent-core/src/session.ts
+++ b/packages/agent-core/src/session.ts
@@ -262,17 +262,25 @@ export function resolveModel(provider: string, modelId: string): Model<Api> | un
 
   return undefined
 }
-import { type AskUserHandler, CORE_SYSTEM_PROMPT, type ToolCallbacks, buildTools } from './agent.js'
+import {
+  type AskUserHandler,
+  CORE_SYSTEM_PROMPT,
+  type ToolCallbacks,
+  buildTools,
+  categorizeTools,
+} from './agent.js'
 import {
   type CompactionConfig,
   type CompactionState,
   compactContext,
   createInitialCompactionState,
+  estimateTokens,
   getDefaultCompactionConfig,
 } from './compaction.js'
 import { type ContextInfo, type MemoryData, assembleConversationContext } from './context.js'
 import {
   type LiveConnectorSummary,
+  type SessionPromptLayerSizes,
   buildActiveConnectorsLayer,
   buildActiveSkillsLayer,
   buildAgentContextLayer,
@@ -280,6 +288,7 @@ import {
   buildProjectMemoryInstructionsLayer,
   buildSurfaceLayer,
   buildWorkflowsLayer,
+  emptyPromptLayerSizes,
   systemReminder,
 } from './prompt-layers.js'
 import {
@@ -375,6 +384,7 @@ export type SessionEvent =
   | { type: 'sub_agent_progress'; toolCallId: string; content: string }
   | { type: 'tasks_update'; tasks: import('@anton/protocol').TaskItem[] }
   | { type: 'token_update'; usage: TokenUsage }
+  | { type: 'context_update'; breakdown: import('@anton/protocol').ContextBreakdown }
   | {
       type: 'browser_state'
       url: string
@@ -487,6 +497,20 @@ export class Session {
   private messageSpanIds: Map<string, string> = new Map()
   private static readonly MESSAGE_SPAN_CAP = 200
   private _promptVersion?: string // hash of assembled system prompt
+  // Char-count snapshot of every system-prompt layer from the most recent
+  // getSystemPrompt() call. Powers ContextBreakdown emission without
+  // re-running the layer builders. Empty until the first build.
+  private _lastLayerSizes: SessionPromptLayerSizes = emptyPromptLayerSizes()
+  // Calibration factor applied to estimated breakdowns: actual / estimated
+  // input tokens from the most recent completed turn. Defaults to 1.0
+  // (no calibration) until we have a real sample.
+  private _contextEstimateScale = 1.0
+  // Sum of the (already-scaled) breakdown categories captured at the
+  // most recent `turn_start`. Used to calibrate scale at `turn_end`
+  // against pre-turn state, not post-turn — pi-ai appends the assistant
+  // response to messages before turn_end fires, which would otherwise
+  // bias the calibration low.
+  private _preTurnEstimateSum: number | null = null
 
   // Safety limits
   private maxTokenBudget: number
@@ -541,6 +565,8 @@ export class Session {
     surface?: SurfaceInfo
     /** Override the computed system prompt (used by fork children to inherit parent's prompt). */
     systemPromptOverride?: string
+    /** Persisted Context-gauge calibration factor (resumed sessions only). */
+    contextEstimateScale?: number
   }) {
     this.id = opts.id
     this.log = withContext(baseLog, { sessionId: opts.id })
@@ -591,6 +617,9 @@ export class Session {
         configCompaction?.preserveRecentCount ?? defaultCompaction.preserveRecentCount,
     }
     this.compactionState = opts.compactionState || createInitialCompactionState()
+    if (typeof opts.contextEstimateScale === 'number' && opts.contextEstimateScale > 0) {
+      this._contextEstimateScale = Math.min(2.0, Math.max(0.5, opts.contextEstimateScale))
+    }
 
     // Runtime strings from config — cast to the SDK's nominal types
     const model = resolveModel(opts.provider, opts.model)
@@ -1396,6 +1425,20 @@ export class Session {
     return { ...this.cumulativeUsage }
   }
 
+  /**
+   * Push a fresh ContextBreakdown into the active event stream. No-op
+   * when no `processMessage` is in flight (between turns) — in that
+   * case the server is expected to read `getContextBreakdown()`
+   * directly and emit `context_update` to the client itself, since
+   * tools and prompt-layer changes between turns still need to refresh
+   * the gauge.
+   */
+  private pushContextUpdate(): void {
+    if (!this.pushEvent) return
+    const breakdown = this.getContextBreakdown()
+    if (breakdown) this.pushEvent({ type: 'context_update', breakdown })
+  }
+
   /**
    * Switch model mid-session. pi SDK handles this gracefully —
    * keeps all messages, next LLM call uses the new model.
@@ -1412,6 +1455,10 @@ export class Session {
     this.provider = provider
     this.model = model
     this.persist()
+    // Context window may have changed (e.g. opus 1M → sonnet 200k).
+    // Refresh the gauge immediately when a turn is active; otherwise
+    // the server emits explicitly at the call site.
+    this.pushContextUpdate()
   }
 
   /** Re-build the tools list and push it to the running agent — call after adding/removing a connector. */
@@ -1425,6 +1472,8 @@ export class Session {
     )
     this.piAgent.setTools(newTools)
     this.log.info({ toolCount: newTools.length }, 'refreshed tools')
+    // Tool schemas changed — gauge bytes shifted between system/MCP buckets.
+    this.pushContextUpdate()
   }
 
   /** Update connector prompt summaries after connector state changes. */
@@ -1913,6 +1962,8 @@ export class Session {
       compactionState: this.compactionState,
       lastTasks: this._lastTasks.length > 0 ? this._lastTasks : undefined,
       usage: this.cumulativeUsage.totalTokens > 0 ? this.getCumulativeUsage() : undefined,
+      contextEstimateScale:
+        this._contextEstimateScale !== 1.0 ? this._contextEstimateScale : undefined,
     }
     const basePath = this.projectId ? getProjectSessionsDir(this.projectId) : undefined
     saveSession(persisted, basePath)
@@ -1936,6 +1987,23 @@ export class Session {
         return []
       }
 
+      case 'turn_start': {
+        // Snapshot the pre-turn breakdown so calibration at turn_end
+        // compares against the prompt that was actually sent to the
+        // model — pi-ai appends the assistant response to messages
+        // BEFORE turn_end fires.
+        const pre = this.getContextBreakdown()
+        this._preTurnEstimateSum = pre
+          ? pre.systemPrompt +
+            pre.systemTools +
+            pre.mcpTools +
+            pre.skills +
+            pre.memoryFiles +
+            pre.messages
+          : null
+        return []
+      }
+
       case 'tool_execution_start':
         this.pendingToolCalls.set(piEvent.toolCallId, {
           name: piEvent.toolName,
@@ -2004,6 +2072,12 @@ export class Session {
           this.cumulativeUsage.totalTokens += this.lastTurnUsage.totalTokens
           this.cumulativeUsage.cacheReadTokens += this.lastTurnUsage.cacheReadTokens
           this.cumulativeUsage.cacheWriteTokens += this.lastTurnUsage.cacheWriteTokens
+          // Calibrate the breakdown estimate against the model's reported
+          // input_tokens — drifts toward reality across turns. Cheap math,
+          // bounded scaling factor.
+          if (this.lastTurnUsage.inputTokens > 0) {
+            this.updateContextEstimateScale(this.lastTurnUsage.inputTokens)
+          }
         }
         // Surface LLM errors (e.g. invalid API key, rate limits) that the pi SDK captures
         if (msg?.stopReason === 'error' && msg?.errorMessage) {
@@ -2013,6 +2087,13 @@ export class Session {
         const events: SessionEvent[] = [
           { type: 'token_update' as const, usage: this.getCumulativeUsage() },
         ]
+        // Emit ContextBreakdown right after every turn — the message
+        // history grew, calibration may have shifted, and skills/memory
+        // can change between turns. Server forwards this verbatim.
+        const breakdown = this.getContextBreakdown()
+        if (breakdown) {
+          events.push({ type: 'context_update' as const, breakdown })
+        }
         // If the LLM call failed, emit an error event so the client shows the real reason
         if (msg?.stopReason === 'error') {
           events.push({
@@ -2447,24 +2528,44 @@ export class Session {
   }
 
   private getSystemPrompt(): string {
-    // Fork children inherit the parent's fully-rendered system prompt
-    if (this.systemPromptOverride) return this.systemPromptOverride
+    // Fork children inherit the parent's fully-rendered system prompt.
+    // Snapshot its length under `identity` so getContextBreakdown still
+    // attributes the prompt — otherwise sub-agents report 0 across every
+    // category except messages and tools.
+    if (this.systemPromptOverride) {
+      const sizes = emptyPromptLayerSizes()
+      sizes.identity = this.systemPromptOverride.length
+      this._lastLayerSizes = sizes
+      return this.systemPromptOverride
+    }
+
+    // Reset sizes — every call re-builds from scratch.
+    const sizes = emptyPromptLayerSizes()
 
     // Layer 0: Core system prompt — self-contained behavioral instructions.
     // Identical for all deployments. Works perfectly even if all other layers are empty.
     let prompt = CORE_SYSTEM_PROMPT
+    sizes.identity += CORE_SYSTEM_PROMPT.length
 
-    prompt +=
+    const orientation =
       '\n\nContextual information, rules, and memory are provided in <system-reminder> tags below. These are injected by the system and should be treated as trusted context. Priority order: workspace rules > user rules > memory > other context.'
+    prompt += orientation
+    sizes.identity += orientation.length
 
     // Layer 1: Workspace rules (.anton.md) — highest priority contextual layer
     if (this.workspacePath) {
-      const workspaceRules = loadWorkspaceRules(this.workspacePath)
-      prompt += systemReminder('Workspace Rules', workspaceRules)
+      const workspaceRulesBlock = systemReminder(
+        'Workspace Rules',
+        loadWorkspaceRules(this.workspacePath),
+      )
+      prompt += workspaceRulesBlock
+      sizes.workspaceRules += workspaceRulesBlock.length
     }
 
     // Layer 2: User rules (append.md + rules/*.md from ~/.anton/prompts/)
-    prompt += systemReminder('User Rules', loadUserRules())
+    const userRulesBlock = systemReminder('User Rules', loadUserRules())
+    prompt += userRulesBlock
+    sizes.userRules += userRulesBlock.length
 
     // Layer 3: Current context — workspace, project, date
     const contextLines: string[] = []
@@ -2506,21 +2607,39 @@ export class Session {
       contextLines.push('- Sudo: not available')
     }
 
-    prompt += systemReminder('Current Context', contextLines.join('\n'))
+    const currentContextBlock = systemReminder('Current Context', contextLines.join('\n'))
+    prompt += currentContextBlock
+    sizes.currentContext += currentContextBlock.length
 
     // Shared layers — wording lives in prompt-layers.ts so the harness
     // path sees byte-identical blocks. Do not inline here.
-    prompt += buildSurfaceLayer(this.surface)
-    prompt += buildMemoryLayer(this.memoryData)
-    prompt += buildProjectMemoryInstructionsLayer(this.projectId)
-    prompt += buildAgentContextLayer(this.agentInstructions, this.agentMemory)
-    prompt += buildActiveConnectorsLayer(this.liveConnectors)
+    const surfaceBlock = buildSurfaceLayer(this.surface)
+    prompt += surfaceBlock
+    sizes.surface += surfaceBlock.length
+
+    const memoryBlock = buildMemoryLayer(this.memoryData)
+    prompt += memoryBlock
+    sizes.memory += memoryBlock.length
+
+    const projectMemoryBlock = buildProjectMemoryInstructionsLayer(this.projectId)
+    prompt += projectMemoryBlock
+    sizes.projectMemoryInstructions += projectMemoryBlock.length
+
+    const agentContextBlock = buildAgentContextLayer(this.agentInstructions, this.agentMemory)
+    prompt += agentContextBlock
+    sizes.agentContext += agentContextBlock.length
+
+    const connectorsBlock = buildActiveConnectorsLayer(this.liveConnectors)
+    prompt += connectorsBlock
+    sizes.connectors += connectorsBlock.length
 
     // Layer 7: Project type guidelines (code.md, document.md, etc.)
     if (this.projectType) {
       const typePrompt = loadProjectTypePrompt(this.projectType as ProjectType)
       if (typePrompt) {
-        prompt += systemReminder('Project Type Guidelines', typePrompt)
+        const typeBlock = systemReminder('Project Type Guidelines', typePrompt)
+        prompt += typeBlock
+        sizes.projectTypeGuidelines += typeBlock.length
       }
     }
 
@@ -2530,24 +2649,121 @@ export class Session {
       firstMessage: this.firstMessage,
     })
     if (refs) {
-      prompt += systemReminder('Reference Knowledge', refs)
+      const refsBlock = systemReminder('Reference Knowledge', refs)
+      prompt += refsBlock
+      sizes.referenceKnowledge += refsBlock.length
     }
 
     // Layer 9: Active skills — catalog plus auto-selected SKILL.md bodies.
-    prompt += buildActiveSkillsLayer({
+    const skillsBlock = buildActiveSkillsLayer({
       skills: this.config.skills,
       userMessage: this.latestUserMessage ?? this.firstMessage,
     })
+    prompt += skillsBlock
+    sizes.skills += skillsBlock.length
 
     // Shared layer — wording lives in prompt-layers.ts.
-    prompt += buildWorkflowsLayer(this.availableWorkflows)
+    const workflowsBlock = buildWorkflowsLayer(this.availableWorkflows)
+    prompt += workflowsBlock
+    sizes.workflows += workflowsBlock.length
 
     // Compute prompt version hash for tracing
     this._promptVersion = hashPromptVersion(prompt)
 
+    this._lastLayerSizes = sizes
+
     return prompt
   }
 
+  /**
+   * Per-category breakdown of this session's current prompt budget.
+   * Powers the in-composer Context gauge + popover. Returns null when the
+   * resolved model has no context window (defensive — pi-ai's catalog
+   * always populates it for our supported models).
+   *
+   * Pi SDK path computes the full split: sums layer sizes from the most
+   * recent `getSystemPrompt()` call into named categories, splits the live
+   * tool list (built-in vs MCP / OAuth-connector), estimates conversation
+   * history via `estimateTokens`, and reserves `(1 − threshold)` of the
+   * window for autocompaction headroom. Char counts get divided by 4 to
+   * match the same heuristic used by compaction.
+   */
+  getContextBreakdown(): import('@anton/protocol').ContextBreakdown | null {
+    const contextWindow =
+      this.resolvedModel?.contextWindow ?? this.compactionConfig.maxContextTokens
+    if (!contextWindow || contextWindow <= 0) return null
+
+    // Make sure we have a layer-size snapshot — the very first read can
+    // happen before any prompt rebuild (e.g. fresh session).
+    if (this._lastLayerSizes === undefined) {
+      this._lastLayerSizes = emptyPromptLayerSizes()
+    }
+    const s = this._lastLayerSizes
+
+    // Group every "system prompt-ish" layer into one bucket. Skills and
+    // memory keep their own rows; everything else (identity, rules,
+    // current context, surface, agent context, connectors, project type,
+    // references, workflows, project memory instructions) lumps in here.
+    const systemPromptChars =
+      s.identity +
+      s.workspaceRules +
+      s.userRules +
+      s.currentContext +
+      s.surface +
+      s.projectMemoryInstructions +
+      s.agentContext +
+      s.connectors +
+      s.projectTypeGuidelines +
+      s.referenceKnowledge +
+      s.workflows
+
+    const toolSizes = categorizeTools(this.piAgent.state.tools)
+
+    const messageTokens = estimateTokens(this.piAgent.state.messages)
+    const autocompactBuffer = Math.floor(
+      contextWindow * Math.max(0, 1 - this.compactionConfig.threshold),
+    )
+
+    const charsToTokens = (chars: number) => Math.ceil(chars / 4)
+    const scale = this._contextEstimateScale > 0 ? this._contextEstimateScale : 1.0
+    const apply = (n: number) => Math.max(0, Math.round(n * scale))
+
+    return {
+      contextWindow,
+      systemPrompt: apply(charsToTokens(systemPromptChars)),
+      systemTools: apply(charsToTokens(toolSizes.systemToolChars)),
+      mcpTools: apply(charsToTokens(toolSizes.mcpToolChars)),
+      skills: apply(charsToTokens(s.skills)),
+      memoryFiles: apply(charsToTokens(s.memory)),
+      messages: apply(messageTokens),
+      autocompactBuffer,
+      source: 'pi-sdk',
+    }
+  }
+
+  /**
+   * Update the calibration factor after a turn finishes. Compares the
+   * model's reported `input_tokens` against the breakdown snapshot
+   * captured at `turn_start` (pre-turn) — calibrating against the
+   * post-turn breakdown would bias scale low because pi-ai appends the
+   * assistant response to messages before turn_end fires.
+   * Bounded to [0.5, 2.0] so a one-off outlier (very large image, weird
+   * cache behaviour) can't blow the estimate up.
+   */
+  updateContextEstimateScale(actualInputTokens: number): void {
+    const preTurnSum = this._preTurnEstimateSum
+    if (preTurnSum === null || preTurnSum <= 0 || actualInputTokens <= 0) return
+    // The pre-turn sum already had the prior scale applied — back it
+    // out so we end up with a multiplicative factor on the raw estimate.
+    const priorScale = this._contextEstimateScale > 0 ? this._contextEstimateScale : 1.0
+    const rawEstimate = preTurnSum / priorScale
+    if (rawEstimate <= 0) return
+    const next = actualInputTokens / rawEstimate
+    this._contextEstimateScale = Math.min(2.0, Math.max(0.5, next))
+    // Consume the snapshot — next turn will capture a fresh one at turn_start.
+    this._preTurnEstimateSum = null
+  }
+
   /**
    * Update where this session is talking. Called by the webhook runner on
    * every turn so a Slack session picks up the current thread's user /
@@ -2558,6 +2774,8 @@ export class Session {
   setSurface(surface: SurfaceInfo | undefined): void {
     this.surface = surface
     this.piAgent.setSystemPrompt(this.getSystemPrompt())
+    // Surface layer changed — refresh the gauge if a turn is active.
+    this.pushContextUpdate()
   }
 
   /**
@@ -2576,6 +2794,8 @@ export class Session {
     this.contextInfo = contextInfo
     // Update system prompt with new context
     this.piAgent.setSystemPrompt(this.getSystemPrompt())
+    // Memory bytes changed — refresh the gauge if a turn is active.
+    this.pushContextUpdate()
     return contextInfo
   }
 }
@@ -2818,6 +3038,7 @@ export function resumeSession(
     title: persisted.title,
     createdAt: persisted.createdAt,
     compactionState: persisted.compactionState || undefined,
+    contextEstimateScale: persisted.contextEstimateScale,
     projectId: opts?.projectId,
     projectContext: opts?.projectContext,
     projectType: opts?.projectType,
diff --git a/packages/agent-server/src/server.ts b/packages/agent-server/src/server.ts
index 68fe04d0..7c51bd62 100644
--- a/packages/agent-server/src/server.ts
+++ b/packages/agent-server/src/server.ts
@@ -111,6 +111,7 @@ import {
   ensureHarnessSessionInit,
   executePublish,
   extractHarnessMemoriesFromMirror,
+  getModelContextSize,
   hashPromptVersion,
   isHarnessSession,
   matchesSurface,
@@ -134,6 +135,7 @@ import {
 import type {
   AiMessage,
   ChannelId,
+  ContextBreakdown,
   ControlMessage,
   TerminalMessage,
   ThinkingLevel,
@@ -2216,6 +2218,11 @@ export class AgentServer {
           model: session.model,
         })
 
+        // Initial Context-gauge breakdown so the popover has data the
+        // moment the user opens it — no "Loading details…" state on
+        // Pi-SDK sessions.
+        this.emitContextUpdateIfPiSdk(msg.id, session)
+
         // Send context info if available
         if (session.contextInfo) {
           this.sendToClient(Channel.AI, {
@@ -2636,6 +2643,29 @@ export class AgentServer {
         provider: providerName,
         model,
       })
+      // Initial Context-gauge breakdown for harness sessions. We don't
+      // know per-section sizes (the CLI's prompt is opaque), but we can
+      // at least seed `contextWindow` so the popover renders an empty
+      // gauge instead of nothing until the first `tokenUsageUpdated`
+      // event arrives.
+      const contextWindow = getModelContextSize(model)
+      if (contextWindow > 0) {
+        this.sendToClient(Channel.AI, {
+          type: 'context_update',
+          sessionId: id,
+          breakdown: {
+            contextWindow,
+            systemPrompt: 0,
+            systemTools: 0,
+            mcpTools: 0,
+            skills: 0,
+            memoryFiles: 0,
+            messages: 0,
+            autocompactBuffer: 0,
+            source: 'harness',
+          },
+        })
+      }
     }
 
     log.info(
@@ -3998,6 +4028,9 @@ export class AgentServer {
         }
         try {
           session.switchModel(msg.provider, msg.model)
+          // Context window may have changed — refresh the gauge before
+          // the user's next turn (otherwise stale until turn_end).
+          this.emitContextUpdateIfPiSdk(id, session)
           log.info(
             { sessionId: id, provider: msg.provider, model: msg.model },
             'Switched API session to new default model',
@@ -5299,6 +5332,10 @@ export class AgentServer {
     // Skip for harness sessions — they manage their own context
     if (!isHarnessSession(session) && !session.contextInfo) {
       const contextInfo = session.loadConversationContext(msg.content)
+      // Memory layer just changed — refresh the gauge so the popover
+      // attributes the new memory bytes correctly before the next turn
+      // ends.
+      this.emitContextUpdateIfPiSdk(sessionId, session)
       if (contextInfo) {
         this.sendToClient(Channel.AI, {
           type: 'context_info',
@@ -6756,9 +6793,11 @@ export class AgentServer {
 
   /** Refresh connector tools on all active sessions so new connectors are available immediately. */
   private refreshAllSessionTools(): void {
-    for (const session of this.sessions.values()) {
+    for (const [sessionId, session] of this.sessions) {
       if (!isHarnessSession(session)) {
         session.refreshConnectorTools()
+        // Tool list (and thus its byte budget) just changed.
+        this.emitContextUpdateIfPiSdk(sessionId, session)
       }
     }
     this.webhookRunner?.refreshAllSessionTools()
@@ -6964,6 +7003,26 @@ export class AgentServer {
     }
   }
 
+  /**
+   * Pull a fresh ContextBreakdown from a Pi-SDK Session and forward it
+   * to the desktop client. Used after explicit mutations (model switch,
+   * connector refresh, conversation context load) where the breakdown
+   * changes between turns and would otherwise stay stale until the
+   * next turn ends. No-op for harness sessions — the codex harness
+   * emits its own breakdowns via `tokenUsageUpdated`.
+   */
+  private emitContextUpdateIfPiSdk(sessionId: string, session: unknown): void {
+    if (isHarnessSession(session)) return
+    const piSession = session as { getContextBreakdown?: () => ContextBreakdown | null }
+    const breakdown = piSession.getContextBreakdown?.()
+    if (!breakdown) return
+    this.sendToClient(Channel.AI, {
+      type: 'context_update',
+      sessionId,
+      breakdown,
+    })
+  }
+
   /**
    * Schedule a hard wall-clock cancel for a detached turn. Replaces any
    * existing timer for the same session so repeated disconnects don't
diff --git a/packages/desktop/src/components/RoutineChat.tsx b/packages/desktop/src/components/RoutineChat.tsx
index 7e041668..9282eee3 100644
--- a/packages/desktop/src/components/RoutineChat.tsx
+++ b/packages/desktop/src/components/RoutineChat.tsx
@@ -8,7 +8,6 @@ import { projectStore } from '../lib/store/projectStore.js'
 import { sessionStore, useSessionState } from '../lib/store/sessionStore.js'
 import { ChatInput } from './chat/ChatInput.js'
 import { ConfirmDialog } from './chat/ConfirmDialog.js'
-import { ContextIndicator } from './chat/ContextIndicator.js'
 import { MessageList } from './chat/MessageList.js'
 import { PlanReviewOverlay } from './chat/PlanReviewOverlay.js'
 import { RoutineChatHeader } from './chat/RoutineChatHeader.js'
@@ -241,7 +240,6 @@ export function RoutineChat() {
 
   return (
     <div className="chat-shell">
-      <ContextIndicator contextInfo={activeConv?.contextInfo} sessionId={activeConv?.sessionId} />
       {isSyncing && messages.length === 0 ? (
         /* First load — nothing local to show yet, show a subtle spinner */
         <div className="chat-shell__sync-loader">
diff --git a/packages/desktop/src/components/chat/ChatInput.tsx b/packages/desktop/src/components/chat/ChatInput.tsx
index 2d0989be..ca779ed1 100644
--- a/packages/desktop/src/components/chat/ChatInput.tsx
+++ b/packages/desktop/src/components/chat/ChatInput.tsx
@@ -30,6 +30,7 @@ import { MentionDropdown } from '../mentions/MentionDropdown.js'
 import { AskUserInline } from './AskUserInline.js'
 import { ComposerAddMenu } from './ComposerAddMenu.js'
 import { ConnectorBanner } from './ConnectorToolbar.js'
+import { ContextGauge } from './ContextGauge.js'
 import { ModelSelector } from './ModelSelector.js'
 import type { RichInputHandle } from './RichInput.js'
 import { RichInput } from './RichInput.js'
@@ -811,6 +812,7 @@ export function ChatInput({
               )}
             </div>
             <div className="composer__toolbar-right">
+              <ContextGauge />
               <ModelSelector />
               {isCurrentSessionWorking ? (
                 <>
diff --git a/packages/desktop/src/components/chat/ContextGauge.tsx b/packages/desktop/src/components/chat/ContextGauge.tsx
new file mode 100644
index 00000000..81738f0f
--- /dev/null
+++ b/packages/desktop/src/components/chat/ContextGauge.tsx
@@ -0,0 +1,120 @@
+import { useCallback, useMemo, useRef, useState } from 'react'
+import { sessionStore } from '../../lib/store/sessionStore.js'
+import { ContextPopover } from './ContextPopover.js'
+
+const SIZE = 16
+const STROKE = 1.6
+const RADIUS = (SIZE - STROKE) / 2
+const CIRCUMFERENCE = 2 * Math.PI * RADIUS
+
+/**
+ * Compose-toolbar context-window gauge. Click toggles the breakdown
+ * popover. Color states track the autocompaction threshold:
+ *   < 70%  → idle (muted ring)
+ *   70–80% → warning (amber)
+ *   ≥ 80%  → critical (matches `--accent`; compaction will fire on the
+ *           next turn at the default 0.80 threshold).
+ *
+ * Hidden when no `contextBreakdown` is in the store (fresh session before
+ * the first `context_update`, or harness path that hasn't reported yet).
+ */
+export function ContextGauge() {
+  const [open, setOpen] = useState(false)
+  const buttonRef = useRef<HTMLButtonElement>(null)
+  const [anchorRect, setAnchorRect] = useState<DOMRect | null>(null)
+
+  const breakdown = sessionStore((s) => {
+    const sid = s.currentSessionId
+    if (!sid) return null
+    return s.sessionStates.get(sid)?.contextBreakdown ?? null
+  })
+
+  const used = useMemo(() => {
+    if (!breakdown) return 0
+    return (
+      breakdown.systemPrompt +
+      breakdown.systemTools +
+      breakdown.mcpTools +
+      breakdown.skills +
+      breakdown.memoryFiles +
+      breakdown.messages
+    )
+  }, [breakdown])
+
+  const fillRatio =
+    breakdown && breakdown.contextWindow > 0
+      ? Math.min(1, Math.max(0, used / breakdown.contextWindow))
+      : 0
+  const percentLabel = Math.round(fillRatio * 100)
+
+  const colorClass =
+    fillRatio >= 0.8
+      ? 'context-gauge--critical'
+      : fillRatio >= 0.7
+        ? 'context-gauge--warning'
+        : 'context-gauge--idle'
+
+  const handleToggle = useCallback(() => {
+    setAnchorRect(buttonRef.current?.getBoundingClientRect() ?? null)
+    setOpen((v) => !v)
+  }, [])
+
+  const handleClose = useCallback(() => setOpen(false), [])
+
+  if (!breakdown) return null
+
+  const dashOffset = CIRCUMFERENCE * (1 - fillRatio)
+
+  return (
+    <>
+      <button
+        ref={buttonRef}
+        type="button"
+        className={`context-gauge ${colorClass}${open ? ' context-gauge--open' : ''}`}
+        aria-label={`Context window ${percentLabel}% used`}
+        aria-haspopup="true"
+        aria-expanded={open}
+        data-tooltip={`${percentLabel}% of context used`}
+        onClick={handleToggle}
+      >
+        <svg
+          width={SIZE}
+          height={SIZE}
+          viewBox={`0 0 ${SIZE} ${SIZE}`}
+          role="img"
+          aria-label={`Context ${percentLabel}% used`}
+          focusable="false"
+        >
+          <title>Context {percentLabel}% used</title>
+          <circle
+            cx={SIZE / 2}
+            cy={SIZE / 2}
+            r={RADIUS}
+            fill="none"
+            strokeWidth={STROKE}
+            className="context-gauge__track"
+          />
+          <circle
+            cx={SIZE / 2}
+            cy={SIZE / 2}
+            r={RADIUS}
+            fill="none"
+            strokeWidth={STROKE}
+            strokeLinecap="round"
+            className="context-gauge__fill"
+            strokeDasharray={CIRCUMFERENCE}
+            strokeDashoffset={dashOffset}
+            transform={`rotate(-90 ${SIZE / 2} ${SIZE / 2})`}
+          />
+        </svg>
+      </button>
+      <ContextPopover
+        open={open}
+        onClose={handleClose}
+        anchorRect={anchorRect}
+        breakdown={breakdown}
+        triggerRef={buttonRef}
+      />
+    </>
+  )
+}
diff --git a/packages/desktop/src/components/chat/ContextIndicator.tsx b/packages/desktop/src/components/chat/ContextIndicator.tsx
deleted file mode 100644
index 3183c3ef..00000000
--- a/packages/desktop/src/components/chat/ContextIndicator.tsx
+++ /dev/null
@@ -1,40 +0,0 @@
-import { Brain, FolderOpen } from 'lucide-react'
-import type { ConversationContextInfo } from '../../lib/conversations.js'
-import { useStore } from '../../lib/store.js'
-
-interface ContextIndicatorProps {
-  contextInfo?: ConversationContextInfo
-  sessionId?: string
-}
-
-export function ContextIndicator({ contextInfo, sessionId }: ContextIndicatorProps) {
-  const openContextPanel = useStore((s) => s.openContextPanel)
-
-  const totalMemories = contextInfo
-    ? contextInfo.globalMemories.length +
-      contextInfo.conversationMemories.length +
-      contextInfo.crossConversationMemories.length
-    : 0
-
-  if (!sessionId && totalMemories === 0) return null
-
-  return (
-    <div className="context-indicator">
-      <button
-        type="button"
-        className="context-indicator__badge"
-        onClick={openContextPanel}
-        data-tooltip={totalMemories > 0 ? `${totalMemories} memories loaded` : 'Conversation info'}
-      >
-        {totalMemories > 0 ? (
-          <>
-            <Brain size={14} strokeWidth={1.5} />
-            <span className="context-indicator__count">{totalMemories}</span>
-          </>
-        ) : (
-          <FolderOpen size={14} strokeWidth={1.5} />
-        )}
-      </button>
-    </div>
-  )
-}
diff --git a/packages/desktop/src/components/chat/ContextPopover.tsx b/packages/desktop/src/components/chat/ContextPopover.tsx
new file mode 100644
index 00000000..28f3278a
--- /dev/null
+++ b/packages/desktop/src/components/chat/ContextPopover.tsx
@@ -0,0 +1,240 @@
+import type { ContextBreakdown } from '@anton/protocol'
+import { type RefObject, useEffect, useMemo, useRef } from 'react'
+import { createPortal } from 'react-dom'
+import { useStore } from '../../lib/store.js'
+
+interface Props {
+  open: boolean
+  onClose: () => void
+  anchorRect: DOMRect | null
+  breakdown: ContextBreakdown
+  /**
+   * Trigger button that opens this popover. Used to skip outside-click
+   * close when the user clicks the trigger again — without this, the
+   * mousedown on the trigger fires onClose, then the click toggles the
+   * gauge back open. Net effect: the popover never closes via the
+   * gauge.
+   */
+  triggerRef?: RefObject<HTMLElement | null>
+}
+
+interface Row {
+  key: string
+  label: string
+  tokens: number
+  /** Solid hue for the stacked bar segment + row legend dot. */
+  className: string
+}
+
+function formatTokens(n: number): string {
+  if (n >= 1_000_000) return `${(n / 1_000_000).toFixed(1)}M`
+  if (n >= 100_000) return `${Math.round(n / 1_000)}k`
+  if (n >= 1_000) return `${(n / 1_000).toFixed(1)}k`
+  return String(Math.max(0, Math.round(n)))
+}
+
+const ESTIMATED_POPOVER_HEIGHT = 360
+const ESTIMATED_POPOVER_WIDTH = 320
+const VIEWPORT_PADDING = 8
+
+/**
+ * Floating per-category breakdown of the active session's context-window
+ * usage. Rendered in a portal so a transformed ancestor can't break the
+ * fixed positioning. Anchored above the gauge by default; flips below
+ * when there isn't enough room above.
+ *
+ * Pi-SDK sessions render every category. Harness sessions
+ * (`breakdown.source === 'harness'`) only carry `messages` + `contextWindow`,
+ * so we collapse to a 2-row breakdown plus a footnote.
+ */
+export function ContextPopover({ open, onClose, anchorRect, breakdown, triggerRef }: Props) {
+  const popoverRef = useRef<HTMLDivElement>(null)
+  const openContextPanel = useStore((s) => s.openContextPanel)
+
+  useEffect(() => {
+    if (!open) return
+    const onKey = (e: KeyboardEvent) => {
+      if (e.key === 'Escape') {
+        e.preventDefault()
+        onClose()
+      }
+    }
+    const onClick = (e: MouseEvent) => {
+      const target = e.target as Node
+      if (popoverRef.current?.contains(target)) return
+      // Don't close on the trigger button — the trigger's own click
+      // handler will toggle `open` to false a beat later, and closing
+      // here would race with that and re-open the popover.
+      if (triggerRef?.current?.contains(target)) return
+      onClose()
+    }
+    window.addEventListener('keydown', onKey)
+    const id = window.setTimeout(() => window.addEventListener('mousedown', onClick), 0)
+    return () => {
+      window.removeEventListener('keydown', onKey)
+      window.removeEventListener('mousedown', onClick)
+      window.clearTimeout(id)
+    }
+  }, [open, onClose, triggerRef])
+
+  const rows: Row[] = useMemo(() => {
+    if (breakdown.source === 'harness') {
+      return [
+        {
+          key: 'messages',
+          label: 'Messages',
+          tokens: breakdown.messages,
+          className: 'context-popover__seg--messages',
+        },
+      ]
+    }
+    return [
+      {
+        key: 'messages',
+        label: 'Messages',
+        tokens: breakdown.messages,
+        className: 'context-popover__seg--messages',
+      },
+      {
+        key: 'systemPrompt',
+        label: 'System prompt',
+        tokens: breakdown.systemPrompt,
+        className: 'context-popover__seg--system-prompt',
+      },
+      {
+        key: 'systemTools',
+        label: 'System tools',
+        tokens: breakdown.systemTools,
+        className: 'context-popover__seg--system-tools',
+      },
+      {
+        key: 'mcpTools',
+        label: 'MCP tools',
+        tokens: breakdown.mcpTools,
+        className: 'context-popover__seg--mcp-tools',
+      },
+      {
+        key: 'skills',
+        label: 'Skills',
+        tokens: breakdown.skills,
+        className: 'context-popover__seg--skills',
+      },
+      {
+        key: 'memoryFiles',
+        label: 'Memory files',
+        tokens: breakdown.memoryFiles,
+        className: 'context-popover__seg--memory',
+      },
+    ]
+  }, [breakdown])
+
+  const usedTokens = rows.reduce((sum, r) => sum + r.tokens, 0)
+  const reserved = breakdown.autocompactBuffer
+  const free = Math.max(0, breakdown.contextWindow - usedTokens - reserved)
+
+  if (!open || !anchorRect) return null
+
+  const spaceAbove = anchorRect.top
+  const placeAbove = spaceAbove >= ESTIMATED_POPOVER_HEIGHT + 16
+  // Center the popover horizontally on the trigger so the visual
+  // pointer always reads "this comes from that button". Clamp to the
+  // viewport so a gauge near the right edge can't push the popover
+  // off-screen.
+  const anchorCenter = anchorRect.left + anchorRect.width / 2
+  const idealLeft = anchorCenter - ESTIMATED_POPOVER_WIDTH / 2
+  const maxLeft = window.innerWidth - ESTIMATED_POPOVER_WIDTH - VIEWPORT_PADDING
+  const left = Math.max(VIEWPORT_PADDING, Math.min(idealLeft, maxLeft))
+  const style: React.CSSProperties = placeAbove
+    ? {
+        position: 'fixed',
+        left,
+        bottom: window.innerHeight - anchorRect.top + 8,
+        zIndex: 50,
+      }
+    : {
+        position: 'fixed',
+        left,
+        top: anchorRect.bottom + 8,
+        zIndex: 50,
+      }
+
+  // Stacked bar uses percentage widths so totals stay stable across resizes.
+  const window_ = breakdown.contextWindow
+  const pct = (n: number) => (window_ > 0 ? (n / window_) * 100 : 0)
+
+  return createPortal(
+    <div
+      ref={popoverRef}
+      className="context-popover"
+      aria-label="Context window breakdown"
+      style={style}
+    >
+      <div className="context-popover__head">
+        <span className="context-popover__title">Context</span>
+        <span className="context-popover__counter">
+          {formatTokens(usedTokens)}/{formatTokens(window_)}
+        </span>
+      </div>
+
+      <div className="context-popover__bar" aria-hidden>
+        {rows
+          .filter((r) => r.tokens > 0)
+          .map((r) => (
+            <span
+              key={r.key}
+              className={`context-popover__seg ${r.className}`}
+              style={{ width: `${pct(r.tokens)}%` }}
+            />
+          ))}
+        {reserved > 0 && (
+          <span
+            className="context-popover__seg context-popover__seg--reserved"
+            style={{ width: `${pct(reserved)}%` }}
+          />
+        )}
+      </div>
+
+      <ul className="context-popover__rows">
+        {rows.map((r) => (
+          <li key={r.key} className="context-popover__row">
+            <span className={`context-popover__dot ${r.className}`} />
+            <span className="context-popover__label">{r.label}</span>
+            <span className="context-popover__value">
+              {window_ > 0 ? `${pct(r.tokens).toFixed(1)}%` : '—'}
+            </span>
+          </li>
+        ))}
+        {reserved > 0 && (
+          <li className="context-popover__row">
+            <span className="context-popover__dot context-popover__seg--reserved" />
+            <span className="context-popover__label">Autocompact buffer</span>
+            <span className="context-popover__value">{pct(reserved).toFixed(1)}%</span>
+          </li>
+        )}
+        <li className="context-popover__row context-popover__row--free">
+          <span className="context-popover__dot context-popover__dot--free" />
+          <span className="context-popover__label">Free space</span>
+          <span className="context-popover__value">{pct(free).toFixed(1)}%</span>
+        </li>
+      </ul>
+
+      {breakdown.source === 'harness' && (
+        <div className="context-popover__footnote">
+          Per-section detail is not available for harness sessions.
+        </div>
+      )}
+
+      <button
+        type="button"
+        className="context-popover__details-link"
+        onClick={() => {
+          openContextPanel()
+          onClose()
+        }}
+      >
+        View memory details →
+      </button>
+    </div>,
+    document.body,
+  )
+}
diff --git a/packages/desktop/src/index.css b/packages/desktop/src/index.css
index 949bb681..59740944 100644
--- a/packages/desktop/src/index.css
+++ b/packages/desktop/src/index.css
@@ -14288,38 +14288,167 @@ button {
 }
 
 /* ═══════════════════════════════════════════════════════════════════
-   CONTEXT INDICATOR
+   CONTEXT GAUGE + POPOVER (composer toolbar)
    ═══════════════════════════════════════════════════════════════════ */
 
-/* ── Context indicator badge ── */
-.context-indicator {
-  position: relative;
-  display: flex;
-  justify-content: flex-end;
-  padding: 4px 16px 0;
+.context-gauge {
+  display: inline-grid;
+  place-items: center;
+  width: 26px;
+  height: 26px;
+  padding: 0;
+  border: 0;
+  background: transparent;
+  border-radius: 999px;
+  color: var(--text-3);
+  cursor: pointer;
+  transition: background 0.12s ease, color 0.12s ease;
+}
+.context-gauge:hover,
+.context-gauge--open {
+  background: var(--bg-elev-2);
+  color: var(--text);
+}
+.context-gauge__track {
+  stroke: color-mix(in oklch, var(--border-strong) 100%, transparent);
+}
+.context-gauge__fill {
+  stroke: var(--text-3);
+  transition: stroke-dashoffset 0.18s ease, stroke 0.12s ease;
+}
+.context-gauge--warning .context-gauge__fill {
+  stroke: var(--warning);
+}
+.context-gauge--critical .context-gauge__fill {
+  stroke: var(--accent);
 }
 
-.context-indicator__badge {
+/* ── Popover ── */
+.context-popover {
+  width: 280px;
+  padding: 12px 14px 10px;
+  background: var(--bg-elev-2);
+  border: 1px solid var(--border-strong);
+  border-radius: 12px;
+  box-shadow: 0 12px 32px rgba(0, 0, 0, 0.32), 0 2px 8px rgba(0, 0, 0, 0.18);
+  color: var(--text);
+  font-size: 12.5px;
+  line-height: 1.4;
+}
+.context-popover__head {
   display: flex;
-  align-items: center;
+  align-items: baseline;
+  justify-content: space-between;
+  margin-bottom: 10px;
+}
+.context-popover__title {
+  font-size: 13px;
+  font-weight: 600;
+  letter-spacing: -0.005em;
+}
+.context-popover__counter {
+  color: var(--text-3);
+  font-variant-numeric: tabular-nums;
+}
+.context-popover__bar {
+  display: flex;
+  width: 100%;
+  height: 6px;
+  border-radius: 999px;
+  overflow: hidden;
+  background: color-mix(in oklch, var(--border) 100%, transparent);
+  margin-bottom: 10px;
+}
+.context-popover__seg {
+  height: 100%;
+}
+.context-popover__rows {
+  margin: 0;
+  padding: 0;
+  list-style: none;
+  display: flex;
+  flex-direction: column;
   gap: 4px;
-  padding: 2px 8px;
-  border: none;
+}
+.context-popover__row {
+  display: grid;
+  grid-template-columns: 8px 1fr auto;
+  align-items: center;
+  gap: 8px;
+  padding: 2px 0;
+  color: var(--text-2, var(--text));
+}
+.context-popover__row--free .context-popover__label {
+  color: var(--text-3);
+}
+.context-popover__dot {
+  width: 8px;
+  height: 8px;
+  border-radius: 999px;
+  display: inline-block;
+}
+.context-popover__dot--free {
   background: transparent;
-  color: var(--text-tertiary, #666);
-  font-size: 11px;
+  box-shadow: inset 0 0 0 1px var(--border-strong);
+}
+.context-popover__label {
+  white-space: nowrap;
+  overflow: hidden;
+  text-overflow: ellipsis;
+}
+.context-popover__value {
+  color: var(--text-3);
+  font-variant-numeric: tabular-nums;
+  font-size: 12px;
+}
+.context-popover__footnote {
+  margin-top: 10px;
+  padding-top: 8px;
+  border-top: 1px solid var(--border);
+  font-size: 11.5px;
+  color: var(--text-3);
+}
+.context-popover__details-link {
+  display: block;
+  width: 100%;
+  margin-top: 10px;
+  padding: 6px 0 0;
+  border: 0;
+  border-top: 1px solid var(--border);
+  background: transparent;
+  color: var(--text-3);
+  font-size: 12px;
+  text-align: left;
   cursor: pointer;
-  border-radius: 4px;
-  transition: background 0.15s, color 0.15s;
+  transition: color 0.12s ease;
 }
-
-.context-indicator__badge:hover {
-  background: var(--bg-hover, rgba(var(--overlay), 0.06));
-  color: var(--text-secondary, #999);
+.context-popover__details-link:hover {
+  color: var(--accent);
 }
 
-.context-indicator__count {
-  font-variant-numeric: tabular-nums;
+/* Stacked-bar segment hues — kept distinct so the bar reads
+   instantly without needing a legend. Tones drawn from existing
+   accent-derived oklch values to match the rest of the UI. */
+.context-popover__seg--messages {
+  background: var(--accent);
+}
+.context-popover__seg--system-prompt {
+  background: oklch(0.7 0.07 250);
+}
+.context-popover__seg--system-tools {
+  background: oklch(0.7 0.1 160);
+}
+.context-popover__seg--mcp-tools {
+  background: oklch(0.7 0.1 220);
+}
+.context-popover__seg--skills {
+  background: oklch(0.72 0.13 300);
+}
+.context-popover__seg--memory {
+  background: oklch(0.74 0.13 35);
+}
+.context-popover__seg--reserved {
+  background: color-mix(in oklch, var(--text-3) 60%, transparent);
 }
 
 /* ── Context panel (inside SidePanel) ── */
diff --git a/packages/desktop/src/lib/store/handlers/interactionHandler.ts b/packages/desktop/src/lib/store/handlers/interactionHandler.ts
index c9ef3c19..bfa32310 100644
--- a/packages/desktop/src/lib/store/handlers/interactionHandler.ts
+++ b/packages/desktop/src/lib/store/handlers/interactionHandler.ts
@@ -189,6 +189,14 @@ export function handleInteractionMessage(msg: AiMessage, ctx: MessageContext): b
       return true
     }
 
+    case 'context_update': {
+      const sid = ctx.msgSessionId
+      if (sid && msg.breakdown) {
+        sessionStore.getState().updateSessionState(sid, { contextBreakdown: msg.breakdown })
+      }
+      return true
+    }
+
     case 'done': {
       const ss = sessionStore.getState()
       const store = useStore.getState()
diff --git a/packages/desktop/src/lib/store/sessionStore.ts b/packages/desktop/src/lib/store/sessionStore.ts
index b1773aed..ee575f0e 100644
--- a/packages/desktop/src/lib/store/sessionStore.ts
+++ b/packages/desktop/src/lib/store/sessionStore.ts
@@ -95,6 +95,12 @@ export interface SessionState {
   lastResponseProvider: string | null
   lastResponseModel: string | null
 
+  // Per-category context window breakdown (drives the composer Context
+  // gauge + popover). Null until the agent-server emits the first
+  // `context_update` event for this session. Pi-SDK sessions carry the
+  // full split; harness sessions only populate `messages` + `contextWindow`.
+  contextBreakdown: import('@anton/protocol').ContextBreakdown | null
+
   // Pending interactions
   pendingConfirm: PendingConfirm | null
   pendingPlan: PendingPlan | null
@@ -150,6 +156,7 @@ export function createSessionState(
     sessionUsage: null,
     lastResponseProvider: null,
     lastResponseModel: null,
+    contextBreakdown: null,
     pendingConfirm: null,
     pendingPlan: null,
     pendingAskUser: null,
diff --git a/specs/features/ui/CONTEXT_GAUGE.md b/specs/features/ui/CONTEXT_GAUGE.md
new file mode 100644
index 00000000..a787c510
--- /dev/null
+++ b/specs/features/ui/CONTEXT_GAUGE.md
@@ -0,0 +1,113 @@
+# Composer Context Gauge + Popover
+
+A circular gauge in the chat composer toolbar shows context-window
+utilisation at a glance. Clicking the gauge opens a popover with a
+per-category breakdown of where the prompt budget is going (messages,
+system prompt, tools, skills, memory, autocompact reserve, free space).
+
+The feature replaces the previous `ContextIndicator` (memory-count
+badge) — the memory count is still surfaced inside the side panel's
+Context view.
+
+## Categories
+
+| Category | Source | Pi SDK | Harness |
+|---|---|:-:|:-:|
+| Messages | `estimateTokens(piAgent.state.messages)` | ✓ | ✓ (= `total inputTokens`) |
+| System prompt | identity + workspace/user rules + current context + surface + agent context + connectors + project type + reference knowledge + workflows + project memory instructions | ✓ | ✗ |
+| System tools | built-in `AgentTool` schemas (names in `BUILT_IN_TOOL_NAMES`) | ✓ | ✗ |
+| MCP tools | tools from `mcpManager` + direct OAuth connector tools | ✓ | ✗ |
+| Skills | `buildActiveSkillsLayer` output | ✓ | ✗ |
+| Memory files | `buildMemoryLayer` output | ✓ | ✗ |
+| Autocompact buffer | `contextWindow * (1 − threshold)` (default `0.20 × window`) | ✓ | ✗ |
+| Free space | `contextWindow − Σ(used) − autocompactBuffer` (derived client-side) | ✓ | ✓ |
+
+Categories matching Claude Code's UI but **omitted** in v1:
+
+- **System tools (deferred)** / **MCP tools (deferred)** — Anton has no
+  lazy-tool-loading mechanism today; every tool's schema is live in
+  every prompt. We can re-add these rows when ToolSearch-style deferral
+  ships.
+- **Custom agents** — Anton's agents are reachable via `delegate_to_agent`
+  rather than injected into the prompt, so the row would always read
+  `0.0%`. Add when an agent flow injects content (e.g. agent identity
+  prompts) into the prompt.
+
+## Token estimation
+
+Two-tier:
+
+1. **Estimate (sync, cheap)** — char-count per layer / 4. Same heuristic
+   `estimateMessageTokens` already uses for compaction. Computed inside
+   `Session.getSystemPrompt` (caches sizes onto `_lastLayerSizes`) and
+   `categorizeTools` (sums `name + description + JSON.stringify(parameters)`
+   per tool, classified by `BUILT_IN_TOOL_NAMES`).
+2. **Calibration (per-turn)** — after a turn finishes, compare the
+   model's reported `input_tokens` against our pre-turn estimate. The
+   ratio updates `_contextEstimateScale`, clamped to `[0.5, 2.0]`, and
+   gets applied to subsequent breakdowns. Drifts toward reality across
+   the first 1–2 turns without paying tokenizer cost.
+
+Real tokenisers (`tiktoken`, `@anthropic-ai/tokenizer`) were
+deliberately deferred — the calibration loop is "good enough" for a
+gauge and avoids per-prompt CPU cost on every turn.
+
+## Protocol
+
+```ts
+// packages/protocol/src/messages.ts
+export interface ContextBreakdown {
+  contextWindow: number
+  systemPrompt: number
+  systemTools: number
+  mcpTools: number
+  skills: number
+  memoryFiles: number
+  messages: number
+  autocompactBuffer: number
+  source: 'pi-sdk' | 'harness'
+}
+
+export interface AiContextUpdateMessage {
+  type: 'context_update'
+  sessionId?: string
+  breakdown: ContextBreakdown
+}
+```
+
+Server emits `context_update` at:
+
+- `session_created` (initial breakdown so the popover never shows a
+  loading state on Pi SDK sessions).
+- After every `turn_end` event from the Pi SDK loop (`Session` already
+  emits `token_update` at the same site).
+- After every codex-harness `tokenUsageUpdated` notification (harness
+  variant: `messages` + `contextWindow` only).
+
+## Gauge color states
+
+The autocompaction threshold (default `0.80`) drives the warning band:
+
+- `< 70%` → `idle` — muted ring (`var(--text-3)`)
+- `70–80%` → `warning` — `var(--warning)` amber
+- `≥ 80%` → `critical` — `var(--accent)` (compaction will fire on the
+  next turn)
+
+## Files touched
+
+| File | Change |
+|---|---|
+| `packages/protocol/src/messages.ts` | + `ContextBreakdown`, + `AiContextUpdateMessage`, union extension |
+| `packages/agent-core/src/agent.ts` | + `BUILT_IN_TOOL_NAMES`, + `categorizeTools` |
+| `packages/agent-core/src/prompt-layers.ts` | + `SessionPromptLayerSizes`, + `emptyPromptLayerSizes` |
+| `packages/agent-core/src/session.ts` | layer-size capture in `getSystemPrompt`, + `getContextBreakdown`, + `updateContextEstimateScale`, emit `context_update` post-turn |
+| `packages/agent-core/src/harness/codex-harness-session.ts` | emit harness-variant `context_update` from `onTokenUsageUpdated` |
+| `packages/agent-server/src/server.ts` | emit initial `context_update` after `session_created` |
+| `packages/desktop/src/lib/store/sessionStore.ts` | + `contextBreakdown` field on `SessionState` |
+| `packages/desktop/src/lib/store/handlers/interactionHandler.ts` | handle `context_update` |
+| `packages/desktop/src/components/chat/ContextGauge.tsx` | new |
+| `packages/desktop/src/components/chat/ContextPopover.tsx` | new |
+| `packages/desktop/src/components/chat/ChatInput.tsx` | slot gauge into `composer__toolbar-right` |
+| `packages/desktop/src/components/chat/ContextIndicator.tsx` | **deleted** |
+| `packages/desktop/src/components/RoutineChat.tsx` | drop `ContextIndicator` import + render |
+| `packages/desktop/src/index.css` | + gauge + popover styles, − stale `.context-indicator` rules |
diff --git a/specs/features/ui/CONTEXT_GAUGE_BLUNDERS.md b/specs/features/ui/CONTEXT_GAUGE_BLUNDERS.md
new file mode 100644
index 00000000..c57e4812
--- /dev/null
+++ b/specs/features/ui/CONTEXT_GAUGE_BLUNDERS.md
@@ -0,0 +1,203 @@
+# Context Gauge — Known Blunders & Fix Queue
+
+Tracking doc for issues caught during self-review of the initial
+`feat/composer-context-gauge` implementation. Delete once every entry
+is **Fixed** and verified.
+
+Numbering matches the order they were surfaced.
+
+## Critical
+
+### 1. Calibration is biased low
+
+**Where**: `packages/agent-core/src/session.ts` — `turn_end` handler.
+
+`updateContextEstimateScale(input)` runs after pi-ai has already
+appended the assistant's response message to `piAgent.state.messages`.
+So `breakdown.messages` (post-turn) is larger than the actual input
+that produced `inputTokens` (pre-turn). `actual / rawEstimate < 1` →
+scale settles around 0.85–0.95 → gauge under-reports by 5–15% on
+every turn forever.
+
+**Fix**: snapshot the raw estimate at `turn_start` and use that for
+calibration at `turn_end`, OR exclude the most recently appended
+assistant message from the estimate during calibration.
+
+Status: fixed
+
+---
+
+### 2. Fork children show zero breakdown
+
+**Where**: `packages/agent-core/src/session.ts:2480-2482`.
+
+`getSystemPrompt()` returns early when `systemPromptOverride` is set
+(sub-agents, fork children) and never populates `_lastLayerSizes`.
+The breakdown for those sessions reports `systemPrompt: 0` even when
+the override prompt is huge. Tools and messages still report real
+numbers, so the gauge looks plausible but the popover lies.
+
+**Fix**: when `systemPromptOverride` is active, populate
+`_lastLayerSizes.identity` with `override.length` (everything else
+stays 0) so the breakdown reports the override under "System prompt".
+
+Status: fixed
+
+---
+
+### 3. Stale gauge after model switch
+
+**Where**: `packages/agent-core/src/session.ts:1421-1433`
+(`switchModel`).
+
+Updates `resolvedModel` and pi-ai's model but does not re-emit
+`context_update`. Switching opus (1M) → sonnet (200k) leaves the
+popover showing old proportions until the next turn finishes.
+
+**Fix**: queue a `context_update` event from `switchModel` (push onto
+the next yielded event batch) using the new `resolvedModel.contextWindow`.
+Same emit path used by `setSurface`, `refreshConnectorTools`,
+`loadConversationContext`.
+
+Status: fixed
+
+---
+
+### 4. Codex harness `messages` over-reports
+
+**Where**: `packages/agent-core/src/harness/codex-harness-session.ts`
+in `onTokenUsageUpdated`.
+
+`total.inputTokens` from codex is *cumulative billed input* across
+all turns (counts cached tokens too). On long conversations it
+exceeds actual prompt size and can show >100% on the gauge.
+
+**Fix**: prefer `last.inputTokens` (per-turn input) over
+`total.inputTokens` for the breakdown's `messages` field; fall back
+to `total` only when `last` is absent. Cap the gauge at 100% as a
+defensive measure.
+
+Status: fixed
+
+---
+
+### 5. Harness `session_created` has no initial breakdown
+
+**Where**: `packages/agent-server/src/server.ts:2219-2229`.
+
+The initial `context_update` emit only runs on the Pi-SDK
+`session_created` branch. Harness sessions show no gauge until the
+first turn completes.
+
+**Fix**: emit a synthetic harness breakdown right after the harness
+`session_created` send, with `contextWindow` looked up from the
+resolved model and all category counters at 0.
+
+Status: fixed
+
+---
+
+### 7. Auto-fix collateral leaked into the diff
+
+**Where**: working tree.
+
+`pnpm check:fix` reformatted unrelated pre-existing files:
+`agent-config/package.json`, `tauri.conf.json`, `ProviderSettingsModal.tsx`,
+parts of `agent-server/server.ts`, parts of `index.css`. None of these
+relate to the gauge.
+
+**Fix**: `git checkout` those files (preserving only the gauge-related
+diffs) so the PR stays scoped.
+
+Status: fixed
+
+---
+
+## Medium
+
+### 6. Clicking the gauge while open doesn't close it
+
+**Where**: `packages/desktop/src/components/chat/ContextPopover.tsx`
++ `ContextGauge.tsx`.
+
+Outside-click handler runs on mousedown against `popoverRef`. The
+gauge button is outside `popoverRef`, so mousedown closes the popover;
+the subsequent click on the gauge fires `setOpen(v => !v)` and reopens
+it. The popover can only be closed by clicking elsewhere.
+
+**Fix**: ignore outside-click when the target is the gauge button
+(pass `triggerRef` into the popover and check `triggerRef.current.contains(target)`
+before calling `onClose`).
+
+Status: fixed
+
+---
+
+### 8. Unnecessary `as never[]` type cast
+
+**Where**: `packages/agent-core/src/session.ts:2664`.
+
+`estimateTokens(this.piAgent.state.messages as never[])` — the cast
+silences type checking. `piAgent.state.messages` is already
+`AgentMessage[]`, which is what `estimateTokens` accepts.
+
+**Fix**: drop the cast.
+
+Status: fixed
+
+---
+
+## Minor
+
+### 9. Lost entry point to side panel context view
+
+**Where**: removed `ContextIndicator.tsx` (clicked → `openContextPanel()`).
+
+The new gauge opens the popover instead of the side panel. No 1-click
+path from composer to the memory list anymore.
+
+**Fix**: add a "View memory details" affordance to the popover footer
+that calls `openContextPanel()` and closes the popover.
+
+Status: fixed
+
+---
+
+### 10. `_contextEstimateScale` not persisted
+
+**Where**: `Session.persist()` / `loadSession()`.
+
+Scale resets to 1.0 on every session resume; calibration starts over.
+
+**Fix**: persist scale alongside `compactionState` in
+`PersistedSession` and rehydrate in the constructor.
+
+Status: fixed
+
+---
+
+### 11. Magic `anchorRect.left - 80` offset
+
+**Where**: `ContextPopover.tsx`.
+
+Random nudge to "center" the popover near the gauge. Not derived from
+the popover width.
+
+**Fix**: align by anchor center: `left = anchorRect.left + anchorRect.width / 2 - ESTIMATED_POPOVER_WIDTH / 2`,
+clamped to viewport.
+
+Status: fixed
+
+---
+
+### 12. `setSurface` / `refreshConnectorTools` / `loadConversationContext` don't re-emit
+
+**Where**: same file, three methods.
+
+Each rebuilds the prompt and updates `_lastLayerSizes`, but no
+`context_update` event is queued. Popover stays stale until next turn.
+
+**Fix**: same approach as #3 — push a `context_update` onto the next
+yielded event batch from each setter.
+
+Status: fixed