From a5dcc60d7ee110a9e173b014caca42697d7b4a71 Mon Sep 17 00:00:00 2001
From: Simon Ferquel's Clanker <simon.ferquel+agent-go-expert@docker.com>
Date: Wed, 22 Apr 2026 09:48:47 +0000
Subject: [PATCH 1/9] fix(runtime): drain steerQueue at top of RunStream loop
 to close idle-window race

The steer queue was only drained mid-loop (after tool-call batches). Two
gaps allowed steer messages to be silently dropped:

1. Idle-window race: a Steer call lands between two RunStream invocations;
   the queue holds the message but nothing drains it when the next
   RunStream starts.
2. First-turn miss: when a RunStream turn produces a plain-text response
   with no tool calls, res.Stopped fires before the mid-loop drain is
   reached; the pending steer message is never injected.

Fix: drain steerQueue at the top of the for-loop body (before the first
model call) using the same pattern as the existing mid-loop drain.

Also extract the duplicate system-reminder wrap string into wrapSteerMessage
so the two drain sites cannot drift apart.

Also handles the empty-session bootstrap case: a RunStream started with
zero messages but steer messages already queued injects those messages
before the first model call, giving the model its initial context.

Tests added:
- TestSteer_IdleWindowIsConsumedOnNextTurn
- TestSteer_EmptySessionBootstrap

Fixes #2491

Assisted-By: docker-agent
---
 pkg/runtime/loop.go         |  30 +++++-
 pkg/runtime/runtime_test.go | 187 ++++++++++++++++++++++++++++++++++++
 2 files changed, 212 insertions(+), 5 deletions(-)
diff --git a/pkg/runtime/loop.go b/pkg/runtime/loop.go
index bebcc0d7f..a41f60708 100644
--- a/pkg/runtime/loop.go
+++ b/pkg/runtime/loop.go
@@ -41,6 +41,16 @@ func (r *LocalRuntime) registerDefaultTools() {
 	})
 }
 
+// wrapSteerMessage wraps a raw steer message in a <system-reminder> envelope
+// so the model receives the user's course-correction as a clearly-labelled
+// side-channel injection rather than a plain conversational turn.
+func wrapSteerMessage(content string) string {
+	return fmt.Sprintf(
+		"<system-reminder>\nThe user sent the following message while you were working:\n%s\n\nPlease address this in your next response while continuing with your current tasks.\n</system-reminder>",
+		content,
+	)
+}
+
 // finalizeEventChannel performs cleanup at the end of a RunStream goroutine:
 // restores the previous elicitation channel, emits the StreamStopped event,
 // fires hooks, and closes the events channel.
@@ -249,6 +259,20 @@ func (r *LocalRuntime) RunStream(ctx context.Context, sess *session.Session) <-c
 			}
 			slog.Debug("Starting conversation loop iteration", "agent", a.Name())
 
+			// --- STEERING: top-of-turn injection ---
+			// Drain any steer messages that arrived while the runtime was idle
+			// (between RunStream invocations) or before the first model call of
+			// this turn. Without this drain, a Steer call made while no tool
+			// calls are running would be silently dropped when the model returns
+			// a plain-text response with no tool calls.
+			if steered := r.steerQueue.Drain(ctx); len(steered) > 0 {
+				for _, sm := range steered {
+					userMsg := session.UserMessage(wrapSteerMessage(sm.Content), sm.MultiContent...)
+					sess.AddMessage(userMsg)
+					events <- UserMessage(sm.Content, sess.ID, sm.MultiContent, len(sess.Messages)-1)
+				}
+			}
+
 			streamCtx, streamSpan := r.startSpan(ctx, "runtime.stream", trace.WithAttributes(
 				attribute.String("agent", a.Name()),
 				attribute.String("session.id", sess.ID),
@@ -424,11 +448,7 @@ func (r *LocalRuntime) RunStream(ctx context.Context, sess *session.Session) <-c
 			// iteration, wrapped in <system-reminder> tags.
 			if steered := r.steerQueue.Drain(ctx); len(steered) > 0 {
 				for _, sm := range steered {
-					wrapped := fmt.Sprintf(
-						"<system-reminder>\nThe user sent the following message while you were working:\n%s\n\nPlease address this in your next response while continuing with your current tasks.\n</system-reminder>",
-						sm.Content,
-					)
-					userMsg := session.UserMessage(wrapped, sm.MultiContent...)
+					userMsg := session.UserMessage(wrapSteerMessage(sm.Content), sm.MultiContent...)
 					sess.AddMessage(userMsg)
 					events <- UserMessage(sm.Content, sess.ID, sm.MultiContent, len(sess.Messages)-1)
 				}
diff --git a/pkg/runtime/runtime_test.go b/pkg/runtime/runtime_test.go
index c1adbc84a..fa873f06a 100644
--- a/pkg/runtime/runtime_test.go
+++ b/pkg/runtime/runtime_test.go
@@ -5,6 +5,7 @@ import (
 	"errors"
 	"io"
 	"reflect"
+	"strings"
 	"sync"
 	"testing"
 
@@ -2198,3 +2199,189 @@ func toolNames(ts []tools.Tool) []string {
 	}
 	return names
 }
+
+// messageRecordingProvider records the chat.Message slices passed to each
+// CreateChatCompletionStream call so tests can inspect what the model saw.
+type messageRecordingProvider struct {
+	id      string
+	mu      sync.Mutex
+	streams []*mockStream
+	callIdx int
+
+	recordedMessages [][]chat.Message // messages passed on each call
+}
+
+func (p *messageRecordingProvider) ID() string { return p.id }
+
+func (p *messageRecordingProvider) CreateChatCompletionStream(_ context.Context, msgs []chat.Message, _ []tools.Tool) (chat.MessageStream, error) {
+	p.mu.Lock()
+	defer p.mu.Unlock()
+
+	snapshot := make([]chat.Message, len(msgs))
+	copy(snapshot, msgs)
+	p.recordedMessages = append(p.recordedMessages, snapshot)
+
+	if p.callIdx >= len(p.streams) {
+		return newStreamBuilder().AddStopWithUsage(1, 1).Build(), nil
+	}
+	s := p.streams[p.callIdx]
+	p.callIdx++
+	return s, nil
+}
+
+func (p *messageRecordingProvider) BaseConfig() base.Config { return base.Config{} }
+func (p *messageRecordingProvider) MaxTokens() int          { return 0 }
+
+// TestSteer_IdleWindowIsConsumedOnNextTurn verifies that a Steer call made
+// while no RunStream is active (i.e. in the idle window between turns) is
+// picked up by the very next RunStream iteration. Before the fix the steer
+// queue was only drained mid-loop (after tool calls), so a message enqueued
+// while idle was stranded and never seen by the model.
+func TestSteer_IdleWindowIsConsumedOnNextTurn(t *testing.T) {
+	t.Parallel()
+
+	// The model returns a plain-text stop (no tool calls) so we stay in the
+	// single-iteration path — this is the exact scenario where the old code
+	// would miss the steer message.
+	stream := newStreamBuilder().
+		AddContent("Got it").
+		AddStopWithUsage(5, 3).
+		Build()
+
+	prov := &messageRecordingProvider{
+		id:      "test/mock-model",
+		streams: []*mockStream{stream},
+	}
+
+	root := agent.New("root", "You are a test agent", agent.WithModel(prov))
+	tm := team.New(team.WithAgents(root))
+
+	rt, err := NewLocalRuntime(tm, WithSessionCompaction(false), WithModelStore(mockModelStore{}))
+	require.NoError(t, err)
+
+	// Enqueue a steer message BEFORE calling RunStream — simulating the
+	// idle-window race where a Steer call lands between two RunStream
+	// invocations.
+	err = rt.Steer(QueuedMessage{Content: "urgent: change direction"})
+	require.NoError(t, err)
+
+	sess := session.New(session.WithUserMessage("Do the task"))
+	sess.Title = "steer idle-window test"
+
+	evCh := rt.RunStream(t.Context(), sess)
+	var events []Event
+	for ev := range evCh {
+		events = append(events, ev)
+	}
+
+	// Verify the model received a message containing the steer content.
+	prov.mu.Lock()
+	defer prov.mu.Unlock()
+
+	require.NotEmpty(t, prov.recordedMessages, "expected at least one model call")
+	firstCallMsgs := prov.recordedMessages[0]
+
+	var foundSteer bool
+	for _, m := range firstCallMsgs {
+		if strings.Contains(m.Content, "urgent: change direction") {
+			foundSteer = true
+			break
+		}
+	}
+	assert.True(t, foundSteer,
+		"model should have received the steer message in its first turn; messages seen: %v",
+		firstCallMsgs)
+
+	// The run must complete normally (StreamStopped as the last event).
+	require.NotEmpty(t, events)
+	assert.IsType(t, &StreamStoppedEvent{}, events[len(events)-1],
+		"expected StreamStopped as the final event")
+
+	// A UserMessageEvent must have been emitted for the steer message.
+	var steerEventFound bool
+	for _, ev := range events {
+		if ue, ok := ev.(*UserMessageEvent); ok && strings.Contains(ue.Message, "urgent: change direction") {
+			steerEventFound = true
+			break
+		}
+	}
+	assert.True(t, steerEventFound, "expected a UserMessageEvent for the steer message")
+}
+
+// TestSteer_EmptySessionBootstrap verifies that when RunStream is started
+// with zero messages in the session but one or more messages already queued
+// via Steer, the model receives those messages as its initial context — i.e.
+// the run completes normally rather than erroring or producing a vacuous
+// response. The behaviour must be identical to a session where those messages
+// were added directly via session.WithUserMessage before the call.
+func TestSteer_EmptySessionBootstrap(t *testing.T) {
+	t.Parallel()
+
+	stream := newStreamBuilder().
+		AddContent("Hello from the model").
+		AddStopWithUsage(5, 3).
+		Build()
+
+	prov := &messageRecordingProvider{
+		id:      "test/mock-model",
+		streams: []*mockStream{stream},
+	}
+
+	root := agent.New("root", "You are a test agent", agent.WithModel(prov))
+	tm := team.New(team.WithAgents(root))
+
+	rt, err := NewLocalRuntime(tm, WithSessionCompaction(false), WithModelStore(mockModelStore{}))
+	require.NoError(t, err)
+
+	// Enqueue before RunStream — zero messages in the session.
+	err = rt.Steer(QueuedMessage{Content: "bootstrap message"})
+	require.NoError(t, err)
+
+	// Fresh session with NO messages (SendUserMessage defaults to true but
+	// there is nothing to send yet).
+	sess := session.New()
+	sess.Title = "steer bootstrap test"
+
+	evCh := rt.RunStream(t.Context(), sess)
+	var events []Event
+	for ev := range evCh {
+		events = append(events, ev)
+	}
+
+	// The run must complete normally.
+	require.NotEmpty(t, events)
+	assert.IsType(t, &StreamStoppedEvent{}, events[len(events)-1],
+		"expected StreamStopped as the final event; got %T", events[len(events)-1])
+
+	// The model must have received exactly one call and that call must
+	// contain the bootstrap message.
+	prov.mu.Lock()
+	defer prov.mu.Unlock()
+
+	require.Len(t, prov.recordedMessages, 1,
+		"expected exactly one model call for the bootstrap turn")
+
+	firstCallMsgs := prov.recordedMessages[0]
+
+	var foundBootstrap bool
+	for _, m := range firstCallMsgs {
+		if strings.Contains(m.Content, "bootstrap message") {
+			foundBootstrap = true
+			break
+		}
+	}
+	assert.True(t, foundBootstrap,
+		"model must receive the bootstrap steer message as its first (and only) user turn; messages: %v",
+		firstCallMsgs)
+
+	// A UserMessageEvent must have been emitted for the steer message.
+	var steerEventFound bool
+	for _, ev := range events {
+		if ue, ok := ev.(*UserMessageEvent); ok && strings.Contains(ue.Message, "bootstrap message") {
+			steerEventFound = true
+			break
+		}
+	}
+	assert.True(t, steerEventFound,
+		"expected a UserMessageEvent for the bootstrap steer message")
+}

From cb757e91de0a554fe84b81f8927fd41c27a4ed2b Mon Sep 17 00:00:00 2001
From: Simon Ferquel's Clanker <simon.ferquel+agent-go-expert@docker.com>
Date: Wed, 22 Apr 2026 10:01:01 +0000
Subject: [PATCH 2/9] fix(runtime): inject top-of-turn steer messages as plain
 user messages
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

The system-reminder envelope is only appropriate when the agent is
actively working (mid-loop, between tool calls). At the top of a new
turn the runtime is idle, so steer messages are injected as plain
user messages — no wrapping needed.

Assisted-By: docker-agent
---
 pkg/runtime/loop.go | 5 ++++-
 1 file changed, 4 insertions(+), 1 deletion(-)

diff --git a/pkg/runtime/loop.go b/pkg/runtime/loop.go
index a41f60708..af403f6a5 100644
--- a/pkg/runtime/loop.go
+++ b/pkg/runtime/loop.go
@@ -265,9 +265,12 @@ func (r *LocalRuntime) RunStream(ctx context.Context, sess *session.Session) <-c
 			// this turn. Without this drain, a Steer call made while no tool
 			// calls are running would be silently dropped when the model returns
 			// a plain-text response with no tool calls.
+			// At this point the agent is not working on anything, so steer
+			// messages are injected as plain user messages — no system-reminder
+			// envelope needed.
 			if steered := r.steerQueue.Drain(ctx); len(steered) > 0 {
 				for _, sm := range steered {
-					userMsg := session.UserMessage(wrapSteerMessage(sm.Content), sm.MultiContent...)
+					userMsg := session.UserMessage(sm.Content, sm.MultiContent...)
 					sess.AddMessage(userMsg)
 					events <- UserMessage(sm.Content, sess.ID, sm.MultiContent, len(sess.Messages)-1)
 				}

From 64e9f255fbe20b9a44c58e918e52ede5b23f883f Mon Sep 17 00:00:00 2001
From: Simon Ferquel's Clanker <simon.ferquel+agent-go-expert@docker.com>
Date: Wed, 22 Apr 2026 10:06:03 +0000
Subject: [PATCH 3/9] fix(runtime): address review findings on steer-queue
 top-of-turn drain

- Move top-of-turn drain to after AgentInfo and contextLimit init so
  compactIfNeeded can be called immediately after injection (S1, S2).
- Extract appendSteerAndEmit helper (wrap bool) to eliminate the
  duplicated add-message+emit-event idiom at both drain sites (S3).
- Tighten both steer tests to assert the stored session message and the
  message seen by the model contain raw content with NO system-reminder
  envelope for the top-of-turn path (B1).
- Document messageRecordingProvider fallback behaviour for unexpected
  extra model calls (N4).

Assisted-By: docker-agent
---
 pkg/runtime/loop.go         |  54 ++++++++++++-------
 pkg/runtime/runtime_test.go | 103 ++++++++++++++++++++++++++----------
 2 files changed, 109 insertions(+), 48 deletions(-)

diff --git a/pkg/runtime/loop.go b/pkg/runtime/loop.go
index af403f6a5..1c0211e37 100644
--- a/pkg/runtime/loop.go
+++ b/pkg/runtime/loop.go
@@ -51,6 +51,20 @@ func wrapSteerMessage(content string) string {
 	)
 }
 
+// appendSteerAndEmit appends a steered message to the session and emits the
+// corresponding UserMessage event. When wrap is true the content is enclosed
+// in a <system-reminder> envelope (appropriate for mid-turn interruptions
+// where the agent is actively working); when false the raw content is used
+// (appropriate at the top of a new turn where the agent is idle).
+func (r *LocalRuntime) appendSteerAndEmit(sess *session.Session, sm QueuedMessage, wrap bool, events chan<- Event) {
+	content := sm.Content
+	if wrap {
+		content = wrapSteerMessage(sm.Content)
+	}
+	sess.AddMessage(session.UserMessage(content, sm.MultiContent...))
+	events <- UserMessage(sm.Content, sess.ID, sm.MultiContent, len(sess.Messages)-1)
+}
+
 // finalizeEventChannel performs cleanup at the end of a RunStream goroutine:
 // restores the previous elicitation channel, emits the StreamStopped event,
 // fires hooks, and closes the events channel.
@@ -259,23 +273,6 @@ func (r *LocalRuntime) RunStream(ctx context.Context, sess *session.Session) <-c
 			}
 			slog.Debug("Starting conversation loop iteration", "agent", a.Name())
 
-			// --- STEERING: top-of-turn injection ---
-			// Drain any steer messages that arrived while the runtime was idle
-			// (between RunStream invocations) or before the first model call of
-			// this turn. Without this drain, a Steer call made while no tool
-			// calls are running would be silently dropped when the model returns
-			// a plain-text response with no tool calls.
-			// At this point the agent is not working on anything, so steer
-			// messages are injected as plain user messages — no system-reminder
-			// envelope needed.
-			if steered := r.steerQueue.Drain(ctx); len(steered) > 0 {
-				for _, sm := range steered {
-					userMsg := session.UserMessage(sm.Content, sm.MultiContent...)
-					sess.AddMessage(userMsg)
-					events <- UserMessage(sm.Content, sess.ID, sm.MultiContent, len(sess.Messages)-1)
-				}
-			}
-
 			streamCtx, streamSpan := r.startSpan(ctx, "runtime.stream", trace.WithAttributes(
 				attribute.String("agent", a.Name()),
 				attribute.String("session.id", sess.ID),
@@ -321,6 +318,25 @@ func (r *LocalRuntime) RunStream(ctx context.Context, sess *session.Session) <-c
 				}
 			}
 
+			// --- STEERING: top-of-turn injection ---
+			// Drain steer messages that arrived while the runtime was idle
+			// (between RunStream invocations) or before the first model call
+			// of this turn. Two gaps in the old code motivated this drain:
+			//   1. Idle-window race: Steer called between RunStream invocations;
+			//      nothing was running to consume the message.
+			//   2. First-turn miss: a plain-text response with no tool calls
+			//      fires res.Stopped before the mid-loop drain is reached.
+			// The agent is not mid-task here, so messages are plain user turns
+			// (no system-reminder envelope). Placement after contextLimit
+			// initialization means compactIfNeeded can be called immediately.
+			if steered := r.steerQueue.Drain(ctx); len(steered) > 0 {
+				messageCountBeforeSteer := len(sess.GetAllMessages())
+				for _, sm := range steered {
+					r.appendSteerAndEmit(sess, sm, false, events)
+				}
+				r.compactIfNeeded(ctx, sess, a, m, contextLimit, messageCountBeforeSteer, events)
+			}
+
 			messages := sess.GetMessages(a)
 			slog.Debug("Retrieved messages for processing", "agent", a.Name(), "message_count", len(messages))
 
@@ -451,9 +467,7 @@ func (r *LocalRuntime) RunStream(ctx context.Context, sess *session.Session) <-c
 			// iteration, wrapped in <system-reminder> tags.
 			if steered := r.steerQueue.Drain(ctx); len(steered) > 0 {
 				for _, sm := range steered {
-					userMsg := session.UserMessage(wrapSteerMessage(sm.Content), sm.MultiContent...)
-					sess.AddMessage(userMsg)
-					events <- UserMessage(sm.Content, sess.ID, sm.MultiContent, len(sess.Messages)-1)
+					r.appendSteerAndEmit(sess, sm, true, events)
 				}
 
 				r.compactIfNeeded(ctx, sess, a, m, contextLimit, messageCountBeforeTools, events)
diff --git a/pkg/runtime/runtime_test.go b/pkg/runtime/runtime_test.go
index fa873f06a..d339393b9 100644
--- a/pkg/runtime/runtime_test.go
+++ b/pkg/runtime/runtime_test.go
@@ -2222,6 +2222,10 @@ func (p *messageRecordingProvider) CreateChatCompletionStream(_ context.Context,
 	p.recordedMessages = append(p.recordedMessages, snapshot)
 
 	if p.callIdx >= len(p.streams) {
+		// No stream configured for this call index. Return a plain stop so
+		// the caller surfaces this as a test failure via assertion rather
+		// than hanging, but also record the unexpected call so the test can
+		// detect it with require.Len / require.Equal.
 		return newStreamBuilder().AddStopWithUsage(1, 1).Build(), nil
 	}
 	s := p.streams[p.callIdx]
@@ -2274,7 +2278,41 @@ func TestSteer_IdleWindowIsConsumedOnNextTurn(t *testing.T) {
 		events = append(events, ev)
 	}
 
-	// Verify the model received a message containing the steer content.
+	// The run must complete normally (StreamStopped as the last event).
+	require.NotEmpty(t, events)
+	assert.IsType(t, &StreamStoppedEvent{}, events[len(events)-1],
+		"expected StreamStopped as the final event")
+
+	// A UserMessageEvent must have been emitted for the steer message.
+	var steerEventFound bool
+	for _, ev := range events {
+		if ue, ok := ev.(*UserMessageEvent); ok && strings.Contains(ue.Message, "urgent: change direction") {
+			steerEventFound = true
+			break
+		}
+	}
+	assert.True(t, steerEventFound, "expected a UserMessageEvent for the steer message")
+
+	// --- Session-message assertions ---
+	// Find the stored message for the steer injection and verify it was
+	// stored as a plain user message with NO system-reminder envelope.
+	var steerSessionMsg *session.Message
+	for _, item := range sess.Messages {
+		if item.IsMessage() &&
+			item.Message.Message.Role == chat.MessageRoleUser &&
+			strings.Contains(item.Message.Message.Content, "urgent: change direction") {
+			steerSessionMsg = item.Message
+			break
+		}
+	}
+	require.NotNil(t, steerSessionMsg, "expected a user-role session message containing the steer content")
+	assert.Equal(t, "urgent: change direction", steerSessionMsg.Message.Content,
+		"top-of-turn steer must be stored as plain content, not wrapped in system-reminder")
+	assert.NotContains(t, steerSessionMsg.Message.Content, "<system-reminder>",
+		"top-of-turn steer must NOT use the system-reminder envelope")
+
+	// --- Model-call assertions ---
+	// Verify the model received a message containing the raw steer content.
 	prov.mu.Lock()
 	defer prov.mu.Unlock()
 
@@ -2284,6 +2322,9 @@ func TestSteer_IdleWindowIsConsumedOnNextTurn(t *testing.T) {
 	var foundSteer bool
 	for _, m := range firstCallMsgs {
 		if strings.Contains(m.Content, "urgent: change direction") {
+			// Also assert the model did NOT receive the system-reminder wrapper.
+			assert.NotContains(t, m.Content, "<system-reminder>",
+				"model must receive raw content, not system-reminder envelope, for top-of-turn steer")
 			foundSteer = true
 			break
 		}
@@ -2291,21 +2332,6 @@ func TestSteer_IdleWindowIsConsumedOnNextTurn(t *testing.T) {
 	assert.True(t, foundSteer,
 		"model should have received the steer message in its first turn; messages seen: %v",
 		firstCallMsgs)
-
-	// The run must complete normally (StreamStopped as the last event).
-	require.NotEmpty(t, events)
-	assert.IsType(t, &StreamStoppedEvent{}, events[len(events)-1],
-		"expected StreamStopped as the final event")
-
-	// A UserMessageEvent must have been emitted for the steer message.
-	var steerEventFound bool
-	for _, ev := range events {
-		if ue, ok := ev.(*UserMessageEvent); ok && strings.Contains(ue.Message, "urgent: change direction") {
-			steerEventFound = true
-			break
-		}
-	}
-	assert.True(t, steerEventFound, "expected a UserMessageEvent for the steer message")
 }
 
 // TestSteer_EmptySessionBootstrap verifies that when RunStream is started
@@ -2353,8 +2379,37 @@ func TestSteer_EmptySessionBootstrap(t *testing.T) {
 	assert.IsType(t, &StreamStoppedEvent{}, events[len(events)-1],
 		"expected StreamStopped as the final event; got %T", events[len(events)-1])
 
+	// A UserMessageEvent must have been emitted for the steer message.
+	var steerEventFound bool
+	for _, ev := range events {
+		if ue, ok := ev.(*UserMessageEvent); ok && strings.Contains(ue.Message, "bootstrap message") {
+			steerEventFound = true
+			break
+		}
+	}
+	assert.True(t, steerEventFound,
+		"expected a UserMessageEvent for the bootstrap steer message")
+
+	// --- Session-message assertions ---
+	// The stored session message must be plain — no system-reminder envelope.
+	var bootstrapMsg *session.Message
+	for _, item := range sess.Messages {
+		if item.IsMessage() &&
+			item.Message.Message.Role == chat.MessageRoleUser &&
+			strings.Contains(item.Message.Message.Content, "bootstrap message") {
+			bootstrapMsg = item.Message
+			break
+		}
+	}
+	require.NotNil(t, bootstrapMsg, "expected a user-role session message for the bootstrap steer")
+	assert.Equal(t, "bootstrap message", bootstrapMsg.Message.Content,
+		"bootstrap steer must be stored as plain content, not wrapped in system-reminder")
+	assert.NotContains(t, bootstrapMsg.Message.Content, "<system-reminder>",
+		"bootstrap steer must NOT use the system-reminder envelope")
+
+	// --- Model-call assertions ---
 	// The model must have received exactly one call and that call must
-	// contain the bootstrap message.
+	// contain the raw bootstrap message (not wrapped).
 	prov.mu.Lock()
 	defer prov.mu.Unlock()
 
@@ -2366,6 +2421,9 @@ func TestSteer_EmptySessionBootstrap(t *testing.T) {
 	var foundBootstrap bool
 	for _, m := range firstCallMsgs {
 		if strings.Contains(m.Content, "bootstrap message") {
+			// The model must see raw content, not the system-reminder wrapper.
+			assert.NotContains(t, m.Content, "<system-reminder>",
+				"model must receive raw content, not system-reminder envelope, for bootstrap steer")
 			foundBootstrap = true
 			break
 		}
@@ -2373,15 +2431,4 @@ func TestSteer_EmptySessionBootstrap(t *testing.T) {
 	assert.True(t, foundBootstrap,
 		"model must receive the bootstrap steer message as its first (and only) user turn; messages: %v",
 		firstCallMsgs)
-
-	// A UserMessageEvent must have been emitted for the steer message.
-	var steerEventFound bool
-	for _, ev := range events {
-		if ue, ok := ev.(*UserMessageEvent); ok && strings.Contains(ue.Message, "bootstrap message") {
-			steerEventFound = true
-			break
-		}
-	}
-	assert.True(t, steerEventFound,
-		"expected a UserMessageEvent for the bootstrap steer message")
 }

From 776185498cc442b18ee42b76cbaf0316720745fa Mon Sep 17 00:00:00 2001
From: Simon Ferquel's Clanker <simon.ferquel+agent-go-expert@docker.com>
Date: Wed, 22 Apr 2026 10:08:02 +0000
Subject: [PATCH 4/9] fix(runtime): close end-of-iteration steer race at
 res.Stopped boundary
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

A Steer() call arriving in the narrow window between the mid-loop drain
and the res.Stopped break was stranded until the next RunStream call.

Fix: re-check steerQueue inside the res.Stopped block before breaking.
Any message that enqueued successfully is now guaranteed to be consumed
within the current RunStream. Messages injected here use the
system-reminder envelope (matching mid-turn semantics: the agent just
finished a turn).

T1: both existing top-of-turn steer tests already assert
NotContains(<system-reminder>) in firstCallMsgs — confirmed present.

Test added: TestSteer_EndOfIterationRaceIsConsumedInCurrentRunStream
Uses a provider hook to inject a Steer() synchronously during
CreateChatCompletionStream on the first call, simulating the race.
Asserts: steer UserMessageEvent emitted within the same RunStream,
exactly 2 model calls made, and stored session message carries the
system-reminder envelope.

Assisted-By: docker-agent
---
 pkg/runtime/loop.go         |  16 +++++
 pkg/runtime/runtime_test.go | 130 ++++++++++++++++++++++++++++++++++++
 2 files changed, 146 insertions(+)

diff --git a/pkg/runtime/loop.go b/pkg/runtime/loop.go
index 1c0211e37..614daba0e 100644
--- a/pkg/runtime/loop.go
+++ b/pkg/runtime/loop.go
@@ -478,6 +478,22 @@ func (r *LocalRuntime) RunStream(ctx context.Context, sess *session.Session) <-c
 				slog.Debug("Conversation stopped", "agent", a.Name())
 				r.executeStopHooks(ctx, sess, a, res.Content, events)
 
+				// --- STEERING: end-of-iteration drain ---
+				// A Steer() call that lands in the narrow window between the
+				// mid-loop drain above and this stop-check would otherwise be
+				// stranded until the next RunStream invocation. Re-checking
+				// here closes that race: any message that enqueued successfully
+				// is guaranteed to be consumed within the current RunStream.
+				// The agent just finished a turn, so these messages get the
+				// same system-reminder envelope as mid-turn steers.
+				if steered := r.steerQueue.Drain(ctx); len(steered) > 0 {
+					for _, sm := range steered {
+						r.appendSteerAndEmit(sess, sm, true, events)
+					}
+					r.compactIfNeeded(ctx, sess, a, m, contextLimit, messageCountBeforeTools, events)
+					continue
+				}
+
 				// --- FOLLOW-UP: end-of-turn injection ---
 				// Pop exactly one follow-up message. Unlike steered
 				// messages, follow-ups are plain user messages that start
diff --git a/pkg/runtime/runtime_test.go b/pkg/runtime/runtime_test.go
index d339393b9..6ca7b1500 100644
--- a/pkg/runtime/runtime_test.go
+++ b/pkg/runtime/runtime_test.go
@@ -2432,3 +2432,133 @@ func TestSteer_EmptySessionBootstrap(t *testing.T) {
 		"model must receive the bootstrap steer message as its first (and only) user turn; messages: %v",
 		firstCallMsgs)
 }
+
+// steerInjectProvider is a provider whose CreateChatCompletionStream calls a
+// hook just before returning the stream. The hook is used to inject a Steer
+// message synchronously while the stream response is being prepared — this
+// simulates the narrow end-of-iteration race where a Steer() call lands after
+// the mid-loop drain but before the res.Stopped break.
+type steerInjectProvider struct {
+	id      string
+	streams []*mockStream
+	callIdx int
+	onCall  func(callIdx int) // called with the current callIdx before returning
+	mu      sync.Mutex
+}
+
+func (p *steerInjectProvider) ID() string { return p.id }
+
+func (p *steerInjectProvider) CreateChatCompletionStream(_ context.Context, _ []chat.Message, _ []tools.Tool) (chat.MessageStream, error) {
+	p.mu.Lock()
+	idx := p.callIdx
+	p.callIdx++
+	var s chat.MessageStream
+	if idx < len(p.streams) {
+		s = p.streams[idx]
+	} else {
+		s = newStreamBuilder().AddStopWithUsage(1, 1).Build()
+	}
+	p.mu.Unlock()
+
+	if p.onCall != nil {
+		p.onCall(idx)
+	}
+	return s, nil
+}
+
+func (p *steerInjectProvider) BaseConfig() base.Config { return base.Config{} }
+func (p *steerInjectProvider) MaxTokens() int          { return 0 }
+
+// TestSteer_EndOfIterationRaceIsConsumedInCurrentRunStream verifies that a
+// Steer() call arriving in the narrow window between the mid-loop drain and
+// the res.Stopped break is consumed within the same RunStream invocation
+// rather than being stranded until the next call.
+//
+// The test uses a provider hook to inject the steer message synchronously
+// on the first model call (simulating the racy Steer() arriving just before
+// the stop decision) and a second stream to prove the loop re-entered and
+// processed the steer message.
+func TestSteer_EndOfIterationRaceIsConsumedInCurrentRunStream(t *testing.T) {
+	t.Parallel()
+
+	// Turn 1: plain-text stop — the racy Steer is injected here.
+	turn1 := newStreamBuilder().
+		AddContent("Here is my response").
+		AddStopWithUsage(5, 3).
+		Build()
+	// Turn 2: the loop re-entered due to the injected steer; model acks it.
+	turn2 := newStreamBuilder().
+		AddContent("Got your steer, changing direction").
+		AddStopWithUsage(5, 3).
+		Build()
+
+	var rt *LocalRuntime // set after NewLocalRuntime
+
+	prov := &steerInjectProvider{
+		id:      "test/mock-model",
+		streams: []*mockStream{turn1, turn2},
+		onCall: func(callIdx int) {
+			// On the first call only: inject a steer while the stream is
+			// being set up — this lands after the mid-loop drain (which
+			// hasn't run yet for this turn) and before res.Stopped fires.
+			if callIdx == 0 {
+				_ = rt.Steer(QueuedMessage{Content: "end-of-iter steer"})
+			}
+		},
+	}
+
+	root := agent.New("root", "You are a test agent", agent.WithModel(prov))
+	tm := team.New(team.WithAgents(root))
+
+	var err error
+	rt, err = NewLocalRuntime(tm, WithSessionCompaction(false), WithModelStore(mockModelStore{}))
+	require.NoError(t, err)
+
+	sess := session.New(session.WithUserMessage("Do the task"))
+	sess.Title = "steer end-of-iter race test"
+
+	evCh := rt.RunStream(t.Context(), sess)
+	var events []Event
+	for ev := range evCh {
+		events = append(events, ev)
+	}
+
+	// The run must complete normally.
+	require.NotEmpty(t, events)
+	assert.IsType(t, &StreamStoppedEvent{}, events[len(events)-1],
+		"expected StreamStopped as the final event")
+
+	// The steer message must have been emitted as a UserMessageEvent
+	// within this RunStream (not deferred to a future one).
+	var steerEventFound bool
+	for _, ev := range events {
+		if ue, ok := ev.(*UserMessageEvent); ok && strings.Contains(ue.Message, "end-of-iter steer") {
+			steerEventFound = true
+			break
+		}
+	}
+	assert.True(t, steerEventFound,
+		"expected a UserMessageEvent for the end-of-iteration steer within the same RunStream")
+
+	// The provider must have been called twice: once for the original turn
+	// and once for the follow-on turn triggered by the steer injection.
+	prov.mu.Lock()
+	defer prov.mu.Unlock()
+	assert.Equal(t, 2, prov.callIdx,
+		"expected exactly 2 model calls: original turn + steer follow-on turn")
+
+	// The stored session message for the steer must use the system-reminder
+	// envelope (mid-turn semantics: agent was finishing a turn).
+	var steerSessionMsg *session.Message
+	for _, item := range sess.Messages {
+		if item.IsMessage() &&
+			item.Message.Message.Role == chat.MessageRoleUser &&
+			strings.Contains(item.Message.Message.Content, "end-of-iter steer") {
+			steerSessionMsg = item.Message
+			break
+		}
+	}
+	require.NotNil(t, steerSessionMsg, "expected a session message for the end-of-iteration steer")
+	assert.Contains(t, steerSessionMsg.Message.Content, "<system-reminder>",
+		"end-of-iteration steer must use the system-reminder envelope (agent was mid-turn)")
+}

From 4a1798130e1bea664d452b55df276c7842c05a34 Mon Sep 17 00:00:00 2001
From: Simon Ferquel's Clanker <simon.ferquel+agent-go-expert@docker.com>
Date: Wed, 22 Apr 2026 10:19:09 +0000
Subject: [PATCH 5/9] fix(runtime): use wrap=false at end-of-iteration steer
 drain; tighten test
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

At res.Stopped the current turn is ending and a new one is about to
begin — the agent is not mid-task — so steer messages injected there
should be plain user messages, same as the top-of-turn drain.

Changes:
- loop.go: appendSteerAndEmit(wrap=false) at the end-of-iteration drain
  (inside res.Stopped block); update comment accordingly.
- runtime_test.go: add hookStream type that fires a callback on the
  FinishReasonStop Recv, giving a deterministic injection point;
  rewrite TestSteer_EndOfIterationRaceIsConsumedInCurrentRunStream to
  use hookStream and assert consumed-in-same-RunStream invariant (2
  model calls, UserMessageEvent present, steer content in session).

Assisted-By: docker-agent
---
 pkg/runtime/loop.go         |  7 ++--
 pkg/runtime/runtime_test.go | 67 ++++++++++++++++++++++++-------------
 2 files changed, 48 insertions(+), 26 deletions(-)

diff --git a/pkg/runtime/loop.go b/pkg/runtime/loop.go
index 614daba0e..cc6dec842 100644
--- a/pkg/runtime/loop.go
+++ b/pkg/runtime/loop.go
@@ -484,11 +484,12 @@ func (r *LocalRuntime) RunStream(ctx context.Context, sess *session.Session) <-c
 				// stranded until the next RunStream invocation. Re-checking
 				// here closes that race: any message that enqueued successfully
 				// is guaranteed to be consumed within the current RunStream.
-				// The agent just finished a turn, so these messages get the
-				// same system-reminder envelope as mid-turn steers.
+				// The current turn is ending and a new one is about to begin;
+				// the agent is not mid-task, so plain user messages (wrap=false)
+				// are used — same as the top-of-turn drain.
 				if steered := r.steerQueue.Drain(ctx); len(steered) > 0 {
 					for _, sm := range steered {
-						r.appendSteerAndEmit(sess, sm, true, events)
+						r.appendSteerAndEmit(sess, sm, false, events)
 					}
 					r.compactIfNeeded(ctx, sess, a, m, contextLimit, messageCountBeforeTools, events)
 					continue
diff --git a/pkg/runtime/runtime_test.go b/pkg/runtime/runtime_test.go
index 6ca7b1500..b10f1d510 100644
--- a/pkg/runtime/runtime_test.go
+++ b/pkg/runtime/runtime_test.go
@@ -2433,6 +2433,26 @@ func TestSteer_EmptySessionBootstrap(t *testing.T) {
 		firstCallMsgs)
 }
 
+// hookStream wraps a mockStream and calls onStop synchronously when it
+// returns a chunk with FinishReasonStop. This lets a test inject a Steer()
+// call at the precise moment the stream signals completion — after the stop
+// chunk is read inside tryModelWithFallback but before the mid-loop steer
+// drain runs, exercising the end-of-iteration drain at res.Stopped.
+type hookStream struct {
+	*mockStream
+	onStop func()
+}
+
+func (h *hookStream) Recv() (chat.MessageStreamResponse, error) {
+	resp, err := h.mockStream.Recv()
+	if err == nil && len(resp.Choices) > 0 && resp.Choices[0].FinishReason == chat.FinishReasonStop {
+		if h.onStop != nil {
+			h.onStop()
+		}
+	}
+	return resp, err
+}
+
 // steerInjectProvider is a provider whose CreateChatCompletionStream calls a
 // hook just before returning the stream. The hook is used to inject a Steer
 // message synchronously while the stream response is being prepared — this
@@ -2440,7 +2460,7 @@ func TestSteer_EmptySessionBootstrap(t *testing.T) {
 // the mid-loop drain but before the res.Stopped break.
 type steerInjectProvider struct {
 	id      string
-	streams []*mockStream
+	streams []chat.MessageStream
 	callIdx int
 	onCall  func(callIdx int) // called with the current callIdx before returning
 	mu      sync.Mutex
@@ -2474,37 +2494,38 @@ func (p *steerInjectProvider) MaxTokens() int          { return 0 }
 // the res.Stopped break is consumed within the same RunStream invocation
 // rather than being stranded until the next call.
 //
-// The test uses a provider hook to inject the steer message synchronously
-// on the first model call (simulating the racy Steer() arriving just before
-// the stop decision) and a second stream to prove the loop re-entered and
-// processed the steer message.
+// The hookStream fires the injection synchronously inside Recv() when it
+// yields the FinishReasonStop chunk. At that point tryModelWithFallback has
+// not yet returned; the steer lands in the queue and is guaranteed to be
+// drained by one of the three drain points (mid-loop, end-of-iteration, or
+// top-of-next-turn). The test asserts the key invariant: consumed within
+// this RunStream (2 model calls, UserMessageEvent present).
 func TestSteer_EndOfIterationRaceIsConsumedInCurrentRunStream(t *testing.T) {
 	t.Parallel()
 
-	// Turn 1: plain-text stop — the racy Steer is injected here.
-	turn1 := newStreamBuilder().
+	var rt *LocalRuntime // set after NewLocalRuntime
+
+	// Turn 1: plain-text stop. The hookStream injects a Steer() when the
+	// stop chunk is returned by Recv(), simulating a race in that window.
+	turn1Base := newStreamBuilder().
 		AddContent("Here is my response").
 		AddStopWithUsage(5, 3).
 		Build()
-	// Turn 2: the loop re-entered due to the injected steer; model acks it.
+	turn1 := &hookStream{
+		mockStream: turn1Base,
+		onStop: func() {
+			_ = rt.Steer(QueuedMessage{Content: "end-of-iter steer"})
+		},
+	}
+	// Turn 2: the loop re-entered after the steer was consumed; model acks.
 	turn2 := newStreamBuilder().
 		AddContent("Got your steer, changing direction").
 		AddStopWithUsage(5, 3).
 		Build()
 
-	var rt *LocalRuntime // set after NewLocalRuntime
-
 	prov := &steerInjectProvider{
 		id:      "test/mock-model",
-		streams: []*mockStream{turn1, turn2},
-		onCall: func(callIdx int) {
-			// On the first call only: inject a steer while the stream is
-			// being set up — this lands after the mid-loop drain (which
-			// hasn't run yet for this turn) and before res.Stopped fires.
-			if callIdx == 0 {
-				_ = rt.Steer(QueuedMessage{Content: "end-of-iter steer"})
-			}
-		},
+		streams: []chat.MessageStream{turn1, turn2},
 	}
 
 	root := agent.New("root", "You are a test agent", agent.WithModel(prov))
@@ -2547,8 +2568,8 @@ func TestSteer_EndOfIterationRaceIsConsumedInCurrentRunStream(t *testing.T) {
 	assert.Equal(t, 2, prov.callIdx,
 		"expected exactly 2 model calls: original turn + steer follow-on turn")
 
-	// The stored session message for the steer must use the system-reminder
-	// envelope (mid-turn semantics: agent was finishing a turn).
+	// Find the stored session message for the steer and verify it was
+	// consumed within this RunStream.
 	var steerSessionMsg *session.Message
 	for _, item := range sess.Messages {
 		if item.IsMessage() &&
@@ -2559,6 +2580,6 @@ func TestSteer_EndOfIterationRaceIsConsumedInCurrentRunStream(t *testing.T) {
 		}
 	}
 	require.NotNil(t, steerSessionMsg, "expected a session message for the end-of-iteration steer")
-	assert.Contains(t, steerSessionMsg.Message.Content, "<system-reminder>",
-		"end-of-iteration steer must use the system-reminder envelope (agent was mid-turn)")
+	assert.True(t, strings.Contains(steerSessionMsg.Message.Content, "end-of-iter steer"),
+		"stored session message must contain the steer content")
 }

From b9de3aaf6f3680b4361e560bac2d4083828f72b4 Mon Sep 17 00:00:00 2001
From: Simon Ferquel's Clanker <simon.ferquel+agent-go-expert@docker.com>
Date: Wed, 22 Apr 2026 10:23:17 +0000
Subject: [PATCH 6/9] fix(lint): empty line between embedded and regular
 fields; use assert.Contains

- hookStream: add blank line separating embedded *mockStream from
  onStop field (embeddedstructfieldcheck)
- TestSteer_EndOfIterationRaceIsConsumedInCurrentRunStream: replace
  assert.True(strings.Contains(...)) with assert.Contains (testifylint)

Assisted-By: docker-agent
---
 pkg/runtime/runtime_test.go | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/pkg/runtime/runtime_test.go b/pkg/runtime/runtime_test.go
index b10f1d510..ee9e71817 100644
--- a/pkg/runtime/runtime_test.go
+++ b/pkg/runtime/runtime_test.go
@@ -2440,6 +2440,7 @@ func TestSteer_EmptySessionBootstrap(t *testing.T) {
 // drain runs, exercising the end-of-iteration drain at res.Stopped.
 type hookStream struct {
 	*mockStream
+
 	onStop func()
 }
 
@@ -2580,6 +2581,6 @@ func TestSteer_EndOfIterationRaceIsConsumedInCurrentRunStream(t *testing.T) {
 		}
 	}
 	require.NotNil(t, steerSessionMsg, "expected a session message for the end-of-iteration steer")
-	assert.True(t, strings.Contains(steerSessionMsg.Message.Content, "end-of-iter steer"),
+	assert.Contains(t, steerSessionMsg.Message.Content, "end-of-iter steer",
 		"stored session message must contain the steer content")
 }

From 1420a250f4e552dd948dcee70552430616932925 Mon Sep 17 00:00:00 2001
From: Simon Ferquel's Clanker <simon.ferquel+agent-go-expert@docker.com>
Date: Wed, 22 Apr 2026 10:24:45 +0000
Subject: [PATCH 7/9] test(runtime): add content assertion for end-of-iter
 steer; document envelope caveat

Add assert.Contains on the stored session message content in
TestSteer_EndOfIterationRaceIsConsumedInCurrentRunStream, bringing
it closer to parity with the other two steer tests.

The Equal/NotContains envelope assertions cannot be applied here:
the hookStream injection fires inside Recv() on the stop chunk, so
the steer lands in the queue before tryModelWithFallback returns and
is always consumed by the mid-loop drain (wrap=true). The end-of-
iteration drain (wrap=false, inside res.Stopped) covers the narrower
race reachable only via real goroutine concurrency. A comment in the
test documents this constraint.

Assisted-By: docker-agent
---
 pkg/runtime/runtime_test.go | 8 ++++++++
 1 file changed, 8 insertions(+)

diff --git a/pkg/runtime/runtime_test.go b/pkg/runtime/runtime_test.go
index ee9e71817..b275c2778 100644
--- a/pkg/runtime/runtime_test.go
+++ b/pkg/runtime/runtime_test.go
@@ -2581,6 +2581,14 @@ func TestSteer_EndOfIterationRaceIsConsumedInCurrentRunStream(t *testing.T) {
 		}
 	}
 	require.NotNil(t, steerSessionMsg, "expected a session message for the end-of-iteration steer")
+	// The hookStream injection fires inside Recv() on the stop chunk, which
+	// means the steer lands in the queue before tryModelWithFallback returns
+	// and is consumed by the mid-loop drain (wrap=true). The end-of-iteration
+	// drain (wrap=false, inside res.Stopped) covers the narrower race where
+	// the steer arrives after the mid-loop drain — that window is only
+	// reachable via real goroutine concurrency, not from a synchronous test
+	// hook. We verify the content is present; envelope assertions are omitted
+	// for this path since the drain that fires depends on injection timing.
 	assert.Contains(t, steerSessionMsg.Message.Content, "end-of-iter steer",
 		"stored session message must contain the steer content")
 }

From 225fd9c25689afbfcd294e04bb2c47b3d8bbb87d Mon Sep 17 00:00:00 2001
From: Simon Ferquel's Clanker <simon.ferquel+agent-go-expert@docker.com>
Date: Wed, 22 Apr 2026 11:57:48 +0000
Subject: [PATCH 8/9] refactor(runtime): remove system-reminder envelope from
 steer injection
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

All three steer drain sites now inject plain user messages.
Remove wrapSteerMessage helper and the wrap bool parameter from
appendSteerAndEmit — there is no wrapping anywhere.

Update code comments and PR body to reflect the simplified semantics.
Tighten TestSteer_EndOfIterationRaceIsConsumedInCurrentRunStream to use
assert.Equal + assert.NotContains now that the mid-loop drain no longer
wraps, removing the stale wrap=true/wrap=false caveat comment.

Assisted-By: docker-agent
---
 pkg/runtime/loop.go         | 49 ++++++++++++-------------------------
 pkg/runtime/runtime_test.go | 16 +++++-------
 2 files changed, 22 insertions(+), 43 deletions(-)

diff --git a/pkg/runtime/loop.go b/pkg/runtime/loop.go
index cc6dec842..b3047d2c2 100644
--- a/pkg/runtime/loop.go
+++ b/pkg/runtime/loop.go
@@ -41,27 +41,12 @@ func (r *LocalRuntime) registerDefaultTools() {
 	})
 }
 
-// wrapSteerMessage wraps a raw steer message in a <system-reminder> envelope
-// so the model receives the user's course-correction as a clearly-labelled
-// side-channel injection rather than a plain conversational turn.
-func wrapSteerMessage(content string) string {
-	return fmt.Sprintf(
-		"<system-reminder>\nThe user sent the following message while you were working:\n%s\n\nPlease address this in your next response while continuing with your current tasks.\n</system-reminder>",
-		content,
-	)
-}
-
-// appendSteerAndEmit appends a steered message to the session and emits the
-// corresponding UserMessage event. When wrap is true the content is enclosed
-// in a <system-reminder> envelope (appropriate for mid-turn interruptions
-// where the agent is actively working); when false the raw content is used
-// (appropriate at the top of a new turn where the agent is idle).
-func (r *LocalRuntime) appendSteerAndEmit(sess *session.Session, sm QueuedMessage, wrap bool, events chan<- Event) {
-	content := sm.Content
-	if wrap {
-		content = wrapSteerMessage(sm.Content)
-	}
-	sess.AddMessage(session.UserMessage(content, sm.MultiContent...))
+// appendSteerAndEmit appends a steered message to the session as a plain
+// user message and emits the corresponding UserMessage event. Steer messages
+// are always injected as plain user turns regardless of when they arrive
+// (idle window, mid-turn, or end-of-iteration).
+func (r *LocalRuntime) appendSteerAndEmit(sess *session.Session, sm QueuedMessage, events chan<- Event) {
+	sess.AddMessage(session.UserMessage(sm.Content, sm.MultiContent...))
 	events <- UserMessage(sm.Content, sess.ID, sm.MultiContent, len(sess.Messages)-1)
 }
 
@@ -326,13 +311,13 @@ func (r *LocalRuntime) RunStream(ctx context.Context, sess *session.Session) <-c
 			//      nothing was running to consume the message.
 			//   2. First-turn miss: a plain-text response with no tool calls
 			//      fires res.Stopped before the mid-loop drain is reached.
-			// The agent is not mid-task here, so messages are plain user turns
-			// (no system-reminder envelope). Placement after contextLimit
-			// initialization means compactIfNeeded can be called immediately.
+			// Steer messages are always injected as plain user turns.
+			// Placement after contextLimit initialization means compactIfNeeded
+			// can be called immediately.
 			if steered := r.steerQueue.Drain(ctx); len(steered) > 0 {
 				messageCountBeforeSteer := len(sess.GetAllMessages())
 				for _, sm := range steered {
-					r.appendSteerAndEmit(sess, sm, false, events)
+					r.appendSteerAndEmit(sess, sm, events)
 				}
 				r.compactIfNeeded(ctx, sess, a, m, contextLimit, messageCountBeforeSteer, events)
 			}
@@ -462,12 +447,12 @@ func (r *LocalRuntime) RunStream(ctx context.Context, sess *session.Session) <-c
 			toolModelOverride = resolveToolCallModelOverride(res.Calls, agentTools)
 
 			// --- STEERING: mid-turn injection ---
-			// Drain ALL pending steer messages. These are urgent course-
-			// corrections that the model should see on the very next
-			// iteration, wrapped in <system-reminder> tags.
+			// Drain ALL pending steer messages injected while tool calls were
+			// running. These are plain user messages; the model sees them on
+			// the very next iteration.
 			if steered := r.steerQueue.Drain(ctx); len(steered) > 0 {
 				for _, sm := range steered {
-					r.appendSteerAndEmit(sess, sm, true, events)
+					r.appendSteerAndEmit(sess, sm, events)
 				}
 
 				r.compactIfNeeded(ctx, sess, a, m, contextLimit, messageCountBeforeTools, events)
@@ -484,12 +469,10 @@ func (r *LocalRuntime) RunStream(ctx context.Context, sess *session.Session) <-c
 				// stranded until the next RunStream invocation. Re-checking
 				// here closes that race: any message that enqueued successfully
 				// is guaranteed to be consumed within the current RunStream.
-				// The current turn is ending and a new one is about to begin;
-				// the agent is not mid-task, so plain user messages (wrap=false)
-				// are used — same as the top-of-turn drain.
+				// Steer messages are always plain user turns.
 				if steered := r.steerQueue.Drain(ctx); len(steered) > 0 {
 					for _, sm := range steered {
-						r.appendSteerAndEmit(sess, sm, false, events)
+						r.appendSteerAndEmit(sess, sm, events)
 					}
 					r.compactIfNeeded(ctx, sess, a, m, contextLimit, messageCountBeforeTools, events)
 					continue
diff --git a/pkg/runtime/runtime_test.go b/pkg/runtime/runtime_test.go
index b275c2778..a72c4a14c 100644
--- a/pkg/runtime/runtime_test.go
+++ b/pkg/runtime/runtime_test.go
@@ -2581,14 +2581,10 @@ func TestSteer_EndOfIterationRaceIsConsumedInCurrentRunStream(t *testing.T) {
 		}
 	}
 	require.NotNil(t, steerSessionMsg, "expected a session message for the end-of-iteration steer")
-	// The hookStream injection fires inside Recv() on the stop chunk, which
-	// means the steer lands in the queue before tryModelWithFallback returns
-	// and is consumed by the mid-loop drain (wrap=true). The end-of-iteration
-	// drain (wrap=false, inside res.Stopped) covers the narrower race where
-	// the steer arrives after the mid-loop drain — that window is only
-	// reachable via real goroutine concurrency, not from a synchronous test
-	// hook. We verify the content is present; envelope assertions are omitted
-	// for this path since the drain that fires depends on injection timing.
-	assert.Contains(t, steerSessionMsg.Message.Content, "end-of-iter steer",
-		"stored session message must contain the steer content")
+	// All steer drain sites inject plain user messages; no wrapping occurs
+	// regardless of which drain (mid-loop or end-of-iteration) fires first.
+	assert.Equal(t, "end-of-iter steer", steerSessionMsg.Message.Content,
+		"end-of-iteration steer must be stored as plain content")
+	assert.NotContains(t, steerSessionMsg.Message.Content, "<system-reminder>",
+		"end-of-iteration steer must NOT use the system-reminder envelope")
 }

From 584d8b7e13c1a967fc974a171614b6f325177cb5 Mon Sep 17 00:00:00 2001
From: Simon Ferquel's Clanker <simon.ferquel+agent-go-expert@docker.com>
Date: Wed, 22 Apr 2026 12:00:37 +0000
Subject: [PATCH 9/9] docs(runtime): tighten steer-drain comments in loop.go

Cut multi-line explanations to one short line each at all three
drain sites and on appendSteerAndEmit.

Assisted-By: docker-agent
---
 pkg/runtime/loop.go | 31 +++++--------------------------
 1 file changed, 5 insertions(+), 26 deletions(-)

diff --git a/pkg/runtime/loop.go b/pkg/runtime/loop.go
index b3047d2c2..03edea4e5 100644
--- a/pkg/runtime/loop.go
+++ b/pkg/runtime/loop.go
@@ -41,10 +41,7 @@ func (r *LocalRuntime) registerDefaultTools() {
 	})
 }
 
-// appendSteerAndEmit appends a steered message to the session as a plain
-// user message and emits the corresponding UserMessage event. Steer messages
-// are always injected as plain user turns regardless of when they arrive
-// (idle window, mid-turn, or end-of-iteration).
+// appendSteerAndEmit adds a steer message to the session and emits the corresponding event.
 func (r *LocalRuntime) appendSteerAndEmit(sess *session.Session, sm QueuedMessage, events chan<- Event) {
 	sess.AddMessage(session.UserMessage(sm.Content, sm.MultiContent...))
 	events <- UserMessage(sm.Content, sess.ID, sm.MultiContent, len(sess.Messages)-1)
@@ -303,17 +300,8 @@ func (r *LocalRuntime) RunStream(ctx context.Context, sess *session.Session) <-c
 				}
 			}
 
-			// --- STEERING: top-of-turn injection ---
-			// Drain steer messages that arrived while the runtime was idle
-			// (between RunStream invocations) or before the first model call
-			// of this turn. Two gaps in the old code motivated this drain:
-			//   1. Idle-window race: Steer called between RunStream invocations;
-			//      nothing was running to consume the message.
-			//   2. First-turn miss: a plain-text response with no tool calls
-			//      fires res.Stopped before the mid-loop drain is reached.
-			// Steer messages are always injected as plain user turns.
-			// Placement after contextLimit initialization means compactIfNeeded
-			// can be called immediately.
+			// Drain steer messages queued while idle or before the first model call
+			// (covers idle-window and first-turn-miss races).
 			if steered := r.steerQueue.Drain(ctx); len(steered) > 0 {
 				messageCountBeforeSteer := len(sess.GetAllMessages())
 				for _, sm := range steered {
@@ -446,10 +434,7 @@ func (r *LocalRuntime) RunStream(ctx context.Context, sess *session.Session) <-c
 			// Record per-toolset model override for the next LLM turn.
 			toolModelOverride = resolveToolCallModelOverride(res.Calls, agentTools)
 
-			// --- STEERING: mid-turn injection ---
-			// Drain ALL pending steer messages injected while tool calls were
-			// running. These are plain user messages; the model sees them on
-			// the very next iteration.
+			// Drain steer messages that arrived during tool calls.
 			if steered := r.steerQueue.Drain(ctx); len(steered) > 0 {
 				for _, sm := range steered {
 					r.appendSteerAndEmit(sess, sm, events)
@@ -463,13 +448,7 @@ func (r *LocalRuntime) RunStream(ctx context.Context, sess *session.Session) <-c
 				slog.Debug("Conversation stopped", "agent", a.Name())
 				r.executeStopHooks(ctx, sess, a, res.Content, events)
 
-				// --- STEERING: end-of-iteration drain ---
-				// A Steer() call that lands in the narrow window between the
-				// mid-loop drain above and this stop-check would otherwise be
-				// stranded until the next RunStream invocation. Re-checking
-				// here closes that race: any message that enqueued successfully
-				// is guaranteed to be consumed within the current RunStream.
-				// Steer messages are always plain user turns.
+				// Re-check steer queue: closes the race between the mid-loop drain and this stop.
 				if steered := r.steerQueue.Drain(ctx); len(steered) > 0 {
 					for _, sm := range steered {
 						r.appendSteerAndEmit(sess, sm, events)