From c43edde2a02806859ec79dacf2634e04ba636ede Mon Sep 17 00:00:00 2001
From: Roo Code <roomote@roocode.com>
Date: Fri, 10 Apr 2026 05:41:34 +0000
Subject: [PATCH] fix: add stream retry cap and context recovery hint for
 provider errors (#12087)

- Add MAX_STREAM_RETRIES (5) to cap first-chunk and mid-stream error retries,
  preventing indefinite retry loops when auto-approval is enabled
- Add context recovery hint prepended to user content on retry attempts,
  helping weaker models re-orient to the current task instead of
  hallucinating about previously completed tasks
- When max retries are exceeded, present the error to the user for manual
  retry instead of continuing to auto-retry indefinitely
- Update last user message in API history on retry with recovery hint and
  refreshed environment details
---
 src/core/task/Task.ts                         |  70 ++++-
 .../task/__tests__/stream-retry-limit.spec.ts | 290 ++++++++++++++++++
 2 files changed, 357 insertions(+), 3 deletions(-)
 create mode 100644 src/core/task/__tests__/stream-retry-limit.spec.ts
diff --git a/src/core/task/Task.ts b/src/core/task/Task.ts
index 005bb0f292b..369c5014b11 100644
--- a/src/core/task/Task.ts
+++ b/src/core/task/Task.ts
@@ -137,6 +137,7 @@ const MAX_EXPONENTIAL_BACKOFF_SECONDS = 600 // 10 minutes
 const DEFAULT_USAGE_COLLECTION_TIMEOUT_MS = 5000 // 5 seconds
 const FORCED_CONTEXT_REDUCTION_PERCENT = 75 // Keep 75% of context (remove 25%) on context window errors
 const MAX_CONTEXT_WINDOW_RETRIES = 3 // Maximum retries for context window errors
+const MAX_STREAM_RETRIES = 5 // Maximum retries for first-chunk and mid-stream errors
 
 export interface TaskOptions extends CreateTaskOptions {
 	provider: ClineProvider
@@ -2646,6 +2647,19 @@ export class Task extends EventEmitter<TaskEvents> implements TaskLike {
 			// Add environment details as its own text block, separate from tool
 			// results.
 			let finalUserContent = [...contentWithoutEnvDetails, { type: "text" as const, text: environmentDetails }]
+
+			// When retrying after an error, prepend a context recovery hint to help the model
+			// re-orient to the current task. This prevents weaker models from latching onto
+			// earlier completed tasks instead of the user's most recent request.
+			const currentRetryAttempt = currentItem.retryAttempt ?? 0
+			if (currentRetryAttempt > 0) {
+				const recoveryHint: Anthropic.Messages.TextBlockParam = {
+					type: "text" as const,
+					text: "[CONTEXT RECOVERY NOTE: The previous API request failed due to a provider error and was automatically retried. Please focus on the user's most recent request below and continue from where you left off. Do not repeat or re-announce previously completed tasks.]",
+				}
+				finalUserContent = [recoveryHint, ...finalUserContent]
+			}
+
 			// Only add user message to conversation history if:
 			// 1. This is the first attempt (retryAttempt === 0), AND
 			// 2. The original userContent was not empty (empty signals delegation resume where
@@ -2660,6 +2674,15 @@ export class Task extends EventEmitter<TaskEvents> implements TaskLike {
 				TelemetryService.instance.captureConversationMessage(this.taskId, "user")
 			}
 
+			// On retry, update the existing last user message in API history with the
+			// recovery hint and refreshed environment details.
+			if (currentRetryAttempt > 0 && !isEmptyUserContent) {
+				const lastIdx = this.apiConversationHistory.length - 1
+				if (lastIdx >= 0 && this.apiConversationHistory[lastIdx].role === "user") {
+					this.apiConversationHistory[lastIdx] = { role: "user", content: finalUserContent }
+				}
+			}
+
 			// Since we sent off a placeholder api_req_started message to update the
 			// webview while waiting to actually start the API request (to load
 			// potential details for example), we need to update the text of that
@@ -3264,14 +3287,37 @@ export class Task extends EventEmitter<TaskEvents> implements TaskLike {
 						} else {
 							// Stream failed - log the error and retry with the same content
 							// The existing rate limiting will prevent rapid retries
+							const currentRetry = currentItem.retryAttempt ?? 0
 							console.error(
-								`[Task#${this.taskId}.${this.instanceId}] Stream failed, will retry: ${streamingFailedMessage}`,
+								`[Task#${this.taskId}.${this.instanceId}] Stream failed (attempt ${currentRetry + 1}/${MAX_STREAM_RETRIES}), will retry: ${streamingFailedMessage}`,
 							)
 
+							// Check if we've exceeded the maximum number of stream retries
+							if (currentRetry >= MAX_STREAM_RETRIES) {
+								console.error(
+									`[Task#${this.taskId}.${this.instanceId}] Max mid-stream retries (${MAX_STREAM_RETRIES}) exceeded, presenting error to user`,
+								)
+								const { response } = await this.ask(
+									"api_req_failed",
+									`Mid-stream error after ${MAX_STREAM_RETRIES} retries: ${streamingFailedMessage}`,
+								)
+								if (response !== "yesButtonClicked") {
+									break
+								}
+								await this.say("api_req_retried")
+								// User clicked retry - reset retry count and continue
+								stack.push({
+									userContent: currentUserContent,
+									includeFileDetails: false,
+									retryAttempt: 0,
+								})
+								continue
+							}
+
 							// Apply exponential backoff similar to first-chunk errors when auto-resubmit is enabled
 							const stateForBackoff = await this.providerRef.deref()?.getState()
 							if (stateForBackoff?.autoApprovalEnabled) {
-								await this.backoffAndAnnounce(currentItem.retryAttempt ?? 0, error)
+								await this.backoffAndAnnounce(currentRetry, error)
 
 								// Check if task was aborted during the backoff
 								if (this.abort) {
@@ -3289,7 +3335,7 @@ export class Task extends EventEmitter<TaskEvents> implements TaskLike {
 							stack.push({
 								userContent: currentUserContent,
 								includeFileDetails: false,
-								retryAttempt: (currentItem.retryAttempt ?? 0) + 1,
+								retryAttempt: currentRetry + 1,
 							})
 
 							// Continue to retry the request
@@ -4327,6 +4373,24 @@ export class Task extends EventEmitter<TaskEvents> implements TaskLike {
 
 			// note that this api_req_failed ask is unique in that we only present this option if the api hasn't streamed any content yet (ie it fails on the first chunk due), as it would allow them to hit a retry button. However if the api failed mid-stream, it could be in any arbitrary state where some tools may have executed, so that error is handled differently and requires cancelling the task entirely.
 			if (autoApprovalEnabled) {
+				// Check if we've exceeded the maximum number of stream retries
+				if (retryAttempt >= MAX_STREAM_RETRIES) {
+					console.error(
+						`[Task#${this.taskId}.${this.instanceId}] Max first-chunk retries (${MAX_STREAM_RETRIES}) exceeded, presenting error to user`,
+					)
+					const { response } = await this.ask(
+						"api_req_failed",
+						error.message ?? JSON.stringify(serializeError(error), null, 2),
+					)
+					if (response !== "yesButtonClicked") {
+						throw new Error("API request failed")
+					}
+					await this.say("api_req_retried")
+					// User clicked retry - reset retry count
+					yield* this.attemptApiRequest(0)
+					return
+				}
+
 				// Apply shared exponential backoff and countdown UX
 				await this.backoffAndAnnounce(retryAttempt, error)
 
diff --git a/src/core/task/__tests__/stream-retry-limit.spec.ts b/src/core/task/__tests__/stream-retry-limit.spec.ts
new file mode 100644
index 00000000000..45c1916c2af
--- /dev/null
+++ b/src/core/task/__tests__/stream-retry-limit.spec.ts
@@ -0,0 +1,290 @@
+// npx vitest core/task/__tests__/stream-retry-limit.spec.ts
+//
+// Unit tests for the stream retry limit (MAX_STREAM_RETRIES) and context
+// recovery hint logic added in fix for #12087.
+//
+// These tests validate the pure logic without importing the heavy Task class
+// to avoid OOM in constrained environments.
+
+describe("Stream Retry Limits and Context Recovery", () => {
+	// The constant value as defined in Task.ts
+	const MAX_STREAM_RETRIES = 5
+
+	describe("MAX_STREAM_RETRIES constant behavior", () => {
+		it("should cap retries at 5", () => {
+			expect(MAX_STREAM_RETRIES).toBe(5)
+		})
+
+		it("should allow retries when retryAttempt < MAX_STREAM_RETRIES", () => {
+			for (let retryAttempt = 0; retryAttempt < MAX_STREAM_RETRIES; retryAttempt++) {
+				const shouldAutoRetry = retryAttempt < MAX_STREAM_RETRIES
+				expect(shouldAutoRetry).toBe(true)
+			}
+		})
+
+		it("should stop auto-retry when retryAttempt >= MAX_STREAM_RETRIES", () => {
+			for (const retryAttempt of [5, 6, 10, 100]) {
+				const shouldAutoRetry = retryAttempt < MAX_STREAM_RETRIES
+				expect(shouldAutoRetry).toBe(false)
+			}
+		})
+
+		it("should present error to user when MAX_STREAM_RETRIES exceeded", () => {
+			// Simulates the logic in attemptApiRequest and the mid-stream error handler
+			const retryAttempt = MAX_STREAM_RETRIES
+			const autoApprovalEnabled = true
+
+			let presentedErrorToUser = false
+			if (autoApprovalEnabled && retryAttempt >= MAX_STREAM_RETRIES) {
+				presentedErrorToUser = true
+			}
+
+			expect(presentedErrorToUser).toBe(true)
+		})
+
+		it("should not present error when under the limit with auto-approval", () => {
+			const retryAttempt = 3
+			const autoApprovalEnabled = true
+
+			let presentedErrorToUser = false
+			if (autoApprovalEnabled && retryAttempt >= MAX_STREAM_RETRIES) {
+				presentedErrorToUser = true
+			}
+
+			expect(presentedErrorToUser).toBe(false)
+		})
+	})
+
+	describe("Context Recovery Hint", () => {
+		const RECOVERY_HINT_TEXT =
+			"[CONTEXT RECOVERY NOTE: The previous API request failed due to a provider error and was automatically retried. Please focus on the user's most recent request below and continue from where you left off. Do not repeat or re-announce previously completed tasks.]"
+
+		it("should not add recovery hint on first attempt (retryAttempt === 0)", () => {
+			const retryAttempt = 0
+			const shouldAddHint = retryAttempt > 0
+			expect(shouldAddHint).toBe(false)
+		})
+
+		it("should add recovery hint on retry attempts (retryAttempt > 0)", () => {
+			for (const retryAttempt of [1, 2, 3, 4, 5]) {
+				const shouldAddHint = retryAttempt > 0
+				expect(shouldAddHint).toBe(true)
+			}
+		})
+
+		it("should prepend recovery hint to user content on retry", () => {
+			const originalContent = [{ type: "text" as const, text: "Please make the cards full width" }]
+			const environmentDetails = "<environment_details>mock env</environment_details>"
+			const recoveryHint = {
+				type: "text" as const,
+				text: RECOVERY_HINT_TEXT,
+			}
+
+			// Simulates the retry path in recursivelyMakeClineRequests
+			const retryAttempt = 1
+			let finalUserContent = [...originalContent, { type: "text" as const, text: environmentDetails }]
+
+			if (retryAttempt > 0) {
+				finalUserContent = [recoveryHint, ...finalUserContent]
+			}
+
+			expect(finalUserContent.length).toBe(3)
+			expect(finalUserContent[0].text).toContain("CONTEXT RECOVERY NOTE")
+			expect(finalUserContent[1].text).toBe("Please make the cards full width")
+			expect(finalUserContent[2].text).toContain("environment_details")
+		})
+
+		it("should not prepend recovery hint on first attempt", () => {
+			const originalContent = [{ type: "text" as const, text: "Please make the cards full width" }]
+			const environmentDetails = "<environment_details>mock env</environment_details>"
+			const recoveryHint = {
+				type: "text" as const,
+				text: RECOVERY_HINT_TEXT,
+			}
+
+			const retryAttempt = 0
+			let finalUserContent = [...originalContent, { type: "text" as const, text: environmentDetails }]
+
+			if (retryAttempt > 0) {
+				finalUserContent = [recoveryHint, ...finalUserContent]
+			}
+
+			expect(finalUserContent.length).toBe(2)
+			expect(finalUserContent[0].text).toBe("Please make the cards full width")
+			expect(finalUserContent[1].text).toContain("environment_details")
+		})
+
+		it("should update the last user message in API history on retry", () => {
+			const apiConversationHistory = [
+				{
+					role: "user" as const,
+					content: [{ type: "text" as const, text: "Complete Task A" }],
+				},
+				{
+					role: "assistant" as const,
+					content: [{ type: "text" as const, text: "Task A completed." }],
+				},
+				{
+					role: "user" as const,
+					content: [
+						{ type: "text" as const, text: "Please complete Task B" },
+						{ type: "text" as const, text: "<environment_details>old env</environment_details>" },
+					],
+				},
+			]
+
+			// Simulates the retry update logic from the code
+			const retryAttempt = 1
+			const isEmptyUserContent = false
+			const updatedContent = [
+				{ type: "text" as const, text: RECOVERY_HINT_TEXT },
+				{ type: "text" as const, text: "Please complete Task B" },
+				{ type: "text" as const, text: "<environment_details>new env</environment_details>" },
+			]
+
+			if (retryAttempt > 0 && !isEmptyUserContent) {
+				const lastIdx = apiConversationHistory.length - 1
+				if (lastIdx >= 0 && apiConversationHistory[lastIdx].role === "user") {
+					apiConversationHistory[lastIdx] = { role: "user", content: updatedContent }
+				}
+			}
+
+			// Verify the last message was updated with recovery hint
+			const lastMessage = apiConversationHistory[apiConversationHistory.length - 1]
+			expect(lastMessage.role).toBe("user")
+			expect(lastMessage.content[0].text).toContain("CONTEXT RECOVERY NOTE")
+			expect(lastMessage.content[1].text).toBe("Please complete Task B")
+			expect(lastMessage.content[2].text).toContain("new env")
+
+			// Verify earlier messages are untouched
+			expect(apiConversationHistory[0]).toEqual({
+				role: "user",
+				content: [{ type: "text", text: "Complete Task A" }],
+			})
+		})
+
+		it("should not update API history if last message is not a user message", () => {
+			const apiConversationHistory = [
+				{
+					role: "user" as const,
+					content: [{ type: "text" as const, text: "Complete Task A" }],
+				},
+				{
+					role: "assistant" as const,
+					content: [{ type: "text" as const, text: "Task A completed." }],
+				},
+			]
+
+			const originalHistory = JSON.parse(JSON.stringify(apiConversationHistory))
+
+			const retryAttempt = 1
+			const isEmptyUserContent = false
+
+			if (retryAttempt > 0 && !isEmptyUserContent) {
+				const lastIdx = apiConversationHistory.length - 1
+				if (lastIdx >= 0 && apiConversationHistory[lastIdx].role === "user") {
+					apiConversationHistory[lastIdx] = {
+						role: "user",
+						content: [{ type: "text", text: "should not appear" }],
+					}
+				}
+			}
+
+			// History should be unchanged since last message is "assistant"
+			expect(apiConversationHistory).toEqual(originalHistory)
+		})
+
+		it("should not update API history if user content is empty (delegation resume)", () => {
+			const apiConversationHistory = [
+				{
+					role: "user" as const,
+					content: [{ type: "text" as const, text: "existing message" }],
+				},
+			]
+
+			const originalHistory = JSON.parse(JSON.stringify(apiConversationHistory))
+
+			const retryAttempt = 1
+			const isEmptyUserContent = true // Empty signals delegation resume
+
+			if (retryAttempt > 0 && !isEmptyUserContent) {
+				const lastIdx = apiConversationHistory.length - 1
+				if (lastIdx >= 0 && apiConversationHistory[lastIdx].role === "user") {
+					apiConversationHistory[lastIdx] = {
+						role: "user",
+						content: [{ type: "text", text: "should not appear" }],
+					}
+				}
+			}
+
+			// History should be unchanged since user content is empty
+			expect(apiConversationHistory).toEqual(originalHistory)
+		})
+
+		it("recovery hint contains key phrases to re-orient the model", () => {
+			expect(RECOVERY_HINT_TEXT).toContain("previous API request failed")
+			expect(RECOVERY_HINT_TEXT).toContain("provider error")
+			expect(RECOVERY_HINT_TEXT).toContain("automatically retried")
+			expect(RECOVERY_HINT_TEXT).toContain("most recent request")
+			expect(RECOVERY_HINT_TEXT).toContain("Do not repeat")
+			expect(RECOVERY_HINT_TEXT).toContain("previously completed tasks")
+		})
+	})
+
+	describe("Mid-stream retry cap", () => {
+		it("should present error to user when mid-stream retries exceed MAX_STREAM_RETRIES", () => {
+			const currentRetry = MAX_STREAM_RETRIES
+			let presentedErrorToUser = false
+			let pushedToStack = false
+
+			if (currentRetry >= MAX_STREAM_RETRIES) {
+				presentedErrorToUser = true
+			} else {
+				pushedToStack = true
+			}
+
+			expect(presentedErrorToUser).toBe(true)
+			expect(pushedToStack).toBe(false)
+		})
+
+		it("should push to retry stack when mid-stream retries are under the limit", () => {
+			const currentRetry = 3
+			let presentedErrorToUser = false
+			let pushedToStack = false
+
+			if (currentRetry >= MAX_STREAM_RETRIES) {
+				presentedErrorToUser = true
+			} else {
+				pushedToStack = true
+			}
+
+			expect(presentedErrorToUser).toBe(false)
+			expect(pushedToStack).toBe(true)
+		})
+
+		it("should reset retry count to 0 when user clicks retry after max retries", () => {
+			const currentRetry = MAX_STREAM_RETRIES
+			let newRetryAttempt = currentRetry
+
+			if (currentRetry >= MAX_STREAM_RETRIES) {
+				// User clicks retry - reset the counter
+				const userClickedRetry = true
+				if (userClickedRetry) {
+					newRetryAttempt = 0
+				}
+			}
+
+			expect(newRetryAttempt).toBe(0)
+		})
+
+		it("should increment retry count on each automatic retry", () => {
+			let retryAttempt = 0
+
+			for (let i = 0; i < MAX_STREAM_RETRIES; i++) {
+				retryAttempt = retryAttempt + 1
+			}
+
+			expect(retryAttempt).toBe(MAX_STREAM_RETRIES)
+		})
+	})
+})