Put back new behavior of not ending until handleSteps returns endTurn: true.

jahooma · jahooma · commit 7c7315ec9b31 · 2025-10-15T17:07:36.000-07:00
diff --git a/backend/src/__tests__/loop-agent-steps.test.ts b/backend/src/__tests__/loop-agent-steps.test.ts
@@ -527,6 +527,7 @@ describe('loopAgentSteps - runAgentStep vs runProgrammaticStep behavior', () =>
     expect(llmCallCount).toBe(1) // LLM called once after STEP
     expect(result.agentState).toBeDefined()
   })
+
   it('should pass shouldEndTurn: true as stepsComplete when end_turn tool is called', async () => {
     // Test that when LLM calls end_turn, shouldEndTurn is correctly passed to runProgrammaticStep
 
@@ -538,11 +539,17 @@ describe('loopAgentSteps - runAgentStep vs runProgrammaticStep behavior', () =>
       () => ({
         runProgrammaticStep: async (params: any) => {
           runProgrammaticStepCalls.push(params)
-          // Return default behavior
-          return { agentState: params.agentState, endTurn: false }
+          // First call: return endTurn false to continue
+          // Second call: return endTurn true to end the loop
+          const shouldEnd = runProgrammaticStepCalls.length >= 2
+          return {
+            agentState: params.agentState,
+            endTurn: shouldEnd,
+            stepNumber: params.stepNumber,
+          }
         },
         clearAgentGeneratorCache: () => {},
-        agentIdToStepAll: new Set(),
+        runIdToStepAll: new Set(),
       }),
     )
 
@@ -586,6 +593,72 @@ describe('loopAgentSteps - runAgentStep vs runProgrammaticStep behavior', () =>
     expect(runProgrammaticStepCalls[1].stepsComplete).toBe(true)
   })
 
+  it('should continue loop when handleSteps returns endTurn: false even if LLM calls end_turn', async () => {
+    // Test that handleSteps endTurn: false takes precedence over LLM end_turn tool call
+
+    let programmaticStepCount = 0
+    let llmStepCount = 0
+
+    const mockGeneratorFunction = function* () {
+      // First iteration: return endTurn: false
+      programmaticStepCount++
+      yield 'STEP'
+
+      // Second iteration: also return endTurn: false
+      programmaticStepCount++
+      yield 'STEP'
+
+      // Third iteration: finally return endTurn: true to end the loop
+      programmaticStepCount++
+      yield { toolName: 'end_turn', input: {} }
+    } as () => StepGenerator
+
+    mockTemplate.handleSteps = mockGeneratorFunction
+
+    const localAgentTemplates = {
+      'test-agent': mockTemplate,
+    }
+
+    // Mock LLM to always call end_turn, but handleSteps should override it
+    let promptCallCount = 0
+    agentRuntimeImpl.promptAiSdkStream = async function* () {
+      promptCallCount++
+      llmStepCount++
+
+      // LLM always tries to end turn
+      yield {
+        type: 'text' as const,
+        text: `LLM response\n\n${getToolCallString('end_turn', {})}`,
+      }
+      return `mock-message-id-${promptCallCount}`
+    }
+
+    await runLoopAgentStepsWithContext({
+      ...agentRuntimeImpl,
+      ...agentRuntimeScopedImpl,
+      userInputId: 'test-user-input',
+      agentType: 'test-agent',
+      agentState: mockAgentState,
+      prompt: 'Test handleSteps endTurn override',
+      spawnParams: undefined,
+      fingerprintId: 'test-fingerprint',
+      fileContext: mockFileContext,
+      localAgentTemplates,
+      userId: TEST_USER_ID,
+      clientSessionId: 'test-session',
+      onResponseChunk: () => {},
+    })
+
+    // Verify handleSteps ran 3 times (yielded STEP twice, then end_turn)
+    expect(programmaticStepCount).toBe(3)
+
+    // Verify LLM was called 2 times (once per STEP yield)
+    expect(llmStepCount).toBe(2)
+
+    // This confirms that even though LLM called end_turn every time,
+    // the loop continued because handleSteps kept yielding STEP before finally ending
+  })
+
   it('should restart loop when agent finishes without setting required output', async () => {
     // Test that when an agent has outputSchema but finishes without calling set_output,
     // the loop restarts with a system message
diff --git a/backend/src/run-agent-step.ts b/backend/src/run-agent-step.ts
@@ -620,9 +620,7 @@ export const loopAgentSteps = async (
         currentAgentState = programmaticAgentState
         totalSteps = stepNumber
 
-        if (endTurn) {
-          shouldEndTurn = true
-        }
+        shouldEndTurn = endTurn
       }
 
       // Check if output is required but missing

Original file line number	Diff line number	Diff line change
`@@ -620,9 +620,7 @@ export const loopAgentSteps = async (`
`620`	`620`	`currentAgentState = programmaticAgentState`
`621`	`621`	`totalSteps = stepNumber`
`622`	`622`
`623`		`- if (endTurn) {`
`624`		`- shouldEndTurn = true`
`625`		`- }`
	`623`	`+ shouldEndTurn = endTurn`
`626`	`624`	`}`
`627`	`625`
`628`	`626`	`// Check if output is required but missing`