Simplify thinker-best-of-n. Tweak ui and prompts

jahooma · jahooma · commit d3ebaa706ee2 · 2025-11-17T18:04:54.000-08:00
diff --git a/.agents/base2/base2.ts b/.agents/base2/base2.ts
@@ -112,6 +112,8 @@ Use the spawn_agents tool to spawn specialized agents to help you complete the u
 - **Sequence agents properly:** Keep in mind dependencies when spawning different agents. Don't spawn agents in parallel that depend on each other.
   ${buildArray(
     '- Spawn context-gathering agents (file pickers, code-searcher, directory-lister, glob-matcher, and web/docs researchers) before making edits.',
+    isMax &&
+      '- Spawn the thinker-best-of-n-gpt-5 after gathering context to solve complex problems.',
     `- Spawn a ${isMax ? 'editor-best-of-n-gpt-5' : 'editor-best-of-n'} agent to implement the changes after you have gathered all the context you need. You must spawn this agent for non-trivial changes, since it writes much better code than you would with the str_replace or write_file tools. Don't spawn the editor in parallel with context-gathering agents.`,
     '- Spawn commanders sequentially if the second command depends on the the first.',
   ).join('\n  ')}
@@ -247,6 +249,7 @@ function buildImplementationStepPrompt({
       `Keep working until the user's request is completely satisfied${!hasNoValidation ? ' and validated' : ''}, or until you require more information from the user.`,
     !isFast &&
       `You must spawn the ${isMax ? 'editor-best-of-n-gpt-5' : 'editor-best-of-n'} agent to implement code changes, since it will generate the best code changes.`,
+    isMax && 'Spawn the thinker-best-of-n-gpt-5 to solve complex problems.',
     `After completing the user request, summarize your changes in a sentence${isFast ? '' : ' or a few short bullet points'}.${isSonnet ? " Don't create any summary markdown files or example documentation files, unless asked by the user." : ''}. Don't repeat yourself -- especially if you already summarized your changes then just end your turn.`,
   ).join('\n')
 }
diff --git a/.agents/thinker/best-of-n/thinker-best-of-n.ts b/.agents/thinker/best-of-n/thinker-best-of-n.ts
@@ -1,7 +1,11 @@
 import { publisher } from '../../constants'
 
 import type { SecretAgentDefinition } from '../../types/secret-agent-definition'
-import type { AgentStepContext, ToolCall } from '../../types/agent-definition'
+import type {
+  AgentStepContext,
+  StepText,
+  ToolCall,
+} from '../../types/agent-definition'
 
 export function createThinkerBestOfN(
   model: 'sonnet' | 'gpt-5',
@@ -18,7 +22,7 @@ export function createThinkerBestOfN(
     includeMessageHistory: true,
     inheritParentSystemPrompt: true,
 
-    toolNames: ['spawn_agents', 'set_messages', 'set_output'],
+    toolNames: ['spawn_agents'],
     spawnableAgents: ['thinker-selector'],
 
     inputSchema: {
@@ -37,19 +41,11 @@ export function createThinkerBestOfN(
         },
       },
     },
-    outputMode: 'structured_output',
+    outputMode: 'last_message',
 
     instructionsPrompt: `You are one agent within the thinker-best-of-n. You were spawned to generate deep thinking about the user's request.
-
-Your task is to think deeply, step by step, about the user request and how best to approach it.
-
-Consider edge cases, potential issues, and alternative approaches. Also, propose reading files or spawning agents to get more context that would be helpful for solving the problem.
-
-Come up with a list of insights that would help someone arrive at the best solution.
-
-Try not to be too prescriptive or confident in one solution. Instead, give clear arguments and reasoning.
-
-You must be extremely concise and to the point.
+    
+Answer the user's query to the best of your ability and be extremely concise and to the point.
 
 **Important**: Do not use any tools! You are only thinking!`,
 
@@ -64,7 +60,6 @@ function* handleSteps({
 }: AgentStepContext): ReturnType<
   NonNullable<SecretAgentDefinition['handleSteps']>
 > {
-  const selectorAgent = 'thinker-selector'
   const n = Math.min(10, Math.max(1, (params?.n as number | undefined) ?? 5))
 
   // Use GENERATE_N to generate n thinking outputs
@@ -86,7 +81,7 @@ function* handleSteps({
     input: {
       agents: [
         {
-          agent_type: selectorAgent,
+          agent_type: 'thinker-selector',
           params: { thoughts },
         },
       ],
@@ -100,29 +95,25 @@ function* handleSteps({
 
   if ('errorMessage' in selectorOutput) {
     yield {
-      toolName: 'set_output',
-      input: { error: selectorOutput.errorMessage },
-    } satisfies ToolCall<'set_output'>
+      type: 'STEP_TEXT',
+      text: selectorOutput.errorMessage,
+    } satisfies StepText
     return
   }
   const { thoughtId } = selectorOutput
   const chosenThought = thoughts.find((thought) => thought.id === thoughtId)
   if (!chosenThought) {
     yield {
-      toolName: 'set_output',
-      input: { error: 'Failed to find chosen thinking output.' },
-    } satisfies ToolCall<'set_output'>
+      type: 'STEP_TEXT',
+      text: 'Failed to find chosen thinking output.',
+    } satisfies StepText
     return
   }
 
-  // Set output with the chosen thinking
   yield {
-    toolName: 'set_output',
-    input: {
-      response: chosenThought.content,
-    },
-    includeToolCall: false,
-  } satisfies ToolCall<'set_output'>
+    type: 'STEP_TEXT',
+    text: chosenThought.content,
+  } satisfies StepText
 
   function extractSpawnResults<T>(
     results: any[] | undefined,
diff --git a/cli/src/components/message-block.tsx b/cli/src/components/message-block.tsx
@@ -609,12 +609,14 @@ const AgentBranchWrapper = memo(
       onToggleCollapsed(agentBlock.agentId)
     }, [onToggleCollapsed, agentBlock.agentId])
 
-    // Create a status message for editor-best-of-n agent
+    // Create a status message for editor-best-of-n and thinker-best-of-n agents
     const nParameterMessage =
       agentBlock.params?.n !== undefined &&
-      agentBlock.agentType.includes('editor-best-of-n')
+      (agentBlock.agentType.includes('editor-best-of-n')
         ? `Generating ${agentBlock.params.n} implementations...`
-        : undefined
+        : agentBlock.agentType.includes('thinker-best-of-n')
+          ? `Generating ${agentBlock.params.n} deep thoughts...`
+          : undefined)
 
     return (
       <box key={keyPrefix} style={{ flexDirection: 'column', gap: 0 }}>