Add best-of-n thinker subagent

jahooma · jahooma · commit 68469508323a · 2025-11-09T15:39:59.000-08:00
diff --git a/.agents/base2/base2.ts b/.agents/base2/base2.ts
@@ -69,8 +69,10 @@ export function createBase2(
       'researcher-web',
       'researcher-docs',
       'commander',
-      isGpt5 && 'best-of-n-editor-gpt-5',
       isDefault && 'best-of-n-editor',
+      isGpt5 && 'best-of-n-editor-gpt-5',
+      isDefault && 'thinker-best-of-n',
+      isGpt5 && 'thinker-best-of-n-gpt-5',
       'context-pruner',
     ),
 
diff --git a/.agents/thinker/thinker-best-of-n-gpt-5.ts b/.agents/thinker/thinker-best-of-n-gpt-5.ts
@@ -0,0 +1,7 @@
+import { createThinkerBestOfN } from './thinker-best-of-n'
+
+const definition = {
+  ...createThinkerBestOfN('gpt-5'),
+  id: 'thinker-best-of-n-gpt-5',
+}
+export default definition
diff --git a/.agents/thinker/thinker-best-of-n.ts b/.agents/thinker/thinker-best-of-n.ts
@@ -0,0 +1,269 @@
+import { publisher } from '../constants'
+
+import type { SecretAgentDefinition } from '../types/secret-agent-definition'
+import type { AgentStepContext, ToolCall } from '../types/agent-definition'
+
+export function createThinkerBestOfN(
+  model: 'sonnet' | 'gpt-5',
+): Omit<SecretAgentDefinition, 'id'> {
+  const isGpt5 = model === 'gpt-5'
+
+  return {
+    publisher,
+    model: isGpt5 ? 'openai/gpt-5' : 'anthropic/claude-sonnet-4.5',
+    displayName: isGpt5 ? 'Best-of-N GPT-5 Thinker' : 'Best-of-N Thinker',
+    spawnerPrompt:
+      'Generates deep thinking by orchestrating multiple thinker agents, selects the best thinking output. Use this to help solve a hard problem. You must first gather all the relevant context *BEFORE* spawning this agent, as it can only think.',
+
+    includeMessageHistory: true,
+    inheritParentSystemPrompt: true,
+
+    toolNames: ['spawn_agents', 'set_messages', 'set_output'],
+    spawnableAgents: isGpt5
+      ? ['thinker-gpt-5', 'thinker-selector-gpt-5']
+      : ['thinker', 'thinker-selector'],
+
+    inputSchema: {
+      prompt: {
+        type: 'string',
+        description: 'The problem you are trying to solve',
+      },
+      params: {
+        type: 'object',
+        properties: {
+          n: {
+            type: 'number',
+            description:
+              'Number of parallel thinker agents to spawn. Defaults to 5. Use fewer for simple questions and max of 10 for complex questions.',
+          },
+        },
+      },
+    },
+    outputMode: 'structured_output',
+
+    handleSteps: isGpt5 ? handleStepsGpt5 : handleStepsSonnet,
+  }
+}
+
+function* handleStepsSonnet({
+  agentState,
+  prompt,
+  params,
+}: AgentStepContext): ReturnType<
+  NonNullable<SecretAgentDefinition['handleSteps']>
+> {
+  const thinkerAgent = 'thinker'
+  const selectorAgent = 'thinker-selector'
+  const n = Math.min(10, Math.max(1, (params?.n as number | undefined) ?? 5))
+
+  // Remove userInstruction message for this agent.
+  const messages = agentState.messageHistory.concat()
+  messages.pop()
+  yield {
+    toolName: 'set_messages',
+    input: {
+      messages,
+    },
+    includeToolCall: false,
+  } satisfies ToolCall<'set_messages'>
+
+  const { toolResult: thinkersResult1 } = yield {
+    toolName: 'spawn_agents',
+    input: {
+      agents: Array.from({ length: n }, () => ({
+        agent_type: thinkerAgent,
+        prompt,
+      })),
+    },
+    includeToolCall: false,
+  } satisfies ToolCall<'spawn_agents'>
+
+  const thinkersResult = extractSpawnResults<string>(thinkersResult1)
+
+  // Extract all the thinking outputs
+  const letters = 'ABCDEFGHIJKLMNOPQRSTUVWXYZ'
+  const thoughts = thinkersResult.map((content, index) => ({
+    id: letters[index],
+    content,
+  }))
+
+  // Spawn selector with thoughts as params
+  const { toolResult: selectorResult } = yield {
+    toolName: 'spawn_agents',
+    input: {
+      agents: [
+        {
+          agent_type: selectorAgent,
+          params: { thoughts },
+        },
+      ],
+    },
+    includeToolCall: false,
+  } satisfies ToolCall<'spawn_agents'>
+
+  const selectorOutput = extractSpawnResults<{
+    thoughtId: string
+  }>(selectorResult)[0]
+
+  if ('errorMessage' in selectorOutput) {
+    yield {
+      toolName: 'set_output',
+      input: { error: selectorOutput.errorMessage },
+    } satisfies ToolCall<'set_output'>
+    return
+  }
+  const { thoughtId } = selectorOutput
+  const chosenThought = thoughts.find((thought) => thought.id === thoughtId)
+  if (!chosenThought) {
+    yield {
+      toolName: 'set_output',
+      input: { error: 'Failed to find chosen thinking output.' },
+    } satisfies ToolCall<'set_output'>
+    return
+  }
+
+  // Set output with the chosen thinking
+  yield {
+    toolName: 'set_output',
+    input: {
+      response: chosenThought.content,
+    },
+    includeToolCall: false,
+  } satisfies ToolCall<'set_output'>
+
+  function extractSpawnResults<T>(
+    results: any[] | undefined,
+  ): (T | { errorMessage: string })[] {
+    if (!results) return []
+    const spawnedResults = results
+      .filter((result) => result.type === 'json')
+      .map((result) => result.value)
+      .flat() as {
+      agentType: string
+      value: { value?: T; errorMessage?: string }
+    }[]
+    return spawnedResults.map(
+      (result) =>
+        result.value.value ??
+        ({
+          errorMessage:
+            result.value.errorMessage ?? 'Error extracting spawn results',
+        } as { errorMessage: string }),
+    )
+  }
+}
+
+function* handleStepsGpt5({
+  agentState,
+  prompt,
+  params,
+}: AgentStepContext): ReturnType<
+  NonNullable<SecretAgentDefinition['handleSteps']>
+> {
+  const thinkerAgent = 'thinker-gpt-5'
+  const selectorAgent = 'thinker-selector-gpt-5'
+  const n = Math.min(10, Math.max(1, (params?.n as number | undefined) ?? 5))
+
+  // Remove userInstruction message for this agent.
+  const messages = agentState.messageHistory.concat()
+  messages.pop()
+  yield {
+    toolName: 'set_messages',
+    input: {
+      messages,
+    },
+    includeToolCall: false,
+  } satisfies ToolCall<'set_messages'>
+
+  const { toolResult: thinkersResult1 } = yield {
+    toolName: 'spawn_agents',
+    input: {
+      agents: Array.from({ length: n }, () => ({
+        agent_type: thinkerAgent,
+        prompt,
+      })),
+    },
+    includeToolCall: false,
+  } satisfies ToolCall<'spawn_agents'>
+
+  const thinkersResult = extractSpawnResults<string>(thinkersResult1)
+
+  // Extract all the thinking outputs
+  const letters = 'ABCDEFGHIJKLMNOPQRSTUVWXYZ'
+  const thoughts = thinkersResult.map((content, index) => ({
+    id: letters[index],
+    content,
+  }))
+
+  // Spawn selector with thoughts as params
+  const { toolResult: selectorResult } = yield {
+    toolName: 'spawn_agents',
+    input: {
+      agents: [
+        {
+          agent_type: selectorAgent,
+          params: { thoughts },
+        },
+      ],
+    },
+    includeToolCall: false,
+  } satisfies ToolCall<'spawn_agents'>
+
+  const selectorOutput = extractSpawnResults<{
+    thoughtId: string
+  }>(selectorResult)[0]
+
+  if ('errorMessage' in selectorOutput) {
+    yield {
+      toolName: 'set_output',
+      input: { error: selectorOutput.errorMessage },
+    } satisfies ToolCall<'set_output'>
+    return
+  }
+  const { thoughtId } = selectorOutput
+  const chosenThought = thoughts.find((thought) => thought.id === thoughtId)
+  if (!chosenThought) {
+    yield {
+      toolName: 'set_output',
+      input: { error: 'Failed to find chosen thinking output.' },
+    } satisfies ToolCall<'set_output'>
+    return
+  }
+
+  // Set output with the chosen thinking
+  yield {
+    toolName: 'set_output',
+    input: {
+      response: chosenThought.content,
+    },
+    includeToolCall: false,
+  } satisfies ToolCall<'set_output'>
+
+  function extractSpawnResults<T>(
+    results: any[] | undefined,
+  ): (T | { errorMessage: string })[] {
+    if (!results) return []
+    const spawnedResults = results
+      .filter((result) => result.type === 'json')
+      .map((result) => result.value)
+      .flat() as {
+      agentType: string
+      value: { value?: T; errorMessage?: string }
+    }[]
+    return spawnedResults.map(
+      (result) =>
+        result.value.value ??
+        ({
+          errorMessage:
+            result.value.errorMessage ?? 'Error extracting spawn results',
+        } as { errorMessage: string }),
+    )
+  }
+}
+
+const definition: SecretAgentDefinition = {
+  ...createThinkerBestOfN('sonnet'),
+  id: 'thinker-best-of-n',
+}
+
+export default definition
diff --git a/.agents/thinker/thinker-selector-gpt-5.ts b/.agents/thinker/thinker-selector-gpt-5.ts
@@ -0,0 +1,77 @@
+import { type SecretAgentDefinition } from '../types/secret-agent-definition'
+import { publisher } from '../constants'
+
+const definition: SecretAgentDefinition = {
+  id: 'thinker-selector-gpt-5',
+  publisher,
+  model: 'openai/gpt-5',
+  displayName: 'Thinker Output Selector GPT-5',
+  spawnerPrompt: 'Analyzes multiple thinking outputs and selects the best one',
+
+  includeMessageHistory: true,
+  inheritParentSystemPrompt: true,
+
+  toolNames: ['set_output'],
+  spawnableAgents: [],
+
+  inputSchema: {
+    params: {
+      type: 'object',
+      properties: {
+        thoughts: {
+          type: 'array',
+          items: {
+            type: 'object',
+            properties: {
+              id: { type: 'string' },
+              content: { type: 'string' },
+            },
+            required: ['id', 'content'],
+          },
+        },
+      },
+      required: ['thoughts'],
+    },
+  },
+  outputMode: 'structured_output',
+  outputSchema: {
+    type: 'object',
+    properties: {
+      thoughtId: {
+        type: 'string',
+        description: 'The id of the chosen thinking output',
+      },
+    },
+    required: ['thoughtId'],
+  },
+
+  instructionsPrompt: `As part of the best-of-n workflow for thinking agents, you are the thinking selector agent.
+  
+## Task Instructions
+
+You have been provided with multiple thinking outputs via params.
+
+The thoughts are available in the params.thoughts array, where each has:
+- id: A unique identifier for the thinking output
+- content: The full thinking text
+
+Your task is to analyze each thinking output carefully, compare them against the original user question, and select the best thinking.
+Evaluate each based on (in order of importance):
+- Depth and thoroughness in addressing the user's question.
+- Correctness and accuracy of insights.
+- Clarity and organization of thoughts.
+- Practical actionability of recommendations.
+- Consideration of edge cases and alternatives.
+
+## User Request
+
+Try to select the thinking output that best answers the user's problem.
+
+## Response Format
+
+If the best one is obvious or the outputs are very similar, you may not need to think very much (a few words suffice) or you may not need to use think tags at all, just pick the best one and output it. You have a dual goal of picking the best thinking and being fast (using as few words as possible).
+
+Then, do not write any other explanations AT ALL. You should directly output a single tool call to set_output with the selected thoughtId.`,
+}
+
+export default definition
diff --git a/.agents/thinker/thinker-selector.ts b/.agents/thinker/thinker-selector.ts
diff --git a/cli/src/components/tools/read-files.tsx b/cli/src/components/tools/read-files.tsx