Skip to content

Commit f558f58

Browse files
committed
base2-fast-with-validation
1 parent 422e2a4 commit f558f58

File tree

3 files changed

+17
-12
lines changed

3 files changed

+17
-12
lines changed
Lines changed: 8 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,8 @@
1+
import { createBase2 } from './base2'
2+
3+
const definition = {
4+
...createBase2('fast-with-validation'),
5+
id: 'base2-fast-with-validation',
6+
displayName: 'Buffy the Fast Validation Orchestrator',
7+
}
8+
export default definition

.agents/base2/base2.ts

Lines changed: 7 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -7,10 +7,11 @@ import {
77
} from '../types/secret-agent-definition'
88

99
export const createBase2: (
10-
mode: 'fast' | 'max',
10+
mode: 'fast' | 'max' | 'fast-with-validation',
1111
) => Omit<SecretAgentDefinition, 'id'> = (mode) => {
12-
const isFast = mode === 'fast'
12+
const isFast = mode === 'fast' || mode === 'fast-with-validation'
1313
const isMax = mode === 'max'
14+
const isFastWithValidation = mode === 'fast-with-validation'
1415
return {
1516
publisher,
1617
model: 'anthropic/claude-sonnet-4.5',
@@ -139,13 +140,13 @@ The user asks you to implement a new feature. You respond in multiple steps:
139140
${
140141
isFast
141142
? `3. Write out your implementation plan as a bullet point list.
142-
4. Use the str_replace or write_file tool to make the changes.`
143+
4. Use the str_replace or write_file tool to make the changes.
144+
${isFastWithValidation ? '5. Test your changes by running appropriate validation commands for the project (e.g. typechecks, tests, lints, etc.). You may have to explore the project to find the appropriate commands.\n' : ''}`
143145
: `3. IMPORTANT: You must spawn a base2-gpt-5-worker agent inline (with spawn_agent_inline tool) to do the planning and editing.
144146
4. Fix any issues left by the base2-gpt-5-worker agent.`
145147
}
146-
5. Inform the user that you have completed the task in one sentence without a final summary. Don't create any markdown summary files either, unless asked by the user. If you already finished the user request and said you're done, then don't say anything else.`,
147-
stepPrompt: `Don't forget to spawn agents that could help, especially: the file-picker-max and code-searcher to get codebase context,${isMax ? ' the base2-gpt-5-worker agent to do the planning and editing,' : ''}.`,
148-
148+
${isFastWithValidation ? '6' : '5'}. Inform the user that you have completed the task in one sentence without a final summary. Don't create any markdown summary files either, unless asked by the user. If you already finished the user request and said you're done, then don't say anything else.`,
149+
stepPrompt: `Don't forget to spawn agents that could help, especially: the file-picker-max and code-searcher to get codebase context,${isMax ? ' the base2-gpt-5-worker agent to do the planning and editing,' : ''}. After completing the user request, summarize your changes in a sentence or a few short bullet points. Do not create any summary markdown files, unless asked by the user. Then, end your turn.`,
149150
handleSteps: function* ({ params }) {
150151
let steps = 0
151152
while (true) {

evals/buffbench/main.ts

Lines changed: 2 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -5,12 +5,8 @@ import { runBuffBench } from './run-buffbench'
55
async function main() {
66
await runBuffBench({
77
evalDataPath: path.join(__dirname, 'eval-codebuff.json'),
8-
agents: [
9-
'base2-fast-thinking',
10-
'base2-fast-thinking-tags',
11-
'base2-fast-thinking-tool',
12-
],
13-
taskConcurrency: 2,
8+
agents: ['base2-fast-with-validation'],
9+
taskConcurrency: 5,
1410
})
1511

1612
process.exit(0)

0 commit comments

Comments
 (0)