We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 86b0642 commit 3c419ceCopy full SHA for 3c419ce
evals/buffbench/main-single-eval.ts
@@ -5,8 +5,8 @@ import { runBuffBench } from './run-buffbench'
5
async function main() {
6
await runBuffBench({
7
evalDataPath: path.join(__dirname, 'eval-codebuff.json'),
8
- agents: ['base2-opus'],
9
- taskIds: ['add-spawn-perms-tests'],
+ agents: ['external:claude'],
+ taskIds: ['filter-system-history'],
10
})
11
12
process.exit(0)
0 commit comments