Skip to content

Commit 9efe7cc

Browse files
committed
Put back run eval set to initial config
1 parent 95196ac commit 9efe7cc

File tree

3 files changed

+18
-18
lines changed

3 files changed

+18
-18
lines changed

evals/git-evals/run-eval-set.ts

Lines changed: 16 additions & 16 deletions
Original file line numberDiff line numberDiff line change
@@ -72,7 +72,7 @@ class RunEvalSetCommand extends Command {
7272
}),
7373
agent: Flags.string({
7474
description: 'Codebuff agent id to use',
75-
default: 'base-layer', // hi
75+
default: 'base-lite',
7676
}),
7777
help: Flags.help({ char: 'h' }),
7878
}
@@ -134,21 +134,21 @@ async function runEvalSet(options: {
134134
evalDataPath: path.join(__dirname, 'eval-codebuff2.json'),
135135
outputDir,
136136
},
137-
// {
138-
// name: 'manifold',
139-
// evalDataPath: path.join(__dirname, 'eval-manifold2.json'),
140-
// outputDir,
141-
// },
142-
// {
143-
// name: 'plane',
144-
// evalDataPath: path.join(__dirname, 'eval-plane.json'),
145-
// outputDir,
146-
// },
147-
// {
148-
// name: 'saleor',
149-
// evalDataPath: path.join(__dirname, 'eval-saleor.json'),
150-
// outputDir,
151-
// },
137+
{
138+
name: 'manifold',
139+
evalDataPath: path.join(__dirname, 'eval-manifold2.json'),
140+
outputDir,
141+
},
142+
{
143+
name: 'plane',
144+
evalDataPath: path.join(__dirname, 'eval-plane.json'),
145+
outputDir,
146+
},
147+
{
148+
name: 'saleor',
149+
evalDataPath: path.join(__dirname, 'eval-saleor.json'),
150+
outputDir,
151+
},
152152
]
153153

154154
console.log(`Running ${evalConfigs.length} evaluations:`)

evals/git-evals/run-single-eval-process.ts

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -74,7 +74,7 @@ async function main() {
7474
fingerprintId,
7575
codingAgent as any,
7676
agent,
77-
true,
77+
false,
7878
)
7979

8080
// Check again after long-running operation

evals/git-evals/run-single-eval.ts

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -199,7 +199,7 @@ async function runSingleEvalTask(options: {
199199
fingerprintId,
200200
codingAgent,
201201
agentType,
202-
true,
202+
false,
203203
)
204204

205205
const duration = Date.now() - startTime

0 commit comments

Comments
 (0)