@@ -25,7 +25,7 @@ import { isValidationSample } from './collect-tuning-data'
2525const isProd = process . argv . includes ( '--prod' )
2626const DATASET = isProd ? 'codebuff_data' : 'codebuff_data_dev'
2727const MAX_PARALLEL = 5 // Maximum number of traces to process in parallel for relabeling
28- const LIMIT = 400 // Total limit of traces to process
28+ const LIMIT = 4000 // Total limit of traces to process
2929const START_CURSOR = '2025-05-31T00:00:00.000Z' // User-provided start cursor or default
3030
3131const GROUND_TRUTH_MODEL = 'claude-opus-4-20250514-with-full-file-context-new'
@@ -306,18 +306,18 @@ const scoringFunctions = {
306306 fn : ( teacher : string , student : string ) =>
307307 jaccardSimilarity ( teacher , student ) ,
308308 } ,
309- jaccardTop3 : {
310- name : 'Jaccard Similarity (Top 3 ) (↑ is better)' ,
309+ jaccardTop2 : {
310+ name : 'Jaccard Similarity (Top 2 ) (↑ is better)' ,
311311 description :
312- 'Filters both the teacher and student outputs to the top 3 files, then calculates Jaccard Similarity' ,
312+ 'Filters both the teacher and student outputs to the top 2 files, then calculates Jaccard Similarity' ,
313313 fn : ( teacher : string , student : string ) =>
314- jaccardSimilarity ( teacher , student , 3 ) ,
314+ jaccardSimilarity ( teacher , student , 2 ) ,
315315 } ,
316316 mrr : {
317- name : 'MRR (Top 3 , average) (↑ is better)' ,
317+ name : 'MRR (Top 2 , average) (↑ is better)' ,
318318 description :
319- 'Rewards students (1/rank) for each file that is in the top 3 of the teacher' ,
320- fn : ( teacher : string , student : string ) => mrr ( teacher , student , 3 ) ,
319+ 'Rewards students (1/rank) for each file that is in the top 2 of the teacher' ,
320+ fn : ( teacher : string , student : string ) => mrr ( teacher , student , 2 ) ,
321321 } ,
322322}
323323
0 commit comments