Skip to content

Commit 0f8f63f

Browse files
committed
eval-planner: write results to a file
1 parent b992969 commit 0f8f63f

File tree

1 file changed

+28
-1
lines changed

1 file changed

+28
-1
lines changed

evals/subagents/eval-planner.ts

Lines changed: 28 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -222,6 +222,18 @@ async function main() {
222222
}),
223223
)
224224

225+
const allResults = [] as Array<{
226+
sha: string
227+
spec: string
228+
agentOutput: string
229+
judgingResults: {
230+
reasoning: string
231+
pros: string
232+
cons: string
233+
overallScore: number
234+
}
235+
}>
236+
225237
// Track statistics
226238
const stats = {
227239
total: evalCommits.length,
@@ -249,7 +261,19 @@ async function main() {
249261
fileStates,
250262
})
251263

252-
const { judgingResults } = result
264+
const { judgingResults, agentOutput } = result
265+
allResults.push({
266+
sha,
267+
spec,
268+
agentOutput,
269+
judgingResults,
270+
})
271+
272+
fs.writeFileSync(
273+
path.join(__dirname, 'eval-planner-results.json'),
274+
JSON.stringify(allResults, null, 2),
275+
)
276+
253277
const { reasoning, pros, cons, overallScore } = judgingResults
254278

255279
console.log(`\n${'='.repeat(80)}`)
@@ -262,6 +286,9 @@ async function main() {
262286
console.log('\n🧠 REASONING:')
263287
console.log(reasoning)
264288

289+
console.log('\n✅ PROS:')
290+
console.log(pros)
291+
265292
console.log('\n❌ CONS:')
266293
console.log(cons)
267294

0 commit comments

Comments
 (0)