Skip to content

Commit 6e81cc3

Browse files
committed
feat: include judge model name in summary
Made-with: Cursor
1 parent 676aa2c commit 6e81cc3

1 file changed

Lines changed: 5 additions & 0 deletions

File tree

ci_eval_runner.py

Lines changed: 5 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -282,11 +282,15 @@ def parse_results(
282282
"metric_scores": {},
283283
})
284284

285+
judge_cfg = config.get("judgeLlm", {})
286+
judge_name = judge_cfg.get("model", "") or judge_cfg.get("name", "")
287+
285288
return {
286289
"experiment_id": experiment.get("id", ""),
287290
"name": experiment.get("name", ""),
288291
"status": experiment.get("status", "unknown"),
289292
"model": config.get("model", {}).get("name", "Unknown"),
293+
"judge": judge_name,
290294
"total_prompts": results.get("total_prompts", 0),
291295
"duration_ms": results.get("duration"),
292296
"passed": all_passed,
@@ -312,6 +316,7 @@ def generate_markdown(results: Dict[str, Any]) -> str:
312316
"",
313317
f"**Experiment:** {results['name']} ",
314318
f"**Model:** {model} ",
319+
f"**Judge:** {results.get('judge') or 'gpt-4o'} ",
315320
f"**Status:** {results['status']} ",
316321
f"**Samples:** {results['total_prompts']} ",
317322
]

0 commit comments

Comments
 (0)