eval: submit GPQA Diamond result via PR (community badge)

#1
by terry-u - opened
Files changed (1) hide show
  1. .eval_results/gpqa.yaml +4 -0
.eval_results/gpqa.yaml CHANGED
@@ -3,4 +3,8 @@
3
  task_id: gpqa_diamond
4
  value: 0.01
5
  date: "2026-06-16"
 
 
 
 
6
  notes: "parody/practice repo — model NOT actually evaluated; value 0.01 is a placeholder set by repo owner, not a measured score"
 
3
  task_id: gpqa_diamond
4
  value: 0.01
5
  date: "2026-06-16"
6
+ source:
7
+ url: https://huggingface.co/terry-u/my-first-model
8
+ name: self-reported placeholder (not a measured eval)
9
+ user: terry-u
10
  notes: "parody/practice repo — model NOT actually evaluated; value 0.01 is a placeholder set by repo owner, not a measured score"