glm-5.2-RedlineBench

#19
Files changed (1) hide show
  1. .eval_results/redlinebench.yaml +10 -0
.eval_results/redlinebench.yaml ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ - dataset:
2
+ id: crosbylegal/RedlineBench
3
+ task_id: redline_overall
4
+ value: 45.7
5
+ date: "2026-06-19"
6
+ source:
7
+ url: https://huggingface.co/zai-org/GLM-5.2
8
+ name: Model Card
9
+ user: crosbylegal
10
+ notes: "agent=glm-5.2; 3-LLM judge panel (majority vote); turn-weighted weighted pass rate (0-100); post-publication run"