Upload _reasoning_rl_multiseed/eval_reasoning_t3_v7r128_postRL_alpha1_s3_par_20260507_005010/score.json with huggingface_hub
Browse files
_reasoning_rl_multiseed/eval_reasoning_t3_v7r128_postRL_alpha1_s3_par_20260507_005010/score.json
ADDED
|
@@ -0,0 +1,71 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"n_rows": 50,
|
| 3 |
+
"format": {
|
| 4 |
+
"reasoning_tags_rate": 0.8,
|
| 5 |
+
"dna_tags_rate": 0.0,
|
| 6 |
+
"cell_mention_rate": 0.92,
|
| 7 |
+
"mean_len_chars": 1052.62,
|
| 8 |
+
"p10_len_chars": 735.4,
|
| 9 |
+
"p90_len_chars": 1656.0
|
| 10 |
+
},
|
| 11 |
+
"tf_grounding": {
|
| 12 |
+
"mean_tf_grounded_rate": 0.19508590161534112,
|
| 13 |
+
"mean_n_cited": 15.08,
|
| 14 |
+
"mean_n_grounded": 5.22,
|
| 15 |
+
"mean_n_canonical_only": 0.32,
|
| 16 |
+
"mean_n_hallucinated": 9.54,
|
| 17 |
+
"mean_motif_consensus": 0.3222940612630679,
|
| 18 |
+
"mean_prog_coverage": 0.1295952380952381
|
| 19 |
+
},
|
| 20 |
+
"per_cell": {
|
| 21 |
+
"Ast": {
|
| 22 |
+
"n": 5,
|
| 23 |
+
"tf_grounded_rate": 0.1787301587301587,
|
| 24 |
+
"n_cited": 9.8,
|
| 25 |
+
"len_chars": 1015.4,
|
| 26 |
+
"cell_mention": 0.8
|
| 27 |
+
},
|
| 28 |
+
"End": {
|
| 29 |
+
"n": 3,
|
| 30 |
+
"tf_grounded_rate": 0.18614718614718614,
|
| 31 |
+
"n_cited": 9.666666666666666,
|
| 32 |
+
"len_chars": 816.3333333333334,
|
| 33 |
+
"cell_mention": 1.0
|
| 34 |
+
},
|
| 35 |
+
"Ex": {
|
| 36 |
+
"n": 15,
|
| 37 |
+
"tf_grounded_rate": 0.23268385024766822,
|
| 38 |
+
"n_cited": 19.4,
|
| 39 |
+
"len_chars": 1016.7333333333333,
|
| 40 |
+
"cell_mention": 0.8666666666666667
|
| 41 |
+
},
|
| 42 |
+
"In": {
|
| 43 |
+
"n": 4,
|
| 44 |
+
"tf_grounded_rate": 0.0857843137254902,
|
| 45 |
+
"n_cited": 12.5,
|
| 46 |
+
"len_chars": 1068.75,
|
| 47 |
+
"cell_mention": 1.0
|
| 48 |
+
},
|
| 49 |
+
"Mic": {
|
| 50 |
+
"n": 13,
|
| 51 |
+
"tf_grounded_rate": 0.25437160062160064,
|
| 52 |
+
"n_cited": 16.384615384615383,
|
| 53 |
+
"len_chars": 1167.0,
|
| 54 |
+
"cell_mention": 0.9230769230769231
|
| 55 |
+
},
|
| 56 |
+
"OPC": {
|
| 57 |
+
"n": 2,
|
| 58 |
+
"tf_grounded_rate": 0.2159090909090909,
|
| 59 |
+
"n_cited": 11.5,
|
| 60 |
+
"len_chars": 937.0,
|
| 61 |
+
"cell_mention": 1.0
|
| 62 |
+
},
|
| 63 |
+
"Oli": {
|
| 64 |
+
"n": 8,
|
| 65 |
+
"tf_grounded_rate": 0.09126984126984126,
|
| 66 |
+
"n_cited": 12.375,
|
| 67 |
+
"len_chars": 1066.75,
|
| 68 |
+
"cell_mention": 1.0
|
| 69 |
+
}
|
| 70 |
+
}
|
| 71 |
+
}
|