Upload _reasoning_rl_multiseed/eval_reasoning_t2_v7r128_postRL_alpha1_s3_20260507_044835/score.json with huggingface_hub
Browse files
_reasoning_rl_multiseed/eval_reasoning_t2_v7r128_postRL_alpha1_s3_20260507_044835/score.json
ADDED
|
@@ -0,0 +1,71 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"n_rows": 50,
|
| 3 |
+
"format": {
|
| 4 |
+
"reasoning_tags_rate": 0.74,
|
| 5 |
+
"dna_tags_rate": 0.08,
|
| 6 |
+
"cell_mention_rate": 0.86,
|
| 7 |
+
"mean_len_chars": 1111.82,
|
| 8 |
+
"p10_len_chars": 616.7,
|
| 9 |
+
"p90_len_chars": 2075.4
|
| 10 |
+
},
|
| 11 |
+
"tf_grounding": {
|
| 12 |
+
"mean_tf_grounded_rate": 0.2666117252466633,
|
| 13 |
+
"mean_n_cited": 15.2,
|
| 14 |
+
"mean_n_grounded": 4.7,
|
| 15 |
+
"mean_n_canonical_only": 0.34,
|
| 16 |
+
"mean_n_hallucinated": 10.16,
|
| 17 |
+
"mean_motif_consensus": 0.2680326215779302,
|
| 18 |
+
"mean_prog_coverage": 0.16297619047619047
|
| 19 |
+
},
|
| 20 |
+
"per_cell": {
|
| 21 |
+
"Ast": {
|
| 22 |
+
"n": 5,
|
| 23 |
+
"tf_grounded_rate": 0.27113095238095236,
|
| 24 |
+
"n_cited": 12.6,
|
| 25 |
+
"len_chars": 1158.6,
|
| 26 |
+
"cell_mention": 1.0
|
| 27 |
+
},
|
| 28 |
+
"End": {
|
| 29 |
+
"n": 3,
|
| 30 |
+
"tf_grounded_rate": 0.2969574036511156,
|
| 31 |
+
"n_cited": 28.666666666666668,
|
| 32 |
+
"len_chars": 1770.3333333333333,
|
| 33 |
+
"cell_mention": 1.0
|
| 34 |
+
},
|
| 35 |
+
"Ex": {
|
| 36 |
+
"n": 15,
|
| 37 |
+
"tf_grounded_rate": 0.2260506160506161,
|
| 38 |
+
"n_cited": 9.8,
|
| 39 |
+
"len_chars": 913.2666666666667,
|
| 40 |
+
"cell_mention": 0.8666666666666667
|
| 41 |
+
},
|
| 42 |
+
"In": {
|
| 43 |
+
"n": 4,
|
| 44 |
+
"tf_grounded_rate": 0.3968418043393217,
|
| 45 |
+
"n_cited": 29.25,
|
| 46 |
+
"len_chars": 1242.75,
|
| 47 |
+
"cell_mention": 0.75
|
| 48 |
+
},
|
| 49 |
+
"Mic": {
|
| 50 |
+
"n": 13,
|
| 51 |
+
"tf_grounded_rate": 0.27188515653328704,
|
| 52 |
+
"n_cited": 14.384615384615385,
|
| 53 |
+
"len_chars": 1015.6923076923077,
|
| 54 |
+
"cell_mention": 0.8461538461538461
|
| 55 |
+
},
|
| 56 |
+
"OPC": {
|
| 57 |
+
"n": 2,
|
| 58 |
+
"tf_grounded_rate": 0.2375,
|
| 59 |
+
"n_cited": 25.0,
|
| 60 |
+
"len_chars": 1579.0,
|
| 61 |
+
"cell_mention": 1.0
|
| 62 |
+
},
|
| 63 |
+
"Oli": {
|
| 64 |
+
"n": 8,
|
| 65 |
+
"tf_grounded_rate": 0.26205322455322455,
|
| 66 |
+
"n_cited": 13.75,
|
| 67 |
+
"len_chars": 1181.875,
|
| 68 |
+
"cell_mention": 0.75
|
| 69 |
+
}
|
| 70 |
+
}
|
| 71 |
+
}
|