Upload exp_phase8_reasoning_grounded_rl_t2_r128_alpha1_s2_20260507_023054/log.jsonl with huggingface_hub
Browse files
exp_phase8_reasoning_grounded_rl_t2_r128_alpha1_s2_20260507_023054/log.jsonl
CHANGED
|
@@ -38,3 +38,14 @@
|
|
| 38 |
{"step": 185, "loss": -28.08819580078125, "mean_r": -0.11071428656578064, "max_r": -0.05714285746216774, "mean_grounded": 4.25, "mean_halluc": 7.0, "mean_cited": 11.75, "mean_tf_grounded_rate": 0.36904761904761907, "gnorm": 377.2549743652344, "elapsed_s": 5958.770046949387, "cell": "Ast", "id": "train:pair_pos:Ast:EPS8L2:chr11_618176_618676:231"}
|
| 39 |
{"step": 190, "loss": -84.53244018554688, "mean_r": 0.11698877811431885, "max_r": 0.9117646813392639, "mean_grounded": 11.5, "mean_halluc": 5.75, "mean_cited": 17.5, "mean_tf_grounded_rate": 0.4924369747899159, "gnorm": 301.6457214355469, "elapsed_s": 6107.5840899944305, "cell": "Ast", "id": "train:pair_pos:Ast:ZBTB17:chr1_16187654_16188154:3652"}
|
| 40 |
{"step": 195, "loss": 33.700984954833984, "mean_r": -0.03437022119760513, "max_r": 0.1315789520740509, "mean_grounded": 5.25, "mean_halluc": 7.5, "mean_cited": 12.75, "mean_tf_grounded_rate": 0.3979082321187584, "gnorm": 404.85498046875, "elapsed_s": 6255.567425727844, "cell": "Ast", "id": "train:pair_pos:Ast:ITPK1-AS1:chr14_93082659_93083159:1782"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 38 |
{"step": 185, "loss": -28.08819580078125, "mean_r": -0.11071428656578064, "max_r": -0.05714285746216774, "mean_grounded": 4.25, "mean_halluc": 7.0, "mean_cited": 11.75, "mean_tf_grounded_rate": 0.36904761904761907, "gnorm": 377.2549743652344, "elapsed_s": 5958.770046949387, "cell": "Ast", "id": "train:pair_pos:Ast:EPS8L2:chr11_618176_618676:231"}
|
| 39 |
{"step": 190, "loss": -84.53244018554688, "mean_r": 0.11698877811431885, "max_r": 0.9117646813392639, "mean_grounded": 11.5, "mean_halluc": 5.75, "mean_cited": 17.5, "mean_tf_grounded_rate": 0.4924369747899159, "gnorm": 301.6457214355469, "elapsed_s": 6107.5840899944305, "cell": "Ast", "id": "train:pair_pos:Ast:ZBTB17:chr1_16187654_16188154:3652"}
|
| 40 |
{"step": 195, "loss": 33.700984954833984, "mean_r": -0.03437022119760513, "max_r": 0.1315789520740509, "mean_grounded": 5.25, "mean_halluc": 7.5, "mean_cited": 12.75, "mean_tf_grounded_rate": 0.3979082321187584, "gnorm": 404.85498046875, "elapsed_s": 6255.567425727844, "cell": "Ast", "id": "train:pair_pos:Ast:ITPK1-AS1:chr14_93082659_93083159:1782"}
|
| 41 |
+
{"step": 200, "loss": -17.7750244140625, "mean_r": -0.1870279610157013, "max_r": 0.11999999731779099, "mean_grounded": 5.0, "mean_halluc": 8.5, "mean_cited": 13.5, "mean_tf_grounded_rate": 0.3370629370629371, "gnorm": 387.2765808105469, "elapsed_s": 6405.924955368042, "cell": "Mic", "id": "train:pair_neg:Mic:ANXA4:chr2_69742465_69742965:3354"}
|
| 42 |
+
{"step": 205, "loss": 27.041183471679688, "mean_r": -0.013921566307544708, "max_r": 0.13333334028720856, "mean_grounded": 4.5, "mean_halluc": 5.75, "mean_cited": 10.5, "mean_tf_grounded_rate": 0.44183006535947716, "gnorm": 269.1871337890625, "elapsed_s": 6558.646851301193, "cell": "Ast", "id": "train:pair_pos:Ast:KCNQ1:chr11_2402023_2402523:1314"}
|
| 43 |
+
{"step": 210, "loss": 7.7697906494140625, "mean_r": -0.4541608691215515, "max_r": -0.03846153989434242, "mean_grounded": 2.0, "mean_halluc": 8.5, "mean_cited": 11.25, "mean_tf_grounded_rate": 0.1701048951048951, "gnorm": 408.90081787109375, "elapsed_s": 6681.592452287674, "cell": "In", "id": "train:pair_pos:In:DNAJC5G:chr2_27132966_27133466:2182"}
|
| 44 |
+
{"step": 215, "loss": -85.06522369384766, "mean_r": 0.03412698581814766, "max_r": 0.4000000059604645, "mean_grounded": 5.0, "mean_halluc": 7.5, "mean_cited": 13.25, "mean_tf_grounded_rate": 0.43253968253968256, "gnorm": 366.5877990722656, "elapsed_s": 6830.9244821071625, "cell": "Ast", "id": "train:pair_pos:Ast:CMTM5:chr14_23358259_23358759:316"}
|
| 45 |
+
{"step": 220, "loss": -104.04539489746094, "mean_r": -0.10083332657814026, "max_r": 1.0, "mean_grounded": 2.0, "mean_halluc": 5.75, "mean_cited": 8.0, "mean_tf_grounded_rate": 0.3732142857142857, "gnorm": 270.4681701660156, "elapsed_s": 6991.258186578751, "cell": "Ast", "id": "train:pair_pos:Ast:VASN:chr16_4613123_4613623:2361"}
|
| 46 |
+
{"step": 225, "loss": 76.3250732421875, "mean_r": -0.6625000238418579, "max_r": -0.4000000059604645, "mean_grounded": 1.0, "mean_halluc": 7.0, "mean_cited": 8.0, "mean_tf_grounded_rate": 0.11458333333333333, "gnorm": 277.0542297363281, "elapsed_s": 7131.870132923126, "cell": "Oli", "id": "train:pair_neg:Oli:WWC2:chr4_182875317_182875817:1392"}
|
| 47 |
+
{"step": 230, "loss": -97.54570770263672, "mean_r": -0.5177790522575378, "max_r": -0.3333333432674408, "mean_grounded": 1.75, "mean_halluc": 8.25, "mean_cited": 10.25, "mean_tf_grounded_rate": 0.18514328808446456, "gnorm": 476.21917724609375, "elapsed_s": 7276.466025114059, "cell": "In", "id": "train:pair_neg:In:FBXW2:chr9_120926274_120926774:3085"}
|
| 48 |
+
{"step": 235, "loss": -13.307289123535156, "mean_r": -0.16236519813537598, "max_r": 0.11249999701976776, "mean_grounded": 5.25, "mean_halluc": 8.75, "mean_cited": 14.5, "mean_tf_grounded_rate": 0.35490196078431374, "gnorm": 427.806640625, "elapsed_s": 7430.018545389175, "cell": "Ast", "id": "train:pair_pos:Ast:CELA2B:chr1_15385743_15386243:3423"}
|
| 49 |
+
{"step": 240, "loss": -46.60246276855469, "mean_r": -0.2937484681606293, "max_r": -0.14444445073604584, "mean_grounded": 3.5, "mean_halluc": 8.0, "mean_cited": 11.5, "mean_tf_grounded_rate": 0.30531135531135534, "gnorm": 417.65228271484375, "elapsed_s": 7575.789538860321, "cell": "Ast", "id": "train:pair_pos:Ast:ERICH6B:chr13_45833621_45834121:528"}
|
| 50 |
+
{"step": 245, "loss": 3.6889114379882812, "mean_r": -0.03144840896129608, "max_r": 0.08571428805589676, "mean_grounded": 5.0, "mean_halluc": 6.75, "mean_cited": 11.75, "mean_tf_grounded_rate": 0.4146825396825397, "gnorm": 415.8805847167969, "elapsed_s": 7706.871344327927, "cell": "Ex", "id": "train:pair_neg:Ex:MLXIP:chr12_122123119_122123619:2978"}
|
| 51 |
+
{"step": 250, "loss": -76.9756088256836, "mean_r": -0.14845821261405945, "max_r": 0.20666666328907013, "mean_grounded": 5.0, "mean_halluc": 8.0, "mean_cited": 13.25, "mean_tf_grounded_rate": 0.3656010656010656, "gnorm": 400.9198913574219, "elapsed_s": 7868.239282131195, "cell": "Ast", "id": "train:pair_pos:Ast:GALNT8:chr12_4779697_4780197:499"}
|