Upload exp_phase8_reasoning_grounded_rl_t2_r128_alpha1_s2_20260507_023054/log.jsonl with huggingface_hub
Browse files
exp_phase8_reasoning_grounded_rl_t2_r128_alpha1_s2_20260507_023054/log.jsonl
CHANGED
|
@@ -14,3 +14,14 @@
|
|
| 14 |
{"step": 65, "loss": -81.56288146972656, "mean_r": -0.3091251850128174, "max_r": -0.10000000149011612, "mean_grounded": 2.75, "mean_halluc": 7.5, "mean_cited": 10.25, "mean_tf_grounded_rate": 0.2981240573152338, "gnorm": 448.92999267578125, "elapsed_s": 2267.7567059993744, "cell": "Ast", "id": "train:pair_pos:Ast:TMEM218:chr11_124928685_124929185:3554"}
|
| 15 |
{"step": 70, "loss": -42.581382751464844, "mean_r": -0.6251075863838196, "max_r": -0.18000000715255737, "mean_grounded": 1.75, "mean_halluc": 18.5, "mean_cited": 20.25, "mean_tf_grounded_rate": 0.1625, "gnorm": 347.837890625, "elapsed_s": 2436.6436779499054, "cell": "Ast", "id": "train:pair_pos:Ast:DOCK9:chr13_99208831_99209331:2173"}
|
| 16 |
{"step": 75, "loss": -62.28608703613281, "mean_r": -0.513744592666626, "max_r": -0.44545453786849976, "mean_grounded": 2.25, "mean_halluc": 9.5, "mean_cited": 11.75, "mean_tf_grounded_rate": 0.20319264069264067, "gnorm": 514.9257202148438, "elapsed_s": 2608.9937732219696, "cell": "Ast", "id": "train:pair_pos:Ast:DMXL2:chr15_51801334_51801834:1962"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 14 |
{"step": 65, "loss": -81.56288146972656, "mean_r": -0.3091251850128174, "max_r": -0.10000000149011612, "mean_grounded": 2.75, "mean_halluc": 7.5, "mean_cited": 10.25, "mean_tf_grounded_rate": 0.2981240573152338, "gnorm": 448.92999267578125, "elapsed_s": 2267.7567059993744, "cell": "Ast", "id": "train:pair_pos:Ast:TMEM218:chr11_124928685_124929185:3554"}
|
| 15 |
{"step": 70, "loss": -42.581382751464844, "mean_r": -0.6251075863838196, "max_r": -0.18000000715255737, "mean_grounded": 1.75, "mean_halluc": 18.5, "mean_cited": 20.25, "mean_tf_grounded_rate": 0.1625, "gnorm": 347.837890625, "elapsed_s": 2436.6436779499054, "cell": "Ast", "id": "train:pair_pos:Ast:DOCK9:chr13_99208831_99209331:2173"}
|
| 16 |
{"step": 75, "loss": -62.28608703613281, "mean_r": -0.513744592666626, "max_r": -0.44545453786849976, "mean_grounded": 2.25, "mean_halluc": 9.5, "mean_cited": 11.75, "mean_tf_grounded_rate": 0.20319264069264067, "gnorm": 514.9257202148438, "elapsed_s": 2608.9937732219696, "cell": "Ast", "id": "train:pair_pos:Ast:DMXL2:chr15_51801334_51801834:1962"}
|
| 17 |
+
{"step": 80, "loss": -58.18048095703125, "mean_r": -0.3349626064300537, "max_r": 0.0, "mean_grounded": 2.25, "mean_halluc": 6.75, "mean_cited": 9.5, "mean_tf_grounded_rate": 0.15998931623931623, "gnorm": 378.6766357421875, "elapsed_s": 2779.6273407936096, "cell": "Ast", "id": "train:pair_pos:Ast:C11orf44:chr11_130609830_130610330:4006"}
|
| 18 |
+
{"step": 85, "loss": 45.8577766418457, "mean_r": -0.33891940116882324, "max_r": 0.06923077255487442, "mean_grounded": 2.5, "mean_halluc": 8.75, "mean_cited": 13.0, "mean_tf_grounded_rate": 0.19711538461538464, "gnorm": 472.75494384765625, "elapsed_s": 2949.309454679489, "cell": "Oli", "id": "train:pair_pos:Oli:SERPINB9:chr6_2804901_2805401:1831"}
|
| 19 |
+
{"step": 90, "loss": -136.3919677734375, "mean_r": -0.2520102262496948, "max_r": 0.20000000298023224, "mean_grounded": 2.75, "mean_halluc": 8.25, "mean_cited": 11.5, "mean_tf_grounded_rate": 0.2907529239766082, "gnorm": 502.80377197265625, "elapsed_s": 3120.3812816143036, "cell": "Ast", "id": "train:pair_pos:Ast:TEP1:chr14_20411316_20411816:3498"}
|
| 20 |
+
{"step": 95, "loss": 11.306283950805664, "mean_r": -0.20493590831756592, "max_r": -0.13076923787593842, "mean_grounded": 3.25, "mean_halluc": 8.0, "mean_cited": 12.0, "mean_tf_grounded_rate": 0.26634615384615384, "gnorm": 384.8565979003906, "elapsed_s": 3271.7989418506622, "cell": "Mic", "id": "train:pair_pos:Mic:ZSCAN16-AS1:chr6_28235874_28236374:3612"}
|
| 21 |
+
{"step": 100, "loss": -4.005195617675781, "mean_r": -0.4769230782985687, "max_r": 0.0923076942563057, "mean_grounded": 2.5, "mean_halluc": 7.75, "mean_cited": 10.75, "mean_tf_grounded_rate": 0.19871794871794873, "gnorm": 394.97674560546875, "elapsed_s": 3434.5299413204193, "cell": "Oli", "id": "train:pair_pos:Oli:IL10RB:chr21_33060338_33060838:863"}
|
| 22 |
+
{"step": 105, "loss": -63.034637451171875, "mean_r": -0.2874999940395355, "max_r": -0.10000000149011612, "mean_grounded": 3.25, "mean_halluc": 8.75, "mean_cited": 12.75, "mean_tf_grounded_rate": 0.27261904761904765, "gnorm": 443.53277587890625, "elapsed_s": 3603.3936331272125, "cell": "Ast", "id": "train:pair_pos:Ast:CAPRIN1:chr11_34183912_34184412:3949"}
|
| 23 |
+
{"step": 110, "loss": 38.24821090698242, "mean_r": -0.4208333492279053, "max_r": -0.1666666716337204, "mean_grounded": 2.75, "mean_halluc": 7.25, "mean_cited": 10.0, "mean_tf_grounded_rate": 0.22916666666666663, "gnorm": 315.0513610839844, "elapsed_s": 3753.567712545395, "cell": "Ast", "id": "train:pair_pos:Ast:TMEM80:chr11_773346_773846:285"}
|
| 24 |
+
{"step": 115, "loss": -3.0448265075683594, "mean_r": -0.21187424659729004, "max_r": 0.7777777910232544, "mean_grounded": 3.25, "mean_halluc": 4.0, "mean_cited": 7.5, "mean_tf_grounded_rate": 0.3513431013431013, "gnorm": 200.75067138671875, "elapsed_s": 3913.7877769470215, "cell": "Ast", "id": "train:pair_pos:Ast:SPRED2:chr2_65435637_65436137:2752"}
|
| 25 |
+
{"step": 120, "loss": -22.570571899414062, "mean_r": -0.22821427881717682, "max_r": 0.18000000715255737, "mean_grounded": 3.0, "mean_halluc": 6.75, "mean_cited": 10.25, "mean_tf_grounded_rate": 0.2857142857142857, "gnorm": 352.949951171875, "elapsed_s": 4063.728887796402, "cell": "Mic", "id": "train:pair_pos:Mic:POLR1B:chr2_112701002_112701502:614"}
|
| 26 |
+
{"step": 125, "loss": -8.872991561889648, "mean_r": -0.2474999874830246, "max_r": -0.019999999552965164, "mean_grounded": 3.25, "mean_halluc": 7.75, "mean_cited": 11.0, "mean_tf_grounded_rate": 0.29583333333333334, "gnorm": 390.1910705566406, "elapsed_s": 4202.351343154907, "cell": "Ast", "id": "train:pair_pos:Ast:APH1B:chr15_63204095_63204595:2566"}
|
| 27 |
+
{"step": 130, "loss": -70.8443603515625, "mean_r": -0.5069047808647156, "max_r": -0.30000001192092896, "mean_grounded": 1.75, "mean_halluc": 12.0, "mean_cited": 14.75, "mean_tf_grounded_rate": 0.12893772893772892, "gnorm": 497.54949951171875, "elapsed_s": 4356.790739774704, "cell": "In", "id": "train:pair_neg:In:SLC22A8:chr11_62855826_62856326:1674"}
|