explcre commited on
Commit
b0ccd2a
·
verified ·
1 Parent(s): 1e8d17e

Upload exp_phase8_reasoning_grounded_rl_t3_r128_alpha1_s3_par_20260507_005010/log.jsonl with huggingface_hub

Browse files
exp_phase8_reasoning_grounded_rl_t3_r128_alpha1_s3_par_20260507_005010/log.jsonl CHANGED
@@ -7,3 +7,13 @@
7
  {"step": 30, "loss": -26.32823944091797, "mean_r": -0.5035101175308228, "max_r": -0.1818181872367859, "mean_grounded": 1.75, "mean_halluc": 8.75, "mean_cited": 11.75, "mean_tf_grounded_rate": 0.15012626262626264, "gnorm": 437.66583251953125, "elapsed_s": 1052.7420649528503, "cell": "Mic", "id": "train:edit:Mic:CDH15:chr16_88977794_88978294:2991"}
8
  {"step": 35, "loss": 93.8807601928711, "mean_r": -0.7846736907958984, "max_r": -0.6666666865348816, "mean_grounded": 1.0, "mean_halluc": 10.75, "mean_cited": 12.25, "mean_tf_grounded_rate": 0.06973581973581974, "gnorm": 400.18951416015625, "elapsed_s": 1229.797791481018, "cell": "In", "id": "train:edit:In:LRRC56:chr11_640216_640716:3357"}
9
  {"step": 40, "loss": -175.54000854492188, "mean_r": -0.442307710647583, "max_r": 0.0, "mean_grounded": 1.75, "mean_halluc": 11.0, "mean_cited": 12.75, "mean_tf_grounded_rate": 0.11615384615384616, "gnorm": 377.7589416503906, "elapsed_s": 1414.281956911087, "cell": "Mic", "id": "train:edit:Mic:SIPA1:chr11_65652352_65652852:3382"}
 
 
 
 
 
 
 
 
 
 
 
7
  {"step": 30, "loss": -26.32823944091797, "mean_r": -0.5035101175308228, "max_r": -0.1818181872367859, "mean_grounded": 1.75, "mean_halluc": 8.75, "mean_cited": 11.75, "mean_tf_grounded_rate": 0.15012626262626264, "gnorm": 437.66583251953125, "elapsed_s": 1052.7420649528503, "cell": "Mic", "id": "train:edit:Mic:CDH15:chr16_88977794_88978294:2991"}
8
  {"step": 35, "loss": 93.8807601928711, "mean_r": -0.7846736907958984, "max_r": -0.6666666865348816, "mean_grounded": 1.0, "mean_halluc": 10.75, "mean_cited": 12.25, "mean_tf_grounded_rate": 0.06973581973581974, "gnorm": 400.18951416015625, "elapsed_s": 1229.797791481018, "cell": "In", "id": "train:edit:In:LRRC56:chr11_640216_640716:3357"}
9
  {"step": 40, "loss": -175.54000854492188, "mean_r": -0.442307710647583, "max_r": 0.0, "mean_grounded": 1.75, "mean_halluc": 11.0, "mean_cited": 12.75, "mean_tf_grounded_rate": 0.11615384615384616, "gnorm": 377.7589416503906, "elapsed_s": 1414.281956911087, "cell": "Mic", "id": "train:edit:Mic:SIPA1:chr11_65652352_65652852:3382"}
10
+ {"step": 45, "loss": -76.31844329833984, "mean_r": -0.1133333295583725, "max_r": 0.06666667014360428, "mean_grounded": 0.5, "mean_halluc": 2.25, "mean_cited": 3.25, "mean_tf_grounded_rate": 0.10833333333333334, "gnorm": 432.98297119140625, "elapsed_s": 1591.3449778556824, "cell": "Ast", "id": "train:edit:Ast:SYN3:chr22_32843166_32843666:1656"}
11
+ {"step": 50, "loss": -85.02119445800781, "mean_r": -0.45192307233810425, "max_r": 0.0, "mean_grounded": 0.0, "mean_halluc": 3.25, "mean_cited": 3.5, "mean_tf_grounded_rate": 0.0, "gnorm": 240.878173828125, "elapsed_s": 1773.7889394760132, "cell": "Ex", "id": "train:edit:Ex:PSMD1:chr2_230924334_230924834:3881"}
12
+ {"step": 55, "loss": -95.26789855957031, "mean_r": -0.5940476059913635, "max_r": -0.2857142984867096, "mean_grounded": 1.0, "mean_halluc": 8.0, "mean_cited": 9.25, "mean_tf_grounded_rate": 0.15178571428571427, "gnorm": 421.9581298828125, "elapsed_s": 1944.9084331989288, "cell": "Oli", "id": "train:edit:Oli:INPP5K:chr17_1648718_1649218:2894"}
13
+ {"step": 60, "loss": 87.06375122070312, "mean_r": -0.7466386556625366, "max_r": -0.5571428537368774, "mean_grounded": 0.5, "mean_halluc": 8.0, "mean_cited": 8.5, "mean_tf_grounded_rate": 0.06696428571428571, "gnorm": 389.80181884765625, "elapsed_s": 2113.1579599380493, "cell": "OPC", "id": "train:edit:OPC:AGPS:chr2_177628765_177629265:3135"}
14
+ {"step": 65, "loss": -187.80018615722656, "mean_r": -0.42097902297973633, "max_r": 0.0, "mean_grounded": 0.25, "mean_halluc": 6.25, "mean_cited": 6.5, "mean_tf_grounded_rate": 0.125, "gnorm": 367.68402099609375, "elapsed_s": 2292.572273492813, "cell": "In", "id": "train:edit:In:PLXNA4:chr7_132869181_132869681:2731"}
15
+ {"step": 70, "loss": -86.65145874023438, "mean_r": -0.6621212363243103, "max_r": 0.0, "mean_grounded": 0.0, "mean_halluc": 3.5, "mean_cited": 3.75, "mean_tf_grounded_rate": 0.0, "gnorm": 172.92315673828125, "elapsed_s": 2474.1830286979675, "cell": "Ex", "id": "train:edit:Ex:LRRN4CL:chr11_62936740_62937240:643"}
16
+ {"step": 75, "loss": -72.8033218383789, "mean_r": 0.18611112236976624, "max_r": 1.2000000476837158, "mean_grounded": 1.5, "mean_halluc": 2.5, "mean_cited": 4.25, "mean_tf_grounded_rate": 0.3888888888888889, "gnorm": 278.49725341796875, "elapsed_s": 2648.636190891266, "cell": "Ex", "id": "train:edit:Ex:CKAP4:chr12_106125394_106125894:3365"}
17
+ {"step": 80, "loss": -191.45631408691406, "mean_r": -0.1815476268529892, "max_r": 0.10000000149011612, "mean_grounded": 0.75, "mean_halluc": 4.0, "mean_cited": 5.25, "mean_tf_grounded_rate": 0.19642857142857142, "gnorm": 511.4512634277344, "elapsed_s": 2828.817238330841, "cell": "OPC", "id": "train:edit:OPC:IL17RB:chr3_53796142_53796642:3987"}
18
+ {"step": 85, "loss": -157.27638244628906, "mean_r": -0.4334615468978882, "max_r": 0.0, "mean_grounded": 1.0, "mean_halluc": 9.0, "mean_cited": 10.75, "mean_tf_grounded_rate": 0.07596153846153847, "gnorm": 334.5196533203125, "elapsed_s": 3008.4655957221985, "cell": "Ex", "id": "train:edit:Ex:SV2C:chr5_76025055_76025555:612"}
19
+ {"step": 90, "loss": -147.7225341796875, "mean_r": -0.5180357098579407, "max_r": 0.0, "mean_grounded": 1.0, "mean_halluc": 8.5, "mean_cited": 10.0, "mean_tf_grounded_rate": 0.07410714285714286, "gnorm": 270.45025634765625, "elapsed_s": 3189.0442271232605, "cell": "Mic", "id": "train:edit:Mic:ATP6V1A:chr3_113670476_113670976:86"}