explcre commited on
Commit
355a44d
·
verified ·
1 Parent(s): 24bb4af

Upload exp_phase8_reasoning_grounded_rl_t2_r128_alpha1_s3_20260507_044835/log.jsonl with huggingface_hub

Browse files
exp_phase8_reasoning_grounded_rl_t2_r128_alpha1_s3_20260507_044835/log.jsonl CHANGED
@@ -19,3 +19,13 @@
19
  {"step": 90, "loss": 59.57316589355469, "mean_r": -0.029230769723653793, "max_r": 0.023076923564076424, "mean_grounded": 4.75, "mean_halluc": 6.75, "mean_cited": 11.5, "mean_tf_grounded_rate": 0.4115384615384615, "gnorm": 399.2134704589844, "elapsed_s": 3084.458697080612, "cell": "Ast", "id": "train:pair_pos:Ast:COPS7A:chr12_6527155_6527655:959"}
20
  {"step": 95, "loss": -68.27378845214844, "mean_r": -0.4207359254360199, "max_r": -0.18000000715255737, "mean_grounded": 4.0, "mean_halluc": 15.5, "mean_cited": 20.0, "mean_tf_grounded_rate": 0.23564213564213565, "gnorm": 456.6268615722656, "elapsed_s": 3245.223747253418, "cell": "Ast", "id": "train:pair_pos:Ast:LRP4:chr11_47118852_47119352:1335"}
21
  {"step": 100, "loss": -225.0859375, "mean_r": -0.4487878680229187, "max_r": 0.0, "mean_grounded": 1.5, "mean_halluc": 9.25, "mean_cited": 10.75, "mean_tf_grounded_rate": 0.1140151515151515, "gnorm": 478.38421630859375, "elapsed_s": 3415.2856843471527, "cell": "Ast", "id": "train:pair_pos:Ast:LRRC55:chr11_57211308_57211808:2019"}
 
 
 
 
 
 
 
 
 
 
 
19
  {"step": 90, "loss": 59.57316589355469, "mean_r": -0.029230769723653793, "max_r": 0.023076923564076424, "mean_grounded": 4.75, "mean_halluc": 6.75, "mean_cited": 11.5, "mean_tf_grounded_rate": 0.4115384615384615, "gnorm": 399.2134704589844, "elapsed_s": 3084.458697080612, "cell": "Ast", "id": "train:pair_pos:Ast:COPS7A:chr12_6527155_6527655:959"}
20
  {"step": 95, "loss": -68.27378845214844, "mean_r": -0.4207359254360199, "max_r": -0.18000000715255737, "mean_grounded": 4.0, "mean_halluc": 15.5, "mean_cited": 20.0, "mean_tf_grounded_rate": 0.23564213564213565, "gnorm": 456.6268615722656, "elapsed_s": 3245.223747253418, "cell": "Ast", "id": "train:pair_pos:Ast:LRP4:chr11_47118852_47119352:1335"}
21
  {"step": 100, "loss": -225.0859375, "mean_r": -0.4487878680229187, "max_r": 0.0, "mean_grounded": 1.5, "mean_halluc": 9.25, "mean_cited": 10.75, "mean_tf_grounded_rate": 0.1140151515151515, "gnorm": 478.38421630859375, "elapsed_s": 3415.2856843471527, "cell": "Ast", "id": "train:pair_pos:Ast:LRRC55:chr11_57211308_57211808:2019"}
22
+ {"step": 105, "loss": 17.90606689453125, "mean_r": -0.27145832777023315, "max_r": 0.21250000596046448, "mean_grounded": 4.5, "mean_halluc": 9.0, "mean_cited": 14.0, "mean_tf_grounded_rate": 0.28541666666666665, "gnorm": 433.63720703125, "elapsed_s": 3582.237601995468, "cell": "Ast", "id": "train:pair_pos:Ast:FAM41C:chr1_941520_942020:24"}
23
+ {"step": 110, "loss": -40.341552734375, "mean_r": -0.32681816816329956, "max_r": -0.25999999046325684, "mean_grounded": 2.75, "mean_halluc": 7.5, "mean_cited": 10.5, "mean_tf_grounded_rate": 0.26136363636363635, "gnorm": 447.862548828125, "elapsed_s": 3734.9819555282593, "cell": "End", "id": "train:pair_pos:End:TMEM121:chr14_105498656_105499156:902"}
24
+ {"step": 115, "loss": -1.363128662109375, "mean_r": -0.2780681848526001, "max_r": -0.027272727340459824, "mean_grounded": 5.25, "mean_halluc": 10.75, "mean_cited": 17.0, "mean_tf_grounded_rate": 0.29384469696969695, "gnorm": 419.2023620605469, "elapsed_s": 3889.340273141861, "cell": "Ast", "id": "train:pair_pos:Ast:ZDHHC5:chr11_57427617_57428117:2307"}
25
+ {"step": 120, "loss": -149.09262084960938, "mean_r": -0.21353384852409363, "max_r": 1.0, "mean_grounded": 3.0, "mean_halluc": 7.5, "mean_cited": 11.5, "mean_tf_grounded_rate": 0.3488721804511278, "gnorm": 328.8318176269531, "elapsed_s": 4057.9865713119507, "cell": "Ex", "id": "train:pair_neg:Ex:PHETA1:chr12_111185910_111186410:479"}
26
+ {"step": 125, "loss": 99.04361724853516, "mean_r": -0.15386904776096344, "max_r": -0.03333333507180214, "mean_grounded": 3.5, "mean_halluc": 6.0, "mean_cited": 10.0, "mean_tf_grounded_rate": 0.3392857142857143, "gnorm": 437.196044921875, "elapsed_s": 4230.925471782684, "cell": "OPC", "id": "train:pair_neg:OPC:ALDOA:chr16_30030479_30030979:296"}
27
+ {"step": 130, "loss": -45.3918571472168, "mean_r": 0.004186604171991348, "max_r": 0.22727273404598236, "mean_grounded": 5.25, "mean_halluc": 7.25, "mean_cited": 13.0, "mean_tf_grounded_rate": 0.4162038619275461, "gnorm": 412.8166198730469, "elapsed_s": 4410.347144365311, "cell": "Oli", "id": "train:pair_neg:Oli:UBN1:chr16_4967030_4967530:837"}
28
+ {"step": 135, "loss": -100.61750793457031, "mean_r": -0.24108392000198364, "max_r": 0.0, "mean_grounded": 2.25, "mean_halluc": 6.75, "mean_cited": 9.25, "mean_tf_grounded_rate": 0.18356643356643357, "gnorm": 369.89801025390625, "elapsed_s": 4584.195008277893, "cell": "Ast", "id": "train:pair_pos:Ast:LNX2:chr13_27638435_27638935:3808"}
29
+ {"step": 140, "loss": -88.15803527832031, "mean_r": 0.18339230120182037, "max_r": 0.699999988079071, "mean_grounded": 6.25, "mean_halluc": 7.5, "mean_cited": 14.0, "mean_tf_grounded_rate": 0.5183731387291759, "gnorm": 381.1214599609375, "elapsed_s": 4738.309872150421, "cell": "Ast", "id": "train:pair_pos:Ast:DZIP1:chr13_95496385_95496885:1925"}
30
+ {"step": 145, "loss": 79.7239990234375, "mean_r": -0.4128749966621399, "max_r": -0.05000000074505806, "mean_grounded": 3.75, "mean_halluc": 16.0, "mean_cited": 19.75, "mean_tf_grounded_rate": 0.26197916666666665, "gnorm": 376.2814025878906, "elapsed_s": 4915.069397211075, "cell": "Ast", "id": "train:pair_pos:Ast:NEK3:chr13_52390267_52390767:917"}
31
+ {"step": 150, "loss": -126.88933563232422, "mean_r": 0.23273809254169464, "max_r": 1.0333333015441895, "mean_grounded": 4.25, "mean_halluc": 4.25, "mean_cited": 9.0, "mean_tf_grounded_rate": 0.529491341991342, "gnorm": 315.1418151855469, "elapsed_s": 5090.648319244385, "cell": "Mic", "id": "train:pair_pos:Mic:GNB4:chr3_179453060_179453560:1907"}