explcre commited on
Commit
00e2032
·
verified ·
1 Parent(s): 86300c6

Upload exp_phase8_reasoning_grounded_rl_t3_r128_alpha1_s3_par_20260507_005010/log.jsonl with huggingface_hub

Browse files
exp_phase8_reasoning_grounded_rl_t3_r128_alpha1_s3_par_20260507_005010/log.jsonl CHANGED
@@ -27,3 +27,12 @@
27
  {"step": 130, "loss": -97.35746765136719, "mean_r": -0.23000000417232513, "max_r": 0.0, "mean_grounded": 0.0, "mean_halluc": 3.75, "mean_cited": 3.75, "mean_tf_grounded_rate": 0.0, "gnorm": 294.1395263671875, "elapsed_s": 4680.179282903671, "cell": "OPC", "id": "train:edit:OPC:ZNF502:chr3_44476289_44476789:1834"}
28
  {"step": 135, "loss": -110.84915924072266, "mean_r": -0.04444444179534912, "max_r": 0.5, "mean_grounded": 0.75, "mean_halluc": 2.25, "mean_cited": 3.25, "mean_tf_grounded_rate": 0.1875, "gnorm": 398.39111328125, "elapsed_s": 4871.525849580765, "cell": "In", "id": "train:edit:In:NOP14:chr4_2834473_2834973:99"}
29
  {"step": 140, "loss": -101.678955078125, "mean_r": -0.17023809254169464, "max_r": 0.0833333358168602, "mean_grounded": 2.0, "mean_halluc": 5.75, "mean_cited": 8.5, "mean_tf_grounded_rate": 0.19791666666666669, "gnorm": 475.77886962890625, "elapsed_s": 5063.330948114395, "cell": "OPC", "id": "train:edit:OPC:DEDD2:chr19_42244624_42245124:4082"}
 
 
 
 
 
 
 
 
 
 
27
  {"step": 130, "loss": -97.35746765136719, "mean_r": -0.23000000417232513, "max_r": 0.0, "mean_grounded": 0.0, "mean_halluc": 3.75, "mean_cited": 3.75, "mean_tf_grounded_rate": 0.0, "gnorm": 294.1395263671875, "elapsed_s": 4680.179282903671, "cell": "OPC", "id": "train:edit:OPC:ZNF502:chr3_44476289_44476789:1834"}
28
  {"step": 135, "loss": -110.84915924072266, "mean_r": -0.04444444179534912, "max_r": 0.5, "mean_grounded": 0.75, "mean_halluc": 2.25, "mean_cited": 3.25, "mean_tf_grounded_rate": 0.1875, "gnorm": 398.39111328125, "elapsed_s": 4871.525849580765, "cell": "In", "id": "train:edit:In:NOP14:chr4_2834473_2834973:99"}
29
  {"step": 140, "loss": -101.678955078125, "mean_r": -0.17023809254169464, "max_r": 0.0833333358168602, "mean_grounded": 2.0, "mean_halluc": 5.75, "mean_cited": 8.5, "mean_tf_grounded_rate": 0.19791666666666669, "gnorm": 475.77886962890625, "elapsed_s": 5063.330948114395, "cell": "OPC", "id": "train:edit:OPC:DEDD2:chr19_42244624_42245124:4082"}
30
+ {"step": 145, "loss": 0.0, "mean_r": 0.0, "max_r": 0.0, "mean_grounded": 0.0, "mean_halluc": 0.0, "mean_cited": 0.0, "mean_tf_grounded_rate": 0.0, "gnorm": 0.0, "elapsed_s": 5254.912788152695, "cell": "Oli", "id": "train:edit:Oli:KIF2C:chr1_44660824_44661324:2156"}
31
+ {"step": 150, "loss": -171.71832275390625, "mean_r": -0.5221154093742371, "max_r": 0.0, "mean_grounded": 1.25, "mean_halluc": 9.5, "mean_cited": 10.75, "mean_tf_grounded_rate": 0.06944444444444445, "gnorm": 360.0874938964844, "elapsed_s": 5441.150552749634, "cell": "Ex", "id": "train:edit:Ex:CEP85:chr1_26016496_26016996:503"}
32
+ {"step": 155, "loss": 84.17100524902344, "mean_r": -0.7821428775787354, "max_r": -0.12857143580913544, "mean_grounded": 1.5, "mean_halluc": 4.0, "mean_cited": 5.5, "mean_tf_grounded_rate": 0.10714285714285714, "gnorm": 330.9013366699219, "elapsed_s": 5630.904017925262, "cell": "Mic", "id": "train:edit:Mic:MYO7B:chr2_127390933_127391433:1686"}
33
+ {"step": 160, "loss": 25.723966598510742, "mean_r": 0.1785714328289032, "max_r": 0.7142857313156128, "mean_grounded": 1.5, "mean_halluc": 0.25, "mean_cited": 1.75, "mean_tf_grounded_rate": 0.21428571428571427, "gnorm": 212.44644165039062, "elapsed_s": 5820.547861814499, "cell": "Oli", "id": "train:edit:Oli:ZNF839:chr14_102191452_102191952:1198"}
34
+ {"step": 165, "loss": -28.028940200805664, "mean_r": -0.25, "max_r": 0.0, "mean_grounded": 0.0, "mean_halluc": 0.25, "mean_cited": 0.25, "mean_tf_grounded_rate": 0.0, "gnorm": 167.03233337402344, "elapsed_s": 6009.097616434097, "cell": "Oli", "id": "train:edit:Oli:RAB36:chr22_23282738_23283238:73"}
35
+ {"step": 170, "loss": -107.42401885986328, "mean_r": -0.11818181723356247, "max_r": 0.4000000059604645, "mean_grounded": 0.5, "mean_halluc": 2.75, "mean_cited": 3.5, "mean_tf_grounded_rate": 0.16666666666666666, "gnorm": 400.05987548828125, "elapsed_s": 6198.614594936371, "cell": "Oli", "id": "train:edit:Oli:PURB:chr7_44749709_44750209:2026"}
36
+ {"step": 175, "loss": -38.00294876098633, "mean_r": -0.0833333358168602, "max_r": 0.0, "mean_grounded": 0.5, "mean_halluc": 0.75, "mean_cited": 1.25, "mean_tf_grounded_rate": 0.20833333333333331, "gnorm": 237.77078247070312, "elapsed_s": 6389.940973997116, "cell": "OPC", "id": "train:edit:OPC:FSCN1:chr7_5686247_5686747:71"}
37
+ {"step": 180, "loss": -28.001291275024414, "mean_r": -0.05000000074505806, "max_r": 0.0, "mean_grounded": 0.5, "mean_halluc": 0.75, "mean_cited": 1.25, "mean_tf_grounded_rate": 0.1, "gnorm": 269.5014343261719, "elapsed_s": 6581.041960954666, "cell": "End", "id": "train:edit:End:CST3:chr20_23868939_23869439:1158"}
38
+ {"step": 185, "loss": -3.159186363220215, "mean_r": -0.2750000059604645, "max_r": 0.0, "mean_grounded": 0.5, "mean_halluc": 1.25, "mean_cited": 1.75, "mean_tf_grounded_rate": 0.1, "gnorm": 151.06671142578125, "elapsed_s": 6772.244442224503, "cell": "Mic", "id": "train:edit:Mic:RIOK1:chr6_7328290_7328790:488"}