explcre commited on
Commit
3b030c8
·
verified ·
1 Parent(s): a4fc679

Upload exp_phase8_reasoning_grounded_rl_t1_r128_alpha1_s3_20260506_234027/log.jsonl with huggingface_hub

Browse files
exp_phase8_reasoning_grounded_rl_t1_r128_alpha1_s3_20260506_234027/log.jsonl CHANGED
@@ -38,3 +38,12 @@
38
  {"step": 185, "loss": 13.997580528259277, "mean_r": 0.9831638336181641, "max_r": 1.0666667222976685, "mean_grounded": 19.75, "mean_halluc": 0.5, "mean_cited": 20.25, "mean_tf_grounded_rate": 0.973389355742297, "gnorm": 181.38186645507812, "elapsed_s": 7036.699383020401, "cell": "Ex", "id": "train:gen:Ex:SH3GL2:chr9_17580139_17580639:1755"}
39
  {"step": 190, "loss": -64.85012817382812, "mean_r": 0.8214423060417175, "max_r": 1.0, "mean_grounded": 9.75, "mean_halluc": 1.75, "mean_cited": 12.0, "mean_tf_grounded_rate": 0.8479967948717949, "gnorm": 208.01470947265625, "elapsed_s": 7226.780698776245, "cell": "Ast", "id": "train:gen:Ast:BCL9L:chr11_118921285_118921785:2605"}
40
  {"step": 195, "loss": -144.64866638183594, "mean_r": -0.3027777671813965, "max_r": 0.0, "mean_grounded": 1.75, "mean_halluc": 8.0, "mean_cited": 11.25, "mean_tf_grounded_rate": 0.14484126984126983, "gnorm": 423.9998474121094, "elapsed_s": 7416.172049045563, "cell": "Oli", "id": "train:gen:Oli:PNPLA2:chr11_727281_727781:568"}
 
 
 
 
 
 
 
 
 
 
38
  {"step": 185, "loss": 13.997580528259277, "mean_r": 0.9831638336181641, "max_r": 1.0666667222976685, "mean_grounded": 19.75, "mean_halluc": 0.5, "mean_cited": 20.25, "mean_tf_grounded_rate": 0.973389355742297, "gnorm": 181.38186645507812, "elapsed_s": 7036.699383020401, "cell": "Ex", "id": "train:gen:Ex:SH3GL2:chr9_17580139_17580639:1755"}
39
  {"step": 190, "loss": -64.85012817382812, "mean_r": 0.8214423060417175, "max_r": 1.0, "mean_grounded": 9.75, "mean_halluc": 1.75, "mean_cited": 12.0, "mean_tf_grounded_rate": 0.8479967948717949, "gnorm": 208.01470947265625, "elapsed_s": 7226.780698776245, "cell": "Ast", "id": "train:gen:Ast:BCL9L:chr11_118921285_118921785:2605"}
40
  {"step": 195, "loss": -144.64866638183594, "mean_r": -0.3027777671813965, "max_r": 0.0, "mean_grounded": 1.75, "mean_halluc": 8.0, "mean_cited": 11.25, "mean_tf_grounded_rate": 0.14484126984126983, "gnorm": 423.9998474121094, "elapsed_s": 7416.172049045563, "cell": "Oli", "id": "train:gen:Oli:PNPLA2:chr11_727281_727781:568"}
41
+ {"step": 200, "loss": -8.827940940856934, "mean_r": 0.3575466275215149, "max_r": 0.6545454263687134, "mean_grounded": 9.25, "mean_halluc": 4.75, "mean_cited": 14.25, "mean_tf_grounded_rate": 0.6612762237762237, "gnorm": 200.6781005859375, "elapsed_s": 7606.140708208084, "cell": "Ex", "id": "train:gen:Ex:ARC:chr8_142543557_142544057:1579"}
42
+ {"step": 205, "loss": -12.655495643615723, "mean_r": 0.9017857313156128, "max_r": 1.0, "mean_grounded": 9.0, "mean_halluc": 0.5, "mean_cited": 9.5, "mean_tf_grounded_rate": 0.9508928571428572, "gnorm": 109.04293060302734, "elapsed_s": 7797.637563705444, "cell": "Oli", "id": "train:gen:Oli:OR9Q1:chr11_57816768_57817268:1813"}
43
+ {"step": 210, "loss": 22.307373046875, "mean_r": -0.20949198305606842, "max_r": 0.6363636255264282, "mean_grounded": 5.0, "mean_halluc": 6.75, "mean_cited": 12.75, "mean_tf_grounded_rate": 0.32820855614973266, "gnorm": 252.35011291503906, "elapsed_s": 7988.808565616608, "cell": "Ex", "id": "train:gen:Ex:HES5:chr1_2296362_2296862:2253"}
44
+ {"step": 215, "loss": 19.59605598449707, "mean_r": 0.8206547498703003, "max_r": 1.2000000476837158, "mean_grounded": 13.25, "mean_halluc": 2.5, "mean_cited": 15.75, "mean_tf_grounded_rate": 0.8674107142857144, "gnorm": 258.6458740234375, "elapsed_s": 8180.824372768402, "cell": "Ex", "id": "train:gen:Ex:ESPN:chr1_6262183_6262683:3483"}
45
+ {"step": 220, "loss": -35.19794464111328, "mean_r": 0.7663906812667847, "max_r": 1.0111111402511597, "mean_grounded": 19.75, "mean_halluc": 2.75, "mean_cited": 22.5, "mean_tf_grounded_rate": 0.878234989648033, "gnorm": 192.8950653076172, "elapsed_s": 8372.581154823303, "cell": "In", "id": "train:gen:In:LRMP:chr12_24818965_24819465:1071"}
46
+ {"step": 225, "loss": -11.222650527954102, "mean_r": 0.5054778456687927, "max_r": 0.8461538553237915, "mean_grounded": 8.0, "mean_halluc": 2.0, "mean_cited": 10.0, "mean_tf_grounded_rate": 0.7436480186480187, "gnorm": 160.99327087402344, "elapsed_s": 8564.304427146912, "cell": "Ex", "id": "train:gen:Ex:DFFB:chr1_3625429_3625929:2632"}
47
+ {"step": 230, "loss": -27.773218154907227, "mean_r": 0.9260683655738831, "max_r": 1.0153846740722656, "mean_grounded": 15.75, "mean_halluc": 0.75, "mean_cited": 16.5, "mean_tf_grounded_rate": 0.9566993464052288, "gnorm": 244.86892700195312, "elapsed_s": 8755.290162801743, "cell": "In", "id": "train:gen:In:PIWIL4:chr11_94449296_94449796:2721"}
48
+ {"step": 235, "loss": -10.545574188232422, "mean_r": 0.8249242305755615, "max_r": 1.0, "mean_grounded": 17.0, "mean_halluc": 1.25, "mean_cited": 18.5, "mean_tf_grounded_rate": 0.900378787878788, "gnorm": 149.94134521484375, "elapsed_s": 8945.831612348557, "cell": "Ex", "id": "train:gen:Ex:NFASC:chr1_205041149_205041649:3983"}
49
+ {"step": 240, "loss": 0.0, "mean_r": 1.0, "max_r": 1.0, "mean_grounded": 9.5, "mean_halluc": 0.0, "mean_cited": 9.5, "mean_tf_grounded_rate": 1.0, "gnorm": 0.0, "elapsed_s": 9137.309298276901, "cell": "Ast", "id": "train:gen:Ast:DBX2:chr12_45045323_45045823:3205"}