Upload exp_phase8_reasoning_grounded_rl_t1_r128_alpha1_s3_20260506_234027/log.jsonl with huggingface_hub
Browse files
exp_phase8_reasoning_grounded_rl_t1_r128_alpha1_s3_20260506_234027/log.jsonl
CHANGED
|
@@ -47,3 +47,5 @@
|
|
| 47 |
{"step": 230, "loss": -27.773218154907227, "mean_r": 0.9260683655738831, "max_r": 1.0153846740722656, "mean_grounded": 15.75, "mean_halluc": 0.75, "mean_cited": 16.5, "mean_tf_grounded_rate": 0.9566993464052288, "gnorm": 244.86892700195312, "elapsed_s": 8755.290162801743, "cell": "In", "id": "train:gen:In:PIWIL4:chr11_94449296_94449796:2721"}
|
| 48 |
{"step": 235, "loss": -10.545574188232422, "mean_r": 0.8249242305755615, "max_r": 1.0, "mean_grounded": 17.0, "mean_halluc": 1.25, "mean_cited": 18.5, "mean_tf_grounded_rate": 0.900378787878788, "gnorm": 149.94134521484375, "elapsed_s": 8945.831612348557, "cell": "Ex", "id": "train:gen:Ex:NFASC:chr1_205041149_205041649:3983"}
|
| 49 |
{"step": 240, "loss": 0.0, "mean_r": 1.0, "max_r": 1.0, "mean_grounded": 9.5, "mean_halluc": 0.0, "mean_cited": 9.5, "mean_tf_grounded_rate": 1.0, "gnorm": 0.0, "elapsed_s": 9137.309298276901, "cell": "Ast", "id": "train:gen:Ast:DBX2:chr12_45045323_45045823:3205"}
|
|
|
|
|
|
|
|
|
| 47 |
{"step": 230, "loss": -27.773218154907227, "mean_r": 0.9260683655738831, "max_r": 1.0153846740722656, "mean_grounded": 15.75, "mean_halluc": 0.75, "mean_cited": 16.5, "mean_tf_grounded_rate": 0.9566993464052288, "gnorm": 244.86892700195312, "elapsed_s": 8755.290162801743, "cell": "In", "id": "train:gen:In:PIWIL4:chr11_94449296_94449796:2721"}
|
| 48 |
{"step": 235, "loss": -10.545574188232422, "mean_r": 0.8249242305755615, "max_r": 1.0, "mean_grounded": 17.0, "mean_halluc": 1.25, "mean_cited": 18.5, "mean_tf_grounded_rate": 0.900378787878788, "gnorm": 149.94134521484375, "elapsed_s": 8945.831612348557, "cell": "Ex", "id": "train:gen:Ex:NFASC:chr1_205041149_205041649:3983"}
|
| 49 |
{"step": 240, "loss": 0.0, "mean_r": 1.0, "max_r": 1.0, "mean_grounded": 9.5, "mean_halluc": 0.0, "mean_cited": 9.5, "mean_tf_grounded_rate": 1.0, "gnorm": 0.0, "elapsed_s": 9137.309298276901, "cell": "Ast", "id": "train:gen:Ast:DBX2:chr12_45045323_45045823:3205"}
|
| 50 |
+
{"step": 245, "loss": -4.2411627769470215, "mean_r": 0.8541666865348816, "max_r": 1.0, "mean_grounded": 6.5, "mean_halluc": 0.5, "mean_cited": 7.0, "mean_tf_grounded_rate": 0.9270833333333334, "gnorm": 159.23463439941406, "elapsed_s": 9328.251233100891, "cell": "Mic", "id": "train:gen:Mic:TMEM201:chr1_9652450_9652950:2560"}
|
| 51 |
+
{"step": 250, "loss": -16.410385131835938, "mean_r": 0.8243464231491089, "max_r": 1.0, "mean_grounded": 16.5, "mean_halluc": 1.5, "mean_cited": 18.25, "mean_tf_grounded_rate": 0.9048202614379085, "gnorm": 204.27130126953125, "elapsed_s": 9519.763813734055, "cell": "Oli", "id": "train:gen:Oli:TAF6L:chr11_62711786_62712286:3329"}
|