Upload exp_phase8_reasoning_grounded_rl_t1_r128_alpha1_s3_20260506_234027/log.jsonl with huggingface_hub
Browse files
exp_phase8_reasoning_grounded_rl_t1_r128_alpha1_s3_20260506_234027/log.jsonl
CHANGED
|
@@ -28,3 +28,13 @@
|
|
| 28 |
{"step": 135, "loss": -111.39610290527344, "mean_r": 0.22946429252624512, "max_r": 0.7928571701049805, "mean_grounded": 7.75, "mean_halluc": 4.0, "mean_cited": 12.0, "mean_tf_grounded_rate": 0.4575892857142857, "gnorm": 391.5924072265625, "elapsed_s": 5130.675909519196, "cell": "OPC", "id": "train:gen:OPC:DTX1:chr12_112936839_112937339:1095"}
|
| 29 |
{"step": 140, "loss": 13.05216121673584, "mean_r": 0.10606060922145844, "max_r": 0.3333333432674408, "mean_grounded": 6.75, "mean_halluc": 5.75, "mean_cited": 12.5, "mean_tf_grounded_rate": 0.553030303030303, "gnorm": 245.5005340576172, "elapsed_s": 5321.55585026741, "cell": "OPC", "id": "train:gen:OPC:TRIM13:chr13_50080258_50080758:654"}
|
| 30 |
{"step": 145, "loss": -57.27449417114258, "mean_r": 0.11188725382089615, "max_r": 0.875, "mean_grounded": 8.75, "mean_halluc": 7.5, "mean_cited": 16.25, "mean_tf_grounded_rate": 0.5559436274509805, "gnorm": 286.83270263671875, "elapsed_s": 5512.434992551804, "cell": "OPC", "id": "train:gen:OPC:FITM1:chr14_24093418_24093918:2986"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 28 |
{"step": 135, "loss": -111.39610290527344, "mean_r": 0.22946429252624512, "max_r": 0.7928571701049805, "mean_grounded": 7.75, "mean_halluc": 4.0, "mean_cited": 12.0, "mean_tf_grounded_rate": 0.4575892857142857, "gnorm": 391.5924072265625, "elapsed_s": 5130.675909519196, "cell": "OPC", "id": "train:gen:OPC:DTX1:chr12_112936839_112937339:1095"}
|
| 29 |
{"step": 140, "loss": 13.05216121673584, "mean_r": 0.10606060922145844, "max_r": 0.3333333432674408, "mean_grounded": 6.75, "mean_halluc": 5.75, "mean_cited": 12.5, "mean_tf_grounded_rate": 0.553030303030303, "gnorm": 245.5005340576172, "elapsed_s": 5321.55585026741, "cell": "OPC", "id": "train:gen:OPC:TRIM13:chr13_50080258_50080758:654"}
|
| 30 |
{"step": 145, "loss": -57.27449417114258, "mean_r": 0.11188725382089615, "max_r": 0.875, "mean_grounded": 8.75, "mean_halluc": 7.5, "mean_cited": 16.25, "mean_tf_grounded_rate": 0.5559436274509805, "gnorm": 286.83270263671875, "elapsed_s": 5512.434992551804, "cell": "OPC", "id": "train:gen:OPC:FITM1:chr14_24093418_24093918:2986"}
|
| 31 |
+
{"step": 150, "loss": -107.69103240966797, "mean_r": 0.30532610416412354, "max_r": 0.9166666865348816, "mean_grounded": 14.75, "mean_halluc": 6.25, "mean_cited": 21.0, "mean_tf_grounded_rate": 0.6301630434782609, "gnorm": 396.09039306640625, "elapsed_s": 5703.050578832626, "cell": "Ex", "id": "train:gen:Ex:ARL8A:chr1_202143325_202143825:1970"}
|
| 32 |
+
{"step": 155, "loss": 98.78294372558594, "mean_r": -0.6161764860153198, "max_r": 0.0, "mean_grounded": 3.5, "mean_halluc": 11.0, "mean_cited": 14.75, "mean_tf_grounded_rate": 0.16911764705882354, "gnorm": 299.56903076171875, "elapsed_s": 5893.349708557129, "cell": "In", "id": "train:gen:In:NRIP3:chr11_9004973_9005473:1745"}
|
| 33 |
+
{"step": 160, "loss": -102.66815948486328, "mean_r": 0.72383713722229, "max_r": 0.892307698726654, "mean_grounded": 13.75, "mean_halluc": 3.0, "mean_cited": 17.5, "mean_tf_grounded_rate": 0.7922402159244265, "gnorm": 363.1687316894531, "elapsed_s": 6082.912489652634, "cell": "End", "id": "train:gen:End:ACAP3:chr1_1352442_1352942:123"}
|
| 34 |
+
{"step": 165, "loss": -184.34024047851562, "mean_r": -0.11614219844341278, "max_r": 0.4000000059604645, "mean_grounded": 4.75, "mean_halluc": 7.5, "mean_cited": 12.25, "mean_tf_grounded_rate": 0.38417832167832167, "gnorm": 405.32208251953125, "elapsed_s": 6272.354876279831, "cell": "OPC", "id": "train:gen:OPC:MCF2L:chr13_113031501_113032001:2002"}
|
| 35 |
+
{"step": 170, "loss": -57.68060302734375, "mean_r": 0.6530753970146179, "max_r": 0.925000011920929, "mean_grounded": 12.0, "mean_halluc": 3.0, "mean_cited": 15.0, "mean_tf_grounded_rate": 0.7994543650793651, "gnorm": 224.40769958496094, "elapsed_s": 6463.121914625168, "cell": "End", "id": "train:gen:End:SH3D21:chr1_36135198_36135698:1360"}
|
| 36 |
+
{"step": 175, "loss": -89.436767578125, "mean_r": -0.03766339272260666, "max_r": 0.38823530077934265, "mean_grounded": 7.0, "mean_halluc": 9.25, "mean_cited": 17.0, "mean_tf_grounded_rate": 0.42218137254901955, "gnorm": 447.1673583984375, "elapsed_s": 6654.3291845321655, "cell": "Ast", "id": "train:gen:Ast:DIP2B:chr12_50621812_50622312:3965"}
|
| 37 |
+
{"step": 180, "loss": -82.02870178222656, "mean_r": 0.21198831498622894, "max_r": 0.6000000238418579, "mean_grounded": 8.5, "mean_halluc": 7.25, "mean_cited": 15.75, "mean_tf_grounded_rate": 0.576827485380117, "gnorm": 213.66537475585938, "elapsed_s": 6845.035688877106, "cell": "Ex", "id": "train:gen:Ex:NAV1:chr1_201780264_201780764:1654"}
|
| 38 |
+
{"step": 185, "loss": 13.997580528259277, "mean_r": 0.9831638336181641, "max_r": 1.0666667222976685, "mean_grounded": 19.75, "mean_halluc": 0.5, "mean_cited": 20.25, "mean_tf_grounded_rate": 0.973389355742297, "gnorm": 181.38186645507812, "elapsed_s": 7036.699383020401, "cell": "Ex", "id": "train:gen:Ex:SH3GL2:chr9_17580139_17580639:1755"}
|
| 39 |
+
{"step": 190, "loss": -64.85012817382812, "mean_r": 0.8214423060417175, "max_r": 1.0, "mean_grounded": 9.75, "mean_halluc": 1.75, "mean_cited": 12.0, "mean_tf_grounded_rate": 0.8479967948717949, "gnorm": 208.01470947265625, "elapsed_s": 7226.780698776245, "cell": "Ast", "id": "train:gen:Ast:BCL9L:chr11_118921285_118921785:2605"}
|
| 40 |
+
{"step": 195, "loss": -144.64866638183594, "mean_r": -0.3027777671813965, "max_r": 0.0, "mean_grounded": 1.75, "mean_halluc": 8.0, "mean_cited": 11.25, "mean_tf_grounded_rate": 0.14484126984126983, "gnorm": 423.9998474121094, "elapsed_s": 7416.172049045563, "cell": "Oli", "id": "train:gen:Oli:PNPLA2:chr11_727281_727781:568"}
|