Upload exp_phase8_reasoning_grounded_rl_t2_r128_alpha1_s3_20260507_044835/log.jsonl with huggingface_hub
Browse files
exp_phase8_reasoning_grounded_rl_t2_r128_alpha1_s3_20260507_044835/log.jsonl
CHANGED
|
@@ -40,3 +40,12 @@
|
|
| 40 |
{"step": 195, "loss": 39.62022399902344, "mean_r": -0.425555557012558, "max_r": -0.3799999952316284, "mean_grounded": 2.75, "mean_halluc": 12.25, "mean_cited": 16.0, "mean_tf_grounded_rate": 0.1717948717948718, "gnorm": 463.9270324707031, "elapsed_s": 6698.379506826401, "cell": "Ast", "id": "train:pair_pos:Ast:SEMA4B:chr15_90158391_90158891:2529"}
|
| 41 |
{"step": 200, "loss": 54.31575012207031, "mean_r": -0.425555557012558, "max_r": -0.08888889104127884, "mean_grounded": 2.0, "mean_halluc": 21.0, "mean_cited": 24.0, "mean_tf_grounded_rate": 0.19166666666666665, "gnorm": 254.85635375976562, "elapsed_s": 6879.148895740509, "cell": "In", "id": "train:pair_pos:In:MIMT1:chr19_56643461_56643961:3139"}
|
| 42 |
{"step": 205, "loss": -53.430694580078125, "mean_r": -0.14499999582767487, "max_r": 0.10000000149011612, "mean_grounded": 2.75, "mean_halluc": 5.5, "mean_cited": 8.75, "mean_tf_grounded_rate": 0.33125, "gnorm": 407.4938049316406, "elapsed_s": 7052.995807170868, "cell": "Ast", "id": "train:pair_pos:Ast:ZNF106:chr15_42497376_42497876:1404"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 40 |
{"step": 195, "loss": 39.62022399902344, "mean_r": -0.425555557012558, "max_r": -0.3799999952316284, "mean_grounded": 2.75, "mean_halluc": 12.25, "mean_cited": 16.0, "mean_tf_grounded_rate": 0.1717948717948718, "gnorm": 463.9270324707031, "elapsed_s": 6698.379506826401, "cell": "Ast", "id": "train:pair_pos:Ast:SEMA4B:chr15_90158391_90158891:2529"}
|
| 41 |
{"step": 200, "loss": 54.31575012207031, "mean_r": -0.425555557012558, "max_r": -0.08888889104127884, "mean_grounded": 2.0, "mean_halluc": 21.0, "mean_cited": 24.0, "mean_tf_grounded_rate": 0.19166666666666665, "gnorm": 254.85635375976562, "elapsed_s": 6879.148895740509, "cell": "In", "id": "train:pair_pos:In:MIMT1:chr19_56643461_56643961:3139"}
|
| 42 |
{"step": 205, "loss": -53.430694580078125, "mean_r": -0.14499999582767487, "max_r": 0.10000000149011612, "mean_grounded": 2.75, "mean_halluc": 5.5, "mean_cited": 8.75, "mean_tf_grounded_rate": 0.33125, "gnorm": 407.4938049316406, "elapsed_s": 7052.995807170868, "cell": "Ast", "id": "train:pair_pos:Ast:ZNF106:chr15_42497376_42497876:1404"}
|
| 43 |
+
{"step": 210, "loss": -7.412021636962891, "mean_r": -0.07740384340286255, "max_r": 0.11538461595773697, "mean_grounded": 3.5, "mean_halluc": 5.5, "mean_cited": 9.5, "mean_tf_grounded_rate": 0.3918269230769231, "gnorm": 318.6491394042969, "elapsed_s": 7230.65495467186, "cell": "OPC", "id": "train:pair_neg:OPC:MEG8:chr14_100802683_100803183:3703"}
|
| 44 |
+
{"step": 215, "loss": -57.61827087402344, "mean_r": -0.0342261865735054, "max_r": 0.17142857611179352, "mean_grounded": 3.0, "mean_halluc": 4.25, "mean_cited": 8.25, "mean_tf_grounded_rate": 0.37797619047619047, "gnorm": 398.4621276855469, "elapsed_s": 7413.518797159195, "cell": "Oli", "id": "train:pair_pos:Oli:ANKH:chr5_14767892_14768392:2736"}
|
| 45 |
+
{"step": 220, "loss": -41.987125396728516, "mean_r": 0.2616666555404663, "max_r": 1.0, "mean_grounded": 2.5, "mean_halluc": 2.75, "mean_cited": 5.25, "mean_tf_grounded_rate": 0.6208333333333333, "gnorm": 256.939697265625, "elapsed_s": 7598.82914018631, "cell": "Ast", "id": "train:pair_pos:Ast:HARBI1:chr11_46694515_46695015:1139"}
|
| 46 |
+
{"step": 225, "loss": -132.82545471191406, "mean_r": -0.16482141613960266, "max_r": 1.3877787807814457e-17, "mean_grounded": 4.25, "mean_halluc": 8.5, "mean_cited": 14.0, "mean_tf_grounded_rate": 0.30892857142857144, "gnorm": 505.094482421875, "elapsed_s": 7779.591448545456, "cell": "Mic", "id": "train:pair_neg:Mic:UVRAG:chr11_75809973_75810473:603"}
|
| 47 |
+
{"step": 230, "loss": 23.48389434814453, "mean_r": 0.3431168794631958, "max_r": 0.5400000214576721, "mean_grounded": 6.0, "mean_halluc": 4.0, "mean_cited": 10.5, "mean_tf_grounded_rate": 0.5970779220779221, "gnorm": 417.0264892578125, "elapsed_s": 7953.560907363892, "cell": "Ast", "id": "train:pair_pos:Ast:FAM222A-AS1:chr12_109822909_109823409:437"}
|
| 48 |
+
{"step": 235, "loss": -8.888442993164062, "mean_r": -0.12062642723321915, "max_r": 0.29411765933036804, "mean_grounded": 4.5, "mean_halluc": 7.0, "mean_cited": 12.25, "mean_tf_grounded_rate": 0.34511077158135983, "gnorm": 424.124267578125, "elapsed_s": 8137.539093255997, "cell": "Ex", "id": "train:pair_pos:Ex:RAG2:chr11_36594219_36594719:2111"}
|
| 49 |
+
{"step": 240, "loss": 53.9141960144043, "mean_r": -0.6138888597488403, "max_r": -0.12222222238779068, "mean_grounded": 1.25, "mean_halluc": 5.5, "mean_cited": 7.0, "mean_tf_grounded_rate": 0.125, "gnorm": 360.671142578125, "elapsed_s": 8322.27424788475, "cell": "Ast", "id": "train:pair_pos:Ast:COG7:chr16_23494217_23494717:38"}
|
| 50 |
+
{"step": 245, "loss": 99.50491333007812, "mean_r": -0.46973684430122375, "max_r": -0.07894736528396606, "mean_grounded": 3.25, "mean_halluc": 8.5, "mean_cited": 12.0, "mean_tf_grounded_rate": 0.21710526315789475, "gnorm": 443.43585205078125, "elapsed_s": 8498.061541080475, "cell": "Mic", "id": "train:pair_neg:Mic:MVD:chr16_88802820_88803320:1851"}
|
| 51 |
+
{"step": 250, "loss": -71.4005126953125, "mean_r": -0.2584415674209595, "max_r": 1.0, "mean_grounded": 2.5, "mean_halluc": 4.5, "mean_cited": 7.25, "mean_tf_grounded_rate": 0.3214285714285714, "gnorm": 187.2640838623047, "elapsed_s": 8667.96145939827, "cell": "Oli", "id": "train:pair_pos:Oli:CARM1:chr19_10734340_10734840:2066"}
|