Upload exp_phase8_reasoning_grounded_rl_t2_r128_alpha1_s3_20260507_044835/log.jsonl with huggingface_hub
Browse files
exp_phase8_reasoning_grounded_rl_t2_r128_alpha1_s3_20260507_044835/log.jsonl
CHANGED
|
@@ -29,3 +29,14 @@
|
|
| 29 |
{"step": 140, "loss": -88.15803527832031, "mean_r": 0.18339230120182037, "max_r": 0.699999988079071, "mean_grounded": 6.25, "mean_halluc": 7.5, "mean_cited": 14.0, "mean_tf_grounded_rate": 0.5183731387291759, "gnorm": 381.1214599609375, "elapsed_s": 4738.309872150421, "cell": "Ast", "id": "train:pair_pos:Ast:DZIP1:chr13_95496385_95496885:1925"}
|
| 30 |
{"step": 145, "loss": 79.7239990234375, "mean_r": -0.4128749966621399, "max_r": -0.05000000074505806, "mean_grounded": 3.75, "mean_halluc": 16.0, "mean_cited": 19.75, "mean_tf_grounded_rate": 0.26197916666666665, "gnorm": 376.2814025878906, "elapsed_s": 4915.069397211075, "cell": "Ast", "id": "train:pair_pos:Ast:NEK3:chr13_52390267_52390767:917"}
|
| 31 |
{"step": 150, "loss": -126.88933563232422, "mean_r": 0.23273809254169464, "max_r": 1.0333333015441895, "mean_grounded": 4.25, "mean_halluc": 4.25, "mean_cited": 9.0, "mean_tf_grounded_rate": 0.529491341991342, "gnorm": 315.1418151855469, "elapsed_s": 5090.648319244385, "cell": "Mic", "id": "train:pair_pos:Mic:GNB4:chr3_179453060_179453560:1907"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 29 |
{"step": 140, "loss": -88.15803527832031, "mean_r": 0.18339230120182037, "max_r": 0.699999988079071, "mean_grounded": 6.25, "mean_halluc": 7.5, "mean_cited": 14.0, "mean_tf_grounded_rate": 0.5183731387291759, "gnorm": 381.1214599609375, "elapsed_s": 4738.309872150421, "cell": "Ast", "id": "train:pair_pos:Ast:DZIP1:chr13_95496385_95496885:1925"}
|
| 30 |
{"step": 145, "loss": 79.7239990234375, "mean_r": -0.4128749966621399, "max_r": -0.05000000074505806, "mean_grounded": 3.75, "mean_halluc": 16.0, "mean_cited": 19.75, "mean_tf_grounded_rate": 0.26197916666666665, "gnorm": 376.2814025878906, "elapsed_s": 4915.069397211075, "cell": "Ast", "id": "train:pair_pos:Ast:NEK3:chr13_52390267_52390767:917"}
|
| 31 |
{"step": 150, "loss": -126.88933563232422, "mean_r": 0.23273809254169464, "max_r": 1.0333333015441895, "mean_grounded": 4.25, "mean_halluc": 4.25, "mean_cited": 9.0, "mean_tf_grounded_rate": 0.529491341991342, "gnorm": 315.1418151855469, "elapsed_s": 5090.648319244385, "cell": "Mic", "id": "train:pair_pos:Mic:GNB4:chr3_179453060_179453560:1907"}
|
| 32 |
+
{"step": 155, "loss": -13.678577423095703, "mean_r": -0.0867857113480568, "max_r": 0.01666666753590107, "mean_grounded": 4.5, "mean_halluc": 7.5, "mean_cited": 12.75, "mean_tf_grounded_rate": 0.3601190476190476, "gnorm": 436.85906982421875, "elapsed_s": 5260.500825643539, "cell": "Ast", "id": "train:pair_pos:Ast:ARFIP2:chr11_6567164_6567664:1736"}
|
| 33 |
+
{"step": 160, "loss": -11.192184448242188, "mean_r": -0.17413420975208282, "max_r": 0.20000000298023224, "mean_grounded": 3.0, "mean_halluc": 4.75, "mean_cited": 8.25, "mean_tf_grounded_rate": 0.3301948051948052, "gnorm": 428.4222717285156, "elapsed_s": 5444.281126260757, "cell": "Ast", "id": "train:pair_neg:Ast:SNAPIN:chr1_153554127_153554627:3034"}
|
| 34 |
+
{"step": 165, "loss": 24.492019653320312, "mean_r": -0.13952019810676575, "max_r": -0.05000000074505806, "mean_grounded": 3.75, "mean_halluc": 6.5, "mean_cited": 10.5, "mean_tf_grounded_rate": 0.3391729797979798, "gnorm": 427.9548034667969, "elapsed_s": 5616.279240608215, "cell": "Ast", "id": "train:pair_pos:Ast:PTPRJ:chr11_47973285_47973785:2005"}
|
| 35 |
+
{"step": 170, "loss": -130.26937866210938, "mean_r": 0.21805554628372192, "max_r": 1.0, "mean_grounded": 3.75, "mean_halluc": 6.25, "mean_cited": 11.0, "mean_tf_grounded_rate": 0.5458333333333333, "gnorm": 377.8606872558594, "elapsed_s": 5796.411918878555, "cell": "Mic", "id": "train:pair_neg:Mic:DEGS2:chr14_100312570_100313070:2112"}
|
| 36 |
+
{"step": 175, "loss": -114.32825469970703, "mean_r": 0.1251068413257599, "max_r": 0.550000011920929, "mean_grounded": 4.25, "mean_halluc": 4.75, "mean_cited": 9.75, "mean_tf_grounded_rate": 0.4738247863247863, "gnorm": 398.3206481933594, "elapsed_s": 5976.548135995865, "cell": "Ast", "id": "train:pair_pos:Ast:SPNS1:chr16_29130376_29130876:437"}
|
| 37 |
+
{"step": 180, "loss": 52.26029968261719, "mean_r": -0.4208333194255829, "max_r": 0.2199999988079071, "mean_grounded": 3.25, "mean_halluc": 8.0, "mean_cited": 11.25, "mean_tf_grounded_rate": 0.2635416666666667, "gnorm": 372.72747802734375, "elapsed_s": 6159.331789255142, "cell": "Mic", "id": "train:pair_pos:Mic:ZNF362:chr1_33237519_33238019:2872"}
|
| 38 |
+
{"step": 185, "loss": -63.27106475830078, "mean_r": 0.14499999582767487, "max_r": 1.0, "mean_grounded": 2.0, "mean_halluc": 3.25, "mean_cited": 5.75, "mean_tf_grounded_rate": 0.39999999999999997, "gnorm": 284.2621765136719, "elapsed_s": 6336.236979961395, "cell": "Ex", "id": "train:pair_pos:Ex:SF3A1:chr22_30424449_30424949:1143"}
|
| 39 |
+
{"step": 190, "loss": -19.42317008972168, "mean_r": 0.16845238208770752, "max_r": 0.6000000238418579, "mean_grounded": 3.0, "mean_halluc": 2.75, "mean_cited": 5.75, "mean_tf_grounded_rate": 0.40476190476190477, "gnorm": 430.9595031738281, "elapsed_s": 6518.158425569534, "cell": "Ast", "id": "train:pair_pos:Ast:TMX1:chr14_51088727_51089227:2086"}
|
| 40 |
+
{"step": 195, "loss": 39.62022399902344, "mean_r": -0.425555557012558, "max_r": -0.3799999952316284, "mean_grounded": 2.75, "mean_halluc": 12.25, "mean_cited": 16.0, "mean_tf_grounded_rate": 0.1717948717948718, "gnorm": 463.9270324707031, "elapsed_s": 6698.379506826401, "cell": "Ast", "id": "train:pair_pos:Ast:SEMA4B:chr15_90158391_90158891:2529"}
|
| 41 |
+
{"step": 200, "loss": 54.31575012207031, "mean_r": -0.425555557012558, "max_r": -0.08888889104127884, "mean_grounded": 2.0, "mean_halluc": 21.0, "mean_cited": 24.0, "mean_tf_grounded_rate": 0.19166666666666665, "gnorm": 254.85635375976562, "elapsed_s": 6879.148895740509, "cell": "In", "id": "train:pair_pos:In:MIMT1:chr19_56643461_56643961:3139"}
|
| 42 |
+
{"step": 205, "loss": -53.430694580078125, "mean_r": -0.14499999582767487, "max_r": 0.10000000149011612, "mean_grounded": 2.75, "mean_halluc": 5.5, "mean_cited": 8.75, "mean_tf_grounded_rate": 0.33125, "gnorm": 407.4938049316406, "elapsed_s": 7052.995807170868, "cell": "Ast", "id": "train:pair_pos:Ast:ZNF106:chr15_42497376_42497876:1404"}
|