Upload exp_phase8_reasoning_grounded_rl_t3_r128_alpha1_s2_20260507_072202/log.jsonl with huggingface_hub
Browse files
exp_phase8_reasoning_grounded_rl_t3_r128_alpha1_s2_20260507_072202/log.jsonl
ADDED
|
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{"step": 1, "loss": 209.12527465820312, "mean_r": -0.8886029720306396, "max_r": -0.729411780834198, "mean_grounded": 0.5, "mean_halluc": 12.5, "mean_cited": 13.5, "mean_tf_grounded_rate": 0.022518382352941176, "gnorm": 388.03436279296875, "elapsed_s": 50.73191690444946, "cell": "Ex", "id": "train:edit:Ex:SLC4A5:chr2_74464392_74464892:766"}
|
| 2 |
+
{"step": 5, "loss": 31.798538208007812, "mean_r": -0.7553879022598267, "max_r": -0.5249999761581421, "mean_grounded": 0.75, "mean_halluc": 14.0, "mean_cited": 15.25, "mean_tf_grounded_rate": 0.05208333333333333, "gnorm": 452.2689208984375, "elapsed_s": 186.7282576560974, "cell": "Ast", "id": "train:edit:Ast:JAML:chr11_118048985_118049485:2444"}
|
| 3 |
+
{"step": 10, "loss": 24.181129455566406, "mean_r": -0.4761904776096344, "max_r": 0.4285714328289032, "mean_grounded": 1.75, "mean_halluc": 3.75, "mean_cited": 5.5, "mean_tf_grounded_rate": 0.2619047619047619, "gnorm": 294.8580627441406, "elapsed_s": 363.3971600532532, "cell": "Mic", "id": "train:edit:Mic:ATP2C2:chr16_84568277_84568777:336"}
|
| 4 |
+
{"step": 15, "loss": -256.75286865234375, "mean_r": -0.3768181800842285, "max_r": 0.0, "mean_grounded": 1.0, "mean_halluc": 5.75, "mean_cited": 7.0, "mean_tf_grounded_rate": 0.12987012987012986, "gnorm": 451.944580078125, "elapsed_s": 540.0139734745026, "cell": "Ast", "id": "train:edit:Ast:SENP3:chr17_7463950_7464450:2189"}
|
| 5 |
+
{"step": 20, "loss": 130.29452514648438, "mean_r": -0.7051190137863159, "max_r": -0.4571428596973419, "mean_grounded": 1.75, "mean_halluc": 10.25, "mean_cited": 12.25, "mean_tf_grounded_rate": 0.11884920634920634, "gnorm": 362.4324645996094, "elapsed_s": 711.3055589199066, "cell": "Ex", "id": "train:edit:Ex:MAPT-AS1:chr17_46037726_46038226:1788"}
|
| 6 |
+
{"step": 25, "loss": 0.08062744140625, "mean_r": -0.7416666746139526, "max_r": -0.20000000298023224, "mean_grounded": 0.75, "mean_halluc": 4.25, "mean_cited": 5.0, "mean_tf_grounded_rate": 0.12083333333333333, "gnorm": 262.1352844238281, "elapsed_s": 885.3601727485657, "cell": "In", "id": "train:edit:In:UBR5:chr8_102400231_102400731:1415"}
|
| 7 |
+
{"step": 30, "loss": -149.3069305419922, "mean_r": -0.2750000059604645, "max_r": 0.0, "mean_grounded": 1.25, "mean_halluc": 4.75, "mean_cited": 7.0, "mean_tf_grounded_rate": 0.16025641025641024, "gnorm": 492.9898681640625, "elapsed_s": 1063.6299800872803, "cell": "Mic", "id": "train:edit:Mic:SLFN11:chr17_35368692_35369192:3547"}
|
| 8 |
+
{"step": 35, "loss": -192.28460693359375, "mean_r": -0.2350524663925171, "max_r": 1.0, "mean_grounded": 1.25, "mean_halluc": 9.25, "mean_cited": 11.25, "mean_tf_grounded_rate": 0.31346153846153846, "gnorm": 333.3654479980469, "elapsed_s": 1244.7975552082062, "cell": "In", "id": "train:edit:In:DTX4:chr11_59135813_59136313:329"}
|
| 9 |
+
{"step": 40, "loss": -143.7164764404297, "mean_r": -0.6516637206077576, "max_r": -0.3117647171020508, "mean_grounded": 1.75, "mean_halluc": 13.75, "mean_cited": 15.75, "mean_tf_grounded_rate": 0.1101455733808675, "gnorm": 557.5035400390625, "elapsed_s": 1414.663667678833, "cell": "Mic", "id": "train:edit:Mic:REC8:chr14_23981797_23982297:2403"}
|