Upload exp_phase8_reasoning_grounded_rl_t2_r128_alpha1_s2_20260507_023054/log.jsonl with huggingface_hub
Browse files
exp_phase8_reasoning_grounded_rl_t2_r128_alpha1_s2_20260507_023054/log.jsonl
CHANGED
|
@@ -25,3 +25,16 @@
|
|
| 25 |
{"step": 120, "loss": -22.570571899414062, "mean_r": -0.22821427881717682, "max_r": 0.18000000715255737, "mean_grounded": 3.0, "mean_halluc": 6.75, "mean_cited": 10.25, "mean_tf_grounded_rate": 0.2857142857142857, "gnorm": 352.949951171875, "elapsed_s": 4063.728887796402, "cell": "Mic", "id": "train:pair_pos:Mic:POLR1B:chr2_112701002_112701502:614"}
|
| 26 |
{"step": 125, "loss": -8.872991561889648, "mean_r": -0.2474999874830246, "max_r": -0.019999999552965164, "mean_grounded": 3.25, "mean_halluc": 7.75, "mean_cited": 11.0, "mean_tf_grounded_rate": 0.29583333333333334, "gnorm": 390.1910705566406, "elapsed_s": 4202.351343154907, "cell": "Ast", "id": "train:pair_pos:Ast:APH1B:chr15_63204095_63204595:2566"}
|
| 27 |
{"step": 130, "loss": -70.8443603515625, "mean_r": -0.5069047808647156, "max_r": -0.30000001192092896, "mean_grounded": 1.75, "mean_halluc": 12.0, "mean_cited": 14.75, "mean_tf_grounded_rate": 0.12893772893772892, "gnorm": 497.54949951171875, "elapsed_s": 4356.790739774704, "cell": "In", "id": "train:pair_neg:In:SLC22A8:chr11_62855826_62856326:1674"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 25 |
{"step": 120, "loss": -22.570571899414062, "mean_r": -0.22821427881717682, "max_r": 0.18000000715255737, "mean_grounded": 3.0, "mean_halluc": 6.75, "mean_cited": 10.25, "mean_tf_grounded_rate": 0.2857142857142857, "gnorm": 352.949951171875, "elapsed_s": 4063.728887796402, "cell": "Mic", "id": "train:pair_pos:Mic:POLR1B:chr2_112701002_112701502:614"}
|
| 26 |
{"step": 125, "loss": -8.872991561889648, "mean_r": -0.2474999874830246, "max_r": -0.019999999552965164, "mean_grounded": 3.25, "mean_halluc": 7.75, "mean_cited": 11.0, "mean_tf_grounded_rate": 0.29583333333333334, "gnorm": 390.1910705566406, "elapsed_s": 4202.351343154907, "cell": "Ast", "id": "train:pair_pos:Ast:APH1B:chr15_63204095_63204595:2566"}
|
| 27 |
{"step": 130, "loss": -70.8443603515625, "mean_r": -0.5069047808647156, "max_r": -0.30000001192092896, "mean_grounded": 1.75, "mean_halluc": 12.0, "mean_cited": 14.75, "mean_tf_grounded_rate": 0.12893772893772892, "gnorm": 497.54949951171875, "elapsed_s": 4356.790739774704, "cell": "In", "id": "train:pair_neg:In:SLC22A8:chr11_62855826_62856326:1674"}
|
| 28 |
+
{"step": 135, "loss": 15.699638366699219, "mean_r": -0.2628571391105652, "max_r": -0.03999999910593033, "mean_grounded": 3.0, "mean_halluc": 7.0, "mean_cited": 10.0, "mean_tf_grounded_rate": 0.30476190476190473, "gnorm": 481.8796081542969, "elapsed_s": 4509.542692661285, "cell": "Ast", "id": "train:pair_pos:Ast:TMEM80:chr11_615054_615554:273"}
|
| 29 |
+
{"step": 140, "loss": -40.240821838378906, "mean_r": -0.3054545521736145, "max_r": -0.02500000037252903, "mean_grounded": 2.25, "mean_halluc": 6.5, "mean_cited": 9.25, "mean_tf_grounded_rate": 0.25170454545454546, "gnorm": 429.24652099609375, "elapsed_s": 4659.6786432266235, "cell": "Ast", "id": "train:pair_pos:Ast:EBPL:chr13_49938849_49939349:778"}
|
| 30 |
+
{"step": 145, "loss": -67.08731842041016, "mean_r": 0.02111111581325531, "max_r": 0.5111111402511597, "mean_grounded": 4.75, "mean_halluc": 6.75, "mean_cited": 11.5, "mean_tf_grounded_rate": 0.43333333333333335, "gnorm": 304.60968017578125, "elapsed_s": 4805.79648900032, "cell": "Ast", "id": "train:pair_pos:Ast:ADAMTS7:chr15_78879608_78880108:1260"}
|
| 31 |
+
{"step": 150, "loss": -55.233375549316406, "mean_r": 0.03181818127632141, "max_r": 0.6000000238418579, "mean_grounded": 3.75, "mean_halluc": 5.0, "mean_cited": 8.75, "mean_tf_grounded_rate": 0.46704545454545454, "gnorm": 283.4294738769531, "elapsed_s": 4951.262852907181, "cell": "Ast", "id": "train:pair_pos:Ast:SETDB2:chr13_49505933_49506433:723"}
|
| 32 |
+
{"step": 155, "loss": -121.55490112304688, "mean_r": -0.08876262605190277, "max_r": 0.17272727191448212, "mean_grounded": 2.75, "mean_halluc": 5.0, "mean_cited": 8.0, "mean_tf_grounded_rate": 0.2525252525252525, "gnorm": 410.5126647949219, "elapsed_s": 5095.025629758835, "cell": "Ast", "id": "train:pair_pos:Ast:TMEM132B:chr12_125049447_125049947:2744"}
|
| 33 |
+
{"step": 160, "loss": -20.297924041748047, "mean_r": -0.1061868667602539, "max_r": 0.33636364340782166, "mean_grounded": 3.75, "mean_halluc": 6.5, "mean_cited": 10.5, "mean_tf_grounded_rate": 0.35025252525252526, "gnorm": 403.12066650390625, "elapsed_s": 5219.118138551712, "cell": "Ast", "id": "train:pair_pos:Ast:GJB6:chr13_20258366_20258866:3210"}
|
| 34 |
+
{"step": 165, "loss": -39.1207160949707, "mean_r": 0.2242063581943512, "max_r": 0.800000011920929, "mean_grounded": 10.25, "mean_halluc": 4.25, "mean_cited": 15.25, "mean_tf_grounded_rate": 0.5413059163059163, "gnorm": 320.2332763671875, "elapsed_s": 5378.3716950416565, "cell": "Ast", "id": "train:pair_pos:Ast:HTR3A:chr11_114181217_114181717:2012"}
|
| 35 |
+
{"step": 170, "loss": -17.722091674804688, "mean_r": -0.4013608694076538, "max_r": 0.44545453786849976, "mean_grounded": 2.75, "mean_halluc": 25.25, "mean_cited": 28.0, "mean_tf_grounded_rate": 0.23686868686868687, "gnorm": 347.85577392578125, "elapsed_s": 5511.788688421249, "cell": "In", "id": "train:pair_pos:In:GAS2L2:chr17_35749917_35750417:1783"}
|
| 36 |
+
{"step": 175, "loss": -11.29852294921875, "mean_r": -0.36103174090385437, "max_r": -0.1599999964237213, "mean_grounded": 3.0, "mean_halluc": 8.75, "mean_cited": 12.5, "mean_tf_grounded_rate": 0.23323412698412696, "gnorm": 387.71417236328125, "elapsed_s": 5660.764411211014, "cell": "Ast", "id": "train:pair_pos:Ast:STARD13-AS:chr13_33191791_33192291:24"}
|
| 37 |
+
{"step": 180, "loss": -64.60961151123047, "mean_r": -0.03551492467522621, "max_r": 0.3333333432674408, "mean_grounded": 7.0, "mean_halluc": 9.25, "mean_cited": 18.25, "mean_tf_grounded_rate": 0.3819681780208096, "gnorm": 392.7103576660156, "elapsed_s": 5801.9618418216705, "cell": "Mic", "id": "train:pair_pos:Mic:GNB4:chr3_179453060_179453560:1907"}
|
| 38 |
+
{"step": 185, "loss": -28.08819580078125, "mean_r": -0.11071428656578064, "max_r": -0.05714285746216774, "mean_grounded": 4.25, "mean_halluc": 7.0, "mean_cited": 11.75, "mean_tf_grounded_rate": 0.36904761904761907, "gnorm": 377.2549743652344, "elapsed_s": 5958.770046949387, "cell": "Ast", "id": "train:pair_pos:Ast:EPS8L2:chr11_618176_618676:231"}
|
| 39 |
+
{"step": 190, "loss": -84.53244018554688, "mean_r": 0.11698877811431885, "max_r": 0.9117646813392639, "mean_grounded": 11.5, "mean_halluc": 5.75, "mean_cited": 17.5, "mean_tf_grounded_rate": 0.4924369747899159, "gnorm": 301.6457214355469, "elapsed_s": 6107.5840899944305, "cell": "Ast", "id": "train:pair_pos:Ast:ZBTB17:chr1_16187654_16188154:3652"}
|
| 40 |
+
{"step": 195, "loss": 33.700984954833984, "mean_r": -0.03437022119760513, "max_r": 0.1315789520740509, "mean_grounded": 5.25, "mean_halluc": 7.5, "mean_cited": 12.75, "mean_tf_grounded_rate": 0.3979082321187584, "gnorm": 404.85498046875, "elapsed_s": 6255.567425727844, "cell": "Ast", "id": "train:pair_pos:Ast:ITPK1-AS1:chr14_93082659_93083159:1782"}
|