explcre commited on
Commit
f67b4bd
·
verified ·
1 Parent(s): 02fbc17

Upload exp_phase8_reasoning_grounded_rl_t2_r128_alpha1_s2_20260507_023054/log.jsonl with huggingface_hub

Browse files
exp_phase8_reasoning_grounded_rl_t2_r128_alpha1_s2_20260507_023054/log.jsonl CHANGED
@@ -3,3 +3,14 @@
3
  {"step": 10, "loss": -22.3604736328125, "mean_r": -0.33328282833099365, "max_r": 0.00909090880304575, "mean_grounded": 3.25, "mean_halluc": 9.5, "mean_cited": 13.25, "mean_tf_grounded_rate": 0.24646464646464647, "gnorm": 493.3493347167969, "elapsed_s": 368.4945650100708, "cell": "Ast", "id": "train:pair_pos:Ast:SACS-AS1:chr13_23609248_23609748:3456"}
4
  {"step": 15, "loss": 15.31060791015625, "mean_r": -0.6000000238418579, "max_r": -0.3142857253551483, "mean_grounded": 2.25, "mean_halluc": 11.5, "mean_cited": 14.5, "mean_tf_grounded_rate": 0.14285714285714285, "gnorm": 407.4206848144531, "elapsed_s": 552.363049030304, "cell": "Ex", "id": "train:pair_pos:Ex:RBM23:chr14_23130565_23131065:2635"}
5
  {"step": 20, "loss": -54.41714859008789, "mean_r": -0.46156859397888184, "max_r": 0.10000000149011612, "mean_grounded": 4.0, "mean_halluc": 14.5, "mean_cited": 19.0, "mean_tf_grounded_rate": 0.23137254901960785, "gnorm": 461.6417541503906, "elapsed_s": 732.1889204978943, "cell": "Ast", "id": "train:pair_pos:Ast:GPR180:chr13_94703150_94703650:1740"}
 
 
 
 
 
 
 
 
 
 
 
 
3
  {"step": 10, "loss": -22.3604736328125, "mean_r": -0.33328282833099365, "max_r": 0.00909090880304575, "mean_grounded": 3.25, "mean_halluc": 9.5, "mean_cited": 13.25, "mean_tf_grounded_rate": 0.24646464646464647, "gnorm": 493.3493347167969, "elapsed_s": 368.4945650100708, "cell": "Ast", "id": "train:pair_pos:Ast:SACS-AS1:chr13_23609248_23609748:3456"}
4
  {"step": 15, "loss": 15.31060791015625, "mean_r": -0.6000000238418579, "max_r": -0.3142857253551483, "mean_grounded": 2.25, "mean_halluc": 11.5, "mean_cited": 14.5, "mean_tf_grounded_rate": 0.14285714285714285, "gnorm": 407.4206848144531, "elapsed_s": 552.363049030304, "cell": "Ex", "id": "train:pair_pos:Ex:RBM23:chr14_23130565_23131065:2635"}
5
  {"step": 20, "loss": -54.41714859008789, "mean_r": -0.46156859397888184, "max_r": 0.10000000149011612, "mean_grounded": 4.0, "mean_halluc": 14.5, "mean_cited": 19.0, "mean_tf_grounded_rate": 0.23137254901960785, "gnorm": 461.6417541503906, "elapsed_s": 732.1889204978943, "cell": "Ast", "id": "train:pair_pos:Ast:GPR180:chr13_94703150_94703650:1740"}
6
+ {"step": 25, "loss": -129.54830932617188, "mean_r": -0.29905983805656433, "max_r": -0.03846153989434242, "mean_grounded": 3.5, "mean_halluc": 11.5, "mean_cited": 15.5, "mean_tf_grounded_rate": 0.260042735042735, "gnorm": 532.6793823242188, "elapsed_s": 913.3625543117523, "cell": "Ast", "id": "train:pair_pos:Ast:ELOVL1:chr1_43572437_43572937:3315"}
7
+ {"step": 30, "loss": -155.8570556640625, "mean_r": -0.6628333330154419, "max_r": -0.13333334028720856, "mean_grounded": 1.75, "mean_halluc": 27.25, "mean_cited": 29.0, "mean_tf_grounded_rate": 0.1275, "gnorm": 429.6753845214844, "elapsed_s": 1098.6165158748627, "cell": "Ast", "id": "train:pair_pos:Ast:TBRG1:chr11_124863023_124863523:3252"}
8
+ {"step": 35, "loss": 34.43647003173828, "mean_r": -0.6553663015365601, "max_r": -0.24285714328289032, "mean_grounded": 1.75, "mean_halluc": 21.25, "mean_cited": 24.0, "mean_tf_grounded_rate": 0.08901056570548097, "gnorm": 391.2756042480469, "elapsed_s": 1261.5197477340698, "cell": "Mic", "id": "train:pair_pos:Mic:ATAD5:chr17_30823269_30823769:2807"}
9
+ {"step": 40, "loss": 48.90322494506836, "mean_r": -0.7400793433189392, "max_r": -0.30000001192092896, "mean_grounded": 0.75, "mean_halluc": 25.75, "mean_cited": 28.0, "mean_tf_grounded_rate": 0.05357142857142857, "gnorm": 393.1705322265625, "elapsed_s": 1436.7695581912994, "cell": "Oli", "id": "train:pair_pos:Oli:DOCK9-DT:chr13_99090139_99090639:4038"}
10
+ {"step": 45, "loss": -130.55673217773438, "mean_r": -0.321092426776886, "max_r": 0.0, "mean_grounded": 2.25, "mean_halluc": 8.5, "mean_cited": 11.75, "mean_tf_grounded_rate": 0.1464985994397759, "gnorm": 398.0940856933594, "elapsed_s": 1605.2349441051483, "cell": "Ast", "id": "train:pair_pos:Ast:TM9SF1:chr14_24171673_24172173:895"}
11
+ {"step": 50, "loss": -0.6146392822265625, "mean_r": -0.5231685042381287, "max_r": 0.06923077255487442, "mean_grounded": 3.0, "mean_halluc": 10.25, "mean_cited": 13.25, "mean_tf_grounded_rate": 0.21657509157509158, "gnorm": 421.5898742675781, "elapsed_s": 1770.4354808330536, "cell": "Ast", "id": "train:pair_pos:Ast:CTR9:chr11_10734335_10734835:2538"}
12
+ {"step": 55, "loss": -66.51898193359375, "mean_r": -0.4506363570690155, "max_r": -0.15454545617103577, "mean_grounded": 3.25, "mean_halluc": 13.0, "mean_cited": 16.5, "mean_tf_grounded_rate": 0.2234090909090909, "gnorm": 499.26861572265625, "elapsed_s": 1939.4690730571747, "cell": "Ast", "id": "train:pair_pos:Ast:CCDC60:chr12_119177983_119178483:1674"}
13
+ {"step": 60, "loss": -158.6281280517578, "mean_r": -0.33472222089767456, "max_r": 0.0, "mean_grounded": 2.5, "mean_halluc": 8.75, "mean_cited": 11.5, "mean_tf_grounded_rate": 0.1597222222222222, "gnorm": 350.1258239746094, "elapsed_s": 2109.0862424373627, "cell": "Ast", "id": "train:pair_pos:Ast:EPS15L1:chr19_16577302_16577802:1537"}
14
+ {"step": 65, "loss": -81.56288146972656, "mean_r": -0.3091251850128174, "max_r": -0.10000000149011612, "mean_grounded": 2.75, "mean_halluc": 7.5, "mean_cited": 10.25, "mean_tf_grounded_rate": 0.2981240573152338, "gnorm": 448.92999267578125, "elapsed_s": 2267.7567059993744, "cell": "Ast", "id": "train:pair_pos:Ast:TMEM218:chr11_124928685_124929185:3554"}
15
+ {"step": 70, "loss": -42.581382751464844, "mean_r": -0.6251075863838196, "max_r": -0.18000000715255737, "mean_grounded": 1.75, "mean_halluc": 18.5, "mean_cited": 20.25, "mean_tf_grounded_rate": 0.1625, "gnorm": 347.837890625, "elapsed_s": 2436.6436779499054, "cell": "Ast", "id": "train:pair_pos:Ast:DOCK9:chr13_99208831_99209331:2173"}
16
+ {"step": 75, "loss": -62.28608703613281, "mean_r": -0.513744592666626, "max_r": -0.44545453786849976, "mean_grounded": 2.25, "mean_halluc": 9.5, "mean_cited": 11.75, "mean_tf_grounded_rate": 0.20319264069264067, "gnorm": 514.9257202148438, "elapsed_s": 2608.9937732219696, "cell": "Ast", "id": "train:pair_pos:Ast:DMXL2:chr15_51801334_51801834:1962"}