Upload exp_phase8_t3_rl_edit_tight_dapo_s3_lr1e3_moods_20260506_124044/log.jsonl with huggingface_hub
Browse files
exp_phase8_t3_rl_edit_tight_dapo_s3_lr1e3_moods_20260506_124044/log.jsonl
CHANGED
|
@@ -1,3 +1,41 @@
|
|
| 1 |
{"rl_step": 1, "loss": -1.4901161193847656e-07, "mean_return": 25.07489013671875, "max_return": 27.450559616088867, "mean_motif_chained": 25.074890874632242, "gnorm": 0.236328125, "elapsed_s": 8.374700784683228, "cell_type": "Ex", "edit_type": "cell_type_transfer", "target_tf": "KLF2", "kd_active": false, "kd_tf": "", "kd_score_mean": 0.0, "ratio_mean": 1.0, "ratio_min": 1.0, "ratio_max": 1.0, "log_ratio_mean": 0.0, "adv_mean": 1.4901161193847656e-07, "adv_std": 0.9999997019767761, "adv_min": -1.4605728387832642, "adv_max": 0.7456849217414856, "comp_oracle_mean": 0.0, "comp_moods_chained_mean": 25.074890874632242, "comp_kd_mean": 0.0, "comp_total_mean": 25.074890874632242, "_algo": "dapo", "_lora_r": 16, "_peak_lr": 0.001, "_temperature": 1.0, "_seq_len_mean": 360.0}
|
| 2 |
{"rl_step": 5, "loss": 8.940696716308594e-08, "mean_return": 42.47251892089844, "max_return": 64.0967788696289, "mean_motif_chained": 42.47251660858892, "gnorm": 0.10888671875, "elapsed_s": 37.4642539024353, "cell_type": "Oli", "edit_type": "cell_type_transfer", "target_tf": "LHX6", "kd_active": false, "kd_tf": "", "kd_score_mean": 0.0, "ratio_mean": 1.0, "ratio_min": 1.0, "ratio_max": 1.0, "log_ratio_mean": 0.0, "adv_mean": -8.940696716308594e-08, "adv_std": 0.9999999403953552, "adv_min": -1.2483487129211426, "adv_max": 1.113036870956421, "comp_oracle_mean": 0.0, "comp_moods_chained_mean": 42.47251660858892, "comp_kd_mean": 0.0, "comp_total_mean": 42.47251660858892, "_algo": "dapo", "_lora_r": 16, "_peak_lr": 0.001, "_temperature": 1.0, "_seq_len_mean": 360.0}
|
| 3 |
{"rl_step": 10, "loss": 9.685754776000977e-08, "mean_return": 50.676795959472656, "max_return": 67.6124496459961, "mean_motif_chained": 50.67679373036245, "gnorm": 0.10009765625, "elapsed_s": 73.75393795967102, "cell_type": "Ex", "edit_type": "promoter_retarget", "target_tf": "TBR1", "kd_active": false, "kd_tf": "", "kd_score_mean": 0.0, "ratio_mean": 1.0, "ratio_min": 1.0, "ratio_max": 1.0, "log_ratio_mean": 0.0, "adv_mean": -9.685754776000977e-08, "adv_std": 0.9999998807907104, "adv_min": -1.353895902633667, "adv_max": 1.0194616317749023, "comp_oracle_mean": 0.0, "comp_moods_chained_mean": 50.67679373036245, "comp_kd_mean": 0.0, "comp_total_mean": 50.67679373036245, "_algo": "dapo", "_lora_r": 16, "_peak_lr": 0.001, "_temperature": 1.0, "_seq_len_mean": 360.0}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
{"rl_step": 1, "loss": -1.4901161193847656e-07, "mean_return": 25.07489013671875, "max_return": 27.450559616088867, "mean_motif_chained": 25.074890874632242, "gnorm": 0.236328125, "elapsed_s": 8.374700784683228, "cell_type": "Ex", "edit_type": "cell_type_transfer", "target_tf": "KLF2", "kd_active": false, "kd_tf": "", "kd_score_mean": 0.0, "ratio_mean": 1.0, "ratio_min": 1.0, "ratio_max": 1.0, "log_ratio_mean": 0.0, "adv_mean": 1.4901161193847656e-07, "adv_std": 0.9999997019767761, "adv_min": -1.4605728387832642, "adv_max": 0.7456849217414856, "comp_oracle_mean": 0.0, "comp_moods_chained_mean": 25.074890874632242, "comp_kd_mean": 0.0, "comp_total_mean": 25.074890874632242, "_algo": "dapo", "_lora_r": 16, "_peak_lr": 0.001, "_temperature": 1.0, "_seq_len_mean": 360.0}
|
| 2 |
{"rl_step": 5, "loss": 8.940696716308594e-08, "mean_return": 42.47251892089844, "max_return": 64.0967788696289, "mean_motif_chained": 42.47251660858892, "gnorm": 0.10888671875, "elapsed_s": 37.4642539024353, "cell_type": "Oli", "edit_type": "cell_type_transfer", "target_tf": "LHX6", "kd_active": false, "kd_tf": "", "kd_score_mean": 0.0, "ratio_mean": 1.0, "ratio_min": 1.0, "ratio_max": 1.0, "log_ratio_mean": 0.0, "adv_mean": -8.940696716308594e-08, "adv_std": 0.9999999403953552, "adv_min": -1.2483487129211426, "adv_max": 1.113036870956421, "comp_oracle_mean": 0.0, "comp_moods_chained_mean": 42.47251660858892, "comp_kd_mean": 0.0, "comp_total_mean": 42.47251660858892, "_algo": "dapo", "_lora_r": 16, "_peak_lr": 0.001, "_temperature": 1.0, "_seq_len_mean": 360.0}
|
| 3 |
{"rl_step": 10, "loss": 9.685754776000977e-08, "mean_return": 50.676795959472656, "max_return": 67.6124496459961, "mean_motif_chained": 50.67679373036245, "gnorm": 0.10009765625, "elapsed_s": 73.75393795967102, "cell_type": "Ex", "edit_type": "promoter_retarget", "target_tf": "TBR1", "kd_active": false, "kd_tf": "", "kd_score_mean": 0.0, "ratio_mean": 1.0, "ratio_min": 1.0, "ratio_max": 1.0, "log_ratio_mean": 0.0, "adv_mean": -9.685754776000977e-08, "adv_std": 0.9999998807907104, "adv_min": -1.353895902633667, "adv_max": 1.0194616317749023, "comp_oracle_mean": 0.0, "comp_moods_chained_mean": 50.67679373036245, "comp_kd_mean": 0.0, "comp_total_mean": 50.67679373036245, "_algo": "dapo", "_lora_r": 16, "_peak_lr": 0.001, "_temperature": 1.0, "_seq_len_mean": 360.0}
|
| 4 |
+
{"rl_step": 15, "loss": -5.960464477539063e-08, "mean_return": 33.844268798828125, "max_return": 52.98606872558594, "mean_motif_chained": 33.844269800299436, "gnorm": 0.06982421875, "elapsed_s": 110.75260424613953, "cell_type": "Ast", "edit_type": "activity_boost", "target_tf": "AP1", "kd_active": false, "kd_tf": "", "kd_score_mean": 0.0, "ratio_mean": 1.0, "ratio_min": 1.0, "ratio_max": 1.0, "log_ratio_mean": 0.0, "adv_mean": 5.960464477539063e-08, "adv_std": 0.9999998807907104, "adv_min": -0.8585960268974304, "adv_max": 1.419593334197998, "comp_oracle_mean": 0.0, "comp_moods_chained_mean": 33.844269800299436, "comp_kd_mean": 0.0, "comp_total_mean": 33.844269800299436, "_algo": "dapo", "_lora_r": 16, "_peak_lr": 0.001, "_temperature": 1.0, "_seq_len_mean": 360.0}
|
| 5 |
+
{"rl_step": 20, "loss": 1.7881393432617188e-07, "mean_return": 38.86052703857422, "max_return": 50.67230987548828, "mean_motif_chained": 38.86052622909345, "gnorm": 0.138671875, "elapsed_s": 148.24392437934875, "cell_type": "OPC", "edit_type": "promoter_retarget", "target_tf": "SOX6", "kd_active": false, "kd_tf": "", "kd_score_mean": 0.0, "ratio_mean": 1.0, "ratio_min": 1.0, "ratio_max": 1.0, "log_ratio_mean": 0.0, "adv_mean": -1.7881393432617188e-07, "adv_std": 0.9999998807907104, "adv_min": -1.35152006149292, "adv_max": 1.0365177392959595, "comp_oracle_mean": 0.0, "comp_moods_chained_mean": 38.86052622909345, "comp_kd_mean": 0.0, "comp_total_mean": 38.86052622909345, "_algo": "dapo", "_lora_r": 16, "_peak_lr": 0.001, "_temperature": 1.0, "_seq_len_mean": 360.0}
|
| 6 |
+
{"rl_step": 25, "loss": 2.9802322387695312e-08, "mean_return": 27.336971282958984, "max_return": 36.19440460205078, "mean_motif_chained": 27.336971305105955, "gnorm": 0.1123046875, "elapsed_s": 186.3923738002777, "cell_type": "Ex", "edit_type": "promoter_retarget", "target_tf": "NEUROD2", "kd_active": false, "kd_tf": "", "kd_score_mean": 0.0, "ratio_mean": 1.0, "ratio_min": 1.0, "ratio_max": 1.0, "log_ratio_mean": 0.0, "adv_mean": -2.9802322387695312e-08, "adv_std": 0.9999997019767761, "adv_min": -1.1249909400939941, "adv_max": 1.1047247648239136, "comp_oracle_mean": 0.0, "comp_moods_chained_mean": 27.336971305105955, "comp_kd_mean": 0.0, "comp_total_mean": 27.336971305105955, "_algo": "dapo", "_lora_r": 16, "_peak_lr": 0.001, "_temperature": 1.0, "_seq_len_mean": 360.0}
|
| 7 |
+
{"rl_step": 30, "loss": -5.960464477539063e-08, "mean_return": 40.54928207397461, "max_return": 77.20588684082031, "mean_motif_chained": 40.549284680594226, "gnorm": 0.11181640625, "elapsed_s": 223.99898886680603, "cell_type": "In", "edit_type": "activity_boost", "target_tf": "LHX6", "kd_active": false, "kd_tf": "", "kd_score_mean": 0.0, "ratio_mean": 1.0, "ratio_min": 1.0, "ratio_max": 1.0, "log_ratio_mean": 0.0, "adv_mean": 5.960464477539063e-08, "adv_std": 0.9999997615814209, "adv_min": -0.9670692682266235, "adv_max": 1.3701462745666504, "comp_oracle_mean": 0.0, "comp_moods_chained_mean": 40.549284680594226, "comp_kd_mean": 0.0, "comp_total_mean": 40.549284680594226, "_algo": "dapo", "_lora_r": 16, "_peak_lr": 0.001, "_temperature": 1.0, "_seq_len_mean": 360.0}
|
| 8 |
+
{"rl_step": 35, "loss": 1.7881393432617188e-07, "mean_return": 32.84033203125, "max_return": 49.41720199584961, "mean_motif_chained": 32.84033064284098, "gnorm": 0.11181640625, "elapsed_s": 260.53619480133057, "cell_type": "Ex", "edit_type": "promoter_retarget", "target_tf": "MEF2C", "kd_active": false, "kd_tf": "", "kd_score_mean": 0.0, "ratio_mean": 1.0, "ratio_min": 1.0, "ratio_max": 1.0, "log_ratio_mean": 0.0, "adv_mean": -1.7881393432617188e-07, "adv_std": 0.9999999403953552, "adv_min": -1.1517488956451416, "adv_max": 1.2461538314819336, "comp_oracle_mean": 0.0, "comp_moods_chained_mean": 32.84033064284098, "comp_kd_mean": 0.0, "comp_total_mean": 32.84033064284098, "_algo": "dapo", "_lora_r": 16, "_peak_lr": 0.001, "_temperature": 1.0, "_seq_len_mean": 360.0}
|
| 9 |
+
{"rl_step": 40, "loss": 5.960464477539063e-08, "mean_return": 36.70616149902344, "max_return": 51.92811965942383, "mean_motif_chained": 36.70616053359369, "gnorm": 0.1416015625, "elapsed_s": 297.4975643157959, "cell_type": "Oli", "edit_type": "promoter_retarget", "target_tf": "MYRF", "kd_active": false, "kd_tf": "", "kd_score_mean": 0.0, "ratio_mean": 1.0, "ratio_min": 1.0, "ratio_max": 1.0, "log_ratio_mean": 0.0, "adv_mean": -5.960464477539063e-08, "adv_std": 1.0, "adv_min": -0.9211280941963196, "adv_max": 1.2223496437072754, "comp_oracle_mean": 0.0, "comp_moods_chained_mean": 36.70616053359369, "comp_kd_mean": 0.0, "comp_total_mean": 36.70616053359369, "_algo": "dapo", "_lora_r": 16, "_peak_lr": 0.001, "_temperature": 1.0, "_seq_len_mean": 360.0}
|
| 10 |
+
{"rl_step": 45, "loss": 1.043081283569336e-07, "mean_return": 45.47503662109375, "max_return": 60.75269317626953, "mean_motif_chained": 45.47503528543021, "gnorm": 0.1484375, "elapsed_s": 333.85710406303406, "cell_type": "Ex", "edit_type": "activity_boost", "target_tf": "NEUROD2", "kd_active": false, "kd_tf": "", "kd_score_mean": 0.0, "ratio_mean": 1.0, "ratio_min": 1.0, "ratio_max": 1.0, "log_ratio_mean": 0.0, "adv_mean": -1.043081283569336e-07, "adv_std": 0.9999999403953552, "adv_min": -1.1467622518539429, "adv_max": 1.1555391550064087, "comp_oracle_mean": 0.0, "comp_moods_chained_mean": 45.47503528543021, "comp_kd_mean": 0.0, "comp_total_mean": 45.47503528543021, "_algo": "dapo", "_lora_r": 16, "_peak_lr": 0.001, "_temperature": 1.0, "_seq_len_mean": 360.0}
|
| 11 |
+
{"rl_step": 50, "loss": -1.341104507446289e-07, "mean_return": 24.33313751220703, "max_return": 39.897525787353516, "mean_motif_chained": 24.333138769158488, "gnorm": 0.232421875, "elapsed_s": 370.4064428806305, "cell_type": "Mic", "edit_type": "promoter_retarget", "target_tf": "RUNX1", "kd_active": false, "kd_tf": "", "kd_score_mean": 0.0, "ratio_mean": 1.0, "ratio_min": 1.0, "ratio_max": 1.0, "log_ratio_mean": 0.0, "adv_mean": 1.341104507446289e-07, "adv_std": 0.9999999403953552, "adv_min": -0.9116485118865967, "adv_max": 1.338451623916626, "comp_oracle_mean": 0.0, "comp_moods_chained_mean": 24.333138769158488, "comp_kd_mean": 0.0, "comp_total_mean": 24.333138769158488, "_algo": "dapo", "_lora_r": 16, "_peak_lr": 0.001, "_temperature": 1.0, "_seq_len_mean": 360.0}
|
| 12 |
+
{"rl_step": 55, "loss": 2.9802322387695312e-08, "mean_return": 39.22856521606445, "max_return": 56.620662689208984, "mean_motif_chained": 39.22856492639096, "gnorm": 0.1396484375, "elapsed_s": 407.5169348716736, "cell_type": "Mic", "edit_type": "promoter_retarget", "target_tf": "RUNX1", "kd_active": false, "kd_tf": "", "kd_score_mean": 0.0, "ratio_mean": 1.0, "ratio_min": 1.0, "ratio_max": 1.0, "log_ratio_mean": 0.0, "adv_mean": -2.9802322387695312e-08, "adv_std": 0.9999998807907104, "adv_min": -1.3001314401626587, "adv_max": 1.1267943382263184, "comp_oracle_mean": 0.0, "comp_moods_chained_mean": 39.22856492639096, "comp_kd_mean": 0.0, "comp_total_mean": 39.22856492639096, "_algo": "dapo", "_lora_r": 16, "_peak_lr": 0.001, "_temperature": 1.0, "_seq_len_mean": 360.0}
|
| 13 |
+
{"rl_step": 60, "loss": 1.2665987014770508e-07, "mean_return": 32.38032150268555, "max_return": 42.39067840576172, "mean_motif_chained": 32.38032061829972, "gnorm": 0.1123046875, "elapsed_s": 444.922935962677, "cell_type": "Ex", "edit_type": "promoter_retarget", "target_tf": "NEUROD2", "kd_active": false, "kd_tf": "", "kd_score_mean": 0.0, "ratio_mean": 1.0, "ratio_min": 1.0, "ratio_max": 1.0, "log_ratio_mean": 0.0, "adv_mean": -1.2665987014770508e-07, "adv_std": 0.9999998807907104, "adv_min": -0.947345495223999, "adv_max": 1.3663780689239502, "comp_oracle_mean": 0.0, "comp_moods_chained_mean": 32.38032061829972, "comp_kd_mean": 0.0, "comp_total_mean": 32.38032061829972, "_algo": "dapo", "_lora_r": 16, "_peak_lr": 0.001, "_temperature": 1.0, "_seq_len_mean": 360.0}
|
| 14 |
+
{"rl_step": 65, "loss": -4.470348358154297e-08, "mean_return": 28.513185501098633, "max_return": 45.1795539855957, "mean_motif_chained": 28.51318662235571, "gnorm": 0.1767578125, "elapsed_s": 482.9289994239807, "cell_type": "Oli", "edit_type": "promoter_retarget", "target_tf": "OLIG2", "kd_active": false, "kd_tf": "", "kd_score_mean": 0.0, "ratio_mean": 1.0, "ratio_min": 1.0, "ratio_max": 1.0, "log_ratio_mean": 0.0, "adv_mean": 4.470348358154297e-08, "adv_std": 0.9999999403953552, "adv_min": -1.1510087251663208, "adv_max": 0.9638814926147461, "comp_oracle_mean": 0.0, "comp_moods_chained_mean": 28.51318662235571, "comp_kd_mean": 0.0, "comp_total_mean": 28.51318662235571, "_algo": "dapo", "_lora_r": 16, "_peak_lr": 0.001, "_temperature": 1.0, "_seq_len_mean": 360.0}
|
| 15 |
+
{"rl_step": 70, "loss": -0.0, "mean_return": 46.2489013671875, "max_return": 62.85711669921875, "mean_motif_chained": 46.24890008635546, "gnorm": 0.2216796875, "elapsed_s": 520.349809885025, "cell_type": "Ex", "edit_type": "promoter_retarget", "target_tf": "RORB", "kd_active": false, "kd_tf": "", "kd_score_mean": 0.0, "ratio_mean": 1.0, "ratio_min": 1.0, "ratio_max": 1.0, "log_ratio_mean": 0.0, "adv_mean": 0.0, "adv_std": 0.9999998807907104, "adv_min": -1.4346280097961426, "adv_max": 0.8881332874298096, "comp_oracle_mean": 0.0, "comp_moods_chained_mean": 46.24890008635546, "comp_kd_mean": 0.0, "comp_total_mean": 46.24890008635546, "_algo": "dapo", "_lora_r": 16, "_peak_lr": 0.001, "_temperature": 1.0, "_seq_len_mean": 360.0}
|
| 16 |
+
{"rl_step": 75, "loss": 1.4901161193847656e-07, "mean_return": 42.725440979003906, "max_return": 49.192169189453125, "mean_motif_chained": 42.72543989580817, "gnorm": 0.177734375, "elapsed_s": 557.3783333301544, "cell_type": "Mic", "edit_type": "activity_boost", "target_tf": "CEBPA", "kd_active": false, "kd_tf": "", "kd_score_mean": 0.0, "ratio_mean": 1.0, "ratio_min": 1.0, "ratio_max": 1.0, "log_ratio_mean": 0.0, "adv_mean": -1.4901161193847656e-07, "adv_std": 0.9999997615814209, "adv_min": -1.2733920812606812, "adv_max": 1.0388745069503784, "comp_oracle_mean": 0.0, "comp_moods_chained_mean": 42.72543989580817, "comp_kd_mean": 0.0, "comp_total_mean": 42.72543989580817, "_algo": "dapo", "_lora_r": 16, "_peak_lr": 0.001, "_temperature": 1.0, "_seq_len_mean": 360.0}
|
| 17 |
+
{"rl_step": 80, "loss": -1.043081283569336e-07, "mean_return": 42.389930725097656, "max_return": 55.240562438964844, "mean_motif_chained": 42.38993268713916, "gnorm": 0.259765625, "elapsed_s": 594.0069422721863, "cell_type": "Ex", "edit_type": "cell_type_transfer", "target_tf": "NKX2-2", "kd_active": false, "kd_tf": "", "kd_score_mean": 0.0, "ratio_mean": 1.0, "ratio_min": 1.0, "ratio_max": 1.0, "log_ratio_mean": 0.0, "adv_mean": 1.043081283569336e-07, "adv_std": 0.9999999403953552, "adv_min": -0.8058874607086182, "adv_max": 1.3234950304031372, "comp_oracle_mean": 0.0, "comp_moods_chained_mean": 42.38993268713916, "comp_kd_mean": 0.0, "comp_total_mean": 42.38993268713916, "_algo": "dapo", "_lora_r": 16, "_peak_lr": 0.001, "_temperature": 1.0, "_seq_len_mean": 360.0}
|
| 18 |
+
{"rl_step": 85, "loss": -0.0, "mean_return": 59.21550750732422, "max_return": 92.17793273925781, "mean_motif_chained": 59.215506493992194, "gnorm": 0.28515625, "elapsed_s": 630.4412500858307, "cell_type": "OPC", "edit_type": "promoter_retarget", "target_tf": "ASCL1", "kd_active": false, "kd_tf": "", "kd_score_mean": 0.0, "ratio_mean": 1.0, "ratio_min": 1.0, "ratio_max": 1.0, "log_ratio_mean": 0.0, "adv_mean": 0.0, "adv_std": 0.9999998211860657, "adv_min": -1.1254518032073975, "adv_max": 1.1994051933288574, "comp_oracle_mean": 0.0, "comp_moods_chained_mean": 59.215506493992194, "comp_kd_mean": 0.0, "comp_total_mean": 59.215506493992194, "_algo": "dapo", "_lora_r": 16, "_peak_lr": 0.001, "_temperature": 1.0, "_seq_len_mean": 360.0}
|
| 19 |
+
{"rl_step": 90, "loss": -4.76837158203125e-07, "mean_return": 38.84468078613281, "max_return": 47.63869094848633, "mean_motif_chained": 38.84468395100568, "gnorm": 0.138671875, "elapsed_s": 666.784975528717, "cell_type": "Mic", "edit_type": "cell_type_transfer", "target_tf": "SOX10", "kd_active": false, "kd_tf": "", "kd_score_mean": 0.0, "ratio_mean": 1.0, "ratio_min": 1.0, "ratio_max": 1.0, "log_ratio_mean": 0.0, "adv_mean": 4.76837158203125e-07, "adv_std": 0.9999998807907104, "adv_min": -0.6631073355674744, "adv_max": 1.4724586009979248, "comp_oracle_mean": 0.0, "comp_moods_chained_mean": 38.84468395100568, "comp_kd_mean": 0.0, "comp_total_mean": 38.84468395100568, "_algo": "dapo", "_lora_r": 16, "_peak_lr": 0.001, "_temperature": 1.0, "_seq_len_mean": 360.0}
|
| 20 |
+
{"rl_step": 95, "loss": -9.685754776000977e-08, "mean_return": 46.53289794921875, "max_return": 85.36104583740234, "mean_motif_chained": 46.532900120466664, "gnorm": 0.240234375, "elapsed_s": 702.909586429596, "cell_type": "Oli", "edit_type": "activity_boost", "target_tf": "MYRF", "kd_active": false, "kd_tf": "", "kd_score_mean": 0.0, "ratio_mean": 1.0, "ratio_min": 1.0, "ratio_max": 1.0, "log_ratio_mean": 0.0, "adv_mean": 9.685754776000977e-08, "adv_std": 0.9999998211860657, "adv_min": -0.928704559803009, "adv_max": 1.3809423446655273, "comp_oracle_mean": 0.0, "comp_moods_chained_mean": 46.532900120466664, "comp_kd_mean": 0.0, "comp_total_mean": 46.532900120466664, "_algo": "dapo", "_lora_r": 16, "_peak_lr": 0.001, "_temperature": 1.0, "_seq_len_mean": 360.0}
|
| 21 |
+
{"rl_step": 100, "loss": 2.3096799850463867e-07, "mean_return": 24.129215240478516, "max_return": 30.150617599487305, "mean_motif_chained": 24.12921394113899, "gnorm": 0.26171875, "elapsed_s": 739.0724713802338, "cell_type": "In", "edit_type": "promoter_retarget", "target_tf": "DLX1", "kd_active": false, "kd_tf": "", "kd_score_mean": 0.0, "ratio_mean": 1.0, "ratio_min": 1.0, "ratio_max": 1.0, "log_ratio_mean": 0.0, "adv_mean": -2.3096799850463867e-07, "adv_std": 0.9999997615814209, "adv_min": -1.372074007987976, "adv_max": 0.9763869047164917, "comp_oracle_mean": 0.0, "comp_moods_chained_mean": 24.12921394113899, "comp_kd_mean": 0.0, "comp_total_mean": 24.12921394113899, "_algo": "dapo", "_lora_r": 16, "_peak_lr": 0.001, "_temperature": 1.0, "_seq_len_mean": 360.0}
|
| 22 |
+
{"rl_step": 105, "loss": -2.384185791015625e-07, "mean_return": 51.324195861816406, "max_return": 59.99216079711914, "mean_motif_chained": 51.32419734369594, "gnorm": 0.3125, "elapsed_s": 775.8290510177612, "cell_type": "Ast", "edit_type": "activity_boost", "target_tf": "AP1", "kd_active": false, "kd_tf": "", "kd_score_mean": 0.0, "ratio_mean": 1.0, "ratio_min": 1.0, "ratio_max": 1.0, "log_ratio_mean": 0.0, "adv_mean": 2.384185791015625e-07, "adv_std": 0.9999998807907104, "adv_min": -1.331211805343628, "adv_max": 1.0145814418792725, "comp_oracle_mean": 0.0, "comp_moods_chained_mean": 51.32419734369594, "comp_kd_mean": 0.0, "comp_total_mean": 51.32419734369594, "_algo": "dapo", "_lora_r": 16, "_peak_lr": 0.001, "_temperature": 1.0, "_seq_len_mean": 360.0}
|
| 23 |
+
{"rl_step": 110, "loss": -8.940696716308594e-08, "mean_return": 70.55686950683594, "max_return": 104.18077850341797, "mean_motif_chained": 70.55687218332696, "gnorm": 0.21875, "elapsed_s": 814.7958242893219, "cell_type": "Mic", "edit_type": "promoter_retarget", "target_tf": "IRF8", "kd_active": false, "kd_tf": "", "kd_score_mean": 0.0, "ratio_mean": 1.0, "ratio_min": 1.0, "ratio_max": 1.0, "log_ratio_mean": 0.0, "adv_mean": 8.940696716308594e-08, "adv_std": 0.9999999403953552, "adv_min": -0.892095685005188, "adv_max": 0.893398642539978, "comp_oracle_mean": 0.0, "comp_moods_chained_mean": 70.55687218332696, "comp_kd_mean": 0.0, "comp_total_mean": 70.55687218332696, "_algo": "dapo", "_lora_r": 16, "_peak_lr": 0.001, "_temperature": 1.0, "_seq_len_mean": 360.0}
|
| 24 |
+
{"rl_step": 115, "loss": -0.0, "mean_return": 43.121604919433594, "max_return": 90.06135559082031, "mean_motif_chained": 43.12160589628096, "gnorm": 0.373046875, "elapsed_s": 851.6169369220734, "cell_type": "Ex", "edit_type": "cell_type_transfer", "target_tf": "IRF8", "kd_active": false, "kd_tf": "", "kd_score_mean": 0.0, "ratio_mean": 1.0, "ratio_min": 1.0, "ratio_max": 1.0, "log_ratio_mean": 0.0, "adv_mean": 0.0, "adv_std": 1.0, "adv_min": -0.8088356256484985, "adv_max": 1.4287946224212646, "comp_oracle_mean": 0.0, "comp_moods_chained_mean": 43.12160589628096, "comp_kd_mean": 0.0, "comp_total_mean": 43.12160589628096, "_algo": "dapo", "_lora_r": 16, "_peak_lr": 0.001, "_temperature": 1.0, "_seq_len_mean": 360.0}
|
| 25 |
+
{"rl_step": 120, "loss": -2.9802322387695312e-08, "mean_return": 46.48229217529297, "max_return": 72.98858642578125, "mean_motif_chained": 46.48229314457069, "gnorm": 0.412109375, "elapsed_s": 889.0976283550262, "cell_type": "Mic", "edit_type": "cell_type_transfer", "target_tf": "LHX6", "kd_active": false, "kd_tf": "", "kd_score_mean": 0.0, "ratio_mean": 1.0, "ratio_min": 1.0, "ratio_max": 1.0, "log_ratio_mean": 0.0, "adv_mean": 2.9802322387695312e-08, "adv_std": 0.9999999403953552, "adv_min": -1.1962825059890747, "adv_max": 1.168035864830017, "comp_oracle_mean": 0.0, "comp_moods_chained_mean": 46.48229314457069, "comp_kd_mean": 0.0, "comp_total_mean": 46.48229314457069, "_algo": "dapo", "_lora_r": 16, "_peak_lr": 0.001, "_temperature": 1.0, "_seq_len_mean": 360.0}
|
| 26 |
+
{"rl_step": 125, "loss": -7.450580596923828e-08, "mean_return": 59.208274841308594, "max_return": 78.99787902832031, "mean_motif_chained": 59.20827522557693, "gnorm": 0.2490234375, "elapsed_s": 927.0252113342285, "cell_type": "Ex", "edit_type": "activity_boost", "target_tf": "RORB", "kd_active": false, "kd_tf": "", "kd_score_mean": 0.0, "ratio_mean": 1.0, "ratio_min": 1.0, "ratio_max": 1.0, "log_ratio_mean": 0.0, "adv_mean": 7.450580596923828e-08, "adv_std": 1.0, "adv_min": -0.8600803017616272, "adv_max": 1.4450323581695557, "comp_oracle_mean": 0.0, "comp_moods_chained_mean": 59.20827522557693, "comp_kd_mean": 0.0, "comp_total_mean": 59.20827522557693, "_algo": "dapo", "_lora_r": 16, "_peak_lr": 0.001, "_temperature": 1.0, "_seq_len_mean": 360.0}
|
| 27 |
+
{"rl_step": 130, "loss": 1.4901161193847656e-07, "mean_return": 44.04701232910156, "max_return": 68.14128875732422, "mean_motif_chained": 44.047010258253714, "gnorm": 0.4140625, "elapsed_s": 964.5458176136017, "cell_type": "Ast", "edit_type": "cell_type_transfer", "target_tf": "SPI1", "kd_active": false, "kd_tf": "", "kd_score_mean": 0.0, "ratio_mean": 1.0, "ratio_min": 1.0, "ratio_max": 1.0, "log_ratio_mean": 0.0, "adv_mean": -1.4901161193847656e-07, "adv_std": 0.9999998807907104, "adv_min": -0.7529813051223755, "adv_max": 1.423538088798523, "comp_oracle_mean": 0.0, "comp_moods_chained_mean": 44.047010258253714, "comp_kd_mean": 0.0, "comp_total_mean": 44.047010258253714, "_algo": "dapo", "_lora_r": 16, "_peak_lr": 0.001, "_temperature": 1.0, "_seq_len_mean": 360.0}
|
| 28 |
+
{"rl_step": 135, "loss": 1.7881393432617188e-07, "mean_return": 48.508934020996094, "max_return": 77.33578491210938, "mean_motif_chained": 48.508929490268436, "gnorm": 0.365234375, "elapsed_s": 1002.9293892383575, "cell_type": "Mic", "edit_type": "activity_boost", "target_tf": "IRF8", "kd_active": false, "kd_tf": "", "kd_score_mean": 0.0, "ratio_mean": 1.0, "ratio_min": 1.0, "ratio_max": 1.0, "log_ratio_mean": 0.0, "adv_mean": -1.7881393432617188e-07, "adv_std": 0.9999998211860657, "adv_min": -1.0128217935562134, "adv_max": 1.3740713596343994, "comp_oracle_mean": 0.0, "comp_moods_chained_mean": 48.508929490268436, "comp_kd_mean": 0.0, "comp_total_mean": 48.508929490268436, "_algo": "dapo", "_lora_r": 16, "_peak_lr": 0.001, "_temperature": 1.0, "_seq_len_mean": 360.0}
|
| 29 |
+
{"rl_step": 140, "loss": -2.980232238769531e-07, "mean_return": 54.953033447265625, "max_return": 64.03836822509766, "mean_motif_chained": 54.95303715103171, "gnorm": 0.2734375, "elapsed_s": 1040.5540609359741, "cell_type": "Mic", "edit_type": "activity_boost", "target_tf": "CEBPA", "kd_active": false, "kd_tf": "", "kd_score_mean": 0.0, "ratio_mean": 1.0, "ratio_min": 1.0, "ratio_max": 1.0, "log_ratio_mean": 0.0, "adv_mean": 2.980232238769531e-07, "adv_std": 0.9999999403953552, "adv_min": -1.384497880935669, "adv_max": 1.001049280166626, "comp_oracle_mean": 0.0, "comp_moods_chained_mean": 54.95303715103171, "comp_kd_mean": 0.0, "comp_total_mean": 54.95303715103171, "_algo": "dapo", "_lora_r": 16, "_peak_lr": 0.001, "_temperature": 1.0, "_seq_len_mean": 360.0}
|
| 30 |
+
{"rl_step": 145, "loss": 1.1920928955078125e-07, "mean_return": 55.28999710083008, "max_return": 75.73579406738281, "mean_motif_chained": 55.2899957212232, "gnorm": 0.3125, "elapsed_s": 1078.9078576564789, "cell_type": "Oli", "edit_type": "activity_boost", "target_tf": "SOX10", "kd_active": false, "kd_tf": "", "kd_score_mean": 0.0, "ratio_mean": 1.0, "ratio_min": 1.0, "ratio_max": 1.0, "log_ratio_mean": 0.0, "adv_mean": -1.1920928955078125e-07, "adv_std": 0.9999998807907104, "adv_min": -0.8232386708259583, "adv_max": 1.2419527769088745, "comp_oracle_mean": 0.0, "comp_moods_chained_mean": 55.2899957212232, "comp_kd_mean": 0.0, "comp_total_mean": 55.2899957212232, "_algo": "dapo", "_lora_r": 16, "_peak_lr": 0.001, "_temperature": 1.0, "_seq_len_mean": 360.0}
|
| 31 |
+
{"rl_step": 150, "loss": -2.9802322387695312e-08, "mean_return": 27.804468154907227, "max_return": 48.50688934326172, "mean_motif_chained": 27.804468673484706, "gnorm": 0.3359375, "elapsed_s": 1114.158706188202, "cell_type": "In", "edit_type": "cell_type_transfer", "target_tf": "NEUROD2", "kd_active": false, "kd_tf": "", "kd_score_mean": 0.0, "ratio_mean": 1.0, "ratio_min": 1.0, "ratio_max": 1.0, "log_ratio_mean": 0.0, "adv_mean": 2.9802322387695312e-08, "adv_std": 0.9999999403953552, "adv_min": -0.990084171295166, "adv_max": 1.125234842300415, "comp_oracle_mean": 0.0, "comp_moods_chained_mean": 27.804468673484706, "comp_kd_mean": 0.0, "comp_total_mean": 27.804468673484706, "_algo": "dapo", "_lora_r": 16, "_peak_lr": 0.001, "_temperature": 1.0, "_seq_len_mean": 360.0}
|
| 32 |
+
{"rl_step": 155, "loss": -2.086162567138672e-07, "mean_return": 46.13496398925781, "max_return": 67.52181243896484, "mean_motif_chained": 46.13496631101523, "gnorm": 0.32421875, "elapsed_s": 1148.5968759059906, "cell_type": "Ex", "edit_type": "promoter_retarget", "target_tf": "MEF2C", "kd_active": false, "kd_tf": "", "kd_score_mean": 0.0, "ratio_mean": 1.0, "ratio_min": 1.0, "ratio_max": 1.0, "log_ratio_mean": 0.0, "adv_mean": 2.086162567138672e-07, "adv_std": 1.0, "adv_min": -0.8153027296066284, "adv_max": 1.4536041021347046, "comp_oracle_mean": 0.0, "comp_moods_chained_mean": 46.13496631101523, "comp_kd_mean": 0.0, "comp_total_mean": 46.13496631101523, "_algo": "dapo", "_lora_r": 16, "_peak_lr": 0.001, "_temperature": 1.0, "_seq_len_mean": 360.0}
|
| 33 |
+
{"rl_step": 160, "loss": 1.4901161193847656e-07, "mean_return": 40.80091094970703, "max_return": 53.82844543457031, "mean_motif_chained": 40.80091051123867, "gnorm": 0.345703125, "elapsed_s": 1182.2681486606598, "cell_type": "Ast", "edit_type": "activity_boost", "target_tf": "SOX9", "kd_active": false, "kd_tf": "", "kd_score_mean": 0.0, "ratio_mean": 1.0, "ratio_min": 1.0, "ratio_max": 1.0, "log_ratio_mean": 0.0, "adv_mean": -1.4901161193847656e-07, "adv_std": 0.9999997615814209, "adv_min": -0.9679352045059204, "adv_max": 1.396469235420227, "comp_oracle_mean": 0.0, "comp_moods_chained_mean": 40.80091051123867, "comp_kd_mean": 0.0, "comp_total_mean": 40.80091051123867, "_algo": "dapo", "_lora_r": 16, "_peak_lr": 0.001, "_temperature": 1.0, "_seq_len_mean": 360.0}
|
| 34 |
+
{"rl_step": 165, "loss": -8.940696716308594e-08, "mean_return": 49.48456573486328, "max_return": 56.938079833984375, "mean_motif_chained": 49.48456597316098, "gnorm": 0.384765625, "elapsed_s": 1216.2751863002777, "cell_type": "OPC", "edit_type": "cell_type_transfer", "target_tf": "NKX2-2", "kd_active": false, "kd_tf": "", "kd_score_mean": 0.0, "ratio_mean": 1.0, "ratio_min": 1.0, "ratio_max": 1.0, "log_ratio_mean": 0.0, "adv_mean": 8.940696716308594e-08, "adv_std": 0.9999999403953552, "adv_min": -1.3848445415496826, "adv_max": 0.9367080330848694, "comp_oracle_mean": 0.0, "comp_moods_chained_mean": 49.48456597316098, "comp_kd_mean": 0.0, "comp_total_mean": 49.48456597316098, "_algo": "dapo", "_lora_r": 16, "_peak_lr": 0.001, "_temperature": 1.0, "_seq_len_mean": 360.0}
|
| 35 |
+
{"rl_step": 170, "loss": -2.682209014892578e-07, "mean_return": 37.35772705078125, "max_return": 47.428680419921875, "mean_motif_chained": 37.357729289405746, "gnorm": 0.65234375, "elapsed_s": 1249.9420504570007, "cell_type": "Ast", "edit_type": "activity_boost", "target_tf": "AP1", "kd_active": false, "kd_tf": "", "kd_score_mean": 0.0, "ratio_mean": 1.0, "ratio_min": 1.0, "ratio_max": 1.0, "log_ratio_mean": 0.0, "adv_mean": 2.682209014892578e-07, "adv_std": 0.9999997615814209, "adv_min": -0.9231137633323669, "adv_max": 1.3568212985992432, "comp_oracle_mean": 0.0, "comp_moods_chained_mean": 37.357729289405746, "comp_kd_mean": 0.0, "comp_total_mean": 37.357729289405746, "_algo": "dapo", "_lora_r": 16, "_peak_lr": 0.001, "_temperature": 1.0, "_seq_len_mean": 360.0}
|
| 36 |
+
{"rl_step": 175, "loss": -8.940696716308594e-08, "mean_return": 44.901248931884766, "max_return": 51.924049377441406, "mean_motif_chained": 44.90124975610763, "gnorm": 0.53125, "elapsed_s": 1283.734236240387, "cell_type": "Oli", "edit_type": "activity_boost", "target_tf": "MYRF", "kd_active": false, "kd_tf": "", "kd_score_mean": 0.0, "ratio_mean": 1.0, "ratio_min": 1.0, "ratio_max": 1.0, "log_ratio_mean": 0.0, "adv_mean": 8.940696716308594e-08, "adv_std": 1.0, "adv_min": -1.482351541519165, "adv_max": 0.66951984167099, "comp_oracle_mean": 0.0, "comp_moods_chained_mean": 44.90124975610763, "comp_kd_mean": 0.0, "comp_total_mean": 44.90124975610763, "_algo": "dapo", "_lora_r": 16, "_peak_lr": 0.001, "_temperature": 1.0, "_seq_len_mean": 360.0}
|
| 37 |
+
{"rl_step": 180, "loss": 1.4901161193847656e-08, "mean_return": 30.220346450805664, "max_return": 48.46043395996094, "mean_motif_chained": 30.220345388361732, "gnorm": 0.60546875, "elapsed_s": 1317.344004869461, "cell_type": "In", "edit_type": "promoter_retarget", "target_tf": "DLX1", "kd_active": false, "kd_tf": "", "kd_score_mean": 0.0, "ratio_mean": 1.0, "ratio_min": 1.0, "ratio_max": 1.0, "log_ratio_mean": 0.0, "adv_mean": -1.4901161193847656e-08, "adv_std": 0.9999998807907104, "adv_min": -0.9046291708946228, "adv_max": 1.3899037837982178, "comp_oracle_mean": 0.0, "comp_moods_chained_mean": 30.220345388361732, "comp_kd_mean": 0.0, "comp_total_mean": 30.220345388361732, "_algo": "dapo", "_lora_r": 16, "_peak_lr": 0.001, "_temperature": 1.0, "_seq_len_mean": 360.0}
|
| 38 |
+
{"rl_step": 185, "loss": -1.1920928955078125e-07, "mean_return": 72.67106628417969, "max_return": 103.13460540771484, "mean_motif_chained": 72.67106884187494, "gnorm": 0.546875, "elapsed_s": 1351.0927710533142, "cell_type": "In", "edit_type": "activity_boost", "target_tf": "SOX6", "kd_active": false, "kd_tf": "", "kd_score_mean": 0.0, "ratio_mean": 1.0, "ratio_min": 1.0, "ratio_max": 1.0, "log_ratio_mean": 0.0, "adv_mean": 1.1920928955078125e-07, "adv_std": 0.9999999403953552, "adv_min": -0.8318790197372437, "adv_max": 1.330163836479187, "comp_oracle_mean": 0.0, "comp_moods_chained_mean": 72.67106884187494, "comp_kd_mean": 0.0, "comp_total_mean": 72.67106884187494, "_algo": "dapo", "_lora_r": 16, "_peak_lr": 0.001, "_temperature": 1.0, "_seq_len_mean": 360.0}
|
| 39 |
+
{"rl_step": 190, "loss": -1.1920928955078125e-07, "mean_return": 34.59965133666992, "max_return": 46.39754867553711, "mean_motif_chained": 34.59965235496295, "gnorm": 0.6796875, "elapsed_s": 1385.0080964565277, "cell_type": "Ast", "edit_type": "promoter_retarget", "target_tf": "AP1", "kd_active": false, "kd_tf": "", "kd_score_mean": 0.0, "ratio_mean": 1.0, "ratio_min": 1.0, "ratio_max": 1.0, "log_ratio_mean": 0.0, "adv_mean": 1.1920928955078125e-07, "adv_std": 0.9999998807907104, "adv_min": -1.219651460647583, "adv_max": 1.1826673746109009, "comp_oracle_mean": 0.0, "comp_moods_chained_mean": 34.59965235496295, "comp_kd_mean": 0.0, "comp_total_mean": 34.59965235496295, "_algo": "dapo", "_lora_r": 16, "_peak_lr": 0.001, "_temperature": 1.0, "_seq_len_mean": 360.0}
|
| 40 |
+
{"rl_step": 195, "loss": -6.705522537231445e-08, "mean_return": 43.1016845703125, "max_return": 61.16847229003906, "mean_motif_chained": 43.101686077501434, "gnorm": 0.46875, "elapsed_s": 1418.6783912181854, "cell_type": "Ex", "edit_type": "promoter_retarget", "target_tf": "RORB", "kd_active": false, "kd_tf": "", "kd_score_mean": 0.0, "ratio_mean": 1.0, "ratio_min": 1.0, "ratio_max": 1.0, "log_ratio_mean": 0.0, "adv_mean": 6.705522537231445e-08, "adv_std": 0.9999999403953552, "adv_min": -0.9156190156936646, "adv_max": 1.3700538873672485, "comp_oracle_mean": 0.0, "comp_moods_chained_mean": 43.101686077501434, "comp_kd_mean": 0.0, "comp_total_mean": 43.101686077501434, "_algo": "dapo", "_lora_r": 16, "_peak_lr": 0.001, "_temperature": 1.0, "_seq_len_mean": 360.0}
|
| 41 |
+
{"rl_step": 200, "loss": 4.470348358154297e-08, "mean_return": 52.83843994140625, "max_return": 88.10202026367188, "mean_motif_chained": 52.838438219610204, "gnorm": 0.65234375, "elapsed_s": 1452.4295673370361, "cell_type": "In", "edit_type": "activity_boost", "target_tf": "DLX1", "kd_active": false, "kd_tf": "", "kd_score_mean": 0.0, "ratio_mean": 1.0, "ratio_min": 1.0, "ratio_max": 1.0, "log_ratio_mean": 0.0, "adv_mean": -4.470348358154297e-08, "adv_std": 0.9999998807907104, "adv_min": -1.0425517559051514, "adv_max": 1.3638800382614136, "comp_oracle_mean": 0.0, "comp_moods_chained_mean": 52.838438219610204, "comp_kd_mean": 0.0, "comp_total_mean": 52.838438219610204, "_algo": "dapo", "_lora_r": 16, "_peak_lr": 0.001, "_temperature": 1.0, "_seq_len_mean": 360.0}
|