Upload exp_phase8_t3_rl_edit_tight_gspo_FIXED_s2_lr1e3_moods_20260506_131012/log.jsonl with huggingface_hub
Browse files
exp_phase8_t3_rl_edit_tight_gspo_FIXED_s2_lr1e3_moods_20260506_131012/log.jsonl
ADDED
|
@@ -0,0 +1,5 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{"rl_step": 1, "loss": 2.9802322387695312e-08, "mean_return": 34.26848220825195, "max_return": 58.57109832763672, "mean_motif_chained": 34.26848091665621, "gnorm": 0.0002422332763671875, "elapsed_s": 7.7574591636657715, "cell_type": "Ex", "edit_type": "cell_type_transfer", "target_tf": "ERG", "kd_active": false, "kd_tf": "", "kd_score_mean": 0.0, "ratio_mean": 1.0, "ratio_min": 1.0, "ratio_max": 1.0, "log_ratio_mean": 0.0, "adv_mean": -2.9802322387695312e-08, "adv_std": 0.9999998807907104, "adv_min": -0.7408204078674316, "adv_max": 1.4037067890167236, "comp_oracle_mean": 0.0, "comp_moods_chained_mean": 34.26848091665621, "comp_kd_mean": 0.0, "comp_total_mean": 34.26848091665621, "_algo": "gspo", "_lora_r": 16, "_peak_lr": 0.001, "_temperature": 1.0, "_seq_len_mean": 360.0}
|
| 2 |
+
{"rl_step": 5, "loss": 5.960464477539063e-08, "mean_return": 56.96424865722656, "max_return": 70.51972198486328, "mean_motif_chained": 56.964249189145654, "gnorm": 0.0002689361572265625, "elapsed_s": 34.85763669013977, "cell_type": "Mic", "edit_type": "activity_boost", "target_tf": "IRF8", "kd_active": false, "kd_tf": "", "kd_score_mean": 0.0, "ratio_mean": 1.0, "ratio_min": 1.0, "ratio_max": 1.0, "log_ratio_mean": 0.0, "adv_mean": -5.960464477539063e-08, "adv_std": 0.9999997615814209, "adv_min": -1.4188815355300903, "adv_max": 0.7671882510185242, "comp_oracle_mean": 0.0, "comp_moods_chained_mean": 56.964249189145654, "comp_kd_mean": 0.0, "comp_total_mean": 56.964249189145654, "_algo": "gspo", "_lora_r": 16, "_peak_lr": 0.001, "_temperature": 1.0, "_seq_len_mean": 360.0}
|
| 3 |
+
{"rl_step": 10, "loss": -8.940696716308594e-08, "mean_return": 40.52712631225586, "max_return": 70.56861877441406, "mean_motif_chained": 40.52712845319869, "gnorm": 0.0003662109375, "elapsed_s": 68.6683235168457, "cell_type": "In", "edit_type": "activity_boost", "target_tf": "SOX6", "kd_active": false, "kd_tf": "", "kd_score_mean": 0.0, "ratio_mean": 1.0, "ratio_min": 1.0, "ratio_max": 1.0, "log_ratio_mean": 0.0, "adv_mean": 8.940696716308594e-08, "adv_std": 0.9999999403953552, "adv_min": -0.7790347337722778, "adv_max": 1.4263747930526733, "comp_oracle_mean": 0.0, "comp_moods_chained_mean": 40.52712845319869, "comp_kd_mean": 0.0, "comp_total_mean": 40.52712845319869, "_algo": "gspo", "_lora_r": 16, "_peak_lr": 0.001, "_temperature": 1.0, "_seq_len_mean": 360.0}
|
| 4 |
+
{"rl_step": 15, "loss": -7.450580596923828e-09, "mean_return": 57.41878890991211, "max_return": 69.25961303710938, "mean_motif_chained": 57.41878762062366, "gnorm": 0.000286102294921875, "elapsed_s": 102.46044397354126, "cell_type": "In", "edit_type": "promoter_retarget", "target_tf": "SOX6", "kd_active": false, "kd_tf": "", "kd_score_mean": 0.0, "ratio_mean": 1.0, "ratio_min": 1.0, "ratio_max": 1.0, "log_ratio_mean": 0.0, "adv_mean": 7.450580596923828e-09, "adv_std": 0.9999998807907104, "adv_min": -0.9183567762374878, "adv_max": 1.4108411073684692, "comp_oracle_mean": 0.0, "comp_moods_chained_mean": 57.41878762062366, "comp_kd_mean": 0.0, "comp_total_mean": 57.41878762062366, "_algo": "gspo", "_lora_r": 16, "_peak_lr": 0.001, "_temperature": 1.0, "_seq_len_mean": 360.0}
|
| 5 |
+
{"rl_step": 20, "loss": -1.341104507446289e-07, "mean_return": 42.41632080078125, "max_return": 73.53028106689453, "mean_motif_chained": 42.41632480817796, "gnorm": 0.000278472900390625, "elapsed_s": 136.60211491584778, "cell_type": "Ast", "edit_type": "cell_type_transfer", "target_tf": "FLI1", "kd_active": false, "kd_tf": "", "kd_score_mean": 0.0, "ratio_mean": 1.0, "ratio_min": 1.0, "ratio_max": 1.0, "log_ratio_mean": 0.0, "adv_mean": 1.341104507446289e-07, "adv_std": 0.9999998807907104, "adv_min": -0.9195317029953003, "adv_max": 1.3465245962142944, "comp_oracle_mean": 0.0, "comp_moods_chained_mean": 42.41632480817796, "comp_kd_mean": 0.0, "comp_total_mean": 42.41632480817796, "_algo": "gspo", "_lora_r": 16, "_peak_lr": 0.001, "_temperature": 1.0, "_seq_len_mean": 360.0}
|