Upload folder using huggingface_hub
Browse files- .gitattributes +44 -0
- llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/0022000.pt +3 -0
- llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_10000/batch_0_cfg_7.5_topk_16384.jpg +3 -0
- llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_10000/batch_1_cfg_7.5_topk_16384.jpg +3 -0
- llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_10000/batch_2_cfg_7.5_topk_16384.jpg +3 -0
- llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_10000/batch_3_cfg_7.5_topk_16384.jpg +3 -0
- llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_12000/batch_0_cfg_7.5_topk_16384.jpg +3 -0
- llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_12000/batch_1_cfg_7.5_topk_16384.jpg +3 -0
- llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_12000/batch_2_cfg_7.5_topk_16384.jpg +3 -0
- llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_12000/batch_3_cfg_7.5_topk_16384.jpg +3 -0
- llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_14000/batch_0_cfg_7.5_topk_16384.jpg +3 -0
- llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_14000/batch_1_cfg_7.5_topk_16384.jpg +3 -0
- llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_14000/batch_2_cfg_7.5_topk_16384.jpg +3 -0
- llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_14000/batch_3_cfg_7.5_topk_16384.jpg +3 -0
- llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_16000/batch_0_cfg_7.5_topk_16384.jpg +3 -0
- llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_16000/batch_1_cfg_7.5_topk_16384.jpg +3 -0
- llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_16000/batch_2_cfg_7.5_topk_16384.jpg +3 -0
- llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_16000/batch_3_cfg_7.5_topk_16384.jpg +3 -0
- llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_18000/batch_0_cfg_7.5_topk_16384.jpg +3 -0
- llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_18000/batch_1_cfg_7.5_topk_16384.jpg +3 -0
- llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_18000/batch_2_cfg_7.5_topk_16384.jpg +3 -0
- llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_18000/batch_3_cfg_7.5_topk_16384.jpg +3 -0
- llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_2000/batch_0_cfg_7.5_topk_16384.jpg +3 -0
- llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_2000/batch_1_cfg_7.5_topk_16384.jpg +3 -0
- llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_2000/batch_2_cfg_7.5_topk_16384.jpg +3 -0
- llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_2000/batch_3_cfg_7.5_topk_16384.jpg +3 -0
- llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_20000/batch_0_cfg_7.5_topk_16384.jpg +3 -0
- llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_20000/batch_1_cfg_7.5_topk_16384.jpg +3 -0
- llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_20000/batch_2_cfg_7.5_topk_16384.jpg +3 -0
- llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_20000/batch_3_cfg_7.5_topk_16384.jpg +3 -0
- llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_22000/batch_0_cfg_7.5_topk_16384.jpg +3 -0
- llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_22000/batch_1_cfg_7.5_topk_16384.jpg +3 -0
- llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_22000/batch_2_cfg_7.5_topk_16384.jpg +3 -0
- llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_22000/batch_3_cfg_7.5_topk_16384.jpg +3 -0
- llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_4000/batch_0_cfg_7.5_topk_16384.jpg +3 -0
- llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_4000/batch_1_cfg_7.5_topk_16384.jpg +3 -0
- llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_4000/batch_2_cfg_7.5_topk_16384.jpg +3 -0
- llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_4000/batch_3_cfg_7.5_topk_16384.jpg +3 -0
- llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_6000/batch_0_cfg_7.5_topk_16384.jpg +3 -0
- llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_6000/batch_1_cfg_7.5_topk_16384.jpg +3 -0
- llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_6000/batch_2_cfg_7.5_topk_16384.jpg +3 -0
- llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_6000/batch_3_cfg_7.5_topk_16384.jpg +3 -0
- llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_8000/batch_0_cfg_7.5_topk_16384.jpg +3 -0
- llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_8000/batch_1_cfg_7.5_topk_16384.jpg +3 -0
- llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_8000/batch_2_cfg_7.5_topk_16384.jpg +3 -0
- llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_8000/batch_3_cfg_7.5_topk_16384.jpg +3 -0
- llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/log.txt +1005 -0
.gitattributes
CHANGED
|
@@ -33,3 +33,47 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
| 36 |
+
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_10000/batch_0_cfg_7.5_topk_16384.jpg filter=lfs diff=lfs merge=lfs -text
|
| 37 |
+
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_10000/batch_1_cfg_7.5_topk_16384.jpg filter=lfs diff=lfs merge=lfs -text
|
| 38 |
+
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_10000/batch_2_cfg_7.5_topk_16384.jpg filter=lfs diff=lfs merge=lfs -text
|
| 39 |
+
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_10000/batch_3_cfg_7.5_topk_16384.jpg filter=lfs diff=lfs merge=lfs -text
|
| 40 |
+
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_12000/batch_0_cfg_7.5_topk_16384.jpg filter=lfs diff=lfs merge=lfs -text
|
| 41 |
+
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_12000/batch_1_cfg_7.5_topk_16384.jpg filter=lfs diff=lfs merge=lfs -text
|
| 42 |
+
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_12000/batch_2_cfg_7.5_topk_16384.jpg filter=lfs diff=lfs merge=lfs -text
|
| 43 |
+
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_12000/batch_3_cfg_7.5_topk_16384.jpg filter=lfs diff=lfs merge=lfs -text
|
| 44 |
+
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_14000/batch_0_cfg_7.5_topk_16384.jpg filter=lfs diff=lfs merge=lfs -text
|
| 45 |
+
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_14000/batch_1_cfg_7.5_topk_16384.jpg filter=lfs diff=lfs merge=lfs -text
|
| 46 |
+
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_14000/batch_2_cfg_7.5_topk_16384.jpg filter=lfs diff=lfs merge=lfs -text
|
| 47 |
+
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_14000/batch_3_cfg_7.5_topk_16384.jpg filter=lfs diff=lfs merge=lfs -text
|
| 48 |
+
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_16000/batch_0_cfg_7.5_topk_16384.jpg filter=lfs diff=lfs merge=lfs -text
|
| 49 |
+
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_16000/batch_1_cfg_7.5_topk_16384.jpg filter=lfs diff=lfs merge=lfs -text
|
| 50 |
+
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_16000/batch_2_cfg_7.5_topk_16384.jpg filter=lfs diff=lfs merge=lfs -text
|
| 51 |
+
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_16000/batch_3_cfg_7.5_topk_16384.jpg filter=lfs diff=lfs merge=lfs -text
|
| 52 |
+
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_18000/batch_0_cfg_7.5_topk_16384.jpg filter=lfs diff=lfs merge=lfs -text
|
| 53 |
+
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_18000/batch_1_cfg_7.5_topk_16384.jpg filter=lfs diff=lfs merge=lfs -text
|
| 54 |
+
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_18000/batch_2_cfg_7.5_topk_16384.jpg filter=lfs diff=lfs merge=lfs -text
|
| 55 |
+
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_18000/batch_3_cfg_7.5_topk_16384.jpg filter=lfs diff=lfs merge=lfs -text
|
| 56 |
+
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_2000/batch_0_cfg_7.5_topk_16384.jpg filter=lfs diff=lfs merge=lfs -text
|
| 57 |
+
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_2000/batch_1_cfg_7.5_topk_16384.jpg filter=lfs diff=lfs merge=lfs -text
|
| 58 |
+
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_2000/batch_2_cfg_7.5_topk_16384.jpg filter=lfs diff=lfs merge=lfs -text
|
| 59 |
+
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_2000/batch_3_cfg_7.5_topk_16384.jpg filter=lfs diff=lfs merge=lfs -text
|
| 60 |
+
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_20000/batch_0_cfg_7.5_topk_16384.jpg filter=lfs diff=lfs merge=lfs -text
|
| 61 |
+
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_20000/batch_1_cfg_7.5_topk_16384.jpg filter=lfs diff=lfs merge=lfs -text
|
| 62 |
+
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_20000/batch_2_cfg_7.5_topk_16384.jpg filter=lfs diff=lfs merge=lfs -text
|
| 63 |
+
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_20000/batch_3_cfg_7.5_topk_16384.jpg filter=lfs diff=lfs merge=lfs -text
|
| 64 |
+
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_22000/batch_0_cfg_7.5_topk_16384.jpg filter=lfs diff=lfs merge=lfs -text
|
| 65 |
+
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_22000/batch_1_cfg_7.5_topk_16384.jpg filter=lfs diff=lfs merge=lfs -text
|
| 66 |
+
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_22000/batch_2_cfg_7.5_topk_16384.jpg filter=lfs diff=lfs merge=lfs -text
|
| 67 |
+
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_22000/batch_3_cfg_7.5_topk_16384.jpg filter=lfs diff=lfs merge=lfs -text
|
| 68 |
+
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_4000/batch_0_cfg_7.5_topk_16384.jpg filter=lfs diff=lfs merge=lfs -text
|
| 69 |
+
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_4000/batch_1_cfg_7.5_topk_16384.jpg filter=lfs diff=lfs merge=lfs -text
|
| 70 |
+
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_4000/batch_2_cfg_7.5_topk_16384.jpg filter=lfs diff=lfs merge=lfs -text
|
| 71 |
+
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_4000/batch_3_cfg_7.5_topk_16384.jpg filter=lfs diff=lfs merge=lfs -text
|
| 72 |
+
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_6000/batch_0_cfg_7.5_topk_16384.jpg filter=lfs diff=lfs merge=lfs -text
|
| 73 |
+
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_6000/batch_1_cfg_7.5_topk_16384.jpg filter=lfs diff=lfs merge=lfs -text
|
| 74 |
+
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_6000/batch_2_cfg_7.5_topk_16384.jpg filter=lfs diff=lfs merge=lfs -text
|
| 75 |
+
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_6000/batch_3_cfg_7.5_topk_16384.jpg filter=lfs diff=lfs merge=lfs -text
|
| 76 |
+
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_8000/batch_0_cfg_7.5_topk_16384.jpg filter=lfs diff=lfs merge=lfs -text
|
| 77 |
+
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_8000/batch_1_cfg_7.5_topk_16384.jpg filter=lfs diff=lfs merge=lfs -text
|
| 78 |
+
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_8000/batch_2_cfg_7.5_topk_16384.jpg filter=lfs diff=lfs merge=lfs -text
|
| 79 |
+
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_8000/batch_3_cfg_7.5_topk_16384.jpg filter=lfs diff=lfs merge=lfs -text
|
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/0022000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5c0afa0cfb1ee30897264c085f3774c2af0ad3bf5a595510fd5d54e7b75a5fcb
|
| 3 |
+
size 6408374056
|
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_10000/batch_0_cfg_7.5_topk_16384.jpg
ADDED
|
Git LFS Details
|
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_10000/batch_1_cfg_7.5_topk_16384.jpg
ADDED
|
Git LFS Details
|
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_10000/batch_2_cfg_7.5_topk_16384.jpg
ADDED
|
Git LFS Details
|
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_10000/batch_3_cfg_7.5_topk_16384.jpg
ADDED
|
Git LFS Details
|
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_12000/batch_0_cfg_7.5_topk_16384.jpg
ADDED
|
Git LFS Details
|
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_12000/batch_1_cfg_7.5_topk_16384.jpg
ADDED
|
Git LFS Details
|
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_12000/batch_2_cfg_7.5_topk_16384.jpg
ADDED
|
Git LFS Details
|
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_12000/batch_3_cfg_7.5_topk_16384.jpg
ADDED
|
Git LFS Details
|
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_14000/batch_0_cfg_7.5_topk_16384.jpg
ADDED
|
Git LFS Details
|
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_14000/batch_1_cfg_7.5_topk_16384.jpg
ADDED
|
Git LFS Details
|
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_14000/batch_2_cfg_7.5_topk_16384.jpg
ADDED
|
Git LFS Details
|
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_14000/batch_3_cfg_7.5_topk_16384.jpg
ADDED
|
Git LFS Details
|
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_16000/batch_0_cfg_7.5_topk_16384.jpg
ADDED
|
Git LFS Details
|
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_16000/batch_1_cfg_7.5_topk_16384.jpg
ADDED
|
Git LFS Details
|
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_16000/batch_2_cfg_7.5_topk_16384.jpg
ADDED
|
Git LFS Details
|
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_16000/batch_3_cfg_7.5_topk_16384.jpg
ADDED
|
Git LFS Details
|
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_18000/batch_0_cfg_7.5_topk_16384.jpg
ADDED
|
Git LFS Details
|
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_18000/batch_1_cfg_7.5_topk_16384.jpg
ADDED
|
Git LFS Details
|
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_18000/batch_2_cfg_7.5_topk_16384.jpg
ADDED
|
Git LFS Details
|
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_18000/batch_3_cfg_7.5_topk_16384.jpg
ADDED
|
Git LFS Details
|
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_2000/batch_0_cfg_7.5_topk_16384.jpg
ADDED
|
Git LFS Details
|
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_2000/batch_1_cfg_7.5_topk_16384.jpg
ADDED
|
Git LFS Details
|
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_2000/batch_2_cfg_7.5_topk_16384.jpg
ADDED
|
Git LFS Details
|
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_2000/batch_3_cfg_7.5_topk_16384.jpg
ADDED
|
Git LFS Details
|
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_20000/batch_0_cfg_7.5_topk_16384.jpg
ADDED
|
Git LFS Details
|
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_20000/batch_1_cfg_7.5_topk_16384.jpg
ADDED
|
Git LFS Details
|
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_20000/batch_2_cfg_7.5_topk_16384.jpg
ADDED
|
Git LFS Details
|
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_20000/batch_3_cfg_7.5_topk_16384.jpg
ADDED
|
Git LFS Details
|
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_22000/batch_0_cfg_7.5_topk_16384.jpg
ADDED
|
Git LFS Details
|
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_22000/batch_1_cfg_7.5_topk_16384.jpg
ADDED
|
Git LFS Details
|
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_22000/batch_2_cfg_7.5_topk_16384.jpg
ADDED
|
Git LFS Details
|
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_22000/batch_3_cfg_7.5_topk_16384.jpg
ADDED
|
Git LFS Details
|
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_4000/batch_0_cfg_7.5_topk_16384.jpg
ADDED
|
Git LFS Details
|
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_4000/batch_1_cfg_7.5_topk_16384.jpg
ADDED
|
Git LFS Details
|
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_4000/batch_2_cfg_7.5_topk_16384.jpg
ADDED
|
Git LFS Details
|
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_4000/batch_3_cfg_7.5_topk_16384.jpg
ADDED
|
Git LFS Details
|
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_6000/batch_0_cfg_7.5_topk_16384.jpg
ADDED
|
Git LFS Details
|
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_6000/batch_1_cfg_7.5_topk_16384.jpg
ADDED
|
Git LFS Details
|
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_6000/batch_2_cfg_7.5_topk_16384.jpg
ADDED
|
Git LFS Details
|
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_6000/batch_3_cfg_7.5_topk_16384.jpg
ADDED
|
Git LFS Details
|
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_8000/batch_0_cfg_7.5_topk_16384.jpg
ADDED
|
Git LFS Details
|
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_8000/batch_1_cfg_7.5_topk_16384.jpg
ADDED
|
Git LFS Details
|
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_8000/batch_2_cfg_7.5_topk_16384.jpg
ADDED
|
Git LFS Details
|
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/checkpoints/eval_step_8000/batch_3_cfg_7.5_topk_16384.jpg
ADDED
|
Git LFS Details
|
llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_newfix_train_only_projection_i2i/014-GPT-XL/log.txt
ADDED
|
@@ -0,0 +1,1005 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[[34m2025-03-20 19:22:49[0m] Experiment directory created at checkpoints/TWO_node_llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_noimageonly_newfix_train_all/014-GPT-XL
|
| 2 |
+
[[34m2025-03-20 19:22:49[0m] Namespace(data_path='/tmp/haozhezhao/MLLMG/jsonl_data/continueT2I_mid_flux_2M.jsonl', cloud_save_path='/tmp/haozhezhao/MLLMG/checkpoints', no_local_save=False, vq_model='VQ-16', vq_ckpt='/tmp/haozhezhao/model/llamagen_t2i/vq_ds16_t2i.pt', codebook_size=16384, codebook_embed_dim=8, gpt_model='GPT-XL', gpt_ckpt=None, gpt_type='t2i', vocab_size=16384, cls_token_num=512, dropout_p=0.1, token_dropout_p=0.1, drop_path=0.0, no_compile=False, results_dir='checkpoints/TWO_node_llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_noimageonly_newfix_train_all', dataset='ti2i', image_size=512, downsample_size=16, num_classes=1000, epochs=1, lr=0.001, weight_decay=0.05, beta1=0.9, beta2=0.95, max_grad_norm=1.0, global_batch_size=128, global_seed=0, num_workers=2, log_every=25, ckpt_every=2000, gradient_accumulation_steps=1, mixed_precision='bf16', val_data_path='/tmp/haozhezhao/MLLMG/jsonl_dir/validation_set.jsonl_mid_1k.jsonl', use_vision_tower=True, model_name_or_path='/tmp/haozhezhao/model/blip2-flan-t5-xl', image_place_holder='<image>', processor_path=None, do_eval=True, max_eval_samples=512, train_text_encoder=True, no_left_padding=False, cfg_scale=7.5, top_k=16384, temperature=0.9, top_p=1.0, eval_steps=2000, project_name='llamagen_ti2i', load_from_checkpoint='/tmp/haozhezhao/MLLMG/checkpoint/FIXed_3M_1epoch_step32000.pt', warmup=0.05, lr_decay_style='cosine', lr_decay_ratio=0.1, train_iters=500000, class_dropout_prob=0.1, with_image_only=True, image_only_rate=0.8, stage2=False, subject_driven=True, load_subject_embedding=None, reference_data_path='/tmp/haozhezhao/MLLMG/cc12m_reference.jsonl', multimodal_encoder='llava', do_recovery=False, no_replace=False, resume=False, dreambench_eval=False, find_unused_parameters=True, load_visual_encoder=False, continue_stage1=False, replace_subject=False, train_all=False, save_total_limit=1, load_language_projection='/tmp/haozhezhao/MLLMG/llava-v1.5-flant5_fixed-pretrain/mm_projector.bin', mm_vision_tower='openai/clip-vit-large-patch14', load_fixed_llamagen=True, unfreeze_output=False, i2i=True, rank=0, world_size=8, gpu=0, dist_url='env://', distributed=True, dist_backend='nccl')
|
| 3 |
+
[[34m2025-03-20 19:22:49[0m] Starting rank=0, seed=0, world_size=8.
|
| 4 |
+
[[34m2025-03-20 19:22:49[0m] text_config is None. Initializing the text config with default values (`OPTConfig`).
|
| 5 |
+
[[34m2025-03-20 19:23:56[0m] GPT Parameters: 2,310,680,832
|
| 6 |
+
[[34m2025-03-20 19:23:56[0m] num decayed parameter tensors: 356, with 2,007,303,168 parameters
|
| 7 |
+
[[34m2025-03-20 19:23:56[0m] num non-decayed parameter tensors: 124, with 197,888 parameters
|
| 8 |
+
[[34m2025-03-20 19:23:56[0m] using fused AdamW: True
|
| 9 |
+
[[34m2025-03-20 19:24:11[0m] Dataset contains 3,018,117 images
|
| 10 |
+
[[34m2025-03-20 19:24:11[0m] Train iters 23579 , warmup 1178.95, len of loader 23579
|
| 11 |
+
[[34m2025-03-20 19:24:20[0m] compiling the model... (may take several minutes)
|
| 12 |
+
[[34m2025-03-20 19:24:21[0m] freeze the vit
|
| 13 |
+
[[34m2025-03-20 19:24:21[0m] set text encoder as trainable
|
| 14 |
+
[[34m2025-03-20 19:24:21[0m] set vision model freeze
|
| 15 |
+
[[34m2025-03-20 19:24:21[0m] ***** total param is 2310680832 *****
|
| 16 |
+
[[34m2025-03-20 19:24:21[0m] ***** total trained param is 31526912 *****
|
| 17 |
+
[[34m2025-03-20 19:24:26[0m] Training for 1 epochs...
|
| 18 |
+
[[34m2025-03-20 19:24:26[0m] Beginning epoch 0...
|
| 19 |
+
[[34m2025-03-20 19:29:42[0m] (step=0000025) Train Loss: 6.5367, Train Steps/Sec: 0.08
|
| 20 |
+
[[34m2025-03-20 19:30:17[0m] (step=0000050) Train Loss: 6.4791, Train Steps/Sec: 0.71
|
| 21 |
+
[[34m2025-03-20 19:30:53[0m] (step=0000075) Train Loss: 6.4914, Train Steps/Sec: 0.71
|
| 22 |
+
[[34m2025-03-20 19:31:30[0m] (step=0000100) Train Loss: 6.4454, Train Steps/Sec: 0.67
|
| 23 |
+
[[34m2025-03-20 19:32:05[0m] (step=0000125) Train Loss: 6.4746, Train Steps/Sec: 0.71
|
| 24 |
+
[[34m2025-03-20 19:32:41[0m] (step=0000150) Train Loss: 6.4932, Train Steps/Sec: 0.70
|
| 25 |
+
[[34m2025-03-20 19:33:16[0m] (step=0000175) Train Loss: 6.4705, Train Steps/Sec: 0.71
|
| 26 |
+
[[34m2025-03-20 19:33:51[0m] (step=0000200) Train Loss: 6.4672, Train Steps/Sec: 0.71
|
| 27 |
+
[[34m2025-03-20 19:34:26[0m] (step=0000225) Train Loss: 6.4509, Train Steps/Sec: 0.71
|
| 28 |
+
[[34m2025-03-20 19:35:02[0m] (step=0000250) Train Loss: 6.4970, Train Steps/Sec: 0.71
|
| 29 |
+
[[34m2025-03-20 19:35:38[0m] (step=0000275) Train Loss: 6.4752, Train Steps/Sec: 0.68
|
| 30 |
+
[[34m2025-03-20 19:36:16[0m] (step=0000300) Train Loss: 6.4615, Train Steps/Sec: 0.66
|
| 31 |
+
[[34m2025-03-20 19:36:53[0m] (step=0000325) Train Loss: 6.4741, Train Steps/Sec: 0.69
|
| 32 |
+
[[34m2025-03-20 19:37:28[0m] (step=0000350) Train Loss: 6.4717, Train Steps/Sec: 0.71
|
| 33 |
+
[[34m2025-03-20 19:38:03[0m] (step=0000375) Train Loss: 6.4472, Train Steps/Sec: 0.71
|
| 34 |
+
[[34m2025-03-20 19:38:38[0m] (step=0000400) Train Loss: 6.4563, Train Steps/Sec: 0.71
|
| 35 |
+
[[34m2025-03-20 19:39:13[0m] (step=0000425) Train Loss: 6.4749, Train Steps/Sec: 0.71
|
| 36 |
+
[[34m2025-03-20 19:39:48[0m] (step=0000450) Train Loss: 6.4726, Train Steps/Sec: 0.71
|
| 37 |
+
[[34m2025-03-20 19:40:23[0m] (step=0000475) Train Loss: 6.4782, Train Steps/Sec: 0.71
|
| 38 |
+
[[34m2025-03-20 19:40:58[0m] (step=0000500) Train Loss: 6.4592, Train Steps/Sec: 0.71
|
| 39 |
+
[[34m2025-03-20 19:41:34[0m] (step=0000525) Train Loss: 6.4710, Train Steps/Sec: 0.71
|
| 40 |
+
[[34m2025-03-20 19:42:09[0m] (step=0000550) Train Loss: 6.4370, Train Steps/Sec: 0.71
|
| 41 |
+
[[34m2025-03-20 19:42:45[0m] (step=0000575) Train Loss: 6.4967, Train Steps/Sec: 0.69
|
| 42 |
+
[[34m2025-03-20 19:43:20[0m] (step=0000600) Train Loss: 6.4770, Train Steps/Sec: 0.71
|
| 43 |
+
[[34m2025-03-20 19:43:55[0m] (step=0000625) Train Loss: 6.4500, Train Steps/Sec: 0.71
|
| 44 |
+
[[34m2025-03-20 19:44:30[0m] (step=0000650) Train Loss: 6.4510, Train Steps/Sec: 0.71
|
| 45 |
+
[[34m2025-03-20 19:45:05[0m] (step=0000675) Train Loss: 6.4788, Train Steps/Sec: 0.71
|
| 46 |
+
[[34m2025-03-20 19:45:40[0m] (step=0000700) Train Loss: 6.4375, Train Steps/Sec: 0.71
|
| 47 |
+
[[34m2025-03-20 19:46:16[0m] (step=0000725) Train Loss: 6.4401, Train Steps/Sec: 0.71
|
| 48 |
+
[[34m2025-03-20 19:46:51[0m] (step=0000750) Train Loss: 6.4351, Train Steps/Sec: 0.71
|
| 49 |
+
[[34m2025-03-20 19:47:26[0m] (step=0000775) Train Loss: 6.4978, Train Steps/Sec: 0.71
|
| 50 |
+
[[34m2025-03-20 19:48:01[0m] (step=0000800) Train Loss: 6.4700, Train Steps/Sec: 0.71
|
| 51 |
+
[[34m2025-03-20 19:48:36[0m] (step=0000825) Train Loss: 6.4854, Train Steps/Sec: 0.71
|
| 52 |
+
[[34m2025-03-20 19:49:11[0m] (step=0000850) Train Loss: 6.4647, Train Steps/Sec: 0.71
|
| 53 |
+
[[34m2025-03-20 19:49:46[0m] (step=0000875) Train Loss: 6.4619, Train Steps/Sec: 0.71
|
| 54 |
+
[[34m2025-03-20 19:50:21[0m] (step=0000900) Train Loss: 6.4654, Train Steps/Sec: 0.71
|
| 55 |
+
[[34m2025-03-20 19:50:59[0m] (step=0000925) Train Loss: 6.4534, Train Steps/Sec: 0.67
|
| 56 |
+
[[34m2025-03-20 19:51:34[0m] (step=0000950) Train Loss: 6.4779, Train Steps/Sec: 0.71
|
| 57 |
+
[[34m2025-03-20 19:52:09[0m] (step=0000975) Train Loss: 6.4151, Train Steps/Sec: 0.71
|
| 58 |
+
[[34m2025-03-20 19:52:44[0m] (step=0001000) Train Loss: 6.4490, Train Steps/Sec: 0.71
|
| 59 |
+
[[34m2025-03-20 19:53:19[0m] (step=0001025) Train Loss: 6.5045, Train Steps/Sec: 0.71
|
| 60 |
+
[[34m2025-03-20 19:53:54[0m] (step=0001050) Train Loss: 6.4553, Train Steps/Sec: 0.71
|
| 61 |
+
[[34m2025-03-20 19:54:29[0m] (step=0001075) Train Loss: 6.4739, Train Steps/Sec: 0.71
|
| 62 |
+
[[34m2025-03-20 19:55:04[0m] (step=0001100) Train Loss: 6.4731, Train Steps/Sec: 0.71
|
| 63 |
+
[[34m2025-03-20 19:55:40[0m] (step=0001125) Train Loss: 6.4477, Train Steps/Sec: 0.71
|
| 64 |
+
[[34m2025-03-20 19:56:15[0m] (step=0001150) Train Loss: 6.4612, Train Steps/Sec: 0.71
|
| 65 |
+
[[34m2025-03-20 19:56:50[0m] (step=0001175) Train Loss: 6.4759, Train Steps/Sec: 0.71
|
| 66 |
+
[[34m2025-03-20 19:57:25[0m] (step=0001200) Train Loss: 6.4931, Train Steps/Sec: 0.71
|
| 67 |
+
[[34m2025-03-20 19:58:00[0m] (step=0001225) Train Loss: 6.4623, Train Steps/Sec: 0.71
|
| 68 |
+
[[34m2025-03-20 19:58:36[0m] (step=0001250) Train Loss: 6.4752, Train Steps/Sec: 0.71
|
| 69 |
+
[[34m2025-03-20 19:59:11[0m] (step=0001275) Train Loss: 6.4567, Train Steps/Sec: 0.71
|
| 70 |
+
[[34m2025-03-20 19:59:46[0m] (step=0001300) Train Loss: 6.4723, Train Steps/Sec: 0.71
|
| 71 |
+
[[34m2025-03-20 20:00:21[0m] (step=0001325) Train Loss: 6.4607, Train Steps/Sec: 0.71
|
| 72 |
+
[[34m2025-03-20 20:00:56[0m] (step=0001350) Train Loss: 6.4306, Train Steps/Sec: 0.71
|
| 73 |
+
[[34m2025-03-20 20:01:31[0m] (step=0001375) Train Loss: 6.4507, Train Steps/Sec: 0.71
|
| 74 |
+
[[34m2025-03-20 20:02:07[0m] (step=0001400) Train Loss: 6.4539, Train Steps/Sec: 0.71
|
| 75 |
+
[[34m2025-03-20 20:02:42[0m] (step=0001425) Train Loss: 6.4632, Train Steps/Sec: 0.71
|
| 76 |
+
[[34m2025-03-20 20:03:17[0m] (step=0001450) Train Loss: 6.4670, Train Steps/Sec: 0.71
|
| 77 |
+
[[34m2025-03-20 20:03:52[0m] (step=0001475) Train Loss: 6.4473, Train Steps/Sec: 0.71
|
| 78 |
+
[[34m2025-03-20 20:04:27[0m] (step=0001500) Train Loss: 6.4782, Train Steps/Sec: 0.71
|
| 79 |
+
[[34m2025-03-20 20:05:02[0m] (step=0001525) Train Loss: 6.4947, Train Steps/Sec: 0.71
|
| 80 |
+
[[34m2025-03-20 20:05:37[0m] (step=0001550) Train Loss: 6.4573, Train Steps/Sec: 0.71
|
| 81 |
+
[[34m2025-03-20 20:06:12[0m] (step=0001575) Train Loss: 6.4487, Train Steps/Sec: 0.71
|
| 82 |
+
[[34m2025-03-20 20:06:47[0m] (step=0001600) Train Loss: 6.4678, Train Steps/Sec: 0.71
|
| 83 |
+
[[34m2025-03-20 20:07:22[0m] (step=0001625) Train Loss: 6.4394, Train Steps/Sec: 0.71
|
| 84 |
+
[[34m2025-03-20 20:07:57[0m] (step=0001650) Train Loss: 6.4461, Train Steps/Sec: 0.71
|
| 85 |
+
[[34m2025-03-20 20:08:33[0m] (step=0001675) Train Loss: 6.4687, Train Steps/Sec: 0.71
|
| 86 |
+
[[34m2025-03-20 20:09:08[0m] (step=0001700) Train Loss: 6.4670, Train Steps/Sec: 0.71
|
| 87 |
+
[[34m2025-03-20 20:09:43[0m] (step=0001725) Train Loss: 6.4667, Train Steps/Sec: 0.71
|
| 88 |
+
[[34m2025-03-20 20:10:18[0m] (step=0001750) Train Loss: 6.4239, Train Steps/Sec: 0.71
|
| 89 |
+
[[34m2025-03-20 20:10:53[0m] (step=0001775) Train Loss: 6.4694, Train Steps/Sec: 0.71
|
| 90 |
+
[[34m2025-03-20 20:11:28[0m] (step=0001800) Train Loss: 6.4433, Train Steps/Sec: 0.71
|
| 91 |
+
[[34m2025-03-20 20:12:03[0m] (step=0001825) Train Loss: 6.4765, Train Steps/Sec: 0.71
|
| 92 |
+
[[34m2025-03-20 20:12:38[0m] (step=0001850) Train Loss: 6.4625, Train Steps/Sec: 0.71
|
| 93 |
+
[[34m2025-03-20 20:13:13[0m] (step=0001875) Train Loss: 6.4658, Train Steps/Sec: 0.71
|
| 94 |
+
[[34m2025-03-20 20:13:48[0m] (step=0001900) Train Loss: 6.4308, Train Steps/Sec: 0.71
|
| 95 |
+
[[34m2025-03-20 20:14:24[0m] (step=0001925) Train Loss: 6.4613, Train Steps/Sec: 0.71
|
| 96 |
+
[[34m2025-03-20 20:14:59[0m] (step=0001950) Train Loss: 6.4633, Train Steps/Sec: 0.71
|
| 97 |
+
[[34m2025-03-20 20:15:34[0m] (step=0001975) Train Loss: 6.4617, Train Steps/Sec: 0.71
|
| 98 |
+
[[34m2025-03-20 20:16:09[0m] (step=0002000) Train Loss: 6.4607, Train Steps/Sec: 0.71
|
| 99 |
+
[[34m2025-03-20 20:16:09[0m] text_config is None. Initializing the text config with default values (`OPTConfig`).
|
| 100 |
+
[[34m2025-03-20 20:22:12[0m] Finish Eval in 2000 steps...
|
| 101 |
+
[[34m2025-03-20 20:22:18[0m] Saved checkpoint to checkpoints/TWO_node_llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_noimageonly_newfix_train_all/014-GPT-XL/checkpoints/0002000.pt
|
| 102 |
+
[[34m2025-03-20 20:22:54[0m] (step=0002025) Train Loss: 6.4400, Train Steps/Sec: 0.06
|
| 103 |
+
[[34m2025-03-20 20:23:29[0m] (step=0002050) Train Loss: 6.4530, Train Steps/Sec: 0.71
|
| 104 |
+
[[34m2025-03-20 20:24:04[0m] (step=0002075) Train Loss: 6.4868, Train Steps/Sec: 0.71
|
| 105 |
+
[[34m2025-03-20 20:24:39[0m] (step=0002100) Train Loss: 6.4806, Train Steps/Sec: 0.71
|
| 106 |
+
[[34m2025-03-20 20:25:14[0m] (step=0002125) Train Loss: 6.4499, Train Steps/Sec: 0.71
|
| 107 |
+
[[34m2025-03-20 20:25:49[0m] (step=0002150) Train Loss: 6.4153, Train Steps/Sec: 0.71
|
| 108 |
+
[[34m2025-03-20 20:26:24[0m] (step=0002175) Train Loss: 6.4856, Train Steps/Sec: 0.71
|
| 109 |
+
[[34m2025-03-20 20:26:59[0m] (step=0002200) Train Loss: 6.4567, Train Steps/Sec: 0.71
|
| 110 |
+
[[34m2025-03-20 20:27:34[0m] (step=0002225) Train Loss: 6.4746, Train Steps/Sec: 0.71
|
| 111 |
+
[[34m2025-03-20 20:28:09[0m] (step=0002250) Train Loss: 6.4400, Train Steps/Sec: 0.71
|
| 112 |
+
[[34m2025-03-20 20:28:44[0m] (step=0002275) Train Loss: 6.4582, Train Steps/Sec: 0.71
|
| 113 |
+
[[34m2025-03-20 20:29:19[0m] (step=0002300) Train Loss: 6.4678, Train Steps/Sec: 0.71
|
| 114 |
+
[[34m2025-03-20 20:29:54[0m] (step=0002325) Train Loss: 6.4556, Train Steps/Sec: 0.71
|
| 115 |
+
[[34m2025-03-20 20:30:29[0m] (step=0002350) Train Loss: 6.4412, Train Steps/Sec: 0.71
|
| 116 |
+
[[34m2025-03-20 20:31:04[0m] (step=0002375) Train Loss: 6.4652, Train Steps/Sec: 0.71
|
| 117 |
+
[[34m2025-03-20 20:31:39[0m] (step=0002400) Train Loss: 6.4301, Train Steps/Sec: 0.71
|
| 118 |
+
[[34m2025-03-20 20:32:14[0m] (step=0002425) Train Loss: 6.4598, Train Steps/Sec: 0.71
|
| 119 |
+
[[34m2025-03-20 20:32:49[0m] (step=0002450) Train Loss: 6.4614, Train Steps/Sec: 0.71
|
| 120 |
+
[[34m2025-03-20 20:33:24[0m] (step=0002475) Train Loss: 6.4573, Train Steps/Sec: 0.71
|
| 121 |
+
[[34m2025-03-20 20:33:59[0m] (step=0002500) Train Loss: 6.4475, Train Steps/Sec: 0.71
|
| 122 |
+
[[34m2025-03-20 20:34:35[0m] (step=0002525) Train Loss: 6.4526, Train Steps/Sec: 0.71
|
| 123 |
+
[[34m2025-03-20 20:35:10[0m] (step=0002550) Train Loss: 6.4324, Train Steps/Sec: 0.71
|
| 124 |
+
[[34m2025-03-20 20:35:45[0m] (step=0002575) Train Loss: 6.4776, Train Steps/Sec: 0.71
|
| 125 |
+
[[34m2025-03-20 20:36:20[0m] (step=0002600) Train Loss: 6.4640, Train Steps/Sec: 0.71
|
| 126 |
+
[[34m2025-03-20 20:36:55[0m] (step=0002625) Train Loss: 6.4627, Train Steps/Sec: 0.71
|
| 127 |
+
[[34m2025-03-20 20:37:31[0m] (step=0002650) Train Loss: 6.4719, Train Steps/Sec: 0.69
|
| 128 |
+
[[34m2025-03-20 20:38:08[0m] (step=0002675) Train Loss: 6.4535, Train Steps/Sec: 0.68
|
| 129 |
+
[[34m2025-03-20 20:38:44[0m] (step=0002700) Train Loss: 6.4506, Train Steps/Sec: 0.69
|
| 130 |
+
[[34m2025-03-20 20:39:19[0m] (step=0002725) Train Loss: 6.4452, Train Steps/Sec: 0.71
|
| 131 |
+
[[34m2025-03-20 20:39:55[0m] (step=0002750) Train Loss: 6.4446, Train Steps/Sec: 0.71
|
| 132 |
+
[[34m2025-03-20 20:40:30[0m] (step=0002775) Train Loss: 6.3894, Train Steps/Sec: 0.71
|
| 133 |
+
[[34m2025-03-20 20:41:05[0m] (step=0002800) Train Loss: 6.4426, Train Steps/Sec: 0.71
|
| 134 |
+
[[34m2025-03-20 20:41:40[0m] (step=0002825) Train Loss: 6.4355, Train Steps/Sec: 0.71
|
| 135 |
+
[[34m2025-03-20 20:42:15[0m] (step=0002850) Train Loss: 6.4673, Train Steps/Sec: 0.71
|
| 136 |
+
[[34m2025-03-20 20:42:50[0m] (step=0002875) Train Loss: 6.4423, Train Steps/Sec: 0.71
|
| 137 |
+
[[34m2025-03-20 20:43:25[0m] (step=0002900) Train Loss: 6.4667, Train Steps/Sec: 0.71
|
| 138 |
+
[[34m2025-03-20 20:44:00[0m] (step=0002925) Train Loss: 6.4614, Train Steps/Sec: 0.71
|
| 139 |
+
[[34m2025-03-20 20:44:35[0m] (step=0002950) Train Loss: 6.4632, Train Steps/Sec: 0.71
|
| 140 |
+
[[34m2025-03-20 20:45:10[0m] (step=0002975) Train Loss: 6.4892, Train Steps/Sec: 0.71
|
| 141 |
+
[[34m2025-03-20 20:45:46[0m] (step=0003000) Train Loss: 6.4556, Train Steps/Sec: 0.71
|
| 142 |
+
[[34m2025-03-20 20:46:21[0m] (step=0003025) Train Loss: 6.4151, Train Steps/Sec: 0.71
|
| 143 |
+
[[34m2025-03-20 20:46:56[0m] (step=0003050) Train Loss: 6.4231, Train Steps/Sec: 0.71
|
| 144 |
+
[[34m2025-03-20 20:47:31[0m] (step=0003075) Train Loss: 6.4647, Train Steps/Sec: 0.71
|
| 145 |
+
[[34m2025-03-20 20:48:08[0m] (step=0003100) Train Loss: 6.4506, Train Steps/Sec: 0.67
|
| 146 |
+
[[34m2025-03-20 20:48:44[0m] (step=0003125) Train Loss: 6.4210, Train Steps/Sec: 0.71
|
| 147 |
+
[[34m2025-03-20 20:49:20[0m] (step=0003150) Train Loss: 6.4596, Train Steps/Sec: 0.69
|
| 148 |
+
[[34m2025-03-20 20:49:56[0m] (step=0003175) Train Loss: 6.4687, Train Steps/Sec: 0.69
|
| 149 |
+
[[34m2025-03-20 20:50:31[0m] (step=0003200) Train Loss: 6.4390, Train Steps/Sec: 0.71
|
| 150 |
+
[[34m2025-03-20 20:51:06[0m] (step=0003225) Train Loss: 6.4429, Train Steps/Sec: 0.71
|
| 151 |
+
[[34m2025-03-20 20:51:41[0m] (step=0003250) Train Loss: 6.4488, Train Steps/Sec: 0.71
|
| 152 |
+
[[34m2025-03-20 20:52:16[0m] (step=0003275) Train Loss: 6.4548, Train Steps/Sec: 0.71
|
| 153 |
+
[[34m2025-03-20 20:52:51[0m] (step=0003300) Train Loss: 6.4480, Train Steps/Sec: 0.71
|
| 154 |
+
[[34m2025-03-20 20:53:26[0m] (step=0003325) Train Loss: 6.4651, Train Steps/Sec: 0.71
|
| 155 |
+
[[34m2025-03-20 20:54:01[0m] (step=0003350) Train Loss: 6.4580, Train Steps/Sec: 0.71
|
| 156 |
+
[[34m2025-03-20 20:54:36[0m] (step=0003375) Train Loss: 6.4678, Train Steps/Sec: 0.71
|
| 157 |
+
[[34m2025-03-20 20:55:11[0m] (step=0003400) Train Loss: 6.4376, Train Steps/Sec: 0.71
|
| 158 |
+
[[34m2025-03-20 20:55:47[0m] (step=0003425) Train Loss: 6.4539, Train Steps/Sec: 0.71
|
| 159 |
+
[[34m2025-03-20 20:56:22[0m] (step=0003450) Train Loss: 6.4523, Train Steps/Sec: 0.71
|
| 160 |
+
[[34m2025-03-20 20:56:57[0m] (step=0003475) Train Loss: 6.4559, Train Steps/Sec: 0.71
|
| 161 |
+
[[34m2025-03-20 20:57:32[0m] (step=0003500) Train Loss: 6.4680, Train Steps/Sec: 0.71
|
| 162 |
+
[[34m2025-03-20 20:58:07[0m] (step=0003525) Train Loss: 6.4559, Train Steps/Sec: 0.71
|
| 163 |
+
[[34m2025-03-20 20:58:42[0m] (step=0003550) Train Loss: 6.4577, Train Steps/Sec: 0.71
|
| 164 |
+
[[34m2025-03-20 20:59:17[0m] (step=0003575) Train Loss: 6.4566, Train Steps/Sec: 0.71
|
| 165 |
+
[[34m2025-03-20 20:59:52[0m] (step=0003600) Train Loss: 6.4444, Train Steps/Sec: 0.71
|
| 166 |
+
[[34m2025-03-20 21:00:27[0m] (step=0003625) Train Loss: 6.4437, Train Steps/Sec: 0.71
|
| 167 |
+
[[34m2025-03-20 21:01:02[0m] (step=0003650) Train Loss: 6.4669, Train Steps/Sec: 0.71
|
| 168 |
+
[[34m2025-03-20 21:01:37[0m] (step=0003675) Train Loss: 6.4088, Train Steps/Sec: 0.71
|
| 169 |
+
[[34m2025-03-20 21:02:12[0m] (step=0003700) Train Loss: 6.4651, Train Steps/Sec: 0.71
|
| 170 |
+
[[34m2025-03-20 21:02:48[0m] (step=0003725) Train Loss: 6.4487, Train Steps/Sec: 0.71
|
| 171 |
+
[[34m2025-03-20 21:03:23[0m] (step=0003750) Train Loss: 6.4143, Train Steps/Sec: 0.71
|
| 172 |
+
[[34m2025-03-20 21:03:58[0m] (step=0003775) Train Loss: 6.4241, Train Steps/Sec: 0.71
|
| 173 |
+
[[34m2025-03-20 21:04:33[0m] (step=0003800) Train Loss: 6.4724, Train Steps/Sec: 0.71
|
| 174 |
+
[[34m2025-03-20 21:05:08[0m] (step=0003825) Train Loss: 6.4061, Train Steps/Sec: 0.71
|
| 175 |
+
[[34m2025-03-20 21:05:43[0m] (step=0003850) Train Loss: 6.4635, Train Steps/Sec: 0.71
|
| 176 |
+
[[34m2025-03-20 21:06:18[0m] (step=0003875) Train Loss: 6.4552, Train Steps/Sec: 0.71
|
| 177 |
+
[[34m2025-03-20 21:06:53[0m] (step=0003900) Train Loss: 6.4737, Train Steps/Sec: 0.71
|
| 178 |
+
[[34m2025-03-20 21:07:28[0m] (step=0003925) Train Loss: 6.4255, Train Steps/Sec: 0.71
|
| 179 |
+
[[34m2025-03-20 21:08:03[0m] (step=0003950) Train Loss: 6.4468, Train Steps/Sec: 0.71
|
| 180 |
+
[[34m2025-03-20 21:08:38[0m] (step=0003975) Train Loss: 6.4338, Train Steps/Sec: 0.71
|
| 181 |
+
[[34m2025-03-20 21:09:13[0m] (step=0004000) Train Loss: 6.4610, Train Steps/Sec: 0.71
|
| 182 |
+
[[34m2025-03-20 21:09:13[0m] text_config is None. Initializing the text config with default values (`OPTConfig`).
|
| 183 |
+
[[34m2025-03-20 21:15:15[0m] Finish Eval in 4000 steps...
|
| 184 |
+
[[34m2025-03-20 21:15:22[0m] Saved checkpoint to checkpoints/TWO_node_llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_noimageonly_newfix_train_all/014-GPT-XL/checkpoints/0004000.pt
|
| 185 |
+
[[34m2025-03-20 21:15:23[0m] Removed old checkpoint: checkpoints/TWO_node_llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_noimageonly_newfix_train_all/014-GPT-XL/checkpoints/0002000.pt
|
| 186 |
+
[[34m2025-03-20 21:15:58[0m] (step=0004025) Train Loss: 6.4496, Train Steps/Sec: 0.06
|
| 187 |
+
[[34m2025-03-20 21:16:33[0m] (step=0004050) Train Loss: 6.4568, Train Steps/Sec: 0.71
|
| 188 |
+
[[34m2025-03-20 21:17:08[0m] (step=0004075) Train Loss: 6.4453, Train Steps/Sec: 0.71
|
| 189 |
+
[[34m2025-03-20 21:17:43[0m] (step=0004100) Train Loss: 6.4399, Train Steps/Sec: 0.71
|
| 190 |
+
[[34m2025-03-20 21:18:18[0m] (step=0004125) Train Loss: 6.4662, Train Steps/Sec: 0.71
|
| 191 |
+
[[34m2025-03-20 21:18:53[0m] (step=0004150) Train Loss: 6.4290, Train Steps/Sec: 0.71
|
| 192 |
+
[[34m2025-03-20 21:19:28[0m] (step=0004175) Train Loss: 6.4176, Train Steps/Sec: 0.71
|
| 193 |
+
[[34m2025-03-20 21:20:03[0m] (step=0004200) Train Loss: 6.4536, Train Steps/Sec: 0.71
|
| 194 |
+
[[34m2025-03-20 21:20:38[0m] (step=0004225) Train Loss: 6.4471, Train Steps/Sec: 0.71
|
| 195 |
+
[[34m2025-03-20 21:21:13[0m] (step=0004250) Train Loss: 6.4603, Train Steps/Sec: 0.71
|
| 196 |
+
[[34m2025-03-20 21:21:48[0m] (step=0004275) Train Loss: 6.4566, Train Steps/Sec: 0.71
|
| 197 |
+
[[34m2025-03-20 21:22:23[0m] (step=0004300) Train Loss: 6.4498, Train Steps/Sec: 0.71
|
| 198 |
+
[[34m2025-03-20 21:22:58[0m] (step=0004325) Train Loss: 6.4612, Train Steps/Sec: 0.71
|
| 199 |
+
[[34m2025-03-20 21:23:33[0m] (step=0004350) Train Loss: 6.4301, Train Steps/Sec: 0.71
|
| 200 |
+
[[34m2025-03-20 21:24:08[0m] (step=0004375) Train Loss: 6.4330, Train Steps/Sec: 0.71
|
| 201 |
+
[[34m2025-03-20 21:24:44[0m] (step=0004400) Train Loss: 6.4556, Train Steps/Sec: 0.69
|
| 202 |
+
[[34m2025-03-20 21:25:19[0m] (step=0004425) Train Loss: 6.4435, Train Steps/Sec: 0.71
|
| 203 |
+
[[34m2025-03-20 21:25:55[0m] (step=0004450) Train Loss: 6.4322, Train Steps/Sec: 0.71
|
| 204 |
+
[[34m2025-03-20 21:26:30[0m] (step=0004475) Train Loss: 6.4370, Train Steps/Sec: 0.71
|
| 205 |
+
[[34m2025-03-20 21:27:05[0m] (step=0004500) Train Loss: 6.4242, Train Steps/Sec: 0.71
|
| 206 |
+
[[34m2025-03-20 21:27:40[0m] (step=0004525) Train Loss: 6.4530, Train Steps/Sec: 0.71
|
| 207 |
+
[[34m2025-03-20 21:28:15[0m] (step=0004550) Train Loss: 6.4453, Train Steps/Sec: 0.71
|
| 208 |
+
[[34m2025-03-20 21:28:50[0m] (step=0004575) Train Loss: 6.4271, Train Steps/Sec: 0.71
|
| 209 |
+
[[34m2025-03-20 21:29:25[0m] (step=0004600) Train Loss: 6.4563, Train Steps/Sec: 0.71
|
| 210 |
+
[[34m2025-03-20 21:30:00[0m] (step=0004625) Train Loss: 6.4248, Train Steps/Sec: 0.71
|
| 211 |
+
[[34m2025-03-20 21:30:35[0m] (step=0004650) Train Loss: 6.4322, Train Steps/Sec: 0.71
|
| 212 |
+
[[34m2025-03-20 21:31:10[0m] (step=0004675) Train Loss: 6.4544, Train Steps/Sec: 0.71
|
| 213 |
+
[[34m2025-03-20 21:31:45[0m] (step=0004700) Train Loss: 6.4524, Train Steps/Sec: 0.71
|
| 214 |
+
[[34m2025-03-20 21:32:20[0m] (step=0004725) Train Loss: 6.4633, Train Steps/Sec: 0.71
|
| 215 |
+
[[34m2025-03-20 21:32:55[0m] (step=0004750) Train Loss: 6.4623, Train Steps/Sec: 0.71
|
| 216 |
+
[[34m2025-03-20 21:33:30[0m] (step=0004775) Train Loss: 6.4103, Train Steps/Sec: 0.71
|
| 217 |
+
[[34m2025-03-20 21:34:05[0m] (step=0004800) Train Loss: 6.4513, Train Steps/Sec: 0.71
|
| 218 |
+
[[34m2025-03-20 21:34:41[0m] (step=0004825) Train Loss: 6.4261, Train Steps/Sec: 0.69
|
| 219 |
+
[[34m2025-03-20 21:35:16[0m] (step=0004850) Train Loss: 6.4622, Train Steps/Sec: 0.71
|
| 220 |
+
[[34m2025-03-20 21:35:51[0m] (step=0004875) Train Loss: 6.4293, Train Steps/Sec: 0.71
|
| 221 |
+
[[34m2025-03-20 21:36:28[0m] (step=0004900) Train Loss: 6.4654, Train Steps/Sec: 0.69
|
| 222 |
+
[[34m2025-03-20 21:37:04[0m] (step=0004925) Train Loss: 6.4551, Train Steps/Sec: 0.68
|
| 223 |
+
[[34m2025-03-20 21:37:39[0m] (step=0004950) Train Loss: 6.4406, Train Steps/Sec: 0.71
|
| 224 |
+
[[34m2025-03-20 21:38:14[0m] (step=0004975) Train Loss: 6.4247, Train Steps/Sec: 0.71
|
| 225 |
+
[[34m2025-03-20 21:38:50[0m] (step=0005000) Train Loss: 6.4201, Train Steps/Sec: 0.71
|
| 226 |
+
[[34m2025-03-20 21:39:25[0m] (step=0005025) Train Loss: 6.4269, Train Steps/Sec: 0.71
|
| 227 |
+
[[34m2025-03-20 21:40:00[0m] (step=0005050) Train Loss: 6.4321, Train Steps/Sec: 0.71
|
| 228 |
+
[[34m2025-03-20 21:40:35[0m] (step=0005075) Train Loss: 6.4306, Train Steps/Sec: 0.71
|
| 229 |
+
[[34m2025-03-20 21:41:10[0m] (step=0005100) Train Loss: 6.3922, Train Steps/Sec: 0.71
|
| 230 |
+
[[34m2025-03-20 21:41:45[0m] (step=0005125) Train Loss: 6.4273, Train Steps/Sec: 0.71
|
| 231 |
+
[[34m2025-03-20 21:42:20[0m] (step=0005150) Train Loss: 6.4445, Train Steps/Sec: 0.71
|
| 232 |
+
[[34m2025-03-20 21:42:55[0m] (step=0005175) Train Loss: 6.4266, Train Steps/Sec: 0.71
|
| 233 |
+
[[34m2025-03-20 21:43:30[0m] (step=0005200) Train Loss: 6.4186, Train Steps/Sec: 0.71
|
| 234 |
+
[[34m2025-03-20 21:44:05[0m] (step=0005225) Train Loss: 6.4267, Train Steps/Sec: 0.71
|
| 235 |
+
[[34m2025-03-20 21:44:40[0m] (step=0005250) Train Loss: 6.4370, Train Steps/Sec: 0.71
|
| 236 |
+
[[34m2025-03-20 21:45:15[0m] (step=0005275) Train Loss: 6.4609, Train Steps/Sec: 0.71
|
| 237 |
+
[[34m2025-03-20 21:45:50[0m] (step=0005300) Train Loss: 6.4411, Train Steps/Sec: 0.71
|
| 238 |
+
[[34m2025-03-20 21:46:26[0m] (step=0005325) Train Loss: 6.4380, Train Steps/Sec: 0.70
|
| 239 |
+
[[34m2025-03-20 21:47:01[0m] (step=0005350) Train Loss: 6.4442, Train Steps/Sec: 0.71
|
| 240 |
+
[[34m2025-03-20 21:47:36[0m] (step=0005375) Train Loss: 6.4004, Train Steps/Sec: 0.71
|
| 241 |
+
[[34m2025-03-20 21:48:11[0m] (step=0005400) Train Loss: 6.4014, Train Steps/Sec: 0.71
|
| 242 |
+
[[34m2025-03-20 21:48:47[0m] (step=0005425) Train Loss: 6.4412, Train Steps/Sec: 0.69
|
| 243 |
+
[[34m2025-03-20 21:49:22[0m] (step=0005450) Train Loss: 6.4229, Train Steps/Sec: 0.71
|
| 244 |
+
[[34m2025-03-20 21:49:57[0m] (step=0005475) Train Loss: 6.4590, Train Steps/Sec: 0.72
|
| 245 |
+
[[34m2025-03-20 21:50:32[0m] (step=0005500) Train Loss: 6.4389, Train Steps/Sec: 0.71
|
| 246 |
+
[[34m2025-03-20 21:51:08[0m] (step=0005525) Train Loss: 6.4199, Train Steps/Sec: 0.69
|
| 247 |
+
[[34m2025-03-20 21:51:43[0m] (step=0005550) Train Loss: 6.4435, Train Steps/Sec: 0.71
|
| 248 |
+
[[34m2025-03-20 21:52:19[0m] (step=0005575) Train Loss: 6.4235, Train Steps/Sec: 0.69
|
| 249 |
+
[[34m2025-03-20 21:52:54[0m] (step=0005600) Train Loss: 6.4272, Train Steps/Sec: 0.71
|
| 250 |
+
[[34m2025-03-20 21:53:29[0m] (step=0005625) Train Loss: 6.4050, Train Steps/Sec: 0.71
|
| 251 |
+
[[34m2025-03-20 21:54:04[0m] (step=0005650) Train Loss: 6.4400, Train Steps/Sec: 0.71
|
| 252 |
+
[[34m2025-03-20 21:54:39[0m] (step=0005675) Train Loss: 6.4548, Train Steps/Sec: 0.71
|
| 253 |
+
[[34m2025-03-20 21:55:14[0m] (step=0005700) Train Loss: 6.4660, Train Steps/Sec: 0.71
|
| 254 |
+
[[34m2025-03-20 21:55:51[0m] (step=0005725) Train Loss: 6.4438, Train Steps/Sec: 0.69
|
| 255 |
+
[[34m2025-03-20 21:56:26[0m] (step=0005750) Train Loss: 6.4537, Train Steps/Sec: 0.71
|
| 256 |
+
[[34m2025-03-20 21:57:01[0m] (step=0005775) Train Loss: 6.4174, Train Steps/Sec: 0.72
|
| 257 |
+
[[34m2025-03-20 21:57:35[0m] (step=0005800) Train Loss: 6.4310, Train Steps/Sec: 0.72
|
| 258 |
+
[[34m2025-03-20 21:58:10[0m] (step=0005825) Train Loss: 6.4228, Train Steps/Sec: 0.71
|
| 259 |
+
[[34m2025-03-20 21:58:45[0m] (step=0005850) Train Loss: 6.4421, Train Steps/Sec: 0.72
|
| 260 |
+
[[34m2025-03-20 21:59:20[0m] (step=0005875) Train Loss: 6.4129, Train Steps/Sec: 0.72
|
| 261 |
+
[[34m2025-03-20 21:59:55[0m] (step=0005900) Train Loss: 6.4568, Train Steps/Sec: 0.72
|
| 262 |
+
[[34m2025-03-20 22:00:30[0m] (step=0005925) Train Loss: 6.4281, Train Steps/Sec: 0.71
|
| 263 |
+
[[34m2025-03-20 22:01:05[0m] (step=0005950) Train Loss: 6.4194, Train Steps/Sec: 0.71
|
| 264 |
+
[[34m2025-03-20 22:01:40[0m] (step=0005975) Train Loss: 6.4256, Train Steps/Sec: 0.71
|
| 265 |
+
[[34m2025-03-20 22:02:15[0m] (step=0006000) Train Loss: 6.4127, Train Steps/Sec: 0.71
|
| 266 |
+
[[34m2025-03-20 22:02:15[0m] text_config is None. Initializing the text config with default values (`OPTConfig`).
|
| 267 |
+
[[34m2025-03-20 22:08:18[0m] Finish Eval in 6000 steps...
|
| 268 |
+
[[34m2025-03-20 22:08:25[0m] Saved checkpoint to checkpoints/TWO_node_llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_noimageonly_newfix_train_all/014-GPT-XL/checkpoints/0006000.pt
|
| 269 |
+
[[34m2025-03-20 22:08:26[0m] Removed old checkpoint: checkpoints/TWO_node_llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_noimageonly_newfix_train_all/014-GPT-XL/checkpoints/0004000.pt
|
| 270 |
+
[[34m2025-03-20 22:09:01[0m] (step=0006025) Train Loss: 6.4344, Train Steps/Sec: 0.06
|
| 271 |
+
[[34m2025-03-20 22:09:36[0m] (step=0006050) Train Loss: 6.4254, Train Steps/Sec: 0.72
|
| 272 |
+
[[34m2025-03-20 22:10:11[0m] (step=0006075) Train Loss: 6.4253, Train Steps/Sec: 0.72
|
| 273 |
+
[[34m2025-03-20 22:10:46[0m] (step=0006100) Train Loss: 6.4574, Train Steps/Sec: 0.72
|
| 274 |
+
[[34m2025-03-20 22:11:20[0m] (step=0006125) Train Loss: 6.4276, Train Steps/Sec: 0.72
|
| 275 |
+
[[34m2025-03-20 22:11:55[0m] (step=0006150) Train Loss: 6.3953, Train Steps/Sec: 0.72
|
| 276 |
+
[[34m2025-03-20 22:12:30[0m] (step=0006175) Train Loss: 6.4325, Train Steps/Sec: 0.72
|
| 277 |
+
[[34m2025-03-20 22:13:05[0m] (step=0006200) Train Loss: 6.4282, Train Steps/Sec: 0.72
|
| 278 |
+
[[34m2025-03-20 22:13:40[0m] (step=0006225) Train Loss: 6.4280, Train Steps/Sec: 0.72
|
| 279 |
+
[[34m2025-03-20 22:14:15[0m] (step=0006250) Train Loss: 6.4474, Train Steps/Sec: 0.72
|
| 280 |
+
[[34m2025-03-20 22:14:50[0m] (step=0006275) Train Loss: 6.4375, Train Steps/Sec: 0.72
|
| 281 |
+
[[34m2025-03-20 22:15:25[0m] (step=0006300) Train Loss: 6.4196, Train Steps/Sec: 0.72
|
| 282 |
+
[[34m2025-03-20 22:16:00[0m] (step=0006325) Train Loss: 6.4473, Train Steps/Sec: 0.72
|
| 283 |
+
[[34m2025-03-20 22:16:35[0m] (step=0006350) Train Loss: 6.3886, Train Steps/Sec: 0.72
|
| 284 |
+
[[34m2025-03-20 22:17:10[0m] (step=0006375) Train Loss: 6.4518, Train Steps/Sec: 0.72
|
| 285 |
+
[[34m2025-03-20 22:17:45[0m] (step=0006400) Train Loss: 6.4215, Train Steps/Sec: 0.72
|
| 286 |
+
[[34m2025-03-20 22:18:20[0m] (step=0006425) Train Loss: 6.4572, Train Steps/Sec: 0.72
|
| 287 |
+
[[34m2025-03-20 22:18:55[0m] (step=0006450) Train Loss: 6.4366, Train Steps/Sec: 0.72
|
| 288 |
+
[[34m2025-03-20 22:19:30[0m] (step=0006475) Train Loss: 6.4377, Train Steps/Sec: 0.71
|
| 289 |
+
[[34m2025-03-20 22:20:05[0m] (step=0006500) Train Loss: 6.4409, Train Steps/Sec: 0.71
|
| 290 |
+
[[34m2025-03-20 22:20:40[0m] (step=0006525) Train Loss: 6.4405, Train Steps/Sec: 0.71
|
| 291 |
+
[[34m2025-03-20 22:21:15[0m] (step=0006550) Train Loss: 6.4367, Train Steps/Sec: 0.71
|
| 292 |
+
[[34m2025-03-20 22:21:50[0m] (step=0006575) Train Loss: 6.4118, Train Steps/Sec: 0.72
|
| 293 |
+
[[34m2025-03-20 22:22:25[0m] (step=0006600) Train Loss: 6.4402, Train Steps/Sec: 0.72
|
| 294 |
+
[[34m2025-03-20 22:23:00[0m] (step=0006625) Train Loss: 6.4273, Train Steps/Sec: 0.72
|
| 295 |
+
[[34m2025-03-20 22:23:34[0m] (step=0006650) Train Loss: 6.4457, Train Steps/Sec: 0.72
|
| 296 |
+
[[34m2025-03-20 22:24:09[0m] (step=0006675) Train Loss: 6.4616, Train Steps/Sec: 0.72
|
| 297 |
+
[[34m2025-03-20 22:24:44[0m] (step=0006700) Train Loss: 6.4466, Train Steps/Sec: 0.72
|
| 298 |
+
[[34m2025-03-20 22:25:19[0m] (step=0006725) Train Loss: 6.4118, Train Steps/Sec: 0.72
|
| 299 |
+
[[34m2025-03-20 22:25:54[0m] (step=0006750) Train Loss: 6.4355, Train Steps/Sec: 0.71
|
| 300 |
+
[[34m2025-03-20 22:26:29[0m] (step=0006775) Train Loss: 6.4184, Train Steps/Sec: 0.71
|
| 301 |
+
[[34m2025-03-20 22:27:04[0m] (step=0006800) Train Loss: 6.3927, Train Steps/Sec: 0.72
|
| 302 |
+
[[34m2025-03-20 22:27:39[0m] (step=0006825) Train Loss: 6.4199, Train Steps/Sec: 0.72
|
| 303 |
+
[[34m2025-03-20 22:28:14[0m] (step=0006850) Train Loss: 6.4369, Train Steps/Sec: 0.72
|
| 304 |
+
[[34m2025-03-20 22:28:49[0m] (step=0006875) Train Loss: 6.4323, Train Steps/Sec: 0.72
|
| 305 |
+
[[34m2025-03-20 22:29:25[0m] (step=0006900) Train Loss: 6.4108, Train Steps/Sec: 0.69
|
| 306 |
+
[[34m2025-03-20 22:30:00[0m] (step=0006925) Train Loss: 6.4357, Train Steps/Sec: 0.72
|
| 307 |
+
[[34m2025-03-20 22:30:35[0m] (step=0006950) Train Loss: 6.4808, Train Steps/Sec: 0.72
|
| 308 |
+
[[34m2025-03-20 22:31:10[0m] (step=0006975) Train Loss: 6.4370, Train Steps/Sec: 0.72
|
| 309 |
+
[[34m2025-03-20 22:31:45[0m] (step=0007000) Train Loss: 6.4265, Train Steps/Sec: 0.72
|
| 310 |
+
[[34m2025-03-20 22:32:20[0m] (step=0007025) Train Loss: 6.4694, Train Steps/Sec: 0.72
|
| 311 |
+
[[34m2025-03-20 22:32:55[0m] (step=0007050) Train Loss: 6.4077, Train Steps/Sec: 0.72
|
| 312 |
+
[[34m2025-03-20 22:33:30[0m] (step=0007075) Train Loss: 6.4566, Train Steps/Sec: 0.72
|
| 313 |
+
[[34m2025-03-20 22:34:05[0m] (step=0007100) Train Loss: 6.4580, Train Steps/Sec: 0.72
|
| 314 |
+
[[34m2025-03-20 22:34:40[0m] (step=0007125) Train Loss: 6.4364, Train Steps/Sec: 0.72
|
| 315 |
+
[[34m2025-03-20 22:35:14[0m] (step=0007150) Train Loss: 6.4023, Train Steps/Sec: 0.72
|
| 316 |
+
[[34m2025-03-20 22:35:49[0m] (step=0007175) Train Loss: 6.4319, Train Steps/Sec: 0.72
|
| 317 |
+
[[34m2025-03-20 22:36:24[0m] (step=0007200) Train Loss: 6.4345, Train Steps/Sec: 0.72
|
| 318 |
+
[[34m2025-03-20 22:36:59[0m] (step=0007225) Train Loss: 6.4259, Train Steps/Sec: 0.72
|
| 319 |
+
[[34m2025-03-20 22:37:36[0m] (step=0007250) Train Loss: 6.4395, Train Steps/Sec: 0.67
|
| 320 |
+
[[34m2025-03-20 22:38:11[0m] (step=0007275) Train Loss: 6.4173, Train Steps/Sec: 0.72
|
| 321 |
+
[[34m2025-03-20 22:38:46[0m] (step=0007300) Train Loss: 6.4227, Train Steps/Sec: 0.72
|
| 322 |
+
[[34m2025-03-20 22:39:23[0m] (step=0007325) Train Loss: 6.4355, Train Steps/Sec: 0.69
|
| 323 |
+
[[34m2025-03-20 22:39:58[0m] (step=0007350) Train Loss: 6.4211, Train Steps/Sec: 0.72
|
| 324 |
+
[[34m2025-03-20 22:40:32[0m] (step=0007375) Train Loss: 6.4340, Train Steps/Sec: 0.72
|
| 325 |
+
[[34m2025-03-20 22:41:07[0m] (step=0007400) Train Loss: 6.4399, Train Steps/Sec: 0.72
|
| 326 |
+
[[34m2025-03-20 22:41:42[0m] (step=0007425) Train Loss: 6.4397, Train Steps/Sec: 0.72
|
| 327 |
+
[[34m2025-03-20 22:42:17[0m] (step=0007450) Train Loss: 6.4227, Train Steps/Sec: 0.72
|
| 328 |
+
[[34m2025-03-20 22:42:52[0m] (step=0007475) Train Loss: 6.4138, Train Steps/Sec: 0.72
|
| 329 |
+
[[34m2025-03-20 22:43:27[0m] (step=0007500) Train Loss: 6.4278, Train Steps/Sec: 0.72
|
| 330 |
+
[[34m2025-03-20 22:44:02[0m] (step=0007525) Train Loss: 6.4314, Train Steps/Sec: 0.72
|
| 331 |
+
[[34m2025-03-20 22:44:37[0m] (step=0007550) Train Loss: 6.4207, Train Steps/Sec: 0.72
|
| 332 |
+
[[34m2025-03-20 22:45:12[0m] (step=0007575) Train Loss: 6.4282, Train Steps/Sec: 0.72
|
| 333 |
+
[[34m2025-03-20 22:45:48[0m] (step=0007600) Train Loss: 6.4374, Train Steps/Sec: 0.69
|
| 334 |
+
[[34m2025-03-20 22:46:23[0m] (step=0007625) Train Loss: 6.4358, Train Steps/Sec: 0.72
|
| 335 |
+
[[34m2025-03-20 22:46:58[0m] (step=0007650) Train Loss: 6.4467, Train Steps/Sec: 0.72
|
| 336 |
+
[[34m2025-03-20 22:47:33[0m] (step=0007675) Train Loss: 6.4385, Train Steps/Sec: 0.72
|
| 337 |
+
[[34m2025-03-20 22:48:08[0m] (step=0007700) Train Loss: 6.4336, Train Steps/Sec: 0.71
|
| 338 |
+
[[34m2025-03-20 22:48:44[0m] (step=0007725) Train Loss: 6.4156, Train Steps/Sec: 0.69
|
| 339 |
+
[[34m2025-03-20 22:49:19[0m] (step=0007750) Train Loss: 6.4096, Train Steps/Sec: 0.71
|
| 340 |
+
[[34m2025-03-20 22:49:56[0m] (step=0007775) Train Loss: 6.4597, Train Steps/Sec: 0.69
|
| 341 |
+
[[34m2025-03-20 22:50:30[0m] (step=0007800) Train Loss: 6.4469, Train Steps/Sec: 0.72
|
| 342 |
+
[[34m2025-03-20 22:51:05[0m] (step=0007825) Train Loss: 6.4494, Train Steps/Sec: 0.71
|
| 343 |
+
[[34m2025-03-20 22:51:40[0m] (step=0007850) Train Loss: 6.4408, Train Steps/Sec: 0.71
|
| 344 |
+
[[34m2025-03-20 22:52:15[0m] (step=0007875) Train Loss: 6.4208, Train Steps/Sec: 0.72
|
| 345 |
+
[[34m2025-03-20 22:52:50[0m] (step=0007900) Train Loss: 6.4623, Train Steps/Sec: 0.72
|
| 346 |
+
[[34m2025-03-20 22:53:25[0m] (step=0007925) Train Loss: 6.4180, Train Steps/Sec: 0.72
|
| 347 |
+
[[34m2025-03-20 22:54:00[0m] (step=0007950) Train Loss: 6.4076, Train Steps/Sec: 0.72
|
| 348 |
+
[[34m2025-03-20 22:54:35[0m] (step=0007975) Train Loss: 6.4219, Train Steps/Sec: 0.72
|
| 349 |
+
[[34m2025-03-20 22:55:10[0m] (step=0008000) Train Loss: 6.4411, Train Steps/Sec: 0.72
|
| 350 |
+
[[34m2025-03-20 22:55:10[0m] text_config is None. Initializing the text config with default values (`OPTConfig`).
|
| 351 |
+
[[34m2025-03-20 23:01:12[0m] Finish Eval in 8000 steps...
|
| 352 |
+
[[34m2025-03-20 23:01:18[0m] Saved checkpoint to checkpoints/TWO_node_llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_noimageonly_newfix_train_all/014-GPT-XL/checkpoints/0008000.pt
|
| 353 |
+
[[34m2025-03-20 23:01:19[0m] Removed old checkpoint: checkpoints/TWO_node_llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_noimageonly_newfix_train_all/014-GPT-XL/checkpoints/0006000.pt
|
| 354 |
+
[[34m2025-03-20 23:01:54[0m] (step=0008025) Train Loss: 6.4718, Train Steps/Sec: 0.06
|
| 355 |
+
[[34m2025-03-20 23:02:29[0m] (step=0008050) Train Loss: 6.4274, Train Steps/Sec: 0.72
|
| 356 |
+
[[34m2025-03-20 23:03:04[0m] (step=0008075) Train Loss: 6.4336, Train Steps/Sec: 0.72
|
| 357 |
+
[[34m2025-03-20 23:03:39[0m] (step=0008100) Train Loss: 6.4129, Train Steps/Sec: 0.72
|
| 358 |
+
[[34m2025-03-20 23:04:14[0m] (step=0008125) Train Loss: 6.4226, Train Steps/Sec: 0.72
|
| 359 |
+
[[34m2025-03-20 23:04:49[0m] (step=0008150) Train Loss: 6.4360, Train Steps/Sec: 0.72
|
| 360 |
+
[[34m2025-03-20 23:05:24[0m] (step=0008175) Train Loss: 6.4365, Train Steps/Sec: 0.72
|
| 361 |
+
[[34m2025-03-20 23:05:59[0m] (step=0008200) Train Loss: 6.4156, Train Steps/Sec: 0.72
|
| 362 |
+
[[34m2025-03-20 23:06:34[0m] (step=0008225) Train Loss: 6.4160, Train Steps/Sec: 0.72
|
| 363 |
+
[[34m2025-03-20 23:07:09[0m] (step=0008250) Train Loss: 6.4263, Train Steps/Sec: 0.72
|
| 364 |
+
[[34m2025-03-20 23:07:43[0m] (step=0008275) Train Loss: 6.4522, Train Steps/Sec: 0.72
|
| 365 |
+
[[34m2025-03-20 23:08:19[0m] (step=0008300) Train Loss: 6.4355, Train Steps/Sec: 0.70
|
| 366 |
+
[[34m2025-03-20 23:08:55[0m] (step=0008325) Train Loss: 6.4262, Train Steps/Sec: 0.71
|
| 367 |
+
[[34m2025-03-20 23:09:29[0m] (step=0008350) Train Loss: 6.4312, Train Steps/Sec: 0.72
|
| 368 |
+
[[34m2025-03-20 23:10:04[0m] (step=0008375) Train Loss: 6.4189, Train Steps/Sec: 0.71
|
| 369 |
+
[[34m2025-03-20 23:10:39[0m] (step=0008400) Train Loss: 6.3955, Train Steps/Sec: 0.72
|
| 370 |
+
[[34m2025-03-20 23:11:14[0m] (step=0008425) Train Loss: 6.4316, Train Steps/Sec: 0.72
|
| 371 |
+
[[34m2025-03-20 23:11:49[0m] (step=0008450) Train Loss: 6.4043, Train Steps/Sec: 0.72
|
| 372 |
+
[[34m2025-03-20 23:12:24[0m] (step=0008475) Train Loss: 6.4294, Train Steps/Sec: 0.71
|
| 373 |
+
[[34m2025-03-20 23:12:59[0m] (step=0008500) Train Loss: 6.4304, Train Steps/Sec: 0.71
|
| 374 |
+
[[34m2025-03-20 23:13:34[0m] (step=0008525) Train Loss: 6.4523, Train Steps/Sec: 0.72
|
| 375 |
+
[[34m2025-03-20 23:14:09[0m] (step=0008550) Train Loss: 6.4442, Train Steps/Sec: 0.72
|
| 376 |
+
[[34m2025-03-20 23:14:44[0m] (step=0008575) Train Loss: 6.4020, Train Steps/Sec: 0.72
|
| 377 |
+
[[34m2025-03-20 23:15:19[0m] (step=0008600) Train Loss: 6.4199, Train Steps/Sec: 0.71
|
| 378 |
+
[[34m2025-03-20 23:15:54[0m] (step=0008625) Train Loss: 6.3928, Train Steps/Sec: 0.72
|
| 379 |
+
[[34m2025-03-20 23:16:29[0m] (step=0008650) Train Loss: 6.4274, Train Steps/Sec: 0.71
|
| 380 |
+
[[34m2025-03-20 23:17:04[0m] (step=0008675) Train Loss: 6.4127, Train Steps/Sec: 0.72
|
| 381 |
+
[[34m2025-03-20 23:17:39[0m] (step=0008700) Train Loss: 6.4326, Train Steps/Sec: 0.71
|
| 382 |
+
[[34m2025-03-20 23:18:14[0m] (step=0008725) Train Loss: 6.3965, Train Steps/Sec: 0.72
|
| 383 |
+
[[34m2025-03-20 23:18:49[0m] (step=0008750) Train Loss: 6.4192, Train Steps/Sec: 0.72
|
| 384 |
+
[[34m2025-03-20 23:19:24[0m] (step=0008775) Train Loss: 6.4366, Train Steps/Sec: 0.72
|
| 385 |
+
[[34m2025-03-20 23:19:59[0m] (step=0008800) Train Loss: 6.4330, Train Steps/Sec: 0.72
|
| 386 |
+
[[34m2025-03-20 23:20:34[0m] (step=0008825) Train Loss: 6.4360, Train Steps/Sec: 0.72
|
| 387 |
+
[[34m2025-03-20 23:21:09[0m] (step=0008850) Train Loss: 6.4113, Train Steps/Sec: 0.72
|
| 388 |
+
[[34m2025-03-20 23:21:44[0m] (step=0008875) Train Loss: 6.4061, Train Steps/Sec: 0.72
|
| 389 |
+
[[34m2025-03-20 23:22:19[0m] (step=0008900) Train Loss: 6.3933, Train Steps/Sec: 0.72
|
| 390 |
+
[[34m2025-03-20 23:22:54[0m] (step=0008925) Train Loss: 6.4546, Train Steps/Sec: 0.71
|
| 391 |
+
[[34m2025-03-20 23:23:29[0m] (step=0008950) Train Loss: 6.4158, Train Steps/Sec: 0.72
|
| 392 |
+
[[34m2025-03-20 23:24:03[0m] (step=0008975) Train Loss: 6.3954, Train Steps/Sec: 0.72
|
| 393 |
+
[[34m2025-03-20 23:24:40[0m] (step=0009000) Train Loss: 6.4390, Train Steps/Sec: 0.69
|
| 394 |
+
[[34m2025-03-20 23:25:15[0m] (step=0009025) Train Loss: 6.3983, Train Steps/Sec: 0.72
|
| 395 |
+
[[34m2025-03-20 23:25:50[0m] (step=0009050) Train Loss: 6.4226, Train Steps/Sec: 0.72
|
| 396 |
+
[[34m2025-03-20 23:26:24[0m] (step=0009075) Train Loss: 6.4239, Train Steps/Sec: 0.72
|
| 397 |
+
[[34m2025-03-20 23:26:59[0m] (step=0009100) Train Loss: 6.4158, Train Steps/Sec: 0.72
|
| 398 |
+
[[34m2025-03-20 23:27:34[0m] (step=0009125) Train Loss: 6.4267, Train Steps/Sec: 0.72
|
| 399 |
+
[[34m2025-03-20 23:28:09[0m] (step=0009150) Train Loss: 6.4354, Train Steps/Sec: 0.72
|
| 400 |
+
[[34m2025-03-20 23:28:44[0m] (step=0009175) Train Loss: 6.4344, Train Steps/Sec: 0.71
|
| 401 |
+
[[34m2025-03-20 23:29:19[0m] (step=0009200) Train Loss: 6.4474, Train Steps/Sec: 0.72
|
| 402 |
+
[[34m2025-03-20 23:29:54[0m] (step=0009225) Train Loss: 6.4438, Train Steps/Sec: 0.72
|
| 403 |
+
[[34m2025-03-20 23:30:29[0m] (step=0009250) Train Loss: 6.4396, Train Steps/Sec: 0.72
|
| 404 |
+
[[34m2025-03-20 23:31:04[0m] (step=0009275) Train Loss: 6.4269, Train Steps/Sec: 0.72
|
| 405 |
+
[[34m2025-03-20 23:31:39[0m] (step=0009300) Train Loss: 6.3951, Train Steps/Sec: 0.72
|
| 406 |
+
[[34m2025-03-20 23:32:15[0m] (step=0009325) Train Loss: 6.4140, Train Steps/Sec: 0.69
|
| 407 |
+
[[34m2025-03-20 23:32:50[0m] (step=0009350) Train Loss: 6.4122, Train Steps/Sec: 0.71
|
| 408 |
+
[[34m2025-03-20 23:33:25[0m] (step=0009375) Train Loss: 6.4518, Train Steps/Sec: 0.72
|
| 409 |
+
[[34m2025-03-20 23:34:00[0m] (step=0009400) Train Loss: 6.4317, Train Steps/Sec: 0.72
|
| 410 |
+
[[34m2025-03-20 23:34:35[0m] (step=0009425) Train Loss: 6.4246, Train Steps/Sec: 0.72
|
| 411 |
+
[[34m2025-03-20 23:35:10[0m] (step=0009450) Train Loss: 6.4295, Train Steps/Sec: 0.72
|
| 412 |
+
[[34m2025-03-20 23:35:45[0m] (step=0009475) Train Loss: 6.4028, Train Steps/Sec: 0.72
|
| 413 |
+
[[34m2025-03-20 23:36:20[0m] (step=0009500) Train Loss: 6.4494, Train Steps/Sec: 0.72
|
| 414 |
+
[[34m2025-03-20 23:36:56[0m] (step=0009525) Train Loss: 6.4273, Train Steps/Sec: 0.69
|
| 415 |
+
[[34m2025-03-20 23:37:31[0m] (step=0009550) Train Loss: 6.4171, Train Steps/Sec: 0.72
|
| 416 |
+
[[34m2025-03-20 23:38:06[0m] (step=0009575) Train Loss: 6.4188, Train Steps/Sec: 0.72
|
| 417 |
+
[[34m2025-03-20 23:38:41[0m] (step=0009600) Train Loss: 6.4070, Train Steps/Sec: 0.72
|
| 418 |
+
[[34m2025-03-20 23:39:16[0m] (step=0009625) Train Loss: 6.4522, Train Steps/Sec: 0.72
|
| 419 |
+
[[34m2025-03-20 23:39:51[0m] (step=0009650) Train Loss: 6.4258, Train Steps/Sec: 0.72
|
| 420 |
+
[[34m2025-03-20 23:40:26[0m] (step=0009675) Train Loss: 6.3994, Train Steps/Sec: 0.72
|
| 421 |
+
[[34m2025-03-20 23:41:02[0m] (step=0009700) Train Loss: 6.4628, Train Steps/Sec: 0.70
|
| 422 |
+
[[34m2025-03-20 23:41:38[0m] (step=0009725) Train Loss: 6.4372, Train Steps/Sec: 0.69
|
| 423 |
+
[[34m2025-03-20 23:42:13[0m] (step=0009750) Train Loss: 6.4326, Train Steps/Sec: 0.72
|
| 424 |
+
[[34m2025-03-20 23:42:48[0m] (step=0009775) Train Loss: 6.3777, Train Steps/Sec: 0.71
|
| 425 |
+
[[34m2025-03-20 23:43:23[0m] (step=0009800) Train Loss: 6.4572, Train Steps/Sec: 0.72
|
| 426 |
+
[[34m2025-03-20 23:43:58[0m] (step=0009825) Train Loss: 6.4424, Train Steps/Sec: 0.72
|
| 427 |
+
[[34m2025-03-20 23:44:33[0m] (step=0009850) Train Loss: 6.4162, Train Steps/Sec: 0.72
|
| 428 |
+
[[34m2025-03-20 23:45:08[0m] (step=0009875) Train Loss: 6.4122, Train Steps/Sec: 0.72
|
| 429 |
+
[[34m2025-03-20 23:45:43[0m] (step=0009900) Train Loss: 6.4317, Train Steps/Sec: 0.72
|
| 430 |
+
[[34m2025-03-20 23:46:18[0m] (step=0009925) Train Loss: 6.4246, Train Steps/Sec: 0.72
|
| 431 |
+
[[34m2025-03-20 23:46:52[0m] (step=0009950) Train Loss: 6.4365, Train Steps/Sec: 0.72
|
| 432 |
+
[[34m2025-03-20 23:47:27[0m] (step=0009975) Train Loss: 6.4012, Train Steps/Sec: 0.72
|
| 433 |
+
[[34m2025-03-20 23:48:02[0m] (step=0010000) Train Loss: 6.4031, Train Steps/Sec: 0.71
|
| 434 |
+
[[34m2025-03-20 23:48:02[0m] text_config is None. Initializing the text config with default values (`OPTConfig`).
|
| 435 |
+
[[34m2025-03-20 23:54:05[0m] Finish Eval in 10000 steps...
|
| 436 |
+
[[34m2025-03-20 23:54:12[0m] Saved checkpoint to checkpoints/TWO_node_llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_noimageonly_newfix_train_all/014-GPT-XL/checkpoints/0010000.pt
|
| 437 |
+
[[34m2025-03-20 23:54:12[0m] Removed old checkpoint: checkpoints/TWO_node_llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_noimageonly_newfix_train_all/014-GPT-XL/checkpoints/0008000.pt
|
| 438 |
+
[[34m2025-03-20 23:54:47[0m] (step=0010025) Train Loss: 6.4260, Train Steps/Sec: 0.06
|
| 439 |
+
[[34m2025-03-20 23:55:23[0m] (step=0010050) Train Loss: 6.4366, Train Steps/Sec: 0.70
|
| 440 |
+
[[34m2025-03-20 23:55:58[0m] (step=0010075) Train Loss: 6.4279, Train Steps/Sec: 0.72
|
| 441 |
+
[[34m2025-03-20 23:56:33[0m] (step=0010100) Train Loss: 6.4262, Train Steps/Sec: 0.71
|
| 442 |
+
[[34m2025-03-20 23:57:08[0m] (step=0010125) Train Loss: 6.4424, Train Steps/Sec: 0.72
|
| 443 |
+
[[34m2025-03-20 23:57:43[0m] (step=0010150) Train Loss: 6.4015, Train Steps/Sec: 0.72
|
| 444 |
+
[[34m2025-03-20 23:58:19[0m] (step=0010175) Train Loss: 6.4151, Train Steps/Sec: 0.69
|
| 445 |
+
[[34m2025-03-20 23:58:55[0m] (step=0010200) Train Loss: 6.4362, Train Steps/Sec: 0.70
|
| 446 |
+
[[34m2025-03-20 23:59:30[0m] (step=0010225) Train Loss: 6.4059, Train Steps/Sec: 0.72
|
| 447 |
+
[[34m2025-03-21 00:00:05[0m] (step=0010250) Train Loss: 6.4311, Train Steps/Sec: 0.72
|
| 448 |
+
[[34m2025-03-21 00:00:40[0m] (step=0010275) Train Loss: 6.4228, Train Steps/Sec: 0.72
|
| 449 |
+
[[34m2025-03-21 00:01:15[0m] (step=0010300) Train Loss: 6.4479, Train Steps/Sec: 0.72
|
| 450 |
+
[[34m2025-03-21 00:01:50[0m] (step=0010325) Train Loss: 6.3938, Train Steps/Sec: 0.72
|
| 451 |
+
[[34m2025-03-21 00:02:25[0m] (step=0010350) Train Loss: 6.4197, Train Steps/Sec: 0.72
|
| 452 |
+
[[34m2025-03-21 00:03:00[0m] (step=0010375) Train Loss: 6.4202, Train Steps/Sec: 0.72
|
| 453 |
+
[[34m2025-03-21 00:03:35[0m] (step=0010400) Train Loss: 6.4000, Train Steps/Sec: 0.72
|
| 454 |
+
[[34m2025-03-21 00:04:09[0m] (step=0010425) Train Loss: 6.3945, Train Steps/Sec: 0.72
|
| 455 |
+
[[34m2025-03-21 00:04:45[0m] (step=0010450) Train Loss: 6.4062, Train Steps/Sec: 0.71
|
| 456 |
+
[[34m2025-03-21 00:05:20[0m] (step=0010475) Train Loss: 6.4326, Train Steps/Sec: 0.72
|
| 457 |
+
[[34m2025-03-21 00:05:55[0m] (step=0010500) Train Loss: 6.4376, Train Steps/Sec: 0.71
|
| 458 |
+
[[34m2025-03-21 00:06:30[0m] (step=0010525) Train Loss: 6.4355, Train Steps/Sec: 0.71
|
| 459 |
+
[[34m2025-03-21 00:07:05[0m] (step=0010550) Train Loss: 6.4296, Train Steps/Sec: 0.71
|
| 460 |
+
[[34m2025-03-21 00:07:40[0m] (step=0010575) Train Loss: 6.3752, Train Steps/Sec: 0.71
|
| 461 |
+
[[34m2025-03-21 00:08:14[0m] (step=0010600) Train Loss: 6.4095, Train Steps/Sec: 0.72
|
| 462 |
+
[[34m2025-03-21 00:08:49[0m] (step=0010625) Train Loss: 6.4422, Train Steps/Sec: 0.72
|
| 463 |
+
[[34m2025-03-21 00:09:24[0m] (step=0010650) Train Loss: 6.4269, Train Steps/Sec: 0.72
|
| 464 |
+
[[34m2025-03-21 00:09:59[0m] (step=0010675) Train Loss: 6.4177, Train Steps/Sec: 0.72
|
| 465 |
+
[[34m2025-03-21 00:10:34[0m] (step=0010700) Train Loss: 6.4081, Train Steps/Sec: 0.72
|
| 466 |
+
[[34m2025-03-21 00:11:09[0m] (step=0010725) Train Loss: 6.3981, Train Steps/Sec: 0.72
|
| 467 |
+
[[34m2025-03-21 00:11:44[0m] (step=0010750) Train Loss: 6.4044, Train Steps/Sec: 0.72
|
| 468 |
+
[[34m2025-03-21 00:12:19[0m] (step=0010775) Train Loss: 6.4084, Train Steps/Sec: 0.71
|
| 469 |
+
[[34m2025-03-21 00:12:54[0m] (step=0010800) Train Loss: 6.4108, Train Steps/Sec: 0.71
|
| 470 |
+
[[34m2025-03-21 00:13:29[0m] (step=0010825) Train Loss: 6.4256, Train Steps/Sec: 0.72
|
| 471 |
+
[[34m2025-03-21 00:14:04[0m] (step=0010850) Train Loss: 6.4444, Train Steps/Sec: 0.72
|
| 472 |
+
[[34m2025-03-21 00:14:39[0m] (step=0010875) Train Loss: 6.4490, Train Steps/Sec: 0.71
|
| 473 |
+
[[34m2025-03-21 00:15:14[0m] (step=0010900) Train Loss: 6.4379, Train Steps/Sec: 0.72
|
| 474 |
+
[[34m2025-03-21 00:15:49[0m] (step=0010925) Train Loss: 6.4175, Train Steps/Sec: 0.72
|
| 475 |
+
[[34m2025-03-21 00:16:24[0m] (step=0010950) Train Loss: 6.4370, Train Steps/Sec: 0.72
|
| 476 |
+
[[34m2025-03-21 00:16:59[0m] (step=0010975) Train Loss: 6.4121, Train Steps/Sec: 0.72
|
| 477 |
+
[[34m2025-03-21 00:17:34[0m] (step=0011000) Train Loss: 6.4375, Train Steps/Sec: 0.72
|
| 478 |
+
[[34m2025-03-21 00:18:09[0m] (step=0011025) Train Loss: 6.4554, Train Steps/Sec: 0.72
|
| 479 |
+
[[34m2025-03-21 00:18:44[0m] (step=0011050) Train Loss: 6.4220, Train Steps/Sec: 0.72
|
| 480 |
+
[[34m2025-03-21 00:19:18[0m] (step=0011075) Train Loss: 6.4181, Train Steps/Sec: 0.72
|
| 481 |
+
[[34m2025-03-21 00:19:53[0m] (step=0011100) Train Loss: 6.4430, Train Steps/Sec: 0.72
|
| 482 |
+
[[34m2025-03-21 00:20:28[0m] (step=0011125) Train Loss: 6.4202, Train Steps/Sec: 0.72
|
| 483 |
+
[[34m2025-03-21 00:21:03[0m] (step=0011150) Train Loss: 6.4380, Train Steps/Sec: 0.72
|
| 484 |
+
[[34m2025-03-21 00:21:38[0m] (step=0011175) Train Loss: 6.4583, Train Steps/Sec: 0.72
|
| 485 |
+
[[34m2025-03-21 00:22:13[0m] (step=0011200) Train Loss: 6.3895, Train Steps/Sec: 0.72
|
| 486 |
+
[[34m2025-03-21 00:22:48[0m] (step=0011225) Train Loss: 6.4082, Train Steps/Sec: 0.72
|
| 487 |
+
[[34m2025-03-21 00:23:23[0m] (step=0011250) Train Loss: 6.4263, Train Steps/Sec: 0.72
|
| 488 |
+
[[34m2025-03-21 00:23:58[0m] (step=0011275) Train Loss: 6.4234, Train Steps/Sec: 0.72
|
| 489 |
+
[[34m2025-03-21 00:24:33[0m] (step=0011300) Train Loss: 6.4234, Train Steps/Sec: 0.72
|
| 490 |
+
[[34m2025-03-21 00:25:08[0m] (step=0011325) Train Loss: 6.4205, Train Steps/Sec: 0.72
|
| 491 |
+
[[34m2025-03-21 00:25:43[0m] (step=0011350) Train Loss: 6.4295, Train Steps/Sec: 0.72
|
| 492 |
+
[[34m2025-03-21 00:26:18[0m] (step=0011375) Train Loss: 6.4027, Train Steps/Sec: 0.72
|
| 493 |
+
[[34m2025-03-21 00:26:53[0m] (step=0011400) Train Loss: 6.4427, Train Steps/Sec: 0.72
|
| 494 |
+
[[34m2025-03-21 00:27:29[0m] (step=0011425) Train Loss: 6.4372, Train Steps/Sec: 0.69
|
| 495 |
+
[[34m2025-03-21 00:28:04[0m] (step=0011450) Train Loss: 6.4177, Train Steps/Sec: 0.72
|
| 496 |
+
[[34m2025-03-21 00:28:39[0m] (step=0011475) Train Loss: 6.3940, Train Steps/Sec: 0.72
|
| 497 |
+
[[34m2025-03-21 00:29:14[0m] (step=0011500) Train Loss: 6.4064, Train Steps/Sec: 0.72
|
| 498 |
+
[[34m2025-03-21 00:29:49[0m] (step=0011525) Train Loss: 6.4154, Train Steps/Sec: 0.72
|
| 499 |
+
[[34m2025-03-21 00:30:24[0m] (step=0011550) Train Loss: 6.4276, Train Steps/Sec: 0.72
|
| 500 |
+
[[34m2025-03-21 00:31:00[0m] (step=0011575) Train Loss: 6.4411, Train Steps/Sec: 0.69
|
| 501 |
+
[[34m2025-03-21 00:31:35[0m] (step=0011600) Train Loss: 6.4168, Train Steps/Sec: 0.72
|
| 502 |
+
[[34m2025-03-21 00:32:10[0m] (step=0011625) Train Loss: 6.4424, Train Steps/Sec: 0.72
|
| 503 |
+
[[34m2025-03-21 00:32:45[0m] (step=0011650) Train Loss: 6.3940, Train Steps/Sec: 0.72
|
| 504 |
+
[[34m2025-03-21 00:33:20[0m] (step=0011675) Train Loss: 6.4143, Train Steps/Sec: 0.72
|
| 505 |
+
[[34m2025-03-21 00:33:55[0m] (step=0011700) Train Loss: 6.4287, Train Steps/Sec: 0.72
|
| 506 |
+
[[34m2025-03-21 00:34:31[0m] (step=0011725) Train Loss: 6.4099, Train Steps/Sec: 0.69
|
| 507 |
+
[[34m2025-03-21 00:35:06[0m] (step=0011750) Train Loss: 6.4160, Train Steps/Sec: 0.72
|
| 508 |
+
[[34m2025-03-21 00:35:42[0m] (step=0011775) Train Loss: 6.4239, Train Steps/Sec: 0.69
|
| 509 |
+
[[34m2025-03-21 00:36:17[0m] (step=0011800) Train Loss: 6.4091, Train Steps/Sec: 0.72
|
| 510 |
+
[[34m2025-03-21 00:36:52[0m] (step=0011825) Train Loss: 6.4256, Train Steps/Sec: 0.72
|
| 511 |
+
[[34m2025-03-21 00:37:27[0m] (step=0011850) Train Loss: 6.4225, Train Steps/Sec: 0.72
|
| 512 |
+
[[34m2025-03-21 00:38:02[0m] (step=0011875) Train Loss: 6.4456, Train Steps/Sec: 0.72
|
| 513 |
+
[[34m2025-03-21 00:38:37[0m] (step=0011900) Train Loss: 6.4158, Train Steps/Sec: 0.72
|
| 514 |
+
[[34m2025-03-21 00:39:13[0m] (step=0011925) Train Loss: 6.3986, Train Steps/Sec: 0.69
|
| 515 |
+
[[34m2025-03-21 00:39:49[0m] (step=0011950) Train Loss: 6.4204, Train Steps/Sec: 0.69
|
| 516 |
+
[[34m2025-03-21 00:40:24[0m] (step=0011975) Train Loss: 6.4600, Train Steps/Sec: 0.72
|
| 517 |
+
[[34m2025-03-21 00:40:59[0m] (step=0012000) Train Loss: 6.3997, Train Steps/Sec: 0.72
|
| 518 |
+
[[34m2025-03-21 00:40:59[0m] text_config is None. Initializing the text config with default values (`OPTConfig`).
|
| 519 |
+
[[34m2025-03-21 00:47:01[0m] Finish Eval in 12000 steps...
|
| 520 |
+
[[34m2025-03-21 00:47:07[0m] Saved checkpoint to checkpoints/TWO_node_llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_noimageonly_newfix_train_all/014-GPT-XL/checkpoints/0012000.pt
|
| 521 |
+
[[34m2025-03-21 00:47:08[0m] Removed old checkpoint: checkpoints/TWO_node_llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_noimageonly_newfix_train_all/014-GPT-XL/checkpoints/0010000.pt
|
| 522 |
+
[[34m2025-03-21 00:47:43[0m] (step=0012025) Train Loss: 6.4527, Train Steps/Sec: 0.06
|
| 523 |
+
[[34m2025-03-21 00:48:18[0m] (step=0012050) Train Loss: 6.4047, Train Steps/Sec: 0.72
|
| 524 |
+
[[34m2025-03-21 00:48:53[0m] (step=0012075) Train Loss: 6.4092, Train Steps/Sec: 0.72
|
| 525 |
+
[[34m2025-03-21 00:49:28[0m] (step=0012100) Train Loss: 6.4124, Train Steps/Sec: 0.72
|
| 526 |
+
[[34m2025-03-21 00:50:03[0m] (step=0012125) Train Loss: 6.4431, Train Steps/Sec: 0.72
|
| 527 |
+
[[34m2025-03-21 00:50:38[0m] (step=0012150) Train Loss: 6.4172, Train Steps/Sec: 0.72
|
| 528 |
+
[[34m2025-03-21 00:51:13[0m] (step=0012175) Train Loss: 6.4271, Train Steps/Sec: 0.72
|
| 529 |
+
[[34m2025-03-21 00:51:49[0m] (step=0012200) Train Loss: 6.4311, Train Steps/Sec: 0.70
|
| 530 |
+
[[34m2025-03-21 00:52:24[0m] (step=0012225) Train Loss: 6.4038, Train Steps/Sec: 0.72
|
| 531 |
+
[[34m2025-03-21 00:52:58[0m] (step=0012250) Train Loss: 6.3975, Train Steps/Sec: 0.72
|
| 532 |
+
[[34m2025-03-21 00:53:33[0m] (step=0012275) Train Loss: 6.4112, Train Steps/Sec: 0.72
|
| 533 |
+
[[34m2025-03-21 00:54:08[0m] (step=0012300) Train Loss: 6.4272, Train Steps/Sec: 0.72
|
| 534 |
+
[[34m2025-03-21 00:54:43[0m] (step=0012325) Train Loss: 6.4207, Train Steps/Sec: 0.72
|
| 535 |
+
[[34m2025-03-21 00:55:19[0m] (step=0012350) Train Loss: 6.4475, Train Steps/Sec: 0.70
|
| 536 |
+
[[34m2025-03-21 00:55:54[0m] (step=0012375) Train Loss: 6.4283, Train Steps/Sec: 0.72
|
| 537 |
+
[[34m2025-03-21 00:56:29[0m] (step=0012400) Train Loss: 6.3989, Train Steps/Sec: 0.72
|
| 538 |
+
[[34m2025-03-21 00:57:04[0m] (step=0012425) Train Loss: 6.4149, Train Steps/Sec: 0.72
|
| 539 |
+
[[34m2025-03-21 00:57:39[0m] (step=0012450) Train Loss: 6.4022, Train Steps/Sec: 0.72
|
| 540 |
+
[[34m2025-03-21 00:58:14[0m] (step=0012475) Train Loss: 6.4146, Train Steps/Sec: 0.72
|
| 541 |
+
[[34m2025-03-21 00:58:49[0m] (step=0012500) Train Loss: 6.4397, Train Steps/Sec: 0.72
|
| 542 |
+
[[34m2025-03-21 00:59:24[0m] (step=0012525) Train Loss: 6.3778, Train Steps/Sec: 0.72
|
| 543 |
+
[[34m2025-03-21 00:59:59[0m] (step=0012550) Train Loss: 6.4386, Train Steps/Sec: 0.72
|
| 544 |
+
[[34m2025-03-21 01:00:34[0m] (step=0012575) Train Loss: 6.3805, Train Steps/Sec: 0.72
|
| 545 |
+
[[34m2025-03-21 01:01:09[0m] (step=0012600) Train Loss: 6.4210, Train Steps/Sec: 0.72
|
| 546 |
+
[[34m2025-03-21 01:01:43[0m] (step=0012625) Train Loss: 6.4042, Train Steps/Sec: 0.72
|
| 547 |
+
[[34m2025-03-21 01:02:18[0m] (step=0012650) Train Loss: 6.4037, Train Steps/Sec: 0.72
|
| 548 |
+
[[34m2025-03-21 01:02:53[0m] (step=0012675) Train Loss: 6.4223, Train Steps/Sec: 0.72
|
| 549 |
+
[[34m2025-03-21 01:03:28[0m] (step=0012700) Train Loss: 6.3889, Train Steps/Sec: 0.72
|
| 550 |
+
[[34m2025-03-21 01:04:03[0m] (step=0012725) Train Loss: 6.4150, Train Steps/Sec: 0.72
|
| 551 |
+
[[34m2025-03-21 01:04:38[0m] (step=0012750) Train Loss: 6.4073, Train Steps/Sec: 0.72
|
| 552 |
+
[[34m2025-03-21 01:05:13[0m] (step=0012775) Train Loss: 6.4256, Train Steps/Sec: 0.72
|
| 553 |
+
[[34m2025-03-21 01:05:48[0m] (step=0012800) Train Loss: 6.4097, Train Steps/Sec: 0.72
|
| 554 |
+
[[34m2025-03-21 01:06:23[0m] (step=0012825) Train Loss: 6.4153, Train Steps/Sec: 0.72
|
| 555 |
+
[[34m2025-03-21 01:06:58[0m] (step=0012850) Train Loss: 6.3949, Train Steps/Sec: 0.72
|
| 556 |
+
[[34m2025-03-21 01:07:33[0m] (step=0012875) Train Loss: 6.4377, Train Steps/Sec: 0.72
|
| 557 |
+
[[34m2025-03-21 01:08:08[0m] (step=0012900) Train Loss: 6.4257, Train Steps/Sec: 0.72
|
| 558 |
+
[[34m2025-03-21 01:08:43[0m] (step=0012925) Train Loss: 6.4156, Train Steps/Sec: 0.72
|
| 559 |
+
[[34m2025-03-21 01:09:18[0m] (step=0012950) Train Loss: 6.3821, Train Steps/Sec: 0.72
|
| 560 |
+
[[34m2025-03-21 01:09:53[0m] (step=0012975) Train Loss: 6.4387, Train Steps/Sec: 0.72
|
| 561 |
+
[[34m2025-03-21 01:10:28[0m] (step=0013000) Train Loss: 6.4018, Train Steps/Sec: 0.72
|
| 562 |
+
[[34m2025-03-21 01:11:03[0m] (step=0013025) Train Loss: 6.4352, Train Steps/Sec: 0.72
|
| 563 |
+
[[34m2025-03-21 01:11:38[0m] (step=0013050) Train Loss: 6.4087, Train Steps/Sec: 0.72
|
| 564 |
+
[[34m2025-03-21 01:12:12[0m] (step=0013075) Train Loss: 6.4049, Train Steps/Sec: 0.72
|
| 565 |
+
[[34m2025-03-21 01:12:47[0m] (step=0013100) Train Loss: 6.4125, Train Steps/Sec: 0.72
|
| 566 |
+
[[34m2025-03-21 01:13:22[0m] (step=0013125) Train Loss: 6.4248, Train Steps/Sec: 0.71
|
| 567 |
+
[[34m2025-03-21 01:13:57[0m] (step=0013150) Train Loss: 6.4104, Train Steps/Sec: 0.72
|
| 568 |
+
[[34m2025-03-21 01:14:32[0m] (step=0013175) Train Loss: 6.4220, Train Steps/Sec: 0.72
|
| 569 |
+
[[34m2025-03-21 01:15:07[0m] (step=0013200) Train Loss: 6.4068, Train Steps/Sec: 0.72
|
| 570 |
+
[[34m2025-03-21 01:15:42[0m] (step=0013225) Train Loss: 6.3936, Train Steps/Sec: 0.72
|
| 571 |
+
[[34m2025-03-21 01:16:17[0m] (step=0013250) Train Loss: 6.4138, Train Steps/Sec: 0.72
|
| 572 |
+
[[34m2025-03-21 01:16:52[0m] (step=0013275) Train Loss: 6.4003, Train Steps/Sec: 0.72
|
| 573 |
+
[[34m2025-03-21 01:17:27[0m] (step=0013300) Train Loss: 6.4214, Train Steps/Sec: 0.72
|
| 574 |
+
[[34m2025-03-21 01:18:02[0m] (step=0013325) Train Loss: 6.4274, Train Steps/Sec: 0.72
|
| 575 |
+
[[34m2025-03-21 01:18:37[0m] (step=0013350) Train Loss: 6.3881, Train Steps/Sec: 0.72
|
| 576 |
+
[[34m2025-03-21 01:19:12[0m] (step=0013375) Train Loss: 6.4484, Train Steps/Sec: 0.72
|
| 577 |
+
[[34m2025-03-21 01:19:47[0m] (step=0013400) Train Loss: 6.3996, Train Steps/Sec: 0.72
|
| 578 |
+
[[34m2025-03-21 01:20:22[0m] (step=0013425) Train Loss: 6.4103, Train Steps/Sec: 0.72
|
| 579 |
+
[[34m2025-03-21 01:20:56[0m] (step=0013450) Train Loss: 6.4189, Train Steps/Sec: 0.72
|
| 580 |
+
[[34m2025-03-21 01:21:31[0m] (step=0013475) Train Loss: 6.4467, Train Steps/Sec: 0.72
|
| 581 |
+
[[34m2025-03-21 01:22:06[0m] (step=0013500) Train Loss: 6.4088, Train Steps/Sec: 0.72
|
| 582 |
+
[[34m2025-03-21 01:22:41[0m] (step=0013525) Train Loss: 6.4400, Train Steps/Sec: 0.72
|
| 583 |
+
[[34m2025-03-21 01:23:16[0m] (step=0013550) Train Loss: 6.4119, Train Steps/Sec: 0.72
|
| 584 |
+
[[34m2025-03-21 01:23:51[0m] (step=0013575) Train Loss: 6.4174, Train Steps/Sec: 0.72
|
| 585 |
+
[[34m2025-03-21 01:24:26[0m] (step=0013600) Train Loss: 6.4185, Train Steps/Sec: 0.72
|
| 586 |
+
[[34m2025-03-21 01:25:01[0m] (step=0013625) Train Loss: 6.4157, Train Steps/Sec: 0.72
|
| 587 |
+
[[34m2025-03-21 01:25:36[0m] (step=0013650) Train Loss: 6.4242, Train Steps/Sec: 0.72
|
| 588 |
+
[[34m2025-03-21 01:26:11[0m] (step=0013675) Train Loss: 6.4308, Train Steps/Sec: 0.72
|
| 589 |
+
[[34m2025-03-21 01:26:46[0m] (step=0013700) Train Loss: 6.4183, Train Steps/Sec: 0.72
|
| 590 |
+
[[34m2025-03-21 01:27:22[0m] (step=0013725) Train Loss: 6.4363, Train Steps/Sec: 0.69
|
| 591 |
+
[[34m2025-03-21 01:27:57[0m] (step=0013750) Train Loss: 6.4227, Train Steps/Sec: 0.72
|
| 592 |
+
[[34m2025-03-21 01:28:32[0m] (step=0013775) Train Loss: 6.4476, Train Steps/Sec: 0.72
|
| 593 |
+
[[34m2025-03-21 01:29:07[0m] (step=0013800) Train Loss: 6.3768, Train Steps/Sec: 0.72
|
| 594 |
+
[[34m2025-03-21 01:29:42[0m] (step=0013825) Train Loss: 6.4080, Train Steps/Sec: 0.72
|
| 595 |
+
[[34m2025-03-21 01:30:17[0m] (step=0013850) Train Loss: 6.3899, Train Steps/Sec: 0.72
|
| 596 |
+
[[34m2025-03-21 01:30:52[0m] (step=0013875) Train Loss: 6.3891, Train Steps/Sec: 0.72
|
| 597 |
+
[[34m2025-03-21 01:31:26[0m] (step=0013900) Train Loss: 6.4219, Train Steps/Sec: 0.72
|
| 598 |
+
[[34m2025-03-21 01:32:03[0m] (step=0013925) Train Loss: 6.4217, Train Steps/Sec: 0.69
|
| 599 |
+
[[34m2025-03-21 01:32:37[0m] (step=0013950) Train Loss: 6.4133, Train Steps/Sec: 0.72
|
| 600 |
+
[[34m2025-03-21 01:33:12[0m] (step=0013975) Train Loss: 6.4125, Train Steps/Sec: 0.72
|
| 601 |
+
[[34m2025-03-21 01:33:47[0m] (step=0014000) Train Loss: 6.4182, Train Steps/Sec: 0.72
|
| 602 |
+
[[34m2025-03-21 01:33:47[0m] text_config is None. Initializing the text config with default values (`OPTConfig`).
|
| 603 |
+
[[34m2025-03-21 01:39:52[0m] Finish Eval in 14000 steps...
|
| 604 |
+
[[34m2025-03-21 01:39:58[0m] Saved checkpoint to checkpoints/TWO_node_llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_noimageonly_newfix_train_all/014-GPT-XL/checkpoints/0014000.pt
|
| 605 |
+
[[34m2025-03-21 01:39:59[0m] Removed old checkpoint: checkpoints/TWO_node_llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_noimageonly_newfix_train_all/014-GPT-XL/checkpoints/0012000.pt
|
| 606 |
+
[[34m2025-03-21 01:40:34[0m] (step=0014025) Train Loss: 6.4065, Train Steps/Sec: 0.06
|
| 607 |
+
[[34m2025-03-21 01:41:09[0m] (step=0014050) Train Loss: 6.4122, Train Steps/Sec: 0.72
|
| 608 |
+
[[34m2025-03-21 01:41:45[0m] (step=0014075) Train Loss: 6.3893, Train Steps/Sec: 0.69
|
| 609 |
+
[[34m2025-03-21 01:42:20[0m] (step=0014100) Train Loss: 6.3906, Train Steps/Sec: 0.72
|
| 610 |
+
[[34m2025-03-21 01:42:55[0m] (step=0014125) Train Loss: 6.3803, Train Steps/Sec: 0.72
|
| 611 |
+
[[34m2025-03-21 01:43:30[0m] (step=0014150) Train Loss: 6.3899, Train Steps/Sec: 0.72
|
| 612 |
+
[[34m2025-03-21 01:44:05[0m] (step=0014175) Train Loss: 6.4217, Train Steps/Sec: 0.72
|
| 613 |
+
[[34m2025-03-21 01:44:41[0m] (step=0014200) Train Loss: 6.4139, Train Steps/Sec: 0.70
|
| 614 |
+
[[34m2025-03-21 01:45:16[0m] (step=0014225) Train Loss: 6.4077, Train Steps/Sec: 0.72
|
| 615 |
+
[[34m2025-03-21 01:45:51[0m] (step=0014250) Train Loss: 6.3863, Train Steps/Sec: 0.72
|
| 616 |
+
[[34m2025-03-21 01:46:26[0m] (step=0014275) Train Loss: 6.4040, Train Steps/Sec: 0.72
|
| 617 |
+
[[34m2025-03-21 01:47:01[0m] (step=0014300) Train Loss: 6.4216, Train Steps/Sec: 0.71
|
| 618 |
+
[[34m2025-03-21 01:47:36[0m] (step=0014325) Train Loss: 6.3933, Train Steps/Sec: 0.72
|
| 619 |
+
[[34m2025-03-21 01:48:11[0m] (step=0014350) Train Loss: 6.4138, Train Steps/Sec: 0.72
|
| 620 |
+
[[34m2025-03-21 01:48:46[0m] (step=0014375) Train Loss: 6.3870, Train Steps/Sec: 0.70
|
| 621 |
+
[[34m2025-03-21 01:49:21[0m] (step=0014400) Train Loss: 6.4153, Train Steps/Sec: 0.72
|
| 622 |
+
[[34m2025-03-21 01:49:56[0m] (step=0014425) Train Loss: 6.4030, Train Steps/Sec: 0.72
|
| 623 |
+
[[34m2025-03-21 01:50:31[0m] (step=0014450) Train Loss: 6.4307, Train Steps/Sec: 0.72
|
| 624 |
+
[[34m2025-03-21 01:51:06[0m] (step=0014475) Train Loss: 6.3967, Train Steps/Sec: 0.72
|
| 625 |
+
[[34m2025-03-21 01:51:41[0m] (step=0014500) Train Loss: 6.4080, Train Steps/Sec: 0.72
|
| 626 |
+
[[34m2025-03-21 01:52:16[0m] (step=0014525) Train Loss: 6.4092, Train Steps/Sec: 0.72
|
| 627 |
+
[[34m2025-03-21 01:52:52[0m] (step=0014550) Train Loss: 6.4266, Train Steps/Sec: 0.70
|
| 628 |
+
[[34m2025-03-21 01:53:27[0m] (step=0014575) Train Loss: 6.4017, Train Steps/Sec: 0.72
|
| 629 |
+
[[34m2025-03-21 01:54:02[0m] (step=0014600) Train Loss: 6.3990, Train Steps/Sec: 0.72
|
| 630 |
+
[[34m2025-03-21 01:54:37[0m] (step=0014625) Train Loss: 6.3913, Train Steps/Sec: 0.72
|
| 631 |
+
[[34m2025-03-21 01:55:12[0m] (step=0014650) Train Loss: 6.4007, Train Steps/Sec: 0.72
|
| 632 |
+
[[34m2025-03-21 01:55:46[0m] (step=0014675) Train Loss: 6.4025, Train Steps/Sec: 0.72
|
| 633 |
+
[[34m2025-03-21 01:56:21[0m] (step=0014700) Train Loss: 6.3865, Train Steps/Sec: 0.72
|
| 634 |
+
[[34m2025-03-21 01:56:56[0m] (step=0014725) Train Loss: 6.4113, Train Steps/Sec: 0.72
|
| 635 |
+
[[34m2025-03-21 01:57:32[0m] (step=0014750) Train Loss: 6.4391, Train Steps/Sec: 0.69
|
| 636 |
+
[[34m2025-03-21 01:58:07[0m] (step=0014775) Train Loss: 6.3700, Train Steps/Sec: 0.72
|
| 637 |
+
[[34m2025-03-21 01:58:43[0m] (step=0014800) Train Loss: 6.4230, Train Steps/Sec: 0.70
|
| 638 |
+
[[34m2025-03-21 01:59:18[0m] (step=0014825) Train Loss: 6.4252, Train Steps/Sec: 0.72
|
| 639 |
+
[[34m2025-03-21 01:59:53[0m] (step=0014850) Train Loss: 6.4132, Train Steps/Sec: 0.72
|
| 640 |
+
[[34m2025-03-21 02:00:28[0m] (step=0014875) Train Loss: 6.4216, Train Steps/Sec: 0.72
|
| 641 |
+
[[34m2025-03-21 02:01:03[0m] (step=0014900) Train Loss: 6.4215, Train Steps/Sec: 0.72
|
| 642 |
+
[[34m2025-03-21 02:01:38[0m] (step=0014925) Train Loss: 6.4252, Train Steps/Sec: 0.72
|
| 643 |
+
[[34m2025-03-21 02:02:13[0m] (step=0014950) Train Loss: 6.4355, Train Steps/Sec: 0.71
|
| 644 |
+
[[34m2025-03-21 02:02:48[0m] (step=0014975) Train Loss: 6.3882, Train Steps/Sec: 0.72
|
| 645 |
+
[[34m2025-03-21 02:03:23[0m] (step=0015000) Train Loss: 6.4048, Train Steps/Sec: 0.72
|
| 646 |
+
[[34m2025-03-21 02:03:58[0m] (step=0015025) Train Loss: 6.4226, Train Steps/Sec: 0.72
|
| 647 |
+
[[34m2025-03-21 02:04:33[0m] (step=0015050) Train Loss: 6.3703, Train Steps/Sec: 0.72
|
| 648 |
+
[[34m2025-03-21 02:05:08[0m] (step=0015075) Train Loss: 6.4106, Train Steps/Sec: 0.72
|
| 649 |
+
[[34m2025-03-21 02:05:43[0m] (step=0015100) Train Loss: 6.4465, Train Steps/Sec: 0.72
|
| 650 |
+
[[34m2025-03-21 02:06:18[0m] (step=0015125) Train Loss: 6.4212, Train Steps/Sec: 0.72
|
| 651 |
+
[[34m2025-03-21 02:06:53[0m] (step=0015150) Train Loss: 6.4173, Train Steps/Sec: 0.72
|
| 652 |
+
[[34m2025-03-21 02:07:28[0m] (step=0015175) Train Loss: 6.3896, Train Steps/Sec: 0.72
|
| 653 |
+
[[34m2025-03-21 02:08:02[0m] (step=0015200) Train Loss: 6.4121, Train Steps/Sec: 0.72
|
| 654 |
+
[[34m2025-03-21 02:08:37[0m] (step=0015225) Train Loss: 6.4142, Train Steps/Sec: 0.72
|
| 655 |
+
[[34m2025-03-21 02:09:12[0m] (step=0015250) Train Loss: 6.4024, Train Steps/Sec: 0.72
|
| 656 |
+
[[34m2025-03-21 02:09:47[0m] (step=0015275) Train Loss: 6.3999, Train Steps/Sec: 0.72
|
| 657 |
+
[[34m2025-03-21 02:10:22[0m] (step=0015300) Train Loss: 6.3833, Train Steps/Sec: 0.72
|
| 658 |
+
[[34m2025-03-21 02:10:57[0m] (step=0015325) Train Loss: 6.4049, Train Steps/Sec: 0.72
|
| 659 |
+
[[34m2025-03-21 02:11:32[0m] (step=0015350) Train Loss: 6.4081, Train Steps/Sec: 0.72
|
| 660 |
+
[[34m2025-03-21 02:12:07[0m] (step=0015375) Train Loss: 6.4086, Train Steps/Sec: 0.71
|
| 661 |
+
[[34m2025-03-21 02:12:42[0m] (step=0015400) Train Loss: 6.4242, Train Steps/Sec: 0.72
|
| 662 |
+
[[34m2025-03-21 02:13:17[0m] (step=0015425) Train Loss: 6.3931, Train Steps/Sec: 0.72
|
| 663 |
+
[[34m2025-03-21 02:13:52[0m] (step=0015450) Train Loss: 6.4196, Train Steps/Sec: 0.72
|
| 664 |
+
[[34m2025-03-21 02:14:27[0m] (step=0015475) Train Loss: 6.4264, Train Steps/Sec: 0.72
|
| 665 |
+
[[34m2025-03-21 02:15:02[0m] (step=0015500) Train Loss: 6.4135, Train Steps/Sec: 0.72
|
| 666 |
+
[[34m2025-03-21 02:15:37[0m] (step=0015525) Train Loss: 6.4198, Train Steps/Sec: 0.72
|
| 667 |
+
[[34m2025-03-21 02:16:12[0m] (step=0015550) Train Loss: 6.3877, Train Steps/Sec: 0.72
|
| 668 |
+
[[34m2025-03-21 02:16:47[0m] (step=0015575) Train Loss: 6.3871, Train Steps/Sec: 0.72
|
| 669 |
+
[[34m2025-03-21 02:17:22[0m] (step=0015600) Train Loss: 6.4317, Train Steps/Sec: 0.72
|
| 670 |
+
[[34m2025-03-21 02:17:57[0m] (step=0015625) Train Loss: 6.4222, Train Steps/Sec: 0.72
|
| 671 |
+
[[34m2025-03-21 02:18:32[0m] (step=0015650) Train Loss: 6.3991, Train Steps/Sec: 0.72
|
| 672 |
+
[[34m2025-03-21 02:19:07[0m] (step=0015675) Train Loss: 6.4249, Train Steps/Sec: 0.72
|
| 673 |
+
[[34m2025-03-21 02:19:41[0m] (step=0015700) Train Loss: 6.4182, Train Steps/Sec: 0.72
|
| 674 |
+
[[34m2025-03-21 02:20:18[0m] (step=0015725) Train Loss: 6.4274, Train Steps/Sec: 0.69
|
| 675 |
+
[[34m2025-03-21 02:20:53[0m] (step=0015750) Train Loss: 6.3992, Train Steps/Sec: 0.72
|
| 676 |
+
[[34m2025-03-21 02:21:27[0m] (step=0015775) Train Loss: 6.3805, Train Steps/Sec: 0.72
|
| 677 |
+
[[34m2025-03-21 02:22:02[0m] (step=0015800) Train Loss: 6.3755, Train Steps/Sec: 0.72
|
| 678 |
+
[[34m2025-03-21 02:22:37[0m] (step=0015825) Train Loss: 6.3810, Train Steps/Sec: 0.72
|
| 679 |
+
[[34m2025-03-21 02:23:12[0m] (step=0015850) Train Loss: 6.4024, Train Steps/Sec: 0.72
|
| 680 |
+
[[34m2025-03-21 02:23:47[0m] (step=0015875) Train Loss: 6.3810, Train Steps/Sec: 0.71
|
| 681 |
+
[[34m2025-03-21 02:24:23[0m] (step=0015900) Train Loss: 6.4271, Train Steps/Sec: 0.69
|
| 682 |
+
[[34m2025-03-21 02:24:58[0m] (step=0015925) Train Loss: 6.4100, Train Steps/Sec: 0.72
|
| 683 |
+
[[34m2025-03-21 02:25:33[0m] (step=0015950) Train Loss: 6.3983, Train Steps/Sec: 0.72
|
| 684 |
+
[[34m2025-03-21 02:26:08[0m] (step=0015975) Train Loss: 6.4109, Train Steps/Sec: 0.72
|
| 685 |
+
[[34m2025-03-21 02:26:43[0m] (step=0016000) Train Loss: 6.4364, Train Steps/Sec: 0.72
|
| 686 |
+
[[34m2025-03-21 02:26:43[0m] text_config is None. Initializing the text config with default values (`OPTConfig`).
|
| 687 |
+
[[34m2025-03-21 02:32:45[0m] Finish Eval in 16000 steps...
|
| 688 |
+
[[34m2025-03-21 02:32:52[0m] Saved checkpoint to checkpoints/TWO_node_llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_noimageonly_newfix_train_all/014-GPT-XL/checkpoints/0016000.pt
|
| 689 |
+
[[34m2025-03-21 02:32:53[0m] Removed old checkpoint: checkpoints/TWO_node_llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_noimageonly_newfix_train_all/014-GPT-XL/checkpoints/0014000.pt
|
| 690 |
+
[[34m2025-03-21 02:33:28[0m] (step=0016025) Train Loss: 6.4140, Train Steps/Sec: 0.06
|
| 691 |
+
[[34m2025-03-21 02:34:03[0m] (step=0016050) Train Loss: 6.4090, Train Steps/Sec: 0.72
|
| 692 |
+
[[34m2025-03-21 02:34:38[0m] (step=0016075) Train Loss: 6.4002, Train Steps/Sec: 0.71
|
| 693 |
+
[[34m2025-03-21 02:35:14[0m] (step=0016100) Train Loss: 6.3993, Train Steps/Sec: 0.69
|
| 694 |
+
[[34m2025-03-21 02:35:49[0m] (step=0016125) Train Loss: 6.4020, Train Steps/Sec: 0.72
|
| 695 |
+
[[34m2025-03-21 02:36:25[0m] (step=0016150) Train Loss: 6.4036, Train Steps/Sec: 0.70
|
| 696 |
+
[[34m2025-03-21 02:37:00[0m] (step=0016175) Train Loss: 6.4256, Train Steps/Sec: 0.72
|
| 697 |
+
[[34m2025-03-21 02:37:35[0m] (step=0016200) Train Loss: 6.3889, Train Steps/Sec: 0.72
|
| 698 |
+
[[34m2025-03-21 02:38:10[0m] (step=0016225) Train Loss: 6.4008, Train Steps/Sec: 0.72
|
| 699 |
+
[[34m2025-03-21 02:38:44[0m] (step=0016250) Train Loss: 6.4108, Train Steps/Sec: 0.72
|
| 700 |
+
[[34m2025-03-21 02:39:19[0m] (step=0016275) Train Loss: 6.4060, Train Steps/Sec: 0.72
|
| 701 |
+
[[34m2025-03-21 02:39:54[0m] (step=0016300) Train Loss: 6.4109, Train Steps/Sec: 0.72
|
| 702 |
+
[[34m2025-03-21 02:40:29[0m] (step=0016325) Train Loss: 6.4012, Train Steps/Sec: 0.72
|
| 703 |
+
[[34m2025-03-21 02:41:04[0m] (step=0016350) Train Loss: 6.4064, Train Steps/Sec: 0.72
|
| 704 |
+
[[34m2025-03-21 02:41:39[0m] (step=0016375) Train Loss: 6.4000, Train Steps/Sec: 0.72
|
| 705 |
+
[[34m2025-03-21 02:42:14[0m] (step=0016400) Train Loss: 6.4227, Train Steps/Sec: 0.72
|
| 706 |
+
[[34m2025-03-21 02:42:49[0m] (step=0016425) Train Loss: 6.3825, Train Steps/Sec: 0.72
|
| 707 |
+
[[34m2025-03-21 02:43:24[0m] (step=0016450) Train Loss: 6.4030, Train Steps/Sec: 0.72
|
| 708 |
+
[[34m2025-03-21 02:44:00[0m] (step=0016475) Train Loss: 6.3910, Train Steps/Sec: 0.69
|
| 709 |
+
[[34m2025-03-21 02:44:35[0m] (step=0016500) Train Loss: 6.3763, Train Steps/Sec: 0.72
|
| 710 |
+
[[34m2025-03-21 02:45:10[0m] (step=0016525) Train Loss: 6.4024, Train Steps/Sec: 0.72
|
| 711 |
+
[[34m2025-03-21 02:45:46[0m] (step=0016550) Train Loss: 6.4089, Train Steps/Sec: 0.69
|
| 712 |
+
[[34m2025-03-21 02:46:21[0m] (step=0016575) Train Loss: 6.4139, Train Steps/Sec: 0.72
|
| 713 |
+
[[34m2025-03-21 02:46:56[0m] (step=0016600) Train Loss: 6.4163, Train Steps/Sec: 0.72
|
| 714 |
+
[[34m2025-03-21 02:47:31[0m] (step=0016625) Train Loss: 6.3837, Train Steps/Sec: 0.72
|
| 715 |
+
[[34m2025-03-21 02:48:06[0m] (step=0016650) Train Loss: 6.4170, Train Steps/Sec: 0.72
|
| 716 |
+
[[34m2025-03-21 02:48:41[0m] (step=0016675) Train Loss: 6.3712, Train Steps/Sec: 0.72
|
| 717 |
+
[[34m2025-03-21 02:49:16[0m] (step=0016700) Train Loss: 6.4108, Train Steps/Sec: 0.71
|
| 718 |
+
[[34m2025-03-21 02:49:51[0m] (step=0016725) Train Loss: 6.3803, Train Steps/Sec: 0.72
|
| 719 |
+
[[34m2025-03-21 02:50:26[0m] (step=0016750) Train Loss: 6.4143, Train Steps/Sec: 0.71
|
| 720 |
+
[[34m2025-03-21 02:51:01[0m] (step=0016775) Train Loss: 6.4358, Train Steps/Sec: 0.72
|
| 721 |
+
[[34m2025-03-21 02:51:36[0m] (step=0016800) Train Loss: 6.3983, Train Steps/Sec: 0.72
|
| 722 |
+
[[34m2025-03-21 02:52:10[0m] (step=0016825) Train Loss: 6.4065, Train Steps/Sec: 0.72
|
| 723 |
+
[[34m2025-03-21 02:52:45[0m] (step=0016850) Train Loss: 6.3846, Train Steps/Sec: 0.72
|
| 724 |
+
[[34m2025-03-21 02:53:21[0m] (step=0016875) Train Loss: 6.4014, Train Steps/Sec: 0.70
|
| 725 |
+
[[34m2025-03-21 02:53:56[0m] (step=0016900) Train Loss: 6.4214, Train Steps/Sec: 0.72
|
| 726 |
+
[[34m2025-03-21 02:54:31[0m] (step=0016925) Train Loss: 6.4083, Train Steps/Sec: 0.72
|
| 727 |
+
[[34m2025-03-21 02:55:06[0m] (step=0016950) Train Loss: 6.3926, Train Steps/Sec: 0.72
|
| 728 |
+
[[34m2025-03-21 02:55:41[0m] (step=0016975) Train Loss: 6.3975, Train Steps/Sec: 0.72
|
| 729 |
+
[[34m2025-03-21 02:56:17[0m] (step=0017000) Train Loss: 6.4116, Train Steps/Sec: 0.70
|
| 730 |
+
[[34m2025-03-21 02:56:52[0m] (step=0017025) Train Loss: 6.3906, Train Steps/Sec: 0.72
|
| 731 |
+
[[34m2025-03-21 02:57:27[0m] (step=0017050) Train Loss: 6.3962, Train Steps/Sec: 0.72
|
| 732 |
+
[[34m2025-03-21 02:58:02[0m] (step=0017075) Train Loss: 6.4329, Train Steps/Sec: 0.72
|
| 733 |
+
[[34m2025-03-21 02:58:37[0m] (step=0017100) Train Loss: 6.4167, Train Steps/Sec: 0.72
|
| 734 |
+
[[34m2025-03-21 02:59:12[0m] (step=0017125) Train Loss: 6.3977, Train Steps/Sec: 0.72
|
| 735 |
+
[[34m2025-03-21 02:59:46[0m] (step=0017150) Train Loss: 6.4517, Train Steps/Sec: 0.72
|
| 736 |
+
[[34m2025-03-21 03:00:21[0m] (step=0017175) Train Loss: 6.3703, Train Steps/Sec: 0.72
|
| 737 |
+
[[34m2025-03-21 03:00:56[0m] (step=0017200) Train Loss: 6.3639, Train Steps/Sec: 0.72
|
| 738 |
+
[[34m2025-03-21 03:01:31[0m] (step=0017225) Train Loss: 6.4230, Train Steps/Sec: 0.72
|
| 739 |
+
[[34m2025-03-21 03:02:06[0m] (step=0017250) Train Loss: 6.4003, Train Steps/Sec: 0.71
|
| 740 |
+
[[34m2025-03-21 03:02:41[0m] (step=0017275) Train Loss: 6.4083, Train Steps/Sec: 0.72
|
| 741 |
+
[[34m2025-03-21 03:03:16[0m] (step=0017300) Train Loss: 6.3798, Train Steps/Sec: 0.72
|
| 742 |
+
[[34m2025-03-21 03:03:51[0m] (step=0017325) Train Loss: 6.3934, Train Steps/Sec: 0.71
|
| 743 |
+
[[34m2025-03-21 03:04:26[0m] (step=0017350) Train Loss: 6.4107, Train Steps/Sec: 0.71
|
| 744 |
+
[[34m2025-03-21 03:05:01[0m] (step=0017375) Train Loss: 6.4141, Train Steps/Sec: 0.71
|
| 745 |
+
[[34m2025-03-21 03:05:36[0m] (step=0017400) Train Loss: 6.4003, Train Steps/Sec: 0.72
|
| 746 |
+
[[34m2025-03-21 03:06:11[0m] (step=0017425) Train Loss: 6.4294, Train Steps/Sec: 0.72
|
| 747 |
+
[[34m2025-03-21 03:06:46[0m] (step=0017450) Train Loss: 6.3935, Train Steps/Sec: 0.72
|
| 748 |
+
[[34m2025-03-21 03:07:21[0m] (step=0017475) Train Loss: 6.4156, Train Steps/Sec: 0.72
|
| 749 |
+
[[34m2025-03-21 03:07:56[0m] (step=0017500) Train Loss: 6.3934, Train Steps/Sec: 0.71
|
| 750 |
+
[[34m2025-03-21 03:08:31[0m] (step=0017525) Train Loss: 6.4336, Train Steps/Sec: 0.72
|
| 751 |
+
[[34m2025-03-21 03:09:06[0m] (step=0017550) Train Loss: 6.3892, Train Steps/Sec: 0.72
|
| 752 |
+
[[34m2025-03-21 03:09:41[0m] (step=0017575) Train Loss: 6.4126, Train Steps/Sec: 0.72
|
| 753 |
+
[[34m2025-03-21 03:10:16[0m] (step=0017600) Train Loss: 6.4017, Train Steps/Sec: 0.72
|
| 754 |
+
[[34m2025-03-21 03:10:50[0m] (step=0017625) Train Loss: 6.3921, Train Steps/Sec: 0.72
|
| 755 |
+
[[34m2025-03-21 03:11:25[0m] (step=0017650) Train Loss: 6.4238, Train Steps/Sec: 0.72
|
| 756 |
+
[[34m2025-03-21 03:12:00[0m] (step=0017675) Train Loss: 6.4161, Train Steps/Sec: 0.72
|
| 757 |
+
[[34m2025-03-21 03:12:35[0m] (step=0017700) Train Loss: 6.4139, Train Steps/Sec: 0.72
|
| 758 |
+
[[34m2025-03-21 03:13:11[0m] (step=0017725) Train Loss: 6.4032, Train Steps/Sec: 0.69
|
| 759 |
+
[[34m2025-03-21 03:13:46[0m] (step=0017750) Train Loss: 6.4099, Train Steps/Sec: 0.72
|
| 760 |
+
[[34m2025-03-21 03:14:21[0m] (step=0017775) Train Loss: 6.4100, Train Steps/Sec: 0.72
|
| 761 |
+
[[34m2025-03-21 03:14:56[0m] (step=0017800) Train Loss: 6.4039, Train Steps/Sec: 0.72
|
| 762 |
+
[[34m2025-03-21 03:15:31[0m] (step=0017825) Train Loss: 6.4030, Train Steps/Sec: 0.72
|
| 763 |
+
[[34m2025-03-21 03:16:06[0m] (step=0017850) Train Loss: 6.3493, Train Steps/Sec: 0.72
|
| 764 |
+
[[34m2025-03-21 03:16:41[0m] (step=0017875) Train Loss: 6.4039, Train Steps/Sec: 0.72
|
| 765 |
+
[[34m2025-03-21 03:17:17[0m] (step=0017900) Train Loss: 6.4165, Train Steps/Sec: 0.69
|
| 766 |
+
[[34m2025-03-21 03:17:52[0m] (step=0017925) Train Loss: 6.3951, Train Steps/Sec: 0.72
|
| 767 |
+
[[34m2025-03-21 03:18:27[0m] (step=0017950) Train Loss: 6.3934, Train Steps/Sec: 0.72
|
| 768 |
+
[[34m2025-03-21 03:19:02[0m] (step=0017975) Train Loss: 6.4046, Train Steps/Sec: 0.72
|
| 769 |
+
[[34m2025-03-21 03:19:37[0m] (step=0018000) Train Loss: 6.3949, Train Steps/Sec: 0.72
|
| 770 |
+
[[34m2025-03-21 03:19:37[0m] text_config is None. Initializing the text config with default values (`OPTConfig`).
|
| 771 |
+
[[34m2025-03-21 03:25:39[0m] Finish Eval in 18000 steps...
|
| 772 |
+
[[34m2025-03-21 03:25:46[0m] Saved checkpoint to checkpoints/TWO_node_llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_noimageonly_newfix_train_all/014-GPT-XL/checkpoints/0018000.pt
|
| 773 |
+
[[34m2025-03-21 03:25:46[0m] Removed old checkpoint: checkpoints/TWO_node_llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_noimageonly_newfix_train_all/014-GPT-XL/checkpoints/0016000.pt
|
| 774 |
+
[[34m2025-03-21 03:26:21[0m] (step=0018025) Train Loss: 6.3912, Train Steps/Sec: 0.06
|
| 775 |
+
[[34m2025-03-21 03:26:56[0m] (step=0018050) Train Loss: 6.4059, Train Steps/Sec: 0.71
|
| 776 |
+
[[34m2025-03-21 03:27:31[0m] (step=0018075) Train Loss: 6.3700, Train Steps/Sec: 0.72
|
| 777 |
+
[[34m2025-03-21 03:28:06[0m] (step=0018100) Train Loss: 6.4192, Train Steps/Sec: 0.72
|
| 778 |
+
[[34m2025-03-21 03:28:41[0m] (step=0018125) Train Loss: 6.3878, Train Steps/Sec: 0.72
|
| 779 |
+
[[34m2025-03-21 03:29:16[0m] (step=0018150) Train Loss: 6.4107, Train Steps/Sec: 0.72
|
| 780 |
+
[[34m2025-03-21 03:29:51[0m] (step=0018175) Train Loss: 6.4124, Train Steps/Sec: 0.72
|
| 781 |
+
[[34m2025-03-21 03:30:26[0m] (step=0018200) Train Loss: 6.4219, Train Steps/Sec: 0.72
|
| 782 |
+
[[34m2025-03-21 03:31:01[0m] (step=0018225) Train Loss: 6.4332, Train Steps/Sec: 0.72
|
| 783 |
+
[[34m2025-03-21 03:31:36[0m] (step=0018250) Train Loss: 6.4196, Train Steps/Sec: 0.72
|
| 784 |
+
[[34m2025-03-21 03:32:11[0m] (step=0018275) Train Loss: 6.3855, Train Steps/Sec: 0.72
|
| 785 |
+
[[34m2025-03-21 03:32:46[0m] (step=0018300) Train Loss: 6.4043, Train Steps/Sec: 0.72
|
| 786 |
+
[[34m2025-03-21 03:33:21[0m] (step=0018325) Train Loss: 6.4057, Train Steps/Sec: 0.72
|
| 787 |
+
[[34m2025-03-21 03:33:56[0m] (step=0018350) Train Loss: 6.3901, Train Steps/Sec: 0.72
|
| 788 |
+
[[34m2025-03-21 03:34:32[0m] (step=0018375) Train Loss: 6.4202, Train Steps/Sec: 0.69
|
| 789 |
+
[[34m2025-03-21 03:35:07[0m] (step=0018400) Train Loss: 6.3991, Train Steps/Sec: 0.72
|
| 790 |
+
[[34m2025-03-21 03:35:42[0m] (step=0018425) Train Loss: 6.4214, Train Steps/Sec: 0.71
|
| 791 |
+
[[34m2025-03-21 03:36:17[0m] (step=0018450) Train Loss: 6.4188, Train Steps/Sec: 0.71
|
| 792 |
+
[[34m2025-03-21 03:36:52[0m] (step=0018475) Train Loss: 6.4130, Train Steps/Sec: 0.71
|
| 793 |
+
[[34m2025-03-21 03:37:27[0m] (step=0018500) Train Loss: 6.4083, Train Steps/Sec: 0.72
|
| 794 |
+
[[34m2025-03-21 03:38:02[0m] (step=0018525) Train Loss: 6.4400, Train Steps/Sec: 0.72
|
| 795 |
+
[[34m2025-03-21 03:38:37[0m] (step=0018550) Train Loss: 6.3966, Train Steps/Sec: 0.72
|
| 796 |
+
[[34m2025-03-21 03:39:12[0m] (step=0018575) Train Loss: 6.3819, Train Steps/Sec: 0.72
|
| 797 |
+
[[34m2025-03-21 03:39:48[0m] (step=0018600) Train Loss: 6.4222, Train Steps/Sec: 0.69
|
| 798 |
+
[[34m2025-03-21 03:40:23[0m] (step=0018625) Train Loss: 6.4152, Train Steps/Sec: 0.72
|
| 799 |
+
[[34m2025-03-21 03:40:58[0m] (step=0018650) Train Loss: 6.3751, Train Steps/Sec: 0.72
|
| 800 |
+
[[34m2025-03-21 03:41:33[0m] (step=0018675) Train Loss: 6.4011, Train Steps/Sec: 0.72
|
| 801 |
+
[[34m2025-03-21 03:42:07[0m] (step=0018700) Train Loss: 6.3712, Train Steps/Sec: 0.72
|
| 802 |
+
[[34m2025-03-21 03:42:42[0m] (step=0018725) Train Loss: 6.3887, Train Steps/Sec: 0.72
|
| 803 |
+
[[34m2025-03-21 03:43:18[0m] (step=0018750) Train Loss: 6.3734, Train Steps/Sec: 0.70
|
| 804 |
+
[[34m2025-03-21 03:43:54[0m] (step=0018775) Train Loss: 6.3804, Train Steps/Sec: 0.70
|
| 805 |
+
[[34m2025-03-21 03:44:29[0m] (step=0018800) Train Loss: 6.4244, Train Steps/Sec: 0.72
|
| 806 |
+
[[34m2025-03-21 03:45:04[0m] (step=0018825) Train Loss: 6.4183, Train Steps/Sec: 0.72
|
| 807 |
+
[[34m2025-03-21 03:45:39[0m] (step=0018850) Train Loss: 6.3970, Train Steps/Sec: 0.72
|
| 808 |
+
[[34m2025-03-21 03:46:15[0m] (step=0018875) Train Loss: 6.3978, Train Steps/Sec: 0.70
|
| 809 |
+
[[34m2025-03-21 03:46:50[0m] (step=0018900) Train Loss: 6.4064, Train Steps/Sec: 0.72
|
| 810 |
+
[[34m2025-03-21 03:47:25[0m] (step=0018925) Train Loss: 6.4034, Train Steps/Sec: 0.71
|
| 811 |
+
[[34m2025-03-21 03:48:00[0m] (step=0018950) Train Loss: 6.4112, Train Steps/Sec: 0.72
|
| 812 |
+
[[34m2025-03-21 03:48:35[0m] (step=0018975) Train Loss: 6.3946, Train Steps/Sec: 0.72
|
| 813 |
+
[[34m2025-03-21 03:49:10[0m] (step=0019000) Train Loss: 6.3969, Train Steps/Sec: 0.72
|
| 814 |
+
[[34m2025-03-21 03:49:46[0m] (step=0019025) Train Loss: 6.4109, Train Steps/Sec: 0.69
|
| 815 |
+
[[34m2025-03-21 03:50:21[0m] (step=0019050) Train Loss: 6.4117, Train Steps/Sec: 0.72
|
| 816 |
+
[[34m2025-03-21 03:50:56[0m] (step=0019075) Train Loss: 6.4210, Train Steps/Sec: 0.72
|
| 817 |
+
[[34m2025-03-21 03:51:30[0m] (step=0019100) Train Loss: 6.3980, Train Steps/Sec: 0.72
|
| 818 |
+
[[34m2025-03-21 03:52:05[0m] (step=0019125) Train Loss: 6.4104, Train Steps/Sec: 0.72
|
| 819 |
+
[[34m2025-03-21 03:52:40[0m] (step=0019150) Train Loss: 6.4225, Train Steps/Sec: 0.72
|
| 820 |
+
[[34m2025-03-21 03:53:15[0m] (step=0019175) Train Loss: 6.4190, Train Steps/Sec: 0.72
|
| 821 |
+
[[34m2025-03-21 03:53:50[0m] (step=0019200) Train Loss: 6.3875, Train Steps/Sec: 0.72
|
| 822 |
+
[[34m2025-03-21 03:54:25[0m] (step=0019225) Train Loss: 6.3486, Train Steps/Sec: 0.72
|
| 823 |
+
[[34m2025-03-21 03:55:00[0m] (step=0019250) Train Loss: 6.4044, Train Steps/Sec: 0.72
|
| 824 |
+
[[34m2025-03-21 03:55:35[0m] (step=0019275) Train Loss: 6.3887, Train Steps/Sec: 0.72
|
| 825 |
+
[[34m2025-03-21 03:56:10[0m] (step=0019300) Train Loss: 6.3902, Train Steps/Sec: 0.72
|
| 826 |
+
[[34m2025-03-21 03:56:45[0m] (step=0019325) Train Loss: 6.3945, Train Steps/Sec: 0.72
|
| 827 |
+
[[34m2025-03-21 03:57:20[0m] (step=0019350) Train Loss: 6.3907, Train Steps/Sec: 0.72
|
| 828 |
+
[[34m2025-03-21 03:57:55[0m] (step=0019375) Train Loss: 6.3920, Train Steps/Sec: 0.72
|
| 829 |
+
[[34m2025-03-21 03:58:30[0m] (step=0019400) Train Loss: 6.3783, Train Steps/Sec: 0.72
|
| 830 |
+
[[34m2025-03-21 03:59:05[0m] (step=0019425) Train Loss: 6.4094, Train Steps/Sec: 0.72
|
| 831 |
+
[[34m2025-03-21 03:59:40[0m] (step=0019450) Train Loss: 6.3843, Train Steps/Sec: 0.72
|
| 832 |
+
[[34m2025-03-21 04:00:15[0m] (step=0019475) Train Loss: 6.3943, Train Steps/Sec: 0.72
|
| 833 |
+
[[34m2025-03-21 04:00:49[0m] (step=0019500) Train Loss: 6.3949, Train Steps/Sec: 0.72
|
| 834 |
+
[[34m2025-03-21 04:01:24[0m] (step=0019525) Train Loss: 6.3919, Train Steps/Sec: 0.72
|
| 835 |
+
[[34m2025-03-21 04:01:59[0m] (step=0019550) Train Loss: 6.4067, Train Steps/Sec: 0.72
|
| 836 |
+
[[34m2025-03-21 04:02:34[0m] (step=0019575) Train Loss: 6.4200, Train Steps/Sec: 0.72
|
| 837 |
+
[[34m2025-03-21 04:03:09[0m] (step=0019600) Train Loss: 6.4007, Train Steps/Sec: 0.72
|
| 838 |
+
[[34m2025-03-21 04:03:44[0m] (step=0019625) Train Loss: 6.3963, Train Steps/Sec: 0.72
|
| 839 |
+
[[34m2025-03-21 04:04:19[0m] (step=0019650) Train Loss: 6.4086, Train Steps/Sec: 0.72
|
| 840 |
+
[[34m2025-03-21 04:04:54[0m] (step=0019675) Train Loss: 6.4067, Train Steps/Sec: 0.72
|
| 841 |
+
[[34m2025-03-21 04:05:29[0m] (step=0019700) Train Loss: 6.3943, Train Steps/Sec: 0.72
|
| 842 |
+
[[34m2025-03-21 04:06:05[0m] (step=0019725) Train Loss: 6.3729, Train Steps/Sec: 0.69
|
| 843 |
+
[[34m2025-03-21 04:06:40[0m] (step=0019750) Train Loss: 6.4144, Train Steps/Sec: 0.72
|
| 844 |
+
[[34m2025-03-21 04:07:15[0m] (step=0019775) Train Loss: 6.3864, Train Steps/Sec: 0.72
|
| 845 |
+
[[34m2025-03-21 04:07:50[0m] (step=0019800) Train Loss: 6.4070, Train Steps/Sec: 0.72
|
| 846 |
+
[[34m2025-03-21 04:08:25[0m] (step=0019825) Train Loss: 6.3688, Train Steps/Sec: 0.72
|
| 847 |
+
[[34m2025-03-21 04:09:00[0m] (step=0019850) Train Loss: 6.3642, Train Steps/Sec: 0.72
|
| 848 |
+
[[34m2025-03-21 04:09:35[0m] (step=0019875) Train Loss: 6.3811, Train Steps/Sec: 0.72
|
| 849 |
+
[[34m2025-03-21 04:10:10[0m] (step=0019900) Train Loss: 6.4052, Train Steps/Sec: 0.72
|
| 850 |
+
[[34m2025-03-21 04:10:45[0m] (step=0019925) Train Loss: 6.3972, Train Steps/Sec: 0.72
|
| 851 |
+
[[34m2025-03-21 04:11:20[0m] (step=0019950) Train Loss: 6.3985, Train Steps/Sec: 0.71
|
| 852 |
+
[[34m2025-03-21 04:11:54[0m] (step=0019975) Train Loss: 6.4144, Train Steps/Sec: 0.71
|
| 853 |
+
[[34m2025-03-21 04:12:29[0m] (step=0020000) Train Loss: 6.3964, Train Steps/Sec: 0.72
|
| 854 |
+
[[34m2025-03-21 04:12:29[0m] text_config is None. Initializing the text config with default values (`OPTConfig`).
|
| 855 |
+
[[34m2025-03-21 04:18:32[0m] Finish Eval in 20000 steps...
|
| 856 |
+
[[34m2025-03-21 04:18:39[0m] Saved checkpoint to checkpoints/TWO_node_llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_noimageonly_newfix_train_all/014-GPT-XL/checkpoints/0020000.pt
|
| 857 |
+
[[34m2025-03-21 04:18:39[0m] Removed old checkpoint: checkpoints/TWO_node_llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_noimageonly_newfix_train_all/014-GPT-XL/checkpoints/0018000.pt
|
| 858 |
+
[[34m2025-03-21 04:19:14[0m] (step=0020025) Train Loss: 6.4165, Train Steps/Sec: 0.06
|
| 859 |
+
[[34m2025-03-21 04:19:49[0m] (step=0020050) Train Loss: 6.4194, Train Steps/Sec: 0.72
|
| 860 |
+
[[34m2025-03-21 04:20:24[0m] (step=0020075) Train Loss: 6.3818, Train Steps/Sec: 0.72
|
| 861 |
+
[[34m2025-03-21 04:20:59[0m] (step=0020100) Train Loss: 6.4276, Train Steps/Sec: 0.72
|
| 862 |
+
[[34m2025-03-21 04:21:34[0m] (step=0020125) Train Loss: 6.4217, Train Steps/Sec: 0.72
|
| 863 |
+
[[34m2025-03-21 04:22:09[0m] (step=0020150) Train Loss: 6.4100, Train Steps/Sec: 0.72
|
| 864 |
+
[[34m2025-03-21 04:22:44[0m] (step=0020175) Train Loss: 6.4028, Train Steps/Sec: 0.72
|
| 865 |
+
[[34m2025-03-21 04:23:19[0m] (step=0020200) Train Loss: 6.4108, Train Steps/Sec: 0.72
|
| 866 |
+
[[34m2025-03-21 04:23:54[0m] (step=0020225) Train Loss: 6.3864, Train Steps/Sec: 0.72
|
| 867 |
+
[[34m2025-03-21 04:24:29[0m] (step=0020250) Train Loss: 6.3886, Train Steps/Sec: 0.71
|
| 868 |
+
[[34m2025-03-21 04:25:04[0m] (step=0020275) Train Loss: 6.4142, Train Steps/Sec: 0.72
|
| 869 |
+
[[34m2025-03-21 04:25:39[0m] (step=0020300) Train Loss: 6.3951, Train Steps/Sec: 0.72
|
| 870 |
+
[[34m2025-03-21 04:26:14[0m] (step=0020325) Train Loss: 6.3855, Train Steps/Sec: 0.72
|
| 871 |
+
[[34m2025-03-21 04:26:48[0m] (step=0020350) Train Loss: 6.3803, Train Steps/Sec: 0.72
|
| 872 |
+
[[34m2025-03-21 04:27:23[0m] (step=0020375) Train Loss: 6.3810, Train Steps/Sec: 0.72
|
| 873 |
+
[[34m2025-03-21 04:27:58[0m] (step=0020400) Train Loss: 6.3824, Train Steps/Sec: 0.72
|
| 874 |
+
[[34m2025-03-21 04:28:33[0m] (step=0020425) Train Loss: 6.3963, Train Steps/Sec: 0.72
|
| 875 |
+
[[34m2025-03-21 04:29:10[0m] (step=0020450) Train Loss: 6.3914, Train Steps/Sec: 0.69
|
| 876 |
+
[[34m2025-03-21 04:29:44[0m] (step=0020475) Train Loss: 6.4009, Train Steps/Sec: 0.72
|
| 877 |
+
[[34m2025-03-21 04:30:19[0m] (step=0020500) Train Loss: 6.3977, Train Steps/Sec: 0.72
|
| 878 |
+
[[34m2025-03-21 04:30:55[0m] (step=0020525) Train Loss: 6.3947, Train Steps/Sec: 0.69
|
| 879 |
+
[[34m2025-03-21 04:31:30[0m] (step=0020550) Train Loss: 6.3958, Train Steps/Sec: 0.72
|
| 880 |
+
[[34m2025-03-21 04:32:05[0m] (step=0020575) Train Loss: 6.3645, Train Steps/Sec: 0.72
|
| 881 |
+
[[34m2025-03-21 04:32:41[0m] (step=0020600) Train Loss: 6.4031, Train Steps/Sec: 0.69
|
| 882 |
+
[[34m2025-03-21 04:33:16[0m] (step=0020625) Train Loss: 6.3919, Train Steps/Sec: 0.72
|
| 883 |
+
[[34m2025-03-21 04:33:51[0m] (step=0020650) Train Loss: 6.3619, Train Steps/Sec: 0.72
|
| 884 |
+
[[34m2025-03-21 04:34:26[0m] (step=0020675) Train Loss: 6.4173, Train Steps/Sec: 0.72
|
| 885 |
+
[[34m2025-03-21 04:35:01[0m] (step=0020700) Train Loss: 6.3527, Train Steps/Sec: 0.72
|
| 886 |
+
[[34m2025-03-21 04:35:37[0m] (step=0020725) Train Loss: 6.4168, Train Steps/Sec: 0.70
|
| 887 |
+
[[34m2025-03-21 04:36:12[0m] (step=0020750) Train Loss: 6.3854, Train Steps/Sec: 0.72
|
| 888 |
+
[[34m2025-03-21 04:36:47[0m] (step=0020775) Train Loss: 6.4020, Train Steps/Sec: 0.72
|
| 889 |
+
[[34m2025-03-21 04:37:22[0m] (step=0020800) Train Loss: 6.3876, Train Steps/Sec: 0.72
|
| 890 |
+
[[34m2025-03-21 04:37:57[0m] (step=0020825) Train Loss: 6.4004, Train Steps/Sec: 0.72
|
| 891 |
+
[[34m2025-03-21 04:38:32[0m] (step=0020850) Train Loss: 6.4154, Train Steps/Sec: 0.72
|
| 892 |
+
[[34m2025-03-21 04:39:07[0m] (step=0020875) Train Loss: 6.3917, Train Steps/Sec: 0.71
|
| 893 |
+
[[34m2025-03-21 04:39:42[0m] (step=0020900) Train Loss: 6.3794, Train Steps/Sec: 0.72
|
| 894 |
+
[[34m2025-03-21 04:40:18[0m] (step=0020925) Train Loss: 6.3892, Train Steps/Sec: 0.70
|
| 895 |
+
[[34m2025-03-21 04:40:52[0m] (step=0020950) Train Loss: 6.4117, Train Steps/Sec: 0.72
|
| 896 |
+
[[34m2025-03-21 04:41:27[0m] (step=0020975) Train Loss: 6.4204, Train Steps/Sec: 0.72
|
| 897 |
+
[[34m2025-03-21 04:42:02[0m] (step=0021000) Train Loss: 6.3726, Train Steps/Sec: 0.72
|
| 898 |
+
[[34m2025-03-21 04:42:37[0m] (step=0021025) Train Loss: 6.3634, Train Steps/Sec: 0.72
|
| 899 |
+
[[34m2025-03-21 04:43:12[0m] (step=0021050) Train Loss: 6.3828, Train Steps/Sec: 0.72
|
| 900 |
+
[[34m2025-03-21 04:43:47[0m] (step=0021075) Train Loss: 6.3750, Train Steps/Sec: 0.72
|
| 901 |
+
[[34m2025-03-21 04:44:22[0m] (step=0021100) Train Loss: 6.3752, Train Steps/Sec: 0.72
|
| 902 |
+
[[34m2025-03-21 04:44:57[0m] (step=0021125) Train Loss: 6.4041, Train Steps/Sec: 0.72
|
| 903 |
+
[[34m2025-03-21 04:45:32[0m] (step=0021150) Train Loss: 6.3967, Train Steps/Sec: 0.72
|
| 904 |
+
[[34m2025-03-21 04:46:07[0m] (step=0021175) Train Loss: 6.4078, Train Steps/Sec: 0.72
|
| 905 |
+
[[34m2025-03-21 04:46:42[0m] (step=0021200) Train Loss: 6.3958, Train Steps/Sec: 0.72
|
| 906 |
+
[[34m2025-03-21 04:47:17[0m] (step=0021225) Train Loss: 6.3923, Train Steps/Sec: 0.72
|
| 907 |
+
[[34m2025-03-21 04:47:52[0m] (step=0021250) Train Loss: 6.4356, Train Steps/Sec: 0.72
|
| 908 |
+
[[34m2025-03-21 04:48:27[0m] (step=0021275) Train Loss: 6.3805, Train Steps/Sec: 0.72
|
| 909 |
+
[[34m2025-03-21 04:49:01[0m] (step=0021300) Train Loss: 6.3991, Train Steps/Sec: 0.72
|
| 910 |
+
[[34m2025-03-21 04:49:36[0m] (step=0021325) Train Loss: 6.3986, Train Steps/Sec: 0.72
|
| 911 |
+
[[34m2025-03-21 04:50:11[0m] (step=0021350) Train Loss: 6.3888, Train Steps/Sec: 0.72
|
| 912 |
+
[[34m2025-03-21 04:50:47[0m] (step=0021375) Train Loss: 6.4120, Train Steps/Sec: 0.70
|
| 913 |
+
[[34m2025-03-21 04:51:22[0m] (step=0021400) Train Loss: 6.3959, Train Steps/Sec: 0.72
|
| 914 |
+
[[34m2025-03-21 04:51:57[0m] (step=0021425) Train Loss: 6.3914, Train Steps/Sec: 0.72
|
| 915 |
+
[[34m2025-03-21 04:52:32[0m] (step=0021450) Train Loss: 6.4115, Train Steps/Sec: 0.72
|
| 916 |
+
[[34m2025-03-21 04:53:07[0m] (step=0021475) Train Loss: 6.3913, Train Steps/Sec: 0.72
|
| 917 |
+
[[34m2025-03-21 04:53:42[0m] (step=0021500) Train Loss: 6.3491, Train Steps/Sec: 0.72
|
| 918 |
+
[[34m2025-03-21 04:54:17[0m] (step=0021525) Train Loss: 6.3882, Train Steps/Sec: 0.72
|
| 919 |
+
[[34m2025-03-21 04:54:52[0m] (step=0021550) Train Loss: 6.3860, Train Steps/Sec: 0.72
|
| 920 |
+
[[34m2025-03-21 04:55:27[0m] (step=0021575) Train Loss: 6.3636, Train Steps/Sec: 0.72
|
| 921 |
+
[[34m2025-03-21 04:56:02[0m] (step=0021600) Train Loss: 6.3732, Train Steps/Sec: 0.72
|
| 922 |
+
[[34m2025-03-21 04:56:36[0m] (step=0021625) Train Loss: 6.3762, Train Steps/Sec: 0.72
|
| 923 |
+
[[34m2025-03-21 04:57:11[0m] (step=0021650) Train Loss: 6.3944, Train Steps/Sec: 0.72
|
| 924 |
+
[[34m2025-03-21 04:57:46[0m] (step=0021675) Train Loss: 6.4159, Train Steps/Sec: 0.72
|
| 925 |
+
[[34m2025-03-21 04:58:21[0m] (step=0021700) Train Loss: 6.4051, Train Steps/Sec: 0.71
|
| 926 |
+
[[34m2025-03-21 04:58:57[0m] (step=0021725) Train Loss: 6.3964, Train Steps/Sec: 0.69
|
| 927 |
+
[[34m2025-03-21 04:59:32[0m] (step=0021750) Train Loss: 6.3787, Train Steps/Sec: 0.72
|
| 928 |
+
[[34m2025-03-21 05:00:07[0m] (step=0021775) Train Loss: 6.3998, Train Steps/Sec: 0.72
|
| 929 |
+
[[34m2025-03-21 05:00:43[0m] (step=0021800) Train Loss: 6.3657, Train Steps/Sec: 0.70
|
| 930 |
+
[[34m2025-03-21 05:01:18[0m] (step=0021825) Train Loss: 6.3779, Train Steps/Sec: 0.72
|
| 931 |
+
[[34m2025-03-21 05:01:53[0m] (step=0021850) Train Loss: 6.3952, Train Steps/Sec: 0.72
|
| 932 |
+
[[34m2025-03-21 05:02:28[0m] (step=0021875) Train Loss: 6.3746, Train Steps/Sec: 0.72
|
| 933 |
+
[[34m2025-03-21 05:03:03[0m] (step=0021900) Train Loss: 6.3982, Train Steps/Sec: 0.72
|
| 934 |
+
[[34m2025-03-21 05:03:38[0m] (step=0021925) Train Loss: 6.4067, Train Steps/Sec: 0.72
|
| 935 |
+
[[34m2025-03-21 05:04:13[0m] (step=0021950) Train Loss: 6.4048, Train Steps/Sec: 0.72
|
| 936 |
+
[[34m2025-03-21 05:04:48[0m] (step=0021975) Train Loss: 6.3832, Train Steps/Sec: 0.72
|
| 937 |
+
[[34m2025-03-21 05:05:23[0m] (step=0022000) Train Loss: 6.4023, Train Steps/Sec: 0.72
|
| 938 |
+
[[34m2025-03-21 05:05:23[0m] text_config is None. Initializing the text config with default values (`OPTConfig`).
|
| 939 |
+
[[34m2025-03-21 05:11:26[0m] Finish Eval in 22000 steps...
|
| 940 |
+
[[34m2025-03-21 05:11:33[0m] Saved checkpoint to checkpoints/TWO_node_llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_noimageonly_newfix_train_all/014-GPT-XL/checkpoints/0022000.pt
|
| 941 |
+
[[34m2025-03-21 05:11:34[0m] Removed old checkpoint: checkpoints/TWO_node_llavat5_subject_train_all_T5_subject_t2i_ti2i_120_w_flux_segment_noimageonly_newfix_train_all/014-GPT-XL/checkpoints/0020000.pt
|
| 942 |
+
[[34m2025-03-21 05:12:09[0m] (step=0022025) Train Loss: 6.3806, Train Steps/Sec: 0.06
|
| 943 |
+
[[34m2025-03-21 05:12:44[0m] (step=0022050) Train Loss: 6.3704, Train Steps/Sec: 0.71
|
| 944 |
+
[[34m2025-03-21 05:13:19[0m] (step=0022075) Train Loss: 6.4170, Train Steps/Sec: 0.72
|
| 945 |
+
[[34m2025-03-21 05:13:53[0m] (step=0022100) Train Loss: 6.3608, Train Steps/Sec: 0.72
|
| 946 |
+
[[34m2025-03-21 05:14:28[0m] (step=0022125) Train Loss: 6.4188, Train Steps/Sec: 0.72
|
| 947 |
+
[[34m2025-03-21 05:15:03[0m] (step=0022150) Train Loss: 6.3739, Train Steps/Sec: 0.72
|
| 948 |
+
[[34m2025-03-21 05:15:38[0m] (step=0022175) Train Loss: 6.3662, Train Steps/Sec: 0.72
|
| 949 |
+
[[34m2025-03-21 05:16:13[0m] (step=0022200) Train Loss: 6.3937, Train Steps/Sec: 0.72
|
| 950 |
+
[[34m2025-03-21 05:16:48[0m] (step=0022225) Train Loss: 6.3978, Train Steps/Sec: 0.72
|
| 951 |
+
[[34m2025-03-21 05:17:23[0m] (step=0022250) Train Loss: 6.3815, Train Steps/Sec: 0.72
|
| 952 |
+
[[34m2025-03-21 05:17:58[0m] (step=0022275) Train Loss: 6.3691, Train Steps/Sec: 0.72
|
| 953 |
+
[[34m2025-03-21 05:18:33[0m] (step=0022300) Train Loss: 6.3940, Train Steps/Sec: 0.71
|
| 954 |
+
[[34m2025-03-21 05:19:08[0m] (step=0022325) Train Loss: 6.4030, Train Steps/Sec: 0.72
|
| 955 |
+
[[34m2025-03-21 05:19:43[0m] (step=0022350) Train Loss: 6.3969, Train Steps/Sec: 0.72
|
| 956 |
+
[[34m2025-03-21 05:20:18[0m] (step=0022375) Train Loss: 6.3963, Train Steps/Sec: 0.72
|
| 957 |
+
[[34m2025-03-21 05:20:53[0m] (step=0022400) Train Loss: 6.3602, Train Steps/Sec: 0.72
|
| 958 |
+
[[34m2025-03-21 05:21:28[0m] (step=0022425) Train Loss: 6.3993, Train Steps/Sec: 0.72
|
| 959 |
+
[[34m2025-03-21 05:22:03[0m] (step=0022450) Train Loss: 6.3735, Train Steps/Sec: 0.71
|
| 960 |
+
[[34m2025-03-21 05:22:39[0m] (step=0022475) Train Loss: 6.3953, Train Steps/Sec: 0.69
|
| 961 |
+
[[34m2025-03-21 05:23:14[0m] (step=0022500) Train Loss: 6.4150, Train Steps/Sec: 0.72
|
| 962 |
+
[[34m2025-03-21 05:23:49[0m] (step=0022525) Train Loss: 6.3966, Train Steps/Sec: 0.72
|
| 963 |
+
[[34m2025-03-21 05:24:24[0m] (step=0022550) Train Loss: 6.3950, Train Steps/Sec: 0.72
|
| 964 |
+
[[34m2025-03-21 05:24:59[0m] (step=0022575) Train Loss: 6.3610, Train Steps/Sec: 0.72
|
| 965 |
+
[[34m2025-03-21 05:25:34[0m] (step=0022600) Train Loss: 6.3677, Train Steps/Sec: 0.72
|
| 966 |
+
[[34m2025-03-21 05:26:08[0m] (step=0022625) Train Loss: 6.3718, Train Steps/Sec: 0.72
|
| 967 |
+
[[34m2025-03-21 05:26:43[0m] (step=0022650) Train Loss: 6.3712, Train Steps/Sec: 0.72
|
| 968 |
+
[[34m2025-03-21 05:27:18[0m] (step=0022675) Train Loss: 6.3926, Train Steps/Sec: 0.71
|
| 969 |
+
[[34m2025-03-21 05:27:53[0m] (step=0022700) Train Loss: 6.3849, Train Steps/Sec: 0.72
|
| 970 |
+
[[34m2025-03-21 05:28:28[0m] (step=0022725) Train Loss: 6.3839, Train Steps/Sec: 0.72
|
| 971 |
+
[[34m2025-03-21 05:29:03[0m] (step=0022750) Train Loss: 6.3588, Train Steps/Sec: 0.72
|
| 972 |
+
[[34m2025-03-21 05:29:40[0m] (step=0022775) Train Loss: 6.3741, Train Steps/Sec: 0.69
|
| 973 |
+
[[34m2025-03-21 05:30:14[0m] (step=0022800) Train Loss: 6.3778, Train Steps/Sec: 0.72
|
| 974 |
+
[[34m2025-03-21 05:30:49[0m] (step=0022825) Train Loss: 6.4009, Train Steps/Sec: 0.72
|
| 975 |
+
[[34m2025-03-21 05:31:24[0m] (step=0022850) Train Loss: 6.3984, Train Steps/Sec: 0.72
|
| 976 |
+
[[34m2025-03-21 05:31:59[0m] (step=0022875) Train Loss: 6.4011, Train Steps/Sec: 0.71
|
| 977 |
+
[[34m2025-03-21 05:32:34[0m] (step=0022900) Train Loss: 6.3943, Train Steps/Sec: 0.71
|
| 978 |
+
[[34m2025-03-21 05:33:09[0m] (step=0022925) Train Loss: 6.4090, Train Steps/Sec: 0.72
|
| 979 |
+
[[34m2025-03-21 05:33:44[0m] (step=0022950) Train Loss: 6.3990, Train Steps/Sec: 0.72
|
| 980 |
+
[[34m2025-03-21 05:34:19[0m] (step=0022975) Train Loss: 6.3927, Train Steps/Sec: 0.72
|
| 981 |
+
[[34m2025-03-21 05:34:54[0m] (step=0023000) Train Loss: 6.3857, Train Steps/Sec: 0.72
|
| 982 |
+
[[34m2025-03-21 05:35:29[0m] (step=0023025) Train Loss: 6.4064, Train Steps/Sec: 0.72
|
| 983 |
+
[[34m2025-03-21 05:36:04[0m] (step=0023050) Train Loss: 6.4067, Train Steps/Sec: 0.72
|
| 984 |
+
[[34m2025-03-21 05:36:39[0m] (step=0023075) Train Loss: 6.3986, Train Steps/Sec: 0.72
|
| 985 |
+
[[34m2025-03-21 05:37:15[0m] (step=0023100) Train Loss: 6.3931, Train Steps/Sec: 0.69
|
| 986 |
+
[[34m2025-03-21 05:37:50[0m] (step=0023125) Train Loss: 6.3747, Train Steps/Sec: 0.72
|
| 987 |
+
[[34m2025-03-21 05:38:25[0m] (step=0023150) Train Loss: 6.3900, Train Steps/Sec: 0.72
|
| 988 |
+
[[34m2025-03-21 05:39:00[0m] (step=0023175) Train Loss: 6.3792, Train Steps/Sec: 0.72
|
| 989 |
+
[[34m2025-03-21 05:39:35[0m] (step=0023200) Train Loss: 6.3700, Train Steps/Sec: 0.72
|
| 990 |
+
[[34m2025-03-21 05:40:10[0m] (step=0023225) Train Loss: 6.3990, Train Steps/Sec: 0.72
|
| 991 |
+
[[34m2025-03-21 05:40:45[0m] (step=0023250) Train Loss: 6.3965, Train Steps/Sec: 0.72
|
| 992 |
+
[[34m2025-03-21 05:41:19[0m] (step=0023275) Train Loss: 6.4291, Train Steps/Sec: 0.72
|
| 993 |
+
[[34m2025-03-21 05:41:54[0m] (step=0023300) Train Loss: 6.3865, Train Steps/Sec: 0.72
|
| 994 |
+
[[34m2025-03-21 05:42:29[0m] (step=0023325) Train Loss: 6.3662, Train Steps/Sec: 0.72
|
| 995 |
+
[[34m2025-03-21 05:43:04[0m] (step=0023350) Train Loss: 6.3977, Train Steps/Sec: 0.72
|
| 996 |
+
[[34m2025-03-21 05:43:39[0m] (step=0023375) Train Loss: 6.3776, Train Steps/Sec: 0.72
|
| 997 |
+
[[34m2025-03-21 05:44:15[0m] (step=0023400) Train Loss: 6.3726, Train Steps/Sec: 0.70
|
| 998 |
+
[[34m2025-03-21 05:44:50[0m] (step=0023425) Train Loss: 6.4272, Train Steps/Sec: 0.72
|
| 999 |
+
[[34m2025-03-21 05:45:25[0m] (step=0023450) Train Loss: 6.3775, Train Steps/Sec: 0.72
|
| 1000 |
+
[[34m2025-03-21 05:46:01[0m] (step=0023475) Train Loss: 6.3884, Train Steps/Sec: 0.70
|
| 1001 |
+
[[34m2025-03-21 05:46:37[0m] (step=0023500) Train Loss: 6.4057, Train Steps/Sec: 0.69
|
| 1002 |
+
[[34m2025-03-21 05:47:12[0m] (step=0023525) Train Loss: 6.3665, Train Steps/Sec: 0.72
|
| 1003 |
+
[[34m2025-03-21 05:47:47[0m] (step=0023550) Train Loss: 6.3712, Train Steps/Sec: 0.72
|
| 1004 |
+
[[34m2025-03-21 05:48:22[0m] (step=0023575) Train Loss: 6.4047, Train Steps/Sec: 0.72
|
| 1005 |
+
[[34m2025-03-21 05:48:28[0m] Done!
|