Upload 6 files

Browse files

Files changed (6) hide show

maskbit/DDMD-GPUS1-bs128-glr1e-06-flr1e-06-FKL-fix_rfix_0.6-emb_pert_fix_0.1-tcfg1.5-fcfg1.0-fcfgt1.0-r_mode_arccos-r_mode_f_arccos-reduce_sum-seed3407-bf16_checkpoint-50000/config.yaml +116 -0
maskbit/DDMD-GPUS1-bs128-glr1e-06-flr1e-06-FKL-fix_rfix_0.6-emb_pert_fix_0.1-tcfg1.5-fcfg1.0-fcfgt1.0-r_mode_arccos-r_mode_f_arccos-reduce_sum-seed3407-bf16_checkpoint-50000/pytorch_model.bin +3 -0
maskbit/DiMO2-GPUS2-bs64-glr5e-07-flr5e-07-FKL-fix_rfix_0.6-cfgs1.5-1.0-1.0-non_saturating-dlr5e-07-g_w200.0-d_w1.0-dm_w1.0-g_noise_0.-0.95-plain-bf16_checkpoint-50000/config.yaml +120 -0
maskbit/DiMO2-GPUS2-bs64-glr5e-07-flr5e-07-FKL-fix_rfix_0.6-cfgs1.5-1.0-1.0-non_saturating-dlr5e-07-g_w200.0-d_w1.0-dm_w1.0-g_noise_0.-0.95-plain-bf16_checkpoint-50000/pytorch_model.bin +3 -0
maskbit/DiMO2-GPUS4-bs64-glr1e-06-flr1e-06-FKL-fix_rfix_0.6-cfgs1.5-1.0-1.0-r_modes_arccos-arccos-non_saturating-dlr1e-06-g_w25.0-d_w1.0-dm_w1.0-g_noise_continuous_0.-0.95-plain-bf16_checkpoint-50000/config.yaml +120 -0
maskbit/DiMO2-GPUS4-bs64-glr1e-06-flr1e-06-FKL-fix_rfix_0.6-cfgs1.5-1.0-1.0-r_modes_arccos-arccos-non_saturating-dlr1e-06-g_w25.0-d_w1.0-dm_w1.0-g_noise_continuous_0.-0.95-plain-bf16_checkpoint-50000/pytorch_model.bin +3 -0

maskbit/DDMD-GPUS1-bs128-glr1e-06-flr1e-06-FKL-fix_rfix_0.6-emb_pert_fix_0.1-tcfg1.5-fcfg1.0-fcfgt1.0-r_mode_arccos-r_mode_f_arccos-reduce_sum-seed3407-bf16_checkpoint-50000/config.yaml ADDED Viewed

	@@ -0,0 +1,116 @@

+name: DDMD-GPUS1-bs128-glr1e-06-flr1e-06-FKL-fix_rfix_0.6-emb_pert_fix_0.1-tcfg1.5-fcfg1.0-fcfgt1.0-r_mode_arccos-r_mode_f_arccos-reduce_sum-seed3407-bf16
+report_to: wandb
+output_dir: outputs//MaskBit_benchmark/DDMD-GPUS1-bs128-glr1e-06-flr1e-06-FKL-fix_rfix_0.6-emb_pert_fix_0.1-tcfg1.5-fcfg1.0-fcfgt1.0-r_mode_arccos-r_mode_f_arccos-reduce_sum-seed3407-bf16/2025-08-11T16-13
+pretrained_model_path: ./pretrained_maskgit/MaskGIT/MaskGIT_ImageNet_256.pth
+pretrained_vae_path: ./pretrained_maskgit/VQGAN/
+wandb_project: DiMO_GAN_MaskBit
+wandb_user: yuanzhi_zhu
+ema_cpu: false
+ema_freq: 1
+max_train_steps: 200001
+log_steps: 50
+validation_steps: 200
+validation_steps_tuple:
+- 2
+- 50
+- 200
+- 500
+metric_type: fid
+metric_steps: 2000
+metric_steps_tuple:
+- 2000
+- 5000
+scale_lr: false
+lr_warmup_steps: 500
+lr_scheduler_type: constant_with_warmup
+train_batch_size: 128
+loss_reduction: sum
+optimizer_type: adam
+adam_beta1: 0.9
+adam_beta2: 0.999
+fake_adam_beta1: 0.9
+fake_adam_beta2: 0.999
+adam_weight_decay: 0.0
+adam_epsilon: 1.0e-06
+max_grad_norm: 1.0
+gradient_accumulation_steps: 1
+gradient_checkpointing: false
+checkpointing_steps: 1000
+mixed_precision: bf16
+enable_xformers_memory_efficient_attention: false
+global_seed: 3407
+is_debug: false
+cast_models_to_dtype: false
+checkpoints_total_limit: 5
+checkpointing_steps_tuple:
+- 5000
+- 10000
+- 15000
+- 20000
+- 25000
+- 30000
+- 40000
+- 50000
+- 60000
+- 70000
+- 80000
+- 90000
+- 100000
+resume_from_checkpoint_path: ''
+no_progress_bar: true
+generator_lr: 1.0e-06
+fake_rounds: 1
+weight_factor_type: uniform
+dm_loss_weight: 1.0
+distil_loss_type: FKL
+fixed_ratio: fix_0.6
+noise_emb_perturb: fix_0.0
+top_k: 0
+top_p: 0.0
+true_cfg: 1.5
+fake_cfg_eval: 1.0
+fake_cfg_train: 1.0
+fake_lr: 1.0e-06
+fake_cfg_drop_ratio: 0.0
+gen_temp: 1.0
+true_temp: 1.0
+fake_temp: 1.0
+ignore_index: -1
+ratio_mode: arccos
+ratio_mode_fake: arccos
+temperature_fake: 1.0
+alpha_fake: 0.0
+fix_emb_layer: true
+adaptive_cfg: false
+use_discriminator: 0.0
+discriminator_lr: 1.0e-06
+g_loss_weight: 0.1
+d_loss_weight: 1.0
+gan_noise_level: continuous_0.-0.5
+noisy_as_masked_emb: true
+noisy_as_noisy_feat: false
+same_maskemb: true
+generator_loss_type: non_saturating
+use_discriminator_steps: 1000
+emb_mode: plain
+tau: 0.5
+tau_min: 0.1
+dis_min_ch: 256
+dis_f_layer: 3
+dis_emb_input: true
+dis_t_cond: true
+dis_adam_beta1: 0.0
+dis_adam_beta2: 0.999
+sched_mode: arccos
+sampling_step: 64
+mask_value: 1024
+cfg_w: 5.8
+r_temp: 10.3
+sm_temp: 1.0
+Jeffreys_beta: 0.0
+run_id: 2025-08-11T16-13
+precision: bf16
+folder_name: DDMD-GPUS1-bs128-glr1e-06-flr1e-06-FKL-fix_rfix_0.6-emb_pert_fix_0.1-tcfg1.5-fcfg1.0-fcfgt1.0-r_mode_arccos-r_mode_f_arccos-reduce_sum-seed3407-bf16/2025-08-11T16-13
+output_name: /MaskBit_benchmark
+ema_decay: 0.9999
+resolution: 256

maskbit/DDMD-GPUS1-bs128-glr1e-06-flr1e-06-FKL-fix_rfix_0.6-emb_pert_fix_0.1-tcfg1.5-fcfg1.0-fcfgt1.0-r_mode_arccos-r_mode_f_arccos-reduce_sum-seed3407-bf16_checkpoint-50000/pytorch_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:25ab49d06acf857f69522e6cfa8b100d1d3af180ad60af07073bb23de04a50a1
+size 1219832638

maskbit/DiMO2-GPUS2-bs64-glr5e-07-flr5e-07-FKL-fix_rfix_0.6-cfgs1.5-1.0-1.0-non_saturating-dlr5e-07-g_w200.0-d_w1.0-dm_w1.0-g_noise_0.-0.95-plain-bf16_checkpoint-50000/config.yaml ADDED Viewed

	@@ -0,0 +1,120 @@

+name: DiMO2-GPUS2-bs64-glr5e-07-flr5e-07-FKL-fix_rfix_0.6-cfgs1.5-1.0-1.0-non_saturating-dlr5e-07-g_w200.0-d_w1.0-dm_w1.0-g_noise_0.-0.95-plain-bf16
+report_to: wandb
+output_dir: outputs//MaskBit_benchmark/DiMO2-GPUS2-bs64-glr5e-07-flr5e-07-FKL-fix_rfix_0.6-cfgs1.5-1.0-1.0-non_saturating-dlr5e-07-g_w200.0-d_w1.0-dm_w1.0-g_noise_0.-0.95-plain-bf16/2025-08-25T18-34
+pretrained_model_path: ./pretrained_maskgit/MaskGIT/MaskGIT_ImageNet_256.pth
+pretrained_vae_path: ./pretrained_maskgit/VQGAN/
+load_dimo_pre_train: outputs/MaskBit_benchmark/DiMO2-GPUS4-bs64-glr1e-06-flr1e-06-FKL-fix_rfix_0.6-cfgs1.5-1.0-1.0-r_modes_arccos-arccos-non_saturating-dlr1e-06-g_w25.0-d_w1.0-dm_w1.0-g_noise_continuous_0.-0.95-plain-bf16/2025-08-17T14-45/meta_checkpoints_best_fid/ema_model/pytorch_model.bin
+wandb_project: DiMO_GAN_MaskBit
+wandb_user: yuanzhi_zhu
+ema_cpu: false
+ema_freq: 1
+ema_rampup: true
+max_train_steps: 200001
+log_steps: 50
+validation_steps: 200
+validation_steps_tuple:
+- 2
+- 50
+- 200
+- 500
+metric_type: fid
+metric_steps: 2000
+metric_steps_tuple:
+- 2000
+- 5000
+scale_lr: false
+lr_warmup_steps: 500
+lr_scheduler_type: constant_with_warmup
+train_batch_size: 64
+loss_reduction: sum
+optimizer_type: adamw
+adam_beta1: 0.9
+adam_beta2: 0.999
+fake_adam_beta1: 0.9
+fake_adam_beta2: 0.999
+adam_weight_decay: 0.01
+adam_epsilon: 1.0e-06
+max_grad_norm: 1.0
+gradient_accumulation_steps: 1
+gradient_checkpointing: false
+checkpointing_steps: 1000
+mixed_precision: bf16
+enable_xformers_memory_efficient_attention: false
+global_seed: 3407
+is_debug: false
+cast_models_to_dtype: false
+checkpoints_total_limit: 5
+checkpointing_steps_tuple:
+- 5000
+- 10000
+- 15000
+- 20000
+- 25000
+- 30000
+- 40000
+- 50000
+- 60000
+- 70000
+- 80000
+- 90000
+- 100000
+resume_from_checkpoint_path: ''
+no_progress_bar: true
+generator_lr: 5.0e-07
+fake_rounds: 1
+weight_factor_type: uniform
+dm_loss_weight: 1.0
+distil_loss_type: FKL
+fixed_ratio: fix_0.6
+noise_emb_perturb: fix_0.0
+top_k: 0
+top_p: 0.0
+true_cfg: 1.5
+fake_cfg_eval: 1.0
+fake_cfg_train: 1.0
+fake_lr: 5.0e-07
+fake_cfg_drop_ratio: 0.0
+gen_temp: 1.0
+true_temp: 1.0
+fake_temp: 1.0
+ignore_index: -1
+ratio_mode: arccos
+ratio_mode_fake: arccos
+temperature_fake: 1.0
+alpha_fake: 0.0
+fix_emb_layer: true
+cfg_schedule: constant
+emb_input: false
+use_discriminator: 1.0
+discriminator_lr: 5.0e-07
+g_loss_weight: 200.0
+d_loss_weight: 1.0
+gan_noise_level: continuous_0.-0.95
+noisy_as_masked_emb: true
+noisy_as_noisy_feat: false
+noisy_as_noisy_emb: false
+same_maskemb: true
+generator_loss_type: non_saturating
+use_discriminator_steps: 1000
+emb_mode: plain
+tau: 0.5
+tau_min: 0.1
+dis_min_ch: 256
+dis_f_layer: 4
+dis_emb_input: true
+dis_t_cond: true
+dis_adam_beta1: 0.0
+dis_adam_beta2: 0.999
+sched_mode: arccos
+sampling_step: 64
+mask_value: 1024
+cfg_w: 5.8
+r_temp: 10.3
+sm_temp: 1.0
+Jeffreys_beta: 0.0
+run_id: 2025-08-25T18-34
+precision: bf16
+folder_name: DiMO2-GPUS2-bs64-glr5e-07-flr5e-07-FKL-fix_rfix_0.6-cfgs1.5-1.0-1.0-non_saturating-dlr5e-07-g_w200.0-d_w1.0-dm_w1.0-g_noise_0.-0.95-plain-bf16/2025-08-25T18-34
+output_name: /MaskBit_benchmark
+ema_decay: 0.9999
+resolution: 256

maskbit/DiMO2-GPUS2-bs64-glr5e-07-flr5e-07-FKL-fix_rfix_0.6-cfgs1.5-1.0-1.0-non_saturating-dlr5e-07-g_w200.0-d_w1.0-dm_w1.0-g_noise_0.-0.95-plain-bf16_checkpoint-50000/pytorch_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b1423dfbe97093c93a23b963e599f34b202bdaef9bfb101e0955f35d1bb0d0a7
+size 1219832638

maskbit/DiMO2-GPUS4-bs64-glr1e-06-flr1e-06-FKL-fix_rfix_0.6-cfgs1.5-1.0-1.0-r_modes_arccos-arccos-non_saturating-dlr1e-06-g_w25.0-d_w1.0-dm_w1.0-g_noise_continuous_0.-0.95-plain-bf16_checkpoint-50000/config.yaml ADDED Viewed

	@@ -0,0 +1,120 @@

+name: DiMO2-GPUS4-bs64-glr1e-06-flr1e-06-FKL-fix_rfix_0.6-cfgs1.5-1.0-1.0-r_modes_arccos-arccos-non_saturating-dlr1e-06-g_w25.0-d_w1.0-dm_w1.0-g_noise_continuous_0.-0.95-plain-bf16
+report_to: wandb
+output_dir: outputs//MaskBit_benchmark/DiMO2-GPUS4-bs64-glr1e-06-flr1e-06-FKL-fix_rfix_0.6-cfgs1.5-1.0-1.0-r_modes_arccos-arccos-non_saturating-dlr1e-06-g_w25.0-d_w1.0-dm_w1.0-g_noise_continuous_0.-0.95-plain-bf16/2025-08-17T14-45
+pretrained_model_path: ./pretrained_maskgit/MaskGIT/MaskGIT_ImageNet_256.pth
+pretrained_vae_path: ./pretrained_maskgit/VQGAN/
+load_dimo_pre_train: ./outputs/MaskBit_benchmark/DDMD-GPUS1-bs128-glr1e-06-flr1e-06-FKL-fix_rfix_0.6-emb_pert_fix_0.1-tcfg1.5-fcfg1.0-fcfgt1.0-r_mode_arccos-r_mode_f_arccos-reduce_sum-seed3407-bf16/2025-08-11T16-13/_checkpoint-50000/ema_model/pytorch_model.bin
+wandb_project: DiMO_GAN_MaskBit
+wandb_user: yuanzhi_zhu
+ema_cpu: false
+ema_freq: 1
+ema_rampup: true
+max_train_steps: 200001
+log_steps: 50
+validation_steps: 200
+validation_steps_tuple:
+- 2
+- 50
+- 200
+- 500
+metric_type: fid
+metric_steps: 2000
+metric_steps_tuple:
+- 2000
+- 5000
+scale_lr: false
+lr_warmup_steps: 500
+lr_scheduler_type: constant_with_warmup
+train_batch_size: 64
+loss_reduction: sum
+optimizer_type: adam
+adam_beta1: 0.9
+adam_beta2: 0.999
+fake_adam_beta1: 0.9
+fake_adam_beta2: 0.999
+adam_weight_decay: 0.0
+adam_epsilon: 1.0e-06
+max_grad_norm: 1.0
+gradient_accumulation_steps: 1
+gradient_checkpointing: false
+checkpointing_steps: 1000
+mixed_precision: bf16
+enable_xformers_memory_efficient_attention: false
+global_seed: 3407
+is_debug: false
+cast_models_to_dtype: false
+checkpoints_total_limit: 5
+checkpointing_steps_tuple:
+- 5000
+- 10000
+- 15000
+- 20000
+- 25000
+- 30000
+- 40000
+- 50000
+- 60000
+- 70000
+- 80000
+- 90000
+- 100000
+resume_from_checkpoint_path: ''
+no_progress_bar: true
+generator_lr: 1.0e-06
+fake_rounds: 1
+weight_factor_type: uniform
+dm_loss_weight: 1.0
+distil_loss_type: FKL
+fixed_ratio: fix_0.6
+noise_emb_perturb: fix_0.0
+top_k: 0
+top_p: 0.0
+true_cfg: 1.5
+fake_cfg_eval: 1.0
+fake_cfg_train: 1.0
+fake_lr: 1.0e-06
+fake_cfg_drop_ratio: 0.0
+gen_temp: 1.0
+true_temp: 1.0
+fake_temp: 1.0
+ignore_index: -1
+ratio_mode: arccos
+ratio_mode_fake: arccos
+temperature_fake: 1.0
+alpha_fake: 0.0
+fix_emb_layer: true
+cfg_schedule: constant
+emb_input: false
+use_discriminator: 1.0
+discriminator_lr: 1.0e-06
+g_loss_weight: 25.0
+d_loss_weight: 1.0
+gan_noise_level: continuous_0.-0.95
+noisy_as_masked_emb: true
+noisy_as_noisy_feat: false
+noisy_as_noisy_emb: false
+same_maskemb: true
+generator_loss_type: non_saturating
+use_discriminator_steps: 1000
+emb_mode: plain
+tau: 0.5
+tau_min: 0.1
+dis_min_ch: 256
+dis_f_layer: 4
+dis_emb_input: true
+dis_t_cond: true
+dis_adam_beta1: 0.0
+dis_adam_beta2: 0.999
+sched_mode: arccos
+sampling_step: 64
+mask_value: 1024
+cfg_w: 5.8
+r_temp: 10.3
+sm_temp: 1.0
+Jeffreys_beta: 0.0
+run_id: 2025-08-17T14-45
+precision: bf16
+folder_name: DiMO2-GPUS4-bs64-glr1e-06-flr1e-06-FKL-fix_rfix_0.6-cfgs1.5-1.0-1.0-r_modes_arccos-arccos-non_saturating-dlr1e-06-g_w25.0-d_w1.0-dm_w1.0-g_noise_continuous_0.-0.95-plain-bf16/2025-08-17T14-45
+output_name: /MaskBit_benchmark
+ema_decay: 0.9999
+resolution: 256

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:32351716414757c5fdc917de7c96889f253a9a4d645a33e1b2a5168af5f170f0
+size 1219832638