dzungpham commited on Feb 26

Commit

a33c4fe

verified ·

1 Parent(s): d4cf9be

DRO training phase 2 for 8000 steps

Browse files

Files changed (37) hide show

DRO-20260226-8P2/FontDiffuserDRO_training_phase_2_config.yaml +159 -0
DRO-20260226-8P2/checkpoint_step_1000/content_encoder.safetensors +3 -0
DRO-20260226-8P2/checkpoint_step_1000/fst_module.safetensors +3 -0
DRO-20260226-8P2/checkpoint_step_1000/fst_projection.safetensors +3 -0
DRO-20260226-8P2/checkpoint_step_1000/mss_encoder.safetensors +3 -0
DRO-20260226-8P2/checkpoint_step_1000/original_style_projection.safetensors +3 -0
DRO-20260226-8P2/checkpoint_step_1000/scr.safetensors +3 -0
DRO-20260226-8P2/checkpoint_step_1000/style_encoder.safetensors +3 -0
DRO-20260226-8P2/checkpoint_step_1000/training_state.pt +3 -0
DRO-20260226-8P2/checkpoint_step_1000/unet.safetensors +3 -0
DRO-20260226-8P2/checkpoint_step_504/content_encoder.safetensors +3 -0
DRO-20260226-8P2/checkpoint_step_504/fst_module.safetensors +3 -0
DRO-20260226-8P2/checkpoint_step_504/fst_projection.safetensors +3 -0
DRO-20260226-8P2/checkpoint_step_504/mss_encoder.safetensors +3 -0
DRO-20260226-8P2/checkpoint_step_504/original_style_projection.safetensors +3 -0
DRO-20260226-8P2/checkpoint_step_504/scr.safetensors +3 -0
DRO-20260226-8P2/checkpoint_step_504/style_encoder.safetensors +3 -0
DRO-20260226-8P2/checkpoint_step_504/training_state.pt +3 -0
DRO-20260226-8P2/checkpoint_step_504/unet.safetensors +3 -0
DRO-20260226-8P2/checkpoint_step_750/content_encoder.safetensors +3 -0
DRO-20260226-8P2/checkpoint_step_750/fst_module.safetensors +3 -0
DRO-20260226-8P2/checkpoint_step_750/fst_projection.safetensors +3 -0
DRO-20260226-8P2/checkpoint_step_750/mss_encoder.safetensors +3 -0
DRO-20260226-8P2/checkpoint_step_750/original_style_projection.safetensors +3 -0
DRO-20260226-8P2/checkpoint_step_750/scr.safetensors +3 -0
DRO-20260226-8P2/checkpoint_step_750/style_encoder.safetensors +3 -0
DRO-20260226-8P2/checkpoint_step_750/training_state.pt +3 -0
DRO-20260226-8P2/checkpoint_step_750/unet.safetensors +3 -0
DRO-20260226-8P2/final/content_encoder.safetensors +3 -0
DRO-20260226-8P2/final/fst_module.safetensors +3 -0
DRO-20260226-8P2/final/fst_projection.safetensors +3 -0
DRO-20260226-8P2/final/mss_encoder.safetensors +3 -0
DRO-20260226-8P2/final/original_style_projection.safetensors +3 -0
DRO-20260226-8P2/final/scr.safetensors +3 -0
DRO-20260226-8P2/final/style_encoder.safetensors +3 -0
DRO-20260226-8P2/final/training_state.pt +3 -0
DRO-20260226-8P2/final/unet.safetensors +3 -0

DRO-20260226-8P2/FontDiffuserDRO_training_phase_2_config.yaml ADDED Viewed

	@@ -0,0 +1,159 @@

+adam_beta1: 0.9
+adam_beta2: 0.999
+adam_epsilon: 1.0e-08
+adam_weight_decay: 0.01
+algorithm_type: dpmsolver++
+batch_size: 1
+beta_scheduler: scaled_linear
+channel_attn: true
+channels_last: false
+character_input: false
+characters: null
+characters_file: null
+ckpt_dir: null
+ckpt_interval: 250
+compile: true
+compute_fid: false
+consistency_loss_weight: 0.1
+content_character: null
+content_encoder_downsample_size: 3
+content_image_path: null
+content_image_size: !!python/tuple
+- 96
+- 96
+content_start_channel: 64
+controlnet: false
+correcting_x0_fn: null
+data_root: .
+dataset_split: train_original
+demo: false
+deterministic: false
+device: cuda:0
+dro_div_weight: 0.0
+dro_lpips_weight: 1.0
+dro_max_timestep_frac: 0.3
+dro_normalise_reward: false
+dro_reward_scale: 1.0
+dro_sharp_weight: 0.0
+dro_ssim_weight: 1.0
+dro_warmup_steps: 0
+dro_weight: 0.1
+drop_prob: 0.1
+enable_attention_slicing: false
+enable_style_transform: false
+enable_xformers: false
+end_line: null
+evaluate: false
+experience_name: FontDiffuserDRO_training_phase_2
+export_onnx: false
+fast_sampling: false
+feature_dim: 512
+ffn_dim: 2048
+fp16: false
+freeze_modules: ''
+frequency_filter_type: gaussian
+frequency_low_cutoff: 0.1
+frequency_mid_cutoff: 0.4
+frequency_mid_target: both
+frequency_use_mid_band: true
+fst_ckpt_path: null
+fst_feature_channels: 64,128,256,512,1024
+fst_num_queries: 220
+fst_num_scales: 5
+fst_query_dim: 256
+gradient_accumulation_steps: 2
+ground_truth_dir: null
+guidance_scale: 7.5
+guidance_type: classifier-free
+hidden_dim: 256
+identity_adaptive_max_weight: 1.0
+identity_adaptive_min_weight: 0.1
+identity_log_metrics: true
+identity_loss_type: frobenius
+identity_loss_weight: 0.1
+identity_matrix_size: null
+identity_metric_interval: 100
+identity_pair_mode: random
+identity_pooled_reduction: mean
+identity_reg_weight: 0.01
+identity_regularization: orthogonal
+identity_similarity_threshold: 0.8
+instructpix2pix: false
+learning_rate: 5.0e-05
+local_rank: 0
+log_interval: 50
+logging_dir: logs
+lr_scheduler: cosine
+lr_warmup_steps: 200
+max_grad_norm: 1.0
+max_train_steps: 1000
+method: multistep
+mixed_precision: 'no'
+mode: refinement
+model_type: noise
+mss_base_channels: 64
+mss_num_scales: 5
+nce_layers: 0,1,2,3
+num_consistency_pairs: 3
+num_heads: 8
+num_identity_pairs: 0
+num_inference_steps: 20
+num_neg: 34
+num_workers: 3
+offset_coefficient: 0.3
+onnx_export_dir: null
+onnx_opset_version: 17
+order: 2
+output_dir: outputs/FontArchitect/DRO-20260226-8P2
+perceptual_coefficient: 0.03
+phase_1: false
+phase_1_ckpt_dir: ckpt/DRO-20260225-8P2/checkpoint_step_500
+phase_2: true
+report_to: wandb
+resolution: 96
+resume_from_checkpoint: ckpt/DRO-20260225-8P2/checkpoint_step_500
+save_image: false
+save_image_dir: null
+save_interval: 10
+sc_coefficient: 0.03
+scale_lr: false
+scr_ckpt_path: ckpt/DRO-20260225-8P2/checkpoint_step_500/scr.safetensors
+scr_image_size: 96
+seed: 123
+skeleton_distance_method: hybrid
+skeleton_fusion_method: concat
+skeleton_max_distance: 12.0
+skeleton_method: medial_axis
+skeleton_output_mode: dual_channel
+skeleton_sigma: 1.5
+skip_type: time_uniform
+start_line: 1
+style_image_path: null
+style_image_size: !!python/tuple
+- 96
+- 96
+style_images: null
+style_source_same_prob: 0.5
+style_start_channel: 64
+style_transform_coefficient: 0.1
+summary: false
+t_end: null
+t_start: null
+temperature: 0.07
+train_batch_size: 4
+ttf_path: ttf/KaiXinSongA.ttf
+unet_channels: !!python/tuple
+- 64
+- 128
+- 256
+- 512
+use_adaptive_identity_loss: false
+use_dro: true
+use_frequency_decomp: true
+use_fst: true
+use_pooled_identity_loss: false
+use_skeleton_content: false
+use_wandb: true
+val_interval: 100
+wandb_project: fontdiffuser-eval
+wandb_run_name: null

DRO-20260226-8P2/checkpoint_step_1000/content_encoder.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9ee03233703578e23371127fb0cd29a6f4ee36e107972ebd23902f5dd1e0faf6
+size 4756580

DRO-20260226-8P2/checkpoint_step_1000/fst_module.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9ce801b59701fc4086a1f5c1a0957381e6d32b7d1aa67b7e1b8abf6e68604341
+size 238575652

DRO-20260226-8P2/checkpoint_step_1000/fst_projection.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6a4e8d198cc62958f215910b4e7ddc3995364d83cb511debc6af94867bd02b89
+size 4198552

DRO-20260226-8P2/checkpoint_step_1000/mss_encoder.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:49e75571c80f882f856092c1b68c227966a51147d4248c8bde91e4cedc1f536a
+size 25261992

DRO-20260226-8P2/checkpoint_step_1000/original_style_projection.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f3e15d6d81bcad13f6ce723ba7b2b7bc75f008720f905b995857831b5796e556
+size 4198552

DRO-20260226-8P2/checkpoint_step_1000/scr.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:fbfecbf3e4485517a5d4004f99a394f21ebd318f06a2484374722cfb3d238c4a
+size 284227968

DRO-20260226-8P2/checkpoint_step_1000/style_encoder.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:718afe6904ec0c143e3c848e7216fa5f8cac6d62fa3f48201d50debbcb68783c
+size 82394556

DRO-20260226-8P2/checkpoint_step_1000/training_state.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:57eea6b1a2e751f01725101ee90d463efd31b954f54962547ff328f991ae5513
+size 1349134749

DRO-20260226-8P2/checkpoint_step_1000/unet.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8276d3ddb5660fb56b8e1b53ccb155b306fafe7f459432ed8c369f539470d50f
+size 314927748

DRO-20260226-8P2/checkpoint_step_504/content_encoder.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:04461be19b5eaaf9e1d83fb8ef84b7a7a51ea87c8095f0d2320bb1659dfea9a9
+size 4756580

DRO-20260226-8P2/checkpoint_step_504/fst_module.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1a8f683f69b672d8b8568f81fdf6bd8fb97d07b8c5930549e533c504836129fd
+size 238575652

DRO-20260226-8P2/checkpoint_step_504/fst_projection.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:051fec3c5ac27ee1501afb81755353bb108774158726290c1ed8d6ecf2430f3e
+size 4198552

DRO-20260226-8P2/checkpoint_step_504/mss_encoder.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e32a73972ed28d92e8a1c5a12b8b6fa5cf4180d2aba3f11b55c69382b040d1b9
+size 25261992

DRO-20260226-8P2/checkpoint_step_504/original_style_projection.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8d5f53162ed3b9dccddfe324684b4f3596f51d5376687b5c3edb8579de6f95d3
+size 4198552

DRO-20260226-8P2/checkpoint_step_504/scr.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:720c3f5aabc331be7e584da0f3d1372be324f514f6d3eb84e5f53b3f894ec8c1
+size 284227968

DRO-20260226-8P2/checkpoint_step_504/style_encoder.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:12eafee3b242d25e6e7288d05fdb5e18cdd3880b8a77d778dee8efdb0a32868b
+size 82394556

DRO-20260226-8P2/checkpoint_step_504/training_state.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:acdf2384de8d9d49587cdccaee0a0d5202c01873ae245323d99f27a7df149f8a
+size 1349134749

DRO-20260226-8P2/checkpoint_step_504/unet.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:918533fca1607a6728205df672fb33bc1fbcb32e84446dbe301ee5c2b29f3160
+size 314927748

DRO-20260226-8P2/checkpoint_step_750/content_encoder.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a7990432ee514a92373ca9ed9f463a46ef06e45dffac0699a3f8ccbdf180fcc5
+size 4756580

DRO-20260226-8P2/checkpoint_step_750/fst_module.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9d3daeafa96c57ff05a09d764d46da8390f8b3989ad9cad31e55b1ee6749079b
+size 238575652

DRO-20260226-8P2/checkpoint_step_750/fst_projection.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7b666a5d267e3671599bf0ce3fc423e70a367a14bdbbf9339be8633e85d78313
+size 4198552

DRO-20260226-8P2/checkpoint_step_750/mss_encoder.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:835bd5bae385537eb22bbf79a5ffc8bf7c509cf0470743faf24fa547af24af14
+size 25261992

DRO-20260226-8P2/checkpoint_step_750/original_style_projection.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e5da38afa61824ed08cfeeb7d583dfe78027bb5825e18b59b32fd90e0dae9d94
+size 4198552

DRO-20260226-8P2/checkpoint_step_750/scr.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:73242967dc4debbe2539b581c62cca03231c3e52736642f2d3fbd1b1a2886b6f
+size 284227968

DRO-20260226-8P2/checkpoint_step_750/style_encoder.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:aaf3fb629ee98a43ccf0c0bb064850c9a7eb9e62efa3ac02d048321ba9f7d92b
+size 82394556

DRO-20260226-8P2/checkpoint_step_750/training_state.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:92475e240099a8cdb71a7d87f3d4cbf4ca58b7d22b73d265abc79d98c9a825ea
+size 1349134749

DRO-20260226-8P2/checkpoint_step_750/unet.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7bab830f7afe3a4cb85ab510097158b6533a0e29c14baae762cd10661940d888
+size 314927748

DRO-20260226-8P2/final/content_encoder.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9ee03233703578e23371127fb0cd29a6f4ee36e107972ebd23902f5dd1e0faf6
+size 4756580

DRO-20260226-8P2/final/fst_module.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9ce801b59701fc4086a1f5c1a0957381e6d32b7d1aa67b7e1b8abf6e68604341
+size 238575652

DRO-20260226-8P2/final/fst_projection.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6a4e8d198cc62958f215910b4e7ddc3995364d83cb511debc6af94867bd02b89
+size 4198552

DRO-20260226-8P2/final/mss_encoder.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:49e75571c80f882f856092c1b68c227966a51147d4248c8bde91e4cedc1f536a
+size 25261992

DRO-20260226-8P2/final/original_style_projection.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f3e15d6d81bcad13f6ce723ba7b2b7bc75f008720f905b995857831b5796e556
+size 4198552

DRO-20260226-8P2/final/scr.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:fbfecbf3e4485517a5d4004f99a394f21ebd318f06a2484374722cfb3d238c4a
+size 284227968

DRO-20260226-8P2/final/style_encoder.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:718afe6904ec0c143e3c848e7216fa5f8cac6d62fa3f48201d50debbcb68783c
+size 82394556

DRO-20260226-8P2/final/training_state.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:57eea6b1a2e751f01725101ee90d463efd31b954f54962547ff328f991ae5513
+size 1349134749

DRO-20260226-8P2/final/unet.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8276d3ddb5660fb56b8e1b53ccb155b306fafe7f459432ed8c369f539470d50f
+size 314927748