dzungpham commited on
Commit
b5c3021
·
verified ·
1 Parent(s): 3cd0d64

FST-only training for paper experiments

Browse files
Files changed (28) hide show
  1. FST-paper-experiment/FontDiffuserFST_training_phase_2_config.yaml +167 -0
  2. FST-paper-experiment/checkpoint_step_1000/content_encoder.safetensors +3 -0
  3. FST-paper-experiment/checkpoint_step_1000/fst_module.safetensors +3 -0
  4. FST-paper-experiment/checkpoint_step_1000/fst_projection.safetensors +3 -0
  5. FST-paper-experiment/checkpoint_step_1000/mss_encoder.safetensors +3 -0
  6. FST-paper-experiment/checkpoint_step_1000/original_style_projection.safetensors +3 -0
  7. FST-paper-experiment/checkpoint_step_1000/scr.safetensors +3 -0
  8. FST-paper-experiment/checkpoint_step_1000/style_encoder.safetensors +3 -0
  9. FST-paper-experiment/checkpoint_step_1000/training_state.pt +3 -0
  10. FST-paper-experiment/checkpoint_step_1000/unet.safetensors +3 -0
  11. FST-paper-experiment/checkpoint_step_250/content_encoder.safetensors +3 -0
  12. FST-paper-experiment/checkpoint_step_250/fst_module.safetensors +3 -0
  13. FST-paper-experiment/checkpoint_step_250/fst_projection.safetensors +3 -0
  14. FST-paper-experiment/checkpoint_step_250/mss_encoder.safetensors +3 -0
  15. FST-paper-experiment/checkpoint_step_250/original_style_projection.safetensors +3 -0
  16. FST-paper-experiment/checkpoint_step_250/scr.safetensors +3 -0
  17. FST-paper-experiment/checkpoint_step_250/style_encoder.safetensors +3 -0
  18. FST-paper-experiment/checkpoint_step_250/training_state.pt +3 -0
  19. FST-paper-experiment/checkpoint_step_250/unet.safetensors +3 -0
  20. FST-paper-experiment/checkpoint_step_500/content_encoder.safetensors +3 -0
  21. FST-paper-experiment/checkpoint_step_500/fst_module.safetensors +3 -0
  22. FST-paper-experiment/checkpoint_step_500/fst_projection.safetensors +3 -0
  23. FST-paper-experiment/checkpoint_step_500/mss_encoder.safetensors +3 -0
  24. FST-paper-experiment/checkpoint_step_500/original_style_projection.safetensors +3 -0
  25. FST-paper-experiment/checkpoint_step_500/scr.safetensors +3 -0
  26. FST-paper-experiment/checkpoint_step_500/style_encoder.safetensors +3 -0
  27. FST-paper-experiment/checkpoint_step_500/training_state.pt +3 -0
  28. FST-paper-experiment/checkpoint_step_500/unet.safetensors +3 -0
FST-paper-experiment/FontDiffuserFST_training_phase_2_config.yaml ADDED
@@ -0,0 +1,167 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ adam_beta1: 0.9
2
+ adam_beta2: 0.999
3
+ adam_epsilon: 1.0e-08
4
+ adam_weight_decay: 0.01
5
+ algorithm_type: dpmsolver++
6
+ batch_size: 1
7
+ beta_scheduler: scaled_linear
8
+ channel_attn: true
9
+ channels_last: false
10
+ character_input: false
11
+ characters: null
12
+ characters_file: null
13
+ ckpt_dir: null
14
+ ckpt_interval: 250
15
+ compile: false
16
+ compute_fid: false
17
+ consistency_loss_weight: 0.1
18
+ content_character: null
19
+ content_encoder_downsample_size: 3
20
+ content_image_path: null
21
+ content_image_size: !!python/tuple
22
+ - 96
23
+ - 96
24
+ content_start_channel: 64
25
+ controlnet: false
26
+ correcting_x0_fn: null
27
+ data_root: .
28
+ dataset_split: train_original
29
+ demo: false
30
+ deterministic: false
31
+ device: cuda:0
32
+ dro_div_weight: 0.0
33
+ dro_lpips_weight: 1.0
34
+ dro_max_timestep_frac: 0.3
35
+ dro_normalise_reward: false
36
+ dro_reward_scale: 1.0
37
+ dro_sharp_weight: 0.0
38
+ dro_ssim_weight: 1.0
39
+ dro_warmup_steps: 0
40
+ dro_weight: 0.1
41
+ drop_prob: 0.1
42
+ enable_attention_slicing: false
43
+ enable_style_transform: false
44
+ enable_xformers: false
45
+ end_line: null
46
+ evaluate: false
47
+ experience_name: FontDiffuserFST_training_phase_2
48
+ export_onnx: false
49
+ fast_sampling: false
50
+ feature_dim: 512
51
+ ffn_dim: 2048
52
+ fp16: false
53
+ freeze_modules: ''
54
+ frequency_filter_type: gaussian
55
+ frequency_low_cutoff: 0.1
56
+ frequency_mid_cutoff: 0.4
57
+ frequency_mid_target: both
58
+ frequency_use_mid_band: true
59
+ fst_ckpt_path: null
60
+ fst_feature_channels: 64,128,256,512,1024
61
+ fst_num_queries: 220
62
+ fst_num_scales: 5
63
+ fst_query_dim: 256
64
+ gradient_accumulation_steps: 2
65
+ ground_truth_dir: null
66
+ grpo_clip_eps: 0.2
67
+ grpo_group_size: 4
68
+ grpo_kl_coeff: 0.01
69
+ grpo_pg_weight: 0.01
70
+ grpo_reward_clip: 5.0
71
+ grpo_sample_steps: 5
72
+ grpo_warmup_steps: 1000
73
+ guidance_scale: 7.5
74
+ guidance_type: classifier-free
75
+ hidden_dim: 256
76
+ identity_adaptive_max_weight: 1.0
77
+ identity_adaptive_min_weight: 0.1
78
+ identity_log_metrics: true
79
+ identity_loss_type: frobenius
80
+ identity_loss_weight: 0.1
81
+ identity_matrix_size: null
82
+ identity_metric_interval: 100
83
+ identity_pair_mode: random
84
+ identity_pooled_reduction: mean
85
+ identity_reg_weight: 0.01
86
+ identity_regularization: orthogonal
87
+ identity_similarity_threshold: 0.8
88
+ instructpix2pix: false
89
+ learning_rate: 5.0e-05
90
+ local_rank: 0
91
+ log_interval: 50
92
+ logging_dir: logs
93
+ lr_scheduler: cosine
94
+ lr_warmup_steps: 2000
95
+ max_grad_norm: 1.0
96
+ max_train_steps: 15000
97
+ method: multistep
98
+ mixed_precision: 'no'
99
+ mode: refinement
100
+ model_type: noise
101
+ mss_base_channels: 64
102
+ mss_num_scales: 5
103
+ nce_layers: 0,1,2,3
104
+ num_consistency_pairs: 3
105
+ num_heads: 8
106
+ num_identity_pairs: 0
107
+ num_inference_steps: 20
108
+ num_neg: 34
109
+ num_workers: 3
110
+ offset_coefficient: 0.3
111
+ onnx_export_dir: null
112
+ onnx_opset_version: 17
113
+ order: 2
114
+ output_dir: outputs/FontArchitect/FST-paper-experiment
115
+ perceptual_coefficient: 0.03
116
+ phase_1: false
117
+ phase_1_ckpt_dir: ckpt/FST-paper-experiment/final
118
+ phase_2: true
119
+ report_to: wandb
120
+ resolution: 96
121
+ resume_from_checkpoint: ''
122
+ save_image: false
123
+ save_image_dir: null
124
+ save_interval: 10
125
+ sc_coefficient: 0.03
126
+ scale_lr: false
127
+ scr_ckpt_path: ckpt/FST-paper-experiments/phase2/checkpoint_step_500/scr.safetensors
128
+ scr_image_size: 96
129
+ seed: 123
130
+ skeleton_distance_method: hybrid
131
+ skeleton_fusion_method: concat
132
+ skeleton_max_distance: 12.0
133
+ skeleton_method: medial_axis
134
+ skeleton_output_mode: dual_channel
135
+ skeleton_sigma: 1.5
136
+ skip_type: time_uniform
137
+ start_line: 1
138
+ style_image_path: null
139
+ style_image_size: !!python/tuple
140
+ - 96
141
+ - 96
142
+ style_images: null
143
+ style_source_same_prob: 0.5
144
+ style_start_channel: 64
145
+ style_transform_coefficient: 0.1
146
+ summary: false
147
+ t_end: null
148
+ t_start: null
149
+ temperature: 0.07
150
+ train_batch_size: 4
151
+ ttf_path: ttf/KaiXinSongA.ttf
152
+ unet_channels: !!python/tuple
153
+ - 64
154
+ - 128
155
+ - 256
156
+ - 512
157
+ use_adaptive_identity_loss: false
158
+ use_dro: false
159
+ use_frequency_decomp: false
160
+ use_fst: true
161
+ use_grpo: false
162
+ use_pooled_identity_loss: false
163
+ use_skeleton_content: false
164
+ use_wandb: true
165
+ val_interval: 100
166
+ wandb_project: fontdiffuser-eval
167
+ wandb_run_name: null
FST-paper-experiment/checkpoint_step_1000/content_encoder.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:747907e2145a118a7ba13cde36d6eb678e4878b57552181a6ae5614b37013f98
3
+ size 4756580
FST-paper-experiment/checkpoint_step_1000/fst_module.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0548923d7a644c340a3ddacd005160db4749b1fa1e73b62bb51f49fb26d03c7a
3
+ size 238575652
FST-paper-experiment/checkpoint_step_1000/fst_projection.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6176668b642f983b5ef896aa3c5ce5f07e67c546b17a1468e38a51480898dbe5
3
+ size 4198552
FST-paper-experiment/checkpoint_step_1000/mss_encoder.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6ebe8ef08d74e01053d154912b90ff6ff1440da41dcaacbb653ff46584da665f
3
+ size 25261992
FST-paper-experiment/checkpoint_step_1000/original_style_projection.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bd13f64e9982a3b2ce31f89040a6dd9d810f19b80e333e80bb6f384af126be30
3
+ size 4198552
FST-paper-experiment/checkpoint_step_1000/scr.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6d9d4a234af4258f939d420fd4aceb7ac6b8303386ad44ac7cc6f0d69ccf94c2
3
+ size 284227968
FST-paper-experiment/checkpoint_step_1000/style_encoder.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dc5a32d87b76ecd4a8e05409c4882f9cc399fa4b79a0cb665884de094fa8e51a
3
+ size 82394556
FST-paper-experiment/checkpoint_step_1000/training_state.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:23355b821f3ff7d26dc80d8c21c38f6d887f6e32e3e35c559a3c989ff0db4f31
3
+ size 1349161117
FST-paper-experiment/checkpoint_step_1000/unet.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:41e7225a08b3704bcbf1ae76af2475d512eacc232ffb0d490c43eaa16c72dfc5
3
+ size 314927748
FST-paper-experiment/checkpoint_step_250/content_encoder.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:99e4b3c75877fd9c274e58f90962686f94fc1406a67b38dd134c5234cac605b2
3
+ size 4756580
FST-paper-experiment/checkpoint_step_250/fst_module.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eec039b77276706ec44b55f132671555d2797d089e2dc098d85b0780bfad043a
3
+ size 238575652
FST-paper-experiment/checkpoint_step_250/fst_projection.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:50f8d3fe7b9f5fb5c838757655ab3032598c33ae10cac879db84e2291e2c080f
3
+ size 4198552
FST-paper-experiment/checkpoint_step_250/mss_encoder.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5cba98dc202813956834d70de2884b590f3add70352196e4164264b475db9f19
3
+ size 25261992
FST-paper-experiment/checkpoint_step_250/original_style_projection.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6c72fa10dad557c208feda50e7ec43d8bda15db2d848c632e428924ea212abc1
3
+ size 4198552
FST-paper-experiment/checkpoint_step_250/scr.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dcba70bca1370a3d1cc9aa1d38cb65c4430be2efe2d71c61fd8d7cfa9ae021b5
3
+ size 284227968
FST-paper-experiment/checkpoint_step_250/style_encoder.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1775a42b2683f8f954c7e502c42b809962f40de7b5567c4c2c75d4b557ce3f99
3
+ size 82394556
FST-paper-experiment/checkpoint_step_250/training_state.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d5a13f32ace78a11e6f12b3859d8d595c22cd03b0f0324f8d9fdb6c2b47210be
3
+ size 1349161117
FST-paper-experiment/checkpoint_step_250/unet.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2739f053aba119820a66271c5e3a27ccaa9e4d3d29edb87cc29f8299de049567
3
+ size 314927748
FST-paper-experiment/checkpoint_step_500/content_encoder.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0822b5ff787565cf9f94ce03f470fe2c177742758eff1828ca1ff218d4b58b1e
3
+ size 4756580
FST-paper-experiment/checkpoint_step_500/fst_module.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ac9ae9b07229a69d37d0f3727e43f0da6b60a2c66d8858e9c0515f6f5c076b51
3
+ size 238575652
FST-paper-experiment/checkpoint_step_500/fst_projection.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4695237575ca12799dfb2bbd4d6540b625213f894fc222c2d64d5b9c50f06938
3
+ size 4198552
FST-paper-experiment/checkpoint_step_500/mss_encoder.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6eaf71c0e6cb967368668326a1a79664a56d293327bf16e2428167c7bcad6e66
3
+ size 25261992
FST-paper-experiment/checkpoint_step_500/original_style_projection.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd2c21e5915abaf8bc7fe888e87928842b90844473718a92e17a346ef6ee09c1
3
+ size 4198552
FST-paper-experiment/checkpoint_step_500/scr.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3f843fd29d3d9a58a5d759ccd73fac41194e02c6e97f0795f7402fecc50ae30b
3
+ size 284227968
FST-paper-experiment/checkpoint_step_500/style_encoder.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cdaca9ab10f1efcc355acbc7e41b7a45bb6d6fff1db142f4cf647decb323035a
3
+ size 82394556
FST-paper-experiment/checkpoint_step_500/training_state.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:69392bd06c5aff1214adfcc1363aed9ef9ff7b2cf7e20a8359b0f67ba61fe63b
3
+ size 1349161117
FST-paper-experiment/checkpoint_step_500/unet.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a6f8c7bd942ace00d2f548623bba0e352608325288a5aabe4cd1a1a7edf859ae
3
+ size 314927748