dzungpham commited on
Commit
3011a43
·
verified ·
1 Parent(s): 5aa9738

FST training for 500, 1000 and 1500 steps phase 1 with consistency loss, no identity loss

Browse files
Files changed (33) hide show
  1. FST/FontDiffuserFST_training_phase_1_config.yaml +8 -8
  2. FST/checkpoint_step_1000/content_encoder.safetensors +3 -0
  3. FST/checkpoint_step_1000/fst_module.safetensors +3 -0
  4. FST/checkpoint_step_1000/fst_projection.safetensors +3 -0
  5. FST/checkpoint_step_1000/identity_loss_module.safetensors +3 -0
  6. FST/checkpoint_step_1000/mss_encoder.safetensors +3 -0
  7. FST/checkpoint_step_1000/original_style_projection.safetensors +3 -0
  8. FST/checkpoint_step_1000/style_encoder.safetensors +3 -0
  9. FST/checkpoint_step_1000/training_state.pth +3 -0
  10. FST/checkpoint_step_1000/unet.safetensors +3 -0
  11. FST/checkpoint_step_1500/content_encoder.safetensors +1 -1
  12. FST/checkpoint_step_1500/fst_module.safetensors +1 -1
  13. FST/checkpoint_step_1500/fst_projection.safetensors +1 -1
  14. FST/checkpoint_step_1500/mss_encoder.safetensors +1 -1
  15. FST/checkpoint_step_1500/original_style_projection.safetensors +1 -1
  16. FST/checkpoint_step_1500/style_encoder.safetensors +1 -1
  17. FST/checkpoint_step_1500/training_state.pth +1 -1
  18. FST/checkpoint_step_1500/unet.safetensors +1 -1
  19. FST/checkpoint_step_500/content_encoder.safetensors +3 -0
  20. FST/checkpoint_step_500/fst_module.safetensors +3 -0
  21. FST/checkpoint_step_500/fst_projection.safetensors +3 -0
  22. FST/checkpoint_step_500/identity_loss_module.safetensors +3 -0
  23. FST/checkpoint_step_500/mss_encoder.safetensors +3 -0
  24. FST/checkpoint_step_500/original_style_projection.safetensors +3 -0
  25. FST/checkpoint_step_500/style_encoder.safetensors +3 -0
  26. FST/checkpoint_step_500/training_state.pth +3 -0
  27. FST/checkpoint_step_500/unet.safetensors +3 -0
  28. FST/logs/FontDiffuserFST_training_phase_1/events.out.tfevents.1770113474.b645e4c54d0e.17996.0 +3 -0
  29. FST/logs/FontDiffuserFST_training_phase_1/training_config_gradient_accumulation_steps/events.out.tfevents.1770113474.b645e4c54d0e.17996.4 +3 -0
  30. FST/logs/FontDiffuserFST_training_phase_1/training_config_learning_rate/events.out.tfevents.1770113474.b645e4c54d0e.17996.1 +3 -0
  31. FST/logs/FontDiffuserFST_training_phase_1/training_config_max_train_steps/events.out.tfevents.1770113474.b645e4c54d0e.17996.3 +3 -0
  32. FST/logs/FontDiffuserFST_training_phase_1/training_config_mixed_precision/events.out.tfevents.1770113474.b645e4c54d0e.17996.5 +3 -0
  33. FST/logs/FontDiffuserFST_training_phase_1/training_config_train_batch_size/events.out.tfevents.1770113474.b645e4c54d0e.17996.2 +3 -0
FST/FontDiffuserFST_training_phase_1_config.yaml CHANGED
@@ -11,7 +11,7 @@ character_input: false
11
  characters: null
12
  characters_file: null
13
  ckpt_dir: null
14
- ckpt_interval: 1500
15
  compile: true
16
  compute_fid: false
17
  consistency_loss_weight: 0.1
@@ -69,12 +69,12 @@ learning_rate: 0.0001
69
  local_rank: -1
70
  log_interval: 50
71
  logging_dir: logs
72
- lr_scheduler: constant
73
- lr_warmup_steps: 200
74
  max_grad_norm: 1.0
75
- max_train_steps: 3000
76
  method: multistep
77
- mixed_precision: fp16
78
  mode: refinement
79
  model_type: noise
80
  mss_base_channels: 64
@@ -82,16 +82,16 @@ mss_num_scales: 5
82
  nce_layers: 0,1,2,3
83
  num_consistency_pairs: 3
84
  num_heads: 8
85
- num_identity_pairs: 3
86
  num_inference_steps: 20
87
  num_neg: 16
88
  num_workers: 1
89
- offset_coefficient: 0.5
90
  onnx_export_dir: null
91
  onnx_opset_version: 17
92
  order: 2
93
  output_dir: outputs/FontDiffuser/FST
94
- perceptual_coefficient: 0.05
95
  phase_1: true
96
  phase_1_ckpt_dir: ''
97
  phase_2: false
 
11
  characters: null
12
  characters_file: null
13
  ckpt_dir: null
14
+ ckpt_interval: 500
15
  compile: true
16
  compute_fid: false
17
  consistency_loss_weight: 0.1
 
69
  local_rank: -1
70
  log_interval: 50
71
  logging_dir: logs
72
+ lr_scheduler: linear
73
+ lr_warmup_steps: 500
74
  max_grad_norm: 1.0
75
+ max_train_steps: 2000
76
  method: multistep
77
+ mixed_precision: 'no'
78
  mode: refinement
79
  model_type: noise
80
  mss_base_channels: 64
 
82
  nce_layers: 0,1,2,3
83
  num_consistency_pairs: 3
84
  num_heads: 8
85
+ num_identity_pairs: 0
86
  num_inference_steps: 20
87
  num_neg: 16
88
  num_workers: 1
89
+ offset_coefficient: 0.3
90
  onnx_export_dir: null
91
  onnx_opset_version: 17
92
  order: 2
93
  output_dir: outputs/FontDiffuser/FST
94
+ perceptual_coefficient: 0.03
95
  phase_1: true
96
  phase_1_ckpt_dir: ''
97
  phase_2: false
FST/checkpoint_step_1000/content_encoder.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:26ebb65a0a709c1aec3825471e5120374b1c5640f7f0e83a0a3fec9955ea93ce
3
+ size 4756580
FST/checkpoint_step_1000/fst_module.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ba0214ac149ccc997b20cebe3c4f8066f42be2599d571ba350e9a1a4be788e28
3
+ size 238575652
FST/checkpoint_step_1000/fst_projection.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a44d5aa4a2b1629fffb87b1c8d5ee4e90762301ec503771c41c44ec8bfc29de1
3
+ size 4198552
FST/checkpoint_step_1000/identity_loss_module.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3ac907e1995c674cbe33c55038ccc3ee9ff880974a0e6b1f6115b29ed9bbce7b
3
+ size 193688
FST/checkpoint_step_1000/mss_encoder.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:50673172e8622866d5b31570fe2b4df116da611a771696b228284ce60b1d7030
3
+ size 25261992
FST/checkpoint_step_1000/original_style_projection.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f386b524f0bde78b71395298f022daf43a3414842c33f5d322460f91352c069a
3
+ size 4198552
FST/checkpoint_step_1000/style_encoder.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f7357dd874674dc95570e869a33cd9b09c6245a42ded762e748326dd6ef2329b
3
+ size 82394556
FST/checkpoint_step_1000/training_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:abc08181188e9b8e0657c51ef82caba88984a48cb1feda685df30ec7ae78a161
3
+ size 1349161373
FST/checkpoint_step_1000/unet.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f5c00771deee66b1d253d5ad5b6a48193303e00b52aebc0683c6dfeeb9237ff5
3
+ size 314927748
FST/checkpoint_step_1500/content_encoder.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:61099e3694480a1fff91aa4bb1bbc1dc966376666f5c2d17575e29ca1e6c0323
3
  size 4756580
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bcea157c70eff0a813a5f877d32209a3473c7da51485bb29afdec4a5411ff889
3
  size 4756580
FST/checkpoint_step_1500/fst_module.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:36ea783bc764b673f1eaf4baa303f49056c01106bbaae63cbd639f11e189368e
3
  size 238575652
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a73af087275073708a3ccb1262e7c7d0389a62da26c8850c4f56b947dee2a153
3
  size 238575652
FST/checkpoint_step_1500/fst_projection.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3d86f9cba4a75ada85db13770a254093e66008b4c5bbd02a60d3899d838aede9
3
  size 4198552
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:82f2bb103fb51382f4c4848daf58226e3d6debe2fd24f7eb3489b76ac4e4f2b6
3
  size 4198552
FST/checkpoint_step_1500/mss_encoder.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:25866998ebc841c69e7a321a58747c1f42e16bc3a2909aad674a56eb287eb926
3
  size 25261992
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bdce15a611e891e087fdee99b8293e4cf1aeec5fb0eb6f77fe36b054c2953131
3
  size 25261992
FST/checkpoint_step_1500/original_style_projection.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cb635fc0ce7d94fa5f0f8f5535911c176911dd3072f8a4819032c3c8456bb2ee
3
  size 4198552
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f8400bf863b954053d97d0b99754e88e0d0f24e0df6266b7f8f8d88ba9e5d09d
3
  size 4198552
FST/checkpoint_step_1500/style_encoder.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:482252ceee1e2a054a2f4cfc19880b0326409c5b508290cc403d2ff0653a63fc
3
  size 82394556
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:124f6b18f79bc42bd0cd5a5b86f5226904fb40f31fabea88ae63c8241eadcfe5
3
  size 82394556
FST/checkpoint_step_1500/training_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2034e2335188e51d7a331851cec591ffb2a37cae3566ec7f2a271650474ec32e
3
  size 1349161373
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:26a3a8195e1453b6396594bd84a83abeca1f3eb9faa42215f505397d30c1d453
3
  size 1349161373
FST/checkpoint_step_1500/unet.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ab3843aa9441306fffacb462bffbc01c5619970d34e2a95f315bf1d3bde4cb2f
3
  size 314927748
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6cb71e6bba58e7678a645966874bdee0b230ef0bf709aff85ed4d9e124431356
3
  size 314927748
FST/checkpoint_step_500/content_encoder.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c7b2947e049aacecc212cea7387db99a8870c1e0607cac6c3e604e47bfa81a24
3
+ size 4756580
FST/checkpoint_step_500/fst_module.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e472bb2df7b716f1ff1c384186799a21cc89be8b7ed93febe82f3223433e7635
3
+ size 238575652
FST/checkpoint_step_500/fst_projection.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ede81db437e817d7877f155c75106fad3b0fc75f4895e4c30a5beda49d9975f7
3
+ size 4198552
FST/checkpoint_step_500/identity_loss_module.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3ac907e1995c674cbe33c55038ccc3ee9ff880974a0e6b1f6115b29ed9bbce7b
3
+ size 193688
FST/checkpoint_step_500/mss_encoder.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5d2de586ed2a774f2c26ad9db5cdb0e9ecb7315eb404f95e4dc63915c7f0a0b3
3
+ size 25261992
FST/checkpoint_step_500/original_style_projection.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5dba2048bd189a22853a12b8752d63b5311e46cbbb7916b2052f20b2aef3a54d
3
+ size 4198552
FST/checkpoint_step_500/style_encoder.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:13d420f37446c5b8c815cc5eae0397fa1aa5fd957eab427d2b4015b9d75e235f
3
+ size 82394556
FST/checkpoint_step_500/training_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7394ca34be774e96a2d937294e723f4bb2d49bced90571a28792bfccbd19b5b6
3
+ size 1349161373
FST/checkpoint_step_500/unet.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c1be7bc26eb6c8dbc959d173850a45807007d6f10879f0bd5b749c1687bccb81
3
+ size 314927748
FST/logs/FontDiffuserFST_training_phase_1/events.out.tfevents.1770113474.b645e4c54d0e.17996.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c4455f15520dcdbe5f8b662184db2d46bd4e5e9d0fb3497e857aa14f069e862a
3
+ size 88
FST/logs/FontDiffuserFST_training_phase_1/training_config_gradient_accumulation_steps/events.out.tfevents.1770113474.b645e4c54d0e.17996.4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:faa95ff3d6fad951cbc79996dbf2aeb415749e89ebe0683412e2c5db289c111c
3
+ size 139
FST/logs/FontDiffuserFST_training_phase_1/training_config_learning_rate/events.out.tfevents.1770113474.b645e4c54d0e.17996.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:985291cdbae0b1105fb521d0a42c4f490771a9481feeafdcd2073795a7c7395a
3
+ size 139
FST/logs/FontDiffuserFST_training_phase_1/training_config_max_train_steps/events.out.tfevents.1770113474.b645e4c54d0e.17996.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c3fb7aa66369f0c6dbc2939195f26566bf04a00839875048241c42755c784c17
3
+ size 139
FST/logs/FontDiffuserFST_training_phase_1/training_config_mixed_precision/events.out.tfevents.1770113474.b645e4c54d0e.17996.5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:70499f78dcabda3130cecb1e773130de50e1db3535da48073990028a740418cd
3
+ size 88
FST/logs/FontDiffuserFST_training_phase_1/training_config_train_batch_size/events.out.tfevents.1770113474.b645e4c54d0e.17996.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:64096d222d6869f1f9be0c1877e152b3f0ee81a6f92bfa8705125138df84547e
3
+ size 139