FST training for 500, 1000 and 1500 steps phase 1 with consistency loss, no identity loss
Browse files- FST/FontDiffuserFST_training_phase_1_config.yaml +8 -8
- FST/checkpoint_step_1000/content_encoder.safetensors +3 -0
- FST/checkpoint_step_1000/fst_module.safetensors +3 -0
- FST/checkpoint_step_1000/fst_projection.safetensors +3 -0
- FST/checkpoint_step_1000/identity_loss_module.safetensors +3 -0
- FST/checkpoint_step_1000/mss_encoder.safetensors +3 -0
- FST/checkpoint_step_1000/original_style_projection.safetensors +3 -0
- FST/checkpoint_step_1000/style_encoder.safetensors +3 -0
- FST/checkpoint_step_1000/training_state.pth +3 -0
- FST/checkpoint_step_1000/unet.safetensors +3 -0
- FST/checkpoint_step_1500/content_encoder.safetensors +1 -1
- FST/checkpoint_step_1500/fst_module.safetensors +1 -1
- FST/checkpoint_step_1500/fst_projection.safetensors +1 -1
- FST/checkpoint_step_1500/mss_encoder.safetensors +1 -1
- FST/checkpoint_step_1500/original_style_projection.safetensors +1 -1
- FST/checkpoint_step_1500/style_encoder.safetensors +1 -1
- FST/checkpoint_step_1500/training_state.pth +1 -1
- FST/checkpoint_step_1500/unet.safetensors +1 -1
- FST/checkpoint_step_500/content_encoder.safetensors +3 -0
- FST/checkpoint_step_500/fst_module.safetensors +3 -0
- FST/checkpoint_step_500/fst_projection.safetensors +3 -0
- FST/checkpoint_step_500/identity_loss_module.safetensors +3 -0
- FST/checkpoint_step_500/mss_encoder.safetensors +3 -0
- FST/checkpoint_step_500/original_style_projection.safetensors +3 -0
- FST/checkpoint_step_500/style_encoder.safetensors +3 -0
- FST/checkpoint_step_500/training_state.pth +3 -0
- FST/checkpoint_step_500/unet.safetensors +3 -0
- FST/logs/FontDiffuserFST_training_phase_1/events.out.tfevents.1770113474.b645e4c54d0e.17996.0 +3 -0
- FST/logs/FontDiffuserFST_training_phase_1/training_config_gradient_accumulation_steps/events.out.tfevents.1770113474.b645e4c54d0e.17996.4 +3 -0
- FST/logs/FontDiffuserFST_training_phase_1/training_config_learning_rate/events.out.tfevents.1770113474.b645e4c54d0e.17996.1 +3 -0
- FST/logs/FontDiffuserFST_training_phase_1/training_config_max_train_steps/events.out.tfevents.1770113474.b645e4c54d0e.17996.3 +3 -0
- FST/logs/FontDiffuserFST_training_phase_1/training_config_mixed_precision/events.out.tfevents.1770113474.b645e4c54d0e.17996.5 +3 -0
- FST/logs/FontDiffuserFST_training_phase_1/training_config_train_batch_size/events.out.tfevents.1770113474.b645e4c54d0e.17996.2 +3 -0
FST/FontDiffuserFST_training_phase_1_config.yaml
CHANGED
|
@@ -11,7 +11,7 @@ character_input: false
|
|
| 11 |
characters: null
|
| 12 |
characters_file: null
|
| 13 |
ckpt_dir: null
|
| 14 |
-
ckpt_interval:
|
| 15 |
compile: true
|
| 16 |
compute_fid: false
|
| 17 |
consistency_loss_weight: 0.1
|
|
@@ -69,12 +69,12 @@ learning_rate: 0.0001
|
|
| 69 |
local_rank: -1
|
| 70 |
log_interval: 50
|
| 71 |
logging_dir: logs
|
| 72 |
-
lr_scheduler:
|
| 73 |
-
lr_warmup_steps:
|
| 74 |
max_grad_norm: 1.0
|
| 75 |
-
max_train_steps:
|
| 76 |
method: multistep
|
| 77 |
-
mixed_precision:
|
| 78 |
mode: refinement
|
| 79 |
model_type: noise
|
| 80 |
mss_base_channels: 64
|
|
@@ -82,16 +82,16 @@ mss_num_scales: 5
|
|
| 82 |
nce_layers: 0,1,2,3
|
| 83 |
num_consistency_pairs: 3
|
| 84 |
num_heads: 8
|
| 85 |
-
num_identity_pairs:
|
| 86 |
num_inference_steps: 20
|
| 87 |
num_neg: 16
|
| 88 |
num_workers: 1
|
| 89 |
-
offset_coefficient: 0.
|
| 90 |
onnx_export_dir: null
|
| 91 |
onnx_opset_version: 17
|
| 92 |
order: 2
|
| 93 |
output_dir: outputs/FontDiffuser/FST
|
| 94 |
-
perceptual_coefficient: 0.
|
| 95 |
phase_1: true
|
| 96 |
phase_1_ckpt_dir: ''
|
| 97 |
phase_2: false
|
|
|
|
| 11 |
characters: null
|
| 12 |
characters_file: null
|
| 13 |
ckpt_dir: null
|
| 14 |
+
ckpt_interval: 500
|
| 15 |
compile: true
|
| 16 |
compute_fid: false
|
| 17 |
consistency_loss_weight: 0.1
|
|
|
|
| 69 |
local_rank: -1
|
| 70 |
log_interval: 50
|
| 71 |
logging_dir: logs
|
| 72 |
+
lr_scheduler: linear
|
| 73 |
+
lr_warmup_steps: 500
|
| 74 |
max_grad_norm: 1.0
|
| 75 |
+
max_train_steps: 2000
|
| 76 |
method: multistep
|
| 77 |
+
mixed_precision: 'no'
|
| 78 |
mode: refinement
|
| 79 |
model_type: noise
|
| 80 |
mss_base_channels: 64
|
|
|
|
| 82 |
nce_layers: 0,1,2,3
|
| 83 |
num_consistency_pairs: 3
|
| 84 |
num_heads: 8
|
| 85 |
+
num_identity_pairs: 0
|
| 86 |
num_inference_steps: 20
|
| 87 |
num_neg: 16
|
| 88 |
num_workers: 1
|
| 89 |
+
offset_coefficient: 0.3
|
| 90 |
onnx_export_dir: null
|
| 91 |
onnx_opset_version: 17
|
| 92 |
order: 2
|
| 93 |
output_dir: outputs/FontDiffuser/FST
|
| 94 |
+
perceptual_coefficient: 0.03
|
| 95 |
phase_1: true
|
| 96 |
phase_1_ckpt_dir: ''
|
| 97 |
phase_2: false
|
FST/checkpoint_step_1000/content_encoder.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:26ebb65a0a709c1aec3825471e5120374b1c5640f7f0e83a0a3fec9955ea93ce
|
| 3 |
+
size 4756580
|
FST/checkpoint_step_1000/fst_module.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ba0214ac149ccc997b20cebe3c4f8066f42be2599d571ba350e9a1a4be788e28
|
| 3 |
+
size 238575652
|
FST/checkpoint_step_1000/fst_projection.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a44d5aa4a2b1629fffb87b1c8d5ee4e90762301ec503771c41c44ec8bfc29de1
|
| 3 |
+
size 4198552
|
FST/checkpoint_step_1000/identity_loss_module.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3ac907e1995c674cbe33c55038ccc3ee9ff880974a0e6b1f6115b29ed9bbce7b
|
| 3 |
+
size 193688
|
FST/checkpoint_step_1000/mss_encoder.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:50673172e8622866d5b31570fe2b4df116da611a771696b228284ce60b1d7030
|
| 3 |
+
size 25261992
|
FST/checkpoint_step_1000/original_style_projection.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f386b524f0bde78b71395298f022daf43a3414842c33f5d322460f91352c069a
|
| 3 |
+
size 4198552
|
FST/checkpoint_step_1000/style_encoder.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f7357dd874674dc95570e869a33cd9b09c6245a42ded762e748326dd6ef2329b
|
| 3 |
+
size 82394556
|
FST/checkpoint_step_1000/training_state.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:abc08181188e9b8e0657c51ef82caba88984a48cb1feda685df30ec7ae78a161
|
| 3 |
+
size 1349161373
|
FST/checkpoint_step_1000/unet.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f5c00771deee66b1d253d5ad5b6a48193303e00b52aebc0683c6dfeeb9237ff5
|
| 3 |
+
size 314927748
|
FST/checkpoint_step_1500/content_encoder.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4756580
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bcea157c70eff0a813a5f877d32209a3473c7da51485bb29afdec4a5411ff889
|
| 3 |
size 4756580
|
FST/checkpoint_step_1500/fst_module.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 238575652
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a73af087275073708a3ccb1262e7c7d0389a62da26c8850c4f56b947dee2a153
|
| 3 |
size 238575652
|
FST/checkpoint_step_1500/fst_projection.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4198552
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:82f2bb103fb51382f4c4848daf58226e3d6debe2fd24f7eb3489b76ac4e4f2b6
|
| 3 |
size 4198552
|
FST/checkpoint_step_1500/mss_encoder.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 25261992
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bdce15a611e891e087fdee99b8293e4cf1aeec5fb0eb6f77fe36b054c2953131
|
| 3 |
size 25261992
|
FST/checkpoint_step_1500/original_style_projection.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4198552
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f8400bf863b954053d97d0b99754e88e0d0f24e0df6266b7f8f8d88ba9e5d09d
|
| 3 |
size 4198552
|
FST/checkpoint_step_1500/style_encoder.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 82394556
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:124f6b18f79bc42bd0cd5a5b86f5226904fb40f31fabea88ae63c8241eadcfe5
|
| 3 |
size 82394556
|
FST/checkpoint_step_1500/training_state.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1349161373
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:26a3a8195e1453b6396594bd84a83abeca1f3eb9faa42215f505397d30c1d453
|
| 3 |
size 1349161373
|
FST/checkpoint_step_1500/unet.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 314927748
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6cb71e6bba58e7678a645966874bdee0b230ef0bf709aff85ed4d9e124431356
|
| 3 |
size 314927748
|
FST/checkpoint_step_500/content_encoder.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c7b2947e049aacecc212cea7387db99a8870c1e0607cac6c3e604e47bfa81a24
|
| 3 |
+
size 4756580
|
FST/checkpoint_step_500/fst_module.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e472bb2df7b716f1ff1c384186799a21cc89be8b7ed93febe82f3223433e7635
|
| 3 |
+
size 238575652
|
FST/checkpoint_step_500/fst_projection.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ede81db437e817d7877f155c75106fad3b0fc75f4895e4c30a5beda49d9975f7
|
| 3 |
+
size 4198552
|
FST/checkpoint_step_500/identity_loss_module.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3ac907e1995c674cbe33c55038ccc3ee9ff880974a0e6b1f6115b29ed9bbce7b
|
| 3 |
+
size 193688
|
FST/checkpoint_step_500/mss_encoder.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5d2de586ed2a774f2c26ad9db5cdb0e9ecb7315eb404f95e4dc63915c7f0a0b3
|
| 3 |
+
size 25261992
|
FST/checkpoint_step_500/original_style_projection.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5dba2048bd189a22853a12b8752d63b5311e46cbbb7916b2052f20b2aef3a54d
|
| 3 |
+
size 4198552
|
FST/checkpoint_step_500/style_encoder.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:13d420f37446c5b8c815cc5eae0397fa1aa5fd957eab427d2b4015b9d75e235f
|
| 3 |
+
size 82394556
|
FST/checkpoint_step_500/training_state.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7394ca34be774e96a2d937294e723f4bb2d49bced90571a28792bfccbd19b5b6
|
| 3 |
+
size 1349161373
|
FST/checkpoint_step_500/unet.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c1be7bc26eb6c8dbc959d173850a45807007d6f10879f0bd5b749c1687bccb81
|
| 3 |
+
size 314927748
|
FST/logs/FontDiffuserFST_training_phase_1/events.out.tfevents.1770113474.b645e4c54d0e.17996.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c4455f15520dcdbe5f8b662184db2d46bd4e5e9d0fb3497e857aa14f069e862a
|
| 3 |
+
size 88
|
FST/logs/FontDiffuserFST_training_phase_1/training_config_gradient_accumulation_steps/events.out.tfevents.1770113474.b645e4c54d0e.17996.4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:faa95ff3d6fad951cbc79996dbf2aeb415749e89ebe0683412e2c5db289c111c
|
| 3 |
+
size 139
|
FST/logs/FontDiffuserFST_training_phase_1/training_config_learning_rate/events.out.tfevents.1770113474.b645e4c54d0e.17996.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:985291cdbae0b1105fb521d0a42c4f490771a9481feeafdcd2073795a7c7395a
|
| 3 |
+
size 139
|
FST/logs/FontDiffuserFST_training_phase_1/training_config_max_train_steps/events.out.tfevents.1770113474.b645e4c54d0e.17996.3
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c3fb7aa66369f0c6dbc2939195f26566bf04a00839875048241c42755c784c17
|
| 3 |
+
size 139
|
FST/logs/FontDiffuserFST_training_phase_1/training_config_mixed_precision/events.out.tfevents.1770113474.b645e4c54d0e.17996.5
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:70499f78dcabda3130cecb1e773130de50e1db3535da48073990028a740418cd
|
| 3 |
+
size 88
|
FST/logs/FontDiffuserFST_training_phase_1/training_config_train_batch_size/events.out.tfevents.1770113474.b645e4c54d0e.17996.2
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:64096d222d6869f1f9be0c1877e152b3f0ee81a6f92bfa8705125138df84547e
|
| 3 |
+
size 139
|