dzungpham commited on Feb 3

Commit

3011a43

verified ·

1 Parent(s): 5aa9738

FST training for 500, 1000 and 1500 steps phase 1 with consistency loss, no identity loss

Browse files

Files changed (33) hide show

FST/FontDiffuserFST_training_phase_1_config.yaml +8 -8
FST/checkpoint_step_1000/content_encoder.safetensors +3 -0
FST/checkpoint_step_1000/fst_module.safetensors +3 -0
FST/checkpoint_step_1000/fst_projection.safetensors +3 -0
FST/checkpoint_step_1000/identity_loss_module.safetensors +3 -0
FST/checkpoint_step_1000/mss_encoder.safetensors +3 -0
FST/checkpoint_step_1000/original_style_projection.safetensors +3 -0
FST/checkpoint_step_1000/style_encoder.safetensors +3 -0
FST/checkpoint_step_1000/training_state.pth +3 -0
FST/checkpoint_step_1000/unet.safetensors +3 -0
FST/checkpoint_step_1500/content_encoder.safetensors +1 -1
FST/checkpoint_step_1500/fst_module.safetensors +1 -1
FST/checkpoint_step_1500/fst_projection.safetensors +1 -1
FST/checkpoint_step_1500/mss_encoder.safetensors +1 -1
FST/checkpoint_step_1500/original_style_projection.safetensors +1 -1
FST/checkpoint_step_1500/style_encoder.safetensors +1 -1
FST/checkpoint_step_1500/training_state.pth +1 -1
FST/checkpoint_step_1500/unet.safetensors +1 -1
FST/checkpoint_step_500/content_encoder.safetensors +3 -0
FST/checkpoint_step_500/fst_module.safetensors +3 -0
FST/checkpoint_step_500/fst_projection.safetensors +3 -0
FST/checkpoint_step_500/identity_loss_module.safetensors +3 -0
FST/checkpoint_step_500/mss_encoder.safetensors +3 -0
FST/checkpoint_step_500/original_style_projection.safetensors +3 -0
FST/checkpoint_step_500/style_encoder.safetensors +3 -0
FST/checkpoint_step_500/training_state.pth +3 -0
FST/checkpoint_step_500/unet.safetensors +3 -0
FST/logs/FontDiffuserFST_training_phase_1/events.out.tfevents.1770113474.b645e4c54d0e.17996.0 +3 -0
FST/logs/FontDiffuserFST_training_phase_1/training_config_gradient_accumulation_steps/events.out.tfevents.1770113474.b645e4c54d0e.17996.4 +3 -0
FST/logs/FontDiffuserFST_training_phase_1/training_config_learning_rate/events.out.tfevents.1770113474.b645e4c54d0e.17996.1 +3 -0
FST/logs/FontDiffuserFST_training_phase_1/training_config_max_train_steps/events.out.tfevents.1770113474.b645e4c54d0e.17996.3 +3 -0
FST/logs/FontDiffuserFST_training_phase_1/training_config_mixed_precision/events.out.tfevents.1770113474.b645e4c54d0e.17996.5 +3 -0
FST/logs/FontDiffuserFST_training_phase_1/training_config_train_batch_size/events.out.tfevents.1770113474.b645e4c54d0e.17996.2 +3 -0

FST/FontDiffuserFST_training_phase_1_config.yaml CHANGED Viewed

@@ -11,7 +11,7 @@ character_input: false
 characters: null
 characters_file: null
 ckpt_dir: null
-ckpt_interval: 1500
 compile: true
 compute_fid: false
 consistency_loss_weight: 0.1
@@ -69,12 +69,12 @@ learning_rate: 0.0001
 local_rank: -1
 log_interval: 50
 logging_dir: logs
-lr_scheduler: constant
-lr_warmup_steps: 200
 max_grad_norm: 1.0
-max_train_steps: 3000
 method: multistep
-mixed_precision: fp16
 mode: refinement
 model_type: noise
 mss_base_channels: 64
@@ -82,16 +82,16 @@ mss_num_scales: 5
 nce_layers: 0,1,2,3
 num_consistency_pairs: 3
 num_heads: 8
-num_identity_pairs: 3
 num_inference_steps: 20
 num_neg: 16
 num_workers: 1
-offset_coefficient: 0.5
 onnx_export_dir: null
 onnx_opset_version: 17
 order: 2
 output_dir: outputs/FontDiffuser/FST
-perceptual_coefficient: 0.05
 phase_1: true
 phase_1_ckpt_dir: ''
 phase_2: false

 characters: null
 characters_file: null
 ckpt_dir: null
+ckpt_interval: 500
 compile: true
 compute_fid: false
 consistency_loss_weight: 0.1
 local_rank: -1
 log_interval: 50
 logging_dir: logs
+lr_scheduler: linear
+lr_warmup_steps: 500
 max_grad_norm: 1.0
+max_train_steps: 2000
 method: multistep
+mixed_precision: 'no'
 mode: refinement
 model_type: noise
 mss_base_channels: 64
 nce_layers: 0,1,2,3
 num_consistency_pairs: 3
 num_heads: 8
+num_identity_pairs: 0
 num_inference_steps: 20
 num_neg: 16
 num_workers: 1
+offset_coefficient: 0.3
 onnx_export_dir: null
 onnx_opset_version: 17
 order: 2
 output_dir: outputs/FontDiffuser/FST
+perceptual_coefficient: 0.03
 phase_1: true
 phase_1_ckpt_dir: ''
 phase_2: false

FST/checkpoint_step_1000/content_encoder.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:26ebb65a0a709c1aec3825471e5120374b1c5640f7f0e83a0a3fec9955ea93ce
+size 4756580

FST/checkpoint_step_1000/fst_module.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ba0214ac149ccc997b20cebe3c4f8066f42be2599d571ba350e9a1a4be788e28
+size 238575652

FST/checkpoint_step_1000/fst_projection.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a44d5aa4a2b1629fffb87b1c8d5ee4e90762301ec503771c41c44ec8bfc29de1
+size 4198552

FST/checkpoint_step_1000/identity_loss_module.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3ac907e1995c674cbe33c55038ccc3ee9ff880974a0e6b1f6115b29ed9bbce7b
+size 193688

FST/checkpoint_step_1000/mss_encoder.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:50673172e8622866d5b31570fe2b4df116da611a771696b228284ce60b1d7030
+size 25261992

FST/checkpoint_step_1000/original_style_projection.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f386b524f0bde78b71395298f022daf43a3414842c33f5d322460f91352c069a
+size 4198552

FST/checkpoint_step_1000/style_encoder.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f7357dd874674dc95570e869a33cd9b09c6245a42ded762e748326dd6ef2329b
+size 82394556

FST/checkpoint_step_1000/training_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:abc08181188e9b8e0657c51ef82caba88984a48cb1feda685df30ec7ae78a161
+size 1349161373

FST/checkpoint_step_1000/unet.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f5c00771deee66b1d253d5ad5b6a48193303e00b52aebc0683c6dfeeb9237ff5
+size 314927748

FST/checkpoint_step_1500/content_encoder.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:61099e3694480a1fff91aa4bb1bbc1dc966376666f5c2d17575e29ca1e6c0323
 size 4756580

 version https://git-lfs.github.com/spec/v1
+oid sha256:bcea157c70eff0a813a5f877d32209a3473c7da51485bb29afdec4a5411ff889
 size 4756580

FST/checkpoint_step_1500/fst_module.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:36ea783bc764b673f1eaf4baa303f49056c01106bbaae63cbd639f11e189368e
 size 238575652

 version https://git-lfs.github.com/spec/v1
+oid sha256:a73af087275073708a3ccb1262e7c7d0389a62da26c8850c4f56b947dee2a153
 size 238575652

FST/checkpoint_step_1500/fst_projection.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3d86f9cba4a75ada85db13770a254093e66008b4c5bbd02a60d3899d838aede9
 size 4198552

 version https://git-lfs.github.com/spec/v1
+oid sha256:82f2bb103fb51382f4c4848daf58226e3d6debe2fd24f7eb3489b76ac4e4f2b6
 size 4198552

FST/checkpoint_step_1500/mss_encoder.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:25866998ebc841c69e7a321a58747c1f42e16bc3a2909aad674a56eb287eb926
 size 25261992

 version https://git-lfs.github.com/spec/v1
+oid sha256:bdce15a611e891e087fdee99b8293e4cf1aeec5fb0eb6f77fe36b054c2953131
 size 25261992

FST/checkpoint_step_1500/original_style_projection.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:cb635fc0ce7d94fa5f0f8f5535911c176911dd3072f8a4819032c3c8456bb2ee
 size 4198552

 version https://git-lfs.github.com/spec/v1
+oid sha256:f8400bf863b954053d97d0b99754e88e0d0f24e0df6266b7f8f8d88ba9e5d09d
 size 4198552

FST/checkpoint_step_1500/style_encoder.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:482252ceee1e2a054a2f4cfc19880b0326409c5b508290cc403d2ff0653a63fc
 size 82394556

 version https://git-lfs.github.com/spec/v1
+oid sha256:124f6b18f79bc42bd0cd5a5b86f5226904fb40f31fabea88ae63c8241eadcfe5
 size 82394556

FST/checkpoint_step_1500/training_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2034e2335188e51d7a331851cec591ffb2a37cae3566ec7f2a271650474ec32e
 size 1349161373

 version https://git-lfs.github.com/spec/v1
+oid sha256:26a3a8195e1453b6396594bd84a83abeca1f3eb9faa42215f505397d30c1d453
 size 1349161373

FST/checkpoint_step_1500/unet.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ab3843aa9441306fffacb462bffbc01c5619970d34e2a95f315bf1d3bde4cb2f
 size 314927748

 version https://git-lfs.github.com/spec/v1
+oid sha256:6cb71e6bba58e7678a645966874bdee0b230ef0bf709aff85ed4d9e124431356
 size 314927748

FST/checkpoint_step_500/content_encoder.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c7b2947e049aacecc212cea7387db99a8870c1e0607cac6c3e604e47bfa81a24
+size 4756580

FST/checkpoint_step_500/fst_module.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e472bb2df7b716f1ff1c384186799a21cc89be8b7ed93febe82f3223433e7635
+size 238575652

FST/checkpoint_step_500/fst_projection.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ede81db437e817d7877f155c75106fad3b0fc75f4895e4c30a5beda49d9975f7
+size 4198552

FST/checkpoint_step_500/identity_loss_module.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3ac907e1995c674cbe33c55038ccc3ee9ff880974a0e6b1f6115b29ed9bbce7b
+size 193688

FST/checkpoint_step_500/mss_encoder.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5d2de586ed2a774f2c26ad9db5cdb0e9ecb7315eb404f95e4dc63915c7f0a0b3
+size 25261992

FST/checkpoint_step_500/original_style_projection.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5dba2048bd189a22853a12b8752d63b5311e46cbbb7916b2052f20b2aef3a54d
+size 4198552

FST/checkpoint_step_500/style_encoder.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:13d420f37446c5b8c815cc5eae0397fa1aa5fd957eab427d2b4015b9d75e235f
+size 82394556

FST/checkpoint_step_500/training_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7394ca34be774e96a2d937294e723f4bb2d49bced90571a28792bfccbd19b5b6
+size 1349161373

FST/checkpoint_step_500/unet.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c1be7bc26eb6c8dbc959d173850a45807007d6f10879f0bd5b749c1687bccb81
+size 314927748

FST/logs/FontDiffuserFST_training_phase_1/events.out.tfevents.1770113474.b645e4c54d0e.17996.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c4455f15520dcdbe5f8b662184db2d46bd4e5e9d0fb3497e857aa14f069e862a
+size 88

FST/logs/FontDiffuserFST_training_phase_1/training_config_gradient_accumulation_steps/events.out.tfevents.1770113474.b645e4c54d0e.17996.4 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:faa95ff3d6fad951cbc79996dbf2aeb415749e89ebe0683412e2c5db289c111c
+size 139

FST/logs/FontDiffuserFST_training_phase_1/training_config_learning_rate/events.out.tfevents.1770113474.b645e4c54d0e.17996.1 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:985291cdbae0b1105fb521d0a42c4f490771a9481feeafdcd2073795a7c7395a
+size 139

FST/logs/FontDiffuserFST_training_phase_1/training_config_max_train_steps/events.out.tfevents.1770113474.b645e4c54d0e.17996.3 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c3fb7aa66369f0c6dbc2939195f26566bf04a00839875048241c42755c784c17
+size 139

FST/logs/FontDiffuserFST_training_phase_1/training_config_mixed_precision/events.out.tfevents.1770113474.b645e4c54d0e.17996.5 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:70499f78dcabda3130cecb1e773130de50e1db3535da48073990028a740418cd
+size 88

FST/logs/FontDiffuserFST_training_phase_1/training_config_train_batch_size/events.out.tfevents.1770113474.b645e4c54d0e.17996.2 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:64096d222d6869f1f9be0c1877e152b3f0ee81a6f92bfa8705125138df84547e
+size 139