Add converted safetensors and original pth weights
Browse files- FontDiffuser_training_phase_1_config.yaml +6 -2
- FontDiffuser_training_phase_2_config.yaml +16 -6
- checkpoint_step_1/content_encoder.safetensors +3 -0
- checkpoint_step_1/scr.safetensors +3 -0
- checkpoint_step_1/style_encoder.safetensors +3 -0
- checkpoint_step_1/training_state.pt +3 -0
- checkpoint_step_1/unet.safetensors +3 -0
- checkpoint_step_1000/content_encoder.safetensors +1 -1
- checkpoint_step_1000/style_encoder.safetensors +1 -1
- checkpoint_step_1000/training_state.pt +2 -2
- checkpoint_step_1000/unet.safetensors +1 -1
- checkpoint_step_500/content_encoder.safetensors +1 -1
- checkpoint_step_500/style_encoder.safetensors +1 -1
- checkpoint_step_500/training_state.pt +2 -2
- checkpoint_step_500/unet.safetensors +1 -1
FontDiffuser_training_phase_1_config.yaml
CHANGED
|
@@ -16,12 +16,15 @@ data_root: my_dataset
|
|
| 16 |
drop_prob: 0.1
|
| 17 |
enable_style_transform: false
|
| 18 |
experience_name: FontDiffuser_training_phase_1
|
| 19 |
-
export_onnx_path:
|
| 20 |
gradient_accumulation_steps: 2
|
| 21 |
guidance_scale: 7.5
|
| 22 |
guidance_type: classifier-free
|
|
|
|
|
|
|
|
|
|
| 23 |
learning_rate: 0.0001
|
| 24 |
-
local_rank:
|
| 25 |
log_interval: 50
|
| 26 |
logging_dir: logs
|
| 27 |
lr_scheduler: cosine
|
|
@@ -66,4 +69,5 @@ unet_channels: !!python/tuple
|
|
| 66 |
- 128
|
| 67 |
- 256
|
| 68 |
- 512
|
|
|
|
| 69 |
val_interval: 100
|
|
|
|
| 16 |
drop_prob: 0.1
|
| 17 |
enable_style_transform: false
|
| 18 |
experience_name: FontDiffuser_training_phase_1
|
| 19 |
+
export_onnx_path: null
|
| 20 |
gradient_accumulation_steps: 2
|
| 21 |
guidance_scale: 7.5
|
| 22 |
guidance_type: classifier-free
|
| 23 |
+
hf_repo_id: dzungpham/font-diffusion-generated-data
|
| 24 |
+
hf_split: handwritten_original
|
| 25 |
+
hf_token: null
|
| 26 |
learning_rate: 0.0001
|
| 27 |
+
local_rank: -1
|
| 28 |
log_interval: 50
|
| 29 |
logging_dir: logs
|
| 30 |
lr_scheduler: cosine
|
|
|
|
| 69 |
- 128
|
| 70 |
- 256
|
| 71 |
- 512
|
| 72 |
+
use_hf_dataset: true
|
| 73 |
val_interval: 100
|
FontDiffuser_training_phase_2_config.yaml
CHANGED
|
@@ -5,7 +5,7 @@ adam_weight_decay: 0.01
|
|
| 5 |
algorithm_type: dpmsolver++
|
| 6 |
beta_scheduler: scaled_linear
|
| 7 |
channel_attn: true
|
| 8 |
-
ckpt_interval:
|
| 9 |
content_encoder_downsample_size: 3
|
| 10 |
content_image_size: !!python/tuple
|
| 11 |
- 96
|
|
@@ -14,10 +14,15 @@ content_start_channel: 64
|
|
| 14 |
correcting_x0_fn: null
|
| 15 |
data_root: my_dataset
|
| 16 |
drop_prob: 0.1
|
|
|
|
| 17 |
experience_name: FontDiffuser_training_phase_2
|
| 18 |
-
|
|
|
|
| 19 |
guidance_scale: 7.5
|
| 20 |
guidance_type: classifier-free
|
|
|
|
|
|
|
|
|
|
| 21 |
learning_rate: 1.0e-05
|
| 22 |
local_rank: -1
|
| 23 |
log_interval: 50
|
|
@@ -25,22 +30,26 @@ logging_dir: logs
|
|
| 25 |
lr_scheduler: constant
|
| 26 |
lr_warmup_steps: 100
|
| 27 |
max_grad_norm: 1.0
|
| 28 |
-
max_train_steps:
|
| 29 |
method: multistep
|
| 30 |
mixed_precision: 'no'
|
| 31 |
mode: refinement
|
| 32 |
model_type: noise
|
| 33 |
nce_layers: 0,1,2,3
|
| 34 |
num_inference_steps: 20
|
| 35 |
-
num_neg:
|
|
|
|
| 36 |
offset_coefficient: 0.5
|
| 37 |
order: 2
|
| 38 |
output_dir: outputs/FontDiffuser
|
| 39 |
perceptual_coefficient: 0.05
|
| 40 |
-
|
|
|
|
| 41 |
phase_2: true
|
| 42 |
report_to: wandb
|
| 43 |
resolution: 96
|
|
|
|
|
|
|
| 44 |
sc_coefficient: 0.05
|
| 45 |
scale_lr: false
|
| 46 |
scr_ckpt_path: ckpt/scr_210000.pth
|
|
@@ -54,10 +63,11 @@ style_start_channel: 64
|
|
| 54 |
t_end: null
|
| 55 |
t_start: null
|
| 56 |
temperature: 0.07
|
| 57 |
-
train_batch_size:
|
| 58 |
unet_channels: !!python/tuple
|
| 59 |
- 64
|
| 60 |
- 128
|
| 61 |
- 256
|
| 62 |
- 512
|
|
|
|
| 63 |
val_interval: 100
|
|
|
|
| 5 |
algorithm_type: dpmsolver++
|
| 6 |
beta_scheduler: scaled_linear
|
| 7 |
channel_attn: true
|
| 8 |
+
ckpt_interval: 1
|
| 9 |
content_encoder_downsample_size: 3
|
| 10 |
content_image_size: !!python/tuple
|
| 11 |
- 96
|
|
|
|
| 14 |
correcting_x0_fn: null
|
| 15 |
data_root: my_dataset
|
| 16 |
drop_prob: 0.1
|
| 17 |
+
enable_style_transform: false
|
| 18 |
experience_name: FontDiffuser_training_phase_2
|
| 19 |
+
export_onnx_path: null
|
| 20 |
+
gradient_accumulation_steps: 1
|
| 21 |
guidance_scale: 7.5
|
| 22 |
guidance_type: classifier-free
|
| 23 |
+
hf_repo_id: dzungpham/font-diffusion-generated-data
|
| 24 |
+
hf_split: handwritten_original
|
| 25 |
+
hf_token: null
|
| 26 |
learning_rate: 1.0e-05
|
| 27 |
local_rank: -1
|
| 28 |
log_interval: 50
|
|
|
|
| 30 |
lr_scheduler: constant
|
| 31 |
lr_warmup_steps: 100
|
| 32 |
max_grad_norm: 1.0
|
| 33 |
+
max_train_steps: 2
|
| 34 |
method: multistep
|
| 35 |
mixed_precision: 'no'
|
| 36 |
mode: refinement
|
| 37 |
model_type: noise
|
| 38 |
nce_layers: 0,1,2,3
|
| 39 |
num_inference_steps: 20
|
| 40 |
+
num_neg: 12
|
| 41 |
+
num_workers: 4
|
| 42 |
offset_coefficient: 0.5
|
| 43 |
order: 2
|
| 44 |
output_dir: outputs/FontDiffuser
|
| 45 |
perceptual_coefficient: 0.05
|
| 46 |
+
phase_1: false
|
| 47 |
+
phase_1_ckpt_dir: outputs/FontDiffuser/checkpoint_step_1000
|
| 48 |
phase_2: true
|
| 49 |
report_to: wandb
|
| 50 |
resolution: 96
|
| 51 |
+
resume_from_checkpoint: null
|
| 52 |
+
save_full_model: false
|
| 53 |
sc_coefficient: 0.05
|
| 54 |
scale_lr: false
|
| 55 |
scr_ckpt_path: ckpt/scr_210000.pth
|
|
|
|
| 63 |
t_end: null
|
| 64 |
t_start: null
|
| 65 |
temperature: 0.07
|
| 66 |
+
train_batch_size: 16
|
| 67 |
unet_channels: !!python/tuple
|
| 68 |
- 64
|
| 69 |
- 128
|
| 70 |
- 256
|
| 71 |
- 512
|
| 72 |
+
use_hf_dataset: true
|
| 73 |
val_interval: 100
|
checkpoint_step_1/content_encoder.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:90d470624b5cbb4300ff2a54d716adb77d06f94f0530b31da30f422d67b99798
|
| 3 |
+
size 4756580
|
checkpoint_step_1/scr.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7618bed9fb85450d0c95b57c7e874ddf725606cf9b90da6295a0c835c3332790
|
| 3 |
+
size 284227968
|
checkpoint_step_1/style_encoder.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:eeec15da854c814b48d5a5d85e3e667905e697ee5b7ec1dc43a4794b31615cb7
|
| 3 |
+
size 82394556
|
checkpoint_step_1/training_state.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9e5c434c81202c7b62c1b19bf34d041b8ba18d40156feed3431fbcda684fd297
|
| 3 |
+
size 1206964193
|
checkpoint_step_1/unet.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:41b460184de2f7239493374e09434005a0c90842f83cbda706743f2fc367aed5
|
| 3 |
+
size 314927748
|
checkpoint_step_1000/content_encoder.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4756580
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8c443fd0f0f8a31406ed436ad47c5ad79052e6ff387b647b43807aaa9d1f7d35
|
| 3 |
size 4756580
|
checkpoint_step_1000/style_encoder.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 82394556
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:722699298a1d4922e4fa2e5e86b713c328b2f37a181dad85516b00c557293331
|
| 3 |
size 82394556
|
checkpoint_step_1000/training_state.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b9d7e49e1038f80535cb9920fd36ed114f2cf1d93f1a53b9d894ae4899ce2400
|
| 3 |
+
size 1206964257
|
checkpoint_step_1000/unet.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 314927748
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:29804a197cfdce5ae634e49e7abe1e7db43da6f56d312cd2db6127f7188abfde
|
| 3 |
size 314927748
|
checkpoint_step_500/content_encoder.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4756580
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e3ef7bb5823c6614ce7983455a3e9b41d17032377ba9c0c18454f5abdc13d4ba
|
| 3 |
size 4756580
|
checkpoint_step_500/style_encoder.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 82394556
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bd8574fdcd0cd3dbbc694c707cb3f6dd96bc6563e26bb108922a22a674405275
|
| 3 |
size 82394556
|
checkpoint_step_500/training_state.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b733b27e3d901d38344835618c38903398a2851100ea955c186ffd0ed08b69bf
|
| 3 |
+
size 1206964257
|
checkpoint_step_500/unet.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 314927748
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:000b933fe6ad05bfe85a7828f3ed3fe315c234216c3026e61b3e1ea9e22ed0eb
|
| 3 |
size 314927748
|