dzungpham commited on
Commit
8679f41
·
verified ·
1 Parent(s): 822f018

Add converted safetensors and original pth weights

Browse files
FontDiffuser_training_phase_1_config.yaml CHANGED
@@ -16,12 +16,15 @@ data_root: my_dataset
16
  drop_prob: 0.1
17
  enable_style_transform: false
18
  experience_name: FontDiffuser_training_phase_1
19
- export_onnx_path: net_arch.onnx
20
  gradient_accumulation_steps: 2
21
  guidance_scale: 7.5
22
  guidance_type: classifier-free
 
 
 
23
  learning_rate: 0.0001
24
- local_rank: 0
25
  log_interval: 50
26
  logging_dir: logs
27
  lr_scheduler: cosine
@@ -66,4 +69,5 @@ unet_channels: !!python/tuple
66
  - 128
67
  - 256
68
  - 512
 
69
  val_interval: 100
 
16
  drop_prob: 0.1
17
  enable_style_transform: false
18
  experience_name: FontDiffuser_training_phase_1
19
+ export_onnx_path: null
20
  gradient_accumulation_steps: 2
21
  guidance_scale: 7.5
22
  guidance_type: classifier-free
23
+ hf_repo_id: dzungpham/font-diffusion-generated-data
24
+ hf_split: handwritten_original
25
+ hf_token: null
26
  learning_rate: 0.0001
27
+ local_rank: -1
28
  log_interval: 50
29
  logging_dir: logs
30
  lr_scheduler: cosine
 
69
  - 128
70
  - 256
71
  - 512
72
+ use_hf_dataset: true
73
  val_interval: 100
FontDiffuser_training_phase_2_config.yaml CHANGED
@@ -5,7 +5,7 @@ adam_weight_decay: 0.01
5
  algorithm_type: dpmsolver++
6
  beta_scheduler: scaled_linear
7
  channel_attn: true
8
- ckpt_interval: 250
9
  content_encoder_downsample_size: 3
10
  content_image_size: !!python/tuple
11
  - 96
@@ -14,10 +14,15 @@ content_start_channel: 64
14
  correcting_x0_fn: null
15
  data_root: my_dataset
16
  drop_prob: 0.1
 
17
  experience_name: FontDiffuser_training_phase_2
18
- gradient_accumulation_steps: 2
 
19
  guidance_scale: 7.5
20
  guidance_type: classifier-free
 
 
 
21
  learning_rate: 1.0e-05
22
  local_rank: -1
23
  log_interval: 50
@@ -25,22 +30,26 @@ logging_dir: logs
25
  lr_scheduler: constant
26
  lr_warmup_steps: 100
27
  max_grad_norm: 1.0
28
- max_train_steps: 500
29
  method: multistep
30
  mixed_precision: 'no'
31
  mode: refinement
32
  model_type: noise
33
  nce_layers: 0,1,2,3
34
  num_inference_steps: 20
35
- num_neg: 11
 
36
  offset_coefficient: 0.5
37
  order: 2
38
  output_dir: outputs/FontDiffuser
39
  perceptual_coefficient: 0.05
40
- phase_1_ckpt_dir: ckpt
 
41
  phase_2: true
42
  report_to: wandb
43
  resolution: 96
 
 
44
  sc_coefficient: 0.05
45
  scale_lr: false
46
  scr_ckpt_path: ckpt/scr_210000.pth
@@ -54,10 +63,11 @@ style_start_channel: 64
54
  t_end: null
55
  t_start: null
56
  temperature: 0.07
57
- train_batch_size: 8
58
  unet_channels: !!python/tuple
59
  - 64
60
  - 128
61
  - 256
62
  - 512
 
63
  val_interval: 100
 
5
  algorithm_type: dpmsolver++
6
  beta_scheduler: scaled_linear
7
  channel_attn: true
8
+ ckpt_interval: 1
9
  content_encoder_downsample_size: 3
10
  content_image_size: !!python/tuple
11
  - 96
 
14
  correcting_x0_fn: null
15
  data_root: my_dataset
16
  drop_prob: 0.1
17
+ enable_style_transform: false
18
  experience_name: FontDiffuser_training_phase_2
19
+ export_onnx_path: null
20
+ gradient_accumulation_steps: 1
21
  guidance_scale: 7.5
22
  guidance_type: classifier-free
23
+ hf_repo_id: dzungpham/font-diffusion-generated-data
24
+ hf_split: handwritten_original
25
+ hf_token: null
26
  learning_rate: 1.0e-05
27
  local_rank: -1
28
  log_interval: 50
 
30
  lr_scheduler: constant
31
  lr_warmup_steps: 100
32
  max_grad_norm: 1.0
33
+ max_train_steps: 2
34
  method: multistep
35
  mixed_precision: 'no'
36
  mode: refinement
37
  model_type: noise
38
  nce_layers: 0,1,2,3
39
  num_inference_steps: 20
40
+ num_neg: 12
41
+ num_workers: 4
42
  offset_coefficient: 0.5
43
  order: 2
44
  output_dir: outputs/FontDiffuser
45
  perceptual_coefficient: 0.05
46
+ phase_1: false
47
+ phase_1_ckpt_dir: outputs/FontDiffuser/checkpoint_step_1000
48
  phase_2: true
49
  report_to: wandb
50
  resolution: 96
51
+ resume_from_checkpoint: null
52
+ save_full_model: false
53
  sc_coefficient: 0.05
54
  scale_lr: false
55
  scr_ckpt_path: ckpt/scr_210000.pth
 
63
  t_end: null
64
  t_start: null
65
  temperature: 0.07
66
+ train_batch_size: 16
67
  unet_channels: !!python/tuple
68
  - 64
69
  - 128
70
  - 256
71
  - 512
72
+ use_hf_dataset: true
73
  val_interval: 100
checkpoint_step_1/content_encoder.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:90d470624b5cbb4300ff2a54d716adb77d06f94f0530b31da30f422d67b99798
3
+ size 4756580
checkpoint_step_1/scr.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7618bed9fb85450d0c95b57c7e874ddf725606cf9b90da6295a0c835c3332790
3
+ size 284227968
checkpoint_step_1/style_encoder.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eeec15da854c814b48d5a5d85e3e667905e697ee5b7ec1dc43a4794b31615cb7
3
+ size 82394556
checkpoint_step_1/training_state.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9e5c434c81202c7b62c1b19bf34d041b8ba18d40156feed3431fbcda684fd297
3
+ size 1206964193
checkpoint_step_1/unet.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:41b460184de2f7239493374e09434005a0c90842f83cbda706743f2fc367aed5
3
+ size 314927748
checkpoint_step_1000/content_encoder.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8302106359a2f47262f83d3793a3d5a84901b051fb9ca83733e5bf05596b3bb8
3
  size 4756580
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8c443fd0f0f8a31406ed436ad47c5ad79052e6ff387b647b43807aaa9d1f7d35
3
  size 4756580
checkpoint_step_1000/style_encoder.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fd9a15d7c7463cf4c631ee05946562bb5d7451f944e69f019ba3611d1ca04e11
3
  size 82394556
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:722699298a1d4922e4fa2e5e86b713c328b2f37a181dad85516b00c557293331
3
  size 82394556
checkpoint_step_1000/training_state.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:291281b64ae387f05fc853c0ac4cd3ea30452aaf53db0bda6059cdd1c875059f
3
- size 1206964193
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b9d7e49e1038f80535cb9920fd36ed114f2cf1d93f1a53b9d894ae4899ce2400
3
+ size 1206964257
checkpoint_step_1000/unet.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9001dfa303a2b68ec78e9495e5b75345ca0dcbd541007e7b240643e308dd1e40
3
  size 314927748
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:29804a197cfdce5ae634e49e7abe1e7db43da6f56d312cd2db6127f7188abfde
3
  size 314927748
checkpoint_step_500/content_encoder.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ce108e8b264e1be106a965a86805fd47b25db7f3fdf93b4ef2ac8c05513fa28d
3
  size 4756580
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3ef7bb5823c6614ce7983455a3e9b41d17032377ba9c0c18454f5abdc13d4ba
3
  size 4756580
checkpoint_step_500/style_encoder.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e4c53dd00df78c41e1977f5f2a17d4c9e0d92cafe87a88890ae0e4f906d468c7
3
  size 82394556
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bd8574fdcd0cd3dbbc694c707cb3f6dd96bc6563e26bb108922a22a674405275
3
  size 82394556
checkpoint_step_500/training_state.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b12ad4fc475384fc57187c4ef34e2c32fb36ddeb26ce44004eda12d44a6edd8b
3
- size 1206964193
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b733b27e3d901d38344835618c38903398a2851100ea955c186ffd0ed08b69bf
3
+ size 1206964257
checkpoint_step_500/unet.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:617b2e33aa034f2853b99c870afffefb88e7057a838e234746ff6a7a379a16aa
3
  size 314927748
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:000b933fe6ad05bfe85a7828f3ed3fe315c234216c3026e61b3e1ea9e22ed0eb
3
  size 314927748