jwheo commited on
Commit
32f218c
·
verified ·
1 Parent(s): 86cbd04

Add photo100k XL configs

Browse files
configs/diffusion_photo100k_xl_stage4_condition_v3.yaml ADDED
@@ -0,0 +1,101 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ project:
2
+ name: diffusion_photo100k_xl_stage4_condition_v3_b8
3
+ output_dir: /home/jwheojjang/scratch/sr-diffusion/runs/diffusion_photo100k_xl_stage4_condition_v3_b8
4
+
5
+ logging:
6
+ wandb:
7
+ enabled: true
8
+ project: sr-diffusion
9
+ name: diffusion_photo100k_xl_stage4_condition_v3_b8
10
+ mode: online
11
+ dir: /home/jwheojjang/scratch/sr-diffusion/wandb
12
+ tags: [stage4, diffusion, condition-start, photo100k, degradation-v3-noise, xl, unet-470m, b8-accum4]
13
+ watch: false
14
+ samples:
15
+ enabled: true
16
+ split: val
17
+ fallback_split: train
18
+ count: 4
19
+ indices: [0, 1, 2, 3]
20
+ init: condition
21
+
22
+ seed: 1337
23
+
24
+ autoencoder:
25
+ config: configs/autoencoder_photo10k.yaml
26
+ checkpoint: /home/jwheojjang/scratch/sr-diffusion/runs/autoencoder_photo10k_b16_eval_online/checkpoints/best_eval_recon.pt
27
+
28
+ condition_encoder:
29
+ config: configs/latent_pretrain_photo100k_v3_noise_xl.yaml
30
+ checkpoint: /home/jwheojjang/scratch/sr-diffusion/runs/latent_pretrain_photo100k_v3_noise_xl_b64/checkpoints/best_eval_latent.pt
31
+ trainable: false
32
+
33
+ data:
34
+ manifest: /home/jwheojjang/scratch/sr-diffusion/data/manifest_photo100k.csv
35
+ split: train
36
+ hr_size: 512
37
+ scale: 4
38
+ degradation_preset: photo_v3_noise_mix
39
+ domains:
40
+ photo: 0
41
+ anime: 1
42
+ num_workers: 8
43
+
44
+ model:
45
+ type: conditional_unet
46
+ latent_channels: 16
47
+ condition_channels: 16
48
+ out_channels: 16
49
+ base_channels: 128
50
+ channel_multipliers: [1, 2, 4, 8]
51
+ num_res_blocks: 6
52
+ norm_groups: 32
53
+ num_heads: 8
54
+ attention_resolutions: [32, 16]
55
+ base_resolution: 128
56
+ num_domains: 2
57
+
58
+ diffusion:
59
+ num_train_timesteps: 1000
60
+ beta_schedule: linear
61
+ beta_start: 0.0001
62
+ beta_end: 0.02
63
+ sample_timestep: 50
64
+ train_min_timestep: 25
65
+ train_max_timestep: 125
66
+ train_init: condition
67
+
68
+ sampling:
69
+ init: condition
70
+ start_timestep: 25
71
+ steps: 32
72
+
73
+ loss:
74
+ noise_weight: 0.05
75
+ x0_weight: 1.0
76
+
77
+ train:
78
+ device: auto
79
+ dtype: bf16
80
+ batch_size: 8
81
+ max_steps: 20000
82
+ lr: 0.000005
83
+ weight_decay: 0.0
84
+ grad_accum_steps: 4
85
+ log_every: 25
86
+ save_every: 1000
87
+ sample_every: 500
88
+
89
+ eval:
90
+ enabled: true
91
+ split: val
92
+ limit: 100
93
+ batch_size: 8
94
+ num_workers: 8
95
+ every: 500
96
+ run_at_start: true
97
+ timestep: 50
98
+ init: condition
99
+ best_metric: eval/decoded_mse
100
+ best_mode: min
101
+ best_checkpoint: best_eval_condition_decoded.pt