File size: 2,167 Bytes
e1e2753
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
run_dir: .exp/diffusion/imagenet_512/dc_ae_f32c32_in_1.0/dit_xl_1/bs_1024_lr_2e-4_fp16
seed: 0
allow_tf32: true
resolution: 512
amp: fp16
cfg_scale: 1.0
evaluate_split: test
evaluate_dir_name: null
num_save_images: 64
save_all_images: false
save_images_at_all_procs: false
evaluate_dataset: sample_class
sample_class:
  name: sample_class
  batch_size: 32
  n_worker: 8
  train_drop_last: true
  seed: 0
  num_classes: 1000
  num_samples: 50000
autoencoder: dc-ae-f32c32-in-1.0
autoencoder_dtype: fp32
scaling_factor: 0.3189
model: dit
dit:
  name: DiT
  input_size: 16
  patch_size: 1
  in_channels: 32
  hidden_size: 1152
  depth: 28
  num_heads: 16
  mlp_ratio: 4.0
  post_norm: false
  class_dropout_prob: 0.1
  num_classes: 1000
  learn_sigma: true
  unconditional: false
  use_checkpoint: true
  pretrained_path: null
  pretrained_source: dc-ae
  eval_scheduler: GaussianDiffusion
  num_inference_steps: 250
  train_scheduler: GaussianDiffusion
uvit:
  name: UViT
  input_size: 32
  patch_size: 2
  in_channels: 4
  hidden_size: 1152
  depth: 28
  num_heads: 16
  mlp_ratio: 4.0
  mlp_time_embed: false
  qkv_bias: false
  act_layer: gelu
  use_checkpoint: true
  class_dropout_prob: 0.1
  num_classes: 1000
  pretrained_path: null
  pretrained_source: dc-ae
  eval_scheduler: DPM_Solver
  num_inference_steps: 30
  train_scheduler: DPM_Solver
  attn_mode: null
compute_fid: true
fid:
  save_path: null
  ref_path: assets/data/fid/imagenet_512_train.npz
compute_inception_score: true
inception_score: {}
train_dataset: latent_imagenet
latent_imagenet:
  name: latent_imagenet
  batch_size: 32
  n_worker: 8
  train_drop_last: true
  seed: 0
  data_dir: assets/data/latent/dc_ae_f32c32_in_1.0/imagenet_512
resume: true
resume_path: null
resume_schedule: true
num_epochs: null
max_steps: 3000000
clip_grad: null
num_store_images: 64
save_checkpoint_steps: 1000
evaluate_steps: 20000
optimizer:
  name: adamw
  lr: 0.0002
  warmup_lr: 0.0
  weight_decay: 0.0
  no_wd_keys: []
  betas:
  - 0.9
  - 0.999
lr_scheduler:
  name: constant
  warmup_steps: 1000
log: true
wandb_entity: null
wandb_project: null
ema_decay: 0.9999
ema_warmup_steps: 2000
evaluate_ema: true