| adam_beta1: 0.9 | |
| adam_beta2: 0.999 | |
| adam_epsilon: 1.0e-08 | |
| adam_weight_decay: 0.01 | |
| algorithm_type: dpmsolver++ | |
| beta_scheduler: scaled_linear | |
| channel_attn: true | |
| ckpt_interval: 250 | |
| content_encoder_downsample_size: 3 | |
| content_image_size: !!python/tuple | |
| - 96 | |
| - 96 | |
| content_start_channel: 64 | |
| correcting_x0_fn: null | |
| data_root: my_dataset | |
| drop_prob: 0.1 | |
| experience_name: FontDiffuser_training_phase_2 | |
| gradient_accumulation_steps: 2 | |
| guidance_scale: 7.5 | |
| guidance_type: classifier-free | |
| learning_rate: 1.0e-05 | |
| local_rank: -1 | |
| log_interval: 50 | |
| logging_dir: logs | |
| lr_scheduler: constant | |
| lr_warmup_steps: 100 | |
| max_grad_norm: 1.0 | |
| max_train_steps: 500 | |
| method: multistep | |
| mixed_precision: 'no' | |
| mode: refinement | |
| model_type: noise | |
| nce_layers: 0,1,2,3 | |
| num_inference_steps: 20 | |
| num_neg: 11 | |
| offset_coefficient: 0.5 | |
| order: 2 | |
| output_dir: outputs/FontDiffuser | |
| perceptual_coefficient: 0.05 | |
| phase_1_ckpt_dir: ckpt | |
| phase_2: true | |
| report_to: wandb | |
| resolution: 96 | |
| sc_coefficient: 0.05 | |
| scale_lr: false | |
| scr_ckpt_path: ckpt/scr_210000.pth | |
| scr_image_size: 96 | |
| seed: 123 | |
| skip_type: time_uniform | |
| style_image_size: !!python/tuple | |
| - 96 | |
| - 96 | |
| style_start_channel: 64 | |
| t_end: null | |
| t_start: null | |
| temperature: 0.07 | |
| train_batch_size: 8 | |
| unet_channels: !!python/tuple | |
| - 64 | |
| - 128 | |
| - 256 | |
| - 512 | |
| val_interval: 100 | |