{ "dataset": { "batch_duplicates": 1, "cache_dataset": true, "cropping": "none", "eval_split": "test", "flipping": "left_right", "image_size": 32, "name": "object_recognition", "num_classes": 10, "tfds_name": "cifar10", "train_split": "train" }, "datasets": [ { "batch_duplicates": 1, "cache_dataset": true, "cropping": "none", "eval_split": "test", "flipping": "left_right", "image_size": 32, "name": "object_recognition", "num_classes": 10, "tfds_name": "cifar10", "train_split": "train" } ], "eval": { "batch_size": 64, "checkpoint_dir": "", "steps": 2, "tag": "eval", "write_images_to_file": true }, "model": { "arch_name": "tape", "b_scale": 1.0, "b_type": "uint8", "cond_decoupled_read": false, "cond_dim": 0, "cond_dropout": 0.0, "cond_on_latent": true, "cond_proj": true, "cond_tape_writable": false, "conditional": "class", "conv_drop_units": 0.0, "conv_kernel_size": 0, "drop_att": 0.0, "drop_path": 0.1, "drop_sc": 0.0, "drop_units": 0.1, "flip_rate": 0.0, "guidance": 0.0, "infer_iterations": 100, "infer_schedule": "cosine", "latent_dim": 512, "latent_mlp_ratio": 4, "latent_num_heads": 16, "latent_pos_encoding": "learned", "latent_slots": 128, "loss_type": "eps", "name": "image_diffusion_model", "normalize_noisy_input": false, "num_layers": "2,2,2", "patch_size": 2, "pos_encoding": "sin_cos", "pred_type": "eps", "pretrained_ckpt": "", "rw_num_heads": 8, "sampler_name": "ddpm", "self_cond": "latent", "self_cond_by_masking": true, "self_cond_rate": 0.9, "tape_dim": 256, "tape_mlp_ratio": 2, "tape_pos_encoding": "learned", "td": 0.0, "time_on_latent": true, "time_scaling": 1000, "train_schedule": "sigmoid@-3,3,0.9", "use_cls_token": false, "x0_clip": "auto", "xattn_enc_ln": false }, "model_dir": "results/cifar10", "optimization": { "beta1": 0.9, "beta2": 0.999, "ema_decay": 0.9999, "ema_name_exact_match": true, "end_lr_factor": 0.0, "eps": 1e-08, "exclude_from_weight_decay": "bias,beta,gamma", "global_clipnorm": 1.0, "learning_rate": 0.003, "learning_rate_scaling": "none", "learning_rate_schedule": "cosine@0.8", "momentum": 0.9, "optimizer": "lamb", "tail_steps": 0, "warmup_epochs": 0, "warmup_steps": 10000, "weight_decay": 0.01 }, "task": { "name": "image_generation", "weight": 1.0 }, "tasks": [ { "name": "image_generation", "weight": 1.0 } ], "train": { "batch_size": 256, "checkpoint_epochs": 40, "checkpoint_steps": 1000, "epochs": 100, "keep_checkpoint_max": 10, "label_smoothing": 0.0, "steps": 150000 } }