{ "learning_rate": 0.0001, "weight_decay": 0.01, "betas": [ 0.9, 0.95 ], "grad_clip": 1.0, "optimizer": "adamw", "warmup_steps": 500, "total_steps": 417059, "max_epochs": 100, "lr_scheduler": "constant", "min_lr": 1e-06, "warmup_type": "linear", "gradient_accumulation": 8, "gradient_checkpointing": false, "compile_mode": null, "ema_decay": 0.9999, "shift": 3.0, "use_snr_weighting": true, "snr_gamma": 5.0, "use_huber_loss": true, "huber_delta": 0.1, "logit_normal_sampling": true, "logit_mean": 0.0, "logit_std": 1.0, "enable_lune": true, "lune_weight": 0.1, "lune_warmup_steps": 1000, "lune_dropout": 0.1, "lune_mode": "cosine", "enable_sol": true, "sol_weight": 0.05, "sol_warmup_steps": 2000, "sol_dropout": 0.1, "use_spatial_weighting": false, "text_dropout": 0.1, "checkpoint_dir": "./checkpoints", "save_every_steps": 1562, "keep_last_n_steps": 5, "save_every_epochs": 1, "keep_last_n_epochs": 3, "log_every": 20, "tensorboard_dir": "./logs", "sample_every": 500, "sample_prompts": [ "subject, object, a red cube on a blue sphere", "subject, a golden retriever sitting on grass", "subject, object, a coffee cup next to a laptop", "subject, a woman with short hair smiling" ], "sample_dir": "./samples", "dtype": "torch.bfloat16", "hf_repo_id": "AbstractPhil/tiny-flux-deep", "upload_every_steps": 1562, "upload_every_epochs": 0 }