| { |
| "learning_rate": 0.0001, |
| "weight_decay": 0.01, |
| "betas": [ |
| 0.9, |
| 0.95 |
| ], |
| "grad_clip": 1.0, |
| "optimizer": "adamw", |
| "warmup_steps": 500, |
| "total_steps": 417059, |
| "max_epochs": 100, |
| "lr_scheduler": "constant", |
| "min_lr": 1e-06, |
| "warmup_type": "linear", |
| "gradient_accumulation": 8, |
| "gradient_checkpointing": false, |
| "compile_mode": null, |
| "ema_decay": 0.9999, |
| "shift": 3.0, |
| "use_snr_weighting": true, |
| "snr_gamma": 5.0, |
| "use_huber_loss": true, |
| "huber_delta": 0.1, |
| "logit_normal_sampling": true, |
| "logit_mean": 0.0, |
| "logit_std": 1.0, |
| "enable_lune": true, |
| "lune_weight": 0.1, |
| "lune_warmup_steps": 1000, |
| "lune_dropout": 0.1, |
| "lune_mode": "cosine", |
| "enable_sol": true, |
| "sol_weight": 0.05, |
| "sol_warmup_steps": 2000, |
| "sol_dropout": 0.1, |
| "use_spatial_weighting": false, |
| "text_dropout": 0.1, |
| "checkpoint_dir": "./checkpoints", |
| "save_every_steps": 1562, |
| "keep_last_n_steps": 5, |
| "save_every_epochs": 1, |
| "keep_last_n_epochs": 3, |
| "log_every": 20, |
| "tensorboard_dir": "./logs", |
| "sample_every": 500, |
| "sample_prompts": [ |
| "subject, object, a red cube on a blue sphere", |
| "subject, a golden retriever sitting on grass", |
| "subject, object, a coffee cup next to a laptop", |
| "subject, a woman with short hair smiling" |
| ], |
| "sample_dir": "./samples", |
| "dtype": "torch.bfloat16", |
| "hf_repo_id": "AbstractPhil/tiny-flux-deep", |
| "upload_every_steps": 1562, |
| "upload_every_epochs": 0 |
| } |