| { | |
| "samples_dir": "/scratch/local/ssd2/jialinyu/remasker/train-AE/samples", | |
| "output_root": "/homes/55/jialinyu/Bohang/remasker/s3_pretrain/checkpoints", | |
| "run_name": "dream-ae-v1", | |
| "seed": 42, | |
| "train_batch_size": 16, | |
| "eval_batch_size": 8, | |
| "num_workers": 4, | |
| "max_steps": 20000, | |
| "eval_every": 1000, | |
| "save_every": 2000, | |
| "learning_rate": 0.0001, | |
| "weight_decay": 0.01, | |
| "max_grad_norm": 1.0, | |
| "lr_reduce_patience": 3, | |
| "early_stop_patience": 8, | |
| "device": "cuda:7", | |
| "resume": null, | |
| "backend": "nccl", | |
| "local_rank": -1, | |
| "d_model": 3584, | |
| "d_hidden_bottleneck": 256, | |
| "d_delta_bottleneck": 32, | |
| "dropout": 0.1 | |
| } | |