File size: 1,473 Bytes
208f788 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 | {
"seed": 42,
"debug": false,
"wandb": true,
"mask_ratio": 0.9,
"noise": 0.0,
"datamodule": {
"batch_size": 32,
"pin_memory": true,
"num_workers": 12,
"_target_": "tedbench.data.LightningStructureDataset",
"root": "./datasets/ted",
"dataset_name": "afdb_stream"
},
"trainer": {
"_target_": "pytorch_lightning.Trainer",
"accelerator": "auto",
"max_steps": 100000,
"strategy": "auto",
"devices": "auto",
"default_root_dir": "${logs.path}",
"num_sanity_val_steps": 0,
"val_check_interval": 1000,
"check_val_every_n_epoch": null,
"accumulate_grad_batches": 4,
"num_nodes": 4
},
"train": {
"optimizer": {
"_target_": "torch.optim.AdamW",
"lr": 0.0024,
"weight_decay": 0.05,
"betas": [
0.9,
0.95
]
},
"lr_scheduler": {
"_target_": "tedbench.lr_schedulers.get_cosine_schedule_with_warmup",
"warmup_steps": 5000,
"max_steps": "${eval:0.99 * ${trainer.max_steps}}",
"min_factor": 0.1
},
"ckpt_path": null,
"compile": false
},
"model": {
"_target_": "tedbench.model.miae_model",
"name": "miae_s",
"use_seq_input": false,
"masking_strategy": "fixed",
"use_inverse_folding_loss": true
},
"logs": {
"prefix": "logs/pretrain/${datamodule.dataset_name}/${seed}",
"path": "${logs.prefix}/runs/${now:%Y-%m-%d}_${now:%H-%M-%S}"
},
"mode": {},
"_model_class": "miae"
} |