miae-l / config.json
dexiongc's picture
Upload folder using huggingface_hub
f793c7a verified
raw
history blame
1.47 kB
{
"seed": 42,
"debug": false,
"wandb": true,
"mask_ratio": 0.9,
"noise": 0.0,
"datamodule": {
"batch_size": 32,
"pin_memory": true,
"num_workers": 12,
"_target_": "tedbench.data.LightningStructureDataset",
"root": "./datasets/ted",
"dataset_name": "afdb_stream"
},
"trainer": {
"_target_": "pytorch_lightning.Trainer",
"accelerator": "auto",
"max_steps": 100000,
"strategy": "auto",
"devices": "auto",
"default_root_dir": "${logs.path}",
"num_sanity_val_steps": 0,
"val_check_interval": 1000,
"check_val_every_n_epoch": null,
"accumulate_grad_batches": 4,
"num_nodes": 4
},
"train": {
"optimizer": {
"_target_": "torch.optim.AdamW",
"lr": 0.0024,
"weight_decay": 0.05,
"betas": [
0.9,
0.95
]
},
"lr_scheduler": {
"_target_": "tedbench.lr_schedulers.get_cosine_schedule_with_warmup",
"warmup_steps": 5000,
"max_steps": "${eval:0.99 * ${trainer.max_steps}}",
"min_factor": 0.1
},
"ckpt_path": null,
"compile": false
},
"model": {
"_target_": "tedbench.model.miae_model",
"name": "miae_l",
"use_seq_input": false,
"masking_strategy": "fixed",
"use_inverse_folding_loss": true
},
"logs": {
"prefix": "logs/pretrain/${datamodule.dataset_name}/${seed}",
"path": "${logs.prefix}/runs/${now:%Y-%m-%d}_${now:%H-%M-%S}"
},
"mode": {},
"_model_class": "miae"
}