File size: 1,473 Bytes
9859ff5
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
{
  "seed": 42,
  "debug": false,
  "wandb": true,
  "mask_ratio": 0.9,
  "noise": 0.0,
  "datamodule": {
    "batch_size": 32,
    "pin_memory": true,
    "num_workers": 12,
    "_target_": "tedbench.data.LightningStructureDataset",
    "root": "./datasets/ted",
    "dataset_name": "afdb_stream"
  },
  "trainer": {
    "_target_": "pytorch_lightning.Trainer",
    "accelerator": "auto",
    "max_steps": 100000,
    "strategy": "auto",
    "devices": "auto",
    "default_root_dir": "${logs.path}",
    "num_sanity_val_steps": 0,
    "val_check_interval": 1000,
    "check_val_every_n_epoch": null,
    "accumulate_grad_batches": 4,
    "num_nodes": 4
  },
  "train": {
    "optimizer": {
      "_target_": "torch.optim.AdamW",
      "lr": 0.0024,
      "weight_decay": 0.05,
      "betas": [
        0.9,
        0.95
      ]
    },
    "lr_scheduler": {
      "_target_": "tedbench.lr_schedulers.get_cosine_schedule_with_warmup",
      "warmup_steps": 5000,
      "max_steps": "${eval:0.99 * ${trainer.max_steps}}",
      "min_factor": 0.1
    },
    "ckpt_path": null,
    "compile": false
  },
  "model": {
    "_target_": "tedbench.model.miae_model",
    "name": "miae_b",
    "use_seq_input": false,
    "masking_strategy": "fixed",
    "use_inverse_folding_loss": true
  },
  "logs": {
    "prefix": "logs/pretrain/${datamodule.dataset_name}/${seed}",
    "path": "${logs.prefix}/runs/${now:%Y-%m-%d}_${now:%H-%M-%S}"
  },
  "mode": {},
  "_model_class": "miae"
}