File size: 1,771 Bytes
2e93df9
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
{
  "seed": 42,
  "debug": false,
  "wandb": true,
  "pretrained_model_path": "pretrained/new/mae_large_mask0.9_dec512d2b.ckpt",
  "datamodule": {
    "batch_size": 32,
    "pin_memory": true,
    "num_workers": 12,
    "train_transform": {
      "_target_": "tedbench.data.transform.Compose",
      "transforms": [
        {
          "_target_": "tedbench.data.transform.RandomCrop",
          "size": 512
        },
        {
          "_target_": "tedbench.data.transform.RandomNoise",
          "std": 0.2,
          "mean": 0.0
        }
      ]
    },
    "_target_": "tedbench.data.TEDLightningDataset",
    "root": "./datasets/ted",
    "dataset_name": "ted"
  },
  "trainer": {
    "_target_": "pytorch_lightning.Trainer",
    "accelerator": "auto",
    "max_steps": 18300,
    "strategy": "auto",
    "devices": "auto",
    "default_root_dir": "${logs.path}",
    "num_sanity_val_steps": 0,
    "accumulate_grad_batches": 4
  },
  "train": {
    "optimizer": {
      "_target_": "torch.optim.AdamW",
      "lr": 0.0016,
      "weight_decay": 0.1,
      "betas": [
        0.9,
        0.95
      ]
    },
    "lr_scheduler": {
      "_target_": "tedbench.lr_schedulers.get_cosine_schedule_with_warmup",
      "warmup_steps": 1830,
      "max_steps": "${trainer.max_steps}"
    },
    "loss": {
      "_target_": "torch.nn.CrossEntropyLoss",
      "label_smoothing": 0.0
    },
    "llrd": 0.8,
    "ckpt_path": null
  },
  "model": {
    "_target_": "tedbench.model.miae_encoder_model",
    "name": "miae_l",
    "num_classes": 965,
    "avg_pool": false
  },
  "logs": {
    "prefix": "logs/finetune/${datamodule.dataset_name}/${seed}",
    "path": "${logs.prefix}/runs/${now:%Y-%m-%d}_${now:%H-%M-%S}"
  },
  "mode": {},
  "_model_class": "miae_classifier"
}