Bavantha11 commited on
Commit
f301af3
·
verified ·
1 Parent(s): 1f5a2a0

Upload configs/nyudv2/m2h_mx_b.yaml with huggingface_hub

Browse files
Files changed (1) hide show
  1. configs/nyudv2/m2h_mx_b.yaml +97 -0
configs/nyudv2/m2h_mx_b.yaml ADDED
@@ -0,0 +1,97 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ dataset:
2
+ name: NYUD
3
+ root: data/NYUDv2
4
+ image_size: [480, 640]
5
+ num_classes: 40
6
+ min_depth: 0.01
7
+ max_depth: 10.0
8
+ visual_min_depth: 0.01
9
+ visual_max_depth: 10.0
10
+ augment:
11
+ random_scale: [1.0, 1.2]
12
+ random_crop: true
13
+ horizontal_flip: true
14
+ color_jitter: {brightness: 0.2, contrast: 0.2, saturation: 0.2, hue: 0.2}
15
+ erase_prob: 0.0
16
+
17
+ training:
18
+ epochs: 120
19
+ batch_size: 6
20
+ eval_batch_size: 12
21
+ num_workers: 4
22
+ device: cuda
23
+ mixed_precision: true
24
+ log_interval: 50
25
+ ckpt_interval: 1
26
+ grad_clip: 1.0
27
+ output_dir: outputs/nyudv2_m2h_mx_b
28
+ ema_decay: 0.999
29
+ eval_use_ema: false
30
+ finetune: true
31
+
32
+ optimization:
33
+ lr: 5.0e-5
34
+ weight_decay: 0.02
35
+ betas: [0.9, 0.999]
36
+ warmup_epochs: 0
37
+ scheduler:
38
+ type: cosine
39
+ min_lr: 1.0e-5
40
+
41
+ tasks:
42
+ include_semseg: true
43
+ include_depth: true
44
+ include_edge: true
45
+ include_normals: true
46
+ edge_pos_weight: 1.0
47
+
48
+ loss:
49
+ weights:
50
+ semseg: 2.0
51
+ depth_si: 2.0
52
+ edge: 0.5
53
+ normals: 1.0
54
+ focal_for_edges: true
55
+ geom_consistency_weight: 0.2
56
+ consistency_depth_normals: 0.2
57
+ consistency_sem_edge: 0.25
58
+ depth_scale_weight: 0.2
59
+ depth_coarse_weight: 0.2
60
+ depth_offset_weight: 0.15
61
+ depth_bin_weight: 0.3
62
+ edge_dice_weight: 0.1
63
+ use_uncertainty_balancer: false
64
+
65
+ model:
66
+ arch: m2h_mx_b
67
+ num_classes: 40
68
+ min_depth: 0.01
69
+ max_depth: 10.0
70
+
71
+ m2h_mx:
72
+ decoder_dim: 256
73
+ num_seg_classes: 40
74
+ backbone_lr_scale: 0.2
75
+ ltc_window_size: 4
76
+ hm_d_state: 32
77
+ hm_drop_path: 0.1
78
+ gtf_extra_levels: 2
79
+ train_last_n_blocks: 4
80
+ intermediate_layer_indices: [2, 5, 8, 11]
81
+ depth_aux_weight: 0.5
82
+ num_register_tokens: 4
83
+ use_lora: true
84
+ lora_rank: 16
85
+ lora_alpha: 32.0
86
+ lora_dropout: 0.05
87
+ backbone_name: facebook/dinov3-vitb16-pretrain-lvd1689m
88
+ depth_bins: 64
89
+ aux_weights:
90
+ semseg: 0.3
91
+ depth: 0.3
92
+ edge: 0.15
93
+ normals: 0.15
94
+
95
+ validation:
96
+ interval_steps: 100
97
+ save_best_on: ["sem_mIoU", "dep_AbsRel"]