TensorBoard
karimknaebel commited on
Commit
8277efe
·
verified ·
1 Parent(s): fc49bf8

Upload folder using huggingface_hub

Browse files
scannet/semseg-ptv3_weight=distill-ptv3_scannet200+structured3d_dino-L/config.py ADDED
@@ -0,0 +1,310 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ weight = 'exp/scannet200/2025-03-01_221653/model/model_last.pth'
2
+ resume = False
3
+ evaluate = True
4
+ test_only = False
5
+ seed = 490701
6
+ save_path = 'exp/scannet/2025-03-04_165711'
7
+ wandb_project = 'semseg_scannet'
8
+ num_worker = 24
9
+ batch_size = 12
10
+ batch_size_val = None
11
+ batch_size_test = None
12
+ epoch = 80
13
+ eval_epoch = 80
14
+ clip_grad = None
15
+ sync_bn = False
16
+ enable_amp = True
17
+ empty_cache = False
18
+ empty_cache_per_epoch = False
19
+ find_unused_parameters = True
20
+ mix_prob = 0.8
21
+ param_dicts = [
22
+ dict(keyword='block', lr=6e-05),
23
+ dict(keyword='backbone', lr=0.0006)
24
+ ]
25
+ hooks = [
26
+ dict(type='CheckpointLoader'),
27
+ dict(type='IterationTimer', warmup_iter=2),
28
+ dict(type='InformationWriter'),
29
+ dict(type='SemSegEvaluator'),
30
+ dict(type='CheckpointSaver', save_freq=None),
31
+ dict(type='PreciseEvaluator', test_last=False)
32
+ ]
33
+ train = dict(type='DefaultTrainer')
34
+ test = dict(type='SemSegTester', verbose=True)
35
+ model = dict(
36
+ type='DefaultSegmentorV2',
37
+ num_classes=20,
38
+ backbone_out_channels=64,
39
+ backbone=dict(
40
+ type='PT-v3m1',
41
+ in_channels=6,
42
+ order=('z', 'z-trans', 'hilbert', 'hilbert-trans'),
43
+ stride=(2, 2, 2, 2),
44
+ enc_depths=(2, 2, 2, 6, 2),
45
+ enc_channels=(32, 64, 128, 256, 512),
46
+ enc_num_head=(2, 4, 8, 16, 32),
47
+ enc_patch_size=(1024, 1024, 1024, 1024, 1024),
48
+ dec_depths=(2, 2, 2, 2),
49
+ dec_channels=(64, 64, 128, 256),
50
+ dec_num_head=(4, 4, 8, 16),
51
+ dec_patch_size=(1024, 1024, 1024, 1024),
52
+ mlp_ratio=4,
53
+ qkv_bias=True,
54
+ qk_scale=None,
55
+ attn_drop=0.0,
56
+ proj_drop=0.0,
57
+ drop_path=0.3,
58
+ shuffle_orders=True,
59
+ pre_norm=True,
60
+ enable_rpe=False,
61
+ enable_flash=True,
62
+ upcast_attention=False,
63
+ upcast_softmax=False,
64
+ cls_mode=False,
65
+ pdnorm_bn=True,
66
+ pdnorm_ln=True,
67
+ pdnorm_decouple=True,
68
+ pdnorm_adaptive=False,
69
+ pdnorm_affine=True,
70
+ pdnorm_conditions=('ScanNet', 'S3DIS', 'Structured3D')),
71
+ criteria=[
72
+ dict(type='CrossEntropyLoss', loss_weight=1.0, ignore_index=-1),
73
+ dict(
74
+ type='LovaszLoss',
75
+ mode='multiclass',
76
+ loss_weight=1.0,
77
+ ignore_index=-1)
78
+ ])
79
+ optimizer = dict(type='AdamW', lr=0.006, weight_decay=0.05)
80
+ scheduler = dict(
81
+ type='OneCycleLR',
82
+ max_lr=[0.006, 6e-05, 0.0006],
83
+ pct_start=0.05,
84
+ anneal_strategy='cos',
85
+ div_factor=10.0,
86
+ final_div_factor=1000.0)
87
+ dataset_type = 'ScanNetDataset'
88
+ data_root = 'data/scannet'
89
+ data = dict(
90
+ num_classes=20,
91
+ ignore_index=-1,
92
+ names=[
93
+ 'wall', 'floor', 'cabinet', 'bed', 'chair', 'sofa', 'table', 'door',
94
+ 'window', 'bookshelf', 'picture', 'counter', 'desk', 'curtain',
95
+ 'refridgerator', 'shower curtain', 'toilet', 'sink', 'bathtub',
96
+ 'otherfurniture'
97
+ ],
98
+ train=dict(
99
+ type='ScanNetDataset',
100
+ split='train',
101
+ data_root='data/scannet',
102
+ transform=[
103
+ dict(type='CenterShift', apply_z=True),
104
+ dict(
105
+ type='RandomDropout',
106
+ dropout_ratio=0.2,
107
+ dropout_application_ratio=0.2),
108
+ dict(
109
+ type='RandomRotate',
110
+ angle=[-1, 1],
111
+ axis='z',
112
+ center=[0, 0, 0],
113
+ p=0.5),
114
+ dict(
115
+ type='RandomRotate',
116
+ angle=[-0.015625, 0.015625],
117
+ axis='x',
118
+ p=0.5),
119
+ dict(
120
+ type='RandomRotate',
121
+ angle=[-0.015625, 0.015625],
122
+ axis='y',
123
+ p=0.5),
124
+ dict(type='RandomScale', scale=[0.9, 1.1]),
125
+ dict(type='RandomFlip', p=0.5),
126
+ dict(type='RandomJitter', sigma=0.005, clip=0.02),
127
+ dict(
128
+ type='ElasticDistortion',
129
+ distortion_params=[[0.2, 0.4], [0.8, 1.6]]),
130
+ dict(type='ChromaticAutoContrast', p=0.2, blend_factor=None),
131
+ dict(type='ChromaticTranslation', p=0.95, ratio=0.05),
132
+ dict(type='ChromaticJitter', p=0.95, std=0.05),
133
+ dict(
134
+ type='GridSample',
135
+ grid_size=0.02,
136
+ hash_type='fnv',
137
+ mode='train',
138
+ return_grid_coord=True),
139
+ dict(type='SphereCrop', point_max=102400, mode='random'),
140
+ dict(type='CenterShift', apply_z=False),
141
+ dict(type='NormalizeColor'),
142
+ dict(type='Add', keys_dict=dict(condition='ScanNet')),
143
+ dict(type='ToTensor'),
144
+ dict(
145
+ type='Collect',
146
+ keys=('coord', 'grid_coord', 'segment', 'condition'),
147
+ feat_keys=('color', 'normal'))
148
+ ],
149
+ test_mode=False,
150
+ loop=1),
151
+ val=dict(
152
+ type='ScanNetDataset',
153
+ split='val',
154
+ data_root='data/scannet',
155
+ transform=[
156
+ dict(type='CenterShift', apply_z=True),
157
+ dict(
158
+ type='GridSample',
159
+ grid_size=0.02,
160
+ hash_type='fnv',
161
+ mode='train',
162
+ return_grid_coord=True),
163
+ dict(type='CenterShift', apply_z=False),
164
+ dict(type='NormalizeColor'),
165
+ dict(type='Add', keys_dict=dict(condition='ScanNet')),
166
+ dict(type='ToTensor'),
167
+ dict(
168
+ type='Collect',
169
+ keys=('coord', 'grid_coord', 'segment', 'condition'),
170
+ feat_keys=('color', 'normal'))
171
+ ],
172
+ test_mode=False),
173
+ test=dict(
174
+ type='ScanNetDataset',
175
+ split='val',
176
+ data_root='data/scannet',
177
+ transform=[
178
+ dict(type='CenterShift', apply_z=True),
179
+ dict(type='NormalizeColor')
180
+ ],
181
+ test_mode=True,
182
+ test_cfg=dict(
183
+ voxelize=dict(
184
+ type='GridSample',
185
+ grid_size=0.02,
186
+ hash_type='fnv',
187
+ mode='test',
188
+ keys=('coord', 'color', 'normal'),
189
+ return_grid_coord=True),
190
+ crop=None,
191
+ post_transform=[
192
+ dict(type='CenterShift', apply_z=False),
193
+ dict(type='ToTensor'),
194
+ dict(type='Add', keys_dict=dict(condition='ScanNet')),
195
+ dict(
196
+ type='Collect',
197
+ keys=('coord', 'grid_coord', 'index', 'condition'),
198
+ feat_keys=('color', 'normal'))
199
+ ],
200
+ aug_transform=[[{
201
+ 'type': 'RandomRotateTargetAngle',
202
+ 'angle': [0],
203
+ 'axis': 'z',
204
+ 'center': [0, 0, 0],
205
+ 'p': 1
206
+ }],
207
+ [{
208
+ 'type': 'RandomRotateTargetAngle',
209
+ 'angle': [0.5],
210
+ 'axis': 'z',
211
+ 'center': [0, 0, 0],
212
+ 'p': 1
213
+ }],
214
+ [{
215
+ 'type': 'RandomRotateTargetAngle',
216
+ 'angle': [1],
217
+ 'axis': 'z',
218
+ 'center': [0, 0, 0],
219
+ 'p': 1
220
+ }],
221
+ [{
222
+ 'type': 'RandomRotateTargetAngle',
223
+ 'angle': [1.5],
224
+ 'axis': 'z',
225
+ 'center': [0, 0, 0],
226
+ 'p': 1
227
+ }],
228
+ [{
229
+ 'type': 'RandomRotateTargetAngle',
230
+ 'angle': [0],
231
+ 'axis': 'z',
232
+ 'center': [0, 0, 0],
233
+ 'p': 1
234
+ }, {
235
+ 'type': 'RandomScale',
236
+ 'scale': [0.95, 0.95]
237
+ }],
238
+ [{
239
+ 'type': 'RandomRotateTargetAngle',
240
+ 'angle': [0.5],
241
+ 'axis': 'z',
242
+ 'center': [0, 0, 0],
243
+ 'p': 1
244
+ }, {
245
+ 'type': 'RandomScale',
246
+ 'scale': [0.95, 0.95]
247
+ }],
248
+ [{
249
+ 'type': 'RandomRotateTargetAngle',
250
+ 'angle': [1],
251
+ 'axis': 'z',
252
+ 'center': [0, 0, 0],
253
+ 'p': 1
254
+ }, {
255
+ 'type': 'RandomScale',
256
+ 'scale': [0.95, 0.95]
257
+ }],
258
+ [{
259
+ 'type': 'RandomRotateTargetAngle',
260
+ 'angle': [1.5],
261
+ 'axis': 'z',
262
+ 'center': [0, 0, 0],
263
+ 'p': 1
264
+ }, {
265
+ 'type': 'RandomScale',
266
+ 'scale': [0.95, 0.95]
267
+ }],
268
+ [{
269
+ 'type': 'RandomRotateTargetAngle',
270
+ 'angle': [0],
271
+ 'axis': 'z',
272
+ 'center': [0, 0, 0],
273
+ 'p': 1
274
+ }, {
275
+ 'type': 'RandomScale',
276
+ 'scale': [1.05, 1.05]
277
+ }],
278
+ [{
279
+ 'type': 'RandomRotateTargetAngle',
280
+ 'angle': [0.5],
281
+ 'axis': 'z',
282
+ 'center': [0, 0, 0],
283
+ 'p': 1
284
+ }, {
285
+ 'type': 'RandomScale',
286
+ 'scale': [1.05, 1.05]
287
+ }],
288
+ [{
289
+ 'type': 'RandomRotateTargetAngle',
290
+ 'angle': [1],
291
+ 'axis': 'z',
292
+ 'center': [0, 0, 0],
293
+ 'p': 1
294
+ }, {
295
+ 'type': 'RandomScale',
296
+ 'scale': [1.05, 1.05]
297
+ }],
298
+ [{
299
+ 'type': 'RandomRotateTargetAngle',
300
+ 'angle': [1.5],
301
+ 'axis': 'z',
302
+ 'center': [0, 0, 0],
303
+ 'p': 1
304
+ }, {
305
+ 'type': 'RandomScale',
306
+ 'scale': [1.05, 1.05]
307
+ }], [{
308
+ 'type': 'RandomFlip',
309
+ 'p': 1
310
+ }]])))
scannet/semseg-ptv3_weight=distill-ptv3_scannet200+structured3d_dino-L/events.out.tfevents.1741103921.n23g0009.hpc.itc.rwth-aachen.de ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d46598741252268954157a484206e81091acd7f43cf28f04b0ab7701b84fca72
3
+ size 786643
scannet/semseg-ptv3_weight=distill-ptv3_scannet200+structured3d_dino-L/model/model_best.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8522fc7400d5535b9b7863f55a5c9c94e7e71d7a81f5470fca3aa5584e5fb039
3
+ size 554980580
scannet/semseg-ptv3_weight=distill-ptv3_scannet200+structured3d_dino-L/model/model_last.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3ff18b4519118984e69f40caf591d9f044260d7dc7396de17c2dfce399248b5
3
+ size 554980580
scannet/semseg-ptv3_weight=distill-ptv3_scannet200+structured3d_dino-L/train.log ADDED
The diff for this file is too large to render. See raw diff