TensorBoard
karimknaebel commited on
Commit
aad5a45
·
verified ·
1 Parent(s): 933d2b9

Upload folder using huggingface_hub

Browse files
s3dis/semseg-ptv3_dino-L/config.py ADDED
@@ -0,0 +1,270 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ weight = 'exp/s3dis/2024-11-09_202340/model/model_best.pth'
2
+ resume = False
3
+ evaluate = True
4
+ test_only = False
5
+ seed = 3468541
6
+ save_path = 'exp/s3dis/2024-11-09_202340'
7
+ wandb_project = 'semseg_s3dis'
8
+ num_worker = 24
9
+ batch_size = 12
10
+ batch_size_val = None
11
+ batch_size_test = None
12
+ epoch = 3000
13
+ eval_epoch = 100
14
+ clip_grad = None
15
+ sync_bn = False
16
+ enable_amp = True
17
+ empty_cache = False
18
+ empty_cache_per_epoch = False
19
+ find_unused_parameters = False
20
+ mix_prob = 0.8
21
+ param_dicts = [dict(keyword='img_enc|block', lr=0.0006)]
22
+ hooks = [
23
+ dict(type='CheckpointLoader'),
24
+ dict(type='IterationTimer', warmup_iter=2),
25
+ dict(type='InformationWriter'),
26
+ dict(type='SemSegEvaluator'),
27
+ dict(type='CheckpointSaver', save_freq=None)
28
+ ]
29
+ train = dict(type='DefaultTrainer')
30
+ test = dict(type='SemSegTester', verbose=True)
31
+ model = dict(
32
+ type='DefaultSegmentorV2',
33
+ num_classes=13,
34
+ backbone_out_channels=64,
35
+ backbone=dict(
36
+ type='PT-v3m1-image',
37
+ in_channels=6,
38
+ order=('z', 'z-trans', 'hilbert', 'hilbert-trans'),
39
+ stride=(2, 2, 2, 2),
40
+ enc_depths=(2, 2, 2, 6, 2),
41
+ enc_channels=(32, 64, 128, 256, 512),
42
+ enc_num_head=(2, 4, 8, 16, 32),
43
+ enc_patch_size=(1024, 1024, 1024, 1024, 1024),
44
+ dec_depths=(2, 2, 2, 2),
45
+ dec_channels=(64, 64, 128, 256),
46
+ dec_num_head=(4, 4, 8, 16),
47
+ dec_patch_size=(1024, 1024, 1024, 1024),
48
+ mlp_ratio=4,
49
+ qkv_bias=True,
50
+ qk_scale=None,
51
+ init_values=None,
52
+ attn_drop=0.0,
53
+ proj_drop=0.0,
54
+ drop_path=0.3,
55
+ shuffle_orders=True,
56
+ pre_norm=True,
57
+ enable_rpe=False,
58
+ enable_flash=True,
59
+ upcast_attention=False,
60
+ upcast_softmax=False,
61
+ cls_mode=False,
62
+ pdnorm_bn=False,
63
+ pdnorm_ln=False,
64
+ pdnorm_decouple=True,
65
+ pdnorm_adaptive=False,
66
+ pdnorm_affine=True,
67
+ pdnorm_conditions=('ScanNet', 'S3DIS', 'Structured3D'),
68
+ dinov2='large'),
69
+ criteria=[
70
+ dict(type='CrossEntropyLoss', loss_weight=1.0, ignore_index=-1),
71
+ dict(
72
+ type='LovaszLoss',
73
+ mode='multiclass',
74
+ loss_weight=1.0,
75
+ ignore_index=-1)
76
+ ])
77
+ optimizer = dict(type='AdamW', lr=0.006, weight_decay=0.05)
78
+ scheduler = dict(
79
+ type='OneCycleLR',
80
+ max_lr=[0.006, 0.0006],
81
+ pct_start=0.05,
82
+ anneal_strategy='cos',
83
+ div_factor=10.0,
84
+ final_div_factor=1000.0)
85
+ dataset_type = 'S3DISDataset'
86
+ data_root = 'data/s3dis'
87
+ data = dict(
88
+ num_classes=13,
89
+ ignore_index=-1,
90
+ names=[
91
+ 'ceiling', 'floor', 'wall', 'beam', 'column', 'window', 'door',
92
+ 'table', 'chair', 'sofa', 'bookcase', 'board', 'clutter'
93
+ ],
94
+ train=dict(
95
+ type='S3DISDataset',
96
+ split=('Area_1', 'Area_2', 'Area_3', 'Area_4', 'Area_6'),
97
+ data_root='data/s3dis',
98
+ with_images=10,
99
+ transform=[
100
+ dict(type='ImageResize', size=[518, 518]),
101
+ dict(
102
+ type='ImageColorJitter',
103
+ brightness=0.4,
104
+ contrast=0.4,
105
+ saturation=0.2,
106
+ hue=0.1),
107
+ dict(type='ImageRandomHorizontalFlip'),
108
+ dict(type='ImageNormalize'),
109
+ dict(type='CenterShift', apply_z=True),
110
+ dict(
111
+ type='RandomDropout',
112
+ dropout_ratio=0.2,
113
+ dropout_application_ratio=0.2),
114
+ dict(
115
+ type='RandomRotate',
116
+ angle=[-1, 1],
117
+ axis='z',
118
+ center=[0, 0, 0],
119
+ p=0.5),
120
+ dict(
121
+ type='RandomRotate',
122
+ angle=[-0.015625, 0.015625],
123
+ axis='x',
124
+ p=0.5),
125
+ dict(
126
+ type='RandomRotate',
127
+ angle=[-0.015625, 0.015625],
128
+ axis='y',
129
+ p=0.5),
130
+ dict(type='RandomScale', scale=[0.9, 1.1]),
131
+ dict(type='RandomFlip', p=0.5),
132
+ dict(type='RandomJitter', sigma=0.005, clip=0.02),
133
+ dict(type='ChromaticAutoContrast', p=0.2, blend_factor=None),
134
+ dict(type='ChromaticTranslation', p=0.95, ratio=0.05),
135
+ dict(type='ChromaticJitter', p=0.95, std=0.05),
136
+ dict(
137
+ type='GridSample',
138
+ grid_size=0.02,
139
+ hash_type='fnv',
140
+ mode='train',
141
+ keys=('coord', 'color', 'normal', 'segment', 'image_coord',
142
+ 'image_mask'),
143
+ return_grid_coord=True),
144
+ dict(type='SphereCrop', sample_rate=0.6, mode='random'),
145
+ dict(type='SphereCrop', point_max=204800, mode='random'),
146
+ dict(type='CenterShift', apply_z=False),
147
+ dict(type='NormalizeColor'),
148
+ dict(type='ToTensor'),
149
+ dict(
150
+ type='Collect',
151
+ keys=('coord', 'grid_coord', 'segment', 'image', 'image_coord',
152
+ 'image_mask'),
153
+ feat_keys=('color', 'normal'))
154
+ ],
155
+ test_mode=False,
156
+ loop=30),
157
+ val=dict(
158
+ type='S3DISDataset',
159
+ split='Area_5',
160
+ data_root='data/s3dis',
161
+ with_images=10,
162
+ transform=[
163
+ dict(type='ImageResize', size=[518, 518]),
164
+ dict(type='ImageNormalize'),
165
+ dict(type='CenterShift', apply_z=True),
166
+ dict(
167
+ type='Copy',
168
+ keys_dict=dict(coord='origin_coord',
169
+ segment='origin_segment')),
170
+ dict(
171
+ type='GridSample',
172
+ grid_size=0.02,
173
+ hash_type='fnv',
174
+ mode='train',
175
+ keys=('coord', 'color', 'normal', 'segment', 'image_coord',
176
+ 'image_mask'),
177
+ return_grid_coord=True),
178
+ dict(type='CenterShift', apply_z=False),
179
+ dict(type='NormalizeColor'),
180
+ dict(type='ToTensor'),
181
+ dict(
182
+ type='Collect',
183
+ keys=('coord', 'grid_coord', 'origin_coord', 'segment',
184
+ 'origin_segment', 'image', 'image_coord', 'image_mask'),
185
+ offset_keys_dict=dict(
186
+ offset='coord', origin_offset='origin_coord'),
187
+ feat_keys=('color', 'normal'))
188
+ ],
189
+ test_mode=False),
190
+ test=dict(
191
+ type='S3DISDataset',
192
+ split='Area_5',
193
+ data_root='data/s3dis',
194
+ with_images=10,
195
+ transform=[
196
+ dict(type='ImageResize', size=[518, 518]),
197
+ dict(type='CenterShift', apply_z=True),
198
+ dict(type='NormalizeColor')
199
+ ],
200
+ test_mode=True,
201
+ test_cfg=dict(
202
+ voxelize=dict(
203
+ type='GridSample',
204
+ grid_size=0.02,
205
+ hash_type='fnv',
206
+ mode='test',
207
+ keys=('coord', 'color', 'normal', 'image_coord', 'image_mask'),
208
+ return_grid_coord=True),
209
+ crop=None,
210
+ post_transform=[
211
+ dict(type='ImageNormalize'),
212
+ dict(type='CenterShift', apply_z=False),
213
+ dict(type='ToTensor'),
214
+ dict(
215
+ type='Collect',
216
+ keys=('coord', 'grid_coord', 'index', 'image',
217
+ 'image_coord', 'image_mask'),
218
+ feat_keys=('color', 'normal'))
219
+ ],
220
+ aug_transform=[[{
221
+ 'type': 'RandomScale',
222
+ 'scale': [0.9, 0.9]
223
+ }], [{
224
+ 'type': 'RandomScale',
225
+ 'scale': [0.95, 0.95]
226
+ }], [{
227
+ 'type': 'RandomScale',
228
+ 'scale': [1, 1]
229
+ }], [{
230
+ 'type': 'RandomScale',
231
+ 'scale': [1.05, 1.05]
232
+ }], [{
233
+ 'type': 'RandomScale',
234
+ 'scale': [1.1, 1.1]
235
+ }],
236
+ [{
237
+ 'type': 'RandomScale',
238
+ 'scale': [0.9, 0.9]
239
+ }, {
240
+ 'type': 'RandomFlip',
241
+ 'p': 1
242
+ }],
243
+ [{
244
+ 'type': 'RandomScale',
245
+ 'scale': [0.95, 0.95]
246
+ }, {
247
+ 'type': 'RandomFlip',
248
+ 'p': 1
249
+ }],
250
+ [{
251
+ 'type': 'RandomScale',
252
+ 'scale': [1, 1]
253
+ }, {
254
+ 'type': 'RandomFlip',
255
+ 'p': 1
256
+ }],
257
+ [{
258
+ 'type': 'RandomScale',
259
+ 'scale': [1.05, 1.05]
260
+ }, {
261
+ 'type': 'RandomFlip',
262
+ 'p': 1
263
+ }],
264
+ [{
265
+ 'type': 'RandomScale',
266
+ 'scale': [1.1, 1.1]
267
+ }, {
268
+ 'type': 'RandomFlip',
269
+ 'p': 1
270
+ }]])))
s3dis/semseg-ptv3_dino-L/events.out.tfevents.1731180267.n23g0009.hpc.itc.rwth-aachen.de ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:936692c84aabfa45a3028bc73302207f24c085d11a01c34f9c918ffd2e109aa8
3
+ size 4335452
s3dis/semseg-ptv3_dino-L/events.out.tfevents.1731250478.r23g0004.hpc.itc.rwth-aachen.de ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3ca3bef5535fee3570512686cbea2788c4bbc68819eb5f54a8d055d60627893
3
+ size 703036
s3dis/semseg-ptv3_dino-L/model/model_best.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e8aa839a31b1af6cce02f76b7e1bc5c4eab60dcaef077cf92f7dcf25614784e0
3
+ size 560915120
s3dis/semseg-ptv3_dino-L/model/model_last.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:04509e20e22d1b1ee4d3038c7012cce78fad082ef96c4c818fa98ce6be5390f4
3
+ size 560920176
s3dis/semseg-ptv3_dino-L/test.log ADDED
The diff for this file is too large to render. See raw diff
 
s3dis/semseg-ptv3_dino-L/train.log ADDED
The diff for this file is too large to render. See raw diff