TensorBoard
karimknaebel commited on
Commit
a656b43
·
verified ·
1 Parent(s): 284fd14

Upload folder using huggingface_hub

Browse files
.gitattributes CHANGED
@@ -47,3 +47,4 @@ scannet200/distill-ptv3_scannet200_dino-L/train.log filter=lfs diff=lfs merge=lf
47
  scannet200/semseg-ptv3_weight=distill-ptv3_scannet200+structured3d_dino-L/train.log filter=lfs diff=lfs merge=lfs -text
48
  nuscenes/semseg-ptv3_weight=distill-ptv3_nuscenes_dino-L/test.log filter=lfs diff=lfs merge=lfs -text
49
  nuscenes/semseg-ptv3_weight=distill-ptv3_nuscenes_dino-L/train.log filter=lfs diff=lfs merge=lfs -text
 
 
47
  scannet200/semseg-ptv3_weight=distill-ptv3_scannet200+structured3d_dino-L/train.log filter=lfs diff=lfs merge=lfs -text
48
  nuscenes/semseg-ptv3_weight=distill-ptv3_nuscenes_dino-L/test.log filter=lfs diff=lfs merge=lfs -text
49
  nuscenes/semseg-ptv3_weight=distill-ptv3_nuscenes_dino-L/train.log filter=lfs diff=lfs merge=lfs -text
50
+ nuscenes/distill-ptv3_nuscenes_dino-L/train.log filter=lfs diff=lfs merge=lfs -text
nuscenes/distill-ptv3_nuscenes_dino-L/config.py ADDED
@@ -0,0 +1,249 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ weight = None
2
+ resume = False
3
+ evaluate = True
4
+ test_only = False
5
+ seed = 14047740
6
+ save_path = 'exp/nuscenes/distill-ptv3dino-Llevels=0'
7
+ wandb_project = 'pointcept_distill_nuscenes'
8
+ num_worker = 16
9
+ batch_size = 12
10
+ batch_size_val = None
11
+ batch_size_test = None
12
+ epoch = 50
13
+ eval_epoch = 50
14
+ clip_grad = None
15
+ sync_bn = False
16
+ enable_amp = True
17
+ empty_cache = False
18
+ empty_cache_per_epoch = False
19
+ find_unused_parameters = False
20
+ mix_prob = 0.8
21
+ param_dicts = [dict(keyword='^(?!.*img_enc).*block', lr=0.0002)]
22
+ hooks = [
23
+ dict(type='CheckpointLoader'),
24
+ dict(type='IterationTimer', warmup_iter=2),
25
+ dict(type='InformationWriter'),
26
+ dict(type='DistillEvaluator'),
27
+ dict(type='CheckpointSaver', save_freq=None)
28
+ ]
29
+ train = dict(type='DefaultTrainer')
30
+ test = dict()
31
+ model = dict(
32
+ type='DefaultDistiller',
33
+ backbone_out_channels=(64, 64, 128, 256, 512),
34
+ levels=(0, ),
35
+ image_feature_channels=(1024, 1024, 1024, 1024, 1024),
36
+ backbone=dict(
37
+ type='PT-v3m1-distill',
38
+ in_channels=4,
39
+ order=['z', 'z-trans', 'hilbert', 'hilbert-trans'],
40
+ stride=(2, 2, 2, 2),
41
+ enc_depths=(2, 2, 2, 6, 2),
42
+ enc_channels=(32, 64, 128, 256, 512),
43
+ enc_num_head=(2, 4, 8, 16, 32),
44
+ enc_patch_size=(1024, 1024, 1024, 1024, 1024),
45
+ dec_depths=(2, 2, 2, 2),
46
+ dec_channels=(64, 64, 128, 256),
47
+ dec_num_head=(4, 4, 8, 16),
48
+ dec_patch_size=(1024, 1024, 1024, 1024),
49
+ mlp_ratio=4,
50
+ qkv_bias=True,
51
+ qk_scale=None,
52
+ attn_drop=0.0,
53
+ proj_drop=0.0,
54
+ drop_path=0.3,
55
+ shuffle_orders=True,
56
+ pre_norm=True,
57
+ enable_rpe=False,
58
+ enable_flash=True,
59
+ upcast_attention=False,
60
+ upcast_softmax=False,
61
+ cls_mode=False,
62
+ pdnorm_bn=False,
63
+ pdnorm_ln=False,
64
+ pdnorm_decouple=True,
65
+ pdnorm_adaptive=False,
66
+ pdnorm_affine=True,
67
+ pdnorm_conditions=('nuScenes', 'SemanticKITTI', 'Waymo'),
68
+ dinov2='large'),
69
+ criteria=[dict(type='MSELoss', loss_weight=1.0)])
70
+ optimizer = dict(type='AdamW', lr=0.002, weight_decay=0.005)
71
+ scheduler = dict(
72
+ type='OneCycleLR',
73
+ max_lr=[0.002, 0.0002],
74
+ pct_start=0.04,
75
+ anneal_strategy='cos',
76
+ div_factor=10.0,
77
+ final_div_factor=100.0)
78
+ dataset_type = 'NuScenesDataset'
79
+ data_root = 'data/nuscenes'
80
+ ignore_index = -1
81
+ names = [
82
+ 'barrier', 'bicycle', 'bus', 'car', 'construction_vehicle', 'motorcycle',
83
+ 'pedestrian', 'traffic_cone', 'trailer', 'truck', 'driveable_surface',
84
+ 'other_flat', 'sidewalk', 'terrain', 'manmade', 'vegetation'
85
+ ]
86
+ data = dict(
87
+ num_classes=16,
88
+ ignore_index=-1,
89
+ names=[
90
+ 'barrier', 'bicycle', 'bus', 'car', 'construction_vehicle',
91
+ 'motorcycle', 'pedestrian', 'traffic_cone', 'trailer', 'truck',
92
+ 'driveable_surface', 'other_flat', 'sidewalk', 'terrain', 'manmade',
93
+ 'vegetation'
94
+ ],
95
+ train=dict(
96
+ type='NuScenesDataset',
97
+ split='train',
98
+ data_root='data/nuscenes',
99
+ with_images=True,
100
+ transform=[
101
+ dict(type='ImageResize', size=[378, 672]),
102
+ dict(
103
+ type='ImageColorJitter',
104
+ brightness=0.4,
105
+ contrast=0.4,
106
+ saturation=0.2,
107
+ hue=0.1),
108
+ dict(type='ImageRandomHorizontalFlip'),
109
+ dict(type='ImageNormalize'),
110
+ dict(
111
+ type='RandomRotate',
112
+ angle=[-1, 1],
113
+ axis='z',
114
+ center=[0, 0, 0],
115
+ p=0.5),
116
+ dict(type='RandomScale', scale=[0.9, 1.1]),
117
+ dict(type='RandomFlip', p=0.5),
118
+ dict(type='RandomJitter', sigma=0.005, clip=0.02),
119
+ dict(
120
+ type='GridSample',
121
+ grid_size=0.05,
122
+ hash_type='fnv',
123
+ mode='train',
124
+ keys=('coord', 'strength', 'segment', 'image_coord',
125
+ 'image_mask'),
126
+ return_grid_coord=True),
127
+ dict(type='ToTensor'),
128
+ dict(
129
+ type='Collect',
130
+ keys=('coord', 'grid_coord', 'segment', 'image', 'image_coord',
131
+ 'image_mask'),
132
+ feat_keys=('coord', 'strength'))
133
+ ],
134
+ test_mode=False,
135
+ ignore_index=-1,
136
+ loop=1),
137
+ val=dict(
138
+ type='NuScenesDataset',
139
+ split='val',
140
+ data_root='data/nuscenes',
141
+ with_images=True,
142
+ transform=[
143
+ dict(type='ImageResize', size=[378, 672]),
144
+ dict(type='ImageNormalize'),
145
+ dict(
146
+ type='GridSample',
147
+ grid_size=0.05,
148
+ hash_type='fnv',
149
+ mode='train',
150
+ keys=('coord', 'strength', 'segment', 'image_coord',
151
+ 'image_mask'),
152
+ return_grid_coord=True),
153
+ dict(type='ToTensor'),
154
+ dict(
155
+ type='Collect',
156
+ keys=('coord', 'grid_coord', 'segment', 'image', 'image_coord',
157
+ 'image_mask'),
158
+ feat_keys=('coord', 'strength'))
159
+ ],
160
+ test_mode=False,
161
+ ignore_index=-1),
162
+ test=dict(
163
+ type='NuScenesDataset',
164
+ split='val',
165
+ data_root='data/nuscenes',
166
+ with_images=True,
167
+ transform=[
168
+ dict(type='ImageResize', size=[378, 672]),
169
+ dict(type='Copy', keys_dict=dict(segment='origin_segment')),
170
+ dict(
171
+ type='GridSample',
172
+ grid_size=0.025,
173
+ hash_type='fnv',
174
+ mode='train',
175
+ keys=('coord', 'strength', 'segment', 'image_coord',
176
+ 'image_mask'),
177
+ return_inverse=True)
178
+ ],
179
+ test_mode=True,
180
+ test_cfg=dict(
181
+ voxelize=dict(
182
+ type='GridSample',
183
+ grid_size=0.05,
184
+ hash_type='fnv',
185
+ mode='test',
186
+ return_grid_coord=True,
187
+ keys=('coord', 'strength', 'image_coord', 'image_mask')),
188
+ crop=None,
189
+ post_transform=[
190
+ dict(type='ImageNormalize'),
191
+ dict(type='ToTensor'),
192
+ dict(
193
+ type='Collect',
194
+ keys=('coord', 'grid_coord', 'index', 'image',
195
+ 'image_coord', 'image_mask'),
196
+ feat_keys=('coord', 'strength'))
197
+ ],
198
+ aug_transform=[[{
199
+ 'type': 'RandomScale',
200
+ 'scale': [0.9, 0.9]
201
+ }], [{
202
+ 'type': 'RandomScale',
203
+ 'scale': [0.95, 0.95]
204
+ }], [{
205
+ 'type': 'RandomScale',
206
+ 'scale': [1, 1]
207
+ }], [{
208
+ 'type': 'RandomScale',
209
+ 'scale': [1.05, 1.05]
210
+ }], [{
211
+ 'type': 'RandomScale',
212
+ 'scale': [1.1, 1.1]
213
+ }],
214
+ [{
215
+ 'type': 'RandomScale',
216
+ 'scale': [0.9, 0.9]
217
+ }, {
218
+ 'type': 'RandomFlip',
219
+ 'p': 1
220
+ }],
221
+ [{
222
+ 'type': 'RandomScale',
223
+ 'scale': [0.95, 0.95]
224
+ }, {
225
+ 'type': 'RandomFlip',
226
+ 'p': 1
227
+ }],
228
+ [{
229
+ 'type': 'RandomScale',
230
+ 'scale': [1, 1]
231
+ }, {
232
+ 'type': 'RandomFlip',
233
+ 'p': 1
234
+ }],
235
+ [{
236
+ 'type': 'RandomScale',
237
+ 'scale': [1.05, 1.05]
238
+ }, {
239
+ 'type': 'RandomFlip',
240
+ 'p': 1
241
+ }],
242
+ [{
243
+ 'type': 'RandomScale',
244
+ 'scale': [1.1, 1.1]
245
+ }, {
246
+ 'type': 'RandomFlip',
247
+ 'p': 1
248
+ }]]),
249
+ ignore_index=-1))
nuscenes/distill-ptv3_nuscenes_dino-L/events.out.tfevents.1729984113.n23g0002.hpc.itc.rwth-aachen.de ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ecc40c1006dc0ab3c779b4ea965e14b109bd4454118221aa601950972622be65
3
+ size 18709910
nuscenes/distill-ptv3_nuscenes_dino-L/model/model_best.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bcffbc01f76d1ff6772d10c19c00edeaa4f5a5aa304b7f28ecf121650bf657a7
3
+ size 555305064
nuscenes/distill-ptv3_nuscenes_dino-L/model/model_last.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bcffbc01f76d1ff6772d10c19c00edeaa4f5a5aa304b7f28ecf121650bf657a7
3
+ size 555305064
nuscenes/distill-ptv3_nuscenes_dino-L/train.log ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c673338ccf14ecc86b0e76af9bc5c48685b527b312ccae8c4587dab2c89e72f8
3
+ size 34723713