jev-aleks commited on
Commit
7ada315
·
verified ·
1 Parent(s): ca4eef8

Upload folder using huggingface_hub

Browse files
seg-best-dino-orb-slam/checkpoint.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c18a5ce50958a99d36a62cae6a690ec41bc9368d5f2d3faaf2e139126f595b42
3
+ size 764129470
seg-best-dino-orb-slam/training_config.yaml ADDED
@@ -0,0 +1,278 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ dataset:
2
+ type: old_KITTI_360
3
+ data_path: /home/fb20user12/datasets/KITTI-360/
4
+ pose_path: /home/fb20user12/datasets/KITTI-360/data_poses
5
+ split_path: datasets/kitti_360/splits/sscbench
6
+ image_size:
7
+ - 192
8
+ - 640
9
+ data_stereo: true
10
+ data_fisheye: true
11
+ data_fc: 2
12
+ fisheye_offset:
13
+ - 10
14
+ - 11
15
+ - 12
16
+ - 13
17
+ - 14
18
+ - 15
19
+ - 16
20
+ - 17
21
+ - 18
22
+ - 19
23
+ - 20
24
+ - 21
25
+ - 22
26
+ - 23
27
+ - 24
28
+ - 25
29
+ - 26
30
+ - 27
31
+ - 28
32
+ - 29
33
+ - 30
34
+ - 31
35
+ - 32
36
+ - 33
37
+ - 34
38
+ - 35
39
+ - 36
40
+ - 37
41
+ - 38
42
+ - 39
43
+ - 40
44
+ stereo_offset:
45
+ - 0
46
+ is_preprocessed: true
47
+ fisheye_rotation: -15
48
+ data_segmentation: true
49
+ steps_per_epoch: 10328
50
+ model:
51
+ arch: BTSNet
52
+ use_code: true
53
+ prediction_mode: default
54
+ predict_dino: true
55
+ dino_dims: 64
56
+ compensate_artifacts: true
57
+ flip_augmentation: true
58
+ encoder:
59
+ type: dinov2
60
+ mode: downsample-prediction
61
+ decoder_arch: dpt
62
+ downsampler_arch: featup
63
+ encoder_arch: vit-b
64
+ version: v1
65
+ separate_gt_version: v1
66
+ encoder_freeze: false
67
+ flip_avg_gt: false
68
+ dim_reduction_arch: mlp
69
+ num_ch_enc:
70
+ - 64
71
+ - 64
72
+ - 128
73
+ - 256
74
+ intermediate_features:
75
+ - 3
76
+ - 6
77
+ - 9
78
+ decoder_out_dim: 256
79
+ dino_pca_dim: 64
80
+ image_size:
81
+ - 192
82
+ - 640
83
+ key_features: false
84
+ code:
85
+ num_freqs: 6
86
+ freq_factor: 1.5
87
+ include_input: true
88
+ decoder_heads:
89
+ - type: resnet
90
+ name: normal_head
91
+ freeze: false
92
+ args:
93
+ n_blocks: 0
94
+ d_hidden: 128
95
+ final_prediction_head: normal_head
96
+ encoding_strategy:
97
+ name: default
98
+ args: {}
99
+ eval_encoding_strategy:
100
+ name: default
101
+ args: null
102
+ loss_renderer_strategy:
103
+ name: kitti_360
104
+ args: null
105
+ eval_loss_renderer_strategy:
106
+ name: single_renderer
107
+ args:
108
+ shuffle_frames: false
109
+ all_frames: true
110
+ inv_z: true
111
+ learn_empty: false
112
+ code_mode: z
113
+ n_frames_render: 4
114
+ sample_radius_3d: 0.5
115
+ renderer:
116
+ n_coarse: 32
117
+ n_fine: 0
118
+ n_fine_depth: 0
119
+ depth_std: 1.0
120
+ sched: []
121
+ white_bkgd: false
122
+ lindisp: true
123
+ hard_alpha_cap: true
124
+ eval_batch_size: 65536
125
+ render_mode: volumetric
126
+ normalize_dino: true
127
+ training:
128
+ optimizer:
129
+ type: adam
130
+ args:
131
+ lr: 0.0005
132
+ betas:
133
+ - 0.9
134
+ - 0.999
135
+ eps: 1.0e-08
136
+ weight_decay: 0.0
137
+ amsgrad: false
138
+ loss:
139
+ - type: stego
140
+ random_weight: 0.7104435477094759
141
+ knn_weight: 0.45714663697057617
142
+ self_weight: 0.0034456931615672037
143
+ random_shift: 0.9438917725068359
144
+ knn_shift: 0.15229132706463983
145
+ self_shift: 0.5457784695246396
146
+ pointwise: false
147
+ num_epochs: 1
148
+ epoch_length: 1000
149
+ continue: false
150
+ checkpoint_every: 5000
151
+ log_every_iters: 250
152
+ ray_sampler:
153
+ z_near: 3
154
+ z_far: 80
155
+ sample_mode: image
156
+ resume_from: /home/fb20user12/code/bts-thesis-dino/out/features-paper/scenedino-kitti-360-sscbench-orb-slam/training_checkpoint_180000.pt
157
+ validation:
158
+ validation:
159
+ metrics:
160
+ - type: seg
161
+ agg_type: unsup_seg
162
+ args:
163
+ n_classes: 19
164
+ gt_classes: 19
165
+ - type: stego
166
+ agg_type: concat
167
+ subset:
168
+ type: random
169
+ args:
170
+ size: 32
171
+ save_best:
172
+ metric: stego_cluster_weighted_miou
173
+ update_model: true
174
+ dry_run: false
175
+ log_loss: false
176
+ global_step:
177
+ type: trainer iteration
178
+ events:
179
+ - type: ITERATION_COMPLETED
180
+ args:
181
+ every: 100
182
+ visualization_seg:
183
+ metrics: {}
184
+ subset:
185
+ type: range
186
+ args:
187
+ start: 300
188
+ end: 301
189
+ visualize:
190
+ input_imgs: null
191
+ dino_gt: null
192
+ batch_dino_gt: null
193
+ batch_dino_artifacts: null
194
+ segs_gt: null
195
+ segs_pred: null
196
+ batch_reconstructed_dino: null
197
+ batch_dino_features_kmeans: null
198
+ depth: null
199
+ log_loss: false
200
+ global_step:
201
+ type: trainer iteration
202
+ events:
203
+ - type: STARTED
204
+ args: null
205
+ - type: ITERATION_COMPLETED
206
+ args:
207
+ every: 100
208
+ downstream:
209
+ type: segmentation
210
+ n_classes: 19
211
+ gt_classes: 19
212
+ input_dim: 768
213
+ code_dim: 64
214
+ knn_neighbors: 4
215
+ buffer_size: 256
216
+ patch_sample_size: 576
217
+ mode: 3d
218
+ apply_crf: false
219
+ sweep:
220
+ study_name: orb_slam_sweep
221
+ storage_url: sqlite:////home/fb20user12/sweeps/optuna_study.db
222
+ direction: maximize
223
+ n_trials: 50
224
+ start_original_param: true
225
+ hparams:
226
+ - key: training.loss.0.random_weight
227
+ method: suggest_float
228
+ kwargs:
229
+ name: random_weight
230
+ low: 0.6
231
+ high: 0.8
232
+ - key: training.loss.0.knn_weight
233
+ method: suggest_float
234
+ kwargs:
235
+ name: knn_weight
236
+ low: 0.3
237
+ high: 0.5
238
+ - key: training.loss.0.self_weight
239
+ method: suggest_float
240
+ kwargs:
241
+ name: self_weight
242
+ low: 0.0
243
+ high: 0.2
244
+ - key: training.loss.0.random_shift
245
+ method: suggest_float
246
+ kwargs:
247
+ name: random_shift
248
+ low: 0.75
249
+ high: 0.95
250
+ - key: training.loss.0.knn_shift
251
+ method: suggest_float
252
+ kwargs:
253
+ name: knn_shift
254
+ low: 0.1
255
+ high: 0.3
256
+ - key: training.loss.0.self_shift
257
+ method: suggest_float
258
+ kwargs:
259
+ name: self_shift
260
+ low: 0.35
261
+ high: 0.55
262
+ training_type: downstream_training
263
+ mode: nvs
264
+ seed: 18
265
+ backend: null
266
+ nproc_per_node: null
267
+ with_amp: true
268
+ name: training
269
+ batch_size: 4
270
+ gradient_accum_factor: 1
271
+ num_workers: 6
272
+ output:
273
+ path: out/sweep-orb-slam/sweep_18
274
+ unique_id: sweep_18
275
+ original_path: out/sweep-orb-slam
276
+ original_unique_id: sweep
277
+ eval_seed: 13
278
+ cuda device name: Tesla V100-SXM3-32GB
seg-best-dino/checkpoint.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9d6d6ca7bd776f68e861639b56cc8b6ea42c8cc560e6711b2850cea1e15d6b01
3
+ size 758231104
seg-best-dino/training_config.yaml ADDED
@@ -0,0 +1,277 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ dataset:
2
+ type: old_KITTI_360
3
+ data_path: /home/fb20user12/datasets/KITTI-360/
4
+ pose_path: /home/fb20user12/datasets/KITTI-360/data_poses
5
+ split_path: datasets/kitti_360/splits/sscbench
6
+ image_size:
7
+ - 192
8
+ - 640
9
+ data_stereo: true
10
+ data_fisheye: true
11
+ data_fc: 2
12
+ fisheye_offset:
13
+ - 10
14
+ - 11
15
+ - 12
16
+ - 13
17
+ - 14
18
+ - 15
19
+ - 16
20
+ - 17
21
+ - 18
22
+ - 19
23
+ - 20
24
+ - 21
25
+ - 22
26
+ - 23
27
+ - 24
28
+ - 25
29
+ - 26
30
+ - 27
31
+ - 28
32
+ - 29
33
+ - 30
34
+ - 31
35
+ - 32
36
+ - 33
37
+ - 34
38
+ - 35
39
+ - 36
40
+ - 37
41
+ - 38
42
+ - 39
43
+ - 40
44
+ stereo_offset:
45
+ - 0
46
+ is_preprocessed: true
47
+ fisheye_rotation: -15
48
+ data_segmentation: true
49
+ steps_per_epoch: 10328
50
+ model:
51
+ arch: BTSNet
52
+ use_code: true
53
+ prediction_mode: default
54
+ predict_dino: true
55
+ dino_dims: 64
56
+ compensate_artifacts: false
57
+ flip_augmentation: true
58
+ encoder:
59
+ type: dinov2
60
+ mode: downsample-prediction
61
+ decoder_arch: dpt
62
+ downsampler_arch: featup
63
+ encoder_arch: vit-b
64
+ version: v1
65
+ separate_gt_version: v1
66
+ encoder_freeze: false
67
+ flip_avg_gt: true
68
+ dim_reduction_arch: mlp
69
+ num_ch_enc:
70
+ - 64
71
+ - 64
72
+ - 128
73
+ - 256
74
+ intermediate_features:
75
+ - 3
76
+ - 6
77
+ - 9
78
+ decoder_out_dim: 256
79
+ dino_pca_dim: 64
80
+ image_size:
81
+ - 192
82
+ - 640
83
+ key_features: false
84
+ code:
85
+ num_freqs: 6
86
+ freq_factor: 1.5
87
+ include_input: true
88
+ decoder_heads:
89
+ - type: resnet
90
+ name: normal_head
91
+ freeze: false
92
+ args:
93
+ n_blocks: 0
94
+ d_hidden: 128
95
+ final_prediction_head: normal_head
96
+ encoding_strategy:
97
+ name: default
98
+ args: {}
99
+ eval_encoding_strategy:
100
+ name: default
101
+ args: null
102
+ loss_renderer_strategy:
103
+ name: kitti_360
104
+ args: null
105
+ eval_loss_renderer_strategy:
106
+ name: single_renderer
107
+ args:
108
+ shuffle_frames: false
109
+ all_frames: true
110
+ inv_z: true
111
+ learn_empty: false
112
+ code_mode: z
113
+ n_frames_render: 4
114
+ sample_radius_3d: 0.5
115
+ renderer:
116
+ n_coarse: 32
117
+ n_fine: 0
118
+ n_fine_depth: 0
119
+ depth_std: 1.0
120
+ sched: []
121
+ white_bkgd: false
122
+ lindisp: true
123
+ hard_alpha_cap: true
124
+ eval_batch_size: 65536
125
+ render_mode: volumetric
126
+ normalize_dino: true
127
+ training:
128
+ optimizer:
129
+ type: adam
130
+ args:
131
+ lr: 0.001
132
+ betas:
133
+ - 0.9
134
+ - 0.999
135
+ eps: 1.0e-08
136
+ weight_decay: 0.0
137
+ amsgrad: false
138
+ loss:
139
+ - type: stego
140
+ random_weight: 0.6702352279261414
141
+ knn_weight: 0.4156436438453117
142
+ self_weight: 0.08146997886146659
143
+ random_shift: 0.8709334888837256
144
+ knn_shift: 0.18458300726748128
145
+ self_shift: 0.43610463774158115
146
+ pointwise: false
147
+ num_epochs: 1
148
+ epoch_length: 1000
149
+ resume_from: /home/fb20user12/code/bts-thesis-dino/out/paper-runs/kitti-base/training_checkpoint_130000.pt
150
+ continue: false
151
+ checkpoint_every: 5000
152
+ log_every_iters: 250
153
+ ray_sampler:
154
+ z_near: 3
155
+ z_far: 80
156
+ sample_mode: image
157
+ validation:
158
+ validation:
159
+ metrics:
160
+ - type: seg
161
+ agg_type: unsup_seg
162
+ args:
163
+ n_classes: 19
164
+ gt_classes: 19
165
+ - type: stego
166
+ agg_type: concat
167
+ subset:
168
+ type: random
169
+ args:
170
+ size: 32
171
+ save_best:
172
+ metric: stego_cluster_weighted_miou
173
+ update_model: true
174
+ dry_run: false
175
+ log_loss: false
176
+ global_step:
177
+ type: trainer iteration
178
+ events:
179
+ - type: ITERATION_COMPLETED
180
+ args:
181
+ every: 100
182
+ visualization_seg:
183
+ metrics: {}
184
+ subset:
185
+ type: range
186
+ args:
187
+ start: 300
188
+ end: 301
189
+ visualize:
190
+ input_imgs: null
191
+ dino_gt: null
192
+ batch_dino_gt: null
193
+ batch_dino_artifacts: null
194
+ segs_gt: null
195
+ segs_pred: null
196
+ batch_reconstructed_dino: null
197
+ batch_dino_features_kmeans: null
198
+ depth: null
199
+ log_loss: false
200
+ global_step:
201
+ type: trainer iteration
202
+ events:
203
+ - type: STARTED
204
+ args: null
205
+ - type: ITERATION_COMPLETED
206
+ args:
207
+ every: 100
208
+ downstream:
209
+ type: segmentation
210
+ n_classes: 19
211
+ gt_classes: 19
212
+ input_dim: 768
213
+ code_dim: 64
214
+ knn_neighbors: 4
215
+ buffer_size: 256
216
+ patch_sample_size: 576
217
+ mode: 3d
218
+ sweep:
219
+ study_name: sweep_pruned_offset_0
220
+ storage_url: sqlite:////home/fb20user12/sweeps/optuna_study.db
221
+ direction: maximize
222
+ n_trials: 100
223
+ start_original_param: true
224
+ hparams:
225
+ - key: training.loss.0.random_weight
226
+ method: suggest_float
227
+ kwargs:
228
+ name: random_weight
229
+ low: 0.0
230
+ high: 1.0
231
+ - key: training.loss.0.knn_weight
232
+ method: suggest_float
233
+ kwargs:
234
+ name: knn_weight
235
+ low: 0.0
236
+ high: 1.0
237
+ - key: training.loss.0.self_weight
238
+ method: suggest_float
239
+ kwargs:
240
+ name: self_weight
241
+ low: 0.0
242
+ high: 1.0
243
+ - key: training.loss.0.random_shift
244
+ method: suggest_float
245
+ kwargs:
246
+ name: random_shift
247
+ low: 0.6
248
+ high: 1.0
249
+ - key: training.loss.0.knn_shift
250
+ method: suggest_float
251
+ kwargs:
252
+ name: knn_shift
253
+ low: 0.0
254
+ high: 0.8
255
+ - key: training.loss.0.self_shift
256
+ method: suggest_float
257
+ kwargs:
258
+ name: self_shift
259
+ low: 0.0
260
+ high: 0.8
261
+ training_type: downstream_training
262
+ mode: nvs
263
+ seed: 34
264
+ backend: null
265
+ nproc_per_node: null
266
+ with_amp: true
267
+ name: training
268
+ batch_size: 4
269
+ gradient_accum_factor: 1
270
+ num_workers: 4
271
+ output:
272
+ path: out/sweep_pruned_offset_0/sweep_34
273
+ unique_id: sweep_34
274
+ original_path: out/sweep_pruned_offset_0/
275
+ original_unique_id: sweep
276
+ eval_seed: 33
277
+ cuda device name: Tesla V100-SXM3-32GB
seg-best-dinov2/checkpoint.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7754f0e8b4476eae0531d089824892b8d4bb70161f0498bf70b1467a6605e218
3
+ size 753457438
seg-best-dinov2/training_config.yaml ADDED
@@ -0,0 +1,277 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ dataset:
2
+ type: old_KITTI_360
3
+ data_path: /home/fb20user12/datasets/KITTI-360/
4
+ pose_path: /home/fb20user12/datasets/KITTI-360/data_poses
5
+ split_path: datasets/kitti_360/splits/sscbench
6
+ image_size:
7
+ - 192
8
+ - 640
9
+ data_stereo: true
10
+ data_fisheye: true
11
+ data_fc: 2
12
+ fisheye_offset:
13
+ - 10
14
+ - 11
15
+ - 12
16
+ - 13
17
+ - 14
18
+ - 15
19
+ - 16
20
+ - 17
21
+ - 18
22
+ - 19
23
+ - 20
24
+ - 21
25
+ - 22
26
+ - 23
27
+ - 24
28
+ - 25
29
+ - 26
30
+ - 27
31
+ - 28
32
+ - 29
33
+ - 30
34
+ - 31
35
+ - 32
36
+ - 33
37
+ - 34
38
+ - 35
39
+ - 36
40
+ - 37
41
+ - 38
42
+ - 39
43
+ - 40
44
+ stereo_offset:
45
+ - 0
46
+ is_preprocessed: true
47
+ fisheye_rotation: -15
48
+ data_segmentation: true
49
+ steps_per_epoch: 5164
50
+ model:
51
+ arch: BTSNet
52
+ use_code: true
53
+ prediction_mode: default
54
+ predict_dino: true
55
+ dino_dims: 64
56
+ compensate_artifacts: true
57
+ flip_augmentation: true
58
+ encoder:
59
+ type: dinov2
60
+ mode: downsample-prediction
61
+ decoder_arch: dpt
62
+ downsampler_arch: featup
63
+ encoder_arch: vit-b
64
+ version: v2
65
+ separate_gt_version: v2
66
+ encoder_freeze: false
67
+ flip_avg_gt: false
68
+ dim_reduction_arch: mlp
69
+ num_ch_enc:
70
+ - 64
71
+ - 64
72
+ - 128
73
+ - 256
74
+ intermediate_features:
75
+ - 3
76
+ - 6
77
+ - 9
78
+ decoder_out_dim: 256
79
+ dino_pca_dim: 64
80
+ image_size:
81
+ - 192
82
+ - 640
83
+ key_features: false
84
+ code:
85
+ num_freqs: 6
86
+ freq_factor: 1.5
87
+ include_input: true
88
+ decoder_heads:
89
+ - type: resnet
90
+ name: normal_head
91
+ freeze: false
92
+ args:
93
+ n_blocks: 0
94
+ d_hidden: 128
95
+ final_prediction_head: normal_head
96
+ encoding_strategy:
97
+ name: default
98
+ args: {}
99
+ eval_encoding_strategy:
100
+ name: default
101
+ args: null
102
+ loss_renderer_strategy:
103
+ name: kitti_360
104
+ args: null
105
+ eval_loss_renderer_strategy:
106
+ name: single_renderer
107
+ args:
108
+ shuffle_frames: false
109
+ all_frames: true
110
+ inv_z: true
111
+ learn_empty: false
112
+ code_mode: z
113
+ n_frames_render: 4
114
+ sample_radius_3d: 0.5
115
+ renderer:
116
+ n_coarse: 32
117
+ n_fine: 0
118
+ n_fine_depth: 0
119
+ depth_std: 1.0
120
+ sched: []
121
+ white_bkgd: false
122
+ lindisp: true
123
+ hard_alpha_cap: true
124
+ eval_batch_size: 65536
125
+ render_mode: volumetric
126
+ normalize_dino: true
127
+ training:
128
+ optimizer:
129
+ type: adam
130
+ args:
131
+ lr: 0.0005
132
+ betas:
133
+ - 0.9
134
+ - 0.999
135
+ eps: 1.0e-08
136
+ weight_decay: 0.0
137
+ amsgrad: false
138
+ loss:
139
+ - type: stego
140
+ random_weight: 0.7681858818342623
141
+ knn_weight: 0.40262895957374445
142
+ self_weight: 0.2478902214214737
143
+ random_shift: 0.8167245534406465
144
+ knn_shift: 0.11229105513980008
145
+ self_shift: 0.5397087004143353
146
+ pointwise: false
147
+ num_epochs: 1
148
+ epoch_length: 1000
149
+ resume_from: /home/fb20user12/code/bts-thesis-dino/out/paper-runs/kitti-dinov2/training_checkpoint_210000.pt
150
+ continue: false
151
+ checkpoint_every: 5000
152
+ log_every_iters: 250
153
+ ray_sampler:
154
+ z_near: 3
155
+ z_far: 80
156
+ sample_mode: image
157
+ validation:
158
+ validation:
159
+ metrics:
160
+ - type: seg
161
+ agg_type: unsup_seg
162
+ args:
163
+ n_classes: 19
164
+ gt_classes: 19
165
+ - type: stego
166
+ agg_type: concat
167
+ subset:
168
+ type: random
169
+ args:
170
+ size: 32
171
+ save_best:
172
+ metric: stego_cluster_weighted_miou
173
+ update_model: true
174
+ dry_run: false
175
+ log_loss: false
176
+ global_step:
177
+ type: trainer iteration
178
+ events:
179
+ - type: ITERATION_COMPLETED
180
+ args:
181
+ every: 100
182
+ visualization_seg:
183
+ metrics: {}
184
+ subset:
185
+ type: range
186
+ args:
187
+ start: 300
188
+ end: 301
189
+ visualize:
190
+ input_imgs: null
191
+ dino_gt: null
192
+ batch_dino_gt: null
193
+ batch_dino_artifacts: null
194
+ segs_gt: null
195
+ segs_pred: null
196
+ batch_reconstructed_dino: null
197
+ batch_dino_features_kmeans: null
198
+ depth: null
199
+ log_loss: false
200
+ global_step:
201
+ type: trainer iteration
202
+ events:
203
+ - type: STARTED
204
+ args: null
205
+ - type: ITERATION_COMPLETED
206
+ args:
207
+ every: 100
208
+ downstream:
209
+ type: segmentation
210
+ n_classes: 19
211
+ gt_classes: 19
212
+ input_dim: 768
213
+ code_dim: 64
214
+ knn_neighbors: 4
215
+ buffer_size: 256
216
+ patch_sample_size: 576
217
+ mode: 3d
218
+ sweep:
219
+ study_name: sweep_dinov2
220
+ storage_url: sqlite:////home/fb20user12/sweeps/optuna_study.db
221
+ direction: maximize
222
+ n_trials: 50
223
+ start_original_param: true
224
+ hparams:
225
+ - key: training.loss.0.random_weight
226
+ method: suggest_float
227
+ kwargs:
228
+ name: random_weight
229
+ low: 0.0
230
+ high: 1.0
231
+ - key: training.loss.0.knn_weight
232
+ method: suggest_float
233
+ kwargs:
234
+ name: knn_weight
235
+ low: 0.0
236
+ high: 1.0
237
+ - key: training.loss.0.self_weight
238
+ method: suggest_float
239
+ kwargs:
240
+ name: self_weight
241
+ low: 0.0
242
+ high: 1.0
243
+ - key: training.loss.0.random_shift
244
+ method: suggest_float
245
+ kwargs:
246
+ name: random_shift
247
+ low: 0.6
248
+ high: 1.0
249
+ - key: training.loss.0.knn_shift
250
+ method: suggest_float
251
+ kwargs:
252
+ name: knn_shift
253
+ low: 0.0
254
+ high: 0.4
255
+ - key: training.loss.0.self_shift
256
+ method: suggest_float
257
+ kwargs:
258
+ name: self_shift
259
+ low: 0.2
260
+ high: 0.6
261
+ training_type: downstream_training
262
+ mode: nvs
263
+ seed: 66
264
+ backend: null
265
+ nproc_per_node: null
266
+ with_amp: true
267
+ name: training
268
+ batch_size: 8
269
+ gradient_accum_factor: 1
270
+ num_workers: 8
271
+ output:
272
+ path: out/sweep_dinov2/sweep_66
273
+ unique_id: sweep_66
274
+ original_path: out/sweep_dinov2/
275
+ original_unique_id: sweep
276
+ eval_seed: 65
277
+ cuda device name: Tesla V100-SXM3-32GB