AndreasLH commited on
Commit
e04700e
·
verified ·
1 Parent(s): f0eb5b4

Upload model and baseline model

Browse files
Baseline_sgd/category_meta.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"thing_classes": ["pedestrian", "car", "cyclist", "van", "truck", "traffic cone", "barrier", "motorcycle", "bicycle", "bus", "trailer", "books", "bottle", "camera", "cereal box", "chair", "cup", "laptop", "shoes", "towel", "blinds", "window", "lamp", "shelves", "mirror", "sink", "cabinet", "bathtub", "door", "toilet", "desk", "box", "bookcase", "picture", "table", "counter", "bed", "night stand", "pillow", "sofa", "television", "floor mat", "curtain", "clothes", "stationery", "refrigerator", "bin", "stove", "oven", "machine"], "thing_dataset_id_to_contiguous_id": {"0": 0, "1": 1, "3": 2, "4": 3, "5": 4, "8": 5, "9": 6, "10": 7, "11": 8, "12": 9, "13": 10, "14": 11, "15": 12, "16": 13, "17": 14, "18": 15, "19": 16, "20": 17, "21": 18, "22": 19, "23": 20, "24": 21, "25": 22, "26": 23, "27": 24, "28": 25, "29": 26, "30": 27, "31": 28, "32": 29, "33": 30, "34": 31, "35": 32, "36": 33, "37": 34, "38": 35, "39": 36, "40": 37, "42": 38, "43": 39, "44": 40, "45": 41, "46": 42, "47": 43, "48": 44, "49": 45, "52": 46, "53": 47, "57": 48, "61": 49}}
Baseline_sgd/config.yaml ADDED
@@ -0,0 +1,454 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ CUDNN_BENCHMARK: false
2
+ DATALOADER:
3
+ ASPECT_RATIO_GROUPING: true
4
+ BALANCE_DATASETS: false
5
+ FILTER_EMPTY_ANNOTATIONS: true
6
+ NUM_WORKERS: 4
7
+ REPEAT_THRESHOLD: 0.1
8
+ SAMPLER_TRAIN: RepeatFactorTrainingSampler
9
+ DATASETS:
10
+ CATEGORY_NAMES:
11
+ - chair
12
+ - table
13
+ - cabinet
14
+ - car
15
+ - lamp
16
+ - books
17
+ - sofa
18
+ - pedestrian
19
+ - picture
20
+ - window
21
+ - pillow
22
+ - truck
23
+ - door
24
+ - blinds
25
+ - sink
26
+ - shelves
27
+ - television
28
+ - shoes
29
+ - cup
30
+ - bottle
31
+ - bookcase
32
+ - laptop
33
+ - desk
34
+ - cereal box
35
+ - floor mat
36
+ - traffic cone
37
+ - mirror
38
+ - barrier
39
+ - counter
40
+ - camera
41
+ - bicycle
42
+ - toilet
43
+ - bus
44
+ - bed
45
+ - refrigerator
46
+ - trailer
47
+ - box
48
+ - oven
49
+ - clothes
50
+ - van
51
+ - towel
52
+ - motorcycle
53
+ - night stand
54
+ - stove
55
+ - machine
56
+ - stationery
57
+ - bathtub
58
+ - cyclist
59
+ - curtain
60
+ - bin
61
+ IGNORE_NAMES:
62
+ - dontcare
63
+ - ignore
64
+ - void
65
+ MAX_DEPTH: 100000000.0
66
+ MIN_HEIGHT_THRES: 0.05
67
+ MODAL_2D_BOXES: false
68
+ PRECOMPUTED_PROPOSAL_TOPK_TEST: 1000
69
+ PRECOMPUTED_PROPOSAL_TOPK_TRAIN: 2000
70
+ PROPOSAL_FILES_TEST: []
71
+ PROPOSAL_FILES_TRAIN: []
72
+ TEST:
73
+ - SUNRGBD_test_mini
74
+ TRAIN:
75
+ - SUNRGBD_train_mini
76
+ - SUNRGBD_val_mini
77
+ TRUNCATION_THRES: 0.75
78
+ TRUNC_2D_BOXES: true
79
+ VISIBILITY_THRES: 0.25
80
+ GLOBAL:
81
+ HACK: 1.0
82
+ INPUT:
83
+ CROP:
84
+ ENABLED: false
85
+ SIZE:
86
+ - 0.9
87
+ - 0.9
88
+ TYPE: relative_range
89
+ FORMAT: BGR
90
+ MASK_FORMAT: polygon
91
+ MAX_SIZE_TEST: 4096
92
+ MAX_SIZE_TRAIN: 4096
93
+ MIN_SIZE_TEST: 512
94
+ MIN_SIZE_TRAIN:
95
+ - 256
96
+ - 272
97
+ - 288
98
+ - 304
99
+ - 320
100
+ - 336
101
+ - 352
102
+ - 368
103
+ - 384
104
+ - 400
105
+ - 416
106
+ - 432
107
+ - 448
108
+ - 464
109
+ - 480
110
+ - 496
111
+ - 512
112
+ - 528
113
+ - 544
114
+ - 560
115
+ - 576
116
+ - 592
117
+ - 608
118
+ - 624
119
+ - 640
120
+ MIN_SIZE_TRAIN_SAMPLING: choice
121
+ RANDOM_FLIP: horizontal
122
+ MODEL:
123
+ ANCHOR_GENERATOR:
124
+ ANGLES:
125
+ - - -90
126
+ - 0
127
+ - 90
128
+ ASPECT_RATIOS:
129
+ - - 0.5
130
+ - 1.0
131
+ - 2.0
132
+ NAME: DefaultAnchorGenerator
133
+ OFFSET: 0.0
134
+ SIZES:
135
+ - - 32
136
+ - - 64
137
+ - - 128
138
+ - - 256
139
+ - - 512
140
+ BACKBONE:
141
+ FREEZE_AT: 0
142
+ NAME: build_dla_from_vision_fpn_backbone
143
+ DEVICE: cpu
144
+ DLA:
145
+ TRICKS: false
146
+ TYPE: dla34
147
+ FPN:
148
+ FUSE_TYPE: sum
149
+ IN_FEATURES:
150
+ - p2
151
+ - p3
152
+ - p4
153
+ - p5
154
+ - p6
155
+ NORM: ''
156
+ OUT_CHANNELS: 256
157
+ KEYPOINT_ON: false
158
+ LOAD_PROPOSALS: false
159
+ MASK_ON: false
160
+ META_ARCHITECTURE: RCNN3D
161
+ PANOPTIC_FPN:
162
+ COMBINE:
163
+ ENABLED: true
164
+ INSTANCES_CONFIDENCE_THRESH: 0.5
165
+ OVERLAP_THRESH: 0.5
166
+ STUFF_AREA_LIMIT: 4096
167
+ INSTANCE_LOSS_WEIGHT: 1.0
168
+ PIXEL_MEAN:
169
+ - 103.53
170
+ - 116.28
171
+ - 123.675
172
+ PIXEL_STD:
173
+ - 57.375
174
+ - 57.12
175
+ - 58.395
176
+ PROPOSAL_GENERATOR:
177
+ MIN_SIZE: 0
178
+ NAME: RPNWithIgnore
179
+ RESNETS:
180
+ DEFORM_MODULATED: false
181
+ DEFORM_NUM_GROUPS: 1
182
+ DEFORM_ON_PER_STAGE:
183
+ - false
184
+ - false
185
+ - false
186
+ - false
187
+ DEPTH: 50
188
+ NORM: FrozenBN
189
+ NUM_GROUPS: 1
190
+ OUT_FEATURES:
191
+ - res4
192
+ RES2_OUT_CHANNELS: 256
193
+ RES5_DILATION: 1
194
+ STEM_OUT_CHANNELS: 64
195
+ STRIDE_IN_1X1: true
196
+ TORCHVISION: true
197
+ WIDTH_PER_GROUP: 64
198
+ RETINANET:
199
+ BBOX_REG_LOSS_TYPE: smooth_l1
200
+ BBOX_REG_WEIGHTS: &id002
201
+ - 1.0
202
+ - 1.0
203
+ - 1.0
204
+ - 1.0
205
+ FOCAL_LOSS_ALPHA: 0.25
206
+ FOCAL_LOSS_GAMMA: 2.0
207
+ IN_FEATURES:
208
+ - p3
209
+ - p4
210
+ - p5
211
+ - p6
212
+ - p7
213
+ IOU_LABELS:
214
+ - 0
215
+ - -1
216
+ - 1
217
+ IOU_THRESHOLDS:
218
+ - 0.4
219
+ - 0.5
220
+ NMS_THRESH_TEST: 0.5
221
+ NORM: ''
222
+ NUM_CLASSES: 80
223
+ NUM_CONVS: 4
224
+ PRIOR_PROB: 0.01
225
+ SCORE_THRESH_TEST: 0.05
226
+ SMOOTH_L1_LOSS_BETA: 0.1
227
+ TOPK_CANDIDATES_TEST: 1000
228
+ ROI_BOX_CASCADE_HEAD:
229
+ BBOX_REG_WEIGHTS:
230
+ - &id001
231
+ - 10.0
232
+ - 10.0
233
+ - 5.0
234
+ - 5.0
235
+ - - 20.0
236
+ - 20.0
237
+ - 10.0
238
+ - 10.0
239
+ - - 30.0
240
+ - 30.0
241
+ - 15.0
242
+ - 15.0
243
+ IOUS:
244
+ - 0.5
245
+ - 0.6
246
+ - 0.7
247
+ ROI_BOX_HEAD:
248
+ BBOX_REG_LOSS_TYPE: smooth_l1
249
+ BBOX_REG_LOSS_WEIGHT: 1.0
250
+ BBOX_REG_WEIGHTS: *id001
251
+ CLS_AGNOSTIC_BBOX_REG: false
252
+ CONV_DIM: 256
253
+ FC_DIM: 1024
254
+ FED_LOSS_FREQ_WEIGHT_POWER: 0.5
255
+ FED_LOSS_NUM_CLASSES: 50
256
+ NAME: FastRCNNConvFCHead
257
+ NORM: ''
258
+ NUM_CONV: 0
259
+ NUM_FC: 2
260
+ POOLER_RESOLUTION: 7
261
+ POOLER_SAMPLING_RATIO: 0
262
+ POOLER_TYPE: ROIAlignV2
263
+ SMOOTH_L1_BETA: 0.0
264
+ TRAIN_ON_PRED_BOXES: false
265
+ USE_FED_LOSS: false
266
+ USE_SIGMOID_CE: false
267
+ ROI_CUBE_HEAD:
268
+ ALLOCENTRIC_POSE: true
269
+ CHAMFER_POSE: true
270
+ CLUSTER_BINS: 1
271
+ CONV_DIM: 256
272
+ DIMS_PRIORS_ENABLED: true
273
+ DIMS_PRIORS_FUNC: exp
274
+ DIMS_PRIORS_PRECOMPUTED: false
275
+ DISENTANGLED_LOSS: true
276
+ FC_DIM: 1024
277
+ INVERSE_Z_WEIGHT: false
278
+ LOSS_W_3D: 1.0
279
+ LOSS_W_DIMS: 1.0
280
+ LOSS_W_JOINT: 1.0
281
+ LOSS_W_POSE: 1.0
282
+ LOSS_W_XY: 1.0
283
+ LOSS_W_Z: 1.0
284
+ NAME: CubeHead
285
+ NUM_CONV: 0
286
+ NUM_FC: 2
287
+ POOLER_RESOLUTION: 7
288
+ POOLER_SAMPLING_RATIO: 0
289
+ POOLER_TYPE: ROIAlignV2
290
+ POSE_TYPE: 6d
291
+ SCALE_ROI_BOXES: 0.0
292
+ SHARED_FC: true
293
+ TEST: blasss
294
+ USE_CONFIDENCE: 1.0
295
+ VIRTUAL_DEPTH: true
296
+ VIRTUAL_FOCAL: 512.0
297
+ Z_TYPE: direct
298
+ ROI_HEADS:
299
+ BATCH_SIZE_PER_IMAGE: 512
300
+ IN_FEATURES:
301
+ - p2
302
+ - p3
303
+ - p4
304
+ - p5
305
+ - p6
306
+ IOU_LABELS:
307
+ - 0
308
+ - 1
309
+ IOU_THRESHOLDS:
310
+ - 0.5
311
+ NAME: ROIHeads3D
312
+ NMS_THRESH_TEST: 0.5
313
+ NUM_CLASSES: 50
314
+ POSITIVE_FRACTION: 0.25
315
+ PROPOSAL_APPEND_GT: true
316
+ SCORE_THRESH_TEST: 0.01
317
+ ROI_KEYPOINT_HEAD:
318
+ CONV_DIMS:
319
+ - 512
320
+ - 512
321
+ - 512
322
+ - 512
323
+ - 512
324
+ - 512
325
+ - 512
326
+ - 512
327
+ LOSS_WEIGHT: 1.0
328
+ MIN_KEYPOINTS_PER_IMAGE: 1
329
+ NAME: KRCNNConvDeconvUpsampleHead
330
+ NORMALIZE_LOSS_BY_VISIBLE_KEYPOINTS: true
331
+ NUM_KEYPOINTS: 17
332
+ POOLER_RESOLUTION: 14
333
+ POOLER_SAMPLING_RATIO: 0
334
+ POOLER_TYPE: ROIAlignV2
335
+ ROI_MASK_HEAD:
336
+ CLS_AGNOSTIC_MASK: false
337
+ CONV_DIM: 256
338
+ NAME: MaskRCNNConvUpsampleHead
339
+ NORM: ''
340
+ NUM_CONV: 0
341
+ POOLER_RESOLUTION: 14
342
+ POOLER_SAMPLING_RATIO: 0
343
+ POOLER_TYPE: ROIAlignV2
344
+ RPN:
345
+ BATCH_SIZE_PER_IMAGE: 256
346
+ BBOX_REG_LOSS_TYPE: smooth_l1
347
+ BBOX_REG_LOSS_WEIGHT: 1.0
348
+ BBOX_REG_WEIGHTS: *id002
349
+ BOUNDARY_THRESH: -1
350
+ CONV_DIMS:
351
+ - -1
352
+ HEAD_NAME: StandardRPNHead
353
+ IGNORE_THRESHOLD: 0.5
354
+ IN_FEATURES:
355
+ - p2
356
+ - p3
357
+ - p4
358
+ - p5
359
+ - p6
360
+ IOU_LABELS:
361
+ - 0
362
+ - -1
363
+ - 1
364
+ IOU_THRESHOLDS:
365
+ - 0.05
366
+ - 0.05
367
+ LOSS_WEIGHT: 1.0
368
+ NMS_THRESH: 0.7
369
+ OBJECTNESS_UNCERTAINTY: IoUness
370
+ POSITIVE_FRACTION: 1.0
371
+ POST_NMS_TOPK_TEST: 1000
372
+ POST_NMS_TOPK_TRAIN: 1000
373
+ PRE_NMS_TOPK_TEST: 1000
374
+ PRE_NMS_TOPK_TRAIN: 2000
375
+ SMOOTH_L1_BETA: 0.0
376
+ SEM_SEG_HEAD:
377
+ COMMON_STRIDE: 4
378
+ CONVS_DIM: 128
379
+ IGNORE_VALUE: 255
380
+ IN_FEATURES:
381
+ - p2
382
+ - p3
383
+ - p4
384
+ - p5
385
+ LOSS_WEIGHT: 1.0
386
+ NAME: SemSegFPNHead
387
+ NORM: GN
388
+ NUM_CLASSES: 54
389
+ STABILIZE: 0.02
390
+ USE_BN: true
391
+ WEIGHTS: ''
392
+ WEIGHTS_PRETRAIN: ''
393
+ OUTPUT_DIR: output/Baseline_sgd
394
+ PLOT:
395
+ OUTPUT_DIR: ''
396
+ RECALL_SCORES: false
397
+ SEED: 12
398
+ SOLVER:
399
+ AMP:
400
+ ENABLED: false
401
+ BASE_LR: 0.0214
402
+ BASE_LR_END: 0.0
403
+ BIAS_LR_FACTOR: 1.0
404
+ CHECKPOINT_PERIOD: 5000
405
+ CLIP_GRADIENTS:
406
+ CLIP_TYPE: value
407
+ CLIP_VALUE: 1.0
408
+ ENABLED: false
409
+ NORM_TYPE: 2.0
410
+ GAMMA: 0.1
411
+ IMS_PER_BATCH: 2
412
+ LR_SCHEDULER_NAME: WarmupMultiStepLR
413
+ MAX_ITER: 100000
414
+ MOMENTUM: 0.9
415
+ NESTEROV: false
416
+ NUM_DECAYS: 3
417
+ REFERENCE_WORLD_SIZE: 0
418
+ RESCALE_INTERVAL: false
419
+ STEPS:
420
+ - 17280
421
+ - 23040
422
+ TYPE: sgd
423
+ WARMUP_FACTOR: 0.001
424
+ WARMUP_ITERS: 0
425
+ WARMUP_METHOD: linear
426
+ WEIGHT_DECAY: 0.0001
427
+ WEIGHT_DECAY_BIAS: null
428
+ WEIGHT_DECAY_NORM: 0.0
429
+ TEST:
430
+ AUG:
431
+ ENABLED: false
432
+ FLIP: true
433
+ MAX_SIZE: 4000
434
+ MIN_SIZES:
435
+ - 400
436
+ - 500
437
+ - 600
438
+ - 700
439
+ - 800
440
+ - 900
441
+ - 1000
442
+ - 1100
443
+ - 1200
444
+ DETECTIONS_PER_IMAGE: 100
445
+ EVAL_PERIOD: 7200
446
+ EXPECTED_RESULTS: []
447
+ KEYPOINT_OKS_SIGMAS: []
448
+ PRECISE_BN:
449
+ ENABLED: false
450
+ NUM_ITER: 200
451
+ TRUNCATION_THRES: 0.33333333
452
+ VISIBILITY_THRES: 0.33333333
453
+ VERSION: 2
454
+ VIS_PERIOD: 1
Baseline_sgd/last_checkpoint ADDED
@@ -0,0 +1 @@
 
 
1
+ model_final.pth
Baseline_sgd/log.txt ADDED
The diff for this file is too large to render. See raw diff
 
Baseline_sgd/metrics.json ADDED
The diff for this file is too large to render. See raw diff
 
Baseline_sgd/model_final.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a2a7d91bfc42b0aa700623efa6ef7641fa9c613c70c854fc9aec75d27ab3f630
3
+ size 383337788
weak cube r-cnn/model_final.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3864e8b2f5a7c0413a271cdb90c5ff5052660ffbe03cbc0f619e3f3977b9458d
3
+ size 383338812