sbchoi commited on
Commit
1e8a4a9
1 Parent(s): cd6c2e8

Add config from convert_rt_detr_original_pytorch_checkpoint_to_pytorch.py

Browse files
Files changed (1) hide show
  1. config.json +20 -35
config.json CHANGED
@@ -10,6 +10,26 @@
10
  ],
11
  "attention_dropout": 0.0,
12
  "auxiliary_loss": true,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
13
  "batch_norm_eps": 1e-05,
14
  "box_noise_scale": 1.0,
15
  "d_model": 256,
@@ -23,17 +43,8 @@
23
  ],
24
  "decoder_layers": 4,
25
  "decoder_n_points": 4,
26
- "depths": [
27
- 3,
28
- 4,
29
- 6,
30
- 3
31
- ],
32
  "disable_custom_kernels": true,
33
- "downsample_in_bottleneck": false,
34
- "downsample_in_first_stage": false,
35
  "dropout": 0.0,
36
- "embedding_size": 64,
37
  "encode_proj_layers": [
38
  2
39
  ],
@@ -56,14 +67,7 @@
56
  ],
57
  "focal_loss_alpha": 0.75,
58
  "focal_loss_gamma": 2.0,
59
- "hidden_act": "relu",
60
  "hidden_expansion": 0.5,
61
- "hidden_sizes": [
62
- 64,
63
- 128,
64
- 256,
65
- 512
66
- ],
67
  "id2label": {
68
  "0": "person",
69
  "1": "bicycle",
@@ -232,7 +236,6 @@
232
  },
233
  "label_noise_ratio": 0.5,
234
  "layer_norm_eps": 1e-05,
235
- "layer_type": "basic",
236
  "learn_initial_query": false,
237
  "matcher_alpha": 0.25,
238
  "matcher_bbox_cost": 5.0,
@@ -241,28 +244,10 @@
241
  "matcher_giou_cost": 2.0,
242
  "model_type": "rt_detr",
243
  "normalize_before": false,
244
- "num_channels": 3,
245
  "num_denoising": 100,
246
  "num_feature_levels": 3,
247
  "num_queries": 300,
248
- "out_features": [
249
- "stage2",
250
- "stage3",
251
- "stage4"
252
- ],
253
- "out_indices": [
254
- 2,
255
- 3,
256
- 4
257
- ],
258
  "positional_encoding_temperature": 10000,
259
- "stage_names": [
260
- "stem",
261
- "stage1",
262
- "stage2",
263
- "stage3",
264
- "stage4"
265
- ],
266
  "torch_dtype": "float32",
267
  "transformers_version": "4.42.0.dev0",
268
  "use_focal_loss": true,
 
10
  ],
11
  "attention_dropout": 0.0,
12
  "auxiliary_loss": true,
13
+ "backbone_config": {
14
+ "hidden_sizes": [
15
+ 64,
16
+ 128,
17
+ 256,
18
+ 512
19
+ ],
20
+ "layer_type": "basic",
21
+ "model_type": "rtdetr-resnet",
22
+ "out_features": [
23
+ "stage2",
24
+ "stage3",
25
+ "stage4"
26
+ ],
27
+ "out_indices": [
28
+ 2,
29
+ 3,
30
+ 4
31
+ ]
32
+ },
33
  "batch_norm_eps": 1e-05,
34
  "box_noise_scale": 1.0,
35
  "d_model": 256,
 
43
  ],
44
  "decoder_layers": 4,
45
  "decoder_n_points": 4,
 
 
 
 
 
 
46
  "disable_custom_kernels": true,
 
 
47
  "dropout": 0.0,
 
48
  "encode_proj_layers": [
49
  2
50
  ],
 
67
  ],
68
  "focal_loss_alpha": 0.75,
69
  "focal_loss_gamma": 2.0,
 
70
  "hidden_expansion": 0.5,
 
 
 
 
 
 
71
  "id2label": {
72
  "0": "person",
73
  "1": "bicycle",
 
236
  },
237
  "label_noise_ratio": 0.5,
238
  "layer_norm_eps": 1e-05,
 
239
  "learn_initial_query": false,
240
  "matcher_alpha": 0.25,
241
  "matcher_bbox_cost": 5.0,
 
244
  "matcher_giou_cost": 2.0,
245
  "model_type": "rt_detr",
246
  "normalize_before": false,
 
247
  "num_denoising": 100,
248
  "num_feature_levels": 3,
249
  "num_queries": 300,
 
 
 
 
 
 
 
 
 
 
250
  "positional_encoding_temperature": 10000,
 
 
 
 
 
 
 
251
  "torch_dtype": "float32",
252
  "transformers_version": "4.42.0.dev0",
253
  "use_focal_loss": true,