sbchoi commited on
Commit
6155b9e
1 Parent(s): a18681d

Add config from convert_rt_detr_original_pytorch_checkpoint_to_pytorch.py

Browse files
Files changed (1) hide show
  1. config.json +19 -35
config.json CHANGED
@@ -10,6 +10,25 @@
10
  ],
11
  "attention_dropout": 0.0,
12
  "auxiliary_loss": true,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
13
  "batch_norm_eps": 1e-05,
14
  "box_noise_scale": 1.0,
15
  "d_model": 256,
@@ -23,17 +42,8 @@
23
  ],
24
  "decoder_layers": 6,
25
  "decoder_n_points": 4,
26
- "depths": [
27
- 3,
28
- 4,
29
- 23,
30
- 3
31
- ],
32
  "disable_custom_kernels": true,
33
- "downsample_in_bottleneck": false,
34
- "downsample_in_first_stage": false,
35
  "dropout": 0.0,
36
- "embedding_size": 64,
37
  "encode_proj_layers": [
38
  2
39
  ],
@@ -56,14 +66,7 @@
56
  ],
57
  "focal_loss_alpha": 0.75,
58
  "focal_loss_gamma": 2.0,
59
- "hidden_act": "relu",
60
  "hidden_expansion": 1.0,
61
- "hidden_sizes": [
62
- 256,
63
- 512,
64
- 1024,
65
- 2048
66
- ],
67
  "id2label": {
68
  "0": "person",
69
  "1": "bicycle",
@@ -232,7 +235,6 @@
232
  },
233
  "label_noise_ratio": 0.5,
234
  "layer_norm_eps": 1e-05,
235
- "layer_type": "bottleneck",
236
  "learn_initial_query": false,
237
  "matcher_alpha": 0.25,
238
  "matcher_bbox_cost": 5.0,
@@ -241,28 +243,10 @@
241
  "matcher_giou_cost": 2.0,
242
  "model_type": "rt_detr",
243
  "normalize_before": false,
244
- "num_channels": 3,
245
  "num_denoising": 100,
246
  "num_feature_levels": 3,
247
  "num_queries": 300,
248
- "out_features": [
249
- "stage2",
250
- "stage3",
251
- "stage4"
252
- ],
253
- "out_indices": [
254
- 2,
255
- 3,
256
- 4
257
- ],
258
  "positional_encoding_temperature": 10000,
259
- "stage_names": [
260
- "stem",
261
- "stage1",
262
- "stage2",
263
- "stage3",
264
- "stage4"
265
- ],
266
  "torch_dtype": "float32",
267
  "transformers_version": "4.42.0.dev0",
268
  "use_focal_loss": true,
 
10
  ],
11
  "attention_dropout": 0.0,
12
  "auxiliary_loss": true,
13
+ "backbone_config": {
14
+ "depths": [
15
+ 3,
16
+ 4,
17
+ 23,
18
+ 3
19
+ ],
20
+ "model_type": "rtdetr-resnet",
21
+ "out_features": [
22
+ "stage2",
23
+ "stage3",
24
+ "stage4"
25
+ ],
26
+ "out_indices": [
27
+ 2,
28
+ 3,
29
+ 4
30
+ ]
31
+ },
32
  "batch_norm_eps": 1e-05,
33
  "box_noise_scale": 1.0,
34
  "d_model": 256,
 
42
  ],
43
  "decoder_layers": 6,
44
  "decoder_n_points": 4,
 
 
 
 
 
 
45
  "disable_custom_kernels": true,
 
 
46
  "dropout": 0.0,
 
47
  "encode_proj_layers": [
48
  2
49
  ],
 
66
  ],
67
  "focal_loss_alpha": 0.75,
68
  "focal_loss_gamma": 2.0,
 
69
  "hidden_expansion": 1.0,
 
 
 
 
 
 
70
  "id2label": {
71
  "0": "person",
72
  "1": "bicycle",
 
235
  },
236
  "label_noise_ratio": 0.5,
237
  "layer_norm_eps": 1e-05,
 
238
  "learn_initial_query": false,
239
  "matcher_alpha": 0.25,
240
  "matcher_bbox_cost": 5.0,
 
243
  "matcher_giou_cost": 2.0,
244
  "model_type": "rt_detr",
245
  "normalize_before": false,
 
246
  "num_denoising": 100,
247
  "num_feature_levels": 3,
248
  "num_queries": 300,
 
 
 
 
 
 
 
 
 
 
249
  "positional_encoding_temperature": 10000,
 
 
 
 
 
 
 
250
  "torch_dtype": "float32",
251
  "transformers_version": "4.42.0.dev0",
252
  "use_focal_loss": true,