Add config from convert_rt_detr_original_pytorch_checkpoint_to_pytorch.py
Browse files- config.json +13 -35
config.json
CHANGED
|
@@ -10,6 +10,19 @@
|
|
| 10 |
],
|
| 11 |
"attention_dropout": 0.0,
|
| 12 |
"auxiliary_loss": true,
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 13 |
"batch_norm_eps": 1e-05,
|
| 14 |
"box_noise_scale": 1.0,
|
| 15 |
"d_model": 256,
|
|
@@ -23,17 +36,8 @@
|
|
| 23 |
],
|
| 24 |
"decoder_layers": 6,
|
| 25 |
"decoder_n_points": 4,
|
| 26 |
-
"depths": [
|
| 27 |
-
3,
|
| 28 |
-
4,
|
| 29 |
-
6,
|
| 30 |
-
3
|
| 31 |
-
],
|
| 32 |
"disable_custom_kernels": true,
|
| 33 |
-
"downsample_in_bottleneck": false,
|
| 34 |
-
"downsample_in_first_stage": false,
|
| 35 |
"dropout": 0.0,
|
| 36 |
-
"embedding_size": 64,
|
| 37 |
"encode_proj_layers": [
|
| 38 |
2
|
| 39 |
],
|
|
@@ -56,14 +60,7 @@
|
|
| 56 |
],
|
| 57 |
"focal_loss_alpha": 0.75,
|
| 58 |
"focal_loss_gamma": 2.0,
|
| 59 |
-
"hidden_act": "relu",
|
| 60 |
"hidden_expansion": 1.0,
|
| 61 |
-
"hidden_sizes": [
|
| 62 |
-
256,
|
| 63 |
-
512,
|
| 64 |
-
1024,
|
| 65 |
-
2048
|
| 66 |
-
],
|
| 67 |
"id2label": {
|
| 68 |
"0": "person",
|
| 69 |
"1": "bicycle",
|
|
@@ -232,7 +229,6 @@
|
|
| 232 |
},
|
| 233 |
"label_noise_ratio": 0.5,
|
| 234 |
"layer_norm_eps": 1e-05,
|
| 235 |
-
"layer_type": "bottleneck",
|
| 236 |
"learn_initial_query": false,
|
| 237 |
"matcher_alpha": 0.25,
|
| 238 |
"matcher_bbox_cost": 5.0,
|
|
@@ -241,28 +237,10 @@
|
|
| 241 |
"matcher_giou_cost": 2.0,
|
| 242 |
"model_type": "rt_detr",
|
| 243 |
"normalize_before": false,
|
| 244 |
-
"num_channels": 3,
|
| 245 |
"num_denoising": 100,
|
| 246 |
"num_feature_levels": 3,
|
| 247 |
"num_queries": 300,
|
| 248 |
-
"out_features": [
|
| 249 |
-
"stage2",
|
| 250 |
-
"stage3",
|
| 251 |
-
"stage4"
|
| 252 |
-
],
|
| 253 |
-
"out_indices": [
|
| 254 |
-
2,
|
| 255 |
-
3,
|
| 256 |
-
4
|
| 257 |
-
],
|
| 258 |
"positional_encoding_temperature": 10000,
|
| 259 |
-
"stage_names": [
|
| 260 |
-
"stem",
|
| 261 |
-
"stage1",
|
| 262 |
-
"stage2",
|
| 263 |
-
"stage3",
|
| 264 |
-
"stage4"
|
| 265 |
-
],
|
| 266 |
"torch_dtype": "float32",
|
| 267 |
"transformers_version": "4.42.0.dev0",
|
| 268 |
"use_focal_loss": true,
|
|
|
|
| 10 |
],
|
| 11 |
"attention_dropout": 0.0,
|
| 12 |
"auxiliary_loss": true,
|
| 13 |
+
"backbone_config": {
|
| 14 |
+
"model_type": "rtdetr-resnet",
|
| 15 |
+
"out_features": [
|
| 16 |
+
"stage2",
|
| 17 |
+
"stage3",
|
| 18 |
+
"stage4"
|
| 19 |
+
],
|
| 20 |
+
"out_indices": [
|
| 21 |
+
2,
|
| 22 |
+
3,
|
| 23 |
+
4
|
| 24 |
+
]
|
| 25 |
+
},
|
| 26 |
"batch_norm_eps": 1e-05,
|
| 27 |
"box_noise_scale": 1.0,
|
| 28 |
"d_model": 256,
|
|
|
|
| 36 |
],
|
| 37 |
"decoder_layers": 6,
|
| 38 |
"decoder_n_points": 4,
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 39 |
"disable_custom_kernels": true,
|
|
|
|
|
|
|
| 40 |
"dropout": 0.0,
|
|
|
|
| 41 |
"encode_proj_layers": [
|
| 42 |
2
|
| 43 |
],
|
|
|
|
| 60 |
],
|
| 61 |
"focal_loss_alpha": 0.75,
|
| 62 |
"focal_loss_gamma": 2.0,
|
|
|
|
| 63 |
"hidden_expansion": 1.0,
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 64 |
"id2label": {
|
| 65 |
"0": "person",
|
| 66 |
"1": "bicycle",
|
|
|
|
| 229 |
},
|
| 230 |
"label_noise_ratio": 0.5,
|
| 231 |
"layer_norm_eps": 1e-05,
|
|
|
|
| 232 |
"learn_initial_query": false,
|
| 233 |
"matcher_alpha": 0.25,
|
| 234 |
"matcher_bbox_cost": 5.0,
|
|
|
|
| 237 |
"matcher_giou_cost": 2.0,
|
| 238 |
"model_type": "rt_detr",
|
| 239 |
"normalize_before": false,
|
|
|
|
| 240 |
"num_denoising": 100,
|
| 241 |
"num_feature_levels": 3,
|
| 242 |
"num_queries": 300,
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 243 |
"positional_encoding_temperature": 10000,
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 244 |
"torch_dtype": "float32",
|
| 245 |
"transformers_version": "4.42.0.dev0",
|
| 246 |
"use_focal_loss": true,
|