vladislavbro commited on
Commit
0e166cc
·
verified ·
1 Parent(s): 5446de0

Add config from convert_d_fine_original_pytorch_checkpoint_to_hf.py

Browse files
Files changed (1) hide show
  1. config.json +32 -38
config.json CHANGED
@@ -1,10 +1,8 @@
1
  {
 
2
  "activation_dropout": 0.0,
3
  "activation_function": "silu",
4
  "anchor_image_size": null,
5
- "architectures": [
6
- "DFineForObjectDetection"
7
- ],
8
  "attention_dropout": 0.0,
9
  "auxiliary_loss": true,
10
  "backbone": null,
@@ -30,51 +28,52 @@
30
  ],
31
  "stage_config": [
32
  [
 
 
33
  64,
34
- 64,
35
- 128,
36
  1,
37
  false,
38
  false,
39
  3,
40
- 6
41
  ],
42
  [
43
- 128,
44
- 128,
45
- 512,
46
- 2,
47
  true,
48
  false,
49
  3,
50
- 6
51
  ],
52
  [
53
- 512,
54
  256,
55
- 1024,
56
- 5,
 
57
  true,
58
  true,
59
  5,
60
- 6
61
  ],
62
  [
63
- 1024,
64
  512,
65
- 2048,
66
- 2,
 
67
  true,
68
  true,
69
  5,
70
- 6
71
  ]
72
  ],
73
  "stem_channels": [
74
  3,
75
- 32,
76
- 64
77
- ]
 
78
  },
79
  "backbone_kwargs": null,
80
  "batch_norm_eps": 1e-05,
@@ -84,19 +83,15 @@
84
  "decoder_attention_heads": 8,
85
  "decoder_ffn_dim": 1024,
86
  "decoder_in_channels": [
87
- 384,
88
- 384,
89
- 384
90
  ],
91
- "decoder_layers": 6,
92
  "decoder_method": "default",
93
- "decoder_n_points": [
94
- 3,
95
- 6,
96
- 3
97
- ],
98
  "decoder_offset_scale": 0.5,
99
- "depth_mult": 1.0,
100
  "disable_custom_kernels": true,
101
  "dropout": 0.0,
102
  "encode_proj_layers": [
@@ -104,12 +99,12 @@
104
  ],
105
  "encoder_activation_function": "gelu",
106
  "encoder_attention_heads": 8,
107
- "encoder_ffn_dim": 2048,
108
- "encoder_hidden_dim": 384,
109
  "encoder_in_channels": [
 
110
  512,
111
- 1024,
112
- 2048
113
  ],
114
  "encoder_layers": 1,
115
  "eos_coefficient": 0.0001,
@@ -123,7 +118,7 @@
123
  "focal_loss_alpha": 0.75,
124
  "focal_loss_gamma": 2.0,
125
  "freeze_backbone_batch_norms": true,
126
- "hidden_expansion": 1.0,
127
  "id2label": {
128
  "0": "person",
129
  "1": "bicycle",
@@ -311,7 +306,6 @@
311
  "reg_max": 32,
312
  "reg_scale": 4.0,
313
  "top_prob_values": 4,
314
- "torch_dtype": "float32",
315
  "transformers_version": "4.49.0.dev0",
316
  "use_focal_loss": true,
317
  "use_pretrained_backbone": false,
 
1
  {
2
+ "_attn_implementation_autoset": true,
3
  "activation_dropout": 0.0,
4
  "activation_function": "silu",
5
  "anchor_image_size": null,
 
 
 
6
  "attention_dropout": 0.0,
7
  "auxiliary_loss": true,
8
  "backbone": null,
 
28
  ],
29
  "stage_config": [
30
  [
31
+ 16,
32
+ 16,
33
  64,
 
 
34
  1,
35
  false,
36
  false,
37
  3,
38
+ 3
39
  ],
40
  [
41
+ 64,
42
+ 32,
43
+ 256,
44
+ 1,
45
  true,
46
  false,
47
  3,
48
+ 3
49
  ],
50
  [
 
51
  256,
52
+ 64,
53
+ 512,
54
+ 2,
55
  true,
56
  true,
57
  5,
58
+ 3
59
  ],
60
  [
 
61
  512,
62
+ 128,
63
+ 1024,
64
+ 1,
65
  true,
66
  true,
67
  5,
68
+ 3
69
  ]
70
  ],
71
  "stem_channels": [
72
  3,
73
+ 16,
74
+ 16
75
+ ],
76
+ "use_lab": true
77
  },
78
  "backbone_kwargs": null,
79
  "batch_norm_eps": 1e-05,
 
83
  "decoder_attention_heads": 8,
84
  "decoder_ffn_dim": 1024,
85
  "decoder_in_channels": [
86
+ 256,
87
+ 256,
88
+ 256
89
  ],
90
+ "decoder_layers": 3,
91
  "decoder_method": "default",
92
+ "decoder_n_points": 4,
 
 
 
 
93
  "decoder_offset_scale": 0.5,
94
+ "depth_mult": 0.34,
95
  "disable_custom_kernels": true,
96
  "dropout": 0.0,
97
  "encode_proj_layers": [
 
99
  ],
100
  "encoder_activation_function": "gelu",
101
  "encoder_attention_heads": 8,
102
+ "encoder_ffn_dim": 1024,
103
+ "encoder_hidden_dim": 256,
104
  "encoder_in_channels": [
105
+ 256,
106
  512,
107
+ 1024
 
108
  ],
109
  "encoder_layers": 1,
110
  "eos_coefficient": 0.0001,
 
118
  "focal_loss_alpha": 0.75,
119
  "focal_loss_gamma": 2.0,
120
  "freeze_backbone_batch_norms": true,
121
+ "hidden_expansion": 0.5,
122
  "id2label": {
123
  "0": "person",
124
  "1": "bicycle",
 
306
  "reg_max": 32,
307
  "reg_scale": 4.0,
308
  "top_prob_values": 4,
 
309
  "transformers_version": "4.49.0.dev0",
310
  "use_focal_loss": true,
311
  "use_pretrained_backbone": false,