vladislavbro commited on
Commit
19a1669
·
verified ·
1 Parent(s): 2b1783d

Add config from convert_d_fine_original_pytorch_checkpoint_to_hf.py

Browse files
Files changed (1) hide show
  1. config.json +37 -6
config.json CHANGED
@@ -1,15 +1,22 @@
1
  {
 
2
  "activation_dropout": 0.0,
3
  "activation_function": "silu",
4
  "anchor_image_size": null,
5
- "architectures": [
6
- "DFineForObjectDetection"
7
- ],
8
  "attention_dropout": 0.0,
9
  "auxiliary_loss": true,
10
  "backbone": null,
11
  "backbone_config": {
 
 
 
 
 
 
 
 
12
  "embedding_size": 32,
 
13
  "hidden_sizes": [
14
  128,
15
  256,
@@ -17,7 +24,8 @@
17
  1024
18
  ],
19
  "layer_type": "basic",
20
- "model_type": "d_fine_resnet",
 
21
  "out_features": [
22
  "stage2",
23
  "stage3",
@@ -28,18 +36,43 @@
28
  3,
29
  4
30
  ],
 
 
 
 
 
 
31
  "stage_in_channels": [
32
  16,
33
  64,
34
  256,
35
  512
36
  ],
 
 
 
 
 
 
 
 
 
 
 
 
37
  "stage_mid_channels": [
38
  16,
39
  32,
40
  64,
41
  128
42
  ],
 
 
 
 
 
 
 
43
  "stage_num_blocks": [
44
  1,
45
  1,
@@ -86,7 +119,6 @@
86
  ],
87
  "decoder_offset_scale": 0.5,
88
  "depth_mult": 0.34,
89
- "disable_custom_kernels": true,
90
  "dropout": 0.0,
91
  "encode_proj_layers": [
92
  2
@@ -300,7 +332,6 @@
300
  "positional_encoding_temperature": 10000,
301
  "reg_scale": 4.0,
302
  "top_prob_values": 4,
303
- "torch_dtype": "float32",
304
  "transformers_version": "4.50.0.dev0",
305
  "use_focal_loss": true,
306
  "use_pretrained_backbone": false,
 
1
  {
2
+ "_attn_implementation_autoset": true,
3
  "activation_dropout": 0.0,
4
  "activation_function": "silu",
5
  "anchor_image_size": null,
 
 
 
6
  "attention_dropout": 0.0,
7
  "auxiliary_loss": true,
8
  "backbone": null,
9
  "backbone_config": {
10
+ "depths": [
11
+ 3,
12
+ 4,
13
+ 6,
14
+ 3
15
+ ],
16
+ "downsample_in_bottleneck": false,
17
+ "downsample_in_first_stage": false,
18
  "embedding_size": 32,
19
+ "hidden_act": "relu",
20
  "hidden_sizes": [
21
  128,
22
  256,
 
24
  1024
25
  ],
26
  "layer_type": "basic",
27
+ "model_type": "hgnet_v2",
28
+ "num_channels": 3,
29
  "out_features": [
30
  "stage2",
31
  "stage3",
 
36
  3,
37
  4
38
  ],
39
+ "stage_downsample": [
40
+ false,
41
+ true,
42
+ true,
43
+ true
44
+ ],
45
  "stage_in_channels": [
46
  16,
47
  64,
48
  256,
49
  512
50
  ],
51
+ "stage_kernel_size": [
52
+ 3,
53
+ 3,
54
+ 5,
55
+ 5
56
+ ],
57
+ "stage_light_block": [
58
+ false,
59
+ false,
60
+ true,
61
+ true
62
+ ],
63
  "stage_mid_channels": [
64
  16,
65
  32,
66
  64,
67
  128
68
  ],
69
+ "stage_names": [
70
+ "stem",
71
+ "stage1",
72
+ "stage2",
73
+ "stage3",
74
+ "stage4"
75
+ ],
76
  "stage_num_blocks": [
77
  1,
78
  1,
 
119
  ],
120
  "decoder_offset_scale": 0.5,
121
  "depth_mult": 0.34,
 
122
  "dropout": 0.0,
123
  "encode_proj_layers": [
124
  2
 
332
  "positional_encoding_temperature": 10000,
333
  "reg_scale": 4.0,
334
  "top_prob_values": 4,
 
335
  "transformers_version": "4.50.0.dev0",
336
  "use_focal_loss": true,
337
  "use_pretrained_backbone": false,