dit-maskrcnn / config.json
nielsr's picture
nielsr HF staff
Upload MaskRCNNForObjectDetection
135856e
{
"_commit_hash": null,
"anchor_generator_ratios": [
0.5,
1.0,
2.0
],
"anchor_generator_scales": [
8
],
"anchor_generator_strides": [
4,
8,
16,
32,
64
],
"architectures": [
"MaskRCNNForObjectDetection"
],
"backbone_config": {
"add_fpn": true,
"attention_probs_dropout_prob": 0.0,
"auxiliary_channels": 256,
"auxiliary_concat_input": false,
"auxiliary_loss_weight": 0.4,
"auxiliary_num_convs": 1,
"drop_path_rate": 0.1,
"hidden_dropout_prob": 0.0,
"hidden_size": 768,
"intermediate_size": 3072,
"layer_scale_init_value": 0.1,
"model_type": "beit",
"num_attention_heads": 12,
"num_hidden_layers": 12,
"out_features": [
"stage4",
"stage6",
"stage8",
"stage12"
],
"out_indices": [
4,
6,
8,
12
],
"patch_size": 16,
"pool_scales": [
1,
2,
3,
6
],
"reshape_hidden_states": true,
"semantic_loss_ignore_index": 255,
"stage_names": [
"stem",
"stage1",
"stage2",
"stage3",
"stage4",
"stage5",
"stage6",
"stage7",
"stage8",
"stage9",
"stage10",
"stage11",
"stage12"
],
"use_absolute_position_embeddings": true,
"use_auxiliary_head": true,
"use_mask_token": false,
"use_mean_pooling": true,
"use_relative_position_bias": false,
"use_shared_relative_position_bias": false,
"vocab_size": 8192
},
"bbox_head_bbox_coder_target_means": [
0.0,
0.0,
0.0,
0.0
],
"bbox_head_bbox_coder_target_stds": [
0.1,
0.1,
0.2,
0.2
],
"bbox_head_fc_out_channels": 1024,
"bbox_head_in_channels": 256,
"bbox_head_num_shared_fcs": 2,
"bbox_head_reg_class_agnostic": false,
"bbox_head_reg_decoded_bbox": false,
"bbox_head_roi_feat_size": 7,
"bbox_roi_extractor_featmap_strides": [
4,
8,
16,
32
],
"bbox_roi_extractor_out_channels": 256,
"bbox_roi_extractor_roi_layer": {
"output_size": 7,
"sampling_ratio": 0,
"type": "RoIAlign"
},
"fpn_num_outputs": 5,
"fpn_out_channels": 256,
"id2label": {
"0": "LABEL_0",
"1": "LABEL_1",
"2": "LABEL_2",
"3": "LABEL_3",
"4": "LABEL_4"
},
"initializer_range": 0.02,
"label2id": {
"LABEL_0": 0,
"LABEL_1": 1,
"LABEL_2": 2,
"LABEL_3": 3,
"LABEL_4": 4
},
"mask_head_conv_out_channels": 256,
"mask_head_in_channels": 256,
"mask_head_num_convs": 4,
"mask_roi_extractor_featmap_strides": [
4,
8,
16,
32
],
"mask_roi_extractor_out_channels": 256,
"mask_roi_extractor_roi_layer": {
"output_size": 14,
"sampling_ratio": 0,
"type": "RoIAlign"
},
"model_type": "maskrcnn",
"rcnn_assigner_ignore_iof_thr": -1,
"rcnn_assigner_match_low_quality": true,
"rcnn_assigner_min_pos_iou": 0.5,
"rcnn_assigner_neg_iou_thr": 0.5,
"rcnn_assigner_pos_iou_thr": 0.5,
"rcnn_sampler_add_gt_as_proposals": true,
"rcnn_sampler_num": 512,
"rcnn_sampler_num_samples_upper_bound": -1,
"rcnn_sampler_pos_fraction": 0.25,
"rcnn_test_cfg": {
"mask_thr_binary": 0.5,
"max_per_img": 100,
"nms": {
"iou_threshold": 0.5,
"type": "nms"
},
"score_thr": 0.05
},
"rcnn_train_cfg": {
"debug": false,
"mask_size": 28,
"pos_weight": -1
},
"rpn_assigner_ignore_iof_thr": -1,
"rpn_assigner_match_low_quality": true,
"rpn_assigner_min_pos_iou": 0.3,
"rpn_assigner_neg_iou_thr": 0.3,
"rpn_assigner_pos_iou_thr": 0.7,
"rpn_bbox_coder_target_means": [
0.0,
0.0,
0.0,
0.0
],
"rpn_bbox_coder_target_stds": [
1.0,
1.0,
1.0,
1.0
],
"rpn_feat_channels": 256,
"rpn_in_channels": 256,
"rpn_loss_bbox": {
"loss_weight": 1.0,
"type": "L1Loss"
},
"rpn_loss_cls": {
"loss_weight": 1.0,
"type": "CrossEntropyLoss",
"use_sigmoid": true
},
"rpn_proposal": {
"max_per_img": 1000,
"min_bbox_size": 0,
"nms": {
"iou_threshold": 0.7,
"type": "nms"
},
"nms_pre": 2000
},
"rpn_sampler_add_gt_as_proposals": false,
"rpn_sampler_num": 256,
"rpn_sampler_num_samples_upper_bound": -1,
"rpn_sampler_pos_fraction": 0.5,
"rpn_test_cfg": {
"max_per_img": 1000,
"min_bbox_size": 0,
"nms": {
"iou_threshold": 0.7,
"type": "nms"
},
"nms_pre": 1000
},
"rpn_train_cfg": {
"allowed_border": -1,
"debug": false,
"pos_weight": -1
},
"torch_dtype": "float32",
"transformers_version": null
}