yonigozlan HF Staff commited on
Commit
3fc1c9e
·
verified ·
1 Parent(s): beece34

Upload model

Browse files
Files changed (2) hide show
  1. config.json +1 -7
  2. model.safetensors +2 -2
config.json CHANGED
@@ -2,7 +2,6 @@
2
  "architectures": [
3
  "Sam2VideoModel"
4
  ],
5
- "binarize_mask_from_pts_for_mem_enc": true,
6
  "enable_occlusion_spatial_embedding": true,
7
  "enable_temporal_pos_encoding_for_object_pointers": true,
8
  "fill_hole_area": 8,
@@ -30,9 +29,6 @@
30
  "mask_downsampler_stride": 2,
31
  "mask_downsampler_total_stride": 16,
32
  "max_object_pointers_in_encoder": 16,
33
- "memory_attention_apply_pe_at_cross_attn_keys": true,
34
- "memory_attention_apply_pe_at_cross_attn_queries": false,
35
- "memory_attention_apply_pe_at_self_attn": false,
36
  "memory_attention_downsample_rate": 1,
37
  "memory_attention_dropout": 0.1,
38
  "memory_attention_feed_forward_hidden_act": "relu",
@@ -55,7 +51,6 @@
55
  "memory_fuser_layer_scale_init_value": 1e-06,
56
  "memory_fuser_num_layers": 2,
57
  "memory_fuser_padding": 3,
58
- "memory_fuser_use_depthwise_conv": true,
59
  "model_type": "sam2",
60
  "multimask_max_pt_num": 1,
61
  "multimask_min_pt_num": 0,
@@ -64,7 +59,6 @@
64
  "non_overlap_masks": false,
65
  "non_overlap_masks_for_mem_enc": false,
66
  "num_maskmem": 7,
67
- "preserve_temporal_direction_in_object_pointers": true,
68
  "project_temporal_pos_encoding_in_object_pointers": true,
69
  "prompt_encoder_config": {
70
  "hidden_act": "gelu",
@@ -80,7 +74,7 @@
80
  "sigmoid_bias_for_mem_enc": -10.0,
81
  "sigmoid_scale_for_mem_enc": 20.0,
82
  "torch_dtype": "float32",
83
- "transformers_version": "4.55.0.dev0",
84
  "vision_config": {
85
  "backbone_channel_list": [
86
  768,
 
2
  "architectures": [
3
  "Sam2VideoModel"
4
  ],
 
5
  "enable_occlusion_spatial_embedding": true,
6
  "enable_temporal_pos_encoding_for_object_pointers": true,
7
  "fill_hole_area": 8,
 
29
  "mask_downsampler_stride": 2,
30
  "mask_downsampler_total_stride": 16,
31
  "max_object_pointers_in_encoder": 16,
 
 
 
32
  "memory_attention_downsample_rate": 1,
33
  "memory_attention_dropout": 0.1,
34
  "memory_attention_feed_forward_hidden_act": "relu",
 
51
  "memory_fuser_layer_scale_init_value": 1e-06,
52
  "memory_fuser_num_layers": 2,
53
  "memory_fuser_padding": 3,
 
54
  "model_type": "sam2",
55
  "multimask_max_pt_num": 1,
56
  "multimask_min_pt_num": 0,
 
59
  "non_overlap_masks": false,
60
  "non_overlap_masks_for_mem_enc": false,
61
  "num_maskmem": 7,
 
62
  "project_temporal_pos_encoding_in_object_pointers": true,
63
  "prompt_encoder_config": {
64
  "hidden_act": "gelu",
 
74
  "sigmoid_bias_for_mem_enc": -10.0,
75
  "sigmoid_scale_for_mem_enc": 20.0,
76
  "torch_dtype": "float32",
77
+ "transformers_version": "4.56.0.dev0",
78
  "vision_config": {
79
  "backbone_channel_list": [
80
  768,
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9c53ac6147ba7add4d91c213ee5b607331fd1cac5c4982f5cc28d3fe5caa57e1
3
- size 155908440
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8f64d3461b06b668002929bc378e57f1058fdca616c8e3d300f7e738f3456e42
3
+ size 155908128