jupyterjazz commited on
Commit
e8ce774
·
verified ·
1 Parent(s): 9ad94d9

Update config.json

Browse files
Files changed (1) hide show
  1. config.json +55 -7
config.json CHANGED
@@ -35,26 +35,74 @@
35
  "single_vector_pool_strategy": "mean",
36
  "sliding_window": 32768,
37
  "tie_word_embeddings": true,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
38
  "torch_dtype": "bfloat16",
39
  "transformers_version": "4.52.0",
40
  "use_cache": true,
41
  "use_sliding_window": false,
42
  "video_token_id": 151656,
43
  "vision_config": {
 
 
 
 
 
 
 
 
44
  "hidden_size": 1280,
 
45
  "in_chans": 3,
 
 
46
  "model_type": "qwen2_5_vl",
 
47
  "out_hidden_size": 2048,
 
 
48
  "spatial_patch_size": 14,
 
49
  "tokens_per_second": 2,
50
- "torch_dtype": "bfloat16"
 
51
  },
52
- "vision_end_token_id": 151653,
53
- "vision_start_token_id": 151652,
54
- "vision_token_id": 151654,
55
- "vocab_size": 151936,
56
- "truncate_dim": null,
57
  "task_names": ["retrieval", "text-matching", "code"],
58
  "matryoshka_dims": [128, 256, 512, 1024, 2048],
59
- "_attn_implementation": "flash_attention_2"
 
 
 
 
60
  }
 
35
  "single_vector_pool_strategy": "mean",
36
  "sliding_window": 32768,
37
  "tie_word_embeddings": true,
38
+ "text_config": {
39
+ "attention_dropout": 0.0,
40
+ "bos_token_id": 151643,
41
+ "eos_token_id": 151645,
42
+ "hidden_act": "silu",
43
+ "hidden_size": 2048,
44
+ "image_token_id": null,
45
+ "initializer_range": 0.02,
46
+ "intermediate_size": 11008,
47
+ "max_position_embeddings": 128000,
48
+ "max_window_layers": 70,
49
+ "model_type": "qwen2_5_vl_text",
50
+ "num_attention_heads": 16,
51
+ "num_hidden_layers": 36,
52
+ "num_key_value_heads": 2,
53
+ "rms_norm_eps": 1e-06,
54
+ "rope_scaling": {
55
+ "mrope_section": [
56
+ 16,
57
+ 24,
58
+ 24
59
+ ],
60
+ "rope_type": "default",
61
+ "type": "default"
62
+ },
63
+ "rope_theta": 1000000.0,
64
+ "sliding_window": null,
65
+ "tie_word_embeddings": true,
66
+ "torch_dtype": "bfloat16",
67
+ "use_cache": true,
68
+ "use_sliding_window": false,
69
+ "vocab_size": 151936
70
+ },
71
  "torch_dtype": "bfloat16",
72
  "transformers_version": "4.52.0",
73
  "use_cache": true,
74
  "use_sliding_window": false,
75
  "video_token_id": 151656,
76
  "vision_config": {
77
+ "depth": 32,
78
+ "fullatt_block_indexes": [
79
+ 7,
80
+ 15,
81
+ 23,
82
+ 31
83
+ ],
84
+ "hidden_act": "silu",
85
  "hidden_size": 1280,
86
+ "in_channels": 3,
87
  "in_chans": 3,
88
+ "initializer_range": 0.02,
89
+ "intermediate_size": 3420,
90
  "model_type": "qwen2_5_vl",
91
+ "num_heads": 16,
92
  "out_hidden_size": 2048,
93
+ "patch_size": 14,
94
+ "spatial_merge_size": 2,
95
  "spatial_patch_size": 14,
96
+ "temporal_patch_size": 2,
97
  "tokens_per_second": 2,
98
+ "torch_dtype": "bfloat16",
99
+ "window_size": 112
100
  },
 
 
 
 
 
101
  "task_names": ["retrieval", "text-matching", "code"],
102
  "matryoshka_dims": [128, 256, 512, 1024, 2048],
103
+ "_attn_implementation": "flash_attention_2",
104
+ "truncate_dim": null,
105
+ "vision_end_token_id": 151653,
106
+ "vision_start_token_id": 151652,
107
+ "vision_token_id": 151654
108
  }