danielhanchen commited on
Commit
c1447b2
·
verified ·
1 Parent(s): 23c8786

Add files using upload-large-folder tool

Browse files
Files changed (3) hide show
  1. config.json +36 -38
  2. generation_config.json +8 -3
  3. model.safetensors +2 -2
config.json CHANGED
@@ -25,68 +25,66 @@
25
  "multi_modal_projector",
26
  "merger",
27
  "modality_projection",
28
- "lm_head",
29
- "multi_modal_projector",
30
- "merger",
31
- "modality_projection",
32
- "vision_tower.vision_model.encoder.layers.23.self_attn",
33
  "language_model.model.layers.5.mlp",
 
 
 
34
  "vision_tower.vision_model.encoder.layers.26.self_attn",
35
- "language_model.model.layers.4.mlp",
36
- "language_model.model.layers.3.mlp",
37
- "vision_tower.vision_model.encoder.layers.18.self_attn",
38
  "vision_tower.vision_model.encoder.layers.19.self_attn",
39
  "vision_tower.vision_model.encoder.layers.21.self_attn",
40
- "language_model.model.layers.1.mlp",
41
- "vision_tower.vision_model.encoder.layers.17.mlp",
42
- "vision_tower.vision_model.encoder.layers.24.self_attn",
43
- "vision_tower.vision_model.encoder.layers.21.mlp",
44
- "vision_tower.vision_model.encoder.layers.19.mlp",
45
- "vision_tower.vision_model.encoder.layers.24.mlp",
46
- "vision_tower.vision_model.encoder.layers.20.self_attn",
47
- "vision_tower.vision_model.encoder.layers.22.self_attn",
48
- "vision_tower.vision_model.encoder.layers.20.mlp",
49
  "vision_tower.vision_model.encoder.layers.25.mlp",
50
- "language_model.model.layers.2.self_attn",
 
51
  "vision_tower.vision_model.encoder.layers.17.self_attn",
52
- "language_model.model.layers.0.mlp",
53
- "vision_tower.vision_model.encoder.layers.16.mlp",
54
  "vision_tower.vision_model.encoder.layers.23.mlp",
55
- "vision_tower.vision_model.encoder.layers.22.mlp",
56
- "vision_tower.vision_model.encoder.layers.13.mlp",
57
  "vision_tower.vision_model.encoder.layers.15.mlp",
 
58
  "vision_tower.vision_model.encoder.layers.18.mlp",
 
 
 
 
 
59
  "vision_tower.vision_model.encoder.layers.16.self_attn",
60
- "vision_tower.vision_model.encoder.layers.10.mlp",
61
- "vision_tower.vision_model.encoder.layers.7.mlp",
 
 
 
62
  "vision_tower.vision_model.encoder.layers.14.mlp",
63
  "vision_tower.vision_model.encoder.layers.14.self_attn",
64
- "vision_tower.vision_model.encoder.layers.9.mlp",
65
  "vision_tower.vision_model.encoder.layers.12.mlp",
66
- "vision_tower.vision_model.encoder.layers.15.self_attn",
 
 
 
67
  "vision_tower.vision_model.encoder.layers.5.mlp",
 
68
  "vision_tower.vision_model.encoder.layers.11.mlp",
69
- "vision_tower.vision_model.encoder.layers.10.self_attn",
70
  "vision_tower.vision_model.encoder.layers.8.mlp",
71
- "vision_tower.vision_model.encoder.layers.8.self_attn",
72
  "vision_tower.vision_model.encoder.layers.13.self_attn",
73
- "vision_tower.vision_model.encoder.layers.12.self_attn",
74
- "vision_tower.vision_model.encoder.layers.11.self_attn",
75
- "vision_tower.vision_model.encoder.layers.4.mlp",
76
  "vision_tower.vision_model.encoder.layers.4.self_attn",
 
77
  "vision_tower.vision_model.encoder.layers.6.mlp",
78
- "vision_tower.vision_model.encoder.layers.9.self_attn",
79
- "vision_tower.vision_model.encoder.layers.2.mlp",
80
- "vision_tower.vision_model.encoder.layers.7.self_attn",
81
  "vision_tower.vision_model.encoder.layers.1.mlp",
82
- "vision_tower.vision_model.encoder.layers.3.mlp",
 
 
83
  "vision_tower.vision_model.encoder.layers.1.self_attn",
84
- "vision_tower.vision_model.encoder.layers.5.self_attn",
85
  "vision_tower.vision_model.encoder.layers.6.self_attn",
 
 
86
  "vision_tower.vision_model.encoder.layers.3.self_attn",
87
  "vision_tower.vision_model.encoder.layers.0.self_attn",
88
- "vision_tower.vision_model.encoder.layers.2.self_attn",
89
  "vision_tower.vision_model.encoder.layers.0.mlp",
 
90
  "vision_tower.vision_model.encoder.layers.26.mlp"
91
  ],
92
  "llm_int8_threshold": 6.0,
@@ -125,7 +123,7 @@
125
  "vocab_size": 262208
126
  },
127
  "torch_dtype": "bfloat16",
128
- "transformers_version": "4.50.0.dev0",
129
  "unsloth_fixed": true,
130
  "vision_config": {
131
  "attention_dropout": 0.0,
 
25
  "multi_modal_projector",
26
  "merger",
27
  "modality_projection",
28
+ "language_model.model.layers.0.self_attn",
 
 
 
 
29
  "language_model.model.layers.5.mlp",
30
+ "language_model.model.layers.2.mlp",
31
+ "language_model.model.layers.4.self_attn",
32
+ "vision_tower.vision_model.encoder.layers.24.self_attn",
33
  "vision_tower.vision_model.encoder.layers.26.self_attn",
34
+ "vision_tower.vision_model.encoder.layers.23.self_attn",
35
+ "vision_tower.vision_model.encoder.layers.20.self_attn",
36
+ "vision_tower.vision_model.encoder.layers.25.self_attn",
37
  "vision_tower.vision_model.encoder.layers.19.self_attn",
38
  "vision_tower.vision_model.encoder.layers.21.self_attn",
 
 
 
 
 
 
 
 
 
39
  "vision_tower.vision_model.encoder.layers.25.mlp",
40
+ "vision_tower.vision_model.encoder.layers.22.self_attn",
41
+ "language_model.model.layers.3.mlp",
42
  "vision_tower.vision_model.encoder.layers.17.self_attn",
 
 
43
  "vision_tower.vision_model.encoder.layers.23.mlp",
 
 
44
  "vision_tower.vision_model.encoder.layers.15.mlp",
45
+ "vision_tower.vision_model.encoder.layers.22.mlp",
46
  "vision_tower.vision_model.encoder.layers.18.mlp",
47
+ "vision_tower.vision_model.encoder.layers.18.self_attn",
48
+ "vision_tower.vision_model.encoder.layers.21.mlp",
49
+ "vision_tower.vision_model.encoder.layers.17.mlp",
50
+ "vision_tower.vision_model.encoder.layers.15.self_attn",
51
+ "vision_tower.vision_model.encoder.layers.24.mlp",
52
  "vision_tower.vision_model.encoder.layers.16.self_attn",
53
+ "vision_tower.vision_model.encoder.layers.19.mlp",
54
+ "vision_tower.vision_model.encoder.layers.20.mlp",
55
+ "language_model.model.layers.0.mlp",
56
+ "language_model.model.layers.2.self_attn",
57
+ "vision_tower.vision_model.encoder.layers.16.mlp",
58
  "vision_tower.vision_model.encoder.layers.14.mlp",
59
  "vision_tower.vision_model.encoder.layers.14.self_attn",
 
60
  "vision_tower.vision_model.encoder.layers.12.mlp",
61
+ "vision_tower.vision_model.encoder.layers.13.mlp",
62
+ "vision_tower.vision_model.encoder.layers.10.mlp",
63
+ "vision_tower.vision_model.encoder.layers.11.self_attn",
64
+ "vision_tower.vision_model.encoder.layers.7.mlp",
65
  "vision_tower.vision_model.encoder.layers.5.mlp",
66
+ "vision_tower.vision_model.encoder.layers.9.mlp",
67
  "vision_tower.vision_model.encoder.layers.11.mlp",
 
68
  "vision_tower.vision_model.encoder.layers.8.mlp",
 
69
  "vision_tower.vision_model.encoder.layers.13.self_attn",
70
+ "vision_tower.vision_model.encoder.layers.9.self_attn",
71
+ "vision_tower.vision_model.encoder.layers.3.mlp",
72
+ "vision_tower.vision_model.encoder.layers.10.self_attn",
73
  "vision_tower.vision_model.encoder.layers.4.self_attn",
74
+ "vision_tower.vision_model.encoder.layers.4.mlp",
75
  "vision_tower.vision_model.encoder.layers.6.mlp",
 
 
 
76
  "vision_tower.vision_model.encoder.layers.1.mlp",
77
+ "vision_tower.vision_model.encoder.layers.8.self_attn",
78
+ "vision_tower.vision_model.encoder.layers.7.self_attn",
79
+ "vision_tower.vision_model.encoder.layers.12.self_attn",
80
  "vision_tower.vision_model.encoder.layers.1.self_attn",
 
81
  "vision_tower.vision_model.encoder.layers.6.self_attn",
82
+ "vision_tower.vision_model.encoder.layers.2.mlp",
83
+ "vision_tower.vision_model.encoder.layers.5.self_attn",
84
  "vision_tower.vision_model.encoder.layers.3.self_attn",
85
  "vision_tower.vision_model.encoder.layers.0.self_attn",
 
86
  "vision_tower.vision_model.encoder.layers.0.mlp",
87
+ "vision_tower.vision_model.encoder.layers.2.self_attn",
88
  "vision_tower.vision_model.encoder.layers.26.mlp"
89
  ],
90
  "llm_int8_threshold": 6.0,
 
123
  "vocab_size": 262208
124
  },
125
  "torch_dtype": "bfloat16",
126
+ "transformers_version": "4.51.0",
127
  "unsloth_fixed": true,
128
  "vision_config": {
129
  "attention_dropout": 0.0,
generation_config.json CHANGED
@@ -1,8 +1,13 @@
1
  {
2
- "_from_model_config": true,
3
  "bos_token_id": 2,
4
  "cache_implementation": "hybrid",
5
- "eos_token_id": 1,
 
 
 
 
6
  "pad_token_id": 0,
7
- "transformers_version": "4.50.0.dev0"
 
 
8
  }
 
1
  {
 
2
  "bos_token_id": 2,
3
  "cache_implementation": "hybrid",
4
+ "do_sample": true,
5
+ "eos_token_id": [
6
+ 1,
7
+ 106
8
+ ],
9
  "pad_token_id": 0,
10
+ "top_k": 64,
11
+ "top_p": 0.95,
12
+ "transformers_version": "4.51.0"
13
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b1d6b800fcac4ef0179121d62afd6fdc67b173aaebd36bf4a5cef970f3e44f31
3
- size 4437712953
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:372535c95c031316bee6050d3d4ed6f9a2f991ee391c7da4bd40b38ca13e90d0
3
+ size 4375543541