Training in progress, step 100
Browse files- added_tokens.json +5 -0
- config.json +16 -1
- model-00001-of-00004.safetensors +1 -1
- model-00002-of-00004.safetensors +1 -1
- model-00003-of-00004.safetensors +1 -1
- model-00004-of-00004.safetensors +2 -2
- model.safetensors.index.json +10 -2
- tokenizer.json +2 -2
- tokenizer_config.json +40 -0
- training_args.bin +2 -2
added_tokens.json
CHANGED
@@ -1,4 +1,9 @@
|
|
1 |
{
|
|
|
|
|
|
|
|
|
|
|
2 |
"<|box_end|>": 151649,
|
3 |
"<|box_start|>": 151648,
|
4 |
"<|endoftext|>": 151643,
|
|
|
1 |
{
|
2 |
+
"<|LABEL_1|>": 151657,
|
3 |
+
"<|LABEL_2|>": 151658,
|
4 |
+
"<|LABEL_3|>": 151659,
|
5 |
+
"<|LABEL_4|>": 151660,
|
6 |
+
"<|LABEL_5|>": 151661,
|
7 |
"<|box_end|>": 151649,
|
8 |
"<|box_start|>": 151648,
|
9 |
"<|endoftext|>": 151643,
|
config.json
CHANGED
@@ -25,6 +25,20 @@
|
|
25 |
"LABEL_3": 3,
|
26 |
"LABEL_4": 4
|
27 |
},
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
28 |
"max_position_embeddings": 32768,
|
29 |
"max_window_layers": 28,
|
30 |
"model_type": "qwen2_vl",
|
@@ -43,10 +57,11 @@
|
|
43 |
"type": "default"
|
44 |
},
|
45 |
"rope_theta": 1000000.0,
|
|
|
46 |
"sliding_window": 32768,
|
47 |
"tie_word_embeddings": false,
|
48 |
"torch_dtype": "bfloat16",
|
49 |
-
"transformers_version": "4.
|
50 |
"use_cache": true,
|
51 |
"use_sliding_window": false,
|
52 |
"video_token_id": 151656,
|
|
|
25 |
"LABEL_3": 3,
|
26 |
"LABEL_4": 4
|
27 |
},
|
28 |
+
"label_special_token_ids": [
|
29 |
+
151657,
|
30 |
+
151658,
|
31 |
+
151659,
|
32 |
+
151660,
|
33 |
+
151661
|
34 |
+
],
|
35 |
+
"label_special_tokens": [
|
36 |
+
"<|LABEL_1|>",
|
37 |
+
"<|LABEL_2|>",
|
38 |
+
"<|LABEL_3|>",
|
39 |
+
"<|LABEL_4|>",
|
40 |
+
"<|LABEL_5|>"
|
41 |
+
],
|
42 |
"max_position_embeddings": 32768,
|
43 |
"max_window_layers": 28,
|
44 |
"model_type": "qwen2_vl",
|
|
|
57 |
"type": "default"
|
58 |
},
|
59 |
"rope_theta": 1000000.0,
|
60 |
+
"score_type": "special_token",
|
61 |
"sliding_window": 32768,
|
62 |
"tie_word_embeddings": false,
|
63 |
"torch_dtype": "bfloat16",
|
64 |
+
"transformers_version": "4.46.3",
|
65 |
"use_cache": true,
|
66 |
"use_sliding_window": false,
|
67 |
"video_token_id": 151656,
|
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4966659944
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dc0769a4a37d7ab5d40b3c9a9e5c3d08298fd5083d1b0e3218730c5f611279ed
|
3 |
size 4966659944
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4991495816
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0d60031ed2bee47b16f24ca7e6c60c182245b6515402ad9f88d3542a7fca7440
|
3 |
size 4991495816
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4932751040
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:42f76df844ddd4cdd76bfb599cdc78cacbce5ca7c97643d065f4f28e51c56658
|
3 |
size 4932751040
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3feeb3af5c2a69d4c78de66a374e65e6ad6da0b070241a35234f9daf1ce5f847
|
3 |
+
size 601966186
|
model.safetensors.index.json
CHANGED
@@ -341,8 +341,16 @@
|
|
341 |
"model.layers.9.self_attn.v_proj.bias": "model-00002-of-00004.safetensors",
|
342 |
"model.layers.9.self_attn.v_proj.weight": "model-00002-of-00004.safetensors",
|
343 |
"model.norm.weight": "model-00004-of-00004.safetensors",
|
344 |
-
"score.bias": "model-00004-of-00004.safetensors",
|
345 |
-
"score.weight": "model-00004-of-00004.safetensors",
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
346 |
"visual.blocks.0.attn.proj.bias": "model-00001-of-00004.safetensors",
|
347 |
"visual.blocks.0.attn.proj.weight": "model-00001-of-00004.safetensors",
|
348 |
"visual.blocks.0.attn.qkv.bias": "model-00001-of-00004.safetensors",
|
|
|
341 |
"model.layers.9.self_attn.v_proj.bias": "model-00002-of-00004.safetensors",
|
342 |
"model.layers.9.self_attn.v_proj.weight": "model-00002-of-00004.safetensors",
|
343 |
"model.norm.weight": "model-00004-of-00004.safetensors",
|
344 |
+
"score.0.bias": "model-00004-of-00004.safetensors",
|
345 |
+
"score.0.weight": "model-00004-of-00004.safetensors",
|
346 |
+
"score.1.bias": "model-00004-of-00004.safetensors",
|
347 |
+
"score.1.weight": "model-00004-of-00004.safetensors",
|
348 |
+
"score.2.bias": "model-00004-of-00004.safetensors",
|
349 |
+
"score.2.weight": "model-00004-of-00004.safetensors",
|
350 |
+
"score.3.bias": "model-00004-of-00004.safetensors",
|
351 |
+
"score.3.weight": "model-00004-of-00004.safetensors",
|
352 |
+
"score.4.bias": "model-00004-of-00004.safetensors",
|
353 |
+
"score.4.weight": "model-00004-of-00004.safetensors",
|
354 |
"visual.blocks.0.attn.proj.bias": "model-00001-of-00004.safetensors",
|
355 |
"visual.blocks.0.attn.proj.weight": "model-00001-of-00004.safetensors",
|
356 |
"visual.blocks.0.attn.qkv.bias": "model-00001-of-00004.safetensors",
|
tokenizer.json
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a918878bef3fafc48485ab78a4bb841a16d5c822bf3262a1e7ef10ad328584bd
|
3 |
+
size 11421311
|
tokenizer_config.json
CHANGED
@@ -112,6 +112,46 @@
|
|
112 |
"rstrip": false,
|
113 |
"single_word": false,
|
114 |
"special": true
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
115 |
}
|
116 |
},
|
117 |
"additional_special_tokens": [
|
|
|
112 |
"rstrip": false,
|
113 |
"single_word": false,
|
114 |
"special": true
|
115 |
+
},
|
116 |
+
"151657": {
|
117 |
+
"content": "<|LABEL_1|>",
|
118 |
+
"lstrip": false,
|
119 |
+
"normalized": false,
|
120 |
+
"rstrip": false,
|
121 |
+
"single_word": false,
|
122 |
+
"special": true
|
123 |
+
},
|
124 |
+
"151658": {
|
125 |
+
"content": "<|LABEL_2|>",
|
126 |
+
"lstrip": false,
|
127 |
+
"normalized": false,
|
128 |
+
"rstrip": false,
|
129 |
+
"single_word": false,
|
130 |
+
"special": true
|
131 |
+
},
|
132 |
+
"151659": {
|
133 |
+
"content": "<|LABEL_3|>",
|
134 |
+
"lstrip": false,
|
135 |
+
"normalized": false,
|
136 |
+
"rstrip": false,
|
137 |
+
"single_word": false,
|
138 |
+
"special": true
|
139 |
+
},
|
140 |
+
"151660": {
|
141 |
+
"content": "<|LABEL_4|>",
|
142 |
+
"lstrip": false,
|
143 |
+
"normalized": false,
|
144 |
+
"rstrip": false,
|
145 |
+
"single_word": false,
|
146 |
+
"special": true
|
147 |
+
},
|
148 |
+
"151661": {
|
149 |
+
"content": "<|LABEL_5|>",
|
150 |
+
"lstrip": false,
|
151 |
+
"normalized": false,
|
152 |
+
"rstrip": false,
|
153 |
+
"single_word": false,
|
154 |
+
"special": true
|
155 |
}
|
156 |
},
|
157 |
"additional_special_tokens": [
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7f4feda9548971998b3fcb2b2b54bdcde67bbfe73f167a0e752b281de7301622
|
3 |
+
size 6712
|