agentlans commited on
Commit
7fe444e
·
verified ·
1 Parent(s): 6b562fd

Upload 9 files

Browse files
Modelfile CHANGED
@@ -2,10 +2,10 @@
2
 
3
  FROM .
4
 
5
- TEMPLATE """{{ if .System }}System: {{ .System }}<|endoftext|>
6
- {{ end }}{{ range .Messages }}{{ if eq .Role "user" }}Human: {{ .Content }}<|endoftext|>
7
- Assistant:{{ else if eq .Role "assistant" }}{{ .Content }}<|endoftext|>
8
  {{ end }}{{ end }}"""
9
 
10
- PARAMETER stop "<|endoftext|>"
11
  PARAMETER num_ctx 4096
 
2
 
3
  FROM .
4
 
5
+ TEMPLATE """{{ if .System }}System: {{ .System }}<|im_end|>
6
+ {{ end }}{{ range .Messages }}{{ if eq .Role "user" }}Human: {{ .Content }}<|im_end|>
7
+ Assistant:{{ else if eq .Role "assistant" }}{{ .Content }}<|im_end|>
8
  {{ end }}{{ end }}"""
9
 
10
+ PARAMETER stop "<|im_end|>"
11
  PARAMETER num_ctx 4096
config.json CHANGED
@@ -4,8 +4,8 @@
4
  ],
5
  "attention_bias": false,
6
  "attention_dropout": 0.0,
7
- "bos_token_id": 0,
8
- "eos_token_id": 0,
9
  "head_dim": 64,
10
  "hidden_act": "silu",
11
  "hidden_size": 576,
@@ -18,6 +18,7 @@
18
  "num_attention_heads": 9,
19
  "num_hidden_layers": 30,
20
  "num_key_value_heads": 3,
 
21
  "pretraining_tp": 1,
22
  "rms_norm_eps": 1e-05,
23
  "rope_interleaved": false,
@@ -25,6 +26,12 @@
25
  "rope_theta": 100000,
26
  "tie_word_embeddings": true,
27
  "torch_dtype": "bfloat16",
 
 
 
 
 
 
28
  "transformers_version": "4.51.3",
29
  "use_cache": true,
30
  "vocab_size": 49152
 
4
  ],
5
  "attention_bias": false,
6
  "attention_dropout": 0.0,
7
+ "bos_token_id": 1,
8
+ "eos_token_id": 2,
9
  "head_dim": 64,
10
  "hidden_act": "silu",
11
  "hidden_size": 576,
 
18
  "num_attention_heads": 9,
19
  "num_hidden_layers": 30,
20
  "num_key_value_heads": 3,
21
+ "pad_token_id": 2,
22
  "pretraining_tp": 1,
23
  "rms_norm_eps": 1e-05,
24
  "rope_interleaved": false,
 
26
  "rope_theta": 100000,
27
  "tie_word_embeddings": true,
28
  "torch_dtype": "bfloat16",
29
+ "transformers.js_config": {
30
+ "kv_cache_dtype": {
31
+ "fp16": "float16",
32
+ "q4f16": "float16"
33
+ }
34
+ },
35
  "transformers_version": "4.51.3",
36
  "use_cache": true,
37
  "vocab_size": 49152
generation_config.json CHANGED
@@ -1,6 +1,7 @@
1
  {
2
  "_from_model_config": true,
3
- "bos_token_id": 0,
4
- "eos_token_id": 0,
 
5
  "transformers_version": "4.51.3"
6
  }
 
1
  {
2
  "_from_model_config": true,
3
+ "bos_token_id": 1,
4
+ "eos_token_id": 2,
5
+ "pad_token_id": 2,
6
  "transformers_version": "4.51.3"
7
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:468c0bec4d396622ff3e0afef872a0a045fab02ce31705156bf773958bd51577
3
  size 269060552
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:363388c189ca7554fdb0ed8c98db0a39c22dc74b6298907232a6637c8b3db586
3
  size 269060552
special_tokens_map.json CHANGED
@@ -1,38 +1,29 @@
1
  {
2
  "additional_special_tokens": [
3
- "<|endoftext|>",
4
  "<|im_start|>",
5
- "<|im_end|>",
6
- "<repo_name>",
7
- "<reponame>",
8
- "<file_sep>",
9
- "<filename>",
10
- "<gh_stars>",
11
- "<issue_start>",
12
- "<issue_comment>",
13
- "<issue_closed>",
14
- "<jupyter_start>",
15
- "<jupyter_text>",
16
- "<jupyter_code>",
17
- "<jupyter_output>",
18
- "<jupyter_script>",
19
- "<empty_output>"
20
  ],
21
  "bos_token": {
22
- "content": "<|endoftext|>",
23
  "lstrip": false,
24
  "normalized": false,
25
  "rstrip": false,
26
  "single_word": false
27
  },
28
  "eos_token": {
29
- "content": "<|endoftext|>",
 
 
 
 
 
 
 
30
  "lstrip": false,
31
  "normalized": false,
32
  "rstrip": false,
33
  "single_word": false
34
  },
35
- "pad_token": "<|endoftext|>",
36
  "unk_token": {
37
  "content": "<|endoftext|>",
38
  "lstrip": false,
 
1
  {
2
  "additional_special_tokens": [
 
3
  "<|im_start|>",
4
+ "<|im_end|>"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
5
  ],
6
  "bos_token": {
7
+ "content": "<|im_start|>",
8
  "lstrip": false,
9
  "normalized": false,
10
  "rstrip": false,
11
  "single_word": false
12
  },
13
  "eos_token": {
14
+ "content": "<|im_end|>",
15
+ "lstrip": false,
16
+ "normalized": false,
17
+ "rstrip": false,
18
+ "single_word": false
19
+ },
20
+ "pad_token": {
21
+ "content": "<|im_end|>",
22
  "lstrip": false,
23
  "normalized": false,
24
  "rstrip": false,
25
  "single_word": false
26
  },
 
27
  "unk_token": {
28
  "content": "<|endoftext|>",
29
  "lstrip": false,
tokenizer_config.json CHANGED
@@ -139,31 +139,16 @@
139
  }
140
  },
141
  "additional_special_tokens": [
142
- "<|endoftext|>",
143
  "<|im_start|>",
144
- "<|im_end|>",
145
- "<repo_name>",
146
- "<reponame>",
147
- "<file_sep>",
148
- "<filename>",
149
- "<gh_stars>",
150
- "<issue_start>",
151
- "<issue_comment>",
152
- "<issue_closed>",
153
- "<jupyter_start>",
154
- "<jupyter_text>",
155
- "<jupyter_code>",
156
- "<jupyter_output>",
157
- "<jupyter_script>",
158
- "<empty_output>"
159
  ],
160
- "bos_token": "<|endoftext|>",
161
- "chat_template": "{% if messages[0]['role'] == 'system' %}{% set loop_messages = messages[1:] %}{% set system_message = messages[0]['content'] %}{% else %}{% set loop_messages = messages %}{% endif %}{% if system_message is defined %}{{ 'System: ' + system_message + '<|endoftext|>' + '\n' }}{% endif %}{% for message in loop_messages %}{% set content = message['content'] %}{% if message['role'] == 'user' %}{{ 'Human: ' + content + '<|endoftext|>' + '\nAssistant:' }}{% elif message['role'] == 'assistant' %}{{ content + '<|endoftext|>' + '\n' }}{% endif %}{% endfor %}",
162
  "clean_up_tokenization_spaces": false,
163
- "eos_token": "<|endoftext|>",
164
  "extra_special_tokens": {},
165
- "model_max_length": 8192,
166
- "pad_token": "<|endoftext|>",
167
  "padding_side": "left",
168
  "split_special_tokens": false,
169
  "tokenizer_class": "GPT2Tokenizer",
 
139
  }
140
  },
141
  "additional_special_tokens": [
 
142
  "<|im_start|>",
143
+ "<|im_end|>"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
144
  ],
145
+ "bos_token": "<|im_start|>",
146
+ "chat_template": "{% if messages[0]['role'] == 'system' %}{% set loop_messages = messages[1:] %}{% set system_message = messages[0]['content'] %}{% else %}{% set loop_messages = messages %}{% endif %}{% if system_message is defined %}{{ 'System: ' + system_message + '<|im_end|>' + '\n' }}{% endif %}{% for message in loop_messages %}{% set content = message['content'] %}{% if message['role'] == 'user' %}{{ 'Human: ' + content + '<|im_end|>' + '\nAssistant:' }}{% elif message['role'] == 'assistant' %}{{ content + '<|im_end|>' + '\n' }}{% endif %}{% endfor %}",
147
  "clean_up_tokenization_spaces": false,
148
+ "eos_token": "<|im_end|>",
149
  "extra_special_tokens": {},
150
+ "model_max_length": 2048,
151
+ "pad_token": "<|im_end|>",
152
  "padding_side": "left",
153
  "split_special_tokens": false,
154
  "tokenizer_class": "GPT2Tokenizer",