Brainkite commited on
Commit
b7189fc
·
verified ·
1 Parent(s): 2392b24

Upload tokenizer

Browse files
Files changed (2) hide show
  1. special_tokens_map.json +1 -7
  2. tokenizer_config.json +1 -1
special_tokens_map.json CHANGED
@@ -17,13 +17,7 @@
17
  "rstrip": false,
18
  "single_word": false
19
  },
20
- "eos_token": {
21
- "content": "<|im_end|>",
22
- "lstrip": false,
23
- "normalized": false,
24
- "rstrip": false,
25
- "single_word": false
26
- },
27
  "pad_token": {
28
  "content": "<|im_end|>",
29
  "lstrip": false,
 
17
  "rstrip": false,
18
  "single_word": false
19
  },
20
+ "eos_token": "<eos>",
 
 
 
 
 
 
21
  "pad_token": {
22
  "content": "<|im_end|>",
23
  "lstrip": false,
tokenizer_config.json CHANGED
@@ -216,7 +216,7 @@
216
  "bos_token": "<|im_start|>",
217
  "chat_template": "{{ bos_token }}{% if messages[0]['role'] == 'system' %}{{ raise_exception('System role not supported') }}{% endif %}{% for message in messages %}{{ '<start_of_turn>' + message['role'] + '\n' + message['content'] | trim + '<end_of_turn><eos>\n' }}{% endfor %}{% if add_generation_prompt %}{{'<start_of_turn>model\n'}}{% endif %}",
218
  "clean_up_tokenization_spaces": false,
219
- "eos_token": "<|im_end|>",
220
  "extra_special_tokens": {},
221
  "model_max_length": 8192,
222
  "pad_token": "<|im_end|>",
 
216
  "bos_token": "<|im_start|>",
217
  "chat_template": "{{ bos_token }}{% if messages[0]['role'] == 'system' %}{{ raise_exception('System role not supported') }}{% endif %}{% for message in messages %}{{ '<start_of_turn>' + message['role'] + '\n' + message['content'] | trim + '<end_of_turn><eos>\n' }}{% endfor %}{% if add_generation_prompt %}{{'<start_of_turn>model\n'}}{% endif %}",
218
  "clean_up_tokenization_spaces": false,
219
+ "eos_token": "<eos>",
220
  "extra_special_tokens": {},
221
  "model_max_length": 8192,
222
  "pad_token": "<|im_end|>",