khaimaitien commited on
Commit
7230752
1 Parent(s): 38fa1ab

Upload folder using huggingface_hub

Browse files
added_tokens.json CHANGED
@@ -2,7 +2,7 @@
2
  "</s>": 2,
3
  "<s>": 1,
4
  "<unk>": 0,
5
- "<|bof|>": 32000,
6
  "<|eof|>": 32001,
7
- "<|eot|>": 32002
8
  }
 
2
  "</s>": 2,
3
  "<s>": 1,
4
  "<unk>": 0,
5
+ "<|bof|>": 32002,
6
  "<|eof|>": 32001,
7
+ "<|eot|>": 32000
8
  }
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "mistralai/Mistral-7B-v0.1",
3
  "architectures": [
4
  "MistralForCausalLM"
5
  ],
@@ -14,7 +14,6 @@
14
  "num_attention_heads": 32,
15
  "num_hidden_layers": 32,
16
  "num_key_value_heads": 8,
17
- "pad_token_id": 2,
18
  "rms_norm_eps": 1e-05,
19
  "rope_theta": 10000.0,
20
  "sliding_window": 4096,
 
1
  {
2
+ "_name_or_path": "/workspace/Mistral-7B-v0.1",
3
  "architectures": [
4
  "MistralForCausalLM"
5
  ],
 
14
  "num_attention_heads": 32,
15
  "num_hidden_layers": 32,
16
  "num_key_value_heads": 8,
 
17
  "rms_norm_eps": 1e-05,
18
  "rope_theta": 10000.0,
19
  "sliding_window": 4096,
pytorch_model-00001-of-00002.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f23e8d1e200efb195517a3ef9cb3efea3f8276ead85a82a860abd792c60e1096
3
  size 9943055436
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:552ad84e3a3ec166a1ab4ab5166276ed4ba95b9c9592e5ff46c85ef7a68a0b3c
3
  size 9943055436
pytorch_model-00002-of-00002.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7d63a15594b099674cacfcbab53949209bbe973220568c9eaa5dd842e782e94a
3
  size 4540561439
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2fe74e959b70e2732c2ed276630de2e091473ace6c47f80311e1fdd6fbb1f54a
3
  size 4540561439
special_tokens_map.json CHANGED
@@ -2,10 +2,12 @@
2
  "additional_special_tokens": [
3
  "<unk>",
4
  "<s>",
5
- "</s>"
 
 
 
6
  ],
7
  "bos_token": "<s>",
8
  "eos_token": "</s>",
9
- "pad_token": "</s>",
10
  "unk_token": "<unk>"
11
  }
 
2
  "additional_special_tokens": [
3
  "<unk>",
4
  "<s>",
5
+ "</s>",
6
+ "<|eot|>",
7
+ "<|eof|>",
8
+ "<|bof|>"
9
  ],
10
  "bos_token": "<s>",
11
  "eos_token": "</s>",
 
12
  "unk_token": "<unk>"
13
  }
tokenizer_config.json CHANGED
@@ -27,45 +27,48 @@
27
  "special": true
28
  },
29
  "32000": {
30
- "content": "<|bof|>",
31
  "lstrip": true,
32
- "normalized": true,
33
  "rstrip": true,
34
  "single_word": false,
35
- "special": false
36
  },
37
  "32001": {
38
  "content": "<|eof|>",
39
  "lstrip": true,
40
- "normalized": true,
41
  "rstrip": true,
42
  "single_word": false,
43
- "special": false
44
  },
45
  "32002": {
46
- "content": "<|eot|>",
47
  "lstrip": true,
48
- "normalized": true,
49
  "rstrip": true,
50
  "single_word": false,
51
- "special": false
52
  }
53
  },
54
  "additional_special_tokens": [
55
  "<unk>",
56
  "<s>",
57
- "</s>"
 
 
 
58
  ],
59
  "bos_token": "<s>",
60
  "clean_up_tokenization_spaces": false,
61
  "eos_token": "</s>",
62
  "legacy": true,
63
  "model_max_length": 1000000000000000019884624838656,
64
- "pad_token": "</s>",
65
  "sp_model_kwargs": {},
66
  "spaces_between_special_tokens": false,
67
  "tokenizer_class": "LlamaTokenizer",
68
- "tokenizer_file": "/root/.cache/huggingface/hub/models--mistralai--Mistral-7B-v0.1/snapshots/60e27e7bebd4aaf2edf6f4d172346bfc95e2ae40/tokenizer.json",
69
  "unk_token": "<unk>",
70
  "use_default_system_prompt": true
71
  }
 
27
  "special": true
28
  },
29
  "32000": {
30
+ "content": "<|eot|>",
31
  "lstrip": true,
32
+ "normalized": false,
33
  "rstrip": true,
34
  "single_word": false,
35
+ "special": true
36
  },
37
  "32001": {
38
  "content": "<|eof|>",
39
  "lstrip": true,
40
+ "normalized": false,
41
  "rstrip": true,
42
  "single_word": false,
43
+ "special": true
44
  },
45
  "32002": {
46
+ "content": "<|bof|>",
47
  "lstrip": true,
48
+ "normalized": false,
49
  "rstrip": true,
50
  "single_word": false,
51
+ "special": true
52
  }
53
  },
54
  "additional_special_tokens": [
55
  "<unk>",
56
  "<s>",
57
+ "</s>",
58
+ "<|eot|>",
59
+ "<|eof|>",
60
+ "<|bof|>"
61
  ],
62
  "bos_token": "<s>",
63
  "clean_up_tokenization_spaces": false,
64
  "eos_token": "</s>",
65
  "legacy": true,
66
  "model_max_length": 1000000000000000019884624838656,
67
+ "pad_token": null,
68
  "sp_model_kwargs": {},
69
  "spaces_between_special_tokens": false,
70
  "tokenizer_class": "LlamaTokenizer",
71
+ "tokenizer_file": "/workspace/Mistral-7B-v0.1/tokenizer.json",
72
  "unk_token": "<unk>",
73
  "use_default_system_prompt": true
74
  }