KoichiYasuoka commited on
Commit
35d0ceb
1 Parent(s): 3d47df5

tokenizer improved

Browse files
Files changed (1) hide show
  1. tokenizer.json +4 -2
tokenizer.json CHANGED
@@ -110,7 +110,8 @@
110
  "pre_tokenizer": {
111
  "type": "Metaspace",
112
  "replacement": "▁",
113
- "add_prefix_space": true
 
114
  },
115
  "post_processor": {
116
  "type": "TemplateProcessing",
@@ -190,7 +191,8 @@
190
  "decoder": {
191
  "type": "Metaspace",
192
  "replacement": "▁",
193
- "add_prefix_space": true
 
194
  },
195
  "model": {
196
  "type": "Unigram",
 
110
  "pre_tokenizer": {
111
  "type": "Metaspace",
112
  "replacement": "▁",
113
+ "add_prefix_space": true,
114
+ "prepend_scheme": "always"
115
  },
116
  "post_processor": {
117
  "type": "TemplateProcessing",
 
191
  "decoder": {
192
  "type": "Metaspace",
193
  "replacement": "▁",
194
+ "add_prefix_space": true,
195
+ "prepend_scheme": "always"
196
  },
197
  "model": {
198
  "type": "Unigram",