InterwebAlchemy commited on
Commit
f1f85c8
·
verified ·
1 Parent(s): f4514e5

Update tokenizer

Browse files

Update tokenizer to use `NFC` normalization because transformers.js doesn't support `NFD`

Files changed (2) hide show
  1. special_tokens_map.json +1 -0
  2. tokenizer.json +1 -1
special_tokens_map.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {}
tokenizer.json CHANGED
@@ -41,7 +41,7 @@
41
  }
42
  ],
43
  "normalizer": {
44
- "type": "NFD"
45
  },
46
  "pre_tokenizer": {
47
  "type": "Split",
 
41
  }
42
  ],
43
  "normalizer": {
44
+ "type": "NFC"
45
  },
46
  "pre_tokenizer": {
47
  "type": "Split",