phongdtd commited on
Commit
0fc29d1
·
1 Parent(s): e57eece

add tokenizer

Browse files
Files changed (1) hide show
  1. vocab.json +1 -1
vocab.json CHANGED
@@ -1 +1 @@
1
- {"": 0, "": 1, "": 2, "d": 3, "ơ": 4, "w": 5, "s": 6, "ũ": 7, "c": 8, "é": 9, "": 10, "í": 11, "": 12, "": 13, "": 14, "": 15, "ô": 16, "ù": 17, "r": 18, "m": 19, "": 20, "â": 21, "j": 22, "": 23, "": 24, "ì": 25, "ý": 26, "": 27, "g": 28, "": 29, "": 30, "h": 31, "": 32, "": 33, "": 34, "e": 35, "à": 36, "": 37, "l": 38, "z": 39, "è": 40, "ă": 41, "": 42, "": 43, "ê": 44, "ặ": 45, "": 46, "u": 47, "ĩ": 48, "õ": 49, "b": 50, "á": 51, "": 52, "o": 53, "": 54, "": 55, "": 56, "": 57, "": 58, "": 59, "k": 60, "": 61, "": 62, "": 63, "": 64, "": 65, "p": 66, "": 67, "ã": 68, "ế": 69, "a": 70, "ó": 71, "": 72, "x": 73, "n": 74, "t": 75, "ú": 76, "f": 77, "": 78, "q": 79, "": 80, "v": 81, "": 82, "ò": 83, "": 84, "": 85, "đ": 87, "": 88, "ư": 89, "y": 90, "": 91, "i": 92, "": 93, "|": 86, "[UNK]": 94, "[PAD]": 95}
 
1
+ {"": 0, "": 1, "": 2, "": 3, "ĩ": 4, "": 5, "": 6, "m": 7, "o": 8, "": 9, "": 10, "": 11, "": 12, "y": 13, "ũ": 14, "": 15, "": 16, "s": 17, "": 18, "": 19, "": 20, "": 21, "ô": 22, "": 23, "đ": 24, "ù": 25, "b": 26, "": 27, "": 28, "l": 29, "t": 30, "j": 31, "ă": 32, "": 33, "": 34, "f": 35, "": 36, "ó": 37, "": 38, "": 39, "h": 40, "k": 41, "e": 42, "c": 43, "": 45, "v": 46, "": 47, "": 48, "": 49, "p": 50, "ơ": 51, "": 52, "z": 53, "é": 54, "": 55, "": 56, "ế": 57, "ú": 58, "": 59, "r": 60, "ý": 61, "g": 62, "õ": 63, "q": 64, "n": 65, "": 66, "í": 67, "": 68, "ã": 69, "u": 70, "è": 71, "": 72, "ì": 73, "a": 74, "w": 75, "d": 76, "ò": 77, "": 78, "": 79, "": 80, "i": 81, "ư": 82, "": 83, "á": 84, "â": 85, "à": 86, "x": 87, "": 88, "": 89, "": 90, "": 91, "": 92, "ê": 93, "|": 44, "[UNK]": 94, "[PAD]": 95}