Wietse de Vries
commited on
Commit
·
b23d41b
1
Parent(s):
61330c1
add missing char tokens to vocab (with embeddings close to [UNK])
Browse files- config.json +6 -3
- pytorch_model.bin +2 -2
- tf_model.h5 +2 -2
- vocab.txt +73 -0
config.json
CHANGED
@@ -1,5 +1,5 @@
|
|
1 |
{
|
2 |
-
"_name_or_path": "
|
3 |
"architectures": [
|
4 |
"BertForMaskedLM"
|
5 |
],
|
@@ -16,6 +16,9 @@
|
|
16 |
"num_attention_heads": 12,
|
17 |
"num_hidden_layers": 12,
|
18 |
"pad_token_id": 3,
|
|
|
|
|
19 |
"type_vocab_size": 2,
|
20 |
-
"
|
21 |
-
|
|
|
|
1 |
{
|
2 |
+
"_name_or_path": "bert-base-dutch-cased",
|
3 |
"architectures": [
|
4 |
"BertForMaskedLM"
|
5 |
],
|
|
|
16 |
"num_attention_heads": 12,
|
17 |
"num_hidden_layers": 12,
|
18 |
"pad_token_id": 3,
|
19 |
+
"position_embedding_type": "absolute",
|
20 |
+
"transformers_version": "4.5.1",
|
21 |
"type_vocab_size": 2,
|
22 |
+
"use_cache": true,
|
23 |
+
"vocab_size": 30073
|
24 |
+
}
|
pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5ffe408c7eea0ffee4c257c6028f8c98146967e3ac3db51dba8e2bc8a4abddf5
|
3 |
+
size 436761702
|
tf_model.h5
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:88cc47b929d21ed816d6ad8d5abea5c06ccae04a5f04f2d6b07da7d212aa18e1
|
3 |
+
size 530923844
|
vocab.txt
CHANGED
@@ -29998,3 +29998,76 @@ zóó
|
|
29998 |
##öl
|
29999 |
##ön
|
30000 |
##ör
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
29998 |
##öl
|
29999 |
##ön
|
30000 |
##ör
|
30001 |
+
##Q
|
30002 |
+
##X
|
30003 |
+
##Ç
|
30004 |
+
##Ó
|
30005 |
+
##Ô
|
30006 |
+
##Ú
|
30007 |
+
##Û
|
30008 |
+
##Ü
|
30009 |
+
##à
|
30010 |
+
##á
|
30011 |
+
##â
|
30012 |
+
##ä
|
30013 |
+
##ê
|
30014 |
+
##ì
|
30015 |
+
##í
|
30016 |
+
##î
|
30017 |
+
##ñ
|
30018 |
+
##ò
|
30019 |
+
##ô
|
30020 |
+
##ù
|
30021 |
+
##ú
|
30022 |
+
##û
|
30023 |
+
##ü
|
30024 |
+
Q
|
30025 |
+
X
|
30026 |
+
a
|
30027 |
+
c
|
30028 |
+
e
|
30029 |
+
f
|
30030 |
+
g
|
30031 |
+
h
|
30032 |
+
i
|
30033 |
+
j
|
30034 |
+
k
|
30035 |
+
l
|
30036 |
+
m
|
30037 |
+
n
|
30038 |
+
o
|
30039 |
+
p
|
30040 |
+
q
|
30041 |
+
r
|
30042 |
+
s
|
30043 |
+
t
|
30044 |
+
u
|
30045 |
+
x
|
30046 |
+
y
|
30047 |
+
Ç
|
30048 |
+
Ó
|
30049 |
+
Ô
|
30050 |
+
Ú
|
30051 |
+
Û
|
30052 |
+
Ü
|
30053 |
+
à
|
30054 |
+
á
|
30055 |
+
â
|
30056 |
+
ä
|
30057 |
+
è
|
30058 |
+
é
|
30059 |
+
ê
|
30060 |
+
ë
|
30061 |
+
ì
|
30062 |
+
í
|
30063 |
+
î
|
30064 |
+
ï
|
30065 |
+
ñ
|
30066 |
+
ò
|
30067 |
+
ó
|
30068 |
+
ô
|
30069 |
+
ö
|
30070 |
+
ù
|
30071 |
+
ú
|
30072 |
+
û
|
30073 |
+
ü
|