luissattelmayer commited on
Commit
576ffb9
·
verified ·
1 Parent(s): 075c6a6

Training in progress, epoch 1

Browse files
Files changed (3) hide show
  1. config.json +11 -11
  2. model.safetensors +2 -2
  3. tokenizer.json +2 -2
config.json CHANGED
@@ -1,16 +1,16 @@
1
  {
2
- "_name_or_path": "EuroBERT/EuroBERT-610m",
3
  "architectures": [
4
  "EuroBertForSequenceClassification"
5
  ],
6
  "attention_bias": false,
7
  "attention_dropout": 0.0,
8
  "auto_map": {
9
- "AutoConfig": "EuroBERT/EuroBERT-610m--configuration_eurobert.EuroBertConfig",
10
- "AutoModel": "EuroBERT/EuroBERT-610m--modeling_eurobert.EuroBertModel",
11
- "AutoModelForMaskedLM": "EuroBERT/EuroBERT-610m--modeling_eurobert.EuroBertForMaskedLM",
12
- "AutoModelForPreTraining": "EuroBERT/EuroBERT-610m--modeling_eurobert.EuroBertPreTrainedModel",
13
- "AutoModelForSequenceClassification": "EuroBERT/EuroBERT-610m--modeling_eurobert.EuroBertForSequenceClassification"
14
  },
15
  "bos_token": "<|begin_of_text|>",
16
  "bos_token_id": 128000,
@@ -20,13 +20,13 @@
20
  "head_dim": 64,
21
  "hidden_act": "silu",
22
  "hidden_dropout": 0.0,
23
- "hidden_size": 1152,
24
  "id2label": {
25
  "0": "0",
26
  "1": "1"
27
  },
28
  "initializer_range": 0.02,
29
- "intermediate_size": 4096,
30
  "label2id": {
31
  "0": 0,
32
  "1": 1
@@ -36,9 +36,9 @@
36
  "max_position_embeddings": 8192,
37
  "mlp_bias": false,
38
  "model_type": "eurobert",
39
- "num_attention_heads": 18,
40
- "num_hidden_layers": 26,
41
- "num_key_value_heads": 6,
42
  "pad_token": "<|end_of_text|>",
43
  "pad_token_id": 128001,
44
  "pretraining_tp": 1,
 
1
  {
2
+ "_name_or_path": "EuroBERT/EuroBERT-210m",
3
  "architectures": [
4
  "EuroBertForSequenceClassification"
5
  ],
6
  "attention_bias": false,
7
  "attention_dropout": 0.0,
8
  "auto_map": {
9
+ "AutoConfig": "EuroBERT/EuroBERT-210m--configuration_eurobert.EuroBertConfig",
10
+ "AutoModel": "EuroBERT/EuroBERT-210m--modeling_eurobert.EuroBertModel",
11
+ "AutoModelForMaskedLM": "EuroBERT/EuroBERT-210m--modeling_eurobert.EuroBertForMaskedLM",
12
+ "AutoModelForPreTraining": "EuroBERT/EuroBERT-210m--modeling_eurobert.EuroBertPreTrainedModel",
13
+ "AutoModelForSequenceClassification": "EuroBERT/EuroBERT-210m--modeling_eurobert.EuroBertForSequenceClassification"
14
  },
15
  "bos_token": "<|begin_of_text|>",
16
  "bos_token_id": 128000,
 
20
  "head_dim": 64,
21
  "hidden_act": "silu",
22
  "hidden_dropout": 0.0,
23
+ "hidden_size": 768,
24
  "id2label": {
25
  "0": "0",
26
  "1": "1"
27
  },
28
  "initializer_range": 0.02,
29
+ "intermediate_size": 3072,
30
  "label2id": {
31
  "0": 0,
32
  "1": 1
 
36
  "max_position_embeddings": 8192,
37
  "mlp_bias": false,
38
  "model_type": "eurobert",
39
+ "num_attention_heads": 12,
40
+ "num_hidden_layers": 12,
41
+ "num_key_value_heads": 12,
42
  "pad_token": "<|end_of_text|>",
43
  "pad_token_id": 128001,
44
  "pretraining_tp": 1,
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:26862fb8cc9725d04d5cdec6b8254dfa8e492c73517528570538b850b8d24483
3
- size 2436848328
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d13e4146835bb9170066397a9f57729e02ac37a74b3aa88e23a812709cafd1ad
3
+ size 849445136
tokenizer.json CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:90afafb9441b9e4eeef11d619ff14569747135aaf1e83ba12aa1c734a0177edf
3
- size 17209997
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fc2befa162f4fa90daed0d884a2db4d02c2da3f6d2172dcd44b2d15259e4fb49
3
+ size 17210081