pdjohn
/

C-EBERT-210m

Token Classification

Model card Files Files and versions

pdjohn commited on Aug 3

Commit

b1cfa89

·

verified ·

1 Parent(s): d63e02b

Upload model

Files changed (2) hide show

config.json +70 -0
model.safetensors +3 -0

config.json ADDED Viewed

	@@ -0,0 +1,70 @@

+{
+  "architectures": [
+    "CausalBERTMultiTaskModel"
+  ],
+  "attention_bias": false,
+  "attention_dropout": 0.0,
+  "auto_map": {
+    "AutoConfig": "configuration_eurobert.EuroBertConfig",
+    "AutoModel": "modeling_eurobert.EuroBertModel",
+    "AutoModelForMaskedLM": "modeling_eurobert.EuroBertForMaskedLM",
+    "AutoModelForPreTraining": "modeling_eurobert.EuroBertPreTrainedModel",
+    "AutoModelForSequenceClassification": "modeling_eurobert.EuroBertForSequenceClassification",
+    "AutoModelForTokenClassification": "modeling_eurobert.EuroBertForTokenClassification"
+  },
+  "base_model_name": "EuroBERT/EuroBERT-210m",
+  "bos_token": "<|begin_of_text|>",
+  "bos_token_id": 128000,
+  "clf_pooling": "late",
+  "eos_token": "<|end_of_text|>",
+  "eos_token_id": 128001,
+  "head_dim": 64,
+  "hidden_act": "silu",
+  "hidden_dropout": 0.0,
+  "hidden_size": 768,
+  "id2label_relation": {
+    "0": "NO_RELATION",
+    "1": "CAUSE",
+    "2": "EFFECT",
+    "3": "INTERDEPENDENCY"
+  },
+  "id2label_span": {
+    "0": "O",
+    "1": "B-INDICATOR",
+    "2": "I-INDICATOR",
+    "3": "B-ENTITY",
+    "4": "I-ENTITY"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "mask_token": "<|mask|>",
+  "mask_token_id": 128002,
+  "max_position_embeddings": 8192,
+  "mlp_bias": false,
+  "model_type": "causalbert_multitask",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 12,
+  "num_key_value_heads": 12,
+  "num_relation_labels": 4,
+  "num_span_labels": 5,
+  "pad_token": "<|end_of_text|>",
+  "pad_token_id": 128001,
+  "pretraining_tp": 1,
+  "relation_class_weights": null,
+  "rms_norm_eps": 1e-05,
+  "rope_scaling": null,
+  "rope_theta": 250000,
+  "span_class_weights": [
+    0.09086648603440675,
+    2.1256438250409166,
+    1.4697529981521529,
+    0.9365069591289833,
+    0.37722973164353996
+  ],
+  "tie_word_embeddings": false,
+  "torch_dtype": "bfloat16",
+  "transformers_version": "4.53.1",
+  "use_cache": false,
+  "vocab_size": 128256,
+  "vocab_size_with_special_tokens": 128256
+}

model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7ce980756462746c271fc6aa8e71b1da7efdab38434a890802ba384ca70220f6
+size 423558482