nis12ram
/

Nemotron-4-Mini-Hindi-4B-Instruct-hindiNER-ner-exp2

Text Generation

text-generation-inference

Model card Files Files and versions Community

nis12ram commited on 9 days ago

Commit

648f1db

·

verified ·

1 Parent(s): 6a4cd93

Update config.json

Files changed (1) hide show

config.json +2 -4

config.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "architectures": [
-    "NemotronModel"
   ],
   "attention_bias": false,
   "attention_dropout": 0.0,
@@ -19,13 +19,11 @@
   "num_attention_heads": 24,
   "num_hidden_layers": 32,
   "num_key_value_heads": 8,
-  "pad_token_id": 0,
   "partial_rotary_factor": 0.5,
   "rope_theta": 10000,
   "tie_word_embeddings": false,
   "torch_dtype": "bfloat16",
   "transformers_version": "4.51.3",
-  "unsloth_version": "2025.5.7",
   "use_cache": true,
   "vocab_size": 256000
-}

 {
   "architectures": [
+    "NemotronForCausalLM"
   ],
   "attention_bias": false,
   "attention_dropout": 0.0,
   "num_attention_heads": 24,
   "num_hidden_layers": 32,
   "num_key_value_heads": 8,
   "partial_rotary_factor": 0.5,
   "rope_theta": 10000,
   "tie_word_embeddings": false,
   "torch_dtype": "bfloat16",
   "transformers_version": "4.51.3",
   "use_cache": true,
   "vocab_size": 256000
+}