Text Generation
Transformers
PyTorch
English
modernbert-decoder
ettin
decoder
orionweller commited on
Commit
b934570
·
verified ·
1 Parent(s): a0dc4ad

Add checkpoint for ext1730

Browse files
Files changed (2) hide show
  1. config.json +3 -3
  2. pytorch_model.bin +1 -1
config.json CHANGED
@@ -16,7 +16,7 @@
16
  "embedding_dropout": 0.0,
17
  "eos_token_id": 50282,
18
  "global_attn_every_n_layers": 3,
19
- "global_rope_theta": 10000.0,
20
  "gradient_checkpointing": false,
21
  "hidden_activation": "gelu",
22
  "hidden_size": 1024,
@@ -25,8 +25,8 @@
25
  "intermediate_size": 2624,
26
  "layer_norm_eps": 1e-05,
27
  "local_attention": 128,
28
- "local_rope_theta": 10000.0,
29
- "max_position_embeddings": 1024,
30
  "mlp_bias": false,
31
  "mlp_dropout": 0.0,
32
  "model_type": "modernbert-decoder",
 
16
  "embedding_dropout": 0.0,
17
  "eos_token_id": 50282,
18
  "global_attn_every_n_layers": 3,
19
+ "global_rope_theta": 160000.0,
20
  "gradient_checkpointing": false,
21
  "hidden_activation": "gelu",
22
  "hidden_size": 1024,
 
25
  "intermediate_size": 2624,
26
  "layer_norm_eps": 1e-05,
27
  "local_attention": 128,
28
+ "local_rope_theta": 160000.0,
29
+ "max_position_embeddings": 7999,
30
  "mlp_bias": false,
31
  "mlp_dropout": 0.0,
32
  "model_type": "modernbert-decoder",
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2f966813b781a4560828a6bab0d88a4e303dfb34f12ed5d5f898c6adf2e28532
3
  size 1583588094
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6907cad400221bd490cf10612bf435efbcaa8e24e0723c0725b77a1a888fca44
3
  size 1583588094