Update README.md
Browse files
README.md
CHANGED
@@ -12,10 +12,6 @@ xLSTM Trained on a shuffeld wikimedia/wikipedia 20231101.en dataset (seed=42)
|
|
12 |
Model checkpoints as branches
|
13 |
|
14 |
```
|
15 |
-
num_blocks=24,
|
16 |
-
num_heads=4,
|
17 |
-
embedding_dim=768,
|
18 |
-
|
19 |
per_device_train_batch_size=32,
|
20 |
logging_steps=3650,
|
21 |
gradient_accumulation_steps=8,
|
|
|
12 |
Model checkpoints as branches
|
13 |
|
14 |
```
|
|
|
|
|
|
|
|
|
15 |
per_device_train_batch_size=32,
|
16 |
logging_steps=3650,
|
17 |
gradient_accumulation_steps=8,
|