pretrain 0
Browse files
scripts/pretrain_core_model_0.yaml
CHANGED
@@ -1,11 +1,11 @@
|
|
1 |
# The name of the model to pretrain. Choose from names in ``litgpt.config``. Mutually exclusive with
|
2 |
# ``model_config``. (type: Optional[str], default: null)
|
3 |
-
model_name: 'tangled-alpha-0.
|
4 |
|
5 |
# A ``litgpt.Config`` object to define the model architecture. Mutually exclusive with
|
6 |
# ``model_config``. (type: Optional[Config], default: null)
|
7 |
model_config:
|
8 |
-
name: 'tangled-alpha-0.
|
9 |
block_size: 131072
|
10 |
vocab_size: 131072
|
11 |
padded_vocab_size: 131072
|
|
|
1 |
# The name of the model to pretrain. Choose from names in ``litgpt.config``. Mutually exclusive with
|
2 |
# ``model_config``. (type: Optional[str], default: null)
|
3 |
+
model_name: 'tangled-alpha-0.10-core'
|
4 |
|
5 |
# A ``litgpt.Config`` object to define the model architecture. Mutually exclusive with
|
6 |
# ``model_config``. (type: Optional[Config], default: null)
|
7 |
model_config:
|
8 |
+
name: 'tangled-alpha-0.10-core'
|
9 |
block_size: 131072
|
10 |
vocab_size: 131072
|
11 |
padded_vocab_size: 131072
|