pretrain core
Browse files
scripts/pretrain_core_model_0.yaml
CHANGED
@@ -76,7 +76,7 @@ train:
|
|
76 |
max_steps:
|
77 |
|
78 |
# Limits the length of samples. Off by default (type: Optional[int], default: null)
|
79 |
-
max_seq_length:
|
80 |
|
81 |
# Whether to tie the embedding weights with the language modeling head weights. (type: Optional[bool], default: False)
|
82 |
tie_embeddings: false
|
|
|
76 |
max_steps:
|
77 |
|
78 |
# Limits the length of samples. Off by default (type: Optional[int], default: null)
|
79 |
+
max_seq_length: 1025
|
80 |
|
81 |
# Whether to tie the embedding weights with the language modeling head weights. (type: Optional[bool], default: False)
|
82 |
tie_embeddings: false
|