pretrain core 1
Browse files- README.md +4 -0
- scripts/pretrain_core_model_1.yaml +1 -1
README.md
CHANGED
@@ -197,3 +197,7 @@ Tasks |Version|Filter|n-shot| Metric |
|
|
197 |
```bash
|
198 |
litgpt convert_pretrained_checkpoint ../out/pretrain-core-0/final ../out/pretrain-core-0/checkpoint
|
199 |
```
|
|
|
|
|
|
|
|
|
|
197 |
```bash
|
198 |
litgpt convert_pretrained_checkpoint ../out/pretrain-core-0/final ../out/pretrain-core-0/checkpoint
|
199 |
```
|
200 |
+
|
201 |
+
```bash
|
202 |
+
CUDA_VISIBLE_DEVICES=0 CUDA_LAUNCH_BLOCKING=0 PYTORCH_CUDA_ALLOC_CONF=expandable_segments:True litgpt pretrain --config pretrain_core_model_1.yaml
|
203 |
+
```
|
scripts/pretrain_core_model_1.yaml
CHANGED
@@ -85,7 +85,7 @@ train:
|
|
85 |
max_norm: 1.0
|
86 |
|
87 |
# (type: float, default: 4e-05)
|
88 |
-
min_lr: 1e-
|
89 |
|
90 |
# Evaluation-related arguments. See ``litgpt.args.EvalArgs`` for details
|
91 |
eval:
|
|
|
85 |
max_norm: 1.0
|
86 |
|
87 |
# (type: float, default: 4e-05)
|
88 |
+
min_lr: 1e-5
|
89 |
|
90 |
# Evaluation-related arguments. See ``litgpt.args.EvalArgs`` for details
|
91 |
eval:
|