mtasic85 commited on
Commit
72813f2
·
1 Parent(s): 9fbd906

pretrain core 1

Browse files
Files changed (2) hide show
  1. README.md +4 -0
  2. scripts/pretrain_core_model_1.yaml +1 -1
README.md CHANGED
@@ -197,3 +197,7 @@ Tasks |Version|Filter|n-shot| Metric |
197
  ```bash
198
  litgpt convert_pretrained_checkpoint ../out/pretrain-core-0/final ../out/pretrain-core-0/checkpoint
199
  ```
 
 
 
 
 
197
  ```bash
198
  litgpt convert_pretrained_checkpoint ../out/pretrain-core-0/final ../out/pretrain-core-0/checkpoint
199
  ```
200
+
201
+ ```bash
202
+ CUDA_VISIBLE_DEVICES=0 CUDA_LAUNCH_BLOCKING=0 PYTORCH_CUDA_ALLOC_CONF=expandable_segments:True litgpt pretrain --config pretrain_core_model_1.yaml
203
+ ```
scripts/pretrain_core_model_1.yaml CHANGED
@@ -85,7 +85,7 @@ train:
85
  max_norm: 1.0
86
 
87
  # (type: float, default: 4e-05)
88
- min_lr: 1e-6
89
 
90
  # Evaluation-related arguments. See ``litgpt.args.EvalArgs`` for details
91
  eval:
 
85
  max_norm: 1.0
86
 
87
  # (type: float, default: 4e-05)
88
+ min_lr: 1e-5
89
 
90
  # Evaluation-related arguments. See ``litgpt.args.EvalArgs`` for details
91
  eval: