tarabukinivan commited on
Commit
86a9c58
·
verified ·
1 Parent(s): c9c9bbd

Training in progress, step 37, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:af45f5a20c7781427e7d13de0ca4866a1cf71bade19be14ca66dbe14b1506f58
3
  size 83945296
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2c5ceccac1e41b6ab4943a237b1547f43185be9ed933d9176b9b40e074d40c0d
3
  size 83945296
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6cecc7bb05c4bb579b040038b3f705ed45416975b87e35007c8e22c6569d7a45
3
  size 168149074
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b63c60c259f42e050012676d4745e55605d17127eda745371ccef41c90351f30
3
  size 168149074
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c7034eba1ae19e0d8d26b6a7beae9c6e8303193d228a3589cb78845a2ac46c6a
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d5984d2f8f71fff6b08847d3fcb1f324914b36bd22b35d67488d6a319a5d85a5
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:24f70974ebe6e16031ce63527ce3fea95f8e56e83073513783f6d8a14f9aa0e8
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:403a4035e63034a6e33503614432aa83d524d5b8ffac47cac18a35f9606be4b7
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.11017597551644988,
5
  "eval_steps": 5,
6
- "global_step": 36,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -169,12 +169,12 @@
169
  "should_evaluate": false,
170
  "should_log": false,
171
  "should_save": true,
172
- "should_training_stop": false
173
  },
174
  "attributes": {}
175
  }
176
  },
177
- "total_flos": 1.340934079905792e+16,
178
  "train_batch_size": 2,
179
  "trial_name": null,
180
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.11323641928079571,
5
  "eval_steps": 5,
6
+ "global_step": 37,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
169
  "should_evaluate": false,
170
  "should_log": false,
171
  "should_save": true,
172
+ "should_training_stop": true
173
  },
174
  "attributes": {}
175
  }
176
  },
177
+ "total_flos": 1.3779253648687104e+16,
178
  "train_batch_size": 2,
179
  "trial_name": null,
180
  "trial_params": null