avsolatorio commited on
Commit
99028ad
·
verified ·
1 Parent(s): 8b3c196

Training in progress, step 10000, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b01285a843120ba7ed07c3b635d0b9c12f1bd1a012476f6d6399b1ebb428f613
3
  size 567860028
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:48e8ffaebfd6ef605ed7a70d898584f2d78a8d777d3176ef4dce697bcdef898c
3
  size 567860028
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c64aa2fa830f9a105805231b81df9bad87e08045f07f00f99e8178f0ad45c467
3
  size 1135783354
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f3d35e2adfee94a3f11af486d31ba30fb618502f9c1f33b283e9c6c61b50868f
3
  size 1135783354
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d2ba8d6eeeac1e2a3c2b4bf6a1a6da24d5e75e0c7e0c4a320806088cc6a5239f
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b2ed4580c3880e0fb178fd3387bc120234bd8b0c5f80ab76ddf25a7512d7b4b3
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f8e3991895adc0982abbe1eaf294042aa9cc197b13c08fe21c235f8d50ffdc14
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b7100428e35f211c455e0edf66e71a9c6844c13e9f45aabcb2c136afe45ca3ce
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "best_metric": 0.039172105491161346,
3
- "best_model_checkpoint": "doc-topic-model_eval-00_train-02/checkpoint-9000",
4
- "epoch": 4.437869822485207,
5
  "eval_steps": 1000,
6
- "global_step": 9000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -241,6 +241,32 @@
241
  "eval_samples_per_second": 304.881,
242
  "eval_steps_per_second": 19.06,
243
  "step": 9000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
244
  }
245
  ],
246
  "logging_steps": 500,
@@ -260,7 +286,7 @@
260
  "attributes": {}
261
  }
262
  },
263
- "total_flos": 203241954845196.0,
264
  "train_batch_size": 4,
265
  "trial_name": null,
266
  "trial_params": null
 
1
  {
2
+ "best_metric": 0.03805544227361679,
3
+ "best_model_checkpoint": "doc-topic-model_eval-00_train-02/checkpoint-10000",
4
+ "epoch": 4.930966469428008,
5
  "eval_steps": 1000,
6
+ "global_step": 10000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
241
  "eval_samples_per_second": 304.881,
242
  "eval_steps_per_second": 19.06,
243
  "step": 9000
244
+ },
245
+ {
246
+ "epoch": 4.684418145956608,
247
+ "grad_norm": 0.43250563740730286,
248
+ "learning_rate": 1.0631163708086787e-05,
249
+ "loss": 0.0352,
250
+ "step": 9500
251
+ },
252
+ {
253
+ "epoch": 4.930966469428008,
254
+ "grad_norm": 0.49166053533554077,
255
+ "learning_rate": 1.0138067061143987e-05,
256
+ "loss": 0.035,
257
+ "step": 10000
258
+ },
259
+ {
260
+ "epoch": 4.930966469428008,
261
+ "eval_accuracy": 0.9873464007823461,
262
+ "eval_f1": 0.5759475634083785,
263
+ "eval_loss": 0.03805544227361679,
264
+ "eval_precision": 0.7600601729973674,
265
+ "eval_recall": 0.46363844918559305,
266
+ "eval_runtime": 26.4106,
267
+ "eval_samples_per_second": 307.074,
268
+ "eval_steps_per_second": 19.197,
269
+ "step": 10000
270
  }
271
  ],
272
  "logging_steps": 500,
 
286
  "attributes": {}
287
  }
288
  },
289
+ "total_flos": 225936279463716.0,
290
  "train_batch_size": 4,
291
  "trial_name": null,
292
  "trial_params": null