rishi70612 commited on
Commit
24cf2d0
·
verified ·
1 Parent(s): f3a126c

Training in progress, step 16800, checkpoint

Browse files
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4c882567b4587e54e73e64f89aebf7700832afcf149737b89c4ab63b4ad03f67
3
- size 14567
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3dcfcd7c355804cf8b13e6226a71391df1b5d90db51709d836250af5fd03a627
3
+ size 14503
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 3.8704487722269265,
5
  "eval_steps": 800,
6
- "global_step": 16000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -327,6 +327,22 @@
327
  "eval_steps_per_second": 5.398,
328
  "eval_wer": 1.0,
329
  "step": 16000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
330
  }
331
  ],
332
  "logging_steps": 800,
@@ -346,7 +362,7 @@
346
  "attributes": {}
347
  }
348
  },
349
- "total_flos": 3.614468588324194e+19,
350
  "train_batch_size": 16,
351
  "trial_name": null,
352
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 4.063868392403532,
5
  "eval_steps": 800,
6
+ "global_step": 16800,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
327
  "eval_steps_per_second": 5.398,
328
  "eval_wer": 1.0,
329
  "step": 16000
330
+ },
331
+ {
332
+ "epoch": 4.063868392403532,
333
+ "grad_norm": NaN,
334
+ "learning_rate": 0.0002604114621601763,
335
+ "loss": 0.0,
336
+ "step": 16800
337
+ },
338
+ {
339
+ "epoch": 4.063868392403532,
340
+ "eval_loss": NaN,
341
+ "eval_runtime": 527.7152,
342
+ "eval_samples_per_second": 44.232,
343
+ "eval_steps_per_second": 5.529,
344
+ "eval_wer": 1.0,
345
+ "step": 16800
346
  }
347
  ],
348
  "logging_steps": 800,
 
362
  "attributes": {}
363
  }
364
  },
365
+ "total_flos": 3.7959210547118785e+19,
366
  "train_batch_size": 16,
367
  "trial_name": null,
368
  "trial_params": null