ihanif commited on
Commit
c2e2c52
·
verified ·
1 Parent(s): 44df140

Training in progress, step 2100, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e99427d68f8233aa1f1c5bb73907e5d9681f9991acb722d5d8f0825832c2f791
3
  size 290403936
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:44dc2faa43ac5a3436dfa3b3bed4aa7c966e4ea4f657d4e6dfca9280a68205ed
3
  size 290403936
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f61c7abc74279095f7ed91d83ceb4ef17ae8f88cda63034464aa1242afbd199a
3
  size 574811514
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1a48debe5a827e29a4f0cc6af4177c358b9b7475853d96668a3332a6bcf5927e
3
  size 574811514
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:28c0cd479201fbb3ddf3b97d0708b8cd4b54efb5dd7439ed8dc16f0f7519ee85
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:04493c60d37ce82f60a8454f7936d5c5083c1013f2dc35a3da96b38580130f41
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ba7673f5d0f1631494ad72f8f050fc150ee4f9e1b527943111bb3dd31bbe4f29
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1d9f44034f20488b71439652353f4af422345160519981213e36f7e2d9306983
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e9a091a177a6000f85d9e8e7d6c3f964e3dfd92da03bfd940a7c2ea7974b6392
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c28781354eb93a174ad9fc8e149ed54169a6a66d39d32994acc35f88e6241d9e
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": 21.52664063484066,
3
  "best_model_checkpoint": "whisper-base-cv20-v2/checkpoint-1500",
4
- "epoch": 2.564102564102564,
5
  "eval_steps": 100,
6
- "global_step": 2000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -767,6 +767,44 @@
767
  "eval_wer": 146.00495444430447,
768
  "eval_wer_ortho": 145.57382494602226,
769
  "step": 2000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
770
  }
771
  ],
772
  "logging_steps": 25,
@@ -786,7 +824,7 @@
786
  "attributes": {}
787
  }
788
  },
789
- "total_flos": 8.30026342858752e+18,
790
  "train_batch_size": 64,
791
  "trial_name": null,
792
  "trial_params": null
 
1
  {
2
  "best_metric": 21.52664063484066,
3
  "best_model_checkpoint": "whisper-base-cv20-v2/checkpoint-1500",
4
+ "epoch": 2.6923076923076925,
5
  "eval_steps": 100,
6
+ "global_step": 2100,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
767
  "eval_wer": 146.00495444430447,
768
  "eval_wer_ortho": 145.57382494602226,
769
  "step": 2000
770
+ },
771
+ {
772
+ "epoch": 2.5961538461538463,
773
+ "grad_norm": 4.9953694343566895,
774
+ "learning_rate": 7.573599240265908e-06,
775
+ "loss": 3.138,
776
+ "step": 2025
777
+ },
778
+ {
779
+ "epoch": 2.628205128205128,
780
+ "grad_norm": 5.183081150054932,
781
+ "learning_rate": 6.9800569800569804e-06,
782
+ "loss": 3.0988,
783
+ "step": 2050
784
+ },
785
+ {
786
+ "epoch": 2.66025641025641,
787
+ "grad_norm": 5.423998832702637,
788
+ "learning_rate": 6.386514719848054e-06,
789
+ "loss": 3.1566,
790
+ "step": 2075
791
+ },
792
+ {
793
+ "epoch": 2.6923076923076925,
794
+ "grad_norm": 5.148243427276611,
795
+ "learning_rate": 5.792972459639127e-06,
796
+ "loss": 3.0998,
797
+ "step": 2100
798
+ },
799
+ {
800
+ "epoch": 2.6923076923076925,
801
+ "eval_loss": 1.8170723915100098,
802
+ "eval_runtime": 730.5921,
803
+ "eval_samples_per_second": 3.834,
804
+ "eval_steps_per_second": 0.06,
805
+ "eval_wer": 129.82743418566568,
806
+ "eval_wer_ortho": 130.33549244311575,
807
+ "step": 2100
808
  }
809
  ],
810
  "logging_steps": 25,
 
824
  "attributes": {}
825
  }
826
  },
827
+ "total_flos": 8.71536740401152e+18,
828
  "train_batch_size": 64,
829
  "trial_name": null,
830
  "trial_params": null