ihanif commited on
Commit
21c203e
·
verified ·
1 Parent(s): 7971e59

Training in progress, step 400, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7723d7c543d8111cde5b0d0c7d380625efc576826c33a65ac4f833b07aeb1078
3
  size 290403936
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2d5614aa1af231902d4d5e3d77f5f3651b101e42cb96721c66a4e36c221825bc
3
  size 290403936
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bd87fc16d56b734cfeee5cb96b5f81c2c149684d9649cfa36228e731375678b9
3
  size 574811514
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f7a91a83c5869579384befed17a65fdc01a4a1eeeb562808c9f16b986e7b270c
3
  size 574811514
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b1b89009b6eacb3b00e97174956b74b753d7bd2d21ca376db9636fe91a916011
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:71100c749c3d328813d845f0d31f26307650b3fddf848738bea5a69ec145f95d
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4c51e96bf39df0dcf05159321d889a0250569d665b8a5872f89010f1c91dbc52
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:79f86771e7e266279e59ca59b5466e514a509aded5e6a1886ec8e7d2af927a1c
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:94141d46d0db9b87a9f2673574f734412e500930d0c99d7e67d128e20b2e1714
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a2b3abdfc627eb6c58d7379b09121bd3c4b9730cfcbd091e8a4ca22eb117191b
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": 100,
3
  "best_metric": 22.84922534324222,
4
  "best_model_checkpoint": "whisper-base-synth-v2/checkpoint-100",
5
- "epoch": 0.9584664536741214,
6
  "eval_steps": 100,
7
- "global_step": 300,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -122,6 +122,44 @@
122
  "eval_wer": 93.44165931897385,
123
  "eval_wer_ortho": 96.17588440458395,
124
  "step": 300
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
125
  }
126
  ],
127
  "logging_steps": 25,
@@ -141,7 +179,7 @@
141
  "attributes": {}
142
  }
143
  },
144
- "total_flos": 1.245311926272e+18,
145
  "train_batch_size": 64,
146
  "trial_name": null,
147
  "trial_params": null
 
2
  "best_global_step": 100,
3
  "best_metric": 22.84922534324222,
4
  "best_model_checkpoint": "whisper-base-synth-v2/checkpoint-100",
5
+ "epoch": 1.2779552715654952,
6
  "eval_steps": 100,
7
+ "global_step": 400,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
122
  "eval_wer": 93.44165931897385,
123
  "eval_wer_ortho": 96.17588440458395,
124
  "step": 300
125
+ },
126
+ {
127
+ "epoch": 1.038338658146965,
128
+ "grad_norm": 3.464035749435425,
129
+ "learning_rate": 5.0958466453674125e-06,
130
+ "loss": 4.0785,
131
+ "step": 325
132
+ },
133
+ {
134
+ "epoch": 1.1182108626198084,
135
+ "grad_norm": 4.340151309967041,
136
+ "learning_rate": 5.49520766773163e-06,
137
+ "loss": 3.9435,
138
+ "step": 350
139
+ },
140
+ {
141
+ "epoch": 1.1980830670926517,
142
+ "grad_norm": 3.903965950012207,
143
+ "learning_rate": 5.894568690095847e-06,
144
+ "loss": 3.8291,
145
+ "step": 375
146
+ },
147
+ {
148
+ "epoch": 1.2779552715654952,
149
+ "grad_norm": 3.497990369796753,
150
+ "learning_rate": 6.2939297124600645e-06,
151
+ "loss": 3.7216,
152
+ "step": 400
153
+ },
154
+ {
155
+ "epoch": 1.2779552715654952,
156
+ "eval_loss": 1.0830340385437012,
157
+ "eval_runtime": 996.8493,
158
+ "eval_samples_per_second": 2.81,
159
+ "eval_steps_per_second": 0.044,
160
+ "eval_wer": 827.2872318092119,
161
+ "eval_wer_ortho": 818.5434313237004,
162
+ "step": 400
163
  }
164
  ],
165
  "logging_steps": 25,
 
179
  "attributes": {}
180
  }
181
  },
182
+ "total_flos": 1.65834038181888e+18,
183
  "train_batch_size": 64,
184
  "trial_name": null,
185
  "trial_params": null