KevinKibe commited on
Commit
e1b0c13
·
verified ·
1 Parent(s): 723b2af

Training in progress, step 5000, checkpoint

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ffe7afe5c070fab96ca43ba7d40ffa5a5697d168401423ad6c0ad6e75a43f93b
3
  size 6710771584
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:82bc6140c804b5d3375fee96fc07573ed3f7f3bd1827010bfb2d2cba57c7527e
3
  size 6710771584
last-checkpoint/pytorch_model-00001-of-00003.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:34683cb4007c3b92110f7840142f7ce353dc35fa8c47d3906f2a8292351af604
3
  size 4986145435
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5a9e4393d35049ad958dc05a7893ce3d9fc4b21c4800a5cb9d0632332aab1743
3
  size 4986145435
last-checkpoint/pytorch_model-00002-of-00003.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7892cbbcf16ff8490e2d0a329d8594e2218d984e8584083ac3da0573e6d508dd
3
  size 4985796040
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5d05fe05ad2b03594c78064a4e20af41c072f2551802c62e8cc765ab2658740c
3
  size 4985796040
last-checkpoint/pytorch_model-00003-of-00003.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4e4147dc29ced8cfe98d7c7047558106240377827105c3d76a5ee8d8e17d7754
3
  size 3407874846
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5627e77582102da559297a40c571e3fd53fef55c7f74cf114eb83aca4b1518ce
3
  size 3407874846
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e4fbdd49ae32378de0eb7b581f65e4edbef5eb7583e3157a829c62678554ea54
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c50f902d46e1503d63201e520cf2d2a219286c093050136afe0283b841bb99b9
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:47132a874ad4fda1d1f651cb8d7cf3a21ccb1e85b7d1f0c122a2dcf69a4af0ac
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2a9b177af396170d7a7558a5fee9e05fa92b1c1bfde5ab937b9c9b2a05a9e953
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": 1.1881097555160522,
3
  "best_model_checkpoint": "../facebook/nllb-200-3.3B-finetuned/checkpoint-1000",
4
- "epoch": 4500.0,
5
  "eval_steps": 500,
6
- "global_step": 4500,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -160,6 +160,23 @@
160
  "eval_samples_per_second": 0.287,
161
  "eval_steps_per_second": 0.144,
162
  "step": 4500
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
163
  }
164
  ],
165
  "logging_steps": 500,
@@ -167,7 +184,7 @@
167
  "num_input_tokens_seen": 0,
168
  "num_train_epochs": 5000,
169
  "save_steps": 500,
170
- "total_flos": 2.8630196748288e+16,
171
  "train_batch_size": 8,
172
  "trial_name": null,
173
  "trial_params": null
 
1
  {
2
  "best_metric": 1.1881097555160522,
3
  "best_model_checkpoint": "../facebook/nllb-200-3.3B-finetuned/checkpoint-1000",
4
+ "epoch": 5000.0,
5
  "eval_steps": 500,
6
+ "global_step": 5000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
160
  "eval_samples_per_second": 0.287,
161
  "eval_steps_per_second": 0.144,
162
  "step": 4500
163
+ },
164
+ {
165
+ "epoch": 5000.0,
166
+ "grad_norm": 0.029535507783293724,
167
+ "learning_rate": 8.882641330809627e-12,
168
+ "loss": 0.0016,
169
+ "step": 5000
170
+ },
171
+ {
172
+ "epoch": 5000.0,
173
+ "eval_gen_len": 24.5,
174
+ "eval_loss": 1.4524964094161987,
175
+ "eval_rouge": 0.0357,
176
+ "eval_runtime": 6.9555,
177
+ "eval_samples_per_second": 0.288,
178
+ "eval_steps_per_second": 0.144,
179
+ "step": 5000
180
  }
181
  ],
182
  "logging_steps": 500,
 
184
  "num_input_tokens_seen": 0,
185
  "num_train_epochs": 5000,
186
  "save_steps": 500,
187
+ "total_flos": 3.181132972032e+16,
188
  "train_batch_size": 8,
189
  "trial_name": null,
190
  "trial_params": null