Training in progress, step 4500, checkpoint
Browse files- last-checkpoint/optimizer.pt +1 -1
- last-checkpoint/pytorch_model-00001-of-00003.bin +1 -1
- last-checkpoint/pytorch_model-00002-of-00003.bin +1 -1
- last-checkpoint/pytorch_model-00003-of-00003.bin +1 -1
- last-checkpoint/rng_state.pth +1 -1
- last-checkpoint/scheduler.pt +1 -1
- last-checkpoint/trainer_state.json +20 -3
last-checkpoint/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 6710771584
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ffe7afe5c070fab96ca43ba7d40ffa5a5697d168401423ad6c0ad6e75a43f93b
|
3 |
size 6710771584
|
last-checkpoint/pytorch_model-00001-of-00003.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4986145435
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:34683cb4007c3b92110f7840142f7ce353dc35fa8c47d3906f2a8292351af604
|
3 |
size 4986145435
|
last-checkpoint/pytorch_model-00002-of-00003.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4985796040
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7892cbbcf16ff8490e2d0a329d8594e2218d984e8584083ac3da0573e6d508dd
|
3 |
size 4985796040
|
last-checkpoint/pytorch_model-00003-of-00003.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 3407874846
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4e4147dc29ced8cfe98d7c7047558106240377827105c3d76a5ee8d8e17d7754
|
3 |
size 3407874846
|
last-checkpoint/rng_state.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14244
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e4fbdd49ae32378de0eb7b581f65e4edbef5eb7583e3157a829c62678554ea54
|
3 |
size 14244
|
last-checkpoint/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1064
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:47132a874ad4fda1d1f651cb8d7cf3a21ccb1e85b7d1f0c122a2dcf69a4af0ac
|
3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
@@ -1,9 +1,9 @@
|
|
1 |
{
|
2 |
"best_metric": 1.1881097555160522,
|
3 |
"best_model_checkpoint": "../facebook/nllb-200-3.3B-finetuned/checkpoint-1000",
|
4 |
-
"epoch":
|
5 |
"eval_steps": 500,
|
6 |
-
"global_step":
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
@@ -143,6 +143,23 @@
|
|
143 |
"eval_samples_per_second": 0.288,
|
144 |
"eval_steps_per_second": 0.144,
|
145 |
"step": 4000
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
146 |
}
|
147 |
],
|
148 |
"logging_steps": 500,
|
@@ -150,7 +167,7 @@
|
|
150 |
"num_input_tokens_seen": 0,
|
151 |
"num_train_epochs": 5000,
|
152 |
"save_steps": 500,
|
153 |
-
"total_flos": 2.
|
154 |
"train_batch_size": 8,
|
155 |
"trial_name": null,
|
156 |
"trial_params": null
|
|
|
1 |
{
|
2 |
"best_metric": 1.1881097555160522,
|
3 |
"best_model_checkpoint": "../facebook/nllb-200-3.3B-finetuned/checkpoint-1000",
|
4 |
+
"epoch": 4500.0,
|
5 |
"eval_steps": 500,
|
6 |
+
"global_step": 4500,
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
|
|
143 |
"eval_samples_per_second": 0.288,
|
144 |
"eval_steps_per_second": 0.144,
|
145 |
"step": 4000
|
146 |
+
},
|
147 |
+
{
|
148 |
+
"epoch": 4500.0,
|
149 |
+
"grad_norm": 0.029812365770339966,
|
150 |
+
"learning_rate": 2.4763828125157654e-07,
|
151 |
+
"loss": 0.0016,
|
152 |
+
"step": 4500
|
153 |
+
},
|
154 |
+
{
|
155 |
+
"epoch": 4500.0,
|
156 |
+
"eval_gen_len": 24.5,
|
157 |
+
"eval_loss": 1.4486483335494995,
|
158 |
+
"eval_rouge": 0.0357,
|
159 |
+
"eval_runtime": 6.9642,
|
160 |
+
"eval_samples_per_second": 0.287,
|
161 |
+
"eval_steps_per_second": 0.144,
|
162 |
+
"step": 4500
|
163 |
}
|
164 |
],
|
165 |
"logging_steps": 500,
|
|
|
167 |
"num_input_tokens_seen": 0,
|
168 |
"num_train_epochs": 5000,
|
169 |
"save_steps": 500,
|
170 |
+
"total_flos": 2.8630196748288e+16,
|
171 |
"train_batch_size": 8,
|
172 |
"trial_name": null,
|
173 |
"trial_params": null
|