kinleyrabgay commited on
Commit
07f3c11
·
verified ·
1 Parent(s): 5969b4c

Training in progress, epoch 5, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:06df666b6e9b9daf5f491d47584000ef0f15c0ff91d9d43b452f6608165d2c17
3
  size 2460354912
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fab85460a1b4afe5235adf29b80d60cc190779373e90f98a65f4d03b9ab2763e
3
  size 2460354912
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4e6f9f13f431d32355177f53dd768a76f75650f7a6e4ff3e746b73da59d4b3b1
3
  size 4921023445
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:efb3e71bd2169d1bee8c01a9ac4b53b09649a9e69287d3ec66340315dc828cd0
3
  size 4921023445
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2f213695afd639b31c091f8223418438a325ee03e1cc0db68e855dfc04f16a3c
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7f19a3c3d19ca62769269406caae709c1ade6af65b39ab8ea8cb5c868d8c6022
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0262aa68bebe82c90fa7f7f9955996a9e0ad8e1b35acbc7f8a4355aa7d949b83
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:86b6dcc7abbb19b3c426b916efb5f17e7204c57a28b1c5bdc0e214cf16444280
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3d31e1b87deb184c3fb7779fff023bc406d60a7176c80663ef83e1b93f1aa152
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b6bdc06fd50950c7d5950384b8985848c0c078212370cd8410d5b1ea7f24947e
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,10 +1,10 @@
1
  {
2
- "best_global_step": 1000,
3
- "best_metric": 63.06198866502594,
4
- "best_model_checkpoint": "nllb-600m-dz-en-checkpoints/checkpoint-1000",
5
- "epoch": 4.0,
6
  "eval_steps": 500,
7
- "global_step": 1000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -58,6 +58,15 @@
58
  "eval_samples_per_second": 4.962,
59
  "eval_steps_per_second": 1.241,
60
  "step": 1000
 
 
 
 
 
 
 
 
 
61
  }
62
  ],
63
  "logging_steps": 500,
@@ -72,12 +81,12 @@
72
  "should_evaluate": false,
73
  "should_log": false,
74
  "should_save": true,
75
- "should_training_stop": false
76
  },
77
  "attributes": {}
78
  }
79
  },
80
- "total_flos": 2167104602112000.0,
81
  "train_batch_size": 4,
82
  "trial_name": null,
83
  "trial_params": null
 
1
  {
2
+ "best_global_step": 1250,
3
+ "best_metric": 63.12399055783562,
4
+ "best_model_checkpoint": "nllb-600m-dz-en-checkpoints/checkpoint-1250",
5
+ "epoch": 5.0,
6
  "eval_steps": 500,
7
+ "global_step": 1250,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
58
  "eval_samples_per_second": 4.962,
59
  "eval_steps_per_second": 1.241,
60
  "step": 1000
61
+ },
62
+ {
63
+ "epoch": 5.0,
64
+ "eval_bleu": 63.12399055783562,
65
+ "eval_loss": 0.10181548446416855,
66
+ "eval_runtime": 111.015,
67
+ "eval_samples_per_second": 4.504,
68
+ "eval_steps_per_second": 1.126,
69
+ "step": 1250
70
  }
71
  ],
72
  "logging_steps": 500,
 
81
  "should_evaluate": false,
82
  "should_log": false,
83
  "should_save": true,
84
+ "should_training_stop": true
85
  },
86
  "attributes": {}
87
  }
88
  },
89
+ "total_flos": 2708880752640000.0,
90
  "train_batch_size": 4,
91
  "trial_name": null,
92
  "trial_params": null