RoyJoy commited on
Commit
118420b
·
verified ·
1 Parent(s): 055277b

Training in progress, step 113, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7e2d5ccac9eb6537d0304c1d9a2664be207cec54a4ffa4f7a1d25f97df0299e7
3
  size 80013120
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:71ce0257c9975c8426eef5147f2e169f64e3821e067cd5cc5585cb8ea22f2fb1
3
  size 80013120
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4fc6ccd88e5c6b445ddb81486e1b8bb3250cd0ab8d1994a6c77c83f6e34745a6
3
  size 41119636
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8719fa79196e95545a788eed7d70f8cb9e00107d9e8d023232dd7e884b1d981b
3
  size 41119636
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a57a79985839c1144630cf23e24a752af1717970babccc404e738d94f6a44f55
3
  size 14960
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:00a877456c8253f043f7051f702060848b6888186d2898c19f50e380e8298427
3
  size 14960
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f78f02857b552b73e80fba53ae03b2fe594f4ff8718b2b7a00f9874950315d8f
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5762c92d924de856e23a69c148ad73656ab908a794479dfbc9eed45e0ea6ce92
3
  size 15024
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:61d763d8dd1b3cf0dec042ca7fcbae7698d20d5c131f3d0f4d2e0fa72962640d
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cfd09b43468bc3c26380f195d7cdbd487a3947aa9fd9338df244051f1d3913d5
3
  size 15024
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:553a6b90849b840223e58a50b84e206a3b835868d03a26f2274252e82e65b480
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f7bec2ec173378a661c585fde43bd276e5b164ea48e7c4439f47a4d480e85f66
3
  size 15024
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3a7a33c3c310055cbe2d20c9c9ebccba7f04bc435d5cf767eccc98d4867335d2
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8f8fe79dd2d524c3a47ebbac1a1fc359d4473e07185866008e654d72a772ea4f
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.7733333333333333,
5
  "eval_steps": 29,
6
- "global_step": 87,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -158,6 +158,41 @@
158
  "eval_samples_per_second": 38.56,
159
  "eval_steps_per_second": 4.871,
160
  "step": 87
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
161
  }
162
  ],
163
  "logging_steps": 5,
@@ -172,12 +207,12 @@
172
  "should_evaluate": false,
173
  "should_log": false,
174
  "should_save": true,
175
- "should_training_stop": false
176
  },
177
  "attributes": {}
178
  }
179
  },
180
- "total_flos": 1.78283317752234e+17,
181
  "train_batch_size": 2,
182
  "trial_name": null,
183
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 1.0044444444444445,
5
  "eval_steps": 29,
6
+ "global_step": 113,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
158
  "eval_samples_per_second": 38.56,
159
  "eval_steps_per_second": 4.871,
160
  "step": 87
161
+ },
162
+ {
163
+ "epoch": 0.8,
164
+ "grad_norm": 0.15183891355991364,
165
+ "learning_rate": 1.1806917592302762e-05,
166
+ "loss": 0.3296,
167
+ "step": 90
168
+ },
169
+ {
170
+ "epoch": 0.8444444444444444,
171
+ "grad_norm": 0.14968590438365936,
172
+ "learning_rate": 7.348083332917926e-06,
173
+ "loss": 0.3245,
174
+ "step": 95
175
+ },
176
+ {
177
+ "epoch": 0.8888888888888888,
178
+ "grad_norm": 0.16398116946220398,
179
+ "learning_rate": 3.879310116241042e-06,
180
+ "loss": 0.319,
181
+ "step": 100
182
+ },
183
+ {
184
+ "epoch": 0.9333333333333333,
185
+ "grad_norm": 0.14950266480445862,
186
+ "learning_rate": 1.4811171192794627e-06,
187
+ "loss": 0.3243,
188
+ "step": 105
189
+ },
190
+ {
191
+ "epoch": 0.9777777777777777,
192
+ "grad_norm": 0.15962573885917664,
193
+ "learning_rate": 2.0917258966953733e-07,
194
+ "loss": 0.3512,
195
+ "step": 110
196
  }
197
  ],
198
  "logging_steps": 5,
 
207
  "should_evaluate": false,
208
  "should_log": false,
209
  "should_save": true,
210
+ "should_training_stop": true
211
  },
212
  "attributes": {}
213
  }
214
  },
215
+ "total_flos": 2.3185047145362227e+17,
216
  "train_batch_size": 2,
217
  "trial_name": null,
218
  "trial_params": null