sandernotenbaert commited on
Commit
b600755
·
verified ·
1 Parent(s): 229ddf6

Training in progress, step 8000, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3dc088dc7806d076db4af87fcb16f32f2f4264c49cbcac76f4cd8fba66849b21
3
  size 30214176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:21620fd84655c4db896f34197f325633f31514594547ffd7f9568f54bdaa66d4
3
  size 30214176
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:003ec6e37af7d32937d3f1e82568738b7f475a4953701c29695e87d37bc4fb0a
3
  size 291962
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6f3eed10629fabf788491c524b6122d0728f36d0d0d91bd828d85edbb66a60e4
3
  size 291962
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:457f1b145880ffefa4ea85b3e7a404600f4cba68a993abb9fd8332c3b47d64e5
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:080ccb46d322e83cec7b5164cc9a9cfad2dd21bf055cdfb1cf5e9ed68adf2f38
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ae69b2b9c59be93f7a4a7ddc203457ae939a2e00629604613f9975492d82daa9
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:49b6ff79bc8fa80bd69ca075842b5f5ae497b21ebbcd9737cb146fba40b9d7d8
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b0ac391f4dafa2480a707714482d63d0a94b4181ff6c8b0c91815f49c7797b53
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b21570681f00b76e8eef45e6f4bee892eb4f5cd6f6499a8d0d1225429aab8516
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": 7500,
3
  "best_metric": 1.5381077527999878,
4
  "best_model_checkpoint": "./results/hierarchical_music_t5_small_finetune/checkpoint-7500",
5
- "epoch": 3.339724502574092,
6
  "eval_steps": 500,
7
- "global_step": 7500,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -1178,6 +1178,84 @@
1178
  "eval_samples_per_second": 363.652,
1179
  "eval_steps_per_second": 45.471,
1180
  "step": 7500
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1181
  }
1182
  ],
1183
  "logging_steps": 50,
@@ -1192,7 +1270,7 @@
1192
  "early_stopping_threshold": 0.0
1193
  },
1194
  "attributes": {
1195
- "early_stopping_patience_counter": 0
1196
  }
1197
  },
1198
  "TrainerControl": {
@@ -1206,7 +1284,7 @@
1206
  "attributes": {}
1207
  }
1208
  },
1209
- "total_flos": 2.936391820718899e+16,
1210
  "train_batch_size": 4,
1211
  "trial_name": null,
1212
  "trial_params": null
 
2
  "best_global_step": 7500,
3
  "best_metric": 1.5381077527999878,
4
  "best_model_checkpoint": "./results/hierarchical_music_t5_small_finetune/checkpoint-7500",
5
+ "epoch": 3.561903436760818,
6
  "eval_steps": 500,
7
+ "global_step": 8000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
1178
  "eval_samples_per_second": 363.652,
1179
  "eval_steps_per_second": 45.471,
1180
  "step": 7500
1181
+ },
1182
+ {
1183
+ "epoch": 3.3615416724641713,
1184
+ "grad_norm": 1.4630149602890015,
1185
+ "learning_rate": 5e-05,
1186
+ "loss": 1.6543,
1187
+ "step": 7550
1188
+ },
1189
+ {
1190
+ "epoch": 3.3838040907193543,
1191
+ "grad_norm": 0.9978652596473694,
1192
+ "learning_rate": 5e-05,
1193
+ "loss": 1.6469,
1194
+ "step": 7600
1195
+ },
1196
+ {
1197
+ "epoch": 3.406066508974537,
1198
+ "grad_norm": 0.9942854046821594,
1199
+ "learning_rate": 5e-05,
1200
+ "loss": 1.6524,
1201
+ "step": 7650
1202
+ },
1203
+ {
1204
+ "epoch": 3.42832892722972,
1205
+ "grad_norm": 1.6113872528076172,
1206
+ "learning_rate": 5e-05,
1207
+ "loss": 1.6392,
1208
+ "step": 7700
1209
+ },
1210
+ {
1211
+ "epoch": 3.450591345484903,
1212
+ "grad_norm": 1.2430763244628906,
1213
+ "learning_rate": 5e-05,
1214
+ "loss": 1.6524,
1215
+ "step": 7750
1216
+ },
1217
+ {
1218
+ "epoch": 3.472853763740086,
1219
+ "grad_norm": 0.9973090887069702,
1220
+ "learning_rate": 5e-05,
1221
+ "loss": 1.6396,
1222
+ "step": 7800
1223
+ },
1224
+ {
1225
+ "epoch": 3.4951161819952694,
1226
+ "grad_norm": 1.3717776536941528,
1227
+ "learning_rate": 5e-05,
1228
+ "loss": 1.6463,
1229
+ "step": 7850
1230
+ },
1231
+ {
1232
+ "epoch": 3.5173786002504523,
1233
+ "grad_norm": 1.3711599111557007,
1234
+ "learning_rate": 5e-05,
1235
+ "loss": 1.644,
1236
+ "step": 7900
1237
+ },
1238
+ {
1239
+ "epoch": 3.5396410185056353,
1240
+ "grad_norm": 1.0126900672912598,
1241
+ "learning_rate": 5e-05,
1242
+ "loss": 1.6311,
1243
+ "step": 7950
1244
+ },
1245
+ {
1246
+ "epoch": 3.561903436760818,
1247
+ "grad_norm": 1.0467159748077393,
1248
+ "learning_rate": 5e-05,
1249
+ "loss": 1.64,
1250
+ "step": 8000
1251
+ },
1252
+ {
1253
+ "epoch": 3.561903436760818,
1254
+ "eval_loss": 1.539516806602478,
1255
+ "eval_runtime": 42.3362,
1256
+ "eval_samples_per_second": 377.242,
1257
+ "eval_steps_per_second": 47.17,
1258
+ "step": 8000
1259
  }
1260
  ],
1261
  "logging_steps": 50,
 
1270
  "early_stopping_threshold": 0.0
1271
  },
1272
  "attributes": {
1273
+ "early_stopping_patience_counter": 1
1274
  }
1275
  },
1276
  "TrainerControl": {
 
1284
  "attributes": {}
1285
  }
1286
  },
1287
+ "total_flos": 2.984631313202381e+16,
1288
  "train_batch_size": 4,
1289
  "trial_name": null,
1290
  "trial_params": null
last-checkpoint/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:98bf107852bd8fb9f94e9f610ccce3445faf6710de67a8a094330338e1efd116
3
  size 5624
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:53d05e7b884c3329c7231564fbcc24e8e12ef445dff72282ffbf7a4bf4c375f3
3
  size 5624