sandernotenbaert commited on
Commit
a76571e
·
verified ·
1 Parent(s): bd81e34

Training in progress, step 8500, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:21620fd84655c4db896f34197f325633f31514594547ffd7f9568f54bdaa66d4
3
  size 30214176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:78eeada532b08bdf3524032fcb0dd8742b5cbe44f304c2f845a2ec8ac351c803
3
  size 30214176
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6f3eed10629fabf788491c524b6122d0728f36d0d0d91bd828d85edbb66a60e4
3
  size 291962
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:48ec7b29adac8f13e97e8d0b0016dbfde03e9643c7d13a43fc298e30253e5845
3
  size 291962
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:080ccb46d322e83cec7b5164cc9a9cfad2dd21bf055cdfb1cf5e9ed68adf2f38
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:54fde25c1257c410542439f7b30010e731a773e09e44bce8d654fd46bb13b1b3
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:49b6ff79bc8fa80bd69ca075842b5f5ae497b21ebbcd9737cb146fba40b9d7d8
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:68029c1a6b8f58f4897cc068068a39570420fb36c1353d8dd13c010a143f2a88
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b21570681f00b76e8eef45e6f4bee892eb4f5cd6f6499a8d0d1225429aab8516
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b5043baea5bed98a56ee64b89f4809a10402dd6a6764f855e2bb19bcd7ba63c7
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,10 +1,10 @@
1
  {
2
- "best_global_step": 7500,
3
- "best_metric": 1.5381077527999878,
4
- "best_model_checkpoint": "./results/hierarchical_music_t5_small_finetune/checkpoint-7500",
5
- "epoch": 3.561903436760818,
6
  "eval_steps": 500,
7
- "global_step": 8000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -1256,6 +1256,84 @@
1256
  "eval_samples_per_second": 377.242,
1257
  "eval_steps_per_second": 47.17,
1258
  "step": 8000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1259
  }
1260
  ],
1261
  "logging_steps": 50,
@@ -1270,7 +1348,7 @@
1270
  "early_stopping_threshold": 0.0
1271
  },
1272
  "attributes": {
1273
- "early_stopping_patience_counter": 1
1274
  }
1275
  },
1276
  "TrainerControl": {
@@ -1284,7 +1362,7 @@
1284
  "attributes": {}
1285
  }
1286
  },
1287
- "total_flos": 2.984631313202381e+16,
1288
  "train_batch_size": 4,
1289
  "trial_name": null,
1290
  "trial_params": null
 
1
  {
2
+ "best_global_step": 8500,
3
+ "best_metric": 1.516330361366272,
4
+ "best_model_checkpoint": "./results/hierarchical_music_t5_small_finetune/checkpoint-8500",
5
+ "epoch": 3.784527619312648,
6
  "eval_steps": 500,
7
+ "global_step": 8500,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
1256
  "eval_samples_per_second": 377.242,
1257
  "eval_steps_per_second": 47.17,
1258
  "step": 8000
1259
+ },
1260
+ {
1261
+ "epoch": 3.584165855016001,
1262
+ "grad_norm": 1.1766951084136963,
1263
+ "learning_rate": 5e-05,
1264
+ "loss": 1.6552,
1265
+ "step": 8050
1266
+ },
1267
+ {
1268
+ "epoch": 3.606428273271184,
1269
+ "grad_norm": 1.0943933725357056,
1270
+ "learning_rate": 5e-05,
1271
+ "loss": 1.6385,
1272
+ "step": 8100
1273
+ },
1274
+ {
1275
+ "epoch": 3.628690691526367,
1276
+ "grad_norm": 1.2377898693084717,
1277
+ "learning_rate": 5e-05,
1278
+ "loss": 1.6288,
1279
+ "step": 8150
1280
+ },
1281
+ {
1282
+ "epoch": 3.65095310978155,
1283
+ "grad_norm": 0.939339280128479,
1284
+ "learning_rate": 5e-05,
1285
+ "loss": 1.6357,
1286
+ "step": 8200
1287
+ },
1288
+ {
1289
+ "epoch": 3.673215528036733,
1290
+ "grad_norm": 1.0802948474884033,
1291
+ "learning_rate": 5e-05,
1292
+ "loss": 1.6367,
1293
+ "step": 8250
1294
+ },
1295
+ {
1296
+ "epoch": 3.695477946291916,
1297
+ "grad_norm": 1.089154601097107,
1298
+ "learning_rate": 5e-05,
1299
+ "loss": 1.6434,
1300
+ "step": 8300
1301
+ },
1302
+ {
1303
+ "epoch": 3.7177403645470988,
1304
+ "grad_norm": 1.095510482788086,
1305
+ "learning_rate": 5e-05,
1306
+ "loss": 1.6445,
1307
+ "step": 8350
1308
+ },
1309
+ {
1310
+ "epoch": 3.740002782802282,
1311
+ "grad_norm": 1.2433582544326782,
1312
+ "learning_rate": 5e-05,
1313
+ "loss": 1.6521,
1314
+ "step": 8400
1315
+ },
1316
+ {
1317
+ "epoch": 3.762265201057465,
1318
+ "grad_norm": 1.3547347784042358,
1319
+ "learning_rate": 5e-05,
1320
+ "loss": 1.6363,
1321
+ "step": 8450
1322
+ },
1323
+ {
1324
+ "epoch": 3.784527619312648,
1325
+ "grad_norm": 1.224070429801941,
1326
+ "learning_rate": 5e-05,
1327
+ "loss": 1.6455,
1328
+ "step": 8500
1329
+ },
1330
+ {
1331
+ "epoch": 3.784527619312648,
1332
+ "eval_loss": 1.516330361366272,
1333
+ "eval_runtime": 40.388,
1334
+ "eval_samples_per_second": 395.439,
1335
+ "eval_steps_per_second": 49.445,
1336
+ "step": 8500
1337
  }
1338
  ],
1339
  "logging_steps": 50,
 
1348
  "early_stopping_threshold": 0.0
1349
  },
1350
  "attributes": {
1351
+ "early_stopping_patience_counter": 0
1352
  }
1353
  },
1354
  "TrainerControl": {
 
1362
  "attributes": {}
1363
  }
1364
  },
1365
+ "total_flos": 3.033090820902912e+16,
1366
  "train_batch_size": 4,
1367
  "trial_name": null,
1368
  "trial_params": null
last-checkpoint/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:53d05e7b884c3329c7231564fbcc24e8e12ef445dff72282ffbf7a4bf4c375f3
3
  size 5624
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:241913eb458c3cd7f38f1105f1ffa37291ed4c7e03a3c94d3d6822f55195b546
3
  size 5624