sandernotenbaert commited on
Commit
98ae865
·
verified ·
1 Parent(s): 15d4b40

Training in progress, step 6500, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e0ba7be4e1197b6ebae5a1fb0d6ae29bbafd16d90726437a2da8408d73641f03
3
  size 30214176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:66f0bf969e7c4f10819387c514099288befb4d6a92b18fedb97919efb7838146
3
  size 30214176
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2bebcf4136f2e6e53dd975d0ec5899e311738161c26efd5f1866b8fbda4dd14d
3
  size 291962
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:50326021a12350d0fd340fb39b69dcb99c4d9d7625607f1ea78848e8533735ef
3
  size 291962
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:788c6b064d884311e214b6335a80e7fe5e75085f966367611657f1664cf160c2
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2aba6f3b60d25e9d80bfa48704513608d3c51338a99fc68164f2cda5539a2e88
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:09a2836138899bf244344610cf1cfa7f6c9e6417ce66d8196cf2ef6125f38e4e
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0b18b3eda07668461b2815107443aa6a6c68056a4e1c0be8b74117cc02ff9391
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e81fbcc85fe8453ce60c9a14a7fd7bb3512bae9747d397407e0552c8567a7c1e
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2167d86470a0af7e2c7e124cb3b9e089d70c4424875cd5dabb7a3f9dabe21d16
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,10 +1,10 @@
1
  {
2
- "best_global_step": 4500,
3
- "best_metric": 1.5784235000610352,
4
- "best_model_checkpoint": "./results/hierarchical_music_t5_small_finetune/checkpoint-4500",
5
- "epoch": 2.6714345345763184,
6
  "eval_steps": 500,
7
- "global_step": 6000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -944,6 +944,84 @@
944
  "eval_samples_per_second": 389.821,
945
  "eval_steps_per_second": 48.743,
946
  "step": 6000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
947
  }
948
  ],
949
  "logging_steps": 50,
@@ -958,7 +1036,7 @@
958
  "early_stopping_threshold": 0.0
959
  },
960
  "attributes": {
961
- "early_stopping_patience_counter": 3
962
  }
963
  },
964
  "TrainerControl": {
@@ -967,12 +1045,12 @@
967
  "should_evaluate": false,
968
  "should_log": false,
969
  "should_save": true,
970
- "should_training_stop": true
971
  },
972
  "attributes": {}
973
  }
974
  },
975
- "total_flos": 2.7676743726557184e+16,
976
  "train_batch_size": 4,
977
  "trial_name": null,
978
  "trial_params": null
 
1
  {
2
+ "best_global_step": 6500,
3
+ "best_metric": 1.5628445148468018,
4
+ "best_model_checkpoint": "./results/hierarchical_music_t5_small_finetune/checkpoint-6500",
5
+ "epoch": 2.894058717128148,
6
  "eval_steps": 500,
7
+ "global_step": 6500,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
944
  "eval_samples_per_second": 389.821,
945
  "eval_steps_per_second": 48.743,
946
  "step": 6000
947
+ },
948
+ {
949
+ "epoch": 2.6936969528315013,
950
+ "grad_norm": 1.070421814918518,
951
+ "learning_rate": 5e-05,
952
+ "loss": 1.6947,
953
+ "step": 6050
954
+ },
955
+ {
956
+ "epoch": 2.7159593710866843,
957
+ "grad_norm": 0.9952645301818848,
958
+ "learning_rate": 5e-05,
959
+ "loss": 1.6907,
960
+ "step": 6100
961
+ },
962
+ {
963
+ "epoch": 2.738221789341867,
964
+ "grad_norm": 1.2595455646514893,
965
+ "learning_rate": 5e-05,
966
+ "loss": 1.6954,
967
+ "step": 6150
968
+ },
969
+ {
970
+ "epoch": 2.76048420759705,
971
+ "grad_norm": 0.9722006916999817,
972
+ "learning_rate": 5e-05,
973
+ "loss": 1.6832,
974
+ "step": 6200
975
+ },
976
+ {
977
+ "epoch": 2.782746625852233,
978
+ "grad_norm": 1.2001519203186035,
979
+ "learning_rate": 5e-05,
980
+ "loss": 1.6832,
981
+ "step": 6250
982
+ },
983
+ {
984
+ "epoch": 2.805009044107416,
985
+ "grad_norm": 1.316867709159851,
986
+ "learning_rate": 5e-05,
987
+ "loss": 1.6873,
988
+ "step": 6300
989
+ },
990
+ {
991
+ "epoch": 2.8272714623625994,
992
+ "grad_norm": 1.2271651029586792,
993
+ "learning_rate": 5e-05,
994
+ "loss": 1.6865,
995
+ "step": 6350
996
+ },
997
+ {
998
+ "epoch": 2.8495338806177823,
999
+ "grad_norm": 1.2443265914916992,
1000
+ "learning_rate": 5e-05,
1001
+ "loss": 1.6779,
1002
+ "step": 6400
1003
+ },
1004
+ {
1005
+ "epoch": 2.8717962988729653,
1006
+ "grad_norm": 1.1751494407653809,
1007
+ "learning_rate": 5e-05,
1008
+ "loss": 1.666,
1009
+ "step": 6450
1010
+ },
1011
+ {
1012
+ "epoch": 2.894058717128148,
1013
+ "grad_norm": 0.9704211950302124,
1014
+ "learning_rate": 5e-05,
1015
+ "loss": 1.6628,
1016
+ "step": 6500
1017
+ },
1018
+ {
1019
+ "epoch": 2.894058717128148,
1020
+ "eval_loss": 1.5628445148468018,
1021
+ "eval_runtime": 41.0455,
1022
+ "eval_samples_per_second": 389.105,
1023
+ "eval_steps_per_second": 48.653,
1024
+ "step": 6500
1025
  }
1026
  ],
1027
  "logging_steps": 50,
 
1036
  "early_stopping_threshold": 0.0
1037
  },
1038
  "attributes": {
1039
+ "early_stopping_patience_counter": 0
1040
  }
1041
  },
1042
  "TrainerControl": {
 
1045
  "should_evaluate": false,
1046
  "should_log": false,
1047
  "should_save": true,
1048
+ "should_training_stop": false
1049
  },
1050
  "attributes": {}
1051
  }
1052
  },
1053
+ "total_flos": 2.8160444868950016e+16,
1054
  "train_batch_size": 4,
1055
  "trial_name": null,
1056
  "trial_params": null
last-checkpoint/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:02aa50af5025c9f0ca029c8bf84c80140d605447e8fbdf2b3d4a1f55708551a3
3
  size 5624
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:98bf107852bd8fb9f94e9f610ccce3445faf6710de67a8a094330338e1efd116
3
  size 5624