sandernotenbaert commited on
Commit
9cf370a
·
verified ·
1 Parent(s): a5ed0c4

Training in progress, step 11000, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:860eca3961053936b241a5a2d4fa22d5d55c591199aaa9b78de4fdc667354710
3
  size 30214176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fdb6e98797334d8dad686390c3a871babad8123963611e212956f6662bc5a8e1
3
  size 30214176
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0908b4e68e646f4581a0026b2c4fa54184efb4bcbd7553998a1c4a4c12cd731e
3
  size 291962
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e49f34f35179e3613b976ab84b875c3b7727044e3d2f20224c5caf29eec11c3a
3
  size 291962
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:79f81c651a86e496a8a0683bb40cfa7b5abd415344f225e4b6cf5b7f3bf0d148
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f0e87d0594583c91449bed8c9b57cd31ad9ac1a2ab308d4940cbd5e7a3fa296b
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d094517def3bab9b1b376a801fd8dd8681180f5ccdb5bd9fd6776c1cd25c2968
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4d966dee3ea83ae9edc170643edbeead55aecfa7f6d46f849824e98b9ee7cee7
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cd17e6a2456b591e82434cf85c6c3687643ac9b76a0a0c080b341aa852e38872
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:18a6e60ee80e57778e5fd78a1d8c91d6a0cd4ce7b1800f1645350ad02d55ca76
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,10 +1,10 @@
1
  {
2
- "best_global_step": 10000,
3
- "best_metric": 1.5091972351074219,
4
- "best_model_checkpoint": "./results/hierarchical_music_t5_small_finetune/checkpoint-10000",
5
- "epoch": 4.6754417698622515,
6
  "eval_steps": 500,
7
- "global_step": 10500,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -1646,6 +1646,84 @@
1646
  "eval_samples_per_second": 394.461,
1647
  "eval_steps_per_second": 49.323,
1648
  "step": 10500
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1649
  }
1650
  ],
1651
  "logging_steps": 50,
@@ -1660,7 +1738,7 @@
1660
  "early_stopping_threshold": 0.0
1661
  },
1662
  "attributes": {
1663
- "early_stopping_patience_counter": 1
1664
  }
1665
  },
1666
  "TrainerControl": {
@@ -1674,7 +1752,7 @@
1674
  "attributes": {}
1675
  }
1676
  },
1677
- "total_flos": 4.37287432012032e+16,
1678
  "train_batch_size": 4,
1679
  "trial_name": null,
1680
  "trial_params": null
 
1
  {
2
+ "best_global_step": 11000,
3
+ "best_metric": 1.5041238069534302,
4
+ "best_model_checkpoint": "./results/hierarchical_music_t5_small_finetune/checkpoint-11000",
5
+ "epoch": 4.898065952414081,
6
  "eval_steps": 500,
7
+ "global_step": 11000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
1646
  "eval_samples_per_second": 394.461,
1647
  "eval_steps_per_second": 49.323,
1648
  "step": 10500
1649
+ },
1650
+ {
1651
+ "epoch": 4.697704188117434,
1652
+ "grad_norm": 1.236370325088501,
1653
+ "learning_rate": 5e-05,
1654
+ "loss": 1.5426,
1655
+ "step": 10550
1656
+ },
1657
+ {
1658
+ "epoch": 4.719966606372617,
1659
+ "grad_norm": 1.1259009838104248,
1660
+ "learning_rate": 5e-05,
1661
+ "loss": 1.5701,
1662
+ "step": 10600
1663
+ },
1664
+ {
1665
+ "epoch": 4.7422290246278,
1666
+ "grad_norm": 1.0653769969940186,
1667
+ "learning_rate": 5e-05,
1668
+ "loss": 1.5543,
1669
+ "step": 10650
1670
+ },
1671
+ {
1672
+ "epoch": 4.764491442882983,
1673
+ "grad_norm": 1.1116371154785156,
1674
+ "learning_rate": 5e-05,
1675
+ "loss": 1.557,
1676
+ "step": 10700
1677
+ },
1678
+ {
1679
+ "epoch": 4.786753861138166,
1680
+ "grad_norm": 1.0332480669021606,
1681
+ "learning_rate": 5e-05,
1682
+ "loss": 1.5513,
1683
+ "step": 10750
1684
+ },
1685
+ {
1686
+ "epoch": 4.809016279393349,
1687
+ "grad_norm": 1.1142674684524536,
1688
+ "learning_rate": 5e-05,
1689
+ "loss": 1.5448,
1690
+ "step": 10800
1691
+ },
1692
+ {
1693
+ "epoch": 4.831278697648532,
1694
+ "grad_norm": 1.0316691398620605,
1695
+ "learning_rate": 5e-05,
1696
+ "loss": 1.5456,
1697
+ "step": 10850
1698
+ },
1699
+ {
1700
+ "epoch": 4.853541115903715,
1701
+ "grad_norm": 0.987628161907196,
1702
+ "learning_rate": 5e-05,
1703
+ "loss": 1.5535,
1704
+ "step": 10900
1705
+ },
1706
+ {
1707
+ "epoch": 4.875803534158898,
1708
+ "grad_norm": 1.125772476196289,
1709
+ "learning_rate": 5e-05,
1710
+ "loss": 1.5583,
1711
+ "step": 10950
1712
+ },
1713
+ {
1714
+ "epoch": 4.898065952414081,
1715
+ "grad_norm": 0.9541718363761902,
1716
+ "learning_rate": 5e-05,
1717
+ "loss": 1.5584,
1718
+ "step": 11000
1719
+ },
1720
+ {
1721
+ "epoch": 4.898065952414081,
1722
+ "eval_loss": 1.5041238069534302,
1723
+ "eval_runtime": 40.2547,
1724
+ "eval_samples_per_second": 396.749,
1725
+ "eval_steps_per_second": 49.609,
1726
+ "step": 11000
1727
  }
1728
  ],
1729
  "logging_steps": 50,
 
1738
  "early_stopping_threshold": 0.0
1739
  },
1740
  "attributes": {
1741
+ "early_stopping_patience_counter": 0
1742
  }
1743
  },
1744
  "TrainerControl": {
 
1752
  "attributes": {}
1753
  }
1754
  },
1755
+ "total_flos": 4.530938070076723e+16,
1756
  "train_batch_size": 4,
1757
  "trial_name": null,
1758
  "trial_params": null