reinhardh commited on
Commit
7e18dac
·
verified ·
1 Parent(s): ed827a8

Training in progress, step 580

Browse files
model-00001-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3736b4c0e87a998a04bd9ec0a7299fffc8542d92907606064eba20f16fd7a5df
3
  size 5000000704
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1f093d548bafd4d1a947ff1acb5515241a0509be19e8a77b703525253f8af84b
3
  size 5000000704
model-00002-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:82a57bc589d2e691f89c5f9d8226106a3d843a23203ba220b7a0b7849e04d785
3
  size 4857411192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c9cb6f4541984d56f542ceef05800a041732711ae35f0c17a36d4cb1438d107a
3
  size 4857411192
model-00003-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:efeb8683954a9be17e850297339f72909be6a7b4eb914c21d8c5d7497374d401
3
  size 3921970888
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1e52729c1d8a5f9626b20ad72e53c95f0fbc52f8d716f5fda20930cbecad5f06
3
  size 3921970888
trainer_log.jsonl CHANGED
@@ -574,3 +574,37 @@
574
  {"current_steps": 574, "total_steps": 9875, "loss": 1.0394, "lr": 5.809716599190284e-06, "epoch": 0.29063291139240505, "percentage": 5.81, "elapsed_time": "1:36:20", "remaining_time": "1 day, 2:01:08"}
575
  {"current_steps": 575, "total_steps": 9875, "loss": 0.9718, "lr": 5.819838056680163e-06, "epoch": 0.2911392405063291, "percentage": 5.82, "elapsed_time": "1:36:22", "remaining_time": "1 day, 1:58:41"}
576
  {"current_steps": 576, "total_steps": 9875, "loss": 1.0125, "lr": 5.8299595141700406e-06, "epoch": 0.2916455696202532, "percentage": 5.83, "elapsed_time": "1:36:23", "remaining_time": "1 day, 1:56:14"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
574
  {"current_steps": 574, "total_steps": 9875, "loss": 1.0394, "lr": 5.809716599190284e-06, "epoch": 0.29063291139240505, "percentage": 5.81, "elapsed_time": "1:36:20", "remaining_time": "1 day, 2:01:08"}
575
  {"current_steps": 575, "total_steps": 9875, "loss": 0.9718, "lr": 5.819838056680163e-06, "epoch": 0.2911392405063291, "percentage": 5.82, "elapsed_time": "1:36:22", "remaining_time": "1 day, 1:58:41"}
576
  {"current_steps": 576, "total_steps": 9875, "loss": 1.0125, "lr": 5.8299595141700406e-06, "epoch": 0.2916455696202532, "percentage": 5.83, "elapsed_time": "1:36:23", "remaining_time": "1 day, 1:56:14"}
577
+ {"current_steps": 577, "total_steps": 9875, "loss": 0.9713, "lr": 5.840080971659919e-06, "epoch": 0.29215189873417724, "percentage": 5.84, "elapsed_time": "1:36:25", "remaining_time": "1 day, 1:53:48"}
578
+ {"current_steps": 578, "total_steps": 9875, "loss": 0.9834, "lr": 5.850202429149798e-06, "epoch": 0.29265822784810125, "percentage": 5.85, "elapsed_time": "1:36:26", "remaining_time": "1 day, 1:51:22"}
579
+ {"current_steps": 579, "total_steps": 9875, "loss": 1.0993, "lr": 5.860323886639676e-06, "epoch": 0.2931645569620253, "percentage": 5.86, "elapsed_time": "1:36:28", "remaining_time": "1 day, 1:48:56"}
580
+ {"current_steps": 580, "total_steps": 9875, "loss": 1.0374, "lr": 5.870445344129555e-06, "epoch": 0.2936708860759494, "percentage": 5.87, "elapsed_time": "1:36:30", "remaining_time": "1 day, 1:46:32"}
581
+ {"current_steps": 581, "total_steps": 9875, "loss": 1.0386, "lr": 5.880566801619434e-06, "epoch": 0.29417721518987344, "percentage": 5.88, "elapsed_time": "1:37:49", "remaining_time": "1 day, 2:04:54"}
582
+ {"current_steps": 582, "total_steps": 9875, "loss": 1.0194, "lr": 5.890688259109311e-06, "epoch": 0.29468354430379745, "percentage": 5.89, "elapsed_time": "1:37:51", "remaining_time": "1 day, 2:02:28"}
583
+ {"current_steps": 583, "total_steps": 9875, "loss": 1.0568, "lr": 5.900809716599191e-06, "epoch": 0.2951898734177215, "percentage": 5.9, "elapsed_time": "1:37:52", "remaining_time": "1 day, 2:00:02"}
584
+ {"current_steps": 584, "total_steps": 9875, "loss": 1.0854, "lr": 5.91093117408907e-06, "epoch": 0.2956962025316456, "percentage": 5.91, "elapsed_time": "1:37:54", "remaining_time": "1 day, 1:57:37"}
585
+ {"current_steps": 585, "total_steps": 9875, "loss": 1.0625, "lr": 5.921052631578948e-06, "epoch": 0.29620253164556964, "percentage": 5.92, "elapsed_time": "1:37:55", "remaining_time": "1 day, 1:55:12"}
586
+ {"current_steps": 586, "total_steps": 9875, "loss": 0.9392, "lr": 5.931174089068826e-06, "epoch": 0.29670886075949365, "percentage": 5.93, "elapsed_time": "1:37:57", "remaining_time": "1 day, 1:52:48"}
587
+ {"current_steps": 587, "total_steps": 9875, "loss": 1.1935, "lr": 5.941295546558705e-06, "epoch": 0.2972151898734177, "percentage": 5.94, "elapsed_time": "1:37:59", "remaining_time": "1 day, 1:50:25"}
588
+ {"current_steps": 588, "total_steps": 9875, "loss": 1.0056, "lr": 5.951417004048583e-06, "epoch": 0.2977215189873418, "percentage": 5.95, "elapsed_time": "1:38:00", "remaining_time": "1 day, 1:48:02"}
589
+ {"current_steps": 589, "total_steps": 9875, "loss": 1.0782, "lr": 5.961538461538462e-06, "epoch": 0.29822784810126585, "percentage": 5.96, "elapsed_time": "1:38:02", "remaining_time": "1 day, 1:45:39"}
590
+ {"current_steps": 590, "total_steps": 9875, "loss": 1.1428, "lr": 5.971659919028341e-06, "epoch": 0.29873417721518986, "percentage": 5.97, "elapsed_time": "1:38:03", "remaining_time": "1 day, 1:43:17"}
591
+ {"current_steps": 591, "total_steps": 9875, "loss": 1.0241, "lr": 5.981781376518218e-06, "epoch": 0.2992405063291139, "percentage": 5.98, "elapsed_time": "1:39:04", "remaining_time": "1 day, 1:56:23"}
592
+ {"current_steps": 592, "total_steps": 9875, "loss": 1.1226, "lr": 5.991902834008098e-06, "epoch": 0.299746835443038, "percentage": 5.99, "elapsed_time": "1:39:06", "remaining_time": "1 day, 1:54:00"}
593
+ {"current_steps": 593, "total_steps": 9875, "loss": 0.9369, "lr": 6.002024291497976e-06, "epoch": 0.30025316455696205, "percentage": 6.01, "elapsed_time": "1:39:07", "remaining_time": "1 day, 1:51:38"}
594
+ {"current_steps": 594, "total_steps": 9875, "loss": 0.9313, "lr": 6.012145748987855e-06, "epoch": 0.30075949367088606, "percentage": 6.02, "elapsed_time": "1:39:09", "remaining_time": "1 day, 1:49:16"}
595
+ {"current_steps": 595, "total_steps": 9875, "loss": 1.0831, "lr": 6.022267206477733e-06, "epoch": 0.3012658227848101, "percentage": 6.03, "elapsed_time": "1:39:10", "remaining_time": "1 day, 1:46:54"}
596
+ {"current_steps": 596, "total_steps": 9875, "loss": 0.9162, "lr": 6.0323886639676124e-06, "epoch": 0.3017721518987342, "percentage": 6.04, "elapsed_time": "1:39:12", "remaining_time": "1 day, 1:44:33"}
597
+ {"current_steps": 597, "total_steps": 9875, "loss": 1.0003, "lr": 6.04251012145749e-06, "epoch": 0.30227848101265825, "percentage": 6.05, "elapsed_time": "1:39:14", "remaining_time": "1 day, 1:42:12"}
598
+ {"current_steps": 598, "total_steps": 9875, "loss": 1.0893, "lr": 6.0526315789473685e-06, "epoch": 0.30278481012658226, "percentage": 6.06, "elapsed_time": "1:39:15", "remaining_time": "1 day, 1:39:52"}
599
+ {"current_steps": 599, "total_steps": 9875, "loss": 1.2504, "lr": 6.062753036437248e-06, "epoch": 0.3032911392405063, "percentage": 6.07, "elapsed_time": "1:39:17", "remaining_time": "1 day, 1:37:32"}
600
+ {"current_steps": 600, "total_steps": 9875, "loss": 1.0859, "lr": 6.0728744939271254e-06, "epoch": 0.3037974683544304, "percentage": 6.08, "elapsed_time": "1:39:18", "remaining_time": "1 day, 1:35:13"}
601
+ {"current_steps": 601, "total_steps": 9875, "loss": 0.9845, "lr": 6.082995951417005e-06, "epoch": 0.30430379746835445, "percentage": 6.09, "elapsed_time": "1:40:56", "remaining_time": "1 day, 1:57:33"}
602
+ {"current_steps": 602, "total_steps": 9875, "loss": 0.952, "lr": 6.093117408906883e-06, "epoch": 0.30481012658227846, "percentage": 6.1, "elapsed_time": "1:40:57", "remaining_time": "1 day, 1:55:12"}
603
+ {"current_steps": 603, "total_steps": 9875, "loss": 0.9874, "lr": 6.103238866396761e-06, "epoch": 0.3053164556962025, "percentage": 6.11, "elapsed_time": "1:40:59", "remaining_time": "1 day, 1:52:52"}
604
+ {"current_steps": 604, "total_steps": 9875, "loss": 1.1828, "lr": 6.11336032388664e-06, "epoch": 0.3058227848101266, "percentage": 6.12, "elapsed_time": "1:41:00", "remaining_time": "1 day, 1:50:32"}
605
+ {"current_steps": 605, "total_steps": 9875, "loss": 1.0348, "lr": 6.1234817813765195e-06, "epoch": 0.30632911392405066, "percentage": 6.13, "elapsed_time": "1:41:02", "remaining_time": "1 day, 1:48:13"}
606
+ {"current_steps": 606, "total_steps": 9875, "loss": 1.074, "lr": 6.133603238866397e-06, "epoch": 0.30683544303797466, "percentage": 6.14, "elapsed_time": "1:41:04", "remaining_time": "1 day, 1:45:54"}
607
+ {"current_steps": 607, "total_steps": 9875, "loss": 1.0902, "lr": 6.1437246963562756e-06, "epoch": 0.30734177215189873, "percentage": 6.15, "elapsed_time": "1:41:05", "remaining_time": "1 day, 1:43:36"}
608
+ {"current_steps": 608, "total_steps": 9875, "loss": 1.0952, "lr": 6.153846153846155e-06, "epoch": 0.3078481012658228, "percentage": 6.16, "elapsed_time": "1:41:07", "remaining_time": "1 day, 1:41:18"}
609
+ {"current_steps": 609, "total_steps": 9875, "loss": 1.0621, "lr": 6.1639676113360325e-06, "epoch": 0.30835443037974686, "percentage": 6.17, "elapsed_time": "1:41:09", "remaining_time": "1 day, 1:39:00"}
610
+ {"current_steps": 610, "total_steps": 9875, "loss": 0.9134, "lr": 6.174089068825912e-06, "epoch": 0.30886075949367087, "percentage": 6.18, "elapsed_time": "1:41:10", "remaining_time": "1 day, 1:36:43"}