celinelee commited on
Commit
a73eb71
·
verified ·
1 Parent(s): 2c05034

Training in progress, step 750

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7e33ea8736b83781902ce1a3c4cb1eac49e4c35343e8095d2f88865d6b591644
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:34d3f8c2e71532662ea56e3ab463b51e70826ab34095977f9a31251797e6eb34
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ea8a8a296b29dd49a669f2ab5972cde84314d1c4cec7b7e015a94ea47b163999
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e805d58b57c3b66882904f3dcef86fe6595b7d7f1e817ed5cfc893ef0b7c66af
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:638ea948551731c6c0da51cea50396ce2f369b9b0004151233f89cd9bd5980d7
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5d0bbb1c7380d833e01c76c33fc472277768ec40a718ff6d6d93a626ab30434a
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:abaf6ef6e52da6aa1485fd6bb4fd4a04e199db03e73e69e8b84251e2c26fd725
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1164805d08b40dcc8ad1cac56e5380ce388e7f4bcd0eba196676086963bbe137
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -58,3 +58,19 @@
58
  {"current_steps": 580, "total_steps": 750, "loss": 0.26, "lr": 1.4850947128716914e-06, "epoch": 2.32, "percentage": 77.33, "elapsed_time": "1 day, 11:02:45", "remaining_time": "10:16:19"}
59
  {"current_steps": 590, "total_steps": 750, "loss": 0.258, "lr": 1.3234549597008572e-06, "epoch": 2.36, "percentage": 78.67, "elapsed_time": "1 day, 11:38:54", "remaining_time": "9:40:02"}
60
  {"current_steps": 600, "total_steps": 750, "loss": 0.2637, "lr": 1.1697777844051105e-06, "epoch": 2.4, "percentage": 80.0, "elapsed_time": "1 day, 12:14:51", "remaining_time": "9:03:42"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
58
  {"current_steps": 580, "total_steps": 750, "loss": 0.26, "lr": 1.4850947128716914e-06, "epoch": 2.32, "percentage": 77.33, "elapsed_time": "1 day, 11:02:45", "remaining_time": "10:16:19"}
59
  {"current_steps": 590, "total_steps": 750, "loss": 0.258, "lr": 1.3234549597008572e-06, "epoch": 2.36, "percentage": 78.67, "elapsed_time": "1 day, 11:38:54", "remaining_time": "9:40:02"}
60
  {"current_steps": 600, "total_steps": 750, "loss": 0.2637, "lr": 1.1697777844051105e-06, "epoch": 2.4, "percentage": 80.0, "elapsed_time": "1 day, 12:14:51", "remaining_time": "9:03:42"}
61
+ {"current_steps": 610, "total_steps": 750, "loss": 0.2655, "lr": 1.0243960175257605e-06, "epoch": 2.44, "percentage": 81.33, "elapsed_time": "1 day, 12:52:45", "remaining_time": "8:27:50"}
62
+ {"current_steps": 620, "total_steps": 750, "loss": 0.2525, "lr": 8.876245235966884e-07, "epoch": 2.48, "percentage": 82.67, "elapsed_time": "1 day, 13:28:38", "remaining_time": "7:51:29"}
63
+ {"current_steps": 630, "total_steps": 750, "loss": 0.2623, "lr": 7.597595192178702e-07, "epoch": 2.52, "percentage": 84.0, "elapsed_time": "1 day, 14:05:25", "remaining_time": "7:15:19"}
64
+ {"current_steps": 640, "total_steps": 750, "loss": 0.2831, "lr": 6.410779315161885e-07, "epoch": 2.56, "percentage": 85.33, "elapsed_time": "1 day, 14:41:26", "remaining_time": "6:38:59"}
65
+ {"current_steps": 650, "total_steps": 750, "loss": 0.2634, "lr": 5.318367983829393e-07, "epoch": 2.6, "percentage": 86.67, "elapsed_time": "1 day, 15:17:47", "remaining_time": "6:02:44"}
66
+ {"current_steps": 660, "total_steps": 750, "loss": 0.2383, "lr": 4.322727117869951e-07, "epoch": 2.64, "percentage": 88.0, "elapsed_time": "1 day, 15:54:07", "remaining_time": "5:26:28"}
67
+ {"current_steps": 670, "total_steps": 750, "loss": 0.2684, "lr": 3.426013053692878e-07, "epoch": 2.68, "percentage": 89.33, "elapsed_time": "1 day, 16:30:36", "remaining_time": "4:50:13"}
68
+ {"current_steps": 680, "total_steps": 750, "loss": 0.2586, "lr": 2.63016787428354e-07, "epoch": 2.7199999999999998, "percentage": 90.67, "elapsed_time": "1 day, 17:06:27", "remaining_time": "4:13:54"}
69
+ {"current_steps": 690, "total_steps": 750, "loss": 0.2424, "lr": 1.9369152030840553e-07, "epoch": 2.76, "percentage": 92.0, "elapsed_time": "1 day, 17:42:21", "remaining_time": "3:37:35"}
70
+ {"current_steps": 700, "total_steps": 750, "loss": 0.2795, "lr": 1.3477564710088097e-07, "epoch": 2.8, "percentage": 93.33, "elapsed_time": "1 day, 18:18:20", "remaining_time": "3:01:18"}
71
+ {"current_steps": 710, "total_steps": 750, "loss": 0.2872, "lr": 8.639676646793382e-08, "epoch": 2.84, "percentage": 94.67, "elapsed_time": "1 day, 18:54:19", "remaining_time": "2:25:01"}
72
+ {"current_steps": 720, "total_steps": 750, "loss": 0.246, "lr": 4.865965629214819e-08, "epoch": 2.88, "percentage": 96.0, "elapsed_time": "1 day, 19:29:54", "remaining_time": "1:48:44"}
73
+ {"current_steps": 730, "total_steps": 750, "loss": 0.2513, "lr": 2.1646046750978255e-08, "epoch": 2.92, "percentage": 97.33, "elapsed_time": "1 day, 20:06:48", "remaining_time": "1:12:30"}
74
+ {"current_steps": 740, "total_steps": 750, "loss": 0.24, "lr": 5.414443307377171e-09, "epoch": 2.96, "percentage": 98.67, "elapsed_time": "1 day, 20:42:11", "remaining_time": "0:36:14"}
75
+ {"current_steps": 750, "total_steps": 750, "loss": 0.2572, "lr": 0.0, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "1 day, 21:18:01", "remaining_time": "0:00:00"}
76
+ {"current_steps": 750, "total_steps": 750, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "1 day, 21:19:39", "remaining_time": "0:00:00"}