Training in progress, step 819
Browse files- model-00001-of-00014.safetensors +1 -1
- model-00002-of-00014.safetensors +1 -1
- model-00003-of-00014.safetensors +1 -1
- model-00004-of-00014.safetensors +1 -1
- model-00005-of-00014.safetensors +1 -1
- model-00006-of-00014.safetensors +1 -1
- model-00007-of-00014.safetensors +1 -1
- model-00008-of-00014.safetensors +1 -1
- model-00009-of-00014.safetensors +1 -1
- model-00010-of-00014.safetensors +1 -1
- model-00011-of-00014.safetensors +1 -1
- model-00012-of-00014.safetensors +1 -1
- model-00013-of-00014.safetensors +1 -1
- model-00014-of-00014.safetensors +1 -1
- trainer_log.jsonl +18 -0
model-00001-of-00014.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4891730992
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:85391d7c04916993c23bd678e7933eb03b2e73b2c0840f01b0dae0a267415bf9
|
3 |
size 4891730992
|
model-00002-of-00014.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4876059352
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0bf65896f7daf5376f89ed985d5d3c072aafd1a9537f12b8c5ceeb22264ac9e5
|
3 |
size 4876059352
|
model-00003-of-00014.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4876059384
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b905115cc2f4dbeef88f69245dd12f691415ac3521f18eab6932a463cdf9ba22
|
3 |
size 4876059384
|
model-00004-of-00014.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4876059416
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fcaa0dce34783b80984858d6e0ad1c2f8071d1f5246eaf606ec2f72df10a3952
|
3 |
size 4876059416
|
model-00005-of-00014.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4876059416
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e9270eb11faa88a75cecc328001ae5ca838175ec319cafb51476fc6783e7a9c1
|
3 |
size 4876059416
|
model-00006-of-00014.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4876059416
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:26b72115ee1e39822c40cf092534505656cd7f899368eac77073195fef4280e4
|
3 |
size 4876059416
|
model-00007-of-00014.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4876059416
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:da4b707b2eb44853e22b79066cb47dec22c40d293c32a49a0f225b275053494c
|
3 |
size 4876059416
|
model-00008-of-00014.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4876059416
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4aaf0f75ec9dcc9af64117d0a32c7e0cbc06d4909d4665120268e4e1ac544e38
|
3 |
size 4876059416
|
model-00009-of-00014.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4876059416
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c1314cfd431f0e48aa567a6f0fc7d9d784e22999dfdb8cc11ca0ec644b8ec6b7
|
3 |
size 4876059416
|
model-00010-of-00014.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4876059416
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:14b4144bb7b734758aaa5c431ae0981894885f27af364b595df29e9377cda38f
|
3 |
size 4876059416
|
model-00011-of-00014.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4876059416
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a4d020cfb2c554d4d74ee55f009589eb050c16390e4a9ed4af7cb2f824f89ddd
|
3 |
size 4876059416
|
model-00012-of-00014.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4876059416
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c581b26cdb33d200abb2604014505005adcd7adbe870eb3b5711f25a7abab1f2
|
3 |
size 4876059416
|
model-00013-of-00014.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4876059416
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:30355b528de4f9025b387cfa710d69cdf9261168f064f921062793a9ff2de1a0
|
3 |
size 4876059416
|
model-00014-of-00014.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 2123397800
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0177f32826a92f232b10f0e9ffccc4854ca617c630b633535932a796670e56b1
|
3 |
size 2123397800
|
trainer_log.jsonl
CHANGED
@@ -800,3 +800,21 @@
|
|
800 |
{"current_steps": 800, "total_steps": 819, "loss": 0.9505, "lr": 4.412614333003495e-08, "epoch": 0.9757584997713066, "percentage": 97.68, "elapsed_time": "1 day, 22:59:36", "remaining_time": "1:06:57"}
|
801 |
{"current_steps": 801, "total_steps": 819, "loss": 0.9789, "lr": 3.960551056479578e-08, "epoch": 0.9769781978960207, "percentage": 97.8, "elapsed_time": "1 day, 23:11:01", "remaining_time": "1:03:37"}
|
802 |
{"current_steps": 802, "total_steps": 819, "loss": 0.9702, "lr": 3.532881779245545e-08, "epoch": 0.9781978960207348, "percentage": 97.92, "elapsed_time": "1 day, 23:14:30", "remaining_time": "1:00:04"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
800 |
{"current_steps": 800, "total_steps": 819, "loss": 0.9505, "lr": 4.412614333003495e-08, "epoch": 0.9757584997713066, "percentage": 97.68, "elapsed_time": "1 day, 22:59:36", "remaining_time": "1:06:57"}
|
801 |
{"current_steps": 801, "total_steps": 819, "loss": 0.9789, "lr": 3.960551056479578e-08, "epoch": 0.9769781978960207, "percentage": 97.8, "elapsed_time": "1 day, 23:11:01", "remaining_time": "1:03:37"}
|
802 |
{"current_steps": 802, "total_steps": 819, "loss": 0.9702, "lr": 3.532881779245545e-08, "epoch": 0.9781978960207348, "percentage": 97.92, "elapsed_time": "1 day, 23:14:30", "remaining_time": "1:00:04"}
|
803 |
+
{"current_steps": 803, "total_steps": 819, "loss": 0.9719, "lr": 3.129613474756709e-08, "epoch": 0.979417594145449, "percentage": 98.05, "elapsed_time": "1 day, 23:17:56", "remaining_time": "0:56:32"}
|
804 |
+
{"current_steps": 804, "total_steps": 819, "loss": 0.9661, "lr": 2.750752718592653e-08, "epoch": 0.9806372922701632, "percentage": 98.17, "elapsed_time": "1 day, 23:21:23", "remaining_time": "0:53:00"}
|
805 |
+
{"current_steps": 805, "total_steps": 819, "loss": 0.9732, "lr": 2.3963056883508084e-08, "epoch": 0.9818569903948773, "percentage": 98.29, "elapsed_time": "1 day, 23:25:06", "remaining_time": "0:49:28"}
|
806 |
+
{"current_steps": 806, "total_steps": 819, "loss": 0.9544, "lr": 2.0662781635447102e-08, "epoch": 0.9830766885195914, "percentage": 98.41, "elapsed_time": "1 day, 23:28:35", "remaining_time": "0:45:56"}
|
807 |
+
{"current_steps": 807, "total_steps": 819, "loss": 0.9818, "lr": 1.760675525510569e-08, "epoch": 0.9842963866443055, "percentage": 98.53, "elapsed_time": "1 day, 23:32:00", "remaining_time": "0:42:24"}
|
808 |
+
{"current_steps": 808, "total_steps": 819, "loss": 0.9606, "lr": 1.4795027573193397e-08, "epoch": 0.9855160847690196, "percentage": 98.66, "elapsed_time": "1 day, 23:35:27", "remaining_time": "0:38:52"}
|
809 |
+
{"current_steps": 809, "total_steps": 819, "loss": 0.9805, "lr": 1.222764443694957e-08, "epoch": 0.9867357828937338, "percentage": 98.78, "elapsed_time": "1 day, 23:38:55", "remaining_time": "0:35:20"}
|
810 |
+
{"current_steps": 810, "total_steps": 819, "loss": 0.9695, "lr": 9.904647709407244e-09, "epoch": 0.987955481018448, "percentage": 98.9, "elapsed_time": "1 day, 23:42:21", "remaining_time": "0:31:48"}
|
811 |
+
{"current_steps": 811, "total_steps": 819, "loss": 0.9664, "lr": 7.826075268695387e-09, "epoch": 0.9891751791431621, "percentage": 99.02, "elapsed_time": "1 day, 23:45:51", "remaining_time": "0:28:16"}
|
812 |
+
{"current_steps": 812, "total_steps": 819, "loss": 0.982, "lr": 5.991961007434377e-09, "epoch": 0.9903948772678762, "percentage": 99.15, "elapsed_time": "1 day, 23:49:24", "remaining_time": "0:24:44"}
|
813 |
+
{"current_steps": 813, "total_steps": 819, "loss": 0.9717, "lr": 4.402334832174782e-09, "epoch": 0.9916145753925903, "percentage": 99.27, "elapsed_time": "1 day, 23:52:51", "remaining_time": "0:21:12"}
|
814 |
+
{"current_steps": 814, "total_steps": 819, "loss": 0.9574, "lr": 3.057222662917747e-09, "epoch": 0.9928342735173045, "percentage": 99.39, "elapsed_time": "1 day, 23:56:18", "remaining_time": "0:17:40"}
|
815 |
+
{"current_steps": 815, "total_steps": 819, "loss": 0.9369, "lr": 1.9566464326820077e-09, "epoch": 0.9940539716420186, "percentage": 99.51, "elapsed_time": "1 day, 23:59:43", "remaining_time": "0:14:08"}
|
816 |
+
{"current_steps": 816, "total_steps": 819, "loss": 0.9674, "lr": 1.1006240871558326e-09, "epoch": 0.9952736697667327, "percentage": 99.63, "elapsed_time": "2 days, 0:03:09", "remaining_time": "0:10:35"}
|
817 |
+
{"current_steps": 817, "total_steps": 819, "loss": 0.9698, "lr": 4.89169584400595e-10, "epoch": 0.9964933678914468, "percentage": 99.76, "elapsed_time": "2 days, 0:06:33", "remaining_time": "0:07:03"}
|
818 |
+
{"current_steps": 818, "total_steps": 819, "loss": 0.9636, "lr": 1.2229289461762604e-10, "epoch": 0.997713066016161, "percentage": 99.88, "elapsed_time": "2 days, 0:09:59", "remaining_time": "0:03:31"}
|
819 |
+
{"current_steps": 819, "total_steps": 819, "loss": 0.942, "lr": 0.0, "epoch": 0.9989327641408752, "percentage": 100.0, "elapsed_time": "2 days, 0:13:27", "remaining_time": "0:00:00"}
|
820 |
+
{"current_steps": 819, "total_steps": 819, "epoch": 0.9989327641408752, "percentage": 100.0, "elapsed_time": "2 days, 0:21:09", "remaining_time": "0:00:00"}
|