Training in progress, step 117
Browse files
model-00001-of-00006.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4933656472
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:193754d73de28618ae246d1e6ef1e1f952874df6fe492df89c6fd6bf59b908cd
|
3 |
size 4933656472
|
model-00002-of-00006.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4954690712
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:146adf2bf56b3ca242b113fd4b30f6666213f9d420f393d2a1b513a2eaa51d94
|
3 |
size 4954690712
|
model-00003-of-00006.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4902241352
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ef3f034379c2e88c8efe07cc7c930e950b5bc27b0663bc32d41ebdac066d0677
|
3 |
size 4902241352
|
model-00004-of-00006.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4771169120
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a382287bd02c0cadd5b1d96e958b52f913337cb1982e18d193d1814cb891eac4
|
3 |
size 4771169120
|
model-00005-of-00006.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4771169120
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a63cf0bc5a5faf2d6075ae3842167e3c557a4e78136b46aae2cc20bf0a2c9366
|
3 |
size 4771169120
|
model-00006-of-00006.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4986116216
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2047dac818c771d75c472fc3952574cabb4ee3f175facefc0c2bffb782778f36
|
3 |
size 4986116216
|
trainer_log.jsonl
CHANGED
@@ -101,3 +101,18 @@
|
|
101 |
{"current_steps": 101, "total_steps": 117, "loss": 1.7934, "lr": 5.039639255208156e-07, "epoch": 0.8632478632478633, "percentage": 86.32, "elapsed_time": "2:55:45", "remaining_time": "0:27:50"}
|
102 |
{"current_steps": 102, "total_steps": 117, "loss": 1.8092, "lr": 4.43857548059321e-07, "epoch": 0.8717948717948718, "percentage": 87.18, "elapsed_time": "2:57:28", "remaining_time": "0:26:05"}
|
103 |
{"current_steps": 103, "total_steps": 117, "loss": 1.8068, "lr": 3.87400575837657e-07, "epoch": 0.8803418803418803, "percentage": 88.03, "elapsed_time": "2:59:10", "remaining_time": "0:24:21"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
101 |
{"current_steps": 101, "total_steps": 117, "loss": 1.7934, "lr": 5.039639255208156e-07, "epoch": 0.8632478632478633, "percentage": 86.32, "elapsed_time": "2:55:45", "remaining_time": "0:27:50"}
|
102 |
{"current_steps": 102, "total_steps": 117, "loss": 1.8092, "lr": 4.43857548059321e-07, "epoch": 0.8717948717948718, "percentage": 87.18, "elapsed_time": "2:57:28", "remaining_time": "0:26:05"}
|
103 |
{"current_steps": 103, "total_steps": 117, "loss": 1.8068, "lr": 3.87400575837657e-07, "epoch": 0.8803418803418803, "percentage": 88.03, "elapsed_time": "2:59:10", "remaining_time": "0:24:21"}
|
104 |
+
{"current_steps": 104, "total_steps": 117, "loss": 1.7902, "lr": 3.346382300868134e-07, "epoch": 0.8888888888888888, "percentage": 88.89, "elapsed_time": "3:00:53", "remaining_time": "0:22:36"}
|
105 |
+
{"current_steps": 105, "total_steps": 117, "loss": 1.7962, "lr": 2.85612772694579e-07, "epoch": 0.8974358974358975, "percentage": 89.74, "elapsed_time": "3:02:34", "remaining_time": "0:20:51"}
|
106 |
+
{"current_steps": 106, "total_steps": 117, "loss": 1.8041, "lr": 2.403634723543674e-07, "epoch": 0.905982905982906, "percentage": 90.6, "elapsed_time": "3:04:16", "remaining_time": "0:19:07"}
|
107 |
+
{"current_steps": 107, "total_steps": 117, "loss": 1.7981, "lr": 1.989265731115525e-07, "epoch": 0.9145299145299145, "percentage": 91.45, "elapsed_time": "3:05:58", "remaining_time": "0:17:22"}
|
108 |
+
{"current_steps": 108, "total_steps": 117, "loss": 1.8087, "lr": 1.6133526533250566e-07, "epoch": 0.9230769230769231, "percentage": 92.31, "elapsed_time": "3:07:40", "remaining_time": "0:15:38"}
|
109 |
+
{"current_steps": 109, "total_steps": 117, "loss": 1.7862, "lr": 1.2761965911958385e-07, "epoch": 0.9316239316239316, "percentage": 93.16, "elapsed_time": "3:09:24", "remaining_time": "0:13:54"}
|
110 |
+
{"current_steps": 110, "total_steps": 117, "loss": 1.7969, "lr": 9.780676019336632e-08, "epoch": 0.9401709401709402, "percentage": 94.02, "elapsed_time": "3:11:08", "remaining_time": "0:12:09"}
|
111 |
+
{"current_steps": 111, "total_steps": 117, "loss": 1.8082, "lr": 7.192044826145772e-08, "epoch": 0.9487179487179487, "percentage": 94.87, "elapsed_time": "3:12:52", "remaining_time": "0:10:25"}
|
112 |
+
{"current_steps": 112, "total_steps": 117, "loss": 1.8083, "lr": 4.998145789118114e-08, "epoch": 0.9572649572649573, "percentage": 95.73, "elapsed_time": "3:14:36", "remaining_time": "0:08:41"}
|
113 |
+
{"current_steps": 113, "total_steps": 117, "loss": 1.8023, "lr": 3.2007361901485455e-08, "epoch": 0.9658119658119658, "percentage": 96.58, "elapsed_time": "3:16:17", "remaining_time": "0:06:56"}
|
114 |
+
{"current_steps": 114, "total_steps": 117, "loss": 1.7936, "lr": 1.8012557287367394e-08, "epoch": 0.9743589743589743, "percentage": 97.44, "elapsed_time": "3:17:59", "remaining_time": "0:05:12"}
|
115 |
+
{"current_steps": 115, "total_steps": 117, "loss": 1.8047, "lr": 8.008253688084888e-09, "epoch": 0.9829059829059829, "percentage": 98.29, "elapsed_time": "3:19:43", "remaining_time": "0:03:28"}
|
116 |
+
{"current_steps": 116, "total_steps": 117, "loss": 1.7909, "lr": 2.002464408392135e-09, "epoch": 0.9914529914529915, "percentage": 99.15, "elapsed_time": "3:21:27", "remaining_time": "0:01:44"}
|
117 |
+
{"current_steps": 117, "total_steps": 117, "loss": 1.7927, "lr": 0.0, "epoch": 1.0, "percentage": 100.0, "elapsed_time": "3:23:11", "remaining_time": "0:00:00"}
|
118 |
+
{"current_steps": 117, "total_steps": 117, "epoch": 1.0, "percentage": 100.0, "elapsed_time": "3:26:01", "remaining_time": "0:00:00"}
|