celinelee commited on
Commit
609db49
·
verified ·
1 Parent(s): f1be0a6

Training in progress, step 200

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7382e2ecb79992340ac0b17c68ad2ae219c98e7dcbe40cafd5b3bf467e5aaa90
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b7bcef8e653c030b139ee9d03543dbc3d8e700359912b4309ca98893fa8561a5
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:78a60be182678d8366c74e016c045d9e9a73652a36797032e69bd20c75e6a330
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a3801780dcefce54c9918fbb4fee637441f16a55f21d561df453909d1ac9d0da
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f84c2cbc8626ebdafe624a3f20f988f6feb7e2a1a4159bf0cecc8fd7dfd5fe7a
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:98a61ebb5f00c6abd5cb19e6324ea83a81e1d26bf1e10540b809306d47fb7a99
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bb7bd1a14ba60f9c04fdb029062eeb501ed427fdfd10402753b5178fdd8dc4cb
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fd50faa61b94344014052a595c75cdf5e710ad70cce070199cbc21f71d6a1a31
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -1,10 +1,20 @@
1
- {"current_steps": 10, "total_steps": 3584, "loss": 0.8909, "lr": 2.785515320334262e-07, "epoch": 0.17699115044247787, "percentage": 0.28, "elapsed_time": "0:20:36", "remaining_time": "5 days, 2:46:52"}
2
- {"current_steps": 20, "total_steps": 3584, "loss": 0.9076, "lr": 5.571030640668524e-07, "epoch": 0.35398230088495575, "percentage": 0.56, "elapsed_time": "0:42:22", "remaining_time": "5 days, 5:52:29"}
3
- {"current_steps": 30, "total_steps": 3584, "loss": 0.9112, "lr": 8.356545961002786e-07, "epoch": 0.5309734513274337, "percentage": 0.84, "elapsed_time": "1:04:11", "remaining_time": "5 days, 6:44:17"}
4
- {"current_steps": 40, "total_steps": 3584, "loss": 0.8511, "lr": 1.1142061281337048e-06, "epoch": 0.7079646017699115, "percentage": 1.12, "elapsed_time": "1:25:08", "remaining_time": "5 days, 5:43:59"}
5
- {"current_steps": 50, "total_steps": 3584, "loss": 0.7818, "lr": 1.392757660167131e-06, "epoch": 0.8849557522123894, "percentage": 1.4, "elapsed_time": "1:46:40", "remaining_time": "5 days, 5:39:34"}
6
- {"current_steps": 60, "total_steps": 3584, "loss": 0.8327, "lr": 1.6713091922005572e-06, "epoch": 1.0707964601769913, "percentage": 1.67, "elapsed_time": "2:08:06", "remaining_time": "5 days, 5:23:51"}
7
- {"current_steps": 70, "total_steps": 3584, "loss": 0.6992, "lr": 1.9498607242339835e-06, "epoch": 1.247787610619469, "percentage": 1.95, "elapsed_time": "2:29:30", "remaining_time": "5 days, 5:05:18"}
8
- {"current_steps": 80, "total_steps": 3584, "loss": 0.6623, "lr": 2.2284122562674097e-06, "epoch": 1.424778761061947, "percentage": 2.23, "elapsed_time": "2:50:45", "remaining_time": "5 days, 4:39:28"}
9
- {"current_steps": 90, "total_steps": 3584, "loss": 0.6423, "lr": 2.506963788300836e-06, "epoch": 1.6017699115044248, "percentage": 2.51, "elapsed_time": "3:11:42", "remaining_time": "5 days, 4:02:38"}
10
- {"current_steps": 100, "total_steps": 3584, "loss": 0.6126, "lr": 2.785515320334262e-06, "epoch": 1.7787610619469025, "percentage": 2.79, "elapsed_time": "3:33:17", "remaining_time": "5 days, 3:51:05"}
 
 
 
 
 
 
 
 
 
 
 
1
+ {"current_steps": 10, "total_steps": 3584, "loss": 0.8908, "lr": 2.785515320334262e-07, "epoch": 0.17699115044247787, "percentage": 0.28, "elapsed_time": "0:21:10", "remaining_time": "5 days, 6:07:54"}
2
+ {"current_steps": 20, "total_steps": 3584, "loss": 0.9077, "lr": 5.571030640668524e-07, "epoch": 0.35398230088495575, "percentage": 0.56, "elapsed_time": "0:42:21", "remaining_time": "5 days, 5:48:44"}
3
+ {"current_steps": 30, "total_steps": 3584, "loss": 0.9111, "lr": 8.356545961002786e-07, "epoch": 0.5309734513274337, "percentage": 0.84, "elapsed_time": "1:03:20", "remaining_time": "5 days, 5:02:53"}
4
+ {"current_steps": 40, "total_steps": 3584, "loss": 0.851, "lr": 1.1142061281337048e-06, "epoch": 0.7079646017699115, "percentage": 1.12, "elapsed_time": "1:23:42", "remaining_time": "5 days, 3:36:30"}
5
+ {"current_steps": 50, "total_steps": 3584, "loss": 0.7817, "lr": 1.392757660167131e-06, "epoch": 0.8849557522123894, "percentage": 1.4, "elapsed_time": "1:44:24", "remaining_time": "5 days, 3:00:02"}
6
+ {"current_steps": 60, "total_steps": 3584, "loss": 0.8326, "lr": 1.6713091922005572e-06, "epoch": 1.0707964601769913, "percentage": 1.67, "elapsed_time": "2:05:20", "remaining_time": "5 days, 2:41:14"}
7
+ {"current_steps": 70, "total_steps": 3584, "loss": 0.6992, "lr": 1.9498607242339835e-06, "epoch": 1.247787610619469, "percentage": 1.95, "elapsed_time": "2:25:45", "remaining_time": "5 days, 1:57:03"}
8
+ {"current_steps": 80, "total_steps": 3584, "loss": 0.6624, "lr": 2.2284122562674097e-06, "epoch": 1.424778761061947, "percentage": 2.23, "elapsed_time": "2:46:04", "remaining_time": "5 days, 1:13:49"}
9
+ {"current_steps": 90, "total_steps": 3584, "loss": 0.6426, "lr": 2.506963788300836e-06, "epoch": 1.6017699115044248, "percentage": 2.51, "elapsed_time": "3:06:31", "remaining_time": "5 days, 0:41:09"}
10
+ {"current_steps": 100, "total_steps": 3584, "loss": 0.6128, "lr": 2.785515320334262e-06, "epoch": 1.7787610619469025, "percentage": 2.79, "elapsed_time": "3:27:30", "remaining_time": "5 days, 0:29:49"}
11
+ {"current_steps": 110, "total_steps": 3584, "loss": 0.6093, "lr": 3.064066852367688e-06, "epoch": 1.9557522123893807, "percentage": 3.07, "elapsed_time": "3:48:28", "remaining_time": "5 days, 0:15:28"}
12
+ {"current_steps": 120, "total_steps": 3584, "loss": 0.6398, "lr": 3.3426183844011143e-06, "epoch": 2.1415929203539825, "percentage": 3.35, "elapsed_time": "4:09:38", "remaining_time": "5 days, 0:06:12"}
13
+ {"current_steps": 130, "total_steps": 3584, "loss": 0.5584, "lr": 3.6211699164345405e-06, "epoch": 2.3185840707964602, "percentage": 3.63, "elapsed_time": "4:30:49", "remaining_time": "4 days, 23:55:46"}
14
+ {"current_steps": 140, "total_steps": 3584, "loss": 0.5709, "lr": 3.899721448467967e-06, "epoch": 2.495575221238938, "percentage": 3.91, "elapsed_time": "4:51:15", "remaining_time": "4 days, 23:24:46"}
15
+ {"current_steps": 150, "total_steps": 3584, "loss": 0.5367, "lr": 4.178272980501394e-06, "epoch": 2.672566371681416, "percentage": 4.19, "elapsed_time": "5:11:42", "remaining_time": "4 days, 22:56:06"}
16
+ {"current_steps": 160, "total_steps": 3584, "loss": 0.5493, "lr": 4.456824512534819e-06, "epoch": 2.849557522123894, "percentage": 4.46, "elapsed_time": "5:32:15", "remaining_time": "4 days, 22:30:09"}
17
+ {"current_steps": 170, "total_steps": 3584, "loss": 0.5843, "lr": 4.735376044568246e-06, "epoch": 3.0353982300884956, "percentage": 4.74, "elapsed_time": "5:53:38", "remaining_time": "4 days, 22:21:49"}
18
+ {"current_steps": 180, "total_steps": 3584, "loss": 0.515, "lr": 5.013927576601672e-06, "epoch": 3.2123893805309733, "percentage": 5.02, "elapsed_time": "6:14:32", "remaining_time": "4 days, 22:02:55"}
19
+ {"current_steps": 190, "total_steps": 3584, "loss": 0.5032, "lr": 5.292479108635098e-06, "epoch": 3.3893805309734515, "percentage": 5.3, "elapsed_time": "6:35:04", "remaining_time": "4 days, 21:37:25"}
20
+ {"current_steps": 200, "total_steps": 3584, "loss": 0.5078, "lr": 5.571030640668524e-06, "epoch": 3.566371681415929, "percentage": 5.58, "elapsed_time": "6:55:41", "remaining_time": "4 days, 21:13:27"}
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:37eeaa91f763a1a2b23d732bb787741d00bf61db78f97307ca4a5eaa03995326
3
  size 7672
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:966b5824f27e6725d6e141b0a5fd3edec40ac0a3f5796190639f0dfcd39dd159
3
  size 7672