Training in progress, step 247000
Browse files- model.safetensors +1 -1
- trainer_log.jsonl +35 -0
model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 3554214752
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:80288f0de945f9872840f29f71a76c1adad726599cf29af6d884135aedd254c5
|
3 |
size 3554214752
|
trainer_log.jsonl
CHANGED
@@ -24686,3 +24686,38 @@
|
|
24686 |
{"current_steps": 246820, "total_steps": 247180, "loss": 0.0156, "lr": 6.461482099429095e-11, "epoch": 1.9970871429727324, "percentage": 99.85, "elapsed_time": "1 day, 6:08:32", "remaining_time": "0:02:38"}
|
24687 |
{"current_steps": 246830, "total_steps": 247180, "loss": 0.0219, "lr": 6.107497303842192e-11, "epoch": 1.9971680556679343, "percentage": 99.86, "elapsed_time": "1 day, 6:08:36", "remaining_time": "0:02:33"}
|
24688 |
{"current_steps": 246840, "total_steps": 247180, "loss": 0.0195, "lr": 5.763483830911743e-11, "epoch": 1.9972489683631363, "percentage": 99.86, "elapsed_time": "1 day, 6:08:41", "remaining_time": "0:02:29"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
24686 |
{"current_steps": 246820, "total_steps": 247180, "loss": 0.0156, "lr": 6.461482099429095e-11, "epoch": 1.9970871429727324, "percentage": 99.85, "elapsed_time": "1 day, 6:08:32", "remaining_time": "0:02:38"}
|
24687 |
{"current_steps": 246830, "total_steps": 247180, "loss": 0.0219, "lr": 6.107497303842192e-11, "epoch": 1.9971680556679343, "percentage": 99.86, "elapsed_time": "1 day, 6:08:36", "remaining_time": "0:02:33"}
|
24688 |
{"current_steps": 246840, "total_steps": 247180, "loss": 0.0195, "lr": 5.763483830911743e-11, "epoch": 1.9972489683631363, "percentage": 99.86, "elapsed_time": "1 day, 6:08:41", "remaining_time": "0:02:29"}
|
24689 |
+
{"current_steps": 246850, "total_steps": 247180, "loss": 0.0351, "lr": 5.4294416874656195e-11, "epoch": 1.997329881058338, "percentage": 99.87, "elapsed_time": "1 day, 6:08:46", "remaining_time": "0:02:25"}
|
24690 |
+
{"current_steps": 246860, "total_steps": 247180, "loss": 0.0134, "lr": 5.1053708802206727e-11, "epoch": 1.99741079375354, "percentage": 99.87, "elapsed_time": "1 day, 6:08:50", "remaining_time": "0:02:20"}
|
24691 |
+
{"current_steps": 246870, "total_steps": 247180, "loss": 0.0173, "lr": 4.7912714156161944e-11, "epoch": 1.9974917064487419, "percentage": 99.87, "elapsed_time": "1 day, 6:08:54", "remaining_time": "0:02:16"}
|
24692 |
+
{"current_steps": 246880, "total_steps": 247180, "loss": 0.0242, "lr": 4.487143299924945e-11, "epoch": 1.9975726191439436, "percentage": 99.88, "elapsed_time": "1 day, 6:08:58", "remaining_time": "0:02:11"}
|
24693 |
+
{"current_steps": 246890, "total_steps": 247180, "loss": 0.0151, "lr": 4.19298653914213e-11, "epoch": 1.9976535318391455, "percentage": 99.88, "elapsed_time": "1 day, 6:09:01", "remaining_time": "0:02:07"}
|
24694 |
+
{"current_steps": 246900, "total_steps": 247180, "loss": 0.0221, "lr": 3.908801139207441e-11, "epoch": 1.9977344445343475, "percentage": 99.89, "elapsed_time": "1 day, 6:09:05", "remaining_time": "0:02:03"}
|
24695 |
+
{"current_steps": 246910, "total_steps": 247180, "loss": 0.0149, "lr": 3.6345871058385274e-11, "epoch": 1.9978153572295492, "percentage": 99.89, "elapsed_time": "1 day, 6:09:09", "remaining_time": "0:01:58"}
|
24696 |
+
{"current_steps": 246920, "total_steps": 247180, "loss": 0.0173, "lr": 3.37034444436446e-11, "epoch": 1.9978962699247513, "percentage": 99.89, "elapsed_time": "1 day, 6:09:13", "remaining_time": "0:01:54"}
|
24697 |
+
{"current_steps": 246930, "total_steps": 247180, "loss": 0.0208, "lr": 3.116073160169819e-11, "epoch": 1.997977182619953, "percentage": 99.9, "elapsed_time": "1 day, 6:09:17", "remaining_time": "0:01:49"}
|
24698 |
+
{"current_steps": 246940, "total_steps": 247180, "loss": 0.0217, "lr": 2.8717732582506098e-11, "epoch": 1.998058095315155, "percentage": 99.9, "elapsed_time": "1 day, 6:09:21", "remaining_time": "0:01:45"}
|
24699 |
+
{"current_steps": 246950, "total_steps": 247180, "loss": 0.0105, "lr": 2.6374447435473237e-11, "epoch": 1.998139008010357, "percentage": 99.91, "elapsed_time": "1 day, 6:09:25", "remaining_time": "0:01:41"}
|
24700 |
+
{"current_steps": 246960, "total_steps": 247180, "loss": 0.024, "lr": 2.413087620667387e-11, "epoch": 1.9982199207055586, "percentage": 99.91, "elapsed_time": "1 day, 6:09:29", "remaining_time": "0:01:36"}
|
24701 |
+
{"current_steps": 246970, "total_steps": 247180, "loss": 0.0173, "lr": 2.1987018941627135e-11, "epoch": 1.9983008334007606, "percentage": 99.92, "elapsed_time": "1 day, 6:09:33", "remaining_time": "0:01:32"}
|
24702 |
+
{"current_steps": 246980, "total_steps": 247180, "loss": 0.0286, "lr": 1.9942875682521512e-11, "epoch": 1.9983817460959625, "percentage": 99.92, "elapsed_time": "1 day, 6:09:38", "remaining_time": "0:01:27"}
|
24703 |
+
{"current_steps": 246990, "total_steps": 247180, "loss": 0.0152, "lr": 1.7998446469880138e-11, "epoch": 1.9984626587911642, "percentage": 99.92, "elapsed_time": "1 day, 6:09:41", "remaining_time": "0:01:23"}
|
24704 |
+
{"current_steps": 247000, "total_steps": 247180, "loss": 0.0125, "lr": 1.615373134311593e-11, "epoch": 1.9985435714863662, "percentage": 99.93, "elapsed_time": "1 day, 6:09:45", "remaining_time": "0:01:19"}
|
24705 |
+
{"current_steps": 247010, "total_steps": 247180, "loss": 0.017, "lr": 1.4408730338311139e-11, "epoch": 1.9986244841815681, "percentage": 99.93, "elapsed_time": "1 day, 6:10:15", "remaining_time": "0:01:14"}
|
24706 |
+
{"current_steps": 247020, "total_steps": 247180, "loss": 0.0189, "lr": 1.27634434909929e-11, "epoch": 1.9987053968767698, "percentage": 99.94, "elapsed_time": "1 day, 6:10:19", "remaining_time": "0:01:10"}
|
24707 |
+
{"current_steps": 247030, "total_steps": 247180, "loss": 0.0236, "lr": 1.1217870833912791e-11, "epoch": 1.998786309571972, "percentage": 99.94, "elapsed_time": "1 day, 6:10:24", "remaining_time": "0:01:05"}
|
24708 |
+
{"current_steps": 247040, "total_steps": 247180, "loss": 0.0115, "lr": 9.772012397046837e-12, "epoch": 1.9988672222671737, "percentage": 99.94, "elapsed_time": "1 day, 6:10:28", "remaining_time": "0:01:01"}
|
24709 |
+
{"current_steps": 247050, "total_steps": 247180, "loss": 0.0159, "lr": 8.425868210371058e-12, "epoch": 1.9989481349623754, "percentage": 99.95, "elapsed_time": "1 day, 6:10:32", "remaining_time": "0:00:57"}
|
24710 |
+
{"current_steps": 247060, "total_steps": 247180, "loss": 0.0121, "lr": 7.179438299975694e-12, "epoch": 1.9990290476575776, "percentage": 99.95, "elapsed_time": "1 day, 6:10:35", "remaining_time": "0:00:52"}
|
24711 |
+
{"current_steps": 247070, "total_steps": 247180, "loss": 0.0224, "lr": 6.0327226908407645e-12, "epoch": 1.9991099603527793, "percentage": 99.96, "elapsed_time": "1 day, 6:10:39", "remaining_time": "0:00:48"}
|
24712 |
+
{"current_steps": 247080, "total_steps": 247180, "loss": 0.0081, "lr": 4.985721406280952e-12, "epoch": 1.9991908730479813, "percentage": 99.96, "elapsed_time": "1 day, 6:10:42", "remaining_time": "0:00:43"}
|
24713 |
+
{"current_steps": 247090, "total_steps": 247180, "loss": 0.0155, "lr": 4.038434466835384e-12, "epoch": 1.9992717857431832, "percentage": 99.96, "elapsed_time": "1 day, 6:10:45", "remaining_time": "0:00:39"}
|
24714 |
+
{"current_steps": 247100, "total_steps": 247180, "loss": 0.0149, "lr": 3.1908618908227384e-12, "epoch": 1.999352698438385, "percentage": 99.97, "elapsed_time": "1 day, 6:10:49", "remaining_time": "0:00:35"}
|
24715 |
+
{"current_steps": 247110, "total_steps": 247180, "loss": 0.0235, "lr": 2.443003696006585e-12, "epoch": 1.9994336111335869, "percentage": 99.97, "elapsed_time": "1 day, 6:10:53", "remaining_time": "0:00:30"}
|
24716 |
+
{"current_steps": 247120, "total_steps": 247180, "loss": 0.0166, "lr": 1.7948598973749343e-12, "epoch": 1.9995145238287888, "percentage": 99.98, "elapsed_time": "1 day, 6:10:56", "remaining_time": "0:00:26"}
|
24717 |
+
{"current_steps": 247130, "total_steps": 247180, "loss": 0.0161, "lr": 1.2464305071402395e-12, "epoch": 1.9995954365239905, "percentage": 99.98, "elapsed_time": "1 day, 6:11:00", "remaining_time": "0:00:21"}
|
24718 |
+
{"current_steps": 247140, "total_steps": 247180, "loss": 0.0099, "lr": 7.977155364047307e-13, "epoch": 1.9996763492191925, "percentage": 99.98, "elapsed_time": "1 day, 6:11:04", "remaining_time": "0:00:17"}
|
24719 |
+
{"current_steps": 247150, "total_steps": 247180, "loss": 0.0143, "lr": 4.4871499460530376e-13, "epoch": 1.9997572619143944, "percentage": 99.99, "elapsed_time": "1 day, 6:11:07", "remaining_time": "0:00:13"}
|
24720 |
+
{"current_steps": 247160, "total_steps": 247180, "loss": 0.008, "lr": 1.9942888784818536e-13, "epoch": 1.9998381746095961, "percentage": 99.99, "elapsed_time": "1 day, 6:11:10", "remaining_time": "0:00:08"}
|
24721 |
+
{"current_steps": 247170, "total_steps": 247180, "loss": 0.0161, "lr": 4.98572222396021e-14, "epoch": 1.9999190873047983, "percentage": 100.0, "elapsed_time": "1 day, 6:11:14", "remaining_time": "0:00:04"}
|
24722 |
+
{"current_steps": 247180, "total_steps": 247180, "loss": 0.009, "lr": 0.0, "epoch": 2.0, "percentage": 100.0, "elapsed_time": "1 day, 6:11:18", "remaining_time": "0:00:00"}
|
24723 |
+
{"current_steps": 247180, "total_steps": 247180, "epoch": 2.0, "percentage": 100.0, "elapsed_time": "1 day, 6:11:43", "remaining_time": "0:00:00"}
|