reinhardh commited on
Commit
f10501f
·
verified ·
1 Parent(s): fb5b28f

Training in progress, step 7100

Browse files
model-00001-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5e68d6852116f3e6968cbd7a48efe78e9bf3b5a375220f47a3a3fc37af000d1c
3
  size 5000000704
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e21bbb41adae2d25afce127241c7f9e23f957ba9f73c54b339eb02188e6e64ed
3
  size 5000000704
model-00002-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9d0bc3795cd98ca3c5d364b4112467adc16594a8e05fe19416ea4812167c462d
3
  size 4857411192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1828a07517b2ec35ceadcc97df79f8e09f7ba5de3f47d995be20081aeca13294
3
  size 4857411192
model-00003-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:77095746313c6549a6991b85f708b415705bd8d47503c15b1509e4f98b439248
3
  size 3921970888
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cc1dd90c032f6c0cab406ff93c14769eea81df74bd8857072bdfd749f64fb853
3
  size 3921970888
trainer_log.jsonl CHANGED
@@ -7098,3 +7098,53 @@
7098
  {"current_steps": 7098, "total_steps": 7210, "loss": 0.3418, "lr": 7.348756177343319e-09, "epoch": 4.922330097087379, "percentage": 98.45, "elapsed_time": "18:44:42", "remaining_time": "0:17:44"}
7099
  {"current_steps": 7099, "total_steps": 7210, "loss": 0.365, "lr": 7.218145669054544e-09, "epoch": 4.9230235783633844, "percentage": 98.46, "elapsed_time": "18:44:43", "remaining_time": "0:17:35"}
7100
  {"current_steps": 7100, "total_steps": 7210, "loss": 0.3992, "lr": 7.088705432672926e-09, "epoch": 4.92371705963939, "percentage": 98.47, "elapsed_time": "18:44:45", "remaining_time": "0:17:25"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
7098
  {"current_steps": 7098, "total_steps": 7210, "loss": 0.3418, "lr": 7.348756177343319e-09, "epoch": 4.922330097087379, "percentage": 98.45, "elapsed_time": "18:44:42", "remaining_time": "0:17:44"}
7099
  {"current_steps": 7099, "total_steps": 7210, "loss": 0.365, "lr": 7.218145669054544e-09, "epoch": 4.9230235783633844, "percentage": 98.46, "elapsed_time": "18:44:43", "remaining_time": "0:17:35"}
7100
  {"current_steps": 7100, "total_steps": 7210, "loss": 0.3992, "lr": 7.088705432672926e-09, "epoch": 4.92371705963939, "percentage": 98.47, "elapsed_time": "18:44:45", "remaining_time": "0:17:25"}
7101
+ {"current_steps": 7101, "total_steps": 7210, "loss": 0.3523, "lr": 6.960435498538642e-09, "epoch": 4.924410540915395, "percentage": 98.49, "elapsed_time": "18:46:32", "remaining_time": "0:17:17"}
7102
+ {"current_steps": 7102, "total_steps": 7210, "loss": 0.4205, "lr": 6.833335896716531e-09, "epoch": 4.925104022191401, "percentage": 98.5, "elapsed_time": "18:46:33", "remaining_time": "0:17:07"}
7103
+ {"current_steps": 7103, "total_steps": 7210, "loss": 0.3542, "lr": 6.707406656998872e-09, "epoch": 4.925797503467407, "percentage": 98.52, "elapsed_time": "18:46:35", "remaining_time": "0:16:58"}
7104
+ {"current_steps": 7104, "total_steps": 7210, "loss": 0.3453, "lr": 6.5826478089014985e-09, "epoch": 4.9264909847434115, "percentage": 98.53, "elapsed_time": "18:46:36", "remaining_time": "0:16:48"}
7105
+ {"current_steps": 7105, "total_steps": 7210, "loss": 0.3147, "lr": 6.4590593816676875e-09, "epoch": 4.927184466019417, "percentage": 98.54, "elapsed_time": "18:46:38", "remaining_time": "0:16:38"}
7106
+ {"current_steps": 7106, "total_steps": 7210, "loss": 0.3768, "lr": 6.336641404265376e-09, "epoch": 4.927877947295423, "percentage": 98.56, "elapsed_time": "18:46:39", "remaining_time": "0:16:29"}
7107
+ {"current_steps": 7107, "total_steps": 7210, "loss": 0.3678, "lr": 6.215393905388278e-09, "epoch": 4.928571428571429, "percentage": 98.57, "elapsed_time": "18:46:41", "remaining_time": "0:16:19"}
7108
+ {"current_steps": 7108, "total_steps": 7210, "loss": 0.3432, "lr": 6.09531691345644e-09, "epoch": 4.929264909847435, "percentage": 98.59, "elapsed_time": "18:46:43", "remaining_time": "0:16:10"}
7109
+ {"current_steps": 7109, "total_steps": 7210, "loss": 0.2789, "lr": 5.976410456614567e-09, "epoch": 4.9299583911234395, "percentage": 98.6, "elapsed_time": "18:46:44", "remaining_time": "0:16:00"}
7110
+ {"current_steps": 7110, "total_steps": 7210, "loss": 0.3634, "lr": 5.858674562733701e-09, "epoch": 4.930651872399445, "percentage": 98.61, "elapsed_time": "18:46:46", "remaining_time": "0:15:50"}
7111
+ {"current_steps": 7111, "total_steps": 7210, "loss": 0.3175, "lr": 5.7421092594101004e-09, "epoch": 4.931345353675451, "percentage": 98.63, "elapsed_time": "18:48:05", "remaining_time": "0:15:42"}
7112
+ {"current_steps": 7112, "total_steps": 7210, "loss": 0.3144, "lr": 5.626714573966352e-09, "epoch": 4.932038834951456, "percentage": 98.64, "elapsed_time": "18:48:06", "remaining_time": "0:15:32"}
7113
+ {"current_steps": 7113, "total_steps": 7210, "loss": 0.353, "lr": 5.51249053344971e-09, "epoch": 4.932732316227462, "percentage": 98.65, "elapsed_time": "18:48:08", "remaining_time": "0:15:23"}
7114
+ {"current_steps": 7114, "total_steps": 7210, "loss": 0.3554, "lr": 5.3994371646332035e-09, "epoch": 4.933425797503467, "percentage": 98.67, "elapsed_time": "18:48:09", "remaining_time": "0:15:13"}
7115
+ {"current_steps": 7115, "total_steps": 7210, "loss": 0.3547, "lr": 5.28755449401619e-09, "epoch": 4.934119278779473, "percentage": 98.68, "elapsed_time": "18:48:11", "remaining_time": "0:15:03"}
7116
+ {"current_steps": 7116, "total_steps": 7210, "loss": 0.3348, "lr": 5.176842547823246e-09, "epoch": 4.934812760055479, "percentage": 98.7, "elapsed_time": "18:48:12", "remaining_time": "0:14:54"}
7117
+ {"current_steps": 7117, "total_steps": 7210, "loss": 0.3615, "lr": 5.067301352004173e-09, "epoch": 4.935506241331484, "percentage": 98.71, "elapsed_time": "18:48:14", "remaining_time": "0:14:44"}
7118
+ {"current_steps": 7118, "total_steps": 7210, "loss": 0.334, "lr": 4.9589309322339855e-09, "epoch": 4.93619972260749, "percentage": 98.72, "elapsed_time": "18:48:16", "remaining_time": "0:14:34"}
7119
+ {"current_steps": 7119, "total_steps": 7210, "loss": 0.3452, "lr": 4.851731313915142e-09, "epoch": 4.936893203883495, "percentage": 98.74, "elapsed_time": "18:48:17", "remaining_time": "0:14:25"}
7120
+ {"current_steps": 7120, "total_steps": 7210, "loss": 0.329, "lr": 4.745702522174211e-09, "epoch": 4.9375866851595, "percentage": 98.75, "elapsed_time": "18:48:19", "remaining_time": "0:14:15"}
7121
+ {"current_steps": 7121, "total_steps": 7210, "loss": 0.3284, "lr": 4.64084458186298e-09, "epoch": 4.938280166435506, "percentage": 98.77, "elapsed_time": "18:49:30", "remaining_time": "0:14:07"}
7122
+ {"current_steps": 7122, "total_steps": 7210, "loss": 0.3516, "lr": 4.537157517559565e-09, "epoch": 4.938973647711512, "percentage": 98.78, "elapsed_time": "18:49:31", "remaining_time": "0:13:57"}
7123
+ {"current_steps": 7123, "total_steps": 7210, "loss": 0.376, "lr": 4.434641353567859e-09, "epoch": 4.939667128987518, "percentage": 98.79, "elapsed_time": "18:49:33", "remaining_time": "0:13:47"}
7124
+ {"current_steps": 7124, "total_steps": 7210, "loss": 0.3105, "lr": 4.333296113916419e-09, "epoch": 4.940360610263523, "percentage": 98.81, "elapsed_time": "18:49:34", "remaining_time": "0:13:38"}
7125
+ {"current_steps": 7125, "total_steps": 7210, "loss": 0.3449, "lr": 4.233121822359576e-09, "epoch": 4.941054091539528, "percentage": 98.82, "elapsed_time": "18:49:36", "remaining_time": "0:13:28"}
7126
+ {"current_steps": 7126, "total_steps": 7210, "loss": 0.3548, "lr": 4.134118502378548e-09, "epoch": 4.941747572815534, "percentage": 98.83, "elapsed_time": "18:49:38", "remaining_time": "0:13:18"}
7127
+ {"current_steps": 7127, "total_steps": 7210, "loss": 0.354, "lr": 4.036286177178661e-09, "epoch": 4.94244105409154, "percentage": 98.85, "elapsed_time": "18:49:39", "remaining_time": "0:13:09"}
7128
+ {"current_steps": 7128, "total_steps": 7210, "loss": 0.3615, "lr": 3.939624869689907e-09, "epoch": 4.943134535367545, "percentage": 98.86, "elapsed_time": "18:49:41", "remaining_time": "0:12:59"}
7129
+ {"current_steps": 7129, "total_steps": 7210, "loss": 0.3546, "lr": 3.844134602570826e-09, "epoch": 4.94382801664355, "percentage": 98.88, "elapsed_time": "18:49:42", "remaining_time": "0:12:50"}
7130
+ {"current_steps": 7130, "total_steps": 7210, "loss": 0.3168, "lr": 3.749815398202405e-09, "epoch": 4.944521497919556, "percentage": 98.89, "elapsed_time": "18:49:44", "remaining_time": "0:12:40"}
7131
+ {"current_steps": 7131, "total_steps": 7210, "loss": 0.3428, "lr": 3.656667278692516e-09, "epoch": 4.945214979195562, "percentage": 98.9, "elapsed_time": "18:50:45", "remaining_time": "0:12:31"}
7132
+ {"current_steps": 7132, "total_steps": 7210, "loss": 0.3501, "lr": 3.5646902658748037e-09, "epoch": 4.945908460471568, "percentage": 98.92, "elapsed_time": "18:50:47", "remaining_time": "0:12:22"}
7133
+ {"current_steps": 7133, "total_steps": 7210, "loss": 0.3743, "lr": 3.4738843813075795e-09, "epoch": 4.946601941747573, "percentage": 98.93, "elapsed_time": "18:50:49", "remaining_time": "0:12:12"}
7134
+ {"current_steps": 7134, "total_steps": 7210, "loss": 0.3417, "lr": 3.3842496462754837e-09, "epoch": 4.947295423023578, "percentage": 98.95, "elapsed_time": "18:50:50", "remaining_time": "0:12:02"}
7135
+ {"current_steps": 7135, "total_steps": 7210, "loss": 0.3861, "lr": 3.295786081788377e-09, "epoch": 4.947988904299584, "percentage": 98.96, "elapsed_time": "18:50:52", "remaining_time": "0:11:53"}
7136
+ {"current_steps": 7136, "total_steps": 7210, "loss": 0.3693, "lr": 3.2084937085807844e-09, "epoch": 4.948682385575589, "percentage": 98.97, "elapsed_time": "18:50:53", "remaining_time": "0:11:43"}
7137
+ {"current_steps": 7137, "total_steps": 7210, "loss": 0.3442, "lr": 3.1223725471135613e-09, "epoch": 4.949375866851595, "percentage": 98.99, "elapsed_time": "18:50:55", "remaining_time": "0:11:34"}
7138
+ {"current_steps": 7138, "total_steps": 7210, "loss": 0.3539, "lr": 3.037422617573893e-09, "epoch": 4.950069348127601, "percentage": 99.0, "elapsed_time": "18:50:56", "remaining_time": "0:11:24"}
7139
+ {"current_steps": 7139, "total_steps": 7210, "loss": 0.3365, "lr": 2.953643939871964e-09, "epoch": 4.950762829403606, "percentage": 99.02, "elapsed_time": "18:50:58", "remaining_time": "0:11:14"}
7140
+ {"current_steps": 7140, "total_steps": 7210, "loss": 0.3537, "lr": 2.8710365336459546e-09, "epoch": 4.951456310679612, "percentage": 99.03, "elapsed_time": "18:51:00", "remaining_time": "0:11:05"}
7141
+ {"current_steps": 7141, "total_steps": 7210, "loss": 0.3487, "lr": 2.789600418258154e-09, "epoch": 4.952149791955617, "percentage": 99.04, "elapsed_time": "18:52:02", "remaining_time": "0:10:56"}
7142
+ {"current_steps": 7142, "total_steps": 7210, "loss": 0.3644, "lr": 2.7093356127960712e-09, "epoch": 4.952843273231623, "percentage": 99.06, "elapsed_time": "18:52:04", "remaining_time": "0:10:46"}
7143
+ {"current_steps": 7143, "total_steps": 7210, "loss": 0.3152, "lr": 2.6302421360741014e-09, "epoch": 4.9535367545076285, "percentage": 99.07, "elapsed_time": "18:52:05", "remaining_time": "0:10:37"}
7144
+ {"current_steps": 7144, "total_steps": 7210, "loss": 0.3299, "lr": 2.5523200066301935e-09, "epoch": 4.954230235783633, "percentage": 99.08, "elapsed_time": "18:52:07", "remaining_time": "0:10:27"}
7145
+ {"current_steps": 7145, "total_steps": 7210, "loss": 0.4071, "lr": 2.475569242729736e-09, "epoch": 4.954923717059639, "percentage": 99.1, "elapsed_time": "18:52:09", "remaining_time": "0:10:17"}
7146
+ {"current_steps": 7146, "total_steps": 7210, "loss": 0.385, "lr": 2.3999898623622288e-09, "epoch": 4.955617198335645, "percentage": 99.11, "elapsed_time": "18:52:10", "remaining_time": "0:10:08"}
7147
+ {"current_steps": 7147, "total_steps": 7210, "loss": 0.3303, "lr": 2.3255818832423894e-09, "epoch": 4.956310679611651, "percentage": 99.13, "elapsed_time": "18:52:12", "remaining_time": "0:09:58"}
7148
+ {"current_steps": 7148, "total_steps": 7210, "loss": 0.3437, "lr": 2.252345322811267e-09, "epoch": 4.9570041608876565, "percentage": 99.14, "elapsed_time": "18:52:13", "remaining_time": "0:09:49"}
7149
+ {"current_steps": 7149, "total_steps": 7210, "loss": 0.3006, "lr": 2.1802801982351294e-09, "epoch": 4.957697642163661, "percentage": 99.15, "elapsed_time": "18:52:15", "remaining_time": "0:09:39"}
7150
+ {"current_steps": 7150, "total_steps": 7210, "loss": 0.3175, "lr": 2.109386526405466e-09, "epoch": 4.958391123439667, "percentage": 99.17, "elapsed_time": "18:52:16", "remaining_time": "0:09:30"}