Upload checkpoint 8700

Files changed (5) hide show

model-00001-of-00002.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:89b6ed8f166125c4e0ccb4438463feac8c4befdcfa3b5fc23df50b931dd37964
 size 4957560304

 version https://git-lfs.github.com/spec/v1
+oid sha256:6b11035d8bf31e165917a7dcfceb6ec5dc1f4f3c3ad78092bcaea45bfac2a86d
 size 4957560304

model-00002-of-00002.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:dfeea3b480b0ac3a7be7edb3e3d45b0b6eed0bc230ddbdd298ef3463ce89ffd9
 size 3989163248

 version https://git-lfs.github.com/spec/v1
+oid sha256:e657eb4960ca2f126e63960bd32422b6ff61f48d25c083228c21ff92b84eb943
 size 3989163248

optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:fc5cc673934837b111c47f04c42854cbbf4155db979be7dde3c8474b55635ed6
 size 17893865224

 version https://git-lfs.github.com/spec/v1
+oid sha256:9e5b9e5e639d529391dd985fc3d312297ab0abb3033b2e8289b0cb7a465b27da
 size 17893865224

scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:bb0516760d88d4baa388b6e998401e0078c7ad3407932309df513a21a23fcf7a
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:fb9b203b48c284e5ca3d5f0f55dfbe5f8779d467d5680d977c3a7b3ba01095a7
 size 1064

trainer_state.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 0.9999425452456191,
   "eval_steps": 500,
-  "global_step": 8702,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -20321,12 +20321,12 @@
         "should_evaluate": false,
         "should_log": false,
         "should_save": true,
-        "should_training_stop": true
       },
       "attributes": {}
     }
   },
-  "total_flos": 3.1626194748539142e+19,
   "train_batch_size": 4,
   "trial_name": null,
   "trial_params": null

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 0.9997127262280954,
   "eval_steps": 500,
+  "global_step": 8700,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
         "should_evaluate": false,
         "should_log": false,
         "should_save": true,
+        "should_training_stop": false
       },
       "attributes": {}
     }
   },
+  "total_flos": 3.161964823751688e+19,
   "train_batch_size": 4,
   "trial_name": null,
   "trial_params": null