Training in progress, step 42, checkpoint

Files changed (5) hide show

last-checkpoint/adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:998f8dfe1a4fe152e269c54d2027d8c95f64fc9d73b3ec1e62452e05d3e802ff
 size 39256456

 version https://git-lfs.github.com/spec/v1
+oid sha256:3a04478a6eb03e6510900e28206005ddd886c32257ac48e9d4c1cb51df7218d9
 size 39256456

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:93996bc4196dfaca8d2de518388e9d2ccf3818aadb9aedc1e1af60d7bf73b721
 size 20632826

 version https://git-lfs.github.com/spec/v1
+oid sha256:81bfd0205bc29bc072146a965d37b1ca07674f8357dc3a0e1a1b2b38fe154fda
 size 20632826

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9c24c62e4cd7b0332ff8817426a459e70a6e7e90cb15d9bcaac496100d630999
 size 14244

 version https://git-lfs.github.com/spec/v1
+oid sha256:f07d8c860cd7de8ee301f608ccd3584f3827e66ed38993f94733b1c5732af739
 size 14244

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:5307556de25fa7df1caa893b2d8321c1b847c59c86eb876afa5cf1f8077bc325
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:da2e7edae03699c1cd9559730363e2f67d4336103b5fded6865a5437f817ac2d
 size 1064

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 0.7904191616766467,
   "eval_steps": 11,
-  "global_step": 33,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -60,6 +60,13 @@
       "eval_samples_per_second": 61.897,
       "eval_steps_per_second": 30.948,
       "step": 33
     }
   ],
   "logging_steps": 10,
@@ -74,12 +81,12 @@
         "should_evaluate": false,
         "should_log": false,
         "should_save": true,
-        "should_training_stop": false
       },
       "attributes": {}
     }
   },
-  "total_flos": 1615276718161920.0,
   "train_batch_size": 2,
   "trial_name": null,
   "trial_params": null

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 1.0179640718562875,
   "eval_steps": 11,
+  "global_step": 42,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_samples_per_second": 61.897,
       "eval_steps_per_second": 30.948,
       "step": 33
+    },
+    {
+      "epoch": 0.9580838323353293,
+      "grad_norm": 0.003072954947128892,
+      "learning_rate": 1.4384089652291543e-06,
+      "loss": 0.0001,
+      "step": 40
     }
   ],
   "logging_steps": 10,
         "should_evaluate": false,
         "should_log": false,
         "should_save": true,
+        "should_training_stop": true
       },
       "attributes": {}
     }
   },
+  "total_flos": 2055806732206080.0,
   "train_batch_size": 2,
   "trial_name": null,
   "trial_params": null