Upload folder using huggingface_hub

Files changed (7) hide show

adapter_config.json CHANGED Viewed

@@ -20,10 +20,10 @@
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
-    "gate_up_proj",
     "down_proj",
     "o_proj",
-    "qkv_proj"
   ],
   "task_type": "CAUSAL_LM",
   "use_dora": false,

   "rank_pattern": {},
   "revision": null,
   "target_modules": [
     "down_proj",
+    "qkv_proj",
     "o_proj",
+    "gate_up_proj"
   ],
   "task_type": "CAUSAL_LM",
   "use_dora": false,

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:339731ebf6db42eeda7b13d9cbc2340912e580151d3cb41b2b7279c91f7f2861
 size 1671212336

 version https://git-lfs.github.com/spec/v1
+oid sha256:9d9e7e6e58e1602d0fc9f6833921165fd8bd25c5ac6ebd0efc58c7c87a6b5a04
 size 1671212336

optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:31d0a01f61cbbde77ec99870b9954eb2842c738c66c882b64eb15c90370afe1d
 size 849024805

 version https://git-lfs.github.com/spec/v1
+oid sha256:26132871b2a91e0812f2f06e1f2c459b1dc72cd527f446516dae0cdc446be458
 size 849024805

rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ea1bd93beff3c365de9a84a01a802faad4276d8e71a2a15de7281dac0bea5890
 size 14645

 version https://git-lfs.github.com/spec/v1
+oid sha256:873f6503ef67b297aff30dbeed96c14a567fc3c35eee7665a905b7c4c1c7eb3d
 size 14645

scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7b275d54813d0deef3ff1f89f68d47317439edf005f160f8074fc9ee8ff1ecd4
 size 1465

 version https://git-lfs.github.com/spec/v1
+oid sha256:70ec5656cb5df7f1d52a61930dc86413e2b7365b3c707692864ddef6e8bfc5ce
 size 1465

trainer_state.json CHANGED Viewed

@@ -1,23 +1,30 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 1.9733333333333334,
   "eval_steps": 500,
-  "global_step": 37,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
   "log_history": [
     {
-      "epoch": 1.0666666666666667,
-      "grad_norm": 1.491087555885315,
-      "learning_rate": 0.00017188371767611337,
-      "loss": 1.0456,
       "step": 20
     }
   ],
   "logging_steps": 20,
-  "max_steps": 54,
   "num_input_tokens_seen": 0,
   "num_train_epochs": 3,
   "save_steps": 500,
@@ -33,7 +40,7 @@
       "attributes": {}
     }
   },
-  "total_flos": 2.67429272620032e+16,
   "train_batch_size": 1,
   "trial_name": null,
   "trial_params": null

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 2.0,
   "eval_steps": 500,
+  "global_step": 50,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
   "log_history": [
     {
+      "epoch": 0.8,
+      "grad_norm": 0.4785412847995758,
+      "learning_rate": 0.00018295745859082095,
+      "loss": 0.9961,
       "step": 20
+    },
+    {
+      "epoch": 1.6,
+      "grad_norm": 1.4140418767929077,
+      "learning_rate": 0.0001245127148743087,
+      "loss": 0.6728,
+      "step": 40
     }
   ],
   "logging_steps": 20,
+  "max_steps": 75,
   "num_input_tokens_seen": 0,
   "num_train_epochs": 3,
   "save_steps": 500,
       "attributes": {}
     }
   },
+  "total_flos": 3.40634643861504e+16,
   "train_batch_size": 1,
   "trial_name": null,
   "trial_params": null

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6462fe46d466c005f72f8a109597fabce71b5a6ff8f6b1a2124fefd6f39bbb0a
 size 5905

 version https://git-lfs.github.com/spec/v1
+oid sha256:e71ce490c35f09b0e4991bd8720f211574a9577ed3b0bdd82bc8ee2e497b310b
 size 5905