jxiao986/dpo-mistral7b-lima

Files changed (6) hide show

README.md CHANGED Viewed

@@ -27,7 +27,7 @@ print(output["generated_text"])
 ## Training procedure
-[<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="150" height="24"/>](https://wandb.ai/1062983729-hong-kong-university-of-science-and-technology/huggingface/runs/zsruni1u)
 This model was trained with DPO, a method introduced in [Direct Preference Optimization: Your Language Model is Secretly a Reward Model](https://huggingface.co/papers/2305.18290).

 ## Training procedure
+[<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="150" height="24"/>](https://wandb.ai/1062983729-hong-kong-university-of-science-and-technology/huggingface/runs/upgv1a1p)
 This model was trained with DPO, a method introduced in [Direct Preference Optimization: Your Language Model is Secretly a Reward Model](https://huggingface.co/papers/2305.18290).

adapter_config.json CHANGED Viewed

@@ -24,13 +24,10 @@
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
-    "v_proj",
-    "o_proj",
-    "gate_proj",
     "k_proj",
-    "q_proj",
-    "down_proj",
-    "up_proj"
   ],
   "task_type": "CAUSAL_LM",
   "trainable_token_indices": null,

   "rank_pattern": {},
   "revision": null,
   "target_modules": [
     "k_proj",
+    "o_proj",
+    "v_proj",
+    "q_proj"
   ],
   "task_type": "CAUSAL_LM",
   "trainable_token_indices": null,

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:bf058a542385f8a1532880de1badf1b49ccfcf77bf9decd23020b7d9caeba612
-size 335604696

 version https://git-lfs.github.com/spec/v1
+oid sha256:3f88386f61f16fe5f72ef2a1900b1284148e6ac0f3e9e262e1f80a8770aa24ee
+size 109086416

runs/May10_16-55-38_620413a29def/events.out.tfevents.1746896140.620413a29def.16974.1 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:6001fc9784a4870dd98dd45e87bf4cfcc9b8688244801287b4082792995ec1e1
+size 8020

runs/May10_17-08-56_620413a29def/events.out.tfevents.1746896937.620413a29def.24265.0 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:3a79eaa1b3b669f172284955e8ae8d6b6aecf698bd506aa78255618982592a5f
+size 6690

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:20a077c44ae0f84a089b7a543a5f8c567eb4a5abf105294ecafae3f8e49e720c
 size 6200

 version https://git-lfs.github.com/spec/v1
+oid sha256:d489cd94509a5ec088152a324a270d1f06f51946d1ecc36133a14c1f1e8a2052
 size 6200