jxm commited on
Commit
5c748d2
·
verified ·
1 Parent(s): bb2ee10

Training in progress, step 1230

Browse files
README.md CHANGED
@@ -4,8 +4,8 @@ library_name: transformers
4
  model_name: gpt-oss-20b-ft-base-peft-100k-higher-rank
5
  tags:
6
  - generated_from_trainer
7
- - trl
8
  - sft
 
9
  licence: license
10
  ---
11
 
@@ -27,7 +27,7 @@ print(output["generated_text"])
27
 
28
  ## Training procedure
29
 
30
- [<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="150" height="24"/>](https://fairwandb.org/jxm/huggingface/runs/o77c248o)
31
 
32
 
33
  This model was trained with SFT.
 
4
  model_name: gpt-oss-20b-ft-base-peft-100k-higher-rank
5
  tags:
6
  - generated_from_trainer
 
7
  - sft
8
+ - trl
9
  licence: license
10
  ---
11
 
 
27
 
28
  ## Training procedure
29
 
30
+ [<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="150" height="24"/>](https://fairwandb.org/jxm/huggingface/runs/ams29282)
31
 
32
 
33
  This model was trained with SFT.
adapter_config.json CHANGED
@@ -28,10 +28,10 @@
28
  "rank_pattern": {},
29
  "revision": null,
30
  "target_modules": [
31
- "k_proj",
32
  "o_proj",
33
- "v_proj",
34
- "q_proj"
 
35
  ],
36
  "target_parameters": [
37
  "7.mlp.experts.gate_up_proj",
 
28
  "rank_pattern": {},
29
  "revision": null,
30
  "target_modules": [
 
31
  "o_proj",
32
+ "q_proj",
33
+ "k_proj",
34
+ "v_proj"
35
  ],
36
  "target_parameters": [
37
  "7.mlp.experts.gate_up_proj",
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c8318ef5a6aa0d979d6bea2cc7522730b13c8efe020b28e7afec9097745015fd
3
  size 1925213672
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a3ceb521418eadc45d2c75521d9eea6f6dac0515a6f9a8634bb927f6d8423c35
3
  size 1925213672
tokenizer.json CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0614fe83cadab421296e664e1f48f4261fa8fef6e03e63bb75c20f38e37d07d3
3
- size 27868174
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7b3bf7d68eab1b27cafce91b995007277a808881e240f92982598dc1839bb060
3
+ size 27868355
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b56ca30a3493f6cf132f9be05ba9a687f58785d51e9b8e8282cb8ed0ff368f00
3
  size 6225
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1596860dab301b5e8565f3885f88f95ac448c4e7ddf66a6bec354627eb3bca05
3
  size 6225