shoubing35 commited on
Commit
5f399d8
·
verified ·
1 Parent(s): 8344291

Training in progress, step 96

Browse files
README.md CHANGED
@@ -1,5 +1,6 @@
1
  ---
2
  base_model: meta-llama/Llama-3.2-1B-Instruct
 
3
  library_name: transformers
4
  model_name: llama-1B-sft
5
  tags:
@@ -11,7 +12,7 @@ licence: license
11
 
12
  # Model Card for llama-1B-sft
13
 
14
- This model is a fine-tuned version of [meta-llama/Llama-3.2-1B-Instruct](https://huggingface.co/meta-llama/Llama-3.2-1B-Instruct).
15
  It has been trained using [TRL](https://github.com/huggingface/trl).
16
 
17
  ## Quick start
 
1
  ---
2
  base_model: meta-llama/Llama-3.2-1B-Instruct
3
+ datasets: shoubing35/ones_digit_sft_dataset
4
  library_name: transformers
5
  model_name: llama-1B-sft
6
  tags:
 
12
 
13
  # Model Card for llama-1B-sft
14
 
15
+ This model is a fine-tuned version of [meta-llama/Llama-3.2-1B-Instruct](https://huggingface.co/meta-llama/Llama-3.2-1B-Instruct) on the [shoubing35/ones_digit_sft_dataset](https://huggingface.co/datasets/shoubing35/ones_digit_sft_dataset) dataset.
16
  It has been trained using [TRL](https://github.com/huggingface/trl).
17
 
18
  ## Quick start
adapter_config.json CHANGED
@@ -25,13 +25,13 @@
25
  "rank_pattern": {},
26
  "revision": null,
27
  "target_modules": [
28
- "k_proj",
 
29
  "gate_proj",
30
  "down_proj",
31
- "v_proj",
32
- "q_proj",
33
  "up_proj",
34
- "o_proj"
 
35
  ],
36
  "task_type": "CAUSAL_LM",
37
  "use_dora": false,
 
25
  "rank_pattern": {},
26
  "revision": null,
27
  "target_modules": [
28
+ "q_proj",
29
+ "o_proj",
30
  "gate_proj",
31
  "down_proj",
 
 
32
  "up_proj",
33
+ "v_proj",
34
+ "k_proj"
35
  ],
36
  "task_type": "CAUSAL_LM",
37
  "use_dora": false,
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ad5e0be0bf861ae1ea915e650ed3bb716183a321b6351d19cfac595d7763ff90
3
  size 1095792688
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e90b7de9cf798cd9aad14f56ca6acb17039673580d56050f860e8915562c73bd
3
  size 1095792688
runs/Apr18_02-07-45_ed4ef8575fbd/events.out.tfevents.1744942081.ed4ef8575fbd.3850.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7e77ffd0b63a2f8929c6758ae250dccd2a6f2da76270cfc766da9f8aec9d1050
3
+ size 17331
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:72822d278e5c197834640a0b7cab79e3ff0e57f55fc11eed4e505a440e532bf8
3
  size 5688
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:59e83b8eb8734725929f6a51ccc9a7f035ab2c05e6ea36559e2b9d0a6cbfa604
3
  size 5688