shoubing35 commited on
Commit
e44b356
·
verified ·
1 Parent(s): 157ab51

Training in progress, step 250

Browse files
README.md CHANGED
@@ -1,18 +1,17 @@
1
  ---
2
  base_model: openai-community/gpt2
3
- datasets: rajpurkar/squad
4
  library_name: transformers
5
  model_name: gpt2-sft
6
  tags:
7
  - generated_from_trainer
8
- - trl
9
  - sft
 
10
  licence: license
11
  ---
12
 
13
  # Model Card for gpt2-sft
14
 
15
- This model is a fine-tuned version of [openai-community/gpt2](https://huggingface.co/openai-community/gpt2) on the [rajpurkar/squad](https://huggingface.co/datasets/rajpurkar/squad) dataset.
16
  It has been trained using [TRL](https://github.com/huggingface/trl).
17
 
18
  ## Quick start
 
1
  ---
2
  base_model: openai-community/gpt2
 
3
  library_name: transformers
4
  model_name: gpt2-sft
5
  tags:
6
  - generated_from_trainer
 
7
  - sft
8
+ - trl
9
  licence: license
10
  ---
11
 
12
  # Model Card for gpt2-sft
13
 
14
+ This model is a fine-tuned version of [openai-community/gpt2](https://huggingface.co/openai-community/gpt2).
15
  It has been trained using [TRL](https://github.com/huggingface/trl).
16
 
17
  ## Quick start
adapter_config.json CHANGED
@@ -13,21 +13,21 @@
13
  "layers_pattern": null,
14
  "layers_to_transform": null,
15
  "loftq_config": {},
16
- "lora_alpha": 32,
17
  "lora_bias": false,
18
- "lora_dropout": 0.1,
19
  "megatron_config": null,
20
  "megatron_core": "megatron.core",
21
  "modules_to_save": [
22
  "embed_tokens"
23
  ],
24
  "peft_type": "LORA",
25
- "r": 16,
26
  "rank_pattern": {},
27
  "revision": null,
28
  "target_modules": [
29
- "c_fc",
30
  "c_proj",
 
31
  "c_attn"
32
  ],
33
  "task_type": "CAUSAL_LM",
 
13
  "layers_pattern": null,
14
  "layers_to_transform": null,
15
  "loftq_config": {},
16
+ "lora_alpha": 64,
17
  "lora_bias": false,
18
+ "lora_dropout": 0.05,
19
  "megatron_config": null,
20
  "megatron_core": "megatron.core",
21
  "modules_to_save": [
22
  "embed_tokens"
23
  ],
24
  "peft_type": "LORA",
25
+ "r": 32,
26
  "rank_pattern": {},
27
  "revision": null,
28
  "target_modules": [
 
29
  "c_proj",
30
+ "c_fc",
31
  "c_attn"
32
  ],
33
  "task_type": "CAUSAL_LM",
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:eb5820656dae1f59ddc29cd6dd75f2d4d60966338de15986c9c0fbbf2e5d2337
3
- size 9449344
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:47b45c8f31b8b3a37fea6b55d2e850b0b4f42736eea082ac399597b8f6370ac1
3
+ size 18886632
runs/Jun24_03-23-29_e41449a0ce0e/events.out.tfevents.1750735414.e41449a0ce0e.21902.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ce6088a88160c930b045bd38f5901758c62a15f552769e66e9d213e89478315d
3
+ size 41662
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9cbb31db80f93ba2fabff595edf502bb560fbdf93e47089709635ba13b03aef8
3
  size 5752
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cf018642b6c872f89f54f579e09e8b98fa7758344feffb7e86eb5029f5013eb8
3
  size 5752