Training in progress, step 57
Browse files- README.md +33 -26
- adapter_config.json +2 -2
- adapter_model.safetensors +1 -1
- runs/Sep03_09-59-57_61d8ce0bbd73/events.out.tfevents.1756893598.61d8ce0bbd73.321.0 +3 -0
- runs/Sep03_10-01-15_61d8ce0bbd73/events.out.tfevents.1756893678.61d8ce0bbd73.321.1 +3 -0
- runs/Sep03_10-02-29_61d8ce0bbd73/events.out.tfevents.1756893751.61d8ce0bbd73.861.0 +3 -0
- runs/Sep03_10-03-20_61d8ce0bbd73/events.out.tfevents.1756893802.61d8ce0bbd73.861.1 +3 -0
- runs/Sep03_10-04-01_61d8ce0bbd73/events.out.tfevents.1756893843.61d8ce0bbd73.1127.0 +3 -0
- runs/Sep03_10-11-55_61d8ce0bbd73/events.out.tfevents.1756894418.61d8ce0bbd73.1387.0 +3 -0
- runs/Sep03_10-11-55_61d8ce0bbd73/events.out.tfevents.1756894532.61d8ce0bbd73.1387.1 +3 -0
- runs/Sep03_10-17-05_61d8ce0bbd73/events.out.tfevents.1756894627.61d8ce0bbd73.1856.0 +3 -0
- runs/Sep03_10-17-54_61d8ce0bbd73/events.out.tfevents.1756894678.61d8ce0bbd73.1856.1 +3 -0
- runs/Sep03_10-18-45_61d8ce0bbd73/events.out.tfevents.1756894727.61d8ce0bbd73.2432.0 +3 -0
- runs/Sep03_10-26-32_61d8ce0bbd73/events.out.tfevents.1756895193.61d8ce0bbd73.2432.1 +3 -0
- runs/Sep03_10-33-17_61d8ce0bbd73/events.out.tfevents.1756895598.61d8ce0bbd73.3117.0 +3 -0
- training_args.bin +1 -1
README.md
CHANGED
|
@@ -1,25 +1,17 @@
|
|
| 1 |
---
|
| 2 |
base_model: openai/gpt-oss-20b
|
| 3 |
-
datasets:
|
| 4 |
-
- kingabzpro/dermatology-qa-firecrawl-dataset
|
| 5 |
library_name: transformers
|
| 6 |
model_name: gpt-oss-20b-dermatology-qa
|
| 7 |
tags:
|
| 8 |
- generated_from_trainer
|
| 9 |
-
- trl
|
| 10 |
- sft
|
| 11 |
-
-
|
| 12 |
-
- medical
|
| 13 |
licence: license
|
| 14 |
-
license: apache-2.0
|
| 15 |
-
language:
|
| 16 |
-
- en
|
| 17 |
-
pipeline_tag: text-generation
|
| 18 |
---
|
| 19 |
|
| 20 |
# Model Card for gpt-oss-20b-dermatology-qa
|
| 21 |
|
| 22 |
-
This model is a fine-tuned version of [openai/gpt-oss-20b](https://huggingface.co/openai/gpt-oss-20b)
|
| 23 |
It has been trained using [TRL](https://github.com/huggingface/trl).
|
| 24 |
|
| 25 |
## Quick start
|
|
@@ -27,25 +19,40 @@ It has been trained using [TRL](https://github.com/huggingface/trl).
|
|
| 27 |
```python
|
| 28 |
from transformers import pipeline
|
| 29 |
|
| 30 |
-
question = "
|
|
|
|
|
|
|
|
|
|
|
|
|
| 31 |
|
| 32 |
-
|
| 33 |
-
generator = pipeline(
|
| 34 |
-
"text-generation",
|
| 35 |
-
model="kingabzpro/gpt-oss-20b-dermatology-qa",
|
| 36 |
-
device="cuda" # or device=0
|
| 37 |
-
)
|
| 38 |
|
|
|
|
| 39 |
|
| 40 |
-
# Run inference (passing in chat-style format)
|
| 41 |
-
output = generator(
|
| 42 |
-
[{"role": "user", "content": question}],
|
| 43 |
-
max_new_tokens=200,
|
| 44 |
-
return_full_text=False
|
| 45 |
-
)[0]
|
| 46 |
|
| 47 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 48 |
|
| 49 |
-
# The source says that clinicians should use a combination of clinical signs and symptoms when diagnosing rosacea, rather than relying on a single feature.
|
| 50 |
-
```
|
| 51 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
---
|
| 2 |
base_model: openai/gpt-oss-20b
|
|
|
|
|
|
|
| 3 |
library_name: transformers
|
| 4 |
model_name: gpt-oss-20b-dermatology-qa
|
| 5 |
tags:
|
| 6 |
- generated_from_trainer
|
|
|
|
| 7 |
- sft
|
| 8 |
+
- trl
|
|
|
|
| 9 |
licence: license
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10 |
---
|
| 11 |
|
| 12 |
# Model Card for gpt-oss-20b-dermatology-qa
|
| 13 |
|
| 14 |
+
This model is a fine-tuned version of [openai/gpt-oss-20b](https://huggingface.co/openai/gpt-oss-20b).
|
| 15 |
It has been trained using [TRL](https://github.com/huggingface/trl).
|
| 16 |
|
| 17 |
## Quick start
|
|
|
|
| 19 |
```python
|
| 20 |
from transformers import pipeline
|
| 21 |
|
| 22 |
+
question = "If you had a time machine, but could only go to the past or the future once and never return, which would you choose and why?"
|
| 23 |
+
generator = pipeline("text-generation", model="kingabzpro/gpt-oss-20b-dermatology-qa", device="cuda")
|
| 24 |
+
output = generator([{"role": "user", "content": question}], max_new_tokens=128, return_full_text=False)[0]
|
| 25 |
+
print(output["generated_text"])
|
| 26 |
+
```
|
| 27 |
|
| 28 |
+
## Training procedure
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 29 |
|
| 30 |
+
|
| 31 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 32 |
|
| 33 |
+
This model was trained with SFT.
|
| 34 |
+
|
| 35 |
+
### Framework versions
|
| 36 |
+
|
| 37 |
+
- TRL: 0.22.1
|
| 38 |
+
- Transformers: 4.55.4
|
| 39 |
+
- Pytorch: 2.8.0.dev20250319+cu128
|
| 40 |
+
- Datasets: 4.0.0
|
| 41 |
+
- Tokenizers: 0.21.4
|
| 42 |
+
|
| 43 |
+
## Citations
|
| 44 |
+
|
| 45 |
|
|
|
|
|
|
|
| 46 |
|
| 47 |
+
Cite TRL as:
|
| 48 |
+
|
| 49 |
+
```bibtex
|
| 50 |
+
@misc{vonwerra2022trl,
|
| 51 |
+
title = {{TRL: Transformer Reinforcement Learning}},
|
| 52 |
+
author = {Leandro von Werra and Younes Belkada and Lewis Tunstall and Edward Beeching and Tristan Thrush and Nathan Lambert and Shengyi Huang and Kashif Rasul and Quentin Gallou{\'e}dec},
|
| 53 |
+
year = 2020,
|
| 54 |
+
journal = {GitHub repository},
|
| 55 |
+
publisher = {GitHub},
|
| 56 |
+
howpublished = {\url{https://github.com/huggingface/trl}}
|
| 57 |
+
}
|
| 58 |
+
```
|
adapter_config.json
CHANGED
|
@@ -28,10 +28,10 @@
|
|
| 28 |
"rank_pattern": {},
|
| 29 |
"revision": null,
|
| 30 |
"target_modules": [
|
|
|
|
| 31 |
"q_proj",
|
| 32 |
-
"v_proj",
|
| 33 |
"o_proj",
|
| 34 |
-
"
|
| 35 |
],
|
| 36 |
"target_parameters": [
|
| 37 |
"7.mlp.experts.gate_up_proj",
|
|
|
|
| 28 |
"rank_pattern": {},
|
| 29 |
"revision": null,
|
| 30 |
"target_modules": [
|
| 31 |
+
"k_proj",
|
| 32 |
"q_proj",
|
|
|
|
| 33 |
"o_proj",
|
| 34 |
+
"v_proj"
|
| 35 |
],
|
| 36 |
"target_parameters": [
|
| 37 |
"7.mlp.experts.gate_up_proj",
|
adapter_model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 60189176
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b0d9138da1714e204f2ad4ebcc8d8519ab4e85b7096299a12bd96c8b34f64abd
|
| 3 |
size 60189176
|
runs/Sep03_09-59-57_61d8ce0bbd73/events.out.tfevents.1756893598.61d8ce0bbd73.321.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e7a8af51b682bc0b8f8bea3881f863eaf40b4169e2df14b9086e0b5e8b9b7d88
|
| 3 |
+
size 6494
|
runs/Sep03_10-01-15_61d8ce0bbd73/events.out.tfevents.1756893678.61d8ce0bbd73.321.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:66120d3af39f438c59f7488b67ef4fbab0257a800b6298a56fb37638a966c46d
|
| 3 |
+
size 6493
|
runs/Sep03_10-02-29_61d8ce0bbd73/events.out.tfevents.1756893751.61d8ce0bbd73.861.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6e38fa4ebfae282e00c2ecd8c611b90fa643204a08cb197936cd65adfa49d30e
|
| 3 |
+
size 6493
|
runs/Sep03_10-03-20_61d8ce0bbd73/events.out.tfevents.1756893802.61d8ce0bbd73.861.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fd2441a752b1cca01b3b12f09207151a79d40b693d6427333ffda9961776274f
|
| 3 |
+
size 6494
|
runs/Sep03_10-04-01_61d8ce0bbd73/events.out.tfevents.1756893843.61d8ce0bbd73.1127.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:623c3b00a8b13436073d67bd6559891f69da345711326322ddb6075c580ec3d9
|
| 3 |
+
size 6494
|
runs/Sep03_10-11-55_61d8ce0bbd73/events.out.tfevents.1756894418.61d8ce0bbd73.1387.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3ae3c924043441369e0d32654be986e5b14e355880d5f4435b0fe46b60e246da
|
| 3 |
+
size 6494
|
runs/Sep03_10-11-55_61d8ce0bbd73/events.out.tfevents.1756894532.61d8ce0bbd73.1387.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c516e8a1b32925c2c7e19a4d7e5470661f8df8c761d85251e9f53ea979985d45
|
| 3 |
+
size 6494
|
runs/Sep03_10-17-05_61d8ce0bbd73/events.out.tfevents.1756894627.61d8ce0bbd73.1856.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3697b0640edc4b0e05c48a1de044de9edc5dd57f8016a8a3ad8dd34038fb2f7e
|
| 3 |
+
size 6494
|
runs/Sep03_10-17-54_61d8ce0bbd73/events.out.tfevents.1756894678.61d8ce0bbd73.1856.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:760be4a96178a0030d827cdb852536210681bbf45eb8f7f774254e8e510e082d
|
| 3 |
+
size 6494
|
runs/Sep03_10-18-45_61d8ce0bbd73/events.out.tfevents.1756894727.61d8ce0bbd73.2432.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7c0dd2027b1de5dd789edc1b7c50dea9155a3b2f8edbb19062cd598d395ec85e
|
| 3 |
+
size 6494
|
runs/Sep03_10-26-32_61d8ce0bbd73/events.out.tfevents.1756895193.61d8ce0bbd73.2432.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a43e4197583a728237c866d45b02cfa5a2057229f7bcf2910b0341f589d0463a
|
| 3 |
+
size 6493
|
runs/Sep03_10-33-17_61d8ce0bbd73/events.out.tfevents.1756895598.61d8ce0bbd73.3117.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:47574b3c6522c1505cdcb32e66b7a982bd5aa55174761c078b2e2a61eb5c3a39
|
| 3 |
+
size 10990
|
training_args.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 6161
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:11adc9de4fb4f041b65e1f4c7ce061b9c334f015eb48dc8e24888faf14e0d75b
|
| 3 |
size 6161
|