diff --git a/.gitattributes b/.gitattributes index a6344aac8c09253b3b630fb776ae94478aa0275b..22da66ea10b5742cf5028edbed6bf8b22fe3fc82 100644 --- a/.gitattributes +++ b/.gitattributes @@ -33,3 +33,7 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text *.zip filter=lfs diff=lfs merge=lfs -text *.zst filter=lfs diff=lfs merge=lfs -text *tfevents* filter=lfs diff=lfs merge=lfs -text +*.json filter=lfs diff=lfs merge=lfs -text +*..jinja filter=lfs diff=lfs merge=lfs -text +*.jinja filter=lfs diff=lfs merge=lfs -text +*.txt filter=lfs diff=lfs merge=lfs -text diff --git a/.gitignore b/.gitignore new file mode 100644 index 0000000000000000000000000000000000000000..6642fd2cab6c45b755e7cfc78563c41e9a1f14ba --- /dev/null +++ b/.gitignore @@ -0,0 +1,5 @@ +runs +*.ipynb +utils +__pycache__ +*.py diff --git a/README.md b/README.md new file mode 100644 index 0000000000000000000000000000000000000000..2c8051bd18e2f7bb2b230fdf7ab410cc1a8077c8 --- /dev/null +++ b/README.md @@ -0,0 +1,52 @@ +--- +license: mit +task_categories: +- text-classification +language: +- fr +tags: +- text-classification +- toxicity +- hate-speech +- content-moderation +- chain-of-thought +- curriculum-learning +- nlp +- french-dataset +- classification +pretty_name: ToxiFrench +datasets: +- Naela00/ToxiFrenchFinetuning +base_model: +- Qwen/Qwen3-4B +--- + +# ToxiFrench Model + +This repository contains the **ToxiFrench** model, a **French language model** fine-tuned for **toxic comment classification**. It is based on the [**Qwen/Qwen3-4B**](https://huggingface.co/Qwen/Qwen3-4B) architecture and is designed to detect and classify toxic comments in French text. + +We performed a series of experiments to evaluate the model's performance under different fine-tuning configurations, focusing on the impact of **data selection strategies** and **Chain-of-Thought (CoT)** annotations. + +## Finetuning notations + +Each experiment follows a naming scheme like: **(r/o)(e/d)(a/b)(s/m/l)** +Where: + +- `r` = random order, `o` = ordered (curriculum) +- `e` = equal toxic/non-toxic, `d` = real-world imbalance +- `a` = with CoT finetuning, `b` = without CoT +- `s` = small (100), `m` = medium (1000), `l` = large (all) + +> e.g. `rdal` is the model trained on the natural distribution of toxicity (`d`), on an arbitrary order (`r`), with CoT annotations (`a`), and on the whole dataset (`l`). + +If a label like `` is present in the checkpoint name, it indicates that the CoT that was used during training did not include this specific reasoning step. + +## Citation + +``` +@misc{toxifrench2025, +title={ToxiFrench}, +author={Delaval Axel}, +year={2025}, +} +``` \ No newline at end of file diff --git a/output_odal_Qwen3-4B_-/checkpoint-420/README.md b/output_odal_Qwen3-4B_-/checkpoint-420/README.md new file mode 100644 index 0000000000000000000000000000000000000000..8a9591cde2bc956137b9f7d13e4fe8be718b6a61 --- /dev/null +++ b/output_odal_Qwen3-4B_-/checkpoint-420/README.md @@ -0,0 +1,202 @@ +--- +base_model: Qwen/Qwen3-4B +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.15.2 \ No newline at end of file diff --git a/output_odal_Qwen3-4B_-/checkpoint-420/adapter_config.json b/output_odal_Qwen3-4B_-/checkpoint-420/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..be253dec68498dcbfdb5ee8017ebd9f58db38f48 --- /dev/null +++ b/output_odal_Qwen3-4B_-/checkpoint-420/adapter_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7230bbb1d85421684376a57f17cb053f867a001c5ca3ff30f574021e3e3c167 +size 828 diff --git a/output_odal_Qwen3-4B_-/checkpoint-420/adapter_model.safetensors b/output_odal_Qwen3-4B_-/checkpoint-420/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7dff035cfef683187ab13cd728266b27648a5624 --- /dev/null +++ b/output_odal_Qwen3-4B_-/checkpoint-420/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a220a58078aa7dbeedaece01045895702dc1f4341e6eb68eb372147c69363b1 +size 1579102000 diff --git a/output_odal_Qwen3-4B_-/checkpoint-420/added_tokens.json b/output_odal_Qwen3-4B_-/checkpoint-420/added_tokens.json new file mode 100644 index 0000000000000000000000000000000000000000..2b76afd7cb1e665182c309e62849419f75306b75 --- /dev/null +++ b/output_odal_Qwen3-4B_-/checkpoint-420/added_tokens.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0284b582e14987fbd3d5a2cb2bd139084371ed9acbae488829a1c900833c680 +size 707 diff --git a/output_odal_Qwen3-4B_-/checkpoint-420/chat_template.jinja b/output_odal_Qwen3-4B_-/checkpoint-420/chat_template.jinja new file mode 100644 index 0000000000000000000000000000000000000000..d85ff3045a68273657a9f871cdb9938c940b110b --- /dev/null +++ b/output_odal_Qwen3-4B_-/checkpoint-420/chat_template.jinja @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a55ee1b1660128b7098723e0abcd92caa0788061051c62d51cbe87d9cf1974d8 +size 4168 diff --git a/output_odal_Qwen3-4B_-/checkpoint-420/global_step417/mp_rank_00_model_states.pt b/output_odal_Qwen3-4B_-/checkpoint-420/global_step417/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e04882e6f2e7bbc8e20307d26e326813e1358738 --- /dev/null +++ b/output_odal_Qwen3-4B_-/checkpoint-420/global_step417/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3fb11f9b7ee3aed9731967a002a28af3f236f98a4518f832085713aa935c238 +size 861285289 diff --git a/output_odal_Qwen3-4B_-/checkpoint-420/global_step417/zero_pp_rank_0_mp_rank_00_optim_states.pt b/output_odal_Qwen3-4B_-/checkpoint-420/global_step417/zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fecc3c7b2ed35942bf1804a53f6061ad66d2a984 --- /dev/null +++ b/output_odal_Qwen3-4B_-/checkpoint-420/global_step417/zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08ecc800d2de12d403727fce406819aa8759a2d327e157b34d6c8d2ede2f9e75 +size 77884216 diff --git a/output_odal_Qwen3-4B_-/checkpoint-420/global_step417/zero_pp_rank_1_mp_rank_00_optim_states.pt b/output_odal_Qwen3-4B_-/checkpoint-420/global_step417/zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b311d4dea71ea6257dcc246914be279a25cd4b4 --- /dev/null +++ b/output_odal_Qwen3-4B_-/checkpoint-420/global_step417/zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e243d774fb8843c0a02feeee03e3cc25352a2de0ba0f907b01121a83571dbe4 +size 77884344 diff --git a/output_odal_Qwen3-4B_-/checkpoint-420/latest b/output_odal_Qwen3-4B_-/checkpoint-420/latest new file mode 100644 index 0000000000000000000000000000000000000000..744a911850c46e288735556662eb3c3fd3a8069e --- /dev/null +++ b/output_odal_Qwen3-4B_-/checkpoint-420/latest @@ -0,0 +1 @@ +global_step417 \ No newline at end of file diff --git a/output_odal_Qwen3-4B_-/checkpoint-420/merges.txt b/output_odal_Qwen3-4B_-/checkpoint-420/merges.txt new file mode 100644 index 0000000000000000000000000000000000000000..80c1a19fae38f8f4c9ab32cc9d4e145c241147e6 --- /dev/null +++ b/output_odal_Qwen3-4B_-/checkpoint-420/merges.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8831e4f1a044471340f7c0a83d7bd71306a5b867e95fd870f74d0c5308a904d5 +size 1671853 diff --git a/output_odal_Qwen3-4B_-/checkpoint-420/rng_state_0.pth b/output_odal_Qwen3-4B_-/checkpoint-420/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..efd7000d81494efd9615bc8778fe458e6479de73 --- /dev/null +++ b/output_odal_Qwen3-4B_-/checkpoint-420/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64120fecc819570fdb1d5359518c94d15c1bc479ba296968352e83038a4c9806 +size 14917 diff --git a/output_odal_Qwen3-4B_-/checkpoint-420/rng_state_1.pth b/output_odal_Qwen3-4B_-/checkpoint-420/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..a33e9316a2de7cacfcd0c065a265b170753c1056 --- /dev/null +++ b/output_odal_Qwen3-4B_-/checkpoint-420/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ba0dc98ec5329a2b43a51e909701a70a2c4641578ad65d679147f68b4736f49 +size 14917 diff --git a/output_odal_Qwen3-4B_-/checkpoint-420/special_tokens_map.json b/output_odal_Qwen3-4B_-/checkpoint-420/special_tokens_map.json new file mode 100644 index 0000000000000000000000000000000000000000..ee3f6af3ba18b7d721f02bdf3fbca2814b7eda35 --- /dev/null +++ b/output_odal_Qwen3-4B_-/checkpoint-420/special_tokens_map.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76862e765266b85aa9459767e33cbaf13970f327a0e88d1c65846c2ddd3a1ecd +size 613 diff --git a/output_odal_Qwen3-4B_-/checkpoint-420/tokenizer.json b/output_odal_Qwen3-4B_-/checkpoint-420/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..cd71f61a15a522601badb3dc960d800d9cb3766c --- /dev/null +++ b/output_odal_Qwen3-4B_-/checkpoint-420/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aeb13307a71acd8fe81861d94ad54ab689df773318809eed3cbe794b4492dae4 +size 11422654 diff --git a/output_odal_Qwen3-4B_-/checkpoint-420/tokenizer_config.json b/output_odal_Qwen3-4B_-/checkpoint-420/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..0d8ad241b789c1419579e4b54e31b0befbad9882 --- /dev/null +++ b/output_odal_Qwen3-4B_-/checkpoint-420/tokenizer_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:443bfa629eb16387a12edbf92a76f6a6f10b2af3b53d87ba1550adfcf45f7fa0 +size 5404 diff --git a/output_odal_Qwen3-4B_-/checkpoint-420/trainer_state.json b/output_odal_Qwen3-4B_-/checkpoint-420/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..ec6aab1a06fce6b031f477f43bc10d17a829ebf1 --- /dev/null +++ b/output_odal_Qwen3-4B_-/checkpoint-420/trainer_state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7edf6e7b712340e695675a44c607e6b28efccb857b15c2f5e66703c80219d157 +size 12181 diff --git a/output_odal_Qwen3-4B_-/checkpoint-420/training_args.bin b/output_odal_Qwen3-4B_-/checkpoint-420/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..8e4cae759b1a71b73c7998972c9abc7b50ff8b9f --- /dev/null +++ b/output_odal_Qwen3-4B_-/checkpoint-420/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a27bfb6651c77744bd50f9d980f357ec5e3e1a52718e7cd7cbf37b8716ffd1a0 +size 7889 diff --git a/output_odal_Qwen3-4B_-/checkpoint-420/vocab.json b/output_odal_Qwen3-4B_-/checkpoint-420/vocab.json new file mode 100644 index 0000000000000000000000000000000000000000..6c49fc63bcb109de13abe49e58f85a4cdba7b679 --- /dev/null +++ b/output_odal_Qwen3-4B_-/checkpoint-420/vocab.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca10d7e9fb3ed18575dd1e277a2579c16d108e32f27439684afa0e10b1440910 +size 2776833 diff --git a/output_odal_Qwen3-4B_-/checkpoint-540/README.md b/output_odal_Qwen3-4B_-/checkpoint-540/README.md new file mode 100644 index 0000000000000000000000000000000000000000..8a9591cde2bc956137b9f7d13e4fe8be718b6a61 --- /dev/null +++ b/output_odal_Qwen3-4B_-/checkpoint-540/README.md @@ -0,0 +1,202 @@ +--- +base_model: Qwen/Qwen3-4B +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.15.2 \ No newline at end of file diff --git a/output_odal_Qwen3-4B_-/checkpoint-540/adapter_config.json b/output_odal_Qwen3-4B_-/checkpoint-540/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..be253dec68498dcbfdb5ee8017ebd9f58db38f48 --- /dev/null +++ b/output_odal_Qwen3-4B_-/checkpoint-540/adapter_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7230bbb1d85421684376a57f17cb053f867a001c5ca3ff30f574021e3e3c167 +size 828 diff --git a/output_odal_Qwen3-4B_-/checkpoint-540/adapter_model.safetensors b/output_odal_Qwen3-4B_-/checkpoint-540/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..42d12920ab2100b63ee306b46971e6b5ac4c2d6a --- /dev/null +++ b/output_odal_Qwen3-4B_-/checkpoint-540/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c471f33c6fc5d1b0487803f39021414584e6964957f7dcb91fdb3d4da087e4a +size 1579102000 diff --git a/output_odal_Qwen3-4B_-/checkpoint-540/added_tokens.json b/output_odal_Qwen3-4B_-/checkpoint-540/added_tokens.json new file mode 100644 index 0000000000000000000000000000000000000000..2b76afd7cb1e665182c309e62849419f75306b75 --- /dev/null +++ b/output_odal_Qwen3-4B_-/checkpoint-540/added_tokens.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0284b582e14987fbd3d5a2cb2bd139084371ed9acbae488829a1c900833c680 +size 707 diff --git a/output_odal_Qwen3-4B_-/checkpoint-540/chat_template.jinja b/output_odal_Qwen3-4B_-/checkpoint-540/chat_template.jinja new file mode 100644 index 0000000000000000000000000000000000000000..d85ff3045a68273657a9f871cdb9938c940b110b --- /dev/null +++ b/output_odal_Qwen3-4B_-/checkpoint-540/chat_template.jinja @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a55ee1b1660128b7098723e0abcd92caa0788061051c62d51cbe87d9cf1974d8 +size 4168 diff --git a/output_odal_Qwen3-4B_-/checkpoint-540/global_step537/mp_rank_00_model_states.pt b/output_odal_Qwen3-4B_-/checkpoint-540/global_step537/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca52b3abb2e207a1c409494ede34271167031113 --- /dev/null +++ b/output_odal_Qwen3-4B_-/checkpoint-540/global_step537/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13b33c193c2b7d902bb1ae931585374f558951cc8f5b1f09751d7e4f11efee8b +size 861285289 diff --git a/output_odal_Qwen3-4B_-/checkpoint-540/global_step537/zero_pp_rank_0_mp_rank_00_optim_states.pt b/output_odal_Qwen3-4B_-/checkpoint-540/global_step537/zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6cce3f723536b4fe2fff9898975abeee5a6dfaa4 --- /dev/null +++ b/output_odal_Qwen3-4B_-/checkpoint-540/global_step537/zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:204b03392e17cccf47207ab9b7349f85e22381962ecc6d97cfccfe2d0d4d6aef +size 77884216 diff --git a/output_odal_Qwen3-4B_-/checkpoint-540/global_step537/zero_pp_rank_1_mp_rank_00_optim_states.pt b/output_odal_Qwen3-4B_-/checkpoint-540/global_step537/zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..60206c3f8ed451bea561fabc907c8f3cd539a086 --- /dev/null +++ b/output_odal_Qwen3-4B_-/checkpoint-540/global_step537/zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10c42677818f4adf001cbf6c00c7b76b8d896d4a9cb17ef3016b2d207d60befe +size 77884344 diff --git a/output_odal_Qwen3-4B_-/checkpoint-540/latest b/output_odal_Qwen3-4B_-/checkpoint-540/latest new file mode 100644 index 0000000000000000000000000000000000000000..57b7e8212ad3c9da2b37172bdd0e1e5a8a199ff7 --- /dev/null +++ b/output_odal_Qwen3-4B_-/checkpoint-540/latest @@ -0,0 +1 @@ +global_step537 \ No newline at end of file diff --git a/output_odal_Qwen3-4B_-/checkpoint-540/merges.txt b/output_odal_Qwen3-4B_-/checkpoint-540/merges.txt new file mode 100644 index 0000000000000000000000000000000000000000..80c1a19fae38f8f4c9ab32cc9d4e145c241147e6 --- /dev/null +++ b/output_odal_Qwen3-4B_-/checkpoint-540/merges.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8831e4f1a044471340f7c0a83d7bd71306a5b867e95fd870f74d0c5308a904d5 +size 1671853 diff --git a/output_odal_Qwen3-4B_-/checkpoint-540/rng_state_0.pth b/output_odal_Qwen3-4B_-/checkpoint-540/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..dee58b4fa19ce06e7c0cfd31405132092a4adf01 --- /dev/null +++ b/output_odal_Qwen3-4B_-/checkpoint-540/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:efc3b787ee0ff48b74e4adb7f937bf74a2a5d3e1b0b23c24d989611139cd39a8 +size 14917 diff --git a/output_odal_Qwen3-4B_-/checkpoint-540/rng_state_1.pth b/output_odal_Qwen3-4B_-/checkpoint-540/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..5651ee09c53f084099f95baff97fc2ba8306b343 --- /dev/null +++ b/output_odal_Qwen3-4B_-/checkpoint-540/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab9aa2a52ba9cac6bf490c27ae75cc2de3c5f6ea1426cba772af0e6552d96aaa +size 14917 diff --git a/output_odal_Qwen3-4B_-/checkpoint-540/special_tokens_map.json b/output_odal_Qwen3-4B_-/checkpoint-540/special_tokens_map.json new file mode 100644 index 0000000000000000000000000000000000000000..ee3f6af3ba18b7d721f02bdf3fbca2814b7eda35 --- /dev/null +++ b/output_odal_Qwen3-4B_-/checkpoint-540/special_tokens_map.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76862e765266b85aa9459767e33cbaf13970f327a0e88d1c65846c2ddd3a1ecd +size 613 diff --git a/output_odal_Qwen3-4B_-/checkpoint-540/tokenizer.json b/output_odal_Qwen3-4B_-/checkpoint-540/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..cd71f61a15a522601badb3dc960d800d9cb3766c --- /dev/null +++ b/output_odal_Qwen3-4B_-/checkpoint-540/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aeb13307a71acd8fe81861d94ad54ab689df773318809eed3cbe794b4492dae4 +size 11422654 diff --git a/output_odal_Qwen3-4B_-/checkpoint-540/tokenizer_config.json b/output_odal_Qwen3-4B_-/checkpoint-540/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..0d8ad241b789c1419579e4b54e31b0befbad9882 --- /dev/null +++ b/output_odal_Qwen3-4B_-/checkpoint-540/tokenizer_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:443bfa629eb16387a12edbf92a76f6a6f10b2af3b53d87ba1550adfcf45f7fa0 +size 5404 diff --git a/output_odal_Qwen3-4B_-/checkpoint-540/trainer_state.json b/output_odal_Qwen3-4B_-/checkpoint-540/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..dbf3b55ebc03a5545aa2ed87b90b4752d98d225e --- /dev/null +++ b/output_odal_Qwen3-4B_-/checkpoint-540/trainer_state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01345551b3a74614e68a28d05230f65c1885f628069ad92d27efbc75568fafd3 +size 15288 diff --git a/output_odal_Qwen3-4B_-/checkpoint-540/training_args.bin b/output_odal_Qwen3-4B_-/checkpoint-540/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..8e4cae759b1a71b73c7998972c9abc7b50ff8b9f --- /dev/null +++ b/output_odal_Qwen3-4B_-/checkpoint-540/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a27bfb6651c77744bd50f9d980f357ec5e3e1a52718e7cd7cbf37b8716ffd1a0 +size 7889 diff --git a/output_odal_Qwen3-4B_-/checkpoint-540/vocab.json b/output_odal_Qwen3-4B_-/checkpoint-540/vocab.json new file mode 100644 index 0000000000000000000000000000000000000000..6c49fc63bcb109de13abe49e58f85a4cdba7b679 --- /dev/null +++ b/output_odal_Qwen3-4B_-/checkpoint-540/vocab.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca10d7e9fb3ed18575dd1e277a2579c16d108e32f27439684afa0e10b1440910 +size 2776833 diff --git a/output_odal_Qwen3-4B_-/checkpoint-548/README.md b/output_odal_Qwen3-4B_-/checkpoint-548/README.md new file mode 100644 index 0000000000000000000000000000000000000000..8a9591cde2bc956137b9f7d13e4fe8be718b6a61 --- /dev/null +++ b/output_odal_Qwen3-4B_-/checkpoint-548/README.md @@ -0,0 +1,202 @@ +--- +base_model: Qwen/Qwen3-4B +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.15.2 \ No newline at end of file diff --git a/output_odal_Qwen3-4B_-/checkpoint-548/adapter_config.json b/output_odal_Qwen3-4B_-/checkpoint-548/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..be253dec68498dcbfdb5ee8017ebd9f58db38f48 --- /dev/null +++ b/output_odal_Qwen3-4B_-/checkpoint-548/adapter_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7230bbb1d85421684376a57f17cb053f867a001c5ca3ff30f574021e3e3c167 +size 828 diff --git a/output_odal_Qwen3-4B_-/checkpoint-548/adapter_model.safetensors b/output_odal_Qwen3-4B_-/checkpoint-548/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2949a097beec7ba8aca29b37e655cc530e3d6c67 --- /dev/null +++ b/output_odal_Qwen3-4B_-/checkpoint-548/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26893ada07476813e552f5b735e06edccb0cd089b10d53d94551e2d2500e1e97 +size 1579102000 diff --git a/output_odal_Qwen3-4B_-/checkpoint-548/added_tokens.json b/output_odal_Qwen3-4B_-/checkpoint-548/added_tokens.json new file mode 100644 index 0000000000000000000000000000000000000000..2b76afd7cb1e665182c309e62849419f75306b75 --- /dev/null +++ b/output_odal_Qwen3-4B_-/checkpoint-548/added_tokens.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0284b582e14987fbd3d5a2cb2bd139084371ed9acbae488829a1c900833c680 +size 707 diff --git a/output_odal_Qwen3-4B_-/checkpoint-548/chat_template.jinja b/output_odal_Qwen3-4B_-/checkpoint-548/chat_template.jinja new file mode 100644 index 0000000000000000000000000000000000000000..d85ff3045a68273657a9f871cdb9938c940b110b --- /dev/null +++ b/output_odal_Qwen3-4B_-/checkpoint-548/chat_template.jinja @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a55ee1b1660128b7098723e0abcd92caa0788061051c62d51cbe87d9cf1974d8 +size 4168 diff --git a/output_odal_Qwen3-4B_-/checkpoint-548/global_step544/mp_rank_00_model_states.pt b/output_odal_Qwen3-4B_-/checkpoint-548/global_step544/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b4f3e2c1df07f23dc5627003d5725479cc2d41f --- /dev/null +++ b/output_odal_Qwen3-4B_-/checkpoint-548/global_step544/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a1c3516b4a07c885d519f0cc8a1565eb7b7ba12a68e505ef91ca0c1c7de3051 +size 861285289 diff --git a/output_odal_Qwen3-4B_-/checkpoint-548/global_step544/zero_pp_rank_0_mp_rank_00_optim_states.pt b/output_odal_Qwen3-4B_-/checkpoint-548/global_step544/zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e56ca1bdf669f63b6b92aff588effb08c4c207e6 --- /dev/null +++ b/output_odal_Qwen3-4B_-/checkpoint-548/global_step544/zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:867cffbbad20a1e9bff6de7622f9decd1c4c67297eb52c36c79d0979836295b6 +size 77884216 diff --git a/output_odal_Qwen3-4B_-/checkpoint-548/global_step544/zero_pp_rank_1_mp_rank_00_optim_states.pt b/output_odal_Qwen3-4B_-/checkpoint-548/global_step544/zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..598fc516629dea5eef4b24d52d1b97f06beab24c --- /dev/null +++ b/output_odal_Qwen3-4B_-/checkpoint-548/global_step544/zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13c1d9114cd659bdf29f4fd0586888c9f537af1932aa28489a994545fb0747f9 +size 77884344 diff --git a/output_odal_Qwen3-4B_-/checkpoint-548/latest b/output_odal_Qwen3-4B_-/checkpoint-548/latest new file mode 100644 index 0000000000000000000000000000000000000000..606df2a525126f7e381b691c76048c61744888b9 --- /dev/null +++ b/output_odal_Qwen3-4B_-/checkpoint-548/latest @@ -0,0 +1 @@ +global_step544 \ No newline at end of file diff --git a/output_odal_Qwen3-4B_-/checkpoint-548/merges.txt b/output_odal_Qwen3-4B_-/checkpoint-548/merges.txt new file mode 100644 index 0000000000000000000000000000000000000000..80c1a19fae38f8f4c9ab32cc9d4e145c241147e6 --- /dev/null +++ b/output_odal_Qwen3-4B_-/checkpoint-548/merges.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8831e4f1a044471340f7c0a83d7bd71306a5b867e95fd870f74d0c5308a904d5 +size 1671853 diff --git a/output_odal_Qwen3-4B_-/checkpoint-548/rng_state_0.pth b/output_odal_Qwen3-4B_-/checkpoint-548/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..5508ce29aeb03fc30b337bbbbdeb7f2757b7341e --- /dev/null +++ b/output_odal_Qwen3-4B_-/checkpoint-548/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b7e02beb04282fa93748a1dd67ed95925f835cc32b9c3072cb8deb9f80998f9 +size 14917 diff --git a/output_odal_Qwen3-4B_-/checkpoint-548/rng_state_1.pth b/output_odal_Qwen3-4B_-/checkpoint-548/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..596b99c6425c85dcbee56a0419d7fbc6905105bd --- /dev/null +++ b/output_odal_Qwen3-4B_-/checkpoint-548/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d09f0823075e37e6957d135b46bb4963f36bc5c28c69980181c8abe4649b55d2 +size 14917 diff --git a/output_odal_Qwen3-4B_-/checkpoint-548/special_tokens_map.json b/output_odal_Qwen3-4B_-/checkpoint-548/special_tokens_map.json new file mode 100644 index 0000000000000000000000000000000000000000..ee3f6af3ba18b7d721f02bdf3fbca2814b7eda35 --- /dev/null +++ b/output_odal_Qwen3-4B_-/checkpoint-548/special_tokens_map.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76862e765266b85aa9459767e33cbaf13970f327a0e88d1c65846c2ddd3a1ecd +size 613 diff --git a/output_odal_Qwen3-4B_-/checkpoint-548/tokenizer.json b/output_odal_Qwen3-4B_-/checkpoint-548/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..cd71f61a15a522601badb3dc960d800d9cb3766c --- /dev/null +++ b/output_odal_Qwen3-4B_-/checkpoint-548/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aeb13307a71acd8fe81861d94ad54ab689df773318809eed3cbe794b4492dae4 +size 11422654 diff --git a/output_odal_Qwen3-4B_-/checkpoint-548/tokenizer_config.json b/output_odal_Qwen3-4B_-/checkpoint-548/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..0d8ad241b789c1419579e4b54e31b0befbad9882 --- /dev/null +++ b/output_odal_Qwen3-4B_-/checkpoint-548/tokenizer_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:443bfa629eb16387a12edbf92a76f6a6f10b2af3b53d87ba1550adfcf45f7fa0 +size 5404 diff --git a/output_odal_Qwen3-4B_-/checkpoint-548/trainer_state.json b/output_odal_Qwen3-4B_-/checkpoint-548/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..afc5664a77a8f0edbe852fe36d45cc0042d87363 --- /dev/null +++ b/output_odal_Qwen3-4B_-/checkpoint-548/trainer_state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ef02a773b67e56bbc465a64f7f0b65163e1392e18ce9dd4b0f9e05646771fbd +size 15273 diff --git a/output_odal_Qwen3-4B_-/checkpoint-548/training_args.bin b/output_odal_Qwen3-4B_-/checkpoint-548/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..8e4cae759b1a71b73c7998972c9abc7b50ff8b9f --- /dev/null +++ b/output_odal_Qwen3-4B_-/checkpoint-548/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a27bfb6651c77744bd50f9d980f357ec5e3e1a52718e7cd7cbf37b8716ffd1a0 +size 7889 diff --git a/output_odal_Qwen3-4B_-/checkpoint-548/vocab.json b/output_odal_Qwen3-4B_-/checkpoint-548/vocab.json new file mode 100644 index 0000000000000000000000000000000000000000..6c49fc63bcb109de13abe49e58f85a4cdba7b679 --- /dev/null +++ b/output_odal_Qwen3-4B_-/checkpoint-548/vocab.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca10d7e9fb3ed18575dd1e277a2579c16d108e32f27439684afa0e10b1440910 +size 2776833 diff --git a/output_odal_Qwen3-4B_-/final_adapters/README.md b/output_odal_Qwen3-4B_-/final_adapters/README.md new file mode 100644 index 0000000000000000000000000000000000000000..8a9591cde2bc956137b9f7d13e4fe8be718b6a61 --- /dev/null +++ b/output_odal_Qwen3-4B_-/final_adapters/README.md @@ -0,0 +1,202 @@ +--- +base_model: Qwen/Qwen3-4B +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.15.2 \ No newline at end of file diff --git a/output_odal_Qwen3-4B_-/final_adapters/adapter_config.json b/output_odal_Qwen3-4B_-/final_adapters/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..be253dec68498dcbfdb5ee8017ebd9f58db38f48 --- /dev/null +++ b/output_odal_Qwen3-4B_-/final_adapters/adapter_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7230bbb1d85421684376a57f17cb053f867a001c5ca3ff30f574021e3e3c167 +size 828 diff --git a/output_odal_Qwen3-4B_-/final_adapters/adapter_model.safetensors b/output_odal_Qwen3-4B_-/final_adapters/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7dff035cfef683187ab13cd728266b27648a5624 --- /dev/null +++ b/output_odal_Qwen3-4B_-/final_adapters/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a220a58078aa7dbeedaece01045895702dc1f4341e6eb68eb372147c69363b1 +size 1579102000 diff --git a/output_odal_Qwen3-4B_-/final_adapters/added_tokens.json b/output_odal_Qwen3-4B_-/final_adapters/added_tokens.json new file mode 100644 index 0000000000000000000000000000000000000000..2b76afd7cb1e665182c309e62849419f75306b75 --- /dev/null +++ b/output_odal_Qwen3-4B_-/final_adapters/added_tokens.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0284b582e14987fbd3d5a2cb2bd139084371ed9acbae488829a1c900833c680 +size 707 diff --git a/output_odal_Qwen3-4B_-/final_adapters/chat_template.jinja b/output_odal_Qwen3-4B_-/final_adapters/chat_template.jinja new file mode 100644 index 0000000000000000000000000000000000000000..d85ff3045a68273657a9f871cdb9938c940b110b --- /dev/null +++ b/output_odal_Qwen3-4B_-/final_adapters/chat_template.jinja @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a55ee1b1660128b7098723e0abcd92caa0788061051c62d51cbe87d9cf1974d8 +size 4168 diff --git a/output_odal_Qwen3-4B_-/final_adapters/merges.txt b/output_odal_Qwen3-4B_-/final_adapters/merges.txt new file mode 100644 index 0000000000000000000000000000000000000000..80c1a19fae38f8f4c9ab32cc9d4e145c241147e6 --- /dev/null +++ b/output_odal_Qwen3-4B_-/final_adapters/merges.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8831e4f1a044471340f7c0a83d7bd71306a5b867e95fd870f74d0c5308a904d5 +size 1671853 diff --git a/output_odal_Qwen3-4B_-/final_adapters/special_tokens_map.json b/output_odal_Qwen3-4B_-/final_adapters/special_tokens_map.json new file mode 100644 index 0000000000000000000000000000000000000000..ee3f6af3ba18b7d721f02bdf3fbca2814b7eda35 --- /dev/null +++ b/output_odal_Qwen3-4B_-/final_adapters/special_tokens_map.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76862e765266b85aa9459767e33cbaf13970f327a0e88d1c65846c2ddd3a1ecd +size 613 diff --git a/output_odal_Qwen3-4B_-/final_adapters/tokenizer.json b/output_odal_Qwen3-4B_-/final_adapters/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..cd71f61a15a522601badb3dc960d800d9cb3766c --- /dev/null +++ b/output_odal_Qwen3-4B_-/final_adapters/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aeb13307a71acd8fe81861d94ad54ab689df773318809eed3cbe794b4492dae4 +size 11422654 diff --git a/output_odal_Qwen3-4B_-/final_adapters/tokenizer_config.json b/output_odal_Qwen3-4B_-/final_adapters/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..0d8ad241b789c1419579e4b54e31b0befbad9882 --- /dev/null +++ b/output_odal_Qwen3-4B_-/final_adapters/tokenizer_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:443bfa629eb16387a12edbf92a76f6a6f10b2af3b53d87ba1550adfcf45f7fa0 +size 5404 diff --git a/output_odal_Qwen3-4B_-/final_adapters/training_args.bin b/output_odal_Qwen3-4B_-/final_adapters/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..8e4cae759b1a71b73c7998972c9abc7b50ff8b9f --- /dev/null +++ b/output_odal_Qwen3-4B_-/final_adapters/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a27bfb6651c77744bd50f9d980f357ec5e3e1a52718e7cd7cbf37b8716ffd1a0 +size 7889 diff --git a/output_odal_Qwen3-4B_-/final_adapters/vocab.json b/output_odal_Qwen3-4B_-/final_adapters/vocab.json new file mode 100644 index 0000000000000000000000000000000000000000..6c49fc63bcb109de13abe49e58f85a4cdba7b679 --- /dev/null +++ b/output_odal_Qwen3-4B_-/final_adapters/vocab.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca10d7e9fb3ed18575dd1e277a2579c16d108e32f27439684afa0e10b1440910 +size 2776833 diff --git a/output_oeal_Qwen3-4B_-/checkpoint-600/README.md b/output_oeal_Qwen3-4B_-/checkpoint-600/README.md new file mode 100644 index 0000000000000000000000000000000000000000..8a9591cde2bc956137b9f7d13e4fe8be718b6a61 --- /dev/null +++ b/output_oeal_Qwen3-4B_-/checkpoint-600/README.md @@ -0,0 +1,202 @@ +--- +base_model: Qwen/Qwen3-4B +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.15.2 \ No newline at end of file diff --git a/output_oeal_Qwen3-4B_-/checkpoint-600/adapter_config.json b/output_oeal_Qwen3-4B_-/checkpoint-600/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..cd249f2932b8f8b3c4a8cd8984ec276952c599b8 --- /dev/null +++ b/output_oeal_Qwen3-4B_-/checkpoint-600/adapter_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15769b4da00c79f0e2677ff72e6e8ae172b3155e62b376e58a93c8952efb6995 +size 828 diff --git a/output_oeal_Qwen3-4B_-/checkpoint-600/adapter_model.safetensors b/output_oeal_Qwen3-4B_-/checkpoint-600/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6d5bc7dcd4aa1c7cb99c97149e7f78a4e108c2b9 --- /dev/null +++ b/output_oeal_Qwen3-4B_-/checkpoint-600/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e56fe94c129a90a2cce427c5a16d0c7a8a3dcb5dd33db50a0a4da7ae9f7b392 +size 1579102000 diff --git a/output_oeal_Qwen3-4B_-/checkpoint-600/added_tokens.json b/output_oeal_Qwen3-4B_-/checkpoint-600/added_tokens.json new file mode 100644 index 0000000000000000000000000000000000000000..2b76afd7cb1e665182c309e62849419f75306b75 --- /dev/null +++ b/output_oeal_Qwen3-4B_-/checkpoint-600/added_tokens.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0284b582e14987fbd3d5a2cb2bd139084371ed9acbae488829a1c900833c680 +size 707 diff --git a/output_oeal_Qwen3-4B_-/checkpoint-600/chat_template.jinja b/output_oeal_Qwen3-4B_-/checkpoint-600/chat_template.jinja new file mode 100644 index 0000000000000000000000000000000000000000..d85ff3045a68273657a9f871cdb9938c940b110b --- /dev/null +++ b/output_oeal_Qwen3-4B_-/checkpoint-600/chat_template.jinja @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a55ee1b1660128b7098723e0abcd92caa0788061051c62d51cbe87d9cf1974d8 +size 4168 diff --git a/output_oeal_Qwen3-4B_-/checkpoint-600/global_step598/mp_rank_00_model_states.pt b/output_oeal_Qwen3-4B_-/checkpoint-600/global_step598/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d995e0372057203167379d42e1a3daab3b751a7 --- /dev/null +++ b/output_oeal_Qwen3-4B_-/checkpoint-600/global_step598/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae1390bd0c5adb4508d3c6d79fbc1b1ced1fec86355db6e0e041ec7c494321c2 +size 861285289 diff --git a/output_oeal_Qwen3-4B_-/checkpoint-600/global_step598/zero_pp_rank_0_mp_rank_00_optim_states.pt b/output_oeal_Qwen3-4B_-/checkpoint-600/global_step598/zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..394edad0dc87a646636323a9c8346e11c29682b2 --- /dev/null +++ b/output_oeal_Qwen3-4B_-/checkpoint-600/global_step598/zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:766446e3e181e416fafe2ce7b72f9a198e297cb4c16bce846bc77fa3b34e5a64 +size 77884216 diff --git a/output_oeal_Qwen3-4B_-/checkpoint-600/global_step598/zero_pp_rank_1_mp_rank_00_optim_states.pt b/output_oeal_Qwen3-4B_-/checkpoint-600/global_step598/zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..20e0ec762f31ad2ac1e4dfb804dc7d16cce9884d --- /dev/null +++ b/output_oeal_Qwen3-4B_-/checkpoint-600/global_step598/zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0521582f76826e13cd387f41808bc76398e001100005cf16e813f4ea94fceaa3 +size 77884344 diff --git a/output_oeal_Qwen3-4B_-/checkpoint-600/latest b/output_oeal_Qwen3-4B_-/checkpoint-600/latest new file mode 100644 index 0000000000000000000000000000000000000000..8a87fdc3e8d4d236bfa15c87e3acae6c027d8460 --- /dev/null +++ b/output_oeal_Qwen3-4B_-/checkpoint-600/latest @@ -0,0 +1 @@ +global_step598 \ No newline at end of file diff --git a/output_oeal_Qwen3-4B_-/checkpoint-600/merges.txt b/output_oeal_Qwen3-4B_-/checkpoint-600/merges.txt new file mode 100644 index 0000000000000000000000000000000000000000..80c1a19fae38f8f4c9ab32cc9d4e145c241147e6 --- /dev/null +++ b/output_oeal_Qwen3-4B_-/checkpoint-600/merges.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8831e4f1a044471340f7c0a83d7bd71306a5b867e95fd870f74d0c5308a904d5 +size 1671853 diff --git a/output_oeal_Qwen3-4B_-/checkpoint-600/rng_state_0.pth b/output_oeal_Qwen3-4B_-/checkpoint-600/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..d7eff0c6f8bbdccfdc6598329e45f13796e054a3 --- /dev/null +++ b/output_oeal_Qwen3-4B_-/checkpoint-600/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:233b2beced6e46147e0d535df7bc94f047fc8d7a5b3828b381e1077e8f5af631 +size 14917 diff --git a/output_oeal_Qwen3-4B_-/checkpoint-600/rng_state_1.pth b/output_oeal_Qwen3-4B_-/checkpoint-600/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..e728608c4aa596f9c27f17e87e5a2c0dc51dcfef --- /dev/null +++ b/output_oeal_Qwen3-4B_-/checkpoint-600/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:105643a0823f635ae4241293ce5ef99154425d151fa6cccca68105b0514afe8e +size 14917 diff --git a/output_oeal_Qwen3-4B_-/checkpoint-600/special_tokens_map.json b/output_oeal_Qwen3-4B_-/checkpoint-600/special_tokens_map.json new file mode 100644 index 0000000000000000000000000000000000000000..ee3f6af3ba18b7d721f02bdf3fbca2814b7eda35 --- /dev/null +++ b/output_oeal_Qwen3-4B_-/checkpoint-600/special_tokens_map.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76862e765266b85aa9459767e33cbaf13970f327a0e88d1c65846c2ddd3a1ecd +size 613 diff --git a/output_oeal_Qwen3-4B_-/checkpoint-600/tokenizer.json b/output_oeal_Qwen3-4B_-/checkpoint-600/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..38dda57c0535c5ded5ad9b8a5b8c4e4a89aba355 --- /dev/null +++ b/output_oeal_Qwen3-4B_-/checkpoint-600/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abfbf1d13376ad75c980dc37b59f5030a8eac0ced7b8fef55166f88a7c9cac34 +size 11422922 diff --git a/output_oeal_Qwen3-4B_-/checkpoint-600/tokenizer_config.json b/output_oeal_Qwen3-4B_-/checkpoint-600/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..0d8ad241b789c1419579e4b54e31b0befbad9882 --- /dev/null +++ b/output_oeal_Qwen3-4B_-/checkpoint-600/tokenizer_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:443bfa629eb16387a12edbf92a76f6a6f10b2af3b53d87ba1550adfcf45f7fa0 +size 5404 diff --git a/output_oeal_Qwen3-4B_-/checkpoint-600/trainer_state.json b/output_oeal_Qwen3-4B_-/checkpoint-600/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..d6762f439a816a01e58b795420316b017ad3cb67 --- /dev/null +++ b/output_oeal_Qwen3-4B_-/checkpoint-600/trainer_state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ab9184fef1f179e65d79c352fd52ae7bdaec8e57010e8d814c3c2dcfb0365ec +size 16728 diff --git a/output_oeal_Qwen3-4B_-/checkpoint-600/training_args.bin b/output_oeal_Qwen3-4B_-/checkpoint-600/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..970918e1fdea383f7bbb41f529e5a496c104d052 --- /dev/null +++ b/output_oeal_Qwen3-4B_-/checkpoint-600/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9564a20f74071dd6173ca96b7e99f3be3226a0e2e863768a3896c383c6d2b1d8 +size 7889 diff --git a/output_oeal_Qwen3-4B_-/checkpoint-600/vocab.json b/output_oeal_Qwen3-4B_-/checkpoint-600/vocab.json new file mode 100644 index 0000000000000000000000000000000000000000..6c49fc63bcb109de13abe49e58f85a4cdba7b679 --- /dev/null +++ b/output_oeal_Qwen3-4B_-/checkpoint-600/vocab.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca10d7e9fb3ed18575dd1e277a2579c16d108e32f27439684afa0e10b1440910 +size 2776833 diff --git a/output_oeal_Qwen3-4B_-/checkpoint-825/README.md b/output_oeal_Qwen3-4B_-/checkpoint-825/README.md new file mode 100644 index 0000000000000000000000000000000000000000..8a9591cde2bc956137b9f7d13e4fe8be718b6a61 --- /dev/null +++ b/output_oeal_Qwen3-4B_-/checkpoint-825/README.md @@ -0,0 +1,202 @@ +--- +base_model: Qwen/Qwen3-4B +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.15.2 \ No newline at end of file diff --git a/output_oeal_Qwen3-4B_-/checkpoint-825/adapter_config.json b/output_oeal_Qwen3-4B_-/checkpoint-825/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..98d21361e8add1621cb60814b662f410dfd8a4d2 --- /dev/null +++ b/output_oeal_Qwen3-4B_-/checkpoint-825/adapter_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53183f3f05d47d7c6bb299d56ed6ce9b4c94ef4829073161a1bc1cf936c1da95 +size 828 diff --git a/output_oeal_Qwen3-4B_-/checkpoint-825/adapter_model.safetensors b/output_oeal_Qwen3-4B_-/checkpoint-825/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..139edc6486bbf92d6c8a7fe0f3eb9e7bad9f22ee --- /dev/null +++ b/output_oeal_Qwen3-4B_-/checkpoint-825/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09fb0fba50e3d1b869029cb3479b989a794f19d2cab4c0f5adeff4db2a45332f +size 1579102000 diff --git a/output_oeal_Qwen3-4B_-/checkpoint-825/added_tokens.json b/output_oeal_Qwen3-4B_-/checkpoint-825/added_tokens.json new file mode 100644 index 0000000000000000000000000000000000000000..2b76afd7cb1e665182c309e62849419f75306b75 --- /dev/null +++ b/output_oeal_Qwen3-4B_-/checkpoint-825/added_tokens.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0284b582e14987fbd3d5a2cb2bd139084371ed9acbae488829a1c900833c680 +size 707 diff --git a/output_oeal_Qwen3-4B_-/checkpoint-825/chat_template.jinja b/output_oeal_Qwen3-4B_-/checkpoint-825/chat_template.jinja new file mode 100644 index 0000000000000000000000000000000000000000..d85ff3045a68273657a9f871cdb9938c940b110b --- /dev/null +++ b/output_oeal_Qwen3-4B_-/checkpoint-825/chat_template.jinja @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a55ee1b1660128b7098723e0abcd92caa0788061051c62d51cbe87d9cf1974d8 +size 4168 diff --git a/output_oeal_Qwen3-4B_-/checkpoint-825/global_step823/mp_rank_00_model_states.pt b/output_oeal_Qwen3-4B_-/checkpoint-825/global_step823/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..89378c740d958b31d7c06ba23e53444b38b730e0 --- /dev/null +++ b/output_oeal_Qwen3-4B_-/checkpoint-825/global_step823/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d569f7008849597dc03b209932701a12d72c37e6551985cf62235c78bbad3d6 +size 861285289 diff --git a/output_oeal_Qwen3-4B_-/checkpoint-825/global_step823/zero_pp_rank_0_mp_rank_00_optim_states.pt b/output_oeal_Qwen3-4B_-/checkpoint-825/global_step823/zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..384256e066bd4c5be074b4f632d96efe536821d2 --- /dev/null +++ b/output_oeal_Qwen3-4B_-/checkpoint-825/global_step823/zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08f118621f501dda771721e6663a92ff1e2517a009bb88a5dfd851c27eebff9e +size 77884216 diff --git a/output_oeal_Qwen3-4B_-/checkpoint-825/global_step823/zero_pp_rank_1_mp_rank_00_optim_states.pt b/output_oeal_Qwen3-4B_-/checkpoint-825/global_step823/zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c7f5075f6fbec0bfb96e16e0b6042f441fc843fe --- /dev/null +++ b/output_oeal_Qwen3-4B_-/checkpoint-825/global_step823/zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36fb106d4a44efbe4dcaf3dc0b27227e7c1efc0aa59d85f6d0ecf0ecab84d52f +size 77884344 diff --git a/output_oeal_Qwen3-4B_-/checkpoint-825/latest b/output_oeal_Qwen3-4B_-/checkpoint-825/latest new file mode 100644 index 0000000000000000000000000000000000000000..4880e0a8911d24e8ce61af5ad62ac0d0852b45c8 --- /dev/null +++ b/output_oeal_Qwen3-4B_-/checkpoint-825/latest @@ -0,0 +1 @@ +global_step823 \ No newline at end of file diff --git a/output_oeal_Qwen3-4B_-/checkpoint-825/merges.txt b/output_oeal_Qwen3-4B_-/checkpoint-825/merges.txt new file mode 100644 index 0000000000000000000000000000000000000000..80c1a19fae38f8f4c9ab32cc9d4e145c241147e6 --- /dev/null +++ b/output_oeal_Qwen3-4B_-/checkpoint-825/merges.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8831e4f1a044471340f7c0a83d7bd71306a5b867e95fd870f74d0c5308a904d5 +size 1671853 diff --git a/output_oeal_Qwen3-4B_-/checkpoint-825/rng_state_0.pth b/output_oeal_Qwen3-4B_-/checkpoint-825/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..f68e915e4c28b709e57a9fe5c3ffeb4cb4bd3280 --- /dev/null +++ b/output_oeal_Qwen3-4B_-/checkpoint-825/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87160020f4c1dbed7fa165014564075920bf49d7bc5d07a8e663424fa0b17936 +size 14917 diff --git a/output_oeal_Qwen3-4B_-/checkpoint-825/rng_state_1.pth b/output_oeal_Qwen3-4B_-/checkpoint-825/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..009475b11f208037e428b8b86c5e407c89e5e5bc --- /dev/null +++ b/output_oeal_Qwen3-4B_-/checkpoint-825/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf86cbfd1e20cd659804a794b27ce82a92404ae158674bcd150593de2b21abcd +size 14917 diff --git a/output_oeal_Qwen3-4B_-/checkpoint-825/special_tokens_map.json b/output_oeal_Qwen3-4B_-/checkpoint-825/special_tokens_map.json new file mode 100644 index 0000000000000000000000000000000000000000..ee3f6af3ba18b7d721f02bdf3fbca2814b7eda35 --- /dev/null +++ b/output_oeal_Qwen3-4B_-/checkpoint-825/special_tokens_map.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76862e765266b85aa9459767e33cbaf13970f327a0e88d1c65846c2ddd3a1ecd +size 613 diff --git a/output_oeal_Qwen3-4B_-/checkpoint-825/tokenizer.json b/output_oeal_Qwen3-4B_-/checkpoint-825/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..cd71f61a15a522601badb3dc960d800d9cb3766c --- /dev/null +++ b/output_oeal_Qwen3-4B_-/checkpoint-825/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aeb13307a71acd8fe81861d94ad54ab689df773318809eed3cbe794b4492dae4 +size 11422654 diff --git a/output_oeal_Qwen3-4B_-/checkpoint-825/tokenizer_config.json b/output_oeal_Qwen3-4B_-/checkpoint-825/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..5c0cfc2d0ad23392bd84cad162c5d524f389f509 --- /dev/null +++ b/output_oeal_Qwen3-4B_-/checkpoint-825/tokenizer_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:502723b70f4fd98e2ee7aa681501d73ed0cbebd40fa8bc6f0585a61c3a14e156 +size 5597 diff --git a/output_oeal_Qwen3-4B_-/checkpoint-825/trainer_state.json b/output_oeal_Qwen3-4B_-/checkpoint-825/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..cd56f1f47d1b0dcc3b76ad3aba6723d96c85c00e --- /dev/null +++ b/output_oeal_Qwen3-4B_-/checkpoint-825/trainer_state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b4bee8c0e4928eca438126314e1d6b6ac59ae76af59306562dba18fe25eae43 +size 22791 diff --git a/output_oeal_Qwen3-4B_-/checkpoint-825/training_args.bin b/output_oeal_Qwen3-4B_-/checkpoint-825/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..81339de916798b4ef4b905c04e809179077a2b7f --- /dev/null +++ b/output_oeal_Qwen3-4B_-/checkpoint-825/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:263e593ff833cdb3879ed2c66f1b6798a8a3dab179baf33a5a099571420a3e92 +size 7889 diff --git a/output_oeal_Qwen3-4B_-/checkpoint-825/vocab.json b/output_oeal_Qwen3-4B_-/checkpoint-825/vocab.json new file mode 100644 index 0000000000000000000000000000000000000000..6c49fc63bcb109de13abe49e58f85a4cdba7b679 --- /dev/null +++ b/output_oeal_Qwen3-4B_-/checkpoint-825/vocab.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca10d7e9fb3ed18575dd1e277a2579c16d108e32f27439684afa0e10b1440910 +size 2776833 diff --git a/output_oeal_Qwen3-4B_-/checkpoint-840/README.md b/output_oeal_Qwen3-4B_-/checkpoint-840/README.md new file mode 100644 index 0000000000000000000000000000000000000000..8a9591cde2bc956137b9f7d13e4fe8be718b6a61 --- /dev/null +++ b/output_oeal_Qwen3-4B_-/checkpoint-840/README.md @@ -0,0 +1,202 @@ +--- +base_model: Qwen/Qwen3-4B +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.15.2 \ No newline at end of file diff --git a/output_oeal_Qwen3-4B_-/checkpoint-840/adapter_config.json b/output_oeal_Qwen3-4B_-/checkpoint-840/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..98d21361e8add1621cb60814b662f410dfd8a4d2 --- /dev/null +++ b/output_oeal_Qwen3-4B_-/checkpoint-840/adapter_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53183f3f05d47d7c6bb299d56ed6ce9b4c94ef4829073161a1bc1cf936c1da95 +size 828 diff --git a/output_oeal_Qwen3-4B_-/checkpoint-840/adapter_model.safetensors b/output_oeal_Qwen3-4B_-/checkpoint-840/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1204c5768876e33bf496a41838e4614c23deff1d --- /dev/null +++ b/output_oeal_Qwen3-4B_-/checkpoint-840/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06cc428aa29ad6e5c35f133fec2799f3162f7be95ad94bf020285defaf16de6c +size 1579102000 diff --git a/output_oeal_Qwen3-4B_-/checkpoint-840/added_tokens.json b/output_oeal_Qwen3-4B_-/checkpoint-840/added_tokens.json new file mode 100644 index 0000000000000000000000000000000000000000..2b76afd7cb1e665182c309e62849419f75306b75 --- /dev/null +++ b/output_oeal_Qwen3-4B_-/checkpoint-840/added_tokens.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0284b582e14987fbd3d5a2cb2bd139084371ed9acbae488829a1c900833c680 +size 707 diff --git a/output_oeal_Qwen3-4B_-/checkpoint-840/chat_template.jinja b/output_oeal_Qwen3-4B_-/checkpoint-840/chat_template.jinja new file mode 100644 index 0000000000000000000000000000000000000000..d85ff3045a68273657a9f871cdb9938c940b110b --- /dev/null +++ b/output_oeal_Qwen3-4B_-/checkpoint-840/chat_template.jinja @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a55ee1b1660128b7098723e0abcd92caa0788061051c62d51cbe87d9cf1974d8 +size 4168 diff --git a/output_oeal_Qwen3-4B_-/checkpoint-840/global_step838/mp_rank_00_model_states.pt b/output_oeal_Qwen3-4B_-/checkpoint-840/global_step838/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..24117b61d12dac13ed3467a595fe7bfa7efc8643 --- /dev/null +++ b/output_oeal_Qwen3-4B_-/checkpoint-840/global_step838/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2d05bdd61b8ce7d0ea6706776bc830d52d2d1dfc135643280a8b250f33a787f +size 861285289 diff --git a/output_oeal_Qwen3-4B_-/checkpoint-840/global_step838/zero_pp_rank_0_mp_rank_00_optim_states.pt b/output_oeal_Qwen3-4B_-/checkpoint-840/global_step838/zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..40c41cbc0134ed0073c1ae0f1200c4e00106e72b --- /dev/null +++ b/output_oeal_Qwen3-4B_-/checkpoint-840/global_step838/zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:511cef357aaf4f5d07e8a9a2c1eab87c72e96bb28ea270aed55355fb23d25813 +size 77884216 diff --git a/output_oeal_Qwen3-4B_-/checkpoint-840/global_step838/zero_pp_rank_1_mp_rank_00_optim_states.pt b/output_oeal_Qwen3-4B_-/checkpoint-840/global_step838/zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ba8c51c6c266722dafde19d22b5380b03f011bc --- /dev/null +++ b/output_oeal_Qwen3-4B_-/checkpoint-840/global_step838/zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9010d88f858aff08d23ae7d2da6611e4137d3197787cf2ab193a1f1111ec3665 +size 77884344 diff --git a/output_oeal_Qwen3-4B_-/checkpoint-840/latest b/output_oeal_Qwen3-4B_-/checkpoint-840/latest new file mode 100644 index 0000000000000000000000000000000000000000..41738f7ff34a06ce41314b74a369fd5d63688df6 --- /dev/null +++ b/output_oeal_Qwen3-4B_-/checkpoint-840/latest @@ -0,0 +1 @@ +global_step838 \ No newline at end of file diff --git a/output_oeal_Qwen3-4B_-/checkpoint-840/merges.txt b/output_oeal_Qwen3-4B_-/checkpoint-840/merges.txt new file mode 100644 index 0000000000000000000000000000000000000000..80c1a19fae38f8f4c9ab32cc9d4e145c241147e6 --- /dev/null +++ b/output_oeal_Qwen3-4B_-/checkpoint-840/merges.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8831e4f1a044471340f7c0a83d7bd71306a5b867e95fd870f74d0c5308a904d5 +size 1671853 diff --git a/output_oeal_Qwen3-4B_-/checkpoint-840/rng_state_0.pth b/output_oeal_Qwen3-4B_-/checkpoint-840/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..acc34e1d98e4531e65a425085fd6f02bcdc6a204 --- /dev/null +++ b/output_oeal_Qwen3-4B_-/checkpoint-840/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2288e819c5246f0c8635ae7375bc66d882b5714670d20fed009ba12ff8413eec +size 14917 diff --git a/output_oeal_Qwen3-4B_-/checkpoint-840/rng_state_1.pth b/output_oeal_Qwen3-4B_-/checkpoint-840/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..6c1b5fc2bacae8476930ccca8125fc9211c48301 --- /dev/null +++ b/output_oeal_Qwen3-4B_-/checkpoint-840/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8fce1ab03d1a63e1761778ca884c91a2a9012dae3aff9623d239766a1e9d0cb +size 14917 diff --git a/output_oeal_Qwen3-4B_-/checkpoint-840/special_tokens_map.json b/output_oeal_Qwen3-4B_-/checkpoint-840/special_tokens_map.json new file mode 100644 index 0000000000000000000000000000000000000000..ee3f6af3ba18b7d721f02bdf3fbca2814b7eda35 --- /dev/null +++ b/output_oeal_Qwen3-4B_-/checkpoint-840/special_tokens_map.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76862e765266b85aa9459767e33cbaf13970f327a0e88d1c65846c2ddd3a1ecd +size 613 diff --git a/output_oeal_Qwen3-4B_-/checkpoint-840/tokenizer.json b/output_oeal_Qwen3-4B_-/checkpoint-840/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..cd71f61a15a522601badb3dc960d800d9cb3766c --- /dev/null +++ b/output_oeal_Qwen3-4B_-/checkpoint-840/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aeb13307a71acd8fe81861d94ad54ab689df773318809eed3cbe794b4492dae4 +size 11422654 diff --git a/output_oeal_Qwen3-4B_-/checkpoint-840/tokenizer_config.json b/output_oeal_Qwen3-4B_-/checkpoint-840/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..5c0cfc2d0ad23392bd84cad162c5d524f389f509 --- /dev/null +++ b/output_oeal_Qwen3-4B_-/checkpoint-840/tokenizer_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:502723b70f4fd98e2ee7aa681501d73ed0cbebd40fa8bc6f0585a61c3a14e156 +size 5597 diff --git a/output_oeal_Qwen3-4B_-/checkpoint-840/trainer_state.json b/output_oeal_Qwen3-4B_-/checkpoint-840/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..d166d6b712630cda24443cb97f568c0dab8a7e86 --- /dev/null +++ b/output_oeal_Qwen3-4B_-/checkpoint-840/trainer_state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf29a3bed241a97ead465b098f4faf6ae0fe5d20c9ca1b7f79e7c15387158006 +size 23180 diff --git a/output_oeal_Qwen3-4B_-/checkpoint-840/training_args.bin b/output_oeal_Qwen3-4B_-/checkpoint-840/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..81339de916798b4ef4b905c04e809179077a2b7f --- /dev/null +++ b/output_oeal_Qwen3-4B_-/checkpoint-840/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:263e593ff833cdb3879ed2c66f1b6798a8a3dab179baf33a5a099571420a3e92 +size 7889 diff --git a/output_oeal_Qwen3-4B_-/checkpoint-840/vocab.json b/output_oeal_Qwen3-4B_-/checkpoint-840/vocab.json new file mode 100644 index 0000000000000000000000000000000000000000..6c49fc63bcb109de13abe49e58f85a4cdba7b679 --- /dev/null +++ b/output_oeal_Qwen3-4B_-/checkpoint-840/vocab.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca10d7e9fb3ed18575dd1e277a2579c16d108e32f27439684afa0e10b1440910 +size 2776833 diff --git a/output_oeal_Qwen3-4B_-/final_adapters/README.md b/output_oeal_Qwen3-4B_-/final_adapters/README.md new file mode 100644 index 0000000000000000000000000000000000000000..8a9591cde2bc956137b9f7d13e4fe8be718b6a61 --- /dev/null +++ b/output_oeal_Qwen3-4B_-/final_adapters/README.md @@ -0,0 +1,202 @@ +--- +base_model: Qwen/Qwen3-4B +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.15.2 \ No newline at end of file diff --git a/output_oeal_Qwen3-4B_-/final_adapters/adapter_config.json b/output_oeal_Qwen3-4B_-/final_adapters/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..cd249f2932b8f8b3c4a8cd8984ec276952c599b8 --- /dev/null +++ b/output_oeal_Qwen3-4B_-/final_adapters/adapter_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15769b4da00c79f0e2677ff72e6e8ae172b3155e62b376e58a93c8952efb6995 +size 828 diff --git a/output_oeal_Qwen3-4B_-/final_adapters/adapter_model.safetensors b/output_oeal_Qwen3-4B_-/final_adapters/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6d5bc7dcd4aa1c7cb99c97149e7f78a4e108c2b9 --- /dev/null +++ b/output_oeal_Qwen3-4B_-/final_adapters/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e56fe94c129a90a2cce427c5a16d0c7a8a3dcb5dd33db50a0a4da7ae9f7b392 +size 1579102000 diff --git a/output_oeal_Qwen3-4B_-/final_adapters/added_tokens.json b/output_oeal_Qwen3-4B_-/final_adapters/added_tokens.json new file mode 100644 index 0000000000000000000000000000000000000000..2b76afd7cb1e665182c309e62849419f75306b75 --- /dev/null +++ b/output_oeal_Qwen3-4B_-/final_adapters/added_tokens.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0284b582e14987fbd3d5a2cb2bd139084371ed9acbae488829a1c900833c680 +size 707 diff --git a/output_oeal_Qwen3-4B_-/final_adapters/chat_template.jinja b/output_oeal_Qwen3-4B_-/final_adapters/chat_template.jinja new file mode 100644 index 0000000000000000000000000000000000000000..d85ff3045a68273657a9f871cdb9938c940b110b --- /dev/null +++ b/output_oeal_Qwen3-4B_-/final_adapters/chat_template.jinja @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a55ee1b1660128b7098723e0abcd92caa0788061051c62d51cbe87d9cf1974d8 +size 4168 diff --git a/output_oeal_Qwen3-4B_-/final_adapters/global_step598/mp_rank_00_model_states.pt b/output_oeal_Qwen3-4B_-/final_adapters/global_step598/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d995e0372057203167379d42e1a3daab3b751a7 --- /dev/null +++ b/output_oeal_Qwen3-4B_-/final_adapters/global_step598/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae1390bd0c5adb4508d3c6d79fbc1b1ced1fec86355db6e0e041ec7c494321c2 +size 861285289 diff --git a/output_oeal_Qwen3-4B_-/final_adapters/global_step598/zero_pp_rank_0_mp_rank_00_optim_states.pt b/output_oeal_Qwen3-4B_-/final_adapters/global_step598/zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..394edad0dc87a646636323a9c8346e11c29682b2 --- /dev/null +++ b/output_oeal_Qwen3-4B_-/final_adapters/global_step598/zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:766446e3e181e416fafe2ce7b72f9a198e297cb4c16bce846bc77fa3b34e5a64 +size 77884216 diff --git a/output_oeal_Qwen3-4B_-/final_adapters/global_step598/zero_pp_rank_1_mp_rank_00_optim_states.pt b/output_oeal_Qwen3-4B_-/final_adapters/global_step598/zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..20e0ec762f31ad2ac1e4dfb804dc7d16cce9884d --- /dev/null +++ b/output_oeal_Qwen3-4B_-/final_adapters/global_step598/zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0521582f76826e13cd387f41808bc76398e001100005cf16e813f4ea94fceaa3 +size 77884344 diff --git a/output_oeal_Qwen3-4B_-/final_adapters/latest b/output_oeal_Qwen3-4B_-/final_adapters/latest new file mode 100644 index 0000000000000000000000000000000000000000..8a87fdc3e8d4d236bfa15c87e3acae6c027d8460 --- /dev/null +++ b/output_oeal_Qwen3-4B_-/final_adapters/latest @@ -0,0 +1 @@ +global_step598 \ No newline at end of file diff --git a/output_oeal_Qwen3-4B_-/final_adapters/merges.txt b/output_oeal_Qwen3-4B_-/final_adapters/merges.txt new file mode 100644 index 0000000000000000000000000000000000000000..80c1a19fae38f8f4c9ab32cc9d4e145c241147e6 --- /dev/null +++ b/output_oeal_Qwen3-4B_-/final_adapters/merges.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8831e4f1a044471340f7c0a83d7bd71306a5b867e95fd870f74d0c5308a904d5 +size 1671853 diff --git a/output_oeal_Qwen3-4B_-/final_adapters/rng_state_0.pth b/output_oeal_Qwen3-4B_-/final_adapters/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..d7eff0c6f8bbdccfdc6598329e45f13796e054a3 --- /dev/null +++ b/output_oeal_Qwen3-4B_-/final_adapters/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:233b2beced6e46147e0d535df7bc94f047fc8d7a5b3828b381e1077e8f5af631 +size 14917 diff --git a/output_oeal_Qwen3-4B_-/final_adapters/rng_state_1.pth b/output_oeal_Qwen3-4B_-/final_adapters/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..e728608c4aa596f9c27f17e87e5a2c0dc51dcfef --- /dev/null +++ b/output_oeal_Qwen3-4B_-/final_adapters/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:105643a0823f635ae4241293ce5ef99154425d151fa6cccca68105b0514afe8e +size 14917 diff --git a/output_oeal_Qwen3-4B_-/final_adapters/special_tokens_map.json b/output_oeal_Qwen3-4B_-/final_adapters/special_tokens_map.json new file mode 100644 index 0000000000000000000000000000000000000000..ee3f6af3ba18b7d721f02bdf3fbca2814b7eda35 --- /dev/null +++ b/output_oeal_Qwen3-4B_-/final_adapters/special_tokens_map.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76862e765266b85aa9459767e33cbaf13970f327a0e88d1c65846c2ddd3a1ecd +size 613 diff --git a/output_oeal_Qwen3-4B_-/final_adapters/tokenizer.json b/output_oeal_Qwen3-4B_-/final_adapters/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..38dda57c0535c5ded5ad9b8a5b8c4e4a89aba355 --- /dev/null +++ b/output_oeal_Qwen3-4B_-/final_adapters/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abfbf1d13376ad75c980dc37b59f5030a8eac0ced7b8fef55166f88a7c9cac34 +size 11422922 diff --git a/output_oeal_Qwen3-4B_-/final_adapters/tokenizer_config.json b/output_oeal_Qwen3-4B_-/final_adapters/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..0d8ad241b789c1419579e4b54e31b0befbad9882 --- /dev/null +++ b/output_oeal_Qwen3-4B_-/final_adapters/tokenizer_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:443bfa629eb16387a12edbf92a76f6a6f10b2af3b53d87ba1550adfcf45f7fa0 +size 5404 diff --git a/output_oeal_Qwen3-4B_-/final_adapters/trainer_state.json b/output_oeal_Qwen3-4B_-/final_adapters/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..d6762f439a816a01e58b795420316b017ad3cb67 --- /dev/null +++ b/output_oeal_Qwen3-4B_-/final_adapters/trainer_state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ab9184fef1f179e65d79c352fd52ae7bdaec8e57010e8d814c3c2dcfb0365ec +size 16728 diff --git a/output_oeal_Qwen3-4B_-/final_adapters/training_args.bin b/output_oeal_Qwen3-4B_-/final_adapters/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..970918e1fdea383f7bbb41f529e5a496c104d052 --- /dev/null +++ b/output_oeal_Qwen3-4B_-/final_adapters/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9564a20f74071dd6173ca96b7e99f3be3226a0e2e863768a3896c383c6d2b1d8 +size 7889 diff --git a/output_oeal_Qwen3-4B_-/final_adapters/vocab.json b/output_oeal_Qwen3-4B_-/final_adapters/vocab.json new file mode 100644 index 0000000000000000000000000000000000000000..6c49fc63bcb109de13abe49e58f85a4cdba7b679 --- /dev/null +++ b/output_oeal_Qwen3-4B_-/final_adapters/vocab.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca10d7e9fb3ed18575dd1e277a2579c16d108e32f27439684afa0e10b1440910 +size 2776833 diff --git a/output_rdal_Qwen3-4B_-/checkpoint-300/README.md b/output_rdal_Qwen3-4B_-/checkpoint-300/README.md new file mode 100644 index 0000000000000000000000000000000000000000..8a9591cde2bc956137b9f7d13e4fe8be718b6a61 --- /dev/null +++ b/output_rdal_Qwen3-4B_-/checkpoint-300/README.md @@ -0,0 +1,202 @@ +--- +base_model: Qwen/Qwen3-4B +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.15.2 \ No newline at end of file diff --git a/output_rdal_Qwen3-4B_-/checkpoint-300/adapter_config.json b/output_rdal_Qwen3-4B_-/checkpoint-300/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..3b1a1bc8092d9144e19f34860219fc41770d9df7 --- /dev/null +++ b/output_rdal_Qwen3-4B_-/checkpoint-300/adapter_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:268ce1b414ef5c505b6c1f46312767afe7ac9d0817b48b3cc4d7351749e2c2cb +size 828 diff --git a/output_rdal_Qwen3-4B_-/checkpoint-300/adapter_model.safetensors b/output_rdal_Qwen3-4B_-/checkpoint-300/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e0431276e820dc85e12117970c576d128b0247ee --- /dev/null +++ b/output_rdal_Qwen3-4B_-/checkpoint-300/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd2aa90f44e9311177737da6ea384dd5286e0e91b5af4cdc9d8ee79241c84f3f +size 1579102000 diff --git a/output_rdal_Qwen3-4B_-/checkpoint-300/added_tokens.json b/output_rdal_Qwen3-4B_-/checkpoint-300/added_tokens.json new file mode 100644 index 0000000000000000000000000000000000000000..2b76afd7cb1e665182c309e62849419f75306b75 --- /dev/null +++ b/output_rdal_Qwen3-4B_-/checkpoint-300/added_tokens.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0284b582e14987fbd3d5a2cb2bd139084371ed9acbae488829a1c900833c680 +size 707 diff --git a/output_rdal_Qwen3-4B_-/checkpoint-300/chat_template.jinja b/output_rdal_Qwen3-4B_-/checkpoint-300/chat_template.jinja new file mode 100644 index 0000000000000000000000000000000000000000..d85ff3045a68273657a9f871cdb9938c940b110b --- /dev/null +++ b/output_rdal_Qwen3-4B_-/checkpoint-300/chat_template.jinja @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a55ee1b1660128b7098723e0abcd92caa0788061051c62d51cbe87d9cf1974d8 +size 4168 diff --git a/output_rdal_Qwen3-4B_-/checkpoint-300/global_step298/mp_rank_00_model_states.pt b/output_rdal_Qwen3-4B_-/checkpoint-300/global_step298/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..15254c94fa8c3cd14173cee135cece651d2a4bd8 --- /dev/null +++ b/output_rdal_Qwen3-4B_-/checkpoint-300/global_step298/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:640d8397d5802d781d8099ad2ff8cb3f71d343195ab2910757bd795559b08c08 +size 861285289 diff --git a/output_rdal_Qwen3-4B_-/checkpoint-300/global_step298/zero_pp_rank_0_mp_rank_00_optim_states.pt b/output_rdal_Qwen3-4B_-/checkpoint-300/global_step298/zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3d58af8fb9fc280b97195204a6bd511c79f6a4f --- /dev/null +++ b/output_rdal_Qwen3-4B_-/checkpoint-300/global_step298/zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de090478d1d511229197cb66a84996730866ab2d6916b2579557f24c90304e51 +size 77884216 diff --git a/output_rdal_Qwen3-4B_-/checkpoint-300/global_step298/zero_pp_rank_1_mp_rank_00_optim_states.pt b/output_rdal_Qwen3-4B_-/checkpoint-300/global_step298/zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..26d940c706bdc0538910d0f729d77723cf323f60 --- /dev/null +++ b/output_rdal_Qwen3-4B_-/checkpoint-300/global_step298/zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab4dcdb6bfe17d6cd5fe15f233f18e70c3954231554a12cd840fb9b130c6f3d2 +size 77884344 diff --git a/output_rdal_Qwen3-4B_-/checkpoint-300/latest b/output_rdal_Qwen3-4B_-/checkpoint-300/latest new file mode 100644 index 0000000000000000000000000000000000000000..27248697cbe0d21f725e081d68ed5d99a77d5e94 --- /dev/null +++ b/output_rdal_Qwen3-4B_-/checkpoint-300/latest @@ -0,0 +1 @@ +global_step298 \ No newline at end of file diff --git a/output_rdal_Qwen3-4B_-/checkpoint-300/merges.txt b/output_rdal_Qwen3-4B_-/checkpoint-300/merges.txt new file mode 100644 index 0000000000000000000000000000000000000000..80c1a19fae38f8f4c9ab32cc9d4e145c241147e6 --- /dev/null +++ b/output_rdal_Qwen3-4B_-/checkpoint-300/merges.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8831e4f1a044471340f7c0a83d7bd71306a5b867e95fd870f74d0c5308a904d5 +size 1671853 diff --git a/output_rdal_Qwen3-4B_-/checkpoint-300/rng_state_0.pth b/output_rdal_Qwen3-4B_-/checkpoint-300/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..8e76935635f7c13e1c6ae1620f267c867f9ebff9 --- /dev/null +++ b/output_rdal_Qwen3-4B_-/checkpoint-300/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3038e9bed18fdd32d650c90838d12e2726f789b6eda2c23851bc90010b311cab +size 14917 diff --git a/output_rdal_Qwen3-4B_-/checkpoint-300/rng_state_1.pth b/output_rdal_Qwen3-4B_-/checkpoint-300/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..3f25c8b6506b6e6af2e74c5e2a87d09ca649ddb1 --- /dev/null +++ b/output_rdal_Qwen3-4B_-/checkpoint-300/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a43bb3cdc52456c2ca4c5f1116e59350228d5e68f22462819e3d600e8eba627 +size 14917 diff --git a/output_rdal_Qwen3-4B_-/checkpoint-300/special_tokens_map.json b/output_rdal_Qwen3-4B_-/checkpoint-300/special_tokens_map.json new file mode 100644 index 0000000000000000000000000000000000000000..ee3f6af3ba18b7d721f02bdf3fbca2814b7eda35 --- /dev/null +++ b/output_rdal_Qwen3-4B_-/checkpoint-300/special_tokens_map.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76862e765266b85aa9459767e33cbaf13970f327a0e88d1c65846c2ddd3a1ecd +size 613 diff --git a/output_rdal_Qwen3-4B_-/checkpoint-300/tokenizer.json b/output_rdal_Qwen3-4B_-/checkpoint-300/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..cd71f61a15a522601badb3dc960d800d9cb3766c --- /dev/null +++ b/output_rdal_Qwen3-4B_-/checkpoint-300/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aeb13307a71acd8fe81861d94ad54ab689df773318809eed3cbe794b4492dae4 +size 11422654 diff --git a/output_rdal_Qwen3-4B_-/checkpoint-300/tokenizer_config.json b/output_rdal_Qwen3-4B_-/checkpoint-300/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..0d8ad241b789c1419579e4b54e31b0befbad9882 --- /dev/null +++ b/output_rdal_Qwen3-4B_-/checkpoint-300/tokenizer_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:443bfa629eb16387a12edbf92a76f6a6f10b2af3b53d87ba1550adfcf45f7fa0 +size 5404 diff --git a/output_rdal_Qwen3-4B_-/checkpoint-300/trainer_state.json b/output_rdal_Qwen3-4B_-/checkpoint-300/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..355d26080eef9c863d0fd84b186093e94d8ce6a0 --- /dev/null +++ b/output_rdal_Qwen3-4B_-/checkpoint-300/trainer_state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4216379db2bd143b2d283e1f852816f8350ef17c9c2aa78d9b10e1e3505e5f61 +size 8965 diff --git a/output_rdal_Qwen3-4B_-/checkpoint-300/training_args.bin b/output_rdal_Qwen3-4B_-/checkpoint-300/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..b7afdb141adad72b781a9154c76e1bacafc146e9 --- /dev/null +++ b/output_rdal_Qwen3-4B_-/checkpoint-300/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0586b3dd15eb1b60e40c5650b3c7344d1abdd741de8e4b60484753137df60d5f +size 7889 diff --git a/output_rdal_Qwen3-4B_-/checkpoint-300/vocab.json b/output_rdal_Qwen3-4B_-/checkpoint-300/vocab.json new file mode 100644 index 0000000000000000000000000000000000000000..6c49fc63bcb109de13abe49e58f85a4cdba7b679 --- /dev/null +++ b/output_rdal_Qwen3-4B_-/checkpoint-300/vocab.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca10d7e9fb3ed18575dd1e277a2579c16d108e32f27439684afa0e10b1440910 +size 2776833 diff --git a/output_rdal_Qwen3-4B_-/checkpoint-540/README.md b/output_rdal_Qwen3-4B_-/checkpoint-540/README.md new file mode 100644 index 0000000000000000000000000000000000000000..8a9591cde2bc956137b9f7d13e4fe8be718b6a61 --- /dev/null +++ b/output_rdal_Qwen3-4B_-/checkpoint-540/README.md @@ -0,0 +1,202 @@ +--- +base_model: Qwen/Qwen3-4B +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.15.2 \ No newline at end of file diff --git a/output_rdal_Qwen3-4B_-/checkpoint-540/adapter_config.json b/output_rdal_Qwen3-4B_-/checkpoint-540/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..3b1a1bc8092d9144e19f34860219fc41770d9df7 --- /dev/null +++ b/output_rdal_Qwen3-4B_-/checkpoint-540/adapter_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:268ce1b414ef5c505b6c1f46312767afe7ac9d0817b48b3cc4d7351749e2c2cb +size 828 diff --git a/output_rdal_Qwen3-4B_-/checkpoint-540/adapter_model.safetensors b/output_rdal_Qwen3-4B_-/checkpoint-540/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d387fc0cd9266f1d1693e9b4da492f8c88ba7b43 --- /dev/null +++ b/output_rdal_Qwen3-4B_-/checkpoint-540/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b768b323fd43c2255849761a70906699d375f5e1c887077951c78054dbfe380 +size 1579102000 diff --git a/output_rdal_Qwen3-4B_-/checkpoint-540/added_tokens.json b/output_rdal_Qwen3-4B_-/checkpoint-540/added_tokens.json new file mode 100644 index 0000000000000000000000000000000000000000..2b76afd7cb1e665182c309e62849419f75306b75 --- /dev/null +++ b/output_rdal_Qwen3-4B_-/checkpoint-540/added_tokens.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0284b582e14987fbd3d5a2cb2bd139084371ed9acbae488829a1c900833c680 +size 707 diff --git a/output_rdal_Qwen3-4B_-/checkpoint-540/chat_template.jinja b/output_rdal_Qwen3-4B_-/checkpoint-540/chat_template.jinja new file mode 100644 index 0000000000000000000000000000000000000000..d85ff3045a68273657a9f871cdb9938c940b110b --- /dev/null +++ b/output_rdal_Qwen3-4B_-/checkpoint-540/chat_template.jinja @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a55ee1b1660128b7098723e0abcd92caa0788061051c62d51cbe87d9cf1974d8 +size 4168 diff --git a/output_rdal_Qwen3-4B_-/checkpoint-540/global_step537/mp_rank_00_model_states.pt b/output_rdal_Qwen3-4B_-/checkpoint-540/global_step537/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..43594d4d26c1ac3df681702c840f622ea61e9f1b --- /dev/null +++ b/output_rdal_Qwen3-4B_-/checkpoint-540/global_step537/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:616e326cccf62a3017a40a2f46fc75d733bee7fd8316015699343d1b2a562d59 +size 861285289 diff --git a/output_rdal_Qwen3-4B_-/checkpoint-540/global_step537/zero_pp_rank_0_mp_rank_00_optim_states.pt b/output_rdal_Qwen3-4B_-/checkpoint-540/global_step537/zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e54496267e2c181be547cf59a347b10ed1f30b6 --- /dev/null +++ b/output_rdal_Qwen3-4B_-/checkpoint-540/global_step537/zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11b3723e0e3bb145bc8d91af5e4f1e87a8e7f3c50dee8ff6e28cb0c9063e738c +size 77884216 diff --git a/output_rdal_Qwen3-4B_-/checkpoint-540/global_step537/zero_pp_rank_1_mp_rank_00_optim_states.pt b/output_rdal_Qwen3-4B_-/checkpoint-540/global_step537/zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..75d354c5bedc825bb6ab5ae9c0ad3aec9c12fcbe --- /dev/null +++ b/output_rdal_Qwen3-4B_-/checkpoint-540/global_step537/zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00ebbb967ce5856cb5d8859ad96d9d399c9df332255684112b9985232fd4da96 +size 77884344 diff --git a/output_rdal_Qwen3-4B_-/checkpoint-540/latest b/output_rdal_Qwen3-4B_-/checkpoint-540/latest new file mode 100644 index 0000000000000000000000000000000000000000..57b7e8212ad3c9da2b37172bdd0e1e5a8a199ff7 --- /dev/null +++ b/output_rdal_Qwen3-4B_-/checkpoint-540/latest @@ -0,0 +1 @@ +global_step537 \ No newline at end of file diff --git a/output_rdal_Qwen3-4B_-/checkpoint-540/merges.txt b/output_rdal_Qwen3-4B_-/checkpoint-540/merges.txt new file mode 100644 index 0000000000000000000000000000000000000000..80c1a19fae38f8f4c9ab32cc9d4e145c241147e6 --- /dev/null +++ b/output_rdal_Qwen3-4B_-/checkpoint-540/merges.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8831e4f1a044471340f7c0a83d7bd71306a5b867e95fd870f74d0c5308a904d5 +size 1671853 diff --git a/output_rdal_Qwen3-4B_-/checkpoint-540/rng_state_0.pth b/output_rdal_Qwen3-4B_-/checkpoint-540/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..68c0a4d5a8129381a9fefb4207e77bcc87abfe19 --- /dev/null +++ b/output_rdal_Qwen3-4B_-/checkpoint-540/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:659293fa5e4b828cc6cf89a4373315daf07e79b76a934c31171169a4b800c6a2 +size 14917 diff --git a/output_rdal_Qwen3-4B_-/checkpoint-540/rng_state_1.pth b/output_rdal_Qwen3-4B_-/checkpoint-540/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..482c0953711549b3d51115d48734c5a63c7c2a93 --- /dev/null +++ b/output_rdal_Qwen3-4B_-/checkpoint-540/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2c29488174705a083fcd31d57cbdbb7d3f7529f31a4f7dee39d08c66b249110 +size 14917 diff --git a/output_rdal_Qwen3-4B_-/checkpoint-540/special_tokens_map.json b/output_rdal_Qwen3-4B_-/checkpoint-540/special_tokens_map.json new file mode 100644 index 0000000000000000000000000000000000000000..ee3f6af3ba18b7d721f02bdf3fbca2814b7eda35 --- /dev/null +++ b/output_rdal_Qwen3-4B_-/checkpoint-540/special_tokens_map.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76862e765266b85aa9459767e33cbaf13970f327a0e88d1c65846c2ddd3a1ecd +size 613 diff --git a/output_rdal_Qwen3-4B_-/checkpoint-540/tokenizer.json b/output_rdal_Qwen3-4B_-/checkpoint-540/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..cd71f61a15a522601badb3dc960d800d9cb3766c --- /dev/null +++ b/output_rdal_Qwen3-4B_-/checkpoint-540/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aeb13307a71acd8fe81861d94ad54ab689df773318809eed3cbe794b4492dae4 +size 11422654 diff --git a/output_rdal_Qwen3-4B_-/checkpoint-540/tokenizer_config.json b/output_rdal_Qwen3-4B_-/checkpoint-540/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..0d8ad241b789c1419579e4b54e31b0befbad9882 --- /dev/null +++ b/output_rdal_Qwen3-4B_-/checkpoint-540/tokenizer_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:443bfa629eb16387a12edbf92a76f6a6f10b2af3b53d87ba1550adfcf45f7fa0 +size 5404 diff --git a/output_rdal_Qwen3-4B_-/checkpoint-540/trainer_state.json b/output_rdal_Qwen3-4B_-/checkpoint-540/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..d2feeb46f4d1f6dc67511fe5d01e6cb8de3c7b0b --- /dev/null +++ b/output_rdal_Qwen3-4B_-/checkpoint-540/trainer_state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6684830e04611c0599dca2b535edbe313aaadd86f352b72f2c02d505ef6190c6 +size 15280 diff --git a/output_rdal_Qwen3-4B_-/checkpoint-540/training_args.bin b/output_rdal_Qwen3-4B_-/checkpoint-540/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..b7afdb141adad72b781a9154c76e1bacafc146e9 --- /dev/null +++ b/output_rdal_Qwen3-4B_-/checkpoint-540/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0586b3dd15eb1b60e40c5650b3c7344d1abdd741de8e4b60484753137df60d5f +size 7889 diff --git a/output_rdal_Qwen3-4B_-/checkpoint-540/vocab.json b/output_rdal_Qwen3-4B_-/checkpoint-540/vocab.json new file mode 100644 index 0000000000000000000000000000000000000000..6c49fc63bcb109de13abe49e58f85a4cdba7b679 --- /dev/null +++ b/output_rdal_Qwen3-4B_-/checkpoint-540/vocab.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca10d7e9fb3ed18575dd1e277a2579c16d108e32f27439684afa0e10b1440910 +size 2776833 diff --git a/output_rdal_Qwen3-4B_-/checkpoint-548/README.md b/output_rdal_Qwen3-4B_-/checkpoint-548/README.md new file mode 100644 index 0000000000000000000000000000000000000000..8a9591cde2bc956137b9f7d13e4fe8be718b6a61 --- /dev/null +++ b/output_rdal_Qwen3-4B_-/checkpoint-548/README.md @@ -0,0 +1,202 @@ +--- +base_model: Qwen/Qwen3-4B +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.15.2 \ No newline at end of file diff --git a/output_rdal_Qwen3-4B_-/checkpoint-548/adapter_config.json b/output_rdal_Qwen3-4B_-/checkpoint-548/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..3b1a1bc8092d9144e19f34860219fc41770d9df7 --- /dev/null +++ b/output_rdal_Qwen3-4B_-/checkpoint-548/adapter_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:268ce1b414ef5c505b6c1f46312767afe7ac9d0817b48b3cc4d7351749e2c2cb +size 828 diff --git a/output_rdal_Qwen3-4B_-/checkpoint-548/adapter_model.safetensors b/output_rdal_Qwen3-4B_-/checkpoint-548/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3e83476507e400e0d1f8f195f85592e6281dcab7 --- /dev/null +++ b/output_rdal_Qwen3-4B_-/checkpoint-548/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7c31796cda897269e30fa58d41caea464933543da7b48e75dc76043eaeecffa +size 1579102000 diff --git a/output_rdal_Qwen3-4B_-/checkpoint-548/added_tokens.json b/output_rdal_Qwen3-4B_-/checkpoint-548/added_tokens.json new file mode 100644 index 0000000000000000000000000000000000000000..2b76afd7cb1e665182c309e62849419f75306b75 --- /dev/null +++ b/output_rdal_Qwen3-4B_-/checkpoint-548/added_tokens.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0284b582e14987fbd3d5a2cb2bd139084371ed9acbae488829a1c900833c680 +size 707 diff --git a/output_rdal_Qwen3-4B_-/checkpoint-548/chat_template.jinja b/output_rdal_Qwen3-4B_-/checkpoint-548/chat_template.jinja new file mode 100644 index 0000000000000000000000000000000000000000..d85ff3045a68273657a9f871cdb9938c940b110b --- /dev/null +++ b/output_rdal_Qwen3-4B_-/checkpoint-548/chat_template.jinja @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a55ee1b1660128b7098723e0abcd92caa0788061051c62d51cbe87d9cf1974d8 +size 4168 diff --git a/output_rdal_Qwen3-4B_-/checkpoint-548/global_step544/mp_rank_00_model_states.pt b/output_rdal_Qwen3-4B_-/checkpoint-548/global_step544/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9284381d7b0c4f88b60c0c8116a29b4cc079ae07 --- /dev/null +++ b/output_rdal_Qwen3-4B_-/checkpoint-548/global_step544/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd6ed2a396599aadfc097aab24a4101d5cfba74642314714606f10a473e05ee3 +size 861285289 diff --git a/output_rdal_Qwen3-4B_-/checkpoint-548/global_step544/zero_pp_rank_0_mp_rank_00_optim_states.pt b/output_rdal_Qwen3-4B_-/checkpoint-548/global_step544/zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..def52e5ce5babfdf3a0a8131944deafccbcbb2cb --- /dev/null +++ b/output_rdal_Qwen3-4B_-/checkpoint-548/global_step544/zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aebf85761b059dcbaa36ebb4399e865e1369e6c07da5a0257e9159e7d8db498d +size 77884216 diff --git a/output_rdal_Qwen3-4B_-/checkpoint-548/global_step544/zero_pp_rank_1_mp_rank_00_optim_states.pt b/output_rdal_Qwen3-4B_-/checkpoint-548/global_step544/zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..de9d4fa3f0611fbac1e67122d9336bb41e0eb92f --- /dev/null +++ b/output_rdal_Qwen3-4B_-/checkpoint-548/global_step544/zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6bceab559938952352c94fa86d544569c7745d2deec53393f2dabb81a92c967f +size 77884344 diff --git a/output_rdal_Qwen3-4B_-/checkpoint-548/latest b/output_rdal_Qwen3-4B_-/checkpoint-548/latest new file mode 100644 index 0000000000000000000000000000000000000000..606df2a525126f7e381b691c76048c61744888b9 --- /dev/null +++ b/output_rdal_Qwen3-4B_-/checkpoint-548/latest @@ -0,0 +1 @@ +global_step544 \ No newline at end of file diff --git a/output_rdal_Qwen3-4B_-/checkpoint-548/merges.txt b/output_rdal_Qwen3-4B_-/checkpoint-548/merges.txt new file mode 100644 index 0000000000000000000000000000000000000000..80c1a19fae38f8f4c9ab32cc9d4e145c241147e6 --- /dev/null +++ b/output_rdal_Qwen3-4B_-/checkpoint-548/merges.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8831e4f1a044471340f7c0a83d7bd71306a5b867e95fd870f74d0c5308a904d5 +size 1671853 diff --git a/output_rdal_Qwen3-4B_-/checkpoint-548/rng_state_0.pth b/output_rdal_Qwen3-4B_-/checkpoint-548/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..c7c0b259a7f5e4572901d8d6d7e6b74badff83c5 --- /dev/null +++ b/output_rdal_Qwen3-4B_-/checkpoint-548/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8925eda3d5437078c6162f5cff456242b5b2edca750d730dcf9bc012c9afef4 +size 14917 diff --git a/output_rdal_Qwen3-4B_-/checkpoint-548/rng_state_1.pth b/output_rdal_Qwen3-4B_-/checkpoint-548/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..ea734464a02a243d9108069ff1750196a9ea73e1 --- /dev/null +++ b/output_rdal_Qwen3-4B_-/checkpoint-548/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92f128cc70dbf7ddd7165be72af0c37eadb23f07f4815cb4360cf5c07d44e127 +size 14917 diff --git a/output_rdal_Qwen3-4B_-/checkpoint-548/special_tokens_map.json b/output_rdal_Qwen3-4B_-/checkpoint-548/special_tokens_map.json new file mode 100644 index 0000000000000000000000000000000000000000..ee3f6af3ba18b7d721f02bdf3fbca2814b7eda35 --- /dev/null +++ b/output_rdal_Qwen3-4B_-/checkpoint-548/special_tokens_map.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76862e765266b85aa9459767e33cbaf13970f327a0e88d1c65846c2ddd3a1ecd +size 613 diff --git a/output_rdal_Qwen3-4B_-/checkpoint-548/tokenizer.json b/output_rdal_Qwen3-4B_-/checkpoint-548/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..cd71f61a15a522601badb3dc960d800d9cb3766c --- /dev/null +++ b/output_rdal_Qwen3-4B_-/checkpoint-548/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aeb13307a71acd8fe81861d94ad54ab689df773318809eed3cbe794b4492dae4 +size 11422654 diff --git a/output_rdal_Qwen3-4B_-/checkpoint-548/tokenizer_config.json b/output_rdal_Qwen3-4B_-/checkpoint-548/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..0d8ad241b789c1419579e4b54e31b0befbad9882 --- /dev/null +++ b/output_rdal_Qwen3-4B_-/checkpoint-548/tokenizer_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:443bfa629eb16387a12edbf92a76f6a6f10b2af3b53d87ba1550adfcf45f7fa0 +size 5404 diff --git a/output_rdal_Qwen3-4B_-/checkpoint-548/trainer_state.json b/output_rdal_Qwen3-4B_-/checkpoint-548/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..a57e2cac51470bfb947870ff21e7131a77d83e45 --- /dev/null +++ b/output_rdal_Qwen3-4B_-/checkpoint-548/trainer_state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d872afec138642a53c2adc154cb3043cc5231e196ccd9637daf2371a38b9807c +size 15264 diff --git a/output_rdal_Qwen3-4B_-/checkpoint-548/training_args.bin b/output_rdal_Qwen3-4B_-/checkpoint-548/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..b7afdb141adad72b781a9154c76e1bacafc146e9 --- /dev/null +++ b/output_rdal_Qwen3-4B_-/checkpoint-548/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0586b3dd15eb1b60e40c5650b3c7344d1abdd741de8e4b60484753137df60d5f +size 7889 diff --git a/output_rdal_Qwen3-4B_-/checkpoint-548/vocab.json b/output_rdal_Qwen3-4B_-/checkpoint-548/vocab.json new file mode 100644 index 0000000000000000000000000000000000000000..6c49fc63bcb109de13abe49e58f85a4cdba7b679 --- /dev/null +++ b/output_rdal_Qwen3-4B_-/checkpoint-548/vocab.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca10d7e9fb3ed18575dd1e277a2579c16d108e32f27439684afa0e10b1440910 +size 2776833 diff --git a/output_rdal_Qwen3-4B_-/final_adapters/README.md b/output_rdal_Qwen3-4B_-/final_adapters/README.md new file mode 100644 index 0000000000000000000000000000000000000000..8a9591cde2bc956137b9f7d13e4fe8be718b6a61 --- /dev/null +++ b/output_rdal_Qwen3-4B_-/final_adapters/README.md @@ -0,0 +1,202 @@ +--- +base_model: Qwen/Qwen3-4B +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.15.2 \ No newline at end of file diff --git a/output_rdal_Qwen3-4B_-/final_adapters/adapter_config.json b/output_rdal_Qwen3-4B_-/final_adapters/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..3b1a1bc8092d9144e19f34860219fc41770d9df7 --- /dev/null +++ b/output_rdal_Qwen3-4B_-/final_adapters/adapter_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:268ce1b414ef5c505b6c1f46312767afe7ac9d0817b48b3cc4d7351749e2c2cb +size 828 diff --git a/output_rdal_Qwen3-4B_-/final_adapters/adapter_model.safetensors b/output_rdal_Qwen3-4B_-/final_adapters/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e0431276e820dc85e12117970c576d128b0247ee --- /dev/null +++ b/output_rdal_Qwen3-4B_-/final_adapters/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd2aa90f44e9311177737da6ea384dd5286e0e91b5af4cdc9d8ee79241c84f3f +size 1579102000 diff --git a/output_rdal_Qwen3-4B_-/final_adapters/added_tokens.json b/output_rdal_Qwen3-4B_-/final_adapters/added_tokens.json new file mode 100644 index 0000000000000000000000000000000000000000..2b76afd7cb1e665182c309e62849419f75306b75 --- /dev/null +++ b/output_rdal_Qwen3-4B_-/final_adapters/added_tokens.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0284b582e14987fbd3d5a2cb2bd139084371ed9acbae488829a1c900833c680 +size 707 diff --git a/output_rdal_Qwen3-4B_-/final_adapters/chat_template.jinja b/output_rdal_Qwen3-4B_-/final_adapters/chat_template.jinja new file mode 100644 index 0000000000000000000000000000000000000000..d85ff3045a68273657a9f871cdb9938c940b110b --- /dev/null +++ b/output_rdal_Qwen3-4B_-/final_adapters/chat_template.jinja @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a55ee1b1660128b7098723e0abcd92caa0788061051c62d51cbe87d9cf1974d8 +size 4168 diff --git a/output_rdal_Qwen3-4B_-/final_adapters/merges.txt b/output_rdal_Qwen3-4B_-/final_adapters/merges.txt new file mode 100644 index 0000000000000000000000000000000000000000..80c1a19fae38f8f4c9ab32cc9d4e145c241147e6 --- /dev/null +++ b/output_rdal_Qwen3-4B_-/final_adapters/merges.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8831e4f1a044471340f7c0a83d7bd71306a5b867e95fd870f74d0c5308a904d5 +size 1671853 diff --git a/output_rdal_Qwen3-4B_-/final_adapters/special_tokens_map.json b/output_rdal_Qwen3-4B_-/final_adapters/special_tokens_map.json new file mode 100644 index 0000000000000000000000000000000000000000..ee3f6af3ba18b7d721f02bdf3fbca2814b7eda35 --- /dev/null +++ b/output_rdal_Qwen3-4B_-/final_adapters/special_tokens_map.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76862e765266b85aa9459767e33cbaf13970f327a0e88d1c65846c2ddd3a1ecd +size 613 diff --git a/output_rdal_Qwen3-4B_-/final_adapters/tokenizer.json b/output_rdal_Qwen3-4B_-/final_adapters/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..cd71f61a15a522601badb3dc960d800d9cb3766c --- /dev/null +++ b/output_rdal_Qwen3-4B_-/final_adapters/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aeb13307a71acd8fe81861d94ad54ab689df773318809eed3cbe794b4492dae4 +size 11422654 diff --git a/output_rdal_Qwen3-4B_-/final_adapters/tokenizer_config.json b/output_rdal_Qwen3-4B_-/final_adapters/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..0d8ad241b789c1419579e4b54e31b0befbad9882 --- /dev/null +++ b/output_rdal_Qwen3-4B_-/final_adapters/tokenizer_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:443bfa629eb16387a12edbf92a76f6a6f10b2af3b53d87ba1550adfcf45f7fa0 +size 5404 diff --git a/output_rdal_Qwen3-4B_-/final_adapters/training_args.bin b/output_rdal_Qwen3-4B_-/final_adapters/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..b7afdb141adad72b781a9154c76e1bacafc146e9 --- /dev/null +++ b/output_rdal_Qwen3-4B_-/final_adapters/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0586b3dd15eb1b60e40c5650b3c7344d1abdd741de8e4b60484753137df60d5f +size 7889 diff --git a/output_rdal_Qwen3-4B_-/final_adapters/vocab.json b/output_rdal_Qwen3-4B_-/final_adapters/vocab.json new file mode 100644 index 0000000000000000000000000000000000000000..6c49fc63bcb109de13abe49e58f85a4cdba7b679 --- /dev/null +++ b/output_rdal_Qwen3-4B_-/final_adapters/vocab.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca10d7e9fb3ed18575dd1e277a2579c16d108e32f27439684afa0e10b1440910 +size 2776833 diff --git a/output_real_Qwen3-4B_-/checkpoint-1095/README.md b/output_real_Qwen3-4B_-/checkpoint-1095/README.md new file mode 100644 index 0000000000000000000000000000000000000000..8a9591cde2bc956137b9f7d13e4fe8be718b6a61 --- /dev/null +++ b/output_real_Qwen3-4B_-/checkpoint-1095/README.md @@ -0,0 +1,202 @@ +--- +base_model: Qwen/Qwen3-4B +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.15.2 \ No newline at end of file diff --git a/output_real_Qwen3-4B_-/checkpoint-1095/adapter_config.json b/output_real_Qwen3-4B_-/checkpoint-1095/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..4d572b96b2c3584e44e8f5ccdaca9c34f63e5a67 --- /dev/null +++ b/output_real_Qwen3-4B_-/checkpoint-1095/adapter_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60211157f9d0e1f4b6c558d6c492c22492b3b7be840f92778705e07232158147 +size 828 diff --git a/output_real_Qwen3-4B_-/checkpoint-1095/adapter_model.safetensors b/output_real_Qwen3-4B_-/checkpoint-1095/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6469db454d1ca1b41a24acdf03ca507db955cdb8 --- /dev/null +++ b/output_real_Qwen3-4B_-/checkpoint-1095/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53c7ac233a263a6c255ec62d8fd5d8a1daffc7aeb652b19f9265ea0b739f69aa +size 1579102000 diff --git a/output_real_Qwen3-4B_-/checkpoint-1095/added_tokens.json b/output_real_Qwen3-4B_-/checkpoint-1095/added_tokens.json new file mode 100644 index 0000000000000000000000000000000000000000..2b76afd7cb1e665182c309e62849419f75306b75 --- /dev/null +++ b/output_real_Qwen3-4B_-/checkpoint-1095/added_tokens.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0284b582e14987fbd3d5a2cb2bd139084371ed9acbae488829a1c900833c680 +size 707 diff --git a/output_real_Qwen3-4B_-/checkpoint-1095/chat_template.jinja b/output_real_Qwen3-4B_-/checkpoint-1095/chat_template.jinja new file mode 100644 index 0000000000000000000000000000000000000000..d85ff3045a68273657a9f871cdb9938c940b110b --- /dev/null +++ b/output_real_Qwen3-4B_-/checkpoint-1095/chat_template.jinja @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a55ee1b1660128b7098723e0abcd92caa0788061051c62d51cbe87d9cf1974d8 +size 4168 diff --git a/output_real_Qwen3-4B_-/checkpoint-1095/global_step1091/mp_rank_00_model_states.pt b/output_real_Qwen3-4B_-/checkpoint-1095/global_step1091/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..38476232405fed80ee3688bcf783dc4a5d072eae --- /dev/null +++ b/output_real_Qwen3-4B_-/checkpoint-1095/global_step1091/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07009dde73f951dcdce9a73dc63ea7e327f0931d7dbfb7adc520480f02f361bb +size 861285289 diff --git a/output_real_Qwen3-4B_-/checkpoint-1095/global_step1091/zero_pp_rank_0_mp_rank_00_optim_states.pt b/output_real_Qwen3-4B_-/checkpoint-1095/global_step1091/zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b977a52d3ed66fd5d7300f6ad61a5639213b4aa8 --- /dev/null +++ b/output_real_Qwen3-4B_-/checkpoint-1095/global_step1091/zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:303846b00fca62b6e8a90ddbd09696c79dfc7f960d81cd7ae82a5bbc07589a9c +size 77884216 diff --git a/output_real_Qwen3-4B_-/checkpoint-1095/global_step1091/zero_pp_rank_1_mp_rank_00_optim_states.pt b/output_real_Qwen3-4B_-/checkpoint-1095/global_step1091/zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..24437020d40c73f6c523f373f8ffd655d1f11cb8 --- /dev/null +++ b/output_real_Qwen3-4B_-/checkpoint-1095/global_step1091/zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:721617a91a1e035f4299b9b7d91f3362e89f417503620f778275859c30e58b95 +size 77884344 diff --git a/output_real_Qwen3-4B_-/checkpoint-1095/latest b/output_real_Qwen3-4B_-/checkpoint-1095/latest new file mode 100644 index 0000000000000000000000000000000000000000..ca24631ebe50acdd3d6887c1b72ccc71dbd6fe43 --- /dev/null +++ b/output_real_Qwen3-4B_-/checkpoint-1095/latest @@ -0,0 +1 @@ +global_step1091 \ No newline at end of file diff --git a/output_real_Qwen3-4B_-/checkpoint-1095/merges.txt b/output_real_Qwen3-4B_-/checkpoint-1095/merges.txt new file mode 100644 index 0000000000000000000000000000000000000000..80c1a19fae38f8f4c9ab32cc9d4e145c241147e6 --- /dev/null +++ b/output_real_Qwen3-4B_-/checkpoint-1095/merges.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8831e4f1a044471340f7c0a83d7bd71306a5b867e95fd870f74d0c5308a904d5 +size 1671853 diff --git a/output_real_Qwen3-4B_-/checkpoint-1095/rng_state_0.pth b/output_real_Qwen3-4B_-/checkpoint-1095/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..ad0179b574a445a30325535b96db08b5de6137ac --- /dev/null +++ b/output_real_Qwen3-4B_-/checkpoint-1095/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:414e79a3671663d435732b7e4f6ce41e6fa237770cb73e95f822886664e77384 +size 14917 diff --git a/output_real_Qwen3-4B_-/checkpoint-1095/rng_state_1.pth b/output_real_Qwen3-4B_-/checkpoint-1095/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..e368c066ece74f65c79f8ca97c11f135d4660961 --- /dev/null +++ b/output_real_Qwen3-4B_-/checkpoint-1095/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:edb97dd638fcad9ab1f11b6ae6d5f7508112d64a4332f3f5cce9dadf69c434a9 +size 14917 diff --git a/output_real_Qwen3-4B_-/checkpoint-1095/special_tokens_map.json b/output_real_Qwen3-4B_-/checkpoint-1095/special_tokens_map.json new file mode 100644 index 0000000000000000000000000000000000000000..ee3f6af3ba18b7d721f02bdf3fbca2814b7eda35 --- /dev/null +++ b/output_real_Qwen3-4B_-/checkpoint-1095/special_tokens_map.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76862e765266b85aa9459767e33cbaf13970f327a0e88d1c65846c2ddd3a1ecd +size 613 diff --git a/output_real_Qwen3-4B_-/checkpoint-1095/tokenizer.json b/output_real_Qwen3-4B_-/checkpoint-1095/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..cd71f61a15a522601badb3dc960d800d9cb3766c --- /dev/null +++ b/output_real_Qwen3-4B_-/checkpoint-1095/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aeb13307a71acd8fe81861d94ad54ab689df773318809eed3cbe794b4492dae4 +size 11422654 diff --git a/output_real_Qwen3-4B_-/checkpoint-1095/tokenizer_config.json b/output_real_Qwen3-4B_-/checkpoint-1095/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..5c0cfc2d0ad23392bd84cad162c5d524f389f509 --- /dev/null +++ b/output_real_Qwen3-4B_-/checkpoint-1095/tokenizer_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:502723b70f4fd98e2ee7aa681501d73ed0cbebd40fa8bc6f0585a61c3a14e156 +size 5597 diff --git a/output_real_Qwen3-4B_-/checkpoint-1095/trainer_state.json b/output_real_Qwen3-4B_-/checkpoint-1095/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..2048163d1436ea0603e0edb71b17e3e142a02ab2 --- /dev/null +++ b/output_real_Qwen3-4B_-/checkpoint-1095/trainer_state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e91653c1d5e5d36e0fd429b50762e308b1cf9951abeac7248c63916feed68f3 +size 29767 diff --git a/output_real_Qwen3-4B_-/checkpoint-1095/training_args.bin b/output_real_Qwen3-4B_-/checkpoint-1095/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..0016dbc8c99357d1a3177558b3ce141136ea4c80 --- /dev/null +++ b/output_real_Qwen3-4B_-/checkpoint-1095/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:344362c00cd71936c4828a55897fe77cd516512a502116f243d4e6cdd38d6a20 +size 7889 diff --git a/output_real_Qwen3-4B_-/checkpoint-1095/vocab.json b/output_real_Qwen3-4B_-/checkpoint-1095/vocab.json new file mode 100644 index 0000000000000000000000000000000000000000..6c49fc63bcb109de13abe49e58f85a4cdba7b679 --- /dev/null +++ b/output_real_Qwen3-4B_-/checkpoint-1095/vocab.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca10d7e9fb3ed18575dd1e277a2579c16d108e32f27439684afa0e10b1440910 +size 2776833 diff --git a/output_real_Qwen3-4B_-/checkpoint-1110/README.md b/output_real_Qwen3-4B_-/checkpoint-1110/README.md new file mode 100644 index 0000000000000000000000000000000000000000..8a9591cde2bc956137b9f7d13e4fe8be718b6a61 --- /dev/null +++ b/output_real_Qwen3-4B_-/checkpoint-1110/README.md @@ -0,0 +1,202 @@ +--- +base_model: Qwen/Qwen3-4B +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.15.2 \ No newline at end of file diff --git a/output_real_Qwen3-4B_-/checkpoint-1110/adapter_config.json b/output_real_Qwen3-4B_-/checkpoint-1110/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..4d572b96b2c3584e44e8f5ccdaca9c34f63e5a67 --- /dev/null +++ b/output_real_Qwen3-4B_-/checkpoint-1110/adapter_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60211157f9d0e1f4b6c558d6c492c22492b3b7be840f92778705e07232158147 +size 828 diff --git a/output_real_Qwen3-4B_-/checkpoint-1110/adapter_model.safetensors b/output_real_Qwen3-4B_-/checkpoint-1110/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9327ceefcaea3b8be1c7900ae5ea237203793d5a --- /dev/null +++ b/output_real_Qwen3-4B_-/checkpoint-1110/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:464bb16b7f938c8e957f79aa9b496af203062632ed471242a544b9428e4c1604 +size 1579102000 diff --git a/output_real_Qwen3-4B_-/checkpoint-1110/added_tokens.json b/output_real_Qwen3-4B_-/checkpoint-1110/added_tokens.json new file mode 100644 index 0000000000000000000000000000000000000000..2b76afd7cb1e665182c309e62849419f75306b75 --- /dev/null +++ b/output_real_Qwen3-4B_-/checkpoint-1110/added_tokens.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0284b582e14987fbd3d5a2cb2bd139084371ed9acbae488829a1c900833c680 +size 707 diff --git a/output_real_Qwen3-4B_-/checkpoint-1110/chat_template.jinja b/output_real_Qwen3-4B_-/checkpoint-1110/chat_template.jinja new file mode 100644 index 0000000000000000000000000000000000000000..d85ff3045a68273657a9f871cdb9938c940b110b --- /dev/null +++ b/output_real_Qwen3-4B_-/checkpoint-1110/chat_template.jinja @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a55ee1b1660128b7098723e0abcd92caa0788061051c62d51cbe87d9cf1974d8 +size 4168 diff --git a/output_real_Qwen3-4B_-/checkpoint-1110/global_step1106/mp_rank_00_model_states.pt b/output_real_Qwen3-4B_-/checkpoint-1110/global_step1106/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1372380d6a4da8cd56441972848fd78479f3b955 --- /dev/null +++ b/output_real_Qwen3-4B_-/checkpoint-1110/global_step1106/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9cc85e5b3a541e9025b10ec2e28f2acbada62b73c8d3b229d77c7326e018ac26 +size 861285289 diff --git a/output_real_Qwen3-4B_-/checkpoint-1110/global_step1106/zero_pp_rank_0_mp_rank_00_optim_states.pt b/output_real_Qwen3-4B_-/checkpoint-1110/global_step1106/zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7178dd7fbd084bc4ae929dc1fe6c391fcfbdcfd5 --- /dev/null +++ b/output_real_Qwen3-4B_-/checkpoint-1110/global_step1106/zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3cb5d669956a66df7d64b4e821561b07b84f6b6aacd993da8edd1c0e84f01f14 +size 77884216 diff --git a/output_real_Qwen3-4B_-/checkpoint-1110/global_step1106/zero_pp_rank_1_mp_rank_00_optim_states.pt b/output_real_Qwen3-4B_-/checkpoint-1110/global_step1106/zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..758b105419aa14c8a7d0fcd07f69736669aea3b0 --- /dev/null +++ b/output_real_Qwen3-4B_-/checkpoint-1110/global_step1106/zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:263a0950d82cca8ea881ed85814d570548a0211c07073320a035bdb1544b606e +size 77884344 diff --git a/output_real_Qwen3-4B_-/checkpoint-1110/latest b/output_real_Qwen3-4B_-/checkpoint-1110/latest new file mode 100644 index 0000000000000000000000000000000000000000..af060b2f59d50c40d81478b91fc0e0c92cb86b97 --- /dev/null +++ b/output_real_Qwen3-4B_-/checkpoint-1110/latest @@ -0,0 +1 @@ +global_step1106 \ No newline at end of file diff --git a/output_real_Qwen3-4B_-/checkpoint-1110/merges.txt b/output_real_Qwen3-4B_-/checkpoint-1110/merges.txt new file mode 100644 index 0000000000000000000000000000000000000000..80c1a19fae38f8f4c9ab32cc9d4e145c241147e6 --- /dev/null +++ b/output_real_Qwen3-4B_-/checkpoint-1110/merges.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8831e4f1a044471340f7c0a83d7bd71306a5b867e95fd870f74d0c5308a904d5 +size 1671853 diff --git a/output_real_Qwen3-4B_-/checkpoint-1110/rng_state_0.pth b/output_real_Qwen3-4B_-/checkpoint-1110/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..f3ad9b1c315fea491f25ca15b4fd8222d0a8eeaf --- /dev/null +++ b/output_real_Qwen3-4B_-/checkpoint-1110/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:794adec03ec1b60646f79e221f7b60163d01f42f262900728a3e446e9674e35b +size 14917 diff --git a/output_real_Qwen3-4B_-/checkpoint-1110/rng_state_1.pth b/output_real_Qwen3-4B_-/checkpoint-1110/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..46e095238b5afe08455df5583608552bf94b33f1 --- /dev/null +++ b/output_real_Qwen3-4B_-/checkpoint-1110/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:591e7d7c0e4346d51c68dedc84d998acb1df7a88fb2620ff787bc260bf88db40 +size 14917 diff --git a/output_real_Qwen3-4B_-/checkpoint-1110/special_tokens_map.json b/output_real_Qwen3-4B_-/checkpoint-1110/special_tokens_map.json new file mode 100644 index 0000000000000000000000000000000000000000..ee3f6af3ba18b7d721f02bdf3fbca2814b7eda35 --- /dev/null +++ b/output_real_Qwen3-4B_-/checkpoint-1110/special_tokens_map.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76862e765266b85aa9459767e33cbaf13970f327a0e88d1c65846c2ddd3a1ecd +size 613 diff --git a/output_real_Qwen3-4B_-/checkpoint-1110/tokenizer.json b/output_real_Qwen3-4B_-/checkpoint-1110/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..cd71f61a15a522601badb3dc960d800d9cb3766c --- /dev/null +++ b/output_real_Qwen3-4B_-/checkpoint-1110/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aeb13307a71acd8fe81861d94ad54ab689df773318809eed3cbe794b4492dae4 +size 11422654 diff --git a/output_real_Qwen3-4B_-/checkpoint-1110/tokenizer_config.json b/output_real_Qwen3-4B_-/checkpoint-1110/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..5c0cfc2d0ad23392bd84cad162c5d524f389f509 --- /dev/null +++ b/output_real_Qwen3-4B_-/checkpoint-1110/tokenizer_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:502723b70f4fd98e2ee7aa681501d73ed0cbebd40fa8bc6f0585a61c3a14e156 +size 5597 diff --git a/output_real_Qwen3-4B_-/checkpoint-1110/trainer_state.json b/output_real_Qwen3-4B_-/checkpoint-1110/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..19076bec40d54099a81a9fd2bd5d04278124c7b5 --- /dev/null +++ b/output_real_Qwen3-4B_-/checkpoint-1110/trainer_state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da5619efc12458d95bde75d33f7814101c6a30c6bab946b07d65dcbc6ecc813c +size 30157 diff --git a/output_real_Qwen3-4B_-/checkpoint-1110/training_args.bin b/output_real_Qwen3-4B_-/checkpoint-1110/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..0016dbc8c99357d1a3177558b3ce141136ea4c80 --- /dev/null +++ b/output_real_Qwen3-4B_-/checkpoint-1110/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:344362c00cd71936c4828a55897fe77cd516512a502116f243d4e6cdd38d6a20 +size 7889 diff --git a/output_real_Qwen3-4B_-/checkpoint-1110/vocab.json b/output_real_Qwen3-4B_-/checkpoint-1110/vocab.json new file mode 100644 index 0000000000000000000000000000000000000000..6c49fc63bcb109de13abe49e58f85a4cdba7b679 --- /dev/null +++ b/output_real_Qwen3-4B_-/checkpoint-1110/vocab.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca10d7e9fb3ed18575dd1e277a2579c16d108e32f27439684afa0e10b1440910 +size 2776833 diff --git a/output_real_Qwen3-4B_-/checkpoint-915/README.md b/output_real_Qwen3-4B_-/checkpoint-915/README.md new file mode 100644 index 0000000000000000000000000000000000000000..8a9591cde2bc956137b9f7d13e4fe8be718b6a61 --- /dev/null +++ b/output_real_Qwen3-4B_-/checkpoint-915/README.md @@ -0,0 +1,202 @@ +--- +base_model: Qwen/Qwen3-4B +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.15.2 \ No newline at end of file diff --git a/output_real_Qwen3-4B_-/checkpoint-915/adapter_config.json b/output_real_Qwen3-4B_-/checkpoint-915/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..4d572b96b2c3584e44e8f5ccdaca9c34f63e5a67 --- /dev/null +++ b/output_real_Qwen3-4B_-/checkpoint-915/adapter_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60211157f9d0e1f4b6c558d6c492c22492b3b7be840f92778705e07232158147 +size 828 diff --git a/output_real_Qwen3-4B_-/checkpoint-915/adapter_model.safetensors b/output_real_Qwen3-4B_-/checkpoint-915/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d8aa5122b3a1fce069627d0532cba5df80503a63 --- /dev/null +++ b/output_real_Qwen3-4B_-/checkpoint-915/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c35aebc5a80bdb30788d9ddd6f4c75b51ad71baec6802f7b777240e0aea4ec3e +size 1579102000 diff --git a/output_real_Qwen3-4B_-/checkpoint-915/added_tokens.json b/output_real_Qwen3-4B_-/checkpoint-915/added_tokens.json new file mode 100644 index 0000000000000000000000000000000000000000..2b76afd7cb1e665182c309e62849419f75306b75 --- /dev/null +++ b/output_real_Qwen3-4B_-/checkpoint-915/added_tokens.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0284b582e14987fbd3d5a2cb2bd139084371ed9acbae488829a1c900833c680 +size 707 diff --git a/output_real_Qwen3-4B_-/checkpoint-915/chat_template.jinja b/output_real_Qwen3-4B_-/checkpoint-915/chat_template.jinja new file mode 100644 index 0000000000000000000000000000000000000000..d85ff3045a68273657a9f871cdb9938c940b110b --- /dev/null +++ b/output_real_Qwen3-4B_-/checkpoint-915/chat_template.jinja @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a55ee1b1660128b7098723e0abcd92caa0788061051c62d51cbe87d9cf1974d8 +size 4168 diff --git a/output_real_Qwen3-4B_-/checkpoint-915/global_step912/mp_rank_00_model_states.pt b/output_real_Qwen3-4B_-/checkpoint-915/global_step912/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..886209bcf5afcef45735cb2c299a7ebcf1d71610 --- /dev/null +++ b/output_real_Qwen3-4B_-/checkpoint-915/global_step912/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbb053ecf39b418319c89124f95c945f2e189bbb2c20f4d5507ab7fe16783eec +size 861285289 diff --git a/output_real_Qwen3-4B_-/checkpoint-915/global_step912/zero_pp_rank_0_mp_rank_00_optim_states.pt b/output_real_Qwen3-4B_-/checkpoint-915/global_step912/zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0cae81c682a12a7d1538b59a04e20a1e8fa42bb --- /dev/null +++ b/output_real_Qwen3-4B_-/checkpoint-915/global_step912/zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b9fe5b649c74b1192809fdec3cc6cfbc2923ef17346f6c90ccef43d8fc883c0 +size 77884216 diff --git a/output_real_Qwen3-4B_-/checkpoint-915/global_step912/zero_pp_rank_1_mp_rank_00_optim_states.pt b/output_real_Qwen3-4B_-/checkpoint-915/global_step912/zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..555c83118127db1b0c658fbcf96097e7841dc004 --- /dev/null +++ b/output_real_Qwen3-4B_-/checkpoint-915/global_step912/zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42604aafd02835293829e079f3adf5d7bb788fdb0f7e6aa8a94f27441ac66598 +size 77884344 diff --git a/output_real_Qwen3-4B_-/checkpoint-915/latest b/output_real_Qwen3-4B_-/checkpoint-915/latest new file mode 100644 index 0000000000000000000000000000000000000000..4afd592634f97e88eb5ee1e76d3bc17c633ec221 --- /dev/null +++ b/output_real_Qwen3-4B_-/checkpoint-915/latest @@ -0,0 +1 @@ +global_step912 \ No newline at end of file diff --git a/output_real_Qwen3-4B_-/checkpoint-915/merges.txt b/output_real_Qwen3-4B_-/checkpoint-915/merges.txt new file mode 100644 index 0000000000000000000000000000000000000000..80c1a19fae38f8f4c9ab32cc9d4e145c241147e6 --- /dev/null +++ b/output_real_Qwen3-4B_-/checkpoint-915/merges.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8831e4f1a044471340f7c0a83d7bd71306a5b867e95fd870f74d0c5308a904d5 +size 1671853 diff --git a/output_real_Qwen3-4B_-/checkpoint-915/rng_state_0.pth b/output_real_Qwen3-4B_-/checkpoint-915/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..246a8ba2df47d0428386c9cb6fe481b85ef0fbd2 --- /dev/null +++ b/output_real_Qwen3-4B_-/checkpoint-915/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:944814b8416a775767c2d5554eaf498fcb3b9eabc9421bc5e539229bc02e6d42 +size 14917 diff --git a/output_real_Qwen3-4B_-/checkpoint-915/rng_state_1.pth b/output_real_Qwen3-4B_-/checkpoint-915/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..3d492dacb2c39fb597482331b4f6f4ba3cb23919 --- /dev/null +++ b/output_real_Qwen3-4B_-/checkpoint-915/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a0c933bfefb8f95545100b963dd1d5f3ecc7579953faaba48a0129afcdc4285 +size 14917 diff --git a/output_real_Qwen3-4B_-/checkpoint-915/special_tokens_map.json b/output_real_Qwen3-4B_-/checkpoint-915/special_tokens_map.json new file mode 100644 index 0000000000000000000000000000000000000000..ee3f6af3ba18b7d721f02bdf3fbca2814b7eda35 --- /dev/null +++ b/output_real_Qwen3-4B_-/checkpoint-915/special_tokens_map.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76862e765266b85aa9459767e33cbaf13970f327a0e88d1c65846c2ddd3a1ecd +size 613 diff --git a/output_real_Qwen3-4B_-/checkpoint-915/tokenizer.json b/output_real_Qwen3-4B_-/checkpoint-915/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..cd71f61a15a522601badb3dc960d800d9cb3766c --- /dev/null +++ b/output_real_Qwen3-4B_-/checkpoint-915/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aeb13307a71acd8fe81861d94ad54ab689df773318809eed3cbe794b4492dae4 +size 11422654 diff --git a/output_real_Qwen3-4B_-/checkpoint-915/tokenizer_config.json b/output_real_Qwen3-4B_-/checkpoint-915/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..5c0cfc2d0ad23392bd84cad162c5d524f389f509 --- /dev/null +++ b/output_real_Qwen3-4B_-/checkpoint-915/tokenizer_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:502723b70f4fd98e2ee7aa681501d73ed0cbebd40fa8bc6f0585a61c3a14e156 +size 5597 diff --git a/output_real_Qwen3-4B_-/checkpoint-915/trainer_state.json b/output_real_Qwen3-4B_-/checkpoint-915/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..29951e60ff18ed21be11b76a1d60093ff08f1739 --- /dev/null +++ b/output_real_Qwen3-4B_-/checkpoint-915/trainer_state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f572793c8560574d45448b7f4f12887274286c86ec3a258bd374982e1226435 +size 24979 diff --git a/output_real_Qwen3-4B_-/checkpoint-915/training_args.bin b/output_real_Qwen3-4B_-/checkpoint-915/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..0016dbc8c99357d1a3177558b3ce141136ea4c80 --- /dev/null +++ b/output_real_Qwen3-4B_-/checkpoint-915/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:344362c00cd71936c4828a55897fe77cd516512a502116f243d4e6cdd38d6a20 +size 7889 diff --git a/output_real_Qwen3-4B_-/checkpoint-915/vocab.json b/output_real_Qwen3-4B_-/checkpoint-915/vocab.json new file mode 100644 index 0000000000000000000000000000000000000000..6c49fc63bcb109de13abe49e58f85a4cdba7b679 --- /dev/null +++ b/output_real_Qwen3-4B_-/checkpoint-915/vocab.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca10d7e9fb3ed18575dd1e277a2579c16d108e32f27439684afa0e10b1440910 +size 2776833 diff --git a/output_real_Qwen3-4B_-/final_adapters/README.md b/output_real_Qwen3-4B_-/final_adapters/README.md new file mode 100644 index 0000000000000000000000000000000000000000..8a9591cde2bc956137b9f7d13e4fe8be718b6a61 --- /dev/null +++ b/output_real_Qwen3-4B_-/final_adapters/README.md @@ -0,0 +1,202 @@ +--- +base_model: Qwen/Qwen3-4B +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.15.2 \ No newline at end of file diff --git a/output_real_Qwen3-4B_-/final_adapters/adapter_config.json b/output_real_Qwen3-4B_-/final_adapters/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..4d572b96b2c3584e44e8f5ccdaca9c34f63e5a67 --- /dev/null +++ b/output_real_Qwen3-4B_-/final_adapters/adapter_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60211157f9d0e1f4b6c558d6c492c22492b3b7be840f92778705e07232158147 +size 828 diff --git a/output_real_Qwen3-4B_-/final_adapters/adapter_model.safetensors b/output_real_Qwen3-4B_-/final_adapters/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d8aa5122b3a1fce069627d0532cba5df80503a63 --- /dev/null +++ b/output_real_Qwen3-4B_-/final_adapters/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c35aebc5a80bdb30788d9ddd6f4c75b51ad71baec6802f7b777240e0aea4ec3e +size 1579102000 diff --git a/output_real_Qwen3-4B_-/final_adapters/added_tokens.json b/output_real_Qwen3-4B_-/final_adapters/added_tokens.json new file mode 100644 index 0000000000000000000000000000000000000000..2b76afd7cb1e665182c309e62849419f75306b75 --- /dev/null +++ b/output_real_Qwen3-4B_-/final_adapters/added_tokens.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0284b582e14987fbd3d5a2cb2bd139084371ed9acbae488829a1c900833c680 +size 707 diff --git a/output_real_Qwen3-4B_-/final_adapters/chat_template.jinja b/output_real_Qwen3-4B_-/final_adapters/chat_template.jinja new file mode 100644 index 0000000000000000000000000000000000000000..d85ff3045a68273657a9f871cdb9938c940b110b --- /dev/null +++ b/output_real_Qwen3-4B_-/final_adapters/chat_template.jinja @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a55ee1b1660128b7098723e0abcd92caa0788061051c62d51cbe87d9cf1974d8 +size 4168 diff --git a/output_real_Qwen3-4B_-/final_adapters/global_step912/mp_rank_00_model_states.pt b/output_real_Qwen3-4B_-/final_adapters/global_step912/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..886209bcf5afcef45735cb2c299a7ebcf1d71610 --- /dev/null +++ b/output_real_Qwen3-4B_-/final_adapters/global_step912/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbb053ecf39b418319c89124f95c945f2e189bbb2c20f4d5507ab7fe16783eec +size 861285289 diff --git a/output_real_Qwen3-4B_-/final_adapters/global_step912/zero_pp_rank_0_mp_rank_00_optim_states.pt b/output_real_Qwen3-4B_-/final_adapters/global_step912/zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0cae81c682a12a7d1538b59a04e20a1e8fa42bb --- /dev/null +++ b/output_real_Qwen3-4B_-/final_adapters/global_step912/zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b9fe5b649c74b1192809fdec3cc6cfbc2923ef17346f6c90ccef43d8fc883c0 +size 77884216 diff --git a/output_real_Qwen3-4B_-/final_adapters/global_step912/zero_pp_rank_1_mp_rank_00_optim_states.pt b/output_real_Qwen3-4B_-/final_adapters/global_step912/zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..555c83118127db1b0c658fbcf96097e7841dc004 --- /dev/null +++ b/output_real_Qwen3-4B_-/final_adapters/global_step912/zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42604aafd02835293829e079f3adf5d7bb788fdb0f7e6aa8a94f27441ac66598 +size 77884344 diff --git a/output_real_Qwen3-4B_-/final_adapters/latest b/output_real_Qwen3-4B_-/final_adapters/latest new file mode 100644 index 0000000000000000000000000000000000000000..4afd592634f97e88eb5ee1e76d3bc17c633ec221 --- /dev/null +++ b/output_real_Qwen3-4B_-/final_adapters/latest @@ -0,0 +1 @@ +global_step912 \ No newline at end of file diff --git a/output_real_Qwen3-4B_-/final_adapters/merges.txt b/output_real_Qwen3-4B_-/final_adapters/merges.txt new file mode 100644 index 0000000000000000000000000000000000000000..80c1a19fae38f8f4c9ab32cc9d4e145c241147e6 --- /dev/null +++ b/output_real_Qwen3-4B_-/final_adapters/merges.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8831e4f1a044471340f7c0a83d7bd71306a5b867e95fd870f74d0c5308a904d5 +size 1671853 diff --git a/output_real_Qwen3-4B_-/final_adapters/rng_state_0.pth b/output_real_Qwen3-4B_-/final_adapters/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..246a8ba2df47d0428386c9cb6fe481b85ef0fbd2 --- /dev/null +++ b/output_real_Qwen3-4B_-/final_adapters/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:944814b8416a775767c2d5554eaf498fcb3b9eabc9421bc5e539229bc02e6d42 +size 14917 diff --git a/output_real_Qwen3-4B_-/final_adapters/rng_state_1.pth b/output_real_Qwen3-4B_-/final_adapters/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..3d492dacb2c39fb597482331b4f6f4ba3cb23919 --- /dev/null +++ b/output_real_Qwen3-4B_-/final_adapters/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a0c933bfefb8f95545100b963dd1d5f3ecc7579953faaba48a0129afcdc4285 +size 14917 diff --git a/output_real_Qwen3-4B_-/final_adapters/special_tokens_map.json b/output_real_Qwen3-4B_-/final_adapters/special_tokens_map.json new file mode 100644 index 0000000000000000000000000000000000000000..ee3f6af3ba18b7d721f02bdf3fbca2814b7eda35 --- /dev/null +++ b/output_real_Qwen3-4B_-/final_adapters/special_tokens_map.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76862e765266b85aa9459767e33cbaf13970f327a0e88d1c65846c2ddd3a1ecd +size 613 diff --git a/output_real_Qwen3-4B_-/final_adapters/tokenizer.json b/output_real_Qwen3-4B_-/final_adapters/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..cd71f61a15a522601badb3dc960d800d9cb3766c --- /dev/null +++ b/output_real_Qwen3-4B_-/final_adapters/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aeb13307a71acd8fe81861d94ad54ab689df773318809eed3cbe794b4492dae4 +size 11422654 diff --git a/output_real_Qwen3-4B_-/final_adapters/tokenizer_config.json b/output_real_Qwen3-4B_-/final_adapters/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..5c0cfc2d0ad23392bd84cad162c5d524f389f509 --- /dev/null +++ b/output_real_Qwen3-4B_-/final_adapters/tokenizer_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:502723b70f4fd98e2ee7aa681501d73ed0cbebd40fa8bc6f0585a61c3a14e156 +size 5597 diff --git a/output_real_Qwen3-4B_-/final_adapters/trainer_state.json b/output_real_Qwen3-4B_-/final_adapters/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..29951e60ff18ed21be11b76a1d60093ff08f1739 --- /dev/null +++ b/output_real_Qwen3-4B_-/final_adapters/trainer_state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f572793c8560574d45448b7f4f12887274286c86ec3a258bd374982e1226435 +size 24979 diff --git a/output_real_Qwen3-4B_-/final_adapters/training_args.bin b/output_real_Qwen3-4B_-/final_adapters/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..0016dbc8c99357d1a3177558b3ce141136ea4c80 --- /dev/null +++ b/output_real_Qwen3-4B_-/final_adapters/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:344362c00cd71936c4828a55897fe77cd516512a502116f243d4e6cdd38d6a20 +size 7889 diff --git a/output_real_Qwen3-4B_-/final_adapters/vocab.json b/output_real_Qwen3-4B_-/final_adapters/vocab.json new file mode 100644 index 0000000000000000000000000000000000000000..6c49fc63bcb109de13abe49e58f85a4cdba7b679 --- /dev/null +++ b/output_real_Qwen3-4B_-/final_adapters/vocab.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca10d7e9fb3ed18575dd1e277a2579c16d108e32f27439684afa0e10b1440910 +size 2776833 diff --git a/output_rebl_Qwen3-4B_-/checkpoint-1035/README.md b/output_rebl_Qwen3-4B_-/checkpoint-1035/README.md new file mode 100644 index 0000000000000000000000000000000000000000..8a9591cde2bc956137b9f7d13e4fe8be718b6a61 --- /dev/null +++ b/output_rebl_Qwen3-4B_-/checkpoint-1035/README.md @@ -0,0 +1,202 @@ +--- +base_model: Qwen/Qwen3-4B +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.15.2 \ No newline at end of file diff --git a/output_rebl_Qwen3-4B_-/checkpoint-1035/adapter_config.json b/output_rebl_Qwen3-4B_-/checkpoint-1035/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..b7b5283e0a45eae761ecf7499b7d7e4dd8f8f10b --- /dev/null +++ b/output_rebl_Qwen3-4B_-/checkpoint-1035/adapter_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d184256a3ccb78e67ec3d01340569d527e9539de90a81532bdad51f881de2535 +size 828 diff --git a/output_rebl_Qwen3-4B_-/checkpoint-1035/adapter_model.safetensors b/output_rebl_Qwen3-4B_-/checkpoint-1035/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c99f9f723f5c92e88515c1d5272b2d8ee77d04c5 --- /dev/null +++ b/output_rebl_Qwen3-4B_-/checkpoint-1035/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d647b8296808701d549976fa684148dc3eba78efdc456ca8dd1aa587304ca79 +size 1579102000 diff --git a/output_rebl_Qwen3-4B_-/checkpoint-1035/added_tokens.json b/output_rebl_Qwen3-4B_-/checkpoint-1035/added_tokens.json new file mode 100644 index 0000000000000000000000000000000000000000..2b76afd7cb1e665182c309e62849419f75306b75 --- /dev/null +++ b/output_rebl_Qwen3-4B_-/checkpoint-1035/added_tokens.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0284b582e14987fbd3d5a2cb2bd139084371ed9acbae488829a1c900833c680 +size 707 diff --git a/output_rebl_Qwen3-4B_-/checkpoint-1035/chat_template.jinja b/output_rebl_Qwen3-4B_-/checkpoint-1035/chat_template.jinja new file mode 100644 index 0000000000000000000000000000000000000000..d85ff3045a68273657a9f871cdb9938c940b110b --- /dev/null +++ b/output_rebl_Qwen3-4B_-/checkpoint-1035/chat_template.jinja @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a55ee1b1660128b7098723e0abcd92caa0788061051c62d51cbe87d9cf1974d8 +size 4168 diff --git a/output_rebl_Qwen3-4B_-/checkpoint-1035/global_step1032/mp_rank_00_model_states.pt b/output_rebl_Qwen3-4B_-/checkpoint-1035/global_step1032/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6362e02b3b332134da9041b3eb2e7021fecee003 --- /dev/null +++ b/output_rebl_Qwen3-4B_-/checkpoint-1035/global_step1032/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe78e739e8bf9f3958e74a30c7d5cedd237c9ea380c5c9ac4ce9d9c1e522b37f +size 861285289 diff --git a/output_rebl_Qwen3-4B_-/checkpoint-1035/global_step1032/zero_pp_rank_0_mp_rank_00_optim_states.pt b/output_rebl_Qwen3-4B_-/checkpoint-1035/global_step1032/zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..15eccb36e753727208b47f8f198a6988ed9512e6 --- /dev/null +++ b/output_rebl_Qwen3-4B_-/checkpoint-1035/global_step1032/zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2334be832381d737d941775c795ea7d8955cc56c47c2c9eccb97b031fab0b9b4 +size 77884216 diff --git a/output_rebl_Qwen3-4B_-/checkpoint-1035/global_step1032/zero_pp_rank_1_mp_rank_00_optim_states.pt b/output_rebl_Qwen3-4B_-/checkpoint-1035/global_step1032/zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..66b499370717d0d262cd65f5c929ac68c0e266a0 --- /dev/null +++ b/output_rebl_Qwen3-4B_-/checkpoint-1035/global_step1032/zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:248848e440cf6e24a839c7fd606f5516fe2809168ffd86ceeceab81d5c40dfb3 +size 77884344 diff --git a/output_rebl_Qwen3-4B_-/checkpoint-1035/latest b/output_rebl_Qwen3-4B_-/checkpoint-1035/latest new file mode 100644 index 0000000000000000000000000000000000000000..3538f99680e03e3fad14811c9d3200f12088d2c6 --- /dev/null +++ b/output_rebl_Qwen3-4B_-/checkpoint-1035/latest @@ -0,0 +1 @@ +global_step1032 \ No newline at end of file diff --git a/output_rebl_Qwen3-4B_-/checkpoint-1035/merges.txt b/output_rebl_Qwen3-4B_-/checkpoint-1035/merges.txt new file mode 100644 index 0000000000000000000000000000000000000000..80c1a19fae38f8f4c9ab32cc9d4e145c241147e6 --- /dev/null +++ b/output_rebl_Qwen3-4B_-/checkpoint-1035/merges.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8831e4f1a044471340f7c0a83d7bd71306a5b867e95fd870f74d0c5308a904d5 +size 1671853 diff --git a/output_rebl_Qwen3-4B_-/checkpoint-1035/rng_state_0.pth b/output_rebl_Qwen3-4B_-/checkpoint-1035/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..3c4236def5058e1efb6d71067990c10d44dbd42a --- /dev/null +++ b/output_rebl_Qwen3-4B_-/checkpoint-1035/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:876bf0fbe24bcb8506396ee76938d3a592dbe9f9b16c3de1438f17c923d1e8c7 +size 14917 diff --git a/output_rebl_Qwen3-4B_-/checkpoint-1035/rng_state_1.pth b/output_rebl_Qwen3-4B_-/checkpoint-1035/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..1312b612db59cfdfc0ac0abfa8ff151db836dbb0 --- /dev/null +++ b/output_rebl_Qwen3-4B_-/checkpoint-1035/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:590ef6934ae2b8a56ad089ee4dd7b36cc24dc03812deecd58355d8bddfeaf719 +size 14917 diff --git a/output_rebl_Qwen3-4B_-/checkpoint-1035/special_tokens_map.json b/output_rebl_Qwen3-4B_-/checkpoint-1035/special_tokens_map.json new file mode 100644 index 0000000000000000000000000000000000000000..ee3f6af3ba18b7d721f02bdf3fbca2814b7eda35 --- /dev/null +++ b/output_rebl_Qwen3-4B_-/checkpoint-1035/special_tokens_map.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76862e765266b85aa9459767e33cbaf13970f327a0e88d1c65846c2ddd3a1ecd +size 613 diff --git a/output_rebl_Qwen3-4B_-/checkpoint-1035/tokenizer.json b/output_rebl_Qwen3-4B_-/checkpoint-1035/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..cd71f61a15a522601badb3dc960d800d9cb3766c --- /dev/null +++ b/output_rebl_Qwen3-4B_-/checkpoint-1035/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aeb13307a71acd8fe81861d94ad54ab689df773318809eed3cbe794b4492dae4 +size 11422654 diff --git a/output_rebl_Qwen3-4B_-/checkpoint-1035/tokenizer_config.json b/output_rebl_Qwen3-4B_-/checkpoint-1035/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..0d8ad241b789c1419579e4b54e31b0befbad9882 --- /dev/null +++ b/output_rebl_Qwen3-4B_-/checkpoint-1035/tokenizer_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:443bfa629eb16387a12edbf92a76f6a6f10b2af3b53d87ba1550adfcf45f7fa0 +size 5404 diff --git a/output_rebl_Qwen3-4B_-/checkpoint-1035/trainer_state.json b/output_rebl_Qwen3-4B_-/checkpoint-1035/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..2cd937a48eaf6f0cefc0d1ba4109f8ba5d14ac65 --- /dev/null +++ b/output_rebl_Qwen3-4B_-/checkpoint-1035/trainer_state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:564ffd60e1f2c750b71ca211c56f0c90b71b559cbe640835014488a4e0207208 +size 27999 diff --git a/output_rebl_Qwen3-4B_-/checkpoint-1035/training_args.bin b/output_rebl_Qwen3-4B_-/checkpoint-1035/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..18fe4e7ff998c19517bc692d9827aaa0ba935a08 --- /dev/null +++ b/output_rebl_Qwen3-4B_-/checkpoint-1035/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34a8ae223a9be91f945faad6045997f8a35870054555f96eb02fccba0cd4f86a +size 7889 diff --git a/output_rebl_Qwen3-4B_-/checkpoint-1035/vocab.json b/output_rebl_Qwen3-4B_-/checkpoint-1035/vocab.json new file mode 100644 index 0000000000000000000000000000000000000000..6c49fc63bcb109de13abe49e58f85a4cdba7b679 --- /dev/null +++ b/output_rebl_Qwen3-4B_-/checkpoint-1035/vocab.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca10d7e9fb3ed18575dd1e277a2579c16d108e32f27439684afa0e10b1440910 +size 2776833 diff --git a/output_rebl_Qwen3-4B_-/checkpoint-1048/README.md b/output_rebl_Qwen3-4B_-/checkpoint-1048/README.md new file mode 100644 index 0000000000000000000000000000000000000000..8a9591cde2bc956137b9f7d13e4fe8be718b6a61 --- /dev/null +++ b/output_rebl_Qwen3-4B_-/checkpoint-1048/README.md @@ -0,0 +1,202 @@ +--- +base_model: Qwen/Qwen3-4B +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.15.2 \ No newline at end of file diff --git a/output_rebl_Qwen3-4B_-/checkpoint-1048/adapter_config.json b/output_rebl_Qwen3-4B_-/checkpoint-1048/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..b7b5283e0a45eae761ecf7499b7d7e4dd8f8f10b --- /dev/null +++ b/output_rebl_Qwen3-4B_-/checkpoint-1048/adapter_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d184256a3ccb78e67ec3d01340569d527e9539de90a81532bdad51f881de2535 +size 828 diff --git a/output_rebl_Qwen3-4B_-/checkpoint-1048/adapter_model.safetensors b/output_rebl_Qwen3-4B_-/checkpoint-1048/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7a20aed6aa651555e8a90ae63e8e9f80dda81f17 --- /dev/null +++ b/output_rebl_Qwen3-4B_-/checkpoint-1048/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5c783ab89caa80dfdf7dea43c5a199de2c4acab7347ede72abaef30316c4273 +size 1579102000 diff --git a/output_rebl_Qwen3-4B_-/checkpoint-1048/added_tokens.json b/output_rebl_Qwen3-4B_-/checkpoint-1048/added_tokens.json new file mode 100644 index 0000000000000000000000000000000000000000..2b76afd7cb1e665182c309e62849419f75306b75 --- /dev/null +++ b/output_rebl_Qwen3-4B_-/checkpoint-1048/added_tokens.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0284b582e14987fbd3d5a2cb2bd139084371ed9acbae488829a1c900833c680 +size 707 diff --git a/output_rebl_Qwen3-4B_-/checkpoint-1048/chat_template.jinja b/output_rebl_Qwen3-4B_-/checkpoint-1048/chat_template.jinja new file mode 100644 index 0000000000000000000000000000000000000000..d85ff3045a68273657a9f871cdb9938c940b110b --- /dev/null +++ b/output_rebl_Qwen3-4B_-/checkpoint-1048/chat_template.jinja @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a55ee1b1660128b7098723e0abcd92caa0788061051c62d51cbe87d9cf1974d8 +size 4168 diff --git a/output_rebl_Qwen3-4B_-/checkpoint-1048/global_step1044/mp_rank_00_model_states.pt b/output_rebl_Qwen3-4B_-/checkpoint-1048/global_step1044/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bbaba3f7de5a4e67eb64c1e98c5cb7e6f3c91cf7 --- /dev/null +++ b/output_rebl_Qwen3-4B_-/checkpoint-1048/global_step1044/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd2e71a447787ee55d58d2311a1dc78976a45abed630db44172bc8340540c5d7 +size 861285289 diff --git a/output_rebl_Qwen3-4B_-/checkpoint-1048/global_step1044/zero_pp_rank_0_mp_rank_00_optim_states.pt b/output_rebl_Qwen3-4B_-/checkpoint-1048/global_step1044/zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8c44e09fe676a3fc15b09233159bd9ab5f98473f --- /dev/null +++ b/output_rebl_Qwen3-4B_-/checkpoint-1048/global_step1044/zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24a5f838f005f6377c1b2abe762849c2f1dd8cec99c13ba7916e3915710cdc07 +size 77884216 diff --git a/output_rebl_Qwen3-4B_-/checkpoint-1048/global_step1044/zero_pp_rank_1_mp_rank_00_optim_states.pt b/output_rebl_Qwen3-4B_-/checkpoint-1048/global_step1044/zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3b276096f0060869e8c62a40bf635e45d636c96 --- /dev/null +++ b/output_rebl_Qwen3-4B_-/checkpoint-1048/global_step1044/zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6fffdb1c7954dbf544aa1f47483edf8e69a610f8ac7d5518ee113db85f764157 +size 77884344 diff --git a/output_rebl_Qwen3-4B_-/checkpoint-1048/latest b/output_rebl_Qwen3-4B_-/checkpoint-1048/latest new file mode 100644 index 0000000000000000000000000000000000000000..8366bde0d0ef46840ff7aa246ce10c00aa687a4f --- /dev/null +++ b/output_rebl_Qwen3-4B_-/checkpoint-1048/latest @@ -0,0 +1 @@ +global_step1044 \ No newline at end of file diff --git a/output_rebl_Qwen3-4B_-/checkpoint-1048/merges.txt b/output_rebl_Qwen3-4B_-/checkpoint-1048/merges.txt new file mode 100644 index 0000000000000000000000000000000000000000..80c1a19fae38f8f4c9ab32cc9d4e145c241147e6 --- /dev/null +++ b/output_rebl_Qwen3-4B_-/checkpoint-1048/merges.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8831e4f1a044471340f7c0a83d7bd71306a5b867e95fd870f74d0c5308a904d5 +size 1671853 diff --git a/output_rebl_Qwen3-4B_-/checkpoint-1048/rng_state_0.pth b/output_rebl_Qwen3-4B_-/checkpoint-1048/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..aa118eee87ca87233f24e825029f9a24b6821f54 --- /dev/null +++ b/output_rebl_Qwen3-4B_-/checkpoint-1048/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3db4c2f80214125b304f49690bfe031506e958bb4b1a0939dd03ce3f71475d22 +size 14917 diff --git a/output_rebl_Qwen3-4B_-/checkpoint-1048/rng_state_1.pth b/output_rebl_Qwen3-4B_-/checkpoint-1048/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..25f6eb4eb1c1ae000d91480f1e1cdeb3cde4995e --- /dev/null +++ b/output_rebl_Qwen3-4B_-/checkpoint-1048/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87e3e54ba094194e2a96483bac1fe434e826538a0d5d07b07f209b50f68c2bc9 +size 14917 diff --git a/output_rebl_Qwen3-4B_-/checkpoint-1048/special_tokens_map.json b/output_rebl_Qwen3-4B_-/checkpoint-1048/special_tokens_map.json new file mode 100644 index 0000000000000000000000000000000000000000..ee3f6af3ba18b7d721f02bdf3fbca2814b7eda35 --- /dev/null +++ b/output_rebl_Qwen3-4B_-/checkpoint-1048/special_tokens_map.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76862e765266b85aa9459767e33cbaf13970f327a0e88d1c65846c2ddd3a1ecd +size 613 diff --git a/output_rebl_Qwen3-4B_-/checkpoint-1048/tokenizer.json b/output_rebl_Qwen3-4B_-/checkpoint-1048/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..cd71f61a15a522601badb3dc960d800d9cb3766c --- /dev/null +++ b/output_rebl_Qwen3-4B_-/checkpoint-1048/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aeb13307a71acd8fe81861d94ad54ab689df773318809eed3cbe794b4492dae4 +size 11422654 diff --git a/output_rebl_Qwen3-4B_-/checkpoint-1048/tokenizer_config.json b/output_rebl_Qwen3-4B_-/checkpoint-1048/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..0d8ad241b789c1419579e4b54e31b0befbad9882 --- /dev/null +++ b/output_rebl_Qwen3-4B_-/checkpoint-1048/tokenizer_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:443bfa629eb16387a12edbf92a76f6a6f10b2af3b53d87ba1550adfcf45f7fa0 +size 5404 diff --git a/output_rebl_Qwen3-4B_-/checkpoint-1048/trainer_state.json b/output_rebl_Qwen3-4B_-/checkpoint-1048/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..2f65cc01bd998ef0c8da13dd85667f3326be8e33 --- /dev/null +++ b/output_rebl_Qwen3-4B_-/checkpoint-1048/trainer_state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e365120b416d34e6fc0e5d5efa90a372c23d1bbd5e1771807418a81fd9b1fbc +size 27983 diff --git a/output_rebl_Qwen3-4B_-/checkpoint-1048/training_args.bin b/output_rebl_Qwen3-4B_-/checkpoint-1048/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..18fe4e7ff998c19517bc692d9827aaa0ba935a08 --- /dev/null +++ b/output_rebl_Qwen3-4B_-/checkpoint-1048/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34a8ae223a9be91f945faad6045997f8a35870054555f96eb02fccba0cd4f86a +size 7889 diff --git a/output_rebl_Qwen3-4B_-/checkpoint-1048/vocab.json b/output_rebl_Qwen3-4B_-/checkpoint-1048/vocab.json new file mode 100644 index 0000000000000000000000000000000000000000..6c49fc63bcb109de13abe49e58f85a4cdba7b679 --- /dev/null +++ b/output_rebl_Qwen3-4B_-/checkpoint-1048/vocab.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca10d7e9fb3ed18575dd1e277a2579c16d108e32f27439684afa0e10b1440910 +size 2776833 diff --git a/output_rebl_Qwen3-4B_-/checkpoint-600/README.md b/output_rebl_Qwen3-4B_-/checkpoint-600/README.md new file mode 100644 index 0000000000000000000000000000000000000000..8a9591cde2bc956137b9f7d13e4fe8be718b6a61 --- /dev/null +++ b/output_rebl_Qwen3-4B_-/checkpoint-600/README.md @@ -0,0 +1,202 @@ +--- +base_model: Qwen/Qwen3-4B +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.15.2 \ No newline at end of file diff --git a/output_rebl_Qwen3-4B_-/checkpoint-600/adapter_config.json b/output_rebl_Qwen3-4B_-/checkpoint-600/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..b7b5283e0a45eae761ecf7499b7d7e4dd8f8f10b --- /dev/null +++ b/output_rebl_Qwen3-4B_-/checkpoint-600/adapter_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d184256a3ccb78e67ec3d01340569d527e9539de90a81532bdad51f881de2535 +size 828 diff --git a/output_rebl_Qwen3-4B_-/checkpoint-600/adapter_model.safetensors b/output_rebl_Qwen3-4B_-/checkpoint-600/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bbd4b89e8d8f3ff27fa9552be188c3246a157133 --- /dev/null +++ b/output_rebl_Qwen3-4B_-/checkpoint-600/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ae45d20e708f57e03e68a15392e4cb668ed5476039899b1f6b932f27446ffa3 +size 1579102000 diff --git a/output_rebl_Qwen3-4B_-/checkpoint-600/added_tokens.json b/output_rebl_Qwen3-4B_-/checkpoint-600/added_tokens.json new file mode 100644 index 0000000000000000000000000000000000000000..2b76afd7cb1e665182c309e62849419f75306b75 --- /dev/null +++ b/output_rebl_Qwen3-4B_-/checkpoint-600/added_tokens.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0284b582e14987fbd3d5a2cb2bd139084371ed9acbae488829a1c900833c680 +size 707 diff --git a/output_rebl_Qwen3-4B_-/checkpoint-600/chat_template.jinja b/output_rebl_Qwen3-4B_-/checkpoint-600/chat_template.jinja new file mode 100644 index 0000000000000000000000000000000000000000..d85ff3045a68273657a9f871cdb9938c940b110b --- /dev/null +++ b/output_rebl_Qwen3-4B_-/checkpoint-600/chat_template.jinja @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a55ee1b1660128b7098723e0abcd92caa0788061051c62d51cbe87d9cf1974d8 +size 4168 diff --git a/output_rebl_Qwen3-4B_-/checkpoint-600/global_step598/mp_rank_00_model_states.pt b/output_rebl_Qwen3-4B_-/checkpoint-600/global_step598/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cdba7fc26376e73d0aee190e2dcdc0b49cb4d644 --- /dev/null +++ b/output_rebl_Qwen3-4B_-/checkpoint-600/global_step598/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93d025b029701ae8b965bdfe0fac84f4e090059b48bd263dc246d0dd1434fd3b +size 861285289 diff --git a/output_rebl_Qwen3-4B_-/checkpoint-600/global_step598/zero_pp_rank_0_mp_rank_00_optim_states.pt b/output_rebl_Qwen3-4B_-/checkpoint-600/global_step598/zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4474ed03fe9e63ac1ce289c1a36eee3185fcfaf6 --- /dev/null +++ b/output_rebl_Qwen3-4B_-/checkpoint-600/global_step598/zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b11ea28101c9bc3d1d6fa487d2bf32a97bcbe741b4c70d07fb30cea107a76e12 +size 77884216 diff --git a/output_rebl_Qwen3-4B_-/checkpoint-600/global_step598/zero_pp_rank_1_mp_rank_00_optim_states.pt b/output_rebl_Qwen3-4B_-/checkpoint-600/global_step598/zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6fd77d73430ed12ba850838e80b62c14d1767b61 --- /dev/null +++ b/output_rebl_Qwen3-4B_-/checkpoint-600/global_step598/zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27e9767a2e4144e3720702c344c97d657b12342f1b30f189d68eb7ae746bf625 +size 77884344 diff --git a/output_rebl_Qwen3-4B_-/checkpoint-600/latest b/output_rebl_Qwen3-4B_-/checkpoint-600/latest new file mode 100644 index 0000000000000000000000000000000000000000..8a87fdc3e8d4d236bfa15c87e3acae6c027d8460 --- /dev/null +++ b/output_rebl_Qwen3-4B_-/checkpoint-600/latest @@ -0,0 +1 @@ +global_step598 \ No newline at end of file diff --git a/output_rebl_Qwen3-4B_-/checkpoint-600/merges.txt b/output_rebl_Qwen3-4B_-/checkpoint-600/merges.txt new file mode 100644 index 0000000000000000000000000000000000000000..80c1a19fae38f8f4c9ab32cc9d4e145c241147e6 --- /dev/null +++ b/output_rebl_Qwen3-4B_-/checkpoint-600/merges.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8831e4f1a044471340f7c0a83d7bd71306a5b867e95fd870f74d0c5308a904d5 +size 1671853 diff --git a/output_rebl_Qwen3-4B_-/checkpoint-600/rng_state_0.pth b/output_rebl_Qwen3-4B_-/checkpoint-600/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..6ff5067e8b4bc450582e1de3ff927bdf0377fbe5 --- /dev/null +++ b/output_rebl_Qwen3-4B_-/checkpoint-600/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ece0abc7d34d1ee03c932f7b5e479bf879e95f92fc9145f523eccc0bb971fd27 +size 14917 diff --git a/output_rebl_Qwen3-4B_-/checkpoint-600/rng_state_1.pth b/output_rebl_Qwen3-4B_-/checkpoint-600/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..dcd47e6236c8bfb05b5fc5f581871db0d2e29cab --- /dev/null +++ b/output_rebl_Qwen3-4B_-/checkpoint-600/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71b8cbba5464b76fa408b0607e24d63d94f22a289c6b69eb3afd9470827eb5d9 +size 14917 diff --git a/output_rebl_Qwen3-4B_-/checkpoint-600/special_tokens_map.json b/output_rebl_Qwen3-4B_-/checkpoint-600/special_tokens_map.json new file mode 100644 index 0000000000000000000000000000000000000000..ee3f6af3ba18b7d721f02bdf3fbca2814b7eda35 --- /dev/null +++ b/output_rebl_Qwen3-4B_-/checkpoint-600/special_tokens_map.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76862e765266b85aa9459767e33cbaf13970f327a0e88d1c65846c2ddd3a1ecd +size 613 diff --git a/output_rebl_Qwen3-4B_-/checkpoint-600/tokenizer.json b/output_rebl_Qwen3-4B_-/checkpoint-600/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..cd71f61a15a522601badb3dc960d800d9cb3766c --- /dev/null +++ b/output_rebl_Qwen3-4B_-/checkpoint-600/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aeb13307a71acd8fe81861d94ad54ab689df773318809eed3cbe794b4492dae4 +size 11422654 diff --git a/output_rebl_Qwen3-4B_-/checkpoint-600/tokenizer_config.json b/output_rebl_Qwen3-4B_-/checkpoint-600/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..0d8ad241b789c1419579e4b54e31b0befbad9882 --- /dev/null +++ b/output_rebl_Qwen3-4B_-/checkpoint-600/tokenizer_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:443bfa629eb16387a12edbf92a76f6a6f10b2af3b53d87ba1550adfcf45f7fa0 +size 5404 diff --git a/output_rebl_Qwen3-4B_-/checkpoint-600/trainer_state.json b/output_rebl_Qwen3-4B_-/checkpoint-600/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..7449b0116dc15d8022733d17c2b298ef7fede4dc --- /dev/null +++ b/output_rebl_Qwen3-4B_-/checkpoint-600/trainer_state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea7707b696281d347f128bec1ce355a05a4637fff8c7384f28433e8ecfbad576 +size 16649 diff --git a/output_rebl_Qwen3-4B_-/checkpoint-600/training_args.bin b/output_rebl_Qwen3-4B_-/checkpoint-600/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..18fe4e7ff998c19517bc692d9827aaa0ba935a08 --- /dev/null +++ b/output_rebl_Qwen3-4B_-/checkpoint-600/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34a8ae223a9be91f945faad6045997f8a35870054555f96eb02fccba0cd4f86a +size 7889 diff --git a/output_rebl_Qwen3-4B_-/checkpoint-600/vocab.json b/output_rebl_Qwen3-4B_-/checkpoint-600/vocab.json new file mode 100644 index 0000000000000000000000000000000000000000..6c49fc63bcb109de13abe49e58f85a4cdba7b679 --- /dev/null +++ b/output_rebl_Qwen3-4B_-/checkpoint-600/vocab.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca10d7e9fb3ed18575dd1e277a2579c16d108e32f27439684afa0e10b1440910 +size 2776833 diff --git a/output_rebl_Qwen3-4B_-/final_adapters/README.md b/output_rebl_Qwen3-4B_-/final_adapters/README.md new file mode 100644 index 0000000000000000000000000000000000000000..8a9591cde2bc956137b9f7d13e4fe8be718b6a61 --- /dev/null +++ b/output_rebl_Qwen3-4B_-/final_adapters/README.md @@ -0,0 +1,202 @@ +--- +base_model: Qwen/Qwen3-4B +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.15.2 \ No newline at end of file diff --git a/output_rebl_Qwen3-4B_-/final_adapters/adapter_config.json b/output_rebl_Qwen3-4B_-/final_adapters/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..b7b5283e0a45eae761ecf7499b7d7e4dd8f8f10b --- /dev/null +++ b/output_rebl_Qwen3-4B_-/final_adapters/adapter_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d184256a3ccb78e67ec3d01340569d527e9539de90a81532bdad51f881de2535 +size 828 diff --git a/output_rebl_Qwen3-4B_-/final_adapters/adapter_model.safetensors b/output_rebl_Qwen3-4B_-/final_adapters/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bbd4b89e8d8f3ff27fa9552be188c3246a157133 --- /dev/null +++ b/output_rebl_Qwen3-4B_-/final_adapters/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ae45d20e708f57e03e68a15392e4cb668ed5476039899b1f6b932f27446ffa3 +size 1579102000 diff --git a/output_rebl_Qwen3-4B_-/final_adapters/added_tokens.json b/output_rebl_Qwen3-4B_-/final_adapters/added_tokens.json new file mode 100644 index 0000000000000000000000000000000000000000..2b76afd7cb1e665182c309e62849419f75306b75 --- /dev/null +++ b/output_rebl_Qwen3-4B_-/final_adapters/added_tokens.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0284b582e14987fbd3d5a2cb2bd139084371ed9acbae488829a1c900833c680 +size 707 diff --git a/output_rebl_Qwen3-4B_-/final_adapters/chat_template.jinja b/output_rebl_Qwen3-4B_-/final_adapters/chat_template.jinja new file mode 100644 index 0000000000000000000000000000000000000000..d85ff3045a68273657a9f871cdb9938c940b110b --- /dev/null +++ b/output_rebl_Qwen3-4B_-/final_adapters/chat_template.jinja @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a55ee1b1660128b7098723e0abcd92caa0788061051c62d51cbe87d9cf1974d8 +size 4168 diff --git a/output_rebl_Qwen3-4B_-/final_adapters/merges.txt b/output_rebl_Qwen3-4B_-/final_adapters/merges.txt new file mode 100644 index 0000000000000000000000000000000000000000..80c1a19fae38f8f4c9ab32cc9d4e145c241147e6 --- /dev/null +++ b/output_rebl_Qwen3-4B_-/final_adapters/merges.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8831e4f1a044471340f7c0a83d7bd71306a5b867e95fd870f74d0c5308a904d5 +size 1671853 diff --git a/output_rebl_Qwen3-4B_-/final_adapters/special_tokens_map.json b/output_rebl_Qwen3-4B_-/final_adapters/special_tokens_map.json new file mode 100644 index 0000000000000000000000000000000000000000..ee3f6af3ba18b7d721f02bdf3fbca2814b7eda35 --- /dev/null +++ b/output_rebl_Qwen3-4B_-/final_adapters/special_tokens_map.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76862e765266b85aa9459767e33cbaf13970f327a0e88d1c65846c2ddd3a1ecd +size 613 diff --git a/output_rebl_Qwen3-4B_-/final_adapters/tokenizer.json b/output_rebl_Qwen3-4B_-/final_adapters/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..cd71f61a15a522601badb3dc960d800d9cb3766c --- /dev/null +++ b/output_rebl_Qwen3-4B_-/final_adapters/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aeb13307a71acd8fe81861d94ad54ab689df773318809eed3cbe794b4492dae4 +size 11422654 diff --git a/output_rebl_Qwen3-4B_-/final_adapters/tokenizer_config.json b/output_rebl_Qwen3-4B_-/final_adapters/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..0d8ad241b789c1419579e4b54e31b0befbad9882 --- /dev/null +++ b/output_rebl_Qwen3-4B_-/final_adapters/tokenizer_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:443bfa629eb16387a12edbf92a76f6a6f10b2af3b53d87ba1550adfcf45f7fa0 +size 5404 diff --git a/output_rebl_Qwen3-4B_-/final_adapters/training_args.bin b/output_rebl_Qwen3-4B_-/final_adapters/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..18fe4e7ff998c19517bc692d9827aaa0ba935a08 --- /dev/null +++ b/output_rebl_Qwen3-4B_-/final_adapters/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34a8ae223a9be91f945faad6045997f8a35870054555f96eb02fccba0cd4f86a +size 7889 diff --git a/output_rebl_Qwen3-4B_-/final_adapters/vocab.json b/output_rebl_Qwen3-4B_-/final_adapters/vocab.json new file mode 100644 index 0000000000000000000000000000000000000000..6c49fc63bcb109de13abe49e58f85a4cdba7b679 --- /dev/null +++ b/output_rebl_Qwen3-4B_-/final_adapters/vocab.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca10d7e9fb3ed18575dd1e277a2579c16d108e32f27439684afa0e10b1440910 +size 2776833