Spaces:
Paused
Paused
Commit
·
4a4b568
1
Parent(s):
c3fb598
Amended quickstart.py for better memory allocation
Browse files- app.py +0 -1
- quickstart.py +2 -0
app.py
CHANGED
@@ -2,7 +2,6 @@ import os
|
|
2 |
import gradio as gr
|
3 |
|
4 |
api_key = os.getenv("HF_TOKEN")
|
5 |
-
os.environ["PYTORCH_CUDA_ALLOC_CONF"] = "expandable_segments:True"
|
6 |
def start_training():
|
7 |
os.system("python quickstart.py --model_name_or_path Qwen/Qwen3-0.6B --train_data_dir trl-lib/Capybara --api_key HF_TOKEN" )
|
8 |
return "Evaluation completed!"
|
|
|
2 |
import gradio as gr
|
3 |
|
4 |
api_key = os.getenv("HF_TOKEN")
|
|
|
5 |
def start_training():
|
6 |
os.system("python quickstart.py --model_name_or_path Qwen/Qwen3-0.6B --train_data_dir trl-lib/Capybara --api_key HF_TOKEN" )
|
7 |
return "Evaluation completed!"
|
quickstart.py
CHANGED
@@ -1,7 +1,9 @@
|
|
|
|
1 |
from trl import SFTTrainer
|
2 |
from datasets import load_dataset
|
3 |
|
4 |
dataset = load_dataset("trl-lib/Capybara", split="train")
|
|
|
5 |
|
6 |
trainer = SFTTrainer(
|
7 |
model="Qwen/Qwen3-0.6B",
|
|
|
1 |
+
import os
|
2 |
from trl import SFTTrainer
|
3 |
from datasets import load_dataset
|
4 |
|
5 |
dataset = load_dataset("trl-lib/Capybara", split="train")
|
6 |
+
os.environ["PYTORCH_CUDA_ALLOC_CONF"] = "expandable_segments:True"
|
7 |
|
8 |
trainer = SFTTrainer(
|
9 |
model="Qwen/Qwen3-0.6B",
|