Spaces:
Running
on
Zero
Running
on
Zero
Update app.py
Browse files
app.py
CHANGED
@@ -1,5 +1,3 @@
|
|
1 |
-
# LoRA Inference Gradio Space Demo
|
2 |
-
|
3 |
import spaces
|
4 |
import gradio as gr
|
5 |
from peft import PeftModel
|
@@ -22,6 +20,7 @@ model = PeftModel.from_pretrained(
|
|
22 |
# Load the tokenizer
|
23 |
tokenizer = AutoTokenizer.from_pretrained("unsloth/qwen2.5-3b-instruct-unsloth-bnb-4bit")
|
24 |
|
|
|
25 |
def generate_response(prompt):
|
26 |
reasoning_prompt = (
|
27 |
"Answer the following question and explain your reasoning step by step.\n"
|
|
|
|
|
|
|
1 |
import spaces
|
2 |
import gradio as gr
|
3 |
from peft import PeftModel
|
|
|
20 |
# Load the tokenizer
|
21 |
tokenizer = AutoTokenizer.from_pretrained("unsloth/qwen2.5-3b-instruct-unsloth-bnb-4bit")
|
22 |
|
23 |
+
@spaces.GPU
|
24 |
def generate_response(prompt):
|
25 |
reasoning_prompt = (
|
26 |
"Answer the following question and explain your reasoning step by step.\n"
|