Spaces:
Running
Running
Update app.py
Browse files
app.py
CHANGED
@@ -115,7 +115,7 @@ def generate_response(user_query, enable_thinking=False):
|
|
115 |
model_inputs = tokenizer([text], return_tensors="pt").to(model.device)
|
116 |
generated_ids = model.generate(
|
117 |
**model_inputs,
|
118 |
-
max_new_tokens=
|
119 |
temperature=0.6,
|
120 |
top_p=0.95,
|
121 |
repetition_penalty=1.0, # Set to 1.0 to avoid overhead
|
|
|
115 |
model_inputs = tokenizer([text], return_tensors="pt").to(model.device)
|
116 |
generated_ids = model.generate(
|
117 |
**model_inputs,
|
118 |
+
max_new_tokens=100, # Reduced for faster generation
|
119 |
temperature=0.6,
|
120 |
top_p=0.95,
|
121 |
repetition_penalty=1.0, # Set to 1.0 to avoid overhead
|