AnilNiraula commited on
Commit
b8b4293
·
verified ·
1 Parent(s): 804eca3

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +1 -1
app.py CHANGED
@@ -115,7 +115,7 @@ def generate_response(user_query, enable_thinking=False):
115
  model_inputs = tokenizer([text], return_tensors="pt").to(model.device)
116
  generated_ids = model.generate(
117
  **model_inputs,
118
- max_new_tokens=50, # Reduced for faster generation
119
  temperature=0.6,
120
  top_p=0.95,
121
  repetition_penalty=1.0, # Set to 1.0 to avoid overhead
 
115
  model_inputs = tokenizer([text], return_tensors="pt").to(model.device)
116
  generated_ids = model.generate(
117
  **model_inputs,
118
+ max_new_tokens=100, # Reduced for faster generation
119
  temperature=0.6,
120
  top_p=0.95,
121
  repetition_penalty=1.0, # Set to 1.0 to avoid overhead