AnilNiraula commited on
Commit
8568b7c
·
verified ·
1 Parent(s): 063ed37

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +1 -1
app.py CHANGED
@@ -200,7 +200,7 @@ try:
200
  logger.info(f"Loading model {model_name}")
201
  model = AutoModelForCausalLM.from_pretrained(
202
  model_name,
203
- torch_dtype=torch.float16,
204
  low_cpu_mem_usage=True
205
  )
206
  # Quantize the model for faster CPU inference
 
200
  logger.info(f"Loading model {model_name}")
201
  model = AutoModelForCausalLM.from_pretrained(
202
  model_name,
203
+ torch_dtype=torch.float32, # Changed to float32 to avoid Half/Float mismatch
204
  low_cpu_mem_usage=True
205
  )
206
  # Quantize the model for faster CPU inference