Spaces:
Running
Running
Update app.py
Browse files
app.py
CHANGED
|
@@ -200,7 +200,7 @@ try:
|
|
| 200 |
logger.info(f"Loading model {model_name}")
|
| 201 |
model = AutoModelForCausalLM.from_pretrained(
|
| 202 |
model_name,
|
| 203 |
-
torch_dtype=torch.
|
| 204 |
low_cpu_mem_usage=True
|
| 205 |
)
|
| 206 |
# Quantize the model for faster CPU inference
|
|
|
|
| 200 |
logger.info(f"Loading model {model_name}")
|
| 201 |
model = AutoModelForCausalLM.from_pretrained(
|
| 202 |
model_name,
|
| 203 |
+
torch_dtype=torch.float32, # Changed to float32 to avoid Half/Float mismatch
|
| 204 |
low_cpu_mem_usage=True
|
| 205 |
)
|
| 206 |
# Quantize the model for faster CPU inference
|