Toadoum commited on
Commit
c3a97cb
·
verified ·
1 Parent(s): de54455

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +2 -1
app.py CHANGED
@@ -41,7 +41,8 @@ tokenizer = AutoTokenizer.from_pretrained(MODEL_REPO)
41
 
42
  # Load model with appropriate dtype and device
43
  model_kwargs = {"torch_dtype": torch.float16} if device == "cuda" else {}
44
- model = AutoModelForSeq2SeqLM.from_pretrained(MODEL_REPO, **model_kwargs).to(device)
 
45
  print(f"Model loaded on: {model.device}")
46
 
47
  # Ensure a pad token to avoid generate() quirks
 
41
 
42
  # Load model with appropriate dtype and device
43
  model_kwargs = {"torch_dtype": torch.float16} if device == "cuda" else {}
44
+ model = AutoModelForSeq2SeqLM.from_pretrained(MODEL_REPO, **model_kwargs)
45
+ model = model.to(device) # Move model to device after full loading
46
  print(f"Model loaded on: {model.device}")
47
 
48
  # Ensure a pad token to avoid generate() quirks