Spaces:
Paused
Paused
Update src/model_loader.py
Browse files- src/model_loader.py +1 -1
src/model_loader.py
CHANGED
@@ -15,6 +15,6 @@ def load_model():
|
|
15 |
bnb_4bit_quant_type="nf4",
|
16 |
bnb_4bit_compute_dtype=torch.bfloat16
|
17 |
)
|
18 |
-
cached_model = AutoModelForCausalLM.from_pretrained(MODEL_NAME
|
19 |
cached_tokenizer = AutoTokenizer.from_pretrained(MODEL_NAME)
|
20 |
return cached_model, cached_tokenizer
|
|
|
15 |
bnb_4bit_quant_type="nf4",
|
16 |
bnb_4bit_compute_dtype=torch.bfloat16
|
17 |
)
|
18 |
+
cached_model = AutoModelForCausalLM.from_pretrained(MODEL_NAME, quantization_config=bnb_config) #
|
19 |
cached_tokenizer = AutoTokenizer.from_pretrained(MODEL_NAME)
|
20 |
return cached_model, cached_tokenizer
|