Yadukrishnan commited on
Commit
9b175f9
·
verified ·
1 Parent(s): 8eed7bd

Update src/model_loader.py

Browse files
Files changed (1) hide show
  1. src/model_loader.py +1 -1
src/model_loader.py CHANGED
@@ -15,6 +15,6 @@ def load_model():
15
  bnb_4bit_quant_type="nf4",
16
  bnb_4bit_compute_dtype=torch.bfloat16
17
  )
18
- cached_model = AutoModelForCausalLM.from_pretrained(MODEL_NAME) #, quantization_config=bnb_config
19
  cached_tokenizer = AutoTokenizer.from_pretrained(MODEL_NAME)
20
  return cached_model, cached_tokenizer
 
15
  bnb_4bit_quant_type="nf4",
16
  bnb_4bit_compute_dtype=torch.bfloat16
17
  )
18
+ cached_model = AutoModelForCausalLM.from_pretrained(MODEL_NAME, quantization_config=bnb_config) #
19
  cached_tokenizer = AutoTokenizer.from_pretrained(MODEL_NAME)
20
  return cached_model, cached_tokenizer