Moreza009 commited on
Commit
019c20a
·
1 Parent(s): ccfca8d
Files changed (1) hide show
  1. app.py +4 -3
app.py CHANGED
@@ -7,10 +7,11 @@ For more information on `huggingface_hub` Inference API support, please check th
7
  # Load model directly
8
  from transformers import AutoTokenizer, AutoModelForCausalLM
9
 
10
- tokenizer = AutoTokenizer.from_pretrained("Moreza009/aya23-8b-double-quantized")
11
- model = AutoModelForCausalLM.from_pretrained("Moreza009/aya23-8b-double-quantized",device_map="auto")
12
-
13
 
 
 
14
  def respond(
15
  message,
16
  max_new_tokens=4000,
 
7
  # Load model directly
8
  from transformers import AutoTokenizer, AutoModelForCausalLM
9
 
10
+ model_id = "MaziyarPanahi/Mistral-7B-Instruct-Aya-101-GGUF"
11
+ filename = "Mistral-7B-Instruct-Aya-101.Q8_0.gguf"
 
12
 
13
+ tokenizer = AutoTokenizer.from_pretrained(model_id, gguf_file=filename)
14
+ model = AutoModelForCausalLM.from_pretrained(model_id, gguf_file=filename)
15
  def respond(
16
  message,
17
  max_new_tokens=4000,