shawno commited on
Commit
789bc12
·
verified ·
1 Parent(s): be79686

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +1 -1
app.py CHANGED
@@ -15,7 +15,7 @@ try:
15
  print("Loading MiniCPM-V-2_6-gguf model...")
16
  llm = Llama.from_pretrained(
17
  repo_id="openbmb/MiniCPM-V-2_6-gguf",
18
- filename="ggml-model-Q3_K_M.gguf",
19
  n_ctx=4096,
20
  n_threads=os.cpu_count(),
21
  n_batch=512, # Increased batch size for prompt processing
 
15
  print("Loading MiniCPM-V-2_6-gguf model...")
16
  llm = Llama.from_pretrained(
17
  repo_id="openbmb/MiniCPM-V-2_6-gguf",
18
+ filename="ggml-model-Q4_K_M.gguf",
19
  n_ctx=4096,
20
  n_threads=os.cpu_count(),
21
  n_batch=512, # Increased batch size for prompt processing