Spaces:

hackeracademy
/

foundation-sec-llm-api

Sleeping

hackeracademy commited on 17 days ago

Commit

90f5d7c

1 Parent(s): 5d8cca4

Download model to /tmp to avoid permission error

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,21 +1,26 @@
-import os, gradio as gr
 from llama_cpp import Llama
 MODEL_URL = (
     "https://huggingface.co/fdtn-ai/Foundation-Sec-8B-Q4_K_M-GGUF/"
     "resolve/main/foundation-sec-8b-q4_k_m.gguf"
 )
-MODEL_PATH = "foundation-sec-8b-q4_k_m.gguf"
-# download once (Gradio blocks until the file exists)
 if not os.path.exists(MODEL_PATH):
-    import requests, time
     with requests.get(MODEL_URL, stream=True) as r:
         r.raise_for_status()
         with open(MODEL_PATH, "wb") as f:
             for chunk in r.iter_content(chunk_size=8192):
                 f.write(chunk)
 llm = Llama(model_path=MODEL_PATH, n_ctx=4096, verbose=False)
 def chat_fn(message, history):

+import os, gradio as gr, requests, tempfile
 from llama_cpp import Llama
 MODEL_URL = (
     "https://huggingface.co/fdtn-ai/Foundation-Sec-8B-Q4_K_M-GGUF/"
     "resolve/main/foundation-sec-8b-q4_k_m.gguf"
 )
+# writable directory
+CACHE_DIR = "/tmp"
+MODEL_PATH = os.path.join(CACHE_DIR, "foundation-sec-8b-q4_k_m.gguf")
+# download only once
 if not os.path.exists(MODEL_PATH):
+    print("Downloading model … (~4.9 GB)")
     with requests.get(MODEL_URL, stream=True) as r:
         r.raise_for_status()
         with open(MODEL_PATH, "wb") as f:
             for chunk in r.iter_content(chunk_size=8192):
                 f.write(chunk)
+    print("Download finished.")
+# load model
 llm = Llama(model_path=MODEL_PATH, n_ctx=4096, verbose=False)
 def chat_fn(message, history):