llama-cpp-agent

Paused

pabloce commited on May 25, 2024

Commit

6e7a7b9

verified ·

1 Parent(s): ddf5fad

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,12 +1,14 @@
 import spaces
 import json
 import subprocess
 import gradio as gr
 from huggingface_hub import hf_hub_download
-subprocess.run('pip install llama-cpp-python==0.2.75 --extra-index-url https://abetlen.github.io/llama-cpp-python/whl/cu124', shell=True)
-subprocess.run('pip install llama-cpp-agent==0.2.10', shell=True)
 hf_hub_download(
     repo_id="bartowski/Meta-Llama-3-70B-Instruct-GGUF",
     filename="Meta-Llama-3-70B-Instruct-Q3_K_M.gguf",
@@ -62,12 +64,6 @@ def respond(
     repeat_penalty,
     model,
 ):
-    from llama_cpp import Llama
-    from llama_cpp_agent import LlamaCppAgent
-    from llama_cpp_agent.providers import LlamaCppPythonProvider
-    from llama_cpp_agent.chat_history import BasicChatHistory
-    from llama_cpp_agent.chat_history.messages import Roles
     chat_template = get_messages_formatter_type(model)
     llm = Llama(

 import spaces
 import json
 import subprocess
+from llama_cpp import Llama
+from llama_cpp_agent import LlamaCppAgent
+from llama_cpp_agent.providers import LlamaCppPythonProvider
+from llama_cpp_agent.chat_history import BasicChatHistory
+from llama_cpp_agent.chat_history.messages import Roles
 import gradio as gr
 from huggingface_hub import hf_hub_download
 hf_hub_download(
     repo_id="bartowski/Meta-Llama-3-70B-Instruct-GGUF",
     filename="Meta-Llama-3-70B-Instruct-Q3_K_M.gguf",
     repeat_penalty,
     model,
 ):
     chat_template = get_messages_formatter_type(model)
     llm = Llama(