Spaces:

poscye
/

ddg-web-search-chat

Running on Zero

App Files Files Community

pabloce commited on May 27, 2024

Commit

8034baa

verified ·

1 Parent(s): 22ca4ed

Update app.py

Browse files

Files changed (1) hide show

app.py +16 -17

app.py CHANGED Viewed

@@ -30,11 +30,11 @@ hf_hub_download(
     filename="Mistral-7B-Instruct-v0.3-Q6_K.gguf",
     local_dir="./models"
 )
-hf_hub_download(
-    repo_id="bartowski/Meta-Llama-3-8B-Instruct-GGUF",
-    filename="Meta-Llama-3-8B-Instruct-Q6_K.gguf",
-    local_dir="./models"
-)
 css = """
 .message-row {
@@ -54,6 +54,9 @@ css = """
 }
 """
 PLACEHOLDER = """
 <div class="message-bubble-border" style="display:flex; max-width: 600px; border-width: 1px; border-radius: 8px; box-shadow: 0 4px 6px rgba(0, 0, 0, 0.1); backdrop-filter: blur(10px);">
     <figure style="margin: 0;">
@@ -67,9 +70,6 @@ PLACEHOLDER = """
                 <span style="display: inline-flex; align-items: center; border-radius: 0.375rem; background-color: rgba(229, 70, 77, 0.1); padding: 0.1rem 0.75rem; font-size: 0.75rem; font-weight: 500; color: #f88181; margin-bottom: 2.5px;">
                     Mistral 7B Instruct v0.3
                 </span>
-                <span style="display: inline-flex; align-items: center; border-radius: 0.375rem; background-color: rgba(79, 70, 229, 0.1); padding: 0.1rem 0.75rem; font-size: 0.75rem; font-weight: 500; color: #60a5fa; margin-top: 2.5px;">
-                    Meta Llama 3 8B Instruct
-                </span>
             </div>
             <div style="display: flex; justify-content: flex-end; align-items: center;">
                 <a href="https://discord.gg/sRMvWKrh" target="_blank" rel="noreferrer" style="padding: .5rem;">
@@ -122,7 +122,6 @@ def write_message_to_user():
 def respond(
     message,
     history: list[tuple[str, str]],
-    model,
     system_message,
     max_tokens,
     temperature,
@@ -132,7 +131,7 @@ def respond(
 ):
     chat_template = get_messages_formatter_type(model)
     llm = Llama(
-        model_path=f"models/{model}",
         flash_attn=True,
         n_threads=40,
         n_gpu_layers=81,
@@ -230,13 +229,13 @@ def respond(
 demo = gr.ChatInterface(
     respond,
     additional_inputs=[
-        gr.Dropdown([
-            'Mistral-7B-Instruct-v0.3-Q6_K.gguf',
-            'Meta-Llama-3-8B-Instruct-Q6_K.gguf'
-        ],
-            value="Mistral-7B-Instruct-v0.3-Q6_K.gguf",
-            label="Model"
-        ),
         gr.Textbox(value=web_search_system_prompt, label="System message"),
         gr.Slider(minimum=1, maximum=4096, value=2048, step=1, label="Max tokens"),
         gr.Slider(minimum=0.1, maximum=1.0, value=0.45, step=0.1, label="Temperature"),

     filename="Mistral-7B-Instruct-v0.3-Q6_K.gguf",
     local_dir="./models"
 )
+# hf_hub_download(
+#     repo_id="bartowski/Meta-Llama-3-8B-Instruct-GGUF",
+#     filename="Meta-Llama-3-8B-Instruct-Q6_K.gguf",
+#     local_dir="./models"
+# )
 css = """
 .message-row {
 }
 """
+# <span style="display: inline-flex; align-items: center; border-radius: 0.375rem; background-color: rgba(79, 70, 229, 0.1); padding: 0.1rem 0.75rem; font-size: 0.75rem; font-weight: 500; color: #60a5fa; margin-top: 2.5px;">
+#     Meta Llama 3 8B Instruct
+# </span>
 PLACEHOLDER = """
 <div class="message-bubble-border" style="display:flex; max-width: 600px; border-width: 1px; border-radius: 8px; box-shadow: 0 4px 6px rgba(0, 0, 0, 0.1); backdrop-filter: blur(10px);">
     <figure style="margin: 0;">
                 <span style="display: inline-flex; align-items: center; border-radius: 0.375rem; background-color: rgba(229, 70, 77, 0.1); padding: 0.1rem 0.75rem; font-size: 0.75rem; font-weight: 500; color: #f88181; margin-bottom: 2.5px;">
                     Mistral 7B Instruct v0.3
                 </span>
             </div>
             <div style="display: flex; justify-content: flex-end; align-items: center;">
                 <a href="https://discord.gg/sRMvWKrh" target="_blank" rel="noreferrer" style="padding: .5rem;">
 def respond(
     message,
     history: list[tuple[str, str]],
     system_message,
     max_tokens,
     temperature,
 ):
     chat_template = get_messages_formatter_type(model)
     llm = Llama(
+        model_path=f"models/{model_selected}",
         flash_attn=True,
         n_threads=40,
         n_gpu_layers=81,
 demo = gr.ChatInterface(
     respond,
     additional_inputs=[
+        # gr.Dropdown([
+        #     'Mistral-7B-Instruct-v0.3-Q6_K.gguf',
+        #     'Meta-Llama-3-8B-Instruct-Q6_K.gguf'
+        # ],
+        #     value="Mistral-7B-Instruct-v0.3-Q6_K.gguf",
+        #     label="Model"
+        # ),
         gr.Textbox(value=web_search_system_prompt, label="System message"),
         gr.Slider(minimum=1, maximum=4096, value=2048, step=1, label="Max tokens"),
         gr.Slider(minimum=0.1, maximum=1.0, value=0.45, step=0.1, label="Temperature"),