Spaces:

hibikigf88
/

Medical_Assistant-RAG

Sleeping

Gary commited on 27 days ago

Commit

aed0189

1 Parent(s): cca58a9

Reduce tokens and change model

Files changed (2) hide show

app.py CHANGED Viewed

@@ -34,7 +34,7 @@ def answer_question(query):
     docs = load_raw_dataset()
     rag = CustomRAG(
         create_vector_database(docs, "all-MiniLM-L6-v2"),
-        get_llm("FreedomIntelligence/HuatuoGPT-o1-7B"),
         get_prompt_template(),
     )
     response, _ = rag.run(query)
@@ -52,7 +52,7 @@ demo = gr.Interface(
         ),
     ],
     outputs="text",
-    title="Medical Assistant – Powered by AI & RAG",
     description=(
         "Get helpful insights based on your described symptoms. "
         "This assistant uses medical reference data to provide informative responses. "

     docs = load_raw_dataset()
     rag = CustomRAG(
         create_vector_database(docs, "all-MiniLM-L6-v2"),
+        get_llm("mistralai/Mistral-7B-Instruct-v0.1"),
         get_prompt_template(),
     )
     response, _ = rag.run(query)
         ),
     ],
     outputs="text",
+    title="Medical Assistant – RAG",
     description=(
         "Get helpful insights based on your described symptoms. "
         "This assistant uses medical reference data to provide informative responses. "

indexer.py CHANGED Viewed

@@ -42,7 +42,7 @@ def get_llm(model_name):
         "text-generation",
         model=model,
         tokenizer=tokenizer,
-        max_new_tokens=512,
         temperature=0.7,
         do_sample=True,
     )

         "text-generation",
         model=model,
         tokenizer=tokenizer,
+        max_new_tokens=300,
         temperature=0.7,
         do_sample=True,
     )