Spaces:

localsavageai
/

savoir-mtc

Sleeping

App Files Files Community

localsavageai commited on Apr 1

Commit

b0c410e

verified ·

1 Parent(s): 900c5e5

Upload 2 files

Browse files

Files changed (2) hide show

app.py +209 -0
requirements.txt +11 -0

app.py ADDED Viewed

	@@ -0,0 +1,209 @@

+import os
+import logging
+import numpy as np
+from typing import List, Optional, Tuple
+import torch
+import gradio as gr
+import spaces
+from sentence_transformers import SentenceTransformer
+from langchain_community.vectorstores import FAISS
+from langchain.embeddings.base import Embeddings
+from gradio_client import Client
+import requests
+from tqdm import tqdm
+# Configuration
+DATA_FILE = "data-mtc.txt"
+DATABASE_DIR = "semantic_memory"
+QWEN_API_URL = "Qwen/Qwen2.5-Max-Demo"  # Gradio API for Qwen2.5 chat
+CHUNK_SIZE = 800
+TOP_K_RESULTS = 150
+SIMILARITY_THRESHOLD = 0.4
+BASE_SYSTEM_PROMPT = """
+Répondez en français selon ces règles :
+1. Utilisez EXCLUSIVEMENT le contexte fourni
+2. Structurez la réponse en :
+   - Définition principale
+   - Caractéristiques clés (3 points maximum)
+   - Relations avec d'autres concepts
+3. Si aucune information pertinente, indiquez-le clairement
+Contexte :
+{context}
+"""
+# Configure logging
+logging.basicConfig(
+    level=logging.INFO,
+    format='%(asctime)s - %(levelname)s - %(message)s',
+    handlers=[
+        logging.FileHandler("mtc_chat.log"),
+        logging.StreamHandler()
+    ]
+)
+class LocalEmbeddings(Embeddings):
+    """Local sentence-transformers embeddings"""
+    def __init__(self, model):
+        self.model = model
+    def embed_documents(self, texts: List[str]) -> List[List[float]]:
+        embeddings = []
+        for text in tqdm(texts, desc="Creating embeddings"):
+            embeddings.append(self.model.encode(text).tolist())
+        return embeddings
+    def embed_query(self, text: str) -> List[float]:
+        return self.model.encode(text).tolist()
+def split_text_into_chunks(text: str) -> List[str]:
+    """Split text with overlap and sentence preservation"""
+    chunks = []
+    start = 0
+    text_length = len(text)
+    while start < text_length:
+        end = min(start + CHUNK_SIZE, text_length)
+        chunk = text[start:end]
+        # Find last complete punctuation
+        last_punct = max(
+            chunk.rfind('.'),
+            chunk.rfind('!'),
+            chunk.rfind('?'),
+            chunk.rfind('\n\n')
+        )
+        if last_punct != -1 and (end - start) > CHUNK_SIZE//2:
+            end = start + last_punct + 1
+        chunks.append(text[start:end].strip())
+        start = end if end > start else start + CHUNK_SIZE
+    return chunks
+def initialize_vector_store(embeddings: Embeddings) -> FAISS:
+    """Initialize FAISS vector store"""
+    if os.path.exists(DATABASE_DIR):
+        try:
+            logging.info("Loading existing database...")
+            return FAISS.load_local(
+                DATABASE_DIR,
+                embeddings,
+                allow_dangerous_deserialization=True
+            )
+        except Exception as e:
+            logging.error(f"FAISS load error: {str(e)}")
+            raise
+    logging.info("Creating new vector database...")
+    if not os.path.exists(DATA_FILE):
+        raise FileNotFoundError(f"{DATA_FILE} not found")
+    try:
+        with open(DATA_FILE, "r", encoding="utf-8") as f:
+            text = f.read()
+        chunks = split_text_into_chunks(text)
+        if not chunks:
+            raise ValueError("No valid chunks generated")
+        logging.info(f"Creating {len(chunks)} chunks...")
+        vector_store = FAISS.from_texts(chunks, embeddings)
+        vector_store.save_local(DATABASE_DIR)
+        logging.info("Vector store initialized successfully")
+        return vector_store
+    except Exception as e:
+        logging.error(f"Initialization failed: {str(e)}")
+        raise
+def generate_response(user_input: str, vector_store: FAISS) -> Optional[str]:
+    """Generate response using Qwen API"""
+    try:
+        # Contextual search
+        docs_scores = vector_store.similarity_search_with_score(
+            user_input,
+            k=TOP_K_RESULTS*3
+        )
+        # Filter results
+        filtered_docs = [
+            (doc, score) for doc, score in docs_scores
+            if score < SIMILARITY_THRESHOLD
+        ]
+        filtered_docs.sort(key=lambda x: x[1])
+        if not filtered_docs:
+            return "Aucune correspondance trouvée. Essayez des termes plus spécifiques."
+        best_docs = [doc for doc, _ in filtered_docs[:TOP_K_RESULTS]]
+        # Build context
+        context = "\n".join(
+            f"=== Source {i+1} ===\n{doc.page_content}\n"
+            for i, doc in enumerate(best_docs)
+        )
+        # Call Qwen API
+        client = Client(QWEN_API_URL, verbose=False)
+        response = client.predict(
+            query=user_input,
+            history=[],
+            system=BASE_SYSTEM_PROMPT.format(context=context),
+            api_name="/model_chat"
+        )
+        # Extract response
+        if isinstance(response, tuple) and len(response) >= 2:
+            chat_history = response[1]
+            if chat_history and len(chat_history[-1]) >= 2:
+                return chat_history[-1][1]
+        return "Réponse indisponible - Veuillez reformuler votre question."
+    except Exception as e:
+        logging.error(f"Generation error: {str(e)}", exc_info=True)
+        return None
+# Initialize models and vector store
+device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
+model = SentenceTransformer("cnmoro/snowflake-arctic-embed-m-v2.0-cpu", device=device, trust_remote_code=True)
+embeddings = LocalEmbeddings(model)
+vector_store = initialize_vector_store(embeddings)
+# Gradio interface
+@spaces.GPU
+def embed(document: str):
+    return model.encode(document).tolist()
+def chat_response(message: str, history: List[Tuple[str, str]]):
+    response = generate_response(message, vector_store)
+    return response or "Erreur de génération - Veuillez réessayer."
+with gr.Blocks() as app:
+    gr.Markdown("# MTC Knowledge Assistant")
+    with gr.Tab("Embeddings"):
+        gr.Markdown("## Text Embedding Demo")
+        text_input = gr.Textbox(label="Enter text to embed")
+        output = gr.JSON(label="Embedding Vector")
+        text_input.submit(embed, inputs=text_input, outputs=output)
+    with gr.Tab("MTC Chat"):
+        gr.Markdown("## Posez vos questions sur la médecine traditionnelle chinoise")
+        chatbot = gr.Chatbot(height=500)
+        msg = gr.Textbox(label="Votre question")
+        clear = gr.ClearButton([msg, chatbot])
+        msg.submit(
+            chat_response,
+            inputs=[msg, chatbot],
+            outputs=[msg, chatbot],
+            queue=True
+        )
+if __name__ == "__main__":
+    app.launch(server_name="0.0.0.0", server_port=7860)

requirements.txt ADDED Viewed

	@@ -0,0 +1,11 @@

+gradio>=5.23.2
+sentence-transformers
+torch
+langchain
+langchain-community
+faiss-cpu
+gradio-client
+tqdm
+requests
+numpy
+einops==0.7.0