Spaces:

SheshankJoshi
/

ssandy_agents

Runtime error

App Files Files Community

Sheshank Joshi commited on 20 days ago

Commit

541377c

1 Parent(s): 59e0000

latest changes

Browse files

Files changed (4) hide show

agent.py +398 -4
app.py +6 -3
basic_tools.py +164 -0
system_prompt.txt +17 -0

agent.py CHANGED Viewed

@@ -1,9 +1,403 @@
 class BasicAgent:
-    def __init__(self):
         print("BasicAgent initialized.")
     def __call__(self, question: str) -> str:
         print(f"Agent received question (first 50 chars): {question[:50]}...")
-        fixed_answer = "This is a default answer."
-        print(f"Agent returning fixed answer: {fixed_answer}")
-        return fixed_answer

+from langchain_huggingface import ChatHuggingFace, HuggingFaceEndpoint, HuggingFaceEmbeddings
+from langchain.tools.retriever import create_retriever_tool
+from langchain_core.tools import BaseTool
+from langgraph.graph import START, StateGraph, MessagesState, END
+from langchain_core.messages import SystemMessage, HumanMessage, AIMessage
+from langchain.vectorstores import VectorStore
+from langchain_core.language_models import BaseChatModel
+from langgraph.prebuilt import tools_condition
+from langgraph.prebuilt import ToolNode
+from langchain_community.vectorstores import FAISS
+from langchain_core.documents import Document
+from langchain_groq import ChatGroq
+from basic_tools import *
+from typing import List
+import numpy as np
+from datetime import datetime, timedelta
+import heapq
+# build a retriever
+embeddings = HuggingFaceEmbeddings(
+    model_name="sentence-transformers/all-mpnet-base-v2")  # dim=768
+vector_store: FAISS = FAISS.from_texts(
+    texts=[],
+    embedding=embeddings)
+# load the system prompt from the file
+with open("system_prompt.txt", "r", encoding="utf-8") as f:
+    system_prompt = f.read()
+# System message
+sys_msg = SystemMessage(content=system_prompt)
 class BasicAgent:
+    tools: List[BaseTool]  = [multiply,
+        add,
+        subtract,
+        divide,
+        modulus,
+        wiki_search,
+        web_search,
+        arxiv_search,
+        requests_get,
+        requests_post
+    ]
+    def __init__(self, embeddings: HuggingFaceEmbeddings, vector_store: VectorStore, llm: BaseChatModel):
+        self.embedding_model = embeddings
+        self.vector_store = vector_store
+        ret = self.vector_store.as_retriever()
+        self.retriever = create_retriever_tool(
+            retriever=ret, #type: ignore
+            name="Question Search", #type: ignore
+            description="A tool to retrieve similar questions from a vector store." #type: ignore
+        )
+        self.llm = llm.bind_tools(self.tools)
+        self.graph = self.build_graph()
         print("BasicAgent initialized.")
     def __call__(self, question: str) -> str:
         print(f"Agent received question (first 50 chars): {question[:50]}...")
+        # Search for similar content to enhance context
+        similar_docs = self.vector_store.similarity_search(question, k=3)
+        # Create enhanced context with relevant past information
+        enhanced_context = question
+        if similar_docs:
+            context_additions = []
+            for doc in similar_docs:
+                # Extract relevant information from similar documents
+                content = doc.page_content
+                if "Question:" in content and "Final answer:" in content:
+                    q = content.split("Question:")[1].split("Final answer:")[0].strip()
+                    a = content.split("Final answer:")[1].split("Timestamp:", 1)[0].strip()
+                    # Only add if it's not exactly the same question
+                    if not question.lower() == q.lower():
+                        context_additions.append(f"Related Q: {q}\nRelated A: {a}")
+            if context_additions:
+                enhanced_context = (
+                    "I'll answer your question, but first consider this relevant information:\n\n" +
+                    "\n\n".join(context_additions) +
+                    "\n\nNow answering your original question: " + question
+                )
+        # Process with the graph
+        input_messages = [HumanMessage(content=enhanced_context)]
+        result = self.graph.invoke({"messages": input_messages})
+        answer = result["messages"][-1].content
+        # Store this Q&A pair for future reference
+        self._cache_result(question, answer)
+        print(f"Agent returning answer (first 50 chars): {answer[:50]}...")
+        return answer
+    def _cache_result(self, question: str, answer: str) -> None:
+        """Cache the question and answer in the vector store"""
+        timestamp = datetime.now().isoformat()
+        content = f"Question: {question}\nFinal answer: {answer}\nTimestamp: {timestamp}"
+        # Create document with metadata
+        doc = Document(
+            page_content=content,
+            metadata={
+                "question": question,
+                "timestamp": timestamp,
+                "type": "qa_pair"
+            }
+        )
+        # Add to vector store
+        self.vector_store.add_documents([doc])
+        print(f"Cached new Q&A in vector store")
+    # Build graph function
+    def build_graph(self):
+        """Build the graph with context enhancement"""
+        from langgraph.graph import END
+        def context_enhanced_generation(state: MessagesState):
+            """Node that enhances context with relevant information"""
+            query = str(state["messages"][-1].content)
+            # Retrieve relevant information
+            similar_docs = self.vector_store.similarity_search(query, k=3)
+            # Extract relevant context
+            context = ""
+            if similar_docs:
+                context_pieces = []
+                for doc in similar_docs:
+                    content = doc.page_content
+                    # Extract the relevant parts
+                    if "Question:" in content:
+                        context_pieces.append(content)
+                if context_pieces:
+                    context = "Relevant context:\n\n" + "\n\n".join(context_pieces) + "\n\n"
+            # Create enhanced messages
+            enhanced_messages = state["messages"].copy()
+            if context:
+                # Add context to system message if it exists, otherwise add a new one
+                system_message_found = False
+                for i, msg in enumerate(enhanced_messages):
+                    if isinstance(msg, SystemMessage):
+                        enhanced_messages[i] = SystemMessage(content=f"{msg.content}\n\n{context}")
+                        system_message_found = True
+                        break
+                if not system_message_found:
+                    enhanced_messages.insert(0, SystemMessage(content=context))
+            # Process with LLM
+            response = self.llm.invoke(enhanced_messages)
+            return {"messages": state["messages"] + [response]}
+        # Tool handling node
+        tool_node = ToolNode(self.tools)
+        # Build graph with tool handling
+        builder = StateGraph(MessagesState)
+        builder.add_node("context_enhanced_generation", context_enhanced_generation)
+        builder.add_node("tools", tool_node)
+        # Connect nodes
+        builder.set_entry_point("context_enhanced_generation")
+        builder.add_conditional_edges(
+            "context_enhanced_generation",
+            tools_condition,
+            {
+                "tools": "tools",
+                None: END
+            }
+        )
+        builder.add_edge("tools", "context_enhanced_generation")
+        return builder.compile()
+    @staticmethod
+    def get_llm(provider: str="groq") -> BaseChatModel:
+        # Load environment variables from .env file
+        if provider == "groq":
+            # Groq https://console.groq.com/docs/models
+            # optional : qwen-qwq-32b gemma2-9b-it
+            llm = ChatGroq(model="qwen-qwq-32b", temperature=0)
+        elif provider == "huggingface":
+            # TODO: Add huggingface endpoint
+            llm = ChatHuggingFace(
+                llm=HuggingFaceEndpoint(
+                    model="Meta-DeepLearning/llama-2-7b-chat-hf",
+                    temperature=0,
+                ),
+            )
+        elif provider == "openai_local":
+            from langchain_openai import ChatOpenAI
+            llm = ChatOpenAI(
+                base_url="http://localhost:11432/v1",  # default LM Studio endpoint
+                api_key="not-used",  # required by interface but ignored #type: ignore
+                model="mistral-nemo-instruct-2407",
+                temperature=0.2
+            )
+        elif provider == "openai":
+            from langchain_openai import ChatOpenAI
+            llm = ChatOpenAI(
+                model="gpt-4o",
+                temperature=0.2,
+            )
+        else:
+            raise ValueError(
+                "Invalid provider. Choose 'groq' or 'huggingface'.")
+        return llm
+    def manage_memory(self, max_documents: int = 1000, max_age_days: int = 30) -> None:
+        """
+        Manage memory by pruning old or less useful entries from the vector store.
+        This implementation works with various vector store types, not just FAISS.
+        Args:
+            max_documents: Maximum number of documents to keep
+            max_age_days: Remove documents older than this many days
+        """
+        print(f"Starting memory management...")
+        # Get all documents from the vector store
+        try:
+            # For vector stores that have a get_all_documents method
+            if hasattr(self.vector_store, "get_all_documents"):
+                all_docs = self.vector_store.get_all_documents()
+                all_ids = [doc.metadata.get("id", i) for i, doc in enumerate(all_docs)]
+            # For FAISS and similar implementations
+            elif hasattr(self.vector_store, "docstore") and hasattr(self.vector_store, "index_to_docstore_id"):
+                # Access docstore in a more robust way
+                if hasattr(self.vector_store.docstore, "docstore"):
+                    all_ids = list(self.vector_store.index_to_docstore_id.values())
+                    all_docs = []
+                    for doc_id in all_ids:
+                        doc = self.vector_store.docstore.search(doc_id)
+                        if doc:
+                            all_docs.append(doc)
+                else:
+                    # Fallback for newer FAISS implementations
+                    try:
+                        all_docs = []
+                        all_ids = []
+                        # Get all index positions
+                        for i in range(self.vector_store.index.ntotal):
+                            # Map index position to document ID
+                            if i in self.vector_store.index_to_docstore_id:
+                                doc_id = self.vector_store.index_to_docstore_id[i]
+                                doc = self.vector_store.docstore.search(doc_id)
+                                if doc:
+                                    all_docs.append(doc)
+                                    all_ids.append(doc_id)
+                    except Exception as e:
+                        print(f"Error accessing FAISS documents: {e}")
+                        all_docs = []
+                        all_ids = []
+            else:
+                print("Warning: Vector store doesn't expose required attributes for memory management")
+                return
+        except Exception as e:
+            print(f"Error accessing vector store documents: {e}")
+            return
+        if not all_docs:
+            print("No documents found in vector store")
+            return
+        print(f"Retrieved {len(all_docs)} documents for scoring")
+        # Score each document based on recency and other factors
+        scored_docs = []
+        cutoff_date = datetime.now() - timedelta(days=max_age_days)
+        for i, doc in enumerate(all_docs):
+            doc_id = all_ids[i] if i < len(all_ids) else i
+            # Extract timestamp from content or metadata
+            timestamp = None
+            if hasattr(doc, "metadata") and doc.metadata and "timestamp" in doc.metadata:
+                try:
+                    timestamp = datetime.fromisoformat(doc.metadata["timestamp"])
+                except (ValueError, TypeError):
+                    pass
+            # If no timestamp in metadata, try to extract from content
+            if not timestamp and hasattr(doc, "page_content") and "Timestamp:" in doc.page_content:
+                try:
+                    timestamp_str = doc.page_content.split("Timestamp:")[-1].strip().split('\n')[0]
+                    timestamp = datetime.fromisoformat(timestamp_str)
+                except (ValueError, TypeError):
+                    timestamp = datetime.now() - timedelta(days=max_age_days+1)
+            # If still no timestamp, use a default
+            if not timestamp:
+                timestamp = datetime.now() - timedelta(days=max_age_days+1)
+            # Calculate age score (newer is better)
+            age_factor = max(0.0, min(1.0, (timestamp - cutoff_date).total_seconds() /
+                                     (datetime.now() - cutoff_date).total_seconds()))
+            # Calculate importance score - could be based on various factors
+            importance_factor = 1.0
+            # If document has been accessed often, increase importance
+            if hasattr(doc, "metadata") and doc.metadata and "access_count" in doc.metadata:
+                importance_factor += min(1.0, doc.metadata["access_count"] / 10)
+            # Create combined score (higher = more valuable to keep)
+            total_score = (0.7 * age_factor) + (0.3 * importance_factor)
+            # Add to priority queue (negative for max-heap behavior)
+            heapq.heappush(scored_docs, (-total_score, i, doc))
+        # Select top documents to keep
+        docs_to_keep = []
+        for _ in range(min(max_documents, len(scored_docs))):
+            if scored_docs:
+                _, _, doc = heapq.heappop(scored_docs)
+                docs_to_keep.append(doc)
+        # Only rebuild if we're actually pruning some documents
+        if len(docs_to_keep) < len(all_docs):
+            print(f"Memory management: Keeping {len(docs_to_keep)} documents out of {len(all_docs)}")
+            # Create a new vector store with the same type as the current one
+            vector_store_type = type(self.vector_store)
+            # Different approaches based on vector store type
+            if hasattr(vector_store_type, "from_documents"):
+                # Most langchain vector stores support this method
+                new_vector_store = vector_store_type.from_documents(
+                    docs_to_keep,
+                    embedding=self.embedding_model
+                )
+                self.vector_store = new_vector_store
+                print(f"Vector store rebuilt with {len(docs_to_keep)} documents")
+            elif hasattr(vector_store_type, "from_texts"):
+                # For vector stores that use from_texts
+                texts = [doc.page_content for doc in docs_to_keep]
+                metadatas = [doc.metadata if hasattr(doc, "metadata") else {} for doc in docs_to_keep]
+                new_vector_store = vector_store_type.from_texts(
+                    texts=texts,
+                    embedding=self.embedding_model,
+                    metadatas=metadatas
+                )
+                self.vector_store = new_vector_store
+                print(f"Vector store rebuilt with {len(docs_to_keep)} documents")
+            else:
+                print("Warning: Could not determine how to rebuild the vector store")
+                print(f"Vector store type: {vector_store_type.__name__}")
+    def capture_tool_result(self, tool_name: str, tool_input: str, tool_output: str) -> None:
+        """
+        Capture knowledge gained from tool usage for future reference
+        Args:
+            tool_name: Name of the tool used
+            tool_input: Input/query sent to the tool
+            tool_output: Result returned by the tool
+        """
+        # Format the content
+        timestamp = datetime.now().isoformat()
+        content = (
+            f"Tool Knowledge\n"
+            f"Tool: {tool_name}\n"
+            f"Query: {tool_input}\n"
+            f"Result: {tool_output}\n"
+            f"Timestamp: {timestamp}"
+        )
+        # Create document with metadata
+        doc = Document(
+            page_content=content,
+            metadata={
+                "type": "tool_knowledge",
+                "tool": tool_name,
+                "timestamp": timestamp,
+                "query": tool_input
+            }
+        )
+        # Add to vector store
+        self.vector_store.add_documents([doc])
+        print(f"Captured knowledge from tool '{tool_name}' in vector store")

app.py CHANGED Viewed

@@ -3,7 +3,7 @@ import gradio as gr
 import requests
 import inspect
 import pandas as pd
-from agent import BasicAgent
 from dotenv import load_dotenv
 import os
@@ -17,7 +17,7 @@ DEFAULT_API_URL = "https://agents-course-unit4-scoring.hf.space"
 # ----- THIS IS WERE YOU CAN BUILD WHAT YOU WANT ------
-def run_and_submit_all( profile: gr.OAuthProfile | None):
     """
     Fetches all questions, runs the BasicAgent on them, submits all answers,
     and displays the results.
@@ -38,7 +38,10 @@ def run_and_submit_all( profile: gr.OAuthProfile | None):
     # 1. Instantiate Agent ( modify this part to create your agent)
     try:
-        agent = BasicAgent()
     except Exception as e:
         print(f"Error instantiating agent: {e}")
         return f"Error initializing agent: {e}", None

 import requests
 import inspect
 import pandas as pd
+from agent import BasicAgent, embeddings, vector_store,
 from dotenv import load_dotenv
 import os
 # ----- THIS IS WERE YOU CAN BUILD WHAT YOU WANT ------
+def run_and_submit_all(profile: gr.OAuthProfile | None):
     """
     Fetches all questions, runs the BasicAgent on them, submits all answers,
     and displays the results.
     # 1. Instantiate Agent ( modify this part to create your agent)
     try:
+        # llm = BasicAgent.get_llm("groq")
+        llm = BasicAgent.get_llm("openai_local")
+        agent = BasicAgent(embeddings, vector_store, llm)
+        print("Agent instantiated successfully.")
     except Exception as e:
         print(f"Error instantiating agent: {e}")
         return f"Error initializing agent: {e}", None

basic_tools.py ADDED Viewed

	@@ -0,0 +1,164 @@

+import os
+from dotenv import load_dotenv
+from langgraph.graph import START, StateGraph, MessagesState
+from langgraph.prebuilt import tools_condition
+from langgraph.prebuilt import ToolNode
+# from langchain_google_genai import ChatGoogleGenerativeAI
+# from langchain_groq import ChatGroq
+from langchain_huggingface import ChatHuggingFace, HuggingFaceEndpoint, HuggingFaceEmbeddings
+from langchain_community.tools.tavily_search import TavilySearchResults
+from langchain_community.document_loaders import WikipediaLoader
+from langchain_community.document_loaders import ArxivLoader
+from langchain_community.vectorstores import SupabaseVectorStore
+from langchain_core.messages import SystemMessage, HumanMessage
+from langchain_core.tools import tool
+from langchain.tools.retriever import create_retriever_tool
+from langchain.requests import RequestsWrapper
+# from supabase.client import Client, create_client
+# from langchain.tools.requests.toolkit import RequestsToolkit  # Added for RequestsToolKit
+from langchain_community.tools import RequestsPostTool, RequestsGetTool
+load_dotenv()
+requests_wrapper = RequestsWrapper()
+@tool
+def multiply(a: int, b: int) -> int:
+    """Multiply two numbers.
+    Args:
+        a: first int
+        b: second int
+    """
+    return a * b
+@tool
+def add(a: int, b: int) -> int:
+    """Add two numbers.
+    Args:
+        a: first int
+        b: second int
+    """
+    return a + b
+@tool
+def subtract(a: int, b: int) -> int:
+    """Subtract two numbers.
+    Args:
+        a: first int
+        b: second int
+    """
+    return a - b
+@tool
+def divide(a: int, b: int) -> float:
+    """Divide two numbers.
+    Args:
+        a: first int
+        b: second int
+    """
+    if b == 0:
+        raise ValueError("Cannot divide by zero.")
+    return a / b
+@tool
+def modulus(a: int, b: int) -> int:
+    """Get the modulus of two numbers.
+    Args:
+        a: first int
+        b: second int
+    """
+    return a % b
+@tool
+def wiki_search(query: str) -> str:
+    """Search Wikipedia for a query and return maximum 2 results.
+    Args:
+        query: The search query."""
+    search_docs = WikipediaLoader(query=query, load_max_docs=2).load()
+    formatted_search_docs = "\n\n---\n\n".join(
+        [
+            f'<Document source="{doc.metadata["source"]}" page="{doc.metadata.get("page", "")}"/>\n{doc.page_content}\n</Document>'
+            for doc in search_docs
+        ])
+    return formatted_search_docs
+@tool
+def web_search(query: str) -> str:
+    """Search Tavily for a query and return maximum 3 results.
+    Args:
+        query: The search query."""
+    search_docs = TavilySearchResults(max_results=3).invoke(input=query)
+    formatted_search_docs = "\n\n---\n\n".join(
+        [
+            f'<Document source="{doc.metadata["source"]}" page="{doc.metadata.get("page", "")}"/>\n{doc.page_content}\n</Document>'
+            for doc in search_docs
+        ])
+    return formatted_search_docs
+@tool
+def arxiv_search(query: str) -> str:
+    """Search Arxiv for a query and return maximum 3 result.
+    Args:
+        query: The search query."""
+    search_docs = ArxivLoader(query=query, load_max_docs=3).load()
+    formatted_search_docs = "\n\n---\n\n".join(
+        [
+            f'<Document source="{doc.metadata["source"]}" page="{doc.metadata.get("page", "")}"/>\n{doc.page_content[:1000]}\n</Document>'
+            for doc in search_docs
+        ])
+    return formatted_search_docs
+# @tool
+# def requests_get(url: str, params: dict = {}) -> str:
+#     """Perform an HTTP GET request using LangChain's RequestsToolKit.
+#     Args:
+#         url: The URL to send the GET request to.
+#         params: Optional dictionary of query parameters.
+#     Returns:
+#         The response content as text.
+#     """
+#     toolkit = RequestsGetTool(requests_wrapper=requests_wrapper)
+#     # The get method is expected to return a response-like object.
+#     response = toolkit.run(url, params=params)
+#     return response.text
+# Adding request toolkits
+requests_get = RequestsGetTool(requests_wrapper=requests_wrapper)
+requests_post = RequestsPostTool(requests_wrapper=requests_wrapper)
+# @tool
+# def requests_post(url: str, data: dict = {}, json: dict = {}, headers: dict = {}) -> str:
+#     """Perform an HTTP POST request using LangChain's RequestsToolKit.
+#     Args:
+#         url: The URL to send the POST request to.
+#         data: Optional dictionary of form data.
+#         json: Optional dictionary to send as JSON.
+#         headers: Optional dictionary of HTTP headers.
+#     Returns:
+#         The response content as text.
+#     """
+#     toolkit = RequestsPostTool(requests_wrapper=requests_wrapper)
+#     response = toolkit.run(url, data=data, json=json, headers=headers)
+#     return response.text

system_prompt.txt ADDED Viewed

	@@ -0,0 +1,17 @@

+You are a helpful assistant tasked with answering questions using a set of tools.
+Your final answer must strictly follow this format:
+FINAL ANSWER: [ANSWER]
+Only write the answer in that exact format. Do not explain anything. Do not include any other text.
+If you are provided with a similar question and its final answer, and the current question is **exactly the same**, then simply return the same final answer without using any tools.
+Only use tools if the current question is different from the similar one.
+Examples:
+- FINAL ANSWER: FunkMonk
+- FINAL ANSWER: Paris
+- FINAL ANSWER: 128
+If you do not follow this format exactly, your response will be considered incorrect.