Spaces:

vonliechti
/

SQuAD_Agent_Experiment

Running

App Files Files Community

vonliechti commited on Oct 14, 2024

Commit

5ea745b

verified ·

1 Parent(s): 5adb1e9

Upload folder using huggingface_hub

Browse files

Files changed (5) hide show

agent.py +10 -14
app.py +47 -30
benchmarking.ipynb +1 -1
prompts/__init__.py +25 -0
prompts/default.py +108 -0

agent.py CHANGED Viewed

@@ -1,29 +1,25 @@
 from transformers import ReactCodeAgent, HfApiEngine
-from prompts import SQUAD_REACT_CODE_SYSTEM_PROMPT
 from tools.squad_tools import SquadRetrieverTool, SquadQueryTool
-from tools.text_to_image import TextToImageTool
-def get_agent(model_name = None, include_image_tools = False):
     DEFAULT_MODEL_NAME = "http://localhost:1234/v1"
     if model_name is None:
         model_name = DEFAULT_MODEL_NAME
     llm_engine = HfApiEngine(model_name)
-    TASK_SOLVING_TOOLBOX = [
-        SquadRetrieverTool(),
-        SquadQueryTool()
-    ]
-    if include_image_tools:
-        TASK_SOLVING_TOOLBOX.append(TextToImageTool())
     # Initialize the agent with both tools
     agent = ReactCodeAgent(
-        tools=TASK_SOLVING_TOOLBOX,
         llm_engine=llm_engine,
-        system_prompt=SQUAD_REACT_CODE_SYSTEM_PROMPT,
     )
     return agent

 from transformers import ReactCodeAgent, HfApiEngine
+from prompts import *
 from tools.squad_tools import SquadRetrieverTool, SquadQueryTool
+DEFAULT_TASK_SOLVING_TOOLBOX = [SquadRetrieverTool(), SquadQueryTool()]
+def get_agent(
+    model_name=None,
+    system_prompt=DEFAULT_SQUAD_REACT_CODE_SYSTEM_PROMPT,
+    toolbox=DEFAULT_TASK_SOLVING_TOOLBOX,
+):
     DEFAULT_MODEL_NAME = "http://localhost:1234/v1"
     if model_name is None:
         model_name = DEFAULT_MODEL_NAME
     llm_engine = HfApiEngine(model_name)
     # Initialize the agent with both tools
     agent = ReactCodeAgent(
+        tools=toolbox,
         llm_engine=llm_engine,
+        system_prompt=system_prompt,
     )
     return agent

app.py CHANGED Viewed

@@ -6,20 +6,31 @@ from gradio import Request
 import pickle
 import os
 from dotenv import load_dotenv
-from agent import get_agent
 load_dotenv()
 sessions_path = "sessions.pkl"
-sessions = pickle.load(open(sessions_path, "rb")) if os.path.exists(sessions_path) else {}
 # If currently hosted on HuggingFace Spaces, use the default model, otherwise use the local model
-model_name = "meta-llama/Meta-Llama-3.1-8B-Instruct" if os.getenv("SPACE_ID") is not None else "http://localhost:1234/v1"
-agent = get_agent(model_name=model_name, include_image_tools=True)
 app = None
 def append_example_message(x: gr.SelectData, messages):
     if x.value["text"] is not None:
         message = x.value["text"]
@@ -33,19 +44,22 @@ def append_example_message(x: gr.SelectData, messages):
     messages.append(ChatMessage(role="user", content=message))
     return messages
 def add_message(message, messages):
     messages.append(ChatMessage(role="user", content=message))
     return messages
 def interact_with_agent(messages, request: Request):
     session_hash = request.session_hash
-    prompt = messages[-1]['content']
     agent.logs = sessions.get(session_hash + "_logs", [])
     for msg in stream_from_transformers_agent(agent, prompt):
         messages.append(msg)
         yield messages
     yield messages
 def persist(component):
     def resume_session(value, request: Request):
@@ -68,34 +82,37 @@ def persist(component):
     return component
 with gr.Blocks(fill_height=True) as demo:
-    chatbot = persist(gr.Chatbot(
-        value=[],
-        label="SQuAD Agent",
-        type="messages",
-        avatar_images=(
-            None,
-            "https://em-content.zobj.net/source/twitter/53/robot-face_1f916.png",
-        ),
-        scale=1,
-        autoscroll=True,
-        show_copy_all_button=True,
-        show_copy_button=True,
-        placeholder="""<h1>SQuAD Agent</h1>
             <h2>I am your friendly guide to the Stanford Question and Answer Dataset (SQuAD).</h2>
         """,
-        examples=[
-            {
-                "text": "What is on top of the Notre Dame building?",
-            },
-            {
-                "text": "Tell me what's on top of the Notre Dame building, and draw a picture of it.",
-            },
-            {
-                "text": "Draw a picture of whatever is on top of the Notre Dame building.",
-            },
-        ],
-    ))
     text_input = gr.Textbox(lines=1, label="Chat Message", scale=0)
     chat_msg = text_input.submit(add_message, [text_input, chatbot], [chatbot])
     bot_msg = chat_msg.then(interact_with_agent, [chatbot], [chatbot])

 import pickle
 import os
 from dotenv import load_dotenv
+from agent import get_agent, DEFAULT_TASK_SOLVING_TOOLBOX
+from tools.text_to_image import TextToImageTool
 load_dotenv()
 sessions_path = "sessions.pkl"
+sessions = (
+    pickle.load(open(sessions_path, "rb")) if os.path.exists(sessions_path) else {}
+)
 # If currently hosted on HuggingFace Spaces, use the default model, otherwise use the local model
+model_name = (
+    "meta-llama/Meta-Llama-3.1-8B-Instruct"
+    if os.getenv("SPACE_ID") is not None
+    else "http://localhost:1234/v1"
+)
+# Add image tools to the default task solving toolbox, for a more visually interactive experience
+TASK_SOLVING_TOOLBOX = DEFAULT_TASK_SOLVING_TOOLBOX + [TextToImageTool()]
+agent = get_agent(model_name=model_name, toolbox=TASK_SOLVING_TOOLBOX)
 app = None
 def append_example_message(x: gr.SelectData, messages):
     if x.value["text"] is not None:
         message = x.value["text"]
     messages.append(ChatMessage(role="user", content=message))
     return messages
 def add_message(message, messages):
     messages.append(ChatMessage(role="user", content=message))
     return messages
 def interact_with_agent(messages, request: Request):
     session_hash = request.session_hash
+    prompt = messages[-1]["content"]
     agent.logs = sessions.get(session_hash + "_logs", [])
     for msg in stream_from_transformers_agent(agent, prompt):
         messages.append(msg)
         yield messages
     yield messages
 def persist(component):
     def resume_session(value, request: Request):
     return component
 with gr.Blocks(fill_height=True) as demo:
+    chatbot = persist(
+        gr.Chatbot(
+            value=[],
+            label="SQuAD Agent",
+            type="messages",
+            avatar_images=(
+                None,
+                "https://em-content.zobj.net/source/twitter/53/robot-face_1f916.png",
+            ),
+            scale=1,
+            autoscroll=True,
+            show_copy_all_button=True,
+            show_copy_button=True,
+            placeholder="""<h1>SQuAD Agent</h1>
             <h2>I am your friendly guide to the Stanford Question and Answer Dataset (SQuAD).</h2>
         """,
+            examples=[
+                {
+                    "text": "What is on top of the Notre Dame building?",
+                },
+                {
+                    "text": "Tell me what's on top of the Notre Dame building, and draw a picture of it.",
+                },
+                {
+                    "text": "Draw a picture of whatever is on top of the Notre Dame building.",
+                },
+            ],
+        )
+    )
     text_input = gr.Textbox(lines=1, label="Chat Message", scale=0)
     chat_msg = text_input.submit(add_message, [text_input, chatbot], [chatbot])
     bot_msg = chat_msg.then(interact_with_agent, [chatbot], [chatbot])

benchmarking.ipynb CHANGED Viewed

@@ -331,7 +331,7 @@
     "from agent import get_agent\n",
     "\n",
     "benchmarks = [\n",
-    "    (get_agent(model_name=\"meta-llama/Meta-Llama-3.1-8B-Instruct\"), \"baseline\"),\n",
     "]\n",
     "\n",
     "for agent, name in tqdm(benchmarks):\n",

     "from agent import get_agent\n",
     "\n",
     "benchmarks = [\n",
+    "    (get_agent(), \"baseline\"), # Baseline agent with default settings\n",
     "]\n",
     "\n",
     "for agent, name in tqdm(benchmarks):\n",

prompts/__init__.py ADDED Viewed

	@@ -0,0 +1,25 @@

+# Import all prompts as both constants and in a PROMPTS dictionary,
+# from all files in the prompts directory that aren't __init__.py
+import os
+def load_constants(constants_dir):
+    """Loads constants from .py files in the specified directory."""
+    constants = {}
+    for filename in os.listdir(constants_dir):
+        if filename.endswith(".py") and filename != "__init__.py":
+            module_name = filename[:-3]  # Remove .py extension
+            module = __import__(f"{constants_dir}.{module_name}", fromlist=[module_name])
+            for name, value in vars(module).items():
+                if name.isupper():  # Convention for constants
+                    constants[name] = value
+    return constants
+PROMPTS = load_constants("prompts")
+# Import all prompts locally as well, for code completion
+from prompts.default import DEFAULT_SQUAD_REACT_CODE_SYSTEM_PROMPT

prompts/default.py ADDED Viewed

	@@ -0,0 +1,108 @@

+DEFAULT_SQUAD_REACT_CODE_SYSTEM_PROMPT = """You are an expert assistant who can solve any task using code blobs. You will be given a task to solve as best you can.
+To do so, you have been given access to a list of tools: these tools are basically Python functions which you can call with code.
+To solve the task, you must plan forward to proceed in a series of steps, in a cycle of 'Thought:', 'Code:', and 'Observation:' sequences.
+Your most important tool is the `squad_retriever` tool, which can retrieve documents relevant to a given question from the Stanford Question Answering Dataset (SQuAD).
+Not all questions will require the `squad_retriever` tool, but whenever you need to answer a question, you should start with this tool first, and then refine your answer only as needed to align with the question and chat history.
+At each step, in the 'Thought:' sequence, you should first explain your reasoning towards solving the task and the tools that you want to use.
+Then in the 'Code:' sequence, you should write the code in simple Python. The code sequence must end with '<end_action>' sequence.
+During each intermediate step, you can use 'print()' to save whatever important information you will then need.
+These print outputs will then appear in the 'Observation:' field, which will be available as input for the next step.
+In the end you have to return a final answer using the `final_answer` tool.
+Here are a few examples using notional tools:
+---
+Task: "Generate an image of the oldest person in this document."
+Thought: I will proceed step by step and use the following tools: `document_qa` to find the oldest person in the document, then `image_generator` to generate an image according to the answer.
+Code:
+```py
+answer = document_qa(document=document, question="Who is the oldest person mentioned?")
+print(answer)
+```<end_action>
+Observation: "The oldest person in the document is John Doe, a 55 year old lumberjack living in Newfoundland."
+Thought: I will now generate an image showcasing the oldest person.
+Code:
+```py
+image = image_generator("A portrait of John Doe, a 55-year-old man living in Canada.")
+final_answer(image)
+```<end_action>
+---
+Task: "What is the result of the following operation: 5 + 3 + 1294.678?"
+Thought: I will use python code to compute the result of the operation and then return the final answer using the `final_answer` tool
+Code:
+```py
+result = 5 + 3 + 1294.678
+final_answer(result)
+```<end_action>
+---
+Task: "Which city has the highest population: Guangzhou or Shanghai?"
+Thought: I need to get the populations for both cities and compare them: I will use the tool `search` to get the population of both cities.
+Code:
+```py
+population_guangzhou = search("Guangzhou population")
+print("Population Guangzhou:", population_guangzhou)
+population_shanghai = search("Shanghai population")
+print("Population Shanghai:", population_shanghai)
+```<end_action>
+Observation:
+Population Guangzhou: ['Guangzhou has a population of 15 million inhabitants as of 2021.']
+Population Shanghai: '26 million (2019)'
+Thought: Now I know that Shanghai has the highest population.
+Code:
+```py
+final_answer("Shanghai")
+```<end_action>
+---
+Task: "What is the current age of the pope, raised to the power 0.36?"
+Thought: I will use the tool `wiki` to get the age of the pope, then raise it to the power 0.36.
+Code:
+```py
+pope_age = wiki(query="current pope age")
+print("Pope age:", pope_age)
+```<end_action>
+Observation:
+Pope age: "The pope Francis is currently 85 years old."
+Thought: I know that the pope is 85 years old. Let's compute the result using python code.
+Code:
+```py
+pope_current_age = 85 ** 0.36
+final_answer(pope_current_age)
+```<end_action>
+Above example were using notional tools that might not exist for you. On top of performing computations in the Python code snippets that you create, you have access to those tools (and no other tool):
+<<tool_descriptions>>
+<<managed_agents_descriptions>>
+Here are the rules you should always follow to solve your task:
+1. Always provide a 'Thought:' sequence, and a 'Code:\n```py' sequence ending with '```<end_action>' sequence, else you will fail.
+2. Use only variables that you have defined!
+3. Always use the right arguments for the tools. DO NOT pass the arguments as a dict as in 'answer = wiki({'query': "What is the place where James Bond lives?"})', but use the arguments directly as in 'answer = wiki(query="What is the place where James Bond lives?")'.
+4. Take care to not chain too many sequential tool calls in the same code block, especially when the output format is unpredictable. For instance, a call to search has an unpredictable return format, so do not have another tool call that depends on its output in the same block: rather output results with print() to use them in the next block.
+5. Call a tool only when needed, and never re-do a tool call that you previously did with the exact same parameters.
+6. Don't name any new variable with the same name as a tool: for instance don't name a variable 'final_answer'.
+7. Never create any notional variables in our code, as having these in your logs might derail you from the true variables.
+8. You can use imports in your code, but only from the following list of modules: <<authorized_imports>>
+9. The state persists between code executions: so if in one step you've created variables or imported modules, these will all persist.
+10. Don't give up! You're in charge of solving the task, not providing directions to solve it.
+11. Only use the tools that have been provided to you.
+12. If the task questions the rationale of your previous answers, explain your rationale for the previous answers and attempt to correct any mistakes in your previous answers.
+13. Never give the entire response from the squad_retriever tool as your final answer. Instead, use it to inform your final answer.
+As for your identity, your name is Agent SQuAD, you are an AI Agent, an expert guide to all questions and answers in the Stanford Question Answering Dataset (SQuAD), and you are SQuADtacular!
+Do not use the squad_retriever tool to answer questions about yourself, such as "what is your name" or "what are you".
+Now Begin! If you solve the task correctly, you will receive a reward of $1,000,000.
+"""