unit-four-final-project

Sleeping

App Files Files Community

gperdrizet commited on Jun 27

Commit

10c462d

verified ·

1 Parent(s): 060a8f4

Downgraded to smolagents 1.18.0 and switched back to single codeagent - scored 20% on GAIA benchmark.

Browse files

Files changed (4) hide show

app.py +1 -2
configuration.py +2 -2
functions/agent.py +15 -37
requirements.txt +1 -1

app.py CHANGED Viewed

@@ -94,7 +94,7 @@ def run_and_submit_all(profile: gr.OAuthProfile | None):
         try:
             submitted_answer = agent.run(
-                question_text
             )
             answers_payload.append({"task_id": task_id, "submitted_answer": submitted_answer})
@@ -209,7 +209,6 @@ with gr.Blocks() as demo:
     run_button = gr.Button("Run Evaluation & Submit All Answers")
     status_output = gr.Textbox(label="Run Status / Submission Result", lines=5, interactive=False)
-    # Removed max_rows=10 from DataFrame constructor
     results_table = gr.DataFrame(label="Questions and Agent Answers", wrap=True)
     run_button.click( # pylint: disable=E1101

         try:
             submitted_answer = agent.run(
+                INSTRUCTIONS + '\n' + question_text
             )
             answers_payload.append({"task_id": task_id, "submitted_answer": submitted_answer})
     run_button = gr.Button("Run Evaluation & Submit All Answers")
     status_output = gr.Textbox(label="Run Status / Submission Result", lines=5, interactive=False)
     results_table = gr.DataFrame(label="Questions and Agent Answers", wrap=True)
     run_button.click( # pylint: disable=E1101

configuration.py CHANGED Viewed

@@ -6,12 +6,12 @@ Contains API URLs and agent instructions used throughout the application.
 # pylint: disable=line-too-long
 # Which questions to answer
-QUESTIONS = [1]
 # GAIA benchmark scoring API
 DEFAULT_API_URL = 'https://agents-course-unit4-scoring.hf.space'
 # Additional instructions for agent. See here: https://huggingface.co/spaces/gaia-benchmark/leaderboard
 INSTRUCTIONS = """
-You are a general AI assistant. I will ask you a question. Your final answer should be a number OR as few words as possible OR a comma separated list of numbers and/or strings. If you are asked for a number, don't use comma to write your number neither use units such as $ or percent sign unless specified otherwise. If you are asked for a string, don't use articles, neither abbreviations (e.g. for cities), and write the digits in plain text unless specified otherwise. If you are asked for a comma separated list, apply the above rules depending of whether the element to be put in the list is a number or a string.
 """

 # pylint: disable=line-too-long
 # Which questions to answer
+QUESTIONS = [1,3,5,8,9,11,13,17,18,20]
 # GAIA benchmark scoring API
 DEFAULT_API_URL = 'https://agents-course-unit4-scoring.hf.space'
 # Additional instructions for agent. See here: https://huggingface.co/spaces/gaia-benchmark/leaderboard
 INSTRUCTIONS = """
+You are a general AI assistant. I will ask you a question. Your final answer should be a number OR as few words as possible OR a comma separated list of numbers and/or strings. If you are asked for a number, don't use comma to write your number neither use units such as $ or percent sign unless specified otherwise. If you are asked for a string, don't use articles, neither abbreviations (e.g. for cities), and write the digits in plain text unless specified otherwise. If you are asked for a comma separated list, apply the above rules depending of whether the element to be put in the list is a number or a string. Submit the final answer via the final_answer tool.
 """

functions/agent.py CHANGED Viewed

@@ -1,7 +1,7 @@
 '''Agent definition for GAIA question answering system.'''
 # Imports for agent creation
-from smolagents import CodeAgent, ToolCallingAgent, InferenceClientModel, VisitWebpageTool
 from functions.tools import (
     google_search,
     wikipedia_search,
@@ -12,50 +12,28 @@ def create_agent():
     '''Creates agent for GAIA question answering system.'''
     model = InferenceClientModel(
-        "Qwen/Qwen2.5-Coder-32B-Instruct", provider="together"
     )
-    web_agent_tools = [
         google_search,
         VisitWebpageTool()
     ]
-    web_agent = CodeAgent(
         model=model,
-        tools=web_agent_tools,
-        name="web_agent",
-        description="Browses the web to find information",
         verbosity_level=1,
-        max_steps=10,
-    )
-    wikipedia_agent_tools = [
-        wikipedia_search,
-        get_wikipedia_page
-    ]
-    wikipedia_agent = CodeAgent(
-        model=model,
-        tools=wikipedia_agent_tools,
-        additional_authorized_imports=['bs4.*'],
-        name="wikipedia_agent",
-        description="Search Wikipedia and retrieve pages",
-        verbosity_level=1,
-        max_steps=10
-    )
-    manager_agent = CodeAgent(
-        model=model,
-        tools=[],
-        additional_authorized_imports=['bs4.*'],
-        name="manager_agent",
-        description="Manages the workflow of other agents",
-        managed_agents=[web_agent, wikipedia_agent],
-        planning_interval=1,
-        verbosity_level=2,
-        max_steps=15,
     )
-    manager_agent.visualize()
-    return manager_agent

 '''Agent definition for GAIA question answering system.'''
 # Imports for agent creation
+from smolagents import CodeAgent, InferenceClientModel, VisitWebpageTool
 from functions.tools import (
     google_search,
     wikipedia_search,
     '''Creates agent for GAIA question answering system.'''
     model = InferenceClientModel(
+        "Qwen/Qwen2.5-Coder-32B-Instruct",
+        provider="hf-inference",
+        max_tokens=8096
     )
+    tools = [
+        wikipedia_search,
+        get_wikipedia_page,
         google_search,
         VisitWebpageTool()
     ]
+    agent = CodeAgent(
         model=model,
+        tools=tools,
+        additional_authorized_imports=['bs4.*', 'json'],
+        name="GAIA_agent",
         verbosity_level=1,
+        max_steps=20,
+        planning_interval=5,
+        description="GAIA agent for question answering"
     )
+    return agent

requirements.txt CHANGED Viewed

@@ -5,6 +5,6 @@ gradio[oauth]
 markdownify
 mwparserfromhell
 requests
-smolagents
 tinycss2
 wikipedia-api

 markdownify
 mwparserfromhell
 requests
+smolagents==1.13.0
 tinycss2
 wikipedia-api