unit-four-final-project

Sleeping

gperdrizet commited on Jul 3

Commit

b4e2809

verified ·

1 Parent(s): 75bb385

Switched to single agent powered by GPT-4.1, added step wait function to avoid hitting the OpenAI API rate limit.

Browse files

Files changed (6) hide show

configuration.py +30 -4
functions/agent.py +66 -116
functions/agent_helper_functions.py +142 -0
functions/tool_helper_functions.py +286 -3
functions/tools.py +3 -264
results.csv +4 -4

configuration.py CHANGED Viewed

@@ -1,8 +1,7 @@
-"""
-Configuration constants for the GAIA agent project.
-Contains API URLs and agent instructions used throughout the application.
-"""
 # pylint: disable=line-too-long
 # Which questions to answer
@@ -15,3 +14,30 @@ DEFAULT_API_URL = 'https://agents-course-unit4-scoring.hf.space'
 INSTRUCTIONS = """
 You are a general AI assistant. I will ask you a question. Your final answer should be a number OR as few words as possible OR a comma separated list of numbers and/or strings. If you are asked for a number, don't use comma to write your number neither use units such as $ or percent sign unless specified otherwise. If you are asked for a string, don't use articles, neither abbreviations (e.g. for cities), and write the digits in plain text unless specified otherwise. If you are asked for a comma separated list, apply the above rules depending of whether the element to be put in the list is a number or a string. Submit the final answer via the final_answer tool.
 """

+"""Configuration constants for the GAIA agent project."""
+from smolagents import OpenAIServerModel, InferenceClientModel
 # pylint: disable=line-too-long
 # Which questions to answer
 INSTRUCTIONS = """
 You are a general AI assistant. I will ask you a question. Your final answer should be a number OR as few words as possible OR a comma separated list of numbers and/or strings. If you are asked for a number, don't use comma to write your number neither use units such as $ or percent sign unless specified otherwise. If you are asked for a string, don't use articles, neither abbreviations (e.g. for cities), and write the digits in plain text unless specified otherwise. If you are asked for a comma separated list, apply the above rules depending of whether the element to be put in the list is a number or a string. Submit the final answer via the final_answer tool.
 """
+# Agent model definitions
+MANAGER_MODEL = InferenceClientModel(
+    "deepseek-ai/DeepSeek-V3",
+    provider="together",
+    max_tokens=64000
+)
+WORKER_MODEL = InferenceClientModel(
+    "deepseek-ai/DeepSeek-V3",
+    provider="together",
+    max_tokens=64000
+)
+CHECK_MODEL = InferenceClientModel(
+    "deepseek-ai/DeepSeek-V3",
+    provider="together",
+    max_tokens=64000
+)
+MODEL = OpenAIServerModel(
+    model_id="gpt-4.1",
+    max_tokens=8000
+)
+TOKEN_LIMITER = 5000
+STEP_WAIT = 60

functions/agent.py CHANGED Viewed

@@ -1,141 +1,91 @@
 '''Agent definition for GAIA question answering system.'''
 # Standard library
-import os
-import json
 import logging
-from openai import OpenAI
 # Imports for agent creation
-from smolagents import CodeAgent, InferenceClientModel, VisitWebpageTool, ActionStep, MessageRole
 from functions.tools import (
     google_search,
     wikipedia_search,
-    get_wikipedia_page
 )
 # Get logger for this module
 logger = logging.getLogger(__name__)
 def create_agent():
     '''Creates agent for GAIA question answering system.'''
-    model = InferenceClientModel(
-        "deepseek-ai/DeepSeek-V3",
-        provider="together",
-        max_tokens=64000
-    )
-    tools = [
-        wikipedia_search,
-        get_wikipedia_page,
-        google_search,
-        VisitWebpageTool(),
-    ]
     agent = CodeAgent(
-        model=model,
-        tools=tools,
         additional_authorized_imports=['bs4.*', 'json'],
-        step_callbacks=[step_memory_cap],
         name="GAIA_agent",
         verbosity_level=5,
-        max_steps=30,
-        planning_interval=2,
-        description="GAIA agent for question answering"
     )
     return agent
-def step_memory_cap(memory_step: ActionStep, agent: CodeAgent) -> None:
-    '''Removes old steps from agent memory to keep context length under control.'''
-    task_step = agent.memory.steps[0]
-    planning_step = agent.memory.steps[1]
-    latest_step = agent.memory.steps[-1]
-    if len(agent.memory.steps) > 2:
-        agent.memory.steps = [task_step, planning_step, latest_step]
-    logger.info('Agent memory has %d steps', len(agent.memory.steps))
-    logger.info('Latest step is step %d', memory_step.step_number)
-    logger.info('Contains: %s messages', len(agent.memory.steps[-1].model_input_messages))
-    logger.info('Token usage: %s', agent.memory.steps[-1].token_usage.total_tokens)
-    for message in agent.memory.steps[-1].model_input_messages:
-        logger.debug(' Role: %s: %s', message['role'], message['content'][:100])
-    token_usage = agent.memory.steps[-1].token_usage.total_tokens
-    if token_usage > 50000:
-        logger.info('Token usage is %d, summarizing old messages', token_usage)
-        summary = summarize_old_messages(
-            agent.memory.steps[-1].model_input_messages[1:]
-        )
-        if summary is not None:
-            new_messages = [agent.memory.steps[-1].model_input_messages[0]]
-            new_messages.append({
-                'role': MessageRole.USER,
-                'content': [{'type': 'text', 'text': f'Here is a summary of your investigation so far: {summary}'}]
-            })
-            agent.memory.steps = [agent.memory.steps[0]]
-            agent.memory.steps[0].model_input_messages = new_messages
-        for message in agent.memory.steps[0].model_input_messages:
-            logger.debug(' Role: %s: %s', message['role'], message['content'][:100])
-def summarize_old_messages(messages: dict) -> dict:
-    '''Summarizes old messages to keep context length under control.'''
-    client = OpenAI(api_key=os.environ['MODAL_API_KEY'])
-    client.base_url = (
-        'https://gperdrizet--vllm-openai-compatible-summarization-serve.modal.run/v1'
-    )
-    # Default to first avalible model
-    model = client.models.list().data[0]
-    model_id = model.id
-    messages = [
-        {
-            'role': 'system',
-            'content': f'Summarize the following interaction between an AI agent and a user. Return the summary formatted as text, not as JSON: {json.dumps(messages)}'
-        }
-    ]
-    completion_args = {
-        'model': model_id,
-        'messages': messages,
-        # "frequency_penalty": args.frequency_penalty,
-        # "max_tokens": 128,
-        # "n": args.n,
-        # "presence_penalty": args.presence_penalty,
-        # "seed": args.seed,
-        # "stop": args.stop,
-        # "stream": args.stream,
-        # "temperature": args.temperature,
-        # "top_p": args.top_p,
-    }
-    try:
-        response = client.chat.completions.create(**completion_args)
-    except Exception as e: # pylint: disable=broad-exception-caught
-        response = None
-        logger.error('Error during Modal API call: %s', e)
-    if response is not None:
-        summary = response.choices[0].message.content
-    else:
-        summary = None
-    return summary

 '''Agent definition for GAIA question answering system.'''
 # Standard library
 import logging
 # Imports for agent creation
+from smolagents import CodeAgent, VisitWebpageTool
 from functions.tools import (
     google_search,
     wikipedia_search,
+    get_wikipedia_page,
+    libretext_book_search,
+    get_libretext_book
 )
+from functions.agent_helper_functions import step_memory_cap, step_wait
+from configuration import MODEL
 # Get logger for this module
 logger = logging.getLogger(__name__)
 def create_agent():
     '''Creates agent for GAIA question answering system.'''
+    # web_agent = CodeAgent(
+    #     model=WORKER_MODEL,
+    #     tools=[google_search, VisitWebpageTool()],
+    #     additional_authorized_imports=['bs4.*', 'json'],
+    #     step_callbacks=[step_memory_cap],
+    #     name="web_agent",
+    #     verbosity_level=5,
+    #     max_steps=10,
+    #     planning_interval=5,
+    #     description="Web search agent for general queries and retrieving web pages as HTML",
+    # )
+    # wikipedia_agent = CodeAgent(
+    #     model=WORKER_MODEL,
+    #     tools=[wikipedia_search, get_wikipedia_page],
+    #     additional_authorized_imports=['bs4.*', 'json'],
+    #     step_callbacks=[step_memory_cap],
+    #     name="wikipedia_agent",
+    #     verbosity_level=5,
+    #     max_steps=10,
+    #     planning_interval=5,
+    #     description="Wikipedia agent to search and retrieve Wikipedia pages as HTML",
+    # )
+    # libretext_agent = CodeAgent(
+    #     model=WORKER_MODEL,
+    #     tools=[libretext_book_search, get_libretext_book],
+    #     additional_authorized_imports=['bs4.*', 'json'],
+    #     step_callbacks=[step_memory_cap],
+    #     name="libretext_agent",
+    #     verbosity_level=5,
+    #     max_steps=10,
+    #     planning_interval=5,
+    #     description="LibreText agent to search and retrieve content from academic textbooks books",
+    # )
+    # manager_agent = CodeAgent(
+    #     model=MANAGER_MODEL,
+    #     tools=[],
+    #     managed_agents=[web_agent, wikipedia_agent, libretext_agent],
+    #     additional_authorized_imports=['bs4.*', 'json'],
+    #     planning_interval=2,
+    #     verbosity_level=2,
+    #     final_answer_checks=[check_reasoning],
+    #     max_steps=20,
+    # )
     agent = CodeAgent(
+        model=MODEL,
+        tools=[
+            google_search,
+            VisitWebpageTool(),
+            wikipedia_search,
+            get_wikipedia_page,
+            libretext_book_search,
+            get_libretext_book
+        ],
         additional_authorized_imports=['bs4.*', 'json'],
+        step_callbacks=[step_memory_cap, step_wait],
         name="GAIA_agent",
         verbosity_level=5,
+        max_steps=20,
+        planning_interval=5
     )
     return agent

functions/agent_helper_functions.py ADDED Viewed

	@@ -0,0 +1,142 @@

+'''Helper functions for the agent(s) in the GAIA question answering system.'''
+import os
+import time
+import json
+import logging
+from openai import OpenAI
+from smolagents import CodeAgent, ActionStep, MessageRole
+from configuration import CHECK_MODEL, TOKEN_LIMITER, STEP_WAIT
+# Get logger for this module
+logger = logging.getLogger(__name__)
+def check_reasoning(final_answer:str, agent_memory):
+    """Checks the reasoning and plot of the agent's final answer."""
+    prompt = (
+        f"Here is a user-given task and the agent steps: {agent_memory.get_succinct_steps()}. " +
+        "Please check that the reasoning process and answer are correct. " +
+        "Do they correctly answer the given task? " +
+        "First list reasons why yes/no, then write your final decision: " +
+        "PASS in caps lock if it is satisfactory, FAIL if it is not. " +
+        f"Final answer: {str(final_answer)}"
+    )
+    messages = [
+        {
+            "role": "user",
+            "content": [
+                {
+                    "type": "text",
+                    "text": prompt,
+                }
+            ],
+        }
+    ]
+    output = CHECK_MODEL(messages).content
+    print("Feedback: ", output)
+    if "FAIL" in output:
+        raise Exception(output) # pylint:disable=broad-exception-raised
+    return True
+def step_memory_cap(memory_step: ActionStep, agent: CodeAgent) -> None:
+    '''Removes old steps from agent memory to keep context length under control.'''
+    task_step = agent.memory.steps[0]
+    planning_step = agent.memory.steps[1]
+    latest_step = agent.memory.steps[-1]
+    if len(agent.memory.steps) > 2:
+        agent.memory.steps = [task_step, planning_step, latest_step]
+    logger.info('Agent memory has %d steps', len(agent.memory.steps))
+    logger.info('Latest step is step %d', memory_step.step_number)
+    logger.info('Contains: %s messages', len(agent.memory.steps[-1].model_input_messages))
+    logger.info('Token usage: %s', agent.memory.steps[-1].token_usage.total_tokens)
+    for message in agent.memory.steps[-1].model_input_messages:
+        logger.debug(' Role: %s: %s', message['role'], message['content'][:100])
+    token_usage = agent.memory.steps[-1].token_usage.total_tokens
+    if token_usage > TOKEN_LIMITER:
+        logger.info('Token usage is %d, summarizing old messages', token_usage)
+        summary = summarize_old_messages(
+            agent.memory.steps[-1].model_input_messages[1:]
+        )
+        if summary is not None:
+            new_messages = [agent.memory.steps[-1].model_input_messages[0]]
+            new_messages.append({
+                'role': MessageRole.USER,
+                'content': [{
+                    'type': 'text',
+                    'text': f'Here is a summary of your investigation so far: {summary}'
+                }]
+            })
+            agent.memory.steps = [agent.memory.steps[0]]
+            agent.memory.steps[0].model_input_messages = new_messages
+        for message in agent.memory.steps[0].model_input_messages:
+            logger.debug(' Role: %s: %s', message['role'], message['content'][:100])
+def summarize_old_messages(messages: dict) -> dict:
+    '''Summarizes old messages to keep context length under control.'''
+    client = OpenAI(api_key=os.environ['MODAL_API_KEY'])
+    client.base_url = (
+        'https://gperdrizet--vllm-openai-compatible-summarization-serve.modal.run/v1'
+    )
+    # Default to first avalible model
+    model = client.models.list().data[0]
+    model_id = model.id
+    messages = [
+        {
+            'role': 'system',
+            'content': ('Summarize the following interaction between an AI agent and a user.' +
+                f'Return the summary formatted as text, not as JSON: {json.dumps(messages)}')
+        }
+    ]
+    completion_args = {
+        'model': model_id,
+        'messages': messages,
+    }
+    try:
+        response = client.chat.completions.create(**completion_args)
+    except Exception as e: # pylint: disable=broad-exception-caught
+        response = None
+        logger.error('Error during Modal API call: %s', e)
+    if response is not None:
+        summary = response.choices[0].message.content
+    else:
+        summary = None
+    return summary
+def step_wait(memory_step: ActionStep, agent: CodeAgent) -> None:
+    '''Waits for a while to prevent hitting API rate limits.'''
+    logger.info('Waiting for %d seconds to prevent hitting API rate limits', STEP_WAIT)
+    logger.info('Current step is %d', memory_step.step_number)
+    logger.info('Current agent has %d steps', len(agent.memory.steps))
+    time.sleep(STEP_WAIT)
+    return True

functions/tool_helper_functions.py CHANGED Viewed

@@ -1,9 +1,11 @@
 '''Helper functions for GAIA question answering agent tools.'''
 import time
 import logging
-import requests
 from bs4 import BeautifulSoup
 # Get logger for this module
 logger = logging.getLogger(__name__)
@@ -52,10 +54,12 @@ def libretext_book_parser(url: str) -> dict:
         chapter_count = 0
         for listing in chapter_listings:
             # Extract the link element
             link = listing.find('a', class_='mt-sortable-listing-link')
             if link:
                 # Extract title from the span with class 'mt-sortable-listing-title'
                 title_span = link.find('span', class_='mt-sortable-listing-title')
                 title = title_span.get_text(strip=True) if title_span else ''
@@ -69,11 +73,13 @@ def libretext_book_parser(url: str) -> dict:
                 # Clean up description - remove the title prefix if it appears
                 if description and title and description.startswith(title):
                     description = description[len(title):].strip()
                     if description.startswith(':'):
                         description = description[1:].strip()
                 # Only add meaningful chapters (skip empty titles or very short ones)
                 if title and len(title) > 2:
                     parsed_chapters[chapter_count] = {
                         'title': title,
                         'url': chapter_url,
@@ -85,14 +91,17 @@ def libretext_book_parser(url: str) -> dict:
                     chapter_count += 1
         logger.info('Successfully extracted %d chapters from book', len(parsed_chapters))
         return parsed_chapters
     except requests.exceptions.RequestException as e:
         logger.error('Request error while fetching book page: %s', str(e))
         return {'error': f'Request error: {str(e)}'}
     except Exception as e: # pylint:disable=broad-exception-caught
         logger.error('Unexpected error in book parser: %s', str(e))
         return {'error': f'Unexpected error: {str(e)}'}
@@ -233,40 +242,52 @@ def save_libretext_book_as_markdown(book_data: dict, filename: str = None, sourc
         # Table of contents
         chapters = book_data.get('chapters', {})
         if chapters:
             markdown_content.append("## Table of Contents\n")
             for chapter_title in chapters.keys():
                 # Create anchor link for the chapter
-                anchor = chapter_title.lower().replace(' ', '-').replace(':', '').replace('(', '').replace(')', '')
                 markdown_content.append(f"- [{chapter_title}](#{anchor})\n")
             markdown_content.append("\n---\n\n")
         # Chapter content
         for chapter_title, chapter_data in chapters.items():
             # Chapter heading
             markdown_content.append(f"## {chapter_title}\n\n")
             sections = chapter_data.get('sections', {})
             if not sections:
                 markdown_content.append("*No sections found for this chapter.*\n\n")
                 continue
             # Section content
             for section_title, section_data in sections.items():
                 # Section heading
                 markdown_content.append(f"### {section_title}\n\n")
                 # Section URL
                 section_url = section_data.get('Section url', '')
                 if section_url:
                     markdown_content.append(f"**URL:** [{section_url}]({section_url})\n\n")
                 # Section summary
                 section_summary = section_data.get('Section summary', '')
                 if section_summary:
                     markdown_content.append(f"{section_summary}\n\n")
-                else:
                     markdown_content.append("*No summary available.*\n\n")
                 markdown_content.append("---\n\n")
@@ -277,9 +298,271 @@ def save_libretext_book_as_markdown(book_data: dict, filename: str = None, sourc
         success_msg = f"Successfully saved LibreTexts book as markdown file: {filename}"
         logger.info(success_msg)
         return success_msg
     except Exception as e:  # pylint:disable=broad-exception-caught
         error_msg = f"Error saving markdown file: {str(e)}"
         logger.error(error_msg)
         return error_msg

 '''Helper functions for GAIA question answering agent tools.'''
+import requests
 import time
 import logging
+import bleach
 from bs4 import BeautifulSoup
+from bleach.css_sanitizer import CSSSanitizer
 # Get logger for this module
 logger = logging.getLogger(__name__)
         chapter_count = 0
         for listing in chapter_listings:
             # Extract the link element
             link = listing.find('a', class_='mt-sortable-listing-link')
             if link:
                 # Extract title from the span with class 'mt-sortable-listing-title'
                 title_span = link.find('span', class_='mt-sortable-listing-title')
                 title = title_span.get_text(strip=True) if title_span else ''
                 # Clean up description - remove the title prefix if it appears
                 if description and title and description.startswith(title):
                     description = description[len(title):].strip()
                     if description.startswith(':'):
                         description = description[1:].strip()
                 # Only add meaningful chapters (skip empty titles or very short ones)
                 if title and len(title) > 2:
                     parsed_chapters[chapter_count] = {
                         'title': title,
                         'url': chapter_url,
                     chapter_count += 1
         logger.info('Successfully extracted %d chapters from book', len(parsed_chapters))
         return parsed_chapters
     except requests.exceptions.RequestException as e:
         logger.error('Request error while fetching book page: %s', str(e))
         return {'error': f'Request error: {str(e)}'}
     except Exception as e: # pylint:disable=broad-exception-caught
         logger.error('Unexpected error in book parser: %s', str(e))
         return {'error': f'Unexpected error: {str(e)}'}
         # Table of contents
         chapters = book_data.get('chapters', {})
         if chapters:
             markdown_content.append("## Table of Contents\n")
             for chapter_title in chapters.keys():
                 # Create anchor link for the chapter
+                anchor = chapter_title.lower().replace(
+                    ' ',
+                    '-'
+                ).replace(':', '').replace('(', '').replace(')', '')
                 markdown_content.append(f"- [{chapter_title}](#{anchor})\n")
             markdown_content.append("\n---\n\n")
         # Chapter content
         for chapter_title, chapter_data in chapters.items():
             # Chapter heading
             markdown_content.append(f"## {chapter_title}\n\n")
             sections = chapter_data.get('sections', {})
             if not sections:
                 markdown_content.append("*No sections found for this chapter.*\n\n")
                 continue
             # Section content
             for section_title, section_data in sections.items():
                 # Section heading
                 markdown_content.append(f"### {section_title}\n\n")
                 # Section URL
                 section_url = section_data.get('Section url', '')
                 if section_url:
                     markdown_content.append(f"**URL:** [{section_url}]({section_url})\n\n")
                 # Section summary
                 section_summary = section_data.get('Section summary', '')
                 if section_summary:
                     markdown_content.append(f"{section_summary}\n\n")
                     markdown_content.append("*No summary available.*\n\n")
                 markdown_content.append("---\n\n")
         success_msg = f"Successfully saved LibreTexts book as markdown file: {filename}"
         logger.info(success_msg)
         return success_msg
     except Exception as e:  # pylint:disable=broad-exception-caught
         error_msg = f"Error saving markdown file: {str(e)}"
         logger.error(error_msg)
         return error_msg
+class WikipediaFetcher:
+    """Gets and cleans up Wikipedia pages."""
+    def fetch(self, page_name):
+        """
+        Passed a Wikipedia page's URL fragment, like
+        'Edward_Montagu,_1st_Earl_of_Sandwich', this will fetch the page's
+        main contents, tidy the HTML, strip out any elements we don't want
+        and return the final HTML string.
+        Returns a dict with two elements:
+            'success' is either True or, if we couldn't fetch the page, False.
+            'content' is the HTML if success==True, or else an error message.
+        """
+        result = self._get_html(page_name)
+        if result["success"]:
+            result["content"] = self._tidy_html(result["content"])
+        return result
+    def _get_html(self, page_name):
+        """
+        Passed the name of a Wikipedia page (eg, 'Samuel_Pepys'), it fetches
+        the HTML content (not the entire HTML page) and returns it.
+        Returns a dict with two elements:
+            'success' is either True or, if we couldn't fetch the page, False.
+            'content' is the HTML if success==True, or else an error message.
+        """
+        error_message = ""
+        url = f"https://en.wikipedia.org/wiki/{page_name}"
+        try:
+            response = requests.get(url, params={"action": "render"}, timeout=5)
+        except requests.exceptions.ConnectionError:
+            error_message = "Can't connect to domain."
+        except requests.exceptions.Timeout:
+            error_message = "Connection timed out."
+        except requests.exceptions.TooManyRedirects:
+            error_message = "Too many redirects."
+        try:
+            response.raise_for_status()
+        except requests.exceptions.HTTPError:
+            # 4xx or 5xx errors:
+            error_message = f"HTTP Error: {response.status_code}"
+        except NameError:
+            if error_message == "":
+                error_message = "Something unusual went wrong."
+        if error_message:
+            return {"success": False, "content": error_message}
+        else:
+            return {"success": True, "content": response.text}
+    def _tidy_html(self, html):
+        """
+        Passed the raw Wikipedia HTML, this returns valid HTML, with all
+        disallowed elements stripped out.
+        """
+        html = self._bleach_html(html)
+        html = self._strip_html(html)
+        return html
+    def _bleach_html(self, html):
+        """
+        Ensures we have valid HTML; no unclosed or mis-nested tags.
+        Removes any tags and attributes we don't want to let through.
+        Doesn't remove the contents of any disallowed tags.
+        Pass it an HTML string, it'll return the bleached HTML string.
+        """
+        # Pretty much most elements, but no forms or audio/video.
+        allowed_tags = {
+            "a",
+            "abbr",
+            "acronym",
+            "address",
+            "area",
+            "article",
+            "b",
+            "blockquote",
+            "br",
+            "caption",
+            "cite",
+            "code",
+            "col",
+            "colgroup",
+            "dd",
+            "del",
+            "dfn",
+            "div",
+            "dl",
+            "dt",
+            "em",
+            "figcaption",
+            "figure",
+            "footer",
+            "h1",
+            "h2",
+            "h3",
+            "h4",
+            "h5",
+            "h6",
+            "header",
+            "hgroup",
+            "hr",
+            "i",
+            "img",
+            "ins",
+            "kbd",
+            "li",
+            "map",
+            "nav",
+            "ol",
+            "p",
+            "pre",
+            "q",
+            "s",
+            "samp",
+            "section",
+            "small",
+            "span",
+            "strong",
+            "sub",
+            "sup",
+            "table",
+            "tbody",
+            "td",
+            "tfoot",
+            "th",
+            "thead",
+            "time",
+            "tr",
+            "ul",
+            "var",
+            # We allow script and style here, so we can close/un-mis-nest
+            # its tags, but then it's removed completely in _strip_html():
+            "script",
+            "style",
+        }
+        # These attributes will not be removed from any of the allowed tags.
+        allowed_attributes = {
+            "*": ["class", "id"],
+            "a": ["href", "title"],
+            "abbr": ["title"],
+            "acronym": ["title"],
+            "img": ["alt", "src", "srcset"],
+            # Ugh. Don't know why this page doesn't use .tright like others
+            # http://127.0.0.1:8000/encyclopedia/5040/
+            "table": ["align"],
+            "td": ["colspan", "rowspan", "style"],
+            "th": ["colspan", "rowspan", "scope"],
+        }
+        # These CSS properties are allowed within style attributes
+        # Added for the family tree on /encyclopedia/5825/
+        # Hopefully doesn't make anything else too hideous.
+        allowed_css_properties = [
+            "background",
+            "border",
+            "border-bottom",
+            "border-collapse",
+            "border-left",
+            "border-radius",
+            "border-right",
+            "border-spacing",
+            "border-top",
+            "height",
+            "padding",
+            "text-align",
+            "width",
+        ]
+        css_sanitizer = CSSSanitizer(allowed_css_properties=allowed_css_properties)
+        a = bleach.clean(
+            html,
+            tags=allowed_tags,
+            attributes=allowed_attributes,
+            css_sanitizer=css_sanitizer,
+            strip=True,
+        )
+        return a
+    def _strip_html(self, html):
+        """
+        Takes out any tags, and their contents, that we don't want at all.
+        And adds custom classes to existing tags (so we can apply CSS styles
+        without having to multiply our CSS).
+        Pass it an HTML string, it returns the stripped HTML string.
+        """
+        # CSS selectors. Strip these and their contents.
+        selectors = [
+            "div.hatnote",
+            "div.navbar.mini",  # Will also match div.mini.navbar
+            # Bottom of https://en.wikipedia.org/wiki/Charles_II_of_England :
+            "div.topicon",
+            "a.mw-headline-anchor",
+            "script",
+            "style",
+        ]
+        # Strip any element that has one of these classes.
+        classes = [
+            # "This article may be expanded with text translated from..."
+            # https://en.wikipedia.org/wiki/Afonso_VI_of_Portugal
+            "ambox-notice",
+            "magnify",
+            # eg audio on https://en.wikipedia.org/wiki/Bagpipes
+            "mediaContainer",
+            "navbox",
+            "noprint",
+        ]
+        # Any element has a class matching a key, it will have the classes
+        # in the value added.
+        add_classes = {
+            # Give these tables standard Bootstrap styles.
+            "infobox": ["table", "table-bordered"],
+            "ambox": ["table", "table-bordered"],
+            "wikitable": ["table", "table-bordered"],
+        }
+        soup = BeautifulSoup(html, "lxml")
+        for selector in selectors:
+            _ = [tag.decompose() for tag in soup.select(selector)]
+        for clss in classes:
+            _ = [tag.decompose() for tag in soup.find_all(attrs={"class": clss})]
+        for clss, new_classes in add_classes.items():
+            for tag in soup.find_all(attrs={"class": clss}):
+                tag["class"] = tag.get("class", []) + new_classes
+        # Depending on the HTML parser BeautifulSoup used, soup may have
+        # surrounding <html><body></body></html> or just <body></body> tags.
+        if soup.body:
+            soup = soup.body
+        elif soup.html:
+            soup = soup.html.body
+        # Put the content back into a string.
+        html = "".join(str(tag) for tag in soup.contents)
+        return html

functions/tools.py CHANGED Viewed

@@ -2,9 +2,7 @@
 import time
 import logging
-import bleach
 import requests
-from bleach.css_sanitizer import CSSSanitizer
 from smolagents import tool
 from googlesearch import search
 from bs4 import BeautifulSoup
@@ -17,7 +15,8 @@ from selenium.common.exceptions import TimeoutException, WebDriverException
 from functions.tool_helper_functions import (
     libretext_book_parser,
     libretext_chapter_parser,
-    save_libretext_book_as_markdown
 )
 # Get logger for this module
@@ -119,7 +118,7 @@ def get_wikipedia_page(query: str) -> str:
     content = content.split(
         '<div class="mw-heading mw-heading2"><h2 id="Further_reading">Further reading</h2></div>'
     )[0]
     content = content.split(
         '<div class="mw-heading mw-heading2"><h2 id="References">References</h2></div>'
     )[0]
@@ -127,266 +126,6 @@ def get_wikipedia_page(query: str) -> str:
     return content
-class WikipediaFetcher:
-    """Gets and cleans up Wikipedia pages."""
-    def fetch(self, page_name):
-        """
-        Passed a Wikipedia page's URL fragment, like
-        'Edward_Montagu,_1st_Earl_of_Sandwich', this will fetch the page's
-        main contents, tidy the HTML, strip out any elements we don't want
-        and return the final HTML string.
-        Returns a dict with two elements:
-            'success' is either True or, if we couldn't fetch the page, False.
-            'content' is the HTML if success==True, or else an error message.
-        """
-        result = self._get_html(page_name)
-        if result["success"]:
-            result["content"] = self._tidy_html(result["content"])
-        return result
-    def _get_html(self, page_name):
-        """
-        Passed the name of a Wikipedia page (eg, 'Samuel_Pepys'), it fetches
-        the HTML content (not the entire HTML page) and returns it.
-        Returns a dict with two elements:
-            'success' is either True or, if we couldn't fetch the page, False.
-            'content' is the HTML if success==True, or else an error message.
-        """
-        error_message = ""
-        url = f"https://en.wikipedia.org/wiki/{page_name}"
-        try:
-            response = requests.get(url, params={"action": "render"}, timeout=5)
-        except requests.exceptions.ConnectionError:
-            error_message = "Can't connect to domain."
-        except requests.exceptions.Timeout:
-            error_message = "Connection timed out."
-        except requests.exceptions.TooManyRedirects:
-            error_message = "Too many redirects."
-        try:
-            response.raise_for_status()
-        except requests.exceptions.HTTPError:
-            # 4xx or 5xx errors:
-            error_message = f"HTTP Error: {response.status_code}"
-        except NameError:
-            if error_message == "":
-                error_message = "Something unusual went wrong."
-        if error_message:
-            return {"success": False, "content": error_message}
-        else:
-            return {"success": True, "content": response.text}
-    def _tidy_html(self, html):
-        """
-        Passed the raw Wikipedia HTML, this returns valid HTML, with all
-        disallowed elements stripped out.
-        """
-        html = self._bleach_html(html)
-        html = self._strip_html(html)
-        return html
-    def _bleach_html(self, html):
-        """
-        Ensures we have valid HTML; no unclosed or mis-nested tags.
-        Removes any tags and attributes we don't want to let through.
-        Doesn't remove the contents of any disallowed tags.
-        Pass it an HTML string, it'll return the bleached HTML string.
-        """
-        # Pretty much most elements, but no forms or audio/video.
-        allowed_tags = {
-            "a",
-            "abbr",
-            "acronym",
-            "address",
-            "area",
-            "article",
-            "b",
-            "blockquote",
-            "br",
-            "caption",
-            "cite",
-            "code",
-            "col",
-            "colgroup",
-            "dd",
-            "del",
-            "dfn",
-            "div",
-            "dl",
-            "dt",
-            "em",
-            "figcaption",
-            "figure",
-            "footer",
-            "h1",
-            "h2",
-            "h3",
-            "h4",
-            "h5",
-            "h6",
-            "header",
-            "hgroup",
-            "hr",
-            "i",
-            "img",
-            "ins",
-            "kbd",
-            "li",
-            "map",
-            "nav",
-            "ol",
-            "p",
-            "pre",
-            "q",
-            "s",
-            "samp",
-            "section",
-            "small",
-            "span",
-            "strong",
-            "sub",
-            "sup",
-            "table",
-            "tbody",
-            "td",
-            "tfoot",
-            "th",
-            "thead",
-            "time",
-            "tr",
-            "ul",
-            "var",
-            # We allow script and style here, so we can close/un-mis-nest
-            # its tags, but then it's removed completely in _strip_html():
-            "script",
-            "style",
-        }
-        # These attributes will not be removed from any of the allowed tags.
-        allowed_attributes = {
-            "*": ["class", "id"],
-            "a": ["href", "title"],
-            "abbr": ["title"],
-            "acronym": ["title"],
-            "img": ["alt", "src", "srcset"],
-            # Ugh. Don't know why this page doesn't use .tright like others
-            # http://127.0.0.1:8000/encyclopedia/5040/
-            "table": ["align"],
-            "td": ["colspan", "rowspan", "style"],
-            "th": ["colspan", "rowspan", "scope"],
-        }
-        # These CSS properties are allowed within style attributes
-        # Added for the family tree on /encyclopedia/5825/
-        # Hopefully doesn't make anything else too hideous.
-        allowed_css_properties = [
-            "background",
-            "border",
-            "border-bottom",
-            "border-collapse",
-            "border-left",
-            "border-radius",
-            "border-right",
-            "border-spacing",
-            "border-top",
-            "height",
-            "padding",
-            "text-align",
-            "width",
-        ]
-        css_sanitizer = CSSSanitizer(allowed_css_properties=allowed_css_properties)
-        a = bleach.clean(
-            html,
-            tags=allowed_tags,
-            attributes=allowed_attributes,
-            css_sanitizer=css_sanitizer,
-            strip=True,
-        )
-        return a
-    def _strip_html(self, html):
-        """
-        Takes out any tags, and their contents, that we don't want at all.
-        And adds custom classes to existing tags (so we can apply CSS styles
-        without having to multiply our CSS).
-        Pass it an HTML string, it returns the stripped HTML string.
-        """
-        # CSS selectors. Strip these and their contents.
-        selectors = [
-            "div.hatnote",
-            "div.navbar.mini",  # Will also match div.mini.navbar
-            # Bottom of https://en.wikipedia.org/wiki/Charles_II_of_England :
-            "div.topicon",
-            "a.mw-headline-anchor",
-            "script",
-            "style",
-        ]
-        # Strip any element that has one of these classes.
-        classes = [
-            # "This article may be expanded with text translated from..."
-            # https://en.wikipedia.org/wiki/Afonso_VI_of_Portugal
-            "ambox-notice",
-            "magnify",
-            # eg audio on https://en.wikipedia.org/wiki/Bagpipes
-            "mediaContainer",
-            "navbox",
-            "noprint",
-        ]
-        # Any element has a class matching a key, it will have the classes
-        # in the value added.
-        add_classes = {
-            # Give these tables standard Bootstrap styles.
-            "infobox": ["table", "table-bordered"],
-            "ambox": ["table", "table-bordered"],
-            "wikitable": ["table", "table-bordered"],
-        }
-        soup = BeautifulSoup(html, "lxml")
-        for selector in selectors:
-            _ = [tag.decompose() for tag in soup.select(selector)]
-        for clss in classes:
-            _ = [tag.decompose() for tag in soup.find_all(attrs={"class": clss})]
-        for clss, new_classes in add_classes.items():
-            for tag in soup.find_all(attrs={"class": clss}):
-                tag["class"] = tag.get("class", []) + new_classes
-        # Depending on the HTML parser BeautifulSoup used, soup may have
-        # surrounding <html><body></body></html> or just <body></body> tags.
-        if soup.body:
-            soup = soup.body
-        elif soup.html:
-            soup = soup.html.body
-        # Put the content back into a string.
-        html = "".join(str(tag) for tag in soup.contents)
-        return html
 @tool
 def libretext_book_search(query: str) -> dict:
     """

 import time
 import logging
 import requests
 from smolagents import tool
 from googlesearch import search
 from bs4 import BeautifulSoup
 from functions.tool_helper_functions import (
     libretext_book_parser,
     libretext_chapter_parser,
+    save_libretext_book_as_markdown,
+    WikipediaFetcher
 )
 # Get logger for this module
     content = content.split(
         '<div class="mw-heading mw-heading2"><h2 id="Further_reading">Further reading</h2></div>'
     )[0]
     content = content.split(
         '<div class="mw-heading mw-heading2"><h2 id="References">References</h2></div>'
     )[0]
     return content
 @tool
 def libretext_book_search(query: str) -> dict:
     """

results.csv CHANGED Viewed

@@ -2,14 +2,14 @@ Task ID,Question,Submitted Answer
 8e867cd7-cff9-4e6c-867a-ff5ddc2550be,How many studio albums were published by Mercedes Sosa between 2000 and 2009 (included)? You can use the latest 2022 version of english wikipedia.,3
 2d83110e-a098-4ebb-9987-066c06fa42d0,".rewsna eht sa ""tfel"" drow eht fo etisoppo eht etirw ,ecnetnes siht dnatsrednu uoy fI",right
 4fc2f1ae-8625-45b5-ab34-ad4433bc21f8,Who nominated the only Featured Article on English Wikipedia about a dinosaur that was promoted in November 2016?,FunkMonk
-cabe07ed-9eca-40ea-8ead-410ef5e83f91,What is the surname of the equine veterinarian mentioned in 1.E Exercises from the chemistry materials licensed by Marisa Alviar-Agnew & Henry Agnew under the CK-12 license in LibreText's Introductory Chemistry materials as compiled 08/21/2023?,not found in materials
 3cef3a44-215e-4aed-8e3b-b1e3f08063b7,"I'm making a grocery list for my mom, but she's a professor of botany and she's a real stickler when it comes to categorizing things. I need to add different foods to different categories on the grocery list, but if I make a mistake, she won't buy anything inserted in the wrong category. Here's the list I have so far:
 milk, eggs, flour, whole bean coffee, Oreos, sweet potatoes, fresh basil, plums, green beans, rice, corn, bell pepper, whole allspice, acorns, broccoli, celery, zucchini, lettuce, peanuts
-I need to make headings for the fruits and vegetables. Could you please create a list of just the vegetables from my list? If you could do that, then I can figure out how to categorize the rest of the list into the appropriate categories. But remember that my mom is a real stickler, so make sure that no botanical fruits end up on the vegetable list, or she won't get them when she's at the store. Please alphabetize the list of vegetables, and place each item in a comma separated list.","broccoli, celery, green beans, lettuce, sweet potatoes, zucchini"
 305ac316-eef6-4446-960a-92d80d542f82,Who did the actor who played Ray in the Polish-language version of Everybody Loves Raymond play in Magda M.? Give only the first name.,Wojciech
-3f57289b-8c60-48be-bd80-01f8099ca449,How many at bats did the Yankee with the most walks in the 1977 regular season have that same season?,519
 cf106601-ab4f-4af9-b045-5295fe67b37d,"What country had the least number of athletes at the 1928 Summer Olympics? If there's a tie for a number of athletes, return the first in alphabetical order. Give the IOC country code as your answer.",CUB
 a0c07678-e491-4bbc-8f0b-07405144218f,"Who are the pitchers with the number before and after Taishō Tamai's number as of July 2023? Give them to me in the form Pitcher Before, Pitcher After, use their last names only, in Roman characters.","Yamasaki, Uehara"
-5a0c1adf-205e-4841-a666-7c3ef95def9d,What is the first name of the only Malko Competition recipient from the 20th Century (after 1977) whose nationality on record is a country that no longer exists?,Claus Peter

 8e867cd7-cff9-4e6c-867a-ff5ddc2550be,How many studio albums were published by Mercedes Sosa between 2000 and 2009 (included)? You can use the latest 2022 version of english wikipedia.,3
 2d83110e-a098-4ebb-9987-066c06fa42d0,".rewsna eht sa ""tfel"" drow eht fo etisoppo eht etirw ,ecnetnes siht dnatsrednu uoy fI",right
 4fc2f1ae-8625-45b5-ab34-ad4433bc21f8,Who nominated the only Featured Article on English Wikipedia about a dinosaur that was promoted in November 2016?,FunkMonk
+cabe07ed-9eca-40ea-8ead-410ef5e83f91,What is the surname of the equine veterinarian mentioned in 1.E Exercises from the chemistry materials licensed by Marisa Alviar-Agnew & Henry Agnew under the CK-12 license in LibreText's Introductory Chemistry materials as compiled 08/21/2023?,No equine veterinarian mentioned in 1.E Exercises
 3cef3a44-215e-4aed-8e3b-b1e3f08063b7,"I'm making a grocery list for my mom, but she's a professor of botany and she's a real stickler when it comes to categorizing things. I need to add different foods to different categories on the grocery list, but if I make a mistake, she won't buy anything inserted in the wrong category. Here's the list I have so far:
 milk, eggs, flour, whole bean coffee, Oreos, sweet potatoes, fresh basil, plums, green beans, rice, corn, bell pepper, whole allspice, acorns, broccoli, celery, zucchini, lettuce, peanuts
+I need to make headings for the fruits and vegetables. Could you please create a list of just the vegetables from my list? If you could do that, then I can figure out how to categorize the rest of the list into the appropriate categories. But remember that my mom is a real stickler, so make sure that no botanical fruits end up on the vegetable list, or she won't get them when she's at the store. Please alphabetize the list of vegetables, and place each item in a comma separated list.","bell pepper, broccoli, celery, corn, green beans, lettuce, sweet potatoes, zucchini"
 305ac316-eef6-4446-960a-92d80d542f82,Who did the actor who played Ray in the Polish-language version of Everybody Loves Raymond play in Magda M.? Give only the first name.,Wojciech
+3f57289b-8c60-48be-bd80-01f8099ca449,How many at bats did the Yankee with the most walks in the 1977 regular season have that same season?,525
 cf106601-ab4f-4af9-b045-5295fe67b37d,"What country had the least number of athletes at the 1928 Summer Olympics? If there's a tie for a number of athletes, return the first in alphabetical order. Give the IOC country code as your answer.",CUB
 a0c07678-e491-4bbc-8f0b-07405144218f,"Who are the pitchers with the number before and after Taishō Tamai's number as of July 2023? Give them to me in the form Pitcher Before, Pitcher After, use their last names only, in Roman characters.","Yamasaki, Uehara"
+5a0c1adf-205e-4841-a666-7c3ef95def9d,What is the first name of the only Malko Competition recipient from the 20th Century (after 1977) whose nationality on record is a country that no longer exists?,Claus Peter Flor