sft_code_quiz

Sleeping

App Files Files Community

burtenshaw commited on Feb 13

Commit

f49bcc1

1 Parent(s): 5ba66b9

update app with formatting and images

Browse files

Files changed (4) hide show

app.py +131 -47
push_data.ipynb +215 -0
pyproject.toml +1 -0
uv.lock +48 -0

app.py CHANGED Viewed

@@ -1,10 +1,11 @@
 import os
 from datetime import datetime
 import random
 import gradio as gr
 from datasets import load_dataset, Dataset, DatasetDict
 from huggingface_hub import whoami, InferenceClient
 # Initialize the inference client
 client = InferenceClient(
@@ -12,37 +13,64 @@ client = InferenceClient(
 )
 # Load questions from Hugging Face dataset
-EXAM_MAX_QUESTIONS = os.getenv("EXAM_MAX_QUESTIONS") or 5  # We have 5 questions total
-EXAM_PASSING_SCORE = os.getenv("EXAM_PASSING_SCORE") or 0.7
 EXAM_DATASET_ID = "burtenshaw/dummy-code-quiz"
 # prep the dataset for the quiz
-ds = load_dataset(EXAM_DATASET_ID, split="train")
-quiz_data = ds.to_list()
 random.shuffle(quiz_data)
-def check_code(user_code, solution, challenge):
     """
     Use LLM to evaluate if the user's code solution is correct.
     Returns True if the solution is correct, False otherwise.
     """
     prompt = f"""You are an expert Python programming instructor evaluating a student's code solution.
     Challenge:
     {challenge}
     Reference Solution:
-    {solution}
     Student's Solution:
-    {user_code}
     Evaluate if the student's solution is functionally equivalent to the reference solution.
     Consider:
     1. Does it solve the problem correctly?
     2. Does it handle edge cases appropriately?
     3. Does it follow the requirements of the challenge?
     Respond with ONLY "CORRECT" or "INCORRECT" followed by a brief explanation.
     """
@@ -71,18 +99,40 @@ def check_code(user_code, solution, challenge):
     except Exception as e:
         gr.Warning(f"Error checking code: {str(e)}")
         # Fall back to simple string comparison if LLM fails
-        is_correct = user_code.strip() == solution.strip()
         status = "✅ Correct!" if is_correct else "❌ Incorrect!"
         gr.Info(f"{status} (Fallback comparison)")
         return is_correct
 def on_user_logged_in(token: gr.OAuthToken | None):
-    """Handle user login state"""
     if token is not None:
-        return gr.update(visible=False), gr.update(visible=True)
     else:
-        return gr.update(visible=True), gr.update(visible=False)
 def push_results_to_hub(
@@ -168,14 +218,20 @@ def handle_quiz(question_idx, user_answers, submitted_code, is_start):
             question_idx < len(quiz_data) and submitted_code.strip()
         ):  # Only check if there's code
             current_q = quiz_data[question_idx]
             is_correct = check_code(
-                submitted_code, current_q["solution"], current_q["challenge"]
             )
             user_answers.append(
                 {
                     "challenge": current_q["challenge"],
-                    "submitted_code": submitted_code,
                     "correct_solution": current_q["solution"],
                     "is_correct": is_correct,
                 }
             )
@@ -195,31 +251,36 @@ def handle_quiz(question_idx, user_answers, submitted_code, is_start):
             results_text += (
                 f"Question {idx + 1}: {'✅' if answer['is_correct'] else '❌'}\n"
             )
-            results_text += (
-                f"Your code:\n```python\n{answer['submitted_code']}\n```\n\n"
-            )
         return (
-            "",  # question_text becomes blank
-            gr.update(value="", visible=False),  # clear and hide code input
-            f"{'✅ Passed!' if grade >= float(EXAM_PASSING_SCORE) else '❌ Did not pass'}",
-            question_idx,
-            user_answers,
-            start_btn_update,
-            gr.update(value=results_text, visible=True),  # show final_markdown
         )
     else:
         # Show the next question
         q = quiz_data[question_idx]
         challenge_text = f"## Question {question_idx + 1} \n### {q['challenge']}"
         return (
-            challenge_text,
-            gr.update(value=q["placeholder"], visible=True),
-            "Submit your code solution and click 'Next' to continue.",
-            question_idx,
-            user_answers,
-            start_btn_update,
-            gr.update(visible=False),  # Hide final_markdown
         )
@@ -238,35 +299,55 @@ with gr.Blocks() as demo:
         )
     with gr.Row(variant="panel"):
-        question_text = gr.Markdown("")
-        code_input = gr.Code(language="python", label="Your Solution", visible=False)
     with gr.Row(variant="compact"):
         status_text = gr.Markdown("")
     with gr.Row(variant="compact"):
-        final_markdown = gr.Markdown("", visible=False)
-        next_btn = gr.Button("Next ⏭️")
-        submit_btn = gr.Button("Submit ✅")
     with gr.Row(variant="compact"):
-        login_btn = gr.LoginButton()
-        start_btn = gr.Button("Start", visible=False)
-    login_btn.click(fn=on_user_logged_in, inputs=None, outputs=[login_btn, start_btn])
     start_btn.click(
         fn=handle_quiz,
         inputs=[question_idx, user_answers, code_input, gr.State(True)],
         outputs=[
-            question_text,
-            code_input,
-            status_text,
-            question_idx,
-            user_answers,
-            start_btn,
-            final_markdown,
         ],
     )
@@ -280,7 +361,10 @@ with gr.Blocks() as demo:
             question_idx,
             user_answers,
             start_btn,
             final_markdown,
         ],
     )

 import os
 from datetime import datetime
 import random
+from typing import List
 import gradio as gr
 from datasets import load_dataset, Dataset, DatasetDict
 from huggingface_hub import whoami, InferenceClient
+import black  # Add black import
 # Initialize the inference client
 client = InferenceClient(
 )
 # Load questions from Hugging Face dataset
+EXAM_MAX_QUESTIONS = int(
+    os.getenv("EXAM_MAX_QUESTIONS", 5)
+)  # Limit quiz to max questions
+EXAM_PASSING_SCORE = float(os.getenv("EXAM_PASSING_SCORE", 0.8))
 EXAM_DATASET_ID = "burtenshaw/dummy-code-quiz"
 # prep the dataset for the quiz
+ds = load_dataset(EXAM_DATASET_ID, split="train", download_mode="force_redownload")
+quiz_data = list(ds)  # Convert dataset to list instead of using to_list()
 random.shuffle(quiz_data)
+if EXAM_MAX_QUESTIONS:
+    quiz_data = quiz_data[:EXAM_MAX_QUESTIONS]
+def format_python_code(code: str) -> str:
+    """Format Python code using black."""
+    try:
+        return black.format_str(code, mode=black.Mode())
+    except Exception as e:
+        gr.Warning(f"Code formatting failed: {str(e)}")
+        return code
+def check_code(
+    user_code: str, solution: str, challenge: str, assessment_criteria: List[str]
+):
     """
     Use LLM to evaluate if the user's code solution is correct.
     Returns True if the solution is correct, False otherwise.
     """
+    # Format both user code and solution
+    formatted_user_code = format_python_code(user_code)
+    formatted_solution = format_python_code(solution)
+    assessment_criteria_str = "\n".join(
+        [f"{i + 1}. {c}" for i, c in enumerate(assessment_criteria)]
+    )
     prompt = f"""You are an expert Python programming instructor evaluating a student's code solution.
     Challenge:
     {challenge}
     Reference Solution:
+    {formatted_solution}
     Student's Solution:
+    {formatted_user_code}
+    Assessment Criteria:
+    {assessment_criteria_str}
     Evaluate if the student's solution is functionally equivalent to the reference solution.
     Consider:
     1. Does it solve the problem correctly?
     2. Does it handle edge cases appropriately?
     3. Does it follow the requirements of the challenge?
+    4. Does it meet the assessment criteria?
     Respond with ONLY "CORRECT" or "INCORRECT" followed by a brief explanation.
     """
     except Exception as e:
         gr.Warning(f"Error checking code: {str(e)}")
         # Fall back to simple string comparison if LLM fails
+        is_correct = formatted_user_code.strip() == formatted_solution.strip()
         status = "✅ Correct!" if is_correct else "❌ Incorrect!"
         gr.Info(f"{status} (Fallback comparison)")
         return is_correct
 def on_user_logged_in(token: gr.OAuthToken | None):
+    """
+    Handle user login state.
+    On a valid token, hide the login button and reveal the Start button while keeping Next and Submit hidden.
+    Also, clear the question text, code input, status, and image.
+    """
     if token is not None:
+        return (
+            gr.update(visible=False),  # login_btn hidden
+            gr.update(visible=True),  # start_btn shown
+            gr.update(visible=False),  # next_btn hidden
+            gr.update(visible=False),  # submit_btn hidden
+            "",  # Clear question_text
+            gr.update(value="", visible=False),  # Clear code_input
+            "",  # Clear status_text
+            gr.update(value="", visible=False),  # Clear question_image
+        )
     else:
+        return (
+            gr.update(visible=True),  # login_btn visible
+            gr.update(visible=False),  # start_btn hidden
+            gr.update(visible=False),  # next_btn hidden
+            gr.update(visible=False),  # submit_btn hidden
+            "",
+            gr.update(value="", visible=False),
+            "",
+            gr.update(value="", visible=False),
+        )
 def push_results_to_hub(
             question_idx < len(quiz_data) and submitted_code.strip()
         ):  # Only check if there's code
             current_q = quiz_data[question_idx]
+            # Format the submitted code before checking
+            formatted_code = format_python_code(submitted_code)
             is_correct = check_code(
+                formatted_code,
+                current_q["solution"],
+                current_q["challenge"],
+                current_q["assessment_criteria"],
             )
             user_answers.append(
                 {
                     "challenge": current_q["challenge"],
+                    "submitted_code": formatted_code,  # Store formatted code
                     "correct_solution": current_q["solution"],
+                    "assessment_criteria": current_q["assessment_criteria"],
                     "is_correct": is_correct,
                 }
             )
             results_text += (
                 f"Question {idx + 1}: {'✅' if answer['is_correct'] else '❌'}\n"
             )
         return (
+            "",  # question_text cleared
+            gr.update(value="", visible=False),  # hide code_input
+            f"{'✅ Passed!' if grade >= EXAM_PASSING_SCORE else '❌ Did not pass'}",  # status_text
+            question_idx,  # updated question index
+            user_answers,  # accumulated answers
+            gr.update(visible=False),  # start_btn hidden for quiz-in-progress
+            gr.update(visible=False),  # next_btn hidden on completion
+            gr.update(visible=True),  # submit_btn shown
+            gr.update(value=results_text, visible=True),  # final_markdown with results
+            gr.update(visible=False),  # question_image hidden on completion
         )
     else:
         # Show the next question
         q = quiz_data[question_idx]
         challenge_text = f"## Question {question_idx + 1} \n### {q['challenge']}"
         return (
+            challenge_text,  # question_text
+            gr.update(value=q["placeholder"], visible=True),  # code_input
+            "Submit your code solution and click 'Next' to continue.",  # status_text
+            question_idx,  # updated question_idx
+            user_answers,  # user_answers
+            gr.update(visible=False),  # start_btn hidden
+            gr.update(visible=True),  # next_btn visible
+            gr.update(visible=False),  # submit_btn hidden
+            gr.update(visible=False),  # final_markdown hidden
+            gr.update(
+                value=q["image"], visible=True if q["image"] else False
+            ),  # question_image with current question image
         )
         )
     with gr.Row(variant="panel"):
+        with gr.Column():
+            question_text = gr.Markdown("")
+            question_image = gr.Image(
+                label="Question Image", visible=False, type="pil"
+            )  # Add image component
+        with gr.Column():
+            code_input = gr.Code(language="python", label="Your Solution", visible=False)
     with gr.Row(variant="compact"):
         status_text = gr.Markdown("")
     with gr.Row(variant="compact"):
+        login_btn = gr.LoginButton()
+        start_btn = gr.Button("Start")
+        next_btn = gr.Button("Next ⏭️", visible=False)
+        submit_btn = gr.Button("Submit ✅", visible=False)
     with gr.Row(variant="compact"):
+        final_markdown = gr.Markdown("", visible=False)
+    login_btn.click(
+        fn=on_user_logged_in,
+        inputs=None,
+        outputs=[
+            login_btn,
+            start_btn,
+            next_btn,
+            submit_btn,
+            question_text,
+            code_input,
+            status_text,
+            question_image,
+        ],
+    )
     start_btn.click(
         fn=handle_quiz,
         inputs=[question_idx, user_answers, code_input, gr.State(True)],
         outputs=[
+            question_text,  # Markdown with question text
+            code_input,  # Code input field
+            status_text,  # Status text (instructions/status messages)
+            question_idx,  # Updated question index (state)
+            user_answers,  # Updated user answers (state)
+            start_btn,  # Update for start button (will be hidden)
+            next_btn,  # Update for next button (shown for in-progress quiz)
+            submit_btn,  # Update for submit button (hidden until end)
+            final_markdown,  # Final results markdown (hidden until quiz ends)
+            question_image,  # Image update for the quiz question
         ],
     )
             question_idx,
             user_answers,
             start_btn,
+            next_btn,
+            submit_btn,
             final_markdown,
+            question_image,
         ],
     )

push_data.ipynb ADDED Viewed

	@@ -0,0 +1,215 @@

+{
+ "cells": [
+  {
+   "cell_type": "code",
+   "execution_count": 41,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "Generating train split: 40 examples [00:00, 9668.75 examples/s]"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "DatasetDict({\n",
+      "    train: Dataset({\n",
+      "        features: ['challenge', 'solution', 'placeholder', 'context', 'assessment_criteria', 'image'],\n",
+      "        num_rows: 40\n",
+      "    })\n",
+      "})\n"
+     ]
+    },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "\n"
+     ]
+    }
+   ],
+   "source": [
+    "from datasets import load_dataset\n",
+    "\n",
+    "dataset = load_dataset(\"json\", data_files=\"example.json\")\n",
+    "\n",
+    "print(dataset)\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 42,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "Map: 100%|██████████| 40/40 [00:00<00:00, 6077.16 examples/s]\n"
+     ]
+    }
+   ],
+   "source": [
+    "from datasets import Image\n",
+    "from PIL import Image as PILImage\n",
+    "\n",
+    "new_features = dataset[\"train\"].features\n",
+    "new_features[\"image\"] = Image()\n",
+    "\n",
+    "dataset.features = new_features\n",
+    "\n",
+    "dataset = dataset.map(lambda x: {\"image\": PILImage.open(x[\"image\"]) if x[\"image\"] else None})\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 43,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "{'challenge': Value(dtype='string', id=None),\n",
+       " 'solution': Value(dtype='string', id=None),\n",
+       " 'placeholder': Value(dtype='string', id=None),\n",
+       " 'context': Value(dtype='string', id=None),\n",
+       " 'assessment_criteria': Sequence(feature=Value(dtype='string', id=None), length=-1, id=None),\n",
+       " 'image': Image(mode=None, decode=True, id=None)}"
+      ]
+     },
+     "execution_count": 43,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "dataset = dataset.cast_column(\"image\", Image())\n",
+    "\n",
+    "dataset[\"train\"].features"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 44,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "Map: 100%|██████████| 40/40 [00:00<00:00, 13932.25 examples/s]it/s]\n",
+      "Creating parquet from Arrow format: 100%|██████████| 1/1 [00:00<00:00, 1119.68ba/s]\n",
+      "Uploading the dataset shards: 100%|██████████| 1/1 [00:01<00:00,  1.36s/it]\n"
+     ]
+    },
+    {
+     "data": {
+      "text/plain": [
+       "CommitInfo(commit_url='https://huggingface.co/datasets/burtenshaw/dummy-code-quiz/commit/9fdc884bb54602cce29639e76a7cabedf79811f8', commit_message='Upload dataset', commit_description='', oid='9fdc884bb54602cce29639e76a7cabedf79811f8', pr_url=None, repo_url=RepoUrl('https://huggingface.co/datasets/burtenshaw/dummy-code-quiz', endpoint='https://huggingface.co', repo_type='dataset', repo_id='burtenshaw/dummy-code-quiz'), pr_revision=None, pr_num=None)"
+      ]
+     },
+     "execution_count": 44,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "dataset.push_to_hub(\"burtenshaw/dummy-code-quiz\", private=False)\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 15,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "'/Users/ben/code/code_assignment_app/images/1.png'"
+      ]
+     },
+     "execution_count": 15,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "dataset[\"train\"][0][\"image\"]"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 3,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "Generating burtenshaw split: 100%|██████████| 1/1 [00:00<00:00, 262.13 examples/s]\n"
+     ]
+    }
+   ],
+   "source": [
+    "response_ds = load_dataset(\"agents-course/dummy-code-quiz_responses\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 4,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "DatasetDict({\n",
+       "    burtenshaw: Dataset({\n",
+       "        features: ['username', 'datetime', 'grade', 'challenge', 'submitted_code', 'correct_solution', 'is_correct'],\n",
+       "        num_rows: 1\n",
+       "    })\n",
+       "})"
+      ]
+     },
+     "execution_count": 4,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "response_ds"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": ".venv",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.11.10"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 2
+}

pyproject.toml CHANGED Viewed

@@ -5,6 +5,7 @@ description = "Add your description here"
 readme = "README.md"
 requires-python = ">=3.11"
 dependencies = [
     "datasets>=3.2.0",
     "gradio[oauth]>=5.13.2",
     "huggingface-hub>=0.28.0",

 readme = "README.md"
 requires-python = ">=3.11"
 dependencies = [
+    "black>=25.1.0",
     "datasets>=3.2.0",
     "gradio[oauth]>=5.13.2",
     "huggingface-hub>=0.28.0",

uv.lock CHANGED Viewed

@@ -200,6 +200,34 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/e8/6a/e83a6c04f8c6014c33d97c135782a55370cf60513f8d9f99f1279c7f9c13/Authlib-1.4.1-py2.py3-none-any.whl", hash = "sha256:edc29c3f6a3e72cd9e9f45fff67fc663a2c364022eb0371c003f22d5405915c1", size = 225610 },
 ]
 [[package]]
 name = "certifi"
 version = "2024.12.14"
@@ -319,6 +347,7 @@ name = "code-assignment-app"
 version = "0.1.0"
 source = { virtual = "." }
 dependencies = [
     { name = "datasets" },
     { name = "gradio", extra = ["oauth"] },
     { name = "huggingface-hub" },
@@ -327,6 +356,7 @@ dependencies = [
 [package.metadata]
 requires-dist = [
     { name = "datasets", specifier = ">=3.2.0" },
     { name = "gradio", extras = ["oauth"], specifier = ">=5.13.2" },
     { name = "huggingface-hub", specifier = ">=0.28.0" },
@@ -922,6 +952,15 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/da/d9/f7f9379981e39b8c2511c9e0326d212accacb82f12fbfdc1aa2ce2a7b2b6/multiprocess-0.70.16-py39-none-any.whl", hash = "sha256:a0bafd3ae1b732eac64be2e72038231c1ba97724b60b09400d68f229fcc2fbf3", size = 133351 },
 ]
 [[package]]
 name = "nest-asyncio"
 version = "1.6.0"
@@ -1085,6 +1124,15 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/c6/ac/dac4a63f978e4dcb3c6d3a78c4d8e0192a113d288502a1216950c41b1027/parso-0.8.4-py2.py3-none-any.whl", hash = "sha256:a418670a20291dacd2dddc80c377c5c3791378ee1e8d12bffc35420643d43f18", size = 103650 },
 ]
 [[package]]
 name = "pexpect"
 version = "4.9.0"

     { url = "https://files.pythonhosted.org/packages/e8/6a/e83a6c04f8c6014c33d97c135782a55370cf60513f8d9f99f1279c7f9c13/Authlib-1.4.1-py2.py3-none-any.whl", hash = "sha256:edc29c3f6a3e72cd9e9f45fff67fc663a2c364022eb0371c003f22d5405915c1", size = 225610 },
 ]
+[[package]]
+name = "black"
+version = "25.1.0"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "click" },
+    { name = "mypy-extensions" },
+    { name = "packaging" },
+    { name = "pathspec" },
+    { name = "platformdirs" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/94/49/26a7b0f3f35da4b5a65f081943b7bcd22d7002f5f0fb8098ec1ff21cb6ef/black-25.1.0.tar.gz", hash = "sha256:33496d5cd1222ad73391352b4ae8da15253c5de89b93a80b3e2c8d9a19ec2666", size = 649449 }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/7e/4f/87f596aca05c3ce5b94b8663dbfe242a12843caaa82dd3f85f1ffdc3f177/black-25.1.0-cp311-cp311-macosx_10_9_x86_64.whl", hash = "sha256:a39337598244de4bae26475f77dda852ea00a93bd4c728e09eacd827ec929df0", size = 1614372 },
+    { url = "https://files.pythonhosted.org/packages/e7/d0/2c34c36190b741c59c901e56ab7f6e54dad8df05a6272a9747ecef7c6036/black-25.1.0-cp311-cp311-macosx_11_0_arm64.whl", hash = "sha256:96c1c7cd856bba8e20094e36e0f948718dc688dba4a9d78c3adde52b9e6c2299", size = 1442865 },
+    { url = "https://files.pythonhosted.org/packages/21/d4/7518c72262468430ead45cf22bd86c883a6448b9eb43672765d69a8f1248/black-25.1.0-cp311-cp311-manylinux_2_17_x86_64.manylinux2014_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:bce2e264d59c91e52d8000d507eb20a9aca4a778731a08cfff7e5ac4a4bb7096", size = 1749699 },
+    { url = "https://files.pythonhosted.org/packages/58/db/4f5beb989b547f79096e035c4981ceb36ac2b552d0ac5f2620e941501c99/black-25.1.0-cp311-cp311-win_amd64.whl", hash = "sha256:172b1dbff09f86ce6f4eb8edf9dede08b1fce58ba194c87d7a4f1a5aa2f5b3c2", size = 1428028 },
+    { url = "https://files.pythonhosted.org/packages/83/71/3fe4741df7adf015ad8dfa082dd36c94ca86bb21f25608eb247b4afb15b2/black-25.1.0-cp312-cp312-macosx_10_13_x86_64.whl", hash = "sha256:4b60580e829091e6f9238c848ea6750efed72140b91b048770b64e74fe04908b", size = 1650988 },
+    { url = "https://files.pythonhosted.org/packages/13/f3/89aac8a83d73937ccd39bbe8fc6ac8860c11cfa0af5b1c96d081facac844/black-25.1.0-cp312-cp312-macosx_11_0_arm64.whl", hash = "sha256:1e2978f6df243b155ef5fa7e558a43037c3079093ed5d10fd84c43900f2d8ecc", size = 1453985 },
+    { url = "https://files.pythonhosted.org/packages/6f/22/b99efca33f1f3a1d2552c714b1e1b5ae92efac6c43e790ad539a163d1754/black-25.1.0-cp312-cp312-manylinux_2_17_x86_64.manylinux2014_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:3b48735872ec535027d979e8dcb20bf4f70b5ac75a8ea99f127c106a7d7aba9f", size = 1783816 },
+    { url = "https://files.pythonhosted.org/packages/18/7e/a27c3ad3822b6f2e0e00d63d58ff6299a99a5b3aee69fa77cd4b0076b261/black-25.1.0-cp312-cp312-win_amd64.whl", hash = "sha256:ea0213189960bda9cf99be5b8c8ce66bb054af5e9e861249cd23471bd7b0b3ba", size = 1440860 },
+    { url = "https://files.pythonhosted.org/packages/98/87/0edf98916640efa5d0696e1abb0a8357b52e69e82322628f25bf14d263d1/black-25.1.0-cp313-cp313-macosx_10_13_x86_64.whl", hash = "sha256:8f0b18a02996a836cc9c9c78e5babec10930862827b1b724ddfe98ccf2f2fe4f", size = 1650673 },
+    { url = "https://files.pythonhosted.org/packages/52/e5/f7bf17207cf87fa6e9b676576749c6b6ed0d70f179a3d812c997870291c3/black-25.1.0-cp313-cp313-macosx_11_0_arm64.whl", hash = "sha256:afebb7098bfbc70037a053b91ae8437c3857482d3a690fefc03e9ff7aa9a5fd3", size = 1453190 },
+    { url = "https://files.pythonhosted.org/packages/e3/ee/adda3d46d4a9120772fae6de454c8495603c37c4c3b9c60f25b1ab6401fe/black-25.1.0-cp313-cp313-manylinux_2_17_x86_64.manylinux2014_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:030b9759066a4ee5e5aca28c3c77f9c64789cdd4de8ac1df642c40b708be6171", size = 1782926 },
+    { url = "https://files.pythonhosted.org/packages/cc/64/94eb5f45dcb997d2082f097a3944cfc7fe87e071907f677e80788a2d7b7a/black-25.1.0-cp313-cp313-win_amd64.whl", hash = "sha256:a22f402b410566e2d1c950708c77ebf5ebd5d0d88a6a2e87c86d9fb48afa0d18", size = 1442613 },
+    { url = "https://files.pythonhosted.org/packages/09/71/54e999902aed72baf26bca0d50781b01838251a462612966e9fc4891eadd/black-25.1.0-py3-none-any.whl", hash = "sha256:95e8176dae143ba9097f351d174fdaf0ccd29efb414b362ae3fd72bf0f710717", size = 207646 },
+]
 [[package]]
 name = "certifi"
 version = "2024.12.14"
 version = "0.1.0"
 source = { virtual = "." }
 dependencies = [
+    { name = "black" },
     { name = "datasets" },
     { name = "gradio", extra = ["oauth"] },
     { name = "huggingface-hub" },
 [package.metadata]
 requires-dist = [
+    { name = "black", specifier = ">=25.1.0" },
     { name = "datasets", specifier = ">=3.2.0" },
     { name = "gradio", extras = ["oauth"], specifier = ">=5.13.2" },
     { name = "huggingface-hub", specifier = ">=0.28.0" },
     { url = "https://files.pythonhosted.org/packages/da/d9/f7f9379981e39b8c2511c9e0326d212accacb82f12fbfdc1aa2ce2a7b2b6/multiprocess-0.70.16-py39-none-any.whl", hash = "sha256:a0bafd3ae1b732eac64be2e72038231c1ba97724b60b09400d68f229fcc2fbf3", size = 133351 },
 ]
+[[package]]
+name = "mypy-extensions"
+version = "1.0.0"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/98/a4/1ab47638b92648243faf97a5aeb6ea83059cc3624972ab6b8d2316078d3f/mypy_extensions-1.0.0.tar.gz", hash = "sha256:75dbf8955dc00442a438fc4d0666508a9a97b6bd41aa2f0ffe9d2f2725af0782", size = 4433 }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/2a/e2/5d3f6ada4297caebe1a2add3b126fe800c96f56dbe5d1988a2cbe0b267aa/mypy_extensions-1.0.0-py3-none-any.whl", hash = "sha256:4392f6c0eb8a5668a69e23d168ffa70f0be9ccfd32b5cc2d26a34ae5b844552d", size = 4695 },
+]
 [[package]]
 name = "nest-asyncio"
 version = "1.6.0"
     { url = "https://files.pythonhosted.org/packages/c6/ac/dac4a63f978e4dcb3c6d3a78c4d8e0192a113d288502a1216950c41b1027/parso-0.8.4-py2.py3-none-any.whl", hash = "sha256:a418670a20291dacd2dddc80c377c5c3791378ee1e8d12bffc35420643d43f18", size = 103650 },
 ]
+[[package]]
+name = "pathspec"
+version = "0.12.1"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/ca/bc/f35b8446f4531a7cb215605d100cd88b7ac6f44ab3fc94870c120ab3adbf/pathspec-0.12.1.tar.gz", hash = "sha256:a482d51503a1ab33b1c67a6c3813a26953dbdc71c31dacaef9a838c4e29f5712", size = 51043 }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/cc/20/ff623b09d963f88bfde16306a54e12ee5ea43e9b597108672ff3a408aad6/pathspec-0.12.1-py3-none-any.whl", hash = "sha256:a0d503e138a4c123b27490a4f7beda6a01c6f288df0e4a8b79c7eb0dc7b4cc08", size = 31191 },
+]
 [[package]]
 name = "pexpect"
 version = "4.9.0"