IPA-Transcription-EN

Running

App Files Files Community

arunasrivastava commited on Dec 5, 2024

Commit

3b95ded

1 Parent(s): eaaacf5

changed coloring on frontend

Browse files

Files changed (2) hide show

__pycache__/app.cpython-310.pyc +0 -0
app.py +90 -242

__pycache__/app.cpython-310.pyc ADDED Viewed

Binary file (2.6 kB). View file

app.py CHANGED Viewed

@@ -1,281 +1,129 @@
 import gradio as gr
 import pandas as pd
-import json
 from pathlib import Path
 from datetime import datetime, timezone
-import uuid
 LAST_UPDATED = "Dec 4th 2024"
-QUEUE_DIR = Path("/Users/arunasrivastava/Koel/IPA-Leaderboard/IPA-Transcription-EN-queue/queue")
-APP_DIR = Path("./")
-# Modified column names for phonemic transcription metrics
-column_names = {
-    "MODEL": "Model",
-    "AVG_PER": "Average PER ⬇️",
-    "AVG_PWED": "Average PWED ⬇️",
-    "GITHUB_URL": "GitHub",
-    "DATE": "Submission Date"
-}
-def load_json_file(file_path: Path, default=None):
-    """Safely load a JSON file or return default if file doesn't exist"""
-    if default is None:
-        default = []
-    if not file_path.exists():
-        return default
-    try:
-        with open(file_path, 'r') as f:
-            return json.load(f)
-    except json.JSONDecodeError:
-        return default
-def save_json_file(file_path: Path, data):
-    """Safely save data to a JSON file"""
-    file_path.parent.mkdir(parents=True, exist_ok=True)
-    with open(file_path, 'w') as f:
-        json.dump(data, f, indent=2, ensure_ascii=False)
 def load_leaderboard_data():
-    """Load and parse leaderboard data"""
-    leaderboard_path = QUEUE_DIR / "leaderboard.json"
-    data = load_json_file(leaderboard_path)
-    return pd.DataFrame(data) if data else pd.DataFrame()
 def format_leaderboard_df(df):
-    """Format leaderboard dataframe for display"""
     if df.empty:
         return df
-    # Select and rename only the columns we want to display
     display_df = pd.DataFrame({
-        "MODEL": df["model"],
-        "AVG_PER": df["average_per"],
-        "AVG_PWED": df["average_pwed"],
-        "GITHUB_URL": df["github_url"],
-        "DATE": pd.to_datetime(df["submission_date"]).dt.strftime("%Y-%m-%d")
     })
-    # Format numeric columns
-    display_df["AVG_PER"] = display_df["AVG_PER"].apply(lambda x: f"{x:.4f}")
-    display_df["AVG_PWED"] = display_df["AVG_PWED"].apply(lambda x: f"{x:.4f}")
-    # Make GitHub URLs clickable
-    display_df["GITHUB_URL"] = display_df["GITHUB_URL"].apply(
-        lambda x: f'<a href="{x}" target="_blank">Repository</a>' if x else "N/A"
-    )
-    # Sort by PER (ascending)
-    display_df.sort_values(by="AVG_PER", inplace=True)
-    return display_df
-def request_evaluation(model_name, submission_name, github_url, subset="test", max_samples=None):
-    """Submit new evaluation request"""
     if not model_name or not submission_name:
-        return gr.Markdown("⚠️ Please provide both model name and submission name.")
     try:
-        # Ensure queue directory exists
-        QUEUE_DIR.mkdir(parents=True, exist_ok=True)
-        # Load existing tasks
-        tasks_file = QUEUE_DIR / "tasks.json"
-        tasks = load_json_file(tasks_file)
-        # Create new task
-        new_task = {
-            "id": str(uuid.uuid4()),
-            "transcription_model": model_name,
-            "subset": subset,
-            "max_samples": max_samples,
-            "submission_name": submission_name,
-            "github_url": github_url or "",
-            "status": "queued",
-            "submitted_at": datetime.now(timezone.utc).isoformat()
-        }
-        # Add new task to existing tasks
-        tasks.append(new_task)
-        # Save updated tasks
-        save_json_file(tasks_file, tasks)
-        return gr.Markdown("✅ Evaluation request submitted successfully! Your results will appear on the leaderboard once processing is complete.")
-    except Exception as e:
-        return gr.Markdown(f"❌ Error submitting request: {str(e)}")
-def load_results_for_model(model_name):
-    """Load detailed results for a specific model"""
-    results_path = QUEUE_DIR / "results.json"
-    results = load_json_file(results_path)
-    # Filter results for the specific model
-    model_results = [r for r in results if r["model"] == model_name]
-    if not model_results:
-        return None
-    # Get the most recent result
-    latest_result = max(model_results, key=lambda x: x["timestamp"])
-    return latest_result
 def create_html_table(df):
-    """Create HTML table with dark theme styling"""
-    if df.empty:
-        return "<p>No data available</p>"
-    html = """
-    <style>
-    table {
-        width: 100%;
-        border-collapse: collapse;
-        color: white;
-        background-color: #1a1a1a;
-    }
-    th, td {
-        padding: 8px;
-        text-align: left;
-        border: 1px solid #333;
-    }
-    th {
-        background-color: #2a2a2a;
-        color: white;
     }
-    tr:nth-child(even) {
-        background-color: #252525;
     }
-    tr:hover {
-        background-color: #303030;
     }
-    a {
-        color: #6ea8fe;
-        text-decoration: none;
     }
-    a:hover {
-        text-decoration: underline;
     }
-    </style>
-    <table>
-    <thead>
-        <tr>
-    """
-    # Add headers
-    for header in column_names.values():
-        html += f"<th>{header}</th>"
-    html += "</tr></thead><tbody>"
-    # Add rows
-    for _, row in df.iterrows():
-        html += "<tr>"
-        for col in df.columns:
-            if col == "GITHUB_URL":
-                html += f"<td>{row[col]}</td>"  # URL is already formatted as HTML
-            else:
-                html += f"<td>{row[col]}</td>"
-        html += "</tr>"
-    html += "</tbody></table>"
-    return html
-# Create Gradio interface
-with gr.Blocks() as demo:
     gr.Markdown("# 🎯 Phonemic Transcription Model Evaluation Leaderboard")
-    gr.Markdown("""
-        Compare the performance of different phonemic transcription models on speech-to-IPA transcription tasks for English.
-        **Metrics:**
-        - **PER (Phoneme Error Rate)**: Measures the edit distance between predicted and ground truth phonemes (lower is better)
-        - **PWED (Phoneme Weighted Edit Distance)**: Measures a weighted difference in phonemes using phonemic features (lower is better)
-        **Datasets:**
-        - **[TIMIT](https://www.kaggle.com/datasets/mfekadu/darpa-timit-acousticphonetic-continuous-speech)**: A phonemic transcription dataset for English speech recognition
-        To learn more about the evaluation metrics, check out our blog post [here](https://huggingface.co/spaces/evaluate-metric/wer).
-    """)
-    with gr.Tabs() as tabs:
         with gr.TabItem("🏆 Leaderboard"):
-            leaderboard_df = load_leaderboard_data()
-            formatted_df = format_leaderboard_df(leaderboard_df)
-            leaderboard_table = gr.HTML(
-                value=create_html_table(formatted_df)
-            )
-            refresh_btn = gr.Button("🔄 Refresh Leaderboard")
             refresh_btn.click(
-                lambda: gr.HTML(value=create_html_table(format_leaderboard_df(load_leaderboard_data())))
             )
-        with gr.TabItem("📝 Submit Model"):
-            with gr.Column():
-                model_input = gr.Textbox(
-                    label="Model Name",
-                    placeholder="facebook/wav2vec2-lv-60-espeak-cv-ft",
-                    info="Enter the Hugging Face model ID"
-                )
-                submission_name = gr.Textbox(
-                    label="Submission Name",
-                    placeholder="My Awesome Model v1.0",
-                    info="Give your submission a descriptive name"
-                )
-                github_url = gr.Textbox(
-                    label="GitHub Repository URL (optional)",
-                    placeholder="https://github.com/username/repo",
-                    info="Link to your model's code repository"
-                )
-                submit_btn = gr.Button("🚀 Submit for Evaluation")
-                result_text = gr.Markdown()
-                def submit_and_clear(model_name, submission_name, github_url):
-                    result = request_evaluation(model_name, submission_name, github_url)
-                    # If submission was successful, clear the form
-                    if "✅" in result.value:
-                        return {
-                            model_input: "",
-                            submission_name: "",
-                            github_url: "",
-                            result_text: result
-                        }
-                    # If there was an error, keep the form data and show error
-                    return {
-                        model_input: model_name,
-                        submission_name: submission_name,
-                        github_url: github_url,
-                        result_text: result
-                    }
-                submit_btn.click(
-                    submit_and_clear,
-                    inputs=[model_input, submission_name, github_url],
-                    outputs=[model_input, submission_name, github_url, result_text]
-                )
-        with gr.TabItem("ℹ️ Detailed Results"):
-            model_selector = gr.Textbox(
-                label="Enter Model Name to View Details",
-                placeholder="facebook/wav2vec2-lv-60-espeak-cv-ft"
-            )
-            view_btn = gr.Button("View Results")
-            results_json = gr.JSON(label="Detailed Results")
-            def show_model_results(model_name):
-                results = load_results_for_model(model_name)
-                return results or {"error": "No results found for this model"}
-            view_btn.click(
-                show_model_results,
-                inputs=[model_selector],
-                outputs=[results_json]
             )
-    gr.Markdown(f"Last updated: {LAST_UPDATED}")
 if __name__ == "__main__":
     demo.launch()

 import gradio as gr
 import pandas as pd
+import requests
 from pathlib import Path
 from datetime import datetime, timezone
+import time
+import logging
+logging.basicConfig(level=logging.INFO)
+BACKEND_URL = "http://127.0.0.1:8000"
 LAST_UPDATED = "Dec 4th 2024"
 def load_leaderboard_data():
+    try:
+        response = requests.get(f"{BACKEND_URL}/leaderboard")
+        response.raise_for_status()
+        return pd.DataFrame(response.json())
+    except requests.RequestException as e:
+        logging.error(f"Error loading leaderboard: {e}")
+        return pd.DataFrame()
 def format_leaderboard_df(df):
     if df.empty:
         return df
     display_df = pd.DataFrame({
+        "Model": df["model"],
+        "Average PER ⬇️": df["average_per"].apply(lambda x: f"{x:.4f}"),
+        "Average PWED ⬇️": df["average_pwed"].apply(lambda x: f"{x:.4f}"),
+        "GitHub": df["github_url"].apply(lambda x: f'<a href="{x}" target="_blank">Repository</a>' if x else "N/A"),
+        "Submission Date": pd.to_datetime(df["submission_date"]).dt.strftime("%Y-%m-%d")
     })
+    return display_df.sort_values("Average PER ⬇️")
+def submit_evaluation(model_name, submission_name, github_url):
     if not model_name or not submission_name:
+        return "⚠️ Please provide both model name and submission name."
+    request_data = {
+        "transcription_model": model_name,
+        "subset": "test",
+        "submission_name": submission_name,
+        "github_url": github_url if github_url else None
+    }
     try:
+        response = requests.post(f"{BACKEND_URL}/evaluate", json=request_data)
+        response.raise_for_status()
+        task_id = response.json()["task_id"]
+        return f"✅ Evaluation submitted successfully! Task ID: {task_id}"
+    except requests.RequestException as e:
+        return f"❌ Error: {str(e)}"
+def check_task_status(task_id):
+    if not task_id:
+        return "Please enter a task ID"
+    try:
+        response = requests.get(f"{BACKEND_URL}/tasks/{task_id}")
+        response.raise_for_status()
+        return response.json()
+    except requests.RequestException as e:
+        return f"Error checking status: {str(e)}"
 def create_html_table(df):
+    return df.to_html(escape=False, index=False, classes="styled-table")
+with gr.Blocks(css="""
+    .styled-table {
+        width: 100%;
+        border-collapse: collapse;
+        margin: 25px 0;
+        font-size: 0.9em;
+        font-family: sans-serif;
+        box-shadow: 0 0 20px rgba(0, 0, 0, 0.15);
     }
+    .styled-table thead tr {
+        background-color: #009879;
+        color: #ffffff;
+        text-align: left;
     }
+    .styled-table th,
+    .styled-table td {
+        padding: 12px 15px;
     }
+    .styled-table tbody tr {
+        border-bottom: 1px solid #dddddd;
     }
+    .styled-table tbody tr:nth-of-type(even) {
+        background-color: #000000;
     }
+""") as demo:
     gr.Markdown("# 🎯 Phonemic Transcription Model Evaluation Leaderboard")
+    with gr.Tabs():
         with gr.TabItem("🏆 Leaderboard"):
+            leaderboard_html = gr.HTML(create_html_table(format_leaderboard_df(load_leaderboard_data())))
+            refresh_btn = gr.Button("🔄 Refresh")
             refresh_btn.click(
+                lambda: create_html_table(format_leaderboard_df(load_leaderboard_data())),
+                outputs=leaderboard_html
             )
+        with gr.TabItem("📝 Submit Model"):
+            model_name = gr.Textbox(label="Model Name", placeholder="facebook/wav2vec2-lv-60-espeak-cv-ft")
+            submission_name = gr.Textbox(label="Submission Name", placeholder="My Model v1.0")
+            github_url = gr.Textbox(label="GitHub URL (optional)", placeholder="https://github.com/username/repo")
+            submit_btn = gr.Button("Submit")
+            result = gr.Textbox(label="Submission Status")
+            submit_btn.click(
+                submit_evaluation,
+                inputs=[model_name, submission_name, github_url],
+                outputs=result
+            )
+        with gr.TabItem("📊 Task Status"):
+            task_id = gr.Textbox(label="Task ID")
+            status_btn = gr.Button("Check Status")
+            status_output = gr.JSON(label="Status")
+            status_btn.click(
+                check_task_status,
+                inputs=task_id,
+                outputs=status_output
             )
 if __name__ == "__main__":
     demo.launch()