Spaces:

galileo-ai
/

agent-leaderboard

Running on CPU Upgrade

App Files Files Community

Pratik Bhavsar commited on Jul 16

Commit

fe3dcd7

1 Parent(s): 267bc29

improved filter

Browse files

Files changed (1) hide show

tabs/leaderboard_v2.py +61 -23

tabs/leaderboard_v2.py CHANGED Viewed

@@ -76,6 +76,30 @@ def get_type_badge(model_type):
     """
 def get_score_bar(score):
     """Generate HTML for score bar with gradient styling"""
     width = score * 100
@@ -226,6 +250,7 @@ def create_leaderboard_v2_tab():
                         <th style="width: 80px;">Rank</th>
                         <th>Model</th>
                         <th style="width: 120px;">Type</th>
                         <th>Vendor</th>
                         <th style="width: 200px;">Avg Action Completion</th>
                         <th style="width: 200px;">Avg Tool Selection Quality</th>
@@ -245,6 +270,7 @@ def create_leaderboard_v2_tab():
                     <td>{get_rank_badge(rank)}</td>
                     <td class="model-name">{row['Model']}</td>
                     <td>{get_type_badge(row['Model Type'])}</td>
                     <td>{row['Vendor']}</td>
             """
@@ -404,7 +430,7 @@ def create_leaderboard_v2_tab():
         if reasoning_filter != "All":
             if reasoning_filter == "Reasoning":
                 filtered_df = filtered_df[filtered_df['Output Type'] == 'Reasoning']
-            elif reasoning_filter == "Non-Reasoning":
                 filtered_df = filtered_df[filtered_df['Output Type'] == 'Normal']
         # Map display name to actual column name using shared mapping
@@ -667,25 +693,37 @@ def create_leaderboard_v2_tab():
     }
     /* Column-specific widths */
-    .dataframe th:nth-child(1), /* Model */
-    .dataframe td:nth-child(1) {
         min-width: 200px !important;
         max-width: 250px !important;
     }
-    .dataframe th:nth-child(2), /* Vendor */
-    .dataframe td:nth-child(2) {
         min-width: 100px !important;
         max-width: 120px !important;
     }
     /* Numeric columns - smaller width */
-    .dataframe th:nth-child(3), .dataframe th:nth-child(4),
-    .dataframe th:nth-child(5), .dataframe th:nth-child(6),
-    .dataframe th:nth-child(7),
-    .dataframe td:nth-child(3), .dataframe td:nth-child(4),
-    .dataframe td:nth-child(5), .dataframe td:nth-child(6),
-    .dataframe td:nth-child(7) {
         min-width: 80px !important;
         max-width: 100px !important;
         text-align: center !important;
@@ -705,14 +743,14 @@ def create_leaderboard_v2_tab():
     }
     /* Model names - keep consistent color on hover */
-    .dataframe td:first-child {
         font-weight: 500 !important;
         color: var(--accent-primary) !important;
         transition: all 0.2s ease !important;
     }
     /* Keep model name color consistent to emphasize row highlight */
-    .dataframe tr:hover td:first-child {
         color: var(--accent-secondary) !important;
     }
@@ -768,10 +806,10 @@ def create_leaderboard_v2_tab():
     /* Responsive design for smaller screens */
     @media (max-width: 1200px) {
-        .dataframe th:nth-child(8), /* Access column */
-        .dataframe td:nth-child(8),
-        .dataframe th:nth-child(9), /* Type column */
-        .dataframe td:nth-child(9) {
             display: none !important;
         }
     }
@@ -787,8 +825,8 @@ def create_leaderboard_v2_tab():
             padding: 8px 4px !important;
         }
-        .dataframe th:nth-child(1),
-        .dataframe td:nth-child(1) {
             min-width: 150px !important;
             max-width: 200px !important;
         }
@@ -1918,7 +1956,7 @@ def create_leaderboard_v2_tab():
         with gr.Column(scale=1):
             reasoning_filter = gr.Radio(
-                choices=["All", "Reasoning", "Non-Reasoning"],
                 value="All",
                 label="🧠 Output Type",
                 elem_classes=["compact-radio"]
@@ -2171,7 +2209,7 @@ def create_leaderboard_v2_tab():
         if reasoning_filter != "All":
             if reasoning_filter == "Reasoning":
                 filtered_df = filtered_df[filtered_df['Output Type'] == 'Reasoning']
-            elif reasoning_filter == "Non-Reasoning":
                 filtered_df = filtered_df[filtered_df['Output Type'] == 'Normal']
         # Map display name to actual column name using shared mapping
@@ -2252,7 +2290,7 @@ def create_leaderboard_v2_tab():
         if reasoning_filter != "All":
             if reasoning_filter == "Reasoning":
                 filtered_df = filtered_df[filtered_df['Output Type'] == 'Reasoning']
-            elif reasoning_filter == "Non-Reasoning":
                 filtered_df = filtered_df[filtered_df['Output Type'] == 'Normal']
         # Map display name to actual column name using shared mapping
@@ -2560,7 +2598,7 @@ def create_leaderboard_v2_tab():
         if reasoning_filter != "All":
             if reasoning_filter == "Reasoning":
                 filtered_df = filtered_df[filtered_df['Output Type'] == 'Reasoning']
-            elif reasoning_filter == "Non-Reasoning":
                 filtered_df = filtered_df[filtered_df['Output Type'] == 'Normal']
         return filtered_df

     """
+def get_output_type_badge(output_type):
+    """Generate HTML for output type badge"""
+    if output_type == "Reasoning":
+        bg_color = "#9333ea"  # Purple for reasoning
+    else:
+        bg_color = "#6b7280"  # Gray for normal
+    return f"""
+        <div style="
+            display: inline-flex;
+            align-items: center;
+            gap: 4px;
+            padding: 4px 8px;
+            background: {bg_color};
+            color: white;
+            border-radius: 4px;
+            font-size: 0.85em;
+            font-weight: 500;
+        ">
+            {output_type}
+        </div>
+    """
 def get_score_bar(score):
     """Generate HTML for score bar with gradient styling"""
     width = score * 100
                         <th style="width: 80px;">Rank</th>
                         <th>Model</th>
                         <th style="width: 120px;">Type</th>
+                        <th style="width: 120px;">Output Type</th>
                         <th>Vendor</th>
                         <th style="width: 200px;">Avg Action Completion</th>
                         <th style="width: 200px;">Avg Tool Selection Quality</th>
                     <td>{get_rank_badge(rank)}</td>
                     <td class="model-name">{row['Model']}</td>
                     <td>{get_type_badge(row['Model Type'])}</td>
+                    <td>{get_output_type_badge(row.get('Output Type', 'Normal'))}</td>
                     <td>{row['Vendor']}</td>
             """
         if reasoning_filter != "All":
             if reasoning_filter == "Reasoning":
                 filtered_df = filtered_df[filtered_df['Output Type'] == 'Reasoning']
+            elif reasoning_filter == "Normal":
                 filtered_df = filtered_df[filtered_df['Output Type'] == 'Normal']
         # Map display name to actual column name using shared mapping
     }
     /* Column-specific widths */
+    .dataframe th:nth-child(2), /* Model */
+    .dataframe td:nth-child(2) {
         min-width: 200px !important;
         max-width: 250px !important;
     }
+    .dataframe th:nth-child(3), /* Model Type */
+    .dataframe td:nth-child(3) {
+        min-width: 100px !important;
+        max-width: 120px !important;
+    }
+    .dataframe th:nth-child(4), /* Output Type */
+    .dataframe td:nth-child(4) {
+        min-width: 100px !important;
+        max-width: 120px !important;
+    }
+    .dataframe th:nth-child(5), /* Vendor */
+    .dataframe td:nth-child(5) {
         min-width: 100px !important;
         max-width: 120px !important;
     }
     /* Numeric columns - smaller width */
+    .dataframe th:nth-child(6), .dataframe th:nth-child(7),
+    .dataframe th:nth-child(8), .dataframe th:nth-child(9),
+    .dataframe th:nth-child(10),
+    .dataframe td:nth-child(6), .dataframe td:nth-child(7),
+    .dataframe td:nth-child(8), .dataframe td:nth-child(9),
+    .dataframe td:nth-child(10) {
         min-width: 80px !important;
         max-width: 100px !important;
         text-align: center !important;
     }
     /* Model names - keep consistent color on hover */
+    .dataframe td:nth-child(2) {
         font-weight: 500 !important;
         color: var(--accent-primary) !important;
         transition: all 0.2s ease !important;
     }
     /* Keep model name color consistent to emphasize row highlight */
+    .dataframe tr:hover td:nth-child(2) {
         color: var(--accent-secondary) !important;
     }
     /* Responsive design for smaller screens */
     @media (max-width: 1200px) {
+        .dataframe th:nth-child(9), /* Vendor column */
+        .dataframe td:nth-child(9),
+        .dataframe th:nth-child(10), /* Last columns */
+        .dataframe td:nth-child(10) {
             display: none !important;
         }
     }
             padding: 8px 4px !important;
         }
+        .dataframe th:nth-child(2),
+        .dataframe td:nth-child(2) {
             min-width: 150px !important;
             max-width: 200px !important;
         }
         with gr.Column(scale=1):
             reasoning_filter = gr.Radio(
+                choices=["All", "Reasoning", "Normal"],
                 value="All",
                 label="🧠 Output Type",
                 elem_classes=["compact-radio"]
         if reasoning_filter != "All":
             if reasoning_filter == "Reasoning":
                 filtered_df = filtered_df[filtered_df['Output Type'] == 'Reasoning']
+            elif reasoning_filter == "Normal":
                 filtered_df = filtered_df[filtered_df['Output Type'] == 'Normal']
         # Map display name to actual column name using shared mapping
         if reasoning_filter != "All":
             if reasoning_filter == "Reasoning":
                 filtered_df = filtered_df[filtered_df['Output Type'] == 'Reasoning']
+            elif reasoning_filter == "Normal":
                 filtered_df = filtered_df[filtered_df['Output Type'] == 'Normal']
         # Map display name to actual column name using shared mapping
         if reasoning_filter != "All":
             if reasoning_filter == "Reasoning":
                 filtered_df = filtered_df[filtered_df['Output Type'] == 'Reasoning']
+            elif reasoning_filter == "Normal":
                 filtered_df = filtered_df[filtered_df['Output Type'] == 'Normal']
         return filtered_df