Steveeeeeeen HF Staff commited on
Commit
f8333bb
·
1 Parent(s): 2736f1e

fix csv loading

Browse files
Files changed (1) hide show
  1. app.py +23 -45
app.py CHANGED
@@ -232,55 +232,33 @@ multilingual_df = create_multilingual_dataframe()
232
  def create_longform_dataframe():
233
  """Create longform dataframe from CSV data"""
234
  if longform_csv_path is None or not longform_csv_path.exists():
235
- print("Longform CSV not found, creating sample data")
236
- # Fallback to sample data if CSV not available
237
- longform_data = []
238
- sample_models = [
239
- {"model": "openai/whisper-large-v3", "earnings21": 8.2, "mustc": 12.4, "rtfx": 2.1},
240
- {"model": "openai/whisper-large-v2", "earnings21": 9.1, "mustc": 13.8, "rtfx": 1.8},
241
- {"model": "nvidia/canary-1b", "earnings21": 7.5, "mustc": 11.2, "rtfx": 3.2},
242
- {"model": "microsoft/speecht5_asr", "earnings21": 15.3, "mustc": 18.7, "rtfx": 1.4},
243
- ]
244
-
245
- for model_data in sample_models:
246
- row = {
247
- "Model": make_clickable_model(model_data["model"]),
248
- "Average WER ⬇️": round((model_data["earnings21"] + model_data["mustc"]) / 2, 2),
249
- "RTFx ⬆️️": model_data["rtfx"] if model_data["rtfx"] > 0 else "NA",
250
- "Earnings21": model_data["earnings21"],
251
- "MustC": model_data["mustc"]
252
- }
253
- longform_data.append(row)
254
 
255
- longform_df = pd.DataFrame(longform_data)
256
- else:
257
- # Load from CSV
258
- longform_raw_df = pd.read_csv(longform_csv_path)
259
- longform_data = []
260
 
261
- for _, row_data in longform_raw_df.iterrows():
262
- model_name = row_data['model']
263
-
264
- # Get values from CSV, similar to other tabs
265
- earnings21_wer = row_data.get('earnings21_wer', -1)
266
- mustc_wer = row_data.get('mustc_wer', -1)
267
- rtfx_value = row_data.get('rtfx', 0)
268
-
269
- # Calculate average WER from available datasets
270
- available_wers = [w for w in [earnings21_wer, mustc_wer] if w != -1 and w > 0]
271
- avg_wer = round(np.mean(available_wers), 2) if available_wers else 0.0
272
-
273
- row = {
274
- "Model": make_clickable_model(model_name),
275
- "Average WER ⬇️": avg_wer,
276
- "RTFx ⬆️️": rtfx_value if rtfx_value > 0 else "NA",
277
- "Earnings21": earnings21_wer if earnings21_wer != -1 else "NA",
278
- "MustC": mustc_wer if mustc_wer != -1 else "NA"
279
- }
280
- longform_data.append(row)
281
 
282
- longform_df = pd.DataFrame(longform_data)
 
 
 
 
 
 
283
 
 
284
  longform_df = longform_df.sort_values(by='Average WER ⬇️')
285
  return longform_df
286
 
 
232
  def create_longform_dataframe():
233
  """Create longform dataframe from CSV data"""
234
  if longform_csv_path is None or not longform_csv_path.exists():
235
+ raise Exception(f"Longform CSV file {longform_csv_path} does not exist locally")
236
+
237
+ # Load from CSV
238
+ longform_raw_df = pd.read_csv(longform_csv_path)
239
+ longform_data = []
240
+
241
+ for _, row_data in longform_raw_df.iterrows():
242
+ model_name = row_data['model']
 
 
 
 
 
 
 
 
 
 
 
243
 
244
+ # Get values from CSV, similar to other tabs
245
+ earnings21_wer = row_data.get('earnings21_wer', -1)
246
+ mustc_wer = row_data.get('mustc_wer', -1)
247
+ rtfx_value = row_data.get('rtfx', 0)
 
248
 
249
+ # Calculate average WER from available datasets
250
+ available_wers = [w for w in [earnings21_wer, mustc_wer] if w != -1 and w > 0]
251
+ avg_wer = round(np.mean(available_wers), 2) if available_wers else 0.0
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
252
 
253
+ row = {
254
+ "Model": make_clickable_model(model_name),
255
+ "Average WER ⬇️": avg_wer,
256
+ "RTFx ⬆️️": rtfx_value if rtfx_value > 0 else "NA",
257
+ "Earnings21": earnings21_wer if earnings21_wer != -1 else "NA",
258
+ }
259
+ longform_data.append(row)
260
 
261
+ longform_df = pd.DataFrame(longform_data)
262
  longform_df = longform_df.sort_values(by='Average WER ⬇️')
263
  return longform_df
264