Spaces:

CIIRC-NLP
/

czechbench_leaderboard

Runtime error

Clémentine commited on Jul 17, 2023

Commit

97b27da

1 Parent(s): 256c5d3

Small fix - we do not want to display models where the MMLU is old with models where the MMLU is new - however, since version is displayed in the results, we keep the files

Files changed (1) hide show

src/auto_leaderboard/load_results.py CHANGED Viewed

@@ -55,6 +55,10 @@ class EvalResult:
 def parse_eval_result(json_filepath: str) -> Tuple[str, list[dict]]:
     with open(json_filepath) as fp:
         data = json.load(fp)
     config = data["config"]
     model = config.get("model_name", None)

 def parse_eval_result(json_filepath: str) -> Tuple[str, list[dict]]:
     with open(json_filepath) as fp:
         data = json.load(fp)
+    for mmlu_k in ["harness|hendrycksTest-abstract_algebra|5", "hendrycksTest-abstract_algebra"]:
+        if mmlu_k in data["versions"] and data["versions"][mmlu_k] == 0:
+            return None, [] # we skip models with the wrong version
     config = data["config"]
     model = config.get("model_name", None)