Clémentine
		
	commited on
		
		
					Commit 
							
							·
						
						97b27da
	
1
								Parent(s):
							
							256c5d3
								
Small fix - we do not want to display models where the MMLU is old with models where the MMLU is new - however, since version is displayed in the results, we keep the files
Browse files
    	
        src/auto_leaderboard/load_results.py
    CHANGED
    
    | @@ -55,6 +55,10 @@ class EvalResult: | |
| 55 | 
             
            def parse_eval_result(json_filepath: str) -> Tuple[str, list[dict]]:
         | 
| 56 | 
             
                with open(json_filepath) as fp:
         | 
| 57 | 
             
                    data = json.load(fp)
         | 
|  | |
|  | |
|  | |
|  | |
| 58 |  | 
| 59 | 
             
                config = data["config"]
         | 
| 60 | 
             
                model = config.get("model_name", None)
         | 
|  | |
| 55 | 
             
            def parse_eval_result(json_filepath: str) -> Tuple[str, list[dict]]:
         | 
| 56 | 
             
                with open(json_filepath) as fp:
         | 
| 57 | 
             
                    data = json.load(fp)
         | 
| 58 | 
            +
                
         | 
| 59 | 
            +
                for mmlu_k in ["harness|hendrycksTest-abstract_algebra|5", "hendrycksTest-abstract_algebra"]:
         | 
| 60 | 
            +
                    if mmlu_k in data["versions"] and data["versions"][mmlu_k] == 0:
         | 
| 61 | 
            +
                        return None, [] # we skip models with the wrong version 
         | 
| 62 |  | 
| 63 | 
             
                config = data["config"]
         | 
| 64 | 
             
                model = config.get("model_name", None)
         | 
