Open-LLM-results-pr

Runtime error

App Files Files Community

Weyaxi commited on Jan 12, 2024

Commit

250d5a2

verified ·

1 Parent(s): 52101ad

delete dataset short name

Browse files

Files changed (1) hide show

app.py +2 -8

app.py CHANGED Viewed

@@ -48,7 +48,6 @@ def get_task_summary(results):
       "ARC":
           {"dataset_type":"ai2_arc",
           "dataset_name":"AI2 Reasoning Challenge (25-Shot)",
-          "dataset_short_name": "ARC (25-shot)",
           "metric_type":"acc_norm",
           "metric_value":results["ARC"],
           "dataset_config":"ARC-Challenge",
@@ -60,7 +59,6 @@ def get_task_summary(results):
       "HellaSwag":
           {"dataset_type":"hellaswag",
           "dataset_name":"HellaSwag (10-Shot)",
-          "dataset_short_name": "HellaSwag (10-shot)",
           "metric_type":"acc_norm",
           "metric_value":results["HellaSwag"],
           "dataset_config":None,
@@ -73,7 +71,6 @@ def get_task_summary(results):
       {
           "dataset_type":"cais/mmlu",
           "dataset_name":"MMLU (5-Shot)",
-          "dataset_short_name": "MMLU (5-Shot)",
           "metric_type":"acc",
           "metric_value":results["MMLU"],
           "dataset_config":"all",
@@ -86,7 +83,6 @@ def get_task_summary(results):
       {
           "dataset_type":"truthful_qa",
           "dataset_name":"TruthfulQA (0-shot)",
-          "dataset_short_name": "TruthfulQA (0-shot)",
           "metric_type":"mc2",
           "metric_value":results["TruthfulQA"],
           "dataset_config":"multiple_choice",
@@ -99,7 +95,6 @@ def get_task_summary(results):
       {
           "dataset_type":"winogrande",
           "dataset_name":"Winogrande (5-shot)",
-          "dataset_short_name": "Winogrande (5-shot)",
           "metric_type":"acc",
           "metric_value":results["Winogrande"],
           "dataset_config":"winogrande_xl",
@@ -111,7 +106,6 @@ def get_task_summary(results):
       {
           "dataset_type":"gsm8k",
           "dataset_name":"GSM8k (5-shot)",
-          "dataset_short_name": "GSM8k (5-shot)",
           "metric_type":"acc",
           "metric_value":results["GSM8K"],
           "dataset_config":"main",
@@ -204,9 +198,9 @@ The leaderboard's backend mainly runs on the [Hugging Face Hub API](https://hugg
 ## 🤝 Acknowledgements
-- Special thanks to Clémentine Fourrier (clefourrier) for her help and contributions to the code.
-- Special thanks to [Lucain Pouget (Wauplin)](https://huggingface.co/docs/huggingface_hub/v0.5.1/en/package_reference/hf_api) for assisting with the [Hugging Face Hub API](https://huggingface.co/docs/huggingface_hub/v0.5.1/en/package_reference/hf_api).
 """
 demo = gr.Interface(title=gradio_title, description=gradio_desc, fn=commit, inputs=["text", "text"], outputs="text")

       "ARC":
           {"dataset_type":"ai2_arc",
           "dataset_name":"AI2 Reasoning Challenge (25-Shot)",
           "metric_type":"acc_norm",
           "metric_value":results["ARC"],
           "dataset_config":"ARC-Challenge",
       "HellaSwag":
           {"dataset_type":"hellaswag",
           "dataset_name":"HellaSwag (10-Shot)",
           "metric_type":"acc_norm",
           "metric_value":results["HellaSwag"],
           "dataset_config":None,
       {
           "dataset_type":"cais/mmlu",
           "dataset_name":"MMLU (5-Shot)",
           "metric_type":"acc",
           "metric_value":results["MMLU"],
           "dataset_config":"all",
       {
           "dataset_type":"truthful_qa",
           "dataset_name":"TruthfulQA (0-shot)",
           "metric_type":"mc2",
           "metric_value":results["TruthfulQA"],
           "dataset_config":"multiple_choice",
       {
           "dataset_type":"winogrande",
           "dataset_name":"Winogrande (5-shot)",
           "metric_type":"acc",
           "metric_value":results["Winogrande"],
           "dataset_config":"winogrande_xl",
       {
           "dataset_type":"gsm8k",
           "dataset_name":"GSM8k (5-shot)",
           "metric_type":"acc",
           "metric_value":results["GSM8K"],
           "dataset_config":"main",
 ## 🤝 Acknowledgements
+- Special thanks to [Clémentine Fourrier (clefourrier)](https://huggingface.co/clefourrier) for her help and contributions to the code.
+- Special thanks to [Lucain Pouget (Wauplin)](https://huggingface.co/Wauplin) for assisting with the [Hugging Face Hub API](https://huggingface.co/docs/huggingface_hub/v0.5.1/en/package_reference/hf_api).
 """
 demo = gr.Interface(title=gradio_title, description=gradio_desc, fn=commit, inputs=["text", "text"], outputs="text")