Fix some format bugs
Browse files- contamination_report.csv +8 -8
contamination_report.csv
CHANGED
|
@@ -484,7 +484,7 @@ wmt/wmt16;en-ro;GPT-3;model;;;21.0;data-based;https://arxiv.org/abs/2005.14165;1
|
|
| 484 |
wmt/wmt16;ro-en;GPT-3;model;;;21.0;data-based;https://arxiv.org/abs/2005.14165;13
|
| 485 |
facebook/anli;test_r1;GPT-3;model;;;20.0;data-based;https://arxiv.org/abs/2005.14165;13
|
| 486 |
facebook/anli;test_r2;GPT-3;model;;;18.0;data-based;https://arxiv.org/abs/2005.14165;13
|
| 487 |
-
mandarjoshi/trivia_qa
|
| 488 |
facebook/anli;test_r3;GPT-3;model;;;16.0;data-based;https://arxiv.org/abs/2005.14165;13
|
| 489 |
wmt/wmt16;fr-en;GPT-3;model;;;14.0;data-based;https://arxiv.org/abs/2005.14165;13
|
| 490 |
wmt/wmt16;en-fr;GPT-3;model;;;14.0;data-based;https://arxiv.org/abs/2005.14165;13
|
|
@@ -521,7 +521,7 @@ ibragim-bad/arc_challenge;;PaLM;model;;;24.7;data-based;https://arxiv.org/abs/22
|
|
| 521 |
winograd_wsc;;GLaM;model;;67.3;;data-based;https://arxiv.org/abs/2112.06905;13
|
| 522 |
winogrande;;GLaM;model;;;0.3;data-based;https://arxiv.org/abs/2112.06905;13
|
| 523 |
super_glue;wic;GLaM;model;;8.2;;data-based;https://arxiv.org/abs/2112.06905;13
|
| 524 |
-
super_glue;wsc;GLaM;model;;57.5
|
| 525 |
mandarjoshi/trivia_qa;;GLaM;model;;18.8;;data-based;https://arxiv.org/abs/2112.06905;13
|
| 526 |
story_cloze;;GLaM;model;;100.0;;data-based;https://arxiv.org/abs/2112.06905;13
|
| 527 |
rajpurkar/squad_v2;;GLaM;model;;94.6;;data-based;https://arxiv.org/abs/2112.06905;13
|
|
@@ -550,7 +550,7 @@ winogrande;;FLAN;model;;;0.2;data-based;https://arxiv.org/abs/2109.01652;13
|
|
| 550 |
mandarjoshi/trivia_qa;;FLAN;model;;22.8;;data-based;https://arxiv.org/abs/2109.01652;13
|
| 551 |
story_cloze;;FLAN;model;;0.4;;data-based;https://arxiv.org/abs/2109.01652;13
|
| 552 |
rajpurkar/squad_v2;;FLAN;model;;99.1;;data-based;https://arxiv.org/abs/2109.01652;13
|
| 553 |
-
wmt/wmt16;ro-en
|
| 554 |
super_glue;record;FLAN;model;;68.0;;data-based;https://arxiv.org/abs/2109.01652;13
|
| 555 |
super_glue;rte;FLAN;model;;33.9;;data-based;https://arxiv.org/abs/2109.01652;13
|
| 556 |
piqa;;FLAN;model;;51.3;;data-based;https://arxiv.org/abs/2109.01652;13
|
|
@@ -558,11 +558,11 @@ allenai/openbookqa;;FLAN;model;;15.0;;data-based;https://arxiv.org/abs/2109.0165
|
|
| 558 |
natural_questions;;FLAN;model;;3.2;;data-based;https://arxiv.org/abs/2109.01652;13
|
| 559 |
super_glue;multirc;FLAN;model;;59.3;;data-based;https://arxiv.org/abs/2109.01652;13
|
| 560 |
Rowan/hellaswag;;FLAN;model;;34.5;;data-based;https://arxiv.org/abs/2109.01652;13
|
| 561 |
-
wmt/wmt16;fr-en
|
| 562 |
-
wmt/wmt16;en-ro
|
| 563 |
-
wmt/wmt16;en-fr
|
| 564 |
-
wmt/wmt16;en-de
|
| 565 |
-
wmt/wmt16;de-en
|
| 566 |
ucinlp/drop;;FLAN;model;;99.4;;data-based;https://arxiv.org/abs/2109.01652;13
|
| 567 |
super_glue;copa;FLAN;model;;9.0;;data-based;https://arxiv.org/abs/2109.01652;13
|
| 568 |
super_glue;cb;FLAN;model;;5.4;;data-based;https://arxiv.org/abs/2109.01652;13
|
|
|
|
| 484 |
wmt/wmt16;ro-en;GPT-3;model;;;21.0;data-based;https://arxiv.org/abs/2005.14165;13
|
| 485 |
facebook/anli;test_r1;GPT-3;model;;;20.0;data-based;https://arxiv.org/abs/2005.14165;13
|
| 486 |
facebook/anli;test_r2;GPT-3;model;;;18.0;data-based;https://arxiv.org/abs/2005.14165;13
|
| 487 |
+
mandarjoshi/trivia_qa;;GPT-3;model;;17.0;;data-based;https://arxiv.org/abs/2005.14165;13
|
| 488 |
facebook/anli;test_r3;GPT-3;model;;;16.0;data-based;https://arxiv.org/abs/2005.14165;13
|
| 489 |
wmt/wmt16;fr-en;GPT-3;model;;;14.0;data-based;https://arxiv.org/abs/2005.14165;13
|
| 490 |
wmt/wmt16;en-fr;GPT-3;model;;;14.0;data-based;https://arxiv.org/abs/2005.14165;13
|
|
|
|
| 521 |
winograd_wsc;;GLaM;model;;67.3;;data-based;https://arxiv.org/abs/2112.06905;13
|
| 522 |
winogrande;;GLaM;model;;;0.3;data-based;https://arxiv.org/abs/2112.06905;13
|
| 523 |
super_glue;wic;GLaM;model;;8.2;;data-based;https://arxiv.org/abs/2112.06905;13
|
| 524 |
+
super_glue;wsc;GLaM;model;;57.5;;data-based;https://arxiv.org/abs/2112.06905;13
|
| 525 |
mandarjoshi/trivia_qa;;GLaM;model;;18.8;;data-based;https://arxiv.org/abs/2112.06905;13
|
| 526 |
story_cloze;;GLaM;model;;100.0;;data-based;https://arxiv.org/abs/2112.06905;13
|
| 527 |
rajpurkar/squad_v2;;GLaM;model;;94.6;;data-based;https://arxiv.org/abs/2112.06905;13
|
|
|
|
| 550 |
mandarjoshi/trivia_qa;;FLAN;model;;22.8;;data-based;https://arxiv.org/abs/2109.01652;13
|
| 551 |
story_cloze;;FLAN;model;;0.4;;data-based;https://arxiv.org/abs/2109.01652;13
|
| 552 |
rajpurkar/squad_v2;;FLAN;model;;99.1;;data-based;https://arxiv.org/abs/2109.01652;13
|
| 553 |
+
wmt/wmt16;ro-en;FLAN;model;;;12.4;data-based;https://arxiv.org/abs/2109.01652;13
|
| 554 |
super_glue;record;FLAN;model;;68.0;;data-based;https://arxiv.org/abs/2109.01652;13
|
| 555 |
super_glue;rte;FLAN;model;;33.9;;data-based;https://arxiv.org/abs/2109.01652;13
|
| 556 |
piqa;;FLAN;model;;51.3;;data-based;https://arxiv.org/abs/2109.01652;13
|
|
|
|
| 558 |
natural_questions;;FLAN;model;;3.2;;data-based;https://arxiv.org/abs/2109.01652;13
|
| 559 |
super_glue;multirc;FLAN;model;;59.3;;data-based;https://arxiv.org/abs/2109.01652;13
|
| 560 |
Rowan/hellaswag;;FLAN;model;;34.5;;data-based;https://arxiv.org/abs/2109.01652;13
|
| 561 |
+
wmt/wmt16;fr-en;FLAN;model;;;25.3;data-based;https://arxiv.org/abs/2109.01652;13
|
| 562 |
+
wmt/wmt16;en-ro;FLAN;model;;;12.4;data-based;https://arxiv.org/abs/2109.01652;13
|
| 563 |
+
wmt/wmt16;en-fr;FLAN;model;;;25.3;data-based;https://arxiv.org/abs/2109.01652;13
|
| 564 |
+
wmt/wmt16;en-de;FLAN;model;;;14.3;data-based;https://arxiv.org/abs/2109.01652;13
|
| 565 |
+
wmt/wmt16;de-en;FLAN;model;;;14.3;data-based;https://arxiv.org/abs/2109.01652;13
|
| 566 |
ucinlp/drop;;FLAN;model;;99.4;;data-based;https://arxiv.org/abs/2109.01652;13
|
| 567 |
super_glue;copa;FLAN;model;;9.0;;data-based;https://arxiv.org/abs/2109.01652;13
|
| 568 |
super_glue;cb;FLAN;model;;5.4;;data-based;https://arxiv.org/abs/2109.01652;13
|