Fix some format bugs
Browse files- contamination_report.csv +8 -8
contamination_report.csv
CHANGED
@@ -484,7 +484,7 @@ wmt/wmt16;en-ro;GPT-3;model;;;21.0;data-based;https://arxiv.org/abs/2005.14165;1
|
|
484 |
wmt/wmt16;ro-en;GPT-3;model;;;21.0;data-based;https://arxiv.org/abs/2005.14165;13
|
485 |
facebook/anli;test_r1;GPT-3;model;;;20.0;data-based;https://arxiv.org/abs/2005.14165;13
|
486 |
facebook/anli;test_r2;GPT-3;model;;;18.0;data-based;https://arxiv.org/abs/2005.14165;13
|
487 |
-
mandarjoshi/trivia_qa
|
488 |
facebook/anli;test_r3;GPT-3;model;;;16.0;data-based;https://arxiv.org/abs/2005.14165;13
|
489 |
wmt/wmt16;fr-en;GPT-3;model;;;14.0;data-based;https://arxiv.org/abs/2005.14165;13
|
490 |
wmt/wmt16;en-fr;GPT-3;model;;;14.0;data-based;https://arxiv.org/abs/2005.14165;13
|
@@ -521,7 +521,7 @@ ibragim-bad/arc_challenge;;PaLM;model;;;24.7;data-based;https://arxiv.org/abs/22
|
|
521 |
winograd_wsc;;GLaM;model;;67.3;;data-based;https://arxiv.org/abs/2112.06905;13
|
522 |
winogrande;;GLaM;model;;;0.3;data-based;https://arxiv.org/abs/2112.06905;13
|
523 |
super_glue;wic;GLaM;model;;8.2;;data-based;https://arxiv.org/abs/2112.06905;13
|
524 |
-
super_glue;wsc;GLaM;model;;57.5
|
525 |
mandarjoshi/trivia_qa;;GLaM;model;;18.8;;data-based;https://arxiv.org/abs/2112.06905;13
|
526 |
story_cloze;;GLaM;model;;100.0;;data-based;https://arxiv.org/abs/2112.06905;13
|
527 |
rajpurkar/squad_v2;;GLaM;model;;94.6;;data-based;https://arxiv.org/abs/2112.06905;13
|
@@ -550,7 +550,7 @@ winogrande;;FLAN;model;;;0.2;data-based;https://arxiv.org/abs/2109.01652;13
|
|
550 |
mandarjoshi/trivia_qa;;FLAN;model;;22.8;;data-based;https://arxiv.org/abs/2109.01652;13
|
551 |
story_cloze;;FLAN;model;;0.4;;data-based;https://arxiv.org/abs/2109.01652;13
|
552 |
rajpurkar/squad_v2;;FLAN;model;;99.1;;data-based;https://arxiv.org/abs/2109.01652;13
|
553 |
-
wmt/wmt16;ro-en
|
554 |
super_glue;record;FLAN;model;;68.0;;data-based;https://arxiv.org/abs/2109.01652;13
|
555 |
super_glue;rte;FLAN;model;;33.9;;data-based;https://arxiv.org/abs/2109.01652;13
|
556 |
piqa;;FLAN;model;;51.3;;data-based;https://arxiv.org/abs/2109.01652;13
|
@@ -558,11 +558,11 @@ allenai/openbookqa;;FLAN;model;;15.0;;data-based;https://arxiv.org/abs/2109.0165
|
|
558 |
natural_questions;;FLAN;model;;3.2;;data-based;https://arxiv.org/abs/2109.01652;13
|
559 |
super_glue;multirc;FLAN;model;;59.3;;data-based;https://arxiv.org/abs/2109.01652;13
|
560 |
Rowan/hellaswag;;FLAN;model;;34.5;;data-based;https://arxiv.org/abs/2109.01652;13
|
561 |
-
wmt/wmt16;fr-en
|
562 |
-
wmt/wmt16;en-ro
|
563 |
-
wmt/wmt16;en-fr
|
564 |
-
wmt/wmt16;en-de
|
565 |
-
wmt/wmt16;de-en
|
566 |
ucinlp/drop;;FLAN;model;;99.4;;data-based;https://arxiv.org/abs/2109.01652;13
|
567 |
super_glue;copa;FLAN;model;;9.0;;data-based;https://arxiv.org/abs/2109.01652;13
|
568 |
super_glue;cb;FLAN;model;;5.4;;data-based;https://arxiv.org/abs/2109.01652;13
|
|
|
484 |
wmt/wmt16;ro-en;GPT-3;model;;;21.0;data-based;https://arxiv.org/abs/2005.14165;13
|
485 |
facebook/anli;test_r1;GPT-3;model;;;20.0;data-based;https://arxiv.org/abs/2005.14165;13
|
486 |
facebook/anli;test_r2;GPT-3;model;;;18.0;data-based;https://arxiv.org/abs/2005.14165;13
|
487 |
+
mandarjoshi/trivia_qa;;GPT-3;model;;17.0;;data-based;https://arxiv.org/abs/2005.14165;13
|
488 |
facebook/anli;test_r3;GPT-3;model;;;16.0;data-based;https://arxiv.org/abs/2005.14165;13
|
489 |
wmt/wmt16;fr-en;GPT-3;model;;;14.0;data-based;https://arxiv.org/abs/2005.14165;13
|
490 |
wmt/wmt16;en-fr;GPT-3;model;;;14.0;data-based;https://arxiv.org/abs/2005.14165;13
|
|
|
521 |
winograd_wsc;;GLaM;model;;67.3;;data-based;https://arxiv.org/abs/2112.06905;13
|
522 |
winogrande;;GLaM;model;;;0.3;data-based;https://arxiv.org/abs/2112.06905;13
|
523 |
super_glue;wic;GLaM;model;;8.2;;data-based;https://arxiv.org/abs/2112.06905;13
|
524 |
+
super_glue;wsc;GLaM;model;;57.5;;data-based;https://arxiv.org/abs/2112.06905;13
|
525 |
mandarjoshi/trivia_qa;;GLaM;model;;18.8;;data-based;https://arxiv.org/abs/2112.06905;13
|
526 |
story_cloze;;GLaM;model;;100.0;;data-based;https://arxiv.org/abs/2112.06905;13
|
527 |
rajpurkar/squad_v2;;GLaM;model;;94.6;;data-based;https://arxiv.org/abs/2112.06905;13
|
|
|
550 |
mandarjoshi/trivia_qa;;FLAN;model;;22.8;;data-based;https://arxiv.org/abs/2109.01652;13
|
551 |
story_cloze;;FLAN;model;;0.4;;data-based;https://arxiv.org/abs/2109.01652;13
|
552 |
rajpurkar/squad_v2;;FLAN;model;;99.1;;data-based;https://arxiv.org/abs/2109.01652;13
|
553 |
+
wmt/wmt16;ro-en;FLAN;model;;;12.4;data-based;https://arxiv.org/abs/2109.01652;13
|
554 |
super_glue;record;FLAN;model;;68.0;;data-based;https://arxiv.org/abs/2109.01652;13
|
555 |
super_glue;rte;FLAN;model;;33.9;;data-based;https://arxiv.org/abs/2109.01652;13
|
556 |
piqa;;FLAN;model;;51.3;;data-based;https://arxiv.org/abs/2109.01652;13
|
|
|
558 |
natural_questions;;FLAN;model;;3.2;;data-based;https://arxiv.org/abs/2109.01652;13
|
559 |
super_glue;multirc;FLAN;model;;59.3;;data-based;https://arxiv.org/abs/2109.01652;13
|
560 |
Rowan/hellaswag;;FLAN;model;;34.5;;data-based;https://arxiv.org/abs/2109.01652;13
|
561 |
+
wmt/wmt16;fr-en;FLAN;model;;;25.3;data-based;https://arxiv.org/abs/2109.01652;13
|
562 |
+
wmt/wmt16;en-ro;FLAN;model;;;12.4;data-based;https://arxiv.org/abs/2109.01652;13
|
563 |
+
wmt/wmt16;en-fr;FLAN;model;;;25.3;data-based;https://arxiv.org/abs/2109.01652;13
|
564 |
+
wmt/wmt16;en-de;FLAN;model;;;14.3;data-based;https://arxiv.org/abs/2109.01652;13
|
565 |
+
wmt/wmt16;de-en;FLAN;model;;;14.3;data-based;https://arxiv.org/abs/2109.01652;13
|
566 |
ucinlp/drop;;FLAN;model;;99.4;;data-based;https://arxiv.org/abs/2109.01652;13
|
567 |
super_glue;copa;FLAN;model;;9.0;;data-based;https://arxiv.org/abs/2109.01652;13
|
568 |
super_glue;cb;FLAN;model;;5.4;;data-based;https://arxiv.org/abs/2109.01652;13
|