Update contamination_report.csv
Browse files- contamination_report.csv +109 -109
contamination_report.csv
CHANGED
|
@@ -463,112 +463,112 @@ bigbio/mednli;;GPT-3.5;model;0.0;0.0;0.0;model-based;https://arxiv.org/pdf/2308.
|
|
| 463 |
RadNLI;;GPT-4;model;0.0;0.0;0.0;model-based;https://arxiv.org/pdf/2308.08493;8
|
| 464 |
RadNLI;;GPT-3.5;model;0.0;0.0;0.0;model-based;https://arxiv.org/pdf/2308.08493;8
|
| 465 |
|
| 466 |
-
quac;;GPT-3;model;;99.0;;data-based;https://arxiv.org/abs/2005.14165;
|
| 467 |
-
rajpurkar/squad_v2;;GPT-3;model;;94.0;;data-based;https://arxiv.org/abs/2005.14165;
|
| 468 |
-
ucinlp/drop;;GPT-3;model;;93.0;;data-based;https://arxiv.org/abs/2005.14165;
|
| 469 |
-
Symbol Insertion;;GPT-3;model;;86.0;;data-based;https://arxiv.org/abs/2005.14165;
|
| 470 |
-
stanfordnlp/coqa;;GPT-3;model;;64.0;;data-based;https://arxiv.org/abs/2005.14165;
|
| 471 |
-
super_glue;record;GPT-3;model;;61.0;;data-based;https://arxiv.org/abs/2005.14165;
|
| 472 |
-
winograd_wsc;;GPT-3;model;;;60.0;data-based;https://arxiv.org/abs/2005.14165;
|
| 473 |
-
super_glue;boolq;GPT-3;model;;60.0;;data-based;https://arxiv.org/abs/2005.14165;
|
| 474 |
-
super_glue;multirc;GPT-3;model;;59.0;;data-based;https://arxiv.org/abs/2005.14165;
|
| 475 |
-
race;high;GPT-3;model;;;45.0;data-based;https://arxiv.org/abs/2005.14165;
|
| 476 |
-
cimec/lambada;;GPT-3;model;;;43.0;data-based;https://arxiv.org/abs/2005.14165;
|
| 477 |
-
super_glue;wsc;GPT-3;model;;40.0;;data-based;https://arxiv.org/abs/2005.14165;
|
| 478 |
-
piqa;;GPT-3;model;;29.0;;data-based;https://arxiv.org/abs/2005.14165;
|
| 479 |
-
wmt/wmt16;en-de;GPT-3;model;;;25.0;data-based;https://arxiv.org/abs/2005.14165;
|
| 480 |
-
wmt/wmt16;de-en;GPT-3;model;;;25.0;data-based;https://arxiv.org/abs/2005.14165;
|
| 481 |
-
race;middle;GPT-3;model;;;25.0;data-based;https://arxiv.org/abs/2005.14165;
|
| 482 |
-
rmanluo/RoG-webqsp;;GPT-3;model;;;21.0;data-based;https://arxiv.org/abs/2005.14165;
|
| 483 |
-
wmt/wmt16;en-ro;GPT-3;model;;;21.0;data-based;https://arxiv.org/abs/2005.14165;
|
| 484 |
-
wmt/wmt16;ro-en;GPT-3;model;;;21.0;data-based;https://arxiv.org/abs/2005.14165;
|
| 485 |
-
facebook/anli;test_r1;GPT-3;model;;;20.0;data-based;https://arxiv.org/abs/2005.14165;
|
| 486 |
-
facebook/anli;test_r2;GPT-3;model;;;18.0;data-based;https://arxiv.org/abs/2005.14165;
|
| 487 |
-
mandarjoshi/trivia_qa;GPT-3;model;;17.0;;data-based;https://arxiv.org/abs/2005.14165;
|
| 488 |
-
facebook/anli;test_r3;GPT-3;model;;;16.0;data-based;https://arxiv.org/abs/2005.14165;
|
| 489 |
-
wmt/wmt16;fr-en;GPT-3;model;;;14.0;data-based;https://arxiv.org/abs/2005.14165;
|
| 490 |
-
wmt/wmt16;en-fr;GPT-3;model;;;14.0;data-based;https://arxiv.org/abs/2005.14165;
|
| 491 |
-
super_glue;rte;GPT-3;model;;8.0;;data-based;https://arxiv.org/abs/2005.14165;
|
| 492 |
-
super_glue;wic;GPT-3;model;;8.0;;data-based;https://arxiv.org/abs/2005.14165;
|
| 493 |
-
super_glue;cb;GPT-3;model;;7.0;;data-based;https://arxiv.org/abs/2005.14165;
|
| 494 |
-
Reversed Words;;GPT-3;model;;7.0;;data-based;https://arxiv.org/abs/2005.14165;
|
| 495 |
-
Anagrams 2;;GPT-3;model;;7.0;;data-based;https://arxiv.org/abs/2005.14165;
|
| 496 |
-
allenai/openbookqa;;GPT-3;model;;;6.0;data-based;https://arxiv.org/abs/2005.14165;
|
| 497 |
-
ibragim-bad/arc_easy;;GPT-3;model;;;4.0;data-based;https://arxiv.org/abs/2005.14165;
|
| 498 |
-
Anagrams 1;;GPT-3;model;;3.0;;data-based;https://arxiv.org/abs/2005.14165;
|
| 499 |
-
ibragim-bad/arc_challenge;;GPT-3;model;;;3.0;data-based;https://arxiv.org/abs/2005.14165;
|
| 500 |
-
super_glue;copa;GPT-3;model;;3.0;;data-based;https://arxiv.org/abs/2005.14165;
|
| 501 |
-
Rowan/hellaswag;;GPT-3;model;;2.0;;data-based;https://arxiv.org/abs/2005.14165;
|
| 502 |
-
natural_questions;;GPT-3;model;;;1.0;data-based;https://arxiv.org/abs/2005.14165;
|
| 503 |
-
Cycled Letters;;GPT-3;model;;1.0;;data-based;https://arxiv.org/abs/2005.14165;
|
| 504 |
-
SAT Analogies;;GPT-3;model;;1.0;;data-based;https://arxiv.org/abs/2005.14165;
|
| 505 |
-
|
| 506 |
-
EdinburghNLP/xsum;;PaLM 2;model;;;42.0;data-based;https://arxiv.org/abs/2305.10403;
|
| 507 |
-
csebuetnlp/xlsum;;PaLM 2;model;;;46.9;data-based;https://arxiv.org/abs/2305.10403;
|
| 508 |
-
wiki_lingua;;PaLM 2;model;;;9.0;data-based;https://arxiv.org/abs/2305.10403;
|
| 509 |
-
|
| 510 |
-
winograd_wsc;;PaLM;model;;;38.5;data-based;https://arxiv.org/abs/2204.02311;
|
| 511 |
-
rmanluo/RoG-webqsp;;PaLM;model;;;26.7;data-based;https://arxiv.org/abs/2204.02311;
|
| 512 |
-
super_glue;wsc;PaLM;model;;;36.8;data-based;https://arxiv.org/abs/2204.02311;
|
| 513 |
-
mandarjoshi/trivia_qa;;PaLM;model;;19.9;;data-based;https://arxiv.org/abs/2204.02311;
|
| 514 |
-
rajpurkar/squad_v2;;PaLM;model;;85.2;;data-based;https://arxiv.org/abs/2204.02311;
|
| 515 |
-
super_glue;record;PaLM;model;;43.4;;data-based;https://arxiv.org/abs/2204.02311;
|
| 516 |
-
cimec/lambada;;PaLM;model;;;29.3;data-based;https://arxiv.org/abs/2204.02311;
|
| 517 |
-
super_glue;cb;PaLM;model;;48.2;;data-based;https://arxiv.org/abs/2204.02311;
|
| 518 |
-
ibragim-bad/arc_easy;;PaLM;model;;;30.4;data-based;https://arxiv.org/abs/2204.02311;
|
| 519 |
-
ibragim-bad/arc_challenge;;PaLM;model;;;24.7;data-based;https://arxiv.org/abs/2204.02311;
|
| 520 |
-
|
| 521 |
-
winograd_wsc;;GLaM;model;;67.3;;data-based;https://arxiv.org/abs/2112.06905;
|
| 522 |
-
winogrande;;GLaM;model;;;0.3;data-based;https://arxiv.org/abs/2112.06905;
|
| 523 |
-
super_glue;wic;GLaM;model;;8.2;;data-based;https://arxiv.org/abs/2112.06905;
|
| 524 |
-
super_glue;wsc;GLaM;model;;57.5;data-based;https://arxiv.org/abs/2112.06905;
|
| 525 |
-
mandarjoshi/trivia_qa;;GLaM;model;;18.8;;data-based;https://arxiv.org/abs/2112.06905;
|
| 526 |
-
story_cloze;;GLaM;model;;100.0;;data-based;https://arxiv.org/abs/2112.06905;
|
| 527 |
-
rajpurkar/squad_v2;;GLaM;model;;94.6;;data-based;https://arxiv.org/abs/2112.06905;
|
| 528 |
-
super_glue;record;GLaM;model;;98.6;;data-based;https://arxiv.org/abs/2112.06905;
|
| 529 |
-
super_glue;rte;GLaM;model;;54.9;;data-based;https://arxiv.org/abs/2112.06905;
|
| 530 |
-
race;middle;GLaM;model;;58.4;;data-based;https://arxiv.org/abs/2112.06905;
|
| 531 |
-
race;high;GLaM;model;;74.0;;data-based;https://arxiv.org/abs/2112.06905;
|
| 532 |
-
quac;;GLaM;model;;99.9;;data-based;https://arxiv.org/abs/2112.06905;
|
| 533 |
-
piqa;;GLaM;model;;49.8;;data-based;https://arxiv.org/abs/2112.06905;
|
| 534 |
-
allenai/openbookqa;;GLaM;model;;20.0;;data-based;https://arxiv.org/abs/2112.06905;
|
| 535 |
-
natural_questions;;GLaM;model;;3.9;;data-based;https://arxiv.org/abs/2112.06905;
|
| 536 |
-
super_glue;multirc;GLaM;model;;68.8;;data-based;https://arxiv.org/abs/2112.06905;
|
| 537 |
-
cimec/lambada;;GLaM;model;;;21.8;data-based;https://arxiv.org/abs/2112.06905;
|
| 538 |
-
Rowan/hellaswag;;GLaM;model;;19.8;;data-based;https://arxiv.org/abs/2112.06905;
|
| 539 |
-
stanfordnlp/coqa;;GLaM;model;;;75.0;data-based;https://arxiv.org/abs/2112.06905;
|
| 540 |
-
super_glue;copa;GLaM;model;;3.0;;data-based;https://arxiv.org/abs/2112.06905;
|
| 541 |
-
super_glue;cb;GLaM;model;;26.8;;data-based;https://arxiv.org/abs/2112.06905;
|
| 542 |
-
super_glue;boolq;GLaM;model;;92.1;;data-based;https://arxiv.org/abs/2112.06905;
|
| 543 |
-
ibragim-bad/arc_easy;;GLaM;model;;32.5;;data-based;https://arxiv.org/abs/2112.06905;
|
| 544 |
-
ibragim-bad/arc_challenge;;GLaM;model;;31.8;;data-based;https://arxiv.org/abs/2112.06905;
|
| 545 |
-
facebook/anli;dev_r3;GLaM;model;;40.7;;data-based;https://arxiv.org/abs/2112.06905;
|
| 546 |
-
facebook/anli;dev_r2;GLaM;model;;96.8;;data-based;https://arxiv.org/abs/2112.06905;
|
| 547 |
-
facebook/anli;dev_r1;GLaM;model;;96.2;;data-based;https://arxiv.org/abs/2112.06905;
|
| 548 |
-
|
| 549 |
-
winogrande;;FLAN;model;;;0.2;data-based;https://arxiv.org/abs/2109.01652;
|
| 550 |
-
mandarjoshi/trivia_qa;;FLAN;model;;22.8;;data-based;https://arxiv.org/abs/2109.01652;
|
| 551 |
-
story_cloze;;FLAN;model;;0.4;;data-based;https://arxiv.org/abs/2109.01652;
|
| 552 |
-
rajpurkar/squad_v2;;FLAN;model;;99.1;;data-based;https://arxiv.org/abs/2109.01652;
|
| 553 |
-
wmt/wmt16;ro-en;;FLAN;model;;;12.4;data-based;https://arxiv.org/abs/2109.01652;
|
| 554 |
-
super_glue;record;FLAN;model;;68.0;;data-based;https://arxiv.org/abs/2109.01652;
|
| 555 |
-
super_glue;rte;FLAN;model;;33.9;;data-based;https://arxiv.org/abs/2109.01652;
|
| 556 |
-
piqa;;FLAN;model;;51.3;;data-based;https://arxiv.org/abs/2109.01652;
|
| 557 |
-
allenai/openbookqa;;FLAN;model;;15.0;;data-based;https://arxiv.org/abs/2109.01652;
|
| 558 |
-
natural_questions;;FLAN;model;;3.2;;data-based;https://arxiv.org/abs/2109.01652;
|
| 559 |
-
super_glue;multirc;FLAN;model;;59.3;;data-based;https://arxiv.org/abs/2109.01652;
|
| 560 |
-
Rowan/hellaswag;;FLAN;model;;34.5;;data-based;https://arxiv.org/abs/2109.01652;
|
| 561 |
-
wmt/wmt16;fr-en;;FLAN;model;;;25.3;data-based;https://arxiv.org/abs/2109.01652;
|
| 562 |
-
wmt/wmt16;en-ro;;FLAN;model;;;12.4;data-based;https://arxiv.org/abs/2109.01652;
|
| 563 |
-
wmt/wmt16;en-fr;;FLAN;model;;;25.3;data-based;https://arxiv.org/abs/2109.01652;
|
| 564 |
-
wmt/wmt16;en-de;;FLAN;model;;;14.3;data-based;https://arxiv.org/abs/2109.01652;
|
| 565 |
-
wmt/wmt16;de-en;;FLAN;model;;;14.3;data-based;https://arxiv.org/abs/2109.01652;
|
| 566 |
-
ucinlp/drop;;FLAN;model;;99.4;;data-based;https://arxiv.org/abs/2109.01652;
|
| 567 |
-
super_glue;copa;FLAN;model;;9.0;;data-based;https://arxiv.org/abs/2109.01652;
|
| 568 |
-
super_glue;cb;FLAN;model;;5.4;;data-based;https://arxiv.org/abs/2109.01652;
|
| 569 |
-
super_glue;boolq;FLAN;model;;23.1;;data-based;https://arxiv.org/abs/2109.01652;
|
| 570 |
-
ibragim-bad/arc_easy;;FLAN;model;;20.2;;data-based;https://arxiv.org/abs/2109.01652;
|
| 571 |
-
ibragim-bad/arc_challenge;;FLAN;model;;15.6;;data-based;https://arxiv.org/abs/2109.01652;
|
| 572 |
-
facebook/anli;dev_r3;FLAN;model;;40.2;;data-based;https://arxiv.org/abs/2109.01652;
|
| 573 |
-
facebook/anli;dev_r2;FLAN;model;;97.9;;data-based;https://arxiv.org/abs/2109.01652;
|
| 574 |
-
facebook/anli;dev_r1;FLAN;model;;98.6;;data-based;https://arxiv.org/abs/2109.01652;
|
|
|
|
| 463 |
RadNLI;;GPT-4;model;0.0;0.0;0.0;model-based;https://arxiv.org/pdf/2308.08493;8
|
| 464 |
RadNLI;;GPT-3.5;model;0.0;0.0;0.0;model-based;https://arxiv.org/pdf/2308.08493;8
|
| 465 |
|
| 466 |
+
quac;;GPT-3;model;;99.0;;data-based;https://arxiv.org/abs/2005.14165;13
|
| 467 |
+
rajpurkar/squad_v2;;GPT-3;model;;94.0;;data-based;https://arxiv.org/abs/2005.14165;13
|
| 468 |
+
ucinlp/drop;;GPT-3;model;;93.0;;data-based;https://arxiv.org/abs/2005.14165;13
|
| 469 |
+
Symbol Insertion;;GPT-3;model;;86.0;;data-based;https://arxiv.org/abs/2005.14165;13
|
| 470 |
+
stanfordnlp/coqa;;GPT-3;model;;64.0;;data-based;https://arxiv.org/abs/2005.14165;13
|
| 471 |
+
super_glue;record;GPT-3;model;;61.0;;data-based;https://arxiv.org/abs/2005.14165;13
|
| 472 |
+
winograd_wsc;;GPT-3;model;;;60.0;data-based;https://arxiv.org/abs/2005.14165;13
|
| 473 |
+
super_glue;boolq;GPT-3;model;;60.0;;data-based;https://arxiv.org/abs/2005.14165;13
|
| 474 |
+
super_glue;multirc;GPT-3;model;;59.0;;data-based;https://arxiv.org/abs/2005.14165;13
|
| 475 |
+
race;high;GPT-3;model;;;45.0;data-based;https://arxiv.org/abs/2005.14165;13
|
| 476 |
+
cimec/lambada;;GPT-3;model;;;43.0;data-based;https://arxiv.org/abs/2005.14165;13
|
| 477 |
+
super_glue;wsc;GPT-3;model;;40.0;;data-based;https://arxiv.org/abs/2005.14165;13
|
| 478 |
+
piqa;;GPT-3;model;;29.0;;data-based;https://arxiv.org/abs/2005.14165;13
|
| 479 |
+
wmt/wmt16;en-de;GPT-3;model;;;25.0;data-based;https://arxiv.org/abs/2005.14165;13
|
| 480 |
+
wmt/wmt16;de-en;GPT-3;model;;;25.0;data-based;https://arxiv.org/abs/2005.14165;13
|
| 481 |
+
race;middle;GPT-3;model;;;25.0;data-based;https://arxiv.org/abs/2005.14165;13
|
| 482 |
+
rmanluo/RoG-webqsp;;GPT-3;model;;;21.0;data-based;https://arxiv.org/abs/2005.14165;13
|
| 483 |
+
wmt/wmt16;en-ro;GPT-3;model;;;21.0;data-based;https://arxiv.org/abs/2005.14165;13
|
| 484 |
+
wmt/wmt16;ro-en;GPT-3;model;;;21.0;data-based;https://arxiv.org/abs/2005.14165;13
|
| 485 |
+
facebook/anli;test_r1;GPT-3;model;;;20.0;data-based;https://arxiv.org/abs/2005.14165;13
|
| 486 |
+
facebook/anli;test_r2;GPT-3;model;;;18.0;data-based;https://arxiv.org/abs/2005.14165;13
|
| 487 |
+
mandarjoshi/trivia_qa;GPT-3;model;;17.0;;data-based;https://arxiv.org/abs/2005.14165;13
|
| 488 |
+
facebook/anli;test_r3;GPT-3;model;;;16.0;data-based;https://arxiv.org/abs/2005.14165;13
|
| 489 |
+
wmt/wmt16;fr-en;GPT-3;model;;;14.0;data-based;https://arxiv.org/abs/2005.14165;13
|
| 490 |
+
wmt/wmt16;en-fr;GPT-3;model;;;14.0;data-based;https://arxiv.org/abs/2005.14165;13
|
| 491 |
+
super_glue;rte;GPT-3;model;;8.0;;data-based;https://arxiv.org/abs/2005.14165;13
|
| 492 |
+
super_glue;wic;GPT-3;model;;8.0;;data-based;https://arxiv.org/abs/2005.14165;13
|
| 493 |
+
super_glue;cb;GPT-3;model;;7.0;;data-based;https://arxiv.org/abs/2005.14165;13
|
| 494 |
+
Reversed Words;;GPT-3;model;;7.0;;data-based;https://arxiv.org/abs/2005.14165;13
|
| 495 |
+
Anagrams 2;;GPT-3;model;;7.0;;data-based;https://arxiv.org/abs/2005.14165;13
|
| 496 |
+
allenai/openbookqa;;GPT-3;model;;;6.0;data-based;https://arxiv.org/abs/2005.14165;13
|
| 497 |
+
ibragim-bad/arc_easy;;GPT-3;model;;;4.0;data-based;https://arxiv.org/abs/2005.14165;13
|
| 498 |
+
Anagrams 1;;GPT-3;model;;3.0;;data-based;https://arxiv.org/abs/2005.14165;13
|
| 499 |
+
ibragim-bad/arc_challenge;;GPT-3;model;;;3.0;data-based;https://arxiv.org/abs/2005.14165;13
|
| 500 |
+
super_glue;copa;GPT-3;model;;3.0;;data-based;https://arxiv.org/abs/2005.14165;13
|
| 501 |
+
Rowan/hellaswag;;GPT-3;model;;2.0;;data-based;https://arxiv.org/abs/2005.14165;13
|
| 502 |
+
natural_questions;;GPT-3;model;;;1.0;data-based;https://arxiv.org/abs/2005.14165;13
|
| 503 |
+
Cycled Letters;;GPT-3;model;;1.0;;data-based;https://arxiv.org/abs/2005.14165;13
|
| 504 |
+
SAT Analogies;;GPT-3;model;;1.0;;data-based;https://arxiv.org/abs/2005.14165;13
|
| 505 |
+
|
| 506 |
+
EdinburghNLP/xsum;;PaLM 2;model;;;42.0;data-based;https://arxiv.org/abs/2305.10403;13
|
| 507 |
+
csebuetnlp/xlsum;;PaLM 2;model;;;46.9;data-based;https://arxiv.org/abs/2305.10403;13
|
| 508 |
+
wiki_lingua;;PaLM 2;model;;;9.0;data-based;https://arxiv.org/abs/2305.10403;13
|
| 509 |
+
|
| 510 |
+
winograd_wsc;;PaLM;model;;;38.5;data-based;https://arxiv.org/abs/2204.02311;13
|
| 511 |
+
rmanluo/RoG-webqsp;;PaLM;model;;;26.7;data-based;https://arxiv.org/abs/2204.02311;13
|
| 512 |
+
super_glue;wsc;PaLM;model;;;36.8;data-based;https://arxiv.org/abs/2204.02311;13
|
| 513 |
+
mandarjoshi/trivia_qa;;PaLM;model;;19.9;;data-based;https://arxiv.org/abs/2204.02311;13
|
| 514 |
+
rajpurkar/squad_v2;;PaLM;model;;85.2;;data-based;https://arxiv.org/abs/2204.02311;13
|
| 515 |
+
super_glue;record;PaLM;model;;43.4;;data-based;https://arxiv.org/abs/2204.02311;13
|
| 516 |
+
cimec/lambada;;PaLM;model;;;29.3;data-based;https://arxiv.org/abs/2204.02311;13
|
| 517 |
+
super_glue;cb;PaLM;model;;48.2;;data-based;https://arxiv.org/abs/2204.02311;13
|
| 518 |
+
ibragim-bad/arc_easy;;PaLM;model;;;30.4;data-based;https://arxiv.org/abs/2204.02311;13
|
| 519 |
+
ibragim-bad/arc_challenge;;PaLM;model;;;24.7;data-based;https://arxiv.org/abs/2204.02311;13
|
| 520 |
+
|
| 521 |
+
winograd_wsc;;GLaM;model;;67.3;;data-based;https://arxiv.org/abs/2112.06905;13
|
| 522 |
+
winogrande;;GLaM;model;;;0.3;data-based;https://arxiv.org/abs/2112.06905;13
|
| 523 |
+
super_glue;wic;GLaM;model;;8.2;;data-based;https://arxiv.org/abs/2112.06905;13
|
| 524 |
+
super_glue;wsc;GLaM;model;;57.5;data-based;https://arxiv.org/abs/2112.06905;13
|
| 525 |
+
mandarjoshi/trivia_qa;;GLaM;model;;18.8;;data-based;https://arxiv.org/abs/2112.06905;13
|
| 526 |
+
story_cloze;;GLaM;model;;100.0;;data-based;https://arxiv.org/abs/2112.06905;13
|
| 527 |
+
rajpurkar/squad_v2;;GLaM;model;;94.6;;data-based;https://arxiv.org/abs/2112.06905;13
|
| 528 |
+
super_glue;record;GLaM;model;;98.6;;data-based;https://arxiv.org/abs/2112.06905;13
|
| 529 |
+
super_glue;rte;GLaM;model;;54.9;;data-based;https://arxiv.org/abs/2112.06905;13
|
| 530 |
+
race;middle;GLaM;model;;58.4;;data-based;https://arxiv.org/abs/2112.06905;13
|
| 531 |
+
race;high;GLaM;model;;74.0;;data-based;https://arxiv.org/abs/2112.06905;13
|
| 532 |
+
quac;;GLaM;model;;99.9;;data-based;https://arxiv.org/abs/2112.06905;13
|
| 533 |
+
piqa;;GLaM;model;;49.8;;data-based;https://arxiv.org/abs/2112.06905;13
|
| 534 |
+
allenai/openbookqa;;GLaM;model;;20.0;;data-based;https://arxiv.org/abs/2112.06905;13
|
| 535 |
+
natural_questions;;GLaM;model;;3.9;;data-based;https://arxiv.org/abs/2112.06905;13
|
| 536 |
+
super_glue;multirc;GLaM;model;;68.8;;data-based;https://arxiv.org/abs/2112.06905;13
|
| 537 |
+
cimec/lambada;;GLaM;model;;;21.8;data-based;https://arxiv.org/abs/2112.06905;13
|
| 538 |
+
Rowan/hellaswag;;GLaM;model;;19.8;;data-based;https://arxiv.org/abs/2112.06905;13
|
| 539 |
+
stanfordnlp/coqa;;GLaM;model;;;75.0;data-based;https://arxiv.org/abs/2112.06905;13
|
| 540 |
+
super_glue;copa;GLaM;model;;3.0;;data-based;https://arxiv.org/abs/2112.06905;13
|
| 541 |
+
super_glue;cb;GLaM;model;;26.8;;data-based;https://arxiv.org/abs/2112.06905;13
|
| 542 |
+
super_glue;boolq;GLaM;model;;92.1;;data-based;https://arxiv.org/abs/2112.06905;13
|
| 543 |
+
ibragim-bad/arc_easy;;GLaM;model;;32.5;;data-based;https://arxiv.org/abs/2112.06905;13
|
| 544 |
+
ibragim-bad/arc_challenge;;GLaM;model;;31.8;;data-based;https://arxiv.org/abs/2112.06905;13
|
| 545 |
+
facebook/anli;dev_r3;GLaM;model;;40.7;;data-based;https://arxiv.org/abs/2112.06905;13
|
| 546 |
+
facebook/anli;dev_r2;GLaM;model;;96.8;;data-based;https://arxiv.org/abs/2112.06905;13
|
| 547 |
+
facebook/anli;dev_r1;GLaM;model;;96.2;;data-based;https://arxiv.org/abs/2112.06905;13
|
| 548 |
+
|
| 549 |
+
winogrande;;FLAN;model;;;0.2;data-based;https://arxiv.org/abs/2109.01652;13
|
| 550 |
+
mandarjoshi/trivia_qa;;FLAN;model;;22.8;;data-based;https://arxiv.org/abs/2109.01652;13
|
| 551 |
+
story_cloze;;FLAN;model;;0.4;;data-based;https://arxiv.org/abs/2109.01652;13
|
| 552 |
+
rajpurkar/squad_v2;;FLAN;model;;99.1;;data-based;https://arxiv.org/abs/2109.01652;13
|
| 553 |
+
wmt/wmt16;ro-en;;FLAN;model;;;12.4;data-based;https://arxiv.org/abs/2109.01652;13
|
| 554 |
+
super_glue;record;FLAN;model;;68.0;;data-based;https://arxiv.org/abs/2109.01652;13
|
| 555 |
+
super_glue;rte;FLAN;model;;33.9;;data-based;https://arxiv.org/abs/2109.01652;13
|
| 556 |
+
piqa;;FLAN;model;;51.3;;data-based;https://arxiv.org/abs/2109.01652;13
|
| 557 |
+
allenai/openbookqa;;FLAN;model;;15.0;;data-based;https://arxiv.org/abs/2109.01652;13
|
| 558 |
+
natural_questions;;FLAN;model;;3.2;;data-based;https://arxiv.org/abs/2109.01652;13
|
| 559 |
+
super_glue;multirc;FLAN;model;;59.3;;data-based;https://arxiv.org/abs/2109.01652;13
|
| 560 |
+
Rowan/hellaswag;;FLAN;model;;34.5;;data-based;https://arxiv.org/abs/2109.01652;13
|
| 561 |
+
wmt/wmt16;fr-en;;FLAN;model;;;25.3;data-based;https://arxiv.org/abs/2109.01652;13
|
| 562 |
+
wmt/wmt16;en-ro;;FLAN;model;;;12.4;data-based;https://arxiv.org/abs/2109.01652;13
|
| 563 |
+
wmt/wmt16;en-fr;;FLAN;model;;;25.3;data-based;https://arxiv.org/abs/2109.01652;13
|
| 564 |
+
wmt/wmt16;en-de;;FLAN;model;;;14.3;data-based;https://arxiv.org/abs/2109.01652;13
|
| 565 |
+
wmt/wmt16;de-en;;FLAN;model;;;14.3;data-based;https://arxiv.org/abs/2109.01652;13
|
| 566 |
+
ucinlp/drop;;FLAN;model;;99.4;;data-based;https://arxiv.org/abs/2109.01652;13
|
| 567 |
+
super_glue;copa;FLAN;model;;9.0;;data-based;https://arxiv.org/abs/2109.01652;13
|
| 568 |
+
super_glue;cb;FLAN;model;;5.4;;data-based;https://arxiv.org/abs/2109.01652;13
|
| 569 |
+
super_glue;boolq;FLAN;model;;23.1;;data-based;https://arxiv.org/abs/2109.01652;13
|
| 570 |
+
ibragim-bad/arc_easy;;FLAN;model;;20.2;;data-based;https://arxiv.org/abs/2109.01652;13
|
| 571 |
+
ibragim-bad/arc_challenge;;FLAN;model;;15.6;;data-based;https://arxiv.org/abs/2109.01652;13
|
| 572 |
+
facebook/anli;dev_r3;FLAN;model;;40.2;;data-based;https://arxiv.org/abs/2109.01652;13
|
| 573 |
+
facebook/anli;dev_r2;FLAN;model;;97.9;;data-based;https://arxiv.org/abs/2109.01652;13
|
| 574 |
+
facebook/anli;dev_r1;FLAN;model;;98.6;;data-based;https://arxiv.org/abs/2109.01652;13
|