AmeyaPrabhu commited on
Commit
0f5ff26
β€’
1 Parent(s): 6febb26

Update contamination_report.csv

Browse files
Files changed (1) hide show
  1. contamination_report.csv +109 -109
contamination_report.csv CHANGED
@@ -463,112 +463,112 @@ bigbio/mednli;;GPT-3.5;model;0.0;0.0;0.0;model-based;https://arxiv.org/pdf/2308.
463
  RadNLI;;GPT-4;model;0.0;0.0;0.0;model-based;https://arxiv.org/pdf/2308.08493;8
464
  RadNLI;;GPT-3.5;model;0.0;0.0;0.0;model-based;https://arxiv.org/pdf/2308.08493;8
465
 
466
- quac;;GPT-3;model;;99.0;;data-based;https://arxiv.org/abs/2005.14165;
467
- rajpurkar/squad_v2;;GPT-3;model;;94.0;;data-based;https://arxiv.org/abs/2005.14165;
468
- ucinlp/drop;;GPT-3;model;;93.0;;data-based;https://arxiv.org/abs/2005.14165;
469
- Symbol Insertion;;GPT-3;model;;86.0;;data-based;https://arxiv.org/abs/2005.14165;
470
- stanfordnlp/coqa;;GPT-3;model;;64.0;;data-based;https://arxiv.org/abs/2005.14165;
471
- super_glue;record;GPT-3;model;;61.0;;data-based;https://arxiv.org/abs/2005.14165;
472
- winograd_wsc;;GPT-3;model;;;60.0;data-based;https://arxiv.org/abs/2005.14165;
473
- super_glue;boolq;GPT-3;model;;60.0;;data-based;https://arxiv.org/abs/2005.14165;
474
- super_glue;multirc;GPT-3;model;;59.0;;data-based;https://arxiv.org/abs/2005.14165;
475
- race;high;GPT-3;model;;;45.0;data-based;https://arxiv.org/abs/2005.14165;
476
- cimec/lambada;;GPT-3;model;;;43.0;data-based;https://arxiv.org/abs/2005.14165;
477
- super_glue;wsc;GPT-3;model;;40.0;;data-based;https://arxiv.org/abs/2005.14165;
478
- piqa;;GPT-3;model;;29.0;;data-based;https://arxiv.org/abs/2005.14165;
479
- wmt/wmt16;en-de;GPT-3;model;;;25.0;data-based;https://arxiv.org/abs/2005.14165;
480
- wmt/wmt16;de-en;GPT-3;model;;;25.0;data-based;https://arxiv.org/abs/2005.14165;
481
- race;middle;GPT-3;model;;;25.0;data-based;https://arxiv.org/abs/2005.14165;
482
- rmanluo/RoG-webqsp;;GPT-3;model;;;21.0;data-based;https://arxiv.org/abs/2005.14165;
483
- wmt/wmt16;en-ro;GPT-3;model;;;21.0;data-based;https://arxiv.org/abs/2005.14165;
484
- wmt/wmt16;ro-en;GPT-3;model;;;21.0;data-based;https://arxiv.org/abs/2005.14165;
485
- facebook/anli;test_r1;GPT-3;model;;;20.0;data-based;https://arxiv.org/abs/2005.14165;
486
- facebook/anli;test_r2;GPT-3;model;;;18.0;data-based;https://arxiv.org/abs/2005.14165;
487
- mandarjoshi/trivia_qa;GPT-3;model;;17.0;;data-based;https://arxiv.org/abs/2005.14165;
488
- facebook/anli;test_r3;GPT-3;model;;;16.0;data-based;https://arxiv.org/abs/2005.14165;
489
- wmt/wmt16;fr-en;GPT-3;model;;;14.0;data-based;https://arxiv.org/abs/2005.14165;
490
- wmt/wmt16;en-fr;GPT-3;model;;;14.0;data-based;https://arxiv.org/abs/2005.14165;
491
- super_glue;rte;GPT-3;model;;8.0;;data-based;https://arxiv.org/abs/2005.14165;
492
- super_glue;wic;GPT-3;model;;8.0;;data-based;https://arxiv.org/abs/2005.14165;
493
- super_glue;cb;GPT-3;model;;7.0;;data-based;https://arxiv.org/abs/2005.14165;
494
- Reversed Words;;GPT-3;model;;7.0;;data-based;https://arxiv.org/abs/2005.14165;
495
- Anagrams 2;;GPT-3;model;;7.0;;data-based;https://arxiv.org/abs/2005.14165;
496
- allenai/openbookqa;;GPT-3;model;;;6.0;data-based;https://arxiv.org/abs/2005.14165;
497
- ibragim-bad/arc_easy;;GPT-3;model;;;4.0;data-based;https://arxiv.org/abs/2005.14165;
498
- Anagrams 1;;GPT-3;model;;3.0;;data-based;https://arxiv.org/abs/2005.14165;
499
- ibragim-bad/arc_challenge;;GPT-3;model;;;3.0;data-based;https://arxiv.org/abs/2005.14165;
500
- super_glue;copa;GPT-3;model;;3.0;;data-based;https://arxiv.org/abs/2005.14165;
501
- Rowan/hellaswag;;GPT-3;model;;2.0;;data-based;https://arxiv.org/abs/2005.14165;
502
- natural_questions;;GPT-3;model;;;1.0;data-based;https://arxiv.org/abs/2005.14165;
503
- Cycled Letters;;GPT-3;model;;1.0;;data-based;https://arxiv.org/abs/2005.14165;
504
- SAT Analogies;;GPT-3;model;;1.0;;data-based;https://arxiv.org/abs/2005.14165;
505
-
506
- EdinburghNLP/xsum;;PaLM 2;model;;;42.0;data-based;https://arxiv.org/abs/2305.10403;
507
- csebuetnlp/xlsum;;PaLM 2;model;;;46.9;data-based;https://arxiv.org/abs/2305.10403;
508
- wiki_lingua;;PaLM 2;model;;;9.0;data-based;https://arxiv.org/abs/2305.10403;
509
-
510
- winograd_wsc;;PaLM;model;;;38.5;data-based;https://arxiv.org/abs/2204.02311;
511
- rmanluo/RoG-webqsp;;PaLM;model;;;26.7;data-based;https://arxiv.org/abs/2204.02311;
512
- super_glue;wsc;PaLM;model;;;36.8;data-based;https://arxiv.org/abs/2204.02311;
513
- mandarjoshi/trivia_qa;;PaLM;model;;19.9;;data-based;https://arxiv.org/abs/2204.02311;
514
- rajpurkar/squad_v2;;PaLM;model;;85.2;;data-based;https://arxiv.org/abs/2204.02311;
515
- super_glue;record;PaLM;model;;43.4;;data-based;https://arxiv.org/abs/2204.02311;
516
- cimec/lambada;;PaLM;model;;;29.3;data-based;https://arxiv.org/abs/2204.02311;
517
- super_glue;cb;PaLM;model;;48.2;;data-based;https://arxiv.org/abs/2204.02311;
518
- ibragim-bad/arc_easy;;PaLM;model;;;30.4;data-based;https://arxiv.org/abs/2204.02311;
519
- ibragim-bad/arc_challenge;;PaLM;model;;;24.7;data-based;https://arxiv.org/abs/2204.02311;
520
-
521
- winograd_wsc;;GLaM;model;;67.3;;data-based;https://arxiv.org/abs/2112.06905;
522
- winogrande;;GLaM;model;;;0.3;data-based;https://arxiv.org/abs/2112.06905;
523
- super_glue;wic;GLaM;model;;8.2;;data-based;https://arxiv.org/abs/2112.06905;
524
- super_glue;wsc;GLaM;model;;57.5;data-based;https://arxiv.org/abs/2112.06905;
525
- mandarjoshi/trivia_qa;;GLaM;model;;18.8;;data-based;https://arxiv.org/abs/2112.06905;
526
- story_cloze;;GLaM;model;;100.0;;data-based;https://arxiv.org/abs/2112.06905;
527
- rajpurkar/squad_v2;;GLaM;model;;94.6;;data-based;https://arxiv.org/abs/2112.06905;
528
- super_glue;record;GLaM;model;;98.6;;data-based;https://arxiv.org/abs/2112.06905;
529
- super_glue;rte;GLaM;model;;54.9;;data-based;https://arxiv.org/abs/2112.06905;
530
- race;middle;GLaM;model;;58.4;;data-based;https://arxiv.org/abs/2112.06905;
531
- race;high;GLaM;model;;74.0;;data-based;https://arxiv.org/abs/2112.06905;
532
- quac;;GLaM;model;;99.9;;data-based;https://arxiv.org/abs/2112.06905;
533
- piqa;;GLaM;model;;49.8;;data-based;https://arxiv.org/abs/2112.06905;
534
- allenai/openbookqa;;GLaM;model;;20.0;;data-based;https://arxiv.org/abs/2112.06905;
535
- natural_questions;;GLaM;model;;3.9;;data-based;https://arxiv.org/abs/2112.06905;
536
- super_glue;multirc;GLaM;model;;68.8;;data-based;https://arxiv.org/abs/2112.06905;
537
- cimec/lambada;;GLaM;model;;;21.8;data-based;https://arxiv.org/abs/2112.06905;
538
- Rowan/hellaswag;;GLaM;model;;19.8;;data-based;https://arxiv.org/abs/2112.06905;
539
- stanfordnlp/coqa;;GLaM;model;;;75.0;data-based;https://arxiv.org/abs/2112.06905;
540
- super_glue;copa;GLaM;model;;3.0;;data-based;https://arxiv.org/abs/2112.06905;
541
- super_glue;cb;GLaM;model;;26.8;;data-based;https://arxiv.org/abs/2112.06905;
542
- super_glue;boolq;GLaM;model;;92.1;;data-based;https://arxiv.org/abs/2112.06905;
543
- ibragim-bad/arc_easy;;GLaM;model;;32.5;;data-based;https://arxiv.org/abs/2112.06905;
544
- ibragim-bad/arc_challenge;;GLaM;model;;31.8;;data-based;https://arxiv.org/abs/2112.06905;
545
- facebook/anli;dev_r3;GLaM;model;;40.7;;data-based;https://arxiv.org/abs/2112.06905;
546
- facebook/anli;dev_r2;GLaM;model;;96.8;;data-based;https://arxiv.org/abs/2112.06905;
547
- facebook/anli;dev_r1;GLaM;model;;96.2;;data-based;https://arxiv.org/abs/2112.06905;
548
-
549
- winogrande;;FLAN;model;;;0.2;data-based;https://arxiv.org/abs/2109.01652;
550
- mandarjoshi/trivia_qa;;FLAN;model;;22.8;;data-based;https://arxiv.org/abs/2109.01652;
551
- story_cloze;;FLAN;model;;0.4;;data-based;https://arxiv.org/abs/2109.01652;
552
- rajpurkar/squad_v2;;FLAN;model;;99.1;;data-based;https://arxiv.org/abs/2109.01652;
553
- wmt/wmt16;ro-en;;FLAN;model;;;12.4;data-based;https://arxiv.org/abs/2109.01652;
554
- super_glue;record;FLAN;model;;68.0;;data-based;https://arxiv.org/abs/2109.01652;
555
- super_glue;rte;FLAN;model;;33.9;;data-based;https://arxiv.org/abs/2109.01652;
556
- piqa;;FLAN;model;;51.3;;data-based;https://arxiv.org/abs/2109.01652;
557
- allenai/openbookqa;;FLAN;model;;15.0;;data-based;https://arxiv.org/abs/2109.01652;
558
- natural_questions;;FLAN;model;;3.2;;data-based;https://arxiv.org/abs/2109.01652;
559
- super_glue;multirc;FLAN;model;;59.3;;data-based;https://arxiv.org/abs/2109.01652;
560
- Rowan/hellaswag;;FLAN;model;;34.5;;data-based;https://arxiv.org/abs/2109.01652;
561
- wmt/wmt16;fr-en;;FLAN;model;;;25.3;data-based;https://arxiv.org/abs/2109.01652;
562
- wmt/wmt16;en-ro;;FLAN;model;;;12.4;data-based;https://arxiv.org/abs/2109.01652;
563
- wmt/wmt16;en-fr;;FLAN;model;;;25.3;data-based;https://arxiv.org/abs/2109.01652;
564
- wmt/wmt16;en-de;;FLAN;model;;;14.3;data-based;https://arxiv.org/abs/2109.01652;
565
- wmt/wmt16;de-en;;FLAN;model;;;14.3;data-based;https://arxiv.org/abs/2109.01652;
566
- ucinlp/drop;;FLAN;model;;99.4;;data-based;https://arxiv.org/abs/2109.01652;
567
- super_glue;copa;FLAN;model;;9.0;;data-based;https://arxiv.org/abs/2109.01652;
568
- super_glue;cb;FLAN;model;;5.4;;data-based;https://arxiv.org/abs/2109.01652;
569
- super_glue;boolq;FLAN;model;;23.1;;data-based;https://arxiv.org/abs/2109.01652;
570
- ibragim-bad/arc_easy;;FLAN;model;;20.2;;data-based;https://arxiv.org/abs/2109.01652;
571
- ibragim-bad/arc_challenge;;FLAN;model;;15.6;;data-based;https://arxiv.org/abs/2109.01652;
572
- facebook/anli;dev_r3;FLAN;model;;40.2;;data-based;https://arxiv.org/abs/2109.01652;
573
- facebook/anli;dev_r2;FLAN;model;;97.9;;data-based;https://arxiv.org/abs/2109.01652;
574
- facebook/anli;dev_r1;FLAN;model;;98.6;;data-based;https://arxiv.org/abs/2109.01652;
 
463
  RadNLI;;GPT-4;model;0.0;0.0;0.0;model-based;https://arxiv.org/pdf/2308.08493;8
464
  RadNLI;;GPT-3.5;model;0.0;0.0;0.0;model-based;https://arxiv.org/pdf/2308.08493;8
465
 
466
+ quac;;GPT-3;model;;99.0;;data-based;https://arxiv.org/abs/2005.14165;13
467
+ rajpurkar/squad_v2;;GPT-3;model;;94.0;;data-based;https://arxiv.org/abs/2005.14165;13
468
+ ucinlp/drop;;GPT-3;model;;93.0;;data-based;https://arxiv.org/abs/2005.14165;13
469
+ Symbol Insertion;;GPT-3;model;;86.0;;data-based;https://arxiv.org/abs/2005.14165;13
470
+ stanfordnlp/coqa;;GPT-3;model;;64.0;;data-based;https://arxiv.org/abs/2005.14165;13
471
+ super_glue;record;GPT-3;model;;61.0;;data-based;https://arxiv.org/abs/2005.14165;13
472
+ winograd_wsc;;GPT-3;model;;;60.0;data-based;https://arxiv.org/abs/2005.14165;13
473
+ super_glue;boolq;GPT-3;model;;60.0;;data-based;https://arxiv.org/abs/2005.14165;13
474
+ super_glue;multirc;GPT-3;model;;59.0;;data-based;https://arxiv.org/abs/2005.14165;13
475
+ race;high;GPT-3;model;;;45.0;data-based;https://arxiv.org/abs/2005.14165;13
476
+ cimec/lambada;;GPT-3;model;;;43.0;data-based;https://arxiv.org/abs/2005.14165;13
477
+ super_glue;wsc;GPT-3;model;;40.0;;data-based;https://arxiv.org/abs/2005.14165;13
478
+ piqa;;GPT-3;model;;29.0;;data-based;https://arxiv.org/abs/2005.14165;13
479
+ wmt/wmt16;en-de;GPT-3;model;;;25.0;data-based;https://arxiv.org/abs/2005.14165;13
480
+ wmt/wmt16;de-en;GPT-3;model;;;25.0;data-based;https://arxiv.org/abs/2005.14165;13
481
+ race;middle;GPT-3;model;;;25.0;data-based;https://arxiv.org/abs/2005.14165;13
482
+ rmanluo/RoG-webqsp;;GPT-3;model;;;21.0;data-based;https://arxiv.org/abs/2005.14165;13
483
+ wmt/wmt16;en-ro;GPT-3;model;;;21.0;data-based;https://arxiv.org/abs/2005.14165;13
484
+ wmt/wmt16;ro-en;GPT-3;model;;;21.0;data-based;https://arxiv.org/abs/2005.14165;13
485
+ facebook/anli;test_r1;GPT-3;model;;;20.0;data-based;https://arxiv.org/abs/2005.14165;13
486
+ facebook/anli;test_r2;GPT-3;model;;;18.0;data-based;https://arxiv.org/abs/2005.14165;13
487
+ mandarjoshi/trivia_qa;GPT-3;model;;17.0;;data-based;https://arxiv.org/abs/2005.14165;13
488
+ facebook/anli;test_r3;GPT-3;model;;;16.0;data-based;https://arxiv.org/abs/2005.14165;13
489
+ wmt/wmt16;fr-en;GPT-3;model;;;14.0;data-based;https://arxiv.org/abs/2005.14165;13
490
+ wmt/wmt16;en-fr;GPT-3;model;;;14.0;data-based;https://arxiv.org/abs/2005.14165;13
491
+ super_glue;rte;GPT-3;model;;8.0;;data-based;https://arxiv.org/abs/2005.14165;13
492
+ super_glue;wic;GPT-3;model;;8.0;;data-based;https://arxiv.org/abs/2005.14165;13
493
+ super_glue;cb;GPT-3;model;;7.0;;data-based;https://arxiv.org/abs/2005.14165;13
494
+ Reversed Words;;GPT-3;model;;7.0;;data-based;https://arxiv.org/abs/2005.14165;13
495
+ Anagrams 2;;GPT-3;model;;7.0;;data-based;https://arxiv.org/abs/2005.14165;13
496
+ allenai/openbookqa;;GPT-3;model;;;6.0;data-based;https://arxiv.org/abs/2005.14165;13
497
+ ibragim-bad/arc_easy;;GPT-3;model;;;4.0;data-based;https://arxiv.org/abs/2005.14165;13
498
+ Anagrams 1;;GPT-3;model;;3.0;;data-based;https://arxiv.org/abs/2005.14165;13
499
+ ibragim-bad/arc_challenge;;GPT-3;model;;;3.0;data-based;https://arxiv.org/abs/2005.14165;13
500
+ super_glue;copa;GPT-3;model;;3.0;;data-based;https://arxiv.org/abs/2005.14165;13
501
+ Rowan/hellaswag;;GPT-3;model;;2.0;;data-based;https://arxiv.org/abs/2005.14165;13
502
+ natural_questions;;GPT-3;model;;;1.0;data-based;https://arxiv.org/abs/2005.14165;13
503
+ Cycled Letters;;GPT-3;model;;1.0;;data-based;https://arxiv.org/abs/2005.14165;13
504
+ SAT Analogies;;GPT-3;model;;1.0;;data-based;https://arxiv.org/abs/2005.14165;13
505
+
506
+ EdinburghNLP/xsum;;PaLM 2;model;;;42.0;data-based;https://arxiv.org/abs/2305.10403;13
507
+ csebuetnlp/xlsum;;PaLM 2;model;;;46.9;data-based;https://arxiv.org/abs/2305.10403;13
508
+ wiki_lingua;;PaLM 2;model;;;9.0;data-based;https://arxiv.org/abs/2305.10403;13
509
+
510
+ winograd_wsc;;PaLM;model;;;38.5;data-based;https://arxiv.org/abs/2204.02311;13
511
+ rmanluo/RoG-webqsp;;PaLM;model;;;26.7;data-based;https://arxiv.org/abs/2204.02311;13
512
+ super_glue;wsc;PaLM;model;;;36.8;data-based;https://arxiv.org/abs/2204.02311;13
513
+ mandarjoshi/trivia_qa;;PaLM;model;;19.9;;data-based;https://arxiv.org/abs/2204.02311;13
514
+ rajpurkar/squad_v2;;PaLM;model;;85.2;;data-based;https://arxiv.org/abs/2204.02311;13
515
+ super_glue;record;PaLM;model;;43.4;;data-based;https://arxiv.org/abs/2204.02311;13
516
+ cimec/lambada;;PaLM;model;;;29.3;data-based;https://arxiv.org/abs/2204.02311;13
517
+ super_glue;cb;PaLM;model;;48.2;;data-based;https://arxiv.org/abs/2204.02311;13
518
+ ibragim-bad/arc_easy;;PaLM;model;;;30.4;data-based;https://arxiv.org/abs/2204.02311;13
519
+ ibragim-bad/arc_challenge;;PaLM;model;;;24.7;data-based;https://arxiv.org/abs/2204.02311;13
520
+
521
+ winograd_wsc;;GLaM;model;;67.3;;data-based;https://arxiv.org/abs/2112.06905;13
522
+ winogrande;;GLaM;model;;;0.3;data-based;https://arxiv.org/abs/2112.06905;13
523
+ super_glue;wic;GLaM;model;;8.2;;data-based;https://arxiv.org/abs/2112.06905;13
524
+ super_glue;wsc;GLaM;model;;57.5;data-based;https://arxiv.org/abs/2112.06905;13
525
+ mandarjoshi/trivia_qa;;GLaM;model;;18.8;;data-based;https://arxiv.org/abs/2112.06905;13
526
+ story_cloze;;GLaM;model;;100.0;;data-based;https://arxiv.org/abs/2112.06905;13
527
+ rajpurkar/squad_v2;;GLaM;model;;94.6;;data-based;https://arxiv.org/abs/2112.06905;13
528
+ super_glue;record;GLaM;model;;98.6;;data-based;https://arxiv.org/abs/2112.06905;13
529
+ super_glue;rte;GLaM;model;;54.9;;data-based;https://arxiv.org/abs/2112.06905;13
530
+ race;middle;GLaM;model;;58.4;;data-based;https://arxiv.org/abs/2112.06905;13
531
+ race;high;GLaM;model;;74.0;;data-based;https://arxiv.org/abs/2112.06905;13
532
+ quac;;GLaM;model;;99.9;;data-based;https://arxiv.org/abs/2112.06905;13
533
+ piqa;;GLaM;model;;49.8;;data-based;https://arxiv.org/abs/2112.06905;13
534
+ allenai/openbookqa;;GLaM;model;;20.0;;data-based;https://arxiv.org/abs/2112.06905;13
535
+ natural_questions;;GLaM;model;;3.9;;data-based;https://arxiv.org/abs/2112.06905;13
536
+ super_glue;multirc;GLaM;model;;68.8;;data-based;https://arxiv.org/abs/2112.06905;13
537
+ cimec/lambada;;GLaM;model;;;21.8;data-based;https://arxiv.org/abs/2112.06905;13
538
+ Rowan/hellaswag;;GLaM;model;;19.8;;data-based;https://arxiv.org/abs/2112.06905;13
539
+ stanfordnlp/coqa;;GLaM;model;;;75.0;data-based;https://arxiv.org/abs/2112.06905;13
540
+ super_glue;copa;GLaM;model;;3.0;;data-based;https://arxiv.org/abs/2112.06905;13
541
+ super_glue;cb;GLaM;model;;26.8;;data-based;https://arxiv.org/abs/2112.06905;13
542
+ super_glue;boolq;GLaM;model;;92.1;;data-based;https://arxiv.org/abs/2112.06905;13
543
+ ibragim-bad/arc_easy;;GLaM;model;;32.5;;data-based;https://arxiv.org/abs/2112.06905;13
544
+ ibragim-bad/arc_challenge;;GLaM;model;;31.8;;data-based;https://arxiv.org/abs/2112.06905;13
545
+ facebook/anli;dev_r3;GLaM;model;;40.7;;data-based;https://arxiv.org/abs/2112.06905;13
546
+ facebook/anli;dev_r2;GLaM;model;;96.8;;data-based;https://arxiv.org/abs/2112.06905;13
547
+ facebook/anli;dev_r1;GLaM;model;;96.2;;data-based;https://arxiv.org/abs/2112.06905;13
548
+
549
+ winogrande;;FLAN;model;;;0.2;data-based;https://arxiv.org/abs/2109.01652;13
550
+ mandarjoshi/trivia_qa;;FLAN;model;;22.8;;data-based;https://arxiv.org/abs/2109.01652;13
551
+ story_cloze;;FLAN;model;;0.4;;data-based;https://arxiv.org/abs/2109.01652;13
552
+ rajpurkar/squad_v2;;FLAN;model;;99.1;;data-based;https://arxiv.org/abs/2109.01652;13
553
+ wmt/wmt16;ro-en;;FLAN;model;;;12.4;data-based;https://arxiv.org/abs/2109.01652;13
554
+ super_glue;record;FLAN;model;;68.0;;data-based;https://arxiv.org/abs/2109.01652;13
555
+ super_glue;rte;FLAN;model;;33.9;;data-based;https://arxiv.org/abs/2109.01652;13
556
+ piqa;;FLAN;model;;51.3;;data-based;https://arxiv.org/abs/2109.01652;13
557
+ allenai/openbookqa;;FLAN;model;;15.0;;data-based;https://arxiv.org/abs/2109.01652;13
558
+ natural_questions;;FLAN;model;;3.2;;data-based;https://arxiv.org/abs/2109.01652;13
559
+ super_glue;multirc;FLAN;model;;59.3;;data-based;https://arxiv.org/abs/2109.01652;13
560
+ Rowan/hellaswag;;FLAN;model;;34.5;;data-based;https://arxiv.org/abs/2109.01652;13
561
+ wmt/wmt16;fr-en;;FLAN;model;;;25.3;data-based;https://arxiv.org/abs/2109.01652;13
562
+ wmt/wmt16;en-ro;;FLAN;model;;;12.4;data-based;https://arxiv.org/abs/2109.01652;13
563
+ wmt/wmt16;en-fr;;FLAN;model;;;25.3;data-based;https://arxiv.org/abs/2109.01652;13
564
+ wmt/wmt16;en-de;;FLAN;model;;;14.3;data-based;https://arxiv.org/abs/2109.01652;13
565
+ wmt/wmt16;de-en;;FLAN;model;;;14.3;data-based;https://arxiv.org/abs/2109.01652;13
566
+ ucinlp/drop;;FLAN;model;;99.4;;data-based;https://arxiv.org/abs/2109.01652;13
567
+ super_glue;copa;FLAN;model;;9.0;;data-based;https://arxiv.org/abs/2109.01652;13
568
+ super_glue;cb;FLAN;model;;5.4;;data-based;https://arxiv.org/abs/2109.01652;13
569
+ super_glue;boolq;FLAN;model;;23.1;;data-based;https://arxiv.org/abs/2109.01652;13
570
+ ibragim-bad/arc_easy;;FLAN;model;;20.2;;data-based;https://arxiv.org/abs/2109.01652;13
571
+ ibragim-bad/arc_challenge;;FLAN;model;;15.6;;data-based;https://arxiv.org/abs/2109.01652;13
572
+ facebook/anli;dev_r3;FLAN;model;;40.2;;data-based;https://arxiv.org/abs/2109.01652;13
573
+ facebook/anli;dev_r2;FLAN;model;;97.9;;data-based;https://arxiv.org/abs/2109.01652;13
574
+ facebook/anli;dev_r1;FLAN;model;;98.6;;data-based;https://arxiv.org/abs/2109.01652;13