sileod
/

deberta-v3-large-tasksource-nli

@@ -218,7 +218,6 @@
     4,
     2,
     8,
-    2,
     4,
     2,
     2,
@@ -229,35 +228,36 @@
     3,
     3,
     20,
     174,
     2,
     2,
     2,
     2,
     2,
-    41,
-    51,
-    3,
     2,
     3,
-    18,
-    17,
     3,
     2,
-    16,
     2,
     2,
-    8,
     2,
     2,
-    7,
-    4,
-    7,
     3,
     42,
     3,
     12,
-    11,
     100,
     13,
     100,
@@ -287,29 +287,29 @@
     28,
     3,
     6,
-    5,
     7,
     3,
-    6,
     4,
     2,
     20,
-    6,
     2,
     2,
     2,
     2,
     2,
     7,
     2,
     2,
     3,
     4,
-    9,
     2,
-    4,
     3,
-    13,
     2,
     2,
     2,
@@ -487,7 +487,11 @@
     1,
     2,
     3,
     3,
     2,
     3,
     3,
@@ -605,106 +609,106 @@
     "model-written-evals",
     "truthful_qa/multiple_choice",
     "fig-qa",
-    "bigbench/logical_sequence",
-    "bigbench/snarks",
-    "bigbench/general_knowledge",
-    "bigbench/moral_permissibility",
-    "bigbench/figure_of_speech_detection",
-    "bigbench/abstract_narrative_understanding",
-    "bigbench/anachronisms",
-    "bigbench/vitaminc_fact_verification",
-    "bigbench/authorship_verification",
     "bigbench/penguins_in_a_table",
-    "bigbench/play_dialog_same_or_different",
-    "bigbench/physical_intuition",
-    "bigbench/empirical_judgments",
-    "bigbench/checkmate_in_one",
-    "bigbench/metaphor_understanding",
-    "bigbench/cs_algorithms",
-    "bigbench/dyck_languages",
     "bigbench/dark_humor_detection",
     "bigbench/fantasy_reasoning",
     "bigbench/odd_one_out",
     "bigbench/epistemic_reasoning",
-    "bigbench/identify_odd_metaphor",
-    "bigbench/discourse_marker_prediction",
     "bigbench/question_selection",
     "bigbench/geometric_shapes",
-    "bigbench/date_understanding",
-    "bigbench/disambiguation_qa",
-    "bigbench/strategyqa",
-    "bigbench/color",
     "bigbench/elementary_math_qa",
-    "bigbench/mathematical_induction",
-    "bigbench/strange_stories",
-    "bigbench/logical_args",
-    "bigbench/cifar10_classification",
-    "bigbench/evaluating_information_essentiality",
     "bigbench/novel_concepts",
-    "bigbench/hyperbaton",
-    "bigbench/fact_checker",
-    "bigbench/sentence_ambiguity",
-    "bigbench/social_iqa",
-    "bigbench/identify_math_theorems",
-    "bigbench/cause_and_effect",
     "bigbench/misconceptions",
-    "bigbench/causal_judgment",
-    "bigbench/international_phonetic_alphabet_nli",
-    "bigbench/implicit_relations",
     "bigbench/salient_translation_error_detection",
     "bigbench/logical_deduction",
-    "bigbench/known_unknowns",
-    "bigbench/arithmetic",
-    "bigbench/sports_understanding",
-    "bigbench/navigate",
-    "bigbench/irony_identification",
     "bigbench/hindu_knowledge",
-    "bigbench/mnist_ascii",
-    "bigbench/social_support",
-    "bigbench/presuppositions_as_nli",
-    "bigbench/tracking_shuffled_objects",
-    "bigbench/winowhy",
-    "bigbench/formal_fallacies_syllogisms_negation",
-    "bigbench/emoji_movie",
-    "bigbench/code_line_description",
-    "bigbench/logical_fallacy_detection",
-    "bigbench/intent_recognition",
-    "bigbench/bbq_lite_json",
-    "bigbench/metaphor_boolean",
-    "bigbench/analytic_entailment",
     "bigbench/unit_interpretation",
     "bigbench/analogical_similarity",
-    "bigbench/symbol_interpretation",
-    "bigbench/contextual_parametric_knowledge_conflicts",
-    "bigbench/conceptual_combinations",
-    "bigbench/temporal_sequences",
-    "bigbench/english_proverbs",
-    "bigbench/gre_reading_comprehension",
-    "bigbench/suicide_risk",
-    "bigbench/emojis_emotion_prediction",
-    "bigbench/phrase_relatedness",
     "bigbench/understanding_fables",
-    "bigbench/riddle_sense",
-    "bigbench/ruin_names",
-    "bigbench/physics",
-    "bigbench/reasoning_about_colored_objects",
     "bigbench/timedial",
-    "bigbench/hhh_alignment",
-    "bigbench/nonsense_words_grammar",
-    "bigbench/crass_ai",
-    "bigbench/undo_permutation",
-    "bigbench/simple_ethical_questions",
-    "bigbench/movie_recommendation",
-    "bigbench/crash_blossom",
-    "bigbench/entailed_polarity",
-    "bigbench/goal_step_wikihow",
-    "bigbench/key_value_maps",
-    "bigbench/real_or_fake_text",
-    "bigbench/human_organs_senses",
-    "bigbench/logic_grid_puzzle",
-    "bigbench/implicatures",
-    "bigbench/similarities_abstraction",
-    "bigbench/movie_dialog_same_or_different",
     "cos_e/v1.0",
     "cosmos_qa",
     "dream",
@@ -743,7 +747,6 @@
     "rumoureval_2019/RumourEval2019",
     "ethos/binary",
     "ethos/multilabel",
-    "tweet_eval/hate",
     "tweet_eval/emotion",
     "tweet_eval/irony",
     "tweet_eval/offensive",
@@ -754,35 +757,36 @@
     "tweet_eval/stance_feminist",
     "tweet_eval/stance_hillary",
     "tweet_eval/emoji",
     "discovery/discovery",
-    "pragmeval/squinky-formality",
     "pragmeval/emobank-valence",
     "pragmeval/emobank-dominance",
     "pragmeval/squinky-implicature",
     "pragmeval/squinky-informativeness",
-    "pragmeval/switchboard",
     "pragmeval/mrda",
     "pragmeval/verifiability",
-    "pragmeval/emobank-arousal",
-    "pragmeval/emergent",
-    "pragmeval/stac",
-    "pragmeval/gum",
     "pragmeval/persuasiveness-claimtype",
     "pragmeval/persuasiveness-eloquence",
-    "pragmeval/pdtb",
-    "pragmeval/persuasiveness-relevance",
-    "pragmeval/sarcasm",
     "pragmeval/persuasiveness-premisetype",
-    "pragmeval/persuasiveness-strength",
     "pragmeval/persuasiveness-specificity",
-    "silicone/dyda_e",
-    "silicone/dyda_da",
-    "silicone/meld_e",
-    "silicone/meld_s",
-    "silicone/oasis",
     "silicone/sem",
     "silicone/maptask",
-    "silicone/iemocap",
     "lex_glue/eurlex",
     "lex_glue/scotus",
     "lex_glue/ledgar",
@@ -812,29 +816,29 @@
     "go_emotions/simplified",
     "scicite",
     "liar",
-    "lexical_relation_classification/CogALexV",
     "lexical_relation_classification/EVALution",
     "lexical_relation_classification/ROOT09",
-    "lexical_relation_classification/BLESS",
     "lexical_relation_classification/K&H+N",
     "linguisticprobing/bigram_shift",
     "linguisticprobing/top_constituents",
-    "linguisticprobing/sentence_length",
     "linguisticprobing/subj_number",
-    "linguisticprobing/obj_number",
-    "linguisticprobing/past_present",
     "linguisticprobing/odd_man_out",
     "linguisticprobing/coordination_inversion",
     "linguisticprobing/tree_depth",
     "crowdflower/tweet_global_warming",
-    "crowdflower/political-media-audience",
-    "crowdflower/economic-news",
-    "crowdflower/sentiment_nuclear_power",
     "crowdflower/political-media-message",
     "crowdflower/political-media-bias",
-    "crowdflower/corporate-messaging",
     "crowdflower/airline-sentiment",
-    "crowdflower/text_emotion",
     "ethics/commonsense",
     "ethics/deontology",
     "ethics/justice",
@@ -899,8 +903,8 @@
     "scruples",
     "wouldyourather",
     "attempto-nli",
-    "defeasible-nli/atomic",
     "defeasible-nli/snli",
     "help-nli",
     "nli-veridicality-transitivity",
     "natural-language-satisfiability",
@@ -923,8 +927,8 @@
     "redefine-math",
     "puzzte",
     "implicatures",
-    "race/high",
     "race/middle",
     "race-c",
     "spartqa-yn",
     "spartqa-mchoice",
@@ -950,10 +954,10 @@
     "oasst1_dense_flat/helpfulness",
     "PARARULE-Plus",
     "mindgames",
-    "universal_dependencies/en_ewt/deprel",
     "universal_dependencies/en_gum/deprel",
-    "universal_dependencies/en_lines/deprel",
     "universal_dependencies/en_partut/deprel",
     "ambient",
     "path-naturalness-prediction",
     "civil_comments/toxicity",
@@ -1012,7 +1016,11 @@
     "lsat_qa/all",
     "apt",
     "twitter-financial-news-sentiment",
     "SpaceNLI",
     "babi_nli",
     "gen_debiased_nli",
     "imppres/presupposition",

     4,
     2,
     8,
     4,
     2,
     2,
     3,
     3,
     20,
+    2,
     174,
     2,
+    41,
     2,
     2,
     2,
     2,
     2,
+    51,
     3,
+    16,
     3,
     2,
+    8,
+    17,
+    18,
     2,
     2,
     2,
     2,
+    3,
+    11,
     3,
     42,
     3,
+    7,
     12,
+    7,
+    4,
     100,
     13,
     100,
     28,
     3,
     6,
+    6,
     7,
     3,
+    5,
     4,
     2,
     20,
     2,
     2,
     2,
     2,
     2,
+    6,
     7,
     2,
+    13,
+    9,
     2,
     3,
     4,
     2,
     3,
+    4,
     2,
     2,
     2,
     1,
     2,
     3,
+    2,
     3,
+    3,
+    2,
+    2,
     2,
     3,
     3,
     "model-written-evals",
     "truthful_qa/multiple_choice",
     "fig-qa",
+    "bigbench/mathematical_induction",
     "bigbench/penguins_in_a_table",
+    "bigbench/strategyqa",
     "bigbench/dark_humor_detection",
+    "bigbench/social_support",
+    "bigbench/crass_ai",
+    "bigbench/real_or_fake_text",
+    "bigbench/symbol_interpretation",
+    "bigbench/tracking_shuffled_objects",
     "bigbench/fantasy_reasoning",
+    "bigbench/cause_and_effect",
+    "bigbench/dyck_languages",
+    "bigbench/known_unknowns",
     "bigbench/odd_one_out",
+    "bigbench/cs_algorithms",
+    "bigbench/crash_blossom",
+    "bigbench/nonsense_words_grammar",
+    "bigbench/snarks",
+    "bigbench/cifar10_classification",
+    "bigbench/emojis_emotion_prediction",
+    "bigbench/contextual_parametric_knowledge_conflicts",
+    "bigbench/checkmate_in_one",
+    "bigbench/metaphor_understanding",
+    "bigbench/evaluating_information_essentiality",
+    "bigbench/international_phonetic_alphabet_nli",
+    "bigbench/temporal_sequences",
+    "bigbench/authorship_verification",
+    "bigbench/logical_fallacy_detection",
+    "bigbench/anachronisms",
+    "bigbench/fact_checker",
+    "bigbench/analytic_entailment",
+    "bigbench/english_proverbs",
+    "bigbench/strange_stories",
+    "bigbench/identify_math_theorems",
+    "bigbench/conceptual_combinations",
+    "bigbench/mnist_ascii",
+    "bigbench/goal_step_wikihow",
     "bigbench/epistemic_reasoning",
+    "bigbench/implicatures",
     "bigbench/question_selection",
+    "bigbench/suicide_risk",
+    "bigbench/reasoning_about_colored_objects",
+    "bigbench/riddle_sense",
+    "bigbench/formal_fallacies_syllogisms_negation",
+    "bigbench/entailed_polarity",
+    "bigbench/winowhy",
+    "bigbench/movie_recommendation",
+    "bigbench/empirical_judgments",
     "bigbench/geometric_shapes",
+    "bigbench/moral_permissibility",
+    "bigbench/presuppositions_as_nli",
+    "bigbench/social_iqa",
+    "bigbench/undo_permutation",
+    "bigbench/intent_recognition",
+    "bigbench/phrase_relatedness",
+    "bigbench/similarities_abstraction",
     "bigbench/elementary_math_qa",
     "bigbench/novel_concepts",
+    "bigbench/play_dialog_same_or_different",
+    "bigbench/key_value_maps",
+    "bigbench/figure_of_speech_detection",
+    "bigbench/metaphor_boolean",
+    "bigbench/date_understanding",
+    "bigbench/simple_ethical_questions",
+    "bigbench/emoji_movie",
+    "bigbench/ruin_names",
+    "bigbench/abstract_narrative_understanding",
+    "bigbench/physics",
     "bigbench/misconceptions",
+    "bigbench/movie_dialog_same_or_different",
+    "bigbench/identify_odd_metaphor",
+    "bigbench/navigate",
     "bigbench/salient_translation_error_detection",
+    "bigbench/causal_judgment",
+    "bigbench/code_line_description",
+    "bigbench/gre_reading_comprehension",
     "bigbench/logical_deduction",
     "bigbench/hindu_knowledge",
+    "bigbench/physical_intuition",
+    "bigbench/color",
     "bigbench/unit_interpretation",
+    "bigbench/bbq_lite_json",
+    "bigbench/logic_grid_puzzle",
+    "bigbench/hhh_alignment",
     "bigbench/analogical_similarity",
+    "bigbench/implicit_relations",
+    "bigbench/vitaminc_fact_verification",
+    "bigbench/human_organs_senses",
+    "bigbench/arithmetic",
+    "bigbench/discourse_marker_prediction",
+    "bigbench/general_knowledge",
+    "bigbench/hyperbaton",
+    "bigbench/logical_sequence",
+    "bigbench/disambiguation_qa",
+    "bigbench/sentence_ambiguity",
+    "bigbench/irony_identification",
+    "bigbench/sports_understanding",
     "bigbench/understanding_fables",
+    "bigbench/logical_args",
     "bigbench/timedial",
     "cos_e/v1.0",
     "cosmos_qa",
     "dream",
     "rumoureval_2019/RumourEval2019",
     "ethos/binary",
     "ethos/multilabel",
     "tweet_eval/emotion",
     "tweet_eval/irony",
     "tweet_eval/offensive",
     "tweet_eval/stance_feminist",
     "tweet_eval/stance_hillary",
     "tweet_eval/emoji",
+    "tweet_eval/hate",
     "discovery/discovery",
     "pragmeval/emobank-valence",
+    "pragmeval/switchboard",
     "pragmeval/emobank-dominance",
+    "pragmeval/emobank-arousal",
+    "pragmeval/squinky-formality",
     "pragmeval/squinky-implicature",
     "pragmeval/squinky-informativeness",
     "pragmeval/mrda",
     "pragmeval/verifiability",
+    "pragmeval/pdtb",
     "pragmeval/persuasiveness-claimtype",
     "pragmeval/persuasiveness-eloquence",
     "pragmeval/persuasiveness-premisetype",
+    "pragmeval/gum",
+    "pragmeval/stac",
     "pragmeval/persuasiveness-specificity",
+    "pragmeval/persuasiveness-strength",
+    "pragmeval/sarcasm",
+    "pragmeval/persuasiveness-relevance",
+    "pragmeval/emergent",
+    "silicone/iemocap",
     "silicone/sem",
+    "silicone/oasis",
+    "silicone/meld_s",
+    "silicone/meld_e",
     "silicone/maptask",
+    "silicone/dyda_e",
+    "silicone/dyda_da",
     "lex_glue/eurlex",
     "lex_glue/scotus",
     "lex_glue/ledgar",
     "go_emotions/simplified",
     "scicite",
     "liar",
+    "lexical_relation_classification/BLESS",
     "lexical_relation_classification/EVALution",
     "lexical_relation_classification/ROOT09",
+    "lexical_relation_classification/CogALexV",
     "lexical_relation_classification/K&H+N",
     "linguisticprobing/bigram_shift",
     "linguisticprobing/top_constituents",
     "linguisticprobing/subj_number",
     "linguisticprobing/odd_man_out",
     "linguisticprobing/coordination_inversion",
+    "linguisticprobing/obj_number",
+    "linguisticprobing/past_present",
+    "linguisticprobing/sentence_length",
     "linguisticprobing/tree_depth",
     "crowdflower/tweet_global_warming",
+    "crowdflower/text_emotion",
     "crowdflower/political-media-message",
     "crowdflower/political-media-bias",
     "crowdflower/airline-sentiment",
+    "crowdflower/sentiment_nuclear_power",
+    "crowdflower/political-media-audience",
+    "crowdflower/economic-news",
+    "crowdflower/corporate-messaging",
     "ethics/commonsense",
     "ethics/deontology",
     "ethics/justice",
     "scruples",
     "wouldyourather",
     "attempto-nli",
     "defeasible-nli/snli",
+    "defeasible-nli/atomic",
     "help-nli",
     "nli-veridicality-transitivity",
     "natural-language-satisfiability",
     "redefine-math",
     "puzzte",
     "implicatures",
     "race/middle",
+    "race/high",
     "race-c",
     "spartqa-yn",
     "spartqa-mchoice",
     "oasst1_dense_flat/helpfulness",
     "PARARULE-Plus",
     "mindgames",
     "universal_dependencies/en_gum/deprel",
+    "universal_dependencies/en_ewt/deprel",
     "universal_dependencies/en_partut/deprel",
+    "universal_dependencies/en_lines/deprel",
     "ambient",
     "path-naturalness-prediction",
     "civil_comments/toxicity",
     "lsat_qa/all",
     "apt",
     "twitter-financial-news-sentiment",
+    "icl-symbol-tuning-instruct",
     "SpaceNLI",
+    "propsegment/nli",
+    "HatemojiBuild",
+    "regset",
     "babi_nli",
     "gen_debiased_nli",
     "imppres/presupposition",

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:cc7a150f04b55cf0740b9ab332e6adf1634b23f7bf5aab69d8f3d0c5c87e0efd
 size 1740400377

 version https://git-lfs.github.com/spec/v1
+oid sha256:40e81d769bb3606dbffbdddf48cd39cf5945e30bcad841cb100e70cf4258a756
 size 1740400377