sileod
/

deberta-v3-large-tasksource-nli

@@ -1,5 +1,5 @@
 {
-  "_name_or_path": "mt-428-30000",
   "architectures": [
     "DebertaV2ForSequenceClassification"
   ],
@@ -243,46 +243,46 @@
     4,
     2,
     8,
-    20,
-    4,
-    2,
-    2,
     3,
-    2,
     3,
     3,
     3,
     3,
     3,
     174,
-    2,
     3,
     2,
     2,
     2,
     2,
-    41,
-    51,
     2,
-    8,
     2,
-    16,
     18,
     2,
     2,
-    17,
     2,
-    3,
     2,
     3,
-    12,
     42,
     3,
     7,
-    11,
     7,
     4,
-    3,
     100,
     13,
     100,
@@ -313,33 +313,33 @@
     28,
     3,
     6,
-    7,
     6,
     5,
-    3,
     4,
     2,
     2,
-    6,
     2,
     7,
     2,
     2,
     2,
-    20,
-    4,
     2,
     3,
     4,
     3,
     2,
-    2,
     9,
     13,
     2,
     2,
     2,
     2,
     4,
     1,
     2,
@@ -430,6 +430,27 @@
     1,
     4,
     1,
     2,
     1,
     1
@@ -496,9 +517,9 @@
     "recast/recast_factuality",
     "recast/recast_puns",
     "recast/recast_kg_relations",
-    "recast/recast_sentiment",
     "recast/recast_megaveridicality",
     "recast/recast_verbcorner",
     "probability_words_nli/usnli",
     "probability_words_nli/reasoning_2hop",
     "probability_words_nli/reasoning_1hop",
@@ -533,29 +554,29 @@
     "gen_debiased_nli/mnli_z_aug",
     "gen_debiased_nli/mnli_seq_z",
     "add_one_rte",
-    "imppres/presupposition_change_of_state/presupposition",
-    "imppres/presupposition_all_n_presupposition/presupposition",
-    "imppres/presupposition_question_presupposition/presupposition",
-    "imppres/presupposition_possessed_definites_uniqueness/presupposition",
-    "imppres/presupposition_possessed_definites_existence/presupposition",
     "imppres/presupposition_only_presupposition/presupposition",
     "imppres/presupposition_cleft_uniqueness/presupposition",
-    "imppres/presupposition_cleft_existence/presupposition",
     "imppres/presupposition_both_presupposition/presupposition",
-    "imppres/implicature_quantifiers/prag",
     "imppres/implicature_numerals_2_3/prag",
-    "imppres/implicature_modals/prag",
-    "imppres/implicature_numerals_10_100/prag",
-    "imppres/implicature_gradable_adjective/prag",
     "imppres/implicature_connectives/prag",
     "imppres/implicature_gradable_verb/prag",
-    "imppres/implicature_quantifiers/log",
-    "imppres/implicature_numerals_2_3/log",
-    "imppres/implicature_numerals_10_100/log",
-    "imppres/implicature_modals/log",
     "imppres/implicature_gradable_verb/log",
-    "imppres/implicature_gradable_adjective/log",
     "imppres/implicature_connectives/log",
     "glue_diagnostics/diagnostics",
     "hlgd",
     "paws/labeled_final",
@@ -569,106 +590,106 @@
     "model-written-evals",
     "truthful_qa/multiple_choice",
     "fig-qa",
-    "bigbench/bbq_lite_json",
-    "bigbench/social_support",
-    "bigbench/irony_identification",
-    "bigbench/snarks",
-    "bigbench/presuppositions_as_nli",
-    "bigbench/logical_fallacy_detection",
-    "bigbench/mathematical_induction",
-    "bigbench/timedial",
     "bigbench/logical_args",
-    "bigbench/causal_judgment",
-    "bigbench/authorship_verification",
-    "bigbench/discourse_marker_prediction",
-    "bigbench/identify_odd_metaphor",
-    "bigbench/mnist_ascii",
-    "bigbench/empirical_judgments",
-    "bigbench/human_organs_senses",
-    "bigbench/phrase_relatedness",
-    "bigbench/similarities_abstraction",
-    "bigbench/elementary_math_qa",
-    "bigbench/general_knowledge",
-    "bigbench/odd_one_out",
-    "bigbench/physical_intuition",
-    "bigbench/english_proverbs",
-    "bigbench/key_value_maps",
-    "bigbench/fact_checker",
-    "bigbench/real_or_fake_text",
-    "bigbench/movie_recommendation",
-    "bigbench/implicit_relations",
-    "bigbench/cause_and_effect",
-    "bigbench/crass_ai",
-    "bigbench/emoji_movie",
-    "bigbench/formal_fallacies_syllogisms_negation",
-    "bigbench/cs_algorithms",
-    "bigbench/salient_translation_error_detection",
-    "bigbench/metaphor_understanding",
-    "bigbench/play_dialog_same_or_different",
     "bigbench/sports_understanding",
-    "bigbench/understanding_fables",
-    "bigbench/nonsense_words_grammar",
-    "bigbench/misconceptions",
-    "bigbench/moral_permissibility",
     "bigbench/color",
-    "bigbench/metaphor_boolean",
-    "bigbench/hyperbaton",
     "bigbench/arithmetic",
-    "bigbench/reasoning_about_colored_objects",
-    "bigbench/social_iqa",
-    "bigbench/symbol_interpretation",
-    "bigbench/crash_blossom",
-    "bigbench/undo_permutation",
-    "bigbench/implicatures",
-    "bigbench/question_selection",
-    "bigbench/code_line_description",
     "bigbench/dark_humor_detection",
-    "bigbench/disambiguation_qa",
-    "bigbench/contextual_parametric_knowledge_conflicts",
-    "bigbench/entailed_polarity",
-    "bigbench/ruin_names",
     "bigbench/international_phonetic_alphabet_nli",
     "bigbench/conceptual_combinations",
-    "bigbench/strange_stories",
     "bigbench/evaluating_information_essentiality",
-    "bigbench/fantasy_reasoning",
     "bigbench/physics",
-    "bigbench/sentence_ambiguity",
-    "bigbench/intent_recognition",
-    "bigbench/checkmate_in_one",
-    "bigbench/analogical_similarity",
-    "bigbench/identify_math_theorems",
-    "bigbench/movie_dialog_same_or_different",
     "bigbench/unit_interpretation",
-    "bigbench/logical_deduction",
-    "bigbench/abstract_narrative_understanding",
-    "bigbench/strategyqa",
-    "bigbench/penguins_in_a_table",
-    "bigbench/goal_step_wikihow",
-    "bigbench/hhh_alignment",
-    "bigbench/date_understanding",
-    "bigbench/cifar10_classification",
-    "bigbench/riddle_sense",
-    "bigbench/logic_grid_puzzle",
     "bigbench/suicide_risk",
     "bigbench/hindu_knowledge",
-    "bigbench/navigate",
-    "bigbench/temporal_sequences",
-    "bigbench/anachronisms",
-    "bigbench/geometric_shapes",
-    "bigbench/figure_of_speech_detection",
-    "bigbench/tracking_shuffled_objects",
     "bigbench/epistemic_reasoning",
     "bigbench/simple_ethical_questions",
     "bigbench/dyck_languages",
-    "bigbench/analytic_entailment",
-    "bigbench/winowhy",
-    "bigbench/gre_reading_comprehension",
-    "bigbench/logical_sequence",
-    "bigbench/emojis_emotion_prediction",
-    "bigbench/novel_concepts",
     "bigbench/vitaminc_fact_verification",
-    "bigbench/known_unknowns",
     "cos_e/v1.0",
     "cosmos_qa",
     "dream",
@@ -689,8 +710,8 @@
     "art",
     "winogrande/winogrande_xl",
     "codah/codah",
-    "ai2_arc/ARC-Easy/challenge",
     "ai2_arc/ARC-Challenge/challenge",
     "definite_pronoun_resolution",
     "swag",
     "math_qa",
@@ -707,46 +728,46 @@
     "rumoureval_2019/RumourEval2019",
     "ethos/binary",
     "ethos/multilabel",
-    "tweet_eval/emoji",
-    "tweet_eval/emotion",
-    "tweet_eval/hate",
     "tweet_eval/offensive",
     "tweet_eval/sentiment",
-    "tweet_eval/irony",
-    "tweet_eval/stance_atheism",
-    "tweet_eval/stance_climate",
     "tweet_eval/stance_hillary",
-    "tweet_eval/stance_feminist",
     "tweet_eval/stance_abortion",
     "discovery/discovery",
-    "pragmeval/squinky-informativeness",
     "pragmeval/verifiability",
-    "pragmeval/squinky-formality",
-    "pragmeval/squinky-implicature",
-    "pragmeval/emobank-dominance",
-    "pragmeval/emobank-arousal",
-    "pragmeval/switchboard",
     "pragmeval/mrda",
     "pragmeval/emobank-valence",
-    "pragmeval/persuasiveness-premisetype",
-    "pragmeval/persuasiveness-relevance",
-    "pragmeval/pdtb",
     "pragmeval/stac",
     "pragmeval/persuasiveness-strength",
-    "pragmeval/sarcasm",
-    "pragmeval/gum",
     "pragmeval/persuasiveness-eloquence",
     "pragmeval/persuasiveness-claimtype",
-    "pragmeval/persuasiveness-specificity",
     "pragmeval/emergent",
-    "silicone/maptask",
     "silicone/oasis",
     "silicone/meld_s",
     "silicone/meld_e",
-    "silicone/iemocap",
     "silicone/dyda_e",
     "silicone/dyda_da",
-    "silicone/sem",
     "lex_glue/eurlex",
     "lex_glue/scotus",
     "lex_glue/ledgar",
@@ -777,29 +798,29 @@
     "go_emotions/simplified",
     "scicite",
     "liar",
-    "lexical_relation_classification/EVALution",
     "lexical_relation_classification/BLESS",
     "lexical_relation_classification/CogALexV",
-    "lexical_relation_classification/ROOT09",
     "lexical_relation_classification/K&H+N",
     "linguisticprobing/bigram_shift",
     "linguisticprobing/odd_man_out",
-    "linguisticprobing/sentence_length",
     "linguisticprobing/coordination_inversion",
     "linguisticprobing/tree_depth",
-    "linguisticprobing/subj_number",
-    "linguisticprobing/obj_number",
     "linguisticprobing/past_present",
-    "linguisticprobing/top_constituents",
-    "crowdflower/sentiment_nuclear_power",
-    "crowdflower/tweet_global_warming",
-    "crowdflower/airline-sentiment",
-    "crowdflower/corporate-messaging",
-    "crowdflower/economic-news",
-    "crowdflower/political-media-bias",
     "crowdflower/political-media-audience",
     "crowdflower/political-media-message",
     "crowdflower/text_emotion",
     "ethics/commonsense",
     "ethics/deontology",
     "ethics/justice",
@@ -894,12 +915,33 @@
     "redefine-math",
     "puzzte",
     "implicatures",
     "babi_nli",
     "blimp-2",
     "mmlu-4"
   ],
   "torch_dtype": "float32",
-  "transformers_version": "4.25.1",
   "type_vocab_size": 0,
   "vocab_size": 128100
 }

 {
+  "_name_or_path": "microsoft/deberta-v3-large",
   "architectures": [
     "DebertaV2ForSequenceClassification"
   ],
     4,
     2,
     8,
     3,
     3,
+    2,
+    2,
     3,
     3,
+    20,
+    4,
     3,
+    2,
     3,
     174,
     3,
+    51,
+    41,
     2,
     2,
     2,
     2,
     2,
     2,
     18,
     2,
     2,
     2,
+    8,
     2,
     3,
+    16,
+    17,
+    3,
+    2,
     42,
     3,
     7,
+    12,
+    3,
     7,
     4,
+    11,
     100,
     13,
     100,
     28,
     3,
     6,
     6,
     5,
+    7,
     4,
+    3,
+    6,
     2,
     2,
     2,
+    20,
     7,
     2,
     2,
     2,
     2,
     3,
     4,
     3,
     2,
+    4,
     9,
     13,
     2,
     2,
     2,
     2,
+    2,
     4,
     1,
     2,
     1,
     4,
     1,
+    1,
+    1,
+    1,
+    3,
+    1,
+    3,
+    1,
+    2,
+    2,
+    1,
+    2,
+    3,
+    3,
+    2,
+    1,
+    3,
+    1,
+    1,
+    3,
+    1,
+    3,
     2,
     1,
     1
     "recast/recast_factuality",
     "recast/recast_puns",
     "recast/recast_kg_relations",
     "recast/recast_megaveridicality",
     "recast/recast_verbcorner",
+    "recast/recast_sentiment",
     "probability_words_nli/usnli",
     "probability_words_nli/reasoning_2hop",
     "probability_words_nli/reasoning_1hop",
     "gen_debiased_nli/mnli_z_aug",
     "gen_debiased_nli/mnli_seq_z",
     "add_one_rte",
     "imppres/presupposition_only_presupposition/presupposition",
+    "imppres/presupposition_question_presupposition/presupposition",
     "imppres/presupposition_cleft_uniqueness/presupposition",
     "imppres/presupposition_both_presupposition/presupposition",
+    "imppres/presupposition_all_n_presupposition/presupposition",
+    "imppres/presupposition_change_of_state/presupposition",
+    "imppres/presupposition_possessed_definites_existence/presupposition",
+    "imppres/presupposition_possessed_definites_uniqueness/presupposition",
+    "imppres/presupposition_cleft_existence/presupposition",
     "imppres/implicature_numerals_2_3/prag",
     "imppres/implicature_connectives/prag",
+    "imppres/implicature_gradable_adjective/prag",
     "imppres/implicature_gradable_verb/prag",
+    "imppres/implicature_modals/prag",
+    "imppres/implicature_numerals_10_100/prag",
+    "imppres/implicature_quantifiers/prag",
     "imppres/implicature_gradable_verb/log",
+    "imppres/implicature_modals/log",
+    "imppres/implicature_numerals_10_100/log",
+    "imppres/implicature_numerals_2_3/log",
+    "imppres/implicature_quantifiers/log",
     "imppres/implicature_connectives/log",
+    "imppres/implicature_gradable_adjective/log",
     "glue_diagnostics/diagnostics",
     "hlgd",
     "paws/labeled_final",
     "model-written-evals",
     "truthful_qa/multiple_choice",
     "fig-qa",
+    "bigbench/entailed_polarity",
     "bigbench/logical_args",
     "bigbench/sports_understanding",
     "bigbench/color",
+    "bigbench/goal_step_wikihow",
+    "bigbench/fantasy_reasoning",
+    "bigbench/navigate",
+    "bigbench/known_unknowns",
+    "bigbench/real_or_fake_text",
+    "bigbench/novel_concepts",
+    "bigbench/logical_sequence",
+    "bigbench/crass_ai",
+    "bigbench/identify_odd_metaphor",
     "bigbench/arithmetic",
+    "bigbench/elementary_math_qa",
+    "bigbench/cifar10_classification",
+    "bigbench/riddle_sense",
+    "bigbench/salient_translation_error_detection",
+    "bigbench/tracking_shuffled_objects",
     "bigbench/dark_humor_detection",
+    "bigbench/mathematical_induction",
+    "bigbench/implicit_relations",
+    "bigbench/logic_grid_puzzle",
+    "bigbench/analytic_entailment",
+    "bigbench/temporal_sequences",
+    "bigbench/question_selection",
+    "bigbench/odd_one_out",
     "bigbench/international_phonetic_alphabet_nli",
+    "bigbench/nonsense_words_grammar",
+    "bigbench/play_dialog_same_or_different",
+    "bigbench/winowhy",
+    "bigbench/causal_judgment",
+    "bigbench/disambiguation_qa",
     "bigbench/conceptual_combinations",
     "bigbench/evaluating_information_essentiality",
+    "bigbench/code_line_description",
     "bigbench/physics",
+    "bigbench/moral_permissibility",
+    "bigbench/ruin_names",
+    "bigbench/misconceptions",
+    "bigbench/general_knowledge",
+    "bigbench/phrase_relatedness",
     "bigbench/unit_interpretation",
+    "bigbench/contextual_parametric_knowledge_conflicts",
+    "bigbench/fact_checker",
+    "bigbench/identify_math_theorems",
+    "bigbench/logical_fallacy_detection",
     "bigbench/suicide_risk",
+    "bigbench/cause_and_effect",
+    "bigbench/timedial",
+    "bigbench/key_value_maps",
+    "bigbench/irony_identification",
+    "bigbench/emojis_emotion_prediction",
+    "bigbench/reasoning_about_colored_objects",
     "bigbench/hindu_knowledge",
+    "bigbench/authorship_verification",
+    "bigbench/human_organs_senses",
+    "bigbench/mnist_ascii",
     "bigbench/epistemic_reasoning",
+    "bigbench/metaphor_boolean",
+    "bigbench/strategyqa",
+    "bigbench/intent_recognition",
+    "bigbench/metaphor_understanding",
+    "bigbench/movie_recommendation",
+    "bigbench/sentence_ambiguity",
+    "bigbench/hhh_alignment",
+    "bigbench/emoji_movie",
+    "bigbench/geometric_shapes",
+    "bigbench/social_iqa",
+    "bigbench/abstract_narrative_understanding",
+    "bigbench/penguins_in_a_table",
+    "bigbench/anachronisms",
+    "bigbench/formal_fallacies_syllogisms_negation",
+    "bigbench/strange_stories",
+    "bigbench/cs_algorithms",
+    "bigbench/physical_intuition",
     "bigbench/simple_ethical_questions",
+    "bigbench/similarities_abstraction",
+    "bigbench/symbol_interpretation",
+    "bigbench/bbq_lite_json",
+    "bigbench/movie_dialog_same_or_different",
     "bigbench/dyck_languages",
+    "bigbench/analogical_similarity",
+    "bigbench/logical_deduction",
+    "bigbench/snarks",
+    "bigbench/social_support",
+    "bigbench/empirical_judgments",
+    "bigbench/date_understanding",
+    "bigbench/presuppositions_as_nli",
+    "bigbench/implicatures",
     "bigbench/vitaminc_fact_verification",
+    "bigbench/checkmate_in_one",
+    "bigbench/gre_reading_comprehension",
+    "bigbench/undo_permutation",
+    "bigbench/english_proverbs",
+    "bigbench/discourse_marker_prediction",
+    "bigbench/understanding_fables",
+    "bigbench/figure_of_speech_detection",
+    "bigbench/hyperbaton",
+    "bigbench/crash_blossom",
     "cos_e/v1.0",
     "cosmos_qa",
     "dream",
     "art",
     "winogrande/winogrande_xl",
     "codah/codah",
     "ai2_arc/ARC-Challenge/challenge",
+    "ai2_arc/ARC-Easy/challenge",
     "definite_pronoun_resolution",
     "swag",
     "math_qa",
     "rumoureval_2019/RumourEval2019",
     "ethos/binary",
     "ethos/multilabel",
+    "tweet_eval/stance_feminist",
+    "tweet_eval/stance_climate",
+    "tweet_eval/irony",
     "tweet_eval/offensive",
     "tweet_eval/sentiment",
     "tweet_eval/stance_hillary",
+    "tweet_eval/emoji",
+    "tweet_eval/emotion",
+    "tweet_eval/stance_atheism",
+    "tweet_eval/hate",
     "tweet_eval/stance_abortion",
     "discovery/discovery",
     "pragmeval/verifiability",
     "pragmeval/mrda",
+    "pragmeval/switchboard",
+    "pragmeval/emobank-arousal",
+    "pragmeval/emobank-dominance",
+    "pragmeval/squinky-informativeness",
+    "pragmeval/squinky-implicature",
+    "pragmeval/squinky-formality",
     "pragmeval/emobank-valence",
     "pragmeval/stac",
     "pragmeval/persuasiveness-strength",
+    "pragmeval/persuasiveness-specificity",
+    "pragmeval/persuasiveness-relevance",
+    "pragmeval/persuasiveness-premisetype",
     "pragmeval/persuasiveness-eloquence",
     "pragmeval/persuasiveness-claimtype",
+    "pragmeval/pdtb",
+    "pragmeval/gum",
     "pragmeval/emergent",
+    "pragmeval/sarcasm",
     "silicone/oasis",
     "silicone/meld_s",
     "silicone/meld_e",
+    "silicone/maptask",
+    "silicone/sem",
     "silicone/dyda_e",
     "silicone/dyda_da",
+    "silicone/iemocap",
     "lex_glue/eurlex",
     "lex_glue/scotus",
     "lex_glue/ledgar",
     "go_emotions/simplified",
     "scicite",
     "liar",
     "lexical_relation_classification/BLESS",
     "lexical_relation_classification/CogALexV",
+    "lexical_relation_classification/EVALution",
     "lexical_relation_classification/K&H+N",
+    "lexical_relation_classification/ROOT09",
+    "linguisticprobing/sentence_length",
     "linguisticprobing/bigram_shift",
     "linguisticprobing/odd_man_out",
     "linguisticprobing/coordination_inversion",
+    "linguisticprobing/top_constituents",
     "linguisticprobing/tree_depth",
     "linguisticprobing/past_present",
+    "linguisticprobing/obj_number",
+    "linguisticprobing/subj_number",
     "crowdflower/political-media-audience",
+    "crowdflower/economic-news",
+    "crowdflower/corporate-messaging",
+    "crowdflower/airline-sentiment",
+    "crowdflower/tweet_global_warming",
+    "crowdflower/sentiment_nuclear_power",
     "crowdflower/political-media-message",
     "crowdflower/text_emotion",
+    "crowdflower/political-media-bias",
     "ethics/commonsense",
     "ethics/deontology",
     "ethics/justice",
     "redefine-math",
     "puzzte",
     "implicatures",
+    "race/high",
+    "race/middle",
+    "race-c",
+    "spartqa-yn",
+    "spartqa-mchoice",
+    "temporal-nli",
+    "riddle_sense",
+    "clcd-english",
+    "twentyquestions",
+    "reclor",
+    "counterfactually-augmented-imdb",
+    "counterfactually-augmented-snli",
+    "cnli",
+    "boolq-natural-perturbations",
+    "acceptability-prediction",
+    "equate",
+    "ScienceQA_text_only",
+    "ekar_english",
+    "implicit-hate-stg1",
+    "chaos-mnli-ambiguity",
+    "headline_cause/en_simple",
     "babi_nli",
     "blimp-2",
     "mmlu-4"
   ],
   "torch_dtype": "float32",
+  "transformers_version": "4.26.0",
   "type_vocab_size": 0,
   "vocab_size": 128100
 }

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2554d7be5da63af6c231f28f619fbdc205cd77c5a13a403d2479d75879720e00
-size 1740394873

 version https://git-lfs.github.com/spec/v1
+oid sha256:706433291e04d0a5099445cda6c065dc027c17490f6e29b6375f5cb2e930c24c
+size 1740400377