tasksource
/

deberta-base-long-nli

@@ -1,6 +1,4 @@
 ---
-library_name: transformers
-pipeline_tag: zero-shot-classification
 datasets:
 - nyu-mll/glue
 - aps/super_glue
@@ -289,6 +287,8 @@ datasets:
 - tasksource/wice
 - Dzeniks/hover
 - tasksource/tasksource_dpo_pairs
 ---
 # Model Card for Model ID

 ---
 datasets:
 - nyu-mll/glue
 - aps/super_glue
 - tasksource/wice
 - Dzeniks/hover
 - tasksource/tasksource_dpo_pairs
+library_name: transformers
+pipeline_tag: zero-shot-classification
 ---
 # Model Card for Model ID

config.json CHANGED Viewed

@@ -27,9 +27,9 @@
     2,
     2,
     3,
-    6,
     2,
     2,
     2,
     2,
     2,
@@ -213,46 +213,46 @@
     4,
     2,
     8,
     2,
     2,
     2,
-    4,
     3,
-    20,
     3,
     3,
     3,
     3,
     3,
     174,
     41,
     51,
     2,
-    3,
     2,
     2,
     2,
     2,
     2,
-    3,
     16,
-    17,
     2,
     8,
     2,
-    3,
-    2,
     2,
     18,
     2,
     3,
     7,
     12,
-    4,
     7,
     42,
     3,
-    11,
     100,
     13,
     100,
@@ -282,29 +282,29 @@
     28,
     3,
     6,
-    6,
-    5,
     7,
-    4,
     3,
     6,
-    20,
-    2,
-    7,
     2,
     2,
     2,
     2,
     2,
-    3,
     2,
     13,
     2,
-    4,
-    9,
     4,
     3,
     2,
     2,
     2,
     2,
@@ -440,7 +440,6 @@
     2,
     2,
     2,
-    2,
     4,
     2,
     24,
@@ -530,6 +529,7 @@
     2,
     1,
     2,
     3,
     3,
     3,
@@ -592,18 +592,18 @@
     "scitail/snli_format",
     "hans",
     "WANLI",
-    "recast/recast_kg_relations",
-    "recast/recast_sentiment",
     "recast/recast_puns",
     "recast/recast_verbnet",
     "recast/recast_verbcorner",
-    "recast/recast_factuality",
-    "recast/recast_megaveridicality",
     "recast/recast_ner",
     "probability_words_nli/reasoning_1hop",
-    "probability_words_nli/reasoning_2hop",
     "probability_words_nli/usnli",
-    "nan-nli/joey234--nan-nli",
     "nli_fever",
     "breaking_nli",
     "conj_nli",
@@ -626,13 +626,13 @@
     "robust_nli_is_sd",
     "robust_nli_li_ts",
     "add_one_rte",
-    "imppres/implicature_numerals_10_100/log",
     "imppres/implicature_modals/log",
-    "imppres/implicature_gradable_verb/log",
     "imppres/implicature_connectives/log",
-    "imppres/implicature_gradable_adjective/log",
     "imppres/implicature_numerals_2_3/log",
-    "imppres/implicature_quantifiers/log",
     "hlgd",
     "paws/labeled_final",
     "paws/labeled_swap",
@@ -640,106 +640,106 @@
     "model-written-evals",
     "truthful_qa/multiple_choice",
     "fig-qa",
     "bigbench/known_unknowns",
-    "bigbench/formal_fallacies_syllogisms_negation",
-    "bigbench/presuppositions_as_nli",
     "bigbench/metaphor_understanding",
-    "bigbench/cause_and_effect",
-    "bigbench/simple_ethical_questions",
-    "bigbench/color",
-    "bigbench/similarities_abstraction",
-    "bigbench/misconceptions",
     "bigbench/english_proverbs",
-    "bigbench/sports_understanding",
-    "bigbench/metaphor_boolean",
-    "bigbench/logical_fallacy_detection",
-    "bigbench/logic_grid_puzzle",
-    "bigbench/empirical_judgments",
-    "bigbench/mnist_ascii",
-    "bigbench/entailed_polarity",
-    "bigbench/elementary_math_qa",
-    "bigbench/gre_reading_comprehension",
     "bigbench/social_iqa",
-    "bigbench/figure_of_speech_detection",
     "bigbench/timedial",
-    "bigbench/moral_permissibility",
-    "bigbench/evaluating_information_essentiality",
-    "bigbench/implicit_relations",
     "bigbench/real_or_fake_text",
-    "bigbench/hyperbaton",
-    "bigbench/odd_one_out",
-    "bigbench/play_dialog_same_or_different",
-    "bigbench/vitaminc_fact_verification",
-    "bigbench/goal_step_wikihow",
-    "bigbench/unit_interpretation",
-    "bigbench/physics",
-    "bigbench/code_line_description",
-    "bigbench/phrase_relatedness",
-    "bigbench/general_knowledge",
     "bigbench/identify_odd_metaphor",
-    "bigbench/key_value_maps",
-    "bigbench/sentence_ambiguity",
-    "bigbench/disambiguation_qa",
-    "bigbench/movie_dialog_same_or_different",
-    "bigbench/discourse_marker_prediction",
-    "bigbench/social_support",
     "bigbench/anachronisms",
-    "bigbench/undo_permutation",
-    "bigbench/irony_identification",
-    "bigbench/nonsense_words_grammar",
     "bigbench/logical_sequence",
-    "bigbench/reasoning_about_colored_objects",
-    "bigbench/causal_judgment",
-    "bigbench/geometric_shapes",
-    "bigbench/logical_deduction",
     "bigbench/question_selection",
-    "bigbench/hhh_alignment",
-    "bigbench/analytic_entailment",
-    "bigbench/riddle_sense",
-    "bigbench/movie_recommendation",
-    "bigbench/penguins_in_a_table",
-    "bigbench/intent_recognition",
-    "bigbench/conceptual_combinations",
-    "bigbench/cs_algorithms",
     "bigbench/temporal_sequences",
-    "bigbench/salient_translation_error_detection",
-    "bigbench/abstract_narrative_understanding",
-    "bigbench/authorship_verification",
-    "bigbench/winowhy",
-    "bigbench/strategyqa",
-    "bigbench/implicatures",
-    "bigbench/snarks",
-    "bigbench/human_organs_senses",
-    "bigbench/arithmetic",
-    "bigbench/tracking_shuffled_objects",
     "bigbench/date_understanding",
-    "bigbench/understanding_fables",
-    "bigbench/checkmate_in_one",
-    "bigbench/cifar10_classification",
-    "bigbench/navigate",
-    "bigbench/ruin_names",
-    "bigbench/bbq_lite_json",
-    "bigbench/suicide_risk",
-    "bigbench/dyck_languages",
-    "bigbench/emoji_movie",
     "bigbench/contextual_parametric_knowledge_conflicts",
-    "bigbench/novel_concepts",
-    "bigbench/fantasy_reasoning",
-    "bigbench/mathematical_induction",
-    "bigbench/emojis_emotion_prediction",
-    "bigbench/symbol_interpretation",
-    "bigbench/strange_stories",
     "bigbench/identify_math_theorems",
     "bigbench/dark_humor_detection",
-    "bigbench/crass_ai",
-    "bigbench/international_phonetic_alphabet_nli",
-    "bigbench/logical_args",
-    "bigbench/epistemic_reasoning",
     "bigbench/hindu_knowledge",
-    "bigbench/physical_intuition",
-    "bigbench/crash_blossom",
-    "bigbench/analogical_similarity",
-    "bigbench/fact_checker",
     "cos_e/v1.0",
     "cosmos_qa",
     "dream",
@@ -773,51 +773,51 @@
     "toxic_conversations",
     "TuringBench",
     "trec",
-    "vitaminc/tals--vitaminc",
     "hope_edi/english",
     "rumoureval_2019/RumourEval2019",
     "ethos/binary",
     "ethos/multilabel",
-    "tweet_eval/irony",
     "tweet_eval/offensive",
-    "tweet_eval/hate",
     "tweet_eval/emotion",
     "tweet_eval/sentiment",
-    "tweet_eval/emoji",
     "tweet_eval/stance_abortion",
     "tweet_eval/stance_atheism",
     "tweet_eval/stance_climate",
     "tweet_eval/stance_feminist",
     "tweet_eval/stance_hillary",
     "discovery/discovery",
     "pragmeval/switchboard",
     "pragmeval/mrda",
     "pragmeval/squinky-informativeness",
-    "pragmeval/verifiability",
     "pragmeval/squinky-implicature",
-    "pragmeval/squinky-formality",
-    "pragmeval/emobank-valence",
-    "pragmeval/emobank-dominance",
     "pragmeval/emobank-arousal",
-    "pragmeval/emergent",
     "pragmeval/pdtb",
-    "pragmeval/gum",
-    "pragmeval/persuasiveness-eloquence",
-    "pragmeval/persuasiveness-premisetype",
-    "pragmeval/persuasiveness-relevance",
     "pragmeval/persuasiveness-claimtype",
-    "pragmeval/sarcasm",
     "pragmeval/persuasiveness-strength",
     "pragmeval/stac",
     "pragmeval/persuasiveness-specificity",
     "silicone/sem",
     "silicone/meld_e",
     "silicone/maptask",
-    "silicone/dyda_da",
     "silicone/dyda_e",
     "silicone/oasis",
     "silicone/meld_s",
-    "silicone/iemocap",
     "lex_glue/eurlex",
     "lex_glue/scotus",
     "lex_glue/ledgar",
@@ -847,29 +847,29 @@
     "go_emotions/simplified",
     "scicite",
     "liar",
-    "lexical_relation_classification/BLESS",
-    "lexical_relation_classification/CogALexV",
     "lexical_relation_classification/EVALution",
-    "lexical_relation_classification/K&H+N",
     "lexical_relation_classification/ROOT09",
     "linguisticprobing/sentence_length",
     "linguisticprobing/top_constituents",
-    "linguisticprobing/coordination_inversion",
     "linguisticprobing/tree_depth",
-    "linguisticprobing/subj_number",
-    "linguisticprobing/obj_number",
-    "linguisticprobing/past_present",
-    "linguisticprobing/bigram_shift",
     "linguisticprobing/odd_man_out",
-    "crowdflower/economic-news",
-    "crowdflower/political-media-bias",
     "crowdflower/text_emotion",
     "crowdflower/political-media-audience",
-    "crowdflower/sentiment_nuclear_power",
-    "crowdflower/political-media-message",
     "crowdflower/corporate-messaging",
     "crowdflower/airline-sentiment",
     "crowdflower/tweet_global_warming",
     "ethics/commonsense",
     "ethics/deontology",
     "ethics/justice",
@@ -891,13 +891,13 @@
     "phrase_similarity",
     "scientific-exaggeration-detection",
     "quarel",
-    "fever-evidence-related/mwong--fever-related",
     "numer_sense",
     "dynasent/dynabench.dynasent.r1.all/r1",
     "dynasent/dynabench.dynasent.r2.all/r2",
     "Sarcasm_News_Headline",
     "sem_eval_2010_task_8",
-    "auditor_review/demo-org--auditor_review",
     "medmcqa",
     "Dynasent_Disagreement",
     "Politeness_Disagreement",
@@ -1005,7 +1005,6 @@
     "subjectivity",
     "MOH",
     "VUAC",
-    "TroFi",
     "sharc_modified/mod",
     "conceptrules_v2",
     "disrpt/eng.dep.scidtb.rels",
@@ -1042,9 +1041,9 @@
     "stepgame",
     "nlgraph",
     "oasst2_pairwise_rlhf_reward",
-    "hh-rlhf/helpful-base",
-    "hh-rlhf/helpful-rejection-sampled",
     "hh-rlhf/helpful-online",
     "hh-rlhf/harmless-base",
     "ruletaker",
     "PARARULE-Plus",
@@ -1058,8 +1057,8 @@
     "lsat-ar",
     "lsat-rc",
     "biosift-nli",
-    "brainteasers/WP",
     "brainteasers/SP",
     "persuasion",
     "AmbigNQ-clarifying-question",
     "SIGA-nli",
@@ -1094,6 +1093,7 @@
     "wice",
     "hover",
     "tasksource_dpo_pairs",
     "babi_nli",
     "gen_debiased_nli",
     "imppres/presupposition",
@@ -1101,7 +1101,7 @@
     "blimp-2"
   ],
   "torch_dtype": "float32",
-  "transformers_version": "4.41.2",
   "type_vocab_size": 0,
   "vocab_size": 128100
 }

     2,
     2,
     3,
     2,
     2,
+    6,
     2,
     2,
     2,
     4,
     2,
     8,
+    20,
     2,
+    4,
     2,
     2,
     3,
     3,
     3,
     3,
     3,
     3,
     174,
+    2,
     41,
+    3,
     51,
     2,
     2,
     2,
     2,
     2,
     2,
     16,
+    3,
     2,
     8,
     2,
     2,
     18,
     2,
+    17,
+    3,
     3,
     7,
+    11,
     12,
     7,
+    4,
     42,
     3,
     100,
     13,
     100,
     28,
     3,
     6,
     7,
     3,
+    4,
+    5,
     6,
     2,
     2,
     2,
+    6,
+    20,
+    7,
     2,
     2,
     2,
+    9,
     13,
     2,
+    3,
     4,
     3,
     2,
+    4,
+    2,
     2,
     2,
     2,
     2,
     2,
     2,
     4,
     2,
     24,
     2,
     1,
     2,
+    2,
     3,
     3,
     3,
     "scitail/snli_format",
     "hans",
     "WANLI",
     "recast/recast_puns",
+    "recast/recast_factuality",
+    "recast/recast_kg_relations",
     "recast/recast_verbnet",
     "recast/recast_verbcorner",
     "recast/recast_ner",
+    "recast/recast_megaveridicality",
+    "recast/recast_sentiment",
     "probability_words_nli/reasoning_1hop",
     "probability_words_nli/usnli",
+    "probability_words_nli/reasoning_2hop",
+    "nan-nli",
     "nli_fever",
     "breaking_nli",
     "conj_nli",
     "robust_nli_is_sd",
     "robust_nli_li_ts",
     "add_one_rte",
+    "imppres/implicature_gradable_adjective/log",
     "imppres/implicature_modals/log",
+    "imppres/implicature_numerals_10_100/log",
+    "imppres/implicature_quantifiers/log",
     "imppres/implicature_connectives/log",
+    "imppres/implicature_gradable_verb/log",
     "imppres/implicature_numerals_2_3/log",
     "hlgd",
     "paws/labeled_final",
     "paws/labeled_swap",
     "model-written-evals",
     "truthful_qa/multiple_choice",
     "fig-qa",
+    "bigbench/discourse_marker_prediction",
+    "bigbench/gre_reading_comprehension",
+    "bigbench/simple_ethical_questions",
     "bigbench/known_unknowns",
+    "bigbench/fact_checker",
+    "bigbench/phrase_relatedness",
+    "bigbench/irony_identification",
+    "bigbench/crash_blossom",
+    "bigbench/physical_intuition",
+    "bigbench/analytic_entailment",
+    "bigbench/play_dialog_same_or_different",
+    "bigbench/metaphor_boolean",
+    "bigbench/undo_permutation",
+    "bigbench/disambiguation_qa",
     "bigbench/metaphor_understanding",
+    "bigbench/nonsense_words_grammar",
+    "bigbench/logical_deduction",
+    "bigbench/sentence_ambiguity",
+    "bigbench/key_value_maps",
+    "bigbench/checkmate_in_one",
+    "bigbench/code_line_description",
+    "bigbench/crass_ai",
+    "bigbench/movie_dialog_same_or_different",
+    "bigbench/strategyqa",
+    "bigbench/hhh_alignment",
     "bigbench/english_proverbs",
+    "bigbench/cs_algorithms",
+    "bigbench/formal_fallacies_syllogisms_negation",
+    "bigbench/conceptual_combinations",
+    "bigbench/geometric_shapes",
+    "bigbench/tracking_shuffled_objects",
+    "bigbench/arithmetic",
+    "bigbench/misconceptions",
+    "bigbench/odd_one_out",
+    "bigbench/international_phonetic_alphabet_nli",
     "bigbench/social_iqa",
+    "bigbench/logical_fallacy_detection",
+    "bigbench/hyperbaton",
+    "bigbench/novel_concepts",
+    "bigbench/similarities_abstraction",
     "bigbench/timedial",
+    "bigbench/salient_translation_error_detection",
+    "bigbench/cifar10_classification",
+    "bigbench/winowhy",
+    "bigbench/mathematical_induction",
     "bigbench/real_or_fake_text",
+    "bigbench/epistemic_reasoning",
+    "bigbench/riddle_sense",
     "bigbench/identify_odd_metaphor",
+    "bigbench/human_organs_senses",
+    "bigbench/emojis_emotion_prediction",
+    "bigbench/logical_args",
     "bigbench/anachronisms",
+    "bigbench/bbq_lite_json",
+    "bigbench/general_knowledge",
     "bigbench/logical_sequence",
+    "bigbench/navigate",
+    "bigbench/analogical_similarity",
+    "bigbench/authorship_verification",
+    "bigbench/elementary_math_qa",
+    "bigbench/goal_step_wikihow",
+    "bigbench/empirical_judgments",
     "bigbench/question_selection",
     "bigbench/temporal_sequences",
+    "bigbench/mnist_ascii",
+    "bigbench/color",
     "bigbench/date_understanding",
+    "bigbench/figure_of_speech_detection",
     "bigbench/contextual_parametric_knowledge_conflicts",
+    "bigbench/ruin_names",
+    "bigbench/abstract_narrative_understanding",
+    "bigbench/physics",
+    "bigbench/understanding_fables",
     "bigbench/identify_math_theorems",
+    "bigbench/penguins_in_a_table",
+    "bigbench/vitaminc_fact_verification",
+    "bigbench/social_support",
+    "bigbench/strange_stories",
     "bigbench/dark_humor_detection",
+    "bigbench/fantasy_reasoning",
+    "bigbench/logic_grid_puzzle",
+    "bigbench/emoji_movie",
+    "bigbench/moral_permissibility",
+    "bigbench/symbol_interpretation",
+    "bigbench/presuppositions_as_nli",
+    "bigbench/dyck_languages",
+    "bigbench/implicatures",
+    "bigbench/suicide_risk",
+    "bigbench/unit_interpretation",
+    "bigbench/intent_recognition",
+    "bigbench/movie_recommendation",
+    "bigbench/snarks",
+    "bigbench/evaluating_information_essentiality",
+    "bigbench/sports_understanding",
+    "bigbench/entailed_polarity",
+    "bigbench/causal_judgment",
+    "bigbench/cause_and_effect",
+    "bigbench/implicit_relations",
+    "bigbench/reasoning_about_colored_objects",
     "bigbench/hindu_knowledge",
     "cos_e/v1.0",
     "cosmos_qa",
     "dream",
     "toxic_conversations",
     "TuringBench",
     "trec",
+    "vitaminc",
     "hope_edi/english",
     "rumoureval_2019/RumourEval2019",
     "ethos/binary",
     "ethos/multilabel",
+    "tweet_eval/emoji",
     "tweet_eval/offensive",
     "tweet_eval/emotion",
+    "tweet_eval/hate",
+    "tweet_eval/irony",
     "tweet_eval/sentiment",
     "tweet_eval/stance_abortion",
     "tweet_eval/stance_atheism",
     "tweet_eval/stance_climate",
     "tweet_eval/stance_feminist",
     "tweet_eval/stance_hillary",
     "discovery/discovery",
+    "pragmeval/squinky-formality",
     "pragmeval/switchboard",
+    "pragmeval/verifiability",
     "pragmeval/mrda",
     "pragmeval/squinky-informativeness",
     "pragmeval/squinky-implicature",
     "pragmeval/emobank-arousal",
+    "pragmeval/emobank-dominance",
+    "pragmeval/emobank-valence",
+    "pragmeval/sarcasm",
     "pragmeval/pdtb",
     "pragmeval/persuasiveness-claimtype",
+    "pragmeval/persuasiveness-relevance",
+    "pragmeval/persuasiveness-premisetype",
+    "pragmeval/persuasiveness-eloquence",
     "pragmeval/persuasiveness-strength",
     "pragmeval/stac",
     "pragmeval/persuasiveness-specificity",
+    "pragmeval/gum",
+    "pragmeval/emergent",
     "silicone/sem",
     "silicone/meld_e",
+    "silicone/iemocap",
     "silicone/maptask",
     "silicone/dyda_e",
+    "silicone/dyda_da",
     "silicone/oasis",
     "silicone/meld_s",
     "lex_glue/eurlex",
     "lex_glue/scotus",
     "lex_glue/ledgar",
     "go_emotions/simplified",
     "scicite",
     "liar",
     "lexical_relation_classification/EVALution",
     "lexical_relation_classification/ROOT09",
+    "lexical_relation_classification/K&H+N",
+    "lexical_relation_classification/CogALexV",
+    "lexical_relation_classification/BLESS",
+    "linguisticprobing/subj_number",
+    "linguisticprobing/past_present",
+    "linguisticprobing/obj_number",
     "linguisticprobing/sentence_length",
     "linguisticprobing/top_constituents",
     "linguisticprobing/tree_depth",
+    "linguisticprobing/coordination_inversion",
     "linguisticprobing/odd_man_out",
+    "linguisticprobing/bigram_shift",
+    "crowdflower/political-media-message",
     "crowdflower/text_emotion",
     "crowdflower/political-media-audience",
+    "crowdflower/economic-news",
     "crowdflower/corporate-messaging",
     "crowdflower/airline-sentiment",
     "crowdflower/tweet_global_warming",
+    "crowdflower/sentiment_nuclear_power",
+    "crowdflower/political-media-bias",
     "ethics/commonsense",
     "ethics/deontology",
     "ethics/justice",
     "phrase_similarity",
     "scientific-exaggeration-detection",
     "quarel",
+    "fever-evidence-related",
     "numer_sense",
     "dynasent/dynabench.dynasent.r1.all/r1",
     "dynasent/dynabench.dynasent.r2.all/r2",
     "Sarcasm_News_Headline",
     "sem_eval_2010_task_8",
+    "auditor_review",
     "medmcqa",
     "Dynasent_Disagreement",
     "Politeness_Disagreement",
     "subjectivity",
     "MOH",
     "VUAC",
     "sharc_modified/mod",
     "conceptrules_v2",
     "disrpt/eng.dep.scidtb.rels",
     "stepgame",
     "nlgraph",
     "oasst2_pairwise_rlhf_reward",
     "hh-rlhf/helpful-online",
+    "hh-rlhf/helpful-rejection-sampled",
+    "hh-rlhf/helpful-base",
     "hh-rlhf/harmless-base",
     "ruletaker",
     "PARARULE-Plus",
     "lsat-ar",
     "lsat-rc",
     "biosift-nli",
     "brainteasers/SP",
+    "brainteasers/WP",
     "persuasion",
     "AmbigNQ-clarifying-question",
     "SIGA-nli",
     "wice",
     "hover",
     "tasksource_dpo_pairs",
+    "seahorse_summarization_evaluation",
     "babi_nli",
     "gen_debiased_nli",
     "imppres/presupposition",
     "blimp-2"
   ],
   "torch_dtype": "float32",
+  "transformers_version": "4.42.3",
   "type_vocab_size": 0,
   "vocab_size": 128100
 }

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9ae1e040afa694928b43261010315a2ccbe630744935c65fba2eb308d2daa26e
 size 737722356

 version https://git-lfs.github.com/spec/v1
+oid sha256:71cace06873870322ffa93e4005999961cef6d6b08263b01aad832ded23d94ae
 size 737722356