sileod commited on
Commit
24fb659
1 Parent(s): a3c9b94

Upload DebertaV2ForSequenceClassification

Browse files
Files changed (2) hide show
  1. config.json +148 -146
  2. pytorch_model.bin +1 -1
config.json CHANGED
@@ -29,10 +29,10 @@
29
  3,
30
  2,
31
  2,
32
- 6,
33
  2,
34
  2,
35
  2,
 
36
  2,
37
  2,
38
  2,
@@ -219,45 +219,45 @@
219
  2,
220
  8,
221
  2,
222
- 3,
 
223
  2,
224
  3,
225
  3,
226
- 2,
227
  3,
228
  3,
229
  3,
230
  20,
231
- 4,
232
  174,
233
  2,
234
  2,
235
  2,
236
  2,
237
  2,
238
- 2,
239
  41,
240
  51,
241
  3,
 
242
  3,
243
- 16,
244
  17,
245
- 8,
246
  2,
 
247
  2,
248
  2,
 
249
  2,
250
  2,
251
- 18,
252
- 3,
253
  4,
254
  7,
255
  3,
 
256
  3,
257
- 7,
258
  12,
259
  11,
260
- 42,
261
  100,
262
  13,
263
  100,
@@ -287,29 +287,29 @@
287
  28,
288
  3,
289
  6,
290
- 6,
291
  7,
292
- 4,
293
  3,
294
- 5,
295
- 2,
296
- 2,
297
  2,
298
- 7,
299
  20,
300
  6,
301
  2,
302
  2,
303
  2,
304
- 4,
305
  2,
306
- 13,
307
- 9,
 
308
  2,
309
  3,
310
  4,
311
- 3,
312
  2,
 
 
 
313
  2,
314
  2,
315
  2,
@@ -488,6 +488,7 @@
488
  2,
489
  3,
490
  2,
 
491
  2,
492
  3,
493
  3,
@@ -552,17 +553,17 @@
552
  "scitail/snli_format",
553
  "hans",
554
  "WANLI",
555
- "recast/recast_megaveridicality",
556
  "recast/recast_ner",
557
- "recast/recast_kg_relations",
558
- "recast/recast_puns",
559
- "recast/recast_factuality",
560
  "recast/recast_verbnet",
 
 
561
  "recast/recast_verbcorner",
562
- "recast/recast_sentiment",
 
563
  "probability_words_nli/reasoning_2hop",
564
  "probability_words_nli/reasoning_1hop",
565
- "probability_words_nli/usnli",
566
  "nan-nli/joey234--nan-nli",
567
  "nli_fever",
568
  "breaking_nli",
@@ -586,13 +587,13 @@
586
  "robust_nli_is_sd",
587
  "robust_nli_li_ts",
588
  "add_one_rte",
589
- "imppres/implicature_modals/log",
590
- "imppres/implicature_connectives/log",
591
  "imppres/implicature_quantifiers/log",
592
- "imppres/implicature_gradable_adjective/log",
593
  "imppres/implicature_numerals_2_3/log",
594
  "imppres/implicature_numerals_10_100/log",
595
- "imppres/implicature_gradable_verb/log",
 
596
  "glue_diagnostics/diagnostics",
597
  "hlgd",
598
  "paws/labeled_final",
@@ -605,106 +606,106 @@
605
  "model-written-evals",
606
  "truthful_qa/multiple_choice",
607
  "fig-qa",
608
- "bigbench/goal_step_wikihow",
609
- "bigbench/implicit_relations",
 
 
610
  "bigbench/geometric_shapes",
611
- "bigbench/identify_math_theorems",
 
 
612
  "bigbench/logical_args",
613
- "bigbench/contextual_parametric_knowledge_conflicts",
614
- "bigbench/logical_sequence",
615
- "bigbench/undo_permutation",
616
- "bigbench/fantasy_reasoning",
617
- "bigbench/ruin_names",
618
- "bigbench/logic_grid_puzzle",
619
  "bigbench/similarities_abstraction",
 
620
  "bigbench/misconceptions",
621
- "bigbench/anachronisms",
622
- "bigbench/crash_blossom",
623
- "bigbench/conceptual_combinations",
624
- "bigbench/dark_humor_detection",
625
- "bigbench/real_or_fake_text",
626
- "bigbench/fact_checker",
627
- "bigbench/empirical_judgments",
628
- "bigbench/hindu_knowledge",
629
- "bigbench/discourse_marker_prediction",
630
- "bigbench/elementary_math_qa",
631
- "bigbench/checkmate_in_one",
632
  "bigbench/understanding_fables",
 
 
633
  "bigbench/emojis_emotion_prediction",
634
- "bigbench/suicide_risk",
635
- "bigbench/physical_intuition",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
636
  "bigbench/epistemic_reasoning",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
637
  "bigbench/mathematical_induction",
 
 
 
 
 
 
 
 
638
  "bigbench/hhh_alignment",
639
- "bigbench/human_organs_senses",
 
 
 
 
 
 
 
 
640
  "bigbench/novel_concepts",
641
  "bigbench/authorship_verification",
642
- "bigbench/reasoning_about_colored_objects",
643
  "bigbench/physics",
644
- "bigbench/winowhy",
645
- "bigbench/question_selection",
646
- "bigbench/english_proverbs",
647
- "bigbench/odd_one_out",
648
- "bigbench/cause_and_effect",
649
- "bigbench/disambiguation_qa",
650
- "bigbench/phrase_relatedness",
651
  "bigbench/snarks",
 
 
652
  "bigbench/arithmetic",
653
- "bigbench/causal_judgment",
654
- "bigbench/general_knowledge",
655
- "bigbench/play_dialog_same_or_different",
656
- "bigbench/evaluating_information_essentiality",
657
- "bigbench/hyperbaton",
658
- "bigbench/timedial",
659
- "bigbench/color",
660
- "bigbench/logical_deduction",
661
- "bigbench/social_iqa",
662
- "bigbench/nonsense_words_grammar",
663
- "bigbench/code_line_description",
664
- "bigbench/vitaminc_fact_verification",
665
- "bigbench/intent_recognition",
666
  "bigbench/cs_algorithms",
667
- "bigbench/riddle_sense",
668
- "bigbench/logical_fallacy_detection",
669
- "bigbench/metaphor_understanding",
670
- "bigbench/analytic_entailment",
671
- "bigbench/presuppositions_as_nli",
672
- "bigbench/international_phonetic_alphabet_nli",
673
  "bigbench/movie_dialog_same_or_different",
 
 
 
674
  "bigbench/strange_stories",
675
- "bigbench/figure_of_speech_detection",
676
- "bigbench/movie_recommendation",
677
- "bigbench/metaphor_boolean",
678
- "bigbench/entailed_polarity",
679
- "bigbench/analogical_similarity",
680
  "bigbench/dyck_languages",
681
- "bigbench/implicatures",
682
- "bigbench/navigate",
683
- "bigbench/temporal_sequences",
684
- "bigbench/moral_permissibility",
685
- "bigbench/irony_identification",
686
- "bigbench/formal_fallacies_syllogisms_negation",
687
- "bigbench/bbq_lite_json",
688
- "bigbench/unit_interpretation",
689
- "bigbench/mnist_ascii",
690
- "bigbench/known_unknowns",
691
- "bigbench/gre_reading_comprehension",
692
- "bigbench/sports_understanding",
693
- "bigbench/identify_odd_metaphor",
694
- "bigbench/simple_ethical_questions",
695
- "bigbench/sentence_ambiguity",
696
- "bigbench/key_value_maps",
697
- "bigbench/penguins_in_a_table",
698
- "bigbench/date_understanding",
699
- "bigbench/emoji_movie",
700
  "bigbench/salient_translation_error_detection",
701
- "bigbench/cifar10_classification",
702
- "bigbench/social_support",
703
- "bigbench/abstract_narrative_understanding",
704
- "bigbench/strategyqa",
705
- "bigbench/symbol_interpretation",
706
- "bigbench/tracking_shuffled_objects",
707
- "bigbench/crass_ai",
708
  "cos_e/v1.0",
709
  "cosmos_qa",
710
  "dream",
@@ -744,45 +745,45 @@
744
  "ethos/binary",
745
  "ethos/multilabel",
746
  "tweet_eval/hate",
747
- "tweet_eval/stance_climate",
748
  "tweet_eval/irony",
749
- "tweet_eval/stance_abortion",
750
- "tweet_eval/sentiment",
751
  "tweet_eval/offensive",
752
- "tweet_eval/stance_feminist",
 
753
  "tweet_eval/stance_atheism",
 
 
754
  "tweet_eval/stance_hillary",
755
  "tweet_eval/emoji",
756
- "tweet_eval/emotion",
757
  "discovery/discovery",
758
- "pragmeval/emobank-dominance",
759
- "pragmeval/emobank-arousal",
760
- "pragmeval/emobank-valence",
761
  "pragmeval/squinky-formality",
 
 
762
  "pragmeval/squinky-implicature",
763
  "pragmeval/squinky-informativeness",
764
  "pragmeval/switchboard",
765
  "pragmeval/mrda",
766
  "pragmeval/verifiability",
 
767
  "pragmeval/emergent",
768
- "pragmeval/pdtb",
769
  "pragmeval/gum",
770
- "pragmeval/persuasiveness-premisetype",
771
  "pragmeval/persuasiveness-eloquence",
 
772
  "pragmeval/persuasiveness-relevance",
773
- "pragmeval/persuasiveness-specificity",
774
- "pragmeval/persuasiveness-strength",
775
  "pragmeval/sarcasm",
776
- "pragmeval/stac",
777
- "pragmeval/persuasiveness-claimtype",
778
- "silicone/dyda_da",
779
  "silicone/dyda_e",
780
- "silicone/sem",
781
- "silicone/meld_s",
782
  "silicone/meld_e",
 
 
 
783
  "silicone/maptask",
784
  "silicone/iemocap",
785
- "silicone/oasis",
786
  "lex_glue/eurlex",
787
  "lex_glue/scotus",
788
  "lex_glue/ledgar",
@@ -812,29 +813,29 @@
812
  "go_emotions/simplified",
813
  "scicite",
814
  "liar",
815
- "lexical_relation_classification/BLESS",
816
  "lexical_relation_classification/EVALution",
817
- "lexical_relation_classification/K&H+N",
818
  "lexical_relation_classification/ROOT09",
819
- "lexical_relation_classification/CogALexV",
 
820
  "linguisticprobing/bigram_shift",
821
- "linguisticprobing/odd_man_out",
822
- "linguisticprobing/coordination_inversion",
823
- "linguisticprobing/tree_depth",
824
  "linguisticprobing/top_constituents",
825
  "linguisticprobing/sentence_length",
826
- "linguisticprobing/past_present",
827
- "linguisticprobing/obj_number",
828
  "linguisticprobing/subj_number",
829
- "crowdflower/sentiment_nuclear_power",
830
- "crowdflower/political-media-bias",
831
- "crowdflower/text_emotion",
832
- "crowdflower/political-media-message",
 
 
833
  "crowdflower/political-media-audience",
834
  "crowdflower/economic-news",
 
 
 
835
  "crowdflower/corporate-messaging",
836
  "crowdflower/airline-sentiment",
837
- "crowdflower/tweet_global_warming",
838
  "ethics/commonsense",
839
  "ethics/deontology",
840
  "ethics/justice",
@@ -950,10 +951,10 @@
950
  "oasst1_dense_flat/helpfulness",
951
  "PARARULE-Plus",
952
  "mindgames",
953
- "universal_dependencies/en_partut/deprel",
954
- "universal_dependencies/en_lines/deprel",
955
- "universal_dependencies/en_gum/deprel",
956
  "universal_dependencies/en_ewt/deprel",
 
 
 
957
  "ambient",
958
  "path-naturalness-prediction",
959
  "civil_comments/toxicity",
@@ -1013,6 +1014,7 @@
1013
  "apt",
1014
  "twitter-financial-news-sentiment",
1015
  "icl-symbol-tuning-instruct",
 
1016
  "babi_nli",
1017
  "gen_debiased_nli",
1018
  "imppres/presupposition",
 
29
  3,
30
  2,
31
  2,
 
32
  2,
33
  2,
34
  2,
35
+ 6,
36
  2,
37
  2,
38
  2,
 
219
  2,
220
  8,
221
  2,
222
+ 4,
223
+ 2,
224
  2,
225
  3,
226
  3,
227
+ 3,
228
  3,
229
  3,
230
  3,
231
  20,
 
232
  174,
233
  2,
234
  2,
235
  2,
236
  2,
237
  2,
 
238
  41,
239
  51,
240
  3,
241
+ 2,
242
  3,
243
+ 18,
244
  17,
245
+ 3,
246
  2,
247
+ 16,
248
  2,
249
  2,
250
+ 8,
251
  2,
252
  2,
253
+ 7,
 
254
  4,
255
  7,
256
  3,
257
+ 42,
258
  3,
 
259
  12,
260
  11,
 
261
  100,
262
  13,
263
  100,
 
287
  28,
288
  3,
289
  6,
290
+ 5,
291
  7,
 
292
  3,
293
+ 6,
294
+ 4,
 
295
  2,
 
296
  20,
297
  6,
298
  2,
299
  2,
300
  2,
 
301
  2,
302
+ 2,
303
+ 7,
304
+ 2,
305
  2,
306
  3,
307
  4,
308
+ 9,
309
  2,
310
+ 4,
311
+ 3,
312
+ 13,
313
  2,
314
  2,
315
  2,
 
488
  2,
489
  3,
490
  2,
491
+ 3,
492
  2,
493
  3,
494
  3,
 
553
  "scitail/snli_format",
554
  "hans",
555
  "WANLI",
 
556
  "recast/recast_ner",
557
+ "recast/recast_sentiment",
558
+ "recast/recast_megaveridicality",
 
559
  "recast/recast_verbnet",
560
+ "recast/recast_puns",
561
+ "recast/recast_kg_relations",
562
  "recast/recast_verbcorner",
563
+ "recast/recast_factuality",
564
+ "probability_words_nli/usnli",
565
  "probability_words_nli/reasoning_2hop",
566
  "probability_words_nli/reasoning_1hop",
 
567
  "nan-nli/joey234--nan-nli",
568
  "nli_fever",
569
  "breaking_nli",
 
587
  "robust_nli_is_sd",
588
  "robust_nli_li_ts",
589
  "add_one_rte",
590
+ "imppres/implicature_gradable_verb/log",
 
591
  "imppres/implicature_quantifiers/log",
592
+ "imppres/implicature_connectives/log",
593
  "imppres/implicature_numerals_2_3/log",
594
  "imppres/implicature_numerals_10_100/log",
595
+ "imppres/implicature_gradable_adjective/log",
596
+ "imppres/implicature_modals/log",
597
  "glue_diagnostics/diagnostics",
598
  "hlgd",
599
  "paws/labeled_final",
 
606
  "model-written-evals",
607
  "truthful_qa/multiple_choice",
608
  "fig-qa",
609
+ "bigbench/sports_understanding",
610
+ "bigbench/analytic_entailment",
611
+ "bigbench/presuppositions_as_nli",
612
+ "bigbench/logic_grid_puzzle",
613
  "bigbench/geometric_shapes",
614
+ "bigbench/metaphor_understanding",
615
+ "bigbench/movie_recommendation",
616
+ "bigbench/gre_reading_comprehension",
617
  "bigbench/logical_args",
 
 
 
 
 
 
618
  "bigbench/similarities_abstraction",
619
+ "bigbench/nonsense_words_grammar",
620
  "bigbench/misconceptions",
621
+ "bigbench/winowhy",
 
 
 
 
 
 
 
 
 
 
622
  "bigbench/understanding_fables",
623
+ "bigbench/logical_sequence",
624
+ "bigbench/hyperbaton",
625
  "bigbench/emojis_emotion_prediction",
626
+ "bigbench/discourse_marker_prediction",
627
+ "bigbench/cause_and_effect",
628
+ "bigbench/crass_ai",
629
+ "bigbench/real_or_fake_text",
630
+ "bigbench/date_understanding",
631
+ "bigbench/analogical_similarity",
632
+ "bigbench/crash_blossom",
633
+ "bigbench/undo_permutation",
634
+ "bigbench/english_proverbs",
635
+ "bigbench/logical_fallacy_detection",
636
+ "bigbench/question_selection",
637
+ "bigbench/human_organs_senses",
638
+ "bigbench/cifar10_classification",
639
+ "bigbench/social_iqa",
640
+ "bigbench/abstract_narrative_understanding",
641
+ "bigbench/emoji_movie",
642
+ "bigbench/sentence_ambiguity",
643
+ "bigbench/elementary_math_qa",
644
  "bigbench/epistemic_reasoning",
645
+ "bigbench/metaphor_boolean",
646
+ "bigbench/tracking_shuffled_objects",
647
+ "bigbench/physical_intuition",
648
+ "bigbench/key_value_maps",
649
+ "bigbench/penguins_in_a_table",
650
+ "bigbench/formal_fallacies_syllogisms_negation",
651
+ "bigbench/riddle_sense",
652
+ "bigbench/logical_deduction",
653
+ "bigbench/entailed_polarity",
654
+ "bigbench/ruin_names",
655
+ "bigbench/timedial",
656
+ "bigbench/fantasy_reasoning",
657
+ "bigbench/causal_judgment",
658
+ "bigbench/social_support",
659
+ "bigbench/disambiguation_qa",
660
+ "bigbench/hindu_knowledge",
661
+ "bigbench/play_dialog_same_or_different",
662
+ "bigbench/intent_recognition",
663
+ "bigbench/code_line_description",
664
+ "bigbench/implicit_relations",
665
+ "bigbench/checkmate_in_one",
666
+ "bigbench/dark_humor_detection",
667
  "bigbench/mathematical_induction",
668
+ "bigbench/identify_odd_metaphor",
669
+ "bigbench/implicatures",
670
+ "bigbench/irony_identification",
671
+ "bigbench/phrase_relatedness",
672
+ "bigbench/figure_of_speech_detection",
673
+ "bigbench/empirical_judgments",
674
+ "bigbench/identify_math_theorems",
675
+ "bigbench/evaluating_information_essentiality",
676
  "bigbench/hhh_alignment",
677
+ "bigbench/reasoning_about_colored_objects",
678
+ "bigbench/goal_step_wikihow",
679
+ "bigbench/odd_one_out",
680
+ "bigbench/strategyqa",
681
+ "bigbench/international_phonetic_alphabet_nli",
682
+ "bigbench/known_unknowns",
683
+ "bigbench/anachronisms",
684
+ "bigbench/bbq_lite_json",
685
+ "bigbench/mnist_ascii",
686
  "bigbench/novel_concepts",
687
  "bigbench/authorship_verification",
 
688
  "bigbench/physics",
689
+ "bigbench/vitaminc_fact_verification",
690
+ "bigbench/general_knowledge",
691
+ "bigbench/simple_ethical_questions",
 
 
 
 
692
  "bigbench/snarks",
693
+ "bigbench/symbol_interpretation",
694
+ "bigbench/moral_permissibility",
695
  "bigbench/arithmetic",
696
+ "bigbench/navigate",
 
 
 
 
 
 
 
 
 
 
 
 
697
  "bigbench/cs_algorithms",
698
+ "bigbench/temporal_sequences",
699
+ "bigbench/unit_interpretation",
 
 
 
 
700
  "bigbench/movie_dialog_same_or_different",
701
+ "bigbench/fact_checker",
702
+ "bigbench/suicide_risk",
703
+ "bigbench/conceptual_combinations",
704
  "bigbench/strange_stories",
 
 
 
 
 
705
  "bigbench/dyck_languages",
706
+ "bigbench/contextual_parametric_knowledge_conflicts",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
707
  "bigbench/salient_translation_error_detection",
708
+ "bigbench/color",
 
 
 
 
 
 
709
  "cos_e/v1.0",
710
  "cosmos_qa",
711
  "dream",
 
745
  "ethos/binary",
746
  "ethos/multilabel",
747
  "tweet_eval/hate",
748
+ "tweet_eval/emotion",
749
  "tweet_eval/irony",
 
 
750
  "tweet_eval/offensive",
751
+ "tweet_eval/sentiment",
752
+ "tweet_eval/stance_abortion",
753
  "tweet_eval/stance_atheism",
754
+ "tweet_eval/stance_climate",
755
+ "tweet_eval/stance_feminist",
756
  "tweet_eval/stance_hillary",
757
  "tweet_eval/emoji",
 
758
  "discovery/discovery",
 
 
 
759
  "pragmeval/squinky-formality",
760
+ "pragmeval/emobank-valence",
761
+ "pragmeval/emobank-dominance",
762
  "pragmeval/squinky-implicature",
763
  "pragmeval/squinky-informativeness",
764
  "pragmeval/switchboard",
765
  "pragmeval/mrda",
766
  "pragmeval/verifiability",
767
+ "pragmeval/emobank-arousal",
768
  "pragmeval/emergent",
769
+ "pragmeval/stac",
770
  "pragmeval/gum",
771
+ "pragmeval/persuasiveness-claimtype",
772
  "pragmeval/persuasiveness-eloquence",
773
+ "pragmeval/pdtb",
774
  "pragmeval/persuasiveness-relevance",
 
 
775
  "pragmeval/sarcasm",
776
+ "pragmeval/persuasiveness-premisetype",
777
+ "pragmeval/persuasiveness-strength",
778
+ "pragmeval/persuasiveness-specificity",
779
  "silicone/dyda_e",
780
+ "silicone/dyda_da",
 
781
  "silicone/meld_e",
782
+ "silicone/meld_s",
783
+ "silicone/oasis",
784
+ "silicone/sem",
785
  "silicone/maptask",
786
  "silicone/iemocap",
 
787
  "lex_glue/eurlex",
788
  "lex_glue/scotus",
789
  "lex_glue/ledgar",
 
813
  "go_emotions/simplified",
814
  "scicite",
815
  "liar",
816
+ "lexical_relation_classification/CogALexV",
817
  "lexical_relation_classification/EVALution",
 
818
  "lexical_relation_classification/ROOT09",
819
+ "lexical_relation_classification/BLESS",
820
+ "lexical_relation_classification/K&H+N",
821
  "linguisticprobing/bigram_shift",
 
 
 
822
  "linguisticprobing/top_constituents",
823
  "linguisticprobing/sentence_length",
 
 
824
  "linguisticprobing/subj_number",
825
+ "linguisticprobing/obj_number",
826
+ "linguisticprobing/past_present",
827
+ "linguisticprobing/odd_man_out",
828
+ "linguisticprobing/coordination_inversion",
829
+ "linguisticprobing/tree_depth",
830
+ "crowdflower/tweet_global_warming",
831
  "crowdflower/political-media-audience",
832
  "crowdflower/economic-news",
833
+ "crowdflower/sentiment_nuclear_power",
834
+ "crowdflower/political-media-message",
835
+ "crowdflower/political-media-bias",
836
  "crowdflower/corporate-messaging",
837
  "crowdflower/airline-sentiment",
838
+ "crowdflower/text_emotion",
839
  "ethics/commonsense",
840
  "ethics/deontology",
841
  "ethics/justice",
 
951
  "oasst1_dense_flat/helpfulness",
952
  "PARARULE-Plus",
953
  "mindgames",
 
 
 
954
  "universal_dependencies/en_ewt/deprel",
955
+ "universal_dependencies/en_gum/deprel",
956
+ "universal_dependencies/en_lines/deprel",
957
+ "universal_dependencies/en_partut/deprel",
958
  "ambient",
959
  "path-naturalness-prediction",
960
  "civil_comments/toxicity",
 
1014
  "apt",
1015
  "twitter-financial-news-sentiment",
1016
  "icl-symbol-tuning-instruct",
1017
+ "SpaceNLI",
1018
  "babi_nli",
1019
  "gen_debiased_nli",
1020
  "imppres/presupposition",
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9c39256062a5ebaf64e0edc840e07bd439c73477cccbb21a59aab118457f5b79
3
  size 737771833
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0a8ff4deb3e99417c600710373a7e73f249ffedade58091d7cae55b372c61743
3
  size 737771833