sileod commited on
Commit
a379150
1 Parent(s): 77c7bbc

Upload DebertaV2ForSequenceClassification

Browse files
Files changed (2) hide show
  1. config.json +151 -145
  2. pytorch_model.bin +1 -1
config.json CHANGED
@@ -28,11 +28,11 @@
28
  2,
29
  3,
30
  2,
 
31
  2,
32
  2,
33
  2,
34
  2,
35
- 6,
36
  2,
37
  2,
38
  2,
@@ -218,38 +218,38 @@
218
  4,
219
  2,
220
  8,
221
- 4,
222
- 2,
223
- 2,
224
- 3,
225
- 3,
226
  3,
227
  3,
228
  3,
229
  3,
230
  20,
 
231
  2,
232
- 174,
233
  2,
234
- 41,
235
  2,
 
 
 
236
  2,
237
  2,
238
  2,
239
  2,
 
 
240
  51,
241
  3,
242
- 16,
243
- 3,
244
  2,
245
- 8,
246
  17,
247
  18,
248
  2,
 
 
249
  2,
250
  2,
251
  2,
252
  3,
 
253
  11,
254
  3,
255
  42,
@@ -287,30 +287,30 @@
287
  28,
288
  3,
289
  6,
 
 
290
  6,
291
- 7,
292
  3,
293
- 5,
294
- 4,
295
  2,
296
  20,
297
  2,
298
  2,
 
299
  2,
 
300
  2,
301
  2,
302
- 6,
303
- 7,
304
  2,
305
  13,
306
- 9,
307
- 2,
308
  3,
309
  4,
310
- 2,
311
  3,
 
312
  4,
313
  2,
 
 
314
  2,
315
  2,
316
  2,
@@ -491,6 +491,9 @@
491
  3,
492
  2,
493
  2,
 
 
 
494
  2,
495
  3,
496
  3,
@@ -555,16 +558,16 @@
555
  "scitail/snli_format",
556
  "hans",
557
  "WANLI",
558
- "recast/recast_ner",
 
 
559
  "recast/recast_sentiment",
560
- "recast/recast_megaveridicality",
561
  "recast/recast_verbnet",
562
- "recast/recast_puns",
563
- "recast/recast_kg_relations",
564
  "recast/recast_verbcorner",
565
- "recast/recast_factuality",
566
- "probability_words_nli/usnli",
567
  "probability_words_nli/reasoning_2hop",
 
568
  "probability_words_nli/reasoning_1hop",
569
  "nan-nli/joey234--nan-nli",
570
  "nli_fever",
@@ -589,13 +592,13 @@
589
  "robust_nli_is_sd",
590
  "robust_nli_li_ts",
591
  "add_one_rte",
 
 
592
  "imppres/implicature_gradable_verb/log",
593
- "imppres/implicature_quantifiers/log",
594
  "imppres/implicature_connectives/log",
595
- "imppres/implicature_numerals_2_3/log",
596
  "imppres/implicature_numerals_10_100/log",
597
- "imppres/implicature_gradable_adjective/log",
598
- "imppres/implicature_modals/log",
599
  "glue_diagnostics/diagnostics",
600
  "hlgd",
601
  "paws/labeled_final",
@@ -608,106 +611,106 @@
608
  "model-written-evals",
609
  "truthful_qa/multiple_choice",
610
  "fig-qa",
611
- "bigbench/navigate",
612
- "bigbench/logical_args",
613
- "bigbench/implicatures",
614
- "bigbench/nonsense_words_grammar",
615
- "bigbench/tracking_shuffled_objects",
616
- "bigbench/simple_ethical_questions",
617
- "bigbench/metaphor_understanding",
618
- "bigbench/novel_concepts",
619
- "bigbench/emoji_movie",
620
- "bigbench/social_iqa",
621
- "bigbench/social_support",
622
- "bigbench/crash_blossom",
623
- "bigbench/empirical_judgments",
624
- "bigbench/english_proverbs",
625
- "bigbench/mnist_ascii",
626
- "bigbench/emojis_emotion_prediction",
627
- "bigbench/hhh_alignment",
628
- "bigbench/hyperbaton",
629
- "bigbench/intent_recognition",
630
- "bigbench/odd_one_out",
631
  "bigbench/analytic_entailment",
632
- "bigbench/mathematical_induction",
633
- "bigbench/cifar10_classification",
634
- "bigbench/logical_fallacy_detection",
635
- "bigbench/logical_deduction",
636
- "bigbench/question_selection",
637
- "bigbench/formal_fallacies_syllogisms_negation",
638
- "bigbench/identify_odd_metaphor",
639
- "bigbench/logic_grid_puzzle",
640
- "bigbench/reasoning_about_colored_objects",
641
  "bigbench/riddle_sense",
642
- "bigbench/bbq_lite_json",
643
- "bigbench/similarities_abstraction",
644
- "bigbench/logical_sequence",
 
 
 
 
 
 
 
 
645
  "bigbench/undo_permutation",
646
- "bigbench/misconceptions",
647
- "bigbench/movie_recommendation",
648
- "bigbench/anachronisms",
649
- "bigbench/symbol_interpretation",
650
- "bigbench/snarks",
651
  "bigbench/key_value_maps",
652
- "bigbench/goal_step_wikihow",
 
 
653
  "bigbench/vitaminc_fact_verification",
 
654
  "bigbench/known_unknowns",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
655
  "bigbench/cs_algorithms",
656
- "bigbench/arithmetic",
657
- "bigbench/epistemic_reasoning",
658
- "bigbench/color",
659
  "bigbench/phrase_relatedness",
660
- "bigbench/gre_reading_comprehension",
661
- "bigbench/date_understanding",
662
- "bigbench/metaphor_boolean",
663
- "bigbench/strategyqa",
664
- "bigbench/understanding_fables",
665
- "bigbench/causal_judgment",
666
- "bigbench/play_dialog_same_or_different",
667
  "bigbench/conceptual_combinations",
668
- "bigbench/sports_understanding",
669
- "bigbench/dyck_languages",
670
- "bigbench/salient_translation_error_detection",
671
- "bigbench/sentence_ambiguity",
 
 
 
 
 
 
 
 
672
  "bigbench/entailed_polarity",
673
- "bigbench/timedial",
674
- "bigbench/ruin_names",
675
- "bigbench/physical_intuition",
 
 
 
 
 
 
 
 
676
  "bigbench/winowhy",
 
 
 
 
 
677
  "bigbench/evaluating_information_essentiality",
678
- "bigbench/dark_humor_detection",
679
- "bigbench/moral_permissibility",
680
- "bigbench/code_line_description",
681
- "bigbench/temporal_sequences",
682
- "bigbench/figure_of_speech_detection",
683
  "bigbench/fantasy_reasoning",
684
- "bigbench/fact_checker",
685
- "bigbench/geometric_shapes",
686
- "bigbench/international_phonetic_alphabet_nli",
687
- "bigbench/authorship_verification",
688
- "bigbench/human_organs_senses",
689
  "bigbench/irony_identification",
690
- "bigbench/presuppositions_as_nli",
691
- "bigbench/physics",
 
 
 
 
 
 
 
 
692
  "bigbench/general_knowledge",
693
- "bigbench/identify_math_theorems",
694
- "bigbench/penguins_in_a_table",
695
- "bigbench/hindu_knowledge",
696
- "bigbench/checkmate_in_one",
697
- "bigbench/unit_interpretation",
698
- "bigbench/real_or_fake_text",
699
- "bigbench/suicide_risk",
700
- "bigbench/implicit_relations",
701
- "bigbench/abstract_narrative_understanding",
702
  "bigbench/strange_stories",
703
- "bigbench/cause_and_effect",
 
 
 
 
704
  "bigbench/disambiguation_qa",
705
- "bigbench/movie_dialog_same_or_different",
706
- "bigbench/elementary_math_qa",
707
- "bigbench/contextual_parametric_knowledge_conflicts",
708
- "bigbench/crass_ai",
709
- "bigbench/analogical_similarity",
710
- "bigbench/discourse_marker_prediction",
711
  "cos_e/v1.0",
712
  "cosmos_qa",
713
  "dream",
@@ -746,38 +749,38 @@
746
  "rumoureval_2019/RumourEval2019",
747
  "ethos/binary",
748
  "ethos/multilabel",
749
- "tweet_eval/emotion",
750
- "tweet_eval/irony",
751
- "tweet_eval/offensive",
752
- "tweet_eval/sentiment",
753
- "tweet_eval/stance_abortion",
754
- "tweet_eval/stance_atheism",
755
- "tweet_eval/stance_climate",
756
- "tweet_eval/stance_feminist",
757
  "tweet_eval/stance_hillary",
 
 
 
758
  "tweet_eval/emoji",
 
 
 
759
  "tweet_eval/hate",
 
 
760
  "discovery/discovery",
761
- "pragmeval/emobank-valence",
762
- "pragmeval/switchboard",
763
- "pragmeval/emobank-dominance",
764
- "pragmeval/emobank-arousal",
765
  "pragmeval/squinky-formality",
766
  "pragmeval/squinky-implicature",
 
767
  "pragmeval/squinky-informativeness",
 
 
768
  "pragmeval/mrda",
769
  "pragmeval/verifiability",
770
- "pragmeval/pdtb",
771
- "pragmeval/persuasiveness-claimtype",
772
- "pragmeval/persuasiveness-eloquence",
773
- "pragmeval/persuasiveness-premisetype",
774
  "pragmeval/gum",
775
  "pragmeval/stac",
 
 
 
776
  "pragmeval/persuasiveness-specificity",
777
  "pragmeval/persuasiveness-strength",
778
  "pragmeval/sarcasm",
779
- "pragmeval/persuasiveness-relevance",
780
- "pragmeval/emergent",
781
  "silicone/iemocap",
782
  "silicone/sem",
783
  "silicone/oasis",
@@ -815,29 +818,29 @@
815
  "go_emotions/simplified",
816
  "scicite",
817
  "liar",
 
 
818
  "lexical_relation_classification/BLESS",
819
- "lexical_relation_classification/EVALution",
820
  "lexical_relation_classification/ROOT09",
821
- "lexical_relation_classification/CogALexV",
822
- "lexical_relation_classification/K&H+N",
823
  "linguisticprobing/bigram_shift",
824
  "linguisticprobing/top_constituents",
825
  "linguisticprobing/subj_number",
826
  "linguisticprobing/odd_man_out",
827
- "linguisticprobing/coordination_inversion",
828
- "linguisticprobing/obj_number",
829
  "linguisticprobing/past_present",
830
  "linguisticprobing/sentence_length",
831
- "linguisticprobing/tree_depth",
832
- "crowdflower/tweet_global_warming",
833
- "crowdflower/text_emotion",
834
- "crowdflower/political-media-message",
835
- "crowdflower/political-media-bias",
836
- "crowdflower/airline-sentiment",
837
- "crowdflower/sentiment_nuclear_power",
838
  "crowdflower/political-media-audience",
 
839
  "crowdflower/economic-news",
840
  "crowdflower/corporate-messaging",
 
 
 
 
 
841
  "ethics/commonsense",
842
  "ethics/deontology",
843
  "ethics/justice",
@@ -901,8 +904,8 @@
901
  "scruples",
902
  "wouldyourather",
903
  "attempto-nli",
904
- "defeasible-nli/snli",
905
  "defeasible-nli/atomic",
 
906
  "help-nli",
907
  "nli-veridicality-transitivity",
908
  "natural-language-satisfiability",
@@ -952,10 +955,10 @@
952
  "oasst1_dense_flat/helpfulness",
953
  "PARARULE-Plus",
954
  "mindgames",
955
- "universal_dependencies/en_gum/deprel",
956
  "universal_dependencies/en_ewt/deprel",
957
- "universal_dependencies/en_partut/deprel",
958
  "universal_dependencies/en_lines/deprel",
 
 
959
  "ambient",
960
  "path-naturalness-prediction",
961
  "civil_comments/toxicity",
@@ -1019,6 +1022,9 @@
1019
  "propsegment/nli",
1020
  "HatemojiBuild",
1021
  "regset",
 
 
 
1022
  "babi_nli",
1023
  "gen_debiased_nli",
1024
  "imppres/presupposition",
 
28
  2,
29
  3,
30
  2,
31
+ 6,
32
  2,
33
  2,
34
  2,
35
  2,
 
36
  2,
37
  2,
38
  2,
 
218
  4,
219
  2,
220
  8,
 
 
 
 
 
221
  3,
222
  3,
223
  3,
224
  3,
225
  20,
226
+ 3,
227
  2,
 
228
  2,
 
229
  2,
230
+ 4,
231
+ 3,
232
+ 174,
233
  2,
234
  2,
235
  2,
236
  2,
237
+ 2,
238
+ 41,
239
  51,
240
  3,
 
 
241
  2,
242
+ 3,
243
  17,
244
  18,
245
  2,
246
+ 8,
247
+ 2,
248
  2,
249
  2,
250
  2,
251
  3,
252
+ 16,
253
  11,
254
  3,
255
  42,
 
287
  28,
288
  3,
289
  6,
290
+ 4,
291
+ 5,
292
  6,
 
293
  3,
294
+ 7,
 
295
  2,
296
  20,
297
  2,
298
  2,
299
+ 7,
300
  2,
301
+ 6,
302
  2,
303
  2,
 
 
304
  2,
305
  13,
 
 
306
  3,
307
  4,
 
308
  3,
309
+ 2,
310
  4,
311
  2,
312
+ 9,
313
+ 2,
314
  2,
315
  2,
316
  2,
 
491
  3,
492
  2,
493
  2,
494
+ 4,
495
+ 1,
496
+ 17,
497
  2,
498
  3,
499
  3,
 
558
  "scitail/snli_format",
559
  "hans",
560
  "WANLI",
561
+ "recast/recast_factuality",
562
+ "recast/recast_kg_relations",
563
+ "recast/recast_puns",
564
  "recast/recast_sentiment",
 
565
  "recast/recast_verbnet",
566
+ "recast/recast_ner",
 
567
  "recast/recast_verbcorner",
568
+ "recast/recast_megaveridicality",
 
569
  "probability_words_nli/reasoning_2hop",
570
+ "probability_words_nli/usnli",
571
  "probability_words_nli/reasoning_1hop",
572
  "nan-nli/joey234--nan-nli",
573
  "nli_fever",
 
592
  "robust_nli_is_sd",
593
  "robust_nli_li_ts",
594
  "add_one_rte",
595
+ "imppres/implicature_numerals_2_3/log",
596
+ "imppres/implicature_modals/log",
597
  "imppres/implicature_gradable_verb/log",
598
+ "imppres/implicature_gradable_adjective/log",
599
  "imppres/implicature_connectives/log",
 
600
  "imppres/implicature_numerals_10_100/log",
601
+ "imppres/implicature_quantifiers/log",
 
602
  "glue_diagnostics/diagnostics",
603
  "hlgd",
604
  "paws/labeled_final",
 
611
  "model-written-evals",
612
  "truthful_qa/multiple_choice",
613
  "fig-qa",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
614
  "bigbench/analytic_entailment",
615
+ "bigbench/figure_of_speech_detection",
 
 
 
 
 
 
 
 
616
  "bigbench/riddle_sense",
617
+ "bigbench/physical_intuition",
618
+ "bigbench/metaphor_boolean",
619
+ "bigbench/epistemic_reasoning",
620
+ "bigbench/dark_humor_detection",
621
+ "bigbench/international_phonetic_alphabet_nli",
622
+ "bigbench/arithmetic",
623
+ "bigbench/cifar10_classification",
624
+ "bigbench/hhh_alignment",
625
+ "bigbench/strategyqa",
626
+ "bigbench/play_dialog_same_or_different",
627
+ "bigbench/odd_one_out",
628
  "bigbench/undo_permutation",
 
 
 
 
 
629
  "bigbench/key_value_maps",
630
+ "bigbench/empirical_judgments",
631
+ "bigbench/question_selection",
632
+ "bigbench/date_understanding",
633
  "bigbench/vitaminc_fact_verification",
634
+ "bigbench/cause_and_effect",
635
  "bigbench/known_unknowns",
636
+ "bigbench/causal_judgment",
637
+ "bigbench/nonsense_words_grammar",
638
+ "bigbench/movie_dialog_same_or_different",
639
+ "bigbench/unit_interpretation",
640
+ "bigbench/abstract_narrative_understanding",
641
+ "bigbench/dyck_languages",
642
+ "bigbench/elementary_math_qa",
643
+ "bigbench/identify_math_theorems",
644
+ "bigbench/misconceptions",
645
+ "bigbench/crash_blossom",
646
+ "bigbench/novel_concepts",
647
+ "bigbench/social_iqa",
648
+ "bigbench/hindu_knowledge",
649
+ "bigbench/anachronisms",
650
  "bigbench/cs_algorithms",
651
+ "bigbench/ruin_names",
 
 
652
  "bigbench/phrase_relatedness",
653
+ "bigbench/crass_ai",
 
 
 
 
 
 
654
  "bigbench/conceptual_combinations",
655
+ "bigbench/discourse_marker_prediction",
656
+ "bigbench/logic_grid_puzzle",
657
+ "bigbench/navigate",
658
+ "bigbench/emoji_movie",
659
+ "bigbench/implicit_relations",
660
+ "bigbench/presuppositions_as_nli",
661
+ "bigbench/code_line_description",
662
+ "bigbench/color",
663
+ "bigbench/gre_reading_comprehension",
664
+ "bigbench/physics",
665
+ "bigbench/symbol_interpretation",
666
+ "bigbench/tracking_shuffled_objects",
667
  "bigbench/entailed_polarity",
668
+ "bigbench/mathematical_induction",
669
+ "bigbench/metaphor_understanding",
670
+ "bigbench/movie_recommendation",
671
+ "bigbench/simple_ethical_questions",
672
+ "bigbench/hyperbaton",
673
+ "bigbench/english_proverbs",
674
+ "bigbench/similarities_abstraction",
675
+ "bigbench/emojis_emotion_prediction",
676
+ "bigbench/temporal_sequences",
677
+ "bigbench/human_organs_senses",
678
+ "bigbench/penguins_in_a_table",
679
  "bigbench/winowhy",
680
+ "bigbench/authorship_verification",
681
+ "bigbench/sentence_ambiguity",
682
+ "bigbench/mnist_ascii",
683
+ "bigbench/identify_odd_metaphor",
684
+ "bigbench/geometric_shapes",
685
  "bigbench/evaluating_information_essentiality",
686
+ "bigbench/timedial",
687
+ "bigbench/salient_translation_error_detection",
688
+ "bigbench/suicide_risk",
 
 
689
  "bigbench/fantasy_reasoning",
690
+ "bigbench/implicatures",
691
+ "bigbench/logical_sequence",
 
 
 
692
  "bigbench/irony_identification",
693
+ "bigbench/formal_fallacies_syllogisms_negation",
694
+ "bigbench/understanding_fables",
695
+ "bigbench/logical_args",
696
+ "bigbench/analogical_similarity",
697
+ "bigbench/social_support",
698
+ "bigbench/logical_fallacy_detection",
699
+ "bigbench/bbq_lite_json",
700
+ "bigbench/reasoning_about_colored_objects",
701
+ "bigbench/intent_recognition",
702
+ "bigbench/contextual_parametric_knowledge_conflicts",
703
  "bigbench/general_knowledge",
 
 
 
 
 
 
 
 
 
704
  "bigbench/strange_stories",
705
+ "bigbench/sports_understanding",
706
+ "bigbench/checkmate_in_one",
707
+ "bigbench/moral_permissibility",
708
+ "bigbench/goal_step_wikihow",
709
+ "bigbench/snarks",
710
  "bigbench/disambiguation_qa",
711
+ "bigbench/real_or_fake_text",
712
+ "bigbench/logical_deduction",
713
+ "bigbench/fact_checker",
 
 
 
714
  "cos_e/v1.0",
715
  "cosmos_qa",
716
  "dream",
 
749
  "rumoureval_2019/RumourEval2019",
750
  "ethos/binary",
751
  "ethos/multilabel",
 
 
 
 
 
 
 
 
752
  "tweet_eval/stance_hillary",
753
+ "tweet_eval/stance_feminist",
754
+ "tweet_eval/stance_climate",
755
+ "tweet_eval/stance_atheism",
756
  "tweet_eval/emoji",
757
+ "tweet_eval/sentiment",
758
+ "tweet_eval/offensive",
759
+ "tweet_eval/irony",
760
  "tweet_eval/hate",
761
+ "tweet_eval/emotion",
762
+ "tweet_eval/stance_abortion",
763
  "discovery/discovery",
 
 
 
 
764
  "pragmeval/squinky-formality",
765
  "pragmeval/squinky-implicature",
766
+ "pragmeval/emobank-dominance",
767
  "pragmeval/squinky-informativeness",
768
+ "pragmeval/emobank-arousal",
769
+ "pragmeval/switchboard",
770
  "pragmeval/mrda",
771
  "pragmeval/verifiability",
772
+ "pragmeval/emobank-valence",
773
+ "pragmeval/emergent",
 
 
774
  "pragmeval/gum",
775
  "pragmeval/stac",
776
+ "pragmeval/persuasiveness-eloquence",
777
+ "pragmeval/persuasiveness-premisetype",
778
+ "pragmeval/persuasiveness-relevance",
779
  "pragmeval/persuasiveness-specificity",
780
  "pragmeval/persuasiveness-strength",
781
  "pragmeval/sarcasm",
782
+ "pragmeval/persuasiveness-claimtype",
783
+ "pragmeval/pdtb",
784
  "silicone/iemocap",
785
  "silicone/sem",
786
  "silicone/oasis",
 
818
  "go_emotions/simplified",
819
  "scicite",
820
  "liar",
821
+ "lexical_relation_classification/K&H+N",
822
+ "lexical_relation_classification/CogALexV",
823
  "lexical_relation_classification/BLESS",
 
824
  "lexical_relation_classification/ROOT09",
825
+ "lexical_relation_classification/EVALution",
 
826
  "linguisticprobing/bigram_shift",
827
  "linguisticprobing/top_constituents",
828
  "linguisticprobing/subj_number",
829
  "linguisticprobing/odd_man_out",
830
+ "linguisticprobing/tree_depth",
 
831
  "linguisticprobing/past_present",
832
  "linguisticprobing/sentence_length",
833
+ "linguisticprobing/obj_number",
834
+ "linguisticprobing/coordination_inversion",
 
 
 
 
 
835
  "crowdflower/political-media-audience",
836
+ "crowdflower/text_emotion",
837
  "crowdflower/economic-news",
838
  "crowdflower/corporate-messaging",
839
+ "crowdflower/airline-sentiment",
840
+ "crowdflower/tweet_global_warming",
841
+ "crowdflower/sentiment_nuclear_power",
842
+ "crowdflower/political-media-bias",
843
+ "crowdflower/political-media-message",
844
  "ethics/commonsense",
845
  "ethics/deontology",
846
  "ethics/justice",
 
904
  "scruples",
905
  "wouldyourather",
906
  "attempto-nli",
 
907
  "defeasible-nli/atomic",
908
+ "defeasible-nli/snli",
909
  "help-nli",
910
  "nli-veridicality-transitivity",
911
  "natural-language-satisfiability",
 
955
  "oasst1_dense_flat/helpfulness",
956
  "PARARULE-Plus",
957
  "mindgames",
 
958
  "universal_dependencies/en_ewt/deprel",
 
959
  "universal_dependencies/en_lines/deprel",
960
+ "universal_dependencies/en_partut/deprel",
961
+ "universal_dependencies/en_gum/deprel",
962
  "ambient",
963
  "path-naturalness-prediction",
964
  "civil_comments/toxicity",
 
1022
  "propsegment/nli",
1023
  "HatemojiBuild",
1024
  "regset",
1025
+ "esci",
1026
+ "chatbot_arena_conversations",
1027
+ "dnd_style_intents",
1028
  "babi_nli",
1029
  "gen_debiased_nli",
1030
  "imppres/presupposition",
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ab88a8f05db76ac64228169372c5ee6b8dde4f2ec01359411d03b5fd2bc386ba
3
  size 737771833
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2e28518532d77001e5030110c5761ec75499fc5fad1a7e81045c7ce0ba0a86e3
3
  size 737771833