sileod's picture
Upload DebertaV2ForSequenceClassification
ee22e02
raw
history blame
14.8 kB
{
"_name_or_path": "microsoft/mdeberta-v3-base",
"architectures": [
"DebertaV2ForSequenceClassification"
],
"attention_probs_dropout_prob": 0.1,
"classifiers_size": [
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
2,
2,
2,
2,
2,
2,
2,
15,
31,
12,
31,
11,
2,
2,
3,
5,
6,
3,
3,
3,
3,
3,
3,
3,
3,
3,
2,
2,
2,
2,
6,
6,
6,
69,
2,
1,
8,
10,
2,
2,
5,
2,
2,
2,
2,
1,
1,
1,
20,
235,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
9,
17,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
18,
1
],
"hidden_act": "gelu",
"hidden_dropout_prob": 0.1,
"hidden_size": 768,
"id2label": {
"0": "entailment",
"1": "neutral",
"2": "contradiction"
},
"initializer_range": 0.02,
"intermediate_size": 3072,
"label2id": {
"contradiction": 2,
"entailment": 0,
"neutral": 1
},
"layer_norm_eps": 1e-07,
"max_position_embeddings": 512,
"max_relative_positions": -1,
"model_type": "deberta-v2",
"norm_rel_ebd": "layer_norm",
"num_attention_heads": 12,
"num_hidden_layers": 12,
"pad_token_id": 0,
"pooler_dropout": 0,
"pooler_hidden_act": "gelu",
"pooler_hidden_size": 768,
"pos_att_type": [
"p2c",
"c2p"
],
"position_biased_input": false,
"position_buckets": 256,
"relative_attention": true,
"share_att_key": true,
"tasks": [
"xnli/es",
"xnli/ar",
"xnli/bg",
"xnli/de",
"xnli/el",
"xnli/en",
"xnli/fr",
"xnli/hi",
"xnli/ru",
"xnli/sw",
"xnli/th",
"xnli/tr",
"xnli/ur",
"xnli/vi",
"xnli/zh",
"americas_nli/all_languages",
"multilingual-NLI-26lang-2mil7",
"stsb_multi_mt/zh",
"stsb_multi_mt/pt",
"stsb_multi_mt/pl",
"stsb_multi_mt/nl",
"stsb_multi_mt/it",
"stsb_multi_mt/fr",
"stsb_multi_mt/es",
"stsb_multi_mt/de",
"stsb_multi_mt/en",
"stsb_multi_mt/ru",
"paws-x/ko",
"paws-x/zh",
"paws-x/fr",
"paws-x/es",
"paws-x/de",
"paws-x/en",
"paws-x/ja",
"miam/ilisten",
"miam/vm2",
"miam/maptask",
"miam/loria",
"miam/dihana",
"x-stance/fr",
"x-stance/de",
"multilingual-sentiments/all",
"universal-joy",
"amazon_reviews_multi/all_languages",
"tweet_sentiment_multilingual/all",
"tweet_sentiment_multilingual/spanish",
"tweet_sentiment_multilingual/portuguese",
"tweet_sentiment_multilingual/italian",
"tweet_sentiment_multilingual/arabic",
"tweet_sentiment_multilingual/german",
"tweet_sentiment_multilingual/french",
"tweet_sentiment_multilingual/english",
"tweet_sentiment_multilingual/hindi",
"offenseval_2020/da",
"offenseval_2020/gr",
"offenseval_2020/tr",
"offenseval_2020/ar",
"offenseval_dravidian/tamil",
"offenseval_dravidian/malayalam",
"offenseval_dravidian/kannada",
"MLMA_hate_speech",
"xglue/qam",
"xsum_factuality",
"x-fact",
"xglue/nc",
"xglue/qadsm",
"xglue/qam",
"xglue/wpr",
"xlwic/xlwic_de_de",
"xlwic/xlwic_fr_fr",
"xlwic/xlwic_en_ko",
"xlwic/xlwic_it_it",
"oasst1_dense_flat/quality",
"oasst1_dense_flat/toxicity",
"oasst1_dense_flat/helpfulness",
"language-identification",
"wili_2018",
"exams/multilingual",
"xcsr/X-CODAH-en",
"xcsr/X-CSQA-ur",
"xcsr/X-CSQA-sw",
"xcsr/X-CSQA-hi",
"xcsr/X-CSQA-vi",
"xcsr/X-CSQA-ar",
"xcsr/X-CSQA-ru",
"xcsr/X-CSQA-jap",
"xcsr/X-CSQA-nl",
"xcsr/X-CODAH-zh",
"xcsr/X-CSQA-it",
"xcsr/X-CSQA-fr",
"xcsr/X-CSQA-es",
"xcsr/X-CSQA-de",
"xcsr/X-CSQA-zh",
"xcsr/X-CSQA-en",
"xcsr/X-CSQA-pl",
"xcsr/X-CODAH-de",
"xcsr/X-CSQA-pt",
"xcsr/X-CODAH-fr",
"xcsr/X-CODAH-es",
"xcsr/X-CODAH-ur",
"xcsr/X-CODAH-sw",
"xcsr/X-CODAH-hi",
"xcsr/X-CODAH-ar",
"xcsr/X-CODAH-vi",
"xcsr/X-CODAH-pt",
"xcsr/X-CODAH-pl",
"xcsr/X-CODAH-nl",
"xcsr/X-CODAH-jap",
"xcsr/X-CODAH-it",
"xcsr/X-CODAH-ru",
"xcopa/ta",
"xcopa/vi",
"xcopa/tr",
"xcopa/th",
"xcopa/zh",
"xcopa/et",
"xcopa/qu",
"xcopa/id",
"xcopa/it",
"xcopa/ht",
"xcopa/translation-et",
"xcopa/sw",
"xcopa/translation-ht",
"xcopa/translation-th",
"xcopa/translation-id",
"xcopa/translation-sw",
"xcopa/translation-zh",
"xcopa/translation-ta",
"xcopa/translation-tr",
"xcopa/translation-vi",
"xcopa/translation-it",
"xstory_cloze/id",
"xstory_cloze/hi",
"xstory_cloze/ar",
"xstory_cloze/es",
"xstory_cloze/en",
"xstory_cloze/ru",
"xstory_cloze/te",
"xstory_cloze/sw",
"xstory_cloze/zh",
"xstory_cloze/eu",
"xstory_cloze/my",
"hh-rlhf",
"xglue/ner",
"xglue/pos",
"universal_dependencies/ja_gsd/pos",
"universal_dependencies/fr_pud/pos",
"universal_dependencies/fr_partut/pos",
"universal_dependencies/fr_gsd/pos",
"universal_dependencies/fr_ftb/pos",
"universal_dependencies/fr_fqb/pos",
"universal_dependencies/fi_tdt/pos",
"universal_dependencies/fi_pud/pos",
"universal_dependencies/fi_ood/pos",
"universal_dependencies/fi_ftb/pos",
"universal_dependencies/fo_oft/pos",
"universal_dependencies/fo_farpahc/pos",
"universal_dependencies/et_ewt/pos",
"universal_dependencies/et_edt/pos",
"universal_dependencies/myv_jr/pos",
"universal_dependencies/en_pud/pos",
"universal_dependencies/en_pronouns/pos",
"universal_dependencies/en_partut/pos",
"universal_dependencies/fr_sequoia/pos",
"universal_dependencies/fr_spoken/pos",
"universal_dependencies/gl_ctg/pos",
"universal_dependencies/gl_treegal/pos",
"universal_dependencies/it_postwita/pos",
"universal_dependencies/it_partut/pos",
"universal_dependencies/it_isdt/pos",
"universal_dependencies/ga_idt/pos",
"universal_dependencies/id_pud/pos",
"universal_dependencies/id_gsd/pos",
"universal_dependencies/id_csui/pos",
"universal_dependencies/is_pud/pos",
"universal_dependencies/is_icepahc/pos",
"universal_dependencies/en_lines/pos",
"universal_dependencies/hu_szeged/pos",
"universal_dependencies/hi_hdtb/pos",
"universal_dependencies/qhe_hiencs/pos",
"universal_dependencies/he_htb/pos",
"universal_dependencies/el_gdt/pos",
"universal_dependencies/got_proiel/pos",
"universal_dependencies/de_pud/pos",
"universal_dependencies/de_lit/pos",
"universal_dependencies/de_hdt/pos",
"universal_dependencies/de_gsd/pos",
"universal_dependencies/hi_pud/pos",
"universal_dependencies/en_gumreddit/pos",
"universal_dependencies/en_ewt/pos",
"universal_dependencies/it_pud/pos",
"universal_dependencies/bho_bhtb/pos",
"universal_dependencies/be_hse/pos",
"universal_dependencies/eu_bdt/pos",
"universal_dependencies/bm_crb/pos",
"universal_dependencies/aii_as/pos",
"universal_dependencies/hy_armtdp/pos",
"universal_dependencies/ar_pud/pos",
"universal_dependencies/ar_padt/pos",
"universal_dependencies/br_keb/pos",
"universal_dependencies/ar_nyuad/pos",
"universal_dependencies/grc_proiel/pos",
"universal_dependencies/grc_perseus/pos",
"universal_dependencies/am_att/pos",
"universal_dependencies/sq_tsa/pos",
"universal_dependencies/aqz_tudet/pos",
"universal_dependencies/akk_riao/pos",
"universal_dependencies/akk_pisandub/pos",
"universal_dependencies/af_afribooms/pos",
"universal_dependencies/apu_ufpa/pos",
"universal_dependencies/bg_btb/pos",
"universal_dependencies/bxr_bdt/pos",
"universal_dependencies/yue_hk/pos",
"universal_dependencies/en_esl/pos",
"universal_dependencies/nl_lassysmall/pos",
"universal_dependencies/nl_alpino/pos",
"universal_dependencies/da_ddt/pos",
"universal_dependencies/cs_pud/pos",
"universal_dependencies/cs_pdt/pos",
"universal_dependencies/cs_fictree/pos",
"universal_dependencies/cs_cltt/pos",
"universal_dependencies/cs_cac/pos",
"universal_dependencies/hr_set/pos",
"universal_dependencies/cop_scriptorium/pos",
"universal_dependencies/lzh_kyoto/pos",
"universal_dependencies/ckt_hse/pos",
"universal_dependencies/zh_pud/pos",
"universal_dependencies/zh_hk/pos",
"universal_dependencies/zh_gsdsimp/pos",
"universal_dependencies/zh_gsd/pos",
"universal_dependencies/zh_cfl/pos",
"universal_dependencies/ca_ancora/pos",
"universal_dependencies/en_gum/pos",
"universal_dependencies/ja_bccwj/pos",
"universal_dependencies/it_twittiro/pos",
"universal_dependencies/wo_wtb/pos",
"universal_dependencies/gun_thomas/pos",
"universal_dependencies/mdf_jr/pos",
"universal_dependencies/myu_tudet/pos",
"universal_dependencies/pcm_nsc/pos",
"universal_dependencies/nyq_aha/pos",
"universal_dependencies/sme_giella/pos",
"universal_dependencies/no_bokmaal/pos",
"universal_dependencies/no_nynorsk/pos",
"universal_dependencies/no_nynorsklia/pos",
"universal_dependencies/cu_proiel/pos",
"universal_dependencies/fro_srcmf/pos",
"universal_dependencies/orv_rnc/pos",
"universal_dependencies/orv_torot/pos",
"universal_dependencies/otk_tonqq/pos",
"universal_dependencies/fa_perdt/pos",
"universal_dependencies/fa_seraji/pos",
"universal_dependencies/pl_lfg/pos",
"universal_dependencies/pl_pdb/pos",
"universal_dependencies/pl_pud/pos",
"universal_dependencies/gun_dooley/pos",
"universal_dependencies/mr_ufal/pos",
"universal_dependencies/it_vit/pos",
"universal_dependencies/mt_mudt/pos",
"universal_dependencies/ja_modern/pos",
"universal_dependencies/ja_pud/pos",
"universal_dependencies/krl_kkpp/pos",
"universal_dependencies/kk_ktb/pos",
"universal_dependencies/kfm_aha/pos",
"universal_dependencies/koi_uh/pos",
"universal_dependencies/kpv_ikdp/pos",
"universal_dependencies/kpv_lattice/pos",
"universal_dependencies/ko_gsd/pos",
"universal_dependencies/pt_bosque/pos",
"universal_dependencies/ko_kaist/pos",
"universal_dependencies/kmr_mg/pos",
"universal_dependencies/la_ittb/pos",
"universal_dependencies/la_llct/pos",
"universal_dependencies/la_perseus/pos",
"universal_dependencies/la_proiel/pos",
"universal_dependencies/lv_lvtb/pos",
"universal_dependencies/lt_alksnis/pos",
"universal_dependencies/lt_hse/pos",
"universal_dependencies/olo_kkpp/pos",
"universal_dependencies/ko_pud/pos",
"universal_dependencies/yo_ytb/pos",
"universal_dependencies/pt_gsd/pos",
"universal_dependencies/ro_nonstandard/pos",
"universal_dependencies/tl_trg/pos",
"universal_dependencies/tl_ugnayan/pos",
"universal_dependencies/ta_mwtt/pos",
"universal_dependencies/ta_ttb/pos",
"universal_dependencies/te_mtg/pos",
"universal_dependencies/th_pud/pos",
"universal_dependencies/tpn_tudet/pos",
"universal_dependencies/qtd_sagt/pos",
"universal_dependencies/tr_boun/pos",
"universal_dependencies/tr_gb/pos",
"universal_dependencies/tr_imst/pos",
"universal_dependencies/tr_pud/pos",
"universal_dependencies/uk_iu/pos",
"universal_dependencies/hsb_ufal/pos",
"universal_dependencies/ur_udtb/pos",
"universal_dependencies/ug_udt/pos",
"universal_dependencies/vi_vtb/pos",
"universal_dependencies/wbp_ufal/pos",
"universal_dependencies/cy_ccg/pos",
"universal_dependencies/gsw_uzh/pos",
"universal_dependencies/pt_pud/pos",
"universal_dependencies/sv_talbanken/pos",
"universal_dependencies/sv_lines/pos",
"universal_dependencies/ro_rrt/pos",
"universal_dependencies/ro_simonero/pos",
"universal_dependencies/ru_gsd/pos",
"universal_dependencies/ru_pud/pos",
"universal_dependencies/ru_syntagrus/pos",
"universal_dependencies/ru_taiga/pos",
"universal_dependencies/sa_ufal/pos",
"universal_dependencies/sa_vedic/pos",
"universal_dependencies/gd_arcosg/pos",
"universal_dependencies/sv_pud/pos",
"universal_dependencies/sr_set/pos",
"universal_dependencies/sk_snk/pos",
"universal_dependencies/sl_ssj/pos",
"universal_dependencies/sl_sst/pos",
"universal_dependencies/soj_aha/pos",
"universal_dependencies/ajp_madar/pos",
"universal_dependencies/es_ancora/pos",
"universal_dependencies/es_gsd/pos",
"universal_dependencies/es_pud/pos",
"universal_dependencies/swl_sslc/pos",
"universal_dependencies/sms_giellagas/pos",
"universal_dependencies/gv_cadhan/pos",
"oasst1_pairwise_rlhf_reward"
],
"torch_dtype": "float32",
"transformers_version": "4.26.1",
"type_vocab_size": 0,
"vocab_size": 251000
}