sileod's picture
Upload DebertaV2ForSequenceClassification
bd9453d
raw
history blame
5.52 kB
{
"_name_or_path": "microsoft/mdeberta-v3-base",
"architectures": [
"DebertaV2ForSequenceClassification"
],
"attention_probs_dropout_prob": 0.1,
"classifiers_size": [
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
3,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
2,
2,
2,
2,
2,
2,
2,
11,
15,
31,
12,
31,
2,
2,
3,
5,
6,
3,
3,
3,
3,
3,
3,
3,
3,
3,
2,
2,
2,
2,
6,
6,
6,
69,
2,
1,
8,
10,
2,
2,
5,
2,
2,
2,
2,
1,
1,
1,
20,
235,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
9,
17
],
"hidden_act": "gelu",
"hidden_dropout_prob": 0.1,
"hidden_size": 768,
"id2label": {
"0": "entailment",
"1": "neutral",
"2": "contradiction"
},
"initializer_range": 0.02,
"intermediate_size": 3072,
"label2id": {
"contradiction": 2,
"entailment": 0,
"neutral": 1
},
"layer_norm_eps": 1e-07,
"max_position_embeddings": 512,
"max_relative_positions": -1,
"model_type": "deberta-v2",
"norm_rel_ebd": "layer_norm",
"num_attention_heads": 12,
"num_hidden_layers": 12,
"pad_token_id": 0,
"pooler_dropout": 0,
"pooler_hidden_act": "gelu",
"pooler_hidden_size": 768,
"pos_att_type": [
"p2c",
"c2p"
],
"position_biased_input": false,
"position_buckets": 256,
"relative_attention": true,
"share_att_key": true,
"tasks": [
"xnli/ur",
"xnli/ar",
"xnli/bg",
"xnli/de",
"xnli/el",
"xnli/zh",
"xnli/vi",
"xnli/tr",
"xnli/th",
"xnli/sw",
"xnli/en",
"xnli/ru",
"xnli/es",
"xnli/fr",
"xnli/hi",
"americas_nli/all_languages",
"multilingual-NLI-26lang-2mil7",
"stsb_multi_mt/pl",
"stsb_multi_mt/it",
"stsb_multi_mt/fr",
"stsb_multi_mt/nl",
"stsb_multi_mt/es",
"stsb_multi_mt/de",
"stsb_multi_mt/en",
"stsb_multi_mt/pt",
"stsb_multi_mt/ru",
"stsb_multi_mt/zh",
"paws-x/zh",
"paws-x/ko",
"paws-x/fr",
"paws-x/es",
"paws-x/de",
"paws-x/en",
"paws-x/ja",
"miam/dihana",
"miam/ilisten",
"miam/loria",
"miam/maptask",
"miam/vm2",
"x-stance/de",
"x-stance/fr",
"multilingual-sentiments/all",
"universal-joy",
"amazon_reviews_multi/all_languages",
"tweet_sentiment_multilingual/all",
"tweet_sentiment_multilingual/portuguese",
"tweet_sentiment_multilingual/italian",
"tweet_sentiment_multilingual/spanish",
"tweet_sentiment_multilingual/german",
"tweet_sentiment_multilingual/french",
"tweet_sentiment_multilingual/english",
"tweet_sentiment_multilingual/arabic",
"tweet_sentiment_multilingual/hindi",
"offenseval_2020/tr",
"offenseval_2020/ar",
"offenseval_2020/da",
"offenseval_2020/gr",
"offenseval_dravidian/tamil",
"offenseval_dravidian/malayalam",
"offenseval_dravidian/kannada",
"MLMA_hate_speech",
"xglue/qam",
"xsum_factuality",
"x-fact",
"xglue/nc",
"xglue/qadsm",
"xglue/qam",
"xglue/wpr",
"xlwic/xlwic_en_ko",
"xlwic/xlwic_fr_fr",
"xlwic/xlwic_it_it",
"xlwic/xlwic_de_de",
"oasst1_dense_flat/quality",
"oasst1_dense_flat/toxicity",
"oasst1_dense_flat/helpfulness",
"language-identification",
"wili_2018",
"exams/multilingual",
"xcsr/X-CSQA-es",
"xcsr/X-CSQA-en",
"xcsr/X-CODAH-ur",
"xcsr/X-CODAH-sw",
"xcsr/X-CODAH-hi",
"xcsr/X-CODAH-vi",
"xcsr/X-CODAH-ar",
"xcsr/X-CODAH-ru",
"xcsr/X-CODAH-pt",
"xcsr/X-CODAH-pl",
"xcsr/X-CODAH-nl",
"xcsr/X-CODAH-jap",
"xcsr/X-CODAH-it",
"xcsr/X-CODAH-fr",
"xcsr/X-CODAH-es",
"xcsr/X-CODAH-de",
"xcsr/X-CODAH-zh",
"xcsr/X-CODAH-en",
"xcsr/X-CSQA-ur",
"xcsr/X-CSQA-sw",
"xcsr/X-CSQA-zh",
"xcsr/X-CSQA-vi",
"xcsr/X-CSQA-ar",
"xcsr/X-CSQA-ru",
"xcsr/X-CSQA-pt",
"xcsr/X-CSQA-pl",
"xcsr/X-CSQA-nl",
"xcsr/X-CSQA-jap",
"xcsr/X-CSQA-it",
"xcsr/X-CSQA-fr",
"xcsr/X-CSQA-de",
"xcsr/X-CSQA-hi",
"xcopa/translation-th",
"xcopa/sw",
"xcopa/et",
"xcopa/ht",
"xcopa/it",
"xcopa/id",
"xcopa/qu",
"xcopa/translation-vi",
"xcopa/zh",
"xcopa/ta",
"xcopa/th",
"xcopa/vi",
"xcopa/tr",
"xcopa/translation-ht",
"xcopa/translation-it",
"xcopa/translation-id",
"xcopa/translation-sw",
"xcopa/translation-zh",
"xcopa/translation-ta",
"xcopa/translation-tr",
"xcopa/translation-et",
"xstory_cloze/ar",
"xstory_cloze/te",
"xstory_cloze/sw",
"xstory_cloze/id",
"xstory_cloze/hi",
"xstory_cloze/es",
"xstory_cloze/my",
"xstory_cloze/ru",
"xstory_cloze/en",
"xstory_cloze/eu",
"xstory_cloze/zh",
"hh-rlhf",
"xglue/ner",
"xglue/pos"
],
"torch_dtype": "float32",
"transformers_version": "4.26.1",
"type_vocab_size": 0,
"vocab_size": 251000
}