{ "architectures": [ "XLMRobertaForTokenClassification" ], "attention_probs_dropout_prob": 0.1, "bos_token_id": 0, "classifier_dropout": null, "eos_token_id": 2, "hidden_act": "gelu", "hidden_dropout_prob": 0.1, "hidden_size": 768, "id2label": { "0": "ADJ", "1": "ADJ+PART", "2": "ADP", "3": "ADV", "4": "ADV+PART", "5": "AUX", "6": "AUX+PART", "7": "B-ADJ", "8": "B-ADJ+PART", "9": "B-ADP", "10": "B-ADP+ADP", "11": "B-ADV", "12": "B-AUX", "13": "B-AUX+PART", "14": "B-AUX+PART+VERB", "15": "B-CCONJ", "16": "B-DET", "17": "B-INTJ", "18": "B-NOUN", "19": "B-NOUN+PART", "20": "B-NUM", "21": "B-PART", "22": "B-PRON", "23": "B-PRON+AUX", "24": "B-PROPN", "25": "B-PROPN+PART", "26": "B-PUNCT", "27": "B-SCONJ", "28": "B-SYM", "29": "B-VERB", "30": "B-VERB+ADV", "31": "B-VERB+PART", "32": "B-X", "33": "CCONJ", "34": "DET", "35": "I-ADJ", "36": "I-ADJ+PART", "37": "I-ADP", "38": "I-ADP+ADP", "39": "I-ADV", "40": "I-AUX", "41": "I-AUX+PART", "42": "I-AUX+PART+VERB", "43": "I-CCONJ", "44": "I-DET", "45": "I-INTJ", "46": "I-NOUN", "47": "I-NOUN+PART", "48": "I-NUM", "49": "I-PART", "50": "I-PRON", "51": "I-PRON+AUX", "52": "I-PROPN", "53": "I-PROPN+PART", "54": "I-PUNCT", "55": "I-SCONJ", "56": "I-SYM", "57": "I-VERB", "58": "I-VERB+ADV", "59": "I-VERB+PART", "60": "I-X", "61": "INTJ", "62": "NOUN", "63": "NOUN+ADP", "64": "NOUN+PART", "65": "NUM", "66": "PART", "67": "PRON", "68": "PRON+AUX", "69": "PRON+VERB", "70": "PROPN", "71": "PUNCT", "72": "SCONJ", "73": "SYM", "74": "VERB", "75": "VERB+PART", "76": "X" }, "initializer_range": 0.02, "intermediate_size": 3072, "label2id": { "ADJ": 0, "ADJ+PART": 1, "ADP": 2, "ADV": 3, "ADV+PART": 4, "AUX": 5, "AUX+PART": 6, "B-ADJ": 7, "B-ADJ+PART": 8, "B-ADP": 9, "B-ADP+ADP": 10, "B-ADV": 11, "B-AUX": 12, "B-AUX+PART": 13, "B-AUX+PART+VERB": 14, "B-CCONJ": 15, "B-DET": 16, "B-INTJ": 17, "B-NOUN": 18, "B-NOUN+PART": 19, "B-NUM": 20, "B-PART": 21, "B-PRON": 22, "B-PRON+AUX": 23, "B-PROPN": 24, "B-PROPN+PART": 25, "B-PUNCT": 26, "B-SCONJ": 27, "B-SYM": 28, "B-VERB": 29, "B-VERB+ADV": 30, "B-VERB+PART": 31, "B-X": 32, "CCONJ": 33, "DET": 34, "I-ADJ": 35, "I-ADJ+PART": 36, "I-ADP": 37, "I-ADP+ADP": 38, "I-ADV": 39, "I-AUX": 40, "I-AUX+PART": 41, "I-AUX+PART+VERB": 42, "I-CCONJ": 43, "I-DET": 44, "I-INTJ": 45, "I-NOUN": 46, "I-NOUN+PART": 47, "I-NUM": 48, "I-PART": 49, "I-PRON": 50, "I-PRON+AUX": 51, "I-PROPN": 52, "I-PROPN+PART": 53, "I-PUNCT": 54, "I-SCONJ": 55, "I-SYM": 56, "I-VERB": 57, "I-VERB+ADV": 58, "I-VERB+PART": 59, "I-X": 60, "INTJ": 61, "NOUN": 62, "NOUN+ADP": 63, "NOUN+PART": 64, "NUM": 65, "PART": 66, "PRON": 67, "PRON+AUX": 68, "PRON+VERB": 69, "PROPN": 70, "PUNCT": 71, "SCONJ": 72, "SYM": 73, "VERB": 74, "VERB+PART": 75, "X": 76 }, "layer_norm_eps": 1e-05, "max_position_embeddings": 514, "model_type": "xlm-roberta", "num_attention_heads": 12, "num_hidden_layers": 12, "output_past": true, "pad_token_id": 1, "position_embedding_type": "absolute", "task_specific_params": { "upos_multiword": { "ADJ+PART": { "elses": [ "else", "s" ], "others": [ "other", "s" ] }, "ADP+ADP": { "OUTTA": [ "OUT", "TA" ] }, "ADV+PART": { "into": [ "in", "to" ] }, "AUX+PART": { "Aren't": [ "Are", "n't" ], "CANNOT": [ "CAN", "NOT" ], "CANT": [ "CA", "NT" ], "Can't": [ "Ca", "n't" ], "DON'T": [ "DO", "N'T" ], "Don't": [ "Do", "n't" ], "Dont": [ "Do", "nt" ], "WASN'T": [ "WAS", "N'T" ], "ain't": [ "ai", "n't" ], "aint": [ "ai", "nt" ], "aren't": [ "are", "n't" ], "arent": [ "are", "nt" ], "can't": [ "ca", "n't" ], "cannot": [ "can", "not" ], "cant": [ "ca", "nt" ], "can\u2019t": [ "ca", "n\u2019t" ], "couldn't": [ "could", "n't" ], "couldnt": [ "could", "nt" ], "didn't": [ "did", "n't" ], "didnt": [ "did", "nt" ], "didn\u2019t": [ "did", "n\u2019t" ], "doesn't": [ "does", "n't" ], "doesnt": [ "does", "nt" ], "don't": [ "do", "n't" ], "dont": [ "do", "nt" ], "don\u2019t": [ "do", "n\u2019t" ], "haven't": [ "have", "n't" ], "havn't": [ "hav", "n't" ], "isn't": [ "is", "n't" ], "wasent": [ "wase", "nt" ], "wasn't": [ "was", "n't" ], "won't": [ "wo", "n't" ], "wont": [ "wo", "nt" ], "won\u2019t": [ "wo", "n\u2019t" ], "wouldn't": [ "would", "n't" ], "wouldnt": [ "would", "nt" ] }, "AUX+PART+VERB": { "dunno": [ "du", "n", "no" ] }, "NOUN+ADP": { "sorta": [ "sort", "a" ] }, "NOUN+PART": { "DAUGHTERS": [ "DAUGHTER", "S" ], "Kids": [ "Kid", "s" ], "Smokers": [ "Smoker", "s" ], "Travelers": [ "Traveler", "s" ], "animals": [ "animal", "s" ], "bakers": [ "baker", "s" ], "beginners": [ "beginner", "s" ], "bettas": [ "betta", "s" ], "boys": [ "boy", "s" ], "friends": [ "friend", "s" ], "grandmas": [ "grandma", "s" ], "humans": [ "human", "s" ], "manufacturers": [ "manufacturer", "s" ], "owners": [ "owner", "s" ], "scammers": [ "scammer", "s" ], "teams": [ "team", "s" ], "visitors": [ "visitor", "s" ], "workers": [ "worker", "s" ] }, "PRON+AUX": { "ITS": [ "IT", "S" ], "Im": [ "I", "m" ], "Your": [ "You", "r" ], "id": [ "i", "d" ], "im": [ "i", "m" ], "its": [ "it", "s" ], "their": [ "thei", "r" ], "there": [ "the", "re" ], "ur": [ "u", "r" ], "your": [ "you", "r" ], "youre": [ "you", "re" ] }, "PRON+VERB": { "im": [ "i", "m" ], "its": [ "it", "s" ] }, "PROPN+PART": { "Friscos": [ "Frisco", "s" ], "Mortons": [ "Morton", "s" ] }, "VERB+ADV": { "c'mon": [ "c'm", "on" ] }, "VERB+PART": { "Gotta": [ "Got", "ta" ], "aren't": [ "are", "n't" ], "doesn't": [ "does", "n't" ], "doesnt": [ "does", "nt" ], "don't": [ "do", "n't" ], "gonna": [ "gon", "na" ], "gotta": [ "got", "ta" ], "isn't": [ "is", "n't" ], "wana": [ "wan", "a" ], "wasn't": [ "was", "n't" ] } } }, "tokenizer_class": "XLMRobertaTokenizerFast", "torch_dtype": "float32", "transformers_version": "4.11.3", "type_vocab_size": 1, "use_cache": true, "vocab_size": 250002 }