{ | |
"_name_or_path": "dsfsi/zabantu-ven-120m", | |
"architectures": [ | |
"XLMRobertaForTokenClassification" | |
], | |
"attention_probs_dropout_prob": 0.1, | |
"bos_token_id": 0, | |
"classifier_dropout": null, | |
"eos_token_id": 2, | |
"hidden_act": "gelu", | |
"hidden_dropout_prob": 0.1, | |
"hidden_size": 768, | |
"id2label": { | |
"0": "B-ADJ", | |
"1": "B-ADP", | |
"2": "B-ADV", | |
"3": "B-AUX", | |
"4": "B-CCONJ", | |
"5": "B-DET", | |
"6": "B-INTJ", | |
"7": "B-NOUN", | |
"8": "B-NUM", | |
"9": "B-PART", | |
"10": "B-PREP", | |
"11": "B-PRON", | |
"12": "B-PROPN", | |
"13": "B-PUNCT", | |
"14": "B-SCONJ", | |
"15": "B-SYM", | |
"16": "B-VERB", | |
"17": "I-ADJ", | |
"18": "I-ADV", | |
"19": "I-NOUN", | |
"20": "I-PREP", | |
"21": "I-VERB", | |
"22": "OUT" | |
}, | |
"initializer_range": 0.02, | |
"intermediate_size": 3072, | |
"label2id": { | |
"B-ADJ": 0, | |
"B-ADP": 1, | |
"B-ADV": 2, | |
"B-AUX": 3, | |
"B-CCONJ": 4, | |
"B-DET": 5, | |
"B-INTJ": 6, | |
"B-NOUN": 7, | |
"B-NUM": 8, | |
"B-PART": 9, | |
"B-PREP": 10, | |
"B-PRON": 11, | |
"B-PROPN": 12, | |
"B-PUNCT": 13, | |
"B-SCONJ": 14, | |
"B-SYM": 15, | |
"B-VERB": 16, | |
"I-ADJ": 17, | |
"I-ADV": 18, | |
"I-NOUN": 19, | |
"I-PREP": 20, | |
"I-VERB": 21, | |
"OUT": 22 | |
}, | |
"layer_norm_eps": 1e-05, | |
"max_length": 512, | |
"max_position_embeddings": 514, | |
"model_type": "xlm-roberta", | |
"num_attention_heads": 6, | |
"num_hidden_layers": 8, | |
"output_past": true, | |
"pad_token_id": 1, | |
"position_embedding_type": "absolute", | |
"torch_dtype": "float32", | |
"transformers_version": "4.41.2", | |
"type_vocab_size": 1, | |
"use_cache": true, | |
"vocab_size": 85002 | |
} | |