ner-document-context / config.json
jamarticus's picture
YurtsAI/ner-document-context
4ababee verified
raw
history blame
19.7 kB
{
"architectures": [
"SpanMarkerModel"
],
"encoder": {
"_name_or_path": "roberta-large",
"add_cross_attention": false,
"architectures": [
"RobertaForMaskedLM"
],
"attention_probs_dropout_prob": 0.1,
"bad_words_ids": null,
"begin_suppress_tokens": null,
"bos_token_id": 0,
"chunk_size_feed_forward": 0,
"classifier_dropout": null,
"cross_attention_hidden_size": null,
"decoder_start_token_id": null,
"diversity_penalty": 0.0,
"do_sample": false,
"early_stopping": false,
"encoder_no_repeat_ngram_size": 0,
"eos_token_id": 2,
"exponential_decay_length_penalty": null,
"finetuning_task": null,
"forced_bos_token_id": null,
"forced_eos_token_id": null,
"hidden_act": "gelu",
"hidden_dropout_prob": 0.1,
"hidden_size": 1024,
"id2label": {
"0": "O",
"1": "B-GENERAL__organization-showorganization",
"2": "I-GENERAL__organization-showorganization",
"3": "B-GENERAL__product-airplane",
"4": "I-GENERAL__product-airplane",
"5": "B-GENERAL__art-film",
"6": "I-GENERAL__art-film",
"7": "B-GENERAL__building-theater",
"8": "I-GENERAL__building-theater",
"9": "B-GENERAL__art-other",
"10": "I-GENERAL__art-other",
"11": "B-GENERAL__other-disease",
"12": "I-GENERAL__other-disease",
"13": "B-GENERAL__person-artist/author",
"14": "I-GENERAL__person-artist/author",
"15": "B-GENERAL__other-biologything",
"16": "I-GENERAL__other-biologything",
"17": "B-GENERAL__organization-media/newspaper",
"18": "I-GENERAL__organization-media/newspaper",
"19": "B-GENERAL__product-food",
"20": "I-GENERAL__product-food",
"21": "B-GENERAL__building-hotel",
"22": "I-GENERAL__building-hotel",
"23": "B-GENERAL__other-chemicalthing",
"24": "I-GENERAL__other-chemicalthing",
"25": "B-GENERAL__organization-other",
"26": "I-GENERAL__organization-other",
"27": "B-GENERAL__organization-religion",
"28": "I-GENERAL__organization-religion",
"29": "B-GENERAL__building-sportsfacility",
"30": "I-GENERAL__building-sportsfacility",
"31": "B-GENERAL__person-other",
"32": "I-GENERAL__person-other",
"33": "B-GENERAL__building-hospital",
"34": "I-GENERAL__building-hospital",
"35": "B-GENERAL__product-weapon",
"36": "I-GENERAL__product-weapon",
"37": "B-GENERAL__person-politician",
"38": "I-GENERAL__person-politician",
"39": "B-GENERAL__product-software",
"40": "I-GENERAL__product-software",
"41": "B-GENERAL__person-scholar",
"42": "I-GENERAL__person-scholar",
"43": "B-DATETIME__relative",
"44": "I-DATETIME__relative",
"45": "B-GENERAL__other-law",
"46": "I-GENERAL__other-law",
"47": "B-GENERAL__event-other",
"48": "I-GENERAL__event-other",
"49": "B-GENERAL__location-bodiesofwater",
"50": "I-GENERAL__location-bodiesofwater",
"51": "B-GENERAL__organization-government/governmentagency",
"52": "I-GENERAL__organization-government/governmentagency",
"53": "B-DATETIME__range",
"54": "I-DATETIME__range",
"55": "B-GENERAL__product-ship",
"56": "I-GENERAL__product-ship",
"57": "B-GENERAL__other-livingthing",
"58": "I-GENERAL__other-livingthing",
"59": "B-GENERAL__product-car",
"60": "I-GENERAL__product-car",
"61": "B-GENERAL__product-game",
"62": "I-GENERAL__product-game",
"63": "B-DATETIME__authored",
"64": "I-DATETIME__authored",
"65": "B-GENERAL__building-other",
"66": "I-GENERAL__building-other",
"67": "B-GENERAL__other-language",
"68": "I-GENERAL__other-language",
"69": "B-GENERAL__other-astronomything",
"70": "I-GENERAL__other-astronomything",
"71": "B-GENERAL__building-library",
"72": "I-GENERAL__building-library",
"73": "B-GENERAL__product-train",
"74": "I-GENERAL__product-train",
"75": "B-GENERAL__location-other",
"76": "I-GENERAL__location-other",
"77": "B-GENERAL__building-airport",
"78": "I-GENERAL__building-airport",
"79": "B-GENERAL__other-god",
"80": "I-GENERAL__other-god",
"81": "B-GENERAL__art-painting",
"82": "I-GENERAL__art-painting",
"83": "B-GENERAL__other-educationaldegree",
"84": "I-GENERAL__other-educationaldegree",
"85": "B-GENERAL__art-music",
"86": "I-GENERAL__art-music",
"87": "B-GENERAL__art-writtenart",
"88": "I-GENERAL__art-writtenart",
"89": "B-GENERAL__building-restaurant",
"90": "I-GENERAL__building-restaurant",
"91": "B-GENERAL__art-broadcastprogram",
"92": "I-GENERAL__art-broadcastprogram",
"93": "B-GENERAL__location-island",
"94": "I-GENERAL__location-island",
"95": "B-DATETIME__absolute",
"96": "I-DATETIME__absolute",
"97": "B-GENERAL__organization-sportsteam",
"98": "I-GENERAL__organization-sportsteam",
"99": "B-GENERAL__event-attack/battle/war/militaryconflict",
"100": "I-GENERAL__event-attack/battle/war/militaryconflict",
"101": "B-GENERAL__product-other",
"102": "I-GENERAL__product-other",
"103": "B-GENERAL__other-award",
"104": "I-GENERAL__other-award",
"105": "B-GENERAL__location-GPE",
"106": "I-GENERAL__location-GPE",
"107": "B-GENERAL__person-soldier",
"108": "I-GENERAL__person-soldier",
"109": "B-GENERAL__location-mountain",
"110": "I-GENERAL__location-mountain",
"111": "B-GENERAL__event-sportsevent",
"112": "I-GENERAL__event-sportsevent",
"113": "B-GENERAL__location-road/railway/highway/transit",
"114": "I-GENERAL__location-road/railway/highway/transit",
"115": "B-GENERAL__other-medical",
"116": "I-GENERAL__other-medical",
"117": "B-GENERAL__organization-education",
"118": "I-GENERAL__organization-education",
"119": "B-GENERAL__organization-company",
"120": "I-GENERAL__organization-company",
"121": "B-GENERAL__other-currency",
"122": "I-GENERAL__other-currency",
"123": "B-GENERAL__location-park",
"124": "I-GENERAL__location-park"
},
"initializer_range": 0.02,
"intermediate_size": 4096,
"is_decoder": false,
"is_encoder_decoder": false,
"label2id": {
"B-DATETIME__absolute": 95,
"B-DATETIME__authored": 63,
"B-DATETIME__range": 53,
"B-DATETIME__relative": 43,
"B-GENERAL__art-broadcastprogram": 91,
"B-GENERAL__art-film": 5,
"B-GENERAL__art-music": 85,
"B-GENERAL__art-other": 9,
"B-GENERAL__art-painting": 81,
"B-GENERAL__art-writtenart": 87,
"B-GENERAL__building-airport": 77,
"B-GENERAL__building-hospital": 33,
"B-GENERAL__building-hotel": 21,
"B-GENERAL__building-library": 71,
"B-GENERAL__building-other": 65,
"B-GENERAL__building-restaurant": 89,
"B-GENERAL__building-sportsfacility": 29,
"B-GENERAL__building-theater": 7,
"B-GENERAL__event-attack/battle/war/militaryconflict": 99,
"B-GENERAL__event-other": 47,
"B-GENERAL__event-sportsevent": 111,
"B-GENERAL__location-GPE": 105,
"B-GENERAL__location-bodiesofwater": 49,
"B-GENERAL__location-island": 93,
"B-GENERAL__location-mountain": 109,
"B-GENERAL__location-other": 75,
"B-GENERAL__location-park": 123,
"B-GENERAL__location-road/railway/highway/transit": 113,
"B-GENERAL__organization-company": 119,
"B-GENERAL__organization-education": 117,
"B-GENERAL__organization-government/governmentagency": 51,
"B-GENERAL__organization-media/newspaper": 17,
"B-GENERAL__organization-other": 25,
"B-GENERAL__organization-religion": 27,
"B-GENERAL__organization-showorganization": 1,
"B-GENERAL__organization-sportsteam": 97,
"B-GENERAL__other-astronomything": 69,
"B-GENERAL__other-award": 103,
"B-GENERAL__other-biologything": 15,
"B-GENERAL__other-chemicalthing": 23,
"B-GENERAL__other-currency": 121,
"B-GENERAL__other-disease": 11,
"B-GENERAL__other-educationaldegree": 83,
"B-GENERAL__other-god": 79,
"B-GENERAL__other-language": 67,
"B-GENERAL__other-law": 45,
"B-GENERAL__other-livingthing": 57,
"B-GENERAL__other-medical": 115,
"B-GENERAL__person-artist/author": 13,
"B-GENERAL__person-other": 31,
"B-GENERAL__person-politician": 37,
"B-GENERAL__person-scholar": 41,
"B-GENERAL__person-soldier": 107,
"B-GENERAL__product-airplane": 3,
"B-GENERAL__product-car": 59,
"B-GENERAL__product-food": 19,
"B-GENERAL__product-game": 61,
"B-GENERAL__product-other": 101,
"B-GENERAL__product-ship": 55,
"B-GENERAL__product-software": 39,
"B-GENERAL__product-train": 73,
"B-GENERAL__product-weapon": 35,
"I-DATETIME__absolute": 96,
"I-DATETIME__authored": 64,
"I-DATETIME__range": 54,
"I-DATETIME__relative": 44,
"I-GENERAL__art-broadcastprogram": 92,
"I-GENERAL__art-film": 6,
"I-GENERAL__art-music": 86,
"I-GENERAL__art-other": 10,
"I-GENERAL__art-painting": 82,
"I-GENERAL__art-writtenart": 88,
"I-GENERAL__building-airport": 78,
"I-GENERAL__building-hospital": 34,
"I-GENERAL__building-hotel": 22,
"I-GENERAL__building-library": 72,
"I-GENERAL__building-other": 66,
"I-GENERAL__building-restaurant": 90,
"I-GENERAL__building-sportsfacility": 30,
"I-GENERAL__building-theater": 8,
"I-GENERAL__event-attack/battle/war/militaryconflict": 100,
"I-GENERAL__event-other": 48,
"I-GENERAL__event-sportsevent": 112,
"I-GENERAL__location-GPE": 106,
"I-GENERAL__location-bodiesofwater": 50,
"I-GENERAL__location-island": 94,
"I-GENERAL__location-mountain": 110,
"I-GENERAL__location-other": 76,
"I-GENERAL__location-park": 124,
"I-GENERAL__location-road/railway/highway/transit": 114,
"I-GENERAL__organization-company": 120,
"I-GENERAL__organization-education": 118,
"I-GENERAL__organization-government/governmentagency": 52,
"I-GENERAL__organization-media/newspaper": 18,
"I-GENERAL__organization-other": 26,
"I-GENERAL__organization-religion": 28,
"I-GENERAL__organization-showorganization": 2,
"I-GENERAL__organization-sportsteam": 98,
"I-GENERAL__other-astronomything": 70,
"I-GENERAL__other-award": 104,
"I-GENERAL__other-biologything": 16,
"I-GENERAL__other-chemicalthing": 24,
"I-GENERAL__other-currency": 122,
"I-GENERAL__other-disease": 12,
"I-GENERAL__other-educationaldegree": 84,
"I-GENERAL__other-god": 80,
"I-GENERAL__other-language": 68,
"I-GENERAL__other-law": 46,
"I-GENERAL__other-livingthing": 58,
"I-GENERAL__other-medical": 116,
"I-GENERAL__person-artist/author": 14,
"I-GENERAL__person-other": 32,
"I-GENERAL__person-politician": 38,
"I-GENERAL__person-scholar": 42,
"I-GENERAL__person-soldier": 108,
"I-GENERAL__product-airplane": 4,
"I-GENERAL__product-car": 60,
"I-GENERAL__product-food": 20,
"I-GENERAL__product-game": 62,
"I-GENERAL__product-other": 102,
"I-GENERAL__product-ship": 56,
"I-GENERAL__product-software": 40,
"I-GENERAL__product-train": 74,
"I-GENERAL__product-weapon": 36,
"O": 0
},
"layer_norm_eps": 1e-05,
"length_penalty": 1.0,
"max_length": 20,
"max_position_embeddings": 514,
"min_length": 0,
"model_type": "roberta",
"no_repeat_ngram_size": 0,
"num_attention_heads": 16,
"num_beam_groups": 1,
"num_beams": 1,
"num_hidden_layers": 24,
"num_return_sequences": 1,
"output_attentions": false,
"output_hidden_states": false,
"output_scores": false,
"pad_token_id": 1,
"position_embedding_type": "absolute",
"prefix": null,
"problem_type": null,
"pruned_heads": {},
"remove_invalid_values": false,
"repetition_penalty": 1.0,
"return_dict": true,
"return_dict_in_generate": false,
"sep_token_id": null,
"suppress_tokens": null,
"task_specific_params": null,
"temperature": 1.0,
"tf_legacy_loss": false,
"tie_encoder_decoder": false,
"tie_word_embeddings": true,
"tokenizer_class": null,
"top_k": 50,
"top_p": 1.0,
"torch_dtype": null,
"torchscript": false,
"transformers_version": "4.42.1",
"type_vocab_size": 1,
"typical_p": 1.0,
"use_bfloat16": false,
"use_cache": true,
"vocab_size": 50272
},
"entity_max_length": 11,
"id2label": {
"0": "O",
"1": "DATETIME__absolute",
"2": "DATETIME__authored",
"3": "DATETIME__range",
"4": "DATETIME__relative",
"5": "GENERAL__art-broadcastprogram",
"6": "GENERAL__art-film",
"7": "GENERAL__art-music",
"8": "GENERAL__art-other",
"9": "GENERAL__art-painting",
"10": "GENERAL__art-writtenart",
"11": "GENERAL__building-airport",
"12": "GENERAL__building-hospital",
"13": "GENERAL__building-hotel",
"14": "GENERAL__building-library",
"15": "GENERAL__building-other",
"16": "GENERAL__building-restaurant",
"17": "GENERAL__building-sportsfacility",
"18": "GENERAL__building-theater",
"19": "GENERAL__event-attack/battle/war/militaryconflict",
"20": "GENERAL__event-other",
"21": "GENERAL__event-sportsevent",
"22": "GENERAL__location-GPE",
"23": "GENERAL__location-bodiesofwater",
"24": "GENERAL__location-island",
"25": "GENERAL__location-mountain",
"26": "GENERAL__location-other",
"27": "GENERAL__location-park",
"28": "GENERAL__location-road/railway/highway/transit",
"29": "GENERAL__organization-company",
"30": "GENERAL__organization-education",
"31": "GENERAL__organization-government/governmentagency",
"32": "GENERAL__organization-media/newspaper",
"33": "GENERAL__organization-other",
"34": "GENERAL__organization-religion",
"35": "GENERAL__organization-showorganization",
"36": "GENERAL__organization-sportsteam",
"37": "GENERAL__other-astronomything",
"38": "GENERAL__other-award",
"39": "GENERAL__other-biologything",
"40": "GENERAL__other-chemicalthing",
"41": "GENERAL__other-currency",
"42": "GENERAL__other-disease",
"43": "GENERAL__other-educationaldegree",
"44": "GENERAL__other-god",
"45": "GENERAL__other-language",
"46": "GENERAL__other-law",
"47": "GENERAL__other-livingthing",
"48": "GENERAL__other-medical",
"49": "GENERAL__person-artist/author",
"50": "GENERAL__person-other",
"51": "GENERAL__person-politician",
"52": "GENERAL__person-scholar",
"53": "GENERAL__person-soldier",
"54": "GENERAL__product-airplane",
"55": "GENERAL__product-car",
"56": "GENERAL__product-food",
"57": "GENERAL__product-game",
"58": "GENERAL__product-other",
"59": "GENERAL__product-ship",
"60": "GENERAL__product-software",
"61": "GENERAL__product-train",
"62": "GENERAL__product-weapon"
},
"id2reduced_id": {
"0": 0,
"1": 35,
"2": 35,
"3": 54,
"4": 54,
"5": 6,
"6": 6,
"7": 18,
"8": 18,
"9": 8,
"10": 8,
"11": 42,
"12": 42,
"13": 49,
"14": 49,
"15": 39,
"16": 39,
"17": 32,
"18": 32,
"19": 56,
"20": 56,
"21": 13,
"22": 13,
"23": 40,
"24": 40,
"25": 33,
"26": 33,
"27": 34,
"28": 34,
"29": 17,
"30": 17,
"31": 50,
"32": 50,
"33": 12,
"34": 12,
"35": 62,
"36": 62,
"37": 51,
"38": 51,
"39": 60,
"40": 60,
"41": 52,
"42": 52,
"43": 4,
"44": 4,
"45": 46,
"46": 46,
"47": 20,
"48": 20,
"49": 23,
"50": 23,
"51": 31,
"52": 31,
"53": 3,
"54": 3,
"55": 59,
"56": 59,
"57": 47,
"58": 47,
"59": 55,
"60": 55,
"61": 57,
"62": 57,
"63": 2,
"64": 2,
"65": 15,
"66": 15,
"67": 45,
"68": 45,
"69": 37,
"70": 37,
"71": 14,
"72": 14,
"73": 61,
"74": 61,
"75": 26,
"76": 26,
"77": 11,
"78": 11,
"79": 44,
"80": 44,
"81": 9,
"82": 9,
"83": 43,
"84": 43,
"85": 7,
"86": 7,
"87": 10,
"88": 10,
"89": 16,
"90": 16,
"91": 5,
"92": 5,
"93": 24,
"94": 24,
"95": 1,
"96": 1,
"97": 36,
"98": 36,
"99": 19,
"100": 19,
"101": 58,
"102": 58,
"103": 38,
"104": 38,
"105": 22,
"106": 22,
"107": 53,
"108": 53,
"109": 25,
"110": 25,
"111": 21,
"112": 21,
"113": 28,
"114": 28,
"115": 48,
"116": 48,
"117": 30,
"118": 30,
"119": 29,
"120": 29,
"121": 41,
"122": 41,
"123": 27,
"124": 27
},
"label2id": {
"DATETIME__absolute": 1,
"DATETIME__authored": 2,
"DATETIME__range": 3,
"DATETIME__relative": 4,
"GENERAL__art-broadcastprogram": 5,
"GENERAL__art-film": 6,
"GENERAL__art-music": 7,
"GENERAL__art-other": 8,
"GENERAL__art-painting": 9,
"GENERAL__art-writtenart": 10,
"GENERAL__building-airport": 11,
"GENERAL__building-hospital": 12,
"GENERAL__building-hotel": 13,
"GENERAL__building-library": 14,
"GENERAL__building-other": 15,
"GENERAL__building-restaurant": 16,
"GENERAL__building-sportsfacility": 17,
"GENERAL__building-theater": 18,
"GENERAL__event-attack/battle/war/militaryconflict": 19,
"GENERAL__event-other": 20,
"GENERAL__event-sportsevent": 21,
"GENERAL__location-GPE": 22,
"GENERAL__location-bodiesofwater": 23,
"GENERAL__location-island": 24,
"GENERAL__location-mountain": 25,
"GENERAL__location-other": 26,
"GENERAL__location-park": 27,
"GENERAL__location-road/railway/highway/transit": 28,
"GENERAL__organization-company": 29,
"GENERAL__organization-education": 30,
"GENERAL__organization-government/governmentagency": 31,
"GENERAL__organization-media/newspaper": 32,
"GENERAL__organization-other": 33,
"GENERAL__organization-religion": 34,
"GENERAL__organization-showorganization": 35,
"GENERAL__organization-sportsteam": 36,
"GENERAL__other-astronomything": 37,
"GENERAL__other-award": 38,
"GENERAL__other-biologything": 39,
"GENERAL__other-chemicalthing": 40,
"GENERAL__other-currency": 41,
"GENERAL__other-disease": 42,
"GENERAL__other-educationaldegree": 43,
"GENERAL__other-god": 44,
"GENERAL__other-language": 45,
"GENERAL__other-law": 46,
"GENERAL__other-livingthing": 47,
"GENERAL__other-medical": 48,
"GENERAL__person-artist/author": 49,
"GENERAL__person-other": 50,
"GENERAL__person-politician": 51,
"GENERAL__person-scholar": 52,
"GENERAL__person-soldier": 53,
"GENERAL__product-airplane": 54,
"GENERAL__product-car": 55,
"GENERAL__product-food": 56,
"GENERAL__product-game": 57,
"GENERAL__product-other": 58,
"GENERAL__product-ship": 59,
"GENERAL__product-software": 60,
"GENERAL__product-train": 61,
"GENERAL__product-weapon": 62,
"O": 0
},
"marker_max_length": 128,
"max_next_context": 3,
"max_prev_context": 3,
"model_max_length": 256,
"model_max_length_default": 512,
"model_type": "span-marker",
"span_marker_version": "1.5.0",
"torch_dtype": "float32",
"trained_with_document_context": true,
"transformers_version": "4.42.1",
"vocab_size": 50272
}