{ | |
"_name_or_path": "google/owlvit-base-patch32", | |
"architectures": [ | |
"OwlViTForObjectDetection" | |
], | |
"id2label": { | |
"0": 6, | |
"1": 7, | |
"10": 16, | |
"11": 17, | |
"12": 18, | |
"13": 19, | |
"14": 20, | |
"15": 21, | |
"16": 22, | |
"17": 23, | |
"18": 24, | |
"19": 25, | |
"2": 8, | |
"20": 26, | |
"21": 27, | |
"22": 28, | |
"23": 29, | |
"24": 30, | |
"25": 31, | |
"26": 32, | |
"27": 33, | |
"28": 34, | |
"29": 35, | |
"3": 9, | |
"30": 36, | |
"31": 37, | |
"32": 38, | |
"33": 40, | |
"34": 41, | |
"35": 42, | |
"36": 43, | |
"37": 44, | |
"38": 45, | |
"39": 46, | |
"4": 10, | |
"40": 47, | |
"41": 48, | |
"5": 11, | |
"6": 12, | |
"7": 13, | |
"8": 14, | |
"9": 15 | |
}, | |
"initializer_factor": 1.0, | |
"label2id": { | |
"6": "0", | |
"7": "1", | |
"8": "2", | |
"9": "3", | |
"10": "4", | |
"11": "5", | |
"12": "6", | |
"13": "7", | |
"14": "8", | |
"15": "9", | |
"16": "10", | |
"17": "11", | |
"18": "12", | |
"19": "13", | |
"20": "14", | |
"21": "15", | |
"22": "16", | |
"23": "17", | |
"24": "18", | |
"25": "19", | |
"26": "20", | |
"27": "21", | |
"28": "22", | |
"29": "23", | |
"30": "24", | |
"31": "25", | |
"32": "26", | |
"33": "27", | |
"34": "28", | |
"35": "29", | |
"36": "30", | |
"37": "31", | |
"38": "32", | |
"40": "33", | |
"41": "34", | |
"42": "35", | |
"43": "36", | |
"44": "37", | |
"45": "38", | |
"46": "39", | |
"47": "40", | |
"48": "41" | |
}, | |
"logit_scale_init_value": 2.6592, | |
"model_type": "owlvit", | |
"projection_dim": 512, | |
"text_config": { | |
"bos_token_id": 0, | |
"dropout": 0.0, | |
"eos_token_id": 2, | |
"max_length": 16, | |
"model_type": "owlvit_text_model", | |
"pad_token_id": 1 | |
}, | |
"text_config_dict": null, | |
"torch_dtype": "float32", | |
"transformers_version": "4.38.2", | |
"vision_config": { | |
"dropout": 0.0, | |
"model_type": "owlvit_vision_model" | |
}, | |
"vision_config_dict": null | |
} | |