{ | |
"version": "1.0", | |
"truncation": null, | |
"padding": null, | |
"added_tokens": [ | |
{ | |
"id": 0, | |
"content": "[UNK]", | |
"single_word": false, | |
"lstrip": false, | |
"rstrip": false, | |
"normalized": false, | |
"special": true | |
}, | |
{ | |
"id": 1, | |
"content": "[CLS]", | |
"single_word": false, | |
"lstrip": false, | |
"rstrip": false, | |
"normalized": false, | |
"special": true | |
}, | |
{ | |
"id": 2, | |
"content": "[SEP]", | |
"single_word": false, | |
"lstrip": false, | |
"rstrip": false, | |
"normalized": false, | |
"special": true | |
}, | |
{ | |
"id": 3, | |
"content": "[PAD]", | |
"single_word": false, | |
"lstrip": false, | |
"rstrip": false, | |
"normalized": false, | |
"special": true | |
}, | |
{ | |
"id": 4, | |
"content": "[MASK]", | |
"single_word": false, | |
"lstrip": false, | |
"rstrip": false, | |
"normalized": false, | |
"special": true | |
} | |
], | |
"normalizer": null, | |
"pre_tokenizer": { | |
"type": "WhitespaceSplit" | |
}, | |
"post_processor": { | |
"type": "TemplateProcessing", | |
"single": [ | |
{ | |
"SpecialToken": { | |
"id": "[CLS]", | |
"type_id": 0 | |
} | |
}, | |
{ | |
"Sequence": { | |
"id": "A", | |
"type_id": 0 | |
} | |
}, | |
{ | |
"SpecialToken": { | |
"id": "[SEP]", | |
"type_id": 0 | |
} | |
} | |
], | |
"pair": [ | |
{ | |
"Sequence": { | |
"id": "A", | |
"type_id": 0 | |
} | |
}, | |
{ | |
"Sequence": { | |
"id": "B", | |
"type_id": 1 | |
} | |
} | |
], | |
"special_tokens": { | |
"[CLS]": { | |
"id": "[CLS]", | |
"ids": [ | |
1 | |
], | |
"tokens": [ | |
"[CLS]" | |
] | |
}, | |
"[SEP]": { | |
"id": "[SEP]", | |
"ids": [ | |
2 | |
], | |
"tokens": [ | |
"[SEP]" | |
] | |
} | |
} | |
}, | |
"decoder": null, | |
"model": { | |
"type": "WordLevel", | |
"vocab": { | |
"[UNK]": 0, | |
"[CLS]": 1, | |
"[SEP]": 2, | |
"[PAD]": 3, | |
"[MASK]": 4, | |
"[=Branch1]": 5, | |
"[Branch1]": 6, | |
"[=C]": 7, | |
"[Ring1]": 8, | |
"[N]": 9, | |
"[=O]": 10, | |
"[O]": 11, | |
"[Ring2]": 12, | |
"[=N]": 13, | |
"[C@H1]": 14, | |
"[C@@H1]": 15, | |
"[Branch2]": 16, | |
"[F]": 17, | |
"[S]": 18, | |
"[=Branch2]": 19, | |
"[#Branch1]": 20, | |
"[NH1+1]": 21, | |
"[=Ring1]": 22, | |
"[Cl]": 23, | |
"[#Branch2]": 24, | |
"[NH1]": 25, | |
"[NH2+1]": 26, | |
"[#C]": 27, | |
"[Br]": 28, | |
"[#N]": 29, | |
"[/C]": 30, | |
"[C]": 31, | |
"[P]": 32, | |
"[C@@]": 33, | |
"[C@]": 34, | |
"[O-1]": 35, | |
"[NH3+1]": 36, | |
"[N-1]": 37, | |
"[\\C]": 38, | |
"[=NH1+1]": 39, | |
"[=S]": 40, | |
"[I]": 41, | |
"[/N]": 42, | |
"[\\-Ring1]": 43, | |
"[/S]": 44, | |
"[/-Ring1]": 45, | |
"[/Cl]": 46, | |
"[\\N]": 47, | |
"[\\Cl]": 48, | |
"[=NH2+1]": 49, | |
"[/NH1+1]": 50, | |
"[/O]": 51, | |
"[H]": 52, | |
"[Si]": 53, | |
"[\\O]": 54, | |
"[=Ring2]": 55, | |
"[\\-Ring2]": 56, | |
"[N+1]": 57, | |
"[\\S]": 58, | |
"[S-1]": 59, | |
"[/-Ring2]": 60, | |
"[/C@@H1]": 61, | |
"[/C@H1]": 62, | |
"[\\C@@H1]": 63, | |
"[S@]": 64, | |
"[=N+1]": 65, | |
"[S@@]": 66, | |
"[\\C@H1]": 67, | |
"[/NH1]": 68, | |
"[B]": 69, | |
"[/F]": 70, | |
"[CH1]": 71, | |
"[CH0]": 72, | |
"[\\O-1]": 73, | |
"[/O-1]": 74, | |
"[\\F]": 75, | |
"[/Br]": 76, | |
"[/C@]": 77, | |
"[\\NH1]": 78, | |
"[\\C@]": 79, | |
"[\\NH1+1]": 80, | |
"[P@@]": 81, | |
"[/C@@]": 82, | |
"[P@]": 83, | |
"[\\Br]": 84, | |
"[\\C@@]": 85, | |
"[/I]": 86, | |
"[S+1]": 87, | |
"[N@+1]": 88, | |
"[N@@+1]": 89, | |
"[/N+1]": 90, | |
"[CH2]": 91, | |
"[Sn]": 92, | |
"[OH0]": 93, | |
"[\\I]": 94, | |
"[/NH2+1]": 95, | |
"[\\N+1]": 96, | |
"[=S+1]": 97, | |
"[\\NH2+1]": 98, | |
"[/OH0]": 99, | |
"[=S@]": 100, | |
"[=S@@]": 101, | |
"[=P]": 102, | |
"[P+1]": 103, | |
"[/H]": 104, | |
"[/P]": 105, | |
"[/NH3+1]": 106, | |
"[\\H]": 107, | |
"[B-1]": 108, | |
"[S@@+1]": 109, | |
"[\\P]": 110, | |
"[C+1]": 111, | |
"[S@+1]": 112, | |
"[=O+1]": 113, | |
"[/Si]": 114, | |
"[\\NH3+1]": 115, | |
"[N@]": 116, | |
"[NH0]": 117, | |
"[\\OH0]": 118, | |
"[C-1]": 119, | |
"[/S@]": 120, | |
"[/S@@]": 121, | |
"[Si@@]": 122, | |
"[P@@H1]": 123, | |
"[\\Si]": 124, | |
"[/Sn]": 125, | |
"[CH1-1]": 126, | |
"[Si@]": 127, | |
"[/N-1]": 128, | |
"[N@@]": 129, | |
"[=NH0]": 130, | |
"[BH3-1]": 131, | |
"[IH2]": 132, | |
"[\\B]": 133, | |
"[/B]": 134, | |
"[Sn@]": 135, | |
"[P@+1]": 136, | |
"[P@@+1]": 137, | |
"[/S+1]": 138, | |
"[Sn@@]": 139, | |
"[=B]": 140, | |
"[=IH2]": 141, | |
"[BH1-1]": 142, | |
"[P@H1]": 143, | |
"[#N+1]": 144, | |
"[=P@@]": 145, | |
"[=P@]": 146, | |
"[O+1]": 147, | |
"[SnH2+1]": 148, | |
"[SnH4+2]": 149, | |
"[/CH0]": 150, | |
"[=17O]": 151, | |
"[=CH0]": 152, | |
"[SnH1]": 153, | |
"[\\N-1]": 154, | |
"[\\S@]": 155, | |
"[P@@H1+1]": 156, | |
"[B@-1]": 157, | |
"[B@@-1]": 158, | |
"[I+1]": 159, | |
"[Sn+1]": 160, | |
"[Sn+2]": 161, | |
"[Br+1]": 162, | |
"[\\P@@]": 163, | |
"[\\P@]": 164, | |
"[\\Sn]": 165, | |
"[#S]": 166, | |
"[/CH1]": 167, | |
"[/NH0]": 168, | |
"[17O]": 169, | |
"[18OH1]": 170, | |
"[=Si]": 171, | |
"[BH2-1]": 172, | |
"[S@@-1]": 173, | |
"[S@@H1]": 174, | |
"[Sn+3]": 175, | |
"[SnH2]": 176, | |
"[SnH6+3]": 177, | |
"[\\C-1]": 178, | |
"[\\NH0]": 179, | |
"[\\S+1]": 180, | |
"[#P]": 181, | |
"[/CH2]": 182, | |
"[/O+1]": 183, | |
"[/P@@]": 184, | |
"[/P@]": 185, | |
"[/Si@@]": 186, | |
"[/Si@]": 187, | |
"[S@H1]": 188, | |
"[SH3]": 189, | |
"[SiH2]": 190, | |
"[SiH3]": 191, | |
"[\\C+1]": 192, | |
"[\\S@@]": 193 | |
}, | |
"unk_token": "[UNK]" | |
} | |
} |