{ "version": "1.0", "truncation": null, "padding": null, "added_tokens": [ { "id": 0, "content": "[UNK]", "single_word": false, "lstrip": false, "rstrip": false, "normalized": false, "special": true }, { "id": 1, "content": "[CLS]", "single_word": false, "lstrip": false, "rstrip": false, "normalized": false, "special": true }, { "id": 2, "content": "[SEP]", "single_word": false, "lstrip": false, "rstrip": false, "normalized": false, "special": true }, { "id": 3, "content": "[PAD]", "single_word": false, "lstrip": false, "rstrip": false, "normalized": false, "special": true }, { "id": 4, "content": "[MASK]", "single_word": false, "lstrip": false, "rstrip": false, "normalized": false, "special": true } ], "normalizer": null, "pre_tokenizer": { "type": "WhitespaceSplit" }, "post_processor": { "type": "TemplateProcessing", "single": [ { "SpecialToken": { "id": "[CLS]", "type_id": 0 } }, { "Sequence": { "id": "A", "type_id": 0 } }, { "SpecialToken": { "id": "[SEP]", "type_id": 0 } } ], "pair": [ { "Sequence": { "id": "A", "type_id": 0 } }, { "Sequence": { "id": "B", "type_id": 1 } } ], "special_tokens": { "[CLS]": { "id": "[CLS]", "ids": [ 1 ], "tokens": [ "[CLS]" ] }, "[SEP]": { "id": "[SEP]", "ids": [ 2 ], "tokens": [ "[SEP]" ] } } }, "decoder": null, "model": { "type": "WordLevel", "vocab": { "[UNK]": 0, "[CLS]": 1, "[SEP]": 2, "[PAD]": 3, "[MASK]": 4, "[17O]": 5, "[/S@@]": 6, "[/N]": 7, "[B@-1]": 8, "[18OH1]": 9, "[-/Ring2]": 10, "[=17O]": 11, "[/Br]": 12, "[C@]": 13, "[N@]": 14, "[Branch1]": 15, "[=Si]": 16, "[=Branch2]": 17, "[Cl].[Cl-1]": 18, "[/C]": 19, "[S].[Cl-1]": 20, "[SH1]": 21, "[Sn@]": 22, "[#S]": 23, "[NH1+1]": 24, "[#Branch1]": 25, "[#Branch1].[Cl-1]": 26, "[BH2-1]": 27, "[/NH1+1]": 28, "[=P@]": 29, "[I]": 30, "[/S+1]": 31, "[S-1]": 32, "[=S@+1]": 33, "[NH0]": 34, "[SnH1]": 35, "[F]": 36, "[BH1-1]": 37, "[=Ring2]": 38, "[CH1]": 39, "[=Ring1]": 40, "[/S@]": 41, "[N@+1]": 42, "[Sn+2]": 43, "[Sn+3]": 44, "[#N+1]": 45, "[/F]": 46, "[Si]": 47, "[/O]": 48, "[Sn]": 49, "[P]": 50, "[Ring2]": 51, "[#Branch2].[Cl-1]": 52, "[=P@@]": 53, "[PH1+1]": 54, "[/Cl]": 55, "[C@@]": 56, "[Sn@@]": 57, "[=S@]": 58, "[=S]": 59, "[C@H1]": 60, "[Ring2].[Cl-1]": 61, "[O-1].[Cl-1]": 62, "[N-1]": 63, "[S@@H1]": 64, "[/O-1]": 65, "[/NH1]": 66, "[/C@@H1]": 67, "[B-1]": 68, "[OH0]": 69, "[Ring1]": 70, "[=O+1]": 71, "[O+1]": 72, "[=S@@+1]": 73, "[=S+1]": 74, "[/I]": 75, "[Si@@]": 76, "[=C]": 77, "[P+1]": 78, "[I].[Cl-1]": 79, "[Branch1].[Cl-1]": 80, "[P@@]": 81, "[Branch1].[C]": 82, "[Br+1]": 83, "[=B]": 84, "[CH1-1]": 85, "[Sn+1]": 86, "[Si-1]": 87, "[/N+1]": 88, "[N+1]": 89, "[CH2]": 90, "[SiH2]": 91, "[/Sn]": 92, "[=PH1]": 93, "[=P+1]": 94, "[S@@]": 95, "[/C@H1]": 96, "[N@@+1]": 97, "[=S@@]": 98, "[/NH2+1]": 99, "[=N+1]": 100, "[=C].[Cl-1]": 101, "[=NH2+1]": 102, "[=SH1]": 103, "[/Si]": 104, "[#N]": 105, "[=N]": 106, "[/OH0]": 107, "[S]": 108, "[Branch2].[Cl-1]": 109, "[N@H1+1]": 110, "[NH2+1]": 111, "[Br]": 112, "[O-1]": 113, "[=Branch1]": 114, "[CH0]": 115, "[=Se]": 116, "[#Branch2]": 117, "[#C]": 118, "[=Branch1].[Cl-1]": 119, "[S@]": 120, "[SiH1]": 121, "[SiH3]": 122, "[#C].[Cl-1]": 123, "[#C-1]": 124, "[S+1]": 125, "[Cl]": 126, "[#N].[Cl-1]": 127, "[/C@@]": 128, "[B@@-1]": 129, "[F].[Cl-1]": 130, "[Br].[Cl-1]": 131, "[=Branch2].[Cl-1]": 132, "[=P]": 133, "[C].[Cl-1]": 134, "[/B]": 135, "[PH1]": 136, "[C-1]": 137, "[Si@@H1]": 138, "[/P]": 139, "[=O].[Cl-1]": 140, "[O].[Cl-1]": 141, "[N@@]": 142, "[P].[Cl-1]": 143, "[S@+1]": 144, "[Branch2]": 145, "[I+1]": 146, "[-/Ring1]": 147, "[/S]": 148, "[P@]": 149, "[P@@+1]": 150, "[=Sn]": 151, "[NH3+1]": 152, "[=N-1]": 153, "[=NH1+1]": 154, "[NH1]": 155, "[Si@]": 156, "[N@@H1+1]": 157, "[N]": 158, "[Ring1].[Cl-1]": 159, "[BH3-1]": 160, "[B]": 161, "[/C@]": 162, "[C]": 163, "[Si@H1]": 164, "[O]": 165, "[=NH0]": 166, "[P@+1]": 167, "[=N].[Cl-1]": 168, "[/N-1]": 169, "[S@@+1]": 170, "[=O]": 171, "[C@@H1]": 172 }, "unk_token": "[UNK]" } }