NisargRhino commited on
Commit
4dfd039
1 Parent(s): 2876e91

Upload 7 files

Browse files
model_drug_classification/.gitattributes ADDED
@@ -0,0 +1 @@
 
 
1
+ *.safetensors filter=lfs diff=lfs merge=lfs -text
model_drug_classification/config.json ADDED
@@ -0,0 +1,28 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "seyonec/ChemBERTa-zinc-base-v1",
3
+ "architectures": [
4
+ "RobertaForMaskedLM"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "bos_token_id": 0,
8
+ "classifier_dropout": null,
9
+ "eos_token_id": 2,
10
+ "hidden_act": "gelu",
11
+ "hidden_dropout_prob": 0.1,
12
+ "hidden_size": 768,
13
+ "initializer_range": 0.02,
14
+ "intermediate_size": 3072,
15
+ "layer_norm_eps": 1e-05,
16
+ "max_position_embeddings": 514,
17
+ "model_type": "roberta",
18
+ "num_attention_heads": 12,
19
+ "num_hidden_layers": 6,
20
+ "output_past": true,
21
+ "pad_token_id": 1,
22
+ "position_embedding_type": "absolute",
23
+ "torch_dtype": "float32",
24
+ "transformers_version": "4.45.2",
25
+ "type_vocab_size": 1,
26
+ "use_cache": true,
27
+ "vocab_size": 767
28
+ }
model_drug_classification/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d811fa78203fb2280611ed8ce713d6a5965ca596ba9618451f597fae4436b201
3
+ size 134
tokenizer_drug_classification/merges.txt ADDED
@@ -0,0 +1,507 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ #version: 0.2
2
+ c c
3
+ C C
4
+ ( =
5
+ cc c
6
+ ] (
7
+ @ @
8
+ C c
9
+ N C
10
+ cc ccc
11
+ n c
12
+ CC C
13
+ ) [
14
+ N H
15
+ + ]
16
+ C O
17
+ cc cc
18
+ N c
19
+ C l
20
+ O C
21
+ CC N
22
+ ) (
23
+ CO c
24
+ ( -
25
+ ( [
26
+ CC CC
27
+ C N
28
+ ) (=
29
+ - ]
30
+ CC O
31
+ n H
32
+ n n
33
+ -] )
34
+ + ](
35
+ CC c
36
+ ) =
37
+ s c
38
+ C S
39
+ n cc
40
+ B r
41
+ C NC
42
+ n nc
43
+ N Cc
44
+ o c
45
+ 1 2
46
+ CC CCC
47
+ +] (=
48
+ CO C
49
+ C n
50
+ 2 1
51
+ CCC N
52
+ c n
53
+ O c
54
+ CC OC
55
+ +] [
56
+ CCO CC
57
+ c nc
58
+ CC S
59
+ ]( [
60
+ CCO c
61
+ ccc s
62
+ ccc nc
63
+ N CC
64
+ O CC
65
+ ( /
66
+ CCC O
67
+ @ ]
68
+ CS c
69
+ ccc o
70
+ @@ ]
71
+ c nn
72
+ CC n
73
+ CC NC
74
+ 3 2
75
+ cccc n
76
+ 2 3
77
+ n o
78
+ +] )
79
+ n oc
80
+ ) /
81
+ c sc
82
+ c s
83
+ cc ncc
84
+ ccc n
85
+ CC Cc
86
+ S c
87
+ S CC
88
+ cc nc
89
+ S C
90
+ O Cc
91
+ cc sc
92
+ cc n
93
+ N NC
94
+ O CO
95
+ @ ](
96
+ nc nc
97
+ N S
98
+ N CCc
99
+ @@ ](
100
+ C Nc
101
+ O CCO
102
+ = [
103
+ n cccc
104
+ c ncc
105
+ N N
106
+ CCCC CC
107
+ N CCC
108
+ o n
109
+ +]( [
110
+ CC CCN
111
+ CCC NC
112
+ nc n
113
+ -] )[
114
+ ncc s
115
+ +] =
116
+ CS C
117
+ CCC n
118
+ s ccc
119
+ S Cc
120
+ CCS c
121
+ cnc n
122
+ ( \
123
+ CO CC
124
+ 3 4
125
+ nn nn
126
+ n ccc
127
+ CO Cc
128
+ cc oc
129
+ )( [
130
+ ncc n
131
+ CCC Oc
132
+ n cccn
133
+ cc nn
134
+ CN S
135
+ @@] (=
136
+ CCS C
137
+ 4 3
138
+ CO CCN
139
+ F c
140
+ CCS CC
141
+ CCC S
142
+ cncc n
143
+ -]) =
144
+ / [
145
+ @] (=
146
+ c oc
147
+ c nnc
148
+ CS CC
149
+ nn n
150
+ N Nc
151
+ nn nc
152
+ N CCN
153
+ nnc n
154
+ +] )[
155
+ CCCC O
156
+ nc nn
157
+ CC l
158
+ CC Nc
159
+ Cl c
160
+ CS Cc
161
+ O CCCO
162
+ cnn n
163
+ NCC NC
164
+ o ccc
165
+ o nc
166
+ CCN S
167
+ O CCC
168
+ )= [
169
+ CCC OC
170
+ CCCC NC
171
+ CO CCn
172
+ ncc nc
173
+ F C
174
+ CCCC CCC
175
+ cs cc
176
+ 1 3
177
+ N O
178
+ cn ccc
179
+ (\ [
180
+ O CCN
181
+ n s
182
+ n sc
183
+ CO CCNC
184
+ N CCOc
185
+ CCCC n
186
+ csc n
187
+ NCC n
188
+ NCCC n
189
+ +] )(
190
+ NCC Cc
191
+ CCCC c
192
+ cc on
193
+ sc nc
194
+ CCC Nc
195
+ nc sc
196
+ N n
197
+ N CCCN
198
+ no nc
199
+ Br c
200
+ N CCS
201
+ S CCC
202
+ CO CCO
203
+ nnc s
204
+ CN Cc
205
+ s cc
206
+ s ccn
207
+ N CCCC
208
+ (= [
209
+ CO CCOc
210
+ 3 1
211
+ oc nc
212
+ ns nc
213
+ O CCc
214
+ CCO Cc
215
+ O S
216
+ nc oc
217
+ cnc nc
218
+ CO CCC
219
+ NCC Nc
220
+ CCC l
221
+ nn sc
222
+ CS CCS
223
+ CO CCCNC
224
+ S CCc
225
+ c o
226
+ CCCC S
227
+ OCC NC
228
+ N CCO
229
+ CCC Sc
230
+ +] \
231
+ -]) /
232
+ CS CN
233
+ CCCC Oc
234
+ \ [
235
+ CCCCC N
236
+ CO CCCN
237
+ CS CCO
238
+ ) -
239
+ O CCOc
240
+ ccc nn
241
+ CO N
242
+ CCO CCN
243
+ N CCCO
244
+ S CCN
245
+ +] /
246
+ CCC SCC
247
+ OCC n
248
+ cs nn
249
+ @ ]([
250
+ C Br
251
+ 4 5
252
+ cc no
253
+ O CCCC
254
+ ]( /
255
+ )( /
256
+ CS CCC
257
+ s nc
258
+ @@ ]([
259
+ CO CCc
260
+ O N
261
+ CCC SC
262
+ 2 4
263
+ +] )([
264
+ O COC
265
+ ccnc n
266
+ N CCSc
267
+ CCC OCC
268
+ CCN CC
269
+ nn cc
270
+ CCCCC NC
271
+ (/ [
272
+ 5 4
273
+ nc on
274
+ CO CCCC
275
+ N CCOC
276
+ CCCC OC
277
+ CS CCN
278
+ ncc o
279
+ CCS Cc
280
+ nnc o
281
+ CO NC
282
+ s nnc
283
+ CO CCOC
284
+ 4 2
285
+ nc ncc
286
+ CCN Cc
287
+ N CCOCC
288
+ N NS
289
+ O CCCN
290
+ N OCc
291
+ OCC Cc
292
+ ) \
293
+ N CCCCn
294
+ O CCCNC
295
+ S CCOc
296
+ CCC F
297
+ CCCN S
298
+ OCC Nc
299
+ CCCC l
300
+ CCO CCO
301
+ NCCC OC
302
+ O CCS
303
+ S CCS
304
+ o cc
305
+ CN CCc
306
+ CCCCC n
307
+ CO CCCn
308
+ CN CC
309
+ CCO CCCNC
310
+ NCCC NC
311
+ Cl C
312
+ -] )(
313
+ -]) =[
314
+ O CCOC
315
+ cn oc
316
+ cnc s
317
+ NC N
318
+ CCCC Sc
319
+ CN n
320
+ CCO CCC
321
+ NCCC Sc
322
+ S CCO
323
+ CCCC Nc
324
+ CCO NC
325
+ N OC
326
+ CO CO
327
+ CN N
328
+ CN CCN
329
+ -] [
330
+ CCOCC NC
331
+ NCCC S
332
+ NCCC Oc
333
+ N CCCCC
334
+ O CCSc
335
+ ] /
336
+ OC n
337
+ CS CCNC
338
+ N OCC
339
+ O CCCn
340
+ cc s
341
+ +] =[
342
+ OC N
343
+ (- [
344
+ CCO CCCC
345
+ CCCCC O
346
+ CCOCC S
347
+ CCOCC n
348
+ CCS CCC
349
+ COCC Nc
350
+ NCCN S
351
+ S CCCS
352
+ s n
353
+ cc nnc
354
+ CC Br
355
+ CO CCOCC
356
+ CO CCSc
357
+ Cl Cc
358
+ CCCC Cc
359
+ -] /
360
+ CS CCCNC
361
+ cnc o
362
+ cnn s
363
+ )/ [
364
+ COCCN S
365
+ O CCCOc
366
+ ] [
367
+ CO CCCOc
368
+ CS CCCN
369
+ NCC CCN
370
+ CO CCS
371
+ CO CCCNc
372
+ CCO CCOc
373
+ CCCCC S
374
+ N CCSC
375
+ O P
376
+ S CCCC
377
+ CO n
378
+ CO CCCOC
379
+ CCCC OCC
380
+ CCCC CCNC
381
+ CS CCc
382
+ CS CCn
383
+ Br Cc
384
+ NCCCN S
385
+ 3 5
386
+ S CCn
387
+ o ncc
388
+ CO P
389
+ Cl CC
390
+ -] =[
391
+ CCO P
392
+ CS CCCCNC
393
+ cn sn
394
+ OCCO CCOCCO
395
+ NCCC Nc
396
+ OCCC l
397
+ OCCC Sc
398
+ C I
399
+ N CCCCCC
400
+ N CCSCC
401
+ N CCOCc
402
+ O CCCCC
403
+ O CCNS
404
+ O CCSCc
405
+ S CN
406
+ S Cn
407
+ S CCNC
408
+ S CCCOc
409
+ c onc
410
+ CO COc
411
+ CCCC CCCCCCC
412
+ CCO CCOC
413
+ CCOCC Cc
414
+ OCC CCN
415
+ CCCO Cc
416
+ NCCC OCC
417
+ ns cc
418
+ NCCCC l
419
+ NCCCC Oc
420
+ 4 1
421
+ C H
422
+ N SC
423
+ O H
424
+ O n
425
+ O CCOCC
426
+ O CCSCC
427
+ O CCCS
428
+ S N
429
+ S CCCc
430
+ ]( /[
431
+ CCC SCc
432
+ CO S
433
+ CO CCCCC
434
+ CCCC CCCC
435
+ CCCC CCO
436
+ CCCC CCS
437
+ CN CCC
438
+ -] )([
439
+ CCO CCCN
440
+ CCO CCCNc
441
+ CCO CCOCc
442
+ +]( -
443
+ CS CCOc
444
+ CS CCSC
445
+ CCCN CC
446
+ cn sc
447
+ CCOCC Nc
448
+ CCS S
449
+ CCS CCOC
450
+ OCC F
451
+ OCC Br
452
+ NCCS Cc
453
+ ( #
454
+ - [
455
+ 3 12
456
+ F CCC
457
+ I C
458
+ I c
459
+ N Oc
460
+ O NC
461
+ O CCSC
462
+ O CCCCn
463
+ O CCOCCS
464
+ S H
465
+ S CCOC
466
+ S CCCO
467
+ S CCSc
468
+ s sc
469
+ s snc
470
+ CCC Br
471
+ CCC NCc
472
+ CO CCCCN
473
+ CO CCCS
474
+ CO CCSCc
475
+ CO CCOCCNC
476
+ Cl CCCSc
477
+ CCCC CCN
478
+ CCCC SC
479
+ CCCC OCc
480
+ CCO CCOCC
481
+ CCO CCCn
482
+ nn ccc
483
+ -]) \
484
+ +]( /
485
+ +]( /[
486
+ CS CCCC
487
+ CS CCOC
488
+ CS CCCNc
489
+ Br CC
490
+ Br CCC
491
+ 12 3
492
+ CCCCC OC
493
+ CCCCC Oc
494
+ CCCCC Sc
495
+ CCOCC Sc
496
+ CCS CCOc
497
+ NN N
498
+ NCCC SC
499
+ CCCCN S
500
+ COCCN Cc
501
+ OCCC Nc
502
+ OCCC SC
503
+ NO CCc
504
+ COCCO CCN
505
+ NCCO CCO
506
+ CCOCCO CCOCC
507
+ OCCOCCOCCO CCO
tokenizer_drug_classification/special_tokens_map.json ADDED
@@ -0,0 +1,51 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": {
3
+ "content": "<s>",
4
+ "lstrip": false,
5
+ "normalized": true,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "cls_token": {
10
+ "content": "<s>",
11
+ "lstrip": false,
12
+ "normalized": true,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "eos_token": {
17
+ "content": "</s>",
18
+ "lstrip": false,
19
+ "normalized": true,
20
+ "rstrip": false,
21
+ "single_word": false
22
+ },
23
+ "mask_token": {
24
+ "content": "<mask>",
25
+ "lstrip": true,
26
+ "normalized": false,
27
+ "rstrip": false,
28
+ "single_word": false
29
+ },
30
+ "pad_token": {
31
+ "content": "<pad>",
32
+ "lstrip": false,
33
+ "normalized": true,
34
+ "rstrip": false,
35
+ "single_word": false
36
+ },
37
+ "sep_token": {
38
+ "content": "</s>",
39
+ "lstrip": false,
40
+ "normalized": true,
41
+ "rstrip": false,
42
+ "single_word": false
43
+ },
44
+ "unk_token": {
45
+ "content": "<unk>",
46
+ "lstrip": false,
47
+ "normalized": true,
48
+ "rstrip": false,
49
+ "single_word": false
50
+ }
51
+ }
tokenizer_drug_classification/tokenizer_config.json ADDED
@@ -0,0 +1,57 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_prefix_space": false,
3
+ "added_tokens_decoder": {
4
+ "0": {
5
+ "content": "<s>",
6
+ "lstrip": false,
7
+ "normalized": true,
8
+ "rstrip": false,
9
+ "single_word": false,
10
+ "special": true
11
+ },
12
+ "1": {
13
+ "content": "<pad>",
14
+ "lstrip": false,
15
+ "normalized": true,
16
+ "rstrip": false,
17
+ "single_word": false,
18
+ "special": true
19
+ },
20
+ "2": {
21
+ "content": "</s>",
22
+ "lstrip": false,
23
+ "normalized": true,
24
+ "rstrip": false,
25
+ "single_word": false,
26
+ "special": true
27
+ },
28
+ "3": {
29
+ "content": "<unk>",
30
+ "lstrip": false,
31
+ "normalized": true,
32
+ "rstrip": false,
33
+ "single_word": false,
34
+ "special": true
35
+ },
36
+ "4": {
37
+ "content": "<mask>",
38
+ "lstrip": true,
39
+ "normalized": false,
40
+ "rstrip": false,
41
+ "single_word": false,
42
+ "special": true
43
+ }
44
+ },
45
+ "bos_token": "<s>",
46
+ "clean_up_tokenization_spaces": false,
47
+ "cls_token": "<s>",
48
+ "eos_token": "</s>",
49
+ "errors": "replace",
50
+ "mask_token": "<mask>",
51
+ "max_len": 512,
52
+ "model_max_length": 512,
53
+ "pad_token": "<pad>",
54
+ "sep_token": "</s>",
55
+ "tokenizer_class": "RobertaTokenizer",
56
+ "unk_token": "<unk>"
57
+ }
tokenizer_drug_classification/vocab.json ADDED
@@ -0,0 +1,769 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "!": 5,
3
+ "\"": 6,
4
+ "#": 7,
5
+ "$": 8,
6
+ "%": 9,
7
+ "&": 10,
8
+ "'": 11,
9
+ "(": 12,
10
+ "(#": 712,
11
+ "(-": 283,
12
+ "(-[": 602,
13
+ "(/": 324,
14
+ "(/[": 530,
15
+ "(=": 263,
16
+ "(=[": 467,
17
+ "([": 284,
18
+ "(\\": 381,
19
+ "(\\[": 438,
20
+ ")": 13,
21
+ ")(": 281,
22
+ ")(/": 514,
23
+ ")(=": 287,
24
+ ")([": 388,
25
+ ")-": 497,
26
+ ")/": 339,
27
+ ")/[": 622,
28
+ ")=": 295,
29
+ ")=[": 427,
30
+ ")[": 272,
31
+ ")\\": 551,
32
+ "*": 14,
33
+ "+": 15,
34
+ "+]": 274,
35
+ "+](": 293,
36
+ "+](-": 701,
37
+ "+](/": 743,
38
+ "+](/[": 744,
39
+ "+](=": 306,
40
+ "+]([": 368,
41
+ "+])": 337,
42
+ "+])(": 448,
43
+ "+])([": 522,
44
+ "+])[": 413,
45
+ "+]/": 504,
46
+ "+]=": 374,
47
+ "+]=[": 600,
48
+ "+][": 314,
49
+ "+]\\": 489,
50
+ ",": 16,
51
+ "-": 17,
52
+ "-[": 713,
53
+ "-]": 288,
54
+ "-])": 292,
55
+ "-])(": 571,
56
+ "-])([": 697,
57
+ "-])/": 490,
58
+ "-])=": 402,
59
+ "-])=[": 572,
60
+ "-])[": 372,
61
+ "-])\\": 742,
62
+ "-]/": 618,
63
+ "-]=[": 649,
64
+ "-][": 588,
65
+ ".": 18,
66
+ "/": 19,
67
+ "/[": 403,
68
+ "0": 20,
69
+ "1": 21,
70
+ "12": 304,
71
+ "123": 750,
72
+ "13": 435,
73
+ "2": 22,
74
+ "21": 309,
75
+ "23": 335,
76
+ "24": 521,
77
+ "3": 23,
78
+ "31": 469,
79
+ "312": 714,
80
+ "32": 333,
81
+ "34": 383,
82
+ "35": 644,
83
+ "4": 24,
84
+ "41": 679,
85
+ "42": 543,
86
+ "43": 396,
87
+ "45": 510,
88
+ "5": 25,
89
+ "54": 531,
90
+ "6": 26,
91
+ "7": 27,
92
+ "8": 28,
93
+ "9": 29,
94
+ ":": 30,
95
+ ";": 31,
96
+ "<": 32,
97
+ "</s>": 2,
98
+ "<mask>": 4,
99
+ "<pad>": 1,
100
+ "<s>": 0,
101
+ "<unk>": 3,
102
+ "=": 33,
103
+ "=[": 361,
104
+ ">": 34,
105
+ "?": 35,
106
+ "@": 36,
107
+ "@@": 266,
108
+ "@@]": 329,
109
+ "@@](": 358,
110
+ "@@](=": 394,
111
+ "@@]([": 517,
112
+ "@]": 326,
113
+ "@](": 354,
114
+ "@](=": 404,
115
+ "@]([": 508,
116
+ "A": 37,
117
+ "B": 38,
118
+ "Br": 299,
119
+ "BrCC": 748,
120
+ "BrCCC": 749,
121
+ "BrCc": 642,
122
+ "Brc": 458,
123
+ "C": 39,
124
+ "CBr": 509,
125
+ "CC": 262,
126
+ "CCBr": 613,
127
+ "CCC": 271,
128
+ "CCCBr": 729,
129
+ "CCCC": 285,
130
+ "CCCCC": 305,
131
+ "CCCCCC": 365,
132
+ "CCCCCCC": 433,
133
+ "CCCCCCCC": 693,
134
+ "CCCCCCCCCCC": 670,
135
+ "CCCCCCN": 736,
136
+ "CCCCCCNC": 639,
137
+ "CCCCCCO": 694,
138
+ "CCCCCCS": 695,
139
+ "CCCCCN": 494,
140
+ "CCCCCNC": 529,
141
+ "CCCCCO": 604,
142
+ "CCCCCOC": 751,
143
+ "CCCCCOc": 752,
144
+ "CCCCCS": 632,
145
+ "CCCCCSc": 753,
146
+ "CCCCCc": 617,
147
+ "CCCCCn": 565,
148
+ "CCCCN": 369,
149
+ "CCCCNC": 429,
150
+ "CCCCNS": 758,
151
+ "CCCCNc": 582,
152
+ "CCCCO": 414,
153
+ "CCCCOC": 535,
154
+ "CCCCOCC": 638,
155
+ "CCCCOCc": 738,
156
+ "CCCCOc": 492,
157
+ "CCCCS": 485,
158
+ "CCCCSC": 737,
159
+ "CCCCSc": 577,
160
+ "CCCCc": 450,
161
+ "CCCCl": 558,
162
+ "CCCCn": 444,
163
+ "CCCF": 555,
164
+ "CCCN": 310,
165
+ "CCCNC": 370,
166
+ "CCCNCC": 704,
167
+ "CCCNCc": 730,
168
+ "CCCNS": 556,
169
+ "CCCNc": 453,
170
+ "CCCO": 325,
171
+ "CCCOC": 428,
172
+ "CCCOCC": 526,
173
+ "CCCOCc": 674,
174
+ "CCCOc": 390,
175
+ "CCCS": 400,
176
+ "CCCSC": 520,
177
+ "CCCSCC": 505,
178
+ "CCCSCc": 690,
179
+ "CCCSc": 488,
180
+ "CCCc": 344,
181
+ "CCCl": 479,
182
+ "CCCn": 376,
183
+ "CCN": 280,
184
+ "CCNC": 332,
185
+ "CCNCC": 527,
186
+ "CCNCc": 545,
187
+ "CCNS": 425,
188
+ "CCNc": 417,
189
+ "CCO": 289,
190
+ "CCOC": 313,
191
+ "CCOCC": 315,
192
+ "CCOCCC": 579,
193
+ "CCOCCCC": 603,
194
+ "CCOCCCN": 698,
195
+ "CCOCCCNC": 568,
196
+ "CCOCCCNc": 699,
197
+ "CCOCCCc": 672,
198
+ "CCOCCCn": 740,
199
+ "CCOCCN": 501,
200
+ "CCOCCNC": 589,
201
+ "CCOCCNc": 706,
202
+ "CCOCCO": 559,
203
+ "CCOCCOC": 671,
204
+ "CCOCCOCC": 739,
205
+ "CCOCCOCCOCC": 765,
206
+ "CCOCCOCc": 700,
207
+ "CCOCCOc": 631,
208
+ "CCOCCS": 605,
209
+ "CCOCCSc": 754,
210
+ "CCOCCn": 606,
211
+ "CCOCc": 473,
212
+ "CCONC": 583,
213
+ "CCOP": 650,
214
+ "CCOc": 319,
215
+ "CCS": 317,
216
+ "CCSC": 395,
217
+ "CCSCC": 399,
218
+ "CCSCCC": 607,
219
+ "CCSCCOC": 708,
220
+ "CCSCCOc": 755,
221
+ "CCSCc": 538,
222
+ "CCSS": 707,
223
+ "CCSc": 379,
224
+ "CCc": 294,
225
+ "CCl": 416,
226
+ "CCn": 331,
227
+ "CH": 680,
228
+ "CI": 657,
229
+ "CN": 286,
230
+ "CNC": 300,
231
+ "CNCC": 567,
232
+ "CNCCC": 696,
233
+ "CNCCN": 587,
234
+ "CNCCc": 564,
235
+ "CNCc": 463,
236
+ "CNN": 586,
237
+ "CNS": 393,
238
+ "CNc": 359,
239
+ "CNn": 578,
240
+ "CO": 275,
241
+ "COC": 307,
242
+ "COCC": 382,
243
+ "COCCC": 477,
244
+ "COCCCC": 533,
245
+ "COCCCCC": 692,
246
+ "COCCCCN": 731,
247
+ "COCCCN": 495,
248
+ "COCCCNC": 482,
249
+ "COCCCNc": 630,
250
+ "COCCCOC": 637,
251
+ "COCCCOc": 626,
252
+ "COCCCS": 732,
253
+ "COCCCn": 566,
254
+ "COCCN": 397,
255
+ "COCCNC": 442,
256
+ "COCCNCc": 759,
257
+ "COCCNS": 623,
258
+ "COCCNc": 608,
259
+ "COCCO": 461,
260
+ "COCCOC": 542,
261
+ "COCCOCC": 614,
262
+ "COCCOCCN": 763,
263
+ "COCCOCCNC": 734,
264
+ "COCCOc": 468,
265
+ "COCCS": 629,
266
+ "COCCSCc": 733,
267
+ "COCCSc": 615,
268
+ "COCCc": 518,
269
+ "COCCn": 430,
270
+ "COCO": 585,
271
+ "COCOc": 669,
272
+ "COCc": 386,
273
+ "CON": 500,
274
+ "CONC": 540,
275
+ "COP": 647,
276
+ "COS": 691,
277
+ "COc": 282,
278
+ "COn": 636,
279
+ "CS": 297,
280
+ "CSC": 375,
281
+ "CSCC": 407,
282
+ "CSCCC": 515,
283
+ "CSCCCC": 745,
284
+ "CSCCCCNC": 651,
285
+ "CSCCCN": 627,
286
+ "CSCCCNC": 619,
287
+ "CSCCCNc": 747,
288
+ "CSCCN": 536,
289
+ "CSCCNC": 596,
290
+ "CSCCO": 496,
291
+ "CSCCOC": 746,
292
+ "CSCCOc": 702,
293
+ "CSCCS": 481,
294
+ "CSCCSC": 703,
295
+ "CSCCc": 640,
296
+ "CSCCn": 641,
297
+ "CSCN": 491,
298
+ "CSCc": 419,
299
+ "CSc": 327,
300
+ "Cc": 267,
301
+ "Cl": 278,
302
+ "ClC": 570,
303
+ "ClCC": 648,
304
+ "ClCCCSc": 735,
305
+ "ClCc": 616,
306
+ "Clc": 418,
307
+ "Cn": 308,
308
+ "D": 40,
309
+ "E": 41,
310
+ "F": 42,
311
+ "FC": 432,
312
+ "FCCC": 715,
313
+ "Fc": 398,
314
+ "G": 43,
315
+ "H": 44,
316
+ "I": 45,
317
+ "IC": 716,
318
+ "Ic": 717,
319
+ "J": 46,
320
+ "K": 47,
321
+ "L": 48,
322
+ "M": 49,
323
+ "N": 50,
324
+ "NC": 268,
325
+ "NCC": 322,
326
+ "NCCC": 366,
327
+ "NCCCC": 466,
328
+ "NCCCCC": 592,
329
+ "NCCCCCC": 658,
330
+ "NCCCCN": 628,
331
+ "NCCCCOc": 678,
332
+ "NCCCCl": 677,
333
+ "NCCCCn": 552,
334
+ "NCCCN": 456,
335
+ "NCCCNC": 569,
336
+ "NCCCNS": 643,
337
+ "NCCCNc": 654,
338
+ "NCCCO": 502,
339
+ "NCCCOC": 560,
340
+ "NCCCOCC": 675,
341
+ "NCCCOc": 591,
342
+ "NCCCS": 590,
343
+ "NCCCSC": 757,
344
+ "NCCCSc": 580,
345
+ "NCCCc": 449,
346
+ "NCCCn": 447,
347
+ "NCCN": 411,
348
+ "NCCNC": 422,
349
+ "NCCNS": 609,
350
+ "NCCNc": 478,
351
+ "NCCO": 487,
352
+ "NCCOC": 534,
353
+ "NCCOCC": 546,
354
+ "NCCOCCO": 764,
355
+ "NCCOCc": 660,
356
+ "NCCOc": 443,
357
+ "NCCS": 459,
358
+ "NCCSC": 633,
359
+ "NCCSCC": 659,
360
+ "NCCSCc": 711,
361
+ "NCCSc": 525,
362
+ "NCCc": 357,
363
+ "NCCn": 446,
364
+ "NCN": 576,
365
+ "NCc": 302,
366
+ "NH": 273,
367
+ "NN": 364,
368
+ "NNC": 352,
369
+ "NNN": 756,
370
+ "NNS": 547,
371
+ "NNc": 409,
372
+ "NO": 436,
373
+ "NOC": 584,
374
+ "NOCC": 597,
375
+ "NOCCc": 762,
376
+ "NOCc": 549,
377
+ "NOc": 718,
378
+ "NS": 356,
379
+ "NSC": 681,
380
+ "Nc": 277,
381
+ "Nn": 455,
382
+ "O": 51,
383
+ "OC": 279,
384
+ "OCC": 323,
385
+ "OCCBr": 710,
386
+ "OCCC": 426,
387
+ "OCCCC": 512,
388
+ "OCCCCC": 661,
389
+ "OCCCCN": 673,
390
+ "OCCCCn": 721,
391
+ "OCCCN": 548,
392
+ "OCCCNC": 553,
393
+ "OCCCNc": 760,
394
+ "OCCCO": 420,
395
+ "OCCCOc": 624,
396
+ "OCCCS": 686,
397
+ "OCCCSC": 761,
398
+ "OCCCSc": 656,
399
+ "OCCCc": 550,
400
+ "OCCCl": 655,
401
+ "OCCCn": 598,
402
+ "OCCF": 709,
403
+ "OCCN": 439,
404
+ "OCCNC": 486,
405
+ "OCCNS": 662,
406
+ "OCCNc": 557,
407
+ "OCCO": 360,
408
+ "OCCOC": 573,
409
+ "OCCOCC": 684,
410
+ "OCCOCCOCCO": 653,
411
+ "OCCOCCOCCOCCO": 766,
412
+ "OCCOCCS": 722,
413
+ "OCCOc": 498,
414
+ "OCCS": 561,
415
+ "OCCSC": 720,
416
+ "OCCSCC": 685,
417
+ "OCCSCc": 663,
418
+ "OCCSc": 593,
419
+ "OCCc": 472,
420
+ "OCCn": 506,
421
+ "OCN": 601,
422
+ "OCO": 353,
423
+ "OCOC": 523,
424
+ "OCc": 349,
425
+ "OCn": 595,
426
+ "OH": 682,
427
+ "ON": 519,
428
+ "ONC": 719,
429
+ "OP": 634,
430
+ "OS": 474,
431
+ "Oc": 312,
432
+ "On": 683,
433
+ "P": 52,
434
+ "Q": 53,
435
+ "R": 54,
436
+ "S": 55,
437
+ "SC": 348,
438
+ "SCC": 346,
439
+ "SCCC": 460,
440
+ "SCCCC": 635,
441
+ "SCCCO": 725,
442
+ "SCCCOc": 667,
443
+ "SCCCS": 610,
444
+ "SCCCc": 688,
445
+ "SCCN": 503,
446
+ "SCCNC": 666,
447
+ "SCCO": 581,
448
+ "SCCOC": 724,
449
+ "SCCOc": 554,
450
+ "SCCS": 562,
451
+ "SCCSc": 726,
452
+ "SCCc": 483,
453
+ "SCCn": 645,
454
+ "SCN": 664,
455
+ "SCc": 378,
456
+ "SCn": 665,
457
+ "SH": 723,
458
+ "SN": 687,
459
+ "Sc": 345,
460
+ "T": 56,
461
+ "U": 57,
462
+ "V": 58,
463
+ "W": 59,
464
+ "X": 60,
465
+ "Y": 61,
466
+ "Z": 62,
467
+ "[": 63,
468
+ "\\": 64,
469
+ "\\[": 493,
470
+ "]": 65,
471
+ "](": 265,
472
+ "](/": 513,
473
+ "](/[": 689,
474
+ "]([": 318,
475
+ "]/": 594,
476
+ "][": 625,
477
+ "^": 66,
478
+ "_": 67,
479
+ "`": 68,
480
+ "a": 69,
481
+ "b": 70,
482
+ "c": 71,
483
+ "cc": 261,
484
+ "ccc": 264,
485
+ "cccc": 276,
486
+ "ccccc": 269,
487
+ "ccccn": 334,
488
+ "cccn": 343,
489
+ "cccnc": 321,
490
+ "cccnn": 499,
491
+ "ccco": 328,
492
+ "cccs": 320,
493
+ "ccn": 351,
494
+ "ccnc": 347,
495
+ "ccncc": 342,
496
+ "ccncn": 524,
497
+ "ccnn": 392,
498
+ "ccnnc": 612,
499
+ "ccno": 511,
500
+ "ccoc": 387,
501
+ "ccon": 451,
502
+ "ccs": 599,
503
+ "ccsc": 350,
504
+ "cn": 311,
505
+ "cnc": 316,
506
+ "cncc": 363,
507
+ "cnccc": 437,
508
+ "cnccn": 401,
509
+ "cncn": 380,
510
+ "cncnc": 476,
511
+ "cnco": 620,
512
+ "cncs": 575,
513
+ "cnn": 330,
514
+ "cnnc": 406,
515
+ "cnnn": 421,
516
+ "cnns": 621,
517
+ "cnoc": 574,
518
+ "cnsc": 705,
519
+ "cnsn": 652,
520
+ "co": 484,
521
+ "coc": 405,
522
+ "conc": 668,
523
+ "cs": 341,
524
+ "csc": 340,
525
+ "cscc": 434,
526
+ "cscn": 445,
527
+ "csnn": 507,
528
+ "d": 72,
529
+ "e": 73,
530
+ "f": 74,
531
+ "g": 75,
532
+ "h": 76,
533
+ "i": 77,
534
+ "j": 78,
535
+ "k": 79,
536
+ "l": 80,
537
+ "m": 81,
538
+ "n": 82,
539
+ "nH": 290,
540
+ "nc": 270,
541
+ "ncc": 298,
542
+ "nccc": 385,
543
+ "ncccc": 362,
544
+ "ncccn": 391,
545
+ "nccn": 389,
546
+ "nccnc": 431,
547
+ "ncco": 537,
548
+ "nccs": 373,
549
+ "ncn": 371,
550
+ "ncnc": 355,
551
+ "ncncc": 544,
552
+ "ncnn": 415,
553
+ "ncoc": 475,
554
+ "ncon": 532,
555
+ "ncsc": 454,
556
+ "nn": 291,
557
+ "nnc": 301,
558
+ "nncc": 528,
559
+ "nnccc": 741,
560
+ "nncn": 412,
561
+ "nnco": 539,
562
+ "nncs": 462,
563
+ "nnn": 408,
564
+ "nnnc": 410,
565
+ "nnnn": 384,
566
+ "nnsc": 480,
567
+ "no": 336,
568
+ "noc": 338,
569
+ "nonc": 457,
570
+ "ns": 440,
571
+ "nsc": 441,
572
+ "nscc": 676,
573
+ "nsnc": 471,
574
+ "o": 83,
575
+ "oc": 303,
576
+ "occ": 563,
577
+ "occc": 423,
578
+ "ocnc": 470,
579
+ "on": 367,
580
+ "onc": 424,
581
+ "oncc": 646,
582
+ "p": 84,
583
+ "q": 85,
584
+ "r": 86,
585
+ "s": 87,
586
+ "sc": 296,
587
+ "scc": 464,
588
+ "sccc": 377,
589
+ "sccn": 465,
590
+ "scnc": 452,
591
+ "sn": 611,
592
+ "snc": 516,
593
+ "snnc": 541,
594
+ "ssc": 727,
595
+ "ssnc": 728,
596
+ "t": 88,
597
+ "u": 89,
598
+ "v": 90,
599
+ "w": 91,
600
+ "x": 92,
601
+ "y": 93,
602
+ "z": 94,
603
+ "{": 95,
604
+ "|": 96,
605
+ "}": 97,
606
+ "~": 98,
607
+ "¡": 99,
608
+ "¢": 100,
609
+ "£": 101,
610
+ "¤": 102,
611
+ "¥": 103,
612
+ "¦": 104,
613
+ "§": 105,
614
+ "¨": 106,
615
+ "©": 107,
616
+ "ª": 108,
617
+ "«": 109,
618
+ "¬": 110,
619
+ "®": 111,
620
+ "¯": 112,
621
+ "°": 113,
622
+ "±": 114,
623
+ "²": 115,
624
+ "³": 116,
625
+ "´": 117,
626
+ "µ": 118,
627
+ "¶": 119,
628
+ "·": 120,
629
+ "¸": 121,
630
+ "¹": 122,
631
+ "º": 123,
632
+ "»": 124,
633
+ "¼": 125,
634
+ "½": 126,
635
+ "¾": 127,
636
+ "¿": 128,
637
+ "À": 129,
638
+ "Á": 130,
639
+ "Â": 131,
640
+ "Ã": 132,
641
+ "Ä": 133,
642
+ "Å": 134,
643
+ "Æ": 135,
644
+ "Ç": 136,
645
+ "È": 137,
646
+ "É": 138,
647
+ "Ê": 139,
648
+ "Ë": 140,
649
+ "Ì": 141,
650
+ "Í": 142,
651
+ "Î": 143,
652
+ "Ï": 144,
653
+ "Ð": 145,
654
+ "Ñ": 146,
655
+ "Ò": 147,
656
+ "Ó": 148,
657
+ "Ô": 149,
658
+ "Õ": 150,
659
+ "Ö": 151,
660
+ "×": 152,
661
+ "Ø": 153,
662
+ "Ù": 154,
663
+ "Ú": 155,
664
+ "Û": 156,
665
+ "Ü": 157,
666
+ "Ý": 158,
667
+ "Þ": 159,
668
+ "ß": 160,
669
+ "à": 161,
670
+ "á": 162,
671
+ "â": 163,
672
+ "ã": 164,
673
+ "ä": 165,
674
+ "å": 166,
675
+ "æ": 167,
676
+ "ç": 168,
677
+ "è": 169,
678
+ "é": 170,
679
+ "ê": 171,
680
+ "ë": 172,
681
+ "ì": 173,
682
+ "í": 174,
683
+ "î": 175,
684
+ "ï": 176,
685
+ "ð": 177,
686
+ "ñ": 178,
687
+ "ò": 179,
688
+ "ó": 180,
689
+ "ô": 181,
690
+ "õ": 182,
691
+ "ö": 183,
692
+ "÷": 184,
693
+ "ø": 185,
694
+ "ù": 186,
695
+ "ú": 187,
696
+ "û": 188,
697
+ "ü": 189,
698
+ "ý": 190,
699
+ "þ": 191,
700
+ "ÿ": 192,
701
+ "Ā": 193,
702
+ "ā": 194,
703
+ "Ă": 195,
704
+ "ă": 196,
705
+ "Ą": 197,
706
+ "ą": 198,
707
+ "Ć": 199,
708
+ "ć": 200,
709
+ "Ĉ": 201,
710
+ "ĉ": 202,
711
+ "Ċ": 203,
712
+ "ċ": 204,
713
+ "Č": 205,
714
+ "č": 206,
715
+ "Ď": 207,
716
+ "ď": 208,
717
+ "Đ": 209,
718
+ "đ": 210,
719
+ "Ē": 211,
720
+ "ē": 212,
721
+ "Ĕ": 213,
722
+ "ĕ": 214,
723
+ "Ė": 215,
724
+ "ė": 216,
725
+ "Ę": 217,
726
+ "ę": 218,
727
+ "Ě": 219,
728
+ "ě": 220,
729
+ "Ĝ": 221,
730
+ "ĝ": 222,
731
+ "Ğ": 223,
732
+ "ğ": 224,
733
+ "Ġ": 225,
734
+ "ġ": 226,
735
+ "Ģ": 227,
736
+ "ģ": 228,
737
+ "Ĥ": 229,
738
+ "ĥ": 230,
739
+ "Ħ": 231,
740
+ "ħ": 232,
741
+ "Ĩ": 233,
742
+ "ĩ": 234,
743
+ "Ī": 235,
744
+ "ī": 236,
745
+ "Ĭ": 237,
746
+ "ĭ": 238,
747
+ "Į": 239,
748
+ "į": 240,
749
+ "İ": 241,
750
+ "ı": 242,
751
+ "IJ": 243,
752
+ "ij": 244,
753
+ "Ĵ": 245,
754
+ "ĵ": 246,
755
+ "Ķ": 247,
756
+ "ķ": 248,
757
+ "ĸ": 249,
758
+ "Ĺ": 250,
759
+ "ĺ": 251,
760
+ "Ļ": 252,
761
+ "ļ": 253,
762
+ "Ľ": 254,
763
+ "ľ": 255,
764
+ "Ŀ": 256,
765
+ "ŀ": 257,
766
+ "Ł": 258,
767
+ "ł": 259,
768
+ "Ń": 260
769
+ }