Eric2333 commited on
Commit
7f284e6
1 Parent(s): 810eba4

Delete tokenizer_bpe_1024

Browse files
tokenizer_bpe_1024/merges.txt DELETED
@@ -1,768 +0,0 @@
1
- #version: 0.2
2
- G G
3
- A A
4
- G C
5
- U U
6
- A C
7
- G U
8
- A U
9
- C C
10
- G AA
11
- C U
12
- G A
13
- A GC
14
- GG U
15
- GG C
16
- G AC
17
- G UU
18
- G AU
19
- A GG
20
- AA U
21
- A UU
22
- C GG
23
- C GC
24
- A GU
25
- AC U
26
- C UU
27
- CC U
28
- GC U
29
- C AA
30
- C AC
31
- GG GG
32
- GU AA
33
- GG AA
34
- A GA
35
- UU U
36
- GG GC
37
- AU GC
38
- GU GC
39
- AC GG
40
- GU C
41
- AGC U
42
- GAC U
43
- GA GG
44
- A GAU
45
- A GAA
46
- AU C
47
- GA GC
48
- AA CU
49
- AA GC
50
- GA GU
51
- A GUU
52
- GAA U
53
- A GGC
54
- C GU
55
- GAA AGC
56
- GG CU
57
- A GGU
58
- GG CC
59
- AAU AC
60
- C AGC
61
- AUU U
62
- C AU
63
- AA UU
64
- GG GU
65
- GA UU
66
- GG UU
67
- CU GC
68
- GA GGC
69
- GG AC
70
- GU GU
71
- AU CC
72
- CGC U
73
- AA AC
74
- GGU GAA
75
- CC C
76
- GG AU
77
- GUU U
78
- GU GAA
79
- GAA GGC
80
- GC GC
81
- GU CC
82
- CGG CU
83
- GC AC
84
- CUU U
85
- AA CAC
86
- AA C
87
- C AGU
88
- AA GUC
89
- GU AGC
90
- CC UU
91
- C GGU
92
- AA AA
93
- GA GAC
94
- GGAA UU
95
- GU CU
96
- CC GC
97
- GAA GAA
98
- AGC AGU
99
- A GAC
100
- AC CU
101
- GAC GCU
102
- A GACU
103
- AC GU
104
- GGGC GUAA
105
- UU UU
106
- CC CU
107
- C AGG
108
- AU CU
109
- GU GGGG
110
- CC AC
111
- GGU AA
112
- GGC GAAGGC
113
- GG AGG
114
- GGC UU
115
- CCU ACGG
116
- GA GAGG
117
- CGC GU
118
- GGUGAA AUGC
119
- GG AGC
120
- GG GAA
121
- GGC GGC
122
- GAA CGCU
123
- AC UU
124
- GU GA
125
- AAU AUU
126
- C GAU
127
- GAC GGU
128
- CC CC
129
- GAGGC AGCAGU
130
- AUGC AAGUC
131
- AU AA
132
- GC UU
133
- GUGC CAGC
134
- C GGC
135
- AAU GGGC
136
- CGC GGU
137
- GC CU
138
- C AUU
139
- AC CC
140
- CU CU
141
- CGGCU AACU
142
- GUGGGG AGC
143
- GG GAU
144
- GAACGCU GGCGGC
145
- CCUACGG GAGGCAGCAGU
146
- AC AC
147
- C ACU
148
- GA GGU
149
- GUU GUAA
150
- GAU GC
151
- GUAGC GGUGAAAUGC
152
- C GAA
153
- GG AAU
154
- AA GU
155
- AU AC
156
- CC AGC
157
- GGU CU
158
- GUGCCAGC AGC
159
- AU GU
160
- GAAAGC GUGGGGAGC
161
- UU CGG
162
- CAA GGC
163
- AAGC GUU
164
- AGC UU
165
- GAA CGG
166
- AAAC AGG
167
- CUU CGG
168
- C AAU
169
- AA CGC
170
- AA CC
171
- C GAC
172
- AC GGU
173
- GA GGAA
174
- GUGA GUAA
175
- GGC GG
176
- GUGCCAGCAGC CGCGGU
177
- GG CCU
178
- ACU GC
179
- GU AGGC
180
- GG GCU
181
- CUU UU
182
- CC GU
183
- AA AGG
184
- AACAC AUGCAAGUC
185
- GU AGAU
186
- AU AU
187
- AGACU CCUACGGGAGGCAGCAGU
188
- GG GACU
189
- GG GUU
190
- GU AGA
191
- GAA GC
192
- GGGG AAUAUU
193
- C AUGC
194
- UU GC
195
- GG UUU
196
- GG AUU
197
- GG GGU
198
- ACU GGGCGUAA
199
- CCU GC
200
- AGAA U
201
- AGCU AGUU
202
- CU GAC
203
- GG AUUU
204
- CGG AAUU
205
- C GUU
206
- GA GAA
207
- CU GU
208
- GAGC GUU
209
- AUU AGAU
210
- GAAAGCGUGGGGAGC AAACAGG
211
- CCU GGU
212
- ACU GACGCU
213
- AGA GU
214
- CU CC
215
- AU GAU
216
- GAC GAU
217
- AC C
218
- GGCC UUCGG
219
- AA AU
220
- GC AU
221
- AA CUU
222
- GAA AC
223
- GAACGCUGGCGGC GUGC
224
- AGG GUGC
225
- CU GAU
226
- AAUAC CGC
227
- CAC ACU
228
- AGG AA
229
- AC UUU
230
- CGG AU
231
- GGAA CU
232
- GAC GC
233
- ACGG CCC
234
- AUU UU
235
- CU CAA
236
- GGCGG ACGG
237
- AGG AGG
238
- CU GUU
239
- GG ACU
240
- GA GAU
241
- AA CCU
242
- GG AGU
243
- GGGG GAU
244
- GGCCUUCGG GUUGUAA
245
- GA GUU
246
- GC AA
247
- AU CGG
248
- AGUU U
249
- CAGU GGCGAAGGC
250
- GU AGU
251
- GAC CU
252
- GU AGG
253
- AC CAAGGC
254
- AA GUU
255
- GU CGG
256
- GAUGC AGC
257
- GU GAGU
258
- C AUC
259
- GAU GAA
260
- AGG CCU
261
- GC AAGC
262
- C GAGU
263
- GUGAGUAA CAC
264
- GGUCU GAGAGG
265
- CGGAAUU ACUGGGCGUAA
266
- CAA GC
267
- CGGCUAACU CC
268
- GGC GC
269
- AAUGGGC GAAAGC
270
- AU GAC
271
- U ACGU
272
- CC CGG
273
- AA ACU
274
- GAA AUGC
275
- AU GAA
276
- CGCGU GAGU
277
- GGGACU GAGAC
278
- CU AAUAC
279
- GA GCU
280
- AU CAA
281
- U AC
282
- CU C
283
- AUUAGAU AC
284
- ACGGU CC
285
- AAU GC
286
- ACGU G
287
- GGGU AGC
288
- AGA GC
289
- AC GC
290
- CGG CCAC
291
- GGCU AACU
292
- AUU GGGCGUAA
293
- AGA UU
294
- AC CGC
295
- GG GAC
296
- GAA ACU
297
- CGGU GGCGAAGGC
298
- AGG UU
299
- C GAGC
300
- GUGCCAGCAGCCGCGGU AAUAC
301
- GU GAU
302
- GU AGGU
303
- AU AUU
304
- AUU AGCUAGUU
305
- AA AGC
306
- GGC GAACGG
307
- GUU UU
308
- AGAA UU
309
- AA GAA
310
- GU AC
311
- CC UUU
312
- GAA CAGG
313
- AGCU GGUCUGAGAGG
314
- GGAACU GAGAC
315
- UU AACACAUGCAAGUC
316
- GG GUUU
317
- AAUGGGC GCAAGC
318
- GUAGCGGUGAAAUGC GUAGAU
319
- GAU ACU
320
- AGG CU
321
- CC AU
322
- GGU GC
323
- ACGGCCC AGACUCCUACGGGAGGCAGCAGU
324
- CC CAC
325
- AGU C
326
- AGGAGG AACAC
327
- AC CAA
328
- GAA CGC
329
- GU CAA
330
- CAGC CACACU
331
- GUAA CU
332
- GAGGC GC
333
- CGG CCU
334
- AAGC AC
335
- GG GGC
336
- CCC GGU
337
- GGGGAAUAUU GCAC
338
- CGC GUGU
339
- CU GAA
340
- GGAACUGAGAC ACGGUCC
341
- AAU GGGG
342
- GUU GGU
343
- GC CC
344
- GGUGAA AUU
345
- AAU ACGG
346
- GA UUU
347
- AGAA GAA
348
- GGGC UU
349
- AU CCU
350
- GAA AGU
351
- AC CUU
352
- GU GAAAGC
353
- GC AGGC
354
- GU AU
355
- GU CAC
356
- GU GGU
357
- GAC GAACGCUGGCGGCGUGC
358
- GU GAC
359
- AU CAC
360
- GGCU CAA
361
- CGGAAUUACUGGGCGUAA AGC
362
- GCU CAA
363
- GG GA
364
- GUGAA AUCC
365
- AC AUU
366
- AU CUU
367
- AGG GAAU
368
- AA AUU
369
- C AGAA
370
- CUGAU CCAGC
371
- AGAU AUC
372
- GUU GC
373
- AUC GUAA
374
- GG GGUAA
375
- GGAAUU CCUGGU
376
- GGAA AC
377
- GUAGA GAU
378
- AA AAU
379
- CC CUU
380
- GAC ACU
381
- GACGGU ACCU
382
- C GUAA
383
- GU GGC
384
- GCU GAA
385
- GG GUAA
386
- C GAAU
387
- GUU GUU
388
- GCU GC
389
- GG GAAU
390
- CU GAGAGG
391
- AGA GGU
392
- GA GA
393
- CGGCUAACUCC GUGCCAGCAGCCGCGGU
394
- AUCC GGAUUU
395
- GCGC GUAGGC
396
- CC AA
397
- AC AA
398
- AAUU UU
399
- CC CAA
400
- GAGGC AC
401
- GUGAGUAACAC GU
402
- AAGCGUU GUCC
403
- GAA C
404
- CAC CAGUGGCGAAGGC
405
- AGA GG
406
- GU GCU
407
- CGG AAU
408
- AC AGG
409
- GGU CUUCGG
410
- CAC CU
411
- AU AGAU
412
- C AGUU
413
- GAGG AGC
414
- CGG AA
415
- GAUU GC
416
- AGGCCU AACACAUGCAAGUC
417
- CC GGU
418
- CC CGC
419
- GCU CGU
420
- CAC GGCUAACU
421
- AU GGU
422
- AUU GAACGCUGGCGGC
423
- GGGGAAUAUU GGAC
424
- UU CU
425
- UU GCU
426
- ACU CU
427
- AU AGC
428
- GAGG AAUAUU
429
- AAGC AU
430
- GG AUC
431
- AGG GAAGAA
432
- AGAAGAA GCAC
433
- GCU AAUACCGC
434
- AC GGGC
435
- GGGACUGAGAC ACGGCCCAGACUCCUACGGGAGGCAGCAGU
436
- C A
437
- CGC AA
438
- GUAGCGGUGAAAUGC GC
439
- AC GAU
440
- GG GAUU
441
- AGCUU GUUGGU
442
- AAU CU
443
- CGC GUGC
444
- CAUGC CGCGUGU
445
- GU CUU
446
- GGUGAAAUU CGU
447
- GUGAGU AAU
448
- GA GGUAA
449
- GGAACUGAGACACGGUCC AGACUCCUACGGGAGGCAGCAGU
450
- CU GAUGCAGC
451
- AAU AA
452
- CC CCU
453
- GAA AGCU
454
- AACGC CGCGUGAGU
455
- GGAGG AACAC
456
- AGG GAU
457
- AGAU AUU
458
- CC GGGG
459
- AGC AC
460
- CGGCUAACU AC
461
- GGCUU ACCAAGGC
462
- CAAGGC GACGAU
463
- GGGUUU AAAGG
464
- CU GGU
465
- C AGA
466
- GU CGC
467
- CGGCUAACU ACGUG
468
- GAAU AA
469
- GUAGA GGUGAAAUUCGU
470
- GC CUU
471
- GAC UU
472
- CCU AGU
473
- AA ACGG
474
- GA GUGC
475
- GUU CU
476
- CGGCUAACUCCGUGCCAGCAGCCGCGGU AAUACGG
477
- GGU GGGG
478
- CCC AGU
479
- CGGCCAC ACU
480
- AGG GAA
481
- AGG GGAGC
482
- AACU GACGCU
483
- GGGUAGC CGGCCU
484
- CUUU GAACGC
485
- GGGG AU
486
- AUC AAU
487
- GUGAA UUGC
488
- AA CGU
489
- AGGGAAU CUU
490
- UACGU AGG
491
- AGAUAUC AGGAGGAACAC
492
- GAGGAAUAUU GGU
493
- AGU CC
494
- CU AU
495
- AGC AU
496
- GGGCU CAA
497
- AGG GC
498
- GGAA ACU
499
- AA CAA
500
- C AGGU
501
- AC GUU
502
- AA UUU
503
- AGA UUU
504
- AAUGGGCGAAAGC CUGAC
505
- AU CGC
506
- GAAAGC GU
507
- AC AAU
508
- AGG GG
509
- GA GUAA
510
- GAGGU GC
511
- AAU CGGAAUUACUGGGCGUAAAGC
512
- CGG UU
513
- GAGCGUU GUCC
514
- GAU GAAGAA
515
- GC AGC
516
- GA GAGU
517
- GACGAACGCUGGCGGCGUGC UUAACACAUGCAAGUC
518
- GU CCU
519
- GAAAUGC GAU
520
- AGCUAGUU GGU
521
- GAC GUU
522
- GAA UU
523
- GACU GC
524
- GCU GCAU
525
- AGA GGAA
526
- AU ACU
527
- AUC AGCUUGUUGGU
528
- GAU CU
529
- CGG AUU
530
- AAU CUU
531
- GGAAUU CC
532
- CUAAUAC AUGCAAGUC
533
- GUU AA
534
- C AGCU
535
- CGAC CUGAGAGG
536
- GCUGAA CUU
537
- GAAGAA GGCCUUCGGGUUGUAA
538
- GAUUGC GAAGGC
539
- CC CGU
540
- GG GAGC
541
- GU AAU
542
- GACGGU AC
543
- GAC GGGUAGCCGGCCU
544
- AGC GC
545
- GCUCGU AGGC
546
- GGCC UU
547
- CC GAA
548
- GUGAA GAA
549
- GGAAUU CCCGGU
550
- CC AGU
551
- AUU GUAA
552
- CGGCU AACUU
553
- CAA UU
554
- GGAAUU AUUGGGCGUAA
555
- GAAAGCGUGGGGAGC GAACAGG
556
- CC GG
557
- CC CAU
558
- C GAGG
559
- AGG AC
560
- AA AGU
561
- CC GAU
562
- CAC CAA
563
- AGC CACGGCUAACU
564
- UUU CU
565
- GGC GGU
566
- GGAAU GC
567
- GAAAC CCU
568
- AA GUCC
569
- C GUGC
570
- GAAAGCGUGGGGAGCAAACAGG AUUAGAUAC
571
- AGCUGGUCUGAGAGG AUGAU
572
- AGA GGGG
573
- AU GGUU
574
- C GAUU
575
- AUUAGCUAGUU GGU
576
- AUGC CU
577
- AGA GUGC
578
- GAA AA
579
- GAU GAACGCUGGCGGCGUGC
580
- GGU AAC
581
- AC GAC
582
- GUC AUU
583
- AAUAC CGGAU
584
- GUGU AGGC
585
- GA GGGG
586
- AU AAU
587
- CGCGU GAGG
588
- AGCU CGU
589
- A G
590
- CACU GGGCGUAA
591
- ACU GGGU
592
- GAAU CAUC
593
- CUU GC
594
- CAA CU
595
- C AGGC
596
- AAGC GGAGG
597
- AGG GCGCGUAGGC
598
- AAGCGUU GUU
599
- GGAA CUGC
600
- CC AUU
601
- AC CAU
602
- AA GUCU
603
- AUCCGGAUUU AUU
604
- CGAU GGCGAAGGC
605
- AC ACU
606
- GG GAGG
607
- GUGAGUAA CGCGU
608
- GAAU CUUUGAACGC
609
- CCUU UU
610
- C AGAU
611
- AGU GAA
612
- GG AGAA
613
- AACU CUGUU
614
- GGCGGACGG GUGAGUAAU
615
- GUAGAGGUGAAAUUCGU AGAUAUU
616
- AC CGG
617
- GAGAC GC
618
- GU AUU
619
- AAGCAU AUCAAU
620
- CCUGC CCUU
621
- AU GCU
622
- AGU AAU
623
- AGG GAC
624
- AUCAGCUUGUUGGU GGGGU
625
- AGU AA
626
- CCAGC CAA
627
- AGAAU AAGCAC
628
- CUCU GGGC
629
- AUC AGGU
630
- CCU AU
631
- GAU AAU
632
- AC CAC
633
- GG AUCC
634
- CGACCUGAGAGG GUGAU
635
- CGC CU
636
- C GA
637
- AC AU
638
- CUU CU
639
- GG AGA
640
- AA GCU
641
- GGAAUUCCUGGU GUAGCGGUGAAAUGCGC
642
- AGC GAAAUGCGAU
643
- GAU GUU
644
- AAACGG G
645
- AA GAC
646
- AGC ACUUU
647
- AAUGGGG GAAACCCU
648
- GU GUU
649
- AAU GGAC
650
- GGGAU AA
651
- GAC GGCCUUCGGGUUGUAA
652
- C AUUU
653
- GGU AUU
654
- C GACU
655
- GACGCU GAGGCGC
656
- AGGC UU
657
- AGCU AAUACCGC
658
- GGU CC
659
- GGGAA CUGC
660
- GUC GUAA
661
- GAA GGGG
662
- GUGU AGC
663
- AU GUU
664
- AAGCAUAUCAAU AAGCGGAGG
665
- AGC GGCGGACGG
666
- UACGU AGGGUGC
667
- GAA CU
668
- CC AGG
669
- AGU GC
670
- CCU AC
671
- GGC GAAAGC
672
- GCU CU
673
- CAC UU
674
- GGU CUU
675
- AUU GC
676
- CAUU GGGCGUAA
677
- CC CUGC
678
- GCU AGC
679
- GUU GCU
680
- AGA GAU
681
- GUC GUC
682
- CGC UU
683
- AAUGGGCGCAAGC CUGAUCCAGC
684
- GAA CC
685
- GUGAAUUGC AGAAUU
686
- GGCGAACGG GUGAGUAACAC
687
- GAAAGCU AGGGGAGC
688
- GAAUCAUC GAAUCUUUGAACGC
689
- ACU GGAA
690
- AA CGG
691
- CUAAUACAUGCAAGUC GAGC
692
- AGCUU GCU
693
- AUUAGAU ACCC
694
- GGAGC AACGCCGCGUGAGU
695
- AAUGGGCGCAAGC CUGAUGCAGC
696
- GUGAAAUCC CC
697
- AA GGU
698
- CGC GC
699
- GGUU UU
700
- GGGUUUAAAGG GUGC
701
- CGGCCAC AUU
702
- GGAA GCCU
703
- GU ACAC
704
- GGUCUUCGG AUCGUAA
705
- AUUGAACGCUGGCGGC AGGCCUAACACAUGCAAGUC
706
- GACGGGUAGCCGGCCU GAGAGG
707
- AUU CU
708
- GAA AGG
709
- CCUU CGG
710
- GG AGCU
711
- CUU GAGU
712
- CGG AGCU
713
- GAC UUU
714
- GUGCCAGC CGC
715
- GC AGU
716
- AGUU GGU
717
- AAGCAUAUCAAUAAGCGGAGG A
718
- GAAAGC CAGG
719
- GGUAA GGUAAC
720
- GG GUUGUAA
721
- ACCC GCUGAACUU
722
- ACAUU GCGC
723
- GGGG AGU
724
- AUC AGC
725
- ACUU CUUUU
726
- AGCU CU
727
- U ACGG
728
- GUAGCGGUGAAAUGC UU
729
- AA GGC
730
- CCU CU
731
- AUCAA ACAGG
732
- AGCUGGUCUGAGAGGAUGAU CAGCCACACU
733
- AU GGGG
734
- GA GAGC
735
- GGUGAAAUGC GUAGAU
736
- GA GGGC
737
- GGC AGC
738
- GU GAGG
739
- AUCGG GAGGAA
740
- AGA GCUCGUAGGC
741
- GGGG AAUUUU
742
- CAU CU
743
- GAU CCAGC
744
- GAA CGGC
745
- GGAAUU CCUAGU
746
- C GUC
747
- GGCC CU
748
- GAU GAU
749
- AUAA GACU
750
- GGCU CACU
751
- GGGG GAC
752
- AAU CUGC
753
- GAA CAC
754
- AACU GC
755
- AAUAC CC
756
- GGACU CGC
757
- CAUGCCGCGUGU GUGAAGAA
758
- GUU AC
759
- AAUU C
760
- GGC AC
761
- ACCAAGGC GACGAU
762
- CUCAA CCU
763
- CGGCUAACUCCGUGCCAGCAGCCGCGGUAAUACGG AGG
764
- AGA GAA
765
- CAA AA
766
- AAGCGUU AUCC
767
- GAACGG AAAGG
768
- GGUU UUCGG
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
tokenizer_bpe_1024/special_tokens_map.json DELETED
@@ -1,5 +0,0 @@
1
- {
2
- "bos_token": "<|endoftext|>",
3
- "eos_token": "<|endoftext|>",
4
- "unk_token": "<|endoftext|>"
5
- }
 
 
 
 
 
 
tokenizer_bpe_1024/tokenizer.json DELETED
@@ -1,1839 +0,0 @@
1
- {
2
- "version": "1.0",
3
- "truncation": null,
4
- "padding": null,
5
- "added_tokens": [
6
- {
7
- "id": 0,
8
- "content": "<|endoftext|>",
9
- "single_word": false,
10
- "lstrip": false,
11
- "rstrip": false,
12
- "normalized": true,
13
- "special": true
14
- }
15
- ],
16
- "normalizer": null,
17
- "pre_tokenizer": {
18
- "type": "ByteLevel",
19
- "add_prefix_space": false,
20
- "trim_offsets": true,
21
- "use_regex": true
22
- },
23
- "post_processor": {
24
- "type": "ByteLevel",
25
- "add_prefix_space": true,
26
- "trim_offsets": false,
27
- "use_regex": true
28
- },
29
- "decoder": {
30
- "type": "ByteLevel",
31
- "add_prefix_space": true,
32
- "trim_offsets": true,
33
- "use_regex": true
34
- },
35
- "model": {
36
- "type": "BPE",
37
- "dropout": null,
38
- "unk_token": null,
39
- "continuing_subword_prefix": "",
40
- "end_of_word_suffix": "",
41
- "fuse_unk": false,
42
- "byte_fallback": false,
43
- "vocab": {
44
- "<|endoftext|>": 0,
45
- "!": 1,
46
- "\"": 2,
47
- "#": 3,
48
- "$": 4,
49
- "%": 5,
50
- "&": 6,
51
- "'": 7,
52
- "(": 8,
53
- ")": 9,
54
- "*": 10,
55
- "+": 11,
56
- ",": 12,
57
- "-": 13,
58
- ".": 14,
59
- "/": 15,
60
- "0": 16,
61
- "1": 17,
62
- "2": 18,
63
- "3": 19,
64
- "4": 20,
65
- "5": 21,
66
- "6": 22,
67
- "7": 23,
68
- "8": 24,
69
- "9": 25,
70
- ":": 26,
71
- ";": 27,
72
- "<": 28,
73
- "=": 29,
74
- ">": 30,
75
- "?": 31,
76
- "@": 32,
77
- "A": 33,
78
- "B": 34,
79
- "C": 35,
80
- "D": 36,
81
- "E": 37,
82
- "F": 38,
83
- "G": 39,
84
- "H": 40,
85
- "I": 41,
86
- "J": 42,
87
- "K": 43,
88
- "L": 44,
89
- "M": 45,
90
- "N": 46,
91
- "O": 47,
92
- "P": 48,
93
- "Q": 49,
94
- "R": 50,
95
- "S": 51,
96
- "T": 52,
97
- "U": 53,
98
- "V": 54,
99
- "W": 55,
100
- "X": 56,
101
- "Y": 57,
102
- "Z": 58,
103
- "[": 59,
104
- "\\": 60,
105
- "]": 61,
106
- "^": 62,
107
- "_": 63,
108
- "`": 64,
109
- "a": 65,
110
- "b": 66,
111
- "c": 67,
112
- "d": 68,
113
- "e": 69,
114
- "f": 70,
115
- "g": 71,
116
- "h": 72,
117
- "i": 73,
118
- "j": 74,
119
- "k": 75,
120
- "l": 76,
121
- "m": 77,
122
- "n": 78,
123
- "o": 79,
124
- "p": 80,
125
- "q": 81,
126
- "r": 82,
127
- "s": 83,
128
- "t": 84,
129
- "u": 85,
130
- "v": 86,
131
- "w": 87,
132
- "x": 88,
133
- "y": 89,
134
- "z": 90,
135
- "{": 91,
136
- "|": 92,
137
- "}": 93,
138
- "~": 94,
139
- "¡": 95,
140
- "¢": 96,
141
- "£": 97,
142
- "¤": 98,
143
- "¥": 99,
144
- "¦": 100,
145
- "§": 101,
146
- "¨": 102,
147
- "©": 103,
148
- "ª": 104,
149
- "«": 105,
150
- "¬": 106,
151
- "®": 107,
152
- "¯": 108,
153
- "°": 109,
154
- "±": 110,
155
- "²": 111,
156
- "³": 112,
157
- "´": 113,
158
- "µ": 114,
159
- "¶": 115,
160
- "·": 116,
161
- "¸": 117,
162
- "¹": 118,
163
- "º": 119,
164
- "»": 120,
165
- "¼": 121,
166
- "½": 122,
167
- "¾": 123,
168
- "¿": 124,
169
- "À": 125,
170
- "Á": 126,
171
- "Â": 127,
172
- "Ã": 128,
173
- "Ä": 129,
174
- "Å": 130,
175
- "Æ": 131,
176
- "Ç": 132,
177
- "È": 133,
178
- "É": 134,
179
- "Ê": 135,
180
- "Ë": 136,
181
- "Ì": 137,
182
- "Í": 138,
183
- "Î": 139,
184
- "Ï": 140,
185
- "Ð": 141,
186
- "Ñ": 142,
187
- "Ò": 143,
188
- "Ó": 144,
189
- "Ô": 145,
190
- "Õ": 146,
191
- "Ö": 147,
192
- "×": 148,
193
- "Ø": 149,
194
- "Ù": 150,
195
- "Ú": 151,
196
- "Û": 152,
197
- "Ü": 153,
198
- "Ý": 154,
199
- "Þ": 155,
200
- "ß": 156,
201
- "à": 157,
202
- "á": 158,
203
- "â": 159,
204
- "ã": 160,
205
- "ä": 161,
206
- "å": 162,
207
- "æ": 163,
208
- "ç": 164,
209
- "è": 165,
210
- "é": 166,
211
- "ê": 167,
212
- "ë": 168,
213
- "ì": 169,
214
- "í": 170,
215
- "î": 171,
216
- "ï": 172,
217
- "ð": 173,
218
- "ñ": 174,
219
- "ò": 175,
220
- "ó": 176,
221
- "ô": 177,
222
- "õ": 178,
223
- "ö": 179,
224
- "÷": 180,
225
- "ø": 181,
226
- "ù": 182,
227
- "ú": 183,
228
- "û": 184,
229
- "ü": 185,
230
- "ý": 186,
231
- "þ": 187,
232
- "ÿ": 188,
233
- "Ā": 189,
234
- "ā": 190,
235
- "Ă": 191,
236
- "ă": 192,
237
- "Ą": 193,
238
- "ą": 194,
239
- "Ć": 195,
240
- "ć": 196,
241
- "Ĉ": 197,
242
- "ĉ": 198,
243
- "Ċ": 199,
244
- "ċ": 200,
245
- "Č": 201,
246
- "č": 202,
247
- "Ď": 203,
248
- "ď": 204,
249
- "Đ": 205,
250
- "đ": 206,
251
- "Ē": 207,
252
- "ē": 208,
253
- "Ĕ": 209,
254
- "ĕ": 210,
255
- "Ė": 211,
256
- "ė": 212,
257
- "Ę": 213,
258
- "ę": 214,
259
- "Ě": 215,
260
- "ě": 216,
261
- "Ĝ": 217,
262
- "ĝ": 218,
263
- "Ğ": 219,
264
- "ğ": 220,
265
- "Ġ": 221,
266
- "ġ": 222,
267
- "Ģ": 223,
268
- "ģ": 224,
269
- "Ĥ": 225,
270
- "ĥ": 226,
271
- "Ħ": 227,
272
- "ħ": 228,
273
- "Ĩ": 229,
274
- "ĩ": 230,
275
- "Ī": 231,
276
- "ī": 232,
277
- "Ĭ": 233,
278
- "ĭ": 234,
279
- "Į": 235,
280
- "į": 236,
281
- "İ": 237,
282
- "ı": 238,
283
- "IJ": 239,
284
- "ij": 240,
285
- "Ĵ": 241,
286
- "ĵ": 242,
287
- "Ķ": 243,
288
- "ķ": 244,
289
- "ĸ": 245,
290
- "Ĺ": 246,
291
- "ĺ": 247,
292
- "Ļ": 248,
293
- "ļ": 249,
294
- "Ľ": 250,
295
- "ľ": 251,
296
- "Ŀ": 252,
297
- "ŀ": 253,
298
- "Ł": 254,
299
- "ł": 255,
300
- "Ń": 256,
301
- "GG": 257,
302
- "AA": 258,
303
- "GC": 259,
304
- "UU": 260,
305
- "AC": 261,
306
- "GU": 262,
307
- "AU": 263,
308
- "CC": 264,
309
- "GAA": 265,
310
- "CU": 266,
311
- "GA": 267,
312
- "AGC": 268,
313
- "GGU": 269,
314
- "GGC": 270,
315
- "GAC": 271,
316
- "GUU": 272,
317
- "GAU": 273,
318
- "AGG": 274,
319
- "AAU": 275,
320
- "AUU": 276,
321
- "CGG": 277,
322
- "CGC": 278,
323
- "AGU": 279,
324
- "ACU": 280,
325
- "CUU": 281,
326
- "CCU": 282,
327
- "GCU": 283,
328
- "CAA": 284,
329
- "CAC": 285,
330
- "GGGG": 286,
331
- "GUAA": 287,
332
- "GGAA": 288,
333
- "AGA": 289,
334
- "UUU": 290,
335
- "GGGC": 291,
336
- "AUGC": 292,
337
- "GUGC": 293,
338
- "ACGG": 294,
339
- "GUC": 295,
340
- "AGCU": 296,
341
- "GACU": 297,
342
- "GAGG": 298,
343
- "AGAU": 299,
344
- "AGAA": 300,
345
- "AUC": 301,
346
- "GAGC": 302,
347
- "AACU": 303,
348
- "AAGC": 304,
349
- "GAGU": 305,
350
- "AGUU": 306,
351
- "GAAU": 307,
352
- "AGGC": 308,
353
- "CGU": 309,
354
- "GAAAGC": 310,
355
- "GGCU": 311,
356
- "AGGU": 312,
357
- "GGCC": 313,
358
- "AAUAC": 314,
359
- "CAGC": 315,
360
- "AUUU": 316,
361
- "CAU": 317,
362
- "AAUU": 318,
363
- "GGGU": 319,
364
- "GAUU": 320,
365
- "GGUU": 321,
366
- "CUGC": 322,
367
- "GAGGC": 323,
368
- "GGAC": 324,
369
- "GUGU": 325,
370
- "AUCC": 326,
371
- "CGCU": 327,
372
- "AAAC": 328,
373
- "GGUGAA": 329,
374
- "CCC": 330,
375
- "GGAU": 331,
376
- "GUUU": 332,
377
- "GUGAA": 333,
378
- "GAAGGC": 334,
379
- "GCGC": 335,
380
- "GUCC": 336,
381
- "CGGCU": 337,
382
- "GCAC": 338,
383
- "CUUU": 339,
384
- "AACAC": 340,
385
- "AAC": 341,
386
- "CAGU": 342,
387
- "AAGUC": 343,
388
- "GUAGC": 344,
389
- "CCUU": 345,
390
- "CGGU": 346,
391
- "AAAA": 347,
392
- "GAGAC": 348,
393
- "GGAAUU": 349,
394
- "GUCU": 350,
395
- "CCGC": 351,
396
- "GAAGAA": 352,
397
- "AGCAGU": 353,
398
- "AGAC": 354,
399
- "ACCU": 355,
400
- "GACGCU": 356,
401
- "AGACU": 357,
402
- "ACGU": 358,
403
- "GGGCGUAA": 359,
404
- "UUUU": 360,
405
- "CCCU": 361,
406
- "CAGG": 362,
407
- "AUCU": 363,
408
- "GUGGGG": 364,
409
- "CCAC": 365,
410
- "GGUAA": 366,
411
- "GGCGAAGGC": 367,
412
- "GGAGG": 368,
413
- "GGCUU": 369,
414
- "CCUACGG": 370,
415
- "GAGAGG": 371,
416
- "CGCGU": 372,
417
- "GGUGAAAUGC": 373,
418
- "GGAGC": 374,
419
- "GGGAA": 375,
420
- "GGCGGC": 376,
421
- "GAACGCU": 377,
422
- "ACUU": 378,
423
- "GUGA": 379,
424
- "AAUAUU": 380,
425
- "CGAU": 381,
426
- "GACGGU": 382,
427
- "CCCC": 383,
428
- "GAGGCAGCAGU": 384,
429
- "AUGCAAGUC": 385,
430
- "AUAA": 386,
431
- "GCUU": 387,
432
- "GUGCCAGC": 388,
433
- "CGGC": 389,
434
- "AAUGGGC": 390,
435
- "CGCGGU": 391,
436
- "GCCU": 392,
437
- "CAUU": 393,
438
- "ACCC": 394,
439
- "CUCU": 395,
440
- "CGGCUAACU": 396,
441
- "GUGGGGAGC": 397,
442
- "GGGAU": 398,
443
- "GAACGCUGGCGGC": 399,
444
- "CCUACGGGAGGCAGCAGU": 400,
445
- "ACAC": 401,
446
- "CACU": 402,
447
- "GAGGU": 403,
448
- "GUUGUAA": 404,
449
- "GAUGC": 405,
450
- "GUAGCGGUGAAAUGC": 406,
451
- "CGAA": 407,
452
- "GGAAU": 408,
453
- "AAGU": 409,
454
- "AUAC": 410,
455
- "CCAGC": 411,
456
- "GGUCU": 412,
457
- "GUGCCAGCAGC": 413,
458
- "AUGU": 414,
459
- "GAAAGCGUGGGGAGC": 415,
460
- "UUCGG": 416,
461
- "CAAGGC": 417,
462
- "AAGCGUU": 418,
463
- "AGCUU": 419,
464
- "GAACGG": 420,
465
- "AAACAGG": 421,
466
- "CUUCGG": 422,
467
- "CAAU": 423,
468
- "AACGC": 424,
469
- "AACC": 425,
470
- "CGAC": 426,
471
- "ACGGU": 427,
472
- "GAGGAA": 428,
473
- "GUGAGUAA": 429,
474
- "GGCGG": 430,
475
- "GUGCCAGCAGCCGCGGU": 431,
476
- "GGCCU": 432,
477
- "ACUGC": 433,
478
- "GUAGGC": 434,
479
- "GGGCU": 435,
480
- "CUUUU": 436,
481
- "CCGU": 437,
482
- "AAAGG": 438,
483
- "AACACAUGCAAGUC": 439,
484
- "GUAGAU": 440,
485
- "AUAU": 441,
486
- "AGACUCCUACGGGAGGCAGCAGU": 442,
487
- "GGGACU": 443,
488
- "GGGUU": 444,
489
- "GUAGA": 445,
490
- "GAAGC": 446,
491
- "GGGGAAUAUU": 447,
492
- "CAUGC": 448,
493
- "UUGC": 449,
494
- "GGUUU": 450,
495
- "GGAUU": 451,
496
- "GGGGU": 452,
497
- "ACUGGGCGUAA": 453,
498
- "CCUGC": 454,
499
- "AGAAU": 455,
500
- "AGCUAGUU": 456,
501
- "CUGAC": 457,
502
- "GGAUUU": 458,
503
- "CGGAAUU": 459,
504
- "CGUU": 460,
505
- "GAGAA": 461,
506
- "CUGU": 462,
507
- "GAGCGUU": 463,
508
- "AUUAGAU": 464,
509
- "GAAAGCGUGGGGAGCAAACAGG": 465,
510
- "CCUGGU": 466,
511
- "ACUGACGCU": 467,
512
- "AGAGU": 468,
513
- "CUCC": 469,
514
- "AUGAU": 470,
515
- "GACGAU": 471,
516
- "ACC": 472,
517
- "GGCCUUCGG": 473,
518
- "AAAU": 474,
519
- "GCAU": 475,
520
- "AACUU": 476,
521
- "GAAAC": 477,
522
- "GAACGCUGGCGGCGUGC": 478,
523
- "AGGGUGC": 479,
524
- "CUGAU": 480,
525
- "AAUACCGC": 481,
526
- "CACACU": 482,
527
- "AGGAA": 483,
528
- "ACUUU": 484,
529
- "CGGAU": 485,
530
- "GGAACU": 486,
531
- "GACGC": 487,
532
- "ACGGCCC": 488,
533
- "AUUUU": 489,
534
- "CUCAA": 490,
535
- "GGCGGACGG": 491,
536
- "AGGAGG": 492,
537
- "CUGUU": 493,
538
- "GGACU": 494,
539
- "GAGAU": 495,
540
- "AACCU": 496,
541
- "GGAGU": 497,
542
- "GGGGGAU": 498,
543
- "GGCCUUCGGGUUGUAA": 499,
544
- "GAGUU": 500,
545
- "GCAA": 501,
546
- "AUCGG": 502,
547
- "AGUUU": 503,
548
- "CAGUGGCGAAGGC": 504,
549
- "GUAGU": 505,
550
- "GACCU": 506,
551
- "GUAGG": 507,
552
- "ACCAAGGC": 508,
553
- "AAGUU": 509,
554
- "GUCGG": 510,
555
- "GAUGCAGC": 511,
556
- "GUGAGU": 512,
557
- "CAUC": 513,
558
- "GAUGAA": 514,
559
- "AGGCCU": 515,
560
- "GCAAGC": 516,
561
- "CGAGU": 517,
562
- "GUGAGUAACAC": 518,
563
- "GGUCUGAGAGG": 519,
564
- "CGGAAUUACUGGGCGUAA": 520,
565
- "CAAGC": 521,
566
- "CGGCUAACUCC": 522,
567
- "GGCGC": 523,
568
- "AAUGGGCGAAAGC": 524,
569
- "AUGAC": 525,
570
- "UACGU": 526,
571
- "CCCGG": 527,
572
- "AAACU": 528,
573
- "GAAAUGC": 529,
574
- "AUGAA": 530,
575
- "CGCGUGAGU": 531,
576
- "GGGACUGAGAC": 532,
577
- "CUAAUAC": 533,
578
- "GAGCU": 534,
579
- "AUCAA": 535,
580
- "UAC": 536,
581
- "CUC": 537,
582
- "AUUAGAUAC": 538,
583
- "ACGGUCC": 539,
584
- "AAUGC": 540,
585
- "ACGUG": 541,
586
- "GGGUAGC": 542,
587
- "AGAGC": 543,
588
- "ACGC": 544,
589
- "CGGCCAC": 545,
590
- "GGCUAACU": 546,
591
- "AUUGGGCGUAA": 547,
592
- "AGAUU": 548,
593
- "ACCGC": 549,
594
- "GGGAC": 550,
595
- "GAAACU": 551,
596
- "CGGUGGCGAAGGC": 552,
597
- "AGGUU": 553,
598
- "CGAGC": 554,
599
- "GUGCCAGCAGCCGCGGUAAUAC": 555,
600
- "GUGAU": 556,
601
- "GUAGGU": 557,
602
- "AUAUU": 558,
603
- "AUUAGCUAGUU": 559,
604
- "AAAGC": 560,
605
- "GGCGAACGG": 561,
606
- "GUUUU": 562,
607
- "AGAAUU": 563,
608
- "AAGAA": 564,
609
- "GUAC": 565,
610
- "CCUUU": 566,
611
- "GAACAGG": 567,
612
- "AGCUGGUCUGAGAGG": 568,
613
- "GGAACUGAGAC": 569,
614
- "UUAACACAUGCAAGUC": 570,
615
- "GGGUUU": 571,
616
- "AAUGGGCGCAAGC": 572,
617
- "GUAGCGGUGAAAUGCGUAGAU": 573,
618
- "GAUACU": 574,
619
- "AGGCU": 575,
620
- "CCAU": 576,
621
- "GGUGC": 577,
622
- "ACGGCCCAGACUCCUACGGGAGGCAGCAGU": 578,
623
- "CCCAC": 579,
624
- "AGUC": 580,
625
- "AGGAGGAACAC": 581,
626
- "ACCAA": 582,
627
- "GAACGC": 583,
628
- "GUCAA": 584,
629
- "CAGCCACACU": 585,
630
- "GUAACU": 586,
631
- "GAGGCGC": 587,
632
- "CGGCCU": 588,
633
- "AAGCAC": 589,
634
- "GGGGC": 590,
635
- "CCCGGU": 591,
636
- "GGGGAAUAUUGCAC": 592,
637
- "CGCGUGU": 593,
638
- "CUGAA": 594,
639
- "GGAACUGAGACACGGUCC": 595,
640
- "AAUGGGG": 596,
641
- "GUUGGU": 597,
642
- "GCCC": 598,
643
- "GGUGAAAUU": 599,
644
- "AAUACGG": 600,
645
- "GAUUU": 601,
646
- "AGAAGAA": 602,
647
- "GGGCUU": 603,
648
- "AUCCU": 604,
649
- "GAAAGU": 605,
650
- "ACCUU": 606,
651
- "GUGAAAGC": 607,
652
- "GCAGGC": 608,
653
- "GUAU": 609,
654
- "GUCAC": 610,
655
- "GUGGU": 611,
656
- "GACGAACGCUGGCGGCGUGC": 612,
657
- "GUGAC": 613,
658
- "AUCAC": 614,
659
- "GGCUCAA": 615,
660
- "CGGAAUUACUGGGCGUAAAGC": 616,
661
- "GCUCAA": 617,
662
- "GGGA": 618,
663
- "GUGAAAUCC": 619,
664
- "ACAUU": 620,
665
- "AUCUU": 621,
666
- "AGGGAAU": 622,
667
- "AAAUU": 623,
668
- "CAGAA": 624,
669
- "CUGAUCCAGC": 625,
670
- "AGAUAUC": 626,
671
- "GUUGC": 627,
672
- "AUCGUAA": 628,
673
- "GGGGUAA": 629,
674
- "GGAAUUCCUGGU": 630,
675
- "GGAAAC": 631,
676
- "GUAGAGAU": 632,
677
- "AAAAU": 633,
678
- "CCCUU": 634,
679
- "GACACU": 635,
680
- "GACGGUACCU": 636,
681
- "CGUAA": 637,
682
- "GUGGC": 638,
683
- "GCUGAA": 639,
684
- "GGGUAA": 640,
685
- "CGAAU": 641,
686
- "GUUGUU": 642,
687
- "GCUGC": 643,
688
- "GGGAAU": 644,
689
- "CUGAGAGG": 645,
690
- "AGAGGU": 646,
691
- "GAGA": 647,
692
- "CGGCUAACUCCGUGCCAGCAGCCGCGGU": 648,
693
- "AUCCGGAUUU": 649,
694
- "GCGCGUAGGC": 650,
695
- "CCAA": 651,
696
- "ACAA": 652,
697
- "AAUUUU": 653,
698
- "CCCAA": 654,
699
- "GAGGCAC": 655,
700
- "GUGAGUAACACGU": 656,
701
- "AAGCGUUGUCC": 657,
702
- "GAAC": 658,
703
- "CACCAGUGGCGAAGGC": 659,
704
- "AGAGG": 660,
705
- "GUGCU": 661,
706
- "CGGAAU": 662,
707
- "ACAGG": 663,
708
- "GGUCUUCGG": 664,
709
- "CACCU": 665,
710
- "AUAGAU": 666,
711
- "CAGUU": 667,
712
- "GAGGAGC": 668,
713
- "CGGAA": 669,
714
- "GAUUGC": 670,
715
- "AGGCCUAACACAUGCAAGUC": 671,
716
- "CCGGU": 672,
717
- "CCCGC": 673,
718
- "GCUCGU": 674,
719
- "CACGGCUAACU": 675,
720
- "AUGGU": 676,
721
- "AUUGAACGCUGGCGGC": 677,
722
- "GGGGAAUAUUGGAC": 678,
723
- "UUCU": 679,
724
- "UUGCU": 680,
725
- "ACUCU": 681,
726
- "AUAGC": 682,
727
- "GAGGAAUAUU": 683,
728
- "AAGCAU": 684,
729
- "GGAUC": 685,
730
- "AGGGAAGAA": 686,
731
- "AGAAGAAGCAC": 687,
732
- "GCUAAUACCGC": 688,
733
- "ACGGGC": 689,
734
- "GGGACUGAGACACGGCCCAGACUCCUACGGGAGGCAGCAGU": 690,
735
- "CA": 691,
736
- "CGCAA": 692,
737
- "GUAGCGGUGAAAUGCGC": 693,
738
- "ACGAU": 694,
739
- "GGGAUU": 695,
740
- "AGCUUGUUGGU": 696,
741
- "AAUCU": 697,
742
- "CGCGUGC": 698,
743
- "CAUGCCGCGUGU": 699,
744
- "GUCUU": 700,
745
- "GGUGAAAUUCGU": 701,
746
- "GUGAGUAAU": 702,
747
- "GAGGUAA": 703,
748
- "GGAACUGAGACACGGUCCAGACUCCUACGGGAGGCAGCAGU": 704,
749
- "CUGAUGCAGC": 705,
750
- "AAUAA": 706,
751
- "CCCCU": 707,
752
- "GAAAGCU": 708,
753
- "AACGCCGCGUGAGU": 709,
754
- "GGAGGAACAC": 710,
755
- "AGGGAU": 711,
756
- "AGAUAUU": 712,
757
- "CCGGGG": 713,
758
- "AGCAC": 714,
759
- "CGGCUAACUAC": 715,
760
- "GGCUUACCAAGGC": 716,
761
- "CAAGGCGACGAU": 717,
762
- "GGGUUUAAAGG": 718,
763
- "CUGGU": 719,
764
- "CAGA": 720,
765
- "GUCGC": 721,
766
- "CGGCUAACUACGUG": 722,
767
- "GAAUAA": 723,
768
- "GUAGAGGUGAAAUUCGU": 724,
769
- "GCCUU": 725,
770
- "GACUU": 726,
771
- "CCUAGU": 727,
772
- "AAACGG": 728,
773
- "GAGUGC": 729,
774
- "GUUCU": 730,
775
- "CGGCUAACUCCGUGCCAGCAGCCGCGGUAAUACGG": 731,
776
- "GGUGGGG": 732,
777
- "CCCAGU": 733,
778
- "CGGCCACACU": 734,
779
- "AGGGAA": 735,
780
- "AGGGGAGC": 736,
781
- "AACUGACGCU": 737,
782
- "GGGUAGCCGGCCU": 738,
783
- "CUUUGAACGC": 739,
784
- "GGGGAU": 740,
785
- "AUCAAU": 741,
786
- "GUGAAUUGC": 742,
787
- "AACGU": 743,
788
- "AGGGAAUCUU": 744,
789
- "UACGUAGG": 745,
790
- "AGAUAUCAGGAGGAACAC": 746,
791
- "GAGGAAUAUUGGU": 747,
792
- "AGUCC": 748,
793
- "CUAU": 749,
794
- "AGCAU": 750,
795
- "GGGCUCAA": 751,
796
- "AGGGC": 752,
797
- "GGAAACU": 753,
798
- "AACAA": 754,
799
- "CAGGU": 755,
800
- "ACGUU": 756,
801
- "AAUUU": 757,
802
- "AGAUUU": 758,
803
- "AAUGGGCGAAAGCCUGAC": 759,
804
- "AUCGC": 760,
805
- "GAAAGCGU": 761,
806
- "ACAAU": 762,
807
- "AGGGG": 763,
808
- "GAGUAA": 764,
809
- "GAGGUGC": 765,
810
- "AAUCGGAAUUACUGGGCGUAAAGC": 766,
811
- "CGGUU": 767,
812
- "GAGCGUUGUCC": 768,
813
- "GAUGAAGAA": 769,
814
- "GCAGC": 770,
815
- "GAGAGU": 771,
816
- "GACGAACGCUGGCGGCGUGCUUAACACAUGCAAGUC": 772,
817
- "GUCCU": 773,
818
- "GAAAUGCGAU": 774,
819
- "AGCUAGUUGGU": 775,
820
- "GACGUU": 776,
821
- "GAAUU": 777,
822
- "GACUGC": 778,
823
- "GCUGCAU": 779,
824
- "AGAGGAA": 780,
825
- "AUACU": 781,
826
- "AUCAGCUUGUUGGU": 782,
827
- "GAUCU": 783,
828
- "CGGAUU": 784,
829
- "AAUCUU": 785,
830
- "GGAAUUCC": 786,
831
- "CUAAUACAUGCAAGUC": 787,
832
- "GUUAA": 788,
833
- "CAGCU": 789,
834
- "CGACCUGAGAGG": 790,
835
- "GCUGAACUU": 791,
836
- "GAAGAAGGCCUUCGGGUUGUAA": 792,
837
- "GAUUGCGAAGGC": 793,
838
- "CCCGU": 794,
839
- "GGGAGC": 795,
840
- "GUAAU": 796,
841
- "GACGGUAC": 797,
842
- "GACGGGUAGCCGGCCU": 798,
843
- "AGCGC": 799,
844
- "GCUCGUAGGC": 800,
845
- "GGCCUU": 801,
846
- "CCGAA": 802,
847
- "GUGAAGAA": 803,
848
- "GGAAUUCCCGGU": 804,
849
- "CCAGU": 805,
850
- "AUUGUAA": 806,
851
- "CGGCUAACUU": 807,
852
- "CAAUU": 808,
853
- "GGAAUUAUUGGGCGUAA": 809,
854
- "GAAAGCGUGGGGAGCGAACAGG": 810,
855
- "CCGG": 811,
856
- "CCCAU": 812,
857
- "CGAGG": 813,
858
- "AGGAC": 814,
859
- "AAAGU": 815,
860
- "CCGAU": 816,
861
- "CACCAA": 817,
862
- "AGCCACGGCUAACU": 818,
863
- "UUUCU": 819,
864
- "GGCGGU": 820,
865
- "GGAAUGC": 821,
866
- "GAAACCCU": 822,
867
- "AAGUCC": 823,
868
- "CGUGC": 824,
869
- "GAAAGCGUGGGGAGCAAACAGGAUUAGAUAC": 825,
870
- "AGCUGGUCUGAGAGGAUGAU": 826,
871
- "AGAGGGG": 827,
872
- "AUGGUU": 828,
873
- "CGAUU": 829,
874
- "AUUAGCUAGUUGGU": 830,
875
- "AUGCCU": 831,
876
- "AGAGUGC": 832,
877
- "GAAAA": 833,
878
- "GAUGAACGCUGGCGGCGUGC": 834,
879
- "GGUAAC": 835,
880
- "ACGAC": 836,
881
- "GUCAUU": 837,
882
- "AAUACCGGAU": 838,
883
- "GUGUAGGC": 839,
884
- "GAGGGG": 840,
885
- "AUAAU": 841,
886
- "CGCGUGAGG": 842,
887
- "AGCUCGU": 843,
888
- "AG": 844,
889
- "CACUGGGCGUAA": 845,
890
- "ACUGGGU": 846,
891
- "GAAUCAUC": 847,
892
- "CUUGC": 848,
893
- "CAACU": 849,
894
- "CAGGC": 850,
895
- "AAGCGGAGG": 851,
896
- "AGGGCGCGUAGGC": 852,
897
- "AAGCGUUGUU": 853,
898
- "GGAACUGC": 854,
899
- "CCAUU": 855,
900
- "ACCAU": 856,
901
- "AAGUCU": 857,
902
- "AUCCGGAUUUAUU": 858,
903
- "CGAUGGCGAAGGC": 859,
904
- "ACACU": 860,
905
- "GGGAGG": 861,
906
- "GUGAGUAACGCGU": 862,
907
- "GAAUCUUUGAACGC": 863,
908
- "CCUUUU": 864,
909
- "CAGAU": 865,
910
- "AGUGAA": 866,
911
- "GGAGAA": 867,
912
- "AACUCUGUU": 868,
913
- "GGCGGACGGGUGAGUAAU": 869,
914
- "GUAGAGGUGAAAUUCGUAGAUAUU": 870,
915
- "ACCGG": 871,
916
- "GAGACGC": 872,
917
- "GUAUU": 873,
918
- "AAGCAUAUCAAU": 874,
919
- "CCUGCCCUU": 875,
920
- "AUGCU": 876,
921
- "AGUAAU": 877,
922
- "AGGGAC": 878,
923
- "AUCAGCUUGUUGGUGGGGU": 879,
924
- "AGUAA": 880,
925
- "CCAGCCAA": 881,
926
- "AGAAUAAGCAC": 882,
927
- "CUCUGGGC": 883,
928
- "AUCAGGU": 884,
929
- "CCUAU": 885,
930
- "GAUAAU": 886,
931
- "ACCAC": 887,
932
- "GGAUCC": 888,
933
- "CGACCUGAGAGGGUGAU": 889,
934
- "CGCCU": 890,
935
- "CGA": 891,
936
- "ACAU": 892,
937
- "CUUCU": 893,
938
- "GGAGA": 894,
939
- "AAGCU": 895,
940
- "GGAAUUCCUGGUGUAGCGGUGAAAUGCGC": 896,
941
- "AGCGAAAUGCGAU": 897,
942
- "GAUGUU": 898,
943
- "AAACGGG": 899,
944
- "AAGAC": 900,
945
- "AGCACUUU": 901,
946
- "AAUGGGGGAAACCCU": 902,
947
- "GUGUU": 903,
948
- "AAUGGAC": 904,
949
- "GGGAUAA": 905,
950
- "GACGGCCUUCGGGUUGUAA": 906,
951
- "CAUUU": 907,
952
- "GGUAUU": 908,
953
- "CGACU": 909,
954
- "GACGCUGAGGCGC": 910,
955
- "AGGCUU": 911,
956
- "AGCUAAUACCGC": 912,
957
- "GGUCC": 913,
958
- "GGGAACUGC": 914,
959
- "GUCGUAA": 915,
960
- "GAAGGGG": 916,
961
- "GUGUAGC": 917,
962
- "AUGUU": 918,
963
- "AAGCAUAUCAAUAAGCGGAGG": 919,
964
- "AGCGGCGGACGG": 920,
965
- "UACGUAGGGUGC": 921,
966
- "GAACU": 922,
967
- "CCAGG": 923,
968
- "AGUGC": 924,
969
- "CCUAC": 925,
970
- "GGCGAAAGC": 926,
971
- "GCUCU": 927,
972
- "CACUU": 928,
973
- "GGUCUU": 929,
974
- "AUUGC": 930,
975
- "CAUUGGGCGUAA": 931,
976
- "CCCUGC": 932,
977
- "GCUAGC": 933,
978
- "GUUGCU": 934,
979
- "AGAGAU": 935,
980
- "GUCGUC": 936,
981
- "CGCUU": 937,
982
- "AAUGGGCGCAAGCCUGAUCCAGC": 938,
983
- "GAACC": 939,
984
- "GUGAAUUGCAGAAUU": 940,
985
- "GGCGAACGGGUGAGUAACAC": 941,
986
- "GAAAGCUAGGGGAGC": 942,
987
- "GAAUCAUCGAAUCUUUGAACGC": 943,
988
- "ACUGGAA": 944,
989
- "AACGG": 945,
990
- "CUAAUACAUGCAAGUCGAGC": 946,
991
- "AGCUUGCU": 947,
992
- "AUUAGAUACCC": 948,
993
- "GGAGCAACGCCGCGUGAGU": 949,
994
- "AAUGGGCGCAAGCCUGAUGCAGC": 950,
995
- "GUGAAAUCCCC": 951,
996
- "AAGGU": 952,
997
- "CGCGC": 953,
998
- "GGUUUU": 954,
999
- "GGGUUUAAAGGGUGC": 955,
1000
- "CGGCCACAUU": 956,
1001
- "GGAAGCCU": 957,
1002
- "GUACAC": 958,
1003
- "GGUCUUCGGAUCGUAA": 959,
1004
- "AUUGAACGCUGGCGGCAGGCCUAACACAUGCAAGUC": 960,
1005
- "GACGGGUAGCCGGCCUGAGAGG": 961,
1006
- "AUUCU": 962,
1007
- "GAAAGG": 963,
1008
- "CCUUCGG": 964,
1009
- "GGAGCU": 965,
1010
- "CUUGAGU": 966,
1011
- "CGGAGCU": 967,
1012
- "GACUUU": 968,
1013
- "GUGCCAGCCGC": 969,
1014
- "GCAGU": 970,
1015
- "AGUUGGU": 971,
1016
- "AAGCAUAUCAAUAAGCGGAGGA": 972,
1017
- "GAAAGCCAGG": 973,
1018
- "GGUAAGGUAAC": 974,
1019
- "GGGUUGUAA": 975,
1020
- "ACCCGCUGAACUU": 976,
1021
- "ACAUUGCGC": 977,
1022
- "GGGGAGU": 978,
1023
- "AUCAGC": 979,
1024
- "ACUUCUUUU": 980,
1025
- "AGCUCU": 981,
1026
- "UACGG": 982,
1027
- "GUAGCGGUGAAAUGCUU": 983,
1028
- "AAGGC": 984,
1029
- "CCUCU": 985,
1030
- "AUCAAACAGG": 986,
1031
- "AGCUGGUCUGAGAGGAUGAUCAGCCACACU": 987,
1032
- "AUGGGG": 988,
1033
- "GAGAGC": 989,
1034
- "GGUGAAAUGCGUAGAU": 990,
1035
- "GAGGGC": 991,
1036
- "GGCAGC": 992,
1037
- "GUGAGG": 993,
1038
- "AUCGGGAGGAA": 994,
1039
- "AGAGCUCGUAGGC": 995,
1040
- "GGGGAAUUUU": 996,
1041
- "CAUCU": 997,
1042
- "GAUCCAGC": 998,
1043
- "GAACGGC": 999,
1044
- "GGAAUUCCUAGU": 1000,
1045
- "CGUC": 1001,
1046
- "GGCCCU": 1002,
1047
- "GAUGAU": 1003,
1048
- "AUAAGACU": 1004,
1049
- "GGCUCACU": 1005,
1050
- "GGGGGAC": 1006,
1051
- "AAUCUGC": 1007,
1052
- "GAACAC": 1008,
1053
- "AACUGC": 1009,
1054
- "AAUACCC": 1010,
1055
- "GGACUCGC": 1011,
1056
- "CAUGCCGCGUGUGUGAAGAA": 1012,
1057
- "GUUAC": 1013,
1058
- "AAUUC": 1014,
1059
- "GGCAC": 1015,
1060
- "ACCAAGGCGACGAU": 1016,
1061
- "CUCAACCU": 1017,
1062
- "CGGCUAACUCCGUGCCAGCAGCCGCGGUAAUACGGAGG": 1018,
1063
- "AGAGAA": 1019,
1064
- "CAAAA": 1020,
1065
- "AAGCGUUAUCC": 1021,
1066
- "GAACGGAAAGG": 1022,
1067
- "GGUUUUCGG": 1023
1068
- },
1069
- "merges": [
1070
- "G G",
1071
- "A A",
1072
- "G C",
1073
- "U U",
1074
- "A C",
1075
- "G U",
1076
- "A U",
1077
- "C C",
1078
- "G AA",
1079
- "C U",
1080
- "G A",
1081
- "A GC",
1082
- "GG U",
1083
- "GG C",
1084
- "G AC",
1085
- "G UU",
1086
- "G AU",
1087
- "A GG",
1088
- "AA U",
1089
- "A UU",
1090
- "C GG",
1091
- "C GC",
1092
- "A GU",
1093
- "AC U",
1094
- "C UU",
1095
- "CC U",
1096
- "GC U",
1097
- "C AA",
1098
- "C AC",
1099
- "GG GG",
1100
- "GU AA",
1101
- "GG AA",
1102
- "A GA",
1103
- "UU U",
1104
- "GG GC",
1105
- "AU GC",
1106
- "GU GC",
1107
- "AC GG",
1108
- "GU C",
1109
- "AGC U",
1110
- "GAC U",
1111
- "GA GG",
1112
- "A GAU",
1113
- "A GAA",
1114
- "AU C",
1115
- "GA GC",
1116
- "AA CU",
1117
- "AA GC",
1118
- "GA GU",
1119
- "A GUU",
1120
- "GAA U",
1121
- "A GGC",
1122
- "C GU",
1123
- "GAA AGC",
1124
- "GG CU",
1125
- "A GGU",
1126
- "GG CC",
1127
- "AAU AC",
1128
- "C AGC",
1129
- "AUU U",
1130
- "C AU",
1131
- "AA UU",
1132
- "GG GU",
1133
- "GA UU",
1134
- "GG UU",
1135
- "CU GC",
1136
- "GA GGC",
1137
- "GG AC",
1138
- "GU GU",
1139
- "AU CC",
1140
- "CGC U",
1141
- "AA AC",
1142
- "GGU GAA",
1143
- "CC C",
1144
- "GG AU",
1145
- "GUU U",
1146
- "GU GAA",
1147
- "GAA GGC",
1148
- "GC GC",
1149
- "GU CC",
1150
- "CGG CU",
1151
- "GC AC",
1152
- "CUU U",
1153
- "AA CAC",
1154
- "AA C",
1155
- "C AGU",
1156
- "AA GUC",
1157
- "GU AGC",
1158
- "CC UU",
1159
- "C GGU",
1160
- "AA AA",
1161
- "GA GAC",
1162
- "GGAA UU",
1163
- "GU CU",
1164
- "CC GC",
1165
- "GAA GAA",
1166
- "AGC AGU",
1167
- "A GAC",
1168
- "AC CU",
1169
- "GAC GCU",
1170
- "A GACU",
1171
- "AC GU",
1172
- "GGGC GUAA",
1173
- "UU UU",
1174
- "CC CU",
1175
- "C AGG",
1176
- "AU CU",
1177
- "GU GGGG",
1178
- "CC AC",
1179
- "GGU AA",
1180
- "GGC GAAGGC",
1181
- "GG AGG",
1182
- "GGC UU",
1183
- "CCU ACGG",
1184
- "GA GAGG",
1185
- "CGC GU",
1186
- "GGUGAA AUGC",
1187
- "GG AGC",
1188
- "GG GAA",
1189
- "GGC GGC",
1190
- "GAA CGCU",
1191
- "AC UU",
1192
- "GU GA",
1193
- "AAU AUU",
1194
- "C GAU",
1195
- "GAC GGU",
1196
- "CC CC",
1197
- "GAGGC AGCAGU",
1198
- "AUGC AAGUC",
1199
- "AU AA",
1200
- "GC UU",
1201
- "GUGC CAGC",
1202
- "C GGC",
1203
- "AAU GGGC",
1204
- "CGC GGU",
1205
- "GC CU",
1206
- "C AUU",
1207
- "AC CC",
1208
- "CU CU",
1209
- "CGGCU AACU",
1210
- "GUGGGG AGC",
1211
- "GG GAU",
1212
- "GAACGCU GGCGGC",
1213
- "CCUACGG GAGGCAGCAGU",
1214
- "AC AC",
1215
- "C ACU",
1216
- "GA GGU",
1217
- "GUU GUAA",
1218
- "GAU GC",
1219
- "GUAGC GGUGAAAUGC",
1220
- "C GAA",
1221
- "GG AAU",
1222
- "AA GU",
1223
- "AU AC",
1224
- "CC AGC",
1225
- "GGU CU",
1226
- "GUGCCAGC AGC",
1227
- "AU GU",
1228
- "GAAAGC GUGGGGAGC",
1229
- "UU CGG",
1230
- "CAA GGC",
1231
- "AAGC GUU",
1232
- "AGC UU",
1233
- "GAA CGG",
1234
- "AAAC AGG",
1235
- "CUU CGG",
1236
- "C AAU",
1237
- "AA CGC",
1238
- "AA CC",
1239
- "C GAC",
1240
- "AC GGU",
1241
- "GA GGAA",
1242
- "GUGA GUAA",
1243
- "GGC GG",
1244
- "GUGCCAGCAGC CGCGGU",
1245
- "GG CCU",
1246
- "ACU GC",
1247
- "GU AGGC",
1248
- "GG GCU",
1249
- "CUU UU",
1250
- "CC GU",
1251
- "AA AGG",
1252
- "AACAC AUGCAAGUC",
1253
- "GU AGAU",
1254
- "AU AU",
1255
- "AGACU CCUACGGGAGGCAGCAGU",
1256
- "GG GACU",
1257
- "GG GUU",
1258
- "GU AGA",
1259
- "GAA GC",
1260
- "GGGG AAUAUU",
1261
- "C AUGC",
1262
- "UU GC",
1263
- "GG UUU",
1264
- "GG AUU",
1265
- "GG GGU",
1266
- "ACU GGGCGUAA",
1267
- "CCU GC",
1268
- "AGAA U",
1269
- "AGCU AGUU",
1270
- "CU GAC",
1271
- "GG AUUU",
1272
- "CGG AAUU",
1273
- "C GUU",
1274
- "GA GAA",
1275
- "CU GU",
1276
- "GAGC GUU",
1277
- "AUU AGAU",
1278
- "GAAAGCGUGGGGAGC AAACAGG",
1279
- "CCU GGU",
1280
- "ACU GACGCU",
1281
- "AGA GU",
1282
- "CU CC",
1283
- "AU GAU",
1284
- "GAC GAU",
1285
- "AC C",
1286
- "GGCC UUCGG",
1287
- "AA AU",
1288
- "GC AU",
1289
- "AA CUU",
1290
- "GAA AC",
1291
- "GAACGCUGGCGGC GUGC",
1292
- "AGG GUGC",
1293
- "CU GAU",
1294
- "AAUAC CGC",
1295
- "CAC ACU",
1296
- "AGG AA",
1297
- "AC UUU",
1298
- "CGG AU",
1299
- "GGAA CU",
1300
- "GAC GC",
1301
- "ACGG CCC",
1302
- "AUU UU",
1303
- "CU CAA",
1304
- "GGCGG ACGG",
1305
- "AGG AGG",
1306
- "CU GUU",
1307
- "GG ACU",
1308
- "GA GAU",
1309
- "AA CCU",
1310
- "GG AGU",
1311
- "GGGG GAU",
1312
- "GGCCUUCGG GUUGUAA",
1313
- "GA GUU",
1314
- "GC AA",
1315
- "AU CGG",
1316
- "AGUU U",
1317
- "CAGU GGCGAAGGC",
1318
- "GU AGU",
1319
- "GAC CU",
1320
- "GU AGG",
1321
- "AC CAAGGC",
1322
- "AA GUU",
1323
- "GU CGG",
1324
- "GAUGC AGC",
1325
- "GU GAGU",
1326
- "C AUC",
1327
- "GAU GAA",
1328
- "AGG CCU",
1329
- "GC AAGC",
1330
- "C GAGU",
1331
- "GUGAGUAA CAC",
1332
- "GGUCU GAGAGG",
1333
- "CGGAAUU ACUGGGCGUAA",
1334
- "CAA GC",
1335
- "CGGCUAACU CC",
1336
- "GGC GC",
1337
- "AAUGGGC GAAAGC",
1338
- "AU GAC",
1339
- "U ACGU",
1340
- "CC CGG",
1341
- "AA ACU",
1342
- "GAA AUGC",
1343
- "AU GAA",
1344
- "CGCGU GAGU",
1345
- "GGGACU GAGAC",
1346
- "CU AAUAC",
1347
- "GA GCU",
1348
- "AU CAA",
1349
- "U AC",
1350
- "CU C",
1351
- "AUUAGAU AC",
1352
- "ACGGU CC",
1353
- "AAU GC",
1354
- "ACGU G",
1355
- "GGGU AGC",
1356
- "AGA GC",
1357
- "AC GC",
1358
- "CGG CCAC",
1359
- "GGCU AACU",
1360
- "AUU GGGCGUAA",
1361
- "AGA UU",
1362
- "AC CGC",
1363
- "GG GAC",
1364
- "GAA ACU",
1365
- "CGGU GGCGAAGGC",
1366
- "AGG UU",
1367
- "C GAGC",
1368
- "GUGCCAGCAGCCGCGGU AAUAC",
1369
- "GU GAU",
1370
- "GU AGGU",
1371
- "AU AUU",
1372
- "AUU AGCUAGUU",
1373
- "AA AGC",
1374
- "GGC GAACGG",
1375
- "GUU UU",
1376
- "AGAA UU",
1377
- "AA GAA",
1378
- "GU AC",
1379
- "CC UUU",
1380
- "GAA CAGG",
1381
- "AGCU GGUCUGAGAGG",
1382
- "GGAACU GAGAC",
1383
- "UU AACACAUGCAAGUC",
1384
- "GG GUUU",
1385
- "AAUGGGC GCAAGC",
1386
- "GUAGCGGUGAAAUGC GUAGAU",
1387
- "GAU ACU",
1388
- "AGG CU",
1389
- "CC AU",
1390
- "GGU GC",
1391
- "ACGGCCC AGACUCCUACGGGAGGCAGCAGU",
1392
- "CC CAC",
1393
- "AGU C",
1394
- "AGGAGG AACAC",
1395
- "AC CAA",
1396
- "GAA CGC",
1397
- "GU CAA",
1398
- "CAGC CACACU",
1399
- "GUAA CU",
1400
- "GAGGC GC",
1401
- "CGG CCU",
1402
- "AAGC AC",
1403
- "GG GGC",
1404
- "CCC GGU",
1405
- "GGGGAAUAUU GCAC",
1406
- "CGC GUGU",
1407
- "CU GAA",
1408
- "GGAACUGAGAC ACGGUCC",
1409
- "AAU GGGG",
1410
- "GUU GGU",
1411
- "GC CC",
1412
- "GGUGAA AUU",
1413
- "AAU ACGG",
1414
- "GA UUU",
1415
- "AGAA GAA",
1416
- "GGGC UU",
1417
- "AU CCU",
1418
- "GAA AGU",
1419
- "AC CUU",
1420
- "GU GAAAGC",
1421
- "GC AGGC",
1422
- "GU AU",
1423
- "GU CAC",
1424
- "GU GGU",
1425
- "GAC GAACGCUGGCGGCGUGC",
1426
- "GU GAC",
1427
- "AU CAC",
1428
- "GGCU CAA",
1429
- "CGGAAUUACUGGGCGUAA AGC",
1430
- "GCU CAA",
1431
- "GG GA",
1432
- "GUGAA AUCC",
1433
- "AC AUU",
1434
- "AU CUU",
1435
- "AGG GAAU",
1436
- "AA AUU",
1437
- "C AGAA",
1438
- "CUGAU CCAGC",
1439
- "AGAU AUC",
1440
- "GUU GC",
1441
- "AUC GUAA",
1442
- "GG GGUAA",
1443
- "GGAAUU CCUGGU",
1444
- "GGAA AC",
1445
- "GUAGA GAU",
1446
- "AA AAU",
1447
- "CC CUU",
1448
- "GAC ACU",
1449
- "GACGGU ACCU",
1450
- "C GUAA",
1451
- "GU GGC",
1452
- "GCU GAA",
1453
- "GG GUAA",
1454
- "C GAAU",
1455
- "GUU GUU",
1456
- "GCU GC",
1457
- "GG GAAU",
1458
- "CU GAGAGG",
1459
- "AGA GGU",
1460
- "GA GA",
1461
- "CGGCUAACUCC GUGCCAGCAGCCGCGGU",
1462
- "AUCC GGAUUU",
1463
- "GCGC GUAGGC",
1464
- "CC AA",
1465
- "AC AA",
1466
- "AAUU UU",
1467
- "CC CAA",
1468
- "GAGGC AC",
1469
- "GUGAGUAACAC GU",
1470
- "AAGCGUU GUCC",
1471
- "GAA C",
1472
- "CAC CAGUGGCGAAGGC",
1473
- "AGA GG",
1474
- "GU GCU",
1475
- "CGG AAU",
1476
- "AC AGG",
1477
- "GGU CUUCGG",
1478
- "CAC CU",
1479
- "AU AGAU",
1480
- "C AGUU",
1481
- "GAGG AGC",
1482
- "CGG AA",
1483
- "GAUU GC",
1484
- "AGGCCU AACACAUGCAAGUC",
1485
- "CC GGU",
1486
- "CC CGC",
1487
- "GCU CGU",
1488
- "CAC GGCUAACU",
1489
- "AU GGU",
1490
- "AUU GAACGCUGGCGGC",
1491
- "GGGGAAUAUU GGAC",
1492
- "UU CU",
1493
- "UU GCU",
1494
- "ACU CU",
1495
- "AU AGC",
1496
- "GAGG AAUAUU",
1497
- "AAGC AU",
1498
- "GG AUC",
1499
- "AGG GAAGAA",
1500
- "AGAAGAA GCAC",
1501
- "GCU AAUACCGC",
1502
- "AC GGGC",
1503
- "GGGACUGAGAC ACGGCCCAGACUCCUACGGGAGGCAGCAGU",
1504
- "C A",
1505
- "CGC AA",
1506
- "GUAGCGGUGAAAUGC GC",
1507
- "AC GAU",
1508
- "GG GAUU",
1509
- "AGCUU GUUGGU",
1510
- "AAU CU",
1511
- "CGC GUGC",
1512
- "CAUGC CGCGUGU",
1513
- "GU CUU",
1514
- "GGUGAAAUU CGU",
1515
- "GUGAGU AAU",
1516
- "GA GGUAA",
1517
- "GGAACUGAGACACGGUCC AGACUCCUACGGGAGGCAGCAGU",
1518
- "CU GAUGCAGC",
1519
- "AAU AA",
1520
- "CC CCU",
1521
- "GAA AGCU",
1522
- "AACGC CGCGUGAGU",
1523
- "GGAGG AACAC",
1524
- "AGG GAU",
1525
- "AGAU AUU",
1526
- "CC GGGG",
1527
- "AGC AC",
1528
- "CGGCUAACU AC",
1529
- "GGCUU ACCAAGGC",
1530
- "CAAGGC GACGAU",
1531
- "GGGUUU AAAGG",
1532
- "CU GGU",
1533
- "C AGA",
1534
- "GU CGC",
1535
- "CGGCUAACU ACGUG",
1536
- "GAAU AA",
1537
- "GUAGA GGUGAAAUUCGU",
1538
- "GC CUU",
1539
- "GAC UU",
1540
- "CCU AGU",
1541
- "AA ACGG",
1542
- "GA GUGC",
1543
- "GUU CU",
1544
- "CGGCUAACUCCGUGCCAGCAGCCGCGGU AAUACGG",
1545
- "GGU GGGG",
1546
- "CCC AGU",
1547
- "CGGCCAC ACU",
1548
- "AGG GAA",
1549
- "AGG GGAGC",
1550
- "AACU GACGCU",
1551
- "GGGUAGC CGGCCU",
1552
- "CUUU GAACGC",
1553
- "GGGG AU",
1554
- "AUC AAU",
1555
- "GUGAA UUGC",
1556
- "AA CGU",
1557
- "AGGGAAU CUU",
1558
- "UACGU AGG",
1559
- "AGAUAUC AGGAGGAACAC",
1560
- "GAGGAAUAUU GGU",
1561
- "AGU CC",
1562
- "CU AU",
1563
- "AGC AU",
1564
- "GGGCU CAA",
1565
- "AGG GC",
1566
- "GGAA ACU",
1567
- "AA CAA",
1568
- "C AGGU",
1569
- "AC GUU",
1570
- "AA UUU",
1571
- "AGA UUU",
1572
- "AAUGGGCGAAAGC CUGAC",
1573
- "AU CGC",
1574
- "GAAAGC GU",
1575
- "AC AAU",
1576
- "AGG GG",
1577
- "GA GUAA",
1578
- "GAGGU GC",
1579
- "AAU CGGAAUUACUGGGCGUAAAGC",
1580
- "CGG UU",
1581
- "GAGCGUU GUCC",
1582
- "GAU GAAGAA",
1583
- "GC AGC",
1584
- "GA GAGU",
1585
- "GACGAACGCUGGCGGCGUGC UUAACACAUGCAAGUC",
1586
- "GU CCU",
1587
- "GAAAUGC GAU",
1588
- "AGCUAGUU GGU",
1589
- "GAC GUU",
1590
- "GAA UU",
1591
- "GACU GC",
1592
- "GCU GCAU",
1593
- "AGA GGAA",
1594
- "AU ACU",
1595
- "AUC AGCUUGUUGGU",
1596
- "GAU CU",
1597
- "CGG AUU",
1598
- "AAU CUU",
1599
- "GGAAUU CC",
1600
- "CUAAUAC AUGCAAGUC",
1601
- "GUU AA",
1602
- "C AGCU",
1603
- "CGAC CUGAGAGG",
1604
- "GCUGAA CUU",
1605
- "GAAGAA GGCCUUCGGGUUGUAA",
1606
- "GAUUGC GAAGGC",
1607
- "CC CGU",
1608
- "GG GAGC",
1609
- "GU AAU",
1610
- "GACGGU AC",
1611
- "GAC GGGUAGCCGGCCU",
1612
- "AGC GC",
1613
- "GCUCGU AGGC",
1614
- "GGCC UU",
1615
- "CC GAA",
1616
- "GUGAA GAA",
1617
- "GGAAUU CCCGGU",
1618
- "CC AGU",
1619
- "AUU GUAA",
1620
- "CGGCU AACUU",
1621
- "CAA UU",
1622
- "GGAAUU AUUGGGCGUAA",
1623
- "GAAAGCGUGGGGAGC GAACAGG",
1624
- "CC GG",
1625
- "CC CAU",
1626
- "C GAGG",
1627
- "AGG AC",
1628
- "AA AGU",
1629
- "CC GAU",
1630
- "CAC CAA",
1631
- "AGC CACGGCUAACU",
1632
- "UUU CU",
1633
- "GGC GGU",
1634
- "GGAAU GC",
1635
- "GAAAC CCU",
1636
- "AA GUCC",
1637
- "C GUGC",
1638
- "GAAAGCGUGGGGAGCAAACAGG AUUAGAUAC",
1639
- "AGCUGGUCUGAGAGG AUGAU",
1640
- "AGA GGGG",
1641
- "AU GGUU",
1642
- "C GAUU",
1643
- "AUUAGCUAGUU GGU",
1644
- "AUGC CU",
1645
- "AGA GUGC",
1646
- "GAA AA",
1647
- "GAU GAACGCUGGCGGCGUGC",
1648
- "GGU AAC",
1649
- "AC GAC",
1650
- "GUC AUU",
1651
- "AAUAC CGGAU",
1652
- "GUGU AGGC",
1653
- "GA GGGG",
1654
- "AU AAU",
1655
- "CGCGU GAGG",
1656
- "AGCU CGU",
1657
- "A G",
1658
- "CACU GGGCGUAA",
1659
- "ACU GGGU",
1660
- "GAAU CAUC",
1661
- "CUU GC",
1662
- "CAA CU",
1663
- "C AGGC",
1664
- "AAGC GGAGG",
1665
- "AGG GCGCGUAGGC",
1666
- "AAGCGUU GUU",
1667
- "GGAA CUGC",
1668
- "CC AUU",
1669
- "AC CAU",
1670
- "AA GUCU",
1671
- "AUCCGGAUUU AUU",
1672
- "CGAU GGCGAAGGC",
1673
- "AC ACU",
1674
- "GG GAGG",
1675
- "GUGAGUAA CGCGU",
1676
- "GAAU CUUUGAACGC",
1677
- "CCUU UU",
1678
- "C AGAU",
1679
- "AGU GAA",
1680
- "GG AGAA",
1681
- "AACU CUGUU",
1682
- "GGCGGACGG GUGAGUAAU",
1683
- "GUAGAGGUGAAAUUCGU AGAUAUU",
1684
- "AC CGG",
1685
- "GAGAC GC",
1686
- "GU AUU",
1687
- "AAGCAU AUCAAU",
1688
- "CCUGC CCUU",
1689
- "AU GCU",
1690
- "AGU AAU",
1691
- "AGG GAC",
1692
- "AUCAGCUUGUUGGU GGGGU",
1693
- "AGU AA",
1694
- "CCAGC CAA",
1695
- "AGAAU AAGCAC",
1696
- "CUCU GGGC",
1697
- "AUC AGGU",
1698
- "CCU AU",
1699
- "GAU AAU",
1700
- "AC CAC",
1701
- "GG AUCC",
1702
- "CGACCUGAGAGG GUGAU",
1703
- "CGC CU",
1704
- "C GA",
1705
- "AC AU",
1706
- "CUU CU",
1707
- "GG AGA",
1708
- "AA GCU",
1709
- "GGAAUUCCUGGU GUAGCGGUGAAAUGCGC",
1710
- "AGC GAAAUGCGAU",
1711
- "GAU GUU",
1712
- "AAACGG G",
1713
- "AA GAC",
1714
- "AGC ACUUU",
1715
- "AAUGGGG GAAACCCU",
1716
- "GU GUU",
1717
- "AAU GGAC",
1718
- "GGGAU AA",
1719
- "GAC GGCCUUCGGGUUGUAA",
1720
- "C AUUU",
1721
- "GGU AUU",
1722
- "C GACU",
1723
- "GACGCU GAGGCGC",
1724
- "AGGC UU",
1725
- "AGCU AAUACCGC",
1726
- "GGU CC",
1727
- "GGGAA CUGC",
1728
- "GUC GUAA",
1729
- "GAA GGGG",
1730
- "GUGU AGC",
1731
- "AU GUU",
1732
- "AAGCAUAUCAAU AAGCGGAGG",
1733
- "AGC GGCGGACGG",
1734
- "UACGU AGGGUGC",
1735
- "GAA CU",
1736
- "CC AGG",
1737
- "AGU GC",
1738
- "CCU AC",
1739
- "GGC GAAAGC",
1740
- "GCU CU",
1741
- "CAC UU",
1742
- "GGU CUU",
1743
- "AUU GC",
1744
- "CAUU GGGCGUAA",
1745
- "CC CUGC",
1746
- "GCU AGC",
1747
- "GUU GCU",
1748
- "AGA GAU",
1749
- "GUC GUC",
1750
- "CGC UU",
1751
- "AAUGGGCGCAAGC CUGAUCCAGC",
1752
- "GAA CC",
1753
- "GUGAAUUGC AGAAUU",
1754
- "GGCGAACGG GUGAGUAACAC",
1755
- "GAAAGCU AGGGGAGC",
1756
- "GAAUCAUC GAAUCUUUGAACGC",
1757
- "ACU GGAA",
1758
- "AA CGG",
1759
- "CUAAUACAUGCAAGUC GAGC",
1760
- "AGCUU GCU",
1761
- "AUUAGAU ACCC",
1762
- "GGAGC AACGCCGCGUGAGU",
1763
- "AAUGGGCGCAAGC CUGAUGCAGC",
1764
- "GUGAAAUCC CC",
1765
- "AA GGU",
1766
- "CGC GC",
1767
- "GGUU UU",
1768
- "GGGUUUAAAGG GUGC",
1769
- "CGGCCAC AUU",
1770
- "GGAA GCCU",
1771
- "GU ACAC",
1772
- "GGUCUUCGG AUCGUAA",
1773
- "AUUGAACGCUGGCGGC AGGCCUAACACAUGCAAGUC",
1774
- "GACGGGUAGCCGGCCU GAGAGG",
1775
- "AUU CU",
1776
- "GAA AGG",
1777
- "CCUU CGG",
1778
- "GG AGCU",
1779
- "CUU GAGU",
1780
- "CGG AGCU",
1781
- "GAC UUU",
1782
- "GUGCCAGC CGC",
1783
- "GC AGU",
1784
- "AGUU GGU",
1785
- "AAGCAUAUCAAUAAGCGGAGG A",
1786
- "GAAAGC CAGG",
1787
- "GGUAA GGUAAC",
1788
- "GG GUUGUAA",
1789
- "ACCC GCUGAACUU",
1790
- "ACAUU GCGC",
1791
- "GGGG AGU",
1792
- "AUC AGC",
1793
- "ACUU CUUUU",
1794
- "AGCU CU",
1795
- "U ACGG",
1796
- "GUAGCGGUGAAAUGC UU",
1797
- "AA GGC",
1798
- "CCU CU",
1799
- "AUCAA ACAGG",
1800
- "AGCUGGUCUGAGAGGAUGAU CAGCCACACU",
1801
- "AU GGGG",
1802
- "GA GAGC",
1803
- "GGUGAAAUGC GUAGAU",
1804
- "GA GGGC",
1805
- "GGC AGC",
1806
- "GU GAGG",
1807
- "AUCGG GAGGAA",
1808
- "AGA GCUCGUAGGC",
1809
- "GGGG AAUUUU",
1810
- "CAU CU",
1811
- "GAU CCAGC",
1812
- "GAA CGGC",
1813
- "GGAAUU CCUAGU",
1814
- "C GUC",
1815
- "GGCC CU",
1816
- "GAU GAU",
1817
- "AUAA GACU",
1818
- "GGCU CACU",
1819
- "GGGG GAC",
1820
- "AAU CUGC",
1821
- "GAA CAC",
1822
- "AACU GC",
1823
- "AAUAC CC",
1824
- "GGACU CGC",
1825
- "CAUGCCGCGUGU GUGAAGAA",
1826
- "GUU AC",
1827
- "AAUU C",
1828
- "GGC AC",
1829
- "ACCAAGGC GACGAU",
1830
- "CUCAA CCU",
1831
- "CGGCUAACUCCGUGCCAGCAGCCGCGGUAAUACGG AGG",
1832
- "AGA GAA",
1833
- "CAA AA",
1834
- "AAGCGUU AUCC",
1835
- "GAACGG AAAGG",
1836
- "GGUU UUCGG"
1837
- ]
1838
- }
1839
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
tokenizer_bpe_1024/tokenizer_config.json DELETED
@@ -1,19 +0,0 @@
1
- {
2
- "add_prefix_space": false,
3
- "added_tokens_decoder": {
4
- "0": {
5
- "content": "<|endoftext|>",
6
- "lstrip": false,
7
- "normalized": true,
8
- "rstrip": false,
9
- "single_word": false,
10
- "special": true
11
- }
12
- },
13
- "bos_token": "<|endoftext|>",
14
- "clean_up_tokenization_spaces": true,
15
- "eos_token": "<|endoftext|>",
16
- "model_max_length": 1024,
17
- "tokenizer_class": "GPT2Tokenizer",
18
- "unk_token": "<|endoftext|>"
19
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
tokenizer_bpe_1024/vocab.json DELETED
@@ -1 +0,0 @@
1
- {"<|endoftext|>":0,"!":1,"\"":2,"#":3,"$":4,"%":5,"&":6,"'":7,"(":8,")":9,"*":10,"+":11,",":12,"-":13,".":14,"/":15,"0":16,"1":17,"2":18,"3":19,"4":20,"5":21,"6":22,"7":23,"8":24,"9":25,":":26,";":27,"<":28,"=":29,">":30,"?":31,"@":32,"A":33,"B":34,"C":35,"D":36,"E":37,"F":38,"G":39,"H":40,"I":41,"J":42,"K":43,"L":44,"M":45,"N":46,"O":47,"P":48,"Q":49,"R":50,"S":51,"T":52,"U":53,"V":54,"W":55,"X":56,"Y":57,"Z":58,"[":59,"\\":60,"]":61,"^":62,"_":63,"`":64,"a":65,"b":66,"c":67,"d":68,"e":69,"f":70,"g":71,"h":72,"i":73,"j":74,"k":75,"l":76,"m":77,"n":78,"o":79,"p":80,"q":81,"r":82,"s":83,"t":84,"u":85,"v":86,"w":87,"x":88,"y":89,"z":90,"{":91,"|":92,"}":93,"~":94,"¡":95,"¢":96,"£":97,"¤":98,"¥":99,"¦":100,"§":101,"¨":102,"©":103,"ª":104,"«":105,"¬":106,"®":107,"¯":108,"°":109,"±":110,"²":111,"³":112,"´":113,"µ":114,"¶":115,"·":116,"¸":117,"¹":118,"º":119,"»":120,"¼":121,"½":122,"¾":123,"¿":124,"À":125,"Á":126,"Â":127,"Ã":128,"Ä":129,"Å":130,"Æ":131,"Ç":132,"È":133,"É":134,"Ê":135,"Ë":136,"Ì":137,"Í":138,"Î":139,"Ï":140,"Ð":141,"Ñ":142,"Ò":143,"Ó":144,"Ô":145,"Õ":146,"Ö":147,"×":148,"Ø":149,"Ù":150,"Ú":151,"Û":152,"Ü":153,"Ý":154,"Þ":155,"ß":156,"à":157,"á":158,"â":159,"ã":160,"ä":161,"å":162,"æ":163,"ç":164,"è":165,"é":166,"ê":167,"ë":168,"ì":169,"í":170,"î":171,"ï":172,"ð":173,"ñ":174,"ò":175,"ó":176,"ô":177,"õ":178,"ö":179,"÷":180,"ø":181,"ù":182,"ú":183,"û":184,"ü":185,"ý":186,"þ":187,"ÿ":188,"Ā":189,"ā":190,"Ă":191,"ă":192,"Ą":193,"ą":194,"Ć":195,"ć":196,"Ĉ":197,"ĉ":198,"Ċ":199,"ċ":200,"Č":201,"č":202,"Ď":203,"ď":204,"Đ":205,"đ":206,"Ē":207,"ē":208,"Ĕ":209,"ĕ":210,"Ė":211,"ė":212,"Ę":213,"ę":214,"Ě":215,"ě":216,"Ĝ":217,"ĝ":218,"Ğ":219,"ğ":220,"Ġ":221,"ġ":222,"Ģ":223,"ģ":224,"Ĥ":225,"ĥ":226,"Ħ":227,"ħ":228,"Ĩ":229,"ĩ":230,"Ī":231,"ī":232,"Ĭ":233,"ĭ":234,"Į":235,"į":236,"İ":237,"ı":238,"IJ":239,"ij":240,"Ĵ":241,"ĵ":242,"Ķ":243,"ķ":244,"ĸ":245,"Ĺ":246,"ĺ":247,"Ļ":248,"ļ":249,"Ľ":250,"ľ":251,"Ŀ":252,"ŀ":253,"Ł":254,"ł":255,"Ń":256,"GG":257,"AA":258,"GC":259,"UU":260,"AC":261,"GU":262,"AU":263,"CC":264,"GAA":265,"CU":266,"GA":267,"AGC":268,"GGU":269,"GGC":270,"GAC":271,"GUU":272,"GAU":273,"AGG":274,"AAU":275,"AUU":276,"CGG":277,"CGC":278,"AGU":279,"ACU":280,"CUU":281,"CCU":282,"GCU":283,"CAA":284,"CAC":285,"GGGG":286,"GUAA":287,"GGAA":288,"AGA":289,"UUU":290,"GGGC":291,"AUGC":292,"GUGC":293,"ACGG":294,"GUC":295,"AGCU":296,"GACU":297,"GAGG":298,"AGAU":299,"AGAA":300,"AUC":301,"GAGC":302,"AACU":303,"AAGC":304,"GAGU":305,"AGUU":306,"GAAU":307,"AGGC":308,"CGU":309,"GAAAGC":310,"GGCU":311,"AGGU":312,"GGCC":313,"AAUAC":314,"CAGC":315,"AUUU":316,"CAU":317,"AAUU":318,"GGGU":319,"GAUU":320,"GGUU":321,"CUGC":322,"GAGGC":323,"GGAC":324,"GUGU":325,"AUCC":326,"CGCU":327,"AAAC":328,"GGUGAA":329,"CCC":330,"GGAU":331,"GUUU":332,"GUGAA":333,"GAAGGC":334,"GCGC":335,"GUCC":336,"CGGCU":337,"GCAC":338,"CUUU":339,"AACAC":340,"AAC":341,"CAGU":342,"AAGUC":343,"GUAGC":344,"CCUU":345,"CGGU":346,"AAAA":347,"GAGAC":348,"GGAAUU":349,"GUCU":350,"CCGC":351,"GAAGAA":352,"AGCAGU":353,"AGAC":354,"ACCU":355,"GACGCU":356,"AGACU":357,"ACGU":358,"GGGCGUAA":359,"UUUU":360,"CCCU":361,"CAGG":362,"AUCU":363,"GUGGGG":364,"CCAC":365,"GGUAA":366,"GGCGAAGGC":367,"GGAGG":368,"GGCUU":369,"CCUACGG":370,"GAGAGG":371,"CGCGU":372,"GGUGAAAUGC":373,"GGAGC":374,"GGGAA":375,"GGCGGC":376,"GAACGCU":377,"ACUU":378,"GUGA":379,"AAUAUU":380,"CGAU":381,"GACGGU":382,"CCCC":383,"GAGGCAGCAGU":384,"AUGCAAGUC":385,"AUAA":386,"GCUU":387,"GUGCCAGC":388,"CGGC":389,"AAUGGGC":390,"CGCGGU":391,"GCCU":392,"CAUU":393,"ACCC":394,"CUCU":395,"CGGCUAACU":396,"GUGGGGAGC":397,"GGGAU":398,"GAACGCUGGCGGC":399,"CCUACGGGAGGCAGCAGU":400,"ACAC":401,"CACU":402,"GAGGU":403,"GUUGUAA":404,"GAUGC":405,"GUAGCGGUGAAAUGC":406,"CGAA":407,"GGAAU":408,"AAGU":409,"AUAC":410,"CCAGC":411,"GGUCU":412,"GUGCCAGCAGC":413,"AUGU":414,"GAAAGCGUGGGGAGC":415,"UUCGG":416,"CAAGGC":417,"AAGCGUU":418,"AGCUU":419,"GAACGG":420,"AAACAGG":421,"CUUCGG":422,"CAAU":423,"AACGC":424,"AACC":425,"CGAC":426,"ACGGU":427,"GAGGAA":428,"GUGAGUAA":429,"GGCGG":430,"GUGCCAGCAGCCGCGGU":431,"GGCCU":432,"ACUGC":433,"GUAGGC":434,"GGGCU":435,"CUUUU":436,"CCGU":437,"AAAGG":438,"AACACAUGCAAGUC":439,"GUAGAU":440,"AUAU":441,"AGACUCCUACGGGAGGCAGCAGU":442,"GGGACU":443,"GGGUU":444,"GUAGA":445,"GAAGC":446,"GGGGAAUAUU":447,"CAUGC":448,"UUGC":449,"GGUUU":450,"GGAUU":451,"GGGGU":452,"ACUGGGCGUAA":453,"CCUGC":454,"AGAAU":455,"AGCUAGUU":456,"CUGAC":457,"GGAUUU":458,"CGGAAUU":459,"CGUU":460,"GAGAA":461,"CUGU":462,"GAGCGUU":463,"AUUAGAU":464,"GAAAGCGUGGGGAGCAAACAGG":465,"CCUGGU":466,"ACUGACGCU":467,"AGAGU":468,"CUCC":469,"AUGAU":470,"GACGAU":471,"ACC":472,"GGCCUUCGG":473,"AAAU":474,"GCAU":475,"AACUU":476,"GAAAC":477,"GAACGCUGGCGGCGUGC":478,"AGGGUGC":479,"CUGAU":480,"AAUACCGC":481,"CACACU":482,"AGGAA":483,"ACUUU":484,"CGGAU":485,"GGAACU":486,"GACGC":487,"ACGGCCC":488,"AUUUU":489,"CUCAA":490,"GGCGGACGG":491,"AGGAGG":492,"CUGUU":493,"GGACU":494,"GAGAU":495,"AACCU":496,"GGAGU":497,"GGGGGAU":498,"GGCCUUCGGGUUGUAA":499,"GAGUU":500,"GCAA":501,"AUCGG":502,"AGUUU":503,"CAGUGGCGAAGGC":504,"GUAGU":505,"GACCU":506,"GUAGG":507,"ACCAAGGC":508,"AAGUU":509,"GUCGG":510,"GAUGCAGC":511,"GUGAGU":512,"CAUC":513,"GAUGAA":514,"AGGCCU":515,"GCAAGC":516,"CGAGU":517,"GUGAGUAACAC":518,"GGUCUGAGAGG":519,"CGGAAUUACUGGGCGUAA":520,"CAAGC":521,"CGGCUAACUCC":522,"GGCGC":523,"AAUGGGCGAAAGC":524,"AUGAC":525,"UACGU":526,"CCCGG":527,"AAACU":528,"GAAAUGC":529,"AUGAA":530,"CGCGUGAGU":531,"GGGACUGAGAC":532,"CUAAUAC":533,"GAGCU":534,"AUCAA":535,"UAC":536,"CUC":537,"AUUAGAUAC":538,"ACGGUCC":539,"AAUGC":540,"ACGUG":541,"GGGUAGC":542,"AGAGC":543,"ACGC":544,"CGGCCAC":545,"GGCUAACU":546,"AUUGGGCGUAA":547,"AGAUU":548,"ACCGC":549,"GGGAC":550,"GAAACU":551,"CGGUGGCGAAGGC":552,"AGGUU":553,"CGAGC":554,"GUGCCAGCAGCCGCGGUAAUAC":555,"GUGAU":556,"GUAGGU":557,"AUAUU":558,"AUUAGCUAGUU":559,"AAAGC":560,"GGCGAACGG":561,"GUUUU":562,"AGAAUU":563,"AAGAA":564,"GUAC":565,"CCUUU":566,"GAACAGG":567,"AGCUGGUCUGAGAGG":568,"GGAACUGAGAC":569,"UUAACACAUGCAAGUC":570,"GGGUUU":571,"AAUGGGCGCAAGC":572,"GUAGCGGUGAAAUGCGUAGAU":573,"GAUACU":574,"AGGCU":575,"CCAU":576,"GGUGC":577,"ACGGCCCAGACUCCUACGGGAGGCAGCAGU":578,"CCCAC":579,"AGUC":580,"AGGAGGAACAC":581,"ACCAA":582,"GAACGC":583,"GUCAA":584,"CAGCCACACU":585,"GUAACU":586,"GAGGCGC":587,"CGGCCU":588,"AAGCAC":589,"GGGGC":590,"CCCGGU":591,"GGGGAAUAUUGCAC":592,"CGCGUGU":593,"CUGAA":594,"GGAACUGAGACACGGUCC":595,"AAUGGGG":596,"GUUGGU":597,"GCCC":598,"GGUGAAAUU":599,"AAUACGG":600,"GAUUU":601,"AGAAGAA":602,"GGGCUU":603,"AUCCU":604,"GAAAGU":605,"ACCUU":606,"GUGAAAGC":607,"GCAGGC":608,"GUAU":609,"GUCAC":610,"GUGGU":611,"GACGAACGCUGGCGGCGUGC":612,"GUGAC":613,"AUCAC":614,"GGCUCAA":615,"CGGAAUUACUGGGCGUAAAGC":616,"GCUCAA":617,"GGGA":618,"GUGAAAUCC":619,"ACAUU":620,"AUCUU":621,"AGGGAAU":622,"AAAUU":623,"CAGAA":624,"CUGAUCCAGC":625,"AGAUAUC":626,"GUUGC":627,"AUCGUAA":628,"GGGGUAA":629,"GGAAUUCCUGGU":630,"GGAAAC":631,"GUAGAGAU":632,"AAAAU":633,"CCCUU":634,"GACACU":635,"GACGGUACCU":636,"CGUAA":637,"GUGGC":638,"GCUGAA":639,"GGGUAA":640,"CGAAU":641,"GUUGUU":642,"GCUGC":643,"GGGAAU":644,"CUGAGAGG":645,"AGAGGU":646,"GAGA":647,"CGGCUAACUCCGUGCCAGCAGCCGCGGU":648,"AUCCGGAUUU":649,"GCGCGUAGGC":650,"CCAA":651,"ACAA":652,"AAUUUU":653,"CCCAA":654,"GAGGCAC":655,"GUGAGUAACACGU":656,"AAGCGUUGUCC":657,"GAAC":658,"CACCAGUGGCGAAGGC":659,"AGAGG":660,"GUGCU":661,"CGGAAU":662,"ACAGG":663,"GGUCUUCGG":664,"CACCU":665,"AUAGAU":666,"CAGUU":667,"GAGGAGC":668,"CGGAA":669,"GAUUGC":670,"AGGCCUAACACAUGCAAGUC":671,"CCGGU":672,"CCCGC":673,"GCUCGU":674,"CACGGCUAACU":675,"AUGGU":676,"AUUGAACGCUGGCGGC":677,"GGGGAAUAUUGGAC":678,"UUCU":679,"UUGCU":680,"ACUCU":681,"AUAGC":682,"GAGGAAUAUU":683,"AAGCAU":684,"GGAUC":685,"AGGGAAGAA":686,"AGAAGAAGCAC":687,"GCUAAUACCGC":688,"ACGGGC":689,"GGGACUGAGACACGGCCCAGACUCCUACGGGAGGCAGCAGU":690,"CA":691,"CGCAA":692,"GUAGCGGUGAAAUGCGC":693,"ACGAU":694,"GGGAUU":695,"AGCUUGUUGGU":696,"AAUCU":697,"CGCGUGC":698,"CAUGCCGCGUGU":699,"GUCUU":700,"GGUGAAAUUCGU":701,"GUGAGUAAU":702,"GAGGUAA":703,"GGAACUGAGACACGGUCCAGACUCCUACGGGAGGCAGCAGU":704,"CUGAUGCAGC":705,"AAUAA":706,"CCCCU":707,"GAAAGCU":708,"AACGCCGCGUGAGU":709,"GGAGGAACAC":710,"AGGGAU":711,"AGAUAUU":712,"CCGGGG":713,"AGCAC":714,"CGGCUAACUAC":715,"GGCUUACCAAGGC":716,"CAAGGCGACGAU":717,"GGGUUUAAAGG":718,"CUGGU":719,"CAGA":720,"GUCGC":721,"CGGCUAACUACGUG":722,"GAAUAA":723,"GUAGAGGUGAAAUUCGU":724,"GCCUU":725,"GACUU":726,"CCUAGU":727,"AAACGG":728,"GAGUGC":729,"GUUCU":730,"CGGCUAACUCCGUGCCAGCAGCCGCGGUAAUACGG":731,"GGUGGGG":732,"CCCAGU":733,"CGGCCACACU":734,"AGGGAA":735,"AGGGGAGC":736,"AACUGACGCU":737,"GGGUAGCCGGCCU":738,"CUUUGAACGC":739,"GGGGAU":740,"AUCAAU":741,"GUGAAUUGC":742,"AACGU":743,"AGGGAAUCUU":744,"UACGUAGG":745,"AGAUAUCAGGAGGAACAC":746,"GAGGAAUAUUGGU":747,"AGUCC":748,"CUAU":749,"AGCAU":750,"GGGCUCAA":751,"AGGGC":752,"GGAAACU":753,"AACAA":754,"CAGGU":755,"ACGUU":756,"AAUUU":757,"AGAUUU":758,"AAUGGGCGAAAGCCUGAC":759,"AUCGC":760,"GAAAGCGU":761,"ACAAU":762,"AGGGG":763,"GAGUAA":764,"GAGGUGC":765,"AAUCGGAAUUACUGGGCGUAAAGC":766,"CGGUU":767,"GAGCGUUGUCC":768,"GAUGAAGAA":769,"GCAGC":770,"GAGAGU":771,"GACGAACGCUGGCGGCGUGCUUAACACAUGCAAGUC":772,"GUCCU":773,"GAAAUGCGAU":774,"AGCUAGUUGGU":775,"GACGUU":776,"GAAUU":777,"GACUGC":778,"GCUGCAU":779,"AGAGGAA":780,"AUACU":781,"AUCAGCUUGUUGGU":782,"GAUCU":783,"CGGAUU":784,"AAUCUU":785,"GGAAUUCC":786,"CUAAUACAUGCAAGUC":787,"GUUAA":788,"CAGCU":789,"CGACCUGAGAGG":790,"GCUGAACUU":791,"GAAGAAGGCCUUCGGGUUGUAA":792,"GAUUGCGAAGGC":793,"CCCGU":794,"GGGAGC":795,"GUAAU":796,"GACGGUAC":797,"GACGGGUAGCCGGCCU":798,"AGCGC":799,"GCUCGUAGGC":800,"GGCCUU":801,"CCGAA":802,"GUGAAGAA":803,"GGAAUUCCCGGU":804,"CCAGU":805,"AUUGUAA":806,"CGGCUAACUU":807,"CAAUU":808,"GGAAUUAUUGGGCGUAA":809,"GAAAGCGUGGGGAGCGAACAGG":810,"CCGG":811,"CCCAU":812,"CGAGG":813,"AGGAC":814,"AAAGU":815,"CCGAU":816,"CACCAA":817,"AGCCACGGCUAACU":818,"UUUCU":819,"GGCGGU":820,"GGAAUGC":821,"GAAACCCU":822,"AAGUCC":823,"CGUGC":824,"GAAAGCGUGGGGAGCAAACAGGAUUAGAUAC":825,"AGCUGGUCUGAGAGGAUGAU":826,"AGAGGGG":827,"AUGGUU":828,"CGAUU":829,"AUUAGCUAGUUGGU":830,"AUGCCU":831,"AGAGUGC":832,"GAAAA":833,"GAUGAACGCUGGCGGCGUGC":834,"GGUAAC":835,"ACGAC":836,"GUCAUU":837,"AAUACCGGAU":838,"GUGUAGGC":839,"GAGGGG":840,"AUAAU":841,"CGCGUGAGG":842,"AGCUCGU":843,"AG":844,"CACUGGGCGUAA":845,"ACUGGGU":846,"GAAUCAUC":847,"CUUGC":848,"CAACU":849,"CAGGC":850,"AAGCGGAGG":851,"AGGGCGCGUAGGC":852,"AAGCGUUGUU":853,"GGAACUGC":854,"CCAUU":855,"ACCAU":856,"AAGUCU":857,"AUCCGGAUUUAUU":858,"CGAUGGCGAAGGC":859,"ACACU":860,"GGGAGG":861,"GUGAGUAACGCGU":862,"GAAUCUUUGAACGC":863,"CCUUUU":864,"CAGAU":865,"AGUGAA":866,"GGAGAA":867,"AACUCUGUU":868,"GGCGGACGGGUGAGUAAU":869,"GUAGAGGUGAAAUUCGUAGAUAUU":870,"ACCGG":871,"GAGACGC":872,"GUAUU":873,"AAGCAUAUCAAU":874,"CCUGCCCUU":875,"AUGCU":876,"AGUAAU":877,"AGGGAC":878,"AUCAGCUUGUUGGUGGGGU":879,"AGUAA":880,"CCAGCCAA":881,"AGAAUAAGCAC":882,"CUCUGGGC":883,"AUCAGGU":884,"CCUAU":885,"GAUAAU":886,"ACCAC":887,"GGAUCC":888,"CGACCUGAGAGGGUGAU":889,"CGCCU":890,"CGA":891,"ACAU":892,"CUUCU":893,"GGAGA":894,"AAGCU":895,"GGAAUUCCUGGUGUAGCGGUGAAAUGCGC":896,"AGCGAAAUGCGAU":897,"GAUGUU":898,"AAACGGG":899,"AAGAC":900,"AGCACUUU":901,"AAUGGGGGAAACCCU":902,"GUGUU":903,"AAUGGAC":904,"GGGAUAA":905,"GACGGCCUUCGGGUUGUAA":906,"CAUUU":907,"GGUAUU":908,"CGACU":909,"GACGCUGAGGCGC":910,"AGGCUU":911,"AGCUAAUACCGC":912,"GGUCC":913,"GGGAACUGC":914,"GUCGUAA":915,"GAAGGGG":916,"GUGUAGC":917,"AUGUU":918,"AAGCAUAUCAAUAAGCGGAGG":919,"AGCGGCGGACGG":920,"UACGUAGGGUGC":921,"GAACU":922,"CCAGG":923,"AGUGC":924,"CCUAC":925,"GGCGAAAGC":926,"GCUCU":927,"CACUU":928,"GGUCUU":929,"AUUGC":930,"CAUUGGGCGUAA":931,"CCCUGC":932,"GCUAGC":933,"GUUGCU":934,"AGAGAU":935,"GUCGUC":936,"CGCUU":937,"AAUGGGCGCAAGCCUGAUCCAGC":938,"GAACC":939,"GUGAAUUGCAGAAUU":940,"GGCGAACGGGUGAGUAACAC":941,"GAAAGCUAGGGGAGC":942,"GAAUCAUCGAAUCUUUGAACGC":943,"ACUGGAA":944,"AACGG":945,"CUAAUACAUGCAAGUCGAGC":946,"AGCUUGCU":947,"AUUAGAUACCC":948,"GGAGCAACGCCGCGUGAGU":949,"AAUGGGCGCAAGCCUGAUGCAGC":950,"GUGAAAUCCCC":951,"AAGGU":952,"CGCGC":953,"GGUUUU":954,"GGGUUUAAAGGGUGC":955,"CGGCCACAUU":956,"GGAAGCCU":957,"GUACAC":958,"GGUCUUCGGAUCGUAA":959,"AUUGAACGCUGGCGGCAGGCCUAACACAUGCAAGUC":960,"GACGGGUAGCCGGCCUGAGAGG":961,"AUUCU":962,"GAAAGG":963,"CCUUCGG":964,"GGAGCU":965,"CUUGAGU":966,"CGGAGCU":967,"GACUUU":968,"GUGCCAGCCGC":969,"GCAGU":970,"AGUUGGU":971,"AAGCAUAUCAAUAAGCGGAGGA":972,"GAAAGCCAGG":973,"GGUAAGGUAAC":974,"GGGUUGUAA":975,"ACCCGCUGAACUU":976,"ACAUUGCGC":977,"GGGGAGU":978,"AUCAGC":979,"ACUUCUUUU":980,"AGCUCU":981,"UACGG":982,"GUAGCGGUGAAAUGCUU":983,"AAGGC":984,"CCUCU":985,"AUCAAACAGG":986,"AGCUGGUCUGAGAGGAUGAUCAGCCACACU":987,"AUGGGG":988,"GAGAGC":989,"GGUGAAAUGCGUAGAU":990,"GAGGGC":991,"GGCAGC":992,"GUGAGG":993,"AUCGGGAGGAA":994,"AGAGCUCGUAGGC":995,"GGGGAAUUUU":996,"CAUCU":997,"GAUCCAGC":998,"GAACGGC":999,"GGAAUUCCUAGU":1000,"CGUC":1001,"GGCCCU":1002,"GAUGAU":1003,"AUAAGACU":1004,"GGCUCACU":1005,"GGGGGAC":1006,"AAUCUGC":1007,"GAACAC":1008,"AACUGC":1009,"AAUACCC":1010,"GGACUCGC":1011,"CAUGCCGCGUGUGUGAAGAA":1012,"GUUAC":1013,"AAUUC":1014,"GGCAC":1015,"ACCAAGGCGACGAU":1016,"CUCAACCU":1017,"CGGCUAACUCCGUGCCAGCAGCCGCGGUAAUACGGAGG":1018,"AGAGAA":1019,"CAAAA":1020,"AAGCGUUAUCC":1021,"GAACGGAAAGG":1022,"GGUUUUCGG":1023}