nguyenvulebinh commited on
Commit
70db2e9
1 Parent(s): 457abe7

Upload tokenizer

Browse files
sentencepiece.bpe.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:770b004b92422d30e82ab9200908eb1d763c3da1eff427b2e3959a1374fe49aa
3
+ size 253482
special_tokens_map.json ADDED
@@ -0,0 +1,30 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": {
3
+ "content": "<s>",
4
+ "lstrip": false,
5
+ "normalized": false,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "eos_token": {
10
+ "content": "</s>",
11
+ "lstrip": false,
12
+ "normalized": false,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "pad_token": {
17
+ "content": "<pad>",
18
+ "lstrip": false,
19
+ "normalized": false,
20
+ "rstrip": false,
21
+ "single_word": false
22
+ },
23
+ "unk_token": {
24
+ "content": "<unk>",
25
+ "lstrip": false,
26
+ "normalized": false,
27
+ "rstrip": false,
28
+ "single_word": false
29
+ }
30
+ }
tokenizer_config.json ADDED
@@ -0,0 +1,49 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "added_tokens_decoder": {
3
+ "0": {
4
+ "content": "<s>",
5
+ "lstrip": false,
6
+ "normalized": false,
7
+ "rstrip": false,
8
+ "single_word": false,
9
+ "special": true
10
+ },
11
+ "1": {
12
+ "content": "<pad>",
13
+ "lstrip": false,
14
+ "normalized": false,
15
+ "rstrip": false,
16
+ "single_word": false,
17
+ "special": true
18
+ },
19
+ "2": {
20
+ "content": "</s>",
21
+ "lstrip": false,
22
+ "normalized": false,
23
+ "rstrip": false,
24
+ "single_word": false,
25
+ "special": true
26
+ },
27
+ "3": {
28
+ "content": "<unk>",
29
+ "lstrip": false,
30
+ "normalized": false,
31
+ "rstrip": false,
32
+ "single_word": false,
33
+ "special": true
34
+ }
35
+ },
36
+ "additional_special_tokens": [],
37
+ "bos_token": "<s>",
38
+ "clean_up_tokenization_spaces": true,
39
+ "do_lower_case": false,
40
+ "do_upper_case": false,
41
+ "eos_token": "</s>",
42
+ "lang_codes": null,
43
+ "model_max_length": 1000000000000000019884624838656,
44
+ "pad_token": "<pad>",
45
+ "sp_model_kwargs": {},
46
+ "tgt_lang": null,
47
+ "tokenizer_class": "Speech2TextTokenizer",
48
+ "unk_token": "<unk>"
49
+ }
vocab.json ADDED
@@ -0,0 +1,1002 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "<s>": 0,
3
+ "<pad>": 1,
4
+ "</s>": 2,
5
+ "<unk>": 3,
6
+ "s": 4,
7
+ "\u2581the": 5,
8
+ "\u2581to": 6,
9
+ "\u2581and": 7,
10
+ "\u2581a": 8,
11
+ "t": 9,
12
+ "\u2581i": 10,
13
+ "'": 11,
14
+ "\u2581of": 12,
15
+ "\u2581that": 13,
16
+ "\u2581in": 14,
17
+ "ing": 15,
18
+ "\u2581we": 16,
19
+ "\u2581you": 17,
20
+ "\u2581it": 18,
21
+ "d": 19,
22
+ "n": 20,
23
+ "ed": 21,
24
+ "m": 22,
25
+ "\u2581is": 23,
26
+ "y": 24,
27
+ "p": 25,
28
+ "r": 26,
29
+ "e": 27,
30
+ "er": 28,
31
+ "re": 29,
32
+ "\u2581for": 30,
33
+ "c": 31,
34
+ "\u2581so": 32,
35
+ "\u2581this": 33,
36
+ "\u2581was": 34,
37
+ "i": 35,
38
+ "b": 36,
39
+ "\u2581they": 37,
40
+ "u": 38,
41
+ "l": 39,
42
+ "\u2581be": 40,
43
+ "al": 41,
44
+ "\u2581have": 42,
45
+ "\u2581are": 43,
46
+ "ly": 44,
47
+ "\u2581with": 45,
48
+ "\u2581what": 46,
49
+ "\u2581on": 47,
50
+ "a": 48,
51
+ "\u2581my": 49,
52
+ "\u2581but": 50,
53
+ "\u2581": 51,
54
+ "g": 52,
55
+ "\u2581s": 53,
56
+ "o": 54,
57
+ "\u2581do": 55,
58
+ "\u2581me": 56,
59
+ "\u2581re": 57,
60
+ "in": 58,
61
+ "\u2581can": 59,
62
+ "\u2581not": 60,
63
+ "\u2581about": 61,
64
+ "ve": 62,
65
+ "ar": 63,
66
+ "\u2581he": 64,
67
+ "le": 65,
68
+ "\u2581all": 66,
69
+ "or": 67,
70
+ "f": 68,
71
+ "\u2581people": 69,
72
+ "\u2581our": 70,
73
+ "\u2581at": 71,
74
+ "ll": 72,
75
+ "\u2581c": 73,
76
+ "\u2581or": 74,
77
+ "\u2581as": 75,
78
+ "ra": 76,
79
+ "v": 77,
80
+ "\u2581de": 78,
81
+ "\u2581there": 79,
82
+ "\u2581like": 80,
83
+ "\u2581one": 81,
84
+ "it": 82,
85
+ "ic": 83,
86
+ "\u2581an": 84,
87
+ "\u2581when": 85,
88
+ "\u2581if": 86,
89
+ "\u2581p": 87,
90
+ "th": 88,
91
+ "ent": 89,
92
+ "\u2581f": 90,
93
+ "\u2581your": 91,
94
+ "ce": 92,
95
+ "\u2581from": 93,
96
+ "\u2581just": 94,
97
+ "\u2581because": 95,
98
+ "w": 96,
99
+ "\u2581how": 97,
100
+ "es": 98,
101
+ "\u2581us": 99,
102
+ "\u2581know": 100,
103
+ "ch": 101,
104
+ "te": 102,
105
+ "\u2581t": 103,
106
+ "\u2581had": 104,
107
+ "ri": 105,
108
+ "\u2581up": 106,
109
+ "on": 107,
110
+ "\u2581out": 108,
111
+ "\u2581who": 109,
112
+ "\u2581time": 110,
113
+ "\u2581their": 111,
114
+ "k": 112,
115
+ "ur": 113,
116
+ "\u2581more": 114,
117
+ "\u2581e": 115,
118
+ "ion": 116,
119
+ "\u2581go": 117,
120
+ "\u2581no": 118,
121
+ "ation": 119,
122
+ "an": 120,
123
+ "\u2581would": 121,
124
+ "ter": 122,
125
+ "\u2581by": 123,
126
+ "h": 124,
127
+ "en": 125,
128
+ "\u2581see": 126,
129
+ "il": 127,
130
+ "\u2581these": 128,
131
+ "\u2581think": 129,
132
+ "\u2581were": 130,
133
+ "\u2581now": 131,
134
+ "\u2581them": 132,
135
+ "\u2581pa": 133,
136
+ "\u2581get": 134,
137
+ "ity": 135,
138
+ "\u2581going": 136,
139
+ "\u2581ba": 137,
140
+ "ge": 138,
141
+ "ate": 139,
142
+ "\u2581con": 140,
143
+ "\u2581very": 141,
144
+ "\u2581co": 142,
145
+ "ive": 143,
146
+ "\u2581really": 144,
147
+ "\u2581se": 145,
148
+ "\u2581w": 146,
149
+ "\u2581don": 147,
150
+ "\u2581way": 148,
151
+ "nd": 149,
152
+ "\u2581she": 150,
153
+ "\u2581ex": 151,
154
+ "\u2581will": 152,
155
+ "ck": 153,
156
+ "ro": 154,
157
+ "tion": 155,
158
+ "\u2581other": 156,
159
+ "\u2581want": 157,
160
+ "\u2581make": 158,
161
+ "\u2581some": 159,
162
+ "ment": 160,
163
+ "\u2581com": 161,
164
+ "\u2581could": 162,
165
+ "\u2581world": 163,
166
+ "\u2581work": 164,
167
+ "ers": 165,
168
+ "\u2581need": 166,
169
+ "\u2581say": 167,
170
+ "\u2581st": 168,
171
+ "se": 169,
172
+ "la": 170,
173
+ "x": 171,
174
+ "\u2581life": 172,
175
+ "\u2581ma": 173,
176
+ "ist": 174,
177
+ "\u2581has": 175,
178
+ "\u2581which": 176,
179
+ "\u2581into": 177,
180
+ "\u2581where": 178,
181
+ "ir": 179,
182
+ "lo": 180,
183
+ "\u2581those": 181,
184
+ "\u2581b": 182,
185
+ "\u2581things": 183,
186
+ "\u2581po": 184,
187
+ "\u2581been": 185,
188
+ "\u2581even": 186,
189
+ "ol": 187,
190
+ "\u2581something": 188,
191
+ "pe": 189,
192
+ "\u2581g": 190,
193
+ "ne": 191,
194
+ "\u2581said": 192,
195
+ "\u2581ra": 193,
196
+ "\u2581her": 194,
197
+ "\u2581years": 195,
198
+ "\u2581take": 196,
199
+ "\u2581day": 197,
200
+ "\u2581mo": 198,
201
+ "\u2581right": 199,
202
+ "\u2581new": 200,
203
+ "\u2581un": 201,
204
+ "\u2581actually": 202,
205
+ "as": 203,
206
+ "ad": 204,
207
+ "id": 205,
208
+ "\u2581look": 206,
209
+ "z": 207,
210
+ "\u2581over": 208,
211
+ "\u2581well": 209,
212
+ "0": 210,
213
+ "\u2581pro": 211,
214
+ "\u2581su": 212,
215
+ "\u2581back": 213,
216
+ "\u2581then": 214,
217
+ "\u2581mi": 215,
218
+ "ci": 216,
219
+ "co": 217,
220
+ "\u2581di": 218,
221
+ "\u2581here": 219,
222
+ "\u2581lo": 220,
223
+ "\u2581than": 221,
224
+ "\u2581o": 222,
225
+ "\u2581first": 223,
226
+ "om": 224,
227
+ "\u2581bo": 225,
228
+ "\u2581ho": 226,
229
+ "ow": 227,
230
+ "ma": 228,
231
+ "me": 229,
232
+ "\u2581most": 230,
233
+ "\u2581also": 231,
234
+ "ide": 232,
235
+ "ies": 233,
236
+ "\u2581fa": 234,
237
+ "ance": 235,
238
+ "\u2581his": 236,
239
+ "\u2581change": 237,
240
+ "tic": 238,
241
+ "vi": 239,
242
+ "at": 240,
243
+ "\u2581mean": 241,
244
+ "\u2581come": 242,
245
+ "\u2581much": 243,
246
+ "\u2581any": 244,
247
+ "able": 245,
248
+ "\u2581la": 246,
249
+ "\u2581only": 247,
250
+ "\u2581many": 248,
251
+ "\u2581dis": 249,
252
+ "us": 250,
253
+ "ut": 251,
254
+ "\u2581ch": 252,
255
+ "ant": 253,
256
+ "age": 254,
257
+ "\u2581why": 255,
258
+ "\u2581every": 256,
259
+ "ng": 257,
260
+ "\u2581happen": 258,
261
+ "ize": 259,
262
+ "\u2581good": 260,
263
+ "\u2581ro": 261,
264
+ "\u2581sp": 262,
265
+ "\u2581thing": 263,
266
+ "\u2581live": 264,
267
+ "\u2581two": 265,
268
+ "ti": 266,
269
+ "\u2581real": 267,
270
+ "ight": 268,
271
+ "\u2581being": 269,
272
+ "\u2581tell": 270,
273
+ "\u2581part": 271,
274
+ "\u2581pre": 272,
275
+ "ful": 273,
276
+ "\u2581lot": 274,
277
+ "ac": 275,
278
+ "\u2581feel": 276,
279
+ "\u2581got": 277,
280
+ "\u2581learn": 278,
281
+ "\u2581did": 279,
282
+ "de": 280,
283
+ "um": 281,
284
+ "\u2581ca": 282,
285
+ "\u2581let": 283,
286
+ "mo": 284,
287
+ "\u2581bu": 285,
288
+ "les": 286,
289
+ "\u2581sh": 287,
290
+ "\u2581ha": 288,
291
+ "ok": 289,
292
+ "ally": 290,
293
+ "\u2581dr": 291,
294
+ "\u2581k": 292,
295
+ "el": 293,
296
+ "est": 294,
297
+ "\u2581te": 295,
298
+ "ure": 296,
299
+ "\u25811": 297,
300
+ "\u2581through": 298,
301
+ "ke": 299,
302
+ "\u2581little": 300,
303
+ "\u2581different": 301,
304
+ "ry": 302,
305
+ "is": 303,
306
+ "\u2581gr": 304,
307
+ "\u2581li": 305,
308
+ "\u2581help": 306,
309
+ "\u2581kind": 307,
310
+ "\u2581give": 308,
311
+ "po": 309,
312
+ "\u2581vi": 310,
313
+ "ul": 311,
314
+ "\u2581talk": 312,
315
+ "\u2581fe": 313,
316
+ "ical": 314,
317
+ "\u2581around": 315,
318
+ "\u2581same": 316,
319
+ "\u2581human": 317,
320
+ "un": 318,
321
+ "\u2581own": 319,
322
+ "ted": 320,
323
+ "lu": 321,
324
+ "\u2581person": 322,
325
+ "\u2581ph": 323,
326
+ "ru": 324,
327
+ "ig": 325,
328
+ "\u2581idea": 326,
329
+ "one": 327,
330
+ "\u2581d": 328,
331
+ "\u2581use": 329,
332
+ "ated": 330,
333
+ "\u2581didn": 331,
334
+ "\u2581br": 332,
335
+ "\u2581school": 333,
336
+ "\u2581find": 334,
337
+ "\u2581problem": 335,
338
+ "\u2581start": 336,
339
+ "\u2581love": 337,
340
+ "\u2581today": 338,
341
+ "\u2581year": 339,
342
+ "ard": 340,
343
+ "\u2581down": 341,
344
+ "\u2581after": 342,
345
+ "ia": 343,
346
+ "5": 344,
347
+ "ap": 345,
348
+ "ous": 346,
349
+ "ine": 347,
350
+ "\u2581question": 348,
351
+ "\u2581fi": 349,
352
+ "\u2581man": 350,
353
+ "\u2581sa": 351,
354
+ "\u2581ne": 352,
355
+ "\u2581great": 353,
356
+ "\u2581ru": 354,
357
+ "\u2581never": 355,
358
+ "\u2581le": 356,
359
+ "ish": 357,
360
+ "\u2581ga": 358,
361
+ "he": 359,
362
+ "\u2581should": 360,
363
+ "\u2581car": 361,
364
+ "\u2581doing": 362,
365
+ "\u2581put": 363,
366
+ "\u2581thought": 364,
367
+ "\u2581long": 365,
368
+ "\u2581fact": 366,
369
+ "ca": 367,
370
+ "tor": 368,
371
+ "ence": 369,
372
+ "\u2581show": 370,
373
+ "\u2581sta": 371,
374
+ "rr": 372,
375
+ "\u2581place": 373,
376
+ "ian": 374,
377
+ "\u2581big": 375,
378
+ "\u2581en": 376,
379
+ "\u2581act": 377,
380
+ "\u2581understand": 378,
381
+ "\u2581him": 379,
382
+ "ness": 380,
383
+ "\u2581cr": 381,
384
+ "\u2581important": 382,
385
+ "am": 383,
386
+ "\u2581might": 384,
387
+ "\u2581off": 385,
388
+ "ta": 386,
389
+ "\u2581da": 387,
390
+ "\u2581ta": 388,
391
+ "bo": 389,
392
+ "}": 390,
393
+ "\u2581{": 391,
394
+ "\u2581bi": 392,
395
+ "\u2581hu": 393,
396
+ "\u2581end": 394,
397
+ "\u2581better": 395,
398
+ "ec": 396,
399
+ "\u2581em": 397,
400
+ "\u2581women": 398,
401
+ "di": 399,
402
+ "\u2581before": 400,
403
+ "\u2581started": 401,
404
+ "ld": 402,
405
+ "\u2581story": 403,
406
+ "ating": 404,
407
+ "\u2581brain": 405,
408
+ "\u2581ask": 406,
409
+ "\u2581system": 407,
410
+ "\u2581j": 408,
411
+ "op": 409,
412
+ "\u2581power": 410,
413
+ "\u2581able": 411,
414
+ "ag": 412,
415
+ "\u2581high": 413,
416
+ "pa": 414,
417
+ "\u2581old": 415,
418
+ "ition": 416,
419
+ "ving": 417,
420
+ "\u2581made": 418,
421
+ "\u2581qu": 419,
422
+ "\u2581came": 420,
423
+ "ary": 421,
424
+ "\u2581ri": 422,
425
+ "\u2581home": 423,
426
+ "\u2581wi": 424,
427
+ "\u2581three": 425,
428
+ "ick": 426,
429
+ "for": 427,
430
+ "\u2581app": 428,
431
+ "\u2581friend": 429,
432
+ "\u2581create": 430,
433
+ "\u2581called": 431,
434
+ "\u2581still": 432,
435
+ "\u2581believe": 433,
436
+ "\u2581found": 434,
437
+ "ha": 435,
438
+ "\u2581na": 436,
439
+ "\u2581hi": 437,
440
+ "ative": 438,
441
+ "\u2581care": 439,
442
+ "\u2581play": 440,
443
+ "\u2581health": 441,
444
+ "\u2581experience": 442,
445
+ "lic": 443,
446
+ "\u2581maybe": 444,
447
+ "\u2581turn": 445,
448
+ "\u2581am": 446,
449
+ "\u2581hand": 447,
450
+ "\u2581went": 448,
451
+ "\u2581children": 449,
452
+ "\u2581men": 450,
453
+ "\u2581word": 451,
454
+ "ound": 452,
455
+ "ph": 453,
456
+ "\u2581together": 454,
457
+ "\u2581become": 455,
458
+ "na": 456,
459
+ "\u2581next": 457,
460
+ "\u2581mar": 458,
461
+ "ie": 459,
462
+ "\u2581tri": 460,
463
+ "\u2581each": 461,
464
+ "\u2581thank": 462,
465
+ "\u2581another": 463,
466
+ "\u2581point": 464,
467
+ "ward": 465,
468
+ "\u2581mon": 466,
469
+ "no": 467,
470
+ "\u2581does": 468,
471
+ "\u2581teach": 469,
472
+ "ities": 470,
473
+ "\u2581always": 471,
474
+ "\u2581build": 472,
475
+ "\u2581last": 473,
476
+ "\u2581th": 474,
477
+ "\u2581ever": 475,
478
+ "ious": 476,
479
+ "sh": 477,
480
+ "oo": 478,
481
+ "\u2581mind": 479,
482
+ "\u2581too": 480,
483
+ "\u2581move": 481,
484
+ "\u2581hard": 482,
485
+ "\u2581bit": 483,
486
+ "\u2581state": 484,
487
+ "ff": 485,
488
+ "\u2581call": 486,
489
+ "\u2581read": 487,
490
+ "\u2581interest": 488,
491
+ "\u2581wanted": 489,
492
+ "\u2581few": 490,
493
+ "\u2581example": 491,
494
+ "\u2581op": 492,
495
+ "ise": 493,
496
+ "\u2581job": 494,
497
+ "\u25812": 495,
498
+ "line": 496,
499
+ "\u2581again": 497,
500
+ "\u2581may": 498,
501
+ "\u2581va": 499,
502
+ "lg": 500,
503
+ "\u258120": 501,
504
+ "\u2581grow": 502,
505
+ "8": 503,
506
+ "ee": 504,
507
+ "\u258110": 505,
508
+ "\u2581jo": 506,
509
+ "tri": 507,
510
+ "ain": 508,
511
+ "\u2581everything": 509,
512
+ "lie": 510,
513
+ "\u2581moment": 511,
514
+ "\u2581less": 512,
515
+ "\u2581myself": 513,
516
+ "\u2581food": 514,
517
+ "\u2581social": 515,
518
+ "\u2581away": 516,
519
+ "\u2581doesn": 517,
520
+ "\u2581family": 518,
521
+ "\u2581under": 519,
522
+ "\u2581develop": 520,
523
+ "\u2581kids": 521,
524
+ "\u2581course": 522,
525
+ "\u2581student": 523,
526
+ "\u2581between": 524,
527
+ "\u2581face": 525,
528
+ "\u2581money": 526,
529
+ "port": 527,
530
+ "\u2581second": 528,
531
+ "\u2581art": 529,
532
+ "\u2581share": 530,
533
+ "\u2581gu": 531,
534
+ "\u2581number": 532,
535
+ "1": 533,
536
+ "\u2581trans": 534,
537
+ "7": 535,
538
+ "\u2581per": 536,
539
+ "\u2581someone": 537,
540
+ "\u2581enough": 538,
541
+ "6": 539,
542
+ "\u2581thinking": 540,
543
+ "\u2581ago": 541,
544
+ "\u2581che": 542,
545
+ "\u2581plan": 543,
546
+ "\u2581try": 544,
547
+ "\u2581far": 545,
548
+ "ism": 546,
549
+ "\u2581told": 547,
550
+ "\u2581lead": 548,
551
+ "\u2581pe": 549,
552
+ "\u2581trying": 550,
553
+ "\u2581working": 551,
554
+ "\u2581young": 552,
555
+ "ten": 553,
556
+ "\u2581ve": 554,
557
+ "\u2581reason": 555,
558
+ "\u2581matter": 556,
559
+ "\u2581best": 557,
560
+ "\u2581remember": 558,
561
+ "\u2581research": 559,
562
+ "\u2581used": 560,
563
+ "\u2581gene": 561,
564
+ "\u2581future": 562,
565
+ "\u2581open": 563,
566
+ "\u2581cu": 564,
567
+ "9": 565,
568
+ "\u2581done": 566,
569
+ "\u2581class": 567,
570
+ "\u2581country": 568,
571
+ "cul": 569,
572
+ "\u2581talking": 570,
573
+ "\u2581stop": 571,
574
+ "\u2581without": 572,
575
+ "\u2581group": 573,
576
+ "\u2581connect": 574,
577
+ "\u2581hope": 575,
578
+ "\u2581walk": 576,
579
+ "\u2581mu": 577,
580
+ "\u2581keep": 578,
581
+ "\u2581small": 579,
582
+ "\u2581million": 580,
583
+ "\u2581girl": 581,
584
+ "\u2581week": 582,
585
+ "\u2581language": 583,
586
+ "\u2581space": 584,
587
+ "\u2581technology": 585,
588
+ "ak": 586,
589
+ "\u2581war": 587,
590
+ "\u2581water": 588,
591
+ "\u2581sense": 589,
592
+ "\u2581community": 590,
593
+ "\u2581child": 591,
594
+ "que": 592,
595
+ "\u2581answer": 593,
596
+ "\u2581book": 594,
597
+ "\u2581often": 595,
598
+ "\u2581making": 596,
599
+ "\u2581free": 597,
600
+ "\u2581having": 598,
601
+ "\u2581looking": 599,
602
+ "\u2581while": 600,
603
+ "ible": 601,
604
+ "\u2581body": 602,
605
+ "\u2581speak": 603,
606
+ "\u2581whole": 604,
607
+ "\u2581else": 605,
608
+ "\u2581getting": 606,
609
+ "\u2581process": 607,
610
+ "land": 608,
611
+ "\u2581four": 609,
612
+ "ability": 610,
613
+ "\u2581allow": 611,
614
+ "\u2581bring": 612,
615
+ "\u2581probably": 613,
616
+ "\u2581ju": 614,
617
+ "\u2581anything": 615,
618
+ "over": 616,
619
+ "2": 617,
620
+ "\u2581add": 618,
621
+ "\u2581cha": 619,
622
+ "j": 620,
623
+ "\u2581ni": 621,
624
+ "\u2581imagine": 622,
625
+ "\u2581stand": 623,
626
+ "\u2581ski": 624,
627
+ "\u2581data": 625,
628
+ "\u2581design": 626,
629
+ "\u2581information": 627,
630
+ "\u2581percent": 628,
631
+ "\u2581name": 629,
632
+ "\u2581such": 630,
633
+ "\u2581science": 631,
634
+ "\u2581sure": 632,
635
+ "000": 633,
636
+ "\u2581self": 634,
637
+ "\u2581knew": 635,
638
+ "\u2581asked": 636,
639
+ "\u2581business": 637,
640
+ "\u2581room": 638,
641
+ "\u2581five": 639,
642
+ "\u2581stories": 640,
643
+ "\u2581living": 641,
644
+ "ught": 642,
645
+ "\u2581listen": 643,
646
+ "\u2581cell": 644,
647
+ "\u2581fun": 645,
648
+ "\u2581society": 646,
649
+ "\u2581study": 647,
650
+ "\u2581guy": 648,
651
+ "\u2581felt": 649,
652
+ "\u2581case": 650,
653
+ "\u2581education": 651,
654
+ "\u2581everyone": 652,
655
+ "\u2581mother": 653,
656
+ "\u2581yourself": 654,
657
+ "\u2581dream": 655,
658
+ "\u25814": 656,
659
+ "\u258119": 657,
660
+ "\u2581already": 658,
661
+ "\u2581project": 659,
662
+ "\u2581both": 660,
663
+ "\u2581light": 661,
664
+ "\u2581music": 662,
665
+ "\u2581begin": 663,
666
+ "\u2581yet": 664,
667
+ "\u2581challenge": 665,
668
+ "\u2581treat": 666,
669
+ "\u2581energy": 667,
670
+ "\u2581effect": 668,
671
+ "\u2581term": 669,
672
+ "\u2581wrong": 670,
673
+ "\u2581ten": 671,
674
+ "\u2581head": 672,
675
+ "\u2581whether": 673,
676
+ "\u2581ourselves": 674,
677
+ "q": 675,
678
+ "\u2581sort": 676,
679
+ "\u25813": 677,
680
+ "\u2581product": 678,
681
+ "\u2581pretty": 679,
682
+ "\u2581close": 680,
683
+ "\u2581program": 681,
684
+ "\u2581woman": 682,
685
+ "\u2581quite": 683,
686
+ "\u2581wonder": 684,
687
+ "\u2581large": 685,
688
+ "\u2581instead": 686,
689
+ "\u2581night": 687,
690
+ "\u2581sometimes": 688,
691
+ "\u2581minute": 689,
692
+ "\u2581true": 690,
693
+ "\u2581eye": 691,
694
+ "\u2581parents": 692,
695
+ "\u2581single": 693,
696
+ "\u2581saw": 694,
697
+ "4": 695,
698
+ "\u2581step": 696,
699
+ "\u2581sound": 697,
700
+ "\u2581lu": 698,
701
+ "\u2581nothing": 699,
702
+ "ship": 700,
703
+ "\u2581control": 701,
704
+ "\u2581nu": 702,
705
+ "\u2581left": 703,
706
+ "\u2581later": 704,
707
+ "\u2581government": 705,
708
+ "\u2581public": 706,
709
+ "\u2581watch": 707,
710
+ "\u2581environment": 708,
711
+ "\u2581simple": 709,
712
+ "\u2581support": 710,
713
+ "\u2581order": 711,
714
+ "\u2581issue": 712,
715
+ "\u2581value": 713,
716
+ "\u2581success": 714,
717
+ "\u2581full": 715,
718
+ "\u2581american": 716,
719
+ "\u2581law": 717,
720
+ "\u2581level": 718,
721
+ "\u2581house": 719,
722
+ "\u2581deep": 720,
723
+ "\u2581disease": 721,
724
+ "\u2581yes": 722,
725
+ "\u2581across": 723,
726
+ "\u2581test": 724,
727
+ "\u2581du": 725,
728
+ "\u2581possible": 726,
729
+ "\u2581eat": 727,
730
+ "\u2581almost": 728,
731
+ "\u2581rest": 729,
732
+ "\u2581half": 730,
733
+ "\u2581cancer": 731,
734
+ "\u2581culture": 732,
735
+ "\u2581emotion": 733,
736
+ "\u2581fail": 734,
737
+ "\u2581animal": 735,
738
+ "\u2581vo": 736,
739
+ "\u2581until": 737,
740
+ "\u2581though": 738,
741
+ "\u2581certain": 739,
742
+ "\u2581past": 740,
743
+ "\u2581relationship": 741,
744
+ "\u2581earth": 742,
745
+ "\u2581amazing": 743,
746
+ "\u2581became": 744,
747
+ "\u2581team": 745,
748
+ "\u2581meet": 746,
749
+ "\u2581decision": 747,
750
+ "way": 748,
751
+ "\u2581game": 749,
752
+ "\u2581individual": 750,
753
+ "\u2581train": 751,
754
+ "\u2581focus": 752,
755
+ "\u2581somebody": 753,
756
+ "\u2581difference": 754,
757
+ "\u2581everybody": 755,
758
+ "\u2581since": 756,
759
+ "\u2581choice": 757,
760
+ "\u2581patient": 758,
761
+ "\u2581history": 759,
762
+ "\u2581taking": 760,
763
+ "\u2581result": 761,
764
+ "\u2581conversation": 762,
765
+ "\u2581doctor": 763,
766
+ "\u2581computer": 764,
767
+ "\u2581discover": 765,
768
+ "\u2581countries": 766,
769
+ "\u258130": 767,
770
+ "\u2581global": 768,
771
+ "\u2581impact": 769,
772
+ "\u2581difficult": 770,
773
+ "\u2581particular": 771,
774
+ "\u2581figure": 772,
775
+ "\u2581spend": 773,
776
+ "\u2581break": 774,
777
+ "\u2581stuff": 775,
778
+ "\u2581leave": 776,
779
+ "\u2581planet": 777,
780
+ "\u2581follow": 778,
781
+ "\u2581model": 779,
782
+ "\u2581expect": 780,
783
+ "\u2581sign": 781,
784
+ "\u2581thousand": 782,
785
+ "\u2581direct": 783,
786
+ "\u2581entire": 784,
787
+ "\u2581elect": 785,
788
+ "\u2581themselves": 786,
789
+ "\u2581cause": 787,
790
+ "\u2581africa": 788,
791
+ "\u2581risk": 789,
792
+ "\u2581must": 790,
793
+ "\u2581against": 791,
794
+ "\u2581couple": 792,
795
+ "\u2581hours": 793,
796
+ "\u2581happy": 794,
797
+ "\u258150": 795,
798
+ "\u2581company": 796,
799
+ "\u2581six": 797,
800
+ "\u2581wait": 798,
801
+ "\u2581write": 799,
802
+ "\u2581behavior": 800,
803
+ "\u2581safe": 801,
804
+ "\u2581voice": 802,
805
+ "3": 803,
806
+ "\u2581exactly": 804,
807
+ "\u2581beautiful": 805,
808
+ "\u2581black": 806,
809
+ "\u2581death": 807,
810
+ "\u2581200": 808,
811
+ "\u2581grand": 809,
812
+ "\u2581organ": 810,
813
+ "\u2581during": 811,
814
+ "\u2581media": 812,
815
+ "\u2581invest": 813,
816
+ "\u2581picture": 814,
817
+ "\u2581front": 815,
818
+ "\u2581clear": 816,
819
+ "\u2581drug": 817,
820
+ "\u2581kill": 818,
821
+ "\u2581organization": 819,
822
+ "\u2581present": 820,
823
+ "\u2581access": 821,
824
+ "\u2581piece": 822,
825
+ "\u2581easy": 823,
826
+ "\u2581generation": 824,
827
+ "ology": 825,
828
+ "\u2581common": 826,
829
+ "qua": 827,
830
+ "\u2581strong": 828,
831
+ "ological": 829,
832
+ "\u2581consider": 830,
833
+ "\u2581nature": 831,
834
+ "\u2581father": 832,
835
+ "\u2581hundred": 833,
836
+ "\u2581college": 834,
837
+ "\u2581protect": 835,
838
+ "\u2581behind": 836,
839
+ "\u2581view": 837,
840
+ "\u2581third": 838,
841
+ "\u2581type": 839,
842
+ "\u2581natural": 840,
843
+ "\u2581outside": 841,
844
+ "\u2581rather": 842,
845
+ "\u2581opportunity": 843,
846
+ "\u2581market": 844,
847
+ "\u2581internet": 845,
848
+ "\u2581least": 846,
849
+ "\u2581billion": 847,
850
+ "\u2581local": 848,
851
+ "\u2581simply": 849,
852
+ "\u2581solution": 850,
853
+ "\u2581perfect": 851,
854
+ "\u2581super": 852,
855
+ "\u2581scientist": 853,
856
+ "\u2581early": 854,
857
+ "\u2581united": 855,
858
+ "\u2581economic": 856,
859
+ "\u2581dollars": 857,
860
+ "\u2581image": 858,
861
+ "\u2581physical": 859,
862
+ "hood": 860,
863
+ "\u2581truth": 861,
864
+ "\u2581cannot": 862,
865
+ "\u2581situation": 863,
866
+ "\u2581whatever": 864,
867
+ "\u2581along": 865,
868
+ "\u2581produce": 866,
869
+ "\u2581practice": 867,
870
+ "\u2581street": 868,
871
+ "\u2581normal": 869,
872
+ "\u2581positive": 870,
873
+ "\u2581collect": 871,
874
+ "ograph": 872,
875
+ "\u2581major": 873,
876
+ "\u2581attention": 874,
877
+ "\u2581knowledge": 875,
878
+ "\u2581middle": 876,
879
+ "\u2581stress": 877,
880
+ "\u2581finally": 878,
881
+ "\u2581short": 879,
882
+ "\u2581america": 880,
883
+ "\u2581field": 881,
884
+ "\u2581morning": 882,
885
+ "\u2581key": 883,
886
+ "\u2581continue": 884,
887
+ "\u2581university": 885,
888
+ "\u2581companies": 886,
889
+ "\u2581trust": 887,
890
+ "\u2581perform": 888,
891
+ "\u2581medical": 889,
892
+ "\u2581provide": 890,
893
+ "\u2581perhaps": 891,
894
+ "\u2581experiment": 892,
895
+ "\u2581service": 893,
896
+ "\u2581resource": 894,
897
+ "\u2581amount": 895,
898
+ "\u2581okay": 896,
899
+ "\u2581potential": 897,
900
+ "\u2581machine": 898,
901
+ "\u2581born": 899,
902
+ "\u2581political": 900,
903
+ "\u2581gender": 901,
904
+ "\u2581began": 902,
905
+ "\u2581population": 903,
906
+ "\u2581accept": 904,
907
+ "\u2581video": 905,
908
+ "\u2581count": 906,
909
+ "\u2581giving": 907,
910
+ "\u2581travel": 908,
911
+ "\u2581micro": 909,
912
+ "\u2581special": 910,
913
+ "\u2581object": 911,
914
+ "\u2581color": 912,
915
+ "\u2581either": 913,
916
+ "\u2581office": 914,
917
+ "\u2581smart": 915,
918
+ "\u2581explain": 916,
919
+ "\u2581approach": 917,
920
+ "\u2581sitting": 918,
921
+ "\u2581message": 919,
922
+ "\u2581affect": 920,
923
+ "\u2581involve": 921,
924
+ "\u2581prison": 922,
925
+ "\u2581engage": 923,
926
+ "\u2581engineer": 924,
927
+ "\u2581white": 925,
928
+ "\u2581europe": 926,
929
+ "ization": 927,
930
+ "\u2581worth": 928,
931
+ "\u2581interact": 929,
932
+ "\u2581adult": 930,
933
+ "\u2581sexual": 931,
934
+ "\u2581itself": 932,
935
+ "\u2581communities": 933,
936
+ "\u2581yeah": 934,
937
+ "\u2581hospital": 935,
938
+ "\u2581choose": 936,
939
+ "\u2581dark": 937,
940
+ "\u2581limit": 938,
941
+ "\u2581complex": 939,
942
+ "\u2581network": 940,
943
+ "\u2581equal": 941,
944
+ "\u2581multi": 942,
945
+ "\u2581sudden": 943,
946
+ "\u2581especially": 944,
947
+ "\u2581suffer": 945,
948
+ "\u2581audience": 946,
949
+ "\u2581aware": 947,
950
+ "\u2581blood": 948,
951
+ "\u2581material": 949,
952
+ "\u2581obvious": 950,
953
+ "\u2581transform": 951,
954
+ "\u2581push": 952,
955
+ "\u2581journey": 953,
956
+ "\u2581increase": 954,
957
+ "\u2581benefit": 955,
958
+ "\u2581sleep": 956,
959
+ "\u2581breath": 957,
960
+ "\u2581require": 958,
961
+ "\u2581measure": 959,
962
+ "\u2581changing": 960,
963
+ "\u2581decade": 961,
964
+ "\u2581perspective": 962,
965
+ "\u2581york": 963,
966
+ "\u2581achieve": 964,
967
+ "\u2581species": 965,
968
+ "\u2581ocean": 966,
969
+ "\u2581industry": 967,
970
+ "\u2581recognize": 968,
971
+ "\u2581character": 969,
972
+ "\u2581brought": 970,
973
+ "\u2581similar": 971,
974
+ "ified": 972,
975
+ "\u2581tradition": 973,
976
+ "\u2581sustain": 974,
977
+ "\u2581current": 975,
978
+ "\u2581daughter": 976,
979
+ "\u2581represent": 977,
980
+ "\u2581function": 978,
981
+ "\u2581century": 979,
982
+ "\u2581express": 980,
983
+ "\u2581laugh": 981,
984
+ "\u2581extreme": 982,
985
+ "\u2581specific": 983,
986
+ "\u2581families": 984,
987
+ "ologist": 985,
988
+ "\u2581climate": 986,
989
+ "\u2581universe": 987,
990
+ "\u2581concept": 988,
991
+ "\u2581please": 989,
992
+ "\u2581response": 990,
993
+ "\u2581inspire": 991,
994
+ "\u2581strange": 992,
995
+ "\u2581negative": 993,
996
+ "\u2581agree": 994,
997
+ "\u2581crazy": 995,
998
+ "\u2581respect": 996,
999
+ "\u2581economy": 997,
1000
+ "\u2581writing": 998,
1001
+ "{": 999
1002
+ }