vladislavbro commited on
Commit
2c83c2c
·
verified ·
1 Parent(s): 9872cc6

Upload tokenizer.json

Browse files
Files changed (1) hide show
  1. tokenizer.json +1462 -0
tokenizer.json ADDED
@@ -0,0 +1,1462 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "version": "1.0",
3
+ "truncation": null,
4
+ "padding": null,
5
+ "added_tokens": [
6
+ {
7
+ "id": 0,
8
+ "special": true,
9
+ "content": "[STOP]",
10
+ "single_word": false,
11
+ "lstrip": false,
12
+ "rstrip": false,
13
+ "normalized": false
14
+ },
15
+ {
16
+ "id": 1,
17
+ "special": true,
18
+ "content": "[UNK]",
19
+ "single_word": false,
20
+ "lstrip": false,
21
+ "rstrip": false,
22
+ "normalized": false
23
+ },
24
+ {
25
+ "id": 2,
26
+ "special": true,
27
+ "content": "[SPACE]",
28
+ "single_word": false,
29
+ "lstrip": false,
30
+ "rstrip": false,
31
+ "normalized": false
32
+ },
33
+ {
34
+ "id": 255,
35
+ "special": true,
36
+ "content": "[START]",
37
+ "single_word": false,
38
+ "lstrip": false,
39
+ "rstrip": false,
40
+ "normalized": false
41
+ },
42
+ {
43
+ "id": 604,
44
+ "content": "[UH]",
45
+ "single_word": false,
46
+ "lstrip": false,
47
+ "rstrip": false,
48
+ "normalized": false,
49
+ "special": true
50
+ },
51
+ {
52
+ "id": 605,
53
+ "content": "[UM]",
54
+ "single_word": false,
55
+ "lstrip": false,
56
+ "rstrip": false,
57
+ "normalized": false,
58
+ "special": true
59
+ },
60
+ {
61
+ "id": 606,
62
+ "content": "[giggle]",
63
+ "single_word": false,
64
+ "lstrip": false,
65
+ "rstrip": false,
66
+ "normalized": false,
67
+ "special": true
68
+ },
69
+ {
70
+ "id": 607,
71
+ "content": "[laughter]",
72
+ "single_word": false,
73
+ "lstrip": false,
74
+ "rstrip": false,
75
+ "normalized": false,
76
+ "special": true
77
+ },
78
+ {
79
+ "id": 608,
80
+ "content": "[guffaw]",
81
+ "single_word": false,
82
+ "lstrip": false,
83
+ "rstrip": false,
84
+ "normalized": false,
85
+ "special": true
86
+ },
87
+ {
88
+ "id": 609,
89
+ "content": "[inhale]",
90
+ "single_word": false,
91
+ "lstrip": false,
92
+ "rstrip": false,
93
+ "normalized": false,
94
+ "special": true
95
+ },
96
+ {
97
+ "id": 610,
98
+ "content": "[exhale]",
99
+ "single_word": false,
100
+ "lstrip": false,
101
+ "rstrip": false,
102
+ "normalized": false,
103
+ "special": true
104
+ },
105
+ {
106
+ "id": 611,
107
+ "content": "[sigh]",
108
+ "single_word": false,
109
+ "lstrip": false,
110
+ "rstrip": false,
111
+ "normalized": false,
112
+ "special": true
113
+ },
114
+ {
115
+ "id": 612,
116
+ "content": "[cry]",
117
+ "single_word": false,
118
+ "lstrip": false,
119
+ "rstrip": false,
120
+ "normalized": false,
121
+ "special": true
122
+ },
123
+ {
124
+ "id": 613,
125
+ "content": "[bark]",
126
+ "single_word": false,
127
+ "lstrip": false,
128
+ "rstrip": false,
129
+ "normalized": false,
130
+ "special": true
131
+ },
132
+ {
133
+ "id": 614,
134
+ "content": "[howl]",
135
+ "single_word": false,
136
+ "lstrip": false,
137
+ "rstrip": false,
138
+ "normalized": false,
139
+ "special": true
140
+ },
141
+ {
142
+ "id": 615,
143
+ "content": "[meow]",
144
+ "single_word": false,
145
+ "lstrip": false,
146
+ "rstrip": false,
147
+ "normalized": false,
148
+ "special": true
149
+ },
150
+ {
151
+ "id": 616,
152
+ "content": "[singing]",
153
+ "single_word": false,
154
+ "lstrip": false,
155
+ "rstrip": false,
156
+ "normalized": false,
157
+ "special": true
158
+ },
159
+ {
160
+ "id": 617,
161
+ "content": "[music]",
162
+ "single_word": false,
163
+ "lstrip": false,
164
+ "rstrip": false,
165
+ "normalized": false,
166
+ "special": true
167
+ },
168
+ {
169
+ "id": 618,
170
+ "content": "[whistle]",
171
+ "single_word": false,
172
+ "lstrip": false,
173
+ "rstrip": false,
174
+ "normalized": false,
175
+ "special": true
176
+ },
177
+ {
178
+ "id": 619,
179
+ "content": "[humming]",
180
+ "single_word": false,
181
+ "lstrip": false,
182
+ "rstrip": false,
183
+ "normalized": false,
184
+ "special": true
185
+ },
186
+ {
187
+ "id": 620,
188
+ "content": "[gasp]",
189
+ "single_word": false,
190
+ "lstrip": false,
191
+ "rstrip": false,
192
+ "normalized": false,
193
+ "special": true
194
+ },
195
+ {
196
+ "id": 621,
197
+ "content": "[groan]",
198
+ "single_word": false,
199
+ "lstrip": false,
200
+ "rstrip": false,
201
+ "normalized": false,
202
+ "special": true
203
+ },
204
+ {
205
+ "id": 622,
206
+ "content": "[whisper]",
207
+ "single_word": false,
208
+ "lstrip": false,
209
+ "rstrip": false,
210
+ "normalized": false,
211
+ "special": true
212
+ },
213
+ {
214
+ "id": 623,
215
+ "content": "[mumble]",
216
+ "single_word": false,
217
+ "lstrip": false,
218
+ "rstrip": false,
219
+ "normalized": false,
220
+ "special": true
221
+ },
222
+ {
223
+ "id": 624,
224
+ "content": "[sniff]",
225
+ "single_word": false,
226
+ "lstrip": false,
227
+ "rstrip": false,
228
+ "normalized": false,
229
+ "special": true
230
+ },
231
+ {
232
+ "id": 625,
233
+ "content": "[sneeze]",
234
+ "single_word": false,
235
+ "lstrip": false,
236
+ "rstrip": false,
237
+ "normalized": false,
238
+ "special": true
239
+ },
240
+ {
241
+ "id": 626,
242
+ "content": "[cough]",
243
+ "single_word": false,
244
+ "lstrip": false,
245
+ "rstrip": false,
246
+ "normalized": false,
247
+ "special": true
248
+ },
249
+ {
250
+ "id": 627,
251
+ "content": "[snore]",
252
+ "single_word": false,
253
+ "lstrip": false,
254
+ "rstrip": false,
255
+ "normalized": false,
256
+ "special": true
257
+ },
258
+ {
259
+ "id": 628,
260
+ "content": "[chew]",
261
+ "single_word": false,
262
+ "lstrip": false,
263
+ "rstrip": false,
264
+ "normalized": false,
265
+ "special": true
266
+ },
267
+ {
268
+ "id": 629,
269
+ "content": "[sip]",
270
+ "single_word": false,
271
+ "lstrip": false,
272
+ "rstrip": false,
273
+ "normalized": false,
274
+ "special": true
275
+ },
276
+ {
277
+ "id": 630,
278
+ "content": "[clear_throat]",
279
+ "single_word": false,
280
+ "lstrip": false,
281
+ "rstrip": false,
282
+ "normalized": false,
283
+ "special": true
284
+ },
285
+ {
286
+ "id": 631,
287
+ "content": "[kiss]",
288
+ "single_word": false,
289
+ "lstrip": false,
290
+ "rstrip": false,
291
+ "normalized": false,
292
+ "special": true
293
+ },
294
+ {
295
+ "id": 632,
296
+ "content": "[shhh]",
297
+ "single_word": false,
298
+ "lstrip": false,
299
+ "rstrip": false,
300
+ "normalized": false,
301
+ "special": true
302
+ },
303
+ {
304
+ "id": 633,
305
+ "content": "[gibberish]",
306
+ "single_word": false,
307
+ "lstrip": false,
308
+ "rstrip": false,
309
+ "normalized": false,
310
+ "special": true
311
+ },
312
+ {
313
+ "id": 634,
314
+ "content": "[fr]",
315
+ "single_word": false,
316
+ "lstrip": false,
317
+ "rstrip": false,
318
+ "normalized": false,
319
+ "special": true
320
+ },
321
+ {
322
+ "id": 635,
323
+ "content": "[es]",
324
+ "single_word": false,
325
+ "lstrip": false,
326
+ "rstrip": false,
327
+ "normalized": false,
328
+ "special": true
329
+ },
330
+ {
331
+ "id": 636,
332
+ "content": "[de]",
333
+ "single_word": false,
334
+ "lstrip": false,
335
+ "rstrip": false,
336
+ "normalized": false,
337
+ "special": true
338
+ },
339
+ {
340
+ "id": 637,
341
+ "content": "[it]",
342
+ "single_word": false,
343
+ "lstrip": false,
344
+ "rstrip": false,
345
+ "normalized": false,
346
+ "special": true
347
+ },
348
+ {
349
+ "id": 638,
350
+ "content": "[ipa]",
351
+ "single_word": false,
352
+ "lstrip": false,
353
+ "rstrip": false,
354
+ "normalized": false,
355
+ "special": true
356
+ },
357
+ {
358
+ "id": 639,
359
+ "content": "[end_of_label]",
360
+ "single_word": false,
361
+ "lstrip": false,
362
+ "rstrip": false,
363
+ "normalized": false,
364
+ "special": true
365
+ },
366
+ {
367
+ "id": 695,
368
+ "content": "[PLACEHOLDER55]",
369
+ "single_word": false,
370
+ "lstrip": false,
371
+ "rstrip": false,
372
+ "normalized": false,
373
+ "special": true
374
+ },
375
+ {
376
+ "id": 696,
377
+ "content": "[PLACEHOLDER56]",
378
+ "single_word": false,
379
+ "lstrip": false,
380
+ "rstrip": false,
381
+ "normalized": false,
382
+ "special": true
383
+ },
384
+ {
385
+ "id": 697,
386
+ "content": "[PLACEHOLDER57]",
387
+ "single_word": false,
388
+ "lstrip": false,
389
+ "rstrip": false,
390
+ "normalized": false,
391
+ "special": true
392
+ },
393
+ {
394
+ "id": 698,
395
+ "content": "[PLACEHOLDER58]",
396
+ "single_word": false,
397
+ "lstrip": false,
398
+ "rstrip": false,
399
+ "normalized": false,
400
+ "special": true
401
+ },
402
+ {
403
+ "id": 699,
404
+ "content": "[PLACEHOLDER59]",
405
+ "single_word": false,
406
+ "lstrip": false,
407
+ "rstrip": false,
408
+ "normalized": false,
409
+ "special": true
410
+ },
411
+ {
412
+ "id": 700,
413
+ "content": "[PLACEHOLDER60]",
414
+ "single_word": false,
415
+ "lstrip": false,
416
+ "rstrip": false,
417
+ "normalized": false,
418
+ "special": true
419
+ },
420
+ {
421
+ "id": 701,
422
+ "content": "[PLACEHOLDER61]",
423
+ "single_word": false,
424
+ "lstrip": false,
425
+ "rstrip": false,
426
+ "normalized": false,
427
+ "special": true
428
+ },
429
+ {
430
+ "id": 702,
431
+ "content": "[PLACEHOLDER62]",
432
+ "single_word": false,
433
+ "lstrip": false,
434
+ "rstrip": false,
435
+ "normalized": false,
436
+ "special": true
437
+ },
438
+ {
439
+ "id": 703,
440
+ "content": "[PLACEHOLDER63]",
441
+ "single_word": false,
442
+ "lstrip": false,
443
+ "rstrip": false,
444
+ "normalized": false,
445
+ "special": true
446
+ }
447
+ ],
448
+ "normalizer": null,
449
+ "pre_tokenizer": {
450
+ "type": "Whitespace"
451
+ },
452
+ "post_processor": {
453
+ "type": "TemplateProcessing",
454
+ "single": [
455
+ { "SpecialToken": { "id": "BOS", "type_id": 0 } },
456
+ { "Sequence": { "id": "A", "type_id": 0 } },
457
+ { "SpecialToken": { "id": "EOS", "type_id": 0 } }
458
+ ],
459
+ "pair": [
460
+ { "SpecialToken": { "id": "BOS", "type_id": 0 } },
461
+ { "Sequence": { "id": "A", "type_id": 0 } },
462
+ { "SpecialToken": { "id": "EOS", "type_id": 0 } },
463
+ { "SpecialToken": { "id": "BOS", "type_id": 1 } },
464
+ { "Sequence": { "id": "B", "type_id": 1 } },
465
+ { "SpecialToken": { "id": "EOS", "type_id": 1 } }
466
+ ],
467
+ "special_tokens": {
468
+ "BOS": {
469
+ "id": "BOS",
470
+ "ids": [255],
471
+ "tokens": ["<s>"]
472
+ },
473
+ "EOS": {
474
+ "id": "EOS",
475
+ "ids": [0],
476
+ "tokens": ["</s>"]
477
+ }
478
+ }
479
+ },
480
+ "decoder": null,
481
+ "model": {
482
+ "type": "BPE",
483
+ "dropout": null,
484
+ "unk_token": "[UNK]",
485
+ "continuing_subword_prefix": null,
486
+ "end_of_word_suffix": null,
487
+ "fuse_unk": false,
488
+ "vocab": {
489
+ "[STOP]": 0,
490
+ "[UNK]": 1,
491
+ "[SPACE]": 2,
492
+ "!": 3,
493
+ "'": 4,
494
+ "(": 5,
495
+ ")": 6,
496
+ ",": 7,
497
+ "-": 8,
498
+ ".": 9,
499
+ "/": 10,
500
+ ":": 11,
501
+ ";": 12,
502
+ "?": 13,
503
+ "a": 14,
504
+ "b": 15,
505
+ "c": 16,
506
+ "d": 17,
507
+ "e": 18,
508
+ "f": 19,
509
+ "g": 20,
510
+ "h": 21,
511
+ "i": 22,
512
+ "j": 23,
513
+ "k": 24,
514
+ "l": 25,
515
+ "m": 26,
516
+ "n": 27,
517
+ "o": 28,
518
+ "p": 29,
519
+ "q": 30,
520
+ "r": 31,
521
+ "s": 32,
522
+ "t": 33,
523
+ "u": 34,
524
+ "v": 35,
525
+ "w": 36,
526
+ "x": 37,
527
+ "y": 38,
528
+ "z": 39,
529
+ "th": 40,
530
+ "in": 41,
531
+ "the": 42,
532
+ "an": 43,
533
+ "er": 44,
534
+ "ou": 45,
535
+ "re": 46,
536
+ "on": 47,
537
+ "at": 48,
538
+ "ed": 49,
539
+ "en": 50,
540
+ "to": 51,
541
+ "ing": 52,
542
+ "and": 53,
543
+ "is": 54,
544
+ "as": 55,
545
+ "al": 56,
546
+ "or": 57,
547
+ "of": 58,
548
+ "ar": 59,
549
+ "it": 60,
550
+ "es": 61,
551
+ "he": 62,
552
+ "st": 63,
553
+ "le": 64,
554
+ "om": 65,
555
+ "se": 66,
556
+ "be": 67,
557
+ "ad": 68,
558
+ "ow": 69,
559
+ "ly": 70,
560
+ "ch": 71,
561
+ "wh": 72,
562
+ "that": 73,
563
+ "you": 74,
564
+ "li": 75,
565
+ "ve": 76,
566
+ "ac": 77,
567
+ "ti": 78,
568
+ "ld": 79,
569
+ "me": 80,
570
+ "was": 81,
571
+ "gh": 82,
572
+ "id": 83,
573
+ "ll": 84,
574
+ "wi": 85,
575
+ "ent": 86,
576
+ "for": 87,
577
+ "ay": 88,
578
+ "ro": 89,
579
+ "ver": 90,
580
+ "ic": 91,
581
+ "her": 92,
582
+ "ke": 93,
583
+ "his": 94,
584
+ "no": 95,
585
+ "ut": 96,
586
+ "un": 97,
587
+ "ir": 98,
588
+ "lo": 99,
589
+ "we": 100,
590
+ "ri": 101,
591
+ "ha": 102,
592
+ "with": 103,
593
+ "ght": 104,
594
+ "out": 105,
595
+ "im": 106,
596
+ "ion": 107,
597
+ "all": 108,
598
+ "ab": 109,
599
+ "one": 110,
600
+ "ne": 111,
601
+ "ge": 112,
602
+ "ould": 113,
603
+ "ter": 114,
604
+ "mo": 115,
605
+ "had": 116,
606
+ "ce": 117,
607
+ "she": 118,
608
+ "go": 119,
609
+ "sh": 120,
610
+ "ur": 121,
611
+ "am": 122,
612
+ "so": 123,
613
+ "pe": 124,
614
+ "my": 125,
615
+ "de": 126,
616
+ "are": 127,
617
+ "but": 128,
618
+ "ome": 129,
619
+ "fr": 130,
620
+ "ther": 131,
621
+ "fe": 132,
622
+ "su": 133,
623
+ "do": 134,
624
+ "con": 135,
625
+ "te": 136,
626
+ "ain": 137,
627
+ "ere": 138,
628
+ "po": 139,
629
+ "if": 140,
630
+ "they": 141,
631
+ "us": 142,
632
+ "ag": 143,
633
+ "tr": 144,
634
+ "now": 145,
635
+ "oun": 146,
636
+ "this": 147,
637
+ "have": 148,
638
+ "not": 149,
639
+ "sa": 150,
640
+ "il": 151,
641
+ "up": 152,
642
+ "thing": 153,
643
+ "from": 154,
644
+ "ap": 155,
645
+ "him": 156,
646
+ "ack": 157,
647
+ "ation": 158,
648
+ "ant": 159,
649
+ "our": 160,
650
+ "op": 161,
651
+ "like": 162,
652
+ "ust": 163,
653
+ "ess": 164,
654
+ "bo": 165,
655
+ "ok": 166,
656
+ "ul": 167,
657
+ "ind": 168,
658
+ "ex": 169,
659
+ "com": 170,
660
+ "some": 171,
661
+ "there": 172,
662
+ "ers": 173,
663
+ "co": 174,
664
+ "res": 175,
665
+ "man": 176,
666
+ "ard": 177,
667
+ "pl": 178,
668
+ "wor": 179,
669
+ "way": 180,
670
+ "tion": 181,
671
+ "fo": 182,
672
+ "ca": 183,
673
+ "were": 184,
674
+ "by": 185,
675
+ "ate": 186,
676
+ "pro": 187,
677
+ "ted": 188,
678
+ "ound": 189,
679
+ "own": 190,
680
+ "would": 191,
681
+ "ts": 192,
682
+ "what": 193,
683
+ "qu": 194,
684
+ "ally": 195,
685
+ "ight": 196,
686
+ "ck": 197,
687
+ "gr": 198,
688
+ "when": 199,
689
+ "ven": 200,
690
+ "can": 201,
691
+ "ough": 202,
692
+ "ine": 203,
693
+ "end": 204,
694
+ "per": 205,
695
+ "ous": 206,
696
+ "od": 207,
697
+ "ide": 208,
698
+ "know": 209,
699
+ "ty": 210,
700
+ "very": 211,
701
+ "si": 212,
702
+ "ak": 213,
703
+ "who": 214,
704
+ "about": 215,
705
+ "ill": 216,
706
+ "them": 217,
707
+ "est": 218,
708
+ "red": 219,
709
+ "ye": 220,
710
+ "could": 221,
711
+ "ong": 222,
712
+ "your": 223,
713
+ "their": 224,
714
+ "em": 225,
715
+ "just": 226,
716
+ "other": 227,
717
+ "into": 228,
718
+ "any": 229,
719
+ "whi": 230,
720
+ "um": 231,
721
+ "tw": 232,
722
+ "ast": 233,
723
+ "der": 234,
724
+ "did": 235,
725
+ "ie": 236,
726
+ "been": 237,
727
+ "ace": 238,
728
+ "ink": 239,
729
+ "ity": 240,
730
+ "back": 241,
731
+ "ting": 242,
732
+ "br": 243,
733
+ "more": 244,
734
+ "ake": 245,
735
+ "pp": 246,
736
+ "then": 247,
737
+ "sp": 248,
738
+ "el": 249,
739
+ "use": 250,
740
+ "bl": 251,
741
+ "said": 252,
742
+ "over": 253,
743
+ "get": 254,
744
+ "[START]": 255,
745
+ "\"": 256,
746
+ "#": 257,
747
+ "$": 258,
748
+ "%": 259,
749
+ "&": 260,
750
+ "*": 261,
751
+ "+": 262,
752
+ "0": 263,
753
+ "1": 264,
754
+ "2": 265,
755
+ "3": 266,
756
+ "4": 267,
757
+ "5": 268,
758
+ "6": 269,
759
+ "7": 270,
760
+ "8": 271,
761
+ "9": 272,
762
+ "<": 273,
763
+ "=": 274,
764
+ ">": 275,
765
+ "@": 276,
766
+ "A": 277,
767
+ "B": 278,
768
+ "C": 279,
769
+ "D": 280,
770
+ "E": 281,
771
+ "F": 282,
772
+ "G": 283,
773
+ "H": 284,
774
+ "I": 285,
775
+ "J": 286,
776
+ "K": 287,
777
+ "L": 288,
778
+ "M": 289,
779
+ "N": 290,
780
+ "O": 291,
781
+ "P": 292,
782
+ "Q": 293,
783
+ "R": 294,
784
+ "S": 295,
785
+ "T": 296,
786
+ "U": 297,
787
+ "V": 298,
788
+ "W": 299,
789
+ "X": 300,
790
+ "Y": 301,
791
+ "Z": 302,
792
+ "[": 303,
793
+ "\\": 304,
794
+ "]": 305,
795
+ "^": 306,
796
+ "_": 307,
797
+ "`": 308,
798
+ "{": 309,
799
+ "|": 310,
800
+ "}": 311,
801
+ "~": 312,
802
+ "‐": 313,
803
+ "‑": 314,
804
+ "‒": 315,
805
+ "–": 316,
806
+ "—": 317,
807
+ "―": 318,
808
+ "‖": 319,
809
+ "‗": 320,
810
+ "‘": 321,
811
+ "’": 322,
812
+ "‚": 323,
813
+ "‛": 324,
814
+ "“": 325,
815
+ "”": 326,
816
+ "„": 327,
817
+ "‟": 328,
818
+ " ": 329,
819
+ "¡": 330,
820
+ "¢": 331,
821
+ "£": 332,
822
+ "¤": 333,
823
+ "¥": 334,
824
+ "¦": 335,
825
+ "§": 336,
826
+ "¨": 337,
827
+ "©": 338,
828
+ "ª": 339,
829
+ "«": 340,
830
+ "¬": 341,
831
+ "­": 342,
832
+ "®": 343,
833
+ "¯": 344,
834
+ "°": 345,
835
+ "±": 346,
836
+ "²": 347,
837
+ "³": 348,
838
+ "´": 349,
839
+ "µ": 350,
840
+ "¶": 351,
841
+ "·": 352,
842
+ "¸": 353,
843
+ "¹": 354,
844
+ "º": 355,
845
+ "»": 356,
846
+ "¼": 357,
847
+ "½": 358,
848
+ "¾": 359,
849
+ "¿": 360,
850
+ "À": 361,
851
+ "Á": 362,
852
+ "Â": 363,
853
+ "Ã": 364,
854
+ "Ä": 365,
855
+ "Å": 366,
856
+ "Æ": 367,
857
+ "Ç": 368,
858
+ "È": 369,
859
+ "É": 370,
860
+ "Ê": 371,
861
+ "Ë": 372,
862
+ "Ì": 373,
863
+ "Í": 374,
864
+ "Î": 375,
865
+ "Ï": 376,
866
+ "Ð": 377,
867
+ "Ñ": 378,
868
+ "Ò": 379,
869
+ "Ó": 380,
870
+ "Ô": 381,
871
+ "Õ": 382,
872
+ "Ö": 383,
873
+ "×": 384,
874
+ "Ø": 385,
875
+ "Ù": 386,
876
+ "Ú": 387,
877
+ "Û": 388,
878
+ "Ü": 389,
879
+ "Ý": 390,
880
+ "Þ": 391,
881
+ "ß": 392,
882
+ "à": 393,
883
+ "á": 394,
884
+ "â": 395,
885
+ "ã": 396,
886
+ "ä": 397,
887
+ "å": 398,
888
+ "æ": 399,
889
+ "ç": 400,
890
+ "è": 401,
891
+ "é": 402,
892
+ "ê": 403,
893
+ "ë": 404,
894
+ "ì": 405,
895
+ "í": 406,
896
+ "î": 407,
897
+ "ï": 408,
898
+ "ð": 409,
899
+ "ñ": 410,
900
+ "ò": 411,
901
+ "ó": 412,
902
+ "ô": 413,
903
+ "õ": 414,
904
+ "ö": 415,
905
+ "÷": 416,
906
+ "ø": 417,
907
+ "ù": 418,
908
+ "ú": 419,
909
+ "û": 420,
910
+ "ü": 421,
911
+ "ý": 422,
912
+ "þ": 423,
913
+ "ÿ": 424,
914
+ "ɐ": 425,
915
+ "ɑ": 426,
916
+ "ɒ": 427,
917
+ "ɓ": 428,
918
+ "ɔ": 429,
919
+ "ɕ": 430,
920
+ "ɖ": 431,
921
+ "ɗ": 432,
922
+ "ɘ": 433,
923
+ "ə": 434,
924
+ "ɚ": 435,
925
+ "ɛ": 436,
926
+ "ɜ": 437,
927
+ "ɝ": 438,
928
+ "ɞ": 439,
929
+ "ɟ": 440,
930
+ "ɠ": 441,
931
+ "ɡ": 442,
932
+ "ɢ": 443,
933
+ "ɣ": 444,
934
+ "ɤ": 445,
935
+ "ɥ": 446,
936
+ "ɦ": 447,
937
+ "ɧ": 448,
938
+ "ɨ": 449,
939
+ "ɩ": 450,
940
+ "ɪ": 451,
941
+ "ɫ": 452,
942
+ "ɬ": 453,
943
+ "ɭ": 454,
944
+ "ɮ": 455,
945
+ "ɯ": 456,
946
+ "ɰ": 457,
947
+ "ɱ": 458,
948
+ "ɲ": 459,
949
+ "ɳ": 460,
950
+ "ɴ": 461,
951
+ "ɵ": 462,
952
+ "ɶ": 463,
953
+ "ɷ": 464,
954
+ "ɸ": 465,
955
+ "ɹ": 466,
956
+ "ɺ": 467,
957
+ "ɻ": 468,
958
+ "ɼ": 469,
959
+ "ɽ": 470,
960
+ "ɾ": 471,
961
+ "ɿ": 472,
962
+ "ʀ": 473,
963
+ "ʁ": 474,
964
+ "ʂ": 475,
965
+ "ʃ": 476,
966
+ "ʄ": 477,
967
+ "ʅ": 478,
968
+ "ʆ": 479,
969
+ "ʇ": 480,
970
+ "ʈ": 481,
971
+ "ʉ": 482,
972
+ "ʊ": 483,
973
+ "ʋ": 484,
974
+ "ʌ": 485,
975
+ "ʍ": 486,
976
+ "ʎ": 487,
977
+ "ʏ": 488,
978
+ "ʐ": 489,
979
+ "ʑ": 490,
980
+ "ʒ": 491,
981
+ "ʓ": 492,
982
+ "ʔ": 493,
983
+ "ʕ": 494,
984
+ "ʖ": 495,
985
+ "ʗ": 496,
986
+ "ʘ": 497,
987
+ "ʙ": 498,
988
+ "ʚ": 499,
989
+ "ʛ": 500,
990
+ "ʜ": 501,
991
+ "ʝ": 502,
992
+ "ʞ": 503,
993
+ "ʟ": 504,
994
+ "ʠ": 505,
995
+ "ʡ": 506,
996
+ "ʢ": 507,
997
+ "ʣ": 508,
998
+ "ʤ": 509,
999
+ "ʥ": 510,
1000
+ "ʦ": 511,
1001
+ "ʧ": 512,
1002
+ "ʨ": 513,
1003
+ "ʩ": 514,
1004
+ "ʪ": 515,
1005
+ "ʫ": 516,
1006
+ "ʬ": 517,
1007
+ "ʭ": 518,
1008
+ "ʮ": 519,
1009
+ "ʯ": 520,
1010
+ "ʰ": 521,
1011
+ "ʱ": 522,
1012
+ "ʲ": 523,
1013
+ "ʳ": 524,
1014
+ "ʴ": 525,
1015
+ "ʵ": 526,
1016
+ "ʶ": 527,
1017
+ "ʷ": 528,
1018
+ "ʸ": 529,
1019
+ "ʹ": 530,
1020
+ "ʺ": 531,
1021
+ "ʻ": 532,
1022
+ "ʼ": 533,
1023
+ "ʽ": 534,
1024
+ "ʾ": 535,
1025
+ "ʿ": 536,
1026
+ "ˀ": 537,
1027
+ "ˁ": 538,
1028
+ "˂": 539,
1029
+ "˃": 540,
1030
+ "˄": 541,
1031
+ "˅": 542,
1032
+ "ˆ": 543,
1033
+ "ˇ": 544,
1034
+ "ˈ": 545,
1035
+ "ˉ": 546,
1036
+ "ˊ": 547,
1037
+ "ˋ": 548,
1038
+ "ˌ": 549,
1039
+ "ˍ": 550,
1040
+ "ˎ": 551,
1041
+ "ˏ": 552,
1042
+ "ː": 553,
1043
+ "ˑ": 554,
1044
+ "˒": 555,
1045
+ "˓": 556,
1046
+ "˔": 557,
1047
+ "˕": 558,
1048
+ "˖": 559,
1049
+ "˗": 560,
1050
+ "˘": 561,
1051
+ "˙": 562,
1052
+ "˚": 563,
1053
+ "˛": 564,
1054
+ "˜": 565,
1055
+ "˝": 566,
1056
+ "˞": 567,
1057
+ "˟": 568,
1058
+ "ˠ": 569,
1059
+ "ˡ": 570,
1060
+ "ˢ": 571,
1061
+ "ˣ": 572,
1062
+ "ˤ": 573,
1063
+ "˥": 574,
1064
+ "˦": 575,
1065
+ "˧": 576,
1066
+ "˨": 577,
1067
+ "˩": 578,
1068
+ "˪": 579,
1069
+ "˫": 580,
1070
+ "ˬ": 581,
1071
+ "˭": 582,
1072
+ "ˮ": 583,
1073
+ "˯": 584,
1074
+ "˰": 585,
1075
+ "˱": 586,
1076
+ "˲": 587,
1077
+ "˳": 588,
1078
+ "˴": 589,
1079
+ "˵": 590,
1080
+ "˶": 591,
1081
+ "˷": 592,
1082
+ "˸": 593,
1083
+ "˹": 594,
1084
+ "˺": 595,
1085
+ "˻": 596,
1086
+ "˼": 597,
1087
+ "˽": 598,
1088
+ "˾": 599,
1089
+ "˿": 600,
1090
+ "ā": 601,
1091
+ "ō": 602,
1092
+ "…": 603,
1093
+ "[UH]": 604,
1094
+ "[UM]": 605,
1095
+ "[giggle]": 606,
1096
+ "[laughter]": 607,
1097
+ "[guffaw]": 608,
1098
+ "[inhale]": 609,
1099
+ "[exhale]": 610,
1100
+ "[sigh]": 611,
1101
+ "[cry]": 612,
1102
+ "[bark]": 613,
1103
+ "[howl]": 614,
1104
+ "[meow]": 615,
1105
+ "[singing]": 616,
1106
+ "[music]": 617,
1107
+ "[whistle]": 618,
1108
+ "[humming]": 619,
1109
+ "[gasp]": 620,
1110
+ "[groan]": 621,
1111
+ "[whisper]": 622,
1112
+ "[mumble]": 623,
1113
+ "[sniff]": 624,
1114
+ "[sneeze]": 625,
1115
+ "[cough]": 626,
1116
+ "[snore]": 627,
1117
+ "[chew]": 628,
1118
+ "[sip]": 629,
1119
+ "[clear_throat]": 630,
1120
+ "[kiss]": 631,
1121
+ "[shhh]": 632,
1122
+ "[gibberish]": 633,
1123
+ "[fr]": 634,
1124
+ "[es]": 635,
1125
+ "[de]": 636,
1126
+ "[it]": 637,
1127
+ "[ipa]": 638,
1128
+ "[end_of_label]": 639,
1129
+ "ŋ": 640,
1130
+ "ᵻ": 641,
1131
+ "θ": 642,
1132
+ "̩": 643,
1133
+ "\u0303": 644,
1134
+ "ɑː": 645,
1135
+ "iː": 646,
1136
+ "uː": 647,
1137
+ "ɜː": 648,
1138
+ "ɔː": 649,
1139
+ "oː": 650,
1140
+ "eɪ": 651,
1141
+ "oʊ": 652,
1142
+ "aɪ": 653,
1143
+ "aʊ": 654,
1144
+ "ɔɪ": 655,
1145
+ "dʒ": 656,
1146
+ "tʃ": 657,
1147
+ "ɪŋ": 658,
1148
+ "ᵻd": 659,
1149
+ "ˈiː": 660,
1150
+ "ˌiː": 661,
1151
+ "ˈɪ": 662,
1152
+ "ˌɪ": 663,
1153
+ "ˈeɪ": 664,
1154
+ "ˌeɪ": 665,
1155
+ "ˈɛ": 666,
1156
+ "ˌɛ": 667,
1157
+ "ˈæ": 668,
1158
+ "ˌæ": 669,
1159
+ "ˈɑː": 670,
1160
+ "ˌɑː": 671,
1161
+ "ˈɔː": 672,
1162
+ "ˌɔː": 673,
1163
+ "oːɹ": 674,
1164
+ "ˈoːɹ": 675,
1165
+ "ˌoːɹ": 676,
1166
+ "ˈoʊ": 677,
1167
+ "ˌoʊ": 678,
1168
+ "ˈʊ": 679,
1169
+ "ˌʊ": 680,
1170
+ "ˈuː": 681,
1171
+ "ˌuː": 682,
1172
+ "ˈɜː": 683,
1173
+ "ˌɜː": 684,
1174
+ "ˈʌ": 685,
1175
+ "ˌʌ": 686,
1176
+ "ˈaɪ": 687,
1177
+ "ˌaɪ": 688,
1178
+ "ˈaʊ": 689,
1179
+ "ˌaʊ": 690,
1180
+ "ˈɔɪ": 691,
1181
+ "ˌɔɪ": 692,
1182
+ "ˈɚ": 693,
1183
+ "ˌɐ": 694,
1184
+ "[PLACEHOLDER55]": 695,
1185
+ "[PLACEHOLDER56]": 696,
1186
+ "[PLACEHOLDER57]": 697,
1187
+ "[PLACEHOLDER58]": 698,
1188
+ "[PLACEHOLDER59]": 699,
1189
+ "[PLACEHOLDER60]": 700,
1190
+ "[PLACEHOLDER61]": 701,
1191
+ "[PLACEHOLDER62]": 702,
1192
+ "[PLACEHOLDER63]": 703
1193
+ },
1194
+ "merges": [
1195
+ "t h",
1196
+ "i n",
1197
+ "th e",
1198
+ "a n",
1199
+ "e r",
1200
+ "o u",
1201
+ "r e",
1202
+ "o n",
1203
+ "a t",
1204
+ "e d",
1205
+ "e n",
1206
+ "t o",
1207
+ "in g",
1208
+ "an d",
1209
+ "i s",
1210
+ "a s",
1211
+ "a l",
1212
+ "o r",
1213
+ "o f",
1214
+ "a r",
1215
+ "i t",
1216
+ "e s",
1217
+ "h e",
1218
+ "s t",
1219
+ "l e",
1220
+ "o m",
1221
+ "s e",
1222
+ "b e",
1223
+ "a d",
1224
+ "o w",
1225
+ "l y",
1226
+ "c h",
1227
+ "w h",
1228
+ "th at",
1229
+ "y ou",
1230
+ "l i",
1231
+ "v e",
1232
+ "a c",
1233
+ "t i",
1234
+ "l d",
1235
+ "m e",
1236
+ "w as",
1237
+ "g h",
1238
+ "i d",
1239
+ "l l",
1240
+ "w i",
1241
+ "en t",
1242
+ "f or",
1243
+ "a y",
1244
+ "r o",
1245
+ "v er",
1246
+ "i c",
1247
+ "h er",
1248
+ "k e",
1249
+ "h is",
1250
+ "n o",
1251
+ "u t",
1252
+ "u n",
1253
+ "i r",
1254
+ "l o",
1255
+ "w e",
1256
+ "r i",
1257
+ "h a",
1258
+ "wi th",
1259
+ "gh t",
1260
+ "ou t",
1261
+ "i m",
1262
+ "i on",
1263
+ "al l",
1264
+ "a b",
1265
+ "on e",
1266
+ "n e",
1267
+ "g e",
1268
+ "ou ld",
1269
+ "t er",
1270
+ "m o",
1271
+ "h ad",
1272
+ "c e",
1273
+ "s he",
1274
+ "g o",
1275
+ "s h",
1276
+ "u r",
1277
+ "a m",
1278
+ "s o",
1279
+ "p e",
1280
+ "m y",
1281
+ "d e",
1282
+ "a re",
1283
+ "b ut",
1284
+ "om e",
1285
+ "f r",
1286
+ "the r",
1287
+ "f e",
1288
+ "s u",
1289
+ "d o",
1290
+ "c on",
1291
+ "t e",
1292
+ "a in",
1293
+ "er e",
1294
+ "p o",
1295
+ "i f",
1296
+ "the y",
1297
+ "u s",
1298
+ "a g",
1299
+ "t r",
1300
+ "n ow",
1301
+ "ou n",
1302
+ "th is",
1303
+ "ha ve",
1304
+ "no t",
1305
+ "s a",
1306
+ "i l",
1307
+ "u p",
1308
+ "th ing",
1309
+ "fr om",
1310
+ "a p",
1311
+ "h im",
1312
+ "ac k",
1313
+ "at ion",
1314
+ "an t",
1315
+ "ou r",
1316
+ "o p",
1317
+ "li ke",
1318
+ "u st",
1319
+ "es s",
1320
+ "b o",
1321
+ "o k",
1322
+ "u l",
1323
+ "in d",
1324
+ "e x",
1325
+ "c om",
1326
+ "s ome",
1327
+ "the re",
1328
+ "er s",
1329
+ "c o",
1330
+ "re s",
1331
+ "m an",
1332
+ "ar d",
1333
+ "p l",
1334
+ "w or",
1335
+ "w ay",
1336
+ "ti on",
1337
+ "f o",
1338
+ "c a",
1339
+ "w ere",
1340
+ "b y",
1341
+ "at e",
1342
+ "p ro",
1343
+ "t ed",
1344
+ "oun d",
1345
+ "ow n",
1346
+ "w ould",
1347
+ "t s",
1348
+ "wh at",
1349
+ "q u",
1350
+ "al ly",
1351
+ "i ght",
1352
+ "c k",
1353
+ "g r",
1354
+ "wh en",
1355
+ "v en",
1356
+ "c an",
1357
+ "ou gh",
1358
+ "in e",
1359
+ "en d",
1360
+ "p er",
1361
+ "ou s",
1362
+ "o d",
1363
+ "id e",
1364
+ "k now",
1365
+ "t y",
1366
+ "ver y",
1367
+ "s i",
1368
+ "a k",
1369
+ "wh o",
1370
+ "ab out",
1371
+ "i ll",
1372
+ "the m",
1373
+ "es t",
1374
+ "re d",
1375
+ "y e",
1376
+ "c ould",
1377
+ "on g",
1378
+ "you r",
1379
+ "the ir",
1380
+ "e m",
1381
+ "j ust",
1382
+ "o ther",
1383
+ "in to",
1384
+ "an y",
1385
+ "wh i",
1386
+ "u m",
1387
+ "t w",
1388
+ "as t",
1389
+ "d er",
1390
+ "d id",
1391
+ "i e",
1392
+ "be en",
1393
+ "ac e",
1394
+ "in k",
1395
+ "it y",
1396
+ "b ack",
1397
+ "t ing",
1398
+ "b r",
1399
+ "mo re",
1400
+ "a ke",
1401
+ "p p",
1402
+ "the n",
1403
+ "s p",
1404
+ "e l",
1405
+ "u se",
1406
+ "b l",
1407
+ "sa id",
1408
+ "o ver",
1409
+ "ge t",
1410
+ "ɑ ː",
1411
+ "i ː",
1412
+ "u ː",
1413
+ "ɜ ː",
1414
+ "ɔ ː",
1415
+ "o ː",
1416
+ "e ɪ",
1417
+ "o ʊ",
1418
+ "a ɪ",
1419
+ "a ʊ",
1420
+ "ɔ ɪ",
1421
+ "d ʒ",
1422
+ "t ʃ",
1423
+ "ɪ ŋ",
1424
+ "ᵻ d",
1425
+ "ˈ iː",
1426
+ "ˌ iː",
1427
+ "ˈ ɪ",
1428
+ "ˌ ɪ",
1429
+ "ˈ eɪ",
1430
+ "ˌ eɪ",
1431
+ "ˈ ɛ",
1432
+ "ˌ ɛ",
1433
+ "ˈ æ",
1434
+ "ˌ æ",
1435
+ "ˈ ɑː",
1436
+ "ˌ ɑː",
1437
+ "ˈ ɔː",
1438
+ "ˌ ɔː",
1439
+ "oː ɹ",
1440
+ "ˈ oːɹ",
1441
+ "ˌ oːɹ",
1442
+ "ˈ oʊ",
1443
+ "ˌ oʊ",
1444
+ "ˈ ʊ",
1445
+ "ˌ ʊ",
1446
+ "ˈ uː",
1447
+ "ˌ uː",
1448
+ "ˈ ɜː",
1449
+ "ˌ ɜː",
1450
+ "ˈ ʌ",
1451
+ "ˌ ʌ",
1452
+ "ˈ aɪ",
1453
+ "ˌ aɪ",
1454
+ "ˈ aʊ",
1455
+ "ˌ aʊ",
1456
+ "ˈ ɔɪ",
1457
+ "ˌ ɔɪ",
1458
+ "ˈ ɚ",
1459
+ "ˌ ɐ"
1460
+ ]
1461
+ }
1462
+ }