hf-transformers-bot commited on
Commit
7aeebda
·
1 Parent(s): 09fcaeb

Upload tiny models for Owlv2Model

Browse files
config.json ADDED
@@ -0,0 +1,34 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "Owlv2Model"
4
+ ],
5
+ "bos_token_id": 1,
6
+ "eos_token_id": 2,
7
+ "initializer_factor": 1.0,
8
+ "logit_scale_init_value": 2.6592,
9
+ "model_type": "owlv2",
10
+ "pad_token_id": 0,
11
+ "projection_dim": 64,
12
+ "text_config": {
13
+ "attention_dropout": 0.1,
14
+ "dropout": 0.1,
15
+ "hidden_size": 64,
16
+ "intermediate_size": 37,
17
+ "model_type": "owlv2_text_model",
18
+ "num_attention_heads": 4,
19
+ "vocab_size": 1024
20
+ },
21
+ "torch_dtype": "float32",
22
+ "transformers_version": "4.36.0.dev0",
23
+ "vision_config": {
24
+ "attention_dropout": 0.1,
25
+ "dropout": 0.1,
26
+ "hidden_size": 32,
27
+ "image_size": 32,
28
+ "intermediate_size": 37,
29
+ "model_type": "owlv2_vision_model",
30
+ "num_attention_heads": 4,
31
+ "num_hidden_layers": 2,
32
+ "patch_size": 2
33
+ }
34
+ }
merges.txt ADDED
@@ -0,0 +1,727 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ #version: 0.2
2
+ t h
3
+ th e</w>
4
+ i n
5
+ a n
6
+ e d</w>
7
+ e r
8
+ r e
9
+ a r
10
+ t i
11
+ o n
12
+ e n
13
+ o f</w>
14
+ o r
15
+ an d</w>
16
+ e r</w>
17
+ o n</w>
18
+ i n</w>
19
+ in g</w>
20
+ s t
21
+ r o
22
+ a l
23
+ i t
24
+ t o</w>
25
+ a s</w>
26
+ a t
27
+ e s</w>
28
+ o u
29
+ h i
30
+ a c
31
+ s i
32
+ a t</w>
33
+ r i
34
+ a l</w>
35
+ e l
36
+ a n</w>
37
+ a m
38
+ o r</w>
39
+ s t</w>
40
+ l i
41
+ u r
42
+ e c
43
+ o m
44
+ d i
45
+ w as</w>
46
+ l y</w>
47
+ e n</w>
48
+ e a
49
+ c h
50
+ u n
51
+ ti on</w>
52
+ l a
53
+ i s</w>
54
+ f i
55
+ o l
56
+ d e
57
+ - @</w>
58
+ @ -@</w>
59
+ r a
60
+ v i
61
+ l e</w>
62
+ l o
63
+ s h
64
+ e m
65
+ b e
66
+ th at</w>
67
+ ' s</w>
68
+ c on
69
+ m a
70
+ f or</w>
71
+ h a
72
+ s u
73
+ b y</w>
74
+ it h</w>
75
+ v e</w>
76
+ w ith</w>
77
+ s e</w>
78
+ c h</w>
79
+ th e
80
+ en t
81
+ p o
82
+ c e</w>
83
+ i l
84
+ s e
85
+ en t</w>
86
+ l e
87
+ c om
88
+ s p
89
+ er e</w>
90
+ p ro
91
+ n o
92
+ b u
93
+ w h
94
+ i t</w>
95
+ t h</w>
96
+ v er
97
+ n e
98
+ c a
99
+ i s
100
+ f or
101
+ a g
102
+ er s</w>
103
+ m o
104
+ g h
105
+ f ro
106
+ t ed</w>
107
+ fro m</w>
108
+ ti on
109
+ o p
110
+ hi s</w>
111
+ a d
112
+ a b
113
+ i c
114
+ h e</w>
115
+ ou n
116
+ a s
117
+ t s</w>
118
+ s c
119
+ d e</w>
120
+ o w
121
+ e x
122
+ w hi
123
+ r u
124
+ t er</w>
125
+ a p
126
+ d s</w>
127
+ w ere</w>
128
+ p re
129
+ d u
130
+ g u
131
+ p ar
132
+ i r
133
+ b o
134
+ th er</w>
135
+ q u
136
+ l u
137
+ t er
138
+ t w
139
+ e s
140
+ re c
141
+ p er
142
+ t a
143
+ at e</w>
144
+ v er</w>
145
+ at ed</w>
146
+ d ing</w>
147
+ it y</w>
148
+ m an
149
+ e ar
150
+ s ed</w>
151
+ d ed</w>
152
+ a u
153
+ al l</w>
154
+ am e</w>
155
+ c i
156
+ on e</w>
157
+ in g
158
+ ar e</w>
159
+ a f
160
+ i r</w>
161
+ a tion</w>
162
+ â Ģ
163
+ ha d</w>
164
+ t r
165
+ u l
166
+ l d</w>
167
+ whi ch</w>
168
+ w a
169
+ i m
170
+ l ea
171
+ b e</w>
172
+ t o
173
+ ti m
174
+ fi r
175
+ w or
176
+ on g</w>
177
+ p or
178
+ m ar
179
+ m e
180
+ al ly</w>
181
+ s o</w>
182
+ ou t</w>
183
+ tion s</w>
184
+ it s</w>
185
+ g h</w>
186
+ g e</w>
187
+ b er</w>
188
+ f e
189
+ p u
190
+ s er
191
+ d er
192
+ p l
193
+ s s</w>
194
+ in e</w>
195
+ in c
196
+ m i
197
+ gh t</w>
198
+ g o
199
+ th is</w>
200
+ t ur
201
+ d a
202
+ ro u
203
+ bu t</w>
204
+ u m
205
+ s on</w>
206
+ w e
207
+ v ed</w>
208
+ si on</w>
209
+ k e</w>
210
+ p la
211
+ the ir</w>
212
+ i es</w>
213
+ fir st</w>
214
+ s a
215
+ o c
216
+ at t
217
+ o f
218
+ p e
219
+ no t</w>
220
+ g i
221
+ n a
222
+ ar y</w>
223
+ m u
224
+ l ed</w>
225
+ âĢ ĵ</w>
226
+ h er</w>
227
+ r an
228
+ c o
229
+ the y</w>
230
+ d er</w>
231
+ al i
232
+ al so</w>
233
+ or e</w>
234
+ e p
235
+ ou ld</w>
236
+ af ter</w>
237
+ s hi
238
+ u s</w>
239
+ e t</w>
240
+ ti c
241
+ st or
242
+ w i
243
+ e v
244
+ o ther</w>
245
+ s h</w>
246
+ t ing</w>
247
+ ar d</w>
248
+ t e
249
+ tw o</w>
250
+ n i
251
+ ha ve</w>
252
+ ou r
253
+ com m
254
+ t e</w>
255
+ ac k</w>
256
+ o o
257
+ f in
258
+ s ec
259
+ ent s</w>
260
+ h as</w>
261
+ com p
262
+ b ec
263
+ k s</w>
264
+ con t
265
+ l and</w>
266
+ be en</w>
267
+ en ce</w>
268
+ k ing</w>
269
+ e l</w>
270
+ ag e</w>
271
+ lo w
272
+ m in
273
+ . @</w>
274
+ @ .@</w>
275
+ om e</w>
276
+ m ent</w>
277
+ ch ar
278
+ g e
279
+ at er</w>
280
+ n or
281
+ h o
282
+ ou s</w>
283
+ wh o</w>
284
+ ea r</w>
285
+ sp ec
286
+ c ol
287
+ el y</w>
288
+ t y</w>
289
+ j o
290
+ ur ing</w>
291
+ du c
292
+ b ri
293
+ st r
294
+ c an
295
+ or i
296
+ t ra
297
+ p a
298
+ sh e</w>
299
+ d o
300
+ ti ve</w>
301
+ m on
302
+ ne w</w>
303
+ r it
304
+ tim e</w>
305
+ on s</w>
306
+ s o
307
+ m an</w>
308
+ d ec
309
+ c ent
310
+ l an
311
+ p i
312
+ ou r</w>
313
+ in ter
314
+ f er
315
+ g ra
316
+ g re
317
+ re s</w>
318
+ inc lu
319
+ m il
320
+ d uring</w>
321
+ ow n</w>
322
+ pre s
323
+ j u
324
+ n ed</w>
325
+ el l</w>
326
+ , @</w>
327
+ @ ,@</w>
328
+ it e</w>
329
+ g en
330
+ wh en</w>
331
+ si g
332
+ b i
333
+ re n
334
+ f a
335
+ g a
336
+ pla y
337
+ en g
338
+ tion al</w>
339
+ oun d</w>
340
+ th ou
341
+ m ore</w>
342
+ re e</w>
343
+ em ber</w>
344
+ e i
345
+ s ou
346
+ s ur
347
+ s ti
348
+ c ar
349
+ for m
350
+ l ar
351
+ s es</w>
352
+ t en
353
+ in to</w>
354
+ t u
355
+ c es</w>
356
+ mo st</w>
357
+ k ed</w>
358
+ wa y</w>
359
+ c re
360
+ c oun
361
+ u p</w>
362
+ l es</w>
363
+ ac e</w>
364
+ al s</w>
365
+ k e
366
+ w ould</w>
367
+ an t</w>
368
+ b er
369
+ f u
370
+ it ed</w>
371
+ p ri
372
+ whi le</w>
373
+ o ver</w>
374
+ ing s</w>
375
+ r e</w>
376
+ fi l
377
+ s y
378
+ e st
379
+ ab le</w>
380
+ w n</w>
381
+ s ea
382
+ ac h
383
+ s ing</w>
384
+ in s</w>
385
+ ti c</w>
386
+ i d</w>
387
+ on ly</w>
388
+ at es</w>
389
+ t ri
390
+ v ing</w>
391
+ b a
392
+ v el
393
+ an ce</w>
394
+ st a
395
+ er n</w>
396
+ f ol
397
+ e en</w>
398
+ in ed</w>
399
+ st ru
400
+ un i
401
+ g ame</w>
402
+ la r</w>
403
+ s el
404
+ b li
405
+ u sed</w>
406
+ n ing</w>
407
+ p s</w>
408
+ ti es</w>
409
+ k no
410
+ c or
411
+ f t</w>
412
+ rec or
413
+ b le</w>
414
+ vi e
415
+ y s</w>
416
+ w il
417
+ ic al</w>
418
+ ap p
419
+ t ro
420
+ th ree</w>
421
+ c la
422
+ ol d</w>
423
+ sh ed</w>
424
+ h ea
425
+ ab out</w>
426
+ w rit
427
+ th an</w>
428
+ st e
429
+ l ater</w>
430
+ ar i
431
+ d y</w>
432
+ pu bli
433
+ lo c
434
+ ag a
435
+ th rou
436
+ s si
437
+ en d</w>
438
+ ma y</w>
439
+ an g
440
+ ac h</w>
441
+ v es</w>
442
+ o g
443
+ hi m</w>
444
+ be tw
445
+ thou gh</w>
446
+ betw een</w>
447
+ u m</w>
448
+ st ar
449
+ sc ri
450
+ re a
451
+ on d</w>
452
+ shi p</w>
453
+ o k</w>
454
+ h el
455
+ s ong</w>
456
+ c hi
457
+ ca p
458
+ e ver</w>
459
+ da y</w>
460
+ c ri
461
+ s ome</w>
462
+ b ro
463
+ n o</w>
464
+ th ere</w>
465
+ an s</w>
466
+ al l
467
+ n um
468
+ r ed</w>
469
+ ear s</w>
470
+ st s</w>
471
+ an y</w>
472
+ w ar
473
+ p h
474
+ p p
475
+ g in
476
+ stru c
477
+ am er
478
+ pro duc
479
+ s ch
480
+ c es
481
+ ur e</w>
482
+ at ing</w>
483
+ em p
484
+ t or
485
+ sea son</w>
486
+ for e</w>
487
+ i c</w>
488
+ c ity</w>
489
+ g ro
490
+ fol low
491
+ su b
492
+ b el
493
+ y ear</w>
494
+ c an</w>
495
+ s in
496
+ wh ere</w>
497
+ an d
498
+ ma de</w>
499
+ re lea
500
+ s m
501
+ b l
502
+ t en</w>
503
+ wi th
504
+ s on
505
+ man y</w>
506
+ a re
507
+ e d
508
+ h ow
509
+ amer ic
510
+ ur y</w>
511
+ st u
512
+ mu si
513
+ c u
514
+ n am
515
+ em ent</w>
516
+ su ch</w>
517
+ al bu
518
+ bu il
519
+ be fore</w>
520
+ e f
521
+ ar m
522
+ t on</w>
523
+ the m</w>
524
+ c al
525
+ b ar
526
+ d es</w>
527
+ m at
528
+ gen er
529
+ o d</w>
530
+ ser ies</w>
531
+ c er
532
+ sh o
533
+ en ti
534
+ h er
535
+ o ver
536
+ an n
537
+ w ell</w>
538
+ wor ld</w>
539
+ g an</w>
540
+ e st</w>
541
+ sec ond</w>
542
+ t ers</w>
543
+ si de</w>
544
+ tr an
545
+ l ine</w>
546
+ tur e</w>
547
+ por t</w>
548
+ be ing</w>
549
+ y ears</w>
550
+ bo th</w>
551
+ in di
552
+ the se</w>
553
+ na tional</w>
554
+ hi stor
555
+ f e</w>
556
+ v o
557
+ st ed</w>
558
+ an i
559
+ b as
560
+ po in
561
+ s ing
562
+ fil m</w>
563
+ p en
564
+ su p
565
+ m is
566
+ c ro
567
+ st ri
568
+ l in
569
+ t re
570
+ wa r</w>
571
+ how ever</w>
572
+ y ing</w>
573
+ l ing</w>
574
+ y p
575
+ ec ted</w>
576
+ di rec
577
+ vi sion</w>
578
+ albu m</w>
579
+ th en</w>
580
+ l l</w>
581
+ se ver
582
+ throu gh</w>
583
+ kno wn</w>
584
+ b or
585
+ c ul
586
+ c lu
587
+ st er</w>
588
+ sou th</w>
589
+ r y</w>
590
+ ec t</w>
591
+ lo w</w>
592
+ p r
593
+ s k
594
+ is o
595
+ nor th</w>
596
+ par t</w>
597
+ f ac
598
+ t ly</w>
599
+ per i
600
+ e u
601
+ b att
602
+ st ate</w>
603
+ c ed</w>
604
+ con si
605
+ in f
606
+ po li
607
+ ol og
608
+ ear ly</w>
609
+ po si
610
+ am es</w>
611
+ w in
612
+ de vel
613
+ o b
614
+ v e
615
+ v en</w>
616
+ op er
617
+ g er
618
+ of fi
619
+ char ac
620
+ m s</w>
621
+ hi gh
622
+ a d</w>
623
+ th o
624
+ sever al</w>
625
+ d re
626
+ de scri
627
+ al e</w>
628
+ num ber</w>
629
+ a ir
630
+ inclu ding</w>
631
+ in st</w>
632
+ aga inst</w>
633
+ l s</w>
634
+ su l
635
+ ep iso
636
+ c am
637
+ di f
638
+ so ci
639
+ bec ame</w>
640
+ li ke</w>
641
+ t el
642
+ f our</w>
643
+ âĢ Ķ</w>
644
+ h ou
645
+ jo h
646
+ un ited</w>
647
+ in v
648
+ un der</w>
649
+ no v
650
+ ti v
651
+ su c
652
+ a tions</w>
653
+ ac k
654
+ t or</w>
655
+ r on
656
+ un d</w>
657
+ w s</w>
658
+ f o
659
+ g r
660
+ devel op
661
+ al though</w>
662
+ cont in
663
+ we st</w>
664
+ ori gin
665
+ musi c</w>
666
+ or s</w>
667
+ d on</w>
668
+ cent ury</w>
669
+ w ard</w>
670
+ wor k</w>
671
+ m e</w>
672
+ am i
673
+ ch a
674
+ ver y</w>
675
+ h ar
676
+ di s
677
+ z ed</w>
678
+ d o</w>
679
+ g s</w>
680
+ t ow
681
+ s ol
682
+ follow ing</w>
683
+ li on</w>
684
+ re ma
685
+ n s</w>
686
+ ti sh</w>
687
+ ch ur
688
+ s om
689
+ m p
690
+ t le</w>
691
+ go ver
692
+ d el
693
+ comp le
694
+ c ur
695
+ u se</w>
696
+ b ack</w>
697
+ h u
698
+ st ern</w>
699
+ be gan</w>
700
+ fi el
701
+ au se</w>
702
+ d ra
703
+ p as
704
+ b il
705
+ ca tion</w>
706
+ d ent</w>
707
+ b ed</w>
708
+ bec ause</w>
709
+ an t
710
+ ea m</w>
711
+ p hi
712
+ y o
713
+ contin u
714
+ ta in</w>
715
+ tr y</w>
716
+ f re
717
+ pe op
718
+ cal led</w>
719
+ f ound</w>
720
+ episo de</w>
721
+ de sig
722
+ m or
723
+ se t</w>
724
+ le y</w>
725
+ ea st</w>
726
+ tr ac
727
+ c ra
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6b37b44d58a9b69bca2b27bd9d1f37fa878c2983d9c190b434e490e6a10bf4b6
3
+ size 1450428
preprocessor_config.json ADDED
@@ -0,0 +1,21 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "crop_size": 32,
3
+ "do_normalize": true,
4
+ "do_pad": true,
5
+ "do_rescale": true,
6
+ "do_resize": true,
7
+ "image_mean": [
8
+ 0.48145466,
9
+ 0.4578275,
10
+ 0.40821073
11
+ ],
12
+ "image_processor_type": "Owlv2ImageProcessor",
13
+ "image_std": [
14
+ 0.26862954,
15
+ 0.26130258,
16
+ 0.27577711
17
+ ],
18
+ "resample": 2,
19
+ "rescale_factor": 0.00392156862745098,
20
+ "size": 32
21
+ }
special_tokens_map.json ADDED
@@ -0,0 +1,30 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": {
3
+ "content": "<|startoftext|>",
4
+ "lstrip": false,
5
+ "normalized": true,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "eos_token": {
10
+ "content": "<|endoftext|>",
11
+ "lstrip": false,
12
+ "normalized": false,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "pad_token": {
17
+ "content": "!",
18
+ "lstrip": false,
19
+ "normalized": false,
20
+ "rstrip": false,
21
+ "single_word": false
22
+ },
23
+ "unk_token": {
24
+ "content": "<|endoftext|>",
25
+ "lstrip": false,
26
+ "normalized": false,
27
+ "rstrip": false,
28
+ "single_word": false
29
+ }
30
+ }
tokenizer.json ADDED
@@ -0,0 +1,1853 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "version": "1.0",
3
+ "truncation": null,
4
+ "padding": null,
5
+ "added_tokens": [
6
+ {
7
+ "id": 0,
8
+ "content": "!",
9
+ "single_word": false,
10
+ "lstrip": false,
11
+ "rstrip": false,
12
+ "normalized": false,
13
+ "special": true
14
+ },
15
+ {
16
+ "id": 1,
17
+ "content": "<|startoftext|>",
18
+ "single_word": false,
19
+ "lstrip": false,
20
+ "rstrip": false,
21
+ "normalized": true,
22
+ "special": true
23
+ },
24
+ {
25
+ "id": 2,
26
+ "content": "<|endoftext|>",
27
+ "single_word": false,
28
+ "lstrip": false,
29
+ "rstrip": false,
30
+ "normalized": false,
31
+ "special": true
32
+ }
33
+ ],
34
+ "normalizer": {
35
+ "type": "Sequence",
36
+ "normalizers": [
37
+ {
38
+ "type": "NFC"
39
+ },
40
+ {
41
+ "type": "Replace",
42
+ "pattern": {
43
+ "Regex": "\\s+"
44
+ },
45
+ "content": " "
46
+ },
47
+ {
48
+ "type": "Lowercase"
49
+ }
50
+ ]
51
+ },
52
+ "pre_tokenizer": {
53
+ "type": "Sequence",
54
+ "pretokenizers": [
55
+ {
56
+ "type": "Split",
57
+ "pattern": {
58
+ "Regex": "'s|'t|'re|'ve|'m|'ll|'d|[\\p{L}]+|[\\p{N}]|[^\\s\\p{L}\\p{N}]+"
59
+ },
60
+ "behavior": "Removed",
61
+ "invert": true
62
+ },
63
+ {
64
+ "type": "ByteLevel",
65
+ "add_prefix_space": false,
66
+ "trim_offsets": true,
67
+ "use_regex": true
68
+ }
69
+ ]
70
+ },
71
+ "post_processor": {
72
+ "type": "RobertaProcessing",
73
+ "sep": [
74
+ "<|endoftext|>",
75
+ 2
76
+ ],
77
+ "cls": [
78
+ "<|startoftext|>",
79
+ 1
80
+ ],
81
+ "trim_offsets": false,
82
+ "add_prefix_space": false
83
+ },
84
+ "decoder": {
85
+ "type": "ByteLevel",
86
+ "add_prefix_space": true,
87
+ "trim_offsets": true,
88
+ "use_regex": true
89
+ },
90
+ "model": {
91
+ "type": "BPE",
92
+ "dropout": null,
93
+ "unk_token": "<|endoftext|>",
94
+ "continuing_subword_prefix": "",
95
+ "end_of_word_suffix": "</w>",
96
+ "fuse_unk": false,
97
+ "byte_fallback": false,
98
+ "vocab": {
99
+ "!": 0,
100
+ "<|startoftext|>": 1,
101
+ "<|endoftext|>": 2,
102
+ "\"": 3,
103
+ "#": 4,
104
+ "$": 5,
105
+ "%": 6,
106
+ "&": 7,
107
+ "'": 8,
108
+ "(": 9,
109
+ ")": 10,
110
+ "*": 11,
111
+ "+": 12,
112
+ ",": 13,
113
+ "-": 14,
114
+ ".": 15,
115
+ "/": 16,
116
+ "0": 17,
117
+ "1": 18,
118
+ "2": 19,
119
+ "3": 20,
120
+ "4": 21,
121
+ "5": 22,
122
+ "6": 23,
123
+ "7": 24,
124
+ "8": 25,
125
+ "9": 26,
126
+ ":": 27,
127
+ ";": 28,
128
+ "<": 29,
129
+ "=": 30,
130
+ ">": 31,
131
+ "?": 32,
132
+ "@": 33,
133
+ "[": 34,
134
+ "\\": 35,
135
+ "]": 36,
136
+ "^": 37,
137
+ "_": 38,
138
+ "`": 39,
139
+ "a": 40,
140
+ "b": 41,
141
+ "c": 42,
142
+ "d": 43,
143
+ "e": 44,
144
+ "f": 45,
145
+ "g": 46,
146
+ "h": 47,
147
+ "i": 48,
148
+ "j": 49,
149
+ "k": 50,
150
+ "l": 51,
151
+ "m": 52,
152
+ "n": 53,
153
+ "o": 54,
154
+ "p": 55,
155
+ "q": 56,
156
+ "r": 57,
157
+ "s": 58,
158
+ "t": 59,
159
+ "u": 60,
160
+ "v": 61,
161
+ "w": 62,
162
+ "x": 63,
163
+ "y": 64,
164
+ "z": 65,
165
+ "|": 66,
166
+ "}": 67,
167
+ "~": 68,
168
+ "¡": 69,
169
+ "¢": 70,
170
+ "£": 71,
171
+ "¤": 72,
172
+ "¥": 73,
173
+ "¦": 74,
174
+ "§": 75,
175
+ "¨": 76,
176
+ "©": 77,
177
+ "ª": 78,
178
+ "«": 79,
179
+ "¬": 80,
180
+ "®": 81,
181
+ "¯": 82,
182
+ "°": 83,
183
+ "±": 84,
184
+ "²": 85,
185
+ "³": 86,
186
+ "´": 87,
187
+ "µ": 88,
188
+ "¶": 89,
189
+ "·": 90,
190
+ "¸": 91,
191
+ "¹": 92,
192
+ "º": 93,
193
+ "»": 94,
194
+ "¼": 95,
195
+ "½": 96,
196
+ "¾": 97,
197
+ "¿": 98,
198
+ "Â": 99,
199
+ "Ã": 100,
200
+ "Ä": 101,
201
+ "Å": 102,
202
+ "Æ": 103,
203
+ "Ç": 104,
204
+ "È": 105,
205
+ "É": 106,
206
+ "Ê": 107,
207
+ "Ë": 108,
208
+ "Ì": 109,
209
+ "Í": 110,
210
+ "Î": 111,
211
+ "Ï": 112,
212
+ "Ð": 113,
213
+ "Ñ": 114,
214
+ "Ö": 115,
215
+ "×": 116,
216
+ "Ø": 117,
217
+ "Ù": 118,
218
+ "Ü": 119,
219
+ "à": 120,
220
+ "á": 121,
221
+ "â": 122,
222
+ "ã": 123,
223
+ "ä": 124,
224
+ "å": 125,
225
+ "æ": 126,
226
+ "ç": 127,
227
+ "è": 128,
228
+ "é": 129,
229
+ "ë": 130,
230
+ "ì": 131,
231
+ "ï": 132,
232
+ "Ģ": 133,
233
+ "ģ": 134,
234
+ "Ĥ": 135,
235
+ "ĥ": 136,
236
+ "Ħ": 137,
237
+ "ħ": 138,
238
+ "Ĩ": 139,
239
+ "ĩ": 140,
240
+ "Ī": 141,
241
+ "ī": 142,
242
+ "Ĭ": 143,
243
+ "ĭ": 144,
244
+ "Į": 145,
245
+ "į": 146,
246
+ "İ": 147,
247
+ "ı": 148,
248
+ "IJ": 149,
249
+ "ij": 150,
250
+ "Ĵ": 151,
251
+ "ĵ": 152,
252
+ "Ķ": 153,
253
+ "ķ": 154,
254
+ "ĸ": 155,
255
+ "Ĺ": 156,
256
+ "ĺ": 157,
257
+ "Ļ": 158,
258
+ "ļ": 159,
259
+ "Ľ": 160,
260
+ "ľ": 161,
261
+ "Ŀ": 162,
262
+ "ŀ": 163,
263
+ "Ł": 164,
264
+ "ł": 165,
265
+ "Ń": 166,
266
+ "e</w>": 167,
267
+ "s</w>": 168,
268
+ "f</w>": 169,
269
+ "d</w>": 170,
270
+ "r</w>": 171,
271
+ "n</w>": 172,
272
+ "l</w>": 173,
273
+ "y</w>": 174,
274
+ "a</w>": 175,
275
+ "c</w>": 176,
276
+ "i</w>": 177,
277
+ "k</w>": 178,
278
+ "g</w>": 179,
279
+ "t</w>": 180,
280
+ "m</w>": 181,
281
+ "p</w>": 182,
282
+ "h</w>": 183,
283
+ "x</w>": 184,
284
+ "ĵ</w>": 185,
285
+ "Ľ</w>": 186,
286
+ "u</w>": 187,
287
+ "o</w>": 188,
288
+ "¡</w>": 189,
289
+ "v</w>": 190,
290
+ "b</w>": 191,
291
+ "z</w>": 192,
292
+ "w</w>": 193,
293
+ "¸</w>": 194,
294
+ "ĩ</w>": 195,
295
+ "ĸ</w>": 196,
296
+ "Ħ</w>": 197,
297
+ "Ĭ</w>": 198,
298
+ "ĺ</w>": 199,
299
+ "©</w>": 200,
300
+ "į</w>": 201,
301
+ "Ĩ</w>": 202,
302
+ "¥</w>": 203,
303
+ ":</w>": 204,
304
+ "Ŀ</w>": 205,
305
+ "ŀ</w>": 206,
306
+ "§</w>": 207,
307
+ "j</w>": 208,
308
+ "¼</w>": 209,
309
+ "£</w>": 210,
310
+ "¹</w>": 211,
311
+ "*</w>": 212,
312
+ "µ</w>": 213,
313
+ "ģ</w>": 214,
314
+ "¢</w>": 215,
315
+ "ķ</w>": 216,
316
+ "q</w>": 217,
317
+ "³</w>": 218,
318
+ "ij</w>": 219,
319
+ "«</w>": 220,
320
+ "ħ</w>": 221,
321
+ "ī</w>": 222,
322
+ "Ķ</w>": 223,
323
+ "¤</w>": 224,
324
+ "²</w>": 225,
325
+ "Ļ</w>": 226,
326
+ "Ĵ</w>": 227,
327
+ "#</w>": 228,
328
+ "Į</w>": 229,
329
+ "ı</w>": 230,
330
+ "Ń</w>": 231,
331
+ "-</w>": 232,
332
+ "ĥ</w>": 233,
333
+ "½</w>": 234,
334
+ "Ĥ</w>": 235,
335
+ ".</w>": 236,
336
+ "¶</w>": 237,
337
+ "¨</w>": 238,
338
+ "®</w>": 239,
339
+ "¦</w>": 240,
340
+ "ĭ</w>": 241,
341
+ "&</w>": 242,
342
+ "Ī</w>": 243,
343
+ "Ģ</w>": 244,
344
+ "±</w>": 245,
345
+ "1</w>": 246,
346
+ "ľ</w>": 247,
347
+ "¯</w>": 248,
348
+ "¿</w>": 249,
349
+ "Ł</w>": 250,
350
+ "8</w>": 251,
351
+ "ł</w>": 252,
352
+ "5</w>": 253,
353
+ "º</w>": 254,
354
+ "IJ</w>": 255,
355
+ "°</w>": 256,
356
+ "»</w>": 257,
357
+ "ª</w>": 258,
358
+ "¾</w>": 259,
359
+ "|</w>": 260,
360
+ "·</w>": 261,
361
+ "<</w>": 262,
362
+ "Ĺ</w>": 263,
363
+ "%</w>": 264,
364
+ "`</w>": 265,
365
+ "]</w>": 266,
366
+ "´</w>": 267,
367
+ "2</w>": 268,
368
+ "@</w>": 269,
369
+ "[</w>": 270,
370
+ "0</w>": 271,
371
+ "¬</w>": 272,
372
+ "3</w>": 273,
373
+ "$</w>": 274,
374
+ ";</w>": 275,
375
+ "6</w>": 276,
376
+ "9</w>": 277,
377
+ "^</w>": 278,
378
+ "İ</w>": 279,
379
+ "~</w>": 280,
380
+ "=</w>": 281,
381
+ "\"</w>": 282,
382
+ "!</w>": 283,
383
+ "></w>": 284,
384
+ "}</w>": 285,
385
+ ",</w>": 286,
386
+ "'</w>": 287,
387
+ "+</w>": 288,
388
+ "(</w>": 289,
389
+ "ļ</w>": 290,
390
+ "?</w>": 291,
391
+ "/</w>": 292,
392
+ "_</w>": 293,
393
+ "4</w>": 294,
394
+ ")</w>": 295,
395
+ "\\</w>": 296,
396
+ "7</w>": 297,
397
+ "th": 298,
398
+ "the</w>": 299,
399
+ "in": 300,
400
+ "an": 301,
401
+ "ed</w>": 302,
402
+ "er": 303,
403
+ "re": 304,
404
+ "ar": 305,
405
+ "ti": 306,
406
+ "on": 307,
407
+ "en": 308,
408
+ "of</w>": 309,
409
+ "or": 310,
410
+ "and</w>": 311,
411
+ "er</w>": 312,
412
+ "on</w>": 313,
413
+ "in</w>": 314,
414
+ "ing</w>": 315,
415
+ "st": 316,
416
+ "ro": 317,
417
+ "al": 318,
418
+ "it": 319,
419
+ "to</w>": 320,
420
+ "as</w>": 321,
421
+ "at": 322,
422
+ "es</w>": 323,
423
+ "ou": 324,
424
+ "hi": 325,
425
+ "ac": 326,
426
+ "si": 327,
427
+ "at</w>": 328,
428
+ "ri": 329,
429
+ "al</w>": 330,
430
+ "el": 331,
431
+ "an</w>": 332,
432
+ "am": 333,
433
+ "or</w>": 334,
434
+ "st</w>": 335,
435
+ "li": 336,
436
+ "ur": 337,
437
+ "ec": 338,
438
+ "om": 339,
439
+ "di": 340,
440
+ "was</w>": 341,
441
+ "ly</w>": 342,
442
+ "en</w>": 343,
443
+ "ea": 344,
444
+ "ch": 345,
445
+ "un": 346,
446
+ "tion</w>": 347,
447
+ "la": 348,
448
+ "is</w>": 349,
449
+ "fi": 350,
450
+ "ol": 351,
451
+ "de": 352,
452
+ "-@</w>": 353,
453
+ "@-@</w>": 354,
454
+ "ra": 355,
455
+ "vi": 356,
456
+ "le</w>": 357,
457
+ "lo": 358,
458
+ "sh": 359,
459
+ "em": 360,
460
+ "be": 361,
461
+ "that</w>": 362,
462
+ "'s</w>": 363,
463
+ "con": 364,
464
+ "ma": 365,
465
+ "for</w>": 366,
466
+ "ha": 367,
467
+ "su": 368,
468
+ "by</w>": 369,
469
+ "ith</w>": 370,
470
+ "ve</w>": 371,
471
+ "with</w>": 372,
472
+ "se</w>": 373,
473
+ "ch</w>": 374,
474
+ "the": 375,
475
+ "ent": 376,
476
+ "po": 377,
477
+ "ce</w>": 378,
478
+ "il": 379,
479
+ "se": 380,
480
+ "ent</w>": 381,
481
+ "le": 382,
482
+ "com": 383,
483
+ "sp": 384,
484
+ "ere</w>": 385,
485
+ "pro": 386,
486
+ "no": 387,
487
+ "bu": 388,
488
+ "wh": 389,
489
+ "it</w>": 390,
490
+ "th</w>": 391,
491
+ "ver": 392,
492
+ "ne": 393,
493
+ "ca": 394,
494
+ "is": 395,
495
+ "for": 396,
496
+ "ag": 397,
497
+ "ers</w>": 398,
498
+ "mo": 399,
499
+ "gh": 400,
500
+ "fro": 401,
501
+ "ted</w>": 402,
502
+ "from</w>": 403,
503
+ "tion": 404,
504
+ "op": 405,
505
+ "his</w>": 406,
506
+ "ad": 407,
507
+ "ab": 408,
508
+ "ic": 409,
509
+ "he</w>": 410,
510
+ "oun": 411,
511
+ "as": 412,
512
+ "ts</w>": 413,
513
+ "sc": 414,
514
+ "de</w>": 415,
515
+ "ow": 416,
516
+ "ex": 417,
517
+ "whi": 418,
518
+ "ru": 419,
519
+ "ter</w>": 420,
520
+ "ap": 421,
521
+ "ds</w>": 422,
522
+ "were</w>": 423,
523
+ "pre": 424,
524
+ "du": 425,
525
+ "gu": 426,
526
+ "par": 427,
527
+ "ir": 428,
528
+ "bo": 429,
529
+ "ther</w>": 430,
530
+ "qu": 431,
531
+ "lu": 432,
532
+ "ter": 433,
533
+ "tw": 434,
534
+ "es": 435,
535
+ "rec": 436,
536
+ "per": 437,
537
+ "ta": 438,
538
+ "ate</w>": 439,
539
+ "ver</w>": 440,
540
+ "ated</w>": 441,
541
+ "ding</w>": 442,
542
+ "ity</w>": 443,
543
+ "man": 444,
544
+ "ear": 445,
545
+ "sed</w>": 446,
546
+ "ded</w>": 447,
547
+ "au": 448,
548
+ "all</w>": 449,
549
+ "ame</w>": 450,
550
+ "ci": 451,
551
+ "one</w>": 452,
552
+ "ing": 453,
553
+ "are</w>": 454,
554
+ "af": 455,
555
+ "ir</w>": 456,
556
+ "ation</w>": 457,
557
+ "âĢ": 458,
558
+ "had</w>": 459,
559
+ "tr": 460,
560
+ "ul": 461,
561
+ "ld</w>": 462,
562
+ "which</w>": 463,
563
+ "wa": 464,
564
+ "im": 465,
565
+ "lea": 466,
566
+ "be</w>": 467,
567
+ "to": 468,
568
+ "tim": 469,
569
+ "fir": 470,
570
+ "wor": 471,
571
+ "ong</w>": 472,
572
+ "por": 473,
573
+ "mar": 474,
574
+ "me": 475,
575
+ "ally</w>": 476,
576
+ "so</w>": 477,
577
+ "out</w>": 478,
578
+ "tions</w>": 479,
579
+ "its</w>": 480,
580
+ "gh</w>": 481,
581
+ "ge</w>": 482,
582
+ "ber</w>": 483,
583
+ "fe": 484,
584
+ "pu": 485,
585
+ "ser": 486,
586
+ "der": 487,
587
+ "pl": 488,
588
+ "ss</w>": 489,
589
+ "ine</w>": 490,
590
+ "inc": 491,
591
+ "mi": 492,
592
+ "ght</w>": 493,
593
+ "go": 494,
594
+ "this</w>": 495,
595
+ "tur": 496,
596
+ "da": 497,
597
+ "rou": 498,
598
+ "but</w>": 499,
599
+ "um": 500,
600
+ "son</w>": 501,
601
+ "we": 502,
602
+ "ved</w>": 503,
603
+ "sion</w>": 504,
604
+ "ke</w>": 505,
605
+ "pla": 506,
606
+ "their</w>": 507,
607
+ "ies</w>": 508,
608
+ "first</w>": 509,
609
+ "sa": 510,
610
+ "oc": 511,
611
+ "att": 512,
612
+ "of": 513,
613
+ "pe": 514,
614
+ "not</w>": 515,
615
+ "gi": 516,
616
+ "na": 517,
617
+ "ary</w>": 518,
618
+ "mu": 519,
619
+ "led</w>": 520,
620
+ "âĢĵ</w>": 521,
621
+ "her</w>": 522,
622
+ "ran": 523,
623
+ "co": 524,
624
+ "they</w>": 525,
625
+ "der</w>": 526,
626
+ "ali": 527,
627
+ "also</w>": 528,
628
+ "ore</w>": 529,
629
+ "ep": 530,
630
+ "ould</w>": 531,
631
+ "after</w>": 532,
632
+ "shi": 533,
633
+ "us</w>": 534,
634
+ "et</w>": 535,
635
+ "tic": 536,
636
+ "stor": 537,
637
+ "wi": 538,
638
+ "ev": 539,
639
+ "other</w>": 540,
640
+ "sh</w>": 541,
641
+ "ting</w>": 542,
642
+ "ard</w>": 543,
643
+ "te": 544,
644
+ "two</w>": 545,
645
+ "ni": 546,
646
+ "have</w>": 547,
647
+ "our": 548,
648
+ "comm": 549,
649
+ "te</w>": 550,
650
+ "ack</w>": 551,
651
+ "oo": 552,
652
+ "fin": 553,
653
+ "sec": 554,
654
+ "ents</w>": 555,
655
+ "has</w>": 556,
656
+ "comp": 557,
657
+ "bec": 558,
658
+ "ks</w>": 559,
659
+ "cont": 560,
660
+ "land</w>": 561,
661
+ "been</w>": 562,
662
+ "ence</w>": 563,
663
+ "king</w>": 564,
664
+ "el</w>": 565,
665
+ "age</w>": 566,
666
+ "low": 567,
667
+ "min": 568,
668
+ ".@</w>": 569,
669
+ "@.@</w>": 570,
670
+ "ome</w>": 571,
671
+ "ment</w>": 572,
672
+ "char": 573,
673
+ "ge": 574,
674
+ "ater</w>": 575,
675
+ "nor": 576,
676
+ "ho": 577,
677
+ "ous</w>": 578,
678
+ "who</w>": 579,
679
+ "ear</w>": 580,
680
+ "spec": 581,
681
+ "col": 582,
682
+ "ely</w>": 583,
683
+ "ty</w>": 584,
684
+ "jo": 585,
685
+ "uring</w>": 586,
686
+ "duc": 587,
687
+ "bri": 588,
688
+ "str": 589,
689
+ "can": 590,
690
+ "ori": 591,
691
+ "tra": 592,
692
+ "pa": 593,
693
+ "she</w>": 594,
694
+ "do": 595,
695
+ "tive</w>": 596,
696
+ "mon": 597,
697
+ "new</w>": 598,
698
+ "rit": 599,
699
+ "time</w>": 600,
700
+ "ons</w>": 601,
701
+ "so": 602,
702
+ "man</w>": 603,
703
+ "dec": 604,
704
+ "cent": 605,
705
+ "lan": 606,
706
+ "pi": 607,
707
+ "our</w>": 608,
708
+ "inter": 609,
709
+ "fer": 610,
710
+ "gra": 611,
711
+ "gre": 612,
712
+ "res</w>": 613,
713
+ "inclu": 614,
714
+ "mil": 615,
715
+ "during</w>": 616,
716
+ "own</w>": 617,
717
+ "pres": 618,
718
+ "ju": 619,
719
+ "ned</w>": 620,
720
+ "ell</w>": 621,
721
+ ",@</w>": 622,
722
+ "@,@</w>": 623,
723
+ "ite</w>": 624,
724
+ "gen": 625,
725
+ "when</w>": 626,
726
+ "sig": 627,
727
+ "bi": 628,
728
+ "ren": 629,
729
+ "fa": 630,
730
+ "ga": 631,
731
+ "play": 632,
732
+ "eng": 633,
733
+ "tional</w>": 634,
734
+ "ound</w>": 635,
735
+ "thou": 636,
736
+ "more</w>": 637,
737
+ "ree</w>": 638,
738
+ "ember</w>": 639,
739
+ "ei": 640,
740
+ "sou": 641,
741
+ "sur": 642,
742
+ "sti": 643,
743
+ "car": 644,
744
+ "form": 645,
745
+ "lar": 646,
746
+ "ses</w>": 647,
747
+ "ten": 648,
748
+ "into</w>": 649,
749
+ "tu": 650,
750
+ "ces</w>": 651,
751
+ "most</w>": 652,
752
+ "ked</w>": 653,
753
+ "way</w>": 654,
754
+ "cre": 655,
755
+ "coun": 656,
756
+ "up</w>": 657,
757
+ "les</w>": 658,
758
+ "ace</w>": 659,
759
+ "als</w>": 660,
760
+ "ke": 661,
761
+ "would</w>": 662,
762
+ "ant</w>": 663,
763
+ "ber": 664,
764
+ "fu": 665,
765
+ "ited</w>": 666,
766
+ "pri": 667,
767
+ "while</w>": 668,
768
+ "over</w>": 669,
769
+ "ings</w>": 670,
770
+ "re</w>": 671,
771
+ "fil": 672,
772
+ "sy": 673,
773
+ "est": 674,
774
+ "able</w>": 675,
775
+ "wn</w>": 676,
776
+ "sea": 677,
777
+ "ach": 678,
778
+ "sing</w>": 679,
779
+ "ins</w>": 680,
780
+ "tic</w>": 681,
781
+ "id</w>": 682,
782
+ "only</w>": 683,
783
+ "ates</w>": 684,
784
+ "tri": 685,
785
+ "ving</w>": 686,
786
+ "ba": 687,
787
+ "vel": 688,
788
+ "ance</w>": 689,
789
+ "sta": 690,
790
+ "ern</w>": 691,
791
+ "fol": 692,
792
+ "een</w>": 693,
793
+ "ined</w>": 694,
794
+ "stru": 695,
795
+ "uni": 696,
796
+ "game</w>": 697,
797
+ "lar</w>": 698,
798
+ "sel": 699,
799
+ "bli": 700,
800
+ "used</w>": 701,
801
+ "ning</w>": 702,
802
+ "ps</w>": 703,
803
+ "ties</w>": 704,
804
+ "kno": 705,
805
+ "cor": 706,
806
+ "ft</w>": 707,
807
+ "recor": 708,
808
+ "ble</w>": 709,
809
+ "vie": 710,
810
+ "ys</w>": 711,
811
+ "wil": 712,
812
+ "ical</w>": 713,
813
+ "app": 714,
814
+ "tro": 715,
815
+ "three</w>": 716,
816
+ "cla": 717,
817
+ "old</w>": 718,
818
+ "shed</w>": 719,
819
+ "hea": 720,
820
+ "about</w>": 721,
821
+ "writ": 722,
822
+ "than</w>": 723,
823
+ "ste": 724,
824
+ "later</w>": 725,
825
+ "ari": 726,
826
+ "dy</w>": 727,
827
+ "publi": 728,
828
+ "loc": 729,
829
+ "aga": 730,
830
+ "throu": 731,
831
+ "ssi": 732,
832
+ "end</w>": 733,
833
+ "may</w>": 734,
834
+ "ang": 735,
835
+ "ach</w>": 736,
836
+ "ves</w>": 737,
837
+ "og": 738,
838
+ "him</w>": 739,
839
+ "betw": 740,
840
+ "though</w>": 741,
841
+ "between</w>": 742,
842
+ "um</w>": 743,
843
+ "star": 744,
844
+ "scri": 745,
845
+ "rea": 746,
846
+ "ond</w>": 747,
847
+ "ship</w>": 748,
848
+ "ok</w>": 749,
849
+ "hel": 750,
850
+ "song</w>": 751,
851
+ "chi": 752,
852
+ "cap": 753,
853
+ "ever</w>": 754,
854
+ "day</w>": 755,
855
+ "cri": 756,
856
+ "some</w>": 757,
857
+ "bro": 758,
858
+ "no</w>": 759,
859
+ "there</w>": 760,
860
+ "ans</w>": 761,
861
+ "all": 762,
862
+ "num": 763,
863
+ "red</w>": 764,
864
+ "ears</w>": 765,
865
+ "sts</w>": 766,
866
+ "any</w>": 767,
867
+ "war": 768,
868
+ "ph": 769,
869
+ "pp": 770,
870
+ "gin": 771,
871
+ "struc": 772,
872
+ "amer": 773,
873
+ "produc": 774,
874
+ "sch": 775,
875
+ "ces": 776,
876
+ "ure</w>": 777,
877
+ "ating</w>": 778,
878
+ "emp": 779,
879
+ "tor": 780,
880
+ "season</w>": 781,
881
+ "fore</w>": 782,
882
+ "ic</w>": 783,
883
+ "city</w>": 784,
884
+ "gro": 785,
885
+ "follow": 786,
886
+ "sub": 787,
887
+ "bel": 788,
888
+ "year</w>": 789,
889
+ "can</w>": 790,
890
+ "sin": 791,
891
+ "where</w>": 792,
892
+ "and": 793,
893
+ "made</w>": 794,
894
+ "relea": 795,
895
+ "sm": 796,
896
+ "bl": 797,
897
+ "ten</w>": 798,
898
+ "with": 799,
899
+ "son": 800,
900
+ "many</w>": 801,
901
+ "are": 802,
902
+ "ed": 803,
903
+ "how": 804,
904
+ "americ": 805,
905
+ "ury</w>": 806,
906
+ "stu": 807,
907
+ "musi": 808,
908
+ "cu": 809,
909
+ "nam": 810,
910
+ "ement</w>": 811,
911
+ "such</w>": 812,
912
+ "albu": 813,
913
+ "buil": 814,
914
+ "before</w>": 815,
915
+ "ef": 816,
916
+ "arm": 817,
917
+ "ton</w>": 818,
918
+ "them</w>": 819,
919
+ "cal": 820,
920
+ "bar": 821,
921
+ "des</w>": 822,
922
+ "mat": 823,
923
+ "gener": 824,
924
+ "od</w>": 825,
925
+ "series</w>": 826,
926
+ "cer": 827,
927
+ "sho": 828,
928
+ "enti": 829,
929
+ "her": 830,
930
+ "over": 831,
931
+ "ann": 832,
932
+ "well</w>": 833,
933
+ "world</w>": 834,
934
+ "gan</w>": 835,
935
+ "est</w>": 836,
936
+ "second</w>": 837,
937
+ "ters</w>": 838,
938
+ "side</w>": 839,
939
+ "tran": 840,
940
+ "line</w>": 841,
941
+ "ture</w>": 842,
942
+ "port</w>": 843,
943
+ "being</w>": 844,
944
+ "years</w>": 845,
945
+ "both</w>": 846,
946
+ "indi": 847,
947
+ "these</w>": 848,
948
+ "national</w>": 849,
949
+ "histor": 850,
950
+ "fe</w>": 851,
951
+ "vo": 852,
952
+ "sted</w>": 853,
953
+ "ani": 854,
954
+ "bas": 855,
955
+ "poin": 856,
956
+ "sing": 857,
957
+ "film</w>": 858,
958
+ "pen": 859,
959
+ "sup": 860,
960
+ "mis": 861,
961
+ "cro": 862,
962
+ "stri": 863,
963
+ "lin": 864,
964
+ "tre": 865,
965
+ "war</w>": 866,
966
+ "however</w>": 867,
967
+ "ying</w>": 868,
968
+ "ling</w>": 869,
969
+ "yp": 870,
970
+ "ected</w>": 871,
971
+ "direc": 872,
972
+ "vision</w>": 873,
973
+ "album</w>": 874,
974
+ "then</w>": 875,
975
+ "ll</w>": 876,
976
+ "sever": 877,
977
+ "through</w>": 878,
978
+ "known</w>": 879,
979
+ "bor": 880,
980
+ "cul": 881,
981
+ "clu": 882,
982
+ "ster</w>": 883,
983
+ "south</w>": 884,
984
+ "ry</w>": 885,
985
+ "ect</w>": 886,
986
+ "low</w>": 887,
987
+ "pr": 888,
988
+ "sk": 889,
989
+ "iso": 890,
990
+ "north</w>": 891,
991
+ "part</w>": 892,
992
+ "fac": 893,
993
+ "tly</w>": 894,
994
+ "peri": 895,
995
+ "eu": 896,
996
+ "batt": 897,
997
+ "state</w>": 898,
998
+ "ced</w>": 899,
999
+ "consi": 900,
1000
+ "inf": 901,
1001
+ "poli": 902,
1002
+ "olog": 903,
1003
+ "early</w>": 904,
1004
+ "posi": 905,
1005
+ "ames</w>": 906,
1006
+ "win": 907,
1007
+ "devel": 908,
1008
+ "ob": 909,
1009
+ "ve": 910,
1010
+ "ven</w>": 911,
1011
+ "oper": 912,
1012
+ "ger": 913,
1013
+ "offi": 914,
1014
+ "charac": 915,
1015
+ "ms</w>": 916,
1016
+ "high": 917,
1017
+ "ad</w>": 918,
1018
+ "tho": 919,
1019
+ "several</w>": 920,
1020
+ "dre": 921,
1021
+ "descri": 922,
1022
+ "ale</w>": 923,
1023
+ "number</w>": 924,
1024
+ "air": 925,
1025
+ "including</w>": 926,
1026
+ "inst</w>": 927,
1027
+ "against</w>": 928,
1028
+ "ls</w>": 929,
1029
+ "sul": 930,
1030
+ "episo": 931,
1031
+ "cam": 932,
1032
+ "dif": 933,
1033
+ "soci": 934,
1034
+ "became</w>": 935,
1035
+ "like</w>": 936,
1036
+ "tel": 937,
1037
+ "four</w>": 938,
1038
+ "âĢĶ</w>": 939,
1039
+ "hou": 940,
1040
+ "joh": 941,
1041
+ "united</w>": 942,
1042
+ "inv": 943,
1043
+ "under</w>": 944,
1044
+ "nov": 945,
1045
+ "tiv": 946,
1046
+ "suc": 947,
1047
+ "ations</w>": 948,
1048
+ "ack": 949,
1049
+ "tor</w>": 950,
1050
+ "ron": 951,
1051
+ "und</w>": 952,
1052
+ "ws</w>": 953,
1053
+ "fo": 954,
1054
+ "gr": 955,
1055
+ "develop": 956,
1056
+ "although</w>": 957,
1057
+ "contin": 958,
1058
+ "west</w>": 959,
1059
+ "origin": 960,
1060
+ "music</w>": 961,
1061
+ "ors</w>": 962,
1062
+ "don</w>": 963,
1063
+ "century</w>": 964,
1064
+ "ward</w>": 965,
1065
+ "work</w>": 966,
1066
+ "me</w>": 967,
1067
+ "ami": 968,
1068
+ "cha": 969,
1069
+ "very</w>": 970,
1070
+ "har": 971,
1071
+ "dis": 972,
1072
+ "zed</w>": 973,
1073
+ "do</w>": 974,
1074
+ "gs</w>": 975,
1075
+ "tow": 976,
1076
+ "sol": 977,
1077
+ "following</w>": 978,
1078
+ "lion</w>": 979,
1079
+ "rema": 980,
1080
+ "ns</w>": 981,
1081
+ "tish</w>": 982,
1082
+ "chur": 983,
1083
+ "som": 984,
1084
+ "mp": 985,
1085
+ "tle</w>": 986,
1086
+ "gover": 987,
1087
+ "del": 988,
1088
+ "comple": 989,
1089
+ "cur": 990,
1090
+ "use</w>": 991,
1091
+ "back</w>": 992,
1092
+ "hu": 993,
1093
+ "stern</w>": 994,
1094
+ "began</w>": 995,
1095
+ "fiel": 996,
1096
+ "ause</w>": 997,
1097
+ "dra": 998,
1098
+ "pas": 999,
1099
+ "bil": 1000,
1100
+ "cation</w>": 1001,
1101
+ "dent</w>": 1002,
1102
+ "bed</w>": 1003,
1103
+ "because</w>": 1004,
1104
+ "ant": 1005,
1105
+ "eam</w>": 1006,
1106
+ "phi": 1007,
1107
+ "yo": 1008,
1108
+ "continu": 1009,
1109
+ "tain</w>": 1010,
1110
+ "try</w>": 1011,
1111
+ "fre": 1012,
1112
+ "peop": 1013,
1113
+ "called</w>": 1014,
1114
+ "found</w>": 1015,
1115
+ "episode</w>": 1016,
1116
+ "desig": 1017,
1117
+ "mor": 1018,
1118
+ "set</w>": 1019,
1119
+ "ley</w>": 1020,
1120
+ "east</w>": 1021,
1121
+ "trac": 1022,
1122
+ "cra": 1023
1123
+ },
1124
+ "merges": [
1125
+ "t h",
1126
+ "th e</w>",
1127
+ "i n",
1128
+ "a n",
1129
+ "e d</w>",
1130
+ "e r",
1131
+ "r e",
1132
+ "a r",
1133
+ "t i",
1134
+ "o n",
1135
+ "e n",
1136
+ "o f</w>",
1137
+ "o r",
1138
+ "an d</w>",
1139
+ "e r</w>",
1140
+ "o n</w>",
1141
+ "i n</w>",
1142
+ "in g</w>",
1143
+ "s t",
1144
+ "r o",
1145
+ "a l",
1146
+ "i t",
1147
+ "t o</w>",
1148
+ "a s</w>",
1149
+ "a t",
1150
+ "e s</w>",
1151
+ "o u",
1152
+ "h i",
1153
+ "a c",
1154
+ "s i",
1155
+ "a t</w>",
1156
+ "r i",
1157
+ "a l</w>",
1158
+ "e l",
1159
+ "a n</w>",
1160
+ "a m",
1161
+ "o r</w>",
1162
+ "s t</w>",
1163
+ "l i",
1164
+ "u r",
1165
+ "e c",
1166
+ "o m",
1167
+ "d i",
1168
+ "w as</w>",
1169
+ "l y</w>",
1170
+ "e n</w>",
1171
+ "e a",
1172
+ "c h",
1173
+ "u n",
1174
+ "ti on</w>",
1175
+ "l a",
1176
+ "i s</w>",
1177
+ "f i",
1178
+ "o l",
1179
+ "d e",
1180
+ "- @</w>",
1181
+ "@ -@</w>",
1182
+ "r a",
1183
+ "v i",
1184
+ "l e</w>",
1185
+ "l o",
1186
+ "s h",
1187
+ "e m",
1188
+ "b e",
1189
+ "th at</w>",
1190
+ "' s</w>",
1191
+ "c on",
1192
+ "m a",
1193
+ "f or</w>",
1194
+ "h a",
1195
+ "s u",
1196
+ "b y</w>",
1197
+ "it h</w>",
1198
+ "v e</w>",
1199
+ "w ith</w>",
1200
+ "s e</w>",
1201
+ "c h</w>",
1202
+ "th e",
1203
+ "en t",
1204
+ "p o",
1205
+ "c e</w>",
1206
+ "i l",
1207
+ "s e",
1208
+ "en t</w>",
1209
+ "l e",
1210
+ "c om",
1211
+ "s p",
1212
+ "er e</w>",
1213
+ "p ro",
1214
+ "n o",
1215
+ "b u",
1216
+ "w h",
1217
+ "i t</w>",
1218
+ "t h</w>",
1219
+ "v er",
1220
+ "n e",
1221
+ "c a",
1222
+ "i s",
1223
+ "f or",
1224
+ "a g",
1225
+ "er s</w>",
1226
+ "m o",
1227
+ "g h",
1228
+ "f ro",
1229
+ "t ed</w>",
1230
+ "fro m</w>",
1231
+ "ti on",
1232
+ "o p",
1233
+ "hi s</w>",
1234
+ "a d",
1235
+ "a b",
1236
+ "i c",
1237
+ "h e</w>",
1238
+ "ou n",
1239
+ "a s",
1240
+ "t s</w>",
1241
+ "s c",
1242
+ "d e</w>",
1243
+ "o w",
1244
+ "e x",
1245
+ "w hi",
1246
+ "r u",
1247
+ "t er</w>",
1248
+ "a p",
1249
+ "d s</w>",
1250
+ "w ere</w>",
1251
+ "p re",
1252
+ "d u",
1253
+ "g u",
1254
+ "p ar",
1255
+ "i r",
1256
+ "b o",
1257
+ "th er</w>",
1258
+ "q u",
1259
+ "l u",
1260
+ "t er",
1261
+ "t w",
1262
+ "e s",
1263
+ "re c",
1264
+ "p er",
1265
+ "t a",
1266
+ "at e</w>",
1267
+ "v er</w>",
1268
+ "at ed</w>",
1269
+ "d ing</w>",
1270
+ "it y</w>",
1271
+ "m an",
1272
+ "e ar",
1273
+ "s ed</w>",
1274
+ "d ed</w>",
1275
+ "a u",
1276
+ "al l</w>",
1277
+ "am e</w>",
1278
+ "c i",
1279
+ "on e</w>",
1280
+ "in g",
1281
+ "ar e</w>",
1282
+ "a f",
1283
+ "i r</w>",
1284
+ "a tion</w>",
1285
+ "â Ģ",
1286
+ "ha d</w>",
1287
+ "t r",
1288
+ "u l",
1289
+ "l d</w>",
1290
+ "whi ch</w>",
1291
+ "w a",
1292
+ "i m",
1293
+ "l ea",
1294
+ "b e</w>",
1295
+ "t o",
1296
+ "ti m",
1297
+ "fi r",
1298
+ "w or",
1299
+ "on g</w>",
1300
+ "p or",
1301
+ "m ar",
1302
+ "m e",
1303
+ "al ly</w>",
1304
+ "s o</w>",
1305
+ "ou t</w>",
1306
+ "tion s</w>",
1307
+ "it s</w>",
1308
+ "g h</w>",
1309
+ "g e</w>",
1310
+ "b er</w>",
1311
+ "f e",
1312
+ "p u",
1313
+ "s er",
1314
+ "d er",
1315
+ "p l",
1316
+ "s s</w>",
1317
+ "in e</w>",
1318
+ "in c",
1319
+ "m i",
1320
+ "gh t</w>",
1321
+ "g o",
1322
+ "th is</w>",
1323
+ "t ur",
1324
+ "d a",
1325
+ "ro u",
1326
+ "bu t</w>",
1327
+ "u m",
1328
+ "s on</w>",
1329
+ "w e",
1330
+ "v ed</w>",
1331
+ "si on</w>",
1332
+ "k e</w>",
1333
+ "p la",
1334
+ "the ir</w>",
1335
+ "i es</w>",
1336
+ "fir st</w>",
1337
+ "s a",
1338
+ "o c",
1339
+ "at t",
1340
+ "o f",
1341
+ "p e",
1342
+ "no t</w>",
1343
+ "g i",
1344
+ "n a",
1345
+ "ar y</w>",
1346
+ "m u",
1347
+ "l ed</w>",
1348
+ "âĢ ĵ</w>",
1349
+ "h er</w>",
1350
+ "r an",
1351
+ "c o",
1352
+ "the y</w>",
1353
+ "d er</w>",
1354
+ "al i",
1355
+ "al so</w>",
1356
+ "or e</w>",
1357
+ "e p",
1358
+ "ou ld</w>",
1359
+ "af ter</w>",
1360
+ "s hi",
1361
+ "u s</w>",
1362
+ "e t</w>",
1363
+ "ti c",
1364
+ "st or",
1365
+ "w i",
1366
+ "e v",
1367
+ "o ther</w>",
1368
+ "s h</w>",
1369
+ "t ing</w>",
1370
+ "ar d</w>",
1371
+ "t e",
1372
+ "tw o</w>",
1373
+ "n i",
1374
+ "ha ve</w>",
1375
+ "ou r",
1376
+ "com m",
1377
+ "t e</w>",
1378
+ "ac k</w>",
1379
+ "o o",
1380
+ "f in",
1381
+ "s ec",
1382
+ "ent s</w>",
1383
+ "h as</w>",
1384
+ "com p",
1385
+ "b ec",
1386
+ "k s</w>",
1387
+ "con t",
1388
+ "l and</w>",
1389
+ "be en</w>",
1390
+ "en ce</w>",
1391
+ "k ing</w>",
1392
+ "e l</w>",
1393
+ "ag e</w>",
1394
+ "lo w",
1395
+ "m in",
1396
+ ". @</w>",
1397
+ "@ .@</w>",
1398
+ "om e</w>",
1399
+ "m ent</w>",
1400
+ "ch ar",
1401
+ "g e",
1402
+ "at er</w>",
1403
+ "n or",
1404
+ "h o",
1405
+ "ou s</w>",
1406
+ "wh o</w>",
1407
+ "ea r</w>",
1408
+ "sp ec",
1409
+ "c ol",
1410
+ "el y</w>",
1411
+ "t y</w>",
1412
+ "j o",
1413
+ "ur ing</w>",
1414
+ "du c",
1415
+ "b ri",
1416
+ "st r",
1417
+ "c an",
1418
+ "or i",
1419
+ "t ra",
1420
+ "p a",
1421
+ "sh e</w>",
1422
+ "d o",
1423
+ "ti ve</w>",
1424
+ "m on",
1425
+ "ne w</w>",
1426
+ "r it",
1427
+ "tim e</w>",
1428
+ "on s</w>",
1429
+ "s o",
1430
+ "m an</w>",
1431
+ "d ec",
1432
+ "c ent",
1433
+ "l an",
1434
+ "p i",
1435
+ "ou r</w>",
1436
+ "in ter",
1437
+ "f er",
1438
+ "g ra",
1439
+ "g re",
1440
+ "re s</w>",
1441
+ "inc lu",
1442
+ "m il",
1443
+ "d uring</w>",
1444
+ "ow n</w>",
1445
+ "pre s",
1446
+ "j u",
1447
+ "n ed</w>",
1448
+ "el l</w>",
1449
+ ", @</w>",
1450
+ "@ ,@</w>",
1451
+ "it e</w>",
1452
+ "g en",
1453
+ "wh en</w>",
1454
+ "si g",
1455
+ "b i",
1456
+ "re n",
1457
+ "f a",
1458
+ "g a",
1459
+ "pla y",
1460
+ "en g",
1461
+ "tion al</w>",
1462
+ "oun d</w>",
1463
+ "th ou",
1464
+ "m ore</w>",
1465
+ "re e</w>",
1466
+ "em ber</w>",
1467
+ "e i",
1468
+ "s ou",
1469
+ "s ur",
1470
+ "s ti",
1471
+ "c ar",
1472
+ "for m",
1473
+ "l ar",
1474
+ "s es</w>",
1475
+ "t en",
1476
+ "in to</w>",
1477
+ "t u",
1478
+ "c es</w>",
1479
+ "mo st</w>",
1480
+ "k ed</w>",
1481
+ "wa y</w>",
1482
+ "c re",
1483
+ "c oun",
1484
+ "u p</w>",
1485
+ "l es</w>",
1486
+ "ac e</w>",
1487
+ "al s</w>",
1488
+ "k e",
1489
+ "w ould</w>",
1490
+ "an t</w>",
1491
+ "b er",
1492
+ "f u",
1493
+ "it ed</w>",
1494
+ "p ri",
1495
+ "whi le</w>",
1496
+ "o ver</w>",
1497
+ "ing s</w>",
1498
+ "r e</w>",
1499
+ "fi l",
1500
+ "s y",
1501
+ "e st",
1502
+ "ab le</w>",
1503
+ "w n</w>",
1504
+ "s ea",
1505
+ "ac h",
1506
+ "s ing</w>",
1507
+ "in s</w>",
1508
+ "ti c</w>",
1509
+ "i d</w>",
1510
+ "on ly</w>",
1511
+ "at es</w>",
1512
+ "t ri",
1513
+ "v ing</w>",
1514
+ "b a",
1515
+ "v el",
1516
+ "an ce</w>",
1517
+ "st a",
1518
+ "er n</w>",
1519
+ "f ol",
1520
+ "e en</w>",
1521
+ "in ed</w>",
1522
+ "st ru",
1523
+ "un i",
1524
+ "g ame</w>",
1525
+ "la r</w>",
1526
+ "s el",
1527
+ "b li",
1528
+ "u sed</w>",
1529
+ "n ing</w>",
1530
+ "p s</w>",
1531
+ "ti es</w>",
1532
+ "k no",
1533
+ "c or",
1534
+ "f t</w>",
1535
+ "rec or",
1536
+ "b le</w>",
1537
+ "vi e",
1538
+ "y s</w>",
1539
+ "w il",
1540
+ "ic al</w>",
1541
+ "ap p",
1542
+ "t ro",
1543
+ "th ree</w>",
1544
+ "c la",
1545
+ "ol d</w>",
1546
+ "sh ed</w>",
1547
+ "h ea",
1548
+ "ab out</w>",
1549
+ "w rit",
1550
+ "th an</w>",
1551
+ "st e",
1552
+ "l ater</w>",
1553
+ "ar i",
1554
+ "d y</w>",
1555
+ "pu bli",
1556
+ "lo c",
1557
+ "ag a",
1558
+ "th rou",
1559
+ "s si",
1560
+ "en d</w>",
1561
+ "ma y</w>",
1562
+ "an g",
1563
+ "ac h</w>",
1564
+ "v es</w>",
1565
+ "o g",
1566
+ "hi m</w>",
1567
+ "be tw",
1568
+ "thou gh</w>",
1569
+ "betw een</w>",
1570
+ "u m</w>",
1571
+ "st ar",
1572
+ "sc ri",
1573
+ "re a",
1574
+ "on d</w>",
1575
+ "shi p</w>",
1576
+ "o k</w>",
1577
+ "h el",
1578
+ "s ong</w>",
1579
+ "c hi",
1580
+ "ca p",
1581
+ "e ver</w>",
1582
+ "da y</w>",
1583
+ "c ri",
1584
+ "s ome</w>",
1585
+ "b ro",
1586
+ "n o</w>",
1587
+ "th ere</w>",
1588
+ "an s</w>",
1589
+ "al l",
1590
+ "n um",
1591
+ "r ed</w>",
1592
+ "ear s</w>",
1593
+ "st s</w>",
1594
+ "an y</w>",
1595
+ "w ar",
1596
+ "p h",
1597
+ "p p",
1598
+ "g in",
1599
+ "stru c",
1600
+ "am er",
1601
+ "pro duc",
1602
+ "s ch",
1603
+ "c es",
1604
+ "ur e</w>",
1605
+ "at ing</w>",
1606
+ "em p",
1607
+ "t or",
1608
+ "sea son</w>",
1609
+ "for e</w>",
1610
+ "i c</w>",
1611
+ "c ity</w>",
1612
+ "g ro",
1613
+ "fol low",
1614
+ "su b",
1615
+ "b el",
1616
+ "y ear</w>",
1617
+ "c an</w>",
1618
+ "s in",
1619
+ "wh ere</w>",
1620
+ "an d",
1621
+ "ma de</w>",
1622
+ "re lea",
1623
+ "s m",
1624
+ "b l",
1625
+ "t en</w>",
1626
+ "wi th",
1627
+ "s on",
1628
+ "man y</w>",
1629
+ "a re",
1630
+ "e d",
1631
+ "h ow",
1632
+ "amer ic",
1633
+ "ur y</w>",
1634
+ "st u",
1635
+ "mu si",
1636
+ "c u",
1637
+ "n am",
1638
+ "em ent</w>",
1639
+ "su ch</w>",
1640
+ "al bu",
1641
+ "bu il",
1642
+ "be fore</w>",
1643
+ "e f",
1644
+ "ar m",
1645
+ "t on</w>",
1646
+ "the m</w>",
1647
+ "c al",
1648
+ "b ar",
1649
+ "d es</w>",
1650
+ "m at",
1651
+ "gen er",
1652
+ "o d</w>",
1653
+ "ser ies</w>",
1654
+ "c er",
1655
+ "sh o",
1656
+ "en ti",
1657
+ "h er",
1658
+ "o ver",
1659
+ "an n",
1660
+ "w ell</w>",
1661
+ "wor ld</w>",
1662
+ "g an</w>",
1663
+ "e st</w>",
1664
+ "sec ond</w>",
1665
+ "t ers</w>",
1666
+ "si de</w>",
1667
+ "tr an",
1668
+ "l ine</w>",
1669
+ "tur e</w>",
1670
+ "por t</w>",
1671
+ "be ing</w>",
1672
+ "y ears</w>",
1673
+ "bo th</w>",
1674
+ "in di",
1675
+ "the se</w>",
1676
+ "na tional</w>",
1677
+ "hi stor",
1678
+ "f e</w>",
1679
+ "v o",
1680
+ "st ed</w>",
1681
+ "an i",
1682
+ "b as",
1683
+ "po in",
1684
+ "s ing",
1685
+ "fil m</w>",
1686
+ "p en",
1687
+ "su p",
1688
+ "m is",
1689
+ "c ro",
1690
+ "st ri",
1691
+ "l in",
1692
+ "t re",
1693
+ "wa r</w>",
1694
+ "how ever</w>",
1695
+ "y ing</w>",
1696
+ "l ing</w>",
1697
+ "y p",
1698
+ "ec ted</w>",
1699
+ "di rec",
1700
+ "vi sion</w>",
1701
+ "albu m</w>",
1702
+ "th en</w>",
1703
+ "l l</w>",
1704
+ "se ver",
1705
+ "throu gh</w>",
1706
+ "kno wn</w>",
1707
+ "b or",
1708
+ "c ul",
1709
+ "c lu",
1710
+ "st er</w>",
1711
+ "sou th</w>",
1712
+ "r y</w>",
1713
+ "ec t</w>",
1714
+ "lo w</w>",
1715
+ "p r",
1716
+ "s k",
1717
+ "is o",
1718
+ "nor th</w>",
1719
+ "par t</w>",
1720
+ "f ac",
1721
+ "t ly</w>",
1722
+ "per i",
1723
+ "e u",
1724
+ "b att",
1725
+ "st ate</w>",
1726
+ "c ed</w>",
1727
+ "con si",
1728
+ "in f",
1729
+ "po li",
1730
+ "ol og",
1731
+ "ear ly</w>",
1732
+ "po si",
1733
+ "am es</w>",
1734
+ "w in",
1735
+ "de vel",
1736
+ "o b",
1737
+ "v e",
1738
+ "v en</w>",
1739
+ "op er",
1740
+ "g er",
1741
+ "of fi",
1742
+ "char ac",
1743
+ "m s</w>",
1744
+ "hi gh",
1745
+ "a d</w>",
1746
+ "th o",
1747
+ "sever al</w>",
1748
+ "d re",
1749
+ "de scri",
1750
+ "al e</w>",
1751
+ "num ber</w>",
1752
+ "a ir",
1753
+ "inclu ding</w>",
1754
+ "in st</w>",
1755
+ "aga inst</w>",
1756
+ "l s</w>",
1757
+ "su l",
1758
+ "ep iso",
1759
+ "c am",
1760
+ "di f",
1761
+ "so ci",
1762
+ "bec ame</w>",
1763
+ "li ke</w>",
1764
+ "t el",
1765
+ "f our</w>",
1766
+ "âĢ Ķ</w>",
1767
+ "h ou",
1768
+ "jo h",
1769
+ "un ited</w>",
1770
+ "in v",
1771
+ "un der</w>",
1772
+ "no v",
1773
+ "ti v",
1774
+ "su c",
1775
+ "a tions</w>",
1776
+ "ac k",
1777
+ "t or</w>",
1778
+ "r on",
1779
+ "un d</w>",
1780
+ "w s</w>",
1781
+ "f o",
1782
+ "g r",
1783
+ "devel op",
1784
+ "al though</w>",
1785
+ "cont in",
1786
+ "we st</w>",
1787
+ "ori gin",
1788
+ "musi c</w>",
1789
+ "or s</w>",
1790
+ "d on</w>",
1791
+ "cent ury</w>",
1792
+ "w ard</w>",
1793
+ "wor k</w>",
1794
+ "m e</w>",
1795
+ "am i",
1796
+ "ch a",
1797
+ "ver y</w>",
1798
+ "h ar",
1799
+ "di s",
1800
+ "z ed</w>",
1801
+ "d o</w>",
1802
+ "g s</w>",
1803
+ "t ow",
1804
+ "s ol",
1805
+ "follow ing</w>",
1806
+ "li on</w>",
1807
+ "re ma",
1808
+ "n s</w>",
1809
+ "ti sh</w>",
1810
+ "ch ur",
1811
+ "s om",
1812
+ "m p",
1813
+ "t le</w>",
1814
+ "go ver",
1815
+ "d el",
1816
+ "comp le",
1817
+ "c ur",
1818
+ "u se</w>",
1819
+ "b ack</w>",
1820
+ "h u",
1821
+ "st ern</w>",
1822
+ "be gan</w>",
1823
+ "fi el",
1824
+ "au se</w>",
1825
+ "d ra",
1826
+ "p as",
1827
+ "b il",
1828
+ "ca tion</w>",
1829
+ "d ent</w>",
1830
+ "b ed</w>",
1831
+ "bec ause</w>",
1832
+ "an t",
1833
+ "ea m</w>",
1834
+ "p hi",
1835
+ "y o",
1836
+ "contin u",
1837
+ "ta in</w>",
1838
+ "tr y</w>",
1839
+ "f re",
1840
+ "pe op",
1841
+ "cal led</w>",
1842
+ "f ound</w>",
1843
+ "episo de</w>",
1844
+ "de sig",
1845
+ "m or",
1846
+ "se t</w>",
1847
+ "le y</w>",
1848
+ "ea st</w>",
1849
+ "tr ac",
1850
+ "c ra"
1851
+ ]
1852
+ }
1853
+ }
tokenizer_config.json ADDED
@@ -0,0 +1,40 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_prefix_space": false,
3
+ "added_tokens_decoder": {
4
+ "0": {
5
+ "content": "!",
6
+ "lstrip": false,
7
+ "normalized": false,
8
+ "rstrip": false,
9
+ "single_word": false,
10
+ "special": true
11
+ },
12
+ "1": {
13
+ "content": "<|startoftext|>",
14
+ "lstrip": false,
15
+ "normalized": true,
16
+ "rstrip": false,
17
+ "single_word": false,
18
+ "special": true
19
+ },
20
+ "2": {
21
+ "content": "<|endoftext|>",
22
+ "lstrip": false,
23
+ "normalized": false,
24
+ "rstrip": false,
25
+ "single_word": false,
26
+ "special": true
27
+ }
28
+ },
29
+ "additional_special_tokens": [],
30
+ "bos_token": "<|startoftext|>",
31
+ "clean_up_tokenization_spaces": true,
32
+ "do_lower_case": true,
33
+ "eos_token": "<|endoftext|>",
34
+ "errors": "replace",
35
+ "model_max_length": 16,
36
+ "pad_token": "!",
37
+ "processor_class": "Owlv2Processor",
38
+ "tokenizer_class": "CLIPTokenizer",
39
+ "unk_token": "<|endoftext|>"
40
+ }
vocab.json ADDED
@@ -0,0 +1,1026 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "!": 0,
3
+ "!</w>": 283,
4
+ "\"": 3,
5
+ "\"</w>": 282,
6
+ "#": 4,
7
+ "#</w>": 228,
8
+ "$": 5,
9
+ "$</w>": 274,
10
+ "%": 6,
11
+ "%</w>": 264,
12
+ "&": 7,
13
+ "&</w>": 242,
14
+ "'": 8,
15
+ "'</w>": 287,
16
+ "'s</w>": 363,
17
+ "(": 9,
18
+ "(</w>": 289,
19
+ ")": 10,
20
+ ")</w>": 295,
21
+ "*": 11,
22
+ "*</w>": 212,
23
+ "+": 12,
24
+ "+</w>": 288,
25
+ ",": 13,
26
+ ",</w>": 286,
27
+ ",@</w>": 622,
28
+ "-": 14,
29
+ "-</w>": 232,
30
+ "-@</w>": 353,
31
+ ".": 15,
32
+ ".</w>": 236,
33
+ ".@</w>": 569,
34
+ "/": 16,
35
+ "/</w>": 292,
36
+ "0": 17,
37
+ "0</w>": 271,
38
+ "1": 18,
39
+ "1</w>": 246,
40
+ "2": 19,
41
+ "2</w>": 268,
42
+ "3": 20,
43
+ "3</w>": 273,
44
+ "4": 21,
45
+ "4</w>": 294,
46
+ "5": 22,
47
+ "5</w>": 253,
48
+ "6": 23,
49
+ "6</w>": 276,
50
+ "7": 24,
51
+ "7</w>": 297,
52
+ "8": 25,
53
+ "8</w>": 251,
54
+ "9": 26,
55
+ "9</w>": 277,
56
+ ":": 27,
57
+ ":</w>": 204,
58
+ ";": 28,
59
+ ";</w>": 275,
60
+ "<": 29,
61
+ "<</w>": 262,
62
+ "<|endoftext|>": 2,
63
+ "<|startoftext|>": 1,
64
+ "=": 30,
65
+ "=</w>": 281,
66
+ ">": 31,
67
+ "></w>": 284,
68
+ "?": 32,
69
+ "?</w>": 291,
70
+ "@": 33,
71
+ "@,@</w>": 623,
72
+ "@-@</w>": 354,
73
+ "@.@</w>": 570,
74
+ "@</w>": 269,
75
+ "[": 34,
76
+ "[</w>": 270,
77
+ "\\": 35,
78
+ "\\</w>": 296,
79
+ "]": 36,
80
+ "]</w>": 266,
81
+ "^": 37,
82
+ "^</w>": 278,
83
+ "_": 38,
84
+ "_</w>": 293,
85
+ "`": 39,
86
+ "`</w>": 265,
87
+ "a": 40,
88
+ "a</w>": 175,
89
+ "ab": 408,
90
+ "able</w>": 675,
91
+ "about</w>": 721,
92
+ "ac": 326,
93
+ "ace</w>": 659,
94
+ "ach": 678,
95
+ "ach</w>": 736,
96
+ "ack": 949,
97
+ "ack</w>": 551,
98
+ "ad": 407,
99
+ "ad</w>": 918,
100
+ "af": 455,
101
+ "after</w>": 532,
102
+ "ag": 397,
103
+ "aga": 730,
104
+ "against</w>": 928,
105
+ "age</w>": 566,
106
+ "air": 925,
107
+ "al": 318,
108
+ "al</w>": 330,
109
+ "albu": 813,
110
+ "album</w>": 874,
111
+ "ale</w>": 923,
112
+ "ali": 527,
113
+ "all": 762,
114
+ "all</w>": 449,
115
+ "ally</w>": 476,
116
+ "als</w>": 660,
117
+ "also</w>": 528,
118
+ "although</w>": 957,
119
+ "am": 333,
120
+ "ame</w>": 450,
121
+ "amer": 773,
122
+ "americ": 805,
123
+ "ames</w>": 906,
124
+ "ami": 968,
125
+ "an": 301,
126
+ "an</w>": 332,
127
+ "ance</w>": 689,
128
+ "and": 793,
129
+ "and</w>": 311,
130
+ "ang": 735,
131
+ "ani": 854,
132
+ "ann": 832,
133
+ "ans</w>": 761,
134
+ "ant": 1005,
135
+ "ant</w>": 663,
136
+ "any</w>": 767,
137
+ "ap": 421,
138
+ "app": 714,
139
+ "ar": 305,
140
+ "ard</w>": 543,
141
+ "are": 802,
142
+ "are</w>": 454,
143
+ "ari": 726,
144
+ "arm": 817,
145
+ "ary</w>": 518,
146
+ "as": 412,
147
+ "as</w>": 321,
148
+ "at": 322,
149
+ "at</w>": 328,
150
+ "ate</w>": 439,
151
+ "ated</w>": 441,
152
+ "ater</w>": 575,
153
+ "ates</w>": 684,
154
+ "ating</w>": 778,
155
+ "ation</w>": 457,
156
+ "ations</w>": 948,
157
+ "att": 512,
158
+ "au": 448,
159
+ "ause</w>": 997,
160
+ "b": 41,
161
+ "b</w>": 191,
162
+ "ba": 687,
163
+ "back</w>": 992,
164
+ "bar": 821,
165
+ "bas": 855,
166
+ "batt": 897,
167
+ "be": 361,
168
+ "be</w>": 467,
169
+ "bec": 558,
170
+ "became</w>": 935,
171
+ "because</w>": 1004,
172
+ "bed</w>": 1003,
173
+ "been</w>": 562,
174
+ "before</w>": 815,
175
+ "began</w>": 995,
176
+ "being</w>": 844,
177
+ "bel": 788,
178
+ "ber": 664,
179
+ "ber</w>": 483,
180
+ "betw": 740,
181
+ "between</w>": 742,
182
+ "bi": 628,
183
+ "bil": 1000,
184
+ "bl": 797,
185
+ "ble</w>": 709,
186
+ "bli": 700,
187
+ "bo": 429,
188
+ "bor": 880,
189
+ "both</w>": 846,
190
+ "bri": 588,
191
+ "bro": 758,
192
+ "bu": 388,
193
+ "buil": 814,
194
+ "but</w>": 499,
195
+ "by</w>": 369,
196
+ "c": 42,
197
+ "c</w>": 176,
198
+ "ca": 394,
199
+ "cal": 820,
200
+ "called</w>": 1014,
201
+ "cam": 932,
202
+ "can": 590,
203
+ "can</w>": 790,
204
+ "cap": 753,
205
+ "car": 644,
206
+ "cation</w>": 1001,
207
+ "ce</w>": 378,
208
+ "ced</w>": 899,
209
+ "cent": 605,
210
+ "century</w>": 964,
211
+ "cer": 827,
212
+ "ces": 776,
213
+ "ces</w>": 651,
214
+ "ch": 345,
215
+ "ch</w>": 374,
216
+ "cha": 969,
217
+ "char": 573,
218
+ "charac": 915,
219
+ "chi": 752,
220
+ "chur": 983,
221
+ "ci": 451,
222
+ "city</w>": 784,
223
+ "cla": 717,
224
+ "clu": 882,
225
+ "co": 524,
226
+ "col": 582,
227
+ "com": 383,
228
+ "comm": 549,
229
+ "comp": 557,
230
+ "comple": 989,
231
+ "con": 364,
232
+ "consi": 900,
233
+ "cont": 560,
234
+ "contin": 958,
235
+ "continu": 1009,
236
+ "cor": 706,
237
+ "coun": 656,
238
+ "cra": 1023,
239
+ "cre": 655,
240
+ "cri": 756,
241
+ "cro": 862,
242
+ "cu": 809,
243
+ "cul": 881,
244
+ "cur": 990,
245
+ "d": 43,
246
+ "d</w>": 170,
247
+ "da": 497,
248
+ "day</w>": 755,
249
+ "de": 352,
250
+ "de</w>": 415,
251
+ "dec": 604,
252
+ "ded</w>": 447,
253
+ "del": 988,
254
+ "dent</w>": 1002,
255
+ "der": 487,
256
+ "der</w>": 526,
257
+ "des</w>": 822,
258
+ "descri": 922,
259
+ "desig": 1017,
260
+ "devel": 908,
261
+ "develop": 956,
262
+ "di": 340,
263
+ "dif": 933,
264
+ "ding</w>": 442,
265
+ "direc": 872,
266
+ "dis": 972,
267
+ "do": 595,
268
+ "do</w>": 974,
269
+ "don</w>": 963,
270
+ "dra": 998,
271
+ "dre": 921,
272
+ "ds</w>": 422,
273
+ "du": 425,
274
+ "duc": 587,
275
+ "during</w>": 616,
276
+ "dy</w>": 727,
277
+ "e": 44,
278
+ "e</w>": 167,
279
+ "ea": 344,
280
+ "eam</w>": 1006,
281
+ "ear": 445,
282
+ "ear</w>": 580,
283
+ "early</w>": 904,
284
+ "ears</w>": 765,
285
+ "east</w>": 1021,
286
+ "ec": 338,
287
+ "ect</w>": 886,
288
+ "ected</w>": 871,
289
+ "ed": 803,
290
+ "ed</w>": 302,
291
+ "een</w>": 693,
292
+ "ef": 816,
293
+ "ei": 640,
294
+ "el": 331,
295
+ "el</w>": 565,
296
+ "ell</w>": 621,
297
+ "ely</w>": 583,
298
+ "em": 360,
299
+ "ember</w>": 639,
300
+ "ement</w>": 811,
301
+ "emp": 779,
302
+ "en": 308,
303
+ "en</w>": 343,
304
+ "ence</w>": 563,
305
+ "end</w>": 733,
306
+ "eng": 633,
307
+ "ent": 376,
308
+ "ent</w>": 381,
309
+ "enti": 829,
310
+ "ents</w>": 555,
311
+ "ep": 530,
312
+ "episo": 931,
313
+ "episode</w>": 1016,
314
+ "er": 303,
315
+ "er</w>": 312,
316
+ "ere</w>": 385,
317
+ "ern</w>": 691,
318
+ "ers</w>": 398,
319
+ "es": 435,
320
+ "es</w>": 323,
321
+ "est": 674,
322
+ "est</w>": 836,
323
+ "et</w>": 535,
324
+ "eu": 896,
325
+ "ev": 539,
326
+ "ever</w>": 754,
327
+ "ex": 417,
328
+ "f": 45,
329
+ "f</w>": 169,
330
+ "fa": 630,
331
+ "fac": 893,
332
+ "fe": 484,
333
+ "fe</w>": 851,
334
+ "fer": 610,
335
+ "fi": 350,
336
+ "fiel": 996,
337
+ "fil": 672,
338
+ "film</w>": 858,
339
+ "fin": 553,
340
+ "fir": 470,
341
+ "first</w>": 509,
342
+ "fo": 954,
343
+ "fol": 692,
344
+ "follow": 786,
345
+ "following</w>": 978,
346
+ "for": 396,
347
+ "for</w>": 366,
348
+ "fore</w>": 782,
349
+ "form": 645,
350
+ "found</w>": 1015,
351
+ "four</w>": 938,
352
+ "fre": 1012,
353
+ "fro": 401,
354
+ "from</w>": 403,
355
+ "ft</w>": 707,
356
+ "fu": 665,
357
+ "g": 46,
358
+ "g</w>": 179,
359
+ "ga": 631,
360
+ "game</w>": 697,
361
+ "gan</w>": 835,
362
+ "ge": 574,
363
+ "ge</w>": 482,
364
+ "gen": 625,
365
+ "gener": 824,
366
+ "ger": 913,
367
+ "gh": 400,
368
+ "gh</w>": 481,
369
+ "ght</w>": 493,
370
+ "gi": 516,
371
+ "gin": 771,
372
+ "go": 494,
373
+ "gover": 987,
374
+ "gr": 955,
375
+ "gra": 611,
376
+ "gre": 612,
377
+ "gro": 785,
378
+ "gs</w>": 975,
379
+ "gu": 426,
380
+ "h": 47,
381
+ "h</w>": 183,
382
+ "ha": 367,
383
+ "had</w>": 459,
384
+ "har": 971,
385
+ "has</w>": 556,
386
+ "have</w>": 547,
387
+ "he</w>": 410,
388
+ "hea": 720,
389
+ "hel": 750,
390
+ "her": 830,
391
+ "her</w>": 522,
392
+ "hi": 325,
393
+ "high": 917,
394
+ "him</w>": 739,
395
+ "his</w>": 406,
396
+ "histor": 850,
397
+ "ho": 577,
398
+ "hou": 940,
399
+ "how": 804,
400
+ "however</w>": 867,
401
+ "hu": 993,
402
+ "i": 48,
403
+ "i</w>": 177,
404
+ "ic": 409,
405
+ "ic</w>": 783,
406
+ "ical</w>": 713,
407
+ "id</w>": 682,
408
+ "ies</w>": 508,
409
+ "il": 379,
410
+ "im": 465,
411
+ "in": 300,
412
+ "in</w>": 314,
413
+ "inc": 491,
414
+ "inclu": 614,
415
+ "including</w>": 926,
416
+ "indi": 847,
417
+ "ine</w>": 490,
418
+ "ined</w>": 694,
419
+ "inf": 901,
420
+ "ing": 453,
421
+ "ing</w>": 315,
422
+ "ings</w>": 670,
423
+ "ins</w>": 680,
424
+ "inst</w>": 927,
425
+ "inter": 609,
426
+ "into</w>": 649,
427
+ "inv": 943,
428
+ "ir": 428,
429
+ "ir</w>": 456,
430
+ "is": 395,
431
+ "is</w>": 349,
432
+ "iso": 890,
433
+ "it": 319,
434
+ "it</w>": 390,
435
+ "ite</w>": 624,
436
+ "ited</w>": 666,
437
+ "ith</w>": 370,
438
+ "its</w>": 480,
439
+ "ity</w>": 443,
440
+ "j": 49,
441
+ "j</w>": 208,
442
+ "jo": 585,
443
+ "joh": 941,
444
+ "ju": 619,
445
+ "k": 50,
446
+ "k</w>": 178,
447
+ "ke": 661,
448
+ "ke</w>": 505,
449
+ "ked</w>": 653,
450
+ "king</w>": 564,
451
+ "kno": 705,
452
+ "known</w>": 879,
453
+ "ks</w>": 559,
454
+ "l": 51,
455
+ "l</w>": 173,
456
+ "la": 348,
457
+ "lan": 606,
458
+ "land</w>": 561,
459
+ "lar": 646,
460
+ "lar</w>": 698,
461
+ "later</w>": 725,
462
+ "ld</w>": 462,
463
+ "le": 382,
464
+ "le</w>": 357,
465
+ "lea": 466,
466
+ "led</w>": 520,
467
+ "les</w>": 658,
468
+ "ley</w>": 1020,
469
+ "li": 336,
470
+ "like</w>": 936,
471
+ "lin": 864,
472
+ "line</w>": 841,
473
+ "ling</w>": 869,
474
+ "lion</w>": 979,
475
+ "ll</w>": 876,
476
+ "lo": 358,
477
+ "loc": 729,
478
+ "low": 567,
479
+ "low</w>": 887,
480
+ "ls</w>": 929,
481
+ "lu": 432,
482
+ "ly</w>": 342,
483
+ "m": 52,
484
+ "m</w>": 181,
485
+ "ma": 365,
486
+ "made</w>": 794,
487
+ "man": 444,
488
+ "man</w>": 603,
489
+ "many</w>": 801,
490
+ "mar": 474,
491
+ "mat": 823,
492
+ "may</w>": 734,
493
+ "me": 475,
494
+ "me</w>": 967,
495
+ "ment</w>": 572,
496
+ "mi": 492,
497
+ "mil": 615,
498
+ "min": 568,
499
+ "mis": 861,
500
+ "mo": 399,
501
+ "mon": 597,
502
+ "mor": 1018,
503
+ "more</w>": 637,
504
+ "most</w>": 652,
505
+ "mp": 985,
506
+ "ms</w>": 916,
507
+ "mu": 519,
508
+ "musi": 808,
509
+ "music</w>": 961,
510
+ "n": 53,
511
+ "n</w>": 172,
512
+ "na": 517,
513
+ "nam": 810,
514
+ "national</w>": 849,
515
+ "ne": 393,
516
+ "ned</w>": 620,
517
+ "new</w>": 598,
518
+ "ni": 546,
519
+ "ning</w>": 702,
520
+ "no": 387,
521
+ "no</w>": 759,
522
+ "nor": 576,
523
+ "north</w>": 891,
524
+ "not</w>": 515,
525
+ "nov": 945,
526
+ "ns</w>": 981,
527
+ "num": 763,
528
+ "number</w>": 924,
529
+ "o": 54,
530
+ "o</w>": 188,
531
+ "ob": 909,
532
+ "oc": 511,
533
+ "od</w>": 825,
534
+ "of": 513,
535
+ "of</w>": 309,
536
+ "offi": 914,
537
+ "og": 738,
538
+ "ok</w>": 749,
539
+ "ol": 351,
540
+ "old</w>": 718,
541
+ "olog": 903,
542
+ "om": 339,
543
+ "ome</w>": 571,
544
+ "on": 307,
545
+ "on</w>": 313,
546
+ "ond</w>": 747,
547
+ "one</w>": 452,
548
+ "ong</w>": 472,
549
+ "only</w>": 683,
550
+ "ons</w>": 601,
551
+ "oo": 552,
552
+ "op": 405,
553
+ "oper": 912,
554
+ "or": 310,
555
+ "or</w>": 334,
556
+ "ore</w>": 529,
557
+ "ori": 591,
558
+ "origin": 960,
559
+ "ors</w>": 962,
560
+ "other</w>": 540,
561
+ "ou": 324,
562
+ "ould</w>": 531,
563
+ "oun": 411,
564
+ "ound</w>": 635,
565
+ "our": 548,
566
+ "our</w>": 608,
567
+ "ous</w>": 578,
568
+ "out</w>": 478,
569
+ "over": 831,
570
+ "over</w>": 669,
571
+ "ow": 416,
572
+ "own</w>": 617,
573
+ "p": 55,
574
+ "p</w>": 182,
575
+ "pa": 593,
576
+ "par": 427,
577
+ "part</w>": 892,
578
+ "pas": 999,
579
+ "pe": 514,
580
+ "pen": 859,
581
+ "peop": 1013,
582
+ "per": 437,
583
+ "peri": 895,
584
+ "ph": 769,
585
+ "phi": 1007,
586
+ "pi": 607,
587
+ "pl": 488,
588
+ "pla": 506,
589
+ "play": 632,
590
+ "po": 377,
591
+ "poin": 856,
592
+ "poli": 902,
593
+ "por": 473,
594
+ "port</w>": 843,
595
+ "posi": 905,
596
+ "pp": 770,
597
+ "pr": 888,
598
+ "pre": 424,
599
+ "pres": 618,
600
+ "pri": 667,
601
+ "pro": 386,
602
+ "produc": 774,
603
+ "ps</w>": 703,
604
+ "pu": 485,
605
+ "publi": 728,
606
+ "q": 56,
607
+ "q</w>": 217,
608
+ "qu": 431,
609
+ "r": 57,
610
+ "r</w>": 171,
611
+ "ra": 355,
612
+ "ran": 523,
613
+ "re": 304,
614
+ "re</w>": 671,
615
+ "rea": 746,
616
+ "rec": 436,
617
+ "recor": 708,
618
+ "red</w>": 764,
619
+ "ree</w>": 638,
620
+ "relea": 795,
621
+ "rema": 980,
622
+ "ren": 629,
623
+ "res</w>": 613,
624
+ "ri": 329,
625
+ "rit": 599,
626
+ "ro": 317,
627
+ "ron": 951,
628
+ "rou": 498,
629
+ "ru": 419,
630
+ "ry</w>": 885,
631
+ "s": 58,
632
+ "s</w>": 168,
633
+ "sa": 510,
634
+ "sc": 414,
635
+ "sch": 775,
636
+ "scri": 745,
637
+ "se": 380,
638
+ "se</w>": 373,
639
+ "sea": 677,
640
+ "season</w>": 781,
641
+ "sec": 554,
642
+ "second</w>": 837,
643
+ "sed</w>": 446,
644
+ "sel": 699,
645
+ "ser": 486,
646
+ "series</w>": 826,
647
+ "ses</w>": 647,
648
+ "set</w>": 1019,
649
+ "sever": 877,
650
+ "several</w>": 920,
651
+ "sh": 359,
652
+ "sh</w>": 541,
653
+ "she</w>": 594,
654
+ "shed</w>": 719,
655
+ "shi": 533,
656
+ "ship</w>": 748,
657
+ "sho": 828,
658
+ "si": 327,
659
+ "side</w>": 839,
660
+ "sig": 627,
661
+ "sin": 791,
662
+ "sing": 857,
663
+ "sing</w>": 679,
664
+ "sion</w>": 504,
665
+ "sk": 889,
666
+ "sm": 796,
667
+ "so": 602,
668
+ "so</w>": 477,
669
+ "soci": 934,
670
+ "sol": 977,
671
+ "som": 984,
672
+ "some</w>": 757,
673
+ "son": 800,
674
+ "son</w>": 501,
675
+ "song</w>": 751,
676
+ "sou": 641,
677
+ "south</w>": 884,
678
+ "sp": 384,
679
+ "spec": 581,
680
+ "ss</w>": 489,
681
+ "ssi": 732,
682
+ "st": 316,
683
+ "st</w>": 335,
684
+ "sta": 690,
685
+ "star": 744,
686
+ "state</w>": 898,
687
+ "ste": 724,
688
+ "sted</w>": 853,
689
+ "ster</w>": 883,
690
+ "stern</w>": 994,
691
+ "sti": 643,
692
+ "stor": 537,
693
+ "str": 589,
694
+ "stri": 863,
695
+ "stru": 695,
696
+ "struc": 772,
697
+ "sts</w>": 766,
698
+ "stu": 807,
699
+ "su": 368,
700
+ "sub": 787,
701
+ "suc": 947,
702
+ "such</w>": 812,
703
+ "sul": 930,
704
+ "sup": 860,
705
+ "sur": 642,
706
+ "sy": 673,
707
+ "t": 59,
708
+ "t</w>": 180,
709
+ "ta": 438,
710
+ "tain</w>": 1010,
711
+ "te": 544,
712
+ "te</w>": 550,
713
+ "ted</w>": 402,
714
+ "tel": 937,
715
+ "ten": 648,
716
+ "ten</w>": 798,
717
+ "ter": 433,
718
+ "ter</w>": 420,
719
+ "ters</w>": 838,
720
+ "th": 298,
721
+ "th</w>": 391,
722
+ "than</w>": 723,
723
+ "that</w>": 362,
724
+ "the": 375,
725
+ "the</w>": 299,
726
+ "their</w>": 507,
727
+ "them</w>": 819,
728
+ "then</w>": 875,
729
+ "ther</w>": 430,
730
+ "there</w>": 760,
731
+ "these</w>": 848,
732
+ "they</w>": 525,
733
+ "this</w>": 495,
734
+ "tho": 919,
735
+ "thou": 636,
736
+ "though</w>": 741,
737
+ "three</w>": 716,
738
+ "throu": 731,
739
+ "through</w>": 878,
740
+ "ti": 306,
741
+ "tic": 536,
742
+ "tic</w>": 681,
743
+ "ties</w>": 704,
744
+ "tim": 469,
745
+ "time</w>": 600,
746
+ "ting</w>": 542,
747
+ "tion": 404,
748
+ "tion</w>": 347,
749
+ "tional</w>": 634,
750
+ "tions</w>": 479,
751
+ "tish</w>": 982,
752
+ "tiv": 946,
753
+ "tive</w>": 596,
754
+ "tle</w>": 986,
755
+ "tly</w>": 894,
756
+ "to": 468,
757
+ "to</w>": 320,
758
+ "ton</w>": 818,
759
+ "tor": 780,
760
+ "tor</w>": 950,
761
+ "tow": 976,
762
+ "tr": 460,
763
+ "tra": 592,
764
+ "trac": 1022,
765
+ "tran": 840,
766
+ "tre": 865,
767
+ "tri": 685,
768
+ "tro": 715,
769
+ "try</w>": 1011,
770
+ "ts</w>": 413,
771
+ "tu": 650,
772
+ "tur": 496,
773
+ "ture</w>": 842,
774
+ "tw": 434,
775
+ "two</w>": 545,
776
+ "ty</w>": 584,
777
+ "u": 60,
778
+ "u</w>": 187,
779
+ "ul": 461,
780
+ "um": 500,
781
+ "um</w>": 743,
782
+ "un": 346,
783
+ "und</w>": 952,
784
+ "under</w>": 944,
785
+ "uni": 696,
786
+ "united</w>": 942,
787
+ "up</w>": 657,
788
+ "ur": 337,
789
+ "ure</w>": 777,
790
+ "uring</w>": 586,
791
+ "ury</w>": 806,
792
+ "us</w>": 534,
793
+ "use</w>": 991,
794
+ "used</w>": 701,
795
+ "v": 61,
796
+ "v</w>": 190,
797
+ "ve": 910,
798
+ "ve</w>": 371,
799
+ "ved</w>": 503,
800
+ "vel": 688,
801
+ "ven</w>": 911,
802
+ "ver": 392,
803
+ "ver</w>": 440,
804
+ "very</w>": 970,
805
+ "ves</w>": 737,
806
+ "vi": 356,
807
+ "vie": 710,
808
+ "ving</w>": 686,
809
+ "vision</w>": 873,
810
+ "vo": 852,
811
+ "w": 62,
812
+ "w</w>": 193,
813
+ "wa": 464,
814
+ "war": 768,
815
+ "war</w>": 866,
816
+ "ward</w>": 965,
817
+ "was</w>": 341,
818
+ "way</w>": 654,
819
+ "we": 502,
820
+ "well</w>": 833,
821
+ "were</w>": 423,
822
+ "west</w>": 959,
823
+ "wh": 389,
824
+ "when</w>": 626,
825
+ "where</w>": 792,
826
+ "whi": 418,
827
+ "which</w>": 463,
828
+ "while</w>": 668,
829
+ "who</w>": 579,
830
+ "wi": 538,
831
+ "wil": 712,
832
+ "win": 907,
833
+ "with": 799,
834
+ "with</w>": 372,
835
+ "wn</w>": 676,
836
+ "wor": 471,
837
+ "work</w>": 966,
838
+ "world</w>": 834,
839
+ "would</w>": 662,
840
+ "writ": 722,
841
+ "ws</w>": 953,
842
+ "x": 63,
843
+ "x</w>": 184,
844
+ "y": 64,
845
+ "y</w>": 174,
846
+ "year</w>": 789,
847
+ "years</w>": 845,
848
+ "ying</w>": 868,
849
+ "yo": 1008,
850
+ "yp": 870,
851
+ "ys</w>": 711,
852
+ "z": 65,
853
+ "z</w>": 192,
854
+ "zed</w>": 973,
855
+ "|": 66,
856
+ "|</w>": 260,
857
+ "}": 67,
858
+ "}</w>": 285,
859
+ "~": 68,
860
+ "~</w>": 280,
861
+ "¡": 69,
862
+ "¡</w>": 189,
863
+ "¢": 70,
864
+ "¢</w>": 215,
865
+ "£": 71,
866
+ "£</w>": 210,
867
+ "¤": 72,
868
+ "¤</w>": 224,
869
+ "¥": 73,
870
+ "¥</w>": 203,
871
+ "¦": 74,
872
+ "¦</w>": 240,
873
+ "§": 75,
874
+ "§</w>": 207,
875
+ "¨": 76,
876
+ "¨</w>": 238,
877
+ "©": 77,
878
+ "©</w>": 200,
879
+ "ª": 78,
880
+ "ª</w>": 258,
881
+ "«": 79,
882
+ "«</w>": 220,
883
+ "¬": 80,
884
+ "¬</w>": 272,
885
+ "®": 81,
886
+ "®</w>": 239,
887
+ "¯": 82,
888
+ "¯</w>": 248,
889
+ "°": 83,
890
+ "°</w>": 256,
891
+ "±": 84,
892
+ "±</w>": 245,
893
+ "²": 85,
894
+ "²</w>": 225,
895
+ "³": 86,
896
+ "³</w>": 218,
897
+ "´": 87,
898
+ "´</w>": 267,
899
+ "µ": 88,
900
+ "µ</w>": 213,
901
+ "¶": 89,
902
+ "¶</w>": 237,
903
+ "·": 90,
904
+ "·</w>": 261,
905
+ "¸": 91,
906
+ "¸</w>": 194,
907
+ "¹": 92,
908
+ "¹</w>": 211,
909
+ "º": 93,
910
+ "º</w>": 254,
911
+ "»": 94,
912
+ "»</w>": 257,
913
+ "¼": 95,
914
+ "¼</w>": 209,
915
+ "½": 96,
916
+ "½</w>": 234,
917
+ "¾": 97,
918
+ "¾</w>": 259,
919
+ "¿": 98,
920
+ "¿</w>": 249,
921
+ "Â": 99,
922
+ "Ã": 100,
923
+ "Ä": 101,
924
+ "Å": 102,
925
+ "Æ": 103,
926
+ "Ç": 104,
927
+ "È": 105,
928
+ "É": 106,
929
+ "Ê": 107,
930
+ "Ë": 108,
931
+ "Ì": 109,
932
+ "Í": 110,
933
+ "Î": 111,
934
+ "Ï": 112,
935
+ "Ð": 113,
936
+ "Ñ": 114,
937
+ "Ö": 115,
938
+ "×": 116,
939
+ "Ø": 117,
940
+ "Ù": 118,
941
+ "Ü": 119,
942
+ "à": 120,
943
+ "á": 121,
944
+ "â": 122,
945
+ "âĢ": 458,
946
+ "âĢĵ</w>": 521,
947
+ "âĢĶ</w>": 939,
948
+ "ã": 123,
949
+ "ä": 124,
950
+ "å": 125,
951
+ "æ": 126,
952
+ "ç": 127,
953
+ "è": 128,
954
+ "é": 129,
955
+ "ë": 130,
956
+ "ì": 131,
957
+ "ï": 132,
958
+ "Ģ": 133,
959
+ "Ģ</w>": 244,
960
+ "ģ": 134,
961
+ "ģ</w>": 214,
962
+ "Ĥ": 135,
963
+ "Ĥ</w>": 235,
964
+ "ĥ": 136,
965
+ "ĥ</w>": 233,
966
+ "Ħ": 137,
967
+ "Ħ</w>": 197,
968
+ "ħ": 138,
969
+ "ħ</w>": 221,
970
+ "Ĩ": 139,
971
+ "Ĩ</w>": 202,
972
+ "ĩ": 140,
973
+ "ĩ</w>": 195,
974
+ "Ī": 141,
975
+ "Ī</w>": 243,
976
+ "ī": 142,
977
+ "ī</w>": 222,
978
+ "Ĭ": 143,
979
+ "Ĭ</w>": 198,
980
+ "ĭ": 144,
981
+ "ĭ</w>": 241,
982
+ "Į": 145,
983
+ "Į</w>": 229,
984
+ "į": 146,
985
+ "į</w>": 201,
986
+ "İ": 147,
987
+ "İ</w>": 279,
988
+ "ı": 148,
989
+ "ı</w>": 230,
990
+ "IJ": 149,
991
+ "IJ</w>": 255,
992
+ "ij": 150,
993
+ "ij</w>": 219,
994
+ "Ĵ": 151,
995
+ "Ĵ</w>": 227,
996
+ "ĵ": 152,
997
+ "ĵ</w>": 185,
998
+ "Ķ": 153,
999
+ "Ķ</w>": 223,
1000
+ "ķ": 154,
1001
+ "ķ</w>": 216,
1002
+ "ĸ": 155,
1003
+ "ĸ</w>": 196,
1004
+ "Ĺ": 156,
1005
+ "Ĺ</w>": 263,
1006
+ "ĺ": 157,
1007
+ "ĺ</w>": 199,
1008
+ "Ļ": 158,
1009
+ "Ļ</w>": 226,
1010
+ "ļ": 159,
1011
+ "ļ</w>": 290,
1012
+ "Ľ": 160,
1013
+ "Ľ</w>": 186,
1014
+ "ľ": 161,
1015
+ "ľ</w>": 247,
1016
+ "Ŀ": 162,
1017
+ "Ŀ</w>": 205,
1018
+ "ŀ": 163,
1019
+ "ŀ</w>": 206,
1020
+ "Ł": 164,
1021
+ "Ł</w>": 250,
1022
+ "ł": 165,
1023
+ "ł</w>": 252,
1024
+ "Ń": 166,
1025
+ "Ń</w>": 231
1026
+ }