davidberenstein1957 commited on
Commit
c60290e
·
verified ·
1 Parent(s): 149e620

Add files using upload-large-folder tool

Browse files
README.md ADDED
@@ -0,0 +1,113 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ library_name: diffusers
3
+ tags:
4
+ - pruna-ai
5
+ ---
6
+
7
+ # Model Card for PrunaAI/tiny-stable-diffusion-pipe-smashed
8
+
9
+ This model was created using the [pruna](https://github.com/PrunaAI/pruna) library. Pruna is a model optimization framework built for developers, enabling you to deliver more efficient models with minimal implementation overhead.
10
+
11
+ ## Usage
12
+
13
+ First things first, you need to install the pruna library:
14
+
15
+ ```bash
16
+ pip install pruna
17
+ ```
18
+
19
+ You can then load this model using the following code:
20
+
21
+ ```python
22
+ from pruna import PrunaModel
23
+
24
+ loaded_model = PrunaModel.from_hub("PrunaAI/tiny-stable-diffusion-pipe-smashed")
25
+ ```
26
+
27
+ After loading the model, you can use the inference methods of the original model.
28
+
29
+ ## Smash Configuration
30
+
31
+ The compression configuration of the model is stored in the `smash_config.json` file.
32
+
33
+ ```bash
34
+ {
35
+ "batcher": null,
36
+ "cacher": "deepcache",
37
+ "compiler": null,
38
+ "pruner": null,
39
+ "quantizer": null,
40
+ "deepcache_interval": 2,
41
+ "max_batch_size": 1,
42
+ "device": "cpu",
43
+ "save_fns": [],
44
+ "load_fns": [
45
+ "diffusers"
46
+ ],
47
+ "reapply_after_load": {
48
+ "pruner": null,
49
+ "quantizer": null,
50
+ "cacher": "deepcache",
51
+ "compiler": null,
52
+ "batcher": null
53
+ }
54
+ }
55
+ ```
56
+
57
+ ## Model Configuration
58
+
59
+ The configuration of the model is stored in the `config.json` file.
60
+
61
+ ```bash
62
+ {
63
+ "model_index": {
64
+ "_class_name": "StableDiffusionPipeline",
65
+ "_diffusers_version": "0.33.1",
66
+ "_name_or_path": "/Users/davidberenstein/.cache/huggingface/hub/models--PrunaAI--tiny-stable-diffusion-pipe-smashed/snapshots/d2b38aca393c0e7a05566b66dc2f264d47bfef65",
67
+ "feature_extractor": [
68
+ "transformers",
69
+ "CLIPImageProcessor"
70
+ ],
71
+ "image_encoder": [
72
+ null,
73
+ null
74
+ ],
75
+ "requires_safety_checker": true,
76
+ "safety_checker": [
77
+ "stable_diffusion",
78
+ "StableDiffusionSafetyChecker"
79
+ ],
80
+ "scheduler": [
81
+ "diffusers",
82
+ "DDIMScheduler"
83
+ ],
84
+ "text_encoder": [
85
+ "transformers",
86
+ "CLIPTextModel"
87
+ ],
88
+ "tokenizer": [
89
+ "transformers",
90
+ "CLIPTokenizer"
91
+ ],
92
+ "unet": [
93
+ "diffusers",
94
+ "UNet2DConditionModel"
95
+ ],
96
+ "vae": [
97
+ "diffusers",
98
+ "AutoencoderKL"
99
+ ]
100
+ },
101
+ "dtype_info": {
102
+ "dtype": "float32"
103
+ }
104
+ }
105
+ ```
106
+
107
+ ## 🌍 Join the Pruna AI community!
108
+
109
+ [![Twitter](https://img.shields.io/twitter/follow/PrunaAI?style=social)](https://twitter.com/PrunaAI)
110
+ [![GitHub](https://img.shields.io/github/followers/PrunaAI?label=Follow%20%40PrunaAI&style=social)](https://github.com/PrunaAI)
111
+ [![LinkedIn](https://img.shields.io/badge/LinkedIn-Connect-blue)](https://www.linkedin.com/company/93832878/admin/feed/posts/?feedType=following)
112
+ [![Discord](https://img.shields.io/badge/Discord-Join%20Us-blue?style=social&logo=discord)](https://discord.com/invite/rskEr4BZJx)
113
+ [![Reddit](https://img.shields.io/reddit/subreddit-subscribers/PrunaAI?style=social)](https://www.reddit.com/r/PrunaAI/)
dtype_info.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"dtype": "float32"}
feature_extractor/preprocessor_config.json ADDED
@@ -0,0 +1,27 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "crop_size": {
3
+ "height": 224,
4
+ "width": 224
5
+ },
6
+ "do_center_crop": true,
7
+ "do_convert_rgb": true,
8
+ "do_normalize": true,
9
+ "do_rescale": true,
10
+ "do_resize": true,
11
+ "image_mean": [
12
+ 0.48145466,
13
+ 0.4578275,
14
+ 0.40821073
15
+ ],
16
+ "image_processor_type": "CLIPImageProcessor",
17
+ "image_std": [
18
+ 0.26862954,
19
+ 0.26130258,
20
+ 0.27577711
21
+ ],
22
+ "resample": 3,
23
+ "rescale_factor": 0.00392156862745098,
24
+ "size": {
25
+ "shortest_edge": 224
26
+ }
27
+ }
model_index.json ADDED
@@ -0,0 +1,38 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "StableDiffusionPipeline",
3
+ "_diffusers_version": "0.33.1",
4
+ "_name_or_path": "/Users/davidberenstein/.cache/huggingface/hub/models--PrunaAI--tiny-stable-diffusion-pipe-smashed/snapshots/d2b38aca393c0e7a05566b66dc2f264d47bfef65",
5
+ "feature_extractor": [
6
+ "transformers",
7
+ "CLIPImageProcessor"
8
+ ],
9
+ "image_encoder": [
10
+ null,
11
+ null
12
+ ],
13
+ "requires_safety_checker": true,
14
+ "safety_checker": [
15
+ "stable_diffusion",
16
+ "StableDiffusionSafetyChecker"
17
+ ],
18
+ "scheduler": [
19
+ "diffusers",
20
+ "DDIMScheduler"
21
+ ],
22
+ "text_encoder": [
23
+ "transformers",
24
+ "CLIPTextModel"
25
+ ],
26
+ "tokenizer": [
27
+ "transformers",
28
+ "CLIPTokenizer"
29
+ ],
30
+ "unet": [
31
+ "diffusers",
32
+ "UNet2DConditionModel"
33
+ ],
34
+ "vae": [
35
+ "diffusers",
36
+ "AutoencoderKL"
37
+ ]
38
+ }
safety_checker/config.json ADDED
@@ -0,0 +1,52 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "StableDiffusionSafetyChecker"
4
+ ],
5
+ "initializer_factor": 1.0,
6
+ "logit_scale_init_value": 2.6592,
7
+ "model_type": "clip",
8
+ "projection_dim": 64,
9
+ "text_config": {
10
+ "attention_dropout": 0.1,
11
+ "bos_token_id": 0,
12
+ "dropout": 0.1,
13
+ "eos_token_id": 2,
14
+ "gradient_checkpointing": false,
15
+ "hidden_act": "quick_gelu",
16
+ "hidden_size": 32,
17
+ "initializer_factor": 1.0,
18
+ "initializer_range": 0.02,
19
+ "intermediate_size": 37,
20
+ "layer_norm_eps": 1e-05,
21
+ "max_position_embeddings": 512,
22
+ "model_type": "clip_text_model",
23
+ "num_attention_heads": 4,
24
+ "num_hidden_layers": 5,
25
+ "projection_dim": 512,
26
+ "torch_dtype": "float32",
27
+ "vocab_size": 99
28
+ },
29
+ "torch_dtype": "float32",
30
+ "transformers_version": "4.51.3",
31
+ "vision_config": {
32
+ "_attn_implementation_autoset": true,
33
+ "attention_dropout": 0.1,
34
+ "dropout": 0.1,
35
+ "gradient_checkpointing": false,
36
+ "hidden_act": "quick_gelu",
37
+ "hidden_size": 32,
38
+ "image_size": 30,
39
+ "initializer_factor": 1.0,
40
+ "initializer_range": 0.02,
41
+ "intermediate_size": 37,
42
+ "layer_norm_eps": 1e-05,
43
+ "model_type": "clip_vision_model",
44
+ "num_attention_heads": 4,
45
+ "num_channels": 3,
46
+ "num_hidden_layers": 5,
47
+ "patch_size": 2,
48
+ "projection_dim": 512,
49
+ "torch_dtype": "float32"
50
+ },
51
+ "vocab_size": 1000
52
+ }
safety_checker/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cd553c930718d5a2076729702298824d3ddc8a4fd4128158fccb3382d270cd8f
3
+ size 191516
scheduler/scheduler_config.json ADDED
@@ -0,0 +1,19 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "DDIMScheduler",
3
+ "_diffusers_version": "0.33.1",
4
+ "beta_end": 0.012,
5
+ "beta_schedule": "scaled_linear",
6
+ "beta_start": 0.00085,
7
+ "clip_sample": false,
8
+ "clip_sample_range": 1.0,
9
+ "dynamic_thresholding_ratio": 0.995,
10
+ "num_train_timesteps": 1000,
11
+ "prediction_type": "epsilon",
12
+ "rescale_betas_zero_snr": false,
13
+ "sample_max_value": 1.0,
14
+ "set_alpha_to_one": true,
15
+ "steps_offset": 1,
16
+ "thresholding": false,
17
+ "timestep_spacing": "leading",
18
+ "trained_betas": null
19
+ }
smash_config.json ADDED
@@ -0,0 +1,21 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "batcher": null,
3
+ "cacher": "deepcache",
4
+ "compiler": null,
5
+ "pruner": null,
6
+ "quantizer": null,
7
+ "deepcache_interval": 2,
8
+ "max_batch_size": 1,
9
+ "device": "cpu",
10
+ "save_fns": [],
11
+ "load_fns": [
12
+ "diffusers"
13
+ ],
14
+ "reapply_after_load": {
15
+ "pruner": null,
16
+ "quantizer": null,
17
+ "cacher": "deepcache",
18
+ "compiler": null,
19
+ "batcher": null
20
+ }
21
+ }
text_encoder/config.json ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "CLIPTextModel"
4
+ ],
5
+ "attention_dropout": 0.0,
6
+ "bos_token_id": 0,
7
+ "dropout": 0.0,
8
+ "eos_token_id": 2,
9
+ "hidden_act": "quick_gelu",
10
+ "hidden_size": 32,
11
+ "initializer_factor": 1.0,
12
+ "initializer_range": 0.02,
13
+ "intermediate_size": 37,
14
+ "layer_norm_eps": 1e-05,
15
+ "max_position_embeddings": 77,
16
+ "model_type": "clip_text_model",
17
+ "num_attention_heads": 4,
18
+ "num_hidden_layers": 5,
19
+ "pad_token_id": 1,
20
+ "projection_dim": 512,
21
+ "torch_dtype": "float32",
22
+ "transformers_version": "4.51.3",
23
+ "vocab_size": 1000
24
+ }
text_encoder/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:103860291b96610a23d9dda96f6a3c4e6c6dd67e5984a0d5e7c8e62769ac6412
3
+ size 283212
tokenizer/merges.txt ADDED
@@ -0,0 +1,647 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ #version: 0.2
2
+ Ġ t
3
+ Ġt h
4
+ Ġ a
5
+ Ġth e</w>
6
+ i n
7
+ Ġ o
8
+ Ġ ,</w>
9
+ Ġ s
10
+ e d</w>
11
+ Ġ w
12
+ e r
13
+ Ġ .</w>
14
+ Ġ i
15
+ r e
16
+ Ġ c
17
+ n d</w>
18
+ Ġ f
19
+ Ġ b
20
+ a t
21
+ Ġo f</w>
22
+ e r</w>
23
+ e n
24
+ a r
25
+ o r
26
+ i t
27
+ Ġ p
28
+ Ġ h
29
+ Ġa nd</w>
30
+ o n
31
+ in g</w>
32
+ a n
33
+ r o
34
+ Ġ m
35
+ Ġ d
36
+ e s</w>
37
+ Ġi n</w>
38
+ o n</w>
39
+ Ġt o</w>
40
+ o u
41
+ i s
42
+ Ġ a</w>
43
+ i c
44
+ Ġ T
45
+ a l
46
+ Ġ l
47
+ Ġ =</w>
48
+ Ġ re
49
+ Ġ "</w>
50
+ e s
51
+ Ġ S
52
+ a s</w>
53
+ a l</w>
54
+ i l
55
+ e l
56
+ i on</w>
57
+ Ġ A
58
+ Ġ C
59
+ Ġ 1
60
+ Ġ Ċ</w>
61
+ u r
62
+ ĠT h
63
+ Ġ n
64
+ a s
65
+ Ġ @
66
+ e c
67
+ o m
68
+ a c
69
+ Ġ e
70
+ Ġw as</w>
71
+ Ġ M
72
+ o r</w>
73
+ a n</w>
74
+ a m
75
+ e n</w>
76
+ o l
77
+ Ġ in
78
+ Ġ g
79
+ Ġ '</w>
80
+ Ġ B
81
+ l y</w>
82
+ a t</w>
83
+ i v
84
+ t s</w>
85
+ ĠTh e</w>
86
+ u s
87
+ - @</w>
88
+ Ġ@ -@</w>
89
+ i s</w>
90
+ Ġ I
91
+ Ġw h
92
+ i g
93
+ Ġ H
94
+ Ġs t
95
+ o s
96
+ u n
97
+ t h
98
+ Ġ P
99
+ Ġw it
100
+ Ġth at</w>
101
+ i r
102
+ Ġa s</w>
103
+ e m
104
+ Ġo n</w>
105
+ r a
106
+ Ġf or</w>
107
+ Ġ R
108
+ e t
109
+ o w
110
+ Ġ 2
111
+ i d
112
+ Ġ D
113
+ l e</w>
114
+ Ġwit h</w>
115
+ l a
116
+ en t</w>
117
+ i m
118
+ Ġ F
119
+ e a
120
+ i on
121
+ Ġb y</w>
122
+ Ġ )</w>
123
+ Ġ (</w>
124
+ Ġa l
125
+ Ġc on
126
+ en t
127
+ Ġ W
128
+ Ġi s</w>
129
+ er e</w>
130
+ Ġ G
131
+ Ġ N
132
+ Ġ L
133
+ Ġh a
134
+ er s</w>
135
+ r i
136
+ t h</w>
137
+ t ed</w>
138
+ u c
139
+ Ġ J
140
+ Ġ1 9
141
+ e v
142
+ u l
143
+ Ġ v
144
+ c e</w>
145
+ at ion</w>
146
+ ro m</w>
147
+ Ġb e
148
+ Ġ E
149
+ i n</w>
150
+ Ġth e
151
+ Ġf rom</w>
152
+ Ġ O
153
+ t er</w>
154
+ Ġp ro
155
+ Ġa r
156
+ a d
157
+ Ġc om
158
+ i c</w>
159
+ a g
160
+ Ġh is</w>
161
+ Ġs h
162
+ Ġa t</w>
163
+ o v
164
+ i es</w>
165
+ o o
166
+ p p
167
+ s t
168
+ c h
169
+ Ġ r
170
+ Ġ2 0
171
+ a y</w>
172
+ i f
173
+ Ġw ere</w>
174
+ Ġc h
175
+ u t</w>
176
+ s t</w>
177
+ u t
178
+ d s</w>
179
+ o p
180
+ u m
181
+ Ġi t</w>
182
+ o c
183
+ t er
184
+ l e
185
+ ig h
186
+ u d
187
+ Ġe x
188
+ ion s</w>
189
+ at e</w>
190
+ it y</w>
191
+ at ed</w>
192
+ Ġ un
193
+ e p
194
+ q u
195
+ Ġn o
196
+ Ġ K
197
+ iv e</w>
198
+ is t
199
+ Ġo n
200
+ am e</w>
201
+ ou n
202
+ i r</w>
203
+ a b
204
+ Ġ â
205
+ in g
206
+ Ġh e</w>
207
+ l d</w>
208
+ u g
209
+ ic h</w>
210
+ Ġa n</w>
211
+ e d
212
+ Ġ k
213
+ Ġâ Ģ
214
+ Ġha d</w>
215
+ v e</w>
216
+ a in
217
+ Ġs e
218
+ t ion</w>
219
+ or e</w>
220
+ re s
221
+ Ġwh ich</w>
222
+ ĠI n</w>
223
+ o d
224
+ th er</w>
225
+ a k
226
+ Ġs p
227
+ a r</w>
228
+ Ġ y
229
+ ĠC h
230
+ on g</w>
231
+ Ġa c
232
+ es t</w>
233
+ Ġ U
234
+ a p
235
+ f f
236
+ al ly</w>
237
+ r it
238
+ ĠS t
239
+ u b
240
+ g e</w>
241
+ b er</w>
242
+ e t</w>
243
+ Ġb e</w>
244
+ e ar
245
+ Ġre c
246
+ er s
247
+ Ġf ir
248
+ o t
249
+ Ġar e</w>
250
+ Ġa n
251
+ c h</w>
252
+ o g
253
+ i a</w>
254
+ es t
255
+ in e</w>
256
+ il l
257
+ an d
258
+ e l</w>
259
+ ar y</w>
260
+ e w</w>
261
+ i d</w>
262
+ Ġf or
263
+ Ġ ;</w>
264
+ Ġcom p
265
+ Ġ V
266
+ Ġin c
267
+ t r
268
+ Ġ20 0
269
+ Ġthe ir</w>
270
+ u s</w>
271
+ Ġb ut</w>
272
+ r an
273
+ ic al</w>
274
+ Ġfir st</w>
275
+ Ġd e
276
+ Ġin t
277
+ Ġ ro
278
+ s o</w>
279
+ ĠâĢ ĵ</w>
280
+ Ġno t</w>
281
+ d ing</w>
282
+ f ter</w>
283
+ ur e</w>
284
+ Ġp ar
285
+ Ġ :</w>
286
+ i an</w>
287
+ Ġt w
288
+ ou ld</w>
289
+ Ġal so</w>
290
+ Ġi ts</w>
291
+ Ġw or
292
+ u m</w>
293
+ Ġo r</w>
294
+ os t</w>
295
+ 0 0</w>
296
+ ou r
297
+ ar d</w>
298
+ Ġre s
299
+ m p
300
+ u e</w>
301
+ Ġa b
302
+ is h</w>
303
+ Ġcon t
304
+ Ġa d
305
+ ow n</w>
306
+ al l</w>
307
+ ou g
308
+ Ġh er</w>
309
+ as t</w>
310
+ Ġ en
311
+ om e</w>
312
+ al l
313
+ d ed</w>
314
+ o w</w>
315
+ Ġha ve</w>
316
+ Ġ us
317
+ ea r</w>
318
+ ac k</w>
319
+ d uc
320
+ i al</w>
321
+ s s
322
+ en ts</w>
323
+ a in</w>
324
+ t ing</w>
325
+ Ġon e</w>
326
+ es s
327
+ Ġh as</w>
328
+ igh t</w>
329
+ a v
330
+ Ġe v
331
+ ou t</w>
332
+ a y
333
+ en ce</w>
334
+ Ġbe en</w>
335
+ e w
336
+ Ġtw o</w>
337
+ Ġc l
338
+ d er</w>
339
+ im e</w>
340
+ k s</w>
341
+ es s</w>
342
+ is h
343
+ . @</w>
344
+ Ġ@ .@</w>
345
+ Ġp la
346
+ Ġp l
347
+ Ġo r
348
+ u p</w>
349
+ m ent</w>
350
+ ur ing</w>
351
+ ol l
352
+ ĠI n
353
+ Ġth is</w>
354
+ Ġb ec
355
+ Ġcom m
356
+ Ġd is
357
+ at er</w>
358
+ ag e</w>
359
+ Ġa pp
360
+ ou s</w>
361
+ e y</w>
362
+ i l</w>
363
+ p er
364
+ ĠA l
365
+ ion al</w>
366
+ l ud
367
+ el y</w>
368
+ t t
369
+ il e</w>
370
+ i z
371
+ Ġ j
372
+ Ġwh o</w>
373
+ Ġa g
374
+ i b
375
+ Ġthe y</w>
376
+ f or
377
+ Ġo v
378
+ at h
379
+ e g
380
+ Ġs c
381
+ i p
382
+ Ġ20 1
383
+ Ġ 3
384
+ Ġp er
385
+ or y</w>
386
+ Ġd es
387
+ id e</w>
388
+ Ġs er
389
+ s e</w>
390
+ ĠH e</w>
391
+ la nd</w>
392
+ at ions</w>
393
+ r ic
394
+ i t</w>
395
+ re s</w>
396
+ er ed</w>
397
+ Ġp re
398
+ ĠS h
399
+ an ce</w>
400
+ or t</w>
401
+ an t</w>
402
+ , @</w>
403
+ Ġ@ ,@</w>
404
+ el l</w>
405
+ Ġ Y
406
+ n ed</w>
407
+ el l
408
+ it e</w>
409
+ Ġinc lud
410
+ Ġre p
411
+ Ġa fter</w>
412
+ Ġs uc
413
+ re e</w>
414
+ an y</w>
415
+ i m</w>
416
+ or t
417
+ Ġ1 8
418
+ Ġs u
419
+ ad e</w>
420
+ ou r</w>
421
+ ĠU n
422
+ ĠI t</w>
423
+ i k
424
+ ĠM ar
425
+ em ber</w>
426
+ Ġ 1</w>
427
+ e en</w>
428
+ a nd</w>
429
+ Ġs ec
430
+ ic e</w>
431
+ Ġt ime</w>
432
+ ĠA n
433
+ Ġint o</w>
434
+ Ġf in
435
+ Ġo ther</w>
436
+ Ġa tt
437
+ il l</w>
438
+ re n
439
+ ac h
440
+ as s
441
+ er al</w>
442
+ es e</w>
443
+ s h
444
+ al s</w>
445
+ it ion</w>
446
+ oug h</w>
447
+ l es</w>
448
+ am p
449
+ Ġw ould</w>
450
+ Ġm ore</w>
451
+ ro ug
452
+ ri b
453
+ er y</w>
454
+ ac e</w>
455
+ Ġ A</w>
456
+ Ġpla y
457
+ it ed</w>
458
+ k ed</w>
459
+ is t</w>
460
+ i ed</w>
461
+ Ġ 2</w>
462
+ as ed</w>
463
+ ing s</w>
464
+ an g
465
+ a m</w>
466
+ i p</w>
467
+ Ġb o
468
+ ab le</w>
469
+ t y</w>
470
+ Ġch ar
471
+ Ġc ent
472
+ et w
473
+ at es</w>
474
+ ro p
475
+ Ġ I</w>
476
+ u nd</w>
477
+ ĠA m
478
+ c es</w>
479
+ o in
480
+ Ġin ter
481
+ u p
482
+ c t
483
+ on e</w>
484
+ Ġt ra
485
+ an t
486
+ ec t
487
+ Ġal l</w>
488
+ e f
489
+ Ġcon s
490
+ ub l
491
+ n ing</w>
492
+ an s</w>
493
+ Ġf e
494
+ us t</w>
495
+ Ġ 0
496
+ Ġre m
497
+ as e</w>
498
+ on g
499
+ Ġwh en</w>
500
+ e b
501
+ ĠW h
502
+ Ġe ar
503
+ ev er</w>
504
+ Ġov er</w>
505
+ Ġk n
506
+ a us
507
+ Ġp os
508
+ a d</w>
509
+ er m
510
+ Ġsh e</w>
511
+ Ġ ra
512
+ Ġd uring</w>
513
+ as on</w>
514
+ v i
515
+ Ġex p
516
+ Ġl ea
517
+ Ġ el
518
+ Ġ 4
519
+ Ġon ly</w>
520
+ o nd</w>
521
+ Ġd ec
522
+ Ġac c
523
+ Ġo ff
524
+ is s
525
+ Ġf l
526
+ ĠE n
527
+ o t</w>
528
+ en s
529
+ os e</w>
530
+ ak e</w>
531
+ o m</w>
532
+ Ġs ev
533
+ ac h</w>
534
+ etw een</w>
535
+ er n
536
+ Ġ 3</w>
537
+ Ġp r
538
+ Ġg ro
539
+ r uc
540
+ Ġd i
541
+ Ġ19 9
542
+ ĠA r
543
+ Ġg ame</w>
544
+ Ġh im</w>
545
+ oo k</w>
546
+ Ġ up</w>
547
+ Ġab out</w>
548
+ Ġre l
549
+ for m
550
+ Ġth ree</w>
551
+ at t
552
+ ĠC om
553
+ Ġs a
554
+ ear s</w>
555
+ Ġ 5
556
+ r y</w>
557
+ Ġi mp
558
+ Ġm ost</w>
559
+ f er
560
+ Ġp res
561
+ Ġf il
562
+ Ġb etween</w>
563
+ Ġbe g
564
+ p h
565
+ or s</w>
566
+ Ġth an</w>
567
+ Ġrec or
568
+ o b
569
+ er ic
570
+ at ing</w>
571
+ Ġth roug
572
+ k ing</w>
573
+ Ġo ut</w>
574
+ Ġn um
575
+ oo d</w>
576
+ oll ow
577
+ ac t
578
+ u il
579
+ Ġc re
580
+ ol og
581
+ at ional</w>
582
+ Ġpro duc
583
+ Ġwh ile</w>
584
+ Ġl ater</w>
585
+ Ġw rit
586
+ e x
587
+ Ġst ar
588
+ Ġsp ec
589
+ e e
590
+ ish ed</w>
591
+ Ġre g
592
+ is ion</w>
593
+ ou th</w>
594
+ Ġre le
595
+ Ġa ss
596
+ Ġse ason</w>
597
+ Ġm ade</w>
598
+ il y</w>
599
+ r u
600
+ o y
601
+ t ur
602
+ t e</w>
603
+ Ġ qu
604
+ Ġm ov
605
+ ur y</w>
606
+ ĠAm eric
607
+ em ent</w>
608
+ c c
609
+ ou nd</w>
610
+ Ġl ar
611
+ Ġfor m
612
+ ec t</w>
613
+ Ġde f
614
+ Ġm us
615
+ ĠP ar
616
+ Ġm e
617
+ Ġs ub
618
+ w ay</w>
619
+ o p</w>
620
+ o h
621
+ el d</w>
622
+ i e</w>
623
+ em p
624
+ am es</w>
625
+ er n</w>
626
+ Ġn or
627
+ iv ed</w>
628
+ ev el
629
+ Ġsuc h</w>
630
+ ar ds</w>
631
+ Ġin d
632
+ ik e</w>
633
+ Ġg en
634
+ er t
635
+ Ġy ear</w>
636
+ Ġus ed</w>
637
+ Ġn ew</w>
638
+ Ġ 5</w>
639
+ Ġal b
640
+ s p
641
+ y p
642
+ Ġwit h
643
+ Ġwh ere</w>
644
+ ic s</w>
645
+ ĠTh is</w>
646
+ Ġthe m</w>
647
+ w n</w>
tokenizer/special_tokens_map.json ADDED
@@ -0,0 +1,30 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": {
3
+ "content": "<|startoftext|>",
4
+ "lstrip": false,
5
+ "normalized": true,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "eos_token": {
10
+ "content": "<|endoftext|>",
11
+ "lstrip": false,
12
+ "normalized": true,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "pad_token": {
17
+ "content": "<|endoftext|>",
18
+ "lstrip": false,
19
+ "normalized": true,
20
+ "rstrip": false,
21
+ "single_word": false
22
+ },
23
+ "unk_token": {
24
+ "content": "<|endoftext|>",
25
+ "lstrip": false,
26
+ "normalized": true,
27
+ "rstrip": false,
28
+ "single_word": false
29
+ }
30
+ }
tokenizer/tokenizer.json ADDED
@@ -0,0 +1,3679 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "version": "1.0",
3
+ "truncation": null,
4
+ "padding": null,
5
+ "added_tokens": [
6
+ {
7
+ "id": 0,
8
+ "content": "<|startoftext|>",
9
+ "single_word": false,
10
+ "lstrip": false,
11
+ "rstrip": false,
12
+ "normalized": true,
13
+ "special": true
14
+ },
15
+ {
16
+ "id": 1,
17
+ "content": "<|endoftext|>",
18
+ "single_word": false,
19
+ "lstrip": false,
20
+ "rstrip": false,
21
+ "normalized": true,
22
+ "special": true
23
+ }
24
+ ],
25
+ "normalizer": {
26
+ "type": "Sequence",
27
+ "normalizers": [
28
+ {
29
+ "type": "NFC"
30
+ },
31
+ {
32
+ "type": "Replace",
33
+ "pattern": {
34
+ "Regex": "\\s+"
35
+ },
36
+ "content": " "
37
+ },
38
+ {
39
+ "type": "Lowercase"
40
+ }
41
+ ]
42
+ },
43
+ "pre_tokenizer": {
44
+ "type": "Sequence",
45
+ "pretokenizers": [
46
+ {
47
+ "type": "Split",
48
+ "pattern": {
49
+ "Regex": "'s|'t|'re|'ve|'m|'ll|'d|[\\p{L}]+|[\\p{N}]|[^\\s\\p{L}\\p{N}]+"
50
+ },
51
+ "behavior": "Removed",
52
+ "invert": true
53
+ },
54
+ {
55
+ "type": "ByteLevel",
56
+ "add_prefix_space": false,
57
+ "trim_offsets": true,
58
+ "use_regex": true
59
+ }
60
+ ]
61
+ },
62
+ "post_processor": {
63
+ "type": "RobertaProcessing",
64
+ "sep": [
65
+ "<|endoftext|>",
66
+ 1
67
+ ],
68
+ "cls": [
69
+ "<|startoftext|>",
70
+ 0
71
+ ],
72
+ "trim_offsets": false,
73
+ "add_prefix_space": false
74
+ },
75
+ "decoder": {
76
+ "type": "ByteLevel",
77
+ "add_prefix_space": true,
78
+ "trim_offsets": true,
79
+ "use_regex": true
80
+ },
81
+ "model": {
82
+ "type": "BPE",
83
+ "dropout": null,
84
+ "unk_token": "<|endoftext|>",
85
+ "continuing_subword_prefix": "",
86
+ "end_of_word_suffix": "</w>",
87
+ "fuse_unk": false,
88
+ "byte_fallback": false,
89
+ "ignore_merges": false,
90
+ "vocab": {
91
+ "<|startoftext|>": 0,
92
+ "<|endoftext|>": 1,
93
+ "!": 2,
94
+ "\"": 3,
95
+ "#": 4,
96
+ "$": 5,
97
+ "%": 6,
98
+ "&": 7,
99
+ "'": 8,
100
+ "(": 9,
101
+ ")": 10,
102
+ "*": 11,
103
+ "+": 12,
104
+ ",": 13,
105
+ "-": 14,
106
+ ".": 15,
107
+ "/": 16,
108
+ "0": 17,
109
+ "1": 18,
110
+ "2": 19,
111
+ "3": 20,
112
+ "4": 21,
113
+ "5": 22,
114
+ "6": 23,
115
+ "7": 24,
116
+ "8": 25,
117
+ "9": 26,
118
+ ":": 27,
119
+ ";": 28,
120
+ "<": 29,
121
+ "=": 30,
122
+ ">": 31,
123
+ "?": 32,
124
+ "@": 33,
125
+ "A": 34,
126
+ "B": 35,
127
+ "C": 36,
128
+ "D": 37,
129
+ "E": 38,
130
+ "F": 39,
131
+ "G": 40,
132
+ "H": 41,
133
+ "I": 42,
134
+ "J": 43,
135
+ "K": 44,
136
+ "L": 45,
137
+ "M": 46,
138
+ "N": 47,
139
+ "O": 48,
140
+ "P": 49,
141
+ "Q": 50,
142
+ "R": 51,
143
+ "S": 52,
144
+ "T": 53,
145
+ "U": 54,
146
+ "V": 55,
147
+ "W": 56,
148
+ "X": 57,
149
+ "Y": 58,
150
+ "Z": 59,
151
+ "[": 60,
152
+ "\\": 61,
153
+ "]": 62,
154
+ "^": 63,
155
+ "_": 64,
156
+ "`": 65,
157
+ "a": 66,
158
+ "b": 67,
159
+ "c": 68,
160
+ "d": 69,
161
+ "e": 70,
162
+ "f": 71,
163
+ "g": 72,
164
+ "h": 73,
165
+ "i": 74,
166
+ "j": 75,
167
+ "k": 76,
168
+ "l": 77,
169
+ "m": 78,
170
+ "n": 79,
171
+ "o": 80,
172
+ "p": 81,
173
+ "q": 82,
174
+ "r": 83,
175
+ "s": 84,
176
+ "t": 85,
177
+ "u": 86,
178
+ "v": 87,
179
+ "w": 88,
180
+ "x": 89,
181
+ "y": 90,
182
+ "z": 91,
183
+ "|": 92,
184
+ "}": 93,
185
+ "~": 94,
186
+ "¡": 95,
187
+ "¢": 96,
188
+ "£": 97,
189
+ "¤": 98,
190
+ "¥": 99,
191
+ "¦": 100,
192
+ "§": 101,
193
+ "¨": 102,
194
+ "©": 103,
195
+ "ª": 104,
196
+ "«": 105,
197
+ "¬": 106,
198
+ "®": 107,
199
+ "¯": 108,
200
+ "°": 109,
201
+ "±": 110,
202
+ "²": 111,
203
+ "³": 112,
204
+ "´": 113,
205
+ "µ": 114,
206
+ "¶": 115,
207
+ "·": 116,
208
+ "¸": 117,
209
+ "¹": 118,
210
+ "º": 119,
211
+ "»": 120,
212
+ "¼": 121,
213
+ "½": 122,
214
+ "¾": 123,
215
+ "¿": 124,
216
+ "Â": 125,
217
+ "Ã": 126,
218
+ "Ä": 127,
219
+ "Å": 128,
220
+ "Æ": 129,
221
+ "Ç": 130,
222
+ "È": 131,
223
+ "É": 132,
224
+ "Ê": 133,
225
+ "Ë": 134,
226
+ "Ì": 135,
227
+ "Í": 136,
228
+ "Î": 137,
229
+ "Ï": 138,
230
+ "Ð": 139,
231
+ "Ñ": 140,
232
+ "Ö": 141,
233
+ "×": 142,
234
+ "Ø": 143,
235
+ "Ù": 144,
236
+ "Ü": 145,
237
+ "à": 146,
238
+ "á": 147,
239
+ "â": 148,
240
+ "ã": 149,
241
+ "ä": 150,
242
+ "å": 151,
243
+ "æ": 152,
244
+ "ç": 153,
245
+ "è": 154,
246
+ "é": 155,
247
+ "ë": 156,
248
+ "ì": 157,
249
+ "ï": 158,
250
+ "Ċ": 159,
251
+ "Ġ": 160,
252
+ "Ģ": 161,
253
+ "ģ": 162,
254
+ "Ĥ": 163,
255
+ "ĥ": 164,
256
+ "Ħ": 165,
257
+ "ħ": 166,
258
+ "Ĩ": 167,
259
+ "ĩ": 168,
260
+ "Ī": 169,
261
+ "ī": 170,
262
+ "Ĭ": 171,
263
+ "ĭ": 172,
264
+ "Į": 173,
265
+ "į": 174,
266
+ "İ": 175,
267
+ "ı": 176,
268
+ "IJ": 177,
269
+ "ij": 178,
270
+ "Ĵ": 179,
271
+ "ĵ": 180,
272
+ "Ķ": 181,
273
+ "ķ": 182,
274
+ "ĸ": 183,
275
+ "Ĺ": 184,
276
+ "ĺ": 185,
277
+ "Ļ": 186,
278
+ "ļ": 187,
279
+ "Ľ": 188,
280
+ "ľ": 189,
281
+ "Ŀ": 190,
282
+ "ŀ": 191,
283
+ "Ł": 192,
284
+ "ł": 193,
285
+ "Ń": 194,
286
+ "e</w>": 195,
287
+ "d</w>": 196,
288
+ "a</w>": 197,
289
+ "o</w>": 198,
290
+ "n</w>": 199,
291
+ "±</w>": 200,
292
+ "l</w>": 201,
293
+ "m</w>": 202,
294
+ "h</w>": 203,
295
+ "r</w>": 204,
296
+ "i</w>": 205,
297
+ "s</w>": 206,
298
+ "Z</w>": 207,
299
+ "t</w>": 208,
300
+ "f</w>": 209,
301
+ "k</w>": 210,
302
+ "y</w>": 211,
303
+ "b</w>": 212,
304
+ "F</w>": 213,
305
+ "g</w>": 214,
306
+ "7</w>": 215,
307
+ "0</w>": 216,
308
+ "p</w>": 217,
309
+ "L</w>": 218,
310
+ "H</w>": 219,
311
+ "¡</w>": 220,
312
+ "Ī</w>": 221,
313
+ "1</w>": 222,
314
+ "Ģ</w>": 223,
315
+ "c</w>": 224,
316
+ "ĩ</w>": 225,
317
+ "6</w>": 226,
318
+ "A</w>": 227,
319
+ "z</w>": 228,
320
+ "u</w>": 229,
321
+ "S</w>": 230,
322
+ "2</w>": 231,
323
+ "v</w>": 232,
324
+ "4</w>": 233,
325
+ "M</w>": 234,
326
+ "T</w>": 235,
327
+ "8</w>": 236,
328
+ "I</w>": 237,
329
+ "N</w>": 238,
330
+ "C</w>": 239,
331
+ "5</w>": 240,
332
+ "¹</w>": 241,
333
+ "9</w>": 242,
334
+ "3</w>": 243,
335
+ "ī</w>": 244,
336
+ "P</w>": 245,
337
+ "E</w>": 246,
338
+ "»</w>": 247,
339
+ "V</w>": 248,
340
+ "İ</w>": 249,
341
+ "w</w>": 250,
342
+ "J</w>": 251,
343
+ "ł</w>": 252,
344
+ ".</w>": 253,
345
+ "K</w>": 254,
346
+ "D</w>": 255,
347
+ "Ķ</w>": 256,
348
+ "¸</w>": 257,
349
+ "B</w>": 258,
350
+ "©</w>": 259,
351
+ "º</w>": 260,
352
+ "µ</w>": 261,
353
+ "Ĥ</w>": 262,
354
+ "X</w>": 263,
355
+ "R</w>": 264,
356
+ "O</w>": 265,
357
+ "«</w>": 266,
358
+ "Ļ</w>": 267,
359
+ "U</w>": 268,
360
+ "x</w>": 269,
361
+ "[</w>": 270,
362
+ "¿</w>": 271,
363
+ "³</w>": 272,
364
+ "ģ</w>": 273,
365
+ "W</w>": 274,
366
+ "§</w>": 275,
367
+ "-</w>": 276,
368
+ "ĸ</w>": 277,
369
+ "Ħ</w>": 278,
370
+ ",</w>": 279,
371
+ "q</w>": 280,
372
+ "ħ</w>": 281,
373
+ "¨</w>": 282,
374
+ "G</w>": 283,
375
+ "²</w>": 284,
376
+ "ĺ</w>": 285,
377
+ "ª</w>": 286,
378
+ "¯</w>": 287,
379
+ "j</w>": 288,
380
+ "]</w>": 289,
381
+ "ļ</w>": 290,
382
+ "Ŀ</w>": 291,
383
+ "¤</w>": 292,
384
+ "ŀ</w>": 293,
385
+ "½</w>": 294,
386
+ "IJ</w>": 295,
387
+ "'</w>": 296,
388
+ "Ń</w>": 297,
389
+ "°</w>": 298,
390
+ "ľ</w>": 299,
391
+ "></w>": 300,
392
+ "¶</w>": 301,
393
+ "į</w>": 302,
394
+ "¦</w>": 303,
395
+ "|</w>": 304,
396
+ "¼</w>": 305,
397
+ "¢</w>": 306,
398
+ "´</w>": 307,
399
+ "Ĩ</w>": 308,
400
+ "Q</w>": 309,
401
+ "Y</w>": 310,
402
+ "Ľ</w>": 311,
403
+ "ĵ</w>": 312,
404
+ "ij</w>": 313,
405
+ "ķ</w>": 314,
406
+ "Ĭ</w>": 315,
407
+ "¾</w>": 316,
408
+ ";</w>": 317,
409
+ "(</w>": 318,
410
+ "¬</w>": 319,
411
+ "@</w>": 320,
412
+ "ĭ</w>": 321,
413
+ "Ĺ</w>": 322,
414
+ "£</w>": 323,
415
+ "Į</w>": 324,
416
+ "#</w>": 325,
417
+ "·</w>": 326,
418
+ "*</w>": 327,
419
+ "Ĵ</w>": 328,
420
+ "®</w>": 329,
421
+ ")</w>": 330,
422
+ "^</w>": 331,
423
+ "ı</w>": 332,
424
+ "Ġ</w>": 333,
425
+ "_</w>": 334,
426
+ "Ł</w>": 335,
427
+ "}</w>": 336,
428
+ "ĥ</w>": 337,
429
+ "\\</w>": 338,
430
+ "¥</w>": 339,
431
+ "<</w>": 340,
432
+ "+</w>": 341,
433
+ "=</w>": 342,
434
+ "~</w>": 343,
435
+ "\"</w>": 344,
436
+ "!</w>": 345,
437
+ "?</w>": 346,
438
+ "`</w>": 347,
439
+ "$</w>": 348,
440
+ "Ċ</w>": 349,
441
+ "/</w>": 350,
442
+ "%</w>": 351,
443
+ "&</w>": 352,
444
+ ":</w>": 353,
445
+ "Ġt": 354,
446
+ "Ġth": 355,
447
+ "Ġa": 356,
448
+ "Ġthe</w>": 357,
449
+ "in": 358,
450
+ "Ġo": 359,
451
+ "Ġ,</w>": 360,
452
+ "Ġs": 361,
453
+ "ed</w>": 362,
454
+ "Ġw": 363,
455
+ "er": 364,
456
+ "Ġ.</w>": 365,
457
+ "Ġi": 366,
458
+ "re": 367,
459
+ "Ġc": 368,
460
+ "nd</w>": 369,
461
+ "Ġf": 370,
462
+ "Ġb": 371,
463
+ "at": 372,
464
+ "Ġof</w>": 373,
465
+ "er</w>": 374,
466
+ "en": 375,
467
+ "ar": 376,
468
+ "or": 377,
469
+ "it": 378,
470
+ "Ġp": 379,
471
+ "Ġh": 380,
472
+ "Ġand</w>": 381,
473
+ "on": 382,
474
+ "ing</w>": 383,
475
+ "an": 384,
476
+ "ro": 385,
477
+ "Ġm": 386,
478
+ "Ġd": 387,
479
+ "es</w>": 388,
480
+ "Ġin</w>": 389,
481
+ "on</w>": 390,
482
+ "Ġto</w>": 391,
483
+ "ou": 392,
484
+ "is": 393,
485
+ "Ġa</w>": 394,
486
+ "ic": 395,
487
+ "ĠT": 396,
488
+ "al": 397,
489
+ "Ġl": 398,
490
+ "Ġ=</w>": 399,
491
+ "Ġre": 400,
492
+ "Ġ\"</w>": 401,
493
+ "es": 402,
494
+ "ĠS": 403,
495
+ "as</w>": 404,
496
+ "al</w>": 405,
497
+ "il": 406,
498
+ "el": 407,
499
+ "ion</w>": 408,
500
+ "ĠA": 409,
501
+ "ĠC": 410,
502
+ "Ġ1": 411,
503
+ "ĠĊ</w>": 412,
504
+ "ur": 413,
505
+ "ĠTh": 414,
506
+ "Ġn": 415,
507
+ "as": 416,
508
+ "Ġ@": 417,
509
+ "ec": 418,
510
+ "om": 419,
511
+ "ac": 420,
512
+ "Ġe": 421,
513
+ "Ġwas</w>": 422,
514
+ "ĠM": 423,
515
+ "or</w>": 424,
516
+ "an</w>": 425,
517
+ "am": 426,
518
+ "en</w>": 427,
519
+ "ol": 428,
520
+ "Ġin": 429,
521
+ "Ġg": 430,
522
+ "Ġ'</w>": 431,
523
+ "ĠB": 432,
524
+ "ly</w>": 433,
525
+ "at</w>": 434,
526
+ "iv": 435,
527
+ "ts</w>": 436,
528
+ "ĠThe</w>": 437,
529
+ "us": 438,
530
+ "-@</w>": 439,
531
+ "Ġ@-@</w>": 440,
532
+ "is</w>": 441,
533
+ "ĠI": 442,
534
+ "Ġwh": 443,
535
+ "ig": 444,
536
+ "ĠH": 445,
537
+ "Ġst": 446,
538
+ "os": 447,
539
+ "un": 448,
540
+ "th": 449,
541
+ "ĠP": 450,
542
+ "Ġwit": 451,
543
+ "Ġthat</w>": 452,
544
+ "ir": 453,
545
+ "Ġas</w>": 454,
546
+ "em": 455,
547
+ "Ġon</w>": 456,
548
+ "ra": 457,
549
+ "Ġfor</w>": 458,
550
+ "ĠR": 459,
551
+ "et": 460,
552
+ "ow": 461,
553
+ "Ġ2": 462,
554
+ "id": 463,
555
+ "ĠD": 464,
556
+ "le</w>": 465,
557
+ "Ġwith</w>": 466,
558
+ "la": 467,
559
+ "ent</w>": 468,
560
+ "im": 469,
561
+ "ĠF": 470,
562
+ "ea": 471,
563
+ "ion": 472,
564
+ "Ġby</w>": 473,
565
+ "Ġ)</w>": 474,
566
+ "Ġ(</w>": 475,
567
+ "Ġal": 476,
568
+ "Ġcon": 477,
569
+ "ent": 478,
570
+ "ĠW": 479,
571
+ "Ġis</w>": 480,
572
+ "ere</w>": 481,
573
+ "ĠG": 482,
574
+ "ĠN": 483,
575
+ "ĠL": 484,
576
+ "Ġha": 485,
577
+ "ers</w>": 486,
578
+ "ri": 487,
579
+ "th</w>": 488,
580
+ "ted</w>": 489,
581
+ "uc": 490,
582
+ "ĠJ": 491,
583
+ "Ġ19": 492,
584
+ "ev": 493,
585
+ "ul": 494,
586
+ "Ġv": 495,
587
+ "ce</w>": 496,
588
+ "ation</w>": 497,
589
+ "rom</w>": 498,
590
+ "Ġbe": 499,
591
+ "ĠE": 500,
592
+ "in</w>": 501,
593
+ "Ġthe": 502,
594
+ "Ġfrom</w>": 503,
595
+ "ĠO": 504,
596
+ "ter</w>": 505,
597
+ "Ġpro": 506,
598
+ "Ġar": 507,
599
+ "ad": 508,
600
+ "Ġcom": 509,
601
+ "ic</w>": 510,
602
+ "ag": 511,
603
+ "Ġhis</w>": 512,
604
+ "Ġsh": 513,
605
+ "Ġat</w>": 514,
606
+ "ov": 515,
607
+ "ies</w>": 516,
608
+ "oo": 517,
609
+ "pp": 518,
610
+ "st": 519,
611
+ "ch": 520,
612
+ "Ġr": 521,
613
+ "Ġ20": 522,
614
+ "ay</w>": 523,
615
+ "if": 524,
616
+ "Ġwere</w>": 525,
617
+ "Ġch": 526,
618
+ "ut</w>": 527,
619
+ "st</w>": 528,
620
+ "ut": 529,
621
+ "ds</w>": 530,
622
+ "op": 531,
623
+ "um": 532,
624
+ "Ġit</w>": 533,
625
+ "oc": 534,
626
+ "ter": 535,
627
+ "le": 536,
628
+ "igh": 537,
629
+ "ud": 538,
630
+ "Ġex": 539,
631
+ "ions</w>": 540,
632
+ "ate</w>": 541,
633
+ "ity</w>": 542,
634
+ "ated</w>": 543,
635
+ "Ġun": 544,
636
+ "ep": 545,
637
+ "qu": 546,
638
+ "Ġno": 547,
639
+ "ĠK": 548,
640
+ "ive</w>": 549,
641
+ "ist": 550,
642
+ "Ġon": 551,
643
+ "ame</w>": 552,
644
+ "oun": 553,
645
+ "ir</w>": 554,
646
+ "ab": 555,
647
+ "Ġâ": 556,
648
+ "ing": 557,
649
+ "Ġhe</w>": 558,
650
+ "ld</w>": 559,
651
+ "ug": 560,
652
+ "ich</w>": 561,
653
+ "Ġan</w>": 562,
654
+ "ed": 563,
655
+ "Ġk": 564,
656
+ "ĠâĢ": 565,
657
+ "Ġhad</w>": 566,
658
+ "ve</w>": 567,
659
+ "ain": 568,
660
+ "Ġse": 569,
661
+ "tion</w>": 570,
662
+ "ore</w>": 571,
663
+ "res": 572,
664
+ "Ġwhich</w>": 573,
665
+ "ĠIn</w>": 574,
666
+ "od": 575,
667
+ "ther</w>": 576,
668
+ "ak": 577,
669
+ "Ġsp": 578,
670
+ "ar</w>": 579,
671
+ "Ġy": 580,
672
+ "ĠCh": 581,
673
+ "ong</w>": 582,
674
+ "Ġac": 583,
675
+ "est</w>": 584,
676
+ "ĠU": 585,
677
+ "ap": 586,
678
+ "ff": 587,
679
+ "ally</w>": 588,
680
+ "rit": 589,
681
+ "ĠSt": 590,
682
+ "ub": 591,
683
+ "ge</w>": 592,
684
+ "ber</w>": 593,
685
+ "et</w>": 594,
686
+ "Ġbe</w>": 595,
687
+ "ear": 596,
688
+ "Ġrec": 597,
689
+ "ers": 598,
690
+ "Ġfir": 599,
691
+ "ot": 600,
692
+ "Ġare</w>": 601,
693
+ "Ġan": 602,
694
+ "ch</w>": 603,
695
+ "og": 604,
696
+ "ia</w>": 605,
697
+ "est": 606,
698
+ "ine</w>": 607,
699
+ "ill": 608,
700
+ "and": 609,
701
+ "el</w>": 610,
702
+ "ary</w>": 611,
703
+ "ew</w>": 612,
704
+ "id</w>": 613,
705
+ "Ġfor": 614,
706
+ "Ġ;</w>": 615,
707
+ "Ġcomp": 616,
708
+ "ĠV": 617,
709
+ "Ġinc": 618,
710
+ "tr": 619,
711
+ "Ġ200": 620,
712
+ "Ġtheir</w>": 621,
713
+ "us</w>": 622,
714
+ "Ġbut</w>": 623,
715
+ "ran": 624,
716
+ "ical</w>": 625,
717
+ "Ġfirst</w>": 626,
718
+ "Ġde": 627,
719
+ "Ġint": 628,
720
+ "Ġro": 629,
721
+ "so</w>": 630,
722
+ "ĠâĢĵ</w>": 631,
723
+ "Ġnot</w>": 632,
724
+ "ding</w>": 633,
725
+ "fter</w>": 634,
726
+ "ure</w>": 635,
727
+ "Ġpar": 636,
728
+ "Ġ:</w>": 637,
729
+ "ian</w>": 638,
730
+ "Ġtw": 639,
731
+ "ould</w>": 640,
732
+ "Ġalso</w>": 641,
733
+ "Ġits</w>": 642,
734
+ "Ġwor": 643,
735
+ "um</w>": 644,
736
+ "Ġor</w>": 645,
737
+ "ost</w>": 646,
738
+ "00</w>": 647,
739
+ "our": 648,
740
+ "ard</w>": 649,
741
+ "Ġres": 650,
742
+ "mp": 651,
743
+ "ue</w>": 652,
744
+ "Ġab": 653,
745
+ "ish</w>": 654,
746
+ "Ġcont": 655,
747
+ "Ġad": 656,
748
+ "own</w>": 657,
749
+ "all</w>": 658,
750
+ "oug": 659,
751
+ "Ġher</w>": 660,
752
+ "ast</w>": 661,
753
+ "Ġen": 662,
754
+ "ome</w>": 663,
755
+ "all": 664,
756
+ "ded</w>": 665,
757
+ "ow</w>": 666,
758
+ "Ġhave</w>": 667,
759
+ "Ġus": 668,
760
+ "ear</w>": 669,
761
+ "ack</w>": 670,
762
+ "duc": 671,
763
+ "ial</w>": 672,
764
+ "ss": 673,
765
+ "ents</w>": 674,
766
+ "ain</w>": 675,
767
+ "ting</w>": 676,
768
+ "Ġone</w>": 677,
769
+ "ess": 678,
770
+ "Ġhas</w>": 679,
771
+ "ight</w>": 680,
772
+ "av": 681,
773
+ "Ġev": 682,
774
+ "out</w>": 683,
775
+ "ay": 684,
776
+ "ence</w>": 685,
777
+ "Ġbeen</w>": 686,
778
+ "ew": 687,
779
+ "Ġtwo</w>": 688,
780
+ "Ġcl": 689,
781
+ "der</w>": 690,
782
+ "ime</w>": 691,
783
+ "ks</w>": 692,
784
+ "ess</w>": 693,
785
+ "ish": 694,
786
+ ".@</w>": 695,
787
+ "Ġ@.@</w>": 696,
788
+ "Ġpla": 697,
789
+ "Ġpl": 698,
790
+ "Ġor": 699,
791
+ "up</w>": 700,
792
+ "ment</w>": 701,
793
+ "uring</w>": 702,
794
+ "oll": 703,
795
+ "ĠIn": 704,
796
+ "Ġthis</w>": 705,
797
+ "Ġbec": 706,
798
+ "Ġcomm": 707,
799
+ "Ġdis": 708,
800
+ "ater</w>": 709,
801
+ "age</w>": 710,
802
+ "Ġapp": 711,
803
+ "ous</w>": 712,
804
+ "ey</w>": 713,
805
+ "il</w>": 714,
806
+ "per": 715,
807
+ "ĠAl": 716,
808
+ "ional</w>": 717,
809
+ "lud": 718,
810
+ "ely</w>": 719,
811
+ "tt": 720,
812
+ "ile</w>": 721,
813
+ "iz": 722,
814
+ "Ġj": 723,
815
+ "Ġwho</w>": 724,
816
+ "Ġag": 725,
817
+ "ib": 726,
818
+ "Ġthey</w>": 727,
819
+ "for": 728,
820
+ "Ġov": 729,
821
+ "ath": 730,
822
+ "eg": 731,
823
+ "Ġsc": 732,
824
+ "ip": 733,
825
+ "Ġ201": 734,
826
+ "Ġ3": 735,
827
+ "Ġper": 736,
828
+ "ory</w>": 737,
829
+ "Ġdes": 738,
830
+ "ide</w>": 739,
831
+ "Ġser": 740,
832
+ "se</w>": 741,
833
+ "ĠHe</w>": 742,
834
+ "land</w>": 743,
835
+ "ations</w>": 744,
836
+ "ric": 745,
837
+ "it</w>": 746,
838
+ "res</w>": 747,
839
+ "ered</w>": 748,
840
+ "Ġpre": 749,
841
+ "ĠSh": 750,
842
+ "ance</w>": 751,
843
+ "ort</w>": 752,
844
+ "ant</w>": 753,
845
+ ",@</w>": 754,
846
+ "Ġ@,@</w>": 755,
847
+ "ell</w>": 756,
848
+ "ĠY": 757,
849
+ "ned</w>": 758,
850
+ "ell": 759,
851
+ "ite</w>": 760,
852
+ "Ġinclud": 761,
853
+ "Ġrep": 762,
854
+ "Ġafter</w>": 763,
855
+ "Ġsuc": 764,
856
+ "ree</w>": 765,
857
+ "any</w>": 766,
858
+ "im</w>": 767,
859
+ "ort": 768,
860
+ "Ġ18": 769,
861
+ "Ġsu": 770,
862
+ "ade</w>": 771,
863
+ "our</w>": 772,
864
+ "ĠUn": 773,
865
+ "ĠIt</w>": 774,
866
+ "ik": 775,
867
+ "ĠMar": 776,
868
+ "ember</w>": 777,
869
+ "Ġ1</w>": 778,
870
+ "een</w>": 779,
871
+ "and</w>": 780,
872
+ "Ġsec": 781,
873
+ "ice</w>": 782,
874
+ "Ġtime</w>": 783,
875
+ "ĠAn": 784,
876
+ "Ġinto</w>": 785,
877
+ "Ġfin": 786,
878
+ "Ġother</w>": 787,
879
+ "Ġatt": 788,
880
+ "ill</w>": 789,
881
+ "ren": 790,
882
+ "ach": 791,
883
+ "ass": 792,
884
+ "eral</w>": 793,
885
+ "ese</w>": 794,
886
+ "sh": 795,
887
+ "als</w>": 796,
888
+ "ition</w>": 797,
889
+ "ough</w>": 798,
890
+ "les</w>": 799,
891
+ "amp": 800,
892
+ "Ġwould</w>": 801,
893
+ "Ġmore</w>": 802,
894
+ "roug": 803,
895
+ "rib": 804,
896
+ "ery</w>": 805,
897
+ "ace</w>": 806,
898
+ "ĠA</w>": 807,
899
+ "Ġplay": 808,
900
+ "ited</w>": 809,
901
+ "ked</w>": 810,
902
+ "ist</w>": 811,
903
+ "ied</w>": 812,
904
+ "Ġ2</w>": 813,
905
+ "ased</w>": 814,
906
+ "ings</w>": 815,
907
+ "ang": 816,
908
+ "am</w>": 817,
909
+ "ip</w>": 818,
910
+ "Ġbo": 819,
911
+ "able</w>": 820,
912
+ "ty</w>": 821,
913
+ "Ġchar": 822,
914
+ "Ġcent": 823,
915
+ "etw": 824,
916
+ "ates</w>": 825,
917
+ "rop": 826,
918
+ "ĠI</w>": 827,
919
+ "und</w>": 828,
920
+ "ĠAm": 829,
921
+ "ces</w>": 830,
922
+ "oin": 831,
923
+ "Ġinter": 832,
924
+ "up": 833,
925
+ "ct": 834,
926
+ "one</w>": 835,
927
+ "Ġtra": 836,
928
+ "ant": 837,
929
+ "ect": 838,
930
+ "Ġall</w>": 839,
931
+ "ef": 840,
932
+ "Ġcons": 841,
933
+ "ubl": 842,
934
+ "ning</w>": 843,
935
+ "ans</w>": 844,
936
+ "Ġfe": 845,
937
+ "ust</w>": 846,
938
+ "Ġ0": 847,
939
+ "Ġrem": 848,
940
+ "ase</w>": 849,
941
+ "ong": 850,
942
+ "Ġwhen</w>": 851,
943
+ "eb": 852,
944
+ "ĠWh": 853,
945
+ "Ġear": 854,
946
+ "ever</w>": 855,
947
+ "Ġover</w>": 856,
948
+ "Ġkn": 857,
949
+ "aus": 858,
950
+ "Ġpos": 859,
951
+ "ad</w>": 860,
952
+ "erm": 861,
953
+ "Ġshe</w>": 862,
954
+ "Ġra": 863,
955
+ "Ġduring</w>": 864,
956
+ "ason</w>": 865,
957
+ "vi": 866,
958
+ "Ġexp": 867,
959
+ "Ġlea": 868,
960
+ "Ġel": 869,
961
+ "Ġ4": 870,
962
+ "Ġonly</w>": 871,
963
+ "ond</w>": 872,
964
+ "Ġdec": 873,
965
+ "Ġacc": 874,
966
+ "Ġoff": 875,
967
+ "iss": 876,
968
+ "Ġfl": 877,
969
+ "ĠEn": 878,
970
+ "ot</w>": 879,
971
+ "ens": 880,
972
+ "ose</w>": 881,
973
+ "ake</w>": 882,
974
+ "om</w>": 883,
975
+ "Ġsev": 884,
976
+ "ach</w>": 885,
977
+ "etween</w>": 886,
978
+ "ern": 887,
979
+ "Ġ3</w>": 888,
980
+ "Ġpr": 889,
981
+ "Ġgro": 890,
982
+ "ruc": 891,
983
+ "Ġdi": 892,
984
+ "Ġ199": 893,
985
+ "ĠAr": 894,
986
+ "Ġgame</w>": 895,
987
+ "Ġhim</w>": 896,
988
+ "ook</w>": 897,
989
+ "Ġup</w>": 898,
990
+ "Ġabout</w>": 899,
991
+ "Ġrel": 900,
992
+ "form": 901,
993
+ "Ġthree</w>": 902,
994
+ "att": 903,
995
+ "ĠCom": 904,
996
+ "Ġsa": 905,
997
+ "ears</w>": 906,
998
+ "Ġ5": 907,
999
+ "ry</w>": 908,
1000
+ "Ġimp": 909,
1001
+ "Ġmost</w>": 910,
1002
+ "fer": 911,
1003
+ "Ġpres": 912,
1004
+ "Ġfil": 913,
1005
+ "Ġbetween</w>": 914,
1006
+ "Ġbeg": 915,
1007
+ "ph": 916,
1008
+ "ors</w>": 917,
1009
+ "Ġthan</w>": 918,
1010
+ "Ġrecor": 919,
1011
+ "ob": 920,
1012
+ "eric": 921,
1013
+ "ating</w>": 922,
1014
+ "Ġthroug": 923,
1015
+ "king</w>": 924,
1016
+ "Ġout</w>": 925,
1017
+ "Ġnum": 926,
1018
+ "ood</w>": 927,
1019
+ "ollow": 928,
1020
+ "act": 929,
1021
+ "uil": 930,
1022
+ "Ġcre": 931,
1023
+ "olog": 932,
1024
+ "ational</w>": 933,
1025
+ "Ġproduc": 934,
1026
+ "Ġwhile</w>": 935,
1027
+ "Ġlater</w>": 936,
1028
+ "Ġwrit": 937,
1029
+ "ex": 938,
1030
+ "Ġstar": 939,
1031
+ "Ġspec": 940,
1032
+ "ee": 941,
1033
+ "ished</w>": 942,
1034
+ "Ġreg": 943,
1035
+ "ision</w>": 944,
1036
+ "outh</w>": 945,
1037
+ "Ġrele": 946,
1038
+ "Ġass": 947,
1039
+ "Ġseason</w>": 948,
1040
+ "Ġmade</w>": 949,
1041
+ "ily</w>": 950,
1042
+ "ru": 951,
1043
+ "oy": 952,
1044
+ "tur": 953,
1045
+ "te</w>": 954,
1046
+ "Ġqu": 955,
1047
+ "Ġmov": 956,
1048
+ "ury</w>": 957,
1049
+ "ĠAmeric": 958,
1050
+ "ement</w>": 959,
1051
+ "cc": 960,
1052
+ "ound</w>": 961,
1053
+ "Ġlar": 962,
1054
+ "Ġform": 963,
1055
+ "ect</w>": 964,
1056
+ "Ġdef": 965,
1057
+ "Ġmus": 966,
1058
+ "ĠPar": 967,
1059
+ "Ġme": 968,
1060
+ "Ġsub": 969,
1061
+ "way</w>": 970,
1062
+ "op</w>": 971,
1063
+ "oh": 972,
1064
+ "eld</w>": 973,
1065
+ "ie</w>": 974,
1066
+ "emp": 975,
1067
+ "ames</w>": 976,
1068
+ "ern</w>": 977,
1069
+ "Ġnor": 978,
1070
+ "ived</w>": 979,
1071
+ "evel": 980,
1072
+ "Ġsuch</w>": 981,
1073
+ "ards</w>": 982,
1074
+ "Ġind": 983,
1075
+ "ike</w>": 984,
1076
+ "Ġgen": 985,
1077
+ "ert": 986,
1078
+ "Ġyear</w>": 987,
1079
+ "Ġused</w>": 988,
1080
+ "Ġnew</w>": 989,
1081
+ "Ġ5</w>": 990,
1082
+ "Ġalb": 991,
1083
+ "sp": 992,
1084
+ "yp": 993,
1085
+ "Ġwith": 994,
1086
+ "Ġwhere</w>": 995,
1087
+ "ics</w>": 996,
1088
+ "ĠThis</w>": 997,
1089
+ "Ġthem</w>": 998,
1090
+ "wn</w>": 999
1091
+ },
1092
+ "merges": [
1093
+ [
1094
+ "Ġ",
1095
+ "t"
1096
+ ],
1097
+ [
1098
+ "Ġt",
1099
+ "h"
1100
+ ],
1101
+ [
1102
+ "Ġ",
1103
+ "a"
1104
+ ],
1105
+ [
1106
+ "Ġth",
1107
+ "e</w>"
1108
+ ],
1109
+ [
1110
+ "i",
1111
+ "n"
1112
+ ],
1113
+ [
1114
+ "Ġ",
1115
+ "o"
1116
+ ],
1117
+ [
1118
+ "Ġ",
1119
+ ",</w>"
1120
+ ],
1121
+ [
1122
+ "Ġ",
1123
+ "s"
1124
+ ],
1125
+ [
1126
+ "e",
1127
+ "d</w>"
1128
+ ],
1129
+ [
1130
+ "Ġ",
1131
+ "w"
1132
+ ],
1133
+ [
1134
+ "e",
1135
+ "r"
1136
+ ],
1137
+ [
1138
+ "Ġ",
1139
+ ".</w>"
1140
+ ],
1141
+ [
1142
+ "Ġ",
1143
+ "i"
1144
+ ],
1145
+ [
1146
+ "r",
1147
+ "e"
1148
+ ],
1149
+ [
1150
+ "Ġ",
1151
+ "c"
1152
+ ],
1153
+ [
1154
+ "n",
1155
+ "d</w>"
1156
+ ],
1157
+ [
1158
+ "Ġ",
1159
+ "f"
1160
+ ],
1161
+ [
1162
+ "Ġ",
1163
+ "b"
1164
+ ],
1165
+ [
1166
+ "a",
1167
+ "t"
1168
+ ],
1169
+ [
1170
+ "Ġo",
1171
+ "f</w>"
1172
+ ],
1173
+ [
1174
+ "e",
1175
+ "r</w>"
1176
+ ],
1177
+ [
1178
+ "e",
1179
+ "n"
1180
+ ],
1181
+ [
1182
+ "a",
1183
+ "r"
1184
+ ],
1185
+ [
1186
+ "o",
1187
+ "r"
1188
+ ],
1189
+ [
1190
+ "i",
1191
+ "t"
1192
+ ],
1193
+ [
1194
+ "Ġ",
1195
+ "p"
1196
+ ],
1197
+ [
1198
+ "Ġ",
1199
+ "h"
1200
+ ],
1201
+ [
1202
+ "Ġa",
1203
+ "nd</w>"
1204
+ ],
1205
+ [
1206
+ "o",
1207
+ "n"
1208
+ ],
1209
+ [
1210
+ "in",
1211
+ "g</w>"
1212
+ ],
1213
+ [
1214
+ "a",
1215
+ "n"
1216
+ ],
1217
+ [
1218
+ "r",
1219
+ "o"
1220
+ ],
1221
+ [
1222
+ "Ġ",
1223
+ "m"
1224
+ ],
1225
+ [
1226
+ "Ġ",
1227
+ "d"
1228
+ ],
1229
+ [
1230
+ "e",
1231
+ "s</w>"
1232
+ ],
1233
+ [
1234
+ "Ġi",
1235
+ "n</w>"
1236
+ ],
1237
+ [
1238
+ "o",
1239
+ "n</w>"
1240
+ ],
1241
+ [
1242
+ "Ġt",
1243
+ "o</w>"
1244
+ ],
1245
+ [
1246
+ "o",
1247
+ "u"
1248
+ ],
1249
+ [
1250
+ "i",
1251
+ "s"
1252
+ ],
1253
+ [
1254
+ "Ġ",
1255
+ "a</w>"
1256
+ ],
1257
+ [
1258
+ "i",
1259
+ "c"
1260
+ ],
1261
+ [
1262
+ "Ġ",
1263
+ "T"
1264
+ ],
1265
+ [
1266
+ "a",
1267
+ "l"
1268
+ ],
1269
+ [
1270
+ "Ġ",
1271
+ "l"
1272
+ ],
1273
+ [
1274
+ "Ġ",
1275
+ "=</w>"
1276
+ ],
1277
+ [
1278
+ "Ġ",
1279
+ "re"
1280
+ ],
1281
+ [
1282
+ "Ġ",
1283
+ "\"</w>"
1284
+ ],
1285
+ [
1286
+ "e",
1287
+ "s"
1288
+ ],
1289
+ [
1290
+ "Ġ",
1291
+ "S"
1292
+ ],
1293
+ [
1294
+ "a",
1295
+ "s</w>"
1296
+ ],
1297
+ [
1298
+ "a",
1299
+ "l</w>"
1300
+ ],
1301
+ [
1302
+ "i",
1303
+ "l"
1304
+ ],
1305
+ [
1306
+ "e",
1307
+ "l"
1308
+ ],
1309
+ [
1310
+ "i",
1311
+ "on</w>"
1312
+ ],
1313
+ [
1314
+ "Ġ",
1315
+ "A"
1316
+ ],
1317
+ [
1318
+ "Ġ",
1319
+ "C"
1320
+ ],
1321
+ [
1322
+ "Ġ",
1323
+ "1"
1324
+ ],
1325
+ [
1326
+ "Ġ",
1327
+ "Ċ</w>"
1328
+ ],
1329
+ [
1330
+ "u",
1331
+ "r"
1332
+ ],
1333
+ [
1334
+ "ĠT",
1335
+ "h"
1336
+ ],
1337
+ [
1338
+ "Ġ",
1339
+ "n"
1340
+ ],
1341
+ [
1342
+ "a",
1343
+ "s"
1344
+ ],
1345
+ [
1346
+ "Ġ",
1347
+ "@"
1348
+ ],
1349
+ [
1350
+ "e",
1351
+ "c"
1352
+ ],
1353
+ [
1354
+ "o",
1355
+ "m"
1356
+ ],
1357
+ [
1358
+ "a",
1359
+ "c"
1360
+ ],
1361
+ [
1362
+ "Ġ",
1363
+ "e"
1364
+ ],
1365
+ [
1366
+ "Ġw",
1367
+ "as</w>"
1368
+ ],
1369
+ [
1370
+ "Ġ",
1371
+ "M"
1372
+ ],
1373
+ [
1374
+ "o",
1375
+ "r</w>"
1376
+ ],
1377
+ [
1378
+ "a",
1379
+ "n</w>"
1380
+ ],
1381
+ [
1382
+ "a",
1383
+ "m"
1384
+ ],
1385
+ [
1386
+ "e",
1387
+ "n</w>"
1388
+ ],
1389
+ [
1390
+ "o",
1391
+ "l"
1392
+ ],
1393
+ [
1394
+ "Ġ",
1395
+ "in"
1396
+ ],
1397
+ [
1398
+ "Ġ",
1399
+ "g"
1400
+ ],
1401
+ [
1402
+ "Ġ",
1403
+ "'</w>"
1404
+ ],
1405
+ [
1406
+ "Ġ",
1407
+ "B"
1408
+ ],
1409
+ [
1410
+ "l",
1411
+ "y</w>"
1412
+ ],
1413
+ [
1414
+ "a",
1415
+ "t</w>"
1416
+ ],
1417
+ [
1418
+ "i",
1419
+ "v"
1420
+ ],
1421
+ [
1422
+ "t",
1423
+ "s</w>"
1424
+ ],
1425
+ [
1426
+ "ĠTh",
1427
+ "e</w>"
1428
+ ],
1429
+ [
1430
+ "u",
1431
+ "s"
1432
+ ],
1433
+ [
1434
+ "-",
1435
+ "@</w>"
1436
+ ],
1437
+ [
1438
+ "Ġ@",
1439
+ "-@</w>"
1440
+ ],
1441
+ [
1442
+ "i",
1443
+ "s</w>"
1444
+ ],
1445
+ [
1446
+ "Ġ",
1447
+ "I"
1448
+ ],
1449
+ [
1450
+ "Ġw",
1451
+ "h"
1452
+ ],
1453
+ [
1454
+ "i",
1455
+ "g"
1456
+ ],
1457
+ [
1458
+ "Ġ",
1459
+ "H"
1460
+ ],
1461
+ [
1462
+ "Ġs",
1463
+ "t"
1464
+ ],
1465
+ [
1466
+ "o",
1467
+ "s"
1468
+ ],
1469
+ [
1470
+ "u",
1471
+ "n"
1472
+ ],
1473
+ [
1474
+ "t",
1475
+ "h"
1476
+ ],
1477
+ [
1478
+ "Ġ",
1479
+ "P"
1480
+ ],
1481
+ [
1482
+ "Ġw",
1483
+ "it"
1484
+ ],
1485
+ [
1486
+ "Ġth",
1487
+ "at</w>"
1488
+ ],
1489
+ [
1490
+ "i",
1491
+ "r"
1492
+ ],
1493
+ [
1494
+ "Ġa",
1495
+ "s</w>"
1496
+ ],
1497
+ [
1498
+ "e",
1499
+ "m"
1500
+ ],
1501
+ [
1502
+ "Ġo",
1503
+ "n</w>"
1504
+ ],
1505
+ [
1506
+ "r",
1507
+ "a"
1508
+ ],
1509
+ [
1510
+ "Ġf",
1511
+ "or</w>"
1512
+ ],
1513
+ [
1514
+ "Ġ",
1515
+ "R"
1516
+ ],
1517
+ [
1518
+ "e",
1519
+ "t"
1520
+ ],
1521
+ [
1522
+ "o",
1523
+ "w"
1524
+ ],
1525
+ [
1526
+ "Ġ",
1527
+ "2"
1528
+ ],
1529
+ [
1530
+ "i",
1531
+ "d"
1532
+ ],
1533
+ [
1534
+ "Ġ",
1535
+ "D"
1536
+ ],
1537
+ [
1538
+ "l",
1539
+ "e</w>"
1540
+ ],
1541
+ [
1542
+ "Ġwit",
1543
+ "h</w>"
1544
+ ],
1545
+ [
1546
+ "l",
1547
+ "a"
1548
+ ],
1549
+ [
1550
+ "en",
1551
+ "t</w>"
1552
+ ],
1553
+ [
1554
+ "i",
1555
+ "m"
1556
+ ],
1557
+ [
1558
+ "Ġ",
1559
+ "F"
1560
+ ],
1561
+ [
1562
+ "e",
1563
+ "a"
1564
+ ],
1565
+ [
1566
+ "i",
1567
+ "on"
1568
+ ],
1569
+ [
1570
+ "Ġb",
1571
+ "y</w>"
1572
+ ],
1573
+ [
1574
+ "Ġ",
1575
+ ")</w>"
1576
+ ],
1577
+ [
1578
+ "Ġ",
1579
+ "(</w>"
1580
+ ],
1581
+ [
1582
+ "Ġa",
1583
+ "l"
1584
+ ],
1585
+ [
1586
+ "Ġc",
1587
+ "on"
1588
+ ],
1589
+ [
1590
+ "en",
1591
+ "t"
1592
+ ],
1593
+ [
1594
+ "Ġ",
1595
+ "W"
1596
+ ],
1597
+ [
1598
+ "Ġi",
1599
+ "s</w>"
1600
+ ],
1601
+ [
1602
+ "er",
1603
+ "e</w>"
1604
+ ],
1605
+ [
1606
+ "Ġ",
1607
+ "G"
1608
+ ],
1609
+ [
1610
+ "Ġ",
1611
+ "N"
1612
+ ],
1613
+ [
1614
+ "Ġ",
1615
+ "L"
1616
+ ],
1617
+ [
1618
+ "Ġh",
1619
+ "a"
1620
+ ],
1621
+ [
1622
+ "er",
1623
+ "s</w>"
1624
+ ],
1625
+ [
1626
+ "r",
1627
+ "i"
1628
+ ],
1629
+ [
1630
+ "t",
1631
+ "h</w>"
1632
+ ],
1633
+ [
1634
+ "t",
1635
+ "ed</w>"
1636
+ ],
1637
+ [
1638
+ "u",
1639
+ "c"
1640
+ ],
1641
+ [
1642
+ "Ġ",
1643
+ "J"
1644
+ ],
1645
+ [
1646
+ "Ġ1",
1647
+ "9"
1648
+ ],
1649
+ [
1650
+ "e",
1651
+ "v"
1652
+ ],
1653
+ [
1654
+ "u",
1655
+ "l"
1656
+ ],
1657
+ [
1658
+ "Ġ",
1659
+ "v"
1660
+ ],
1661
+ [
1662
+ "c",
1663
+ "e</w>"
1664
+ ],
1665
+ [
1666
+ "at",
1667
+ "ion</w>"
1668
+ ],
1669
+ [
1670
+ "ro",
1671
+ "m</w>"
1672
+ ],
1673
+ [
1674
+ "Ġb",
1675
+ "e"
1676
+ ],
1677
+ [
1678
+ "Ġ",
1679
+ "E"
1680
+ ],
1681
+ [
1682
+ "i",
1683
+ "n</w>"
1684
+ ],
1685
+ [
1686
+ "Ġth",
1687
+ "e"
1688
+ ],
1689
+ [
1690
+ "Ġf",
1691
+ "rom</w>"
1692
+ ],
1693
+ [
1694
+ "Ġ",
1695
+ "O"
1696
+ ],
1697
+ [
1698
+ "t",
1699
+ "er</w>"
1700
+ ],
1701
+ [
1702
+ "Ġp",
1703
+ "ro"
1704
+ ],
1705
+ [
1706
+ "Ġa",
1707
+ "r"
1708
+ ],
1709
+ [
1710
+ "a",
1711
+ "d"
1712
+ ],
1713
+ [
1714
+ "Ġc",
1715
+ "om"
1716
+ ],
1717
+ [
1718
+ "i",
1719
+ "c</w>"
1720
+ ],
1721
+ [
1722
+ "a",
1723
+ "g"
1724
+ ],
1725
+ [
1726
+ "Ġh",
1727
+ "is</w>"
1728
+ ],
1729
+ [
1730
+ "Ġs",
1731
+ "h"
1732
+ ],
1733
+ [
1734
+ "Ġa",
1735
+ "t</w>"
1736
+ ],
1737
+ [
1738
+ "o",
1739
+ "v"
1740
+ ],
1741
+ [
1742
+ "i",
1743
+ "es</w>"
1744
+ ],
1745
+ [
1746
+ "o",
1747
+ "o"
1748
+ ],
1749
+ [
1750
+ "p",
1751
+ "p"
1752
+ ],
1753
+ [
1754
+ "s",
1755
+ "t"
1756
+ ],
1757
+ [
1758
+ "c",
1759
+ "h"
1760
+ ],
1761
+ [
1762
+ "Ġ",
1763
+ "r"
1764
+ ],
1765
+ [
1766
+ "Ġ2",
1767
+ "0"
1768
+ ],
1769
+ [
1770
+ "a",
1771
+ "y</w>"
1772
+ ],
1773
+ [
1774
+ "i",
1775
+ "f"
1776
+ ],
1777
+ [
1778
+ "��w",
1779
+ "ere</w>"
1780
+ ],
1781
+ [
1782
+ "Ġc",
1783
+ "h"
1784
+ ],
1785
+ [
1786
+ "u",
1787
+ "t</w>"
1788
+ ],
1789
+ [
1790
+ "s",
1791
+ "t</w>"
1792
+ ],
1793
+ [
1794
+ "u",
1795
+ "t"
1796
+ ],
1797
+ [
1798
+ "d",
1799
+ "s</w>"
1800
+ ],
1801
+ [
1802
+ "o",
1803
+ "p"
1804
+ ],
1805
+ [
1806
+ "u",
1807
+ "m"
1808
+ ],
1809
+ [
1810
+ "Ġi",
1811
+ "t</w>"
1812
+ ],
1813
+ [
1814
+ "o",
1815
+ "c"
1816
+ ],
1817
+ [
1818
+ "t",
1819
+ "er"
1820
+ ],
1821
+ [
1822
+ "l",
1823
+ "e"
1824
+ ],
1825
+ [
1826
+ "ig",
1827
+ "h"
1828
+ ],
1829
+ [
1830
+ "u",
1831
+ "d"
1832
+ ],
1833
+ [
1834
+ "Ġe",
1835
+ "x"
1836
+ ],
1837
+ [
1838
+ "ion",
1839
+ "s</w>"
1840
+ ],
1841
+ [
1842
+ "at",
1843
+ "e</w>"
1844
+ ],
1845
+ [
1846
+ "it",
1847
+ "y</w>"
1848
+ ],
1849
+ [
1850
+ "at",
1851
+ "ed</w>"
1852
+ ],
1853
+ [
1854
+ "Ġ",
1855
+ "un"
1856
+ ],
1857
+ [
1858
+ "e",
1859
+ "p"
1860
+ ],
1861
+ [
1862
+ "q",
1863
+ "u"
1864
+ ],
1865
+ [
1866
+ "Ġn",
1867
+ "o"
1868
+ ],
1869
+ [
1870
+ "Ġ",
1871
+ "K"
1872
+ ],
1873
+ [
1874
+ "iv",
1875
+ "e</w>"
1876
+ ],
1877
+ [
1878
+ "is",
1879
+ "t"
1880
+ ],
1881
+ [
1882
+ "Ġo",
1883
+ "n"
1884
+ ],
1885
+ [
1886
+ "am",
1887
+ "e</w>"
1888
+ ],
1889
+ [
1890
+ "ou",
1891
+ "n"
1892
+ ],
1893
+ [
1894
+ "i",
1895
+ "r</w>"
1896
+ ],
1897
+ [
1898
+ "a",
1899
+ "b"
1900
+ ],
1901
+ [
1902
+ "Ġ",
1903
+ "â"
1904
+ ],
1905
+ [
1906
+ "in",
1907
+ "g"
1908
+ ],
1909
+ [
1910
+ "Ġh",
1911
+ "e</w>"
1912
+ ],
1913
+ [
1914
+ "l",
1915
+ "d</w>"
1916
+ ],
1917
+ [
1918
+ "u",
1919
+ "g"
1920
+ ],
1921
+ [
1922
+ "ic",
1923
+ "h</w>"
1924
+ ],
1925
+ [
1926
+ "Ġa",
1927
+ "n</w>"
1928
+ ],
1929
+ [
1930
+ "e",
1931
+ "d"
1932
+ ],
1933
+ [
1934
+ "Ġ",
1935
+ "k"
1936
+ ],
1937
+ [
1938
+ "Ġâ",
1939
+ "Ģ"
1940
+ ],
1941
+ [
1942
+ "Ġha",
1943
+ "d</w>"
1944
+ ],
1945
+ [
1946
+ "v",
1947
+ "e</w>"
1948
+ ],
1949
+ [
1950
+ "a",
1951
+ "in"
1952
+ ],
1953
+ [
1954
+ "Ġs",
1955
+ "e"
1956
+ ],
1957
+ [
1958
+ "t",
1959
+ "ion</w>"
1960
+ ],
1961
+ [
1962
+ "or",
1963
+ "e</w>"
1964
+ ],
1965
+ [
1966
+ "re",
1967
+ "s"
1968
+ ],
1969
+ [
1970
+ "Ġwh",
1971
+ "ich</w>"
1972
+ ],
1973
+ [
1974
+ "ĠI",
1975
+ "n</w>"
1976
+ ],
1977
+ [
1978
+ "o",
1979
+ "d"
1980
+ ],
1981
+ [
1982
+ "th",
1983
+ "er</w>"
1984
+ ],
1985
+ [
1986
+ "a",
1987
+ "k"
1988
+ ],
1989
+ [
1990
+ "Ġs",
1991
+ "p"
1992
+ ],
1993
+ [
1994
+ "a",
1995
+ "r</w>"
1996
+ ],
1997
+ [
1998
+ "Ġ",
1999
+ "y"
2000
+ ],
2001
+ [
2002
+ "ĠC",
2003
+ "h"
2004
+ ],
2005
+ [
2006
+ "on",
2007
+ "g</w>"
2008
+ ],
2009
+ [
2010
+ "Ġa",
2011
+ "c"
2012
+ ],
2013
+ [
2014
+ "es",
2015
+ "t</w>"
2016
+ ],
2017
+ [
2018
+ "Ġ",
2019
+ "U"
2020
+ ],
2021
+ [
2022
+ "a",
2023
+ "p"
2024
+ ],
2025
+ [
2026
+ "f",
2027
+ "f"
2028
+ ],
2029
+ [
2030
+ "al",
2031
+ "ly</w>"
2032
+ ],
2033
+ [
2034
+ "r",
2035
+ "it"
2036
+ ],
2037
+ [
2038
+ "ĠS",
2039
+ "t"
2040
+ ],
2041
+ [
2042
+ "u",
2043
+ "b"
2044
+ ],
2045
+ [
2046
+ "g",
2047
+ "e</w>"
2048
+ ],
2049
+ [
2050
+ "b",
2051
+ "er</w>"
2052
+ ],
2053
+ [
2054
+ "e",
2055
+ "t</w>"
2056
+ ],
2057
+ [
2058
+ "Ġb",
2059
+ "e</w>"
2060
+ ],
2061
+ [
2062
+ "e",
2063
+ "ar"
2064
+ ],
2065
+ [
2066
+ "Ġre",
2067
+ "c"
2068
+ ],
2069
+ [
2070
+ "er",
2071
+ "s"
2072
+ ],
2073
+ [
2074
+ "Ġf",
2075
+ "ir"
2076
+ ],
2077
+ [
2078
+ "o",
2079
+ "t"
2080
+ ],
2081
+ [
2082
+ "Ġar",
2083
+ "e</w>"
2084
+ ],
2085
+ [
2086
+ "Ġa",
2087
+ "n"
2088
+ ],
2089
+ [
2090
+ "c",
2091
+ "h</w>"
2092
+ ],
2093
+ [
2094
+ "o",
2095
+ "g"
2096
+ ],
2097
+ [
2098
+ "i",
2099
+ "a</w>"
2100
+ ],
2101
+ [
2102
+ "es",
2103
+ "t"
2104
+ ],
2105
+ [
2106
+ "in",
2107
+ "e</w>"
2108
+ ],
2109
+ [
2110
+ "il",
2111
+ "l"
2112
+ ],
2113
+ [
2114
+ "an",
2115
+ "d"
2116
+ ],
2117
+ [
2118
+ "e",
2119
+ "l</w>"
2120
+ ],
2121
+ [
2122
+ "ar",
2123
+ "y</w>"
2124
+ ],
2125
+ [
2126
+ "e",
2127
+ "w</w>"
2128
+ ],
2129
+ [
2130
+ "i",
2131
+ "d</w>"
2132
+ ],
2133
+ [
2134
+ "Ġf",
2135
+ "or"
2136
+ ],
2137
+ [
2138
+ "Ġ",
2139
+ ";</w>"
2140
+ ],
2141
+ [
2142
+ "Ġcom",
2143
+ "p"
2144
+ ],
2145
+ [
2146
+ "Ġ",
2147
+ "V"
2148
+ ],
2149
+ [
2150
+ "Ġin",
2151
+ "c"
2152
+ ],
2153
+ [
2154
+ "t",
2155
+ "r"
2156
+ ],
2157
+ [
2158
+ "Ġ20",
2159
+ "0"
2160
+ ],
2161
+ [
2162
+ "Ġthe",
2163
+ "ir</w>"
2164
+ ],
2165
+ [
2166
+ "u",
2167
+ "s</w>"
2168
+ ],
2169
+ [
2170
+ "Ġb",
2171
+ "ut</w>"
2172
+ ],
2173
+ [
2174
+ "r",
2175
+ "an"
2176
+ ],
2177
+ [
2178
+ "ic",
2179
+ "al</w>"
2180
+ ],
2181
+ [
2182
+ "Ġfir",
2183
+ "st</w>"
2184
+ ],
2185
+ [
2186
+ "Ġd",
2187
+ "e"
2188
+ ],
2189
+ [
2190
+ "Ġin",
2191
+ "t"
2192
+ ],
2193
+ [
2194
+ "Ġ",
2195
+ "ro"
2196
+ ],
2197
+ [
2198
+ "s",
2199
+ "o</w>"
2200
+ ],
2201
+ [
2202
+ "ĠâĢ",
2203
+ "ĵ</w>"
2204
+ ],
2205
+ [
2206
+ "Ġno",
2207
+ "t</w>"
2208
+ ],
2209
+ [
2210
+ "d",
2211
+ "ing</w>"
2212
+ ],
2213
+ [
2214
+ "f",
2215
+ "ter</w>"
2216
+ ],
2217
+ [
2218
+ "ur",
2219
+ "e</w>"
2220
+ ],
2221
+ [
2222
+ "Ġp",
2223
+ "ar"
2224
+ ],
2225
+ [
2226
+ "Ġ",
2227
+ ":</w>"
2228
+ ],
2229
+ [
2230
+ "i",
2231
+ "an</w>"
2232
+ ],
2233
+ [
2234
+ "Ġt",
2235
+ "w"
2236
+ ],
2237
+ [
2238
+ "ou",
2239
+ "ld</w>"
2240
+ ],
2241
+ [
2242
+ "Ġal",
2243
+ "so</w>"
2244
+ ],
2245
+ [
2246
+ "Ġi",
2247
+ "ts</w>"
2248
+ ],
2249
+ [
2250
+ "Ġw",
2251
+ "or"
2252
+ ],
2253
+ [
2254
+ "u",
2255
+ "m</w>"
2256
+ ],
2257
+ [
2258
+ "Ġo",
2259
+ "r</w>"
2260
+ ],
2261
+ [
2262
+ "os",
2263
+ "t</w>"
2264
+ ],
2265
+ [
2266
+ "0",
2267
+ "0</w>"
2268
+ ],
2269
+ [
2270
+ "ou",
2271
+ "r"
2272
+ ],
2273
+ [
2274
+ "ar",
2275
+ "d</w>"
2276
+ ],
2277
+ [
2278
+ "Ġre",
2279
+ "s"
2280
+ ],
2281
+ [
2282
+ "m",
2283
+ "p"
2284
+ ],
2285
+ [
2286
+ "u",
2287
+ "e</w>"
2288
+ ],
2289
+ [
2290
+ "Ġa",
2291
+ "b"
2292
+ ],
2293
+ [
2294
+ "is",
2295
+ "h</w>"
2296
+ ],
2297
+ [
2298
+ "Ġcon",
2299
+ "t"
2300
+ ],
2301
+ [
2302
+ "Ġa",
2303
+ "d"
2304
+ ],
2305
+ [
2306
+ "ow",
2307
+ "n</w>"
2308
+ ],
2309
+ [
2310
+ "al",
2311
+ "l</w>"
2312
+ ],
2313
+ [
2314
+ "ou",
2315
+ "g"
2316
+ ],
2317
+ [
2318
+ "Ġh",
2319
+ "er</w>"
2320
+ ],
2321
+ [
2322
+ "as",
2323
+ "t</w>"
2324
+ ],
2325
+ [
2326
+ "Ġ",
2327
+ "en"
2328
+ ],
2329
+ [
2330
+ "om",
2331
+ "e</w>"
2332
+ ],
2333
+ [
2334
+ "al",
2335
+ "l"
2336
+ ],
2337
+ [
2338
+ "d",
2339
+ "ed</w>"
2340
+ ],
2341
+ [
2342
+ "o",
2343
+ "w</w>"
2344
+ ],
2345
+ [
2346
+ "Ġha",
2347
+ "ve</w>"
2348
+ ],
2349
+ [
2350
+ "Ġ",
2351
+ "us"
2352
+ ],
2353
+ [
2354
+ "ea",
2355
+ "r</w>"
2356
+ ],
2357
+ [
2358
+ "ac",
2359
+ "k</w>"
2360
+ ],
2361
+ [
2362
+ "d",
2363
+ "uc"
2364
+ ],
2365
+ [
2366
+ "i",
2367
+ "al</w>"
2368
+ ],
2369
+ [
2370
+ "s",
2371
+ "s"
2372
+ ],
2373
+ [
2374
+ "en",
2375
+ "ts</w>"
2376
+ ],
2377
+ [
2378
+ "a",
2379
+ "in</w>"
2380
+ ],
2381
+ [
2382
+ "t",
2383
+ "ing</w>"
2384
+ ],
2385
+ [
2386
+ "Ġon",
2387
+ "e</w>"
2388
+ ],
2389
+ [
2390
+ "es",
2391
+ "s"
2392
+ ],
2393
+ [
2394
+ "Ġh",
2395
+ "as</w>"
2396
+ ],
2397
+ [
2398
+ "igh",
2399
+ "t</w>"
2400
+ ],
2401
+ [
2402
+ "a",
2403
+ "v"
2404
+ ],
2405
+ [
2406
+ "Ġe",
2407
+ "v"
2408
+ ],
2409
+ [
2410
+ "ou",
2411
+ "t</w>"
2412
+ ],
2413
+ [
2414
+ "a",
2415
+ "y"
2416
+ ],
2417
+ [
2418
+ "en",
2419
+ "ce</w>"
2420
+ ],
2421
+ [
2422
+ "Ġbe",
2423
+ "en</w>"
2424
+ ],
2425
+ [
2426
+ "e",
2427
+ "w"
2428
+ ],
2429
+ [
2430
+ "Ġtw",
2431
+ "o</w>"
2432
+ ],
2433
+ [
2434
+ "Ġc",
2435
+ "l"
2436
+ ],
2437
+ [
2438
+ "d",
2439
+ "er</w>"
2440
+ ],
2441
+ [
2442
+ "im",
2443
+ "e</w>"
2444
+ ],
2445
+ [
2446
+ "k",
2447
+ "s</w>"
2448
+ ],
2449
+ [
2450
+ "es",
2451
+ "s</w>"
2452
+ ],
2453
+ [
2454
+ "is",
2455
+ "h"
2456
+ ],
2457
+ [
2458
+ ".",
2459
+ "@</w>"
2460
+ ],
2461
+ [
2462
+ "Ġ@",
2463
+ ".@</w>"
2464
+ ],
2465
+ [
2466
+ "Ġp",
2467
+ "la"
2468
+ ],
2469
+ [
2470
+ "Ġp",
2471
+ "l"
2472
+ ],
2473
+ [
2474
+ "Ġo",
2475
+ "r"
2476
+ ],
2477
+ [
2478
+ "u",
2479
+ "p</w>"
2480
+ ],
2481
+ [
2482
+ "m",
2483
+ "ent</w>"
2484
+ ],
2485
+ [
2486
+ "ur",
2487
+ "ing</w>"
2488
+ ],
2489
+ [
2490
+ "ol",
2491
+ "l"
2492
+ ],
2493
+ [
2494
+ "ĠI",
2495
+ "n"
2496
+ ],
2497
+ [
2498
+ "Ġth",
2499
+ "is</w>"
2500
+ ],
2501
+ [
2502
+ "Ġb",
2503
+ "ec"
2504
+ ],
2505
+ [
2506
+ "Ġcom",
2507
+ "m"
2508
+ ],
2509
+ [
2510
+ "Ġd",
2511
+ "is"
2512
+ ],
2513
+ [
2514
+ "at",
2515
+ "er</w>"
2516
+ ],
2517
+ [
2518
+ "ag",
2519
+ "e</w>"
2520
+ ],
2521
+ [
2522
+ "Ġa",
2523
+ "pp"
2524
+ ],
2525
+ [
2526
+ "ou",
2527
+ "s</w>"
2528
+ ],
2529
+ [
2530
+ "e",
2531
+ "y</w>"
2532
+ ],
2533
+ [
2534
+ "i",
2535
+ "l</w>"
2536
+ ],
2537
+ [
2538
+ "p",
2539
+ "er"
2540
+ ],
2541
+ [
2542
+ "ĠA",
2543
+ "l"
2544
+ ],
2545
+ [
2546
+ "ion",
2547
+ "al</w>"
2548
+ ],
2549
+ [
2550
+ "l",
2551
+ "ud"
2552
+ ],
2553
+ [
2554
+ "el",
2555
+ "y</w>"
2556
+ ],
2557
+ [
2558
+ "t",
2559
+ "t"
2560
+ ],
2561
+ [
2562
+ "il",
2563
+ "e</w>"
2564
+ ],
2565
+ [
2566
+ "i",
2567
+ "z"
2568
+ ],
2569
+ [
2570
+ "Ġ",
2571
+ "j"
2572
+ ],
2573
+ [
2574
+ "Ġwh",
2575
+ "o</w>"
2576
+ ],
2577
+ [
2578
+ "Ġa",
2579
+ "g"
2580
+ ],
2581
+ [
2582
+ "i",
2583
+ "b"
2584
+ ],
2585
+ [
2586
+ "Ġthe",
2587
+ "y</w>"
2588
+ ],
2589
+ [
2590
+ "f",
2591
+ "or"
2592
+ ],
2593
+ [
2594
+ "Ġo",
2595
+ "v"
2596
+ ],
2597
+ [
2598
+ "at",
2599
+ "h"
2600
+ ],
2601
+ [
2602
+ "e",
2603
+ "g"
2604
+ ],
2605
+ [
2606
+ "Ġs",
2607
+ "c"
2608
+ ],
2609
+ [
2610
+ "i",
2611
+ "p"
2612
+ ],
2613
+ [
2614
+ "Ġ20",
2615
+ "1"
2616
+ ],
2617
+ [
2618
+ "Ġ",
2619
+ "3"
2620
+ ],
2621
+ [
2622
+ "Ġp",
2623
+ "er"
2624
+ ],
2625
+ [
2626
+ "or",
2627
+ "y</w>"
2628
+ ],
2629
+ [
2630
+ "Ġd",
2631
+ "es"
2632
+ ],
2633
+ [
2634
+ "id",
2635
+ "e</w>"
2636
+ ],
2637
+ [
2638
+ "Ġs",
2639
+ "er"
2640
+ ],
2641
+ [
2642
+ "s",
2643
+ "e</w>"
2644
+ ],
2645
+ [
2646
+ "ĠH",
2647
+ "e</w>"
2648
+ ],
2649
+ [
2650
+ "la",
2651
+ "nd</w>"
2652
+ ],
2653
+ [
2654
+ "at",
2655
+ "ions</w>"
2656
+ ],
2657
+ [
2658
+ "r",
2659
+ "ic"
2660
+ ],
2661
+ [
2662
+ "i",
2663
+ "t</w>"
2664
+ ],
2665
+ [
2666
+ "re",
2667
+ "s</w>"
2668
+ ],
2669
+ [
2670
+ "er",
2671
+ "ed</w>"
2672
+ ],
2673
+ [
2674
+ "Ġp",
2675
+ "re"
2676
+ ],
2677
+ [
2678
+ "ĠS",
2679
+ "h"
2680
+ ],
2681
+ [
2682
+ "an",
2683
+ "ce</w>"
2684
+ ],
2685
+ [
2686
+ "or",
2687
+ "t</w>"
2688
+ ],
2689
+ [
2690
+ "an",
2691
+ "t</w>"
2692
+ ],
2693
+ [
2694
+ ",",
2695
+ "@</w>"
2696
+ ],
2697
+ [
2698
+ "Ġ@",
2699
+ ",@</w>"
2700
+ ],
2701
+ [
2702
+ "el",
2703
+ "l</w>"
2704
+ ],
2705
+ [
2706
+ "Ġ",
2707
+ "Y"
2708
+ ],
2709
+ [
2710
+ "n",
2711
+ "ed</w>"
2712
+ ],
2713
+ [
2714
+ "el",
2715
+ "l"
2716
+ ],
2717
+ [
2718
+ "it",
2719
+ "e</w>"
2720
+ ],
2721
+ [
2722
+ "Ġinc",
2723
+ "lud"
2724
+ ],
2725
+ [
2726
+ "Ġre",
2727
+ "p"
2728
+ ],
2729
+ [
2730
+ "Ġa",
2731
+ "fter</w>"
2732
+ ],
2733
+ [
2734
+ "Ġs",
2735
+ "uc"
2736
+ ],
2737
+ [
2738
+ "re",
2739
+ "e</w>"
2740
+ ],
2741
+ [
2742
+ "an",
2743
+ "y</w>"
2744
+ ],
2745
+ [
2746
+ "i",
2747
+ "m</w>"
2748
+ ],
2749
+ [
2750
+ "or",
2751
+ "t"
2752
+ ],
2753
+ [
2754
+ "Ġ1",
2755
+ "8"
2756
+ ],
2757
+ [
2758
+ "Ġs",
2759
+ "u"
2760
+ ],
2761
+ [
2762
+ "ad",
2763
+ "e</w>"
2764
+ ],
2765
+ [
2766
+ "ou",
2767
+ "r</w>"
2768
+ ],
2769
+ [
2770
+ "ĠU",
2771
+ "n"
2772
+ ],
2773
+ [
2774
+ "ĠI",
2775
+ "t</w>"
2776
+ ],
2777
+ [
2778
+ "i",
2779
+ "k"
2780
+ ],
2781
+ [
2782
+ "ĠM",
2783
+ "ar"
2784
+ ],
2785
+ [
2786
+ "em",
2787
+ "ber</w>"
2788
+ ],
2789
+ [
2790
+ "Ġ",
2791
+ "1</w>"
2792
+ ],
2793
+ [
2794
+ "e",
2795
+ "en</w>"
2796
+ ],
2797
+ [
2798
+ "a",
2799
+ "nd</w>"
2800
+ ],
2801
+ [
2802
+ "Ġs",
2803
+ "ec"
2804
+ ],
2805
+ [
2806
+ "ic",
2807
+ "e</w>"
2808
+ ],
2809
+ [
2810
+ "Ġt",
2811
+ "ime</w>"
2812
+ ],
2813
+ [
2814
+ "ĠA",
2815
+ "n"
2816
+ ],
2817
+ [
2818
+ "Ġint",
2819
+ "o</w>"
2820
+ ],
2821
+ [
2822
+ "Ġf",
2823
+ "in"
2824
+ ],
2825
+ [
2826
+ "Ġo",
2827
+ "ther</w>"
2828
+ ],
2829
+ [
2830
+ "Ġa",
2831
+ "tt"
2832
+ ],
2833
+ [
2834
+ "il",
2835
+ "l</w>"
2836
+ ],
2837
+ [
2838
+ "re",
2839
+ "n"
2840
+ ],
2841
+ [
2842
+ "ac",
2843
+ "h"
2844
+ ],
2845
+ [
2846
+ "as",
2847
+ "s"
2848
+ ],
2849
+ [
2850
+ "er",
2851
+ "al</w>"
2852
+ ],
2853
+ [
2854
+ "es",
2855
+ "e</w>"
2856
+ ],
2857
+ [
2858
+ "s",
2859
+ "h"
2860
+ ],
2861
+ [
2862
+ "al",
2863
+ "s</w>"
2864
+ ],
2865
+ [
2866
+ "it",
2867
+ "ion</w>"
2868
+ ],
2869
+ [
2870
+ "oug",
2871
+ "h</w>"
2872
+ ],
2873
+ [
2874
+ "l",
2875
+ "es</w>"
2876
+ ],
2877
+ [
2878
+ "am",
2879
+ "p"
2880
+ ],
2881
+ [
2882
+ "Ġw",
2883
+ "ould</w>"
2884
+ ],
2885
+ [
2886
+ "Ġm",
2887
+ "ore</w>"
2888
+ ],
2889
+ [
2890
+ "ro",
2891
+ "ug"
2892
+ ],
2893
+ [
2894
+ "ri",
2895
+ "b"
2896
+ ],
2897
+ [
2898
+ "er",
2899
+ "y</w>"
2900
+ ],
2901
+ [
2902
+ "ac",
2903
+ "e</w>"
2904
+ ],
2905
+ [
2906
+ "Ġ",
2907
+ "A</w>"
2908
+ ],
2909
+ [
2910
+ "Ġpla",
2911
+ "y"
2912
+ ],
2913
+ [
2914
+ "it",
2915
+ "ed</w>"
2916
+ ],
2917
+ [
2918
+ "k",
2919
+ "ed</w>"
2920
+ ],
2921
+ [
2922
+ "is",
2923
+ "t</w>"
2924
+ ],
2925
+ [
2926
+ "i",
2927
+ "ed</w>"
2928
+ ],
2929
+ [
2930
+ "Ġ",
2931
+ "2</w>"
2932
+ ],
2933
+ [
2934
+ "as",
2935
+ "ed</w>"
2936
+ ],
2937
+ [
2938
+ "ing",
2939
+ "s</w>"
2940
+ ],
2941
+ [
2942
+ "an",
2943
+ "g"
2944
+ ],
2945
+ [
2946
+ "a",
2947
+ "m</w>"
2948
+ ],
2949
+ [
2950
+ "i",
2951
+ "p</w>"
2952
+ ],
2953
+ [
2954
+ "Ġb",
2955
+ "o"
2956
+ ],
2957
+ [
2958
+ "ab",
2959
+ "le</w>"
2960
+ ],
2961
+ [
2962
+ "t",
2963
+ "y</w>"
2964
+ ],
2965
+ [
2966
+ "Ġch",
2967
+ "ar"
2968
+ ],
2969
+ [
2970
+ "Ġc",
2971
+ "ent"
2972
+ ],
2973
+ [
2974
+ "et",
2975
+ "w"
2976
+ ],
2977
+ [
2978
+ "at",
2979
+ "es</w>"
2980
+ ],
2981
+ [
2982
+ "ro",
2983
+ "p"
2984
+ ],
2985
+ [
2986
+ "Ġ",
2987
+ "I</w>"
2988
+ ],
2989
+ [
2990
+ "u",
2991
+ "nd</w>"
2992
+ ],
2993
+ [
2994
+ "ĠA",
2995
+ "m"
2996
+ ],
2997
+ [
2998
+ "c",
2999
+ "es</w>"
3000
+ ],
3001
+ [
3002
+ "o",
3003
+ "in"
3004
+ ],
3005
+ [
3006
+ "Ġin",
3007
+ "ter"
3008
+ ],
3009
+ [
3010
+ "u",
3011
+ "p"
3012
+ ],
3013
+ [
3014
+ "c",
3015
+ "t"
3016
+ ],
3017
+ [
3018
+ "on",
3019
+ "e</w>"
3020
+ ],
3021
+ [
3022
+ "Ġt",
3023
+ "ra"
3024
+ ],
3025
+ [
3026
+ "an",
3027
+ "t"
3028
+ ],
3029
+ [
3030
+ "ec",
3031
+ "t"
3032
+ ],
3033
+ [
3034
+ "Ġal",
3035
+ "l</w>"
3036
+ ],
3037
+ [
3038
+ "e",
3039
+ "f"
3040
+ ],
3041
+ [
3042
+ "Ġcon",
3043
+ "s"
3044
+ ],
3045
+ [
3046
+ "ub",
3047
+ "l"
3048
+ ],
3049
+ [
3050
+ "n",
3051
+ "ing</w>"
3052
+ ],
3053
+ [
3054
+ "an",
3055
+ "s</w>"
3056
+ ],
3057
+ [
3058
+ "Ġf",
3059
+ "e"
3060
+ ],
3061
+ [
3062
+ "us",
3063
+ "t</w>"
3064
+ ],
3065
+ [
3066
+ "Ġ",
3067
+ "0"
3068
+ ],
3069
+ [
3070
+ "Ġre",
3071
+ "m"
3072
+ ],
3073
+ [
3074
+ "as",
3075
+ "e</w>"
3076
+ ],
3077
+ [
3078
+ "on",
3079
+ "g"
3080
+ ],
3081
+ [
3082
+ "Ġwh",
3083
+ "en</w>"
3084
+ ],
3085
+ [
3086
+ "e",
3087
+ "b"
3088
+ ],
3089
+ [
3090
+ "ĠW",
3091
+ "h"
3092
+ ],
3093
+ [
3094
+ "Ġe",
3095
+ "ar"
3096
+ ],
3097
+ [
3098
+ "ev",
3099
+ "er</w>"
3100
+ ],
3101
+ [
3102
+ "Ġov",
3103
+ "er</w>"
3104
+ ],
3105
+ [
3106
+ "Ġk",
3107
+ "n"
3108
+ ],
3109
+ [
3110
+ "a",
3111
+ "us"
3112
+ ],
3113
+ [
3114
+ "Ġp",
3115
+ "os"
3116
+ ],
3117
+ [
3118
+ "a",
3119
+ "d</w>"
3120
+ ],
3121
+ [
3122
+ "er",
3123
+ "m"
3124
+ ],
3125
+ [
3126
+ "Ġsh",
3127
+ "e</w>"
3128
+ ],
3129
+ [
3130
+ "Ġ",
3131
+ "ra"
3132
+ ],
3133
+ [
3134
+ "Ġd",
3135
+ "uring</w>"
3136
+ ],
3137
+ [
3138
+ "as",
3139
+ "on</w>"
3140
+ ],
3141
+ [
3142
+ "v",
3143
+ "i"
3144
+ ],
3145
+ [
3146
+ "Ġex",
3147
+ "p"
3148
+ ],
3149
+ [
3150
+ "Ġl",
3151
+ "ea"
3152
+ ],
3153
+ [
3154
+ "Ġ",
3155
+ "el"
3156
+ ],
3157
+ [
3158
+ "Ġ",
3159
+ "4"
3160
+ ],
3161
+ [
3162
+ "Ġon",
3163
+ "ly</w>"
3164
+ ],
3165
+ [
3166
+ "o",
3167
+ "nd</w>"
3168
+ ],
3169
+ [
3170
+ "Ġd",
3171
+ "ec"
3172
+ ],
3173
+ [
3174
+ "Ġac",
3175
+ "c"
3176
+ ],
3177
+ [
3178
+ "Ġo",
3179
+ "ff"
3180
+ ],
3181
+ [
3182
+ "is",
3183
+ "s"
3184
+ ],
3185
+ [
3186
+ "Ġf",
3187
+ "l"
3188
+ ],
3189
+ [
3190
+ "ĠE",
3191
+ "n"
3192
+ ],
3193
+ [
3194
+ "o",
3195
+ "t</w>"
3196
+ ],
3197
+ [
3198
+ "en",
3199
+ "s"
3200
+ ],
3201
+ [
3202
+ "os",
3203
+ "e</w>"
3204
+ ],
3205
+ [
3206
+ "ak",
3207
+ "e</w>"
3208
+ ],
3209
+ [
3210
+ "o",
3211
+ "m</w>"
3212
+ ],
3213
+ [
3214
+ "Ġs",
3215
+ "ev"
3216
+ ],
3217
+ [
3218
+ "ac",
3219
+ "h</w>"
3220
+ ],
3221
+ [
3222
+ "etw",
3223
+ "een</w>"
3224
+ ],
3225
+ [
3226
+ "er",
3227
+ "n"
3228
+ ],
3229
+ [
3230
+ "Ġ",
3231
+ "3</w>"
3232
+ ],
3233
+ [
3234
+ "Ġp",
3235
+ "r"
3236
+ ],
3237
+ [
3238
+ "Ġg",
3239
+ "ro"
3240
+ ],
3241
+ [
3242
+ "r",
3243
+ "uc"
3244
+ ],
3245
+ [
3246
+ "Ġd",
3247
+ "i"
3248
+ ],
3249
+ [
3250
+ "Ġ19",
3251
+ "9"
3252
+ ],
3253
+ [
3254
+ "ĠA",
3255
+ "r"
3256
+ ],
3257
+ [
3258
+ "Ġg",
3259
+ "ame</w>"
3260
+ ],
3261
+ [
3262
+ "Ġh",
3263
+ "im</w>"
3264
+ ],
3265
+ [
3266
+ "oo",
3267
+ "k</w>"
3268
+ ],
3269
+ [
3270
+ "Ġ",
3271
+ "up</w>"
3272
+ ],
3273
+ [
3274
+ "Ġab",
3275
+ "out</w>"
3276
+ ],
3277
+ [
3278
+ "Ġre",
3279
+ "l"
3280
+ ],
3281
+ [
3282
+ "for",
3283
+ "m"
3284
+ ],
3285
+ [
3286
+ "Ġth",
3287
+ "ree</w>"
3288
+ ],
3289
+ [
3290
+ "at",
3291
+ "t"
3292
+ ],
3293
+ [
3294
+ "ĠC",
3295
+ "om"
3296
+ ],
3297
+ [
3298
+ "Ġs",
3299
+ "a"
3300
+ ],
3301
+ [
3302
+ "ear",
3303
+ "s</w>"
3304
+ ],
3305
+ [
3306
+ "Ġ",
3307
+ "5"
3308
+ ],
3309
+ [
3310
+ "r",
3311
+ "y</w>"
3312
+ ],
3313
+ [
3314
+ "Ġi",
3315
+ "mp"
3316
+ ],
3317
+ [
3318
+ "Ġm",
3319
+ "ost</w>"
3320
+ ],
3321
+ [
3322
+ "f",
3323
+ "er"
3324
+ ],
3325
+ [
3326
+ "Ġp",
3327
+ "res"
3328
+ ],
3329
+ [
3330
+ "Ġf",
3331
+ "il"
3332
+ ],
3333
+ [
3334
+ "Ġb",
3335
+ "etween</w>"
3336
+ ],
3337
+ [
3338
+ "Ġbe",
3339
+ "g"
3340
+ ],
3341
+ [
3342
+ "p",
3343
+ "h"
3344
+ ],
3345
+ [
3346
+ "or",
3347
+ "s</w>"
3348
+ ],
3349
+ [
3350
+ "Ġth",
3351
+ "an</w>"
3352
+ ],
3353
+ [
3354
+ "Ġrec",
3355
+ "or"
3356
+ ],
3357
+ [
3358
+ "o",
3359
+ "b"
3360
+ ],
3361
+ [
3362
+ "er",
3363
+ "ic"
3364
+ ],
3365
+ [
3366
+ "at",
3367
+ "ing</w>"
3368
+ ],
3369
+ [
3370
+ "Ġth",
3371
+ "roug"
3372
+ ],
3373
+ [
3374
+ "k",
3375
+ "ing</w>"
3376
+ ],
3377
+ [
3378
+ "Ġo",
3379
+ "ut</w>"
3380
+ ],
3381
+ [
3382
+ "Ġn",
3383
+ "um"
3384
+ ],
3385
+ [
3386
+ "oo",
3387
+ "d</w>"
3388
+ ],
3389
+ [
3390
+ "oll",
3391
+ "ow"
3392
+ ],
3393
+ [
3394
+ "ac",
3395
+ "t"
3396
+ ],
3397
+ [
3398
+ "u",
3399
+ "il"
3400
+ ],
3401
+ [
3402
+ "Ġc",
3403
+ "re"
3404
+ ],
3405
+ [
3406
+ "ol",
3407
+ "og"
3408
+ ],
3409
+ [
3410
+ "at",
3411
+ "ional</w>"
3412
+ ],
3413
+ [
3414
+ "Ġpro",
3415
+ "duc"
3416
+ ],
3417
+ [
3418
+ "Ġwh",
3419
+ "ile</w>"
3420
+ ],
3421
+ [
3422
+ "Ġl",
3423
+ "ater</w>"
3424
+ ],
3425
+ [
3426
+ "Ġw",
3427
+ "rit"
3428
+ ],
3429
+ [
3430
+ "e",
3431
+ "x"
3432
+ ],
3433
+ [
3434
+ "Ġst",
3435
+ "ar"
3436
+ ],
3437
+ [
3438
+ "Ġsp",
3439
+ "ec"
3440
+ ],
3441
+ [
3442
+ "e",
3443
+ "e"
3444
+ ],
3445
+ [
3446
+ "ish",
3447
+ "ed</w>"
3448
+ ],
3449
+ [
3450
+ "Ġre",
3451
+ "g"
3452
+ ],
3453
+ [
3454
+ "is",
3455
+ "ion</w>"
3456
+ ],
3457
+ [
3458
+ "ou",
3459
+ "th</w>"
3460
+ ],
3461
+ [
3462
+ "Ġre",
3463
+ "le"
3464
+ ],
3465
+ [
3466
+ "Ġa",
3467
+ "ss"
3468
+ ],
3469
+ [
3470
+ "Ġse",
3471
+ "ason</w>"
3472
+ ],
3473
+ [
3474
+ "Ġm",
3475
+ "ade</w>"
3476
+ ],
3477
+ [
3478
+ "il",
3479
+ "y</w>"
3480
+ ],
3481
+ [
3482
+ "r",
3483
+ "u"
3484
+ ],
3485
+ [
3486
+ "o",
3487
+ "y"
3488
+ ],
3489
+ [
3490
+ "t",
3491
+ "ur"
3492
+ ],
3493
+ [
3494
+ "t",
3495
+ "e</w>"
3496
+ ],
3497
+ [
3498
+ "Ġ",
3499
+ "qu"
3500
+ ],
3501
+ [
3502
+ "Ġm",
3503
+ "ov"
3504
+ ],
3505
+ [
3506
+ "ur",
3507
+ "y</w>"
3508
+ ],
3509
+ [
3510
+ "ĠAm",
3511
+ "eric"
3512
+ ],
3513
+ [
3514
+ "em",
3515
+ "ent</w>"
3516
+ ],
3517
+ [
3518
+ "c",
3519
+ "c"
3520
+ ],
3521
+ [
3522
+ "ou",
3523
+ "nd</w>"
3524
+ ],
3525
+ [
3526
+ "Ġl",
3527
+ "ar"
3528
+ ],
3529
+ [
3530
+ "Ġfor",
3531
+ "m"
3532
+ ],
3533
+ [
3534
+ "ec",
3535
+ "t</w>"
3536
+ ],
3537
+ [
3538
+ "Ġde",
3539
+ "f"
3540
+ ],
3541
+ [
3542
+ "Ġm",
3543
+ "us"
3544
+ ],
3545
+ [
3546
+ "ĠP",
3547
+ "ar"
3548
+ ],
3549
+ [
3550
+ "Ġm",
3551
+ "e"
3552
+ ],
3553
+ [
3554
+ "Ġs",
3555
+ "ub"
3556
+ ],
3557
+ [
3558
+ "w",
3559
+ "ay</w>"
3560
+ ],
3561
+ [
3562
+ "o",
3563
+ "p</w>"
3564
+ ],
3565
+ [
3566
+ "o",
3567
+ "h"
3568
+ ],
3569
+ [
3570
+ "el",
3571
+ "d</w>"
3572
+ ],
3573
+ [
3574
+ "i",
3575
+ "e</w>"
3576
+ ],
3577
+ [
3578
+ "em",
3579
+ "p"
3580
+ ],
3581
+ [
3582
+ "am",
3583
+ "es</w>"
3584
+ ],
3585
+ [
3586
+ "er",
3587
+ "n</w>"
3588
+ ],
3589
+ [
3590
+ "Ġn",
3591
+ "or"
3592
+ ],
3593
+ [
3594
+ "iv",
3595
+ "ed</w>"
3596
+ ],
3597
+ [
3598
+ "ev",
3599
+ "el"
3600
+ ],
3601
+ [
3602
+ "Ġsuc",
3603
+ "h</w>"
3604
+ ],
3605
+ [
3606
+ "ar",
3607
+ "ds</w>"
3608
+ ],
3609
+ [
3610
+ "Ġin",
3611
+ "d"
3612
+ ],
3613
+ [
3614
+ "ik",
3615
+ "e</w>"
3616
+ ],
3617
+ [
3618
+ "Ġg",
3619
+ "en"
3620
+ ],
3621
+ [
3622
+ "er",
3623
+ "t"
3624
+ ],
3625
+ [
3626
+ "Ġy",
3627
+ "ear</w>"
3628
+ ],
3629
+ [
3630
+ "Ġus",
3631
+ "ed</w>"
3632
+ ],
3633
+ [
3634
+ "Ġn",
3635
+ "ew</w>"
3636
+ ],
3637
+ [
3638
+ "Ġ",
3639
+ "5</w>"
3640
+ ],
3641
+ [
3642
+ "Ġal",
3643
+ "b"
3644
+ ],
3645
+ [
3646
+ "s",
3647
+ "p"
3648
+ ],
3649
+ [
3650
+ "y",
3651
+ "p"
3652
+ ],
3653
+ [
3654
+ "Ġwit",
3655
+ "h"
3656
+ ],
3657
+ [
3658
+ "Ġwh",
3659
+ "ere</w>"
3660
+ ],
3661
+ [
3662
+ "ic",
3663
+ "s</w>"
3664
+ ],
3665
+ [
3666
+ "ĠTh",
3667
+ "is</w>"
3668
+ ],
3669
+ [
3670
+ "Ġthe",
3671
+ "m</w>"
3672
+ ],
3673
+ [
3674
+ "w",
3675
+ "n</w>"
3676
+ ]
3677
+ ]
3678
+ }
3679
+ }
tokenizer/tokenizer_config.json ADDED
@@ -0,0 +1,31 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_prefix_space": false,
3
+ "added_tokens_decoder": {
4
+ "0": {
5
+ "content": "<|startoftext|>",
6
+ "lstrip": false,
7
+ "normalized": true,
8
+ "rstrip": false,
9
+ "single_word": false,
10
+ "special": true
11
+ },
12
+ "1": {
13
+ "content": "<|endoftext|>",
14
+ "lstrip": false,
15
+ "normalized": true,
16
+ "rstrip": false,
17
+ "single_word": false,
18
+ "special": true
19
+ }
20
+ },
21
+ "bos_token": "<|startoftext|>",
22
+ "clean_up_tokenization_spaces": false,
23
+ "do_lower_case": true,
24
+ "eos_token": "<|endoftext|>",
25
+ "errors": "replace",
26
+ "extra_special_tokens": {},
27
+ "model_max_length": 77,
28
+ "pad_token": "<|endoftext|>",
29
+ "tokenizer_class": "CLIPTokenizer",
30
+ "unk_token": "<|endoftext|>"
31
+ }
tokenizer/vocab.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"<|startoftext|>":0,"<|endoftext|>":1,"!":2,"\"":3,"#":4,"$":5,"%":6,"&":7,"'":8,"(":9,")":10,"*":11,"+":12,",":13,"-":14,".":15,"/":16,"0":17,"1":18,"2":19,"3":20,"4":21,"5":22,"6":23,"7":24,"8":25,"9":26,":":27,";":28,"<":29,"=":30,">":31,"?":32,"@":33,"A":34,"B":35,"C":36,"D":37,"E":38,"F":39,"G":40,"H":41,"I":42,"J":43,"K":44,"L":45,"M":46,"N":47,"O":48,"P":49,"Q":50,"R":51,"S":52,"T":53,"U":54,"V":55,"W":56,"X":57,"Y":58,"Z":59,"[":60,"\\":61,"]":62,"^":63,"_":64,"`":65,"a":66,"b":67,"c":68,"d":69,"e":70,"f":71,"g":72,"h":73,"i":74,"j":75,"k":76,"l":77,"m":78,"n":79,"o":80,"p":81,"q":82,"r":83,"s":84,"t":85,"u":86,"v":87,"w":88,"x":89,"y":90,"z":91,"|":92,"}":93,"~":94,"¡":95,"¢":96,"£":97,"¤":98,"¥":99,"¦":100,"§":101,"¨":102,"©":103,"ª":104,"«":105,"¬":106,"®":107,"¯":108,"°":109,"±":110,"²":111,"³":112,"´":113,"µ":114,"¶":115,"·":116,"¸":117,"¹":118,"º":119,"»":120,"¼":121,"½":122,"¾":123,"¿":124,"Â":125,"Ã":126,"Ä":127,"Å":128,"Æ":129,"Ç":130,"È":131,"É":132,"Ê":133,"Ë":134,"Ì":135,"Í":136,"Î":137,"Ï":138,"Ð":139,"Ñ":140,"Ö":141,"×":142,"Ø":143,"Ù":144,"Ü":145,"à":146,"á":147,"â":148,"ã":149,"ä":150,"å":151,"æ":152,"ç":153,"è":154,"é":155,"ë":156,"ì":157,"ï":158,"Ċ":159,"Ġ":160,"Ģ":161,"ģ":162,"Ĥ":163,"ĥ":164,"Ħ":165,"ħ":166,"Ĩ":167,"ĩ":168,"Ī":169,"ī":170,"Ĭ":171,"ĭ":172,"Į":173,"į":174,"İ":175,"ı":176,"IJ":177,"ij":178,"Ĵ":179,"ĵ":180,"Ķ":181,"ķ":182,"ĸ":183,"Ĺ":184,"ĺ":185,"Ļ":186,"ļ":187,"Ľ":188,"ľ":189,"Ŀ":190,"ŀ":191,"Ł":192,"ł":193,"Ń":194,"e</w>":195,"d</w>":196,"a</w>":197,"o</w>":198,"n</w>":199,"±</w>":200,"l</w>":201,"m</w>":202,"h</w>":203,"r</w>":204,"i</w>":205,"s</w>":206,"Z</w>":207,"t</w>":208,"f</w>":209,"k</w>":210,"y</w>":211,"b</w>":212,"F</w>":213,"g</w>":214,"7</w>":215,"0</w>":216,"p</w>":217,"L</w>":218,"H</w>":219,"¡</w>":220,"Ī</w>":221,"1</w>":222,"Ģ</w>":223,"c</w>":224,"ĩ</w>":225,"6</w>":226,"A</w>":227,"z</w>":228,"u</w>":229,"S</w>":230,"2</w>":231,"v</w>":232,"4</w>":233,"M</w>":234,"T</w>":235,"8</w>":236,"I</w>":237,"N</w>":238,"C</w>":239,"5</w>":240,"¹</w>":241,"9</w>":242,"3</w>":243,"ī</w>":244,"P</w>":245,"E</w>":246,"»</w>":247,"V</w>":248,"İ</w>":249,"w</w>":250,"J</w>":251,"ł</w>":252,".</w>":253,"K</w>":254,"D</w>":255,"Ķ</w>":256,"¸</w>":257,"B</w>":258,"©</w>":259,"º</w>":260,"µ</w>":261,"Ĥ</w>":262,"X</w>":263,"R</w>":264,"O</w>":265,"«</w>":266,"Ļ</w>":267,"U</w>":268,"x</w>":269,"[</w>":270,"¿</w>":271,"³</w>":272,"ģ</w>":273,"W</w>":274,"§</w>":275,"-</w>":276,"ĸ</w>":277,"Ħ</w>":278,",</w>":279,"q</w>":280,"ħ</w>":281,"¨</w>":282,"G</w>":283,"²</w>":284,"ĺ</w>":285,"ª</w>":286,"¯</w>":287,"j</w>":288,"]</w>":289,"ļ</w>":290,"Ŀ</w>":291,"¤</w>":292,"ŀ</w>":293,"½</w>":294,"IJ</w>":295,"'</w>":296,"Ń</w>":297,"°</w>":298,"ľ</w>":299,"></w>":300,"¶</w>":301,"į</w>":302,"¦</w>":303,"|</w>":304,"¼</w>":305,"¢</w>":306,"´</w>":307,"Ĩ</w>":308,"Q</w>":309,"Y</w>":310,"Ľ</w>":311,"ĵ</w>":312,"ij</w>":313,"ķ</w>":314,"Ĭ</w>":315,"¾</w>":316,";</w>":317,"(</w>":318,"¬</w>":319,"@</w>":320,"ĭ</w>":321,"Ĺ</w>":322,"£</w>":323,"Į</w>":324,"#</w>":325,"·</w>":326,"*</w>":327,"Ĵ</w>":328,"®</w>":329,")</w>":330,"^</w>":331,"ı</w>":332,"Ġ</w>":333,"_</w>":334,"Ł</w>":335,"}</w>":336,"ĥ</w>":337,"\\</w>":338,"¥</w>":339,"<</w>":340,"+</w>":341,"=</w>":342,"~</w>":343,"\"</w>":344,"!</w>":345,"?</w>":346,"`</w>":347,"$</w>":348,"Ċ</w>":349,"/</w>":350,"%</w>":351,"&</w>":352,":</w>":353,"Ġt":354,"Ġth":355,"Ġa":356,"Ġthe</w>":357,"in":358,"Ġo":359,"Ġ,</w>":360,"Ġs":361,"ed</w>":362,"Ġw":363,"er":364,"Ġ.</w>":365,"Ġi":366,"re":367,"Ġc":368,"nd</w>":369,"Ġf":370,"Ġb":371,"at":372,"Ġof</w>":373,"er</w>":374,"en":375,"ar":376,"or":377,"it":378,"Ġp":379,"Ġh":380,"Ġand</w>":381,"on":382,"ing</w>":383,"an":384,"ro":385,"Ġm":386,"Ġd":387,"es</w>":388,"Ġin</w>":389,"on</w>":390,"Ġto</w>":391,"ou":392,"is":393,"Ġa</w>":394,"ic":395,"ĠT":396,"al":397,"Ġl":398,"Ġ=</w>":399,"Ġre":400,"Ġ\"</w>":401,"es":402,"ĠS":403,"as</w>":404,"al</w>":405,"il":406,"el":407,"ion</w>":408,"ĠA":409,"ĠC":410,"Ġ1":411,"ĠĊ</w>":412,"ur":413,"ĠTh":414,"Ġn":415,"as":416,"Ġ@":417,"ec":418,"om":419,"ac":420,"Ġe":421,"Ġwas</w>":422,"ĠM":423,"or</w>":424,"an</w>":425,"am":426,"en</w>":427,"ol":428,"Ġin":429,"Ġg":430,"Ġ'</w>":431,"ĠB":432,"ly</w>":433,"at</w>":434,"iv":435,"ts</w>":436,"ĠThe</w>":437,"us":438,"-@</w>":439,"Ġ@-@</w>":440,"is</w>":441,"ĠI":442,"Ġwh":443,"ig":444,"ĠH":445,"Ġst":446,"os":447,"un":448,"th":449,"ĠP":450,"Ġwit":451,"Ġthat</w>":452,"ir":453,"Ġas</w>":454,"em":455,"Ġon</w>":456,"ra":457,"Ġfor</w>":458,"ĠR":459,"et":460,"ow":461,"Ġ2":462,"id":463,"ĠD":464,"le</w>":465,"Ġwith</w>":466,"la":467,"ent</w>":468,"im":469,"ĠF":470,"ea":471,"ion":472,"Ġby</w>":473,"Ġ)</w>":474,"Ġ(</w>":475,"Ġal":476,"Ġcon":477,"ent":478,"ĠW":479,"Ġis</w>":480,"ere</w>":481,"ĠG":482,"ĠN":483,"ĠL":484,"Ġha":485,"ers</w>":486,"ri":487,"th</w>":488,"ted</w>":489,"uc":490,"ĠJ":491,"��19":492,"ev":493,"ul":494,"Ġv":495,"ce</w>":496,"ation</w>":497,"rom</w>":498,"Ġbe":499,"ĠE":500,"in</w>":501,"Ġthe":502,"Ġfrom</w>":503,"ĠO":504,"ter</w>":505,"Ġpro":506,"Ġar":507,"ad":508,"Ġcom":509,"ic</w>":510,"ag":511,"Ġhis</w>":512,"Ġsh":513,"Ġat</w>":514,"ov":515,"ies</w>":516,"oo":517,"pp":518,"st":519,"ch":520,"Ġr":521,"Ġ20":522,"ay</w>":523,"if":524,"Ġwere</w>":525,"Ġch":526,"ut</w>":527,"st</w>":528,"ut":529,"ds</w>":530,"op":531,"um":532,"Ġit</w>":533,"oc":534,"ter":535,"le":536,"igh":537,"ud":538,"Ġex":539,"ions</w>":540,"ate</w>":541,"ity</w>":542,"ated</w>":543,"Ġun":544,"ep":545,"qu":546,"Ġno":547,"ĠK":548,"ive</w>":549,"ist":550,"Ġon":551,"ame</w>":552,"oun":553,"ir</w>":554,"ab":555,"Ġâ":556,"ing":557,"Ġhe</w>":558,"ld</w>":559,"ug":560,"ich</w>":561,"Ġan</w>":562,"ed":563,"Ġk":564,"ĠâĢ":565,"Ġhad</w>":566,"ve</w>":567,"ain":568,"Ġse":569,"tion</w>":570,"ore</w>":571,"res":572,"Ġwhich</w>":573,"ĠIn</w>":574,"od":575,"ther</w>":576,"ak":577,"Ġsp":578,"ar</w>":579,"Ġy":580,"ĠCh":581,"ong</w>":582,"Ġac":583,"est</w>":584,"ĠU":585,"ap":586,"ff":587,"ally</w>":588,"rit":589,"ĠSt":590,"ub":591,"ge</w>":592,"ber</w>":593,"et</w>":594,"Ġbe</w>":595,"ear":596,"Ġrec":597,"ers":598,"Ġfir":599,"ot":600,"Ġare</w>":601,"Ġan":602,"ch</w>":603,"og":604,"ia</w>":605,"est":606,"ine</w>":607,"ill":608,"and":609,"el</w>":610,"ary</w>":611,"ew</w>":612,"id</w>":613,"Ġfor":614,"Ġ;</w>":615,"Ġcomp":616,"ĠV":617,"Ġinc":618,"tr":619,"Ġ200":620,"Ġtheir</w>":621,"us</w>":622,"Ġbut</w>":623,"ran":624,"ical</w>":625,"Ġfirst</w>":626,"Ġde":627,"Ġint":628,"Ġro":629,"so</w>":630,"ĠâĢĵ</w>":631,"Ġnot</w>":632,"ding</w>":633,"fter</w>":634,"ure</w>":635,"Ġpar":636,"Ġ:</w>":637,"ian</w>":638,"Ġtw":639,"ould</w>":640,"Ġalso</w>":641,"Ġits</w>":642,"Ġwor":643,"um</w>":644,"Ġor</w>":645,"ost</w>":646,"00</w>":647,"our":648,"ard</w>":649,"Ġres":650,"mp":651,"ue</w>":652,"Ġab":653,"ish</w>":654,"Ġcont":655,"Ġad":656,"own</w>":657,"all</w>":658,"oug":659,"Ġher</w>":660,"ast</w>":661,"Ġen":662,"ome</w>":663,"all":664,"ded</w>":665,"ow</w>":666,"Ġhave</w>":667,"Ġus":668,"ear</w>":669,"ack</w>":670,"duc":671,"ial</w>":672,"ss":673,"ents</w>":674,"ain</w>":675,"ting</w>":676,"Ġone</w>":677,"ess":678,"Ġhas</w>":679,"ight</w>":680,"av":681,"Ġev":682,"out</w>":683,"ay":684,"ence</w>":685,"Ġbeen</w>":686,"ew":687,"Ġtwo</w>":688,"Ġcl":689,"der</w>":690,"ime</w>":691,"ks</w>":692,"ess</w>":693,"ish":694,".@</w>":695,"Ġ@.@</w>":696,"Ġpla":697,"Ġpl":698,"Ġor":699,"up</w>":700,"ment</w>":701,"uring</w>":702,"oll":703,"ĠIn":704,"Ġthis</w>":705,"Ġbec":706,"Ġcomm":707,"Ġdis":708,"ater</w>":709,"age</w>":710,"Ġapp":711,"ous</w>":712,"ey</w>":713,"il</w>":714,"per":715,"ĠAl":716,"ional</w>":717,"lud":718,"ely</w>":719,"tt":720,"ile</w>":721,"iz":722,"Ġj":723,"Ġwho</w>":724,"Ġag":725,"ib":726,"Ġthey</w>":727,"for":728,"Ġov":729,"ath":730,"eg":731,"Ġsc":732,"ip":733,"Ġ201":734,"Ġ3":735,"Ġper":736,"ory</w>":737,"Ġdes":738,"ide</w>":739,"Ġser":740,"se</w>":741,"ĠHe</w>":742,"land</w>":743,"ations</w>":744,"ric":745,"it</w>":746,"res</w>":747,"ered</w>":748,"Ġpre":749,"ĠSh":750,"ance</w>":751,"ort</w>":752,"ant</w>":753,",@</w>":754,"Ġ@,@</w>":755,"ell</w>":756,"ĠY":757,"ned</w>":758,"ell":759,"ite</w>":760,"Ġinclud":761,"Ġrep":762,"Ġafter</w>":763,"Ġsuc":764,"ree</w>":765,"any</w>":766,"im</w>":767,"ort":768,"Ġ18":769,"Ġsu":770,"ade</w>":771,"our</w>":772,"ĠUn":773,"ĠIt</w>":774,"ik":775,"ĠMar":776,"ember</w>":777,"Ġ1</w>":778,"een</w>":779,"and</w>":780,"Ġsec":781,"ice</w>":782,"Ġtime</w>":783,"ĠAn":784,"Ġinto</w>":785,"Ġfin":786,"Ġother</w>":787,"Ġatt":788,"ill</w>":789,"ren":790,"ach":791,"ass":792,"eral</w>":793,"ese</w>":794,"sh":795,"als</w>":796,"ition</w>":797,"ough</w>":798,"les</w>":799,"amp":800,"Ġwould</w>":801,"Ġmore</w>":802,"roug":803,"rib":804,"ery</w>":805,"ace</w>":806,"ĠA</w>":807,"Ġplay":808,"ited</w>":809,"ked</w>":810,"ist</w>":811,"ied</w>":812,"Ġ2</w>":813,"ased</w>":814,"ings</w>":815,"ang":816,"am</w>":817,"ip</w>":818,"Ġbo":819,"able</w>":820,"ty</w>":821,"Ġchar":822,"Ġcent":823,"etw":824,"ates</w>":825,"rop":826,"ĠI</w>":827,"und</w>":828,"ĠAm":829,"ces</w>":830,"oin":831,"Ġinter":832,"up":833,"ct":834,"one</w>":835,"Ġtra":836,"ant":837,"ect":838,"Ġall</w>":839,"ef":840,"Ġcons":841,"ubl":842,"ning</w>":843,"ans</w>":844,"Ġfe":845,"ust</w>":846,"Ġ0":847,"Ġrem":848,"ase</w>":849,"ong":850,"Ġwhen</w>":851,"eb":852,"ĠWh":853,"Ġear":854,"ever</w>":855,"Ġover</w>":856,"Ġkn":857,"aus":858,"Ġpos":859,"ad</w>":860,"erm":861,"Ġshe</w>":862,"Ġra":863,"Ġduring</w>":864,"ason</w>":865,"vi":866,"Ġexp":867,"Ġlea":868,"Ġel":869,"Ġ4":870,"Ġonly</w>":871,"ond</w>":872,"Ġdec":873,"Ġacc":874,"Ġoff":875,"iss":876,"Ġfl":877,"ĠEn":878,"ot</w>":879,"ens":880,"ose</w>":881,"ake</w>":882,"om</w>":883,"Ġsev":884,"ach</w>":885,"etween</w>":886,"ern":887,"Ġ3</w>":888,"Ġpr":889,"Ġgro":890,"ruc":891,"Ġdi":892,"Ġ199":893,"ĠAr":894,"Ġgame</w>":895,"Ġhim</w>":896,"ook</w>":897,"Ġup</w>":898,"Ġabout</w>":899,"Ġrel":900,"form":901,"Ġthree</w>":902,"att":903,"ĠCom":904,"Ġsa":905,"ears</w>":906,"Ġ5":907,"ry</w>":908,"Ġimp":909,"Ġmost</w>":910,"fer":911,"Ġpres":912,"Ġfil":913,"Ġbetween</w>":914,"Ġbeg":915,"ph":916,"ors</w>":917,"Ġthan</w>":918,"Ġrecor":919,"ob":920,"eric":921,"ating</w>":922,"Ġthroug":923,"king</w>":924,"Ġout</w>":925,"Ġnum":926,"ood</w>":927,"ollow":928,"act":929,"uil":930,"Ġcre":931,"olog":932,"ational</w>":933,"Ġproduc":934,"Ġwhile</w>":935,"Ġlater</w>":936,"Ġwrit":937,"ex":938,"Ġstar":939,"Ġspec":940,"ee":941,"ished</w>":942,"Ġreg":943,"ision</w>":944,"outh</w>":945,"Ġrele":946,"Ġass":947,"Ġseason</w>":948,"Ġmade</w>":949,"ily</w>":950,"ru":951,"oy":952,"tur":953,"te</w>":954,"Ġqu":955,"Ġmov":956,"ury</w>":957,"ĠAmeric":958,"ement</w>":959,"cc":960,"ound</w>":961,"Ġlar":962,"Ġform":963,"ect</w>":964,"Ġdef":965,"Ġmus":966,"ĠPar":967,"Ġme":968,"Ġsub":969,"way</w>":970,"op</w>":971,"oh":972,"eld</w>":973,"ie</w>":974,"emp":975,"ames</w>":976,"ern</w>":977,"Ġnor":978,"ived</w>":979,"evel":980,"Ġsuch</w>":981,"ards</w>":982,"Ġind":983,"ike</w>":984,"Ġgen":985,"ert":986,"Ġyear</w>":987,"Ġused</w>":988,"Ġnew</w>":989,"Ġ5</w>":990,"Ġalb":991,"sp":992,"yp":993,"Ġwith":994,"Ġwhere</w>":995,"ics</w>":996,"ĠThis</w>":997,"Ġthem</w>":998,"wn</w>":999}
unet/config.json ADDED
@@ -0,0 +1,62 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "UNet2DConditionModel",
3
+ "_diffusers_version": "0.33.1",
4
+ "_name_or_path": "/Users/davidberenstein/.cache/huggingface/hub/models--PrunaAI--tiny-stable-diffusion-pipe-smashed/snapshots/d2b38aca393c0e7a05566b66dc2f264d47bfef65/unet",
5
+ "act_fn": "silu",
6
+ "addition_embed_type": null,
7
+ "addition_embed_type_num_heads": 64,
8
+ "addition_time_embed_dim": null,
9
+ "attention_head_dim": 8,
10
+ "attention_type": "default",
11
+ "block_out_channels": [
12
+ 32,
13
+ 64
14
+ ],
15
+ "center_input_sample": false,
16
+ "class_embed_type": null,
17
+ "class_embeddings_concat": false,
18
+ "conv_in_kernel": 3,
19
+ "conv_out_kernel": 3,
20
+ "cross_attention_dim": 32,
21
+ "cross_attention_norm": null,
22
+ "down_block_types": [
23
+ "DownBlock2D",
24
+ "CrossAttnDownBlock2D"
25
+ ],
26
+ "downsample_padding": 1,
27
+ "dropout": 0.0,
28
+ "dual_cross_attention": false,
29
+ "encoder_hid_dim": null,
30
+ "encoder_hid_dim_type": null,
31
+ "flip_sin_to_cos": true,
32
+ "freq_shift": 0,
33
+ "in_channels": 4,
34
+ "layers_per_block": 2,
35
+ "mid_block_only_cross_attention": null,
36
+ "mid_block_scale_factor": 1,
37
+ "mid_block_type": "UNetMidBlock2DCrossAttn",
38
+ "norm_eps": 1e-05,
39
+ "norm_num_groups": 32,
40
+ "num_attention_heads": null,
41
+ "num_class_embeds": null,
42
+ "only_cross_attention": false,
43
+ "out_channels": 4,
44
+ "projection_class_embeddings_input_dim": null,
45
+ "resnet_out_scale_factor": 1.0,
46
+ "resnet_skip_time_act": false,
47
+ "resnet_time_scale_shift": "default",
48
+ "reverse_transformer_layers_per_block": null,
49
+ "sample_size": 32,
50
+ "time_cond_proj_dim": null,
51
+ "time_embedding_act_fn": null,
52
+ "time_embedding_dim": null,
53
+ "time_embedding_type": "positional",
54
+ "timestep_post_act": null,
55
+ "transformer_layers_per_block": 1,
56
+ "up_block_types": [
57
+ "CrossAttnUpBlock2D",
58
+ "UpBlock2D"
59
+ ],
60
+ "upcast_attention": false,
61
+ "use_linear_projection": false
62
+ }
unet/diffusion_pytorch_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c69e435ef37a4e0fe3471d2c9488924bdf534cb51c08e9450420784d53336d73
3
+ size 5742160
vae/config.json ADDED
@@ -0,0 +1,32 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "AutoencoderKL",
3
+ "_diffusers_version": "0.33.1",
4
+ "_name_or_path": "/Users/davidberenstein/.cache/huggingface/hub/models--PrunaAI--tiny-stable-diffusion-pipe-smashed/snapshots/d2b38aca393c0e7a05566b66dc2f264d47bfef65/vae",
5
+ "act_fn": "silu",
6
+ "block_out_channels": [
7
+ 32,
8
+ 64
9
+ ],
10
+ "down_block_types": [
11
+ "DownEncoderBlock2D",
12
+ "DownEncoderBlock2D"
13
+ ],
14
+ "force_upcast": true,
15
+ "in_channels": 3,
16
+ "latent_channels": 4,
17
+ "latents_mean": null,
18
+ "latents_std": null,
19
+ "layers_per_block": 1,
20
+ "mid_block_add_attention": true,
21
+ "norm_num_groups": 32,
22
+ "out_channels": 3,
23
+ "sample_size": 32,
24
+ "scaling_factor": 0.18215,
25
+ "shift_factor": null,
26
+ "up_block_types": [
27
+ "UpDecoderBlock2D",
28
+ "UpDecoderBlock2D"
29
+ ],
30
+ "use_post_quant_conv": true,
31
+ "use_quant_conv": true
32
+ }
vae/diffusion_pytorch_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7999b516094ac4239121d9f62a37e6be99620e7016220011bb99cf8b1a391aad
3
+ size 2646532