hf-transformers-bot commited on
Commit
007838c
·
1 Parent(s): ecc9c00

Upload tiny models for FalconForSequenceClassification

Browse files
Files changed (5) hide show
  1. config.json +34 -0
  2. model.safetensors +3 -0
  3. special_tokens_map.json +22 -0
  4. tokenizer.json +2006 -0
  5. tokenizer_config.json +122 -0
config.json ADDED
@@ -0,0 +1,34 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "alibi": false,
3
+ "architectures": [
4
+ "FalconForSequenceClassification"
5
+ ],
6
+ "attention_dropout": 0.0,
7
+ "attention_probs_dropout_prob": 0.1,
8
+ "bias": false,
9
+ "bos_token_id": 11,
10
+ "eos_token_id": 11,
11
+ "hidden_act": "gelu",
12
+ "hidden_dropout": 0.0,
13
+ "hidden_dropout_prob": 0.1,
14
+ "hidden_size": 32,
15
+ "initializer_range": 0.02,
16
+ "intermediate_size": 37,
17
+ "layer_norm_epsilon": 1e-05,
18
+ "max_position_embeddings": 512,
19
+ "model_type": "falcon",
20
+ "multi_query": true,
21
+ "new_decoder_architecture": true,
22
+ "num_attention_heads": 4,
23
+ "num_hidden_layers": 2,
24
+ "num_kv_heads": 4,
25
+ "pad_token_id": 1,
26
+ "parallel_attn": true,
27
+ "rope_scaling": null,
28
+ "rope_theta": 10000.0,
29
+ "torch_dtype": "float32",
30
+ "transformers_version": "4.36.0.dev0",
31
+ "type_vocab_size": 16,
32
+ "use_cache": true,
33
+ "vocab_size": 1024
34
+ }
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d40e84bfe1389e41dbc844969ea97726b6fee44f990d24aa76122a1f69a3a25a
3
+ size 232856
special_tokens_map.json ADDED
@@ -0,0 +1,22 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "additional_special_tokens": [
3
+ ">>TITLE<<",
4
+ ">>ABSTRACT<<",
5
+ ">>INTRODUCTION<<",
6
+ ">>SUMMARY<<",
7
+ ">>COMMENT<<",
8
+ ">>ANSWER<<",
9
+ ">>QUESTION<<",
10
+ ">>DOMAIN<<",
11
+ ">>PREFIX<<",
12
+ ">>SUFFIX<<",
13
+ ">>MIDDLE<<"
14
+ ],
15
+ "eos_token": {
16
+ "content": "<|endoftext|>",
17
+ "lstrip": false,
18
+ "normalized": false,
19
+ "rstrip": false,
20
+ "single_word": false
21
+ }
22
+ }
tokenizer.json ADDED
@@ -0,0 +1,2006 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "version": "1.0",
3
+ "truncation": null,
4
+ "padding": null,
5
+ "added_tokens": [
6
+ {
7
+ "id": 0,
8
+ "content": ">>TITLE<<",
9
+ "single_word": false,
10
+ "lstrip": false,
11
+ "rstrip": false,
12
+ "normalized": false,
13
+ "special": true
14
+ },
15
+ {
16
+ "id": 1,
17
+ "content": ">>ABSTRACT<<",
18
+ "single_word": false,
19
+ "lstrip": false,
20
+ "rstrip": false,
21
+ "normalized": false,
22
+ "special": true
23
+ },
24
+ {
25
+ "id": 2,
26
+ "content": ">>INTRODUCTION<<",
27
+ "single_word": false,
28
+ "lstrip": false,
29
+ "rstrip": false,
30
+ "normalized": false,
31
+ "special": true
32
+ },
33
+ {
34
+ "id": 3,
35
+ "content": ">>SUMMARY<<",
36
+ "single_word": false,
37
+ "lstrip": false,
38
+ "rstrip": false,
39
+ "normalized": false,
40
+ "special": true
41
+ },
42
+ {
43
+ "id": 4,
44
+ "content": ">>COMMENT<<",
45
+ "single_word": false,
46
+ "lstrip": false,
47
+ "rstrip": false,
48
+ "normalized": false,
49
+ "special": true
50
+ },
51
+ {
52
+ "id": 5,
53
+ "content": ">>ANSWER<<",
54
+ "single_word": false,
55
+ "lstrip": false,
56
+ "rstrip": false,
57
+ "normalized": false,
58
+ "special": true
59
+ },
60
+ {
61
+ "id": 6,
62
+ "content": ">>QUESTION<<",
63
+ "single_word": false,
64
+ "lstrip": false,
65
+ "rstrip": false,
66
+ "normalized": false,
67
+ "special": true
68
+ },
69
+ {
70
+ "id": 7,
71
+ "content": ">>DOMAIN<<",
72
+ "single_word": false,
73
+ "lstrip": false,
74
+ "rstrip": false,
75
+ "normalized": false,
76
+ "special": true
77
+ },
78
+ {
79
+ "id": 8,
80
+ "content": ">>PREFIX<<",
81
+ "single_word": false,
82
+ "lstrip": false,
83
+ "rstrip": false,
84
+ "normalized": false,
85
+ "special": true
86
+ },
87
+ {
88
+ "id": 9,
89
+ "content": ">>SUFFIX<<",
90
+ "single_word": false,
91
+ "lstrip": false,
92
+ "rstrip": false,
93
+ "normalized": false,
94
+ "special": true
95
+ },
96
+ {
97
+ "id": 10,
98
+ "content": ">>MIDDLE<<",
99
+ "single_word": false,
100
+ "lstrip": false,
101
+ "rstrip": false,
102
+ "normalized": false,
103
+ "special": true
104
+ },
105
+ {
106
+ "id": 11,
107
+ "content": "<|endoftext|>",
108
+ "single_word": false,
109
+ "lstrip": false,
110
+ "rstrip": false,
111
+ "normalized": false,
112
+ "special": true
113
+ }
114
+ ],
115
+ "normalizer": null,
116
+ "pre_tokenizer": {
117
+ "type": "Sequence",
118
+ "pretokenizers": [
119
+ {
120
+ "type": "Punctuation",
121
+ "behavior": "Contiguous"
122
+ },
123
+ {
124
+ "type": "ByteLevel",
125
+ "add_prefix_space": false,
126
+ "trim_offsets": true,
127
+ "use_regex": true
128
+ },
129
+ {
130
+ "type": "Digits",
131
+ "individual_digits": false
132
+ },
133
+ {
134
+ "type": "Split",
135
+ "pattern": {
136
+ "Regex": "[0-9][0-9][0-9]"
137
+ },
138
+ "behavior": "Isolated",
139
+ "invert": false
140
+ }
141
+ ]
142
+ },
143
+ "post_processor": null,
144
+ "decoder": {
145
+ "type": "ByteLevel",
146
+ "add_prefix_space": true,
147
+ "trim_offsets": true,
148
+ "use_regex": true
149
+ },
150
+ "model": {
151
+ "type": "BPE",
152
+ "dropout": null,
153
+ "unk_token": null,
154
+ "continuing_subword_prefix": null,
155
+ "end_of_word_suffix": null,
156
+ "fuse_unk": false,
157
+ "byte_fallback": false,
158
+ "vocab": {
159
+ ">>TITLE<<": 0,
160
+ ">>ABSTRACT<<": 1,
161
+ ">>INTRODUCTION<<": 2,
162
+ ">>SUMMARY<<": 3,
163
+ ">>COMMENT<<": 4,
164
+ ">>ANSWER<<": 5,
165
+ ">>QUESTION<<": 6,
166
+ ">>DOMAIN<<": 7,
167
+ ">>PREFIX<<": 8,
168
+ ">>SUFFIX<<": 9,
169
+ ">>MIDDLE<<": 10,
170
+ "<|endoftext|>": 11,
171
+ "!": 12,
172
+ "\"": 13,
173
+ "#": 14,
174
+ "$": 15,
175
+ "%": 16,
176
+ "&": 17,
177
+ "'": 18,
178
+ "(": 19,
179
+ ")": 20,
180
+ "*": 21,
181
+ "+": 22,
182
+ ",": 23,
183
+ "-": 24,
184
+ ".": 25,
185
+ "/": 26,
186
+ "0": 27,
187
+ "1": 28,
188
+ "2": 29,
189
+ "3": 30,
190
+ "4": 31,
191
+ "5": 32,
192
+ "6": 33,
193
+ "7": 34,
194
+ "8": 35,
195
+ "9": 36,
196
+ ":": 37,
197
+ ";": 38,
198
+ "<": 39,
199
+ "=": 40,
200
+ ">": 41,
201
+ "?": 42,
202
+ "@": 43,
203
+ "A": 44,
204
+ "B": 45,
205
+ "C": 46,
206
+ "D": 47,
207
+ "E": 48,
208
+ "F": 49,
209
+ "G": 50,
210
+ "H": 51,
211
+ "I": 52,
212
+ "J": 53,
213
+ "K": 54,
214
+ "L": 55,
215
+ "M": 56,
216
+ "N": 57,
217
+ "O": 58,
218
+ "P": 59,
219
+ "Q": 60,
220
+ "R": 61,
221
+ "S": 62,
222
+ "T": 63,
223
+ "U": 64,
224
+ "V": 65,
225
+ "W": 66,
226
+ "X": 67,
227
+ "Y": 68,
228
+ "Z": 69,
229
+ "[": 70,
230
+ "\\": 71,
231
+ "]": 72,
232
+ "^": 73,
233
+ "_": 74,
234
+ "`": 75,
235
+ "a": 76,
236
+ "b": 77,
237
+ "c": 78,
238
+ "d": 79,
239
+ "e": 80,
240
+ "f": 81,
241
+ "g": 82,
242
+ "h": 83,
243
+ "i": 84,
244
+ "j": 85,
245
+ "k": 86,
246
+ "l": 87,
247
+ "m": 88,
248
+ "n": 89,
249
+ "o": 90,
250
+ "p": 91,
251
+ "q": 92,
252
+ "r": 93,
253
+ "s": 94,
254
+ "t": 95,
255
+ "u": 96,
256
+ "v": 97,
257
+ "w": 98,
258
+ "x": 99,
259
+ "y": 100,
260
+ "z": 101,
261
+ "|": 102,
262
+ "}": 103,
263
+ "~": 104,
264
+ "¡": 105,
265
+ "¢": 106,
266
+ "£": 107,
267
+ "¤": 108,
268
+ "¥": 109,
269
+ "¦": 110,
270
+ "§": 111,
271
+ "¨": 112,
272
+ "©": 113,
273
+ "ª": 114,
274
+ "«": 115,
275
+ "¬": 116,
276
+ "®": 117,
277
+ "¯": 118,
278
+ "°": 119,
279
+ "±": 120,
280
+ "²": 121,
281
+ "³": 122,
282
+ "´": 123,
283
+ "µ": 124,
284
+ "¶": 125,
285
+ "·": 126,
286
+ "¸": 127,
287
+ "¹": 128,
288
+ "º": 129,
289
+ "»": 130,
290
+ "¼": 131,
291
+ "½": 132,
292
+ "¾": 133,
293
+ "¿": 134,
294
+ "Â": 135,
295
+ "Ã": 136,
296
+ "Ä": 137,
297
+ "Å": 138,
298
+ "Æ": 139,
299
+ "Ç": 140,
300
+ "È": 141,
301
+ "É": 142,
302
+ "Ê": 143,
303
+ "Ë": 144,
304
+ "Ì": 145,
305
+ "Í": 146,
306
+ "Î": 147,
307
+ "Ï": 148,
308
+ "Ð": 149,
309
+ "Ñ": 150,
310
+ "Ö": 151,
311
+ "×": 152,
312
+ "Ø": 153,
313
+ "Ù": 154,
314
+ "Ü": 155,
315
+ "à": 156,
316
+ "á": 157,
317
+ "â": 158,
318
+ "ã": 159,
319
+ "ä": 160,
320
+ "å": 161,
321
+ "æ": 162,
322
+ "ç": 163,
323
+ "è": 164,
324
+ "é": 165,
325
+ "ë": 166,
326
+ "ì": 167,
327
+ "ï": 168,
328
+ "Ċ": 169,
329
+ "Ġ": 170,
330
+ "Ģ": 171,
331
+ "ģ": 172,
332
+ "Ĥ": 173,
333
+ "ĥ": 174,
334
+ "Ħ": 175,
335
+ "ħ": 176,
336
+ "Ĩ": 177,
337
+ "ĩ": 178,
338
+ "Ī": 179,
339
+ "ī": 180,
340
+ "Ĭ": 181,
341
+ "ĭ": 182,
342
+ "Į": 183,
343
+ "į": 184,
344
+ "İ": 185,
345
+ "ı": 186,
346
+ "IJ": 187,
347
+ "ij": 188,
348
+ "Ĵ": 189,
349
+ "ĵ": 190,
350
+ "Ķ": 191,
351
+ "ķ": 192,
352
+ "ĸ": 193,
353
+ "Ĺ": 194,
354
+ "ĺ": 195,
355
+ "Ļ": 196,
356
+ "ļ": 197,
357
+ "Ľ": 198,
358
+ "ľ": 199,
359
+ "Ŀ": 200,
360
+ "ŀ": 201,
361
+ "Ł": 202,
362
+ "ł": 203,
363
+ "Ń": 204,
364
+ "Ġt": 205,
365
+ "he": 206,
366
+ "Ġa": 207,
367
+ "in": 208,
368
+ "Ġthe": 209,
369
+ "er": 210,
370
+ "on": 211,
371
+ "re": 212,
372
+ "Ġs": 213,
373
+ "ed": 214,
374
+ "Ġo": 215,
375
+ "Ġw": 216,
376
+ "nd": 217,
377
+ "at": 218,
378
+ "or": 219,
379
+ "it": 220,
380
+ "Ġc": 221,
381
+ "en": 222,
382
+ "Ġf": 223,
383
+ "is": 224,
384
+ "es": 225,
385
+ "ar": 226,
386
+ "Ġof": 227,
387
+ "Ġb": 228,
388
+ "an": 229,
389
+ "Ġin": 230,
390
+ "al": 231,
391
+ "ing": 232,
392
+ "Ġp": 233,
393
+ "Ġand": 234,
394
+ "as": 235,
395
+ "Ġto": 236,
396
+ "ro": 237,
397
+ "ic": 238,
398
+ "Ġm": 239,
399
+ "Ġd": 240,
400
+ "Ġh": 241,
401
+ "ion": 242,
402
+ "le": 243,
403
+ "ou": 244,
404
+ "ĠT": 245,
405
+ "Ġre": 246,
406
+ "ĠA": 247,
407
+ "ĠS": 248,
408
+ "ent": 249,
409
+ "il": 250,
410
+ "Ġth": 251,
411
+ "st": 252,
412
+ "ĠC": 253,
413
+ "el": 254,
414
+ "om": 255,
415
+ "Ġl": 256,
416
+ "am": 257,
417
+ "ĠĊ": 258,
418
+ "Ġe": 259,
419
+ "Ġn": 260,
420
+ "ad": 261,
421
+ "ac": 262,
422
+ "Ġwas": 263,
423
+ "ĠM": 264,
424
+ "ur": 265,
425
+ "ĠThe": 266,
426
+ "ec": 267,
427
+ "Ġon": 268,
428
+ "ly": 269,
429
+ "ĠB": 270,
430
+ "ĠI": 271,
431
+ "Ġg": 272,
432
+ "et": 273,
433
+ "ol": 274,
434
+ "id": 275,
435
+ "iv": 276,
436
+ "im": 277,
437
+ "Ġfor": 278,
438
+ "ir": 279,
439
+ "-@": 280,
440
+ "@-@": 281,
441
+ "ig": 282,
442
+ "ot": 283,
443
+ "ter": 284,
444
+ "Ġas": 285,
445
+ "ĠH": 286,
446
+ "us": 287,
447
+ "ow": 288,
448
+ "Ġst": 289,
449
+ "ut": 290,
450
+ "ith": 291,
451
+ "ay": 292,
452
+ "ĠP": 293,
453
+ "ation": 294,
454
+ "ver": 295,
455
+ "Ġbe": 296,
456
+ "her": 297,
457
+ "Ġthat": 298,
458
+ "Ġwith": 299,
459
+ "ĠR": 300,
460
+ "ce": 301,
461
+ "th": 302,
462
+ "ĠD": 303,
463
+ "Ġis": 304,
464
+ "un": 305,
465
+ "em": 306,
466
+ "ĠF": 307,
467
+ "Ġwh": 308,
468
+ "ul": 309,
469
+ "Ġby": 310,
470
+ "Ġal": 311,
471
+ "ch": 312,
472
+ "ĠW": 313,
473
+ "Ġcon": 314,
474
+ "ra": 315,
475
+ "ĠG": 316,
476
+ "os": 317,
477
+ "ĠL": 318,
478
+ "ĠN": 319,
479
+ "Ġat": 320,
480
+ "ers": 321,
481
+ "ct": 322,
482
+ "19": 323,
483
+ "Ġit": 324,
484
+ "rom": 325,
485
+ "and": 326,
486
+ "Ġan": 327,
487
+ "um": 328,
488
+ "est": 329,
489
+ "ĠJ": 330,
490
+ "ag": 331,
491
+ "Ġhe": 332,
492
+ "ist": 333,
493
+ "ain": 334,
494
+ "od": 335,
495
+ "av": 336,
496
+ "ri": 337,
497
+ "ĠE": 338,
498
+ "00": 339,
499
+ "ĠO": 340,
500
+ "Ġfrom": 341,
501
+ "Ġcom": 342,
502
+ "Ġhis": 343,
503
+ "op": 344,
504
+ "Ġpro": 345,
505
+ "res": 346,
506
+ "ies": 347,
507
+ "if": 348,
508
+ "Ġv": 349,
509
+ "ort": 350,
510
+ "ere": 351,
511
+ "ill": 352,
512
+ "ld": 353,
513
+ "Ġde": 354,
514
+ "pp": 355,
515
+ "Ġsu": 356,
516
+ "ore": 357,
517
+ "ĠIn": 358,
518
+ "Ġr": 359,
519
+ "Ġse": 360,
520
+ "Ġwere": 361,
521
+ "ew": 362,
522
+ "ong": 363,
523
+ "igh": 364,
524
+ "ard": 365,
525
+ "ate": 366,
526
+ "all": 367,
527
+ "art": 368,
528
+ "ak": 369,
529
+ "ich": 370,
530
+ "Ġch": 371,
531
+ "Ġor": 372,
532
+ "ab": 373,
533
+ "ant": 374,
534
+ "ud": 375,
535
+ "oc": 376,
536
+ "ber": 377,
537
+ "Ġex": 378,
538
+ "gh": 379,
539
+ "ity": 380,
540
+ "ated": 381,
541
+ "pt": 382,
542
+ "ess": 383,
543
+ "ear": 384,
544
+ "ĠK": 385,
545
+ "Ġpl": 386,
546
+ "ame": 387,
547
+ "qu": 388,
548
+ "ive": 389,
549
+ "rou": 390,
550
+ "Ġare": 391,
551
+ "Ġsh": 392,
552
+ "Ġk": 393,
553
+ "ack": 394,
554
+ "ect": 395,
555
+ "âĢ": 396,
556
+ "ĠU": 397,
557
+ "Ġhad": 398,
558
+ "se": 399,
559
+ "Ġwhich": 400,
560
+ "red": 401,
561
+ "ov": 402,
562
+ "ĠSt": 403,
563
+ "ast": 404,
564
+ "Ġsp": 405,
565
+ "ian": 406,
566
+ "Ġy": 407,
567
+ "ment": 408,
568
+ "Ġle": 409,
569
+ "Ġnot": 410,
570
+ "ge": 411,
571
+ "ord": 412,
572
+ "rit": 413,
573
+ "ip": 414,
574
+ "ine": 415,
575
+ "ell": 416,
576
+ "ally": 417,
577
+ "our": 418,
578
+ "ost": 419,
579
+ "ight": 420,
580
+ "ther": 421,
581
+ "ap": 422,
582
+ "Ġu": 423,
583
+ "ish": 424,
584
+ "ĠCh": 425,
585
+ "oun": 426,
586
+ "ia": 427,
587
+ "ave": 428,
588
+ "ary": 429,
589
+ "ust": 430,
590
+ "og": 431,
591
+ "200": 432,
592
+ "Ġun": 433,
593
+ "ous": 434,
594
+ "irst": 435,
595
+ "ĠV": 436,
596
+ "cc": 437,
597
+ "Ġinc": 438,
598
+ "Ġcomp": 439,
599
+ "ru": 440,
600
+ "ions": 441,
601
+ "20": 442,
602
+ "Ġtheir": 443,
603
+ "Ġbut": 444,
604
+ "ide": 445,
605
+ "ure": 446,
606
+ "so": 447,
607
+ "Ġcont": 448,
608
+ "Ġint": 449,
609
+ "fter": 450,
610
+ "ical": 451,
611
+ "ial": 452,
612
+ "Ġar": 453,
613
+ "Ġfirst": 454,
614
+ "ould": 455,
615
+ "Ġits": 456,
616
+ "hed": 457,
617
+ "âĢĵ": 458,
618
+ "Ġwhe": 459,
619
+ "wo": 460,
620
+ "out": 461,
621
+ "ub": 462,
622
+ "ff": 463,
623
+ "ue": 464,
624
+ "Ġher": 465,
625
+ "own": 466,
626
+ "ok": 467,
627
+ "Ġalso": 468,
628
+ "Ġcl": 469,
629
+ "per": 470,
630
+ "ign": 471,
631
+ "ater": 472,
632
+ "ran": 473,
633
+ "orm": 474,
634
+ "ie": 475,
635
+ "ome": 476,
636
+ "ork": 477,
637
+ "ass": 478,
638
+ "ire": 479,
639
+ "end": 480,
640
+ "Ġres": 481,
641
+ "Ġab": 482,
642
+ "Ġad": 483,
643
+ "Ġus": 484,
644
+ "ry": 485,
645
+ "Ġrec": 486,
646
+ "Ġhave": 487,
647
+ "age": 488,
648
+ "ĠHe": 489,
649
+ "Ġro": 490,
650
+ "mer": 491,
651
+ "Ġone": 492,
652
+ "ond": 493,
653
+ "low": 494,
654
+ "Ġhas": 495,
655
+ "ĠTh": 496,
656
+ "du": 497,
657
+ "18": 498,
658
+ "Ġper": 499,
659
+ "Ġbeen": 500,
660
+ "ime": 501,
661
+ "Ġtwo": 502,
662
+ "ence": 503,
663
+ "land": 504,
664
+ ".@": 505,
665
+ "@.@": 506,
666
+ "ult": 507,
667
+ "ree": 508,
668
+ "ough": 509,
669
+ "ile": 510,
670
+ "Ġwho": 511,
671
+ "ĠAl": 512,
672
+ "Ġsc": 513,
673
+ "uring": 514,
674
+ "pl": 515,
675
+ "ory": 516,
676
+ "ition": 517,
677
+ "ric": 518,
678
+ "ations": 519,
679
+ "Ġdis": 520,
680
+ "Ġthis": 521,
681
+ "Ġbec": 522,
682
+ "Ġapp": 523,
683
+ "iz": 524,
684
+ "ĠIt": 525,
685
+ "are": 526,
686
+ "ach": 527,
687
+ "lud": 528,
688
+ "ade": 529,
689
+ "Ġplay": 530,
690
+ "Ġj": 531,
691
+ "Ġman": 532,
692
+ "act": 533,
693
+ "ely": 534,
694
+ "Ġpart": 535,
695
+ "Ġdes": 536,
696
+ "Ġag": 537,
697
+ "Ġthey": 538,
698
+ "Ġyear": 539,
699
+ "ount": 540,
700
+ "201": 541,
701
+ "Ġover": 542,
702
+ "Ġother": 543,
703
+ "ound": 544,
704
+ "Ġafter": 545,
705
+ "ib": 546,
706
+ "over": 547,
707
+ "Ġser": 548,
708
+ "Ġen": 549,
709
+ "Ġoff": 550,
710
+ "Ġim": 551,
711
+ "ction": 552,
712
+ "ĠY": 553,
713
+ "ke": 554,
714
+ "ite": 555,
715
+ ",@": 556,
716
+ "@,@": 557,
717
+ "te": 558,
718
+ "urn": 559,
719
+ "Ġinclud": 560,
720
+ "ress": 561,
721
+ "ance": 562,
722
+ "ang": 563,
723
+ "Ġatt": 564,
724
+ "ice": 565,
725
+ "ace": 566,
726
+ "ark": 567,
727
+ "Ġout": 568,
728
+ "wn": 569,
729
+ "ph": 570,
730
+ "ember": 571,
731
+ "Ġpre": 572,
732
+ "Ġup": 573,
733
+ "ens": 574,
734
+ "man": 575,
735
+ "Ġev": 576,
736
+ "Ġtime": 577,
737
+ "nder": 578,
738
+ "rough": 579,
739
+ "ced": 580,
740
+ "Ġfin": 581,
741
+ "Ġinto": 582,
742
+ "one": 583,
743
+ "port": 584,
744
+ "round": 585,
745
+ "we": 586,
746
+ "ren": 587,
747
+ "les": 588,
748
+ "int": 589,
749
+ "ĠOn": 590,
750
+ "vel": 591,
751
+ "Ġcomm": 592,
752
+ "Ġshe": 593,
753
+ "ason": 594,
754
+ "amp": 595,
755
+ "Ġte": 596,
756
+ "Ġwould": 597,
757
+ "ward": 598,
758
+ "Ġmore": 599,
759
+ "ied": 600,
760
+ "ose": 601,
761
+ "rib": 602,
762
+ "ĠUn": 603,
763
+ "Ġall": 604,
764
+ "ings": 605,
765
+ "tern": 606,
766
+ "ces": 607,
767
+ "able": 608,
768
+ "Ġwe": 609,
769
+ "ited": 610,
770
+ "ever": 611,
771
+ "ents": 612,
772
+ "Ġhim": 613,
773
+ "ased": 614,
774
+ "ors": 615,
775
+ "oy": 616,
776
+ "ood": 617,
777
+ "Ġcent": 618,
778
+ "ix": 619,
779
+ "ase": 620,
780
+ "ild": 621,
781
+ "ĠAn": 622,
782
+ "Ġwork": 623,
783
+ "ates": 624,
784
+ "ious": 625,
785
+ "ath": 626,
786
+ "Ġpo": 627,
787
+ "rop": 628,
788
+ "old": 629,
789
+ "als": 630,
790
+ "iss": 631,
791
+ "ey": 632,
792
+ "ict": 633,
793
+ "Ġfe": 634,
794
+ "Ġthem": 635,
795
+ "gan": 636,
796
+ "Ġsec": 637,
797
+ "Ġbet": 638,
798
+ "Ġwhen": 639,
799
+ "Ġsong": 640,
800
+ "Ġrem": 641,
801
+ "ep": 642,
802
+ "form": 643,
803
+ "ail": 644,
804
+ "fer": 645,
805
+ "Ġear": 646,
806
+ "ubl": 647,
807
+ "aw": 648,
808
+ "Ġkn": 649,
809
+ "ake": 650,
810
+ "aus": 651,
811
+ "Ġmost": 652,
812
+ "Ġcons": 653,
813
+ "Ġduring": 654,
814
+ "ĠAs": 655,
815
+ "orth": 656,
816
+ "Ġnew": 657,
817
+ "ered": 658,
818
+ "ilm": 659,
819
+ "ved": 660,
820
+ "att": 661,
821
+ "Ġonly": 662,
822
+ "Ġdec": 663,
823
+ "ick": 664,
824
+ "Ġgame": 665,
825
+ "ons": 666,
826
+ "ug": 667,
827
+ "Ġtr": 668,
828
+ "ft": 669,
829
+ "oth": 670,
830
+ "ook": 671,
831
+ "ĠMar": 672,
832
+ "reat": 673,
833
+ "way": 674,
834
+ "Ġcan": 675,
835
+ "ollow": 676,
836
+ "outh": 677,
837
+ "ween": 678,
838
+ "ĠEn": 679,
839
+ "199": 680,
840
+ "ters": 681,
841
+ "Ġrel": 682,
842
+ "ind": 683,
843
+ "Ġabout": 684,
844
+ "Ġseason": 685,
845
+ "Ġagain": 686,
846
+ "ral": 687,
847
+ "Ġthree": 688,
848
+ "ational": 689,
849
+ "Ġunder": 690,
850
+ "ular": 691,
851
+ "Ġme": 692,
852
+ "Ġthan": 693,
853
+ "ĠCom": 694,
854
+ "ĠAr": 695,
855
+ "hip": 696,
856
+ "ob": 697,
857
+ "Ġne": 698,
858
+ "Ġbetween": 699,
859
+ "Ġfl": 700,
860
+ "hn": 701,
861
+ "ve": 702,
862
+ "Ġchar": 703,
863
+ "Ġcol": 704,
864
+ "Ġrecord": 705,
865
+ "iew": 706,
866
+ "ron": 707,
867
+ "fore": 708,
868
+ "Ġthrough": 709,
869
+ "ision": 710,
870
+ "orn": 711,
871
+ "ock": 712,
872
+ "Ġver": 713,
873
+ "Ġlater": 714,
874
+ "Ġnum": 715,
875
+ "Ġend": 716,
876
+ "olog": 717,
877
+ "ames": 718,
878
+ "Ġpos": 719,
879
+ "Ġwrit": 720,
880
+ "Ġprodu": 721,
881
+ "Ġwhile": 722,
882
+ "Ġact": 723,
883
+ "Ġrele": 724,
884
+ "Ġfilm": 725,
885
+ "ished": 726,
886
+ "Ġpr": 727,
887
+ "ans": 728,
888
+ "Ġreg": 729,
889
+ "Ġform": 730,
890
+ "Ġass": 731,
891
+ "ĠSe": 732,
892
+ "ury": 733,
893
+ "ted": 734,
894
+ "ts": 735,
895
+ "Ġmade": 736,
896
+ "Ġsub": 737,
897
+ "Ġpe": 738,
898
+ "10": 739,
899
+ "Ġso": 740,
900
+ "orld": 741,
901
+ "Ġret": 742,
902
+ "ĠNew": 743,
903
+ "Ġspec": 744,
904
+ "Ġacc": 745,
905
+ "Ġqu": 746,
906
+ "Ġwhere": 747,
907
+ "ener": 748,
908
+ "Ġmov": 749,
909
+ "hes": 750,
910
+ "meric": 751,
911
+ "ating": 752,
912
+ "Ġinter": 753,
913
+ "ĠLe": 754,
914
+ "ĠAmeric": 755,
915
+ "Ġra": 756,
916
+ "Ġsome": 757,
917
+ "Ġco": 758,
918
+ "Ġlar": 759,
919
+ "Ġbu": 760,
920
+ "Ġdef": 761,
921
+ "bum": 762,
922
+ "Ġac": 763,
923
+ "Ġmus": 764,
924
+ "Ġfollow": 765,
925
+ "ĠAt": 766,
926
+ "ins": 767,
927
+ "ived": 768,
928
+ "ific": 769,
929
+ "ual": 770,
930
+ "Ġam": 771,
931
+ "Ġsuch": 772,
932
+ "Ġsecond": 773,
933
+ "ike": 774,
934
+ "Ġfour": 775,
935
+ "Ġind": 776,
936
+ "ann": 777,
937
+ "hen": 778,
938
+ "Ġused": 779,
939
+ "ĠRe": 780,
940
+ "ics": 781,
941
+ "lect": 782,
942
+ "Ġday": 783,
943
+ "iel": 784,
944
+ "ily": 785,
945
+ "ĠThis": 786,
946
+ "000": 787,
947
+ "Ġpubl": 788,
948
+ "Ġcall": 789,
949
+ "ĠJo": 790,
950
+ "..": 791,
951
+ "ll": 792,
952
+ "Ġalbum": 793,
953
+ "rans": 794,
954
+ "Ġdo": 795,
955
+ "any": 796,
956
+ "Ġbefore": 797,
957
+ "ros": 798,
958
+ "ĠSh": 799,
959
+ "Ġsy": 800,
960
+ "aid": 801,
961
+ "ĠEng": 802,
962
+ "Ġbeing": 803,
963
+ "uc": 804,
964
+ "Ġep": 805,
965
+ "Ġsupp": 806,
966
+ "Ġthere": 807,
967
+ "Ġyears": 808,
968
+ "ars": 809,
969
+ "owever": 810,
970
+ "Ġent": 811,
971
+ "ife": 812,
972
+ "Ġhigh": 813,
973
+ "Ġfound": 814,
974
+ "ird": 815,
975
+ "Ġno": 816,
976
+ "Ġset": 817,
977
+ "16": 818,
978
+ "ines": 819,
979
+ "iver": 820,
980
+ "io": 821,
981
+ "other": 822,
982
+ "ject": 823,
983
+ "Ġsur": 824,
984
+ "aj": 825,
985
+ "ten": 826,
986
+ "Ġtra": 827,
987
+ "ised": 828,
988
+ "ities": 829,
989
+ "velop": 830,
990
+ "Ġbl": 831,
991
+ "ale": 832,
992
+ "Ġseries": 833,
993
+ "12": 834,
994
+ "Ġloc": 835,
995
+ "Ġnumber": 836,
996
+ "Ġpres": 837,
997
+ "ane": 838,
998
+ "ause": 839,
999
+ "ode": 840,
1000
+ "ek": 841,
1001
+ "ton": 842,
1002
+ "ĠSc": 843,
1003
+ "ier": 844,
1004
+ "ise": 845,
1005
+ "Ġsever": 846,
1006
+ "ince": 847,
1007
+ "Ġboth": 848,
1008
+ "ank": 849,
1009
+ "row": 850,
1010
+ "15": 851,
1011
+ "irect": 852,
1012
+ "son": 853,
1013
+ "Ġthen": 854,
1014
+ "ĠBrit": 855,
1015
+ "iet": 856,
1016
+ "Ġepis": 857,
1017
+ "Ġincluding": 858,
1018
+ "17": 859,
1019
+ "its": 860,
1020
+ "igin": 861,
1021
+ "pr": 862,
1022
+ "Ġagainst": 863,
1023
+ "Ġwell": 864,
1024
+ "Ġbecame": 865,
1025
+ "Ġexp": 866,
1026
+ "Ġknown": 867,
1027
+ "Ġtrans": 868,
1028
+ "Ġcharac": 869,
1029
+ "âĢĶ": 870,
1030
+ "ram": 871,
1031
+ "Ġback": 872,
1032
+ "Ġadd": 873,
1033
+ "Ġpop": 874,
1034
+ "Ġgo": 875,
1035
+ "urch": 876,
1036
+ "Ġdesc": 877,
1037
+ "Ġsing": 878,
1038
+ "ield": 879,
1039
+ "Ġperform": 880,
1040
+ "ained": 881,
1041
+ "Ġrece": 882,
1042
+ "ident": 883,
1043
+ "Ġem": 884,
1044
+ "ert": 885,
1045
+ "ures": 886,
1046
+ "Ġinv": 887,
1047
+ "198": 888,
1048
+ "Ġdep": 889,
1049
+ "air": 890,
1050
+ "ern": 891,
1051
+ "ather": 892,
1052
+ "ful": 893,
1053
+ "ĠZ": 894,
1054
+ "Ġmon": 895,
1055
+ "Ġmany": 896,
1056
+ "Ġmain": 897,
1057
+ "Ġstud": 898,
1058
+ "Ġlong": 899,
1059
+ "inn": 900,
1060
+ "though": 901,
1061
+ "up": 902,
1062
+ "ool": 903,
1063
+ "ĠUnited": 904,
1064
+ "led": 905,
1065
+ "ement": 906,
1066
+ "ower": 907,
1067
+ "ĠJohn": 908,
1068
+ "Ġop": 909,
1069
+ "ined": 910,
1070
+ "Ġmet": 911,
1071
+ "ober": 912,
1072
+ "ley": 913,
1073
+ "Ġcentury": 914,
1074
+ "Ġteam": 915,
1075
+ "Ġest": 916,
1076
+ "ĠAfter": 917,
1077
+ "yl": 918,
1078
+ "Ġmin": 919,
1079
+ "uch": 920,
1080
+ "ute": 921,
1081
+ "Ġdevelop": 922,
1082
+ "ĠShe": 923,
1083
+ "iam": 924,
1084
+ "Ġshow": 925,
1085
+ "elf": 926,
1086
+ "Ġrep": 927,
1087
+ "Ġconc": 928,
1088
+ "ative": 929,
1089
+ "Ġcre": 930,
1090
+ "overn": 931,
1091
+ "ared": 932,
1092
+ "194": 933,
1093
+ "Ġorigin": 934,
1094
+ "Ġsm": 935,
1095
+ "ivers": 936,
1096
+ "az": 937,
1097
+ "Ġlead": 938,
1098
+ "Ġseveral": 939,
1099
+ "ah": 940,
1100
+ "Ġob": 941,
1101
+ "Ġrev": 942,
1102
+ "Ġmill": 943,
1103
+ "erm": 944,
1104
+ "ually": 945,
1105
+ "oot": 946,
1106
+ "Ġbegan": 947,
1107
+ "196": 948,
1108
+ "ired": 949,
1109
+ "Ġdif": 950,
1110
+ "Ġcontin": 951,
1111
+ "Ġsign": 952,
1112
+ "ik": 953,
1113
+ "ĠInd": 954,
1114
+ "ments": 955,
1115
+ "ized": 956,
1116
+ "197": 957,
1117
+ "Ġdirect": 958,
1118
+ "au": 959,
1119
+ "Ġext": 960,
1120
+ "ross": 961,
1121
+ "emb": 962,
1122
+ "der": 963,
1123
+ "Ġpol": 964,
1124
+ "Ġmay": 965,
1125
+ "apt": 966,
1126
+ "els": 967,
1127
+ "ĠWh": 968,
1128
+ "Ġcomple": 969,
1129
+ "Ġart": 970,
1130
+ "ĠBr": 971,
1131
+ "ĠIs": 972,
1132
+ "une": 973,
1133
+ "til": 974,
1134
+ "Ġcrit": 975,
1135
+ "Ġhist": 976,
1136
+ "Ġearly": 977,
1137
+ "Ġcould": 978,
1138
+ "ĠCon": 979,
1139
+ "Ġdid": 980,
1140
+ "Ġbel": 981,
1141
+ "Ġcalled": 982,
1142
+ "ued": 983,
1143
+ "Ġnear": 984,
1144
+ "Ġepisode": 985,
1145
+ "yp": 986,
1146
+ "Ġdescrib": 987,
1147
+ "imes": 988,
1148
+ "Ġbro": 989,
1149
+ "roup": 990,
1150
+ "ople": 991,
1151
+ "Ġdown": 992,
1152
+ "Ġrun": 993,
1153
+ "13": 994,
1154
+ "aking": 995,
1155
+ "Ġdisc": 996,
1156
+ "Ġalong": 997,
1157
+ "ccess": 998,
1158
+ "ĠMay": 999,
1159
+ "Ġfeat": 1000,
1160
+ "Ġinst": 1001,
1161
+ "ĠAmerican": 1002,
1162
+ "Ġsaid": 1003,
1163
+ "Ġdist": 1004,
1164
+ "Ġinf": 1005,
1165
+ "Ġimp": 1006,
1166
+ "ink": 1007,
1167
+ "Ġins": 1008,
1168
+ "ty": 1009,
1169
+ "Ġthese": 1010,
1170
+ "Ġmil": 1011,
1171
+ "ven": 1012,
1172
+ "ĠGer": 1013,
1173
+ "gest": 1014,
1174
+ "ium": 1015,
1175
+ "enn": 1016,
1176
+ "ĠBl": 1017,
1177
+ "ĠAust": 1018,
1178
+ "Ġresp": 1019,
1179
+ "ull": 1020,
1180
+ "ruct": 1021,
1181
+ "ured": 1022,
1182
+ "Ġthough": 1023
1183
+ },
1184
+ "merges": [
1185
+ "Ġ t",
1186
+ "h e",
1187
+ "Ġ a",
1188
+ "i n",
1189
+ "Ġt he",
1190
+ "e r",
1191
+ "o n",
1192
+ "r e",
1193
+ "Ġ s",
1194
+ "e d",
1195
+ "Ġ o",
1196
+ "Ġ w",
1197
+ "n d",
1198
+ "a t",
1199
+ "o r",
1200
+ "i t",
1201
+ "Ġ c",
1202
+ "e n",
1203
+ "Ġ f",
1204
+ "i s",
1205
+ "e s",
1206
+ "a r",
1207
+ "Ġo f",
1208
+ "Ġ b",
1209
+ "a n",
1210
+ "Ġ in",
1211
+ "a l",
1212
+ "in g",
1213
+ "Ġ p",
1214
+ "Ġa nd",
1215
+ "a s",
1216
+ "Ġt o",
1217
+ "r o",
1218
+ "i c",
1219
+ "Ġ m",
1220
+ "Ġ d",
1221
+ "Ġ h",
1222
+ "i on",
1223
+ "l e",
1224
+ "o u",
1225
+ "Ġ T",
1226
+ "Ġ re",
1227
+ "Ġ A",
1228
+ "Ġ S",
1229
+ "en t",
1230
+ "i l",
1231
+ "Ġt h",
1232
+ "s t",
1233
+ "Ġ C",
1234
+ "e l",
1235
+ "o m",
1236
+ "Ġ l",
1237
+ "a m",
1238
+ "Ġ Ċ",
1239
+ "Ġ e",
1240
+ "Ġ n",
1241
+ "a d",
1242
+ "a c",
1243
+ "Ġw as",
1244
+ "Ġ M",
1245
+ "u r",
1246
+ "ĠT he",
1247
+ "e c",
1248
+ "Ġ on",
1249
+ "l y",
1250
+ "Ġ B",
1251
+ "Ġ I",
1252
+ "Ġ g",
1253
+ "e t",
1254
+ "o l",
1255
+ "i d",
1256
+ "i v",
1257
+ "i m",
1258
+ "Ġf or",
1259
+ "i r",
1260
+ "- @",
1261
+ "@ -@",
1262
+ "i g",
1263
+ "o t",
1264
+ "t er",
1265
+ "Ġa s",
1266
+ "Ġ H",
1267
+ "u s",
1268
+ "o w",
1269
+ "Ġs t",
1270
+ "u t",
1271
+ "it h",
1272
+ "a y",
1273
+ "Ġ P",
1274
+ "at ion",
1275
+ "v er",
1276
+ "Ġb e",
1277
+ "he r",
1278
+ "Ġth at",
1279
+ "Ġw ith",
1280
+ "Ġ R",
1281
+ "c e",
1282
+ "t h",
1283
+ "Ġ D",
1284
+ "Ġ is",
1285
+ "u n",
1286
+ "e m",
1287
+ "Ġ F",
1288
+ "Ġw h",
1289
+ "u l",
1290
+ "Ġb y",
1291
+ "Ġa l",
1292
+ "c h",
1293
+ "Ġ W",
1294
+ "Ġc on",
1295
+ "r a",
1296
+ "Ġ G",
1297
+ "o s",
1298
+ "Ġ L",
1299
+ "Ġ N",
1300
+ "Ġa t",
1301
+ "er s",
1302
+ "c t",
1303
+ "1 9",
1304
+ "Ġ it",
1305
+ "ro m",
1306
+ "a nd",
1307
+ "Ġa n",
1308
+ "u m",
1309
+ "es t",
1310
+ "Ġ J",
1311
+ "a g",
1312
+ "Ġ he",
1313
+ "is t",
1314
+ "a in",
1315
+ "o d",
1316
+ "a v",
1317
+ "r i",
1318
+ "Ġ E",
1319
+ "0 0",
1320
+ "Ġ O",
1321
+ "Ġf rom",
1322
+ "Ġc om",
1323
+ "Ġh is",
1324
+ "o p",
1325
+ "Ġp ro",
1326
+ "re s",
1327
+ "i es",
1328
+ "i f",
1329
+ "Ġ v",
1330
+ "or t",
1331
+ "er e",
1332
+ "il l",
1333
+ "l d",
1334
+ "Ġd e",
1335
+ "p p",
1336
+ "Ġs u",
1337
+ "o re",
1338
+ "ĠI n",
1339
+ "Ġ r",
1340
+ "Ġs e",
1341
+ "Ġw ere",
1342
+ "e w",
1343
+ "on g",
1344
+ "ig h",
1345
+ "ar d",
1346
+ "at e",
1347
+ "al l",
1348
+ "ar t",
1349
+ "a k",
1350
+ "ic h",
1351
+ "Ġc h",
1352
+ "Ġo r",
1353
+ "a b",
1354
+ "an t",
1355
+ "u d",
1356
+ "o c",
1357
+ "b er",
1358
+ "Ġe x",
1359
+ "g h",
1360
+ "it y",
1361
+ "at ed",
1362
+ "p t",
1363
+ "es s",
1364
+ "e ar",
1365
+ "Ġ K",
1366
+ "Ġp l",
1367
+ "am e",
1368
+ "q u",
1369
+ "iv e",
1370
+ "ro u",
1371
+ "Ġa re",
1372
+ "Ġs h",
1373
+ "Ġ k",
1374
+ "ac k",
1375
+ "ec t",
1376
+ "â Ģ",
1377
+ "Ġ U",
1378
+ "Ġh ad",
1379
+ "s e",
1380
+ "Ġwh ich",
1381
+ "re d",
1382
+ "o v",
1383
+ "ĠS t",
1384
+ "as t",
1385
+ "Ġs p",
1386
+ "i an",
1387
+ "Ġ y",
1388
+ "m ent",
1389
+ "Ġ le",
1390
+ "Ġn ot",
1391
+ "g e",
1392
+ "or d",
1393
+ "r it",
1394
+ "i p",
1395
+ "in e",
1396
+ "el l",
1397
+ "al ly",
1398
+ "ou r",
1399
+ "o st",
1400
+ "igh t",
1401
+ "t her",
1402
+ "a p",
1403
+ "Ġ u",
1404
+ "is h",
1405
+ "ĠC h",
1406
+ "ou n",
1407
+ "i a",
1408
+ "av e",
1409
+ "ar y",
1410
+ "u st",
1411
+ "o g",
1412
+ "2 00",
1413
+ "Ġ un",
1414
+ "ou s",
1415
+ "ir st",
1416
+ "Ġ V",
1417
+ "c c",
1418
+ "Ġin c",
1419
+ "Ġcom p",
1420
+ "r u",
1421
+ "ion s",
1422
+ "2 0",
1423
+ "Ġthe ir",
1424
+ "Ġb ut",
1425
+ "id e",
1426
+ "u re",
1427
+ "s o",
1428
+ "Ġcon t",
1429
+ "Ġin t",
1430
+ "f ter",
1431
+ "ic al",
1432
+ "i al",
1433
+ "Ġa r",
1434
+ "Ġf irst",
1435
+ "ou ld",
1436
+ "Ġit s",
1437
+ "he d",
1438
+ "âĢ ĵ",
1439
+ "Ġw he",
1440
+ "w o",
1441
+ "ou t",
1442
+ "u b",
1443
+ "f f",
1444
+ "u e",
1445
+ "Ġ her",
1446
+ "ow n",
1447
+ "o k",
1448
+ "Ġal so",
1449
+ "Ġc l",
1450
+ "p er",
1451
+ "ig n",
1452
+ "at er",
1453
+ "r an",
1454
+ "or m",
1455
+ "i e",
1456
+ "om e",
1457
+ "or k",
1458
+ "as s",
1459
+ "i re",
1460
+ "e nd",
1461
+ "Ġre s",
1462
+ "Ġa b",
1463
+ "Ġa d",
1464
+ "Ġ us",
1465
+ "r y",
1466
+ "Ġre c",
1467
+ "Ġh ave",
1468
+ "ag e",
1469
+ "ĠH e",
1470
+ "Ġ ro",
1471
+ "m er",
1472
+ "Ġon e",
1473
+ "on d",
1474
+ "l ow",
1475
+ "Ġh as",
1476
+ "ĠT h",
1477
+ "d u",
1478
+ "1 8",
1479
+ "Ġp er",
1480
+ "Ġbe en",
1481
+ "im e",
1482
+ "Ġt wo",
1483
+ "en ce",
1484
+ "l and",
1485
+ ". @",
1486
+ "@ .@",
1487
+ "ul t",
1488
+ "re e",
1489
+ "ou gh",
1490
+ "i le",
1491
+ "Ġwh o",
1492
+ "ĠA l",
1493
+ "Ġs c",
1494
+ "ur ing",
1495
+ "p l",
1496
+ "or y",
1497
+ "it ion",
1498
+ "r ic",
1499
+ "ation s",
1500
+ "Ġd is",
1501
+ "Ġth is",
1502
+ "Ġb ec",
1503
+ "Ġa pp",
1504
+ "i z",
1505
+ "ĠI t",
1506
+ "a re",
1507
+ "ac h",
1508
+ "l ud",
1509
+ "ad e",
1510
+ "Ġpl ay",
1511
+ "Ġ j",
1512
+ "Ġm an",
1513
+ "ac t",
1514
+ "el y",
1515
+ "Ġp art",
1516
+ "Ġd es",
1517
+ "Ġa g",
1518
+ "Ġthe y",
1519
+ "Ġy ear",
1520
+ "oun t",
1521
+ "20 1",
1522
+ "Ġo ver",
1523
+ "Ġo ther",
1524
+ "ou nd",
1525
+ "Ġa fter",
1526
+ "i b",
1527
+ "o ver",
1528
+ "Ġs er",
1529
+ "Ġ en",
1530
+ "Ġof f",
1531
+ "Ġ im",
1532
+ "ct ion",
1533
+ "Ġ Y",
1534
+ "k e",
1535
+ "it e",
1536
+ ", @",
1537
+ "@ ,@",
1538
+ "t e",
1539
+ "ur n",
1540
+ "Ġinc lud",
1541
+ "res s",
1542
+ "an ce",
1543
+ "an g",
1544
+ "Ġat t",
1545
+ "ic e",
1546
+ "ac e",
1547
+ "ar k",
1548
+ "Ġo ut",
1549
+ "w n",
1550
+ "p h",
1551
+ "em ber",
1552
+ "Ġp re",
1553
+ "Ġu p",
1554
+ "en s",
1555
+ "m an",
1556
+ "Ġe v",
1557
+ "Ġt ime",
1558
+ "nd er",
1559
+ "rou gh",
1560
+ "c ed",
1561
+ "Ġf in",
1562
+ "Ġint o",
1563
+ "on e",
1564
+ "p ort",
1565
+ "rou nd",
1566
+ "w e",
1567
+ "re n",
1568
+ "l es",
1569
+ "in t",
1570
+ "ĠO n",
1571
+ "v el",
1572
+ "Ġcom m",
1573
+ "Ġs he",
1574
+ "as on",
1575
+ "am p",
1576
+ "Ġt e",
1577
+ "Ġw ould",
1578
+ "w ard",
1579
+ "Ġm ore",
1580
+ "i ed",
1581
+ "os e",
1582
+ "ri b",
1583
+ "ĠU n",
1584
+ "Ġal l",
1585
+ "ing s",
1586
+ "ter n",
1587
+ "c es",
1588
+ "ab le",
1589
+ "Ġw e",
1590
+ "it ed",
1591
+ "e ver",
1592
+ "ent s",
1593
+ "Ġh im",
1594
+ "as ed",
1595
+ "or s",
1596
+ "o y",
1597
+ "o od",
1598
+ "Ġc ent",
1599
+ "i x",
1600
+ "as e",
1601
+ "il d",
1602
+ "ĠA n",
1603
+ "Ġw ork",
1604
+ "at es",
1605
+ "i ous",
1606
+ "at h",
1607
+ "Ġp o",
1608
+ "ro p",
1609
+ "ol d",
1610
+ "al s",
1611
+ "is s",
1612
+ "e y",
1613
+ "ic t",
1614
+ "Ġf e",
1615
+ "Ġthe m",
1616
+ "g an",
1617
+ "Ġs ec",
1618
+ "Ġb et",
1619
+ "Ġwhe n",
1620
+ "Ġs ong",
1621
+ "Ġre m",
1622
+ "e p",
1623
+ "f orm",
1624
+ "a il",
1625
+ "f er",
1626
+ "Ġe ar",
1627
+ "ub l",
1628
+ "a w",
1629
+ "Ġk n",
1630
+ "ak e",
1631
+ "a us",
1632
+ "Ġm ost",
1633
+ "Ġcon s",
1634
+ "Ġd uring",
1635
+ "ĠA s",
1636
+ "or th",
1637
+ "Ġn ew",
1638
+ "er ed",
1639
+ "il m",
1640
+ "v ed",
1641
+ "at t",
1642
+ "Ġon ly",
1643
+ "Ġd ec",
1644
+ "ic k",
1645
+ "Ġg ame",
1646
+ "on s",
1647
+ "u g",
1648
+ "Ġt r",
1649
+ "f t",
1650
+ "ot h",
1651
+ "o ok",
1652
+ "ĠM ar",
1653
+ "re at",
1654
+ "w ay",
1655
+ "Ġc an",
1656
+ "ol low",
1657
+ "ou th",
1658
+ "we en",
1659
+ "ĠE n",
1660
+ "19 9",
1661
+ "ter s",
1662
+ "Ġre l",
1663
+ "in d",
1664
+ "Ġab out",
1665
+ "Ġse ason",
1666
+ "Ġag ain",
1667
+ "r al",
1668
+ "Ġth ree",
1669
+ "ation al",
1670
+ "Ġu nder",
1671
+ "ul ar",
1672
+ "Ġm e",
1673
+ "Ġth an",
1674
+ "ĠC om",
1675
+ "ĠA r",
1676
+ "h ip",
1677
+ "o b",
1678
+ "Ġn e",
1679
+ "Ġbet ween",
1680
+ "Ġf l",
1681
+ "h n",
1682
+ "v e",
1683
+ "Ġch ar",
1684
+ "Ġc ol",
1685
+ "Ġrec ord",
1686
+ "i ew",
1687
+ "r on",
1688
+ "f ore",
1689
+ "Ġth rough",
1690
+ "is ion",
1691
+ "or n",
1692
+ "oc k",
1693
+ "Ġ ver",
1694
+ "Ġl ater",
1695
+ "Ġn um",
1696
+ "Ġe nd",
1697
+ "ol og",
1698
+ "am es",
1699
+ "Ġp os",
1700
+ "Ġw rit",
1701
+ "Ġpro du",
1702
+ "Ġwh ile",
1703
+ "Ġa ct",
1704
+ "Ġre le",
1705
+ "Ġf ilm",
1706
+ "is hed",
1707
+ "Ġp r",
1708
+ "an s",
1709
+ "Ġre g",
1710
+ "Ġfor m",
1711
+ "Ġas s",
1712
+ "ĠS e",
1713
+ "ur y",
1714
+ "t ed",
1715
+ "t s",
1716
+ "Ġm ade",
1717
+ "Ġsu b",
1718
+ "Ġp e",
1719
+ "1 0",
1720
+ "Ġs o",
1721
+ "or ld",
1722
+ "Ġre t",
1723
+ "ĠN ew",
1724
+ "Ġsp ec",
1725
+ "Ġa cc",
1726
+ "Ġ qu",
1727
+ "Ġwhe re",
1728
+ "en er",
1729
+ "Ġm ov",
1730
+ "he s",
1731
+ "mer ic",
1732
+ "at ing",
1733
+ "Ġin ter",
1734
+ "ĠL e",
1735
+ "ĠA meric",
1736
+ "Ġ ra",
1737
+ "Ġs ome",
1738
+ "Ġc o",
1739
+ "Ġl ar",
1740
+ "Ġb u",
1741
+ "Ġde f",
1742
+ "b um",
1743
+ "Ġa c",
1744
+ "Ġm us",
1745
+ "Ġf ollow",
1746
+ "ĠA t",
1747
+ "in s",
1748
+ "iv ed",
1749
+ "if ic",
1750
+ "u al",
1751
+ "Ġa m",
1752
+ "Ġsu ch",
1753
+ "Ġsec ond",
1754
+ "i ke",
1755
+ "Ġf our",
1756
+ "Ġin d",
1757
+ "an n",
1758
+ "he n",
1759
+ "Ġus ed",
1760
+ "ĠR e",
1761
+ "ic s",
1762
+ "le ct",
1763
+ "Ġd ay",
1764
+ "i el",
1765
+ "il y",
1766
+ "ĠTh is",
1767
+ "00 0",
1768
+ "Ġp ubl",
1769
+ "Ġc all",
1770
+ "ĠJ o",
1771
+ ". .",
1772
+ "l l",
1773
+ "Ġal bum",
1774
+ "ran s",
1775
+ "Ġd o",
1776
+ "an y",
1777
+ "Ġbe fore",
1778
+ "ro s",
1779
+ "ĠS h",
1780
+ "Ġs y",
1781
+ "a id",
1782
+ "ĠEn g",
1783
+ "Ġbe ing",
1784
+ "u c",
1785
+ "Ġe p",
1786
+ "Ġsu pp",
1787
+ "Ġthe re",
1788
+ "Ġyear s",
1789
+ "ar s",
1790
+ "ow ever",
1791
+ "Ġ ent",
1792
+ "if e",
1793
+ "Ġh igh",
1794
+ "Ġf ound",
1795
+ "ir d",
1796
+ "Ġn o",
1797
+ "Ġs et",
1798
+ "1 6",
1799
+ "in es",
1800
+ "iv er",
1801
+ "i o",
1802
+ "ot her",
1803
+ "j ect",
1804
+ "Ġs ur",
1805
+ "a j",
1806
+ "t en",
1807
+ "Ġt ra",
1808
+ "is ed",
1809
+ "it ies",
1810
+ "vel op",
1811
+ "Ġb l",
1812
+ "al e",
1813
+ "Ġser ies",
1814
+ "1 2",
1815
+ "Ġl oc",
1816
+ "Ġnum ber",
1817
+ "Ġp res",
1818
+ "an e",
1819
+ "aus e",
1820
+ "od e",
1821
+ "e k",
1822
+ "t on",
1823
+ "ĠS c",
1824
+ "i er",
1825
+ "is e",
1826
+ "Ġse ver",
1827
+ "in ce",
1828
+ "Ġb oth",
1829
+ "an k",
1830
+ "ro w",
1831
+ "1 5",
1832
+ "ire ct",
1833
+ "s on",
1834
+ "Ġthe n",
1835
+ "ĠB rit",
1836
+ "i et",
1837
+ "Ġep is",
1838
+ "Ġinclud ing",
1839
+ "1 7",
1840
+ "it s",
1841
+ "ig in",
1842
+ "p r",
1843
+ "Ġagain st",
1844
+ "Ġw ell",
1845
+ "Ġbec ame",
1846
+ "Ġex p",
1847
+ "Ġkn own",
1848
+ "Ġt rans",
1849
+ "Ġchar ac",
1850
+ "âĢ Ķ",
1851
+ "r am",
1852
+ "Ġb ack",
1853
+ "Ġad d",
1854
+ "Ġp op",
1855
+ "Ġg o",
1856
+ "ur ch",
1857
+ "Ġdes c",
1858
+ "Ġs ing",
1859
+ "iel d",
1860
+ "Ġper form",
1861
+ "ain ed",
1862
+ "Ġre ce",
1863
+ "id ent",
1864
+ "Ġe m",
1865
+ "er t",
1866
+ "u res",
1867
+ "Ġin v",
1868
+ "19 8",
1869
+ "Ġde p",
1870
+ "a ir",
1871
+ "er n",
1872
+ "at her",
1873
+ "f ul",
1874
+ "Ġ Z",
1875
+ "Ġm on",
1876
+ "Ġman y",
1877
+ "Ġm ain",
1878
+ "Ġst ud",
1879
+ "Ġl ong",
1880
+ "in n",
1881
+ "th ough",
1882
+ "u p",
1883
+ "o ol",
1884
+ "ĠUn ited",
1885
+ "l ed",
1886
+ "em ent",
1887
+ "ow er",
1888
+ "ĠJo hn",
1889
+ "Ġo p",
1890
+ "in ed",
1891
+ "Ġm et",
1892
+ "o ber",
1893
+ "le y",
1894
+ "Ġcent ury",
1895
+ "Ġte am",
1896
+ "Ġ est",
1897
+ "ĠA fter",
1898
+ "y l",
1899
+ "Ġm in",
1900
+ "u ch",
1901
+ "ut e",
1902
+ "Ġde velop",
1903
+ "ĠS he",
1904
+ "i am",
1905
+ "Ġsh ow",
1906
+ "el f",
1907
+ "Ġre p",
1908
+ "Ġcon c",
1909
+ "at ive",
1910
+ "Ġc re",
1911
+ "over n",
1912
+ "a red",
1913
+ "19 4",
1914
+ "Ġor igin",
1915
+ "Ġs m",
1916
+ "iv ers",
1917
+ "a z",
1918
+ "Ġle ad",
1919
+ "Ġsever al",
1920
+ "a h",
1921
+ "Ġo b",
1922
+ "Ġre v",
1923
+ "Ġm ill",
1924
+ "er m",
1925
+ "u ally",
1926
+ "o ot",
1927
+ "Ġbe gan",
1928
+ "19 6",
1929
+ "i red",
1930
+ "Ġd if",
1931
+ "Ġcont in",
1932
+ "Ġs ign",
1933
+ "i k",
1934
+ "ĠI nd",
1935
+ "ment s",
1936
+ "iz ed",
1937
+ "19 7",
1938
+ "Ġd irect",
1939
+ "a u",
1940
+ "Ġex t",
1941
+ "ros s",
1942
+ "em b",
1943
+ "d er",
1944
+ "Ġp ol",
1945
+ "Ġm ay",
1946
+ "a pt",
1947
+ "el s",
1948
+ "ĠW h",
1949
+ "Ġcomp le",
1950
+ "Ġar t",
1951
+ "ĠB r",
1952
+ "ĠI s",
1953
+ "un e",
1954
+ "t il",
1955
+ "Ġc rit",
1956
+ "Ġh ist",
1957
+ "Ġear ly",
1958
+ "Ġc ould",
1959
+ "ĠC on",
1960
+ "Ġd id",
1961
+ "Ġb el",
1962
+ "Ġcall ed",
1963
+ "u ed",
1964
+ "Ġn ear",
1965
+ "Ġepis ode",
1966
+ "y p",
1967
+ "Ġdesc rib",
1968
+ "im es",
1969
+ "Ġb ro",
1970
+ "rou p",
1971
+ "op le",
1972
+ "Ġd own",
1973
+ "Ġr un",
1974
+ "1 3",
1975
+ "ak ing",
1976
+ "Ġdis c",
1977
+ "Ġal ong",
1978
+ "cc ess",
1979
+ "ĠM ay",
1980
+ "Ġfe at",
1981
+ "Ġin st",
1982
+ "ĠAmeric an",
1983
+ "Ġs aid",
1984
+ "Ġd ist",
1985
+ "Ġin f",
1986
+ "Ġim p",
1987
+ "in k",
1988
+ "Ġin s",
1989
+ "t y",
1990
+ "Ġthe se",
1991
+ "Ġm il",
1992
+ "v en",
1993
+ "ĠG er",
1994
+ "g est",
1995
+ "i um",
1996
+ "en n",
1997
+ "ĠB l",
1998
+ "ĠA ust",
1999
+ "Ġres p",
2000
+ "ul l",
2001
+ "ru ct",
2002
+ "u red",
2003
+ "Ġth ough"
2004
+ ]
2005
+ }
2006
+ }
tokenizer_config.json ADDED
@@ -0,0 +1,122 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_prefix_space": false,
3
+ "added_tokens_decoder": {
4
+ "0": {
5
+ "content": ">>TITLE<<",
6
+ "lstrip": false,
7
+ "normalized": false,
8
+ "rstrip": false,
9
+ "single_word": false,
10
+ "special": true
11
+ },
12
+ "1": {
13
+ "content": ">>ABSTRACT<<",
14
+ "lstrip": false,
15
+ "normalized": false,
16
+ "rstrip": false,
17
+ "single_word": false,
18
+ "special": true
19
+ },
20
+ "2": {
21
+ "content": ">>INTRODUCTION<<",
22
+ "lstrip": false,
23
+ "normalized": false,
24
+ "rstrip": false,
25
+ "single_word": false,
26
+ "special": true
27
+ },
28
+ "3": {
29
+ "content": ">>SUMMARY<<",
30
+ "lstrip": false,
31
+ "normalized": false,
32
+ "rstrip": false,
33
+ "single_word": false,
34
+ "special": true
35
+ },
36
+ "4": {
37
+ "content": ">>COMMENT<<",
38
+ "lstrip": false,
39
+ "normalized": false,
40
+ "rstrip": false,
41
+ "single_word": false,
42
+ "special": true
43
+ },
44
+ "5": {
45
+ "content": ">>ANSWER<<",
46
+ "lstrip": false,
47
+ "normalized": false,
48
+ "rstrip": false,
49
+ "single_word": false,
50
+ "special": true
51
+ },
52
+ "6": {
53
+ "content": ">>QUESTION<<",
54
+ "lstrip": false,
55
+ "normalized": false,
56
+ "rstrip": false,
57
+ "single_word": false,
58
+ "special": true
59
+ },
60
+ "7": {
61
+ "content": ">>DOMAIN<<",
62
+ "lstrip": false,
63
+ "normalized": false,
64
+ "rstrip": false,
65
+ "single_word": false,
66
+ "special": true
67
+ },
68
+ "8": {
69
+ "content": ">>PREFIX<<",
70
+ "lstrip": false,
71
+ "normalized": false,
72
+ "rstrip": false,
73
+ "single_word": false,
74
+ "special": true
75
+ },
76
+ "9": {
77
+ "content": ">>SUFFIX<<",
78
+ "lstrip": false,
79
+ "normalized": false,
80
+ "rstrip": false,
81
+ "single_word": false,
82
+ "special": true
83
+ },
84
+ "10": {
85
+ "content": ">>MIDDLE<<",
86
+ "lstrip": false,
87
+ "normalized": false,
88
+ "rstrip": false,
89
+ "single_word": false,
90
+ "special": true
91
+ },
92
+ "11": {
93
+ "content": "<|endoftext|>",
94
+ "lstrip": false,
95
+ "normalized": false,
96
+ "rstrip": false,
97
+ "single_word": false,
98
+ "special": true
99
+ }
100
+ },
101
+ "additional_special_tokens": [
102
+ ">>TITLE<<",
103
+ ">>ABSTRACT<<",
104
+ ">>INTRODUCTION<<",
105
+ ">>SUMMARY<<",
106
+ ">>COMMENT<<",
107
+ ">>ANSWER<<",
108
+ ">>QUESTION<<",
109
+ ">>DOMAIN<<",
110
+ ">>PREFIX<<",
111
+ ">>SUFFIX<<",
112
+ ">>MIDDLE<<"
113
+ ],
114
+ "clean_up_tokenization_spaces": true,
115
+ "eos_token": "<|endoftext|>",
116
+ "model_input_names": [
117
+ "input_ids",
118
+ "attention_mask"
119
+ ],
120
+ "model_max_length": 512,
121
+ "tokenizer_class": "PreTrainedTokenizerFast"
122
+ }