Cleo3927 commited on
Commit
fc051ee
·
verified ·
1 Parent(s): f8a2cf4

Training in progress, step 240

Browse files
config.json CHANGED
@@ -3,6 +3,7 @@
3
  "EncoderDecoderModel"
4
  ],
5
  "decoder": {
 
6
  "_name_or_path": "",
7
  "add_cross_attention": true,
8
  "architectures": null,
@@ -78,10 +79,11 @@
78
  "typical_p": 1.0,
79
  "use_bfloat16": false,
80
  "use_cache": true,
81
- "vocab_size": 53
82
  },
83
  "decoder_start_token_id": 2,
84
  "encoder": {
 
85
  "_name_or_path": "",
86
  "add_cross_attention": false,
87
  "architectures": null,
@@ -157,13 +159,13 @@
157
  "typical_p": 1.0,
158
  "use_bfloat16": false,
159
  "use_cache": true,
160
- "vocab_size": 53
161
  },
162
  "eos_token_id": 0,
163
  "is_encoder_decoder": true,
164
  "model_type": "encoder-decoder",
165
  "pad_token_id": 3,
166
  "torch_dtype": "float32",
167
- "transformers_version": "4.38.1",
168
  "unk_token_id": null
169
  }
 
3
  "EncoderDecoderModel"
4
  ],
5
  "decoder": {
6
+ "_attn_implementation_autoset": false,
7
  "_name_or_path": "",
8
  "add_cross_attention": true,
9
  "architectures": null,
 
79
  "typical_p": 1.0,
80
  "use_bfloat16": false,
81
  "use_cache": true,
82
+ "vocab_size": 52
83
  },
84
  "decoder_start_token_id": 2,
85
  "encoder": {
86
+ "_attn_implementation_autoset": false,
87
  "_name_or_path": "",
88
  "add_cross_attention": false,
89
  "architectures": null,
 
159
  "typical_p": 1.0,
160
  "use_bfloat16": false,
161
  "use_cache": true,
162
+ "vocab_size": 52
163
  },
164
  "eos_token_id": 0,
165
  "is_encoder_decoder": true,
166
  "model_type": "encoder-decoder",
167
  "pad_token_id": 3,
168
  "torch_dtype": "float32",
169
+ "transformers_version": "4.48.3",
170
  "unk_token_id": null
171
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:36d9c024e1e3d7d9a5df926e8039a15c4bd48836b296e195124e53acefbe0cdb
3
- size 31207604
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b03dd9866b16e1489cafed293ba084665b8b1265bce390aca66bcbf89c4a9e18
3
+ size 31205552
runs/Mar03_20-16-38_8d7670e5dd92/events.out.tfevents.1741032999.8d7670e5dd92.554.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:222a6d199bb099581572501f0e2ea2fc213d84a59f2a30e38c05fce03befb4c2
3
+ size 9132
runs/Mar03_20-17-28_8d7670e5dd92/events.out.tfevents.1741033049.8d7670e5dd92.554.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4ac091c7296f21a778a638ad702c2e0183ac4c578b17d5da027c1faeb9f0aef3
3
+ size 9132
runs/Mar03_20-28-52_8d7670e5dd92/events.out.tfevents.1741033733.8d7670e5dd92.554.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:27be49082bfed6bb918edc34e3f44496da5b43396b8c9b1fd423817cf8a0310d
3
+ size 27952
tokenizer.json CHANGED
@@ -95,6 +95,7 @@
95
  "end_of_word_suffix": null,
96
  "fuse_unk": false,
97
  "byte_fallback": false,
 
98
  "vocab": {
99
  "[EOS]": 0,
100
  "[UNK]": 1,
@@ -112,81 +113,188 @@
112
  "7": 13,
113
  "8": 14,
114
  "9": 15,
115
- "=": 16,
116
  "99": 17,
117
- "10": 18,
118
- "98": 19,
119
- "11": 20,
120
  "12": 21,
121
- "97": 22,
122
  "13": 23,
123
- "96": 24,
124
  "95": 25,
125
- "14": 26,
126
  "94": 27,
127
- "15": 28,
128
  "16": 29,
129
- "93": 30,
130
- "17": 31,
131
- "92": 32,
132
- "91": 33,
133
- "18": 34,
134
- "19": 35,
135
- "90": 36,
136
  "20": 37,
137
- "89": 38,
138
  "21": 39,
139
- "88": 40,
140
- "22": 41,
141
- "87": 42,
142
  "23": 43,
143
- "86": 44,
144
- "24": 45,
145
- "85": 46,
146
  "25": 47,
147
- "84": 48,
148
- "26": 49,
149
- "83": 50,
150
- "27": 51,
151
- "82": 52
152
  },
153
  "merges": [
154
- "9 9",
155
- "1 0",
156
- "9 8",
157
- "1 1",
158
- "1 2",
159
- "9 7",
160
- "1 3",
161
- "9 6",
162
- "9 5",
163
- "1 4",
164
- "9 4",
165
- "1 5",
166
- "1 6",
167
- "9 3",
168
- "1 7",
169
- "9 2",
170
- "9 1",
171
- "1 8",
172
- "1 9",
173
- "9 0",
174
- "2 0",
175
- "8 9",
176
- "2 1",
177
- "8 8",
178
- "2 2",
179
- "8 7",
180
- "2 3",
181
- "8 6",
182
- "2 4",
183
- "8 5",
184
- "2 5",
185
- "8 4",
186
- "2 6",
187
- "8 3",
188
- "2 7",
189
- "8 2"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
190
  ]
191
  }
192
  }
 
95
  "end_of_word_suffix": null,
96
  "fuse_unk": false,
97
  "byte_fallback": false,
98
+ "ignore_merges": false,
99
  "vocab": {
100
  "[EOS]": 0,
101
  "[UNK]": 1,
 
113
  "7": 13,
114
  "8": 14,
115
  "9": 15,
116
+ "10": 16,
117
  "99": 17,
118
+ "98": 18,
119
+ "11": 19,
120
+ "97": 20,
121
  "12": 21,
122
+ "96": 22,
123
  "13": 23,
124
+ "14": 24,
125
  "95": 25,
126
+ "15": 26,
127
  "94": 27,
128
+ "93": 28,
129
  "16": 29,
130
+ "17": 30,
131
+ "92": 31,
132
+ "91": 32,
133
+ "18": 33,
134
+ "19": 34,
135
+ "90": 35,
136
+ "89": 36,
137
  "20": 37,
138
+ "88": 38,
139
  "21": 39,
140
+ "22": 40,
141
+ "87": 41,
142
+ "86": 42,
143
  "23": 43,
144
+ "24": 44,
145
+ "85": 45,
146
+ "84": 46,
147
  "25": 47,
148
+ "26": 48,
149
+ "83": 49,
150
+ "27": 50,
151
+ "82": 51
 
152
  },
153
  "merges": [
154
+ [
155
+ "1",
156
+ "0"
157
+ ],
158
+ [
159
+ "9",
160
+ "9"
161
+ ],
162
+ [
163
+ "9",
164
+ "8"
165
+ ],
166
+ [
167
+ "1",
168
+ "1"
169
+ ],
170
+ [
171
+ "9",
172
+ "7"
173
+ ],
174
+ [
175
+ "1",
176
+ "2"
177
+ ],
178
+ [
179
+ "9",
180
+ "6"
181
+ ],
182
+ [
183
+ "1",
184
+ "3"
185
+ ],
186
+ [
187
+ "1",
188
+ "4"
189
+ ],
190
+ [
191
+ "9",
192
+ "5"
193
+ ],
194
+ [
195
+ "1",
196
+ "5"
197
+ ],
198
+ [
199
+ "9",
200
+ "4"
201
+ ],
202
+ [
203
+ "9",
204
+ "3"
205
+ ],
206
+ [
207
+ "1",
208
+ "6"
209
+ ],
210
+ [
211
+ "1",
212
+ "7"
213
+ ],
214
+ [
215
+ "9",
216
+ "2"
217
+ ],
218
+ [
219
+ "9",
220
+ "1"
221
+ ],
222
+ [
223
+ "1",
224
+ "8"
225
+ ],
226
+ [
227
+ "1",
228
+ "9"
229
+ ],
230
+ [
231
+ "9",
232
+ "0"
233
+ ],
234
+ [
235
+ "8",
236
+ "9"
237
+ ],
238
+ [
239
+ "2",
240
+ "0"
241
+ ],
242
+ [
243
+ "8",
244
+ "8"
245
+ ],
246
+ [
247
+ "2",
248
+ "1"
249
+ ],
250
+ [
251
+ "2",
252
+ "2"
253
+ ],
254
+ [
255
+ "8",
256
+ "7"
257
+ ],
258
+ [
259
+ "8",
260
+ "6"
261
+ ],
262
+ [
263
+ "2",
264
+ "3"
265
+ ],
266
+ [
267
+ "2",
268
+ "4"
269
+ ],
270
+ [
271
+ "8",
272
+ "5"
273
+ ],
274
+ [
275
+ "8",
276
+ "4"
277
+ ],
278
+ [
279
+ "2",
280
+ "5"
281
+ ],
282
+ [
283
+ "2",
284
+ "6"
285
+ ],
286
+ [
287
+ "8",
288
+ "3"
289
+ ],
290
+ [
291
+ "2",
292
+ "7"
293
+ ],
294
+ [
295
+ "8",
296
+ "2"
297
+ ]
298
  ]
299
  }
300
  }
tokenizer_config.json CHANGED
@@ -33,9 +33,10 @@
33
  "special": true
34
  }
35
  },
36
- "clean_up_tokenization_spaces": true,
37
  "cls_token": "[CLS]",
38
  "eos_token": "[EOS]",
 
39
  "model_max_length": 1000000000000000019884624838656,
40
  "pad_token": "[PAD]",
41
  "tokenizer_class": "PreTrainedTokenizerFast"
 
33
  "special": true
34
  }
35
  },
36
+ "clean_up_tokenization_spaces": false,
37
  "cls_token": "[CLS]",
38
  "eos_token": "[EOS]",
39
+ "extra_special_tokens": {},
40
  "model_max_length": 1000000000000000019884624838656,
41
  "pad_token": "[PAD]",
42
  "tokenizer_class": "PreTrainedTokenizerFast"
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d3f63b88acd55144274e10cea203015237b824f2edc459fa6207a536b4ed9983
3
- size 5112
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5608d1a93fb9374e9f46c3ce223d0542685ffcc484bd6cb7ef470ec61f58bb2f
3
+ size 5496