neginr commited on
Commit
7904a45
·
verified ·
1 Parent(s): 1604df7

Training in progress, epoch 2

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f10ad0c990899f705f5d432a4532d775a7d3d084dd9c9f9be0ae23bba0d48cb0
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a5e6a24a4b33bebb769025034352144593b686d63194976104f33c3822616fb8
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:96ebfc4bc368c86172b060c19329e902f5b2d7215c73ae1602382f0e4d50a991
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4eb73807cf55566f5292d1156b7471e74707cba5bbb56affb94936879d311d0b
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:710d9b234280555cc0d13db7a3e4ceb2173890cd133c1b13549e8ea06ca65233
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0bc6eec6a4aa0c6b76330b9442a032ad047a0fe3b3cc8bbe4cfb7a789080b9fe
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e7b4bf9e938fcecc3ac08a2ddbacfc246eddb1bf4a97fa7ffbdeeb3425a0a6a2
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4bf274cd83f46328ae4382bd619460fd7105c242b7a21b742bfcf4e99d2763a4
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -222,3 +222,114 @@
222
  {"current_steps": 221, "total_steps": 555, "loss": 0.5589, "lr": 6.0290081411946785e-05, "epoch": 1.9887514060742406, "percentage": 39.82, "elapsed_time": "7:17:46", "remaining_time": "11:01:36"}
223
  {"current_steps": 222, "total_steps": 555, "loss": 0.5489, "lr": 6.007265327506734e-05, "epoch": 1.9977502812148482, "percentage": 40.0, "elapsed_time": "7:19:43", "remaining_time": "10:59:35"}
224
  {"current_steps": 223, "total_steps": 555, "loss": 0.9973, "lr": 5.985442952494643e-05, "epoch": 2.0067491563554554, "percentage": 40.18, "elapsed_time": "7:23:29", "remaining_time": "11:00:16"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
222
  {"current_steps": 221, "total_steps": 555, "loss": 0.5589, "lr": 6.0290081411946785e-05, "epoch": 1.9887514060742406, "percentage": 39.82, "elapsed_time": "7:17:46", "remaining_time": "11:01:36"}
223
  {"current_steps": 222, "total_steps": 555, "loss": 0.5489, "lr": 6.007265327506734e-05, "epoch": 1.9977502812148482, "percentage": 40.0, "elapsed_time": "7:19:43", "remaining_time": "10:59:35"}
224
  {"current_steps": 223, "total_steps": 555, "loss": 0.9973, "lr": 5.985442952494643e-05, "epoch": 2.0067491563554554, "percentage": 40.18, "elapsed_time": "7:23:29", "remaining_time": "11:00:16"}
225
+ {"current_steps": 224, "total_steps": 555, "loss": 0.5251, "lr": 5.9635418811248e-05, "epoch": 2.015748031496063, "percentage": 40.36, "elapsed_time": "7:25:27", "remaining_time": "10:58:14"}
226
+ {"current_steps": 225, "total_steps": 555, "loss": 0.5222, "lr": 5.941562981482859e-05, "epoch": 2.0247469066366706, "percentage": 40.54, "elapsed_time": "7:27:24", "remaining_time": "10:56:11"}
227
+ {"current_steps": 226, "total_steps": 555, "loss": 0.5175, "lr": 5.9195071247393325e-05, "epoch": 2.0337457817772777, "percentage": 40.72, "elapsed_time": "7:29:21", "remaining_time": "10:54:09"}
228
+ {"current_steps": 227, "total_steps": 555, "loss": 0.5219, "lr": 5.897375185115052e-05, "epoch": 2.0427446569178853, "percentage": 40.9, "elapsed_time": "7:31:17", "remaining_time": "10:52:04"}
229
+ {"current_steps": 228, "total_steps": 555, "loss": 0.5248, "lr": 5.8751680398465244e-05, "epoch": 2.0517435320584925, "percentage": 41.08, "elapsed_time": "7:33:12", "remaining_time": "10:49:59"}
230
+ {"current_steps": 229, "total_steps": 555, "loss": 0.531, "lr": 5.8528865691511564e-05, "epoch": 2.0607424071991, "percentage": 41.26, "elapsed_time": "7:35:08", "remaining_time": "10:47:56"}
231
+ {"current_steps": 230, "total_steps": 555, "loss": 0.5185, "lr": 5.83053165619237e-05, "epoch": 2.0697412823397077, "percentage": 41.44, "elapsed_time": "7:37:05", "remaining_time": "10:45:52"}
232
+ {"current_steps": 231, "total_steps": 555, "loss": 0.5238, "lr": 5.808104187044592e-05, "epoch": 2.078740157480315, "percentage": 41.62, "elapsed_time": "7:39:03", "remaining_time": "10:43:52"}
233
+ {"current_steps": 232, "total_steps": 555, "loss": 0.5116, "lr": 5.785605050658134e-05, "epoch": 2.0877390326209224, "percentage": 41.8, "elapsed_time": "7:41:00", "remaining_time": "10:41:50"}
234
+ {"current_steps": 233, "total_steps": 555, "loss": 0.5188, "lr": 5.7630351388239654e-05, "epoch": 2.09673790776153, "percentage": 41.98, "elapsed_time": "7:42:58", "remaining_time": "10:39:48"}
235
+ {"current_steps": 234, "total_steps": 555, "loss": 0.5189, "lr": 5.7403953461383515e-05, "epoch": 2.105736782902137, "percentage": 42.16, "elapsed_time": "7:44:55", "remaining_time": "10:37:46"}
236
+ {"current_steps": 235, "total_steps": 555, "loss": 0.513, "lr": 5.717686569967406e-05, "epoch": 2.1147356580427448, "percentage": 42.34, "elapsed_time": "7:46:51", "remaining_time": "10:35:43"}
237
+ {"current_steps": 236, "total_steps": 555, "loss": 0.5136, "lr": 5.694909710411517e-05, "epoch": 2.123734533183352, "percentage": 42.52, "elapsed_time": "7:48:48", "remaining_time": "10:33:41"}
238
+ {"current_steps": 237, "total_steps": 555, "loss": 0.5226, "lr": 5.672065670269674e-05, "epoch": 2.1327334083239595, "percentage": 42.7, "elapsed_time": "7:50:45", "remaining_time": "10:31:39"}
239
+ {"current_steps": 238, "total_steps": 555, "loss": 0.517, "lr": 5.649155355003677e-05, "epoch": 2.141732283464567, "percentage": 42.88, "elapsed_time": "7:52:41", "remaining_time": "10:29:35"}
240
+ {"current_steps": 239, "total_steps": 555, "loss": 0.5166, "lr": 5.6261796727022575e-05, "epoch": 2.1507311586051743, "percentage": 43.06, "elapsed_time": "7:54:38", "remaining_time": "10:27:33"}
241
+ {"current_steps": 240, "total_steps": 555, "loss": 0.5112, "lr": 5.603139534045075e-05, "epoch": 2.159730033745782, "percentage": 43.24, "elapsed_time": "7:56:36", "remaining_time": "10:25:32"}
242
+ {"current_steps": 241, "total_steps": 555, "loss": 0.5078, "lr": 5.5800358522666254e-05, "epoch": 2.168728908886389, "percentage": 43.42, "elapsed_time": "7:58:34", "remaining_time": "10:23:31"}
243
+ {"current_steps": 242, "total_steps": 555, "loss": 0.5194, "lr": 5.556869543120043e-05, "epoch": 2.1777277840269966, "percentage": 43.6, "elapsed_time": "8:00:29", "remaining_time": "10:21:27"}
244
+ {"current_steps": 243, "total_steps": 555, "loss": 0.5177, "lr": 5.533641524840805e-05, "epoch": 2.1867266591676042, "percentage": 43.78, "elapsed_time": "8:02:25", "remaining_time": "10:19:25"}
245
+ {"current_steps": 244, "total_steps": 555, "loss": 0.5169, "lr": 5.5103527181103266e-05, "epoch": 2.1957255343082114, "percentage": 43.96, "elapsed_time": "8:04:22", "remaining_time": "10:17:22"}
246
+ {"current_steps": 245, "total_steps": 555, "loss": 0.5166, "lr": 5.4870040460194834e-05, "epoch": 2.204724409448819, "percentage": 44.14, "elapsed_time": "8:06:18", "remaining_time": "10:15:20"}
247
+ {"current_steps": 246, "total_steps": 555, "loss": 0.5162, "lr": 5.463596434032011e-05, "epoch": 2.213723284589426, "percentage": 44.32, "elapsed_time": "8:08:14", "remaining_time": "10:13:17"}
248
+ {"current_steps": 247, "total_steps": 555, "loss": 0.5211, "lr": 5.440130809947824e-05, "epoch": 2.2227221597300337, "percentage": 44.5, "elapsed_time": "8:10:08", "remaining_time": "10:11:11"}
249
+ {"current_steps": 248, "total_steps": 555, "loss": 0.5114, "lr": 5.4166081038662484e-05, "epoch": 2.2317210348706413, "percentage": 44.68, "elapsed_time": "8:12:04", "remaining_time": "10:09:08"}
250
+ {"current_steps": 249, "total_steps": 555, "loss": 0.5101, "lr": 5.3930292481491494e-05, "epoch": 2.2407199100112485, "percentage": 44.86, "elapsed_time": "8:14:03", "remaining_time": "10:07:08"}
251
+ {"current_steps": 250, "total_steps": 555, "loss": 0.5111, "lr": 5.3693951773839736e-05, "epoch": 2.249718785151856, "percentage": 45.05, "elapsed_time": "8:16:00", "remaining_time": "10:05:07"}
252
+ {"current_steps": 251, "total_steps": 555, "loss": 0.516, "lr": 5.345706828346715e-05, "epoch": 2.2587176602924632, "percentage": 45.23, "elapsed_time": "8:17:58", "remaining_time": "10:03:07"}
253
+ {"current_steps": 252, "total_steps": 555, "loss": 0.5168, "lr": 5.3219651399647716e-05, "epoch": 2.267716535433071, "percentage": 45.41, "elapsed_time": "8:19:56", "remaining_time": "10:01:07"}
254
+ {"current_steps": 253, "total_steps": 555, "loss": 0.5089, "lr": 5.298171053279739e-05, "epoch": 2.2767154105736784, "percentage": 45.59, "elapsed_time": "8:21:55", "remaining_time": "9:59:08"}
255
+ {"current_steps": 254, "total_steps": 555, "loss": 0.5165, "lr": 5.274325511410106e-05, "epoch": 2.2857142857142856, "percentage": 45.77, "elapsed_time": "8:23:55", "remaining_time": "9:57:10"}
256
+ {"current_steps": 255, "total_steps": 555, "loss": 0.5148, "lr": 5.250429459513876e-05, "epoch": 2.294713160854893, "percentage": 45.95, "elapsed_time": "8:25:53", "remaining_time": "9:55:10"}
257
+ {"current_steps": 256, "total_steps": 555, "loss": 0.5098, "lr": 5.226483844751099e-05, "epoch": 2.303712035995501, "percentage": 46.13, "elapsed_time": "8:27:51", "remaining_time": "9:53:09"}
258
+ {"current_steps": 257, "total_steps": 555, "loss": 0.5158, "lr": 5.202489616246333e-05, "epoch": 2.312710911136108, "percentage": 46.31, "elapsed_time": "8:29:48", "remaining_time": "9:51:08"}
259
+ {"current_steps": 258, "total_steps": 555, "loss": 0.5137, "lr": 5.178447725051026e-05, "epoch": 2.3217097862767155, "percentage": 46.49, "elapsed_time": "8:31:50", "remaining_time": "9:49:12"}
260
+ {"current_steps": 259, "total_steps": 555, "loss": 0.5149, "lr": 5.154359124105814e-05, "epoch": 2.3307086614173227, "percentage": 46.67, "elapsed_time": "8:33:50", "remaining_time": "9:47:14"}
261
+ {"current_steps": 260, "total_steps": 555, "loss": 0.5122, "lr": 5.1302247682027494e-05, "epoch": 2.3397075365579303, "percentage": 46.85, "elapsed_time": "8:35:48", "remaining_time": "9:45:14"}
262
+ {"current_steps": 261, "total_steps": 555, "loss": 0.5106, "lr": 5.106045613947466e-05, "epoch": 2.3487064116985374, "percentage": 47.03, "elapsed_time": "8:37:44", "remaining_time": "9:43:11"}
263
+ {"current_steps": 262, "total_steps": 555, "loss": 0.5098, "lr": 5.08182261972125e-05, "epoch": 2.357705286839145, "percentage": 47.21, "elapsed_time": "8:39:40", "remaining_time": "9:41:10"}
264
+ {"current_steps": 263, "total_steps": 555, "loss": 0.5152, "lr": 5.057556745643058e-05, "epoch": 2.3667041619797526, "percentage": 47.39, "elapsed_time": "8:41:37", "remaining_time": "9:39:08"}
265
+ {"current_steps": 264, "total_steps": 555, "loss": 0.5096, "lr": 5.033248953531466e-05, "epoch": 2.37570303712036, "percentage": 47.57, "elapsed_time": "8:43:33", "remaining_time": "9:37:06"}
266
+ {"current_steps": 265, "total_steps": 555, "loss": 0.5108, "lr": 5.0089002068665376e-05, "epoch": 2.3847019122609674, "percentage": 47.75, "elapsed_time": "8:45:29", "remaining_time": "9:35:04"}
267
+ {"current_steps": 266, "total_steps": 555, "loss": 0.5169, "lr": 4.9845114707516395e-05, "epoch": 2.393700787401575, "percentage": 47.93, "elapsed_time": "8:47:27", "remaining_time": "9:33:04"}
268
+ {"current_steps": 267, "total_steps": 555, "loss": 0.5077, "lr": 4.9600837118751874e-05, "epoch": 2.402699662542182, "percentage": 48.11, "elapsed_time": "8:49:23", "remaining_time": "9:31:02"}
269
+ {"current_steps": 268, "total_steps": 555, "loss": 0.5211, "lr": 4.93561789847233e-05, "epoch": 2.4116985376827897, "percentage": 48.29, "elapsed_time": "8:51:19", "remaining_time": "9:28:59"}
270
+ {"current_steps": 269, "total_steps": 555, "loss": 0.5098, "lr": 4.91111500028657e-05, "epoch": 2.420697412823397, "percentage": 48.47, "elapsed_time": "8:53:15", "remaining_time": "9:26:57"}
271
+ {"current_steps": 270, "total_steps": 555, "loss": 0.5175, "lr": 4.886575988531329e-05, "epoch": 2.4296962879640045, "percentage": 48.65, "elapsed_time": "8:55:12", "remaining_time": "9:24:56"}
272
+ {"current_steps": 271, "total_steps": 555, "loss": 0.5136, "lr": 4.862001835851449e-05, "epoch": 2.438695163104612, "percentage": 48.83, "elapsed_time": "8:57:08", "remaining_time": "9:22:55"}
273
+ {"current_steps": 272, "total_steps": 555, "loss": 0.5099, "lr": 4.837393516284642e-05, "epoch": 2.4476940382452193, "percentage": 49.01, "elapsed_time": "8:59:04", "remaining_time": "9:20:53"}
274
+ {"current_steps": 273, "total_steps": 555, "loss": 0.5165, "lr": 4.8127520052228815e-05, "epoch": 2.456692913385827, "percentage": 49.19, "elapsed_time": "9:01:05", "remaining_time": "9:18:55"}
275
+ {"current_steps": 274, "total_steps": 555, "loss": 0.5084, "lr": 4.788078279373744e-05, "epoch": 2.465691788526434, "percentage": 49.37, "elapsed_time": "9:03:03", "remaining_time": "9:16:56"}
276
+ {"current_steps": 275, "total_steps": 555, "loss": 0.5134, "lr": 4.763373316721687e-05, "epoch": 2.4746906636670416, "percentage": 49.55, "elapsed_time": "9:05:00", "remaining_time": "9:14:54"}
277
+ {"current_steps": 276, "total_steps": 555, "loss": 0.5137, "lr": 4.7386380964892984e-05, "epoch": 2.483689538807649, "percentage": 49.73, "elapsed_time": "9:06:58", "remaining_time": "9:12:55"}
278
+ {"current_steps": 277, "total_steps": 555, "loss": 0.5128, "lr": 4.713873599098471e-05, "epoch": 2.4926884139482564, "percentage": 49.91, "elapsed_time": "9:08:56", "remaining_time": "9:10:55"}
279
+ {"current_steps": 278, "total_steps": 555, "loss": 0.5114, "lr": 4.689080806131547e-05, "epoch": 2.501687289088864, "percentage": 50.09, "elapsed_time": "9:10:53", "remaining_time": "9:08:54"}
280
+ {"current_steps": 279, "total_steps": 555, "loss": 0.5095, "lr": 4.664260700292416e-05, "epoch": 2.5106861642294716, "percentage": 50.27, "elapsed_time": "9:12:52", "remaining_time": "9:06:55"}
281
+ {"current_steps": 280, "total_steps": 555, "loss": 0.509, "lr": 4.639414265367554e-05, "epoch": 2.5196850393700787, "percentage": 50.45, "elapsed_time": "9:14:51", "remaining_time": "9:04:56"}
282
+ {"current_steps": 281, "total_steps": 555, "loss": 0.5135, "lr": 4.614542486187033e-05, "epoch": 2.5286839145106863, "percentage": 50.63, "elapsed_time": "9:16:46", "remaining_time": "9:02:54"}
283
+ {"current_steps": 282, "total_steps": 555, "loss": 0.5129, "lr": 4.589646348585494e-05, "epoch": 2.5376827896512935, "percentage": 50.81, "elapsed_time": "9:18:42", "remaining_time": "9:00:52"}
284
+ {"current_steps": 283, "total_steps": 555, "loss": 0.5119, "lr": 4.564726839363059e-05, "epoch": 2.546681664791901, "percentage": 50.99, "elapsed_time": "9:20:38", "remaining_time": "8:58:50"}
285
+ {"current_steps": 284, "total_steps": 555, "loss": 0.5226, "lr": 4.539784946246225e-05, "epoch": 2.555680539932508, "percentage": 51.17, "elapsed_time": "9:22:35", "remaining_time": "8:56:49"}
286
+ {"current_steps": 285, "total_steps": 555, "loss": 0.5205, "lr": 4.5148216578487134e-05, "epoch": 2.564679415073116, "percentage": 51.35, "elapsed_time": "9:24:30", "remaining_time": "8:54:48"}
287
+ {"current_steps": 286, "total_steps": 555, "loss": 0.5078, "lr": 4.4898379636322815e-05, "epoch": 2.5736782902137234, "percentage": 51.53, "elapsed_time": "9:26:26", "remaining_time": "8:52:46"}
288
+ {"current_steps": 287, "total_steps": 555, "loss": 0.5146, "lr": 4.4648348538675064e-05, "epoch": 2.5826771653543306, "percentage": 51.71, "elapsed_time": "9:28:22", "remaining_time": "8:50:44"}
289
+ {"current_steps": 288, "total_steps": 555, "loss": 0.5124, "lr": 4.4398133195945326e-05, "epoch": 2.591676040494938, "percentage": 51.89, "elapsed_time": "9:30:18", "remaining_time": "8:48:43"}
290
+ {"current_steps": 289, "total_steps": 555, "loss": 0.5141, "lr": 4.414774352583791e-05, "epoch": 2.6006749156355458, "percentage": 52.07, "elapsed_time": "9:32:15", "remaining_time": "8:46:43"}
291
+ {"current_steps": 290, "total_steps": 555, "loss": 0.5126, "lr": 4.3897189452966895e-05, "epoch": 2.609673790776153, "percentage": 52.25, "elapsed_time": "9:34:12", "remaining_time": "8:44:42"}
292
+ {"current_steps": 291, "total_steps": 555, "loss": 0.5133, "lr": 4.364648090846271e-05, "epoch": 2.6186726659167605, "percentage": 52.43, "elapsed_time": "9:36:07", "remaining_time": "8:42:40"}
293
+ {"current_steps": 292, "total_steps": 555, "loss": 0.5083, "lr": 4.339562782957857e-05, "epoch": 2.6276715410573677, "percentage": 52.61, "elapsed_time": "9:38:05", "remaining_time": "8:40:40"}
294
+ {"current_steps": 293, "total_steps": 555, "loss": 0.5194, "lr": 4.314464015929649e-05, "epoch": 2.6366704161979753, "percentage": 52.79, "elapsed_time": "9:39:59", "remaining_time": "8:38:37"}
295
+ {"current_steps": 294, "total_steps": 555, "loss": 0.5128, "lr": 4.28935278459333e-05, "epoch": 2.6456692913385824, "percentage": 52.97, "elapsed_time": "9:41:55", "remaining_time": "8:36:36"}
296
+ {"current_steps": 295, "total_steps": 555, "loss": 0.5148, "lr": 4.264230084274624e-05, "epoch": 2.65466816647919, "percentage": 53.15, "elapsed_time": "9:43:50", "remaining_time": "8:34:34"}
297
+ {"current_steps": 296, "total_steps": 555, "loss": 0.5097, "lr": 4.239096910753846e-05, "epoch": 2.6636670416197976, "percentage": 53.33, "elapsed_time": "9:45:47", "remaining_time": "8:32:34"}
298
+ {"current_steps": 297, "total_steps": 555, "loss": 0.5108, "lr": 4.213954260226438e-05, "epoch": 2.6726659167604048, "percentage": 53.51, "elapsed_time": "9:47:44", "remaining_time": "8:30:34"}
299
+ {"current_steps": 298, "total_steps": 555, "loss": 0.5084, "lr": 4.188803129263476e-05, "epoch": 2.6816647919010124, "percentage": 53.69, "elapsed_time": "9:49:41", "remaining_time": "8:28:33"}
300
+ {"current_steps": 299, "total_steps": 555, "loss": 0.5078, "lr": 4.163644514772172e-05, "epoch": 2.69066366704162, "percentage": 53.87, "elapsed_time": "9:51:38", "remaining_time": "8:26:33"}
301
+ {"current_steps": 300, "total_steps": 555, "loss": 0.5177, "lr": 4.1384794139563614e-05, "epoch": 2.699662542182227, "percentage": 54.05, "elapsed_time": "9:53:34", "remaining_time": "8:24:32"}
302
+ {"current_steps": 301, "total_steps": 555, "loss": 0.5149, "lr": 4.113308824276977e-05, "epoch": 2.7086614173228347, "percentage": 54.23, "elapsed_time": "9:55:30", "remaining_time": "8:22:31"}
303
+ {"current_steps": 302, "total_steps": 555, "loss": 0.5088, "lr": 4.0881337434125086e-05, "epoch": 2.7176602924634423, "percentage": 54.41, "elapsed_time": "9:57:31", "remaining_time": "8:20:34"}
304
+ {"current_steps": 303, "total_steps": 555, "loss": 0.509, "lr": 4.0629551692194634e-05, "epoch": 2.7266591676040495, "percentage": 54.59, "elapsed_time": "9:59:27", "remaining_time": "8:18:33"}
305
+ {"current_steps": 304, "total_steps": 555, "loss": 0.5143, "lr": 4.037774099692815e-05, "epoch": 2.735658042744657, "percentage": 54.77, "elapsed_time": "10:01:23", "remaining_time": "8:16:32"}
306
+ {"current_steps": 305, "total_steps": 555, "loss": 0.5123, "lr": 4.0125915329264396e-05, "epoch": 2.7446569178852642, "percentage": 54.95, "elapsed_time": "10:03:19", "remaining_time": "8:14:31"}
307
+ {"current_steps": 306, "total_steps": 555, "loss": 0.5132, "lr": 3.9874084670735624e-05, "epoch": 2.753655793025872, "percentage": 55.14, "elapsed_time": "10:05:16", "remaining_time": "8:12:31"}
308
+ {"current_steps": 307, "total_steps": 555, "loss": 0.5088, "lr": 3.962225900307187e-05, "epoch": 2.762654668166479, "percentage": 55.32, "elapsed_time": "10:07:12", "remaining_time": "8:10:30"}
309
+ {"current_steps": 308, "total_steps": 555, "loss": 0.5115, "lr": 3.937044830780537e-05, "epoch": 2.7716535433070866, "percentage": 55.5, "elapsed_time": "10:09:09", "remaining_time": "8:08:30"}
310
+ {"current_steps": 309, "total_steps": 555, "loss": 0.5088, "lr": 3.9118662565874934e-05, "epoch": 2.780652418447694, "percentage": 55.68, "elapsed_time": "10:11:06", "remaining_time": "8:06:30"}
311
+ {"current_steps": 310, "total_steps": 555, "loss": 0.515, "lr": 3.886691175723025e-05, "epoch": 2.7896512935883013, "percentage": 55.86, "elapsed_time": "10:13:01", "remaining_time": "8:04:29"}
312
+ {"current_steps": 311, "total_steps": 555, "loss": 0.5102, "lr": 3.8615205860436406e-05, "epoch": 2.798650168728909, "percentage": 56.04, "elapsed_time": "10:14:57", "remaining_time": "8:02:28"}
313
+ {"current_steps": 312, "total_steps": 555, "loss": 0.5142, "lr": 3.83635548522783e-05, "epoch": 2.8076490438695165, "percentage": 56.22, "elapsed_time": "10:16:53", "remaining_time": "8:00:27"}
314
+ {"current_steps": 313, "total_steps": 555, "loss": 0.5143, "lr": 3.811196870736526e-05, "epoch": 2.8166479190101237, "percentage": 56.4, "elapsed_time": "10:18:49", "remaining_time": "7:58:27"}
315
+ {"current_steps": 314, "total_steps": 555, "loss": 0.5066, "lr": 3.786045739773564e-05, "epoch": 2.8256467941507313, "percentage": 56.58, "elapsed_time": "10:20:46", "remaining_time": "7:56:27"}
316
+ {"current_steps": 315, "total_steps": 555, "loss": 0.5077, "lr": 3.7609030892461554e-05, "epoch": 2.8346456692913384, "percentage": 56.76, "elapsed_time": "10:22:42", "remaining_time": "7:54:26"}
317
+ {"current_steps": 316, "total_steps": 555, "loss": 0.5104, "lr": 3.735769915725378e-05, "epoch": 2.843644544431946, "percentage": 56.94, "elapsed_time": "10:24:37", "remaining_time": "7:52:25"}
318
+ {"current_steps": 317, "total_steps": 555, "loss": 0.5076, "lr": 3.710647215406672e-05, "epoch": 2.852643419572553, "percentage": 57.12, "elapsed_time": "10:26:36", "remaining_time": "7:50:26"}
319
+ {"current_steps": 318, "total_steps": 555, "loss": 0.5117, "lr": 3.6855359840703525e-05, "epoch": 2.861642294713161, "percentage": 57.3, "elapsed_time": "10:28:34", "remaining_time": "7:48:27"}
320
+ {"current_steps": 319, "total_steps": 555, "loss": 0.515, "lr": 3.660437217042145e-05, "epoch": 2.8706411698537684, "percentage": 57.48, "elapsed_time": "10:30:32", "remaining_time": "7:46:29"}
321
+ {"current_steps": 320, "total_steps": 555, "loss": 0.5114, "lr": 3.63535190915373e-05, "epoch": 2.8796400449943755, "percentage": 57.66, "elapsed_time": "10:32:30", "remaining_time": "7:44:30"}
322
+ {"current_steps": 321, "total_steps": 555, "loss": 0.512, "lr": 3.610281054703311e-05, "epoch": 2.888638920134983, "percentage": 57.84, "elapsed_time": "10:34:28", "remaining_time": "7:42:31"}
323
+ {"current_steps": 322, "total_steps": 555, "loss": 0.513, "lr": 3.58522564741621e-05, "epoch": 2.8976377952755907, "percentage": 58.02, "elapsed_time": "10:36:24", "remaining_time": "7:40:30"}
324
+ {"current_steps": 323, "total_steps": 555, "loss": 0.5092, "lr": 3.560186680405469e-05, "epoch": 2.906636670416198, "percentage": 58.2, "elapsed_time": "10:38:22", "remaining_time": "7:38:31"}
325
+ {"current_steps": 324, "total_steps": 555, "loss": 0.5143, "lr": 3.535165146132494e-05, "epoch": 2.9156355455568055, "percentage": 58.38, "elapsed_time": "10:40:18", "remaining_time": "7:36:31"}
326
+ {"current_steps": 325, "total_steps": 555, "loss": 0.5044, "lr": 3.51016203636772e-05, "epoch": 2.924634420697413, "percentage": 58.56, "elapsed_time": "10:42:14", "remaining_time": "7:34:30"}
327
+ {"current_steps": 326, "total_steps": 555, "loss": 0.5151, "lr": 3.485178342151287e-05, "epoch": 2.9336332958380202, "percentage": 58.74, "elapsed_time": "10:44:11", "remaining_time": "7:32:30"}
328
+ {"current_steps": 327, "total_steps": 555, "loss": 0.506, "lr": 3.460215053753776e-05, "epoch": 2.942632170978628, "percentage": 58.92, "elapsed_time": "10:46:07", "remaining_time": "7:30:30"}
329
+ {"current_steps": 328, "total_steps": 555, "loss": 0.5106, "lr": 3.435273160636942e-05, "epoch": 2.951631046119235, "percentage": 59.1, "elapsed_time": "10:48:03", "remaining_time": "7:28:30"}
330
+ {"current_steps": 329, "total_steps": 555, "loss": 0.509, "lr": 3.410353651414507e-05, "epoch": 2.9606299212598426, "percentage": 59.28, "elapsed_time": "10:50:00", "remaining_time": "7:26:30"}
331
+ {"current_steps": 330, "total_steps": 555, "loss": 0.5119, "lr": 3.385457513812968e-05, "epoch": 2.9696287964004497, "percentage": 59.46, "elapsed_time": "10:51:56", "remaining_time": "7:24:30"}
332
+ {"current_steps": 331, "total_steps": 555, "loss": 0.5105, "lr": 3.360585734632448e-05, "epoch": 2.9786276715410573, "percentage": 59.64, "elapsed_time": "10:53:51", "remaining_time": "7:22:29"}
333
+ {"current_steps": 332, "total_steps": 555, "loss": 0.51, "lr": 3.3357392997075854e-05, "epoch": 2.987626546681665, "percentage": 59.82, "elapsed_time": "10:55:49", "remaining_time": "7:20:30"}
334
+ {"current_steps": 333, "total_steps": 555, "loss": 0.5096, "lr": 3.3109191938684535e-05, "epoch": 2.996625421822272, "percentage": 60.0, "elapsed_time": "10:57:47", "remaining_time": "7:18:31"}
335
+ {"current_steps": 334, "total_steps": 555, "loss": 0.9217, "lr": 3.28612640090153e-05, "epoch": 3.0056242969628797, "percentage": 60.18, "elapsed_time": "11:01:34", "remaining_time": "7:17:44"}