sedrickkeh commited on
Commit
9a213fc
·
verified ·
1 Parent(s): 74fcb74

Training in progress, epoch 2

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dbbc85295a0f747318048947ff76d73957719b02ad7e574bb97089c6a90e5cc6
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:56a2845d11c95bfe85f53e7d4f08a21124d2eefd63af0cf5b8fe0e86158f0226
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f0140e7104568ddb51835633a91919aedc336d63586b7b3cd10a7e207179d970
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4686484a9ba5a32d6d58ac5c6bb31eedde12b81bee3cfbc3a3f36fc90b35325c
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f88e8e51c9504fde9e1f8db68e13dc82df5a3a29455a3fb815f6bb03f501a864
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1453d82db80365b683dafcf4913ce594c47b6f5708856bbdbacc5da894887095
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8440328864a5d28d87af68b2ed409efc60e6d6fa66b833fc4b939da825157e86
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:537500fd46fc15b5313e71b758e751ab0ee8e9447c474457ef2729a417ecaaf1
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -293,3 +293,150 @@
293
  {"current_steps": 293, "total_steps": 735, "loss": 0.6882, "lr": 6.0219118809536794e-05, "epoch": 1.9872827469266638, "percentage": 39.86, "elapsed_time": "18:01:41", "remaining_time": "1 day, 3:11:46"}
294
  {"current_steps": 294, "total_steps": 735, "loss": 0.6769, "lr": 6.0054855343047914e-05, "epoch": 1.9940652818991098, "percentage": 40.0, "elapsed_time": "18:05:22", "remaining_time": "1 day, 3:08:03"}
295
  {"current_steps": 295, "total_steps": 735, "loss": 1.0693, "lr": 5.989013885847117e-05, "epoch": 2.0008478168715556, "percentage": 40.14, "elapsed_time": "18:10:35", "remaining_time": "1 day, 3:06:38"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
293
  {"current_steps": 293, "total_steps": 735, "loss": 0.6882, "lr": 6.0219118809536794e-05, "epoch": 1.9872827469266638, "percentage": 39.86, "elapsed_time": "18:01:41", "remaining_time": "1 day, 3:11:46"}
294
  {"current_steps": 294, "total_steps": 735, "loss": 0.6769, "lr": 6.0054855343047914e-05, "epoch": 1.9940652818991098, "percentage": 40.0, "elapsed_time": "18:05:22", "remaining_time": "1 day, 3:08:03"}
295
  {"current_steps": 295, "total_steps": 735, "loss": 1.0693, "lr": 5.989013885847117e-05, "epoch": 2.0008478168715556, "percentage": 40.14, "elapsed_time": "18:10:35", "remaining_time": "1 day, 3:06:38"}
296
+ {"current_steps": 296, "total_steps": 735, "loss": 0.6673, "lr": 5.972497307657869e-05, "epoch": 2.0076303518440017, "percentage": 40.27, "elapsed_time": "18:14:16", "remaining_time": "1 day, 3:02:55"}
297
+ {"current_steps": 297, "total_steps": 735, "loss": 0.6676, "lr": 5.955936172829179e-05, "epoch": 2.0144128868164475, "percentage": 40.41, "elapsed_time": "18:17:57", "remaining_time": "1 day, 2:59:13"}
298
+ {"current_steps": 298, "total_steps": 735, "loss": 0.6551, "lr": 5.939330855459661e-05, "epoch": 2.0211954217888937, "percentage": 40.54, "elapsed_time": "18:21:39", "remaining_time": "1 day, 2:55:30"}
299
+ {"current_steps": 299, "total_steps": 735, "loss": 0.6723, "lr": 5.922681730645968e-05, "epoch": 2.0279779567613394, "percentage": 40.68, "elapsed_time": "18:25:20", "remaining_time": "1 day, 2:51:48"}
300
+ {"current_steps": 300, "total_steps": 735, "loss": 0.6509, "lr": 5.905989174474319e-05, "epoch": 2.0347604917337856, "percentage": 40.82, "elapsed_time": "18:29:01", "remaining_time": "1 day, 2:48:05"}
301
+ {"current_steps": 301, "total_steps": 735, "loss": 0.6577, "lr": 5.889253564011999e-05, "epoch": 2.0415430267062313, "percentage": 40.95, "elapsed_time": "18:32:43", "remaining_time": "1 day, 2:44:23"}
302
+ {"current_steps": 302, "total_steps": 735, "loss": 0.6665, "lr": 5.872475277298847e-05, "epoch": 2.0483255616786775, "percentage": 41.09, "elapsed_time": "18:36:24", "remaining_time": "1 day, 2:40:40"}
303
+ {"current_steps": 303, "total_steps": 735, "loss": 0.6556, "lr": 5.855654693338711e-05, "epoch": 2.0551080966511233, "percentage": 41.22, "elapsed_time": "18:40:04", "remaining_time": "1 day, 2:36:56"}
304
+ {"current_steps": 304, "total_steps": 735, "loss": 0.6604, "lr": 5.838792192090889e-05, "epoch": 2.0618906316235694, "percentage": 41.36, "elapsed_time": "18:43:45", "remaining_time": "1 day, 2:33:13"}
305
+ {"current_steps": 305, "total_steps": 735, "loss": 0.6593, "lr": 5.821888154461549e-05, "epoch": 2.068673166596015, "percentage": 41.5, "elapsed_time": "18:47:26", "remaining_time": "1 day, 2:29:30"}
306
+ {"current_steps": 306, "total_steps": 735, "loss": 0.6637, "lr": 5.8049429622951194e-05, "epoch": 2.0754557015684614, "percentage": 41.63, "elapsed_time": "18:51:08", "remaining_time": "1 day, 2:25:48"}
307
+ {"current_steps": 307, "total_steps": 735, "loss": 0.6433, "lr": 5.7879569983656694e-05, "epoch": 2.082238236540907, "percentage": 41.77, "elapsed_time": "18:54:49", "remaining_time": "1 day, 2:22:06"}
308
+ {"current_steps": 308, "total_steps": 735, "loss": 0.6681, "lr": 5.770930646368257e-05, "epoch": 2.0890207715133533, "percentage": 41.9, "elapsed_time": "18:58:30", "remaining_time": "1 day, 2:18:23"}
309
+ {"current_steps": 309, "total_steps": 735, "loss": 0.6571, "lr": 5.7538642909102654e-05, "epoch": 2.095803306485799, "percentage": 42.04, "elapsed_time": "19:02:11", "remaining_time": "1 day, 2:14:40"}
310
+ {"current_steps": 310, "total_steps": 735, "loss": 0.6462, "lr": 5.736758317502714e-05, "epoch": 2.1025858414582452, "percentage": 42.18, "elapsed_time": "19:05:52", "remaining_time": "1 day, 2:10:56"}
311
+ {"current_steps": 311, "total_steps": 735, "loss": 0.642, "lr": 5.719613112551546e-05, "epoch": 2.109368376430691, "percentage": 42.31, "elapsed_time": "19:09:33", "remaining_time": "1 day, 2:07:14"}
312
+ {"current_steps": 312, "total_steps": 735, "loss": 0.6523, "lr": 5.702429063348912e-05, "epoch": 2.1161509114031367, "percentage": 42.45, "elapsed_time": "19:13:14", "remaining_time": "1 day, 2:03:31"}
313
+ {"current_steps": 313, "total_steps": 735, "loss": 0.6485, "lr": 5.685206558064407e-05, "epoch": 2.122933446375583, "percentage": 42.59, "elapsed_time": "19:16:55", "remaining_time": "1 day, 1:59:48"}
314
+ {"current_steps": 314, "total_steps": 735, "loss": 0.6622, "lr": 5.667945985736308e-05, "epoch": 2.1297159813480286, "percentage": 42.72, "elapsed_time": "19:20:36", "remaining_time": "1 day, 1:56:05"}
315
+ {"current_steps": 315, "total_steps": 735, "loss": 0.6598, "lr": 5.6506477362627926e-05, "epoch": 2.136498516320475, "percentage": 42.86, "elapsed_time": "19:24:17", "remaining_time": "1 day, 1:52:23"}
316
+ {"current_steps": 316, "total_steps": 735, "loss": 0.6631, "lr": 5.6333122003931186e-05, "epoch": 2.1432810512929206, "percentage": 42.99, "elapsed_time": "19:27:58", "remaining_time": "1 day, 1:48:40"}
317
+ {"current_steps": 317, "total_steps": 735, "loss": 0.6543, "lr": 5.615939769718809e-05, "epoch": 2.1500635862653668, "percentage": 43.13, "elapsed_time": "19:31:40", "remaining_time": "1 day, 1:44:58"}
318
+ {"current_steps": 318, "total_steps": 735, "loss": 0.6453, "lr": 5.5985308366647985e-05, "epoch": 2.1568461212378125, "percentage": 43.27, "elapsed_time": "19:35:21", "remaining_time": "1 day, 1:41:15"}
319
+ {"current_steps": 319, "total_steps": 735, "loss": 0.6466, "lr": 5.5810857944805744e-05, "epoch": 2.1636286562102587, "percentage": 43.4, "elapsed_time": "19:39:01", "remaining_time": "1 day, 1:37:32"}
320
+ {"current_steps": 320, "total_steps": 735, "loss": 0.6776, "lr": 5.5636050372312896e-05, "epoch": 2.1704111911827044, "percentage": 43.54, "elapsed_time": "19:42:42", "remaining_time": "1 day, 1:33:49"}
321
+ {"current_steps": 321, "total_steps": 735, "loss": 0.6517, "lr": 5.546088959788862e-05, "epoch": 2.1771937261551506, "percentage": 43.67, "elapsed_time": "19:46:23", "remaining_time": "1 day, 1:30:06"}
322
+ {"current_steps": 322, "total_steps": 735, "loss": 0.6565, "lr": 5.528537957823061e-05, "epoch": 2.1839762611275964, "percentage": 43.81, "elapsed_time": "19:50:04", "remaining_time": "1 day, 1:26:23"}
323
+ {"current_steps": 323, "total_steps": 735, "loss": 0.6587, "lr": 5.510952427792559e-05, "epoch": 2.1907587961000425, "percentage": 43.95, "elapsed_time": "19:53:45", "remaining_time": "1 day, 1:22:41"}
324
+ {"current_steps": 324, "total_steps": 735, "loss": 0.6433, "lr": 5.493332766935981e-05, "epoch": 2.1975413310724883, "percentage": 44.08, "elapsed_time": "19:57:26", "remaining_time": "1 day, 1:18:58"}
325
+ {"current_steps": 325, "total_steps": 735, "loss": 0.6578, "lr": 5.4756793732629335e-05, "epoch": 2.2043238660449345, "percentage": 44.22, "elapsed_time": "20:01:07", "remaining_time": "1 day, 1:15:15"}
326
+ {"current_steps": 326, "total_steps": 735, "loss": 0.6499, "lr": 5.45799264554501e-05, "epoch": 2.21110640101738, "percentage": 44.35, "elapsed_time": "20:04:48", "remaining_time": "1 day, 1:11:32"}
327
+ {"current_steps": 327, "total_steps": 735, "loss": 0.6394, "lr": 5.440272983306789e-05, "epoch": 2.2178889359898264, "percentage": 44.49, "elapsed_time": "20:08:29", "remaining_time": "1 day, 1:07:50"}
328
+ {"current_steps": 328, "total_steps": 735, "loss": 0.6554, "lr": 5.4225207868167994e-05, "epoch": 2.224671470962272, "percentage": 44.63, "elapsed_time": "20:12:09", "remaining_time": "1 day, 1:04:07"}
329
+ {"current_steps": 329, "total_steps": 735, "loss": 0.6482, "lr": 5.404736457078489e-05, "epoch": 2.231454005934718, "percentage": 44.76, "elapsed_time": "20:15:50", "remaining_time": "1 day, 1:00:24"}
330
+ {"current_steps": 330, "total_steps": 735, "loss": 0.6503, "lr": 5.38692039582116e-05, "epoch": 2.238236540907164, "percentage": 44.9, "elapsed_time": "20:19:31", "remaining_time": "1 day, 0:56:41"}
331
+ {"current_steps": 331, "total_steps": 735, "loss": 0.6468, "lr": 5.3690730054908985e-05, "epoch": 2.24501907587961, "percentage": 45.03, "elapsed_time": "20:23:13", "remaining_time": "1 day, 0:52:59"}
332
+ {"current_steps": 332, "total_steps": 735, "loss": 0.6518, "lr": 5.3511946892414775e-05, "epoch": 2.251801610852056, "percentage": 45.17, "elapsed_time": "20:26:53", "remaining_time": "1 day, 0:49:16"}
333
+ {"current_steps": 333, "total_steps": 735, "loss": 0.6565, "lr": 5.333285850925256e-05, "epoch": 2.2585841458245017, "percentage": 45.31, "elapsed_time": "20:30:34", "remaining_time": "1 day, 0:45:33"}
334
+ {"current_steps": 334, "total_steps": 735, "loss": 0.6564, "lr": 5.315346895084056e-05, "epoch": 2.265366680796948, "percentage": 45.44, "elapsed_time": "20:34:15", "remaining_time": "1 day, 0:41:51"}
335
+ {"current_steps": 335, "total_steps": 735, "loss": 0.6516, "lr": 5.297378226940019e-05, "epoch": 2.2721492157693937, "percentage": 45.58, "elapsed_time": "20:37:56", "remaining_time": "1 day, 0:38:08"}
336
+ {"current_steps": 336, "total_steps": 735, "loss": 0.6626, "lr": 5.279380252386461e-05, "epoch": 2.27893175074184, "percentage": 45.71, "elapsed_time": "20:41:38", "remaining_time": "1 day, 0:34:26"}
337
+ {"current_steps": 337, "total_steps": 735, "loss": 0.6663, "lr": 5.2613533779786945e-05, "epoch": 2.2857142857142856, "percentage": 45.85, "elapsed_time": "20:45:19", "remaining_time": "1 day, 0:30:44"}
338
+ {"current_steps": 338, "total_steps": 735, "loss": 0.6408, "lr": 5.243298010924852e-05, "epoch": 2.2924968206867318, "percentage": 45.99, "elapsed_time": "20:48:59", "remaining_time": "1 day, 0:27:00"}
339
+ {"current_steps": 339, "total_steps": 735, "loss": 0.6435, "lr": 5.225214559076683e-05, "epoch": 2.2992793556591775, "percentage": 46.12, "elapsed_time": "20:52:40", "remaining_time": "1 day, 0:23:18"}
340
+ {"current_steps": 340, "total_steps": 735, "loss": 0.6395, "lr": 5.207103430920345e-05, "epoch": 2.3060618906316237, "percentage": 46.26, "elapsed_time": "20:56:22", "remaining_time": "1 day, 0:19:36"}
341
+ {"current_steps": 341, "total_steps": 735, "loss": 0.654, "lr": 5.1889650355671725e-05, "epoch": 2.3128444256040694, "percentage": 46.39, "elapsed_time": "21:00:03", "remaining_time": "1 day, 0:15:53"}
342
+ {"current_steps": 342, "total_steps": 735, "loss": 0.6546, "lr": 5.1707997827444394e-05, "epoch": 2.3196269605765156, "percentage": 46.53, "elapsed_time": "21:03:44", "remaining_time": "1 day, 0:12:11"}
343
+ {"current_steps": 343, "total_steps": 735, "loss": 0.6646, "lr": 5.152608082786098e-05, "epoch": 2.3264094955489614, "percentage": 46.67, "elapsed_time": "21:07:24", "remaining_time": "1 day, 0:08:28"}
344
+ {"current_steps": 344, "total_steps": 735, "loss": 0.648, "lr": 5.1343903466235174e-05, "epoch": 2.3331920305214076, "percentage": 46.8, "elapsed_time": "21:11:05", "remaining_time": "1 day, 0:04:45"}
345
+ {"current_steps": 345, "total_steps": 735, "loss": 0.6593, "lr": 5.116146985776194e-05, "epoch": 2.3399745654938533, "percentage": 46.94, "elapsed_time": "21:14:45", "remaining_time": "1 day, 0:01:01"}
346
+ {"current_steps": 346, "total_steps": 735, "loss": 0.6516, "lr": 5.0978784123424617e-05, "epoch": 2.3467571004662995, "percentage": 47.07, "elapsed_time": "21:18:25", "remaining_time": "23:57:18"}
347
+ {"current_steps": 347, "total_steps": 735, "loss": 0.6638, "lr": 5.0795850389901784e-05, "epoch": 2.3535396354387452, "percentage": 47.21, "elapsed_time": "21:22:06", "remaining_time": "23:53:35"}
348
+ {"current_steps": 348, "total_steps": 735, "loss": 0.6457, "lr": 5.061267278947408e-05, "epoch": 2.360322170411191, "percentage": 47.35, "elapsed_time": "21:25:46", "remaining_time": "23:49:52"}
349
+ {"current_steps": 349, "total_steps": 735, "loss": 0.6584, "lr": 5.042925545993079e-05, "epoch": 2.367104705383637, "percentage": 47.48, "elapsed_time": "21:29:27", "remaining_time": "23:46:09"}
350
+ {"current_steps": 350, "total_steps": 735, "loss": 0.6348, "lr": 5.02456025444765e-05, "epoch": 2.373887240356083, "percentage": 47.62, "elapsed_time": "21:33:08", "remaining_time": "23:42:27"}
351
+ {"current_steps": 351, "total_steps": 735, "loss": 0.6574, "lr": 5.0061718191637394e-05, "epoch": 2.380669775328529, "percentage": 47.76, "elapsed_time": "21:36:49", "remaining_time": "23:38:45"}
352
+ {"current_steps": 352, "total_steps": 735, "loss": 0.6502, "lr": 4.987760655516757e-05, "epoch": 2.387452310300975, "percentage": 47.89, "elapsed_time": "21:40:31", "remaining_time": "23:35:03"}
353
+ {"current_steps": 353, "total_steps": 735, "loss": 0.6468, "lr": 4.9693271793955255e-05, "epoch": 2.394234845273421, "percentage": 48.03, "elapsed_time": "21:44:11", "remaining_time": "23:31:20"}
354
+ {"current_steps": 354, "total_steps": 735, "loss": 0.6486, "lr": 4.95087180719288e-05, "epoch": 2.4010173802458668, "percentage": 48.16, "elapsed_time": "21:47:52", "remaining_time": "23:27:37"}
355
+ {"current_steps": 355, "total_steps": 735, "loss": 0.6477, "lr": 4.9323949557962684e-05, "epoch": 2.407799915218313, "percentage": 48.3, "elapsed_time": "21:51:32", "remaining_time": "23:23:54"}
356
+ {"current_steps": 356, "total_steps": 735, "loss": 0.6479, "lr": 4.913897042578327e-05, "epoch": 2.4145824501907587, "percentage": 48.44, "elapsed_time": "21:55:14", "remaining_time": "23:20:12"}
357
+ {"current_steps": 357, "total_steps": 735, "loss": 0.6605, "lr": 4.8953784853874624e-05, "epoch": 2.421364985163205, "percentage": 48.57, "elapsed_time": "21:58:55", "remaining_time": "23:16:30"}
358
+ {"current_steps": 358, "total_steps": 735, "loss": 0.6414, "lr": 4.8768397025383996e-05, "epoch": 2.4281475201356506, "percentage": 48.71, "elapsed_time": "22:02:36", "remaining_time": "23:12:48"}
359
+ {"current_steps": 359, "total_steps": 735, "loss": 0.6526, "lr": 4.858281112802745e-05, "epoch": 2.434930055108097, "percentage": 48.84, "elapsed_time": "22:06:17", "remaining_time": "23:09:06"}
360
+ {"current_steps": 360, "total_steps": 735, "loss": 0.6503, "lr": 4.83970313539952e-05, "epoch": 2.4417125900805425, "percentage": 48.98, "elapsed_time": "22:09:59", "remaining_time": "23:05:24"}
361
+ {"current_steps": 361, "total_steps": 735, "loss": 0.6447, "lr": 4.821106189985693e-05, "epoch": 2.4484951250529887, "percentage": 49.12, "elapsed_time": "22:13:39", "remaining_time": "23:01:41"}
362
+ {"current_steps": 362, "total_steps": 735, "loss": 0.6566, "lr": 4.8024906966467e-05, "epoch": 2.4552776600254345, "percentage": 49.25, "elapsed_time": "22:17:21", "remaining_time": "22:58:00"}
363
+ {"current_steps": 363, "total_steps": 735, "loss": 0.6614, "lr": 4.783857075886956e-05, "epoch": 2.4620601949978806, "percentage": 49.39, "elapsed_time": "22:21:02", "remaining_time": "22:54:17"}
364
+ {"current_steps": 364, "total_steps": 735, "loss": 0.6446, "lr": 4.7652057486203525e-05, "epoch": 2.4688427299703264, "percentage": 49.52, "elapsed_time": "22:24:43", "remaining_time": "22:50:35"}
365
+ {"current_steps": 365, "total_steps": 735, "loss": 0.6563, "lr": 4.746537136160757e-05, "epoch": 2.4756252649427726, "percentage": 49.66, "elapsed_time": "22:28:25", "remaining_time": "22:46:53"}
366
+ {"current_steps": 366, "total_steps": 735, "loss": 0.6502, "lr": 4.727851660212487e-05, "epoch": 2.4824077999152183, "percentage": 49.8, "elapsed_time": "22:32:06", "remaining_time": "22:43:11"}
367
+ {"current_steps": 367, "total_steps": 735, "loss": 0.6424, "lr": 4.709149742860792e-05, "epoch": 2.489190334887664, "percentage": 49.93, "elapsed_time": "22:35:47", "remaining_time": "22:39:29"}
368
+ {"current_steps": 368, "total_steps": 735, "loss": 0.6496, "lr": 4.690431806562311e-05, "epoch": 2.4959728698601102, "percentage": 50.07, "elapsed_time": "22:39:28", "remaining_time": "22:35:46"}
369
+ {"current_steps": 369, "total_steps": 735, "loss": 0.6533, "lr": 4.6716982741355386e-05, "epoch": 2.5027554048325564, "percentage": 50.2, "elapsed_time": "22:43:09", "remaining_time": "22:32:04"}
370
+ {"current_steps": 370, "total_steps": 735, "loss": 0.6402, "lr": 4.652949568751267e-05, "epoch": 2.509537939805002, "percentage": 50.34, "elapsed_time": "22:46:50", "remaining_time": "22:28:22"}
371
+ {"current_steps": 371, "total_steps": 735, "loss": 0.6482, "lr": 4.63418611392303e-05, "epoch": 2.516320474777448, "percentage": 50.48, "elapsed_time": "22:50:31", "remaining_time": "22:24:40"}
372
+ {"current_steps": 372, "total_steps": 735, "loss": 0.6522, "lr": 4.615408333497538e-05, "epoch": 2.523103009749894, "percentage": 50.61, "elapsed_time": "22:54:12", "remaining_time": "22:20:57"}
373
+ {"current_steps": 373, "total_steps": 735, "loss": 0.6573, "lr": 4.5966166516450985e-05, "epoch": 2.52988554472234, "percentage": 50.75, "elapsed_time": "22:57:53", "remaining_time": "22:17:15"}
374
+ {"current_steps": 374, "total_steps": 735, "loss": 0.6598, "lr": 4.577811492850039e-05, "epoch": 2.536668079694786, "percentage": 50.88, "elapsed_time": "23:01:34", "remaining_time": "22:13:33"}
375
+ {"current_steps": 375, "total_steps": 735, "loss": 0.6465, "lr": 4.558993281901116e-05, "epoch": 2.5434506146672318, "percentage": 51.02, "elapsed_time": "23:05:15", "remaining_time": "22:09:50"}
376
+ {"current_steps": 376, "total_steps": 735, "loss": 0.6488, "lr": 4.540162443881922e-05, "epoch": 2.550233149639678, "percentage": 51.16, "elapsed_time": "23:08:55", "remaining_time": "22:06:07"}
377
+ {"current_steps": 377, "total_steps": 735, "loss": 0.648, "lr": 4.5213194041612824e-05, "epoch": 2.5570156846121237, "percentage": 51.29, "elapsed_time": "23:12:36", "remaining_time": "22:02:25"}
378
+ {"current_steps": 378, "total_steps": 735, "loss": 0.6579, "lr": 4.5024645883836426e-05, "epoch": 2.56379821958457, "percentage": 51.43, "elapsed_time": "23:16:17", "remaining_time": "21:58:42"}
379
+ {"current_steps": 379, "total_steps": 735, "loss": 0.6621, "lr": 4.4835984224594586e-05, "epoch": 2.5705807545570156, "percentage": 51.56, "elapsed_time": "23:19:57", "remaining_time": "21:55:00"}
380
+ {"current_steps": 380, "total_steps": 735, "loss": 0.6512, "lr": 4.464721332555577e-05, "epoch": 2.577363289529462, "percentage": 51.7, "elapsed_time": "23:23:38", "remaining_time": "21:51:17"}
381
+ {"current_steps": 381, "total_steps": 735, "loss": 0.6492, "lr": 4.445833745085602e-05, "epoch": 2.5841458245019076, "percentage": 51.84, "elapsed_time": "23:27:19", "remaining_time": "21:47:35"}
382
+ {"current_steps": 382, "total_steps": 735, "loss": 0.6589, "lr": 4.4269360867002675e-05, "epoch": 2.5909283594743533, "percentage": 51.97, "elapsed_time": "23:31:00", "remaining_time": "21:43:53"}
383
+ {"current_steps": 383, "total_steps": 735, "loss": 0.6493, "lr": 4.408028784277799e-05, "epoch": 2.5977108944467995, "percentage": 52.11, "elapsed_time": "23:34:41", "remaining_time": "21:40:11"}
384
+ {"current_steps": 384, "total_steps": 735, "loss": 0.6589, "lr": 4.389112264914273e-05, "epoch": 2.6044934294192457, "percentage": 52.24, "elapsed_time": "23:38:23", "remaining_time": "21:36:29"}
385
+ {"current_steps": 385, "total_steps": 735, "loss": 0.6561, "lr": 4.370186955913962e-05, "epoch": 2.6112759643916914, "percentage": 52.38, "elapsed_time": "23:42:04", "remaining_time": "21:32:47"}
386
+ {"current_steps": 386, "total_steps": 735, "loss": 0.6552, "lr": 4.351253284779692e-05, "epoch": 2.618058499364137, "percentage": 52.52, "elapsed_time": "23:45:45", "remaining_time": "21:29:05"}
387
+ {"current_steps": 387, "total_steps": 735, "loss": 0.6364, "lr": 4.332311679203177e-05, "epoch": 2.6248410343365833, "percentage": 52.65, "elapsed_time": "23:49:26", "remaining_time": "21:25:23"}
388
+ {"current_steps": 388, "total_steps": 735, "loss": 0.6502, "lr": 4.313362567055367e-05, "epoch": 2.6316235693090295, "percentage": 52.79, "elapsed_time": "23:53:07", "remaining_time": "21:21:41"}
389
+ {"current_steps": 389, "total_steps": 735, "loss": 0.6561, "lr": 4.294406376376771e-05, "epoch": 2.6384061042814753, "percentage": 52.93, "elapsed_time": "23:56:48", "remaining_time": "21:17:59"}
390
+ {"current_steps": 390, "total_steps": 735, "loss": 0.6567, "lr": 4.2754435353677985e-05, "epoch": 2.645188639253921, "percentage": 53.06, "elapsed_time": "1 day, 0:00:29", "remaining_time": "21:14:16"}
391
+ {"current_steps": 391, "total_steps": 735, "loss": 0.6568, "lr": 4.2564744723790835e-05, "epoch": 2.651971174226367, "percentage": 53.2, "elapsed_time": "1 day, 0:04:10", "remaining_time": "21:10:34"}
392
+ {"current_steps": 392, "total_steps": 735, "loss": 0.6552, "lr": 4.237499615901805e-05, "epoch": 2.658753709198813, "percentage": 53.33, "elapsed_time": "1 day, 0:07:51", "remaining_time": "21:06:52"}
393
+ {"current_steps": 393, "total_steps": 735, "loss": 0.6333, "lr": 4.218519394558013e-05, "epoch": 2.665536244171259, "percentage": 53.47, "elapsed_time": "1 day, 0:11:32", "remaining_time": "21:03:10"}
394
+ {"current_steps": 394, "total_steps": 735, "loss": 0.6501, "lr": 4.199534237090943e-05, "epoch": 2.672318779143705, "percentage": 53.61, "elapsed_time": "1 day, 0:15:13", "remaining_time": "20:59:28"}
395
+ {"current_steps": 395, "total_steps": 735, "loss": 0.648, "lr": 4.1805445723553346e-05, "epoch": 2.679101314116151, "percentage": 53.74, "elapsed_time": "1 day, 0:18:54", "remaining_time": "20:55:46"}
396
+ {"current_steps": 396, "total_steps": 735, "loss": 0.6544, "lr": 4.1615508293077394e-05, "epoch": 2.685883849088597, "percentage": 53.88, "elapsed_time": "1 day, 0:22:35", "remaining_time": "20:52:03"}
397
+ {"current_steps": 397, "total_steps": 735, "loss": 0.6558, "lr": 4.142553436996834e-05, "epoch": 2.692666384061043, "percentage": 54.01, "elapsed_time": "1 day, 0:26:16", "remaining_time": "20:48:22"}
398
+ {"current_steps": 398, "total_steps": 735, "loss": 0.6354, "lr": 4.12355282455373e-05, "epoch": 2.6994489190334887, "percentage": 54.15, "elapsed_time": "1 day, 0:29:57", "remaining_time": "20:44:39"}
399
+ {"current_steps": 399, "total_steps": 735, "loss": 0.6493, "lr": 4.1045494211822756e-05, "epoch": 2.706231454005935, "percentage": 54.29, "elapsed_time": "1 day, 0:33:37", "remaining_time": "20:40:57"}
400
+ {"current_steps": 400, "total_steps": 735, "loss": 0.6397, "lr": 4.085543656149365e-05, "epoch": 2.7130139889783806, "percentage": 54.42, "elapsed_time": "1 day, 0:37:18", "remaining_time": "20:37:15"}
401
+ {"current_steps": 401, "total_steps": 735, "loss": 0.6537, "lr": 4.0665359587752394e-05, "epoch": 2.7197965239508264, "percentage": 54.56, "elapsed_time": "1 day, 0:41:00", "remaining_time": "20:33:33"}
402
+ {"current_steps": 402, "total_steps": 735, "loss": 0.656, "lr": 4.04752675842379e-05, "epoch": 2.7265790589232726, "percentage": 54.69, "elapsed_time": "1 day, 0:44:40", "remaining_time": "20:29:50"}
403
+ {"current_steps": 403, "total_steps": 735, "loss": 0.6424, "lr": 4.028516484492857e-05, "epoch": 2.7333615938957188, "percentage": 54.83, "elapsed_time": "1 day, 0:48:21", "remaining_time": "20:26:08"}
404
+ {"current_steps": 404, "total_steps": 735, "loss": 0.6377, "lr": 4.009505566404535e-05, "epoch": 2.7401441288681645, "percentage": 54.97, "elapsed_time": "1 day, 0:52:02", "remaining_time": "20:22:26"}
405
+ {"current_steps": 405, "total_steps": 735, "loss": 0.6518, "lr": 3.990494433595466e-05, "epoch": 2.7469266638406102, "percentage": 55.1, "elapsed_time": "1 day, 0:55:43", "remaining_time": "20:18:43"}
406
+ {"current_steps": 406, "total_steps": 735, "loss": 0.6536, "lr": 3.9714835155071435e-05, "epoch": 2.7537091988130564, "percentage": 55.24, "elapsed_time": "1 day, 0:59:23", "remaining_time": "20:15:01"}
407
+ {"current_steps": 407, "total_steps": 735, "loss": 0.6583, "lr": 3.952473241576211e-05, "epoch": 2.760491733785502, "percentage": 55.37, "elapsed_time": "1 day, 1:03:05", "remaining_time": "20:11:19"}
408
+ {"current_steps": 408, "total_steps": 735, "loss": 0.6545, "lr": 3.933464041224761e-05, "epoch": 2.7672742687579484, "percentage": 55.51, "elapsed_time": "1 day, 1:06:46", "remaining_time": "20:07:38"}
409
+ {"current_steps": 409, "total_steps": 735, "loss": 0.6513, "lr": 3.914456343850637e-05, "epoch": 2.774056803730394, "percentage": 55.65, "elapsed_time": "1 day, 1:10:28", "remaining_time": "20:03:56"}
410
+ {"current_steps": 410, "total_steps": 735, "loss": 0.6548, "lr": 3.895450578817727e-05, "epoch": 2.7808393387028403, "percentage": 55.78, "elapsed_time": "1 day, 1:14:08", "remaining_time": "20:00:14"}
411
+ {"current_steps": 411, "total_steps": 735, "loss": 0.654, "lr": 3.8764471754462714e-05, "epoch": 2.787621873675286, "percentage": 55.92, "elapsed_time": "1 day, 1:17:49", "remaining_time": "19:56:32"}
412
+ {"current_steps": 412, "total_steps": 735, "loss": 0.651, "lr": 3.857446563003167e-05, "epoch": 2.794404408647732, "percentage": 56.05, "elapsed_time": "1 day, 1:21:31", "remaining_time": "19:52:50"}
413
+ {"current_steps": 413, "total_steps": 735, "loss": 0.6418, "lr": 3.838449170692262e-05, "epoch": 2.801186943620178, "percentage": 56.19, "elapsed_time": "1 day, 1:25:12", "remaining_time": "19:49:08"}
414
+ {"current_steps": 414, "total_steps": 735, "loss": 0.6566, "lr": 3.819455427644666e-05, "epoch": 2.807969478592624, "percentage": 56.33, "elapsed_time": "1 day, 1:28:53", "remaining_time": "19:45:27"}
415
+ {"current_steps": 415, "total_steps": 735, "loss": 0.6494, "lr": 3.800465762909057e-05, "epoch": 2.81475201356507, "percentage": 56.46, "elapsed_time": "1 day, 1:32:34", "remaining_time": "19:41:44"}
416
+ {"current_steps": 416, "total_steps": 735, "loss": 0.6504, "lr": 3.781480605441989e-05, "epoch": 2.821534548537516, "percentage": 56.6, "elapsed_time": "1 day, 1:36:16", "remaining_time": "19:38:03"}
417
+ {"current_steps": 417, "total_steps": 735, "loss": 0.6515, "lr": 3.7625003840981976e-05, "epoch": 2.828317083509962, "percentage": 56.73, "elapsed_time": "1 day, 1:39:56", "remaining_time": "19:34:20"}
418
+ {"current_steps": 418, "total_steps": 735, "loss": 0.6482, "lr": 3.743525527620918e-05, "epoch": 2.835099618482408, "percentage": 56.87, "elapsed_time": "1 day, 1:43:36", "remaining_time": "19:30:38"}
419
+ {"current_steps": 419, "total_steps": 735, "loss": 0.6558, "lr": 3.724556464632203e-05, "epoch": 2.8418821534548537, "percentage": 57.01, "elapsed_time": "1 day, 1:47:18", "remaining_time": "19:26:56"}
420
+ {"current_steps": 420, "total_steps": 735, "loss": 0.6283, "lr": 3.7055936236232296e-05, "epoch": 2.8486646884272995, "percentage": 57.14, "elapsed_time": "1 day, 1:50:58", "remaining_time": "19:23:13"}
421
+ {"current_steps": 421, "total_steps": 735, "loss": 0.6524, "lr": 3.686637432944634e-05, "epoch": 2.8554472233997457, "percentage": 57.28, "elapsed_time": "1 day, 1:54:39", "remaining_time": "19:19:32"}
422
+ {"current_steps": 422, "total_steps": 735, "loss": 0.6407, "lr": 3.6676883207968226e-05, "epoch": 2.862229758372192, "percentage": 57.41, "elapsed_time": "1 day, 1:58:20", "remaining_time": "19:15:50"}
423
+ {"current_steps": 423, "total_steps": 735, "loss": 0.6431, "lr": 3.648746715220309e-05, "epoch": 2.8690122933446376, "percentage": 57.55, "elapsed_time": "1 day, 2:02:03", "remaining_time": "19:12:09"}
424
+ {"current_steps": 424, "total_steps": 735, "loss": 0.6457, "lr": 3.6298130440860394e-05, "epoch": 2.8757948283170833, "percentage": 57.69, "elapsed_time": "1 day, 2:05:46", "remaining_time": "19:08:28"}
425
+ {"current_steps": 425, "total_steps": 735, "loss": 0.6413, "lr": 3.6108877350857296e-05, "epoch": 2.8825773632895295, "percentage": 57.82, "elapsed_time": "1 day, 2:09:28", "remaining_time": "19:04:47"}
426
+ {"current_steps": 426, "total_steps": 735, "loss": 0.6493, "lr": 3.5919712157222014e-05, "epoch": 2.8893598982619753, "percentage": 57.96, "elapsed_time": "1 day, 2:13:09", "remaining_time": "19:01:05"}
427
+ {"current_steps": 427, "total_steps": 735, "loss": 0.6471, "lr": 3.573063913299733e-05, "epoch": 2.8961424332344214, "percentage": 58.1, "elapsed_time": "1 day, 2:16:50", "remaining_time": "18:57:23"}
428
+ {"current_steps": 428, "total_steps": 735, "loss": 0.6525, "lr": 3.554166254914399e-05, "epoch": 2.902924968206867, "percentage": 58.23, "elapsed_time": "1 day, 2:20:31", "remaining_time": "18:53:41"}
429
+ {"current_steps": 429, "total_steps": 735, "loss": 0.6435, "lr": 3.535278667444423e-05, "epoch": 2.9097075031793134, "percentage": 58.37, "elapsed_time": "1 day, 2:24:12", "remaining_time": "18:49:59"}
430
+ {"current_steps": 430, "total_steps": 735, "loss": 0.6537, "lr": 3.5164015775405414e-05, "epoch": 2.916490038151759, "percentage": 58.5, "elapsed_time": "1 day, 2:27:53", "remaining_time": "18:46:17"}
431
+ {"current_steps": 431, "total_steps": 735, "loss": 0.6528, "lr": 3.4975354116163594e-05, "epoch": 2.9232725731242053, "percentage": 58.64, "elapsed_time": "1 day, 2:31:34", "remaining_time": "18:42:35"}
432
+ {"current_steps": 432, "total_steps": 735, "loss": 0.6552, "lr": 3.478680595838719e-05, "epoch": 2.930055108096651, "percentage": 58.78, "elapsed_time": "1 day, 2:35:15", "remaining_time": "18:38:53"}
433
+ {"current_steps": 433, "total_steps": 735, "loss": 0.6477, "lr": 3.4598375561180783e-05, "epoch": 2.9368376430690972, "percentage": 58.91, "elapsed_time": "1 day, 2:38:56", "remaining_time": "18:35:11"}
434
+ {"current_steps": 434, "total_steps": 735, "loss": 0.6415, "lr": 3.441006718098885e-05, "epoch": 2.943620178041543, "percentage": 59.05, "elapsed_time": "1 day, 2:42:37", "remaining_time": "18:31:29"}
435
+ {"current_steps": 435, "total_steps": 735, "loss": 0.66, "lr": 3.422188507149962e-05, "epoch": 2.9504027130139887, "percentage": 59.18, "elapsed_time": "1 day, 2:46:18", "remaining_time": "18:27:47"}
436
+ {"current_steps": 436, "total_steps": 735, "loss": 0.6392, "lr": 3.403383348354902e-05, "epoch": 2.957185247986435, "percentage": 59.32, "elapsed_time": "1 day, 2:49:59", "remaining_time": "18:24:05"}
437
+ {"current_steps": 437, "total_steps": 735, "loss": 0.6571, "lr": 3.3845916665024626e-05, "epoch": 2.963967782958881, "percentage": 59.46, "elapsed_time": "1 day, 2:53:40", "remaining_time": "18:20:24"}
438
+ {"current_steps": 438, "total_steps": 735, "loss": 0.658, "lr": 3.36581388607697e-05, "epoch": 2.970750317931327, "percentage": 59.59, "elapsed_time": "1 day, 2:57:21", "remaining_time": "18:16:42"}
439
+ {"current_steps": 439, "total_steps": 735, "loss": 0.6445, "lr": 3.347050431248735e-05, "epoch": 2.9775328529037726, "percentage": 59.73, "elapsed_time": "1 day, 3:01:01", "remaining_time": "18:12:59"}
440
+ {"current_steps": 440, "total_steps": 735, "loss": 0.6514, "lr": 3.3283017258644634e-05, "epoch": 2.9843153878762188, "percentage": 59.86, "elapsed_time": "1 day, 3:04:42", "remaining_time": "18:09:17"}
441
+ {"current_steps": 441, "total_steps": 735, "loss": 0.6479, "lr": 3.30956819343769e-05, "epoch": 2.991097922848665, "percentage": 60.0, "elapsed_time": "1 day, 3:08:23", "remaining_time": "18:05:35"}
442
+ {"current_steps": 442, "total_steps": 735, "loss": 0.7446, "lr": 3.290850257139209e-05, "epoch": 2.9978804578211107, "percentage": 60.14, "elapsed_time": "1 day, 3:11:36", "remaining_time": "18:01:34"}