Training in progress, epoch 3
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4877660776
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5e838278fcda23dcb4c51ad07023be536a6ab301cb18cc65d3022c9f7669495b
|
3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4932751008
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2c7112cef37666be84dcf4634a088c54ea034c1325046a3704f024ca786a3b8c
|
3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4330865200
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:44f52f7ff0a9878e03e7f9081240fabc0f77c32e6b7ecb65b207138533269953
|
3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1089994880
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bf7e9824b9fc57116f959223b8012c770d9ede8672b0fec0c4099345aa856595
|
3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
@@ -440,3 +440,151 @@
|
|
440 |
{"current_steps": 440, "total_steps": 735, "loss": 0.6514, "lr": 3.3283017258644634e-05, "epoch": 2.9843153878762188, "percentage": 59.86, "elapsed_time": "1 day, 3:04:42", "remaining_time": "18:09:17"}
|
441 |
{"current_steps": 441, "total_steps": 735, "loss": 0.6479, "lr": 3.30956819343769e-05, "epoch": 2.991097922848665, "percentage": 60.0, "elapsed_time": "1 day, 3:08:23", "remaining_time": "18:05:35"}
|
442 |
{"current_steps": 442, "total_steps": 735, "loss": 0.7446, "lr": 3.290850257139209e-05, "epoch": 2.9978804578211107, "percentage": 60.14, "elapsed_time": "1 day, 3:11:36", "remaining_time": "18:01:34"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
440 |
{"current_steps": 440, "total_steps": 735, "loss": 0.6514, "lr": 3.3283017258644634e-05, "epoch": 2.9843153878762188, "percentage": 59.86, "elapsed_time": "1 day, 3:04:42", "remaining_time": "18:09:17"}
|
441 |
{"current_steps": 441, "total_steps": 735, "loss": 0.6479, "lr": 3.30956819343769e-05, "epoch": 2.991097922848665, "percentage": 60.0, "elapsed_time": "1 day, 3:08:23", "remaining_time": "18:05:35"}
|
442 |
{"current_steps": 442, "total_steps": 735, "loss": 0.7446, "lr": 3.290850257139209e-05, "epoch": 2.9978804578211107, "percentage": 60.14, "elapsed_time": "1 day, 3:11:36", "remaining_time": "18:01:34"}
|
443 |
+
{"current_steps": 443, "total_steps": 735, "loss": 0.9011, "lr": 3.2721483397875135e-05, "epoch": 3.0046629927935564, "percentage": 60.27, "elapsed_time": "1 day, 3:16:50", "remaining_time": "17:58:54"}
|
444 |
+
{"current_steps": 444, "total_steps": 735, "loss": 0.6098, "lr": 3.253462863839243e-05, "epoch": 3.0114455277660026, "percentage": 60.41, "elapsed_time": "1 day, 3:20:31", "remaining_time": "17:55:12"}
|
445 |
+
{"current_steps": 445, "total_steps": 735, "loss": 0.6367, "lr": 3.2347942513796475e-05, "epoch": 3.0182280627384483, "percentage": 60.54, "elapsed_time": "1 day, 3:24:12", "remaining_time": "17:51:30"}
|
446 |
+
{"current_steps": 446, "total_steps": 735, "loss": 0.6285, "lr": 3.216142924113046e-05, "epoch": 3.0250105977108945, "percentage": 60.68, "elapsed_time": "1 day, 3:27:53", "remaining_time": "17:47:48"}
|
447 |
+
{"current_steps": 447, "total_steps": 735, "loss": 0.6332, "lr": 3.1975093033533003e-05, "epoch": 3.0317931326833403, "percentage": 60.82, "elapsed_time": "1 day, 3:31:34", "remaining_time": "17:44:06"}
|
448 |
+
{"current_steps": 448, "total_steps": 735, "loss": 0.6246, "lr": 3.1788938100143086e-05, "epoch": 3.0385756676557865, "percentage": 60.95, "elapsed_time": "1 day, 3:35:16", "remaining_time": "17:40:24"}
|
449 |
+
{"current_steps": 449, "total_steps": 735, "loss": 0.6193, "lr": 3.160296864600482e-05, "epoch": 3.045358202628232, "percentage": 61.09, "elapsed_time": "1 day, 3:38:57", "remaining_time": "17:36:42"}
|
450 |
+
{"current_steps": 450, "total_steps": 735, "loss": 0.6264, "lr": 3.1417188871972554e-05, "epoch": 3.0521407376006784, "percentage": 61.22, "elapsed_time": "1 day, 3:42:38", "remaining_time": "17:33:00"}
|
451 |
+
{"current_steps": 451, "total_steps": 735, "loss": 0.631, "lr": 3.123160297461601e-05, "epoch": 3.058923272573124, "percentage": 61.36, "elapsed_time": "1 day, 3:46:19", "remaining_time": "17:29:18"}
|
452 |
+
{"current_steps": 452, "total_steps": 735, "loss": 0.6344, "lr": 3.104621514612538e-05, "epoch": 3.0657058075455703, "percentage": 61.5, "elapsed_time": "1 day, 3:49:59", "remaining_time": "17:25:35"}
|
453 |
+
{"current_steps": 453, "total_steps": 735, "loss": 0.6129, "lr": 3.086102957421672e-05, "epoch": 3.072488342518016, "percentage": 61.63, "elapsed_time": "1 day, 3:53:40", "remaining_time": "17:21:53"}
|
454 |
+
{"current_steps": 454, "total_steps": 735, "loss": 0.6269, "lr": 3.0676050442037336e-05, "epoch": 3.0792708774904622, "percentage": 61.77, "elapsed_time": "1 day, 3:57:20", "remaining_time": "17:18:10"}
|
455 |
+
{"current_steps": 455, "total_steps": 735, "loss": 0.6221, "lr": 3.0491281928071217e-05, "epoch": 3.086053412462908, "percentage": 61.9, "elapsed_time": "1 day, 4:01:01", "remaining_time": "17:14:28"}
|
456 |
+
{"current_steps": 456, "total_steps": 735, "loss": 0.6256, "lr": 3.030672820604476e-05, "epoch": 3.092835947435354, "percentage": 62.04, "elapsed_time": "1 day, 4:04:42", "remaining_time": "17:10:46"}
|
457 |
+
{"current_steps": 457, "total_steps": 735, "loss": 0.6177, "lr": 3.012239344483244e-05, "epoch": 3.0996184824078, "percentage": 62.18, "elapsed_time": "1 day, 4:08:23", "remaining_time": "17:07:04"}
|
458 |
+
{"current_steps": 458, "total_steps": 735, "loss": 0.6113, "lr": 2.993828180836262e-05, "epoch": 3.1064010173802457, "percentage": 62.31, "elapsed_time": "1 day, 4:12:03", "remaining_time": "17:03:21"}
|
459 |
+
{"current_steps": 459, "total_steps": 735, "loss": 0.6297, "lr": 2.9754397455523497e-05, "epoch": 3.113183552352692, "percentage": 62.45, "elapsed_time": "1 day, 4:15:45", "remaining_time": "16:59:40"}
|
460 |
+
{"current_steps": 460, "total_steps": 735, "loss": 0.6196, "lr": 2.957074454006921e-05, "epoch": 3.1199660873251376, "percentage": 62.59, "elapsed_time": "1 day, 4:19:26", "remaining_time": "16:55:58"}
|
461 |
+
{"current_steps": 461, "total_steps": 735, "loss": 0.6188, "lr": 2.9387327210525942e-05, "epoch": 3.1267486222975838, "percentage": 62.72, "elapsed_time": "1 day, 4:23:07", "remaining_time": "16:52:16"}
|
462 |
+
{"current_steps": 462, "total_steps": 735, "loss": 0.6281, "lr": 2.9204149610098223e-05, "epoch": 3.1335311572700295, "percentage": 62.86, "elapsed_time": "1 day, 4:26:48", "remaining_time": "16:48:34"}
|
463 |
+
{"current_steps": 463, "total_steps": 735, "loss": 0.6157, "lr": 2.902121587657539e-05, "epoch": 3.1403136922424757, "percentage": 62.99, "elapsed_time": "1 day, 4:30:29", "remaining_time": "16:44:52"}
|
464 |
+
{"current_steps": 464, "total_steps": 735, "loss": 0.626, "lr": 2.8838530142238076e-05, "epoch": 3.1470962272149214, "percentage": 63.13, "elapsed_time": "1 day, 4:34:10", "remaining_time": "16:41:10"}
|
465 |
+
{"current_steps": 465, "total_steps": 735, "loss": 0.6199, "lr": 2.865609653376484e-05, "epoch": 3.1538787621873676, "percentage": 63.27, "elapsed_time": "1 day, 4:37:51", "remaining_time": "16:37:28"}
|
466 |
+
{"current_steps": 466, "total_steps": 735, "loss": 0.635, "lr": 2.8473919172139034e-05, "epoch": 3.1606612971598134, "percentage": 63.4, "elapsed_time": "1 day, 4:41:33", "remaining_time": "16:33:46"}
|
467 |
+
{"current_steps": 467, "total_steps": 735, "loss": 0.6181, "lr": 2.8292002172555616e-05, "epoch": 3.1674438321322596, "percentage": 63.54, "elapsed_time": "1 day, 4:45:14", "remaining_time": "16:30:04"}
|
468 |
+
{"current_steps": 468, "total_steps": 735, "loss": 0.6304, "lr": 2.8110349644328275e-05, "epoch": 3.1742263671047053, "percentage": 63.67, "elapsed_time": "1 day, 4:48:55", "remaining_time": "16:26:22"}
|
469 |
+
{"current_steps": 469, "total_steps": 735, "loss": 0.6351, "lr": 2.7928965690796562e-05, "epoch": 3.1810089020771515, "percentage": 63.81, "elapsed_time": "1 day, 4:52:36", "remaining_time": "16:22:40"}
|
470 |
+
{"current_steps": 470, "total_steps": 735, "loss": 0.6301, "lr": 2.7747854409233187e-05, "epoch": 3.187791437049597, "percentage": 63.95, "elapsed_time": "1 day, 4:56:17", "remaining_time": "16:18:58"}
|
471 |
+
{"current_steps": 471, "total_steps": 735, "loss": 0.6207, "lr": 2.7567019890751493e-05, "epoch": 3.1945739720220434, "percentage": 64.08, "elapsed_time": "1 day, 4:59:58", "remaining_time": "16:15:16"}
|
472 |
+
{"current_steps": 472, "total_steps": 735, "loss": 0.6213, "lr": 2.7386466220213065e-05, "epoch": 3.201356506994489, "percentage": 64.22, "elapsed_time": "1 day, 5:03:39", "remaining_time": "16:11:34"}
|
473 |
+
{"current_steps": 473, "total_steps": 735, "loss": 0.6212, "lr": 2.7206197476135403e-05, "epoch": 3.2081390419669353, "percentage": 64.35, "elapsed_time": "1 day, 5:07:20", "remaining_time": "16:07:52"}
|
474 |
+
{"current_steps": 474, "total_steps": 735, "loss": 0.6284, "lr": 2.7026217730599814e-05, "epoch": 3.214921576939381, "percentage": 64.49, "elapsed_time": "1 day, 5:11:01", "remaining_time": "16:04:10"}
|
475 |
+
{"current_steps": 475, "total_steps": 735, "loss": 0.627, "lr": 2.6846531049159454e-05, "epoch": 3.2217041119118273, "percentage": 64.63, "elapsed_time": "1 day, 5:14:42", "remaining_time": "16:00:28"}
|
476 |
+
{"current_steps": 476, "total_steps": 735, "loss": 0.6236, "lr": 2.6667141490747454e-05, "epoch": 3.228486646884273, "percentage": 64.76, "elapsed_time": "1 day, 5:18:23", "remaining_time": "15:56:46"}
|
477 |
+
{"current_steps": 477, "total_steps": 735, "loss": 0.6242, "lr": 2.648805310758524e-05, "epoch": 3.2352691818567187, "percentage": 64.9, "elapsed_time": "1 day, 5:22:04", "remaining_time": "15:53:04"}
|
478 |
+
{"current_steps": 478, "total_steps": 735, "loss": 0.6135, "lr": 2.6309269945091025e-05, "epoch": 3.242051716829165, "percentage": 65.03, "elapsed_time": "1 day, 5:25:45", "remaining_time": "15:49:22"}
|
479 |
+
{"current_steps": 479, "total_steps": 735, "loss": 0.6401, "lr": 2.6130796041788404e-05, "epoch": 3.2488342518016107, "percentage": 65.17, "elapsed_time": "1 day, 5:29:25", "remaining_time": "15:45:40"}
|
480 |
+
{"current_steps": 480, "total_steps": 735, "loss": 0.6303, "lr": 2.5952635429215117e-05, "epoch": 3.255616786774057, "percentage": 65.31, "elapsed_time": "1 day, 5:33:06", "remaining_time": "15:41:57"}
|
481 |
+
{"current_steps": 481, "total_steps": 735, "loss": 0.6213, "lr": 2.5774792131832012e-05, "epoch": 3.2623993217465026, "percentage": 65.44, "elapsed_time": "1 day, 5:36:47", "remaining_time": "15:38:15"}
|
482 |
+
{"current_steps": 482, "total_steps": 735, "loss": 0.6368, "lr": 2.559727016693212e-05, "epoch": 3.269181856718949, "percentage": 65.58, "elapsed_time": "1 day, 5:40:28", "remaining_time": "15:34:34"}
|
483 |
+
{"current_steps": 483, "total_steps": 735, "loss": 0.641, "lr": 2.54200735445499e-05, "epoch": 3.2759643916913945, "percentage": 65.71, "elapsed_time": "1 day, 5:44:09", "remaining_time": "15:30:52"}
|
484 |
+
{"current_steps": 484, "total_steps": 735, "loss": 0.6204, "lr": 2.5243206267370685e-05, "epoch": 3.2827469266638407, "percentage": 65.85, "elapsed_time": "1 day, 5:47:50", "remaining_time": "15:27:09"}
|
485 |
+
{"current_steps": 485, "total_steps": 735, "loss": 0.6207, "lr": 2.506667233064021e-05, "epoch": 3.2895294616362865, "percentage": 65.99, "elapsed_time": "1 day, 5:51:31", "remaining_time": "15:23:27"}
|
486 |
+
{"current_steps": 486, "total_steps": 735, "loss": 0.6371, "lr": 2.489047572207442e-05, "epoch": 3.2963119966087326, "percentage": 66.12, "elapsed_time": "1 day, 5:55:12", "remaining_time": "15:19:45"}
|
487 |
+
{"current_steps": 487, "total_steps": 735, "loss": 0.6285, "lr": 2.4714620421769394e-05, "epoch": 3.3030945315811784, "percentage": 66.26, "elapsed_time": "1 day, 5:58:53", "remaining_time": "15:16:03"}
|
488 |
+
{"current_steps": 488, "total_steps": 735, "loss": 0.631, "lr": 2.4539110402111383e-05, "epoch": 3.3098770665536246, "percentage": 66.39, "elapsed_time": "1 day, 6:02:33", "remaining_time": "15:12:21"}
|
489 |
+
{"current_steps": 489, "total_steps": 735, "loss": 0.6276, "lr": 2.436394962768712e-05, "epoch": 3.3166596015260703, "percentage": 66.53, "elapsed_time": "1 day, 6:06:14", "remaining_time": "15:08:39"}
|
490 |
+
{"current_steps": 490, "total_steps": 735, "loss": 0.6244, "lr": 2.4189142055194276e-05, "epoch": 3.3234421364985165, "percentage": 66.67, "elapsed_time": "1 day, 6:09:56", "remaining_time": "15:04:58"}
|
491 |
+
{"current_steps": 491, "total_steps": 735, "loss": 0.6101, "lr": 2.4014691633352038e-05, "epoch": 3.3302246714709622, "percentage": 66.8, "elapsed_time": "1 day, 6:13:36", "remaining_time": "15:01:15"}
|
492 |
+
{"current_steps": 492, "total_steps": 735, "loss": 0.6135, "lr": 2.3840602302811923e-05, "epoch": 3.337007206443408, "percentage": 66.94, "elapsed_time": "1 day, 6:17:17", "remaining_time": "14:57:33"}
|
493 |
+
{"current_steps": 493, "total_steps": 735, "loss": 0.6288, "lr": 2.3666877996068824e-05, "epoch": 3.343789741415854, "percentage": 67.07, "elapsed_time": "1 day, 6:20:58", "remaining_time": "14:53:51"}
|
494 |
+
{"current_steps": 494, "total_steps": 735, "loss": 0.6326, "lr": 2.3493522637372087e-05, "epoch": 3.3505722763883004, "percentage": 67.21, "elapsed_time": "1 day, 6:24:39", "remaining_time": "14:50:09"}
|
495 |
+
{"current_steps": 495, "total_steps": 735, "loss": 0.6259, "lr": 2.332054014263692e-05, "epoch": 3.357354811360746, "percentage": 67.35, "elapsed_time": "1 day, 6:28:19", "remaining_time": "14:46:27"}
|
496 |
+
{"current_steps": 496, "total_steps": 735, "loss": 0.6245, "lr": 2.3147934419355935e-05, "epoch": 3.364137346333192, "percentage": 67.48, "elapsed_time": "1 day, 6:32:00", "remaining_time": "14:42:45"}
|
497 |
+
{"current_steps": 497, "total_steps": 735, "loss": 0.6316, "lr": 2.2975709366510887e-05, "epoch": 3.370919881305638, "percentage": 67.62, "elapsed_time": "1 day, 6:35:41", "remaining_time": "14:39:03"}
|
498 |
+
{"current_steps": 498, "total_steps": 735, "loss": 0.6383, "lr": 2.2803868874484536e-05, "epoch": 3.3777024162780838, "percentage": 67.76, "elapsed_time": "1 day, 6:39:22", "remaining_time": "14:35:21"}
|
499 |
+
{"current_steps": 499, "total_steps": 735, "loss": 0.614, "lr": 2.2632416824972886e-05, "epoch": 3.38448495125053, "percentage": 67.89, "elapsed_time": "1 day, 6:43:03", "remaining_time": "14:31:39"}
|
500 |
+
{"current_steps": 500, "total_steps": 735, "loss": 0.6317, "lr": 2.2461357090897352e-05, "epoch": 3.3912674862229757, "percentage": 68.03, "elapsed_time": "1 day, 6:46:44", "remaining_time": "14:27:58"}
|
501 |
+
{"current_steps": 501, "total_steps": 735, "loss": 0.6226, "lr": 2.2290693536317444e-05, "epoch": 3.398050021195422, "percentage": 68.16, "elapsed_time": "1 day, 6:50:25", "remaining_time": "14:24:16"}
|
502 |
+
{"current_steps": 502, "total_steps": 735, "loss": 0.6306, "lr": 2.212043001634332e-05, "epoch": 3.4048325561678676, "percentage": 68.3, "elapsed_time": "1 day, 6:54:06", "remaining_time": "14:20:34"}
|
503 |
+
{"current_steps": 503, "total_steps": 735, "loss": 0.6144, "lr": 2.1950570377048813e-05, "epoch": 3.411615091140314, "percentage": 68.44, "elapsed_time": "1 day, 6:57:47", "remaining_time": "14:16:52"}
|
504 |
+
{"current_steps": 504, "total_steps": 735, "loss": 0.6317, "lr": 2.178111845538453e-05, "epoch": 3.4183976261127595, "percentage": 68.57, "elapsed_time": "1 day, 7:01:29", "remaining_time": "14:13:10"}
|
505 |
+
{"current_steps": 505, "total_steps": 735, "loss": 0.6227, "lr": 2.1612078079091125e-05, "epoch": 3.4251801610852057, "percentage": 68.71, "elapsed_time": "1 day, 7:05:10", "remaining_time": "14:09:29"}
|
506 |
+
{"current_steps": 506, "total_steps": 735, "loss": 0.6179, "lr": 2.144345306661291e-05, "epoch": 3.4319626960576515, "percentage": 68.84, "elapsed_time": "1 day, 7:08:51", "remaining_time": "14:05:47"}
|
507 |
+
{"current_steps": 507, "total_steps": 735, "loss": 0.6218, "lr": 2.1275247227011536e-05, "epoch": 3.4387452310300977, "percentage": 68.98, "elapsed_time": "1 day, 7:12:32", "remaining_time": "14:02:05"}
|
508 |
+
{"current_steps": 508, "total_steps": 735, "loss": 0.6313, "lr": 2.1107464359880022e-05, "epoch": 3.4455277660025434, "percentage": 69.12, "elapsed_time": "1 day, 7:16:13", "remaining_time": "13:58:23"}
|
509 |
+
{"current_steps": 509, "total_steps": 735, "loss": 0.6309, "lr": 2.0940108255256823e-05, "epoch": 3.4523103009749896, "percentage": 69.25, "elapsed_time": "1 day, 7:19:54", "remaining_time": "13:54:41"}
|
510 |
+
{"current_steps": 510, "total_steps": 735, "loss": 0.6076, "lr": 2.0773182693540325e-05, "epoch": 3.4590928359474353, "percentage": 69.39, "elapsed_time": "1 day, 7:23:35", "remaining_time": "13:50:59"}
|
511 |
+
{"current_steps": 511, "total_steps": 735, "loss": 0.6238, "lr": 2.0606691445403398e-05, "epoch": 3.465875370919881, "percentage": 69.52, "elapsed_time": "1 day, 7:27:16", "remaining_time": "13:47:17"}
|
512 |
+
{"current_steps": 512, "total_steps": 735, "loss": 0.6135, "lr": 2.0440638271708226e-05, "epoch": 3.4726579058923273, "percentage": 69.66, "elapsed_time": "1 day, 7:30:57", "remaining_time": "13:43:36"}
|
513 |
+
{"current_steps": 513, "total_steps": 735, "loss": 0.6347, "lr": 2.0275026923421315e-05, "epoch": 3.4794404408647734, "percentage": 69.8, "elapsed_time": "1 day, 7:34:38", "remaining_time": "13:39:54"}
|
514 |
+
{"current_steps": 514, "total_steps": 735, "loss": 0.6289, "lr": 2.0109861141528853e-05, "epoch": 3.486222975837219, "percentage": 69.93, "elapsed_time": "1 day, 7:38:19", "remaining_time": "13:36:12"}
|
515 |
+
{"current_steps": 515, "total_steps": 735, "loss": 0.6128, "lr": 1.9945144656952103e-05, "epoch": 3.493005510809665, "percentage": 70.07, "elapsed_time": "1 day, 7:42:00", "remaining_time": "13:32:30"}
|
516 |
+
{"current_steps": 516, "total_steps": 735, "loss": 0.634, "lr": 1.9780881190463222e-05, "epoch": 3.499788045782111, "percentage": 70.2, "elapsed_time": "1 day, 7:45:41", "remaining_time": "13:28:48"}
|
517 |
+
{"current_steps": 517, "total_steps": 735, "loss": 0.6322, "lr": 1.9617074452601113e-05, "epoch": 3.506570580754557, "percentage": 70.34, "elapsed_time": "1 day, 7:49:22", "remaining_time": "13:25:06"}
|
518 |
+
{"current_steps": 518, "total_steps": 735, "loss": 0.6231, "lr": 1.9453728143587697e-05, "epoch": 3.513353115727003, "percentage": 70.48, "elapsed_time": "1 day, 7:53:03", "remaining_time": "13:21:24"}
|
519 |
+
{"current_steps": 519, "total_steps": 735, "loss": 0.625, "lr": 1.9290845953244307e-05, "epoch": 3.520135650699449, "percentage": 70.61, "elapsed_time": "1 day, 7:56:44", "remaining_time": "13:17:43"}
|
520 |
+
{"current_steps": 520, "total_steps": 735, "loss": 0.6191, "lr": 1.9128431560908263e-05, "epoch": 3.526918185671895, "percentage": 70.75, "elapsed_time": "1 day, 8:00:25", "remaining_time": "13:14:01"}
|
521 |
+
{"current_steps": 521, "total_steps": 735, "loss": 0.622, "lr": 1.896648863534988e-05, "epoch": 3.5337007206443407, "percentage": 70.88, "elapsed_time": "1 day, 8:04:05", "remaining_time": "13:10:18"}
|
522 |
+
{"current_steps": 522, "total_steps": 735, "loss": 0.6194, "lr": 1.8805020834689487e-05, "epoch": 3.540483255616787, "percentage": 71.02, "elapsed_time": "1 day, 8:07:45", "remaining_time": "13:06:36"}
|
523 |
+
{"current_steps": 523, "total_steps": 735, "loss": 0.6255, "lr": 1.864403180631489e-05, "epoch": 3.5472657905892326, "percentage": 71.16, "elapsed_time": "1 day, 8:11:26", "remaining_time": "13:02:55"}
|
524 |
+
{"current_steps": 524, "total_steps": 735, "loss": 0.6253, "lr": 1.8483525186798875e-05, "epoch": 3.554048325561679, "percentage": 71.29, "elapsed_time": "1 day, 8:15:06", "remaining_time": "12:59:12"}
|
525 |
+
{"current_steps": 525, "total_steps": 735, "loss": 0.62, "lr": 1.832350460181717e-05, "epoch": 3.5608308605341246, "percentage": 71.43, "elapsed_time": "1 day, 8:18:47", "remaining_time": "12:55:30"}
|
526 |
+
{"current_steps": 526, "total_steps": 735, "loss": 0.629, "lr": 1.8163973666066473e-05, "epoch": 3.5676133955065703, "percentage": 71.56, "elapsed_time": "1 day, 8:22:27", "remaining_time": "12:51:48"}
|
527 |
+
{"current_steps": 527, "total_steps": 735, "loss": 0.6344, "lr": 1.8004935983182835e-05, "epoch": 3.5743959304790165, "percentage": 71.7, "elapsed_time": "1 day, 8:26:09", "remaining_time": "12:48:07"}
|
528 |
+
{"current_steps": 528, "total_steps": 735, "loss": 0.6284, "lr": 1.784639514566021e-05, "epoch": 3.5811784654514627, "percentage": 71.84, "elapsed_time": "1 day, 8:29:49", "remaining_time": "12:44:25"}
|
529 |
+
{"current_steps": 529, "total_steps": 735, "loss": 0.6245, "lr": 1.7688354734769378e-05, "epoch": 3.5879610004239084, "percentage": 71.97, "elapsed_time": "1 day, 8:33:29", "remaining_time": "12:40:43"}
|
530 |
+
{"current_steps": 530, "total_steps": 735, "loss": 0.6241, "lr": 1.753081832047697e-05, "epoch": 3.594743535396354, "percentage": 72.11, "elapsed_time": "1 day, 8:37:10", "remaining_time": "12:37:01"}
|
531 |
+
{"current_steps": 531, "total_steps": 735, "loss": 0.6296, "lr": 1.7373789461364904e-05, "epoch": 3.6015260703688003, "percentage": 72.24, "elapsed_time": "1 day, 8:40:51", "remaining_time": "12:33:19"}
|
532 |
+
{"current_steps": 532, "total_steps": 735, "loss": 0.6335, "lr": 1.7217271704549913e-05, "epoch": 3.6083086053412465, "percentage": 72.38, "elapsed_time": "1 day, 8:44:32", "remaining_time": "12:29:37"}
|
533 |
+
{"current_steps": 533, "total_steps": 735, "loss": 0.6307, "lr": 1.7061268585603507e-05, "epoch": 3.6150911403136923, "percentage": 72.52, "elapsed_time": "1 day, 8:48:13", "remaining_time": "12:25:55"}
|
534 |
+
{"current_steps": 534, "total_steps": 735, "loss": 0.6347, "lr": 1.6905783628472074e-05, "epoch": 3.621873675286138, "percentage": 72.65, "elapsed_time": "1 day, 8:51:53", "remaining_time": "12:22:13"}
|
535 |
+
{"current_steps": 535, "total_steps": 735, "loss": 0.6265, "lr": 1.6750820345397217e-05, "epoch": 3.628656210258584, "percentage": 72.79, "elapsed_time": "1 day, 8:55:34", "remaining_time": "12:18:32"}
|
536 |
+
{"current_steps": 536, "total_steps": 735, "loss": 0.6287, "lr": 1.659638223683653e-05, "epoch": 3.63543874523103, "percentage": 72.93, "elapsed_time": "1 day, 8:59:15", "remaining_time": "12:14:50"}
|
537 |
+
{"current_steps": 537, "total_steps": 735, "loss": 0.6361, "lr": 1.644247279138442e-05, "epoch": 3.642221280203476, "percentage": 73.06, "elapsed_time": "1 day, 9:02:56", "remaining_time": "12:11:08"}
|
538 |
+
{"current_steps": 538, "total_steps": 735, "loss": 0.6251, "lr": 1.628909548569339e-05, "epoch": 3.649003815175922, "percentage": 73.2, "elapsed_time": "1 day, 9:06:37", "remaining_time": "12:07:26"}
|
539 |
+
{"current_steps": 539, "total_steps": 735, "loss": 0.629, "lr": 1.6136253784395455e-05, "epoch": 3.655786350148368, "percentage": 73.33, "elapsed_time": "1 day, 9:10:18", "remaining_time": "12:03:44"}
|
540 |
+
{"current_steps": 540, "total_steps": 735, "loss": 0.6174, "lr": 1.5983951140023864e-05, "epoch": 3.662568885120814, "percentage": 73.47, "elapsed_time": "1 day, 9:13:59", "remaining_time": "12:00:03"}
|
541 |
+
{"current_steps": 541, "total_steps": 735, "loss": 0.6192, "lr": 1.583219099293516e-05, "epoch": 3.66935142009326, "percentage": 73.61, "elapsed_time": "1 day, 9:17:39", "remaining_time": "11:56:21"}
|
542 |
+
{"current_steps": 542, "total_steps": 735, "loss": 0.6193, "lr": 1.568097677123146e-05, "epoch": 3.6761339550657057, "percentage": 73.74, "elapsed_time": "1 day, 9:21:20", "remaining_time": "11:52:39"}
|
543 |
+
{"current_steps": 543, "total_steps": 735, "loss": 0.6126, "lr": 1.5530311890682946e-05, "epoch": 3.682916490038152, "percentage": 73.88, "elapsed_time": "1 day, 9:25:01", "remaining_time": "11:48:57"}
|
544 |
+
{"current_steps": 544, "total_steps": 735, "loss": 0.6204, "lr": 1.5380199754650838e-05, "epoch": 3.6896990250105977, "percentage": 74.01, "elapsed_time": "1 day, 9:28:42", "remaining_time": "11:45:15"}
|
545 |
+
{"current_steps": 545, "total_steps": 735, "loss": 0.634, "lr": 1.5230643754010355e-05, "epoch": 3.6964815599830434, "percentage": 74.15, "elapsed_time": "1 day, 9:32:23", "remaining_time": "11:41:34"}
|
546 |
+
{"current_steps": 546, "total_steps": 735, "loss": 0.6132, "lr": 1.508164726707427e-05, "epoch": 3.7032640949554896, "percentage": 74.29, "elapsed_time": "1 day, 9:36:04", "remaining_time": "11:37:52"}
|
547 |
+
{"current_steps": 547, "total_steps": 735, "loss": 0.6263, "lr": 1.4933213659516485e-05, "epoch": 3.7100466299279358, "percentage": 74.42, "elapsed_time": "1 day, 9:39:45", "remaining_time": "11:34:10"}
|
548 |
+
{"current_steps": 548, "total_steps": 735, "loss": 0.6158, "lr": 1.4785346284296078e-05, "epoch": 3.7168291649003815, "percentage": 74.56, "elapsed_time": "1 day, 9:43:26", "remaining_time": "11:30:28"}
|
549 |
+
{"current_steps": 549, "total_steps": 735, "loss": 0.6235, "lr": 1.4638048481581537e-05, "epoch": 3.7236116998728273, "percentage": 74.69, "elapsed_time": "1 day, 9:47:07", "remaining_time": "11:26:47"}
|
550 |
+
{"current_steps": 550, "total_steps": 735, "loss": 0.6137, "lr": 1.4491323578675265e-05, "epoch": 3.7303942348452734, "percentage": 74.83, "elapsed_time": "1 day, 9:50:48", "remaining_time": "11:23:05"}
|
551 |
+
{"current_steps": 551, "total_steps": 735, "loss": 0.6329, "lr": 1.4345174889938514e-05, "epoch": 3.7371767698177196, "percentage": 74.97, "elapsed_time": "1 day, 9:54:28", "remaining_time": "11:19:23"}
|
552 |
+
{"current_steps": 552, "total_steps": 735, "loss": 0.6272, "lr": 1.4199605716716414e-05, "epoch": 3.7439593047901654, "percentage": 75.1, "elapsed_time": "1 day, 9:58:09", "remaining_time": "11:15:41"}
|
553 |
+
{"current_steps": 553, "total_steps": 735, "loss": 0.6363, "lr": 1.4054619347263487e-05, "epoch": 3.750741839762611, "percentage": 75.24, "elapsed_time": "1 day, 10:01:49", "remaining_time": "11:11:59"}
|
554 |
+
{"current_steps": 554, "total_steps": 735, "loss": 0.6218, "lr": 1.3910219056669335e-05, "epoch": 3.7575243747350573, "percentage": 75.37, "elapsed_time": "1 day, 10:05:29", "remaining_time": "11:08:17"}
|
555 |
+
{"current_steps": 555, "total_steps": 735, "loss": 0.6278, "lr": 1.3766408106784601e-05, "epoch": 3.764306909707503, "percentage": 75.51, "elapsed_time": "1 day, 10:09:10", "remaining_time": "11:04:35"}
|
556 |
+
{"current_steps": 556, "total_steps": 735, "loss": 0.6227, "lr": 1.3623189746147398e-05, "epoch": 3.771089444679949, "percentage": 75.65, "elapsed_time": "1 day, 10:12:51", "remaining_time": "11:00:54"}
|
557 |
+
{"current_steps": 557, "total_steps": 735, "loss": 0.6296, "lr": 1.3480567209909863e-05, "epoch": 3.777871979652395, "percentage": 75.78, "elapsed_time": "1 day, 10:16:32", "remaining_time": "10:57:12"}
|
558 |
+
{"current_steps": 558, "total_steps": 735, "loss": 0.6175, "lr": 1.333854371976505e-05, "epoch": 3.784654514624841, "percentage": 75.92, "elapsed_time": "1 day, 10:20:13", "remaining_time": "10:53:30"}
|
559 |
+
{"current_steps": 559, "total_steps": 735, "loss": 0.6259, "lr": 1.319712248387424e-05, "epoch": 3.791437049597287, "percentage": 76.05, "elapsed_time": "1 day, 10:23:53", "remaining_time": "10:49:48"}
|
560 |
+
{"current_steps": 560, "total_steps": 735, "loss": 0.6259, "lr": 1.3056306696794377e-05, "epoch": 3.798219584569733, "percentage": 76.19, "elapsed_time": "1 day, 10:27:34", "remaining_time": "10:46:06"}
|
561 |
+
{"current_steps": 561, "total_steps": 735, "loss": 0.623, "lr": 1.2916099539405997e-05, "epoch": 3.805002119542179, "percentage": 76.33, "elapsed_time": "1 day, 10:31:15", "remaining_time": "10:42:25"}
|
562 |
+
{"current_steps": 562, "total_steps": 735, "loss": 0.629, "lr": 1.2776504178841291e-05, "epoch": 3.811784654514625, "percentage": 76.46, "elapsed_time": "1 day, 10:34:56", "remaining_time": "10:38:43"}
|
563 |
+
{"current_steps": 563, "total_steps": 735, "loss": 0.6239, "lr": 1.2637523768412633e-05, "epoch": 3.8185671894870707, "percentage": 76.6, "elapsed_time": "1 day, 10:38:37", "remaining_time": "10:35:01"}
|
564 |
+
{"current_steps": 564, "total_steps": 735, "loss": 0.6213, "lr": 1.249916144754133e-05, "epoch": 3.8253497244595165, "percentage": 76.73, "elapsed_time": "1 day, 10:42:18", "remaining_time": "10:31:20"}
|
565 |
+
{"current_steps": 565, "total_steps": 735, "loss": 0.6205, "lr": 1.2361420341686641e-05, "epoch": 3.8321322594319627, "percentage": 76.87, "elapsed_time": "1 day, 10:45:59", "remaining_time": "10:27:38"}
|
566 |
+
{"current_steps": 566, "total_steps": 735, "loss": 0.6221, "lr": 1.22243035622753e-05, "epoch": 3.838914794404409, "percentage": 77.01, "elapsed_time": "1 day, 10:49:40", "remaining_time": "10:23:56"}
|
567 |
+
{"current_steps": 567, "total_steps": 735, "loss": 0.6212, "lr": 1.2087814206631095e-05, "epoch": 3.8456973293768546, "percentage": 77.14, "elapsed_time": "1 day, 10:53:21", "remaining_time": "10:20:15"}
|
568 |
+
{"current_steps": 568, "total_steps": 735, "loss": 0.6199, "lr": 1.1951955357905033e-05, "epoch": 3.8524798643493003, "percentage": 77.28, "elapsed_time": "1 day, 10:57:02", "remaining_time": "10:16:33"}
|
569 |
+
{"current_steps": 569, "total_steps": 735, "loss": 0.6198, "lr": 1.1816730085005603e-05, "epoch": 3.8592623993217465, "percentage": 77.41, "elapsed_time": "1 day, 11:00:43", "remaining_time": "10:12:51"}
|
570 |
+
{"current_steps": 570, "total_steps": 735, "loss": 0.6256, "lr": 1.1682141442529473e-05, "epoch": 3.8660449342941927, "percentage": 77.55, "elapsed_time": "1 day, 11:04:24", "remaining_time": "10:09:10"}
|
571 |
+
{"current_steps": 571, "total_steps": 735, "loss": 0.6157, "lr": 1.1548192470692516e-05, "epoch": 3.8728274692666385, "percentage": 77.69, "elapsed_time": "1 day, 11:08:05", "remaining_time": "10:05:28"}
|
572 |
+
{"current_steps": 572, "total_steps": 735, "loss": 0.6262, "lr": 1.1414886195261135e-05, "epoch": 3.879610004239084, "percentage": 77.82, "elapsed_time": "1 day, 11:11:46", "remaining_time": "10:01:46"}
|
573 |
+
{"current_steps": 573, "total_steps": 735, "loss": 0.6218, "lr": 1.128222562748384e-05, "epoch": 3.8863925392115304, "percentage": 77.96, "elapsed_time": "1 day, 11:15:27", "remaining_time": "9:58:05"}
|
574 |
+
{"current_steps": 574, "total_steps": 735, "loss": 0.6264, "lr": 1.1150213764023357e-05, "epoch": 3.893175074183976, "percentage": 78.1, "elapsed_time": "1 day, 11:19:09", "remaining_time": "9:54:23"}
|
575 |
+
{"current_steps": 575, "total_steps": 735, "loss": 0.6217, "lr": 1.1018853586888794e-05, "epoch": 3.8999576091564223, "percentage": 78.23, "elapsed_time": "1 day, 11:22:52", "remaining_time": "9:50:42"}
|
576 |
+
{"current_steps": 576, "total_steps": 735, "loss": 0.6271, "lr": 1.0888148063368411e-05, "epoch": 3.906740144128868, "percentage": 78.37, "elapsed_time": "1 day, 11:26:34", "remaining_time": "9:47:01"}
|
577 |
+
{"current_steps": 577, "total_steps": 735, "loss": 0.6246, "lr": 1.075810014596248e-05, "epoch": 3.9135226791013142, "percentage": 78.5, "elapsed_time": "1 day, 11:30:16", "remaining_time": "9:43:19"}
|
578 |
+
{"current_steps": 578, "total_steps": 735, "loss": 0.6186, "lr": 1.0628712772316682e-05, "epoch": 3.92030521407376, "percentage": 78.64, "elapsed_time": "1 day, 11:33:56", "remaining_time": "9:39:38"}
|
579 |
+
{"current_steps": 579, "total_steps": 735, "loss": 0.6237, "lr": 1.04999888651557e-05, "epoch": 3.927087749046206, "percentage": 78.78, "elapsed_time": "1 day, 11:37:37", "remaining_time": "9:35:56"}
|
580 |
+
{"current_steps": 580, "total_steps": 735, "loss": 0.6247, "lr": 1.0371931332217175e-05, "epoch": 3.933870284018652, "percentage": 78.91, "elapsed_time": "1 day, 11:41:18", "remaining_time": "9:32:14"}
|
581 |
+
{"current_steps": 581, "total_steps": 735, "loss": 0.623, "lr": 1.0244543066186102e-05, "epoch": 3.940652818991098, "percentage": 79.05, "elapsed_time": "1 day, 11:44:59", "remaining_time": "9:28:33"}
|
582 |
+
{"current_steps": 582, "total_steps": 735, "loss": 0.6311, "lr": 1.0117826944629425e-05, "epoch": 3.947435353963544, "percentage": 79.18, "elapsed_time": "1 day, 11:48:40", "remaining_time": "9:24:51"}
|
583 |
+
{"current_steps": 583, "total_steps": 735, "loss": 0.6352, "lr": 9.991785829931024e-06, "epoch": 3.9542178889359896, "percentage": 79.32, "elapsed_time": "1 day, 11:52:21", "remaining_time": "9:21:09"}
|
584 |
+
{"current_steps": 584, "total_steps": 735, "loss": 0.616, "lr": 9.866422569227133e-06, "epoch": 3.9610004239084358, "percentage": 79.46, "elapsed_time": "1 day, 11:56:02", "remaining_time": "9:17:28"}
|
585 |
+
{"current_steps": 585, "total_steps": 735, "loss": 0.6267, "lr": 9.74173999434192e-06, "epoch": 3.967782958880882, "percentage": 79.59, "elapsed_time": "1 day, 11:59:43", "remaining_time": "9:13:46"}
|
586 |
+
{"current_steps": 586, "total_steps": 735, "loss": 0.6228, "lr": 9.61774092172362e-06, "epoch": 3.9745654938533277, "percentage": 79.73, "elapsed_time": "1 day, 12:03:24", "remaining_time": "9:10:04"}
|
587 |
+
{"current_steps": 587, "total_steps": 735, "loss": 0.6249, "lr": 9.494428152380868e-06, "epoch": 3.9813480288257734, "percentage": 79.86, "elapsed_time": "1 day, 12:07:06", "remaining_time": "9:06:23"}
|
588 |
+
{"current_steps": 588, "total_steps": 735, "loss": 0.6327, "lr": 9.371804471819401e-06, "epoch": 3.9881305637982196, "percentage": 80.0, "elapsed_time": "1 day, 12:10:47", "remaining_time": "9:02:41"}
|
589 |
+
{"current_steps": 589, "total_steps": 735, "loss": 0.6303, "lr": 9.249872649979203e-06, "epoch": 3.994913098770666, "percentage": 80.14, "elapsed_time": "1 day, 12:14:28", "remaining_time": "8:59:00"}
|
590 |
+
{"current_steps": 590, "total_steps": 735, "loss": 0.947, "lr": 9.128635441171854e-06, "epoch": 4.001695633743111, "percentage": 80.27, "elapsed_time": "1 day, 12:19:44", "remaining_time": "8:55:41"}
|