Training in progress, epoch 4
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4877660776
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a067be9d34801d63561c233b216d553b4cbedda0b89fe91c9fd07ed6f8d84950
|
3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4932751008
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:de6cce5f8a23bd25d358bad7c8522b136b5906ed717c4e04d9dd8f2047537567
|
3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4330865200
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5db00ac5dbd78f78b33087892bb24fd28292d8cb2d1a1b71799a1f36b6380f9c
|
3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1089994880
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c28e145d07b9f2d85aebad83f6f8b5d6f74c456cc6b0074e12dea8a14a7c216c
|
3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
@@ -588,3 +588,149 @@
|
|
588 |
{"current_steps": 588, "total_steps": 735, "loss": 0.6327, "lr": 9.371804471819401e-06, "epoch": 3.9881305637982196, "percentage": 80.0, "elapsed_time": "1 day, 12:10:47", "remaining_time": "9:02:41"}
|
589 |
{"current_steps": 589, "total_steps": 735, "loss": 0.6303, "lr": 9.249872649979203e-06, "epoch": 3.994913098770666, "percentage": 80.14, "elapsed_time": "1 day, 12:14:28", "remaining_time": "8:59:00"}
|
590 |
{"current_steps": 590, "total_steps": 735, "loss": 0.947, "lr": 9.128635441171854e-06, "epoch": 4.001695633743111, "percentage": 80.27, "elapsed_time": "1 day, 12:19:44", "remaining_time": "8:55:41"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
588 |
{"current_steps": 588, "total_steps": 735, "loss": 0.6327, "lr": 9.371804471819401e-06, "epoch": 3.9881305637982196, "percentage": 80.0, "elapsed_time": "1 day, 12:10:47", "remaining_time": "9:02:41"}
|
589 |
{"current_steps": 589, "total_steps": 735, "loss": 0.6303, "lr": 9.249872649979203e-06, "epoch": 3.994913098770666, "percentage": 80.14, "elapsed_time": "1 day, 12:14:28", "remaining_time": "8:59:00"}
|
590 |
{"current_steps": 590, "total_steps": 735, "loss": 0.947, "lr": 9.128635441171854e-06, "epoch": 4.001695633743111, "percentage": 80.27, "elapsed_time": "1 day, 12:19:44", "remaining_time": "8:55:41"}
|
591 |
+
{"current_steps": 591, "total_steps": 735, "loss": 0.6138, "lr": 9.008095584018406e-06, "epoch": 4.008478168715557, "percentage": 80.41, "elapsed_time": "1 day, 12:23:25", "remaining_time": "8:52:00"}
|
592 |
+
{"current_steps": 592, "total_steps": 735, "loss": 0.6084, "lr": 8.888255801387417e-06, "epoch": 4.0152607036880035, "percentage": 80.54, "elapsed_time": "1 day, 12:27:06", "remaining_time": "8:48:18"}
|
593 |
+
{"current_steps": 593, "total_steps": 735, "loss": 0.6196, "lr": 8.76911880033354e-06, "epoch": 4.02204323866045, "percentage": 80.68, "elapsed_time": "1 day, 12:30:46", "remaining_time": "8:44:36"}
|
594 |
+
{"current_steps": 594, "total_steps": 735, "loss": 0.6193, "lr": 8.65068727203633e-06, "epoch": 4.028825773632895, "percentage": 80.82, "elapsed_time": "1 day, 12:34:27", "remaining_time": "8:40:54"}
|
595 |
+
{"current_steps": 595, "total_steps": 735, "loss": 0.5971, "lr": 8.53296389173941e-06, "epoch": 4.035608308605341, "percentage": 80.95, "elapsed_time": "1 day, 12:38:08", "remaining_time": "8:37:12"}
|
596 |
+
{"current_steps": 596, "total_steps": 735, "loss": 0.6085, "lr": 8.415951318690134e-06, "epoch": 4.042390843577787, "percentage": 81.09, "elapsed_time": "1 day, 12:41:48", "remaining_time": "8:33:30"}
|
597 |
+
{"current_steps": 597, "total_steps": 735, "loss": 0.6001, "lr": 8.299652196079462e-06, "epoch": 4.0491733785502335, "percentage": 81.22, "elapsed_time": "1 day, 12:45:30", "remaining_time": "8:29:48"}
|
598 |
+
{"current_steps": 598, "total_steps": 735, "loss": 0.6105, "lr": 8.184069150982217e-06, "epoch": 4.055955913522679, "percentage": 81.36, "elapsed_time": "1 day, 12:49:11", "remaining_time": "8:26:07"}
|
599 |
+
{"current_steps": 599, "total_steps": 735, "loss": 0.6055, "lr": 8.069204794297843e-06, "epoch": 4.062738448495125, "percentage": 81.5, "elapsed_time": "1 day, 12:52:52", "remaining_time": "8:22:25"}
|
600 |
+
{"current_steps": 600, "total_steps": 735, "loss": 0.6032, "lr": 7.955061720691315e-06, "epoch": 4.069520983467571, "percentage": 81.63, "elapsed_time": "1 day, 12:56:34", "remaining_time": "8:18:43"}
|
601 |
+
{"current_steps": 601, "total_steps": 735, "loss": 0.6123, "lr": 7.841642508534617e-06, "epoch": 4.076303518440017, "percentage": 81.77, "elapsed_time": "1 day, 13:00:16", "remaining_time": "8:15:02"}
|
602 |
+
{"current_steps": 602, "total_steps": 735, "loss": 0.6153, "lr": 7.728949719848464e-06, "epoch": 4.083086053412463, "percentage": 81.9, "elapsed_time": "1 day, 13:03:57", "remaining_time": "8:11:20"}
|
603 |
+
{"current_steps": 603, "total_steps": 735, "loss": 0.6168, "lr": 7.6169859002443954e-06, "epoch": 4.089868588384909, "percentage": 82.04, "elapsed_time": "1 day, 13:07:38", "remaining_time": "8:07:38"}
|
604 |
+
{"current_steps": 604, "total_steps": 735, "loss": 0.6151, "lr": 7.505753578867354e-06, "epoch": 4.096651123357355, "percentage": 82.18, "elapsed_time": "1 day, 13:11:18", "remaining_time": "8:03:56"}
|
605 |
+
{"current_steps": 605, "total_steps": 735, "loss": 0.6166, "lr": 7.395255268338459e-06, "epoch": 4.1034336583298, "percentage": 82.31, "elapsed_time": "1 day, 13:14:59", "remaining_time": "8:00:14"}
|
606 |
+
{"current_steps": 606, "total_steps": 735, "loss": 0.6103, "lr": 7.285493464698343e-06, "epoch": 4.1102161933022465, "percentage": 82.45, "elapsed_time": "1 day, 13:18:40", "remaining_time": "7:56:32"}
|
607 |
+
{"current_steps": 607, "total_steps": 735, "loss": 0.6213, "lr": 7.176470647350675e-06, "epoch": 4.116998728274693, "percentage": 82.59, "elapsed_time": "1 day, 13:22:21", "remaining_time": "7:52:51"}
|
608 |
+
{"current_steps": 608, "total_steps": 735, "loss": 0.6099, "lr": 7.068189279006237e-06, "epoch": 4.123781263247139, "percentage": 82.72, "elapsed_time": "1 day, 13:26:02", "remaining_time": "7:49:09"}
|
609 |
+
{"current_steps": 609, "total_steps": 735, "loss": 0.5961, "lr": 6.960651805627248e-06, "epoch": 4.130563798219584, "percentage": 82.86, "elapsed_time": "1 day, 13:29:43", "remaining_time": "7:45:27"}
|
610 |
+
{"current_steps": 610, "total_steps": 735, "loss": 0.6001, "lr": 6.853860656372125e-06, "epoch": 4.13734633319203, "percentage": 82.99, "elapsed_time": "1 day, 13:33:25", "remaining_time": "7:41:46"}
|
611 |
+
{"current_steps": 611, "total_steps": 735, "loss": 0.6068, "lr": 6.747818243540587e-06, "epoch": 4.144128868164477, "percentage": 83.13, "elapsed_time": "1 day, 13:37:06", "remaining_time": "7:38:04"}
|
612 |
+
{"current_steps": 612, "total_steps": 735, "loss": 0.6083, "lr": 6.642526962519218e-06, "epoch": 4.150911403136923, "percentage": 83.27, "elapsed_time": "1 day, 13:40:47", "remaining_time": "7:34:22"}
|
613 |
+
{"current_steps": 613, "total_steps": 735, "loss": 0.6026, "lr": 6.537989191727292e-06, "epoch": 4.157693938109368, "percentage": 83.4, "elapsed_time": "1 day, 13:44:29", "remaining_time": "7:30:40"}
|
614 |
+
{"current_steps": 614, "total_steps": 735, "loss": 0.6019, "lr": 6.4342072925631125e-06, "epoch": 4.164476473081814, "percentage": 83.54, "elapsed_time": "1 day, 13:48:10", "remaining_time": "7:26:59"}
|
615 |
+
{"current_steps": 615, "total_steps": 735, "loss": 0.5954, "lr": 6.331183609350602e-06, "epoch": 4.17125900805426, "percentage": 83.67, "elapsed_time": "1 day, 13:51:51", "remaining_time": "7:23:17"}
|
616 |
+
{"current_steps": 616, "total_steps": 735, "loss": 0.6117, "lr": 6.228920469286408e-06, "epoch": 4.178041543026707, "percentage": 83.81, "elapsed_time": "1 day, 13:55:32", "remaining_time": "7:19:35"}
|
617 |
+
{"current_steps": 617, "total_steps": 735, "loss": 0.5946, "lr": 6.127420182387314e-06, "epoch": 4.184824077999152, "percentage": 83.95, "elapsed_time": "1 day, 13:59:13", "remaining_time": "7:15:53"}
|
618 |
+
{"current_steps": 618, "total_steps": 735, "loss": 0.6034, "lr": 6.026685041438018e-06, "epoch": 4.191606612971598, "percentage": 84.08, "elapsed_time": "1 day, 14:02:54", "remaining_time": "7:12:12"}
|
619 |
+
{"current_steps": 619, "total_steps": 735, "loss": 0.6048, "lr": 5.926717321939417e-06, "epoch": 4.198389147944044, "percentage": 84.22, "elapsed_time": "1 day, 14:06:35", "remaining_time": "7:08:30"}
|
620 |
+
{"current_steps": 620, "total_steps": 735, "loss": 0.6037, "lr": 5.827519282057128e-06, "epoch": 4.2051716829164905, "percentage": 84.35, "elapsed_time": "1 day, 14:10:17", "remaining_time": "7:04:48"}
|
621 |
+
{"current_steps": 621, "total_steps": 735, "loss": 0.607, "lr": 5.729093162570545e-06, "epoch": 4.211954217888936, "percentage": 84.49, "elapsed_time": "1 day, 14:13:57", "remaining_time": "7:01:06"}
|
622 |
+
{"current_steps": 622, "total_steps": 735, "loss": 0.6135, "lr": 5.631441186822168e-06, "epoch": 4.218736752861382, "percentage": 84.63, "elapsed_time": "1 day, 14:17:38", "remaining_time": "6:57:24"}
|
623 |
+
{"current_steps": 623, "total_steps": 735, "loss": 0.5981, "lr": 5.534565560667426e-06, "epoch": 4.225519287833828, "percentage": 84.76, "elapsed_time": "1 day, 14:21:19", "remaining_time": "6:53:43"}
|
624 |
+
{"current_steps": 624, "total_steps": 735, "loss": 0.6118, "lr": 5.4384684724248096e-06, "epoch": 4.232301822806273, "percentage": 84.9, "elapsed_time": "1 day, 14:25:00", "remaining_time": "6:50:01"}
|
625 |
+
{"current_steps": 625, "total_steps": 735, "loss": 0.6184, "lr": 5.343152092826476e-06, "epoch": 4.23908435777872, "percentage": 85.03, "elapsed_time": "1 day, 14:28:42", "remaining_time": "6:46:19"}
|
626 |
+
{"current_steps": 626, "total_steps": 735, "loss": 0.6058, "lr": 5.2486185749691665e-06, "epoch": 4.245866892751166, "percentage": 85.17, "elapsed_time": "1 day, 14:32:23", "remaining_time": "6:42:38"}
|
627 |
+
{"current_steps": 627, "total_steps": 735, "loss": 0.6071, "lr": 5.154870054265635e-06, "epoch": 4.252649427723612, "percentage": 85.31, "elapsed_time": "1 day, 14:36:04", "remaining_time": "6:38:56"}
|
628 |
+
{"current_steps": 628, "total_steps": 735, "loss": 0.6019, "lr": 5.061908648396338e-06, "epoch": 4.259431962696057, "percentage": 85.44, "elapsed_time": "1 day, 14:39:45", "remaining_time": "6:35:14"}
|
629 |
+
{"current_steps": 629, "total_steps": 735, "loss": 0.604, "lr": 4.969736457261669e-06, "epoch": 4.2662144976685035, "percentage": 85.58, "elapsed_time": "1 day, 14:43:27", "remaining_time": "6:31:33"}
|
630 |
+
{"current_steps": 630, "total_steps": 735, "loss": 0.6103, "lr": 4.878355562934465e-06, "epoch": 4.27299703264095, "percentage": 85.71, "elapsed_time": "1 day, 14:47:08", "remaining_time": "6:27:51"}
|
631 |
+
{"current_steps": 631, "total_steps": 735, "loss": 0.6102, "lr": 4.787768029613014e-06, "epoch": 4.279779567613396, "percentage": 85.85, "elapsed_time": "1 day, 14:50:48", "remaining_time": "6:24:09"}
|
632 |
+
{"current_steps": 632, "total_steps": 735, "loss": 0.6044, "lr": 4.697975903574419e-06, "epoch": 4.286562102585841, "percentage": 85.99, "elapsed_time": "1 day, 14:54:30", "remaining_time": "6:20:27"}
|
633 |
+
{"current_steps": 633, "total_steps": 735, "loss": 0.6104, "lr": 4.608981213128347e-06, "epoch": 4.293344637558287, "percentage": 86.12, "elapsed_time": "1 day, 14:58:11", "remaining_time": "6:16:46"}
|
634 |
+
{"current_steps": 634, "total_steps": 735, "loss": 0.6103, "lr": 4.520785968571266e-06, "epoch": 4.3001271725307335, "percentage": 86.26, "elapsed_time": "1 day, 15:01:51", "remaining_time": "6:13:04"}
|
635 |
+
{"current_steps": 635, "total_steps": 735, "loss": 0.6127, "lr": 4.433392162140968e-06, "epoch": 4.30690970750318, "percentage": 86.39, "elapsed_time": "1 day, 15:05:33", "remaining_time": "6:09:22"}
|
636 |
+
{"current_steps": 636, "total_steps": 735, "loss": 0.6258, "lr": 4.3468017679716245e-06, "epoch": 4.313692242475625, "percentage": 86.53, "elapsed_time": "1 day, 15:09:14", "remaining_time": "6:05:41"}
|
637 |
+
{"current_steps": 637, "total_steps": 735, "loss": 0.617, "lr": 4.261016742049155e-06, "epoch": 4.320474777448071, "percentage": 86.67, "elapsed_time": "1 day, 15:12:55", "remaining_time": "6:01:59"}
|
638 |
+
{"current_steps": 638, "total_steps": 735, "loss": 0.6086, "lr": 4.176039022167064e-06, "epoch": 4.327257312420517, "percentage": 86.8, "elapsed_time": "1 day, 15:16:35", "remaining_time": "5:58:17"}
|
639 |
+
{"current_steps": 639, "total_steps": 735, "loss": 0.6108, "lr": 4.0918705278826685e-06, "epoch": 4.3340398473929636, "percentage": 86.94, "elapsed_time": "1 day, 15:20:16", "remaining_time": "5:54:35"}
|
640 |
+
{"current_steps": 640, "total_steps": 735, "loss": 0.6122, "lr": 4.008513160473726e-06, "epoch": 4.340822382365409, "percentage": 87.07, "elapsed_time": "1 day, 15:23:57", "remaining_time": "5:50:54"}
|
641 |
+
{"current_steps": 641, "total_steps": 735, "loss": 0.6059, "lr": 3.925968802895477e-06, "epoch": 4.347604917337855, "percentage": 87.21, "elapsed_time": "1 day, 15:27:38", "remaining_time": "5:47:12"}
|
642 |
+
{"current_steps": 642, "total_steps": 735, "loss": 0.6159, "lr": 3.8442393197381456e-06, "epoch": 4.354387452310301, "percentage": 87.35, "elapsed_time": "1 day, 15:31:19", "remaining_time": "5:43:30"}
|
643 |
+
{"current_steps": 643, "total_steps": 735, "loss": 0.6053, "lr": 3.7633265571847787e-06, "epoch": 4.3611699872827465, "percentage": 87.48, "elapsed_time": "1 day, 15:35:00", "remaining_time": "5:39:48"}
|
644 |
+
{"current_steps": 644, "total_steps": 735, "loss": 0.6185, "lr": 3.683232342969594e-06, "epoch": 4.367952522255193, "percentage": 87.62, "elapsed_time": "1 day, 15:38:41", "remaining_time": "5:36:07"}
|
645 |
+
{"current_steps": 645, "total_steps": 735, "loss": 0.6311, "lr": 3.603958486336625e-06, "epoch": 4.374735057227639, "percentage": 87.76, "elapsed_time": "1 day, 15:42:21", "remaining_time": "5:32:25"}
|
646 |
+
{"current_steps": 646, "total_steps": 735, "loss": 0.6158, "lr": 3.5255067779989173e-06, "epoch": 4.381517592200085, "percentage": 87.89, "elapsed_time": "1 day, 15:46:02", "remaining_time": "5:28:43"}
|
647 |
+
{"current_steps": 647, "total_steps": 735, "loss": 0.6176, "lr": 3.4478789900980545e-06, "epoch": 4.38830012717253, "percentage": 88.03, "elapsed_time": "1 day, 15:49:44", "remaining_time": "5:25:02"}
|
648 |
+
{"current_steps": 648, "total_steps": 735, "loss": 0.614, "lr": 3.371076876164101e-06, "epoch": 4.395082662144977, "percentage": 88.16, "elapsed_time": "1 day, 15:53:25", "remaining_time": "5:21:20"}
|
649 |
+
{"current_steps": 649, "total_steps": 735, "loss": 0.6098, "lr": 3.295102171076039e-06, "epoch": 4.401865197117423, "percentage": 88.3, "elapsed_time": "1 day, 15:57:06", "remaining_time": "5:17:38"}
|
650 |
+
{"current_steps": 650, "total_steps": 735, "loss": 0.5976, "lr": 3.2199565910225305e-06, "epoch": 4.408647732089869, "percentage": 88.44, "elapsed_time": "1 day, 16:00:48", "remaining_time": "5:13:57"}
|
651 |
+
{"current_steps": 651, "total_steps": 735, "loss": 0.6164, "lr": 3.145641833463198e-06, "epoch": 4.415430267062314, "percentage": 88.57, "elapsed_time": "1 day, 16:04:29", "remaining_time": "5:10:15"}
|
652 |
+
{"current_steps": 652, "total_steps": 735, "loss": 0.6156, "lr": 3.0721595770902435e-06, "epoch": 4.42221280203476, "percentage": 88.71, "elapsed_time": "1 day, 16:08:10", "remaining_time": "5:06:33"}
|
653 |
+
{"current_steps": 653, "total_steps": 735, "loss": 0.6001, "lr": 2.9995114817905493e-06, "epoch": 4.428995337007207, "percentage": 88.84, "elapsed_time": "1 day, 16:11:51", "remaining_time": "5:02:52"}
|
654 |
+
{"current_steps": 654, "total_steps": 735, "loss": 0.607, "lr": 2.927699188608171e-06, "epoch": 4.435777871979653, "percentage": 88.98, "elapsed_time": "1 day, 16:15:32", "remaining_time": "4:59:10"}
|
655 |
+
{"current_steps": 655, "total_steps": 735, "loss": 0.6169, "lr": 2.856724319707289e-06, "epoch": 4.442560406952098, "percentage": 89.12, "elapsed_time": "1 day, 16:19:14", "remaining_time": "4:55:28"}
|
656 |
+
{"current_steps": 656, "total_steps": 735, "loss": 0.6179, "lr": 2.7865884783355234e-06, "epoch": 4.449342941924544, "percentage": 89.25, "elapsed_time": "1 day, 16:22:55", "remaining_time": "4:51:47"}
|
657 |
+
{"current_steps": 657, "total_steps": 735, "loss": 0.6201, "lr": 2.717293248787769e-06, "epoch": 4.4561254768969905, "percentage": 89.39, "elapsed_time": "1 day, 16:26:37", "remaining_time": "4:48:05"}
|
658 |
+
{"current_steps": 658, "total_steps": 735, "loss": 0.6019, "lr": 2.648840196370368e-06, "epoch": 4.462908011869436, "percentage": 89.52, "elapsed_time": "1 day, 16:30:17", "remaining_time": "4:44:23"}
|
659 |
+
{"current_steps": 659, "total_steps": 735, "loss": 0.5977, "lr": 2.5812308673657825e-06, "epoch": 4.469690546841882, "percentage": 89.66, "elapsed_time": "1 day, 16:33:59", "remaining_time": "4:40:42"}
|
660 |
+
{"current_steps": 660, "total_steps": 735, "loss": 0.6017, "lr": 2.5144667889976316e-06, "epoch": 4.476473081814328, "percentage": 89.8, "elapsed_time": "1 day, 16:37:40", "remaining_time": "4:37:00"}
|
661 |
+
{"current_steps": 661, "total_steps": 735, "loss": 0.6086, "lr": 2.4485494693962197e-06, "epoch": 4.483255616786774, "percentage": 89.93, "elapsed_time": "1 day, 16:41:21", "remaining_time": "4:33:18"}
|
662 |
+
{"current_steps": 662, "total_steps": 735, "loss": 0.6182, "lr": 2.3834803975644772e-06, "epoch": 4.49003815175922, "percentage": 90.07, "elapsed_time": "1 day, 16:45:02", "remaining_time": "4:29:37"}
|
663 |
+
{"current_steps": 663, "total_steps": 735, "loss": 0.6074, "lr": 2.3192610433442784e-06, "epoch": 4.496820686731666, "percentage": 90.2, "elapsed_time": "1 day, 16:48:43", "remaining_time": "4:25:55"}
|
664 |
+
{"current_steps": 664, "total_steps": 735, "loss": 0.6076, "lr": 2.2558928573833016e-06, "epoch": 4.503603221704112, "percentage": 90.34, "elapsed_time": "1 day, 16:52:25", "remaining_time": "4:22:13"}
|
665 |
+
{"current_steps": 665, "total_steps": 735, "loss": 0.6019, "lr": 2.1933772711021995e-06, "epoch": 4.510385756676558, "percentage": 90.48, "elapsed_time": "1 day, 16:56:07", "remaining_time": "4:18:32"}
|
666 |
+
{"current_steps": 666, "total_steps": 735, "loss": 0.5995, "lr": 2.1317156966623243e-06, "epoch": 4.5171682916490035, "percentage": 90.61, "elapsed_time": "1 day, 16:59:48", "remaining_time": "4:14:50"}
|
667 |
+
{"current_steps": 667, "total_steps": 735, "loss": 0.6023, "lr": 2.0709095269337755e-06, "epoch": 4.52395082662145, "percentage": 90.75, "elapsed_time": "1 day, 17:03:30", "remaining_time": "4:11:09"}
|
668 |
+
{"current_steps": 668, "total_steps": 735, "loss": 0.6143, "lr": 2.0109601354639706e-06, "epoch": 4.530733361593896, "percentage": 90.88, "elapsed_time": "1 day, 17:07:10", "remaining_time": "4:07:27"}
|
669 |
+
{"current_steps": 669, "total_steps": 735, "loss": 0.6143, "lr": 1.9518688764466096e-06, "epoch": 4.537515896566342, "percentage": 91.02, "elapsed_time": "1 day, 17:10:51", "remaining_time": "4:03:45"}
|
670 |
+
{"current_steps": 670, "total_steps": 735, "loss": 0.6092, "lr": 1.8936370846910845e-06, "epoch": 4.544298431538787, "percentage": 91.16, "elapsed_time": "1 day, 17:14:32", "remaining_time": "4:00:04"}
|
671 |
+
{"current_steps": 671, "total_steps": 735, "loss": 0.6186, "lr": 1.8362660755923079e-06, "epoch": 4.5510809665112335, "percentage": 91.29, "elapsed_time": "1 day, 17:18:13", "remaining_time": "3:56:22"}
|
672 |
+
{"current_steps": 672, "total_steps": 735, "loss": 0.5983, "lr": 1.7797571451010442e-06, "epoch": 4.55786350148368, "percentage": 91.43, "elapsed_time": "1 day, 17:21:55", "remaining_time": "3:52:40"}
|
673 |
+
{"current_steps": 673, "total_steps": 735, "loss": 0.6132, "lr": 1.7241115696945821e-06, "epoch": 4.564646036456125, "percentage": 91.56, "elapsed_time": "1 day, 17:25:36", "remaining_time": "3:48:59"}
|
674 |
+
{"current_steps": 674, "total_steps": 735, "loss": 0.5962, "lr": 1.669330606347952e-06, "epoch": 4.571428571428571, "percentage": 91.7, "elapsed_time": "1 day, 17:29:17", "remaining_time": "3:45:17"}
|
675 |
+
{"current_steps": 675, "total_steps": 735, "loss": 0.6141, "lr": 1.6154154925054878e-06, "epoch": 4.578211106401017, "percentage": 91.84, "elapsed_time": "1 day, 17:32:58", "remaining_time": "3:41:35"}
|
676 |
+
{"current_steps": 676, "total_steps": 735, "loss": 0.6024, "lr": 1.5623674460529014e-06, "epoch": 4.5849936413734635, "percentage": 91.97, "elapsed_time": "1 day, 17:36:39", "remaining_time": "3:37:54"}
|
677 |
+
{"current_steps": 677, "total_steps": 735, "loss": 0.6086, "lr": 1.510187665289773e-06, "epoch": 4.59177617634591, "percentage": 92.11, "elapsed_time": "1 day, 17:40:20", "remaining_time": "3:34:12"}
|
678 |
+
{"current_steps": 678, "total_steps": 735, "loss": 0.6052, "lr": 1.458877328902455e-06, "epoch": 4.598558711318355, "percentage": 92.24, "elapsed_time": "1 day, 17:44:01", "remaining_time": "3:30:30"}
|
679 |
+
{"current_steps": 679, "total_steps": 735, "loss": 0.6072, "lr": 1.4084375959374864e-06, "epoch": 4.605341246290801, "percentage": 92.38, "elapsed_time": "1 day, 17:47:43", "remaining_time": "3:26:49"}
|
680 |
+
{"current_steps": 680, "total_steps": 735, "loss": 0.6089, "lr": 1.3588696057753725e-06, "epoch": 4.612123781263247, "percentage": 92.52, "elapsed_time": "1 day, 17:51:24", "remaining_time": "3:23:07"}
|
681 |
+
{"current_steps": 681, "total_steps": 735, "loss": 0.6016, "lr": 1.3101744781048774e-06, "epoch": 4.618906316235693, "percentage": 92.65, "elapsed_time": "1 day, 17:55:04", "remaining_time": "3:19:26"}
|
682 |
+
{"current_steps": 682, "total_steps": 735, "loss": 0.6075, "lr": 1.262353312897715e-06, "epoch": 4.625688851208139, "percentage": 92.79, "elapsed_time": "1 day, 17:58:45", "remaining_time": "3:15:44"}
|
683 |
+
{"current_steps": 683, "total_steps": 735, "loss": 0.6157, "lr": 1.2154071903837107e-06, "epoch": 4.632471386180585, "percentage": 92.93, "elapsed_time": "1 day, 18:02:26", "remaining_time": "3:12:02"}
|
684 |
+
{"current_steps": 684, "total_steps": 735, "loss": 0.6049, "lr": 1.1693371710263857e-06, "epoch": 4.639253921153031, "percentage": 93.06, "elapsed_time": "1 day, 18:06:07", "remaining_time": "3:08:21"}
|
685 |
+
{"current_steps": 685, "total_steps": 735, "loss": 0.6048, "lr": 1.1241442954990301e-06, "epoch": 4.6460364561254766, "percentage": 93.2, "elapsed_time": "1 day, 18:09:48", "remaining_time": "3:04:39"}
|
686 |
+
{"current_steps": 686, "total_steps": 735, "loss": 0.5989, "lr": 1.0798295846611562e-06, "epoch": 4.652818991097923, "percentage": 93.33, "elapsed_time": "1 day, 18:13:29", "remaining_time": "3:00:57"}
|
687 |
+
{"current_steps": 687, "total_steps": 735, "loss": 0.6098, "lr": 1.0363940395354777e-06, "epoch": 4.659601526070369, "percentage": 93.47, "elapsed_time": "1 day, 18:17:11", "remaining_time": "2:57:16"}
|
688 |
+
{"current_steps": 688, "total_steps": 735, "loss": 0.6149, "lr": 9.938386412852652e-07, "epoch": 4.666384061042815, "percentage": 93.61, "elapsed_time": "1 day, 18:20:52", "remaining_time": "2:53:34"}
|
689 |
+
{"current_steps": 689, "total_steps": 735, "loss": 0.6088, "lr": 9.52164351192213e-07, "epoch": 4.67316659601526, "percentage": 93.74, "elapsed_time": "1 day, 18:24:33", "remaining_time": "2:49:53"}
|
690 |
+
{"current_steps": 690, "total_steps": 735, "loss": 0.5989, "lr": 9.113721106346918e-07, "epoch": 4.679949130987707, "percentage": 93.88, "elapsed_time": "1 day, 18:28:14", "remaining_time": "2:46:11"}
|
691 |
+
{"current_steps": 691, "total_steps": 735, "loss": 0.6172, "lr": 8.714628410665082e-07, "epoch": 4.686731665960153, "percentage": 94.01, "elapsed_time": "1 day, 18:31:56", "remaining_time": "2:42:29"}
|
692 |
+
{"current_steps": 692, "total_steps": 735, "loss": 0.6067, "lr": 8.324374439960947e-07, "epoch": 4.693514200932599, "percentage": 94.15, "elapsed_time": "1 day, 18:35:37", "remaining_time": "2:38:48"}
|
693 |
+
{"current_steps": 693, "total_steps": 735, "loss": 0.6142, "lr": 7.942968009661123e-07, "epoch": 4.700296735905044, "percentage": 94.29, "elapsed_time": "1 day, 18:39:19", "remaining_time": "2:35:06"}
|
694 |
+
{"current_steps": 694, "total_steps": 735, "loss": 0.614, "lr": 7.570417735335733e-07, "epoch": 4.7070792708774905, "percentage": 94.42, "elapsed_time": "1 day, 18:42:59", "remaining_time": "2:31:24"}
|
695 |
+
{"current_steps": 695, "total_steps": 735, "loss": 0.5969, "lr": 7.206732032503638e-07, "epoch": 4.713861805849937, "percentage": 94.56, "elapsed_time": "1 day, 18:46:39", "remaining_time": "2:27:43"}
|
696 |
+
{"current_steps": 696, "total_steps": 735, "loss": 0.6122, "lr": 6.851919116442274e-07, "epoch": 4.720644340822382, "percentage": 94.69, "elapsed_time": "1 day, 18:50:20", "remaining_time": "2:24:01"}
|
697 |
+
{"current_steps": 697, "total_steps": 735, "loss": 0.6092, "lr": 6.505987002002245e-07, "epoch": 4.727426875794828, "percentage": 94.83, "elapsed_time": "1 day, 18:54:01", "remaining_time": "2:20:20"}
|
698 |
+
{"current_steps": 698, "total_steps": 735, "loss": 0.6038, "lr": 6.168943503426139e-07, "epoch": 4.734209410767274, "percentage": 94.97, "elapsed_time": "1 day, 18:57:42", "remaining_time": "2:16:38"}
|
699 |
+
{"current_steps": 699, "total_steps": 735, "loss": 0.5943, "lr": 5.840796234172085e-07, "epoch": 4.7409919457397205, "percentage": 95.1, "elapsed_time": "1 day, 19:01:23", "remaining_time": "2:12:56"}
|
700 |
+
{"current_steps": 700, "total_steps": 735, "loss": 0.6066, "lr": 5.521552606741765e-07, "epoch": 4.747774480712166, "percentage": 95.24, "elapsed_time": "1 day, 19:05:04", "remaining_time": "2:09:15"}
|
701 |
+
{"current_steps": 701, "total_steps": 735, "loss": 0.6114, "lr": 5.211219832512893e-07, "epoch": 4.754557015684612, "percentage": 95.37, "elapsed_time": "1 day, 19:08:46", "remaining_time": "2:05:33"}
|
702 |
+
{"current_steps": 702, "total_steps": 735, "loss": 0.6185, "lr": 4.909804921576466e-07, "epoch": 4.761339550657058, "percentage": 95.51, "elapsed_time": "1 day, 19:12:27", "remaining_time": "2:01:52"}
|
703 |
+
{"current_steps": 703, "total_steps": 735, "loss": 0.6067, "lr": 4.6173146825782224e-07, "epoch": 4.768122085629504, "percentage": 95.65, "elapsed_time": "1 day, 19:16:07", "remaining_time": "1:58:10"}
|
704 |
+
{"current_steps": 704, "total_steps": 735, "loss": 0.6047, "lr": 4.3337557225650695e-07, "epoch": 4.77490462060195, "percentage": 95.78, "elapsed_time": "1 day, 19:19:48", "remaining_time": "1:54:28"}
|
705 |
+
{"current_steps": 705, "total_steps": 735, "loss": 0.6118, "lr": 4.0591344468355666e-07, "epoch": 4.781687155574396, "percentage": 95.92, "elapsed_time": "1 day, 19:23:29", "remaining_time": "1:50:47"}
|
706 |
+
{"current_steps": 706, "total_steps": 735, "loss": 0.6189, "lr": 3.793457058795591e-07, "epoch": 4.788469690546842, "percentage": 96.05, "elapsed_time": "1 day, 19:27:10", "remaining_time": "1:47:05"}
|
707 |
+
{"current_steps": 707, "total_steps": 735, "loss": 0.6085, "lr": 3.5367295598178307e-07, "epoch": 4.795252225519288, "percentage": 96.19, "elapsed_time": "1 day, 19:30:51", "remaining_time": "1:43:24"}
|
708 |
+
{"current_steps": 708, "total_steps": 735, "loss": 0.6045, "lr": 3.2889577491064693e-07, "epoch": 4.8020347604917335, "percentage": 96.33, "elapsed_time": "1 day, 19:34:32", "remaining_time": "1:39:42"}
|
709 |
+
{"current_steps": 709, "total_steps": 735, "loss": 0.6122, "lr": 3.050147223566091e-07, "epoch": 4.80881729546418, "percentage": 96.46, "elapsed_time": "1 day, 19:38:13", "remaining_time": "1:36:00"}
|
710 |
+
{"current_steps": 710, "total_steps": 735, "loss": 0.6033, "lr": 2.8203033776752487e-07, "epoch": 4.815599830436626, "percentage": 96.6, "elapsed_time": "1 day, 19:41:54", "remaining_time": "1:32:19"}
|
711 |
+
{"current_steps": 711, "total_steps": 735, "loss": 0.6094, "lr": 2.599431403364694e-07, "epoch": 4.822382365409071, "percentage": 96.73, "elapsed_time": "1 day, 19:45:35", "remaining_time": "1:28:37"}
|
712 |
+
{"current_steps": 712, "total_steps": 735, "loss": 0.604, "lr": 2.3875362899000054e-07, "epoch": 4.829164900381517, "percentage": 96.87, "elapsed_time": "1 day, 19:49:16", "remaining_time": "1:24:56"}
|
713 |
+
{"current_steps": 713, "total_steps": 735, "loss": 0.6087, "lr": 2.1846228237689226e-07, "epoch": 4.8359474353539635, "percentage": 97.01, "elapsed_time": "1 day, 19:52:58", "remaining_time": "1:21:14"}
|
714 |
+
{"current_steps": 714, "total_steps": 735, "loss": 0.6091, "lr": 1.9906955885732104e-07, "epoch": 4.84272997032641, "percentage": 97.14, "elapsed_time": "1 day, 19:56:39", "remaining_time": "1:17:32"}
|
715 |
+
{"current_steps": 715, "total_steps": 735, "loss": 0.6146, "lr": 1.8057589649251862e-07, "epoch": 4.849512505298856, "percentage": 97.28, "elapsed_time": "1 day, 20:00:20", "remaining_time": "1:13:51"}
|
716 |
+
{"current_steps": 716, "total_steps": 735, "loss": 0.6042, "lr": 1.62981713034851e-07, "epoch": 4.856295040271301, "percentage": 97.41, "elapsed_time": "1 day, 20:04:01", "remaining_time": "1:10:09"}
|
717 |
+
{"current_steps": 717, "total_steps": 735, "loss": 0.6086, "lr": 1.462874059184305e-07, "epoch": 4.863077575243747, "percentage": 97.55, "elapsed_time": "1 day, 20:07:42", "remaining_time": "1:06:28"}
|
718 |
+
{"current_steps": 718, "total_steps": 735, "loss": 0.6295, "lr": 1.3049335225009175e-07, "epoch": 4.869860110216194, "percentage": 97.69, "elapsed_time": "1 day, 20:11:23", "remaining_time": "1:02:46"}
|
719 |
+
{"current_steps": 719, "total_steps": 735, "loss": 0.6085, "lr": 1.1559990880089189e-07, "epoch": 4.876642645188639, "percentage": 97.82, "elapsed_time": "1 day, 20:15:03", "remaining_time": "0:59:05"}
|
720 |
+
{"current_steps": 720, "total_steps": 735, "loss": 0.5998, "lr": 1.0160741199805036e-07, "epoch": 4.883425180161085, "percentage": 97.96, "elapsed_time": "1 day, 20:18:44", "remaining_time": "0:55:23"}
|
721 |
+
{"current_steps": 721, "total_steps": 735, "loss": 0.6145, "lr": 8.851617791735933e-08, "epoch": 4.890207715133531, "percentage": 98.1, "elapsed_time": "1 day, 20:22:24", "remaining_time": "0:51:41"}
|
722 |
+
{"current_steps": 722, "total_steps": 735, "loss": 0.604, "lr": 7.632650227602511e-08, "epoch": 4.896990250105977, "percentage": 98.23, "elapsed_time": "1 day, 20:26:06", "remaining_time": "0:48:00"}
|
723 |
+
{"current_steps": 723, "total_steps": 735, "loss": 0.6187, "lr": 6.503866042599338e-08, "epoch": 4.903772785078423, "percentage": 98.37, "elapsed_time": "1 day, 20:29:47", "remaining_time": "0:44:18"}
|
724 |
+
{"current_steps": 724, "total_steps": 735, "loss": 0.6166, "lr": 5.4652907347745307e-08, "epoch": 4.910555320050869, "percentage": 98.5, "elapsed_time": "1 day, 20:33:28", "remaining_time": "0:40:37"}
|
725 |
+
{"current_steps": 725, "total_steps": 735, "loss": 0.6156, "lr": 4.516947764451107e-08, "epoch": 4.917337855023315, "percentage": 98.64, "elapsed_time": "1 day, 20:37:10", "remaining_time": "0:36:55"}
|
726 |
+
{"current_steps": 726, "total_steps": 735, "loss": 0.6085, "lr": 3.6588585537002955e-08, "epoch": 4.924120389995761, "percentage": 98.78, "elapsed_time": "1 day, 20:40:52", "remaining_time": "0:33:14"}
|
727 |
+
{"current_steps": 727, "total_steps": 735, "loss": 0.6026, "lr": 2.8910424858543673e-08, "epoch": 4.930902924968207, "percentage": 98.91, "elapsed_time": "1 day, 20:44:35", "remaining_time": "0:29:32"}
|
728 |
+
{"current_steps": 728, "total_steps": 735, "loss": 0.6012, "lr": 2.213516905070101e-08, "epoch": 4.937685459940653, "percentage": 99.05, "elapsed_time": "1 day, 20:48:17", "remaining_time": "0:25:50"}
|
729 |
+
{"current_steps": 729, "total_steps": 735, "loss": 0.6146, "lr": 1.6262971159384243e-08, "epoch": 4.944467994913099, "percentage": 99.18, "elapsed_time": "1 day, 20:51:58", "remaining_time": "0:22:09"}
|
730 |
+
{"current_steps": 730, "total_steps": 735, "loss": 0.6116, "lr": 1.1293963831366939e-08, "epoch": 4.951250529885545, "percentage": 99.32, "elapsed_time": "1 day, 20:55:38", "remaining_time": "0:18:27"}
|
731 |
+
{"current_steps": 731, "total_steps": 735, "loss": 0.602, "lr": 7.228259311293784e-09, "epoch": 4.9580330648579904, "percentage": 99.46, "elapsed_time": "1 day, 20:59:19", "remaining_time": "0:14:46"}
|
732 |
+
{"current_steps": 732, "total_steps": 735, "loss": 0.6099, "lr": 4.065949439158168e-09, "epoch": 4.964815599830437, "percentage": 99.59, "elapsed_time": "1 day, 21:03:00", "remaining_time": "0:11:04"}
|
733 |
+
{"current_steps": 733, "total_steps": 735, "loss": 0.615, "lr": 1.8071056482105166e-09, "epoch": 4.971598134802883, "percentage": 99.73, "elapsed_time": "1 day, 21:06:41", "remaining_time": "0:07:23"}
|
734 |
+
{"current_steps": 734, "total_steps": 735, "loss": 0.6104, "lr": 4.517789633551317e-10, "epoch": 4.978380669775328, "percentage": 99.86, "elapsed_time": "1 day, 21:10:22", "remaining_time": "0:03:41"}
|
735 |
+
{"current_steps": 735, "total_steps": 735, "loss": 0.6111, "lr": 0.0, "epoch": 4.985163204747774, "percentage": 100.0, "elapsed_time": "1 day, 21:14:04", "remaining_time": "0:00:00"}
|
736 |
+
{"current_steps": 735, "total_steps": 735, "epoch": 4.985163204747774, "percentage": 100.0, "elapsed_time": "1 day, 21:15:37", "remaining_time": "0:00:00"}
|