Training in progress, epoch 4
Browse files- model-00001-of-00004.safetensors +1 -1
- model-00002-of-00004.safetensors +1 -1
- model-00003-of-00004.safetensors +1 -1
- model-00004-of-00004.safetensors +1 -1
- trainer_log.jsonl +266 -0
- training_args.bin +2 -2
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4877660776
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d26e400ba0320dc4126695afead1442d3b232d7bdee1591d4e7197d34ed487dd
|
3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4932751008
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5a25b88afb609149aa0ca55b03a981162ae951be4d1f45808b49b60e8a776a05
|
3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4330865200
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0fd4e6e587e41df2dd7bdd3060e4099f873d17428b7e9436ec7526fbbad8e3ac
|
3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1089994880
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fb50831507fbb9e5f945095e4e69b411903977b431d69fcbaa95572b80c27bd9
|
3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
@@ -718,3 +718,269 @@
|
|
718 |
{"current_steps": 718, "total_steps": 895, "loss": 0.7133, "lr": 9.169522193895614e-06, "epoch": 3.991660875608061, "percentage": 80.22, "elapsed_time": "20:31:57", "remaining_time": "5:03:42"}
|
719 |
{"current_steps": 719, "total_steps": 895, "loss": 0.6978, "lr": 9.070299749108184e-06, "epoch": 3.9972202918693536, "percentage": 80.34, "elapsed_time": "20:33:39", "remaining_time": "5:01:58"}
|
720 |
{"current_steps": 720, "total_steps": 895, "loss": 0.6916, "lr": 8.971548371823205e-06, "epoch": 4.002779708130646, "percentage": 80.45, "elapsed_time": "20:37:10", "remaining_time": "5:00:42"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
718 |
{"current_steps": 718, "total_steps": 895, "loss": 0.7133, "lr": 9.169522193895614e-06, "epoch": 3.991660875608061, "percentage": 80.22, "elapsed_time": "20:31:57", "remaining_time": "5:03:42"}
|
719 |
{"current_steps": 719, "total_steps": 895, "loss": 0.6978, "lr": 9.070299749108184e-06, "epoch": 3.9972202918693536, "percentage": 80.34, "elapsed_time": "20:33:39", "remaining_time": "5:01:58"}
|
720 |
{"current_steps": 720, "total_steps": 895, "loss": 0.6916, "lr": 8.971548371823205e-06, "epoch": 4.002779708130646, "percentage": 80.45, "elapsed_time": "20:37:10", "remaining_time": "5:00:42"}
|
721 |
+
{"current_steps": 721, "total_steps": 895, "loss": 0.692, "lr": 8.873269566050262e-06, "epoch": 4.008339124391939, "percentage": 80.56, "elapsed_time": "20:38:51", "remaining_time": "4:58:58"}
|
722 |
+
{"current_steps": 722, "total_steps": 895, "loss": 0.6844, "lr": 8.775464828601477e-06, "epoch": 4.013898540653232, "percentage": 80.67, "elapsed_time": "20:40:34", "remaining_time": "4:57:15"}
|
723 |
+
{"current_steps": 723, "total_steps": 895, "loss": 0.6765, "lr": 8.678135649068862e-06, "epoch": 4.019457956914524, "percentage": 80.78, "elapsed_time": "20:42:15", "remaining_time": "4:55:31"}
|
724 |
+
{"current_steps": 724, "total_steps": 895, "loss": 0.6818, "lr": 8.581283509801501e-06, "epoch": 4.0250173731758165, "percentage": 80.89, "elapsed_time": "20:43:59", "remaining_time": "4:53:49"}
|
725 |
+
{"current_steps": 725, "total_steps": 895, "loss": 0.6799, "lr": 8.484909885883073e-06, "epoch": 4.030576789437109, "percentage": 81.01, "elapsed_time": "20:45:41", "remaining_time": "4:52:05"}
|
726 |
+
{"current_steps": 726, "total_steps": 895, "loss": 0.6803, "lr": 8.389016245109305e-06, "epoch": 4.036136205698401, "percentage": 81.12, "elapsed_time": "20:47:22", "remaining_time": "4:50:21"}
|
727 |
+
{"current_steps": 727, "total_steps": 895, "loss": 0.6735, "lr": 8.293604047965677e-06, "epoch": 4.041695621959694, "percentage": 81.23, "elapsed_time": "20:49:03", "remaining_time": "4:48:38"}
|
728 |
+
{"current_steps": 728, "total_steps": 895, "loss": 0.6725, "lr": 8.19867474760514e-06, "epoch": 4.047255038220987, "percentage": 81.34, "elapsed_time": "20:50:46", "remaining_time": "4:46:55"}
|
729 |
+
{"current_steps": 729, "total_steps": 895, "loss": 0.674, "lr": 8.104229789825994e-06, "epoch": 4.052814454482279, "percentage": 81.45, "elapsed_time": "20:52:27", "remaining_time": "4:45:11"}
|
730 |
+
{"current_steps": 730, "total_steps": 895, "loss": 0.6725, "lr": 8.010270613049918e-06, "epoch": 4.058373870743572, "percentage": 81.56, "elapsed_time": "20:54:10", "remaining_time": "4:43:28"}
|
731 |
+
{"current_steps": 731, "total_steps": 895, "loss": 0.6673, "lr": 7.916798648299964e-06, "epoch": 4.063933287004865, "percentage": 81.68, "elapsed_time": "20:55:53", "remaining_time": "4:41:45"}
|
732 |
+
{"current_steps": 732, "total_steps": 895, "loss": 0.6816, "lr": 7.823815319178844e-06, "epoch": 4.069492703266157, "percentage": 81.79, "elapsed_time": "20:57:34", "remaining_time": "4:40:02"}
|
733 |
+
{"current_steps": 733, "total_steps": 895, "loss": 0.6709, "lr": 7.731322041847207e-06, "epoch": 4.07505211952745, "percentage": 81.9, "elapsed_time": "20:59:17", "remaining_time": "4:38:19"}
|
734 |
+
{"current_steps": 734, "total_steps": 895, "loss": 0.6769, "lr": 7.639320225002106e-06, "epoch": 4.0806115357887425, "percentage": 82.01, "elapsed_time": "21:00:59", "remaining_time": "4:36:35"}
|
735 |
+
{"current_steps": 735, "total_steps": 895, "loss": 0.6625, "lr": 7.547811269855501e-06, "epoch": 4.086170952050034, "percentage": 82.12, "elapsed_time": "21:02:41", "remaining_time": "4:34:52"}
|
736 |
+
{"current_steps": 736, "total_steps": 895, "loss": 0.6942, "lr": 7.456796570112939e-06, "epoch": 4.091730368311327, "percentage": 82.23, "elapsed_time": "21:04:22", "remaining_time": "4:33:08"}
|
737 |
+
{"current_steps": 737, "total_steps": 895, "loss": 0.6816, "lr": 7.366277511952326e-06, "epoch": 4.09728978457262, "percentage": 82.35, "elapsed_time": "21:06:02", "remaining_time": "4:31:25"}
|
738 |
+
{"current_steps": 738, "total_steps": 895, "loss": 0.6962, "lr": 7.2762554740028445e-06, "epoch": 4.102849200833912, "percentage": 82.46, "elapsed_time": "21:07:44", "remaining_time": "4:29:41"}
|
739 |
+
{"current_steps": 739, "total_steps": 895, "loss": 0.6881, "lr": 7.186731827323883e-06, "epoch": 4.108408617095205, "percentage": 82.57, "elapsed_time": "21:09:25", "remaining_time": "4:27:58"}
|
740 |
+
{"current_steps": 740, "total_steps": 895, "loss": 0.6879, "lr": 7.097707935384232e-06, "epoch": 4.113968033356498, "percentage": 82.68, "elapsed_time": "21:11:09", "remaining_time": "4:26:15"}
|
741 |
+
{"current_steps": 741, "total_steps": 895, "loss": 0.667, "lr": 7.009185154041258e-06, "epoch": 4.11952744961779, "percentage": 82.79, "elapsed_time": "21:12:50", "remaining_time": "4:24:31"}
|
742 |
+
{"current_steps": 742, "total_steps": 895, "loss": 0.6883, "lr": 6.921164831520322e-06, "epoch": 4.125086865879083, "percentage": 82.91, "elapsed_time": "21:14:32", "remaining_time": "4:22:48"}
|
743 |
+
{"current_steps": 743, "total_steps": 895, "loss": 0.675, "lr": 6.833648308394156e-06, "epoch": 4.1306462821403755, "percentage": 83.02, "elapsed_time": "21:16:14", "remaining_time": "4:21:05"}
|
744 |
+
{"current_steps": 744, "total_steps": 895, "loss": 0.672, "lr": 6.7466369175625475e-06, "epoch": 4.1362056984016675, "percentage": 83.13, "elapsed_time": "21:17:56", "remaining_time": "4:19:22"}
|
745 |
+
{"current_steps": 745, "total_steps": 895, "loss": 0.6786, "lr": 6.660131984231917e-06, "epoch": 4.14176511466296, "percentage": 83.24, "elapsed_time": "21:19:38", "remaining_time": "4:17:38"}
|
746 |
+
{"current_steps": 746, "total_steps": 895, "loss": 0.6738, "lr": 6.574134825895276e-06, "epoch": 4.147324530924253, "percentage": 83.35, "elapsed_time": "21:21:19", "remaining_time": "4:15:55"}
|
747 |
+
{"current_steps": 747, "total_steps": 895, "loss": 0.6843, "lr": 6.488646752312031e-06, "epoch": 4.152883947185545, "percentage": 83.46, "elapsed_time": "21:23:03", "remaining_time": "4:14:12"}
|
748 |
+
{"current_steps": 748, "total_steps": 895, "loss": 0.6806, "lr": 6.403669065488141e-06, "epoch": 4.158443363446838, "percentage": 83.58, "elapsed_time": "21:24:46", "remaining_time": "4:12:29"}
|
749 |
+
{"current_steps": 749, "total_steps": 895, "loss": 0.7094, "lr": 6.3192030596562e-06, "epoch": 4.164002779708131, "percentage": 83.69, "elapsed_time": "21:26:30", "remaining_time": "4:10:46"}
|
750 |
+
{"current_steps": 750, "total_steps": 895, "loss": 0.6786, "lr": 6.235250021255788e-06, "epoch": 4.169562195969423, "percentage": 83.8, "elapsed_time": "21:28:12", "remaining_time": "4:09:03"}
|
751 |
+
{"current_steps": 751, "total_steps": 895, "loss": 0.6772, "lr": 6.15181122891384e-06, "epoch": 4.175121612230716, "percentage": 83.91, "elapsed_time": "21:29:56", "remaining_time": "4:07:20"}
|
752 |
+
{"current_steps": 752, "total_steps": 895, "loss": 0.6678, "lr": 6.068887953425213e-06, "epoch": 4.180681028492009, "percentage": 84.02, "elapsed_time": "21:31:38", "remaining_time": "4:05:37"}
|
753 |
+
{"current_steps": 753, "total_steps": 895, "loss": 0.6856, "lr": 5.986481457733284e-06, "epoch": 4.186240444753301, "percentage": 84.13, "elapsed_time": "21:33:20", "remaining_time": "4:03:53"}
|
754 |
+
{"current_steps": 754, "total_steps": 895, "loss": 0.6722, "lr": 5.904592996910739e-06, "epoch": 4.1917998610145935, "percentage": 84.25, "elapsed_time": "21:35:03", "remaining_time": "4:02:10"}
|
755 |
+
{"current_steps": 755, "total_steps": 895, "loss": 0.6969, "lr": 5.823223818140458e-06, "epoch": 4.197359277275886, "percentage": 84.36, "elapsed_time": "21:36:44", "remaining_time": "4:00:27"}
|
756 |
+
{"current_steps": 756, "total_steps": 895, "loss": 0.703, "lr": 5.7423751606965296e-06, "epoch": 4.202918693537178, "percentage": 84.47, "elapsed_time": "21:38:26", "remaining_time": "3:58:44"}
|
757 |
+
{"current_steps": 757, "total_steps": 895, "loss": 0.6916, "lr": 5.662048255925357e-06, "epoch": 4.208478109798471, "percentage": 84.58, "elapsed_time": "21:40:08", "remaining_time": "3:57:00"}
|
758 |
+
{"current_steps": 758, "total_steps": 895, "loss": 0.6684, "lr": 5.582244327226907e-06, "epoch": 4.214037526059764, "percentage": 84.69, "elapsed_time": "21:41:50", "remaining_time": "3:55:17"}
|
759 |
+
{"current_steps": 759, "total_steps": 895, "loss": 0.6814, "lr": 5.502964590036093e-06, "epoch": 4.219596942321056, "percentage": 84.8, "elapsed_time": "21:43:32", "remaining_time": "3:53:34"}
|
760 |
+
{"current_steps": 760, "total_steps": 895, "loss": 0.6726, "lr": 5.424210251804227e-06, "epoch": 4.225156358582349, "percentage": 84.92, "elapsed_time": "21:45:16", "remaining_time": "3:51:51"}
|
761 |
+
{"current_steps": 761, "total_steps": 895, "loss": 0.6839, "lr": 5.345982511980707e-06, "epoch": 4.230715774843642, "percentage": 85.03, "elapsed_time": "21:46:57", "remaining_time": "3:50:08"}
|
762 |
+
{"current_steps": 762, "total_steps": 895, "loss": 0.6558, "lr": 5.268282561994658e-06, "epoch": 4.236275191104934, "percentage": 85.14, "elapsed_time": "21:48:40", "remaining_time": "3:48:25"}
|
763 |
+
{"current_steps": 763, "total_steps": 895, "loss": 0.689, "lr": 5.191111585236828e-06, "epoch": 4.2418346073662265, "percentage": 85.25, "elapsed_time": "21:50:23", "remaining_time": "3:46:41"}
|
764 |
+
{"current_steps": 764, "total_steps": 895, "loss": 0.6886, "lr": 5.114470757041572e-06, "epoch": 4.247394023627519, "percentage": 85.36, "elapsed_time": "21:52:06", "remaining_time": "3:44:58"}
|
765 |
+
{"current_steps": 765, "total_steps": 895, "loss": 0.6917, "lr": 5.038361244668952e-06, "epoch": 4.252953439888811, "percentage": 85.47, "elapsed_time": "21:53:47", "remaining_time": "3:43:15"}
|
766 |
+
{"current_steps": 766, "total_steps": 895, "loss": 0.6874, "lr": 4.96278420728693e-06, "epoch": 4.258512856150104, "percentage": 85.59, "elapsed_time": "21:55:30", "remaining_time": "3:41:32"}
|
767 |
+
{"current_steps": 767, "total_steps": 895, "loss": 0.69, "lr": 4.887740795953764e-06, "epoch": 4.264072272411397, "percentage": 85.7, "elapsed_time": "21:57:12", "remaining_time": "3:39:49"}
|
768 |
+
{"current_steps": 768, "total_steps": 895, "loss": 0.6864, "lr": 4.813232153600393e-06, "epoch": 4.269631688672689, "percentage": 85.81, "elapsed_time": "21:58:54", "remaining_time": "3:38:06"}
|
769 |
+
{"current_steps": 769, "total_steps": 895, "loss": 0.6791, "lr": 4.739259415013138e-06, "epoch": 4.275191104933982, "percentage": 85.92, "elapsed_time": "22:00:37", "remaining_time": "3:36:23"}
|
770 |
+
{"current_steps": 770, "total_steps": 895, "loss": 0.6856, "lr": 4.6658237068163285e-06, "epoch": 4.280750521195275, "percentage": 86.03, "elapsed_time": "22:02:20", "remaining_time": "3:34:39"}
|
771 |
+
{"current_steps": 720, "total_steps": 895, "loss": 0.6835, "lr": 8.971548371823205e-06, "epoch": 4.0222376650451706, "percentage": 80.45, "elapsed_time": "0:01:56", "remaining_time": "0:00:28"}
|
772 |
+
{"current_steps": 721, "total_steps": 895, "loss": 0.6883, "lr": 8.873269566050262e-06, "epoch": 4.0277970813064625, "percentage": 80.56, "elapsed_time": "0:03:41", "remaining_time": "0:00:53"}
|
773 |
+
{"current_steps": 722, "total_steps": 895, "loss": 0.674, "lr": 8.775464828601477e-06, "epoch": 4.033356497567755, "percentage": 80.67, "elapsed_time": "0:05:27", "remaining_time": "0:01:18"}
|
774 |
+
{"current_steps": 723, "total_steps": 895, "loss": 0.677, "lr": 8.678135649068862e-06, "epoch": 4.038915913829048, "percentage": 80.78, "elapsed_time": "0:07:14", "remaining_time": "0:01:43"}
|
775 |
+
{"current_steps": 724, "total_steps": 895, "loss": 0.6761, "lr": 8.581283509801501e-06, "epoch": 4.04447533009034, "percentage": 80.89, "elapsed_time": "0:09:01", "remaining_time": "0:02:07"}
|
776 |
+
{"current_steps": 725, "total_steps": 895, "loss": 0.6744, "lr": 8.484909885883073e-06, "epoch": 4.050034746351633, "percentage": 81.01, "elapsed_time": "0:10:50", "remaining_time": "0:02:32"}
|
777 |
+
{"current_steps": 726, "total_steps": 895, "loss": 0.6704, "lr": 8.389016245109305e-06, "epoch": 4.055594162612926, "percentage": 81.12, "elapsed_time": "0:12:37", "remaining_time": "0:02:56"}
|
778 |
+
{"current_steps": 727, "total_steps": 895, "loss": 0.6671, "lr": 8.293604047965677e-06, "epoch": 4.061153578874218, "percentage": 81.23, "elapsed_time": "0:14:24", "remaining_time": "0:03:19"}
|
779 |
+
{"current_steps": 728, "total_steps": 895, "loss": 0.679, "lr": 8.19867474760514e-06, "epoch": 4.066712995135511, "percentage": 81.34, "elapsed_time": "0:16:11", "remaining_time": "0:03:42"}
|
780 |
+
{"current_steps": 729, "total_steps": 895, "loss": 0.6812, "lr": 8.104229789825994e-06, "epoch": 4.072272411396804, "percentage": 81.45, "elapsed_time": "0:17:59", "remaining_time": "0:04:05"}
|
781 |
+
{"current_steps": 730, "total_steps": 895, "loss": 0.6646, "lr": 8.010270613049918e-06, "epoch": 4.077831827658096, "percentage": 81.56, "elapsed_time": "0:19:46", "remaining_time": "0:04:28"}
|
782 |
+
{"current_steps": 731, "total_steps": 895, "loss": 0.6721, "lr": 7.916798648299964e-06, "epoch": 4.0833912439193885, "percentage": 81.68, "elapsed_time": "0:21:33", "remaining_time": "0:04:50"}
|
783 |
+
{"current_steps": 732, "total_steps": 895, "loss": 0.6757, "lr": 7.823815319178844e-06, "epoch": 4.088950660180681, "percentage": 81.79, "elapsed_time": "0:23:20", "remaining_time": "0:05:11"}
|
784 |
+
{"current_steps": 733, "total_steps": 895, "loss": 0.6966, "lr": 7.731322041847207e-06, "epoch": 4.094510076441973, "percentage": 81.9, "elapsed_time": "0:25:06", "remaining_time": "0:05:32"}
|
785 |
+
{"current_steps": 734, "total_steps": 895, "loss": 0.6849, "lr": 7.639320225002106e-06, "epoch": 4.100069492703266, "percentage": 82.01, "elapsed_time": "0:26:53", "remaining_time": "0:05:53"}
|
786 |
+
{"current_steps": 735, "total_steps": 895, "loss": 0.6922, "lr": 7.547811269855501e-06, "epoch": 4.105628908964559, "percentage": 82.12, "elapsed_time": "0:28:40", "remaining_time": "0:06:14"}
|
787 |
+
{"current_steps": 736, "total_steps": 895, "loss": 0.6896, "lr": 7.456796570112939e-06, "epoch": 4.111188325225851, "percentage": 82.23, "elapsed_time": "0:30:27", "remaining_time": "0:06:34"}
|
788 |
+
{"current_steps": 737, "total_steps": 895, "loss": 0.6782, "lr": 7.366277511952326e-06, "epoch": 4.116747741487144, "percentage": 82.35, "elapsed_time": "0:32:15", "remaining_time": "0:06:54"}
|
789 |
+
{"current_steps": 738, "total_steps": 895, "loss": 0.6782, "lr": 7.2762554740028445e-06, "epoch": 4.122307157748437, "percentage": 82.46, "elapsed_time": "0:34:01", "remaining_time": "0:07:14"}
|
790 |
+
{"current_steps": 739, "total_steps": 895, "loss": 0.6783, "lr": 7.186731827323883e-06, "epoch": 4.127866574009729, "percentage": 82.57, "elapsed_time": "0:35:49", "remaining_time": "0:07:33"}
|
791 |
+
{"current_steps": 740, "total_steps": 895, "loss": 0.6726, "lr": 7.097707935384232e-06, "epoch": 4.1334259902710215, "percentage": 82.68, "elapsed_time": "0:37:36", "remaining_time": "0:07:52"}
|
792 |
+
{"current_steps": 741, "total_steps": 895, "loss": 0.675, "lr": 7.009185154041258e-06, "epoch": 4.138985406532314, "percentage": 82.79, "elapsed_time": "0:39:24", "remaining_time": "0:08:11"}
|
793 |
+
{"current_steps": 742, "total_steps": 895, "loss": 0.6777, "lr": 6.921164831520322e-06, "epoch": 4.144544822793606, "percentage": 82.91, "elapsed_time": "0:41:13", "remaining_time": "0:08:30"}
|
794 |
+
{"current_steps": 743, "total_steps": 895, "loss": 0.6837, "lr": 6.833648308394156e-06, "epoch": 4.150104239054899, "percentage": 83.02, "elapsed_time": "0:43:01", "remaining_time": "0:08:48"}
|
795 |
+
{"current_steps": 744, "total_steps": 895, "loss": 0.6806, "lr": 6.7466369175625475e-06, "epoch": 4.155663655316192, "percentage": 83.13, "elapsed_time": "0:44:47", "remaining_time": "0:09:05"}
|
796 |
+
{"current_steps": 745, "total_steps": 895, "loss": 0.6851, "lr": 6.660131984231917e-06, "epoch": 4.161223071577484, "percentage": 83.24, "elapsed_time": "0:46:34", "remaining_time": "0:09:22"}
|
797 |
+
{"current_steps": 746, "total_steps": 895, "loss": 0.6935, "lr": 6.574134825895276e-06, "epoch": 4.166782487838777, "percentage": 83.35, "elapsed_time": "0:48:20", "remaining_time": "0:09:39"}
|
798 |
+
{"current_steps": 747, "total_steps": 895, "loss": 0.6874, "lr": 6.488646752312031e-06, "epoch": 4.17234190410007, "percentage": 83.46, "elapsed_time": "0:50:09", "remaining_time": "0:09:56"}
|
799 |
+
{"current_steps": 748, "total_steps": 895, "loss": 0.6721, "lr": 6.403669065488141e-06, "epoch": 4.177901320361362, "percentage": 83.58, "elapsed_time": "0:51:56", "remaining_time": "0:10:12"}
|
800 |
+
{"current_steps": 749, "total_steps": 895, "loss": 0.6701, "lr": 6.3192030596562e-06, "epoch": 4.183460736622655, "percentage": 83.69, "elapsed_time": "0:53:42", "remaining_time": "0:10:28"}
|
801 |
+
{"current_steps": 750, "total_steps": 895, "loss": 0.6803, "lr": 6.235250021255788e-06, "epoch": 4.1890201528839475, "percentage": 83.8, "elapsed_time": "0:55:29", "remaining_time": "0:10:43"}
|
802 |
+
{"current_steps": 751, "total_steps": 895, "loss": 0.6833, "lr": 6.15181122891384e-06, "epoch": 4.194579569145239, "percentage": 83.91, "elapsed_time": "0:57:15", "remaining_time": "0:10:58"}
|
803 |
+
{"current_steps": 752, "total_steps": 895, "loss": 0.702, "lr": 6.068887953425213e-06, "epoch": 4.200138985406532, "percentage": 84.02, "elapsed_time": "0:59:03", "remaining_time": "0:11:13"}
|
804 |
+
{"current_steps": 753, "total_steps": 895, "loss": 0.6985, "lr": 5.986481457733284e-06, "epoch": 4.205698401667825, "percentage": 84.13, "elapsed_time": "1:00:49", "remaining_time": "0:11:28"}
|
805 |
+
{"current_steps": 754, "total_steps": 895, "loss": 0.6766, "lr": 5.904592996910739e-06, "epoch": 4.211257817929117, "percentage": 84.25, "elapsed_time": "1:02:35", "remaining_time": "0:11:42"}
|
806 |
+
{"current_steps": 755, "total_steps": 895, "loss": 0.6803, "lr": 5.823223818140458e-06, "epoch": 4.21681723419041, "percentage": 84.36, "elapsed_time": "1:04:21", "remaining_time": "0:11:56"}
|
807 |
+
{"current_steps": 720, "total_steps": 895, "loss": 0.6835, "lr": 8.971548371823205e-06, "epoch": 4.0222376650451706, "percentage": 80.45, "elapsed_time": "0:02:03", "remaining_time": "0:00:29"}
|
808 |
+
{"current_steps": 721, "total_steps": 895, "loss": 0.6883, "lr": 8.873269566050262e-06, "epoch": 4.0277970813064625, "percentage": 80.56, "elapsed_time": "0:03:49", "remaining_time": "0:00:55"}
|
809 |
+
{"current_steps": 722, "total_steps": 895, "loss": 0.674, "lr": 8.775464828601477e-06, "epoch": 4.033356497567755, "percentage": 80.67, "elapsed_time": "0:05:39", "remaining_time": "0:01:21"}
|
810 |
+
{"current_steps": 720, "total_steps": 895, "loss": 0.6835, "lr": 8.971548371823205e-06, "epoch": 4.0222376650451706, "percentage": 80.45, "elapsed_time": "0:01:55", "remaining_time": "0:00:28"}
|
811 |
+
{"current_steps": 721, "total_steps": 895, "loss": 0.6883, "lr": 8.873269566050262e-06, "epoch": 4.0277970813064625, "percentage": 80.56, "elapsed_time": "0:03:34", "remaining_time": "0:00:51"}
|
812 |
+
{"current_steps": 722, "total_steps": 895, "loss": 0.674, "lr": 8.775464828601477e-06, "epoch": 4.033356497567755, "percentage": 80.67, "elapsed_time": "0:05:14", "remaining_time": "0:01:15"}
|
813 |
+
{"current_steps": 723, "total_steps": 895, "loss": 0.677, "lr": 8.678135649068862e-06, "epoch": 4.038915913829048, "percentage": 80.78, "elapsed_time": "0:06:54", "remaining_time": "0:01:38"}
|
814 |
+
{"current_steps": 724, "total_steps": 895, "loss": 0.6761, "lr": 8.581283509801501e-06, "epoch": 4.04447533009034, "percentage": 80.89, "elapsed_time": "0:08:35", "remaining_time": "0:02:01"}
|
815 |
+
{"current_steps": 725, "total_steps": 895, "loss": 0.6744, "lr": 8.484909885883073e-06, "epoch": 4.050034746351633, "percentage": 81.01, "elapsed_time": "0:10:16", "remaining_time": "0:02:24"}
|
816 |
+
{"current_steps": 726, "total_steps": 895, "loss": 0.6703, "lr": 8.389016245109305e-06, "epoch": 4.055594162612926, "percentage": 81.12, "elapsed_time": "0:11:55", "remaining_time": "0:02:46"}
|
817 |
+
{"current_steps": 727, "total_steps": 895, "loss": 0.6671, "lr": 8.293604047965677e-06, "epoch": 4.061153578874218, "percentage": 81.23, "elapsed_time": "0:13:35", "remaining_time": "0:03:08"}
|
818 |
+
{"current_steps": 728, "total_steps": 895, "loss": 0.679, "lr": 8.19867474760514e-06, "epoch": 4.066712995135511, "percentage": 81.34, "elapsed_time": "0:15:15", "remaining_time": "0:03:30"}
|
819 |
+
{"current_steps": 729, "total_steps": 895, "loss": 0.6812, "lr": 8.104229789825994e-06, "epoch": 4.072272411396804, "percentage": 81.45, "elapsed_time": "0:16:54", "remaining_time": "0:03:51"}
|
820 |
+
{"current_steps": 730, "total_steps": 895, "loss": 0.6646, "lr": 8.010270613049918e-06, "epoch": 4.077831827658096, "percentage": 81.56, "elapsed_time": "0:18:34", "remaining_time": "0:04:11"}
|
821 |
+
{"current_steps": 731, "total_steps": 895, "loss": 0.672, "lr": 7.916798648299964e-06, "epoch": 4.0833912439193885, "percentage": 81.68, "elapsed_time": "0:20:14", "remaining_time": "0:04:32"}
|
822 |
+
{"current_steps": 732, "total_steps": 895, "loss": 0.6757, "lr": 7.823815319178844e-06, "epoch": 4.088950660180681, "percentage": 81.79, "elapsed_time": "0:21:55", "remaining_time": "0:04:52"}
|
823 |
+
{"current_steps": 733, "total_steps": 895, "loss": 0.6966, "lr": 7.731322041847207e-06, "epoch": 4.094510076441973, "percentage": 81.9, "elapsed_time": "0:23:34", "remaining_time": "0:05:12"}
|
824 |
+
{"current_steps": 734, "total_steps": 895, "loss": 0.6849, "lr": 7.639320225002106e-06, "epoch": 4.100069492703266, "percentage": 82.01, "elapsed_time": "0:25:13", "remaining_time": "0:05:32"}
|
825 |
+
{"current_steps": 735, "total_steps": 895, "loss": 0.6922, "lr": 7.547811269855501e-06, "epoch": 4.105628908964559, "percentage": 82.12, "elapsed_time": "0:26:53", "remaining_time": "0:05:51"}
|
826 |
+
{"current_steps": 736, "total_steps": 895, "loss": 0.6896, "lr": 7.456796570112939e-06, "epoch": 4.111188325225851, "percentage": 82.23, "elapsed_time": "0:28:32", "remaining_time": "0:06:10"}
|
827 |
+
{"current_steps": 737, "total_steps": 895, "loss": 0.6781, "lr": 7.366277511952326e-06, "epoch": 4.116747741487144, "percentage": 82.35, "elapsed_time": "0:30:12", "remaining_time": "0:06:28"}
|
828 |
+
{"current_steps": 738, "total_steps": 895, "loss": 0.6781, "lr": 7.2762554740028445e-06, "epoch": 4.122307157748437, "percentage": 82.46, "elapsed_time": "0:31:51", "remaining_time": "0:06:46"}
|
829 |
+
{"current_steps": 739, "total_steps": 895, "loss": 0.6783, "lr": 7.186731827323883e-06, "epoch": 4.127866574009729, "percentage": 82.57, "elapsed_time": "0:33:30", "remaining_time": "0:07:04"}
|
830 |
+
{"current_steps": 740, "total_steps": 895, "loss": 0.6726, "lr": 7.097707935384232e-06, "epoch": 4.1334259902710215, "percentage": 82.68, "elapsed_time": "0:35:09", "remaining_time": "0:07:21"}
|
831 |
+
{"current_steps": 741, "total_steps": 895, "loss": 0.6751, "lr": 7.009185154041258e-06, "epoch": 4.138985406532314, "percentage": 82.79, "elapsed_time": "0:36:49", "remaining_time": "0:07:39"}
|
832 |
+
{"current_steps": 742, "total_steps": 895, "loss": 0.6777, "lr": 6.921164831520322e-06, "epoch": 4.144544822793606, "percentage": 82.91, "elapsed_time": "0:38:30", "remaining_time": "0:07:56"}
|
833 |
+
{"current_steps": 743, "total_steps": 895, "loss": 0.6838, "lr": 6.833648308394156e-06, "epoch": 4.150104239054899, "percentage": 83.02, "elapsed_time": "0:40:10", "remaining_time": "0:08:13"}
|
834 |
+
{"current_steps": 744, "total_steps": 895, "loss": 0.6807, "lr": 6.7466369175625475e-06, "epoch": 4.155663655316192, "percentage": 83.13, "elapsed_time": "0:41:49", "remaining_time": "0:08:29"}
|
835 |
+
{"current_steps": 745, "total_steps": 895, "loss": 0.6852, "lr": 6.660131984231917e-06, "epoch": 4.161223071577484, "percentage": 83.24, "elapsed_time": "0:43:29", "remaining_time": "0:08:45"}
|
836 |
+
{"current_steps": 746, "total_steps": 895, "loss": 0.6936, "lr": 6.574134825895276e-06, "epoch": 4.166782487838777, "percentage": 83.35, "elapsed_time": "0:45:08", "remaining_time": "0:09:01"}
|
837 |
+
{"current_steps": 747, "total_steps": 895, "loss": 0.6875, "lr": 6.488646752312031e-06, "epoch": 4.17234190410007, "percentage": 83.46, "elapsed_time": "0:46:49", "remaining_time": "0:09:16"}
|
838 |
+
{"current_steps": 748, "total_steps": 895, "loss": 0.6722, "lr": 6.403669065488141e-06, "epoch": 4.177901320361362, "percentage": 83.58, "elapsed_time": "0:48:28", "remaining_time": "0:09:31"}
|
839 |
+
{"current_steps": 749, "total_steps": 895, "loss": 0.6703, "lr": 6.3192030596562e-06, "epoch": 4.183460736622655, "percentage": 83.69, "elapsed_time": "0:50:07", "remaining_time": "0:09:46"}
|
840 |
+
{"current_steps": 750, "total_steps": 895, "loss": 0.6804, "lr": 6.235250021255788e-06, "epoch": 4.1890201528839475, "percentage": 83.8, "elapsed_time": "0:51:47", "remaining_time": "0:10:00"}
|
841 |
+
{"current_steps": 751, "total_steps": 895, "loss": 0.6835, "lr": 6.15181122891384e-06, "epoch": 4.194579569145239, "percentage": 83.91, "elapsed_time": "0:53:26", "remaining_time": "0:10:14"}
|
842 |
+
{"current_steps": 752, "total_steps": 895, "loss": 0.7022, "lr": 6.068887953425213e-06, "epoch": 4.200138985406532, "percentage": 84.02, "elapsed_time": "0:55:06", "remaining_time": "0:10:28"}
|
843 |
+
{"current_steps": 753, "total_steps": 895, "loss": 0.6986, "lr": 5.986481457733284e-06, "epoch": 4.205698401667825, "percentage": 84.13, "elapsed_time": "0:56:46", "remaining_time": "0:10:42"}
|
844 |
+
{"current_steps": 754, "total_steps": 895, "loss": 0.6767, "lr": 5.904592996910739e-06, "epoch": 4.211257817929117, "percentage": 84.25, "elapsed_time": "0:58:25", "remaining_time": "0:10:55"}
|
845 |
+
{"current_steps": 755, "total_steps": 895, "loss": 0.6804, "lr": 5.823223818140458e-06, "epoch": 4.21681723419041, "percentage": 84.36, "elapsed_time": "1:00:05", "remaining_time": "0:11:08"}
|
846 |
+
{"current_steps": 756, "total_steps": 895, "loss": 0.6763, "lr": 5.7423751606965296e-06, "epoch": 4.222376650451703, "percentage": 84.47, "elapsed_time": "1:01:45", "remaining_time": "0:11:21"}
|
847 |
+
{"current_steps": 757, "total_steps": 895, "loss": 0.6726, "lr": 5.662048255925357e-06, "epoch": 4.227936066712995, "percentage": 84.58, "elapsed_time": "1:03:25", "remaining_time": "0:11:33"}
|
848 |
+
{"current_steps": 758, "total_steps": 895, "loss": 0.6785, "lr": 5.582244327226907e-06, "epoch": 4.233495482974288, "percentage": 84.69, "elapsed_time": "1:05:05", "remaining_time": "0:11:45"}
|
849 |
+
{"current_steps": 759, "total_steps": 895, "loss": 0.6682, "lr": 5.502964590036093e-06, "epoch": 4.2390548992355805, "percentage": 84.8, "elapsed_time": "1:06:44", "remaining_time": "0:11:57"}
|
850 |
+
{"current_steps": 760, "total_steps": 895, "loss": 0.6891, "lr": 5.424210251804227e-06, "epoch": 4.2446143154968725, "percentage": 84.92, "elapsed_time": "1:08:24", "remaining_time": "0:12:09"}
|
851 |
+
{"current_steps": 761, "total_steps": 895, "loss": 0.6927, "lr": 5.345982511980707e-06, "epoch": 4.250173731758165, "percentage": 85.03, "elapsed_time": "1:10:04", "remaining_time": "0:12:20"}
|
852 |
+
{"current_steps": 762, "total_steps": 895, "loss": 0.6831, "lr": 5.268282561994658e-06, "epoch": 4.255733148019458, "percentage": 85.14, "elapsed_time": "1:11:43", "remaining_time": "0:12:31"}
|
853 |
+
{"current_steps": 763, "total_steps": 895, "loss": 0.6925, "lr": 5.191111585236828e-06, "epoch": 4.26129256428075, "percentage": 85.25, "elapsed_time": "1:13:23", "remaining_time": "0:12:41"}
|
854 |
+
{"current_steps": 764, "total_steps": 895, "loss": 0.6845, "lr": 5.114470757041572e-06, "epoch": 4.266851980542043, "percentage": 85.36, "elapsed_time": "1:15:02", "remaining_time": "0:12:52"}
|
855 |
+
{"current_steps": 765, "total_steps": 895, "loss": 0.6915, "lr": 5.038361244668952e-06, "epoch": 4.272411396803336, "percentage": 85.47, "elapsed_time": "1:16:41", "remaining_time": "0:13:02"}
|
856 |
+
{"current_steps": 766, "total_steps": 895, "loss": 0.6757, "lr": 4.96278420728693e-06, "epoch": 4.277970813064628, "percentage": 85.59, "elapsed_time": "1:18:21", "remaining_time": "0:13:11"}
|
857 |
+
{"current_steps": 767, "total_steps": 895, "loss": 0.6922, "lr": 4.887740795953764e-06, "epoch": 4.283530229325921, "percentage": 85.7, "elapsed_time": "1:20:00", "remaining_time": "0:13:21"}
|
858 |
+
{"current_steps": 768, "total_steps": 895, "loss": 0.6847, "lr": 4.813232153600393e-06, "epoch": 4.289089645587214, "percentage": 85.81, "elapsed_time": "1:21:40", "remaining_time": "0:13:30"}
|
859 |
+
{"current_steps": 769, "total_steps": 895, "loss": 0.6761, "lr": 4.739259415013138e-06, "epoch": 4.294649061848506, "percentage": 85.92, "elapsed_time": "1:23:20", "remaining_time": "0:13:39"}
|
860 |
+
{"current_steps": 770, "total_steps": 895, "loss": 0.6729, "lr": 4.6658237068163285e-06, "epoch": 4.3002084781097984, "percentage": 86.03, "elapsed_time": "1:24:59", "remaining_time": "0:13:47"}
|
861 |
+
{"current_steps": 771, "total_steps": 895, "loss": 0.6765, "lr": 4.5929261474552164e-06, "epoch": 4.305767894371091, "percentage": 86.15, "elapsed_time": "1:26:40", "remaining_time": "0:13:56"}
|
862 |
+
{"current_steps": 772, "total_steps": 895, "loss": 0.6922, "lr": 4.520567847178847e-06, "epoch": 4.311327310632383, "percentage": 86.26, "elapsed_time": "1:28:20", "remaining_time": "0:14:04"}
|
863 |
+
{"current_steps": 773, "total_steps": 895, "loss": 0.6757, "lr": 4.4487499080232685e-06, "epoch": 4.316886726893676, "percentage": 86.37, "elapsed_time": "1:29:59", "remaining_time": "0:14:12"}
|
864 |
+
{"current_steps": 774, "total_steps": 895, "loss": 0.6827, "lr": 4.377473423794643e-06, "epoch": 4.322446143154969, "percentage": 86.48, "elapsed_time": "1:31:38", "remaining_time": "0:14:19"}
|
865 |
+
{"current_steps": 775, "total_steps": 895, "loss": 0.6798, "lr": 4.30673948005266e-06, "epoch": 4.328005559416261, "percentage": 86.59, "elapsed_time": "1:33:18", "remaining_time": "0:14:26"}
|
866 |
+
{"current_steps": 776, "total_steps": 895, "loss": 0.6639, "lr": 4.236549154093954e-06, "epoch": 4.333564975677554, "percentage": 86.7, "elapsed_time": "1:34:58", "remaining_time": "0:14:33"}
|
867 |
+
{"current_steps": 777, "total_steps": 895, "loss": 0.6843, "lr": 4.1669035149357255e-06, "epoch": 4.339124391938847, "percentage": 86.82, "elapsed_time": "1:36:37", "remaining_time": "0:14:40"}
|
868 |
+
{"current_steps": 778, "total_steps": 895, "loss": 0.68, "lr": 4.097803623299443e-06, "epoch": 4.344683808200139, "percentage": 86.93, "elapsed_time": "1:38:16", "remaining_time": "0:14:46"}
|
869 |
+
{"current_steps": 779, "total_steps": 895, "loss": 0.6808, "lr": 4.029250531594722e-06, "epoch": 4.3502432244614315, "percentage": 87.04, "elapsed_time": "1:39:56", "remaining_time": "0:14:52"}
|
870 |
+
{"current_steps": 780, "total_steps": 895, "loss": 0.6937, "lr": 3.961245283903239e-06, "epoch": 4.355802640722724, "percentage": 87.15, "elapsed_time": "1:41:35", "remaining_time": "0:14:58"}
|
871 |
+
{"current_steps": 781, "total_steps": 895, "loss": 0.6851, "lr": 3.893788915962873e-06, "epoch": 4.361362056984016, "percentage": 87.26, "elapsed_time": "1:43:15", "remaining_time": "0:15:04"}
|
872 |
+
{"current_steps": 782, "total_steps": 895, "loss": 0.6791, "lr": 3.8268824551519214e-06, "epoch": 4.366921473245309, "percentage": 87.37, "elapsed_time": "1:44:54", "remaining_time": "0:15:09"}
|
873 |
+
{"current_steps": 783, "total_steps": 895, "loss": 0.6833, "lr": 3.760526920473462e-06, "epoch": 4.372480889506602, "percentage": 87.49, "elapsed_time": "1:46:33", "remaining_time": "0:15:14"}
|
874 |
+
{"current_steps": 784, "total_steps": 895, "loss": 0.6778, "lr": 3.6947233225397993e-06, "epoch": 4.378040305767894, "percentage": 87.6, "elapsed_time": "1:48:13", "remaining_time": "0:15:19"}
|
875 |
+
{"current_steps": 785, "total_steps": 895, "loss": 0.678, "lr": 3.62947266355711e-06, "epoch": 4.383599722029187, "percentage": 87.71, "elapsed_time": "1:49:52", "remaining_time": "0:15:23"}
|
876 |
+
{"current_steps": 786, "total_steps": 895, "loss": 0.6756, "lr": 3.5647759373101585e-06, "epoch": 4.38915913829048, "percentage": 87.82, "elapsed_time": "1:51:32", "remaining_time": "0:15:28"}
|
877 |
+
{"current_steps": 787, "total_steps": 895, "loss": 0.6741, "lr": 3.500634129147167e-06, "epoch": 4.394718554551772, "percentage": 87.93, "elapsed_time": "1:53:11", "remaining_time": "0:15:32"}
|
878 |
+
{"current_steps": 788, "total_steps": 895, "loss": 0.6983, "lr": 3.437048215964827e-06, "epoch": 4.400277970813065, "percentage": 88.04, "elapsed_time": "1:54:51", "remaining_time": "0:15:35"}
|
879 |
+
{"current_steps": 789, "total_steps": 895, "loss": 0.6847, "lr": 3.3740191661933764e-06, "epoch": 4.4058373870743575, "percentage": 88.16, "elapsed_time": "1:56:31", "remaining_time": "0:15:39"}
|
880 |
+
{"current_steps": 790, "total_steps": 895, "loss": 0.6731, "lr": 3.311547939781887e-06, "epoch": 4.411396803335649, "percentage": 88.27, "elapsed_time": "1:58:10", "remaining_time": "0:15:42"}
|
881 |
+
{"current_steps": 791, "total_steps": 895, "loss": 0.69, "lr": 3.2496354881836268e-06, "epoch": 4.416956219596942, "percentage": 88.38, "elapsed_time": "1:59:50", "remaining_time": "0:15:45"}
|
882 |
+
{"current_steps": 792, "total_steps": 895, "loss": 0.6722, "lr": 3.188282754341603e-06, "epoch": 4.422515635858235, "percentage": 88.49, "elapsed_time": "2:01:29", "remaining_time": "0:15:47"}
|
883 |
+
{"current_steps": 793, "total_steps": 895, "loss": 0.6868, "lr": 3.1274906726741317e-06, "epoch": 4.428075052119527, "percentage": 88.6, "elapsed_time": "2:03:09", "remaining_time": "0:15:50"}
|
884 |
+
{"current_steps": 794, "total_steps": 895, "loss": 0.6919, "lr": 3.067260169060697e-06, "epoch": 4.43363446838082, "percentage": 88.72, "elapsed_time": "2:04:48", "remaining_time": "0:15:52"}
|
885 |
+
{"current_steps": 795, "total_steps": 895, "loss": 0.6728, "lr": 3.0075921608277415e-06, "epoch": 4.439193884642113, "percentage": 88.83, "elapsed_time": "2:06:27", "remaining_time": "0:15:54"}
|
886 |
+
{"current_steps": 796, "total_steps": 895, "loss": 0.6733, "lr": 2.9484875567348117e-06, "epoch": 4.444753300903405, "percentage": 88.94, "elapsed_time": "2:08:07", "remaining_time": "0:15:56"}
|
887 |
+
{"current_steps": 797, "total_steps": 895, "loss": 0.6817, "lr": 2.8899472569606166e-06, "epoch": 4.450312717164698, "percentage": 89.05, "elapsed_time": "2:09:46", "remaining_time": "0:15:57"}
|
888 |
+
{"current_steps": 798, "total_steps": 895, "loss": 0.6833, "lr": 2.8319721530894084e-06, "epoch": 4.4558721334259905, "percentage": 89.16, "elapsed_time": "2:11:25", "remaining_time": "0:15:58"}
|
889 |
+
{"current_steps": 799, "total_steps": 895, "loss": 0.6857, "lr": 2.7745631280973005e-06, "epoch": 4.4614315496872825, "percentage": 89.27, "elapsed_time": "2:13:05", "remaining_time": "0:15:59"}
|
890 |
+
{"current_steps": 800, "total_steps": 895, "loss": 0.6643, "lr": 2.7177210563389178e-06, "epoch": 4.466990965948575, "percentage": 89.39, "elapsed_time": "2:14:45", "remaining_time": "0:16:00"}
|
891 |
+
{"current_steps": 801, "total_steps": 895, "loss": 0.6838, "lr": 2.6614468035340137e-06, "epoch": 4.472550382209868, "percentage": 89.5, "elapsed_time": "2:16:24", "remaining_time": "0:16:00"}
|
892 |
+
{"current_steps": 802, "total_steps": 895, "loss": 0.6642, "lr": 2.6057412267543347e-06, "epoch": 4.47810979847116, "percentage": 89.61, "elapsed_time": "2:18:04", "remaining_time": "0:16:00"}
|
893 |
+
{"current_steps": 803, "total_steps": 895, "loss": 0.6896, "lr": 2.550605174410512e-06, "epoch": 4.483669214732453, "percentage": 89.72, "elapsed_time": "2:19:43", "remaining_time": "0:16:00"}
|
894 |
+
{"current_steps": 804, "total_steps": 895, "loss": 0.6706, "lr": 2.49603948623919e-06, "epoch": 4.489228630993746, "percentage": 89.83, "elapsed_time": "2:21:22", "remaining_time": "0:16:00"}
|
895 |
+
{"current_steps": 805, "total_steps": 895, "loss": 0.6693, "lr": 2.442044993290198e-06, "epoch": 4.494788047255038, "percentage": 89.94, "elapsed_time": "2:23:01", "remaining_time": "0:15:59"}
|
896 |
+
{"current_steps": 806, "total_steps": 895, "loss": 0.6951, "lr": 2.388622517913937e-06, "epoch": 4.500347463516331, "percentage": 90.06, "elapsed_time": "2:24:41", "remaining_time": "0:15:58"}
|
897 |
+
{"current_steps": 807, "total_steps": 895, "loss": 0.6738, "lr": 2.335772873748807e-06, "epoch": 4.505906879777624, "percentage": 90.17, "elapsed_time": "2:26:20", "remaining_time": "0:15:57"}
|
898 |
+
{"current_steps": 808, "total_steps": 895, "loss": 0.667, "lr": 2.283496865708843e-06, "epoch": 4.511466296038916, "percentage": 90.28, "elapsed_time": "2:27:59", "remaining_time": "0:15:56"}
|
899 |
+
{"current_steps": 809, "total_steps": 895, "loss": 0.6727, "lr": 2.231795289971448e-06, "epoch": 4.517025712300208, "percentage": 90.39, "elapsed_time": "2:29:39", "remaining_time": "0:15:54"}
|
900 |
+
{"current_steps": 810, "total_steps": 895, "loss": 0.6861, "lr": 2.1806689339652864e-06, "epoch": 4.522585128561501, "percentage": 90.5, "elapsed_time": "2:31:18", "remaining_time": "0:15:52"}
|
901 |
+
{"current_steps": 811, "total_steps": 895, "loss": 0.6901, "lr": 2.130118576358249e-06, "epoch": 4.528144544822793, "percentage": 90.61, "elapsed_time": "2:32:57", "remaining_time": "0:15:50"}
|
902 |
+
{"current_steps": 812, "total_steps": 895, "loss": 0.6914, "lr": 2.0801449870456424e-06, "epoch": 4.533703961084086, "percentage": 90.73, "elapsed_time": "2:34:37", "remaining_time": "0:15:48"}
|
903 |
+
{"current_steps": 813, "total_steps": 895, "loss": 0.6742, "lr": 2.0307489271384107e-06, "epoch": 4.539263377345379, "percentage": 90.84, "elapsed_time": "2:36:16", "remaining_time": "0:15:45"}
|
904 |
+
{"current_steps": 814, "total_steps": 895, "loss": 0.6788, "lr": 1.9819311489516122e-06, "epoch": 4.544822793606671, "percentage": 90.95, "elapsed_time": "2:37:56", "remaining_time": "0:15:42"}
|
905 |
+
{"current_steps": 815, "total_steps": 895, "loss": 0.6753, "lr": 1.9336923959928855e-06, "epoch": 4.550382209867964, "percentage": 91.06, "elapsed_time": "2:39:35", "remaining_time": "0:15:39"}
|
906 |
+
{"current_steps": 816, "total_steps": 895, "loss": 0.6888, "lr": 1.8860334029511795e-06, "epoch": 4.555941626129257, "percentage": 91.17, "elapsed_time": "2:41:16", "remaining_time": "0:15:36"}
|
907 |
+
{"current_steps": 817, "total_steps": 895, "loss": 0.6676, "lr": 1.8389548956855474e-06, "epoch": 4.561501042390549, "percentage": 91.28, "elapsed_time": "2:42:56", "remaining_time": "0:15:33"}
|
908 |
+
{"current_steps": 818, "total_steps": 895, "loss": 0.6816, "lr": 1.7924575912140785e-06, "epoch": 4.5670604586518415, "percentage": 91.4, "elapsed_time": "2:44:35", "remaining_time": "0:15:29"}
|
909 |
+
{"current_steps": 819, "total_steps": 895, "loss": 0.668, "lr": 1.7465421977030094e-06, "epoch": 4.572619874913134, "percentage": 91.51, "elapsed_time": "2:46:15", "remaining_time": "0:15:25"}
|
910 |
+
{"current_steps": 820, "total_steps": 895, "loss": 0.6906, "lr": 1.7012094144558932e-06, "epoch": 4.578179291174426, "percentage": 91.62, "elapsed_time": "2:47:54", "remaining_time": "0:15:21"}
|
911 |
+
{"current_steps": 821, "total_steps": 895, "loss": 0.671, "lr": 1.656459931903016e-06, "epoch": 4.583738707435719, "percentage": 91.73, "elapsed_time": "2:49:33", "remaining_time": "0:15:17"}
|
912 |
+
{"current_steps": 822, "total_steps": 895, "loss": 0.6904, "lr": 1.6122944315907841e-06, "epoch": 4.589298123697012, "percentage": 91.84, "elapsed_time": "2:51:13", "remaining_time": "0:15:12"}
|
913 |
+
{"current_steps": 823, "total_steps": 895, "loss": 0.6864, "lr": 1.568713586171451e-06, "epoch": 4.594857539958304, "percentage": 91.96, "elapsed_time": "2:52:52", "remaining_time": "0:15:07"}
|
914 |
+
{"current_steps": 824, "total_steps": 895, "loss": 0.6739, "lr": 1.5257180593927845e-06, "epoch": 4.600416956219597, "percentage": 92.07, "elapsed_time": "2:54:31", "remaining_time": "0:15:02"}
|
915 |
+
{"current_steps": 825, "total_steps": 895, "loss": 0.69, "lr": 1.4833085060880349e-06, "epoch": 4.60597637248089, "percentage": 92.18, "elapsed_time": "2:56:11", "remaining_time": "0:14:56"}
|
916 |
+
{"current_steps": 826, "total_steps": 895, "loss": 0.6771, "lr": 1.4414855721658705e-06, "epoch": 4.611535788742182, "percentage": 92.29, "elapsed_time": "2:57:50", "remaining_time": "0:14:51"}
|
917 |
+
{"current_steps": 827, "total_steps": 895, "loss": 0.6873, "lr": 1.400249894600636e-06, "epoch": 4.617095205003475, "percentage": 92.4, "elapsed_time": "2:59:29", "remaining_time": "0:14:45"}
|
918 |
+
{"current_steps": 828, "total_steps": 895, "loss": 0.6769, "lr": 1.3596021014225858e-06, "epoch": 4.6226546212647674, "percentage": 92.51, "elapsed_time": "3:01:08", "remaining_time": "0:14:39"}
|
919 |
+
{"current_steps": 829, "total_steps": 895, "loss": 0.6814, "lr": 1.3195428117083453e-06, "epoch": 4.628214037526059, "percentage": 92.63, "elapsed_time": "3:02:48", "remaining_time": "0:14:33"}
|
920 |
+
{"current_steps": 830, "total_steps": 895, "loss": 0.6728, "lr": 1.2800726355714743e-06, "epoch": 4.633773453787352, "percentage": 92.74, "elapsed_time": "3:04:27", "remaining_time": "0:14:26"}
|
921 |
+
{"current_steps": 831, "total_steps": 895, "loss": 0.6945, "lr": 1.2411921741531807e-06, "epoch": 4.639332870048645, "percentage": 92.85, "elapsed_time": "3:06:06", "remaining_time": "0:14:20"}
|
922 |
+
{"current_steps": 832, "total_steps": 895, "loss": 0.7003, "lr": 1.2029020196131502e-06, "epoch": 4.644892286309937, "percentage": 92.96, "elapsed_time": "3:07:46", "remaining_time": "0:14:13"}
|
923 |
+
{"current_steps": 833, "total_steps": 895, "loss": 0.6682, "lr": 1.165202755120558e-06, "epoch": 4.65045170257123, "percentage": 93.07, "elapsed_time": "3:09:26", "remaining_time": "0:14:05"}
|
924 |
+
{"current_steps": 834, "total_steps": 895, "loss": 0.6832, "lr": 1.1280949548451559e-06, "epoch": 4.656011118832523, "percentage": 93.18, "elapsed_time": "3:11:05", "remaining_time": "0:13:58"}
|
925 |
+
{"current_steps": 835, "total_steps": 895, "loss": 0.6839, "lr": 1.0915791839485412e-06, "epoch": 4.661570535093815, "percentage": 93.3, "elapsed_time": "3:12:45", "remaining_time": "0:13:51"}
|
926 |
+
{"current_steps": 836, "total_steps": 895, "loss": 0.6813, "lr": 1.0556559985755377e-06, "epoch": 4.667129951355108, "percentage": 93.41, "elapsed_time": "3:14:24", "remaining_time": "0:13:43"}
|
927 |
+
{"current_steps": 837, "total_steps": 895, "loss": 0.6887, "lr": 1.020325945845757e-06, "epoch": 4.6726893676164005, "percentage": 93.52, "elapsed_time": "3:16:03", "remaining_time": "0:13:35"}
|
928 |
+
{"current_steps": 838, "total_steps": 895, "loss": 0.6751, "lr": 9.855895638452284e-07, "epoch": 4.6782487838776925, "percentage": 93.63, "elapsed_time": "3:17:43", "remaining_time": "0:13:26"}
|
929 |
+
{"current_steps": 839, "total_steps": 895, "loss": 0.6704, "lr": 9.514473816182179e-07, "epoch": 4.683808200138985, "percentage": 93.74, "elapsed_time": "3:19:23", "remaining_time": "0:13:18"}
|
930 |
+
{"current_steps": 840, "total_steps": 895, "loss": 0.6874, "lr": 9.17899919159182e-07, "epoch": 4.689367616400278, "percentage": 93.85, "elapsed_time": "3:21:04", "remaining_time": "0:13:09"}
|
931 |
+
{"current_steps": 841, "total_steps": 895, "loss": 0.6948, "lr": 8.849476874048313e-07, "epoch": 4.69492703266157, "percentage": 93.97, "elapsed_time": "3:22:44", "remaining_time": "0:13:01"}
|
932 |
+
{"current_steps": 842, "total_steps": 895, "loss": 0.6719, "lr": 8.525911882263593e-07, "epoch": 4.700486448922863, "percentage": 94.08, "elapsed_time": "3:24:23", "remaining_time": "0:12:51"}
|
933 |
+
{"current_steps": 843, "total_steps": 895, "loss": 0.6735, "lr": 8.208309144217907e-07, "epoch": 4.706045865184156, "percentage": 94.19, "elapsed_time": "3:26:03", "remaining_time": "0:12:42"}
|
934 |
+
{"current_steps": 844, "total_steps": 895, "loss": 0.6829, "lr": 7.896673497084806e-07, "epoch": 4.711605281445448, "percentage": 94.3, "elapsed_time": "3:27:43", "remaining_time": "0:12:33"}
|
935 |
+
{"current_steps": 845, "total_steps": 895, "loss": 0.6727, "lr": 7.591009687157513e-07, "epoch": 4.717164697706741, "percentage": 94.41, "elapsed_time": "3:29:22", "remaining_time": "0:12:23"}
|
936 |
+
{"current_steps": 846, "total_steps": 895, "loss": 0.6903, "lr": 7.291322369776587e-07, "epoch": 4.722724113968034, "percentage": 94.53, "elapsed_time": "3:31:01", "remaining_time": "0:12:13"}
|
937 |
+
{"current_steps": 847, "total_steps": 895, "loss": 0.6814, "lr": 6.997616109258953e-07, "epoch": 4.728283530229326, "percentage": 94.64, "elapsed_time": "3:32:41", "remaining_time": "0:12:03"}
|
938 |
+
{"current_steps": 848, "total_steps": 895, "loss": 0.6812, "lr": 6.709895378828624e-07, "epoch": 4.733842946490618, "percentage": 94.75, "elapsed_time": "3:34:20", "remaining_time": "0:11:52"}
|
939 |
+
{"current_steps": 849, "total_steps": 895, "loss": 0.6712, "lr": 6.428164560548134e-07, "epoch": 4.739402362751911, "percentage": 94.86, "elapsed_time": "3:35:59", "remaining_time": "0:11:42"}
|
940 |
+
{"current_steps": 850, "total_steps": 895, "loss": 0.678, "lr": 6.152427945252415e-07, "epoch": 4.744961779013203, "percentage": 94.97, "elapsed_time": "3:37:39", "remaining_time": "0:11:31"}
|
941 |
+
{"current_steps": 851, "total_steps": 895, "loss": 0.6757, "lr": 5.882689732482849e-07, "epoch": 4.750521195274496, "percentage": 95.08, "elapsed_time": "3:39:18", "remaining_time": "0:11:20"}
|
942 |
+
{"current_steps": 852, "total_steps": 895, "loss": 0.6752, "lr": 5.618954030423629e-07, "epoch": 4.756080611535789, "percentage": 95.2, "elapsed_time": "3:40:57", "remaining_time": "0:11:09"}
|
943 |
+
{"current_steps": 853, "total_steps": 895, "loss": 0.683, "lr": 5.361224855839231e-07, "epoch": 4.761640027797081, "percentage": 95.31, "elapsed_time": "3:42:37", "remaining_time": "0:10:57"}
|
944 |
+
{"current_steps": 854, "total_steps": 895, "loss": 0.6859, "lr": 5.109506134012954e-07, "epoch": 4.767199444058374, "percentage": 95.42, "elapsed_time": "3:44:16", "remaining_time": "0:10:46"}
|
945 |
+
{"current_steps": 855, "total_steps": 895, "loss": 0.6862, "lr": 4.863801698687409e-07, "epoch": 4.772758860319667, "percentage": 95.53, "elapsed_time": "3:45:55", "remaining_time": "0:10:34"}
|
946 |
+
{"current_steps": 856, "total_steps": 895, "loss": 0.6738, "lr": 4.6241152920060817e-07, "epoch": 4.778318276580959, "percentage": 95.64, "elapsed_time": "3:47:35", "remaining_time": "0:10:22"}
|
947 |
+
{"current_steps": 857, "total_steps": 895, "loss": 0.6896, "lr": 4.390450564456172e-07, "epoch": 4.7838776928422515, "percentage": 95.75, "elapsed_time": "3:49:14", "remaining_time": "0:10:09"}
|
948 |
+
{"current_steps": 858, "total_steps": 895, "loss": 0.6782, "lr": 4.1628110748132664e-07, "epoch": 4.789437109103544, "percentage": 95.87, "elapsed_time": "3:50:53", "remaining_time": "0:09:57"}
|
949 |
+
{"current_steps": 859, "total_steps": 895, "loss": 0.6816, "lr": 3.941200290086844e-07, "epoch": 4.794996525364836, "percentage": 95.98, "elapsed_time": "3:52:33", "remaining_time": "0:09:44"}
|
950 |
+
{"current_steps": 860, "total_steps": 895, "loss": 0.6705, "lr": 3.725621585467698e-07, "epoch": 4.800555941626129, "percentage": 96.09, "elapsed_time": "3:54:12", "remaining_time": "0:09:31"}
|
951 |
+
{"current_steps": 861, "total_steps": 895, "loss": 0.6899, "lr": 3.5160782442764216e-07, "epoch": 4.806115357887422, "percentage": 96.2, "elapsed_time": "3:55:52", "remaining_time": "0:09:18"}
|
952 |
+
{"current_steps": 862, "total_steps": 895, "loss": 0.6777, "lr": 3.3125734579134484e-07, "epoch": 4.811674774148714, "percentage": 96.31, "elapsed_time": "3:57:31", "remaining_time": "0:09:05"}
|
953 |
+
{"current_steps": 863, "total_steps": 895, "loss": 0.6854, "lr": 3.115110325810422e-07, "epoch": 4.817234190410007, "percentage": 96.42, "elapsed_time": "3:59:11", "remaining_time": "0:08:52"}
|
954 |
+
{"current_steps": 864, "total_steps": 895, "loss": 0.6763, "lr": 2.9236918553829486e-07, "epoch": 4.8227936066713, "percentage": 96.54, "elapsed_time": "4:00:51", "remaining_time": "0:08:38"}
|
955 |
+
{"current_steps": 865, "total_steps": 895, "loss": 0.6897, "lr": 2.738320961984897e-07, "epoch": 4.828353022932592, "percentage": 96.65, "elapsed_time": "4:02:30", "remaining_time": "0:08:24"}
|
956 |
+
{"current_steps": 866, "total_steps": 895, "loss": 0.6762, "lr": 2.559000468863948e-07, "epoch": 4.833912439193885, "percentage": 96.76, "elapsed_time": "4:04:09", "remaining_time": "0:08:10"}
|
957 |
+
{"current_steps": 867, "total_steps": 895, "loss": 0.6844, "lr": 2.3857331071185595e-07, "epoch": 4.839471855455177, "percentage": 96.87, "elapsed_time": "4:05:49", "remaining_time": "0:07:56"}
|
958 |
+
{"current_steps": 868, "total_steps": 895, "loss": 0.6807, "lr": 2.2185215156563578e-07, "epoch": 4.845031271716469, "percentage": 96.98, "elapsed_time": "4:07:28", "remaining_time": "0:07:41"}
|
959 |
+
{"current_steps": 869, "total_steps": 895, "loss": 0.6864, "lr": 2.057368241154123e-07, "epoch": 4.850590687977762, "percentage": 97.09, "elapsed_time": "4:09:07", "remaining_time": "0:07:27"}
|
960 |
+
{"current_steps": 870, "total_steps": 895, "loss": 0.6746, "lr": 1.9022757380186662e-07, "epoch": 4.856150104239055, "percentage": 97.21, "elapsed_time": "4:10:47", "remaining_time": "0:07:12"}
|
961 |
+
{"current_steps": 871, "total_steps": 895, "loss": 0.6953, "lr": 1.7532463683499258e-07, "epoch": 4.861709520500347, "percentage": 97.32, "elapsed_time": "4:12:26", "remaining_time": "0:06:57"}
|
962 |
+
{"current_steps": 872, "total_steps": 895, "loss": 0.6804, "lr": 1.6102824019043728e-07, "epoch": 4.86726893676164, "percentage": 97.43, "elapsed_time": "4:14:05", "remaining_time": "0:06:42"}
|
963 |
+
{"current_steps": 873, "total_steps": 895, "loss": 0.6888, "lr": 1.473386016061129e-07, "epoch": 4.872828353022933, "percentage": 97.54, "elapsed_time": "4:15:44", "remaining_time": "0:06:26"}
|
964 |
+
{"current_steps": 874, "total_steps": 895, "loss": 0.6764, "lr": 1.3425592957881707e-07, "epoch": 4.878387769284225, "percentage": 97.65, "elapsed_time": "4:17:24", "remaining_time": "0:06:11"}
|
965 |
+
{"current_steps": 875, "total_steps": 895, "loss": 0.6928, "lr": 1.2178042336111084e-07, "epoch": 4.883947185545518, "percentage": 97.77, "elapsed_time": "4:19:03", "remaining_time": "0:05:55"}
|
966 |
+
{"current_steps": 876, "total_steps": 895, "loss": 0.6773, "lr": 1.0991227295824136e-07, "epoch": 4.8895066018068105, "percentage": 97.88, "elapsed_time": "4:20:42", "remaining_time": "0:05:39"}
|
967 |
+
{"current_steps": 877, "total_steps": 895, "loss": 0.689, "lr": 9.865165912527286e-08, "epoch": 4.8950660180681025, "percentage": 97.99, "elapsed_time": "4:22:22", "remaining_time": "0:05:23"}
|
968 |
+
{"current_steps": 878, "total_steps": 895, "loss": 0.674, "lr": 8.799875336433339e-08, "epoch": 4.900625434329395, "percentage": 98.1, "elapsed_time": "4:24:01", "remaining_time": "0:05:06"}
|
969 |
+
{"current_steps": 879, "total_steps": 895, "loss": 0.6724, "lr": 7.795371792198136e-08, "epoch": 4.906184850590688, "percentage": 98.21, "elapsed_time": "4:25:40", "remaining_time": "0:04:50"}
|
970 |
+
{"current_steps": 880, "total_steps": 895, "loss": 0.6667, "lr": 6.851670578677195e-08, "epoch": 4.91174426685198, "percentage": 98.32, "elapsed_time": "4:27:20", "remaining_time": "0:04:33"}
|
971 |
+
{"current_steps": 881, "total_steps": 895, "loss": 0.6853, "lr": 5.968786068688115e-08, "epoch": 4.917303683113273, "percentage": 98.44, "elapsed_time": "4:29:00", "remaining_time": "0:04:16"}
|
972 |
+
{"current_steps": 882, "total_steps": 895, "loss": 0.6806, "lr": 5.146731708795649e-08, "epoch": 4.922863099374566, "percentage": 98.55, "elapsed_time": "4:30:39", "remaining_time": "0:03:59"}
|
973 |
+
{"current_steps": 883, "total_steps": 895, "loss": 0.6859, "lr": 4.3855200191043056e-08, "epoch": 4.928422515635858, "percentage": 98.66, "elapsed_time": "4:32:18", "remaining_time": "0:03:42"}
|
974 |
+
{"current_steps": 884, "total_steps": 895, "loss": 0.6827, "lr": 3.685162593070057e-08, "epoch": 4.933981931897151, "percentage": 98.77, "elapsed_time": "4:33:58", "remaining_time": "0:03:24"}
|
975 |
+
{"current_steps": 885, "total_steps": 895, "loss": 0.6887, "lr": 3.0456700973204854e-08, "epoch": 4.939541348158444, "percentage": 98.88, "elapsed_time": "4:35:37", "remaining_time": "0:03:06"}
|
976 |
+
{"current_steps": 886, "total_steps": 895, "loss": 0.6689, "lr": 2.4670522714957955e-08, "epoch": 4.945100764419736, "percentage": 98.99, "elapsed_time": "4:37:16", "remaining_time": "0:02:48"}
|
977 |
+
{"current_steps": 887, "total_steps": 895, "loss": 0.6838, "lr": 1.949317928097827e-08, "epoch": 4.950660180681028, "percentage": 99.11, "elapsed_time": "4:38:56", "remaining_time": "0:02:30"}
|
978 |
+
{"current_steps": 888, "total_steps": 895, "loss": 0.6764, "lr": 1.4924749523572703e-08, "epoch": 4.956219596942321, "percentage": 99.22, "elapsed_time": "4:40:35", "remaining_time": "0:02:12"}
|
979 |
+
{"current_steps": 889, "total_steps": 895, "loss": 0.6877, "lr": 1.0965303021142071e-08, "epoch": 4.961779013203613, "percentage": 99.33, "elapsed_time": "4:42:15", "remaining_time": "0:01:54"}
|
980 |
+
{"current_steps": 890, "total_steps": 895, "loss": 0.6903, "lr": 7.614900077093091e-09, "epoch": 4.967338429464906, "percentage": 99.44, "elapsed_time": "4:43:54", "remaining_time": "0:01:35"}
|
981 |
+
{"current_steps": 891, "total_steps": 895, "loss": 0.685, "lr": 4.873591718945747e-09, "epoch": 4.972897845726199, "percentage": 99.55, "elapsed_time": "4:45:33", "remaining_time": "0:01:16"}
|
982 |
+
{"current_steps": 892, "total_steps": 895, "loss": 0.6779, "lr": 2.741419697560588e-09, "epoch": 4.978457261987491, "percentage": 99.66, "elapsed_time": "4:47:13", "remaining_time": "0:00:57"}
|
983 |
+
{"current_steps": 893, "total_steps": 895, "loss": 0.6931, "lr": 1.2184164864725845e-09, "epoch": 4.984016678248784, "percentage": 99.78, "elapsed_time": "4:48:52", "remaining_time": "0:00:38"}
|
984 |
+
{"current_steps": 894, "total_steps": 895, "loss": 0.6791, "lr": 3.0460528142040033e-10, "epoch": 4.989576094510077, "percentage": 99.89, "elapsed_time": "4:50:31", "remaining_time": "0:00:19"}
|
985 |
+
{"current_steps": 895, "total_steps": 895, "loss": 0.6829, "lr": 0.0, "epoch": 4.995135510771369, "percentage": 100.0, "elapsed_time": "4:52:10", "remaining_time": "0:00:00"}
|
986 |
+
{"current_steps": 895, "total_steps": 895, "epoch": 4.995135510771369, "percentage": 100.0, "elapsed_time": "4:55:26", "remaining_time": "0:00:00"}
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c873563ab41b2f44bcaf05f347c480badbd4337d8e0746816274dfefa9c354ca
|
3 |
+
size 7416
|