Training in progress, epoch 3
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4877660776
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:29d76fbbdd1ab6dc6c700c5509b40401ba2bda28eeac4e712d7f46bae58908ce
|
3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4932751008
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d60c99a36df83e9799b073080c9964a644a71e9ddac044e0a12f082f6b201631
|
3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4330865200
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:802dcfb2a237a15a2cc90737ba2001b14981432a4f2209584a9e055b2c27bf30
|
3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1089994880
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d3da32877c6d45a6090c5107d807e2538ca1a661f45093dfb315a8e7cac43a00
|
3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
@@ -751,3 +751,250 @@
|
|
751 |
{"current_steps": 751, "total_steps": 1230, "loss": 0.4417, "lr": 1.5802911561074944e-05, "epoch": 3.042025316455696, "percentage": 61.06, "elapsed_time": "2:12:05", "remaining_time": "1:24:14"}
|
752 |
{"current_steps": 752, "total_steps": 1230, "loss": 0.4641, "lr": 1.5747433727755595e-05, "epoch": 3.0460759493670886, "percentage": 61.14, "elapsed_time": "2:12:15", "remaining_time": "1:24:03"}
|
753 |
{"current_steps": 753, "total_steps": 1230, "loss": 0.4487, "lr": 1.5691990144020376e-05, "epoch": 3.050126582278481, "percentage": 61.22, "elapsed_time": "2:12:25", "remaining_time": "1:23:53"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
751 |
{"current_steps": 751, "total_steps": 1230, "loss": 0.4417, "lr": 1.5802911561074944e-05, "epoch": 3.042025316455696, "percentage": 61.06, "elapsed_time": "2:12:05", "remaining_time": "1:24:14"}
|
752 |
{"current_steps": 752, "total_steps": 1230, "loss": 0.4641, "lr": 1.5747433727755595e-05, "epoch": 3.0460759493670886, "percentage": 61.14, "elapsed_time": "2:12:15", "remaining_time": "1:24:03"}
|
753 |
{"current_steps": 753, "total_steps": 1230, "loss": 0.4487, "lr": 1.5691990144020376e-05, "epoch": 3.050126582278481, "percentage": 61.22, "elapsed_time": "2:12:25", "remaining_time": "1:23:53"}
|
754 |
+
{"current_steps": 754, "total_steps": 1230, "loss": 0.4426, "lr": 1.5636581256404297e-05, "epoch": 3.0541772151898736, "percentage": 61.3, "elapsed_time": "2:12:35", "remaining_time": "1:23:42"}
|
755 |
+
{"current_steps": 755, "total_steps": 1230, "loss": 0.4345, "lr": 1.558120751116291e-05, "epoch": 3.0582278481012657, "percentage": 61.38, "elapsed_time": "2:12:45", "remaining_time": "1:23:31"}
|
756 |
+
{"current_steps": 756, "total_steps": 1230, "loss": 0.4369, "lr": 1.552586935426876e-05, "epoch": 3.062278481012658, "percentage": 61.46, "elapsed_time": "2:12:55", "remaining_time": "1:23:20"}
|
757 |
+
{"current_steps": 757, "total_steps": 1230, "loss": 0.4471, "lr": 1.547056723140774e-05, "epoch": 3.0663291139240507, "percentage": 61.54, "elapsed_time": "2:13:05", "remaining_time": "1:23:09"}
|
758 |
+
{"current_steps": 758, "total_steps": 1230, "loss": 0.4458, "lr": 1.5415301587975565e-05, "epoch": 3.0703797468354432, "percentage": 61.63, "elapsed_time": "2:13:15", "remaining_time": "1:22:58"}
|
759 |
+
{"current_steps": 759, "total_steps": 1230, "loss": 0.4503, "lr": 1.536007286907411e-05, "epoch": 3.0744303797468353, "percentage": 61.71, "elapsed_time": "2:13:25", "remaining_time": "1:22:47"}
|
760 |
+
{"current_steps": 760, "total_steps": 1230, "loss": 0.4339, "lr": 1.5304881519507896e-05, "epoch": 3.078481012658228, "percentage": 61.79, "elapsed_time": "2:13:35", "remaining_time": "1:22:37"}
|
761 |
+
{"current_steps": 761, "total_steps": 1230, "loss": 0.4514, "lr": 1.5249727983780453e-05, "epoch": 3.0825316455696203, "percentage": 61.87, "elapsed_time": "2:13:45", "remaining_time": "1:22:26"}
|
762 |
+
{"current_steps": 762, "total_steps": 1230, "loss": 0.4629, "lr": 1.5194612706090786e-05, "epoch": 3.086582278481013, "percentage": 61.95, "elapsed_time": "2:13:55", "remaining_time": "1:22:15"}
|
763 |
+
{"current_steps": 763, "total_steps": 1230, "loss": 0.4291, "lr": 1.5139536130329771e-05, "epoch": 3.090632911392405, "percentage": 62.03, "elapsed_time": "2:14:06", "remaining_time": "1:22:04"}
|
764 |
+
{"current_steps": 764, "total_steps": 1230, "loss": 0.4473, "lr": 1.508449870007656e-05, "epoch": 3.0946835443037974, "percentage": 62.11, "elapsed_time": "2:14:16", "remaining_time": "1:21:53"}
|
765 |
+
{"current_steps": 765, "total_steps": 1230, "loss": 0.4517, "lr": 1.5029500858595056e-05, "epoch": 3.09873417721519, "percentage": 62.2, "elapsed_time": "2:14:26", "remaining_time": "1:21:42"}
|
766 |
+
{"current_steps": 766, "total_steps": 1230, "loss": 0.4459, "lr": 1.4974543048830328e-05, "epoch": 3.1027848101265825, "percentage": 62.28, "elapsed_time": "2:14:36", "remaining_time": "1:21:32"}
|
767 |
+
{"current_steps": 767, "total_steps": 1230, "loss": 0.4337, "lr": 1.4919625713405e-05, "epoch": 3.1068354430379745, "percentage": 62.36, "elapsed_time": "2:14:46", "remaining_time": "1:21:21"}
|
768 |
+
{"current_steps": 768, "total_steps": 1230, "loss": 0.4339, "lr": 1.4864749294615756e-05, "epoch": 3.110886075949367, "percentage": 62.44, "elapsed_time": "2:14:56", "remaining_time": "1:21:10"}
|
769 |
+
{"current_steps": 769, "total_steps": 1230, "loss": 0.459, "lr": 1.4809914234429716e-05, "epoch": 3.1149367088607596, "percentage": 62.52, "elapsed_time": "2:15:06", "remaining_time": "1:20:59"}
|
770 |
+
{"current_steps": 770, "total_steps": 1230, "loss": 0.4664, "lr": 1.4755120974480923e-05, "epoch": 3.118987341772152, "percentage": 62.6, "elapsed_time": "2:15:16", "remaining_time": "1:20:48"}
|
771 |
+
{"current_steps": 771, "total_steps": 1230, "loss": 0.4423, "lr": 1.4700369956066771e-05, "epoch": 3.123037974683544, "percentage": 62.68, "elapsed_time": "2:15:26", "remaining_time": "1:20:38"}
|
772 |
+
{"current_steps": 772, "total_steps": 1230, "loss": 0.4472, "lr": 1.4645661620144413e-05, "epoch": 3.1270886075949367, "percentage": 62.76, "elapsed_time": "2:15:36", "remaining_time": "1:20:27"}
|
773 |
+
{"current_steps": 773, "total_steps": 1230, "loss": 0.4506, "lr": 1.4590996407327284e-05, "epoch": 3.131139240506329, "percentage": 62.85, "elapsed_time": "2:15:46", "remaining_time": "1:20:16"}
|
774 |
+
{"current_steps": 774, "total_steps": 1230, "loss": 0.4419, "lr": 1.4536374757881487e-05, "epoch": 3.1351898734177217, "percentage": 62.93, "elapsed_time": "2:15:56", "remaining_time": "1:20:05"}
|
775 |
+
{"current_steps": 775, "total_steps": 1230, "loss": 0.4434, "lr": 1.4481797111722271e-05, "epoch": 3.1392405063291138, "percentage": 63.01, "elapsed_time": "2:16:06", "remaining_time": "1:19:54"}
|
776 |
+
{"current_steps": 776, "total_steps": 1230, "loss": 0.4764, "lr": 1.4427263908410507e-05, "epoch": 3.1432911392405063, "percentage": 63.09, "elapsed_time": "2:16:16", "remaining_time": "1:19:43"}
|
777 |
+
{"current_steps": 777, "total_steps": 1230, "loss": 0.4384, "lr": 1.4372775587149108e-05, "epoch": 3.147341772151899, "percentage": 63.17, "elapsed_time": "2:16:26", "remaining_time": "1:19:33"}
|
778 |
+
{"current_steps": 778, "total_steps": 1230, "loss": 0.4629, "lr": 1.4318332586779522e-05, "epoch": 3.1513924050632913, "percentage": 63.25, "elapsed_time": "2:16:36", "remaining_time": "1:19:22"}
|
779 |
+
{"current_steps": 779, "total_steps": 1230, "loss": 0.4629, "lr": 1.4263935345778202e-05, "epoch": 3.1554430379746834, "percentage": 63.33, "elapsed_time": "2:16:47", "remaining_time": "1:19:11"}
|
780 |
+
{"current_steps": 780, "total_steps": 1230, "loss": 0.4664, "lr": 1.420958430225303e-05, "epoch": 3.159493670886076, "percentage": 63.41, "elapsed_time": "2:16:57", "remaining_time": "1:19:00"}
|
781 |
+
{"current_steps": 781, "total_steps": 1230, "loss": 0.4529, "lr": 1.415527989393985e-05, "epoch": 3.1635443037974684, "percentage": 63.5, "elapsed_time": "2:17:07", "remaining_time": "1:18:49"}
|
782 |
+
{"current_steps": 782, "total_steps": 1230, "loss": 0.4549, "lr": 1.410102255819891e-05, "epoch": 3.167594936708861, "percentage": 63.58, "elapsed_time": "2:17:17", "remaining_time": "1:18:39"}
|
783 |
+
{"current_steps": 783, "total_steps": 1230, "loss": 0.4488, "lr": 1.404681273201131e-05, "epoch": 3.171645569620253, "percentage": 63.66, "elapsed_time": "2:17:27", "remaining_time": "1:18:28"}
|
784 |
+
{"current_steps": 784, "total_steps": 1230, "loss": 0.4483, "lr": 1.399265085197556e-05, "epoch": 3.1756962025316455, "percentage": 63.74, "elapsed_time": "2:17:37", "remaining_time": "1:18:17"}
|
785 |
+
{"current_steps": 785, "total_steps": 1230, "loss": 0.4409, "lr": 1.393853735430398e-05, "epoch": 3.179746835443038, "percentage": 63.82, "elapsed_time": "2:17:47", "remaining_time": "1:18:06"}
|
786 |
+
{"current_steps": 786, "total_steps": 1230, "loss": 0.4477, "lr": 1.3884472674819246e-05, "epoch": 3.1837974683544306, "percentage": 63.9, "elapsed_time": "2:17:57", "remaining_time": "1:17:55"}
|
787 |
+
{"current_steps": 787, "total_steps": 1230, "loss": 0.4614, "lr": 1.3830457248950864e-05, "epoch": 3.1878481012658226, "percentage": 63.98, "elapsed_time": "2:18:07", "remaining_time": "1:17:44"}
|
788 |
+
{"current_steps": 788, "total_steps": 1230, "loss": 0.4547, "lr": 1.377649151173163e-05, "epoch": 3.191898734177215, "percentage": 64.07, "elapsed_time": "2:18:17", "remaining_time": "1:17:34"}
|
789 |
+
{"current_steps": 789, "total_steps": 1230, "loss": 0.4568, "lr": 1.3722575897794181e-05, "epoch": 3.1959493670886077, "percentage": 64.15, "elapsed_time": "2:18:27", "remaining_time": "1:17:23"}
|
790 |
+
{"current_steps": 790, "total_steps": 1230, "loss": 0.4329, "lr": 1.3668710841367472e-05, "epoch": 3.2, "percentage": 64.23, "elapsed_time": "2:18:37", "remaining_time": "1:17:12"}
|
791 |
+
{"current_steps": 791, "total_steps": 1230, "loss": 0.447, "lr": 1.361489677627324e-05, "epoch": 3.2040506329113922, "percentage": 64.31, "elapsed_time": "2:18:47", "remaining_time": "1:17:01"}
|
792 |
+
{"current_steps": 792, "total_steps": 1230, "loss": 0.4493, "lr": 1.3561134135922585e-05, "epoch": 3.2081012658227848, "percentage": 64.39, "elapsed_time": "2:18:57", "remaining_time": "1:16:51"}
|
793 |
+
{"current_steps": 793, "total_steps": 1230, "loss": 0.4625, "lr": 1.350742335331241e-05, "epoch": 3.2121518987341773, "percentage": 64.47, "elapsed_time": "2:19:07", "remaining_time": "1:16:40"}
|
794 |
+
{"current_steps": 794, "total_steps": 1230, "loss": 0.4523, "lr": 1.345376486102198e-05, "epoch": 3.21620253164557, "percentage": 64.55, "elapsed_time": "2:19:17", "remaining_time": "1:16:29"}
|
795 |
+
{"current_steps": 795, "total_steps": 1230, "loss": 0.4491, "lr": 1.3400159091209414e-05, "epoch": 3.220253164556962, "percentage": 64.63, "elapsed_time": "2:19:27", "remaining_time": "1:16:18"}
|
796 |
+
{"current_steps": 796, "total_steps": 1230, "loss": 0.4573, "lr": 1.3346606475608216e-05, "epoch": 3.2243037974683544, "percentage": 64.72, "elapsed_time": "2:19:37", "remaining_time": "1:16:07"}
|
797 |
+
{"current_steps": 797, "total_steps": 1230, "loss": 0.4762, "lr": 1.3293107445523781e-05, "epoch": 3.228354430379747, "percentage": 64.8, "elapsed_time": "2:19:48", "remaining_time": "1:15:57"}
|
798 |
+
{"current_steps": 798, "total_steps": 1230, "loss": 0.4618, "lr": 1.3239662431829949e-05, "epoch": 3.2324050632911394, "percentage": 64.88, "elapsed_time": "2:19:58", "remaining_time": "1:15:46"}
|
799 |
+
{"current_steps": 799, "total_steps": 1230, "loss": 0.4583, "lr": 1.3186271864965509e-05, "epoch": 3.2364556962025315, "percentage": 64.96, "elapsed_time": "2:20:08", "remaining_time": "1:15:35"}
|
800 |
+
{"current_steps": 800, "total_steps": 1230, "loss": 0.4573, "lr": 1.3132936174930756e-05, "epoch": 3.240506329113924, "percentage": 65.04, "elapsed_time": "2:20:18", "remaining_time": "1:15:24"}
|
801 |
+
{"current_steps": 801, "total_steps": 1230, "loss": 0.4477, "lr": 1.3079655791283995e-05, "epoch": 3.2445569620253165, "percentage": 65.12, "elapsed_time": "2:20:28", "remaining_time": "1:15:13"}
|
802 |
+
{"current_steps": 802, "total_steps": 1230, "loss": 0.4445, "lr": 1.3026431143138108e-05, "epoch": 3.248607594936709, "percentage": 65.2, "elapsed_time": "2:20:38", "remaining_time": "1:15:03"}
|
803 |
+
{"current_steps": 803, "total_steps": 1230, "loss": 0.45, "lr": 1.2973262659157114e-05, "epoch": 3.252658227848101, "percentage": 65.28, "elapsed_time": "2:20:48", "remaining_time": "1:14:52"}
|
804 |
+
{"current_steps": 804, "total_steps": 1230, "loss": 0.4551, "lr": 1.2920150767552651e-05, "epoch": 3.2567088607594936, "percentage": 65.37, "elapsed_time": "2:20:58", "remaining_time": "1:14:41"}
|
805 |
+
{"current_steps": 805, "total_steps": 1230, "loss": 0.4589, "lr": 1.2867095896080607e-05, "epoch": 3.260759493670886, "percentage": 65.45, "elapsed_time": "2:21:08", "remaining_time": "1:14:30"}
|
806 |
+
{"current_steps": 806, "total_steps": 1230, "loss": 0.4557, "lr": 1.2814098472037612e-05, "epoch": 3.2648101265822786, "percentage": 65.53, "elapsed_time": "2:21:18", "remaining_time": "1:14:20"}
|
807 |
+
{"current_steps": 807, "total_steps": 1230, "loss": 0.4541, "lr": 1.276115892225764e-05, "epoch": 3.2688607594936707, "percentage": 65.61, "elapsed_time": "2:21:28", "remaining_time": "1:14:09"}
|
808 |
+
{"current_steps": 808, "total_steps": 1230, "loss": 0.4577, "lr": 1.2708277673108555e-05, "epoch": 3.2729113924050632, "percentage": 65.69, "elapsed_time": "2:21:38", "remaining_time": "1:13:58"}
|
809 |
+
{"current_steps": 809, "total_steps": 1230, "loss": 0.4408, "lr": 1.2655455150488649e-05, "epoch": 3.2769620253164558, "percentage": 65.77, "elapsed_time": "2:21:48", "remaining_time": "1:13:47"}
|
810 |
+
{"current_steps": 810, "total_steps": 1230, "loss": 0.4532, "lr": 1.2602691779823272e-05, "epoch": 3.2810126582278483, "percentage": 65.85, "elapsed_time": "2:21:58", "remaining_time": "1:13:37"}
|
811 |
+
{"current_steps": 811, "total_steps": 1230, "loss": 0.4519, "lr": 1.2549987986061355e-05, "epoch": 3.2850632911392403, "percentage": 65.93, "elapsed_time": "2:22:08", "remaining_time": "1:13:26"}
|
812 |
+
{"current_steps": 812, "total_steps": 1230, "loss": 0.462, "lr": 1.2497344193672005e-05, "epoch": 3.289113924050633, "percentage": 66.02, "elapsed_time": "2:22:18", "remaining_time": "1:13:15"}
|
813 |
+
{"current_steps": 813, "total_steps": 1230, "loss": 0.4525, "lr": 1.2444760826641092e-05, "epoch": 3.2931645569620254, "percentage": 66.1, "elapsed_time": "2:22:28", "remaining_time": "1:13:04"}
|
814 |
+
{"current_steps": 814, "total_steps": 1230, "loss": 0.4517, "lr": 1.2392238308467817e-05, "epoch": 3.297215189873418, "percentage": 66.18, "elapsed_time": "2:22:38", "remaining_time": "1:12:54"}
|
815 |
+
{"current_steps": 815, "total_steps": 1230, "loss": 0.4571, "lr": 1.2339777062161326e-05, "epoch": 3.30126582278481, "percentage": 66.26, "elapsed_time": "2:22:49", "remaining_time": "1:12:43"}
|
816 |
+
{"current_steps": 816, "total_steps": 1230, "loss": 0.4446, "lr": 1.2287377510237293e-05, "epoch": 3.3053164556962025, "percentage": 66.34, "elapsed_time": "2:22:59", "remaining_time": "1:12:32"}
|
817 |
+
{"current_steps": 817, "total_steps": 1230, "loss": 0.458, "lr": 1.2235040074714488e-05, "epoch": 3.309367088607595, "percentage": 66.42, "elapsed_time": "2:23:09", "remaining_time": "1:12:21"}
|
818 |
+
{"current_steps": 818, "total_steps": 1230, "loss": 0.4663, "lr": 1.2182765177111434e-05, "epoch": 3.3134177215189875, "percentage": 66.5, "elapsed_time": "2:23:19", "remaining_time": "1:12:11"}
|
819 |
+
{"current_steps": 819, "total_steps": 1230, "loss": 0.4443, "lr": 1.213055323844297e-05, "epoch": 3.3174683544303796, "percentage": 66.59, "elapsed_time": "2:23:29", "remaining_time": "1:12:00"}
|
820 |
+
{"current_steps": 820, "total_steps": 1230, "loss": 0.4452, "lr": 1.2078404679216864e-05, "epoch": 3.321518987341772, "percentage": 66.67, "elapsed_time": "2:23:39", "remaining_time": "1:11:49"}
|
821 |
+
{"current_steps": 821, "total_steps": 1230, "loss": 0.4511, "lr": 1.2026319919430458e-05, "epoch": 3.3255696202531646, "percentage": 66.75, "elapsed_time": "2:23:49", "remaining_time": "1:11:39"}
|
822 |
+
{"current_steps": 822, "total_steps": 1230, "loss": 0.4554, "lr": 1.1974299378567227e-05, "epoch": 3.329620253164557, "percentage": 66.83, "elapsed_time": "2:23:59", "remaining_time": "1:11:28"}
|
823 |
+
{"current_steps": 823, "total_steps": 1230, "loss": 0.4307, "lr": 1.1922343475593462e-05, "epoch": 3.333670886075949, "percentage": 66.91, "elapsed_time": "2:24:09", "remaining_time": "1:11:17"}
|
824 |
+
{"current_steps": 824, "total_steps": 1230, "loss": 0.4552, "lr": 1.187045262895488e-05, "epoch": 3.3377215189873417, "percentage": 66.99, "elapsed_time": "2:24:19", "remaining_time": "1:11:06"}
|
825 |
+
{"current_steps": 825, "total_steps": 1230, "loss": 0.4528, "lr": 1.1818627256573203e-05, "epoch": 3.3417721518987342, "percentage": 67.07, "elapsed_time": "2:24:29", "remaining_time": "1:10:56"}
|
826 |
+
{"current_steps": 826, "total_steps": 1230, "loss": 0.4592, "lr": 1.1766867775842864e-05, "epoch": 3.3458227848101267, "percentage": 67.15, "elapsed_time": "2:24:39", "remaining_time": "1:10:45"}
|
827 |
+
{"current_steps": 827, "total_steps": 1230, "loss": 0.4734, "lr": 1.1715174603627615e-05, "epoch": 3.349873417721519, "percentage": 67.24, "elapsed_time": "2:24:49", "remaining_time": "1:10:34"}
|
828 |
+
{"current_steps": 828, "total_steps": 1230, "loss": 0.4645, "lr": 1.1663548156257147e-05, "epoch": 3.3539240506329113, "percentage": 67.32, "elapsed_time": "2:25:00", "remaining_time": "1:10:23"}
|
829 |
+
{"current_steps": 829, "total_steps": 1230, "loss": 0.4442, "lr": 1.161198884952377e-05, "epoch": 3.357974683544304, "percentage": 67.4, "elapsed_time": "2:25:10", "remaining_time": "1:10:13"}
|
830 |
+
{"current_steps": 830, "total_steps": 1230, "loss": 0.4636, "lr": 1.1560497098679056e-05, "epoch": 3.3620253164556964, "percentage": 67.48, "elapsed_time": "2:25:20", "remaining_time": "1:10:02"}
|
831 |
+
{"current_steps": 831, "total_steps": 1230, "loss": 0.437, "lr": 1.1509073318430479e-05, "epoch": 3.3660759493670884, "percentage": 67.56, "elapsed_time": "2:25:30", "remaining_time": "1:09:51"}
|
832 |
+
{"current_steps": 832, "total_steps": 1230, "loss": 0.4599, "lr": 1.1457717922938116e-05, "epoch": 3.370126582278481, "percentage": 67.64, "elapsed_time": "2:25:40", "remaining_time": "1:09:41"}
|
833 |
+
{"current_steps": 833, "total_steps": 1230, "loss": 0.4408, "lr": 1.1406431325811233e-05, "epoch": 3.3741772151898735, "percentage": 67.72, "elapsed_time": "2:25:50", "remaining_time": "1:09:30"}
|
834 |
+
{"current_steps": 834, "total_steps": 1230, "loss": 0.4545, "lr": 1.135521394010506e-05, "epoch": 3.378227848101266, "percentage": 67.8, "elapsed_time": "2:26:00", "remaining_time": "1:09:19"}
|
835 |
+
{"current_steps": 835, "total_steps": 1230, "loss": 0.4545, "lr": 1.1304066178317367e-05, "epoch": 3.382278481012658, "percentage": 67.89, "elapsed_time": "2:26:10", "remaining_time": "1:09:08"}
|
836 |
+
{"current_steps": 836, "total_steps": 1230, "loss": 0.4541, "lr": 1.1252988452385199e-05, "epoch": 3.3863291139240506, "percentage": 67.97, "elapsed_time": "2:26:20", "remaining_time": "1:08:58"}
|
837 |
+
{"current_steps": 837, "total_steps": 1230, "loss": 0.4522, "lr": 1.1201981173681536e-05, "epoch": 3.390379746835443, "percentage": 68.05, "elapsed_time": "2:26:30", "remaining_time": "1:08:47"}
|
838 |
+
{"current_steps": 838, "total_steps": 1230, "loss": 0.4617, "lr": 1.1151044753011991e-05, "epoch": 3.3944303797468356, "percentage": 68.13, "elapsed_time": "2:26:40", "remaining_time": "1:08:36"}
|
839 |
+
{"current_steps": 839, "total_steps": 1230, "loss": 0.4446, "lr": 1.1100179600611491e-05, "epoch": 3.3984810126582277, "percentage": 68.21, "elapsed_time": "2:26:50", "remaining_time": "1:08:26"}
|
840 |
+
{"current_steps": 840, "total_steps": 1230, "loss": 0.4471, "lr": 1.1049386126140985e-05, "epoch": 3.40253164556962, "percentage": 68.29, "elapsed_time": "2:27:00", "remaining_time": "1:08:15"}
|
841 |
+
{"current_steps": 841, "total_steps": 1230, "loss": 0.4418, "lr": 1.0998664738684128e-05, "epoch": 3.4065822784810127, "percentage": 68.37, "elapsed_time": "2:27:11", "remaining_time": "1:08:04"}
|
842 |
+
{"current_steps": 842, "total_steps": 1230, "loss": 0.4548, "lr": 1.0948015846744e-05, "epoch": 3.410632911392405, "percentage": 68.46, "elapsed_time": "2:27:21", "remaining_time": "1:07:54"}
|
843 |
+
{"current_steps": 843, "total_steps": 1230, "loss": 0.4523, "lr": 1.0897439858239832e-05, "epoch": 3.4146835443037973, "percentage": 68.54, "elapsed_time": "2:27:31", "remaining_time": "1:07:43"}
|
844 |
+
{"current_steps": 844, "total_steps": 1230, "loss": 0.4488, "lr": 1.0846937180503652e-05, "epoch": 3.41873417721519, "percentage": 68.62, "elapsed_time": "2:27:41", "remaining_time": "1:07:32"}
|
845 |
+
{"current_steps": 845, "total_steps": 1230, "loss": 0.4586, "lr": 1.0796508220277117e-05, "epoch": 3.4227848101265823, "percentage": 68.7, "elapsed_time": "2:27:51", "remaining_time": "1:07:21"}
|
846 |
+
{"current_steps": 846, "total_steps": 1230, "loss": 0.4345, "lr": 1.0746153383708107e-05, "epoch": 3.426835443037975, "percentage": 68.78, "elapsed_time": "2:28:01", "remaining_time": "1:07:11"}
|
847 |
+
{"current_steps": 847, "total_steps": 1230, "loss": 0.4508, "lr": 1.0695873076347579e-05, "epoch": 3.430886075949367, "percentage": 68.86, "elapsed_time": "2:28:11", "remaining_time": "1:07:00"}
|
848 |
+
{"current_steps": 848, "total_steps": 1230, "loss": 0.4565, "lr": 1.0645667703146205e-05, "epoch": 3.4349367088607594, "percentage": 68.94, "elapsed_time": "2:28:21", "remaining_time": "1:06:49"}
|
849 |
+
{"current_steps": 849, "total_steps": 1230, "loss": 0.4498, "lr": 1.0595537668451161e-05, "epoch": 3.438987341772152, "percentage": 69.02, "elapsed_time": "2:28:31", "remaining_time": "1:06:39"}
|
850 |
+
{"current_steps": 850, "total_steps": 1230, "loss": 0.4698, "lr": 1.0545483376002854e-05, "epoch": 3.4430379746835444, "percentage": 69.11, "elapsed_time": "2:28:41", "remaining_time": "1:06:28"}
|
851 |
+
{"current_steps": 851, "total_steps": 1230, "loss": 0.4513, "lr": 1.0495505228931676e-05, "epoch": 3.4470886075949365, "percentage": 69.19, "elapsed_time": "2:28:51", "remaining_time": "1:06:17"}
|
852 |
+
{"current_steps": 852, "total_steps": 1230, "loss": 0.4644, "lr": 1.044560362975474e-05, "epoch": 3.451139240506329, "percentage": 69.27, "elapsed_time": "2:29:01", "remaining_time": "1:06:07"}
|
853 |
+
{"current_steps": 853, "total_steps": 1230, "loss": 0.4414, "lr": 1.0395778980372695e-05, "epoch": 3.4551898734177215, "percentage": 69.35, "elapsed_time": "2:29:11", "remaining_time": "1:05:56"}
|
854 |
+
{"current_steps": 854, "total_steps": 1230, "loss": 0.4464, "lr": 1.0346031682066381e-05, "epoch": 3.459240506329114, "percentage": 69.43, "elapsed_time": "2:29:21", "remaining_time": "1:05:45"}
|
855 |
+
{"current_steps": 855, "total_steps": 1230, "loss": 0.4774, "lr": 1.0296362135493724e-05, "epoch": 3.463291139240506, "percentage": 69.51, "elapsed_time": "2:29:32", "remaining_time": "1:05:35"}
|
856 |
+
{"current_steps": 856, "total_steps": 1230, "loss": 0.4681, "lr": 1.0246770740686422e-05, "epoch": 3.4673417721518986, "percentage": 69.59, "elapsed_time": "2:29:42", "remaining_time": "1:05:24"}
|
857 |
+
{"current_steps": 857, "total_steps": 1230, "loss": 0.451, "lr": 1.0197257897046743e-05, "epoch": 3.471392405063291, "percentage": 69.67, "elapsed_time": "2:29:52", "remaining_time": "1:05:13"}
|
858 |
+
{"current_steps": 858, "total_steps": 1230, "loss": 0.4542, "lr": 1.014782400334433e-05, "epoch": 3.4754430379746837, "percentage": 69.76, "elapsed_time": "2:30:02", "remaining_time": "1:05:03"}
|
859 |
+
{"current_steps": 859, "total_steps": 1230, "loss": 0.4567, "lr": 1.009846945771296e-05, "epoch": 3.479493670886076, "percentage": 69.84, "elapsed_time": "2:30:12", "remaining_time": "1:04:52"}
|
860 |
+
{"current_steps": 860, "total_steps": 1230, "loss": 0.4685, "lr": 1.0049194657647363e-05, "epoch": 3.4835443037974683, "percentage": 69.92, "elapsed_time": "2:30:22", "remaining_time": "1:04:41"}
|
861 |
+
{"current_steps": 861, "total_steps": 1230, "loss": 0.4448, "lr": 1.0000000000000006e-05, "epoch": 3.487594936708861, "percentage": 70.0, "elapsed_time": "2:30:32", "remaining_time": "1:04:31"}
|
862 |
+
{"current_steps": 862, "total_steps": 1230, "loss": 0.4496, "lr": 9.950885880977891e-06, "epoch": 3.4916455696202533, "percentage": 70.08, "elapsed_time": "2:30:42", "remaining_time": "1:04:20"}
|
863 |
+
{"current_steps": 863, "total_steps": 1230, "loss": 0.4473, "lr": 9.901852696139382e-06, "epoch": 3.4956962025316454, "percentage": 70.16, "elapsed_time": "2:30:52", "remaining_time": "1:04:09"}
|
864 |
+
{"current_steps": 864, "total_steps": 1230, "loss": 0.4569, "lr": 9.852900840391027e-06, "epoch": 3.499746835443038, "percentage": 70.24, "elapsed_time": "2:31:02", "remaining_time": "1:03:59"}
|
865 |
+
{"current_steps": 865, "total_steps": 1230, "loss": 0.458, "lr": 9.804030707984313e-06, "epoch": 3.5037974683544304, "percentage": 70.33, "elapsed_time": "2:31:12", "remaining_time": "1:03:48"}
|
866 |
+
{"current_steps": 866, "total_steps": 1230, "loss": 0.4514, "lr": 9.755242692512599e-06, "epoch": 3.507848101265823, "percentage": 70.41, "elapsed_time": "2:31:22", "remaining_time": "1:03:37"}
|
867 |
+
{"current_steps": 867, "total_steps": 1230, "loss": 0.4563, "lr": 9.70653718690782e-06, "epoch": 3.5118987341772154, "percentage": 70.49, "elapsed_time": "2:31:32", "remaining_time": "1:03:27"}
|
868 |
+
{"current_steps": 868, "total_steps": 1230, "loss": 0.4487, "lr": 9.657914583437454e-06, "epoch": 3.5159493670886075, "percentage": 70.57, "elapsed_time": "2:31:42", "remaining_time": "1:03:16"}
|
869 |
+
{"current_steps": 869, "total_steps": 1230, "loss": 0.4509, "lr": 9.609375273701246e-06, "epoch": 3.52, "percentage": 70.65, "elapsed_time": "2:31:52", "remaining_time": "1:03:05"}
|
870 |
+
{"current_steps": 870, "total_steps": 1230, "loss": 0.4627, "lr": 9.560919648628133e-06, "epoch": 3.5240506329113925, "percentage": 70.73, "elapsed_time": "2:32:03", "remaining_time": "1:02:55"}
|
871 |
+
{"current_steps": 871, "total_steps": 1230, "loss": 0.4484, "lr": 9.512548098473047e-06, "epoch": 3.5281012658227846, "percentage": 70.81, "elapsed_time": "2:32:13", "remaining_time": "1:02:44"}
|
872 |
+
{"current_steps": 872, "total_steps": 1230, "loss": 0.4562, "lr": 9.464261012813825e-06, "epoch": 3.532151898734177, "percentage": 70.89, "elapsed_time": "2:32:23", "remaining_time": "1:02:33"}
|
873 |
+
{"current_steps": 873, "total_steps": 1230, "loss": 0.4402, "lr": 9.416058780547987e-06, "epoch": 3.5362025316455696, "percentage": 70.98, "elapsed_time": "2:32:33", "remaining_time": "1:02:23"}
|
874 |
+
{"current_steps": 874, "total_steps": 1230, "loss": 0.4475, "lr": 9.367941789889714e-06, "epoch": 3.540253164556962, "percentage": 71.06, "elapsed_time": "2:32:43", "remaining_time": "1:02:12"}
|
875 |
+
{"current_steps": 875, "total_steps": 1230, "loss": 0.4423, "lr": 9.319910428366607e-06, "epoch": 3.5443037974683547, "percentage": 71.14, "elapsed_time": "2:32:53", "remaining_time": "1:02:01"}
|
876 |
+
{"current_steps": 876, "total_steps": 1230, "loss": 0.4499, "lr": 9.271965082816667e-06, "epoch": 3.5483544303797467, "percentage": 71.22, "elapsed_time": "2:33:03", "remaining_time": "1:01:51"}
|
877 |
+
{"current_steps": 877, "total_steps": 1230, "loss": 0.447, "lr": 9.224106139385111e-06, "epoch": 3.5524050632911393, "percentage": 71.3, "elapsed_time": "2:33:13", "remaining_time": "1:01:40"}
|
878 |
+
{"current_steps": 878, "total_steps": 1230, "loss": 0.4571, "lr": 9.176333983521291e-06, "epoch": 3.5564556962025318, "percentage": 71.38, "elapsed_time": "2:33:23", "remaining_time": "1:01:29"}
|
879 |
+
{"current_steps": 879, "total_steps": 1230, "loss": 0.4485, "lr": 9.12864899997558e-06, "epoch": 3.560506329113924, "percentage": 71.46, "elapsed_time": "2:33:33", "remaining_time": "1:01:19"}
|
880 |
+
{"current_steps": 880, "total_steps": 1230, "loss": 0.4551, "lr": 9.08105157279628e-06, "epoch": 3.5645569620253164, "percentage": 71.54, "elapsed_time": "2:33:43", "remaining_time": "1:01:08"}
|
881 |
+
{"current_steps": 881, "total_steps": 1230, "loss": 0.4472, "lr": 9.03354208532653e-06, "epoch": 3.568607594936709, "percentage": 71.63, "elapsed_time": "2:33:53", "remaining_time": "1:00:57"}
|
882 |
+
{"current_steps": 882, "total_steps": 1230, "loss": 0.4673, "lr": 8.986120920201205e-06, "epoch": 3.5726582278481014, "percentage": 71.71, "elapsed_time": "2:34:03", "remaining_time": "1:00:47"}
|
883 |
+
{"current_steps": 883, "total_steps": 1230, "loss": 0.4582, "lr": 8.938788459343852e-06, "epoch": 3.576708860759494, "percentage": 71.79, "elapsed_time": "2:34:13", "remaining_time": "1:00:36"}
|
884 |
+
{"current_steps": 884, "total_steps": 1230, "loss": 0.4635, "lr": 8.8915450839636e-06, "epoch": 3.580759493670886, "percentage": 71.87, "elapsed_time": "2:34:23", "remaining_time": "1:00:25"}
|
885 |
+
{"current_steps": 885, "total_steps": 1230, "loss": 0.4457, "lr": 8.844391174552116e-06, "epoch": 3.5848101265822785, "percentage": 71.95, "elapsed_time": "2:34:33", "remaining_time": "1:00:15"}
|
886 |
+
{"current_steps": 886, "total_steps": 1230, "loss": 0.4485, "lr": 8.797327110880479e-06, "epoch": 3.588860759493671, "percentage": 72.03, "elapsed_time": "2:34:43", "remaining_time": "1:00:04"}
|
887 |
+
{"current_steps": 887, "total_steps": 1230, "loss": 0.4532, "lr": 8.750353271996206e-06, "epoch": 3.592911392405063, "percentage": 72.11, "elapsed_time": "2:34:53", "remaining_time": "0:59:53"}
|
888 |
+
{"current_steps": 888, "total_steps": 1230, "loss": 0.4646, "lr": 8.703470036220132e-06, "epoch": 3.5969620253164556, "percentage": 72.2, "elapsed_time": "2:35:03", "remaining_time": "0:59:43"}
|
889 |
+
{"current_steps": 889, "total_steps": 1230, "loss": 0.4625, "lr": 8.656677781143394e-06, "epoch": 3.601012658227848, "percentage": 72.28, "elapsed_time": "2:35:13", "remaining_time": "0:59:32"}
|
890 |
+
{"current_steps": 890, "total_steps": 1230, "loss": 0.4402, "lr": 8.609976883624377e-06, "epoch": 3.6050632911392406, "percentage": 72.36, "elapsed_time": "2:35:24", "remaining_time": "0:59:22"}
|
891 |
+
{"current_steps": 891, "total_steps": 1230, "loss": 0.4495, "lr": 8.563367719785698e-06, "epoch": 3.609113924050633, "percentage": 72.44, "elapsed_time": "2:35:34", "remaining_time": "0:59:11"}
|
892 |
+
{"current_steps": 892, "total_steps": 1230, "loss": 0.4506, "lr": 8.516850665011138e-06, "epoch": 3.613164556962025, "percentage": 72.52, "elapsed_time": "2:35:44", "remaining_time": "0:59:00"}
|
893 |
+
{"current_steps": 893, "total_steps": 1230, "loss": 0.4515, "lr": 8.47042609394269e-06, "epoch": 3.6172151898734177, "percentage": 72.6, "elapsed_time": "2:35:54", "remaining_time": "0:58:50"}
|
894 |
+
{"current_steps": 894, "total_steps": 1230, "loss": 0.4529, "lr": 8.424094380477432e-06, "epoch": 3.6212658227848102, "percentage": 72.68, "elapsed_time": "2:36:04", "remaining_time": "0:58:39"}
|
895 |
+
{"current_steps": 895, "total_steps": 1230, "loss": 0.4556, "lr": 8.37785589776465e-06, "epoch": 3.6253164556962023, "percentage": 72.76, "elapsed_time": "2:36:14", "remaining_time": "0:58:28"}
|
896 |
+
{"current_steps": 896, "total_steps": 1230, "loss": 0.46, "lr": 8.331711018202694e-06, "epoch": 3.629367088607595, "percentage": 72.85, "elapsed_time": "2:36:24", "remaining_time": "0:58:18"}
|
897 |
+
{"current_steps": 897, "total_steps": 1230, "loss": 0.4576, "lr": 8.285660113436104e-06, "epoch": 3.6334177215189873, "percentage": 72.93, "elapsed_time": "2:36:34", "remaining_time": "0:58:07"}
|
898 |
+
{"current_steps": 898, "total_steps": 1230, "loss": 0.446, "lr": 8.239703554352527e-06, "epoch": 3.63746835443038, "percentage": 73.01, "elapsed_time": "2:36:44", "remaining_time": "0:57:56"}
|
899 |
+
{"current_steps": 899, "total_steps": 1230, "loss": 0.4669, "lr": 8.193841711079775e-06, "epoch": 3.6415189873417724, "percentage": 73.09, "elapsed_time": "2:36:54", "remaining_time": "0:57:46"}
|
900 |
+
{"current_steps": 900, "total_steps": 1230, "loss": 0.4541, "lr": 8.148074952982828e-06, "epoch": 3.6455696202531644, "percentage": 73.17, "elapsed_time": "2:37:05", "remaining_time": "0:57:35"}
|
901 |
+
{"current_steps": 901, "total_steps": 1230, "loss": 0.4446, "lr": 8.102403648660859e-06, "epoch": 3.649620253164557, "percentage": 73.25, "elapsed_time": "2:37:15", "remaining_time": "0:57:25"}
|
902 |
+
{"current_steps": 902, "total_steps": 1230, "loss": 0.4445, "lr": 8.056828165944282e-06, "epoch": 3.6536708860759495, "percentage": 73.33, "elapsed_time": "2:37:25", "remaining_time": "0:57:14"}
|
903 |
+
{"current_steps": 903, "total_steps": 1230, "loss": 0.4502, "lr": 8.011348871891762e-06, "epoch": 3.6577215189873415, "percentage": 73.41, "elapsed_time": "2:37:35", "remaining_time": "0:57:03"}
|
904 |
+
{"current_steps": 904, "total_steps": 1230, "loss": 0.4537, "lr": 7.965966132787287e-06, "epoch": 3.661772151898734, "percentage": 73.5, "elapsed_time": "2:37:45", "remaining_time": "0:56:53"}
|
905 |
+
{"current_steps": 905, "total_steps": 1230, "loss": 0.4513, "lr": 7.920680314137189e-06, "epoch": 3.6658227848101266, "percentage": 73.58, "elapsed_time": "2:37:55", "remaining_time": "0:56:42"}
|
906 |
+
{"current_steps": 906, "total_steps": 1230, "loss": 0.4586, "lr": 7.875491780667246e-06, "epoch": 3.669873417721519, "percentage": 73.66, "elapsed_time": "2:38:05", "remaining_time": "0:56:32"}
|
907 |
+
{"current_steps": 907, "total_steps": 1230, "loss": 0.4471, "lr": 7.830400896319667e-06, "epoch": 3.6739240506329116, "percentage": 73.74, "elapsed_time": "2:38:15", "remaining_time": "0:56:21"}
|
908 |
+
{"current_steps": 908, "total_steps": 1230, "loss": 0.4462, "lr": 7.785408024250259e-06, "epoch": 3.6779746835443037, "percentage": 73.82, "elapsed_time": "2:38:25", "remaining_time": "0:56:10"}
|
909 |
+
{"current_steps": 909, "total_steps": 1230, "loss": 0.46, "lr": 7.74051352682542e-06, "epoch": 3.682025316455696, "percentage": 73.9, "elapsed_time": "2:38:35", "remaining_time": "0:56:00"}
|
910 |
+
{"current_steps": 910, "total_steps": 1230, "loss": 0.4466, "lr": 7.695717765619257e-06, "epoch": 3.6860759493670887, "percentage": 73.98, "elapsed_time": "2:38:45", "remaining_time": "0:55:49"}
|
911 |
+
{"current_steps": 911, "total_steps": 1230, "loss": 0.452, "lr": 7.651021101410673e-06, "epoch": 3.690126582278481, "percentage": 74.07, "elapsed_time": "2:38:55", "remaining_time": "0:55:39"}
|
912 |
+
{"current_steps": 912, "total_steps": 1230, "loss": 0.4515, "lr": 7.606423894180464e-06, "epoch": 3.6941772151898733, "percentage": 74.15, "elapsed_time": "2:39:05", "remaining_time": "0:55:28"}
|
913 |
+
{"current_steps": 913, "total_steps": 1230, "loss": 0.4458, "lr": 7.56192650310839e-06, "epoch": 3.698227848101266, "percentage": 74.23, "elapsed_time": "2:39:15", "remaining_time": "0:55:17"}
|
914 |
+
{"current_steps": 914, "total_steps": 1230, "loss": 0.4541, "lr": 7.517529286570349e-06, "epoch": 3.7022784810126583, "percentage": 74.31, "elapsed_time": "2:39:26", "remaining_time": "0:55:07"}
|
915 |
+
{"current_steps": 915, "total_steps": 1230, "loss": 0.4563, "lr": 7.473232602135387e-06, "epoch": 3.706329113924051, "percentage": 74.39, "elapsed_time": "2:39:36", "remaining_time": "0:54:56"}
|
916 |
+
{"current_steps": 916, "total_steps": 1230, "loss": 0.4305, "lr": 7.429036806562935e-06, "epoch": 3.710379746835443, "percentage": 74.47, "elapsed_time": "2:39:46", "remaining_time": "0:54:46"}
|
917 |
+
{"current_steps": 917, "total_steps": 1230, "loss": 0.4578, "lr": 7.3849422557998455e-06, "epoch": 3.7144303797468354, "percentage": 74.55, "elapsed_time": "2:39:56", "remaining_time": "0:54:35"}
|
918 |
+
{"current_steps": 918, "total_steps": 1230, "loss": 0.463, "lr": 7.340949304977567e-06, "epoch": 3.718481012658228, "percentage": 74.63, "elapsed_time": "2:40:06", "remaining_time": "0:54:24"}
|
919 |
+
{"current_steps": 919, "total_steps": 1230, "loss": 0.4475, "lr": 7.297058308409282e-06, "epoch": 3.72253164556962, "percentage": 74.72, "elapsed_time": "2:40:16", "remaining_time": "0:54:14"}
|
920 |
+
{"current_steps": 920, "total_steps": 1230, "loss": 0.4505, "lr": 7.25326961958704e-06, "epoch": 3.7265822784810125, "percentage": 74.8, "elapsed_time": "2:40:26", "remaining_time": "0:54:03"}
|
921 |
+
{"current_steps": 921, "total_steps": 1230, "loss": 0.4535, "lr": 7.209583591178921e-06, "epoch": 3.730632911392405, "percentage": 74.88, "elapsed_time": "2:40:36", "remaining_time": "0:53:53"}
|
922 |
+
{"current_steps": 922, "total_steps": 1230, "loss": 0.4526, "lr": 7.1660005750261925e-06, "epoch": 3.7346835443037976, "percentage": 74.96, "elapsed_time": "2:40:46", "remaining_time": "0:53:42"}
|
923 |
+
{"current_steps": 923, "total_steps": 1230, "loss": 0.4627, "lr": 7.1225209221404765e-06, "epoch": 3.73873417721519, "percentage": 75.04, "elapsed_time": "2:40:56", "remaining_time": "0:53:31"}
|
924 |
+
{"current_steps": 924, "total_steps": 1230, "loss": 0.474, "lr": 7.079144982700909e-06, "epoch": 3.742784810126582, "percentage": 75.12, "elapsed_time": "2:41:07", "remaining_time": "0:53:21"}
|
925 |
+
{"current_steps": 925, "total_steps": 1230, "loss": 0.4406, "lr": 7.0358731060513695e-06, "epoch": 3.7468354430379747, "percentage": 75.2, "elapsed_time": "2:41:17", "remaining_time": "0:53:10"}
|
926 |
+
{"current_steps": 926, "total_steps": 1230, "loss": 0.4538, "lr": 6.99270564069757e-06, "epoch": 3.750886075949367, "percentage": 75.28, "elapsed_time": "2:41:27", "remaining_time": "0:53:00"}
|
927 |
+
{"current_steps": 927, "total_steps": 1230, "loss": 0.4454, "lr": 6.949642934304375e-06, "epoch": 3.7549367088607593, "percentage": 75.37, "elapsed_time": "2:41:37", "remaining_time": "0:52:49"}
|
928 |
+
{"current_steps": 928, "total_steps": 1230, "loss": 0.4532, "lr": 6.906685333692871e-06, "epoch": 3.7589873417721518, "percentage": 75.45, "elapsed_time": "2:41:47", "remaining_time": "0:52:39"}
|
929 |
+
{"current_steps": 929, "total_steps": 1230, "loss": 0.4527, "lr": 6.86383318483769e-06, "epoch": 3.7630379746835443, "percentage": 75.53, "elapsed_time": "2:41:57", "remaining_time": "0:52:28"}
|
930 |
+
{"current_steps": 930, "total_steps": 1230, "loss": 0.4549, "lr": 6.821086832864139e-06, "epoch": 3.767088607594937, "percentage": 75.61, "elapsed_time": "2:42:07", "remaining_time": "0:52:17"}
|
931 |
+
{"current_steps": 931, "total_steps": 1230, "loss": 0.4379, "lr": 6.77844662204546e-06, "epoch": 3.7711392405063293, "percentage": 75.69, "elapsed_time": "2:42:17", "remaining_time": "0:52:07"}
|
932 |
+
{"current_steps": 932, "total_steps": 1230, "loss": 0.4555, "lr": 6.7359128958000455e-06, "epoch": 3.7751898734177214, "percentage": 75.77, "elapsed_time": "2:42:27", "remaining_time": "0:51:56"}
|
933 |
+
{"current_steps": 933, "total_steps": 1230, "loss": 0.4594, "lr": 6.693485996688695e-06, "epoch": 3.779240506329114, "percentage": 75.85, "elapsed_time": "2:42:37", "remaining_time": "0:51:46"}
|
934 |
+
{"current_steps": 934, "total_steps": 1230, "loss": 0.4516, "lr": 6.651166266411801e-06, "epoch": 3.7832911392405064, "percentage": 75.93, "elapsed_time": "2:42:48", "remaining_time": "0:51:35"}
|
935 |
+
{"current_steps": 935, "total_steps": 1230, "loss": 0.4534, "lr": 6.6089540458066725e-06, "epoch": 3.7873417721518985, "percentage": 76.02, "elapsed_time": "2:42:58", "remaining_time": "0:51:25"}
|
936 |
+
{"current_steps": 936, "total_steps": 1230, "loss": 0.4483, "lr": 6.566849674844711e-06, "epoch": 3.791392405063291, "percentage": 76.1, "elapsed_time": "2:43:08", "remaining_time": "0:51:14"}
|
937 |
+
{"current_steps": 937, "total_steps": 1230, "loss": 0.4354, "lr": 6.524853492628747e-06, "epoch": 3.7954430379746835, "percentage": 76.18, "elapsed_time": "2:43:18", "remaining_time": "0:51:03"}
|
938 |
+
{"current_steps": 938, "total_steps": 1230, "loss": 0.4423, "lr": 6.4829658373902536e-06, "epoch": 3.799493670886076, "percentage": 76.26, "elapsed_time": "2:43:28", "remaining_time": "0:50:53"}
|
939 |
+
{"current_steps": 939, "total_steps": 1230, "loss": 0.4541, "lr": 6.441187046486648e-06, "epoch": 3.8035443037974686, "percentage": 76.34, "elapsed_time": "2:43:38", "remaining_time": "0:50:42"}
|
940 |
+
{"current_steps": 940, "total_steps": 1230, "loss": 0.4308, "lr": 6.399517456398567e-06, "epoch": 3.8075949367088606, "percentage": 76.42, "elapsed_time": "2:43:48", "remaining_time": "0:50:32"}
|
941 |
+
{"current_steps": 941, "total_steps": 1230, "loss": 0.4321, "lr": 6.357957402727164e-06, "epoch": 3.811645569620253, "percentage": 76.5, "elapsed_time": "2:43:58", "remaining_time": "0:50:21"}
|
942 |
+
{"current_steps": 942, "total_steps": 1230, "loss": 0.4473, "lr": 6.316507220191395e-06, "epoch": 3.8156962025316457, "percentage": 76.59, "elapsed_time": "2:44:08", "remaining_time": "0:50:11"}
|
943 |
+
{"current_steps": 943, "total_steps": 1230, "loss": 0.4358, "lr": 6.275167242625331e-06, "epoch": 3.8197468354430377, "percentage": 76.67, "elapsed_time": "2:44:18", "remaining_time": "0:50:00"}
|
944 |
+
{"current_steps": 944, "total_steps": 1230, "loss": 0.4448, "lr": 6.233937802975471e-06, "epoch": 3.8237974683544302, "percentage": 76.75, "elapsed_time": "2:44:28", "remaining_time": "0:49:49"}
|
945 |
+
{"current_steps": 945, "total_steps": 1230, "loss": 0.4457, "lr": 6.192819233298046e-06, "epoch": 3.8278481012658228, "percentage": 76.83, "elapsed_time": "2:44:38", "remaining_time": "0:49:39"}
|
946 |
+
{"current_steps": 946, "total_steps": 1230, "loss": 0.4488, "lr": 6.151811864756383e-06, "epoch": 3.8318987341772153, "percentage": 76.91, "elapsed_time": "2:44:49", "remaining_time": "0:49:28"}
|
947 |
+
{"current_steps": 947, "total_steps": 1230, "loss": 0.4626, "lr": 6.1109160276181655e-06, "epoch": 3.835949367088608, "percentage": 76.99, "elapsed_time": "2:44:59", "remaining_time": "0:49:18"}
|
948 |
+
{"current_steps": 948, "total_steps": 1230, "loss": 0.4538, "lr": 6.070132051252868e-06, "epoch": 3.84, "percentage": 77.07, "elapsed_time": "2:45:09", "remaining_time": "0:49:07"}
|
949 |
+
{"current_steps": 949, "total_steps": 1230, "loss": 0.4476, "lr": 6.0294602641290034e-06, "epoch": 3.8440506329113924, "percentage": 77.15, "elapsed_time": "2:45:19", "remaining_time": "0:48:57"}
|
950 |
+
{"current_steps": 950, "total_steps": 1230, "loss": 0.435, "lr": 5.988900993811575e-06, "epoch": 3.848101265822785, "percentage": 77.24, "elapsed_time": "2:45:29", "remaining_time": "0:48:46"}
|
951 |
+
{"current_steps": 951, "total_steps": 1230, "loss": 0.4423, "lr": 5.948454566959363e-06, "epoch": 3.852151898734177, "percentage": 77.32, "elapsed_time": "2:45:39", "remaining_time": "0:48:35"}
|
952 |
+
{"current_steps": 952, "total_steps": 1230, "loss": 0.4494, "lr": 5.908121309322328e-06, "epoch": 3.8562025316455695, "percentage": 77.4, "elapsed_time": "2:45:49", "remaining_time": "0:48:25"}
|
953 |
+
{"current_steps": 953, "total_steps": 1230, "loss": 0.462, "lr": 5.867901545738976e-06, "epoch": 3.860253164556962, "percentage": 77.48, "elapsed_time": "2:45:59", "remaining_time": "0:48:14"}
|
954 |
+
{"current_steps": 954, "total_steps": 1230, "loss": 0.4496, "lr": 5.827795600133774e-06, "epoch": 3.8643037974683545, "percentage": 77.56, "elapsed_time": "2:46:09", "remaining_time": "0:48:04"}
|
955 |
+
{"current_steps": 955, "total_steps": 1230, "loss": 0.4481, "lr": 5.787803795514466e-06, "epoch": 3.868354430379747, "percentage": 77.64, "elapsed_time": "2:46:19", "remaining_time": "0:47:53"}
|
956 |
+
{"current_steps": 956, "total_steps": 1230, "loss": 0.4502, "lr": 5.747926453969576e-06, "epoch": 3.872405063291139, "percentage": 77.72, "elapsed_time": "2:46:29", "remaining_time": "0:47:43"}
|
957 |
+
{"current_steps": 957, "total_steps": 1230, "loss": 0.4424, "lr": 5.708163896665708e-06, "epoch": 3.8764556962025316, "percentage": 77.8, "elapsed_time": "2:46:39", "remaining_time": "0:47:32"}
|
958 |
+
{"current_steps": 958, "total_steps": 1230, "loss": 0.4491, "lr": 5.668516443845047e-06, "epoch": 3.880506329113924, "percentage": 77.89, "elapsed_time": "2:46:49", "remaining_time": "0:47:22"}
|
959 |
+
{"current_steps": 959, "total_steps": 1230, "loss": 0.4478, "lr": 5.6289844148227225e-06, "epoch": 3.884556962025316, "percentage": 77.97, "elapsed_time": "2:46:59", "remaining_time": "0:47:11"}
|
960 |
+
{"current_steps": 960, "total_steps": 1230, "loss": 0.4532, "lr": 5.5895681279842615e-06, "epoch": 3.8886075949367087, "percentage": 78.05, "elapsed_time": "2:47:09", "remaining_time": "0:47:00"}
|
961 |
+
{"current_steps": 961, "total_steps": 1230, "loss": 0.4521, "lr": 5.550267900783019e-06, "epoch": 3.8926582278481012, "percentage": 78.13, "elapsed_time": "2:47:19", "remaining_time": "0:46:50"}
|
962 |
+
{"current_steps": 962, "total_steps": 1230, "loss": 0.4529, "lr": 5.511084049737623e-06, "epoch": 3.8967088607594937, "percentage": 78.21, "elapsed_time": "2:47:29", "remaining_time": "0:46:39"}
|
963 |
+
{"current_steps": 963, "total_steps": 1230, "loss": 0.4452, "lr": 5.4720168904294215e-06, "epoch": 3.9007594936708863, "percentage": 78.29, "elapsed_time": "2:47:39", "remaining_time": "0:46:29"}
|
964 |
+
{"current_steps": 964, "total_steps": 1230, "loss": 0.4449, "lr": 5.433066737499948e-06, "epoch": 3.9048101265822783, "percentage": 78.37, "elapsed_time": "2:47:50", "remaining_time": "0:46:18"}
|
965 |
+
{"current_steps": 965, "total_steps": 1230, "loss": 0.4613, "lr": 5.394233904648376e-06, "epoch": 3.908860759493671, "percentage": 78.46, "elapsed_time": "2:48:00", "remaining_time": "0:46:08"}
|
966 |
+
{"current_steps": 966, "total_steps": 1230, "loss": 0.4378, "lr": 5.355518704628997e-06, "epoch": 3.9129113924050634, "percentage": 78.54, "elapsed_time": "2:48:10", "remaining_time": "0:45:57"}
|
967 |
+
{"current_steps": 967, "total_steps": 1230, "loss": 0.4693, "lr": 5.316921449248731e-06, "epoch": 3.9169620253164554, "percentage": 78.62, "elapsed_time": "2:48:20", "remaining_time": "0:45:47"}
|
968 |
+
{"current_steps": 968, "total_steps": 1230, "loss": 0.4443, "lr": 5.278442449364538e-06, "epoch": 3.921012658227848, "percentage": 78.7, "elapsed_time": "2:48:30", "remaining_time": "0:45:36"}
|
969 |
+
{"current_steps": 969, "total_steps": 1230, "loss": 0.4459, "lr": 5.240082014881016e-06, "epoch": 3.9250632911392405, "percentage": 78.78, "elapsed_time": "2:48:40", "remaining_time": "0:45:25"}
|
970 |
+
{"current_steps": 970, "total_steps": 1230, "loss": 0.4569, "lr": 5.201840454747822e-06, "epoch": 3.929113924050633, "percentage": 78.86, "elapsed_time": "2:48:50", "remaining_time": "0:45:15"}
|
971 |
+
{"current_steps": 971, "total_steps": 1230, "loss": 0.4411, "lr": 5.163718076957223e-06, "epoch": 3.9331645569620255, "percentage": 78.94, "elapsed_time": "2:49:00", "remaining_time": "0:45:04"}
|
972 |
+
{"current_steps": 972, "total_steps": 1230, "loss": 0.4579, "lr": 5.125715188541609e-06, "epoch": 3.9372151898734176, "percentage": 79.02, "elapsed_time": "2:49:10", "remaining_time": "0:44:54"}
|
973 |
+
{"current_steps": 973, "total_steps": 1230, "loss": 0.4491, "lr": 5.087832095571021e-06, "epoch": 3.94126582278481, "percentage": 79.11, "elapsed_time": "2:49:20", "remaining_time": "0:44:43"}
|
974 |
+
{"current_steps": 974, "total_steps": 1230, "loss": 0.4649, "lr": 5.0500691031506766e-06, "epoch": 3.9453164556962026, "percentage": 79.19, "elapsed_time": "2:49:30", "remaining_time": "0:44:33"}
|
975 |
+
{"current_steps": 975, "total_steps": 1230, "loss": 0.4682, "lr": 5.01242651541854e-06, "epoch": 3.9493670886075947, "percentage": 79.27, "elapsed_time": "2:49:40", "remaining_time": "0:44:22"}
|
976 |
+
{"current_steps": 976, "total_steps": 1230, "loss": 0.4503, "lr": 4.974904635542815e-06, "epoch": 3.953417721518987, "percentage": 79.35, "elapsed_time": "2:49:50", "remaining_time": "0:44:12"}
|
977 |
+
{"current_steps": 977, "total_steps": 1230, "loss": 0.4562, "lr": 4.937503765719582e-06, "epoch": 3.9574683544303797, "percentage": 79.43, "elapsed_time": "2:50:00", "remaining_time": "0:44:01"}
|
978 |
+
{"current_steps": 978, "total_steps": 1230, "loss": 0.4421, "lr": 4.900224207170299e-06, "epoch": 3.961518987341772, "percentage": 79.51, "elapsed_time": "2:50:11", "remaining_time": "0:43:51"}
|
979 |
+
{"current_steps": 979, "total_steps": 1230, "loss": 0.4353, "lr": 4.8630662601394065e-06, "epoch": 3.9655696202531647, "percentage": 79.59, "elapsed_time": "2:50:21", "remaining_time": "0:43:40"}
|
980 |
+
{"current_steps": 980, "total_steps": 1230, "loss": 0.4301, "lr": 4.8260302238918995e-06, "epoch": 3.969620253164557, "percentage": 79.67, "elapsed_time": "2:50:31", "remaining_time": "0:43:29"}
|
981 |
+
{"current_steps": 981, "total_steps": 1230, "loss": 0.4647, "lr": 4.789116396710924e-06, "epoch": 3.9736708860759493, "percentage": 79.76, "elapsed_time": "2:50:41", "remaining_time": "0:43:19"}
|
982 |
+
{"current_steps": 982, "total_steps": 1230, "loss": 0.4412, "lr": 4.752325075895368e-06, "epoch": 3.977721518987342, "percentage": 79.84, "elapsed_time": "2:50:51", "remaining_time": "0:43:08"}
|
983 |
+
{"current_steps": 983, "total_steps": 1230, "loss": 0.4462, "lr": 4.715656557757473e-06, "epoch": 3.981772151898734, "percentage": 79.92, "elapsed_time": "2:51:01", "remaining_time": "0:42:58"}
|
984 |
+
{"current_steps": 984, "total_steps": 1230, "loss": 0.4455, "lr": 4.679111137620442e-06, "epoch": 3.9858227848101264, "percentage": 80.0, "elapsed_time": "2:51:11", "remaining_time": "0:42:47"}
|
985 |
+
{"current_steps": 985, "total_steps": 1230, "loss": 0.4425, "lr": 4.6426891098160585e-06, "epoch": 3.989873417721519, "percentage": 80.08, "elapsed_time": "2:51:21", "remaining_time": "0:42:37"}
|
986 |
+
{"current_steps": 986, "total_steps": 1230, "loss": 0.4614, "lr": 4.6063907676823474e-06, "epoch": 3.9939240506329114, "percentage": 80.16, "elapsed_time": "2:51:31", "remaining_time": "0:42:26"}
|
987 |
+
{"current_steps": 987, "total_steps": 1230, "loss": 0.4396, "lr": 4.570216403561141e-06, "epoch": 3.997974683544304, "percentage": 80.24, "elapsed_time": "2:51:41", "remaining_time": "0:42:16"}
|
988 |
+
{"current_steps": 988, "total_steps": 1230, "loss": 0.404, "lr": 4.534166308795815e-06, "epoch": 4.002025316455696, "percentage": 80.33, "elapsed_time": "2:53:49", "remaining_time": "0:42:34"}
|
989 |
+
{"current_steps": 989, "total_steps": 1230, "loss": 0.3586, "lr": 4.498240773728859e-06, "epoch": 4.006075949367089, "percentage": 80.41, "elapsed_time": "2:53:59", "remaining_time": "0:42:23"}
|
990 |
+
{"current_steps": 990, "total_steps": 1230, "loss": 0.3485, "lr": 4.462440087699609e-06, "epoch": 4.010126582278481, "percentage": 80.49, "elapsed_time": "2:54:09", "remaining_time": "0:42:13"}
|
991 |
+
{"current_steps": 991, "total_steps": 1230, "loss": 0.3574, "lr": 4.426764539041861e-06, "epoch": 4.014177215189873, "percentage": 80.57, "elapsed_time": "2:54:19", "remaining_time": "0:42:02"}
|
992 |
+
{"current_steps": 992, "total_steps": 1230, "loss": 0.3477, "lr": 4.391214415081582e-06, "epoch": 4.018227848101266, "percentage": 80.65, "elapsed_time": "2:54:29", "remaining_time": "0:41:51"}
|
993 |
+
{"current_steps": 993, "total_steps": 1230, "loss": 0.3532, "lr": 4.355790002134579e-06, "epoch": 4.022278481012658, "percentage": 80.73, "elapsed_time": "2:54:39", "remaining_time": "0:41:41"}
|
994 |
+
{"current_steps": 994, "total_steps": 1230, "loss": 0.3523, "lr": 4.320491585504207e-06, "epoch": 4.02632911392405, "percentage": 80.81, "elapsed_time": "2:54:49", "remaining_time": "0:41:30"}
|
995 |
+
{"current_steps": 995, "total_steps": 1230, "loss": 0.3603, "lr": 4.2853194494790615e-06, "epoch": 4.030379746835443, "percentage": 80.89, "elapsed_time": "2:54:59", "remaining_time": "0:41:19"}
|
996 |
+
{"current_steps": 996, "total_steps": 1230, "loss": 0.3564, "lr": 4.250273877330691e-06, "epoch": 4.034430379746835, "percentage": 80.98, "elapsed_time": "2:55:09", "remaining_time": "0:41:09"}
|
997 |
+
{"current_steps": 997, "total_steps": 1230, "loss": 0.3513, "lr": 4.215355151311313e-06, "epoch": 4.038481012658228, "percentage": 81.06, "elapsed_time": "2:55:19", "remaining_time": "0:40:58"}
|
998 |
+
{"current_steps": 998, "total_steps": 1230, "loss": 0.3497, "lr": 4.180563552651542e-06, "epoch": 4.04253164556962, "percentage": 81.14, "elapsed_time": "2:55:30", "remaining_time": "0:40:47"}
|
999 |
+
{"current_steps": 999, "total_steps": 1230, "loss": 0.3445, "lr": 4.145899361558147e-06, "epoch": 4.046582278481012, "percentage": 81.22, "elapsed_time": "2:55:40", "remaining_time": "0:40:37"}
|
1000 |
+
{"current_steps": 1000, "total_steps": 1230, "loss": 0.3464, "lr": 4.111362857211738e-06, "epoch": 4.050632911392405, "percentage": 81.3, "elapsed_time": "2:55:50", "remaining_time": "0:40:26"}
|