ryanmarten commited on
Commit
39bdd51
·
verified ·
1 Parent(s): e133bdf

Training in progress, epoch 3

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:af5d3ed62c4965e6d531e1e2390eebfc2170c963ce513d7feba61d77f4660fd2
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:32d66a79801966e00ba95d889d8f91a2808d2a104615ce5e4a0525934ddd9b3b
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:367e16bbbd8f856c9fd3bafe3979b901b25530d44223d81dcf8848d5de2b4fc4
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:208cdf1f0f10f1a9f4f7a85ec7ebeced450beea7c63eb5a0bbc8bd41c4f5b899
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:47d08e62f0b2d7bd3eeaab7b70bcb2133454a35d3f6e491870889c55fa339005
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c4a26943b5d0d1b68316010419400ca4a82357fee4f491b01d53245544b46c21
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1815548a676fd73a732659c75926969ed97d22d9897b1285776783c81d8a2dd6
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1f433fd9d8e68840bb1ed884ddb67d695fa699a182e6dbd4af9dd5abb5f6c97f
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -750,3 +750,253 @@
750
  {"current_steps": 750, "total_steps": 1230, "loss": 0.185, "lr": 1.585842319716759e-05, "epoch": 3.0425316455696203, "percentage": 60.98, "elapsed_time": "4:06:54", "remaining_time": "2:38:01"}
751
  {"current_steps": 751, "total_steps": 1230, "loss": 0.1502, "lr": 1.5802911561074944e-05, "epoch": 3.046582278481013, "percentage": 61.06, "elapsed_time": "4:07:11", "remaining_time": "2:37:39"}
752
  {"current_steps": 752, "total_steps": 1230, "loss": 0.1887, "lr": 1.5747433727755595e-05, "epoch": 3.050632911392405, "percentage": 61.14, "elapsed_time": "4:07:31", "remaining_time": "2:37:20"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
750
  {"current_steps": 750, "total_steps": 1230, "loss": 0.185, "lr": 1.585842319716759e-05, "epoch": 3.0425316455696203, "percentage": 60.98, "elapsed_time": "4:06:54", "remaining_time": "2:38:01"}
751
  {"current_steps": 751, "total_steps": 1230, "loss": 0.1502, "lr": 1.5802911561074944e-05, "epoch": 3.046582278481013, "percentage": 61.06, "elapsed_time": "4:07:11", "remaining_time": "2:37:39"}
752
  {"current_steps": 752, "total_steps": 1230, "loss": 0.1887, "lr": 1.5747433727755595e-05, "epoch": 3.050632911392405, "percentage": 61.14, "elapsed_time": "4:07:31", "remaining_time": "2:37:20"}
753
+ {"current_steps": 753, "total_steps": 1230, "loss": 0.1792, "lr": 1.5691990144020376e-05, "epoch": 3.0546835443037974, "percentage": 61.22, "elapsed_time": "4:07:50", "remaining_time": "2:36:59"}
754
+ {"current_steps": 754, "total_steps": 1230, "loss": 0.1752, "lr": 1.5636581256404297e-05, "epoch": 3.05873417721519, "percentage": 61.3, "elapsed_time": "4:08:09", "remaining_time": "2:36:39"}
755
+ {"current_steps": 755, "total_steps": 1230, "loss": 0.1705, "lr": 1.558120751116291e-05, "epoch": 3.0627848101265824, "percentage": 61.38, "elapsed_time": "4:08:27", "remaining_time": "2:36:19"}
756
+ {"current_steps": 756, "total_steps": 1230, "loss": 0.1693, "lr": 1.552586935426876e-05, "epoch": 3.0668354430379745, "percentage": 61.46, "elapsed_time": "4:08:45", "remaining_time": "2:35:57"}
757
+ {"current_steps": 757, "total_steps": 1230, "loss": 0.1658, "lr": 1.547056723140774e-05, "epoch": 3.070886075949367, "percentage": 61.54, "elapsed_time": "4:09:03", "remaining_time": "2:35:37"}
758
+ {"current_steps": 758, "total_steps": 1230, "loss": 0.1908, "lr": 1.5415301587975565e-05, "epoch": 3.0749367088607595, "percentage": 61.63, "elapsed_time": "4:09:22", "remaining_time": "2:35:16"}
759
+ {"current_steps": 759, "total_steps": 1230, "loss": 0.1554, "lr": 1.536007286907411e-05, "epoch": 3.078987341772152, "percentage": 61.71, "elapsed_time": "4:09:40", "remaining_time": "2:34:55"}
760
+ {"current_steps": 760, "total_steps": 1230, "loss": 0.1738, "lr": 1.5304881519507896e-05, "epoch": 3.083037974683544, "percentage": 61.79, "elapsed_time": "4:09:57", "remaining_time": "2:34:34"}
761
+ {"current_steps": 761, "total_steps": 1230, "loss": 0.1864, "lr": 1.5249727983780453e-05, "epoch": 3.0870886075949366, "percentage": 61.87, "elapsed_time": "4:10:15", "remaining_time": "2:34:13"}
762
+ {"current_steps": 762, "total_steps": 1230, "loss": 0.1502, "lr": 1.5194612706090786e-05, "epoch": 3.091139240506329, "percentage": 61.95, "elapsed_time": "4:10:32", "remaining_time": "2:33:52"}
763
+ {"current_steps": 763, "total_steps": 1230, "loss": 0.1837, "lr": 1.5139536130329771e-05, "epoch": 3.0951898734177217, "percentage": 62.03, "elapsed_time": "4:10:51", "remaining_time": "2:33:32"}
764
+ {"current_steps": 764, "total_steps": 1230, "loss": 0.1637, "lr": 1.508449870007656e-05, "epoch": 3.0992405063291137, "percentage": 62.11, "elapsed_time": "4:11:08", "remaining_time": "2:33:11"}
765
+ {"current_steps": 765, "total_steps": 1230, "loss": 0.1674, "lr": 1.5029500858595056e-05, "epoch": 3.1032911392405063, "percentage": 62.2, "elapsed_time": "4:11:27", "remaining_time": "2:32:50"}
766
+ {"current_steps": 766, "total_steps": 1230, "loss": 0.1777, "lr": 1.4974543048830328e-05, "epoch": 3.1073417721518988, "percentage": 62.28, "elapsed_time": "4:11:45", "remaining_time": "2:32:30"}
767
+ {"current_steps": 767, "total_steps": 1230, "loss": 0.1739, "lr": 1.4919625713405e-05, "epoch": 3.1113924050632913, "percentage": 62.36, "elapsed_time": "4:12:04", "remaining_time": "2:32:10"}
768
+ {"current_steps": 768, "total_steps": 1230, "loss": 0.1767, "lr": 1.4864749294615756e-05, "epoch": 3.1154430379746834, "percentage": 62.44, "elapsed_time": "4:12:22", "remaining_time": "2:31:49"}
769
+ {"current_steps": 769, "total_steps": 1230, "loss": 0.1638, "lr": 1.4809914234429716e-05, "epoch": 3.119493670886076, "percentage": 62.52, "elapsed_time": "4:12:40", "remaining_time": "2:31:28"}
770
+ {"current_steps": 770, "total_steps": 1230, "loss": 0.1688, "lr": 1.4755120974480923e-05, "epoch": 3.1235443037974684, "percentage": 62.6, "elapsed_time": "4:12:59", "remaining_time": "2:31:08"}
771
+ {"current_steps": 771, "total_steps": 1230, "loss": 0.1871, "lr": 1.4700369956066771e-05, "epoch": 3.127594936708861, "percentage": 62.68, "elapsed_time": "4:13:17", "remaining_time": "2:30:47"}
772
+ {"current_steps": 772, "total_steps": 1230, "loss": 0.1648, "lr": 1.4645661620144413e-05, "epoch": 3.131645569620253, "percentage": 62.76, "elapsed_time": "4:13:35", "remaining_time": "2:30:26"}
773
+ {"current_steps": 773, "total_steps": 1230, "loss": 0.1806, "lr": 1.4590996407327284e-05, "epoch": 3.1356962025316455, "percentage": 62.85, "elapsed_time": "4:13:53", "remaining_time": "2:30:06"}
774
+ {"current_steps": 774, "total_steps": 1230, "loss": 0.1885, "lr": 1.4536374757881487e-05, "epoch": 3.139746835443038, "percentage": 62.93, "elapsed_time": "4:14:12", "remaining_time": "2:29:45"}
775
+ {"current_steps": 775, "total_steps": 1230, "loss": 0.171, "lr": 1.4481797111722271e-05, "epoch": 3.1437974683544305, "percentage": 63.01, "elapsed_time": "4:14:31", "remaining_time": "2:29:26"}
776
+ {"current_steps": 776, "total_steps": 1230, "loss": 0.1772, "lr": 1.4427263908410507e-05, "epoch": 3.1478481012658226, "percentage": 63.09, "elapsed_time": "4:14:51", "remaining_time": "2:29:06"}
777
+ {"current_steps": 777, "total_steps": 1230, "loss": 0.1698, "lr": 1.4372775587149108e-05, "epoch": 3.151898734177215, "percentage": 63.17, "elapsed_time": "4:15:08", "remaining_time": "2:28:45"}
778
+ {"current_steps": 778, "total_steps": 1230, "loss": 0.1782, "lr": 1.4318332586779522e-05, "epoch": 3.1559493670886076, "percentage": 63.25, "elapsed_time": "4:15:25", "remaining_time": "2:28:23"}
779
+ {"current_steps": 779, "total_steps": 1230, "loss": 0.1754, "lr": 1.4263935345778202e-05, "epoch": 3.16, "percentage": 63.33, "elapsed_time": "4:15:45", "remaining_time": "2:28:04"}
780
+ {"current_steps": 780, "total_steps": 1230, "loss": 0.1888, "lr": 1.420958430225303e-05, "epoch": 3.164050632911392, "percentage": 63.41, "elapsed_time": "4:16:06", "remaining_time": "2:27:45"}
781
+ {"current_steps": 781, "total_steps": 1230, "loss": 0.1765, "lr": 1.415527989393985e-05, "epoch": 3.1681012658227847, "percentage": 63.5, "elapsed_time": "4:16:24", "remaining_time": "2:27:24"}
782
+ {"current_steps": 782, "total_steps": 1230, "loss": 0.1764, "lr": 1.410102255819891e-05, "epoch": 3.1721518987341772, "percentage": 63.58, "elapsed_time": "4:16:42", "remaining_time": "2:27:03"}
783
+ {"current_steps": 783, "total_steps": 1230, "loss": 0.1666, "lr": 1.404681273201131e-05, "epoch": 3.1762025316455698, "percentage": 63.66, "elapsed_time": "4:17:01", "remaining_time": "2:26:43"}
784
+ {"current_steps": 784, "total_steps": 1230, "loss": 0.1725, "lr": 1.399265085197556e-05, "epoch": 3.180253164556962, "percentage": 63.74, "elapsed_time": "4:17:19", "remaining_time": "2:26:23"}
785
+ {"current_steps": 785, "total_steps": 1230, "loss": 0.1862, "lr": 1.393853735430398e-05, "epoch": 3.1843037974683543, "percentage": 63.82, "elapsed_time": "4:17:38", "remaining_time": "2:26:03"}
786
+ {"current_steps": 786, "total_steps": 1230, "loss": 0.1702, "lr": 1.3884472674819246e-05, "epoch": 3.188354430379747, "percentage": 63.9, "elapsed_time": "4:17:57", "remaining_time": "2:25:42"}
787
+ {"current_steps": 787, "total_steps": 1230, "loss": 0.1758, "lr": 1.3830457248950864e-05, "epoch": 3.1924050632911394, "percentage": 63.98, "elapsed_time": "4:18:15", "remaining_time": "2:25:22"}
788
+ {"current_steps": 788, "total_steps": 1230, "loss": 0.1778, "lr": 1.377649151173163e-05, "epoch": 3.1964556962025314, "percentage": 64.07, "elapsed_time": "4:18:35", "remaining_time": "2:25:02"}
789
+ {"current_steps": 789, "total_steps": 1230, "loss": 0.1809, "lr": 1.3722575897794181e-05, "epoch": 3.200506329113924, "percentage": 64.15, "elapsed_time": "4:18:53", "remaining_time": "2:24:42"}
790
+ {"current_steps": 790, "total_steps": 1230, "loss": 0.1773, "lr": 1.3668710841367472e-05, "epoch": 3.2045569620253165, "percentage": 64.23, "elapsed_time": "4:19:12", "remaining_time": "2:24:21"}
791
+ {"current_steps": 791, "total_steps": 1230, "loss": 0.178, "lr": 1.361489677627324e-05, "epoch": 3.208607594936709, "percentage": 64.31, "elapsed_time": "4:19:31", "remaining_time": "2:24:02"}
792
+ {"current_steps": 792, "total_steps": 1230, "loss": 0.1505, "lr": 1.3561134135922585e-05, "epoch": 3.212658227848101, "percentage": 64.39, "elapsed_time": "4:19:48", "remaining_time": "2:23:40"}
793
+ {"current_steps": 793, "total_steps": 1230, "loss": 0.172, "lr": 1.350742335331241e-05, "epoch": 3.2167088607594936, "percentage": 64.47, "elapsed_time": "4:20:07", "remaining_time": "2:23:20"}
794
+ {"current_steps": 794, "total_steps": 1230, "loss": 0.1745, "lr": 1.345376486102198e-05, "epoch": 3.220759493670886, "percentage": 64.55, "elapsed_time": "4:20:25", "remaining_time": "2:23:00"}
795
+ {"current_steps": 795, "total_steps": 1230, "loss": 0.1883, "lr": 1.3400159091209414e-05, "epoch": 3.2248101265822786, "percentage": 64.63, "elapsed_time": "4:20:44", "remaining_time": "2:22:40"}
796
+ {"current_steps": 796, "total_steps": 1230, "loss": 0.1575, "lr": 1.3346606475608216e-05, "epoch": 3.2288607594936707, "percentage": 64.72, "elapsed_time": "4:21:03", "remaining_time": "2:22:19"}
797
+ {"current_steps": 797, "total_steps": 1230, "loss": 0.1696, "lr": 1.3293107445523781e-05, "epoch": 3.232911392405063, "percentage": 64.8, "elapsed_time": "4:21:21", "remaining_time": "2:21:59"}
798
+ {"current_steps": 798, "total_steps": 1230, "loss": 0.1749, "lr": 1.3239662431829949e-05, "epoch": 3.2369620253164557, "percentage": 64.88, "elapsed_time": "4:21:39", "remaining_time": "2:21:39"}
799
+ {"current_steps": 799, "total_steps": 1230, "loss": 0.1643, "lr": 1.3186271864965509e-05, "epoch": 3.2410126582278482, "percentage": 64.96, "elapsed_time": "4:21:57", "remaining_time": "2:21:18"}
800
+ {"current_steps": 800, "total_steps": 1230, "loss": 0.1862, "lr": 1.3132936174930756e-05, "epoch": 3.2450632911392403, "percentage": 65.04, "elapsed_time": "4:22:15", "remaining_time": "2:20:57"}
801
+ {"current_steps": 801, "total_steps": 1230, "loss": 0.1756, "lr": 1.3079655791283995e-05, "epoch": 3.249113924050633, "percentage": 65.12, "elapsed_time": "4:22:33", "remaining_time": "2:20:37"}
802
+ {"current_steps": 802, "total_steps": 1230, "loss": 0.1767, "lr": 1.3026431143138108e-05, "epoch": 3.2531645569620253, "percentage": 65.2, "elapsed_time": "4:22:52", "remaining_time": "2:20:16"}
803
+ {"current_steps": 803, "total_steps": 1230, "loss": 0.1725, "lr": 1.2973262659157114e-05, "epoch": 3.257215189873418, "percentage": 65.28, "elapsed_time": "4:23:10", "remaining_time": "2:19:56"}
804
+ {"current_steps": 804, "total_steps": 1230, "loss": 0.1709, "lr": 1.2920150767552651e-05, "epoch": 3.26126582278481, "percentage": 65.37, "elapsed_time": "4:23:30", "remaining_time": "2:19:37"}
805
+ {"current_steps": 805, "total_steps": 1230, "loss": 0.1739, "lr": 1.2867095896080607e-05, "epoch": 3.2653164556962024, "percentage": 65.45, "elapsed_time": "4:23:48", "remaining_time": "2:19:16"}
806
+ {"current_steps": 806, "total_steps": 1230, "loss": 0.1603, "lr": 1.2814098472037612e-05, "epoch": 3.269367088607595, "percentage": 65.53, "elapsed_time": "4:24:06", "remaining_time": "2:18:56"}
807
+ {"current_steps": 807, "total_steps": 1230, "loss": 0.1648, "lr": 1.276115892225764e-05, "epoch": 3.2734177215189875, "percentage": 65.61, "elapsed_time": "4:24:25", "remaining_time": "2:18:36"}
808
+ {"current_steps": 808, "total_steps": 1230, "loss": 0.1726, "lr": 1.2708277673108555e-05, "epoch": 3.27746835443038, "percentage": 65.69, "elapsed_time": "4:24:43", "remaining_time": "2:18:15"}
809
+ {"current_steps": 809, "total_steps": 1230, "loss": 0.1664, "lr": 1.2655455150488649e-05, "epoch": 3.281518987341772, "percentage": 65.77, "elapsed_time": "4:25:00", "remaining_time": "2:17:54"}
810
+ {"current_steps": 810, "total_steps": 1230, "loss": 0.178, "lr": 1.2602691779823272e-05, "epoch": 3.2855696202531646, "percentage": 65.85, "elapsed_time": "4:25:20", "remaining_time": "2:17:34"}
811
+ {"current_steps": 811, "total_steps": 1230, "loss": 0.181, "lr": 1.2549987986061355e-05, "epoch": 3.289620253164557, "percentage": 65.93, "elapsed_time": "4:25:39", "remaining_time": "2:17:15"}
812
+ {"current_steps": 812, "total_steps": 1230, "loss": 0.1783, "lr": 1.2497344193672005e-05, "epoch": 3.293670886075949, "percentage": 66.02, "elapsed_time": "4:25:56", "remaining_time": "2:16:54"}
813
+ {"current_steps": 813, "total_steps": 1230, "loss": 0.1832, "lr": 1.2444760826641092e-05, "epoch": 3.2977215189873417, "percentage": 66.1, "elapsed_time": "4:26:14", "remaining_time": "2:16:33"}
814
+ {"current_steps": 814, "total_steps": 1230, "loss": 0.1701, "lr": 1.2392238308467817e-05, "epoch": 3.301772151898734, "percentage": 66.18, "elapsed_time": "4:26:32", "remaining_time": "2:16:12"}
815
+ {"current_steps": 815, "total_steps": 1230, "loss": 0.1615, "lr": 1.2339777062161326e-05, "epoch": 3.3058227848101267, "percentage": 66.26, "elapsed_time": "4:26:49", "remaining_time": "2:15:52"}
816
+ {"current_steps": 816, "total_steps": 1230, "loss": 0.1817, "lr": 1.2287377510237293e-05, "epoch": 3.309873417721519, "percentage": 66.34, "elapsed_time": "4:27:09", "remaining_time": "2:15:32"}
817
+ {"current_steps": 817, "total_steps": 1230, "loss": 0.1783, "lr": 1.2235040074714488e-05, "epoch": 3.3139240506329113, "percentage": 66.42, "elapsed_time": "4:27:28", "remaining_time": "2:15:12"}
818
+ {"current_steps": 818, "total_steps": 1230, "loss": 0.1824, "lr": 1.2182765177111434e-05, "epoch": 3.317974683544304, "percentage": 66.5, "elapsed_time": "4:27:48", "remaining_time": "2:14:53"}
819
+ {"current_steps": 819, "total_steps": 1230, "loss": 0.179, "lr": 1.213055323844297e-05, "epoch": 3.3220253164556963, "percentage": 66.59, "elapsed_time": "4:28:08", "remaining_time": "2:14:33"}
820
+ {"current_steps": 820, "total_steps": 1230, "loss": 0.1723, "lr": 1.2078404679216864e-05, "epoch": 3.3260759493670884, "percentage": 66.67, "elapsed_time": "4:28:28", "remaining_time": "2:14:14"}
821
+ {"current_steps": 821, "total_steps": 1230, "loss": 0.1594, "lr": 1.2026319919430458e-05, "epoch": 3.330126582278481, "percentage": 66.75, "elapsed_time": "4:28:46", "remaining_time": "2:13:53"}
822
+ {"current_steps": 822, "total_steps": 1230, "loss": 0.1723, "lr": 1.1974299378567227e-05, "epoch": 3.3341772151898734, "percentage": 66.83, "elapsed_time": "4:29:05", "remaining_time": "2:13:34"}
823
+ {"current_steps": 823, "total_steps": 1230, "loss": 0.1617, "lr": 1.1922343475593462e-05, "epoch": 3.338227848101266, "percentage": 66.91, "elapsed_time": "4:29:23", "remaining_time": "2:13:13"}
824
+ {"current_steps": 824, "total_steps": 1230, "loss": 0.1784, "lr": 1.187045262895488e-05, "epoch": 3.3422784810126585, "percentage": 66.99, "elapsed_time": "4:29:43", "remaining_time": "2:12:53"}
825
+ {"current_steps": 825, "total_steps": 1230, "loss": 0.1574, "lr": 1.1818627256573203e-05, "epoch": 3.3463291139240505, "percentage": 67.07, "elapsed_time": "4:30:01", "remaining_time": "2:12:33"}
826
+ {"current_steps": 826, "total_steps": 1230, "loss": 0.1874, "lr": 1.1766867775842864e-05, "epoch": 3.350379746835443, "percentage": 67.15, "elapsed_time": "4:30:19", "remaining_time": "2:12:13"}
827
+ {"current_steps": 827, "total_steps": 1230, "loss": 0.1795, "lr": 1.1715174603627615e-05, "epoch": 3.3544303797468356, "percentage": 67.24, "elapsed_time": "4:30:37", "remaining_time": "2:11:52"}
828
+ {"current_steps": 828, "total_steps": 1230, "loss": 0.1836, "lr": 1.1663548156257147e-05, "epoch": 3.3584810126582276, "percentage": 67.32, "elapsed_time": "4:30:55", "remaining_time": "2:11:32"}
829
+ {"current_steps": 829, "total_steps": 1230, "loss": 0.1537, "lr": 1.161198884952377e-05, "epoch": 3.36253164556962, "percentage": 67.4, "elapsed_time": "4:31:13", "remaining_time": "2:11:11"}
830
+ {"current_steps": 830, "total_steps": 1230, "loss": 0.1745, "lr": 1.1560497098679056e-05, "epoch": 3.3665822784810127, "percentage": 67.48, "elapsed_time": "4:31:30", "remaining_time": "2:10:50"}
831
+ {"current_steps": 831, "total_steps": 1230, "loss": 0.1558, "lr": 1.1509073318430479e-05, "epoch": 3.370632911392405, "percentage": 67.56, "elapsed_time": "4:31:47", "remaining_time": "2:10:30"}
832
+ {"current_steps": 832, "total_steps": 1230, "loss": 0.1771, "lr": 1.1457717922938116e-05, "epoch": 3.3746835443037977, "percentage": 67.64, "elapsed_time": "4:32:06", "remaining_time": "2:10:09"}
833
+ {"current_steps": 833, "total_steps": 1230, "loss": 0.177, "lr": 1.1406431325811233e-05, "epoch": 3.3787341772151898, "percentage": 67.72, "elapsed_time": "4:32:25", "remaining_time": "2:09:49"}
834
+ {"current_steps": 834, "total_steps": 1230, "loss": 0.1724, "lr": 1.135521394010506e-05, "epoch": 3.3827848101265823, "percentage": 67.8, "elapsed_time": "4:32:43", "remaining_time": "2:09:29"}
835
+ {"current_steps": 835, "total_steps": 1230, "loss": 0.1744, "lr": 1.1304066178317367e-05, "epoch": 3.386835443037975, "percentage": 67.89, "elapsed_time": "4:33:02", "remaining_time": "2:09:09"}
836
+ {"current_steps": 836, "total_steps": 1230, "loss": 0.1862, "lr": 1.1252988452385199e-05, "epoch": 3.390886075949367, "percentage": 67.97, "elapsed_time": "4:33:21", "remaining_time": "2:08:49"}
837
+ {"current_steps": 837, "total_steps": 1230, "loss": 0.1765, "lr": 1.1201981173681536e-05, "epoch": 3.3949367088607594, "percentage": 68.05, "elapsed_time": "4:33:40", "remaining_time": "2:08:29"}
838
+ {"current_steps": 838, "total_steps": 1230, "loss": 0.1709, "lr": 1.1151044753011991e-05, "epoch": 3.398987341772152, "percentage": 68.13, "elapsed_time": "4:33:58", "remaining_time": "2:08:09"}
839
+ {"current_steps": 839, "total_steps": 1230, "loss": 0.1679, "lr": 1.1100179600611491e-05, "epoch": 3.4030379746835444, "percentage": 68.21, "elapsed_time": "4:34:16", "remaining_time": "2:07:49"}
840
+ {"current_steps": 840, "total_steps": 1230, "loss": 0.1713, "lr": 1.1049386126140985e-05, "epoch": 3.407088607594937, "percentage": 68.29, "elapsed_time": "4:34:34", "remaining_time": "2:07:28"}
841
+ {"current_steps": 841, "total_steps": 1230, "loss": 0.1662, "lr": 1.0998664738684128e-05, "epoch": 3.411139240506329, "percentage": 68.37, "elapsed_time": "4:34:52", "remaining_time": "2:07:08"}
842
+ {"current_steps": 842, "total_steps": 1230, "loss": 0.1815, "lr": 1.0948015846744e-05, "epoch": 3.4151898734177215, "percentage": 68.46, "elapsed_time": "4:35:11", "remaining_time": "2:06:48"}
843
+ {"current_steps": 843, "total_steps": 1230, "loss": 0.1653, "lr": 1.0897439858239832e-05, "epoch": 3.419240506329114, "percentage": 68.54, "elapsed_time": "4:35:29", "remaining_time": "2:06:28"}
844
+ {"current_steps": 844, "total_steps": 1230, "loss": 0.1801, "lr": 1.0846937180503652e-05, "epoch": 3.423291139240506, "percentage": 68.62, "elapsed_time": "4:35:50", "remaining_time": "2:06:09"}
845
+ {"current_steps": 845, "total_steps": 1230, "loss": 0.1641, "lr": 1.0796508220277117e-05, "epoch": 3.4273417721518986, "percentage": 68.7, "elapsed_time": "4:36:07", "remaining_time": "2:05:48"}
846
+ {"current_steps": 846, "total_steps": 1230, "loss": 0.186, "lr": 1.0746153383708107e-05, "epoch": 3.431392405063291, "percentage": 68.78, "elapsed_time": "4:36:26", "remaining_time": "2:05:28"}
847
+ {"current_steps": 847, "total_steps": 1230, "loss": 0.1615, "lr": 1.0695873076347579e-05, "epoch": 3.4354430379746836, "percentage": 68.86, "elapsed_time": "4:36:43", "remaining_time": "2:05:08"}
848
+ {"current_steps": 848, "total_steps": 1230, "loss": 0.1573, "lr": 1.0645667703146205e-05, "epoch": 3.439493670886076, "percentage": 68.94, "elapsed_time": "4:37:02", "remaining_time": "2:04:47"}
849
+ {"current_steps": 849, "total_steps": 1230, "loss": 0.1697, "lr": 1.0595537668451161e-05, "epoch": 3.4435443037974682, "percentage": 69.02, "elapsed_time": "4:37:20", "remaining_time": "2:04:27"}
850
+ {"current_steps": 850, "total_steps": 1230, "loss": 0.1642, "lr": 1.0545483376002854e-05, "epoch": 3.4475949367088607, "percentage": 69.11, "elapsed_time": "4:37:38", "remaining_time": "2:04:07"}
851
+ {"current_steps": 851, "total_steps": 1230, "loss": 0.1735, "lr": 1.0495505228931676e-05, "epoch": 3.4516455696202533, "percentage": 69.19, "elapsed_time": "4:37:56", "remaining_time": "2:03:47"}
852
+ {"current_steps": 852, "total_steps": 1230, "loss": 0.1726, "lr": 1.044560362975474e-05, "epoch": 3.4556962025316453, "percentage": 69.27, "elapsed_time": "4:38:14", "remaining_time": "2:03:26"}
853
+ {"current_steps": 853, "total_steps": 1230, "loss": 0.1654, "lr": 1.0395778980372695e-05, "epoch": 3.459746835443038, "percentage": 69.35, "elapsed_time": "4:38:33", "remaining_time": "2:03:06"}
854
+ {"current_steps": 854, "total_steps": 1230, "loss": 0.1799, "lr": 1.0346031682066381e-05, "epoch": 3.4637974683544304, "percentage": 69.43, "elapsed_time": "4:38:52", "remaining_time": "2:02:47"}
855
+ {"current_steps": 855, "total_steps": 1230, "loss": 0.1581, "lr": 1.0296362135493724e-05, "epoch": 3.467848101265823, "percentage": 69.51, "elapsed_time": "4:39:10", "remaining_time": "2:02:26"}
856
+ {"current_steps": 856, "total_steps": 1230, "loss": 0.1596, "lr": 1.0246770740686422e-05, "epoch": 3.4718987341772154, "percentage": 69.59, "elapsed_time": "4:39:27", "remaining_time": "2:02:06"}
857
+ {"current_steps": 857, "total_steps": 1230, "loss": 0.1825, "lr": 1.0197257897046743e-05, "epoch": 3.4759493670886075, "percentage": 69.67, "elapsed_time": "4:39:46", "remaining_time": "2:01:46"}
858
+ {"current_steps": 858, "total_steps": 1230, "loss": 0.1785, "lr": 1.014782400334433e-05, "epoch": 3.48, "percentage": 69.76, "elapsed_time": "4:40:05", "remaining_time": "2:01:26"}
859
+ {"current_steps": 859, "total_steps": 1230, "loss": 0.1821, "lr": 1.009846945771296e-05, "epoch": 3.4840506329113925, "percentage": 69.84, "elapsed_time": "4:40:24", "remaining_time": "2:01:06"}
860
+ {"current_steps": 860, "total_steps": 1230, "loss": 0.1731, "lr": 1.0049194657647363e-05, "epoch": 3.4881012658227846, "percentage": 69.92, "elapsed_time": "4:40:42", "remaining_time": "2:00:46"}
861
+ {"current_steps": 861, "total_steps": 1230, "loss": 0.1447, "lr": 1.0000000000000006e-05, "epoch": 3.492151898734177, "percentage": 70.0, "elapsed_time": "4:40:59", "remaining_time": "2:00:25"}
862
+ {"current_steps": 862, "total_steps": 1230, "loss": 0.1651, "lr": 9.950885880977891e-06, "epoch": 3.4962025316455696, "percentage": 70.08, "elapsed_time": "4:41:18", "remaining_time": "2:00:05"}
863
+ {"current_steps": 863, "total_steps": 1230, "loss": 0.1483, "lr": 9.901852696139382e-06, "epoch": 3.500253164556962, "percentage": 70.16, "elapsed_time": "4:41:35", "remaining_time": "1:59:45"}
864
+ {"current_steps": 864, "total_steps": 1230, "loss": 0.1676, "lr": 9.852900840391027e-06, "epoch": 3.5043037974683546, "percentage": 70.24, "elapsed_time": "4:41:55", "remaining_time": "1:59:25"}
865
+ {"current_steps": 865, "total_steps": 1230, "loss": 0.1682, "lr": 9.804030707984313e-06, "epoch": 3.5083544303797467, "percentage": 70.33, "elapsed_time": "4:42:12", "remaining_time": "1:59:04"}
866
+ {"current_steps": 866, "total_steps": 1230, "loss": 0.1675, "lr": 9.755242692512599e-06, "epoch": 3.512405063291139, "percentage": 70.41, "elapsed_time": "4:42:31", "remaining_time": "1:58:45"}
867
+ {"current_steps": 867, "total_steps": 1230, "loss": 0.1782, "lr": 9.70653718690782e-06, "epoch": 3.5164556962025317, "percentage": 70.49, "elapsed_time": "4:42:50", "remaining_time": "1:58:25"}
868
+ {"current_steps": 868, "total_steps": 1230, "loss": 0.1668, "lr": 9.657914583437454e-06, "epoch": 3.520506329113924, "percentage": 70.57, "elapsed_time": "4:43:11", "remaining_time": "1:58:06"}
869
+ {"current_steps": 869, "total_steps": 1230, "loss": 0.1825, "lr": 9.609375273701246e-06, "epoch": 3.5245569620253163, "percentage": 70.65, "elapsed_time": "4:43:30", "remaining_time": "1:57:46"}
870
+ {"current_steps": 870, "total_steps": 1230, "loss": 0.1629, "lr": 9.560919648628133e-06, "epoch": 3.528607594936709, "percentage": 70.73, "elapsed_time": "4:43:46", "remaining_time": "1:57:25"}
871
+ {"current_steps": 871, "total_steps": 1230, "loss": 0.171, "lr": 9.512548098473047e-06, "epoch": 3.5326582278481014, "percentage": 70.81, "elapsed_time": "4:44:05", "remaining_time": "1:57:05"}
872
+ {"current_steps": 872, "total_steps": 1230, "loss": 0.1761, "lr": 9.464261012813825e-06, "epoch": 3.536708860759494, "percentage": 70.89, "elapsed_time": "4:44:25", "remaining_time": "1:56:46"}
873
+ {"current_steps": 873, "total_steps": 1230, "loss": 0.1741, "lr": 9.416058780547987e-06, "epoch": 3.540759493670886, "percentage": 70.98, "elapsed_time": "4:44:44", "remaining_time": "1:56:26"}
874
+ {"current_steps": 874, "total_steps": 1230, "loss": 0.1812, "lr": 9.367941789889714e-06, "epoch": 3.5448101265822785, "percentage": 71.06, "elapsed_time": "4:45:04", "remaining_time": "1:56:06"}
875
+ {"current_steps": 875, "total_steps": 1230, "loss": 0.1593, "lr": 9.319910428366607e-06, "epoch": 3.548860759493671, "percentage": 71.14, "elapsed_time": "4:45:21", "remaining_time": "1:55:46"}
876
+ {"current_steps": 876, "total_steps": 1230, "loss": 0.1699, "lr": 9.271965082816667e-06, "epoch": 3.552911392405063, "percentage": 71.22, "elapsed_time": "4:45:39", "remaining_time": "1:55:26"}
877
+ {"current_steps": 877, "total_steps": 1230, "loss": 0.1627, "lr": 9.224106139385111e-06, "epoch": 3.5569620253164556, "percentage": 71.3, "elapsed_time": "4:45:57", "remaining_time": "1:55:06"}
878
+ {"current_steps": 878, "total_steps": 1230, "loss": 0.1796, "lr": 9.176333983521291e-06, "epoch": 3.561012658227848, "percentage": 71.38, "elapsed_time": "4:46:18", "remaining_time": "1:54:47"}
879
+ {"current_steps": 879, "total_steps": 1230, "loss": 0.1808, "lr": 9.12864899997558e-06, "epoch": 3.5650632911392406, "percentage": 71.46, "elapsed_time": "4:46:40", "remaining_time": "1:54:28"}
880
+ {"current_steps": 880, "total_steps": 1230, "loss": 0.1624, "lr": 9.08105157279628e-06, "epoch": 3.569113924050633, "percentage": 71.54, "elapsed_time": "4:46:57", "remaining_time": "1:54:07"}
881
+ {"current_steps": 881, "total_steps": 1230, "loss": 0.162, "lr": 9.03354208532653e-06, "epoch": 3.573164556962025, "percentage": 71.63, "elapsed_time": "4:47:15", "remaining_time": "1:53:47"}
882
+ {"current_steps": 882, "total_steps": 1230, "loss": 0.1727, "lr": 8.986120920201205e-06, "epoch": 3.5772151898734177, "percentage": 71.71, "elapsed_time": "4:47:33", "remaining_time": "1:53:27"}
883
+ {"current_steps": 883, "total_steps": 1230, "loss": 0.1798, "lr": 8.938788459343852e-06, "epoch": 3.58126582278481, "percentage": 71.79, "elapsed_time": "4:47:52", "remaining_time": "1:53:07"}
884
+ {"current_steps": 884, "total_steps": 1230, "loss": 0.1645, "lr": 8.8915450839636e-06, "epoch": 3.5853164556962023, "percentage": 71.87, "elapsed_time": "4:48:12", "remaining_time": "1:52:48"}
885
+ {"current_steps": 885, "total_steps": 1230, "loss": 0.1743, "lr": 8.844391174552116e-06, "epoch": 3.589367088607595, "percentage": 71.95, "elapsed_time": "4:48:31", "remaining_time": "1:52:28"}
886
+ {"current_steps": 886, "total_steps": 1230, "loss": 0.1613, "lr": 8.797327110880479e-06, "epoch": 3.5934177215189873, "percentage": 72.03, "elapsed_time": "4:48:49", "remaining_time": "1:52:08"}
887
+ {"current_steps": 887, "total_steps": 1230, "loss": 0.1485, "lr": 8.750353271996206e-06, "epoch": 3.59746835443038, "percentage": 72.11, "elapsed_time": "4:49:06", "remaining_time": "1:51:47"}
888
+ {"current_steps": 888, "total_steps": 1230, "loss": 0.1702, "lr": 8.703470036220132e-06, "epoch": 3.6015189873417723, "percentage": 72.2, "elapsed_time": "4:49:25", "remaining_time": "1:51:28"}
889
+ {"current_steps": 889, "total_steps": 1230, "loss": 0.1784, "lr": 8.656677781143394e-06, "epoch": 3.6055696202531644, "percentage": 72.28, "elapsed_time": "4:49:44", "remaining_time": "1:51:08"}
890
+ {"current_steps": 890, "total_steps": 1230, "loss": 0.1881, "lr": 8.609976883624377e-06, "epoch": 3.609620253164557, "percentage": 72.36, "elapsed_time": "4:50:04", "remaining_time": "1:50:49"}
891
+ {"current_steps": 891, "total_steps": 1230, "loss": 0.1704, "lr": 8.563367719785698e-06, "epoch": 3.6136708860759494, "percentage": 72.44, "elapsed_time": "4:50:23", "remaining_time": "1:50:29"}
892
+ {"current_steps": 892, "total_steps": 1230, "loss": 0.1569, "lr": 8.516850665011138e-06, "epoch": 3.6177215189873415, "percentage": 72.52, "elapsed_time": "4:50:41", "remaining_time": "1:50:08"}
893
+ {"current_steps": 893, "total_steps": 1230, "loss": 0.1596, "lr": 8.47042609394269e-06, "epoch": 3.621772151898734, "percentage": 72.6, "elapsed_time": "4:50:59", "remaining_time": "1:49:48"}
894
+ {"current_steps": 894, "total_steps": 1230, "loss": 0.1696, "lr": 8.424094380477432e-06, "epoch": 3.6258227848101265, "percentage": 72.68, "elapsed_time": "4:51:19", "remaining_time": "1:49:29"}
895
+ {"current_steps": 895, "total_steps": 1230, "loss": 0.1577, "lr": 8.37785589776465e-06, "epoch": 3.629873417721519, "percentage": 72.76, "elapsed_time": "4:51:36", "remaining_time": "1:49:09"}
896
+ {"current_steps": 896, "total_steps": 1230, "loss": 0.1834, "lr": 8.331711018202694e-06, "epoch": 3.6339240506329116, "percentage": 72.85, "elapsed_time": "4:51:55", "remaining_time": "1:48:49"}
897
+ {"current_steps": 897, "total_steps": 1230, "loss": 0.1708, "lr": 8.285660113436104e-06, "epoch": 3.6379746835443036, "percentage": 72.93, "elapsed_time": "4:52:14", "remaining_time": "1:48:29"}
898
+ {"current_steps": 898, "total_steps": 1230, "loss": 0.1603, "lr": 8.239703554352527e-06, "epoch": 3.642025316455696, "percentage": 73.01, "elapsed_time": "4:52:32", "remaining_time": "1:48:09"}
899
+ {"current_steps": 899, "total_steps": 1230, "loss": 0.168, "lr": 8.193841711079775e-06, "epoch": 3.6460759493670887, "percentage": 73.09, "elapsed_time": "4:52:50", "remaining_time": "1:47:49"}
900
+ {"current_steps": 900, "total_steps": 1230, "loss": 0.1795, "lr": 8.148074952982828e-06, "epoch": 3.6501265822784807, "percentage": 73.17, "elapsed_time": "4:53:09", "remaining_time": "1:47:29"}
901
+ {"current_steps": 901, "total_steps": 1230, "loss": 0.1595, "lr": 8.102403648660859e-06, "epoch": 3.6541772151898733, "percentage": 73.25, "elapsed_time": "4:53:28", "remaining_time": "1:47:09"}
902
+ {"current_steps": 902, "total_steps": 1230, "loss": 0.1739, "lr": 8.056828165944282e-06, "epoch": 3.6582278481012658, "percentage": 73.33, "elapsed_time": "4:53:47", "remaining_time": "1:46:49"}
903
+ {"current_steps": 903, "total_steps": 1230, "loss": 0.1568, "lr": 8.011348871891762e-06, "epoch": 3.6622784810126583, "percentage": 73.41, "elapsed_time": "4:54:04", "remaining_time": "1:46:29"}
904
+ {"current_steps": 904, "total_steps": 1230, "loss": 0.1648, "lr": 7.965966132787287e-06, "epoch": 3.666329113924051, "percentage": 73.5, "elapsed_time": "4:54:21", "remaining_time": "1:46:09"}
905
+ {"current_steps": 905, "total_steps": 1230, "loss": 0.1903, "lr": 7.920680314137189e-06, "epoch": 3.670379746835443, "percentage": 73.58, "elapsed_time": "4:54:40", "remaining_time": "1:45:49"}
906
+ {"current_steps": 906, "total_steps": 1230, "loss": 0.1786, "lr": 7.875491780667246e-06, "epoch": 3.6744303797468354, "percentage": 73.66, "elapsed_time": "4:55:01", "remaining_time": "1:45:30"}
907
+ {"current_steps": 907, "total_steps": 1230, "loss": 0.1591, "lr": 7.830400896319667e-06, "epoch": 3.678481012658228, "percentage": 73.74, "elapsed_time": "4:55:18", "remaining_time": "1:45:09"}
908
+ {"current_steps": 908, "total_steps": 1230, "loss": 0.168, "lr": 7.785408024250259e-06, "epoch": 3.68253164556962, "percentage": 73.82, "elapsed_time": "4:55:36", "remaining_time": "1:44:49"}
909
+ {"current_steps": 909, "total_steps": 1230, "loss": 0.1664, "lr": 7.74051352682542e-06, "epoch": 3.6865822784810125, "percentage": 73.9, "elapsed_time": "4:55:54", "remaining_time": "1:44:29"}
910
+ {"current_steps": 910, "total_steps": 1230, "loss": 0.1754, "lr": 7.695717765619257e-06, "epoch": 3.690632911392405, "percentage": 73.98, "elapsed_time": "4:56:14", "remaining_time": "1:44:10"}
911
+ {"current_steps": 911, "total_steps": 1230, "loss": 0.1645, "lr": 7.651021101410673e-06, "epoch": 3.6946835443037975, "percentage": 74.07, "elapsed_time": "4:56:31", "remaining_time": "1:43:50"}
912
+ {"current_steps": 912, "total_steps": 1230, "loss": 0.1536, "lr": 7.606423894180464e-06, "epoch": 3.69873417721519, "percentage": 74.15, "elapsed_time": "4:56:49", "remaining_time": "1:43:29"}
913
+ {"current_steps": 913, "total_steps": 1230, "loss": 0.1569, "lr": 7.56192650310839e-06, "epoch": 3.702784810126582, "percentage": 74.23, "elapsed_time": "4:57:07", "remaining_time": "1:43:09"}
914
+ {"current_steps": 914, "total_steps": 1230, "loss": 0.1527, "lr": 7.517529286570349e-06, "epoch": 3.7068354430379746, "percentage": 74.31, "elapsed_time": "4:57:26", "remaining_time": "1:42:50"}
915
+ {"current_steps": 915, "total_steps": 1230, "loss": 0.1674, "lr": 7.473232602135387e-06, "epoch": 3.710886075949367, "percentage": 74.39, "elapsed_time": "4:57:46", "remaining_time": "1:42:30"}
916
+ {"current_steps": 916, "total_steps": 1230, "loss": 0.165, "lr": 7.429036806562935e-06, "epoch": 3.714936708860759, "percentage": 74.47, "elapsed_time": "4:58:04", "remaining_time": "1:42:10"}
917
+ {"current_steps": 917, "total_steps": 1230, "loss": 0.176, "lr": 7.3849422557998455e-06, "epoch": 3.7189873417721517, "percentage": 74.55, "elapsed_time": "4:58:22", "remaining_time": "1:41:50"}
918
+ {"current_steps": 918, "total_steps": 1230, "loss": 0.1791, "lr": 7.340949304977567e-06, "epoch": 3.7230379746835442, "percentage": 74.63, "elapsed_time": "4:58:42", "remaining_time": "1:41:31"}
919
+ {"current_steps": 919, "total_steps": 1230, "loss": 0.1779, "lr": 7.297058308409282e-06, "epoch": 3.7270886075949368, "percentage": 74.72, "elapsed_time": "4:59:00", "remaining_time": "1:41:11"}
920
+ {"current_steps": 920, "total_steps": 1230, "loss": 0.1595, "lr": 7.25326961958704e-06, "epoch": 3.7311392405063293, "percentage": 74.8, "elapsed_time": "4:59:19", "remaining_time": "1:40:51"}
921
+ {"current_steps": 921, "total_steps": 1230, "loss": 0.15, "lr": 7.209583591178921e-06, "epoch": 3.7351898734177214, "percentage": 74.88, "elapsed_time": "4:59:36", "remaining_time": "1:40:31"}
922
+ {"current_steps": 922, "total_steps": 1230, "loss": 0.1751, "lr": 7.1660005750261925e-06, "epoch": 3.739240506329114, "percentage": 74.96, "elapsed_time": "4:59:53", "remaining_time": "1:40:10"}
923
+ {"current_steps": 923, "total_steps": 1230, "loss": 0.1543, "lr": 7.1225209221404765e-06, "epoch": 3.7432911392405064, "percentage": 75.04, "elapsed_time": "5:00:13", "remaining_time": "1:39:51"}
924
+ {"current_steps": 924, "total_steps": 1230, "loss": 0.1833, "lr": 7.079144982700909e-06, "epoch": 3.747341772151899, "percentage": 75.12, "elapsed_time": "5:00:33", "remaining_time": "1:39:32"}
925
+ {"current_steps": 925, "total_steps": 1230, "loss": 0.1697, "lr": 7.0358731060513695e-06, "epoch": 3.7513924050632914, "percentage": 75.2, "elapsed_time": "5:00:52", "remaining_time": "1:39:12"}
926
+ {"current_steps": 926, "total_steps": 1230, "loss": 0.1627, "lr": 6.99270564069757e-06, "epoch": 3.7554430379746835, "percentage": 75.28, "elapsed_time": "5:01:10", "remaining_time": "1:38:52"}
927
+ {"current_steps": 927, "total_steps": 1230, "loss": 0.1722, "lr": 6.949642934304375e-06, "epoch": 3.759493670886076, "percentage": 75.37, "elapsed_time": "5:01:30", "remaining_time": "1:38:33"}
928
+ {"current_steps": 928, "total_steps": 1230, "loss": 0.1667, "lr": 6.906685333692871e-06, "epoch": 3.7635443037974685, "percentage": 75.45, "elapsed_time": "5:01:50", "remaining_time": "1:38:13"}
929
+ {"current_steps": 929, "total_steps": 1230, "loss": 0.1762, "lr": 6.86383318483769e-06, "epoch": 3.7675949367088606, "percentage": 75.53, "elapsed_time": "5:02:10", "remaining_time": "1:37:54"}
930
+ {"current_steps": 930, "total_steps": 1230, "loss": 0.1512, "lr": 6.821086832864139e-06, "epoch": 3.771645569620253, "percentage": 75.61, "elapsed_time": "5:02:27", "remaining_time": "1:37:34"}
931
+ {"current_steps": 931, "total_steps": 1230, "loss": 0.1852, "lr": 6.77844662204546e-06, "epoch": 3.7756962025316456, "percentage": 75.69, "elapsed_time": "5:02:46", "remaining_time": "1:37:14"}
932
+ {"current_steps": 932, "total_steps": 1230, "loss": 0.1543, "lr": 6.7359128958000455e-06, "epoch": 3.779746835443038, "percentage": 75.77, "elapsed_time": "5:03:05", "remaining_time": "1:36:54"}
933
+ {"current_steps": 933, "total_steps": 1230, "loss": 0.1714, "lr": 6.693485996688695e-06, "epoch": 3.7837974683544306, "percentage": 75.85, "elapsed_time": "5:03:23", "remaining_time": "1:36:34"}
934
+ {"current_steps": 934, "total_steps": 1230, "loss": 0.1626, "lr": 6.651166266411801e-06, "epoch": 3.7878481012658227, "percentage": 75.93, "elapsed_time": "5:03:41", "remaining_time": "1:36:14"}
935
+ {"current_steps": 935, "total_steps": 1230, "loss": 0.1691, "lr": 6.6089540458066725e-06, "epoch": 3.7918987341772152, "percentage": 76.02, "elapsed_time": "5:03:59", "remaining_time": "1:35:54"}
936
+ {"current_steps": 936, "total_steps": 1230, "loss": 0.1727, "lr": 6.566849674844711e-06, "epoch": 3.7959493670886078, "percentage": 76.1, "elapsed_time": "5:04:19", "remaining_time": "1:35:35"}
937
+ {"current_steps": 937, "total_steps": 1230, "loss": 0.1439, "lr": 6.524853492628747e-06, "epoch": 3.8, "percentage": 76.18, "elapsed_time": "5:04:36", "remaining_time": "1:35:15"}
938
+ {"current_steps": 938, "total_steps": 1230, "loss": 0.1899, "lr": 6.4829658373902536e-06, "epoch": 3.8040506329113923, "percentage": 76.26, "elapsed_time": "5:04:58", "remaining_time": "1:34:56"}
939
+ {"current_steps": 939, "total_steps": 1230, "loss": 0.1646, "lr": 6.441187046486648e-06, "epoch": 3.808101265822785, "percentage": 76.34, "elapsed_time": "5:05:15", "remaining_time": "1:34:36"}
940
+ {"current_steps": 940, "total_steps": 1230, "loss": 0.1596, "lr": 6.399517456398567e-06, "epoch": 3.8121518987341774, "percentage": 76.42, "elapsed_time": "5:05:35", "remaining_time": "1:34:16"}
941
+ {"current_steps": 941, "total_steps": 1230, "loss": 0.1708, "lr": 6.357957402727164e-06, "epoch": 3.81620253164557, "percentage": 76.5, "elapsed_time": "5:05:53", "remaining_time": "1:33:56"}
942
+ {"current_steps": 942, "total_steps": 1230, "loss": 0.1569, "lr": 6.316507220191395e-06, "epoch": 3.820253164556962, "percentage": 76.59, "elapsed_time": "5:06:10", "remaining_time": "1:33:36"}
943
+ {"current_steps": 943, "total_steps": 1230, "loss": 0.1601, "lr": 6.275167242625331e-06, "epoch": 3.8243037974683545, "percentage": 76.67, "elapsed_time": "5:06:28", "remaining_time": "1:33:16"}
944
+ {"current_steps": 944, "total_steps": 1230, "loss": 0.1652, "lr": 6.233937802975471e-06, "epoch": 3.828354430379747, "percentage": 76.75, "elapsed_time": "5:06:47", "remaining_time": "1:32:56"}
945
+ {"current_steps": 945, "total_steps": 1230, "loss": 0.1593, "lr": 6.192819233298046e-06, "epoch": 3.832405063291139, "percentage": 76.83, "elapsed_time": "5:07:05", "remaining_time": "1:32:36"}
946
+ {"current_steps": 946, "total_steps": 1230, "loss": 0.1715, "lr": 6.151811864756383e-06, "epoch": 3.8364556962025316, "percentage": 76.91, "elapsed_time": "5:07:24", "remaining_time": "1:32:17"}
947
+ {"current_steps": 947, "total_steps": 1230, "loss": 0.1517, "lr": 6.1109160276181655e-06, "epoch": 3.840506329113924, "percentage": 76.99, "elapsed_time": "5:07:42", "remaining_time": "1:31:57"}
948
+ {"current_steps": 948, "total_steps": 1230, "loss": 0.1637, "lr": 6.070132051252868e-06, "epoch": 3.8445569620253166, "percentage": 77.07, "elapsed_time": "5:08:00", "remaining_time": "1:31:37"}
949
+ {"current_steps": 949, "total_steps": 1230, "loss": 0.1605, "lr": 6.0294602641290034e-06, "epoch": 3.848607594936709, "percentage": 77.15, "elapsed_time": "5:08:19", "remaining_time": "1:31:17"}
950
+ {"current_steps": 950, "total_steps": 1230, "loss": 0.1745, "lr": 5.988900993811575e-06, "epoch": 3.852658227848101, "percentage": 77.24, "elapsed_time": "5:08:37", "remaining_time": "1:30:57"}
951
+ {"current_steps": 951, "total_steps": 1230, "loss": 0.1604, "lr": 5.948454566959363e-06, "epoch": 3.8567088607594937, "percentage": 77.32, "elapsed_time": "5:08:55", "remaining_time": "1:30:37"}
952
+ {"current_steps": 952, "total_steps": 1230, "loss": 0.15, "lr": 5.908121309322328e-06, "epoch": 3.8607594936708862, "percentage": 77.4, "elapsed_time": "5:09:13", "remaining_time": "1:30:18"}
953
+ {"current_steps": 953, "total_steps": 1230, "loss": 0.158, "lr": 5.867901545738976e-06, "epoch": 3.8648101265822783, "percentage": 77.48, "elapsed_time": "5:09:32", "remaining_time": "1:29:58"}
954
+ {"current_steps": 954, "total_steps": 1230, "loss": 0.1598, "lr": 5.827795600133774e-06, "epoch": 3.868860759493671, "percentage": 77.56, "elapsed_time": "5:09:51", "remaining_time": "1:29:38"}
955
+ {"current_steps": 955, "total_steps": 1230, "loss": 0.1812, "lr": 5.787803795514466e-06, "epoch": 3.8729113924050633, "percentage": 77.64, "elapsed_time": "5:10:10", "remaining_time": "1:29:18"}
956
+ {"current_steps": 956, "total_steps": 1230, "loss": 0.1713, "lr": 5.747926453969576e-06, "epoch": 3.876962025316456, "percentage": 77.72, "elapsed_time": "5:10:29", "remaining_time": "1:28:59"}
957
+ {"current_steps": 957, "total_steps": 1230, "loss": 0.1664, "lr": 5.708163896665708e-06, "epoch": 3.8810126582278484, "percentage": 77.8, "elapsed_time": "5:10:48", "remaining_time": "1:28:39"}
958
+ {"current_steps": 958, "total_steps": 1230, "loss": 0.157, "lr": 5.668516443845047e-06, "epoch": 3.8850632911392404, "percentage": 77.89, "elapsed_time": "5:11:05", "remaining_time": "1:28:19"}
959
+ {"current_steps": 959, "total_steps": 1230, "loss": 0.1708, "lr": 5.6289844148227225e-06, "epoch": 3.889113924050633, "percentage": 77.97, "elapsed_time": "5:11:23", "remaining_time": "1:27:59"}
960
+ {"current_steps": 960, "total_steps": 1230, "loss": 0.179, "lr": 5.5895681279842615e-06, "epoch": 3.8931645569620255, "percentage": 78.05, "elapsed_time": "5:11:42", "remaining_time": "1:27:39"}
961
+ {"current_steps": 961, "total_steps": 1230, "loss": 0.1666, "lr": 5.550267900783019e-06, "epoch": 3.8972151898734175, "percentage": 78.13, "elapsed_time": "5:11:59", "remaining_time": "1:27:19"}
962
+ {"current_steps": 962, "total_steps": 1230, "loss": 0.1565, "lr": 5.511084049737623e-06, "epoch": 3.90126582278481, "percentage": 78.21, "elapsed_time": "5:12:17", "remaining_time": "1:26:59"}
963
+ {"current_steps": 963, "total_steps": 1230, "loss": 0.1431, "lr": 5.4720168904294215e-06, "epoch": 3.9053164556962026, "percentage": 78.29, "elapsed_time": "5:12:33", "remaining_time": "1:26:39"}
964
+ {"current_steps": 964, "total_steps": 1230, "loss": 0.1672, "lr": 5.433066737499948e-06, "epoch": 3.909367088607595, "percentage": 78.37, "elapsed_time": "5:12:52", "remaining_time": "1:26:19"}
965
+ {"current_steps": 965, "total_steps": 1230, "loss": 0.1782, "lr": 5.394233904648376e-06, "epoch": 3.9134177215189876, "percentage": 78.46, "elapsed_time": "5:13:09", "remaining_time": "1:25:59"}
966
+ {"current_steps": 966, "total_steps": 1230, "loss": 0.1687, "lr": 5.355518704628997e-06, "epoch": 3.9174683544303797, "percentage": 78.54, "elapsed_time": "5:13:29", "remaining_time": "1:25:40"}
967
+ {"current_steps": 967, "total_steps": 1230, "loss": 0.168, "lr": 5.316921449248731e-06, "epoch": 3.921518987341772, "percentage": 78.62, "elapsed_time": "5:13:48", "remaining_time": "1:25:20"}
968
+ {"current_steps": 968, "total_steps": 1230, "loss": 0.1788, "lr": 5.278442449364538e-06, "epoch": 3.9255696202531647, "percentage": 78.7, "elapsed_time": "5:14:06", "remaining_time": "1:25:01"}
969
+ {"current_steps": 969, "total_steps": 1230, "loss": 0.17, "lr": 5.240082014881016e-06, "epoch": 3.9296202531645568, "percentage": 78.78, "elapsed_time": "5:14:25", "remaining_time": "1:24:41"}
970
+ {"current_steps": 970, "total_steps": 1230, "loss": 0.159, "lr": 5.201840454747822e-06, "epoch": 3.9336708860759493, "percentage": 78.86, "elapsed_time": "5:14:44", "remaining_time": "1:24:21"}
971
+ {"current_steps": 971, "total_steps": 1230, "loss": 0.1452, "lr": 5.163718076957223e-06, "epoch": 3.937721518987342, "percentage": 78.94, "elapsed_time": "5:15:02", "remaining_time": "1:24:01"}
972
+ {"current_steps": 972, "total_steps": 1230, "loss": 0.1682, "lr": 5.125715188541609e-06, "epoch": 3.9417721518987343, "percentage": 79.02, "elapsed_time": "5:15:21", "remaining_time": "1:23:42"}
973
+ {"current_steps": 973, "total_steps": 1230, "loss": 0.1713, "lr": 5.087832095571021e-06, "epoch": 3.945822784810127, "percentage": 79.11, "elapsed_time": "5:15:41", "remaining_time": "1:23:22"}
974
+ {"current_steps": 974, "total_steps": 1230, "loss": 0.1583, "lr": 5.0500691031506766e-06, "epoch": 3.949873417721519, "percentage": 79.19, "elapsed_time": "5:16:00", "remaining_time": "1:23:03"}
975
+ {"current_steps": 975, "total_steps": 1230, "loss": 0.1724, "lr": 5.01242651541854e-06, "epoch": 3.9539240506329114, "percentage": 79.27, "elapsed_time": "5:16:18", "remaining_time": "1:22:43"}
976
+ {"current_steps": 976, "total_steps": 1230, "loss": 0.1724, "lr": 4.974904635542815e-06, "epoch": 3.957974683544304, "percentage": 79.35, "elapsed_time": "5:16:37", "remaining_time": "1:22:23"}
977
+ {"current_steps": 977, "total_steps": 1230, "loss": 0.1557, "lr": 4.937503765719582e-06, "epoch": 3.962025316455696, "percentage": 79.43, "elapsed_time": "5:16:54", "remaining_time": "1:22:04"}
978
+ {"current_steps": 978, "total_steps": 1230, "loss": 0.1697, "lr": 4.900224207170299e-06, "epoch": 3.9660759493670885, "percentage": 79.51, "elapsed_time": "5:17:12", "remaining_time": "1:21:44"}
979
+ {"current_steps": 979, "total_steps": 1230, "loss": 0.1558, "lr": 4.8630662601394065e-06, "epoch": 3.970126582278481, "percentage": 79.59, "elapsed_time": "5:17:29", "remaining_time": "1:21:24"}
980
+ {"current_steps": 980, "total_steps": 1230, "loss": 0.1723, "lr": 4.8260302238918995e-06, "epoch": 3.9741772151898735, "percentage": 79.67, "elapsed_time": "5:17:49", "remaining_time": "1:21:04"}
981
+ {"current_steps": 981, "total_steps": 1230, "loss": 0.1661, "lr": 4.789116396710924e-06, "epoch": 3.978227848101266, "percentage": 79.76, "elapsed_time": "5:18:07", "remaining_time": "1:20:44"}
982
+ {"current_steps": 982, "total_steps": 1230, "loss": 0.1602, "lr": 4.752325075895368e-06, "epoch": 3.982278481012658, "percentage": 79.84, "elapsed_time": "5:18:25", "remaining_time": "1:20:25"}
983
+ {"current_steps": 983, "total_steps": 1230, "loss": 0.1528, "lr": 4.715656557757473e-06, "epoch": 3.9863291139240506, "percentage": 79.92, "elapsed_time": "5:18:45", "remaining_time": "1:20:05"}
984
+ {"current_steps": 984, "total_steps": 1230, "loss": 0.1556, "lr": 4.679111137620442e-06, "epoch": 3.990379746835443, "percentage": 80.0, "elapsed_time": "5:19:02", "remaining_time": "1:19:45"}
985
+ {"current_steps": 985, "total_steps": 1230, "loss": 0.1744, "lr": 4.6426891098160585e-06, "epoch": 3.9944303797468352, "percentage": 80.08, "elapsed_time": "5:19:21", "remaining_time": "1:19:26"}
986
+ {"current_steps": 986, "total_steps": 1230, "loss": 0.1919, "lr": 4.6063907676823474e-06, "epoch": 3.9984810126582278, "percentage": 80.16, "elapsed_time": "5:19:41", "remaining_time": "1:19:06"}
987
+ {"current_steps": 987, "total_steps": 1230, "loss": 0.1229, "lr": 4.570216403561141e-06, "epoch": 4.004050632911392, "percentage": 80.24, "elapsed_time": "5:21:15", "remaining_time": "1:19:05"}
988
+ {"current_steps": 988, "total_steps": 1230, "loss": 0.1015, "lr": 4.534166308795815e-06, "epoch": 4.008101265822785, "percentage": 80.33, "elapsed_time": "5:21:33", "remaining_time": "1:18:45"}
989
+ {"current_steps": 989, "total_steps": 1230, "loss": 0.105, "lr": 4.498240773728859e-06, "epoch": 4.012151898734177, "percentage": 80.41, "elapsed_time": "5:21:52", "remaining_time": "1:18:25"}
990
+ {"current_steps": 990, "total_steps": 1230, "loss": 0.0978, "lr": 4.462440087699609e-06, "epoch": 4.01620253164557, "percentage": 80.49, "elapsed_time": "5:22:10", "remaining_time": "1:18:06"}
991
+ {"current_steps": 991, "total_steps": 1230, "loss": 0.1072, "lr": 4.426764539041861e-06, "epoch": 4.020253164556962, "percentage": 80.57, "elapsed_time": "5:22:30", "remaining_time": "1:17:46"}
992
+ {"current_steps": 992, "total_steps": 1230, "loss": 0.0941, "lr": 4.391214415081582e-06, "epoch": 4.024303797468354, "percentage": 80.65, "elapsed_time": "5:22:48", "remaining_time": "1:17:26"}
993
+ {"current_steps": 993, "total_steps": 1230, "loss": 0.0986, "lr": 4.355790002134579e-06, "epoch": 4.028354430379747, "percentage": 80.73, "elapsed_time": "5:23:08", "remaining_time": "1:17:07"}
994
+ {"current_steps": 994, "total_steps": 1230, "loss": 0.1114, "lr": 4.320491585504207e-06, "epoch": 4.032405063291139, "percentage": 80.81, "elapsed_time": "5:23:27", "remaining_time": "1:16:47"}
995
+ {"current_steps": 995, "total_steps": 1230, "loss": 0.1133, "lr": 4.2853194494790615e-06, "epoch": 4.036455696202531, "percentage": 80.89, "elapsed_time": "5:23:47", "remaining_time": "1:16:28"}
996
+ {"current_steps": 996, "total_steps": 1230, "loss": 0.1024, "lr": 4.250273877330691e-06, "epoch": 4.040506329113924, "percentage": 80.98, "elapsed_time": "5:24:08", "remaining_time": "1:16:09"}
997
+ {"current_steps": 997, "total_steps": 1230, "loss": 0.106, "lr": 4.215355151311313e-06, "epoch": 4.044556962025316, "percentage": 81.06, "elapsed_time": "5:24:27", "remaining_time": "1:15:49"}
998
+ {"current_steps": 998, "total_steps": 1230, "loss": 0.108, "lr": 4.180563552651542e-06, "epoch": 4.048607594936709, "percentage": 81.14, "elapsed_time": "5:24:48", "remaining_time": "1:15:30"}
999
+ {"current_steps": 999, "total_steps": 1230, "loss": 0.1007, "lr": 4.145899361558147e-06, "epoch": 4.052658227848101, "percentage": 81.22, "elapsed_time": "5:25:06", "remaining_time": "1:15:10"}
1000
+ {"current_steps": 1000, "total_steps": 1230, "loss": 0.106, "lr": 4.111362857211738e-06, "epoch": 4.056708860759493, "percentage": 81.3, "elapsed_time": "5:25:27", "remaining_time": "1:14:51"}
1001
+ {"current_steps": 1001, "total_steps": 1230, "loss": 0.0943, "lr": 4.076954317764592e-06, "epoch": 4.060759493670886, "percentage": 81.38, "elapsed_time": "5:25:45", "remaining_time": "1:14:31"}
1002
+ {"current_steps": 1002, "total_steps": 1230, "loss": 0.1024, "lr": 4.042674020338335e-06, "epoch": 4.0648101265822785, "percentage": 81.46, "elapsed_time": "5:26:04", "remaining_time": "1:14:11"}