sedrickkeh commited on
Commit
7173a40
·
verified ·
1 Parent(s): 03c5858

Training in progress, epoch 3

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4fc5ca1ed4b2f59591392ef2f55fe876722fc409d285094d9f6d667343df3028
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1567ca1bacfc0123187f34cfbc9cc462153ae798104fc457c79d505e2bcd1b06
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a37b70cfa48c7efa19bcafaf2995f82f0714eb1bb27067b7f1864f1aaf4a362c
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9883e7cb812f9d7c9e2629b56e6a153b70163b043c8c9f226499ac4528830ec0
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cf6aa2037750d707c2f0597579fd3cb0830c0328c838b5970ccd11224754ac08
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:37dbee9c60ec45d79dc5ef0176945aa42e22df393aed478ecab9f05c8956237b
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d3678420e13d8e13518a8715b14440ad817adf6d6f3842b26aec79a4680e019e
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:473d543ee74cb9f62bf8246307dfd5e2986d56b482a449599b52f3432e332175
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -740,3 +740,249 @@
740
  {"current_steps": 740, "total_steps": 1230, "loss": 0.4085, "lr": 1.6415300222223788e-05, "epoch": 2.9974683544303797, "percentage": 60.16, "elapsed_time": "21:03:37", "remaining_time": "13:56:43"}
741
  {"current_steps": 741, "total_steps": 1230, "loss": 0.4219, "lr": 1.6359475191103958e-05, "epoch": 3.0015189873417722, "percentage": 60.24, "elapsed_time": "21:06:32", "remaining_time": "13:55:48"}
742
  {"current_steps": 742, "total_steps": 1230, "loss": 0.289, "lr": 1.6303679480270466e-05, "epoch": 3.0055696202531648, "percentage": 60.33, "elapsed_time": "21:08:05", "remaining_time": "13:53:59"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
740
  {"current_steps": 740, "total_steps": 1230, "loss": 0.4085, "lr": 1.6415300222223788e-05, "epoch": 2.9974683544303797, "percentage": 60.16, "elapsed_time": "21:03:37", "remaining_time": "13:56:43"}
741
  {"current_steps": 741, "total_steps": 1230, "loss": 0.4219, "lr": 1.6359475191103958e-05, "epoch": 3.0015189873417722, "percentage": 60.24, "elapsed_time": "21:06:32", "remaining_time": "13:55:48"}
742
  {"current_steps": 742, "total_steps": 1230, "loss": 0.289, "lr": 1.6303679480270466e-05, "epoch": 3.0055696202531648, "percentage": 60.33, "elapsed_time": "21:08:05", "remaining_time": "13:53:59"}
743
+ {"current_steps": 743, "total_steps": 1230, "loss": 0.2974, "lr": 1.624791353909428e-05, "epoch": 3.009620253164557, "percentage": 60.41, "elapsed_time": "21:09:41", "remaining_time": "13:52:13"}
744
+ {"current_steps": 744, "total_steps": 1230, "loss": 0.2942, "lr": 1.619217781670663e-05, "epoch": 3.0136708860759494, "percentage": 60.49, "elapsed_time": "21:11:19", "remaining_time": "13:50:27"}
745
+ {"current_steps": 745, "total_steps": 1230, "loss": 0.3141, "lr": 1.6136472761995373e-05, "epoch": 3.017721518987342, "percentage": 60.57, "elapsed_time": "21:12:58", "remaining_time": "13:48:43"}
746
+ {"current_steps": 746, "total_steps": 1230, "loss": 0.2926, "lr": 1.608079882360134e-05, "epoch": 3.0217721518987344, "percentage": 60.65, "elapsed_time": "21:14:43", "remaining_time": "13:47:02"}
747
+ {"current_steps": 747, "total_steps": 1230, "loss": 0.3036, "lr": 1.60251564499148e-05, "epoch": 3.0258227848101265, "percentage": 60.73, "elapsed_time": "21:16:31", "remaining_time": "13:45:23"}
748
+ {"current_steps": 748, "total_steps": 1230, "loss": 0.2931, "lr": 1.596954608907176e-05, "epoch": 3.029873417721519, "percentage": 60.81, "elapsed_time": "21:18:24", "remaining_time": "13:43:47"}
749
+ {"current_steps": 749, "total_steps": 1230, "loss": 0.3076, "lr": 1.591396818895043e-05, "epoch": 3.0339240506329115, "percentage": 60.89, "elapsed_time": "21:20:17", "remaining_time": "13:42:11"}
750
+ {"current_steps": 750, "total_steps": 1230, "loss": 0.2919, "lr": 1.585842319716759e-05, "epoch": 3.037974683544304, "percentage": 60.98, "elapsed_time": "21:22:09", "remaining_time": "13:40:34"}
751
+ {"current_steps": 751, "total_steps": 1230, "loss": 0.2892, "lr": 1.5802911561074944e-05, "epoch": 3.042025316455696, "percentage": 61.06, "elapsed_time": "21:23:50", "remaining_time": "13:38:51"}
752
+ {"current_steps": 752, "total_steps": 1230, "loss": 0.2977, "lr": 1.5747433727755595e-05, "epoch": 3.0460759493670886, "percentage": 61.14, "elapsed_time": "21:25:13", "remaining_time": "13:36:56"}
753
+ {"current_steps": 753, "total_steps": 1230, "loss": 0.3139, "lr": 1.5691990144020376e-05, "epoch": 3.050126582278481, "percentage": 61.22, "elapsed_time": "21:27:07", "remaining_time": "13:35:21"}
754
+ {"current_steps": 754, "total_steps": 1230, "loss": 0.283, "lr": 1.5636581256404297e-05, "epoch": 3.0541772151898736, "percentage": 61.3, "elapsed_time": "21:28:46", "remaining_time": "13:33:36"}
755
+ {"current_steps": 755, "total_steps": 1230, "loss": 0.3032, "lr": 1.558120751116291e-05, "epoch": 3.0582278481012657, "percentage": 61.38, "elapsed_time": "21:30:18", "remaining_time": "13:31:46"}
756
+ {"current_steps": 756, "total_steps": 1230, "loss": 0.2796, "lr": 1.552586935426876e-05, "epoch": 3.062278481012658, "percentage": 61.46, "elapsed_time": "21:31:49", "remaining_time": "13:29:57"}
757
+ {"current_steps": 757, "total_steps": 1230, "loss": 0.2941, "lr": 1.547056723140774e-05, "epoch": 3.0663291139240507, "percentage": 61.54, "elapsed_time": "21:33:22", "remaining_time": "13:28:08"}
758
+ {"current_steps": 758, "total_steps": 1230, "loss": 0.3041, "lr": 1.5415301587975565e-05, "epoch": 3.0703797468354432, "percentage": 61.63, "elapsed_time": "21:35:07", "remaining_time": "13:26:27"}
759
+ {"current_steps": 759, "total_steps": 1230, "loss": 0.3016, "lr": 1.536007286907411e-05, "epoch": 3.0744303797468353, "percentage": 61.71, "elapsed_time": "21:36:54", "remaining_time": "13:24:47"}
760
+ {"current_steps": 760, "total_steps": 1230, "loss": 0.3069, "lr": 1.5304881519507896e-05, "epoch": 3.078481012658228, "percentage": 61.79, "elapsed_time": "21:38:52", "remaining_time": "13:23:15"}
761
+ {"current_steps": 761, "total_steps": 1230, "loss": 0.2879, "lr": 1.5249727983780453e-05, "epoch": 3.0825316455696203, "percentage": 61.87, "elapsed_time": "21:40:24", "remaining_time": "13:21:26"}
762
+ {"current_steps": 762, "total_steps": 1230, "loss": 0.3212, "lr": 1.5194612706090786e-05, "epoch": 3.086582278481013, "percentage": 61.95, "elapsed_time": "21:42:06", "remaining_time": "13:19:43"}
763
+ {"current_steps": 763, "total_steps": 1230, "loss": 0.283, "lr": 1.5139536130329771e-05, "epoch": 3.090632911392405, "percentage": 62.03, "elapsed_time": "21:43:48", "remaining_time": "13:18:00"}
764
+ {"current_steps": 764, "total_steps": 1230, "loss": 0.2866, "lr": 1.508449870007656e-05, "epoch": 3.0946835443037974, "percentage": 62.11, "elapsed_time": "21:45:30", "remaining_time": "13:16:17"}
765
+ {"current_steps": 765, "total_steps": 1230, "loss": 0.3163, "lr": 1.5029500858595056e-05, "epoch": 3.09873417721519, "percentage": 62.2, "elapsed_time": "21:47:10", "remaining_time": "13:14:33"}
766
+ {"current_steps": 766, "total_steps": 1230, "loss": 0.285, "lr": 1.4974543048830328e-05, "epoch": 3.1027848101265825, "percentage": 62.28, "elapsed_time": "21:48:46", "remaining_time": "13:12:46"}
767
+ {"current_steps": 767, "total_steps": 1230, "loss": 0.2892, "lr": 1.4919625713405e-05, "epoch": 3.1068354430379745, "percentage": 62.36, "elapsed_time": "21:50:27", "remaining_time": "13:11:03"}
768
+ {"current_steps": 768, "total_steps": 1230, "loss": 0.2857, "lr": 1.4864749294615756e-05, "epoch": 3.110886075949367, "percentage": 62.44, "elapsed_time": "21:52:04", "remaining_time": "13:09:17"}
769
+ {"current_steps": 769, "total_steps": 1230, "loss": 0.2885, "lr": 1.4809914234429716e-05, "epoch": 3.1149367088607596, "percentage": 62.52, "elapsed_time": "21:53:41", "remaining_time": "13:07:31"}
770
+ {"current_steps": 770, "total_steps": 1230, "loss": 0.3264, "lr": 1.4755120974480923e-05, "epoch": 3.118987341772152, "percentage": 62.6, "elapsed_time": "21:55:22", "remaining_time": "13:05:48"}
771
+ {"current_steps": 771, "total_steps": 1230, "loss": 0.2911, "lr": 1.4700369956066771e-05, "epoch": 3.123037974683544, "percentage": 62.68, "elapsed_time": "21:57:08", "remaining_time": "13:04:07"}
772
+ {"current_steps": 772, "total_steps": 1230, "loss": 0.2874, "lr": 1.4645661620144413e-05, "epoch": 3.1270886075949367, "percentage": 62.76, "elapsed_time": "21:58:31", "remaining_time": "13:02:13"}
773
+ {"current_steps": 773, "total_steps": 1230, "loss": 0.2979, "lr": 1.4590996407327284e-05, "epoch": 3.131139240506329, "percentage": 62.85, "elapsed_time": "22:00:04", "remaining_time": "13:00:26"}
774
+ {"current_steps": 774, "total_steps": 1230, "loss": 0.2939, "lr": 1.4536374757881487e-05, "epoch": 3.1351898734177217, "percentage": 62.93, "elapsed_time": "22:01:50", "remaining_time": "12:58:45"}
775
+ {"current_steps": 775, "total_steps": 1230, "loss": 0.2928, "lr": 1.4481797111722271e-05, "epoch": 3.1392405063291138, "percentage": 63.01, "elapsed_time": "22:03:34", "remaining_time": "12:57:04"}
776
+ {"current_steps": 776, "total_steps": 1230, "loss": 0.2697, "lr": 1.4427263908410507e-05, "epoch": 3.1432911392405063, "percentage": 63.09, "elapsed_time": "22:05:25", "remaining_time": "12:55:26"}
777
+ {"current_steps": 777, "total_steps": 1230, "loss": 0.291, "lr": 1.4372775587149108e-05, "epoch": 3.147341772151899, "percentage": 63.17, "elapsed_time": "22:07:10", "remaining_time": "12:53:45"}
778
+ {"current_steps": 778, "total_steps": 1230, "loss": 0.2951, "lr": 1.4318332586779522e-05, "epoch": 3.1513924050632913, "percentage": 63.25, "elapsed_time": "22:08:47", "remaining_time": "12:52:00"}
779
+ {"current_steps": 779, "total_steps": 1230, "loss": 0.2852, "lr": 1.4263935345778202e-05, "epoch": 3.1554430379746834, "percentage": 63.33, "elapsed_time": "22:10:29", "remaining_time": "12:50:17"}
780
+ {"current_steps": 780, "total_steps": 1230, "loss": 0.296, "lr": 1.420958430225303e-05, "epoch": 3.159493670886076, "percentage": 63.41, "elapsed_time": "22:12:13", "remaining_time": "12:48:35"}
781
+ {"current_steps": 781, "total_steps": 1230, "loss": 0.2991, "lr": 1.415527989393985e-05, "epoch": 3.1635443037974684, "percentage": 63.5, "elapsed_time": "22:14:13", "remaining_time": "12:47:03"}
782
+ {"current_steps": 782, "total_steps": 1230, "loss": 0.2774, "lr": 1.410102255819891e-05, "epoch": 3.167594936708861, "percentage": 63.58, "elapsed_time": "22:15:46", "remaining_time": "12:45:14"}
783
+ {"current_steps": 783, "total_steps": 1230, "loss": 0.3017, "lr": 1.404681273201131e-05, "epoch": 3.171645569620253, "percentage": 63.66, "elapsed_time": "22:17:34", "remaining_time": "12:43:35"}
784
+ {"current_steps": 784, "total_steps": 1230, "loss": 0.2964, "lr": 1.399265085197556e-05, "epoch": 3.1756962025316455, "percentage": 63.74, "elapsed_time": "22:19:20", "remaining_time": "12:41:55"}
785
+ {"current_steps": 785, "total_steps": 1230, "loss": 0.2937, "lr": 1.393853735430398e-05, "epoch": 3.179746835443038, "percentage": 63.82, "elapsed_time": "22:20:48", "remaining_time": "12:40:04"}
786
+ {"current_steps": 786, "total_steps": 1230, "loss": 0.28, "lr": 1.3884472674819246e-05, "epoch": 3.1837974683544306, "percentage": 63.9, "elapsed_time": "22:22:26", "remaining_time": "12:38:19"}
787
+ {"current_steps": 787, "total_steps": 1230, "loss": 0.2879, "lr": 1.3830457248950864e-05, "epoch": 3.1878481012658226, "percentage": 63.98, "elapsed_time": "22:24:15", "remaining_time": "12:36:41"}
788
+ {"current_steps": 788, "total_steps": 1230, "loss": 0.2936, "lr": 1.377649151173163e-05, "epoch": 3.191898734177215, "percentage": 64.07, "elapsed_time": "22:25:56", "remaining_time": "12:34:57"}
789
+ {"current_steps": 789, "total_steps": 1230, "loss": 0.2998, "lr": 1.3722575897794181e-05, "epoch": 3.1959493670886077, "percentage": 64.15, "elapsed_time": "22:27:43", "remaining_time": "12:33:17"}
790
+ {"current_steps": 790, "total_steps": 1230, "loss": 0.3084, "lr": 1.3668710841367472e-05, "epoch": 3.2, "percentage": 64.23, "elapsed_time": "22:29:44", "remaining_time": "12:31:45"}
791
+ {"current_steps": 791, "total_steps": 1230, "loss": 0.2911, "lr": 1.361489677627324e-05, "epoch": 3.2040506329113922, "percentage": 64.31, "elapsed_time": "22:31:27", "remaining_time": "12:30:02"}
792
+ {"current_steps": 792, "total_steps": 1230, "loss": 0.2708, "lr": 1.3561134135922585e-05, "epoch": 3.2081012658227848, "percentage": 64.39, "elapsed_time": "22:33:02", "remaining_time": "12:28:16"}
793
+ {"current_steps": 793, "total_steps": 1230, "loss": 0.3148, "lr": 1.350742335331241e-05, "epoch": 3.2121518987341773, "percentage": 64.47, "elapsed_time": "22:34:55", "remaining_time": "12:26:39"}
794
+ {"current_steps": 794, "total_steps": 1230, "loss": 0.2933, "lr": 1.345376486102198e-05, "epoch": 3.21620253164557, "percentage": 64.55, "elapsed_time": "22:36:35", "remaining_time": "12:24:55"}
795
+ {"current_steps": 795, "total_steps": 1230, "loss": 0.3016, "lr": 1.3400159091209414e-05, "epoch": 3.220253164556962, "percentage": 64.63, "elapsed_time": "22:38:07", "remaining_time": "12:23:07"}
796
+ {"current_steps": 796, "total_steps": 1230, "loss": 0.306, "lr": 1.3346606475608216e-05, "epoch": 3.2243037974683544, "percentage": 64.72, "elapsed_time": "22:39:49", "remaining_time": "12:21:24"}
797
+ {"current_steps": 797, "total_steps": 1230, "loss": 0.2833, "lr": 1.3293107445523781e-05, "epoch": 3.228354430379747, "percentage": 64.8, "elapsed_time": "22:41:34", "remaining_time": "12:19:43"}
798
+ {"current_steps": 798, "total_steps": 1230, "loss": 0.3131, "lr": 1.3239662431829949e-05, "epoch": 3.2324050632911394, "percentage": 64.88, "elapsed_time": "22:43:26", "remaining_time": "12:18:06"}
799
+ {"current_steps": 799, "total_steps": 1230, "loss": 0.2921, "lr": 1.3186271864965509e-05, "epoch": 3.2364556962025315, "percentage": 64.96, "elapsed_time": "22:44:55", "remaining_time": "12:16:16"}
800
+ {"current_steps": 800, "total_steps": 1230, "loss": 0.308, "lr": 1.3132936174930756e-05, "epoch": 3.240506329113924, "percentage": 65.04, "elapsed_time": "22:46:54", "remaining_time": "12:14:42"}
801
+ {"current_steps": 801, "total_steps": 1230, "loss": 0.2828, "lr": 1.3079655791283995e-05, "epoch": 3.2445569620253165, "percentage": 65.12, "elapsed_time": "22:48:29", "remaining_time": "12:12:56"}
802
+ {"current_steps": 802, "total_steps": 1230, "loss": 0.2937, "lr": 1.3026431143138108e-05, "epoch": 3.248607594936709, "percentage": 65.2, "elapsed_time": "22:50:06", "remaining_time": "12:11:11"}
803
+ {"current_steps": 803, "total_steps": 1230, "loss": 0.3009, "lr": 1.2973262659157114e-05, "epoch": 3.252658227848101, "percentage": 65.28, "elapsed_time": "22:52:03", "remaining_time": "12:09:36"}
804
+ {"current_steps": 804, "total_steps": 1230, "loss": 0.2868, "lr": 1.2920150767552651e-05, "epoch": 3.2567088607594936, "percentage": 65.37, "elapsed_time": "22:53:45", "remaining_time": "12:07:53"}
805
+ {"current_steps": 805, "total_steps": 1230, "loss": 0.3087, "lr": 1.2867095896080607e-05, "epoch": 3.260759493670886, "percentage": 65.45, "elapsed_time": "22:55:36", "remaining_time": "12:06:15"}
806
+ {"current_steps": 806, "total_steps": 1230, "loss": 0.2844, "lr": 1.2814098472037612e-05, "epoch": 3.2648101265822786, "percentage": 65.53, "elapsed_time": "22:57:18", "remaining_time": "12:04:32"}
807
+ {"current_steps": 807, "total_steps": 1230, "loss": 0.304, "lr": 1.276115892225764e-05, "epoch": 3.2688607594936707, "percentage": 65.61, "elapsed_time": "22:59:00", "remaining_time": "12:02:49"}
808
+ {"current_steps": 808, "total_steps": 1230, "loss": 0.2851, "lr": 1.2708277673108555e-05, "epoch": 3.2729113924050632, "percentage": 65.69, "elapsed_time": "23:00:31", "remaining_time": "12:01:01"}
809
+ {"current_steps": 809, "total_steps": 1230, "loss": 0.2975, "lr": 1.2655455150488649e-05, "epoch": 3.2769620253164558, "percentage": 65.77, "elapsed_time": "23:02:13", "remaining_time": "11:59:17"}
810
+ {"current_steps": 810, "total_steps": 1230, "loss": 0.2952, "lr": 1.2602691779823272e-05, "epoch": 3.2810126582278483, "percentage": 65.85, "elapsed_time": "23:03:57", "remaining_time": "11:57:36"}
811
+ {"current_steps": 811, "total_steps": 1230, "loss": 0.2951, "lr": 1.2549987986061355e-05, "epoch": 3.2850632911392403, "percentage": 65.93, "elapsed_time": "23:05:51", "remaining_time": "11:55:59"}
812
+ {"current_steps": 812, "total_steps": 1230, "loss": 0.2945, "lr": 1.2497344193672005e-05, "epoch": 3.289113924050633, "percentage": 66.02, "elapsed_time": "23:07:30", "remaining_time": "11:54:15"}
813
+ {"current_steps": 813, "total_steps": 1230, "loss": 0.2803, "lr": 1.2444760826641092e-05, "epoch": 3.2931645569620254, "percentage": 66.1, "elapsed_time": "23:09:00", "remaining_time": "11:52:26"}
814
+ {"current_steps": 814, "total_steps": 1230, "loss": 0.2942, "lr": 1.2392238308467817e-05, "epoch": 3.297215189873418, "percentage": 66.18, "elapsed_time": "23:10:32", "remaining_time": "11:50:38"}
815
+ {"current_steps": 815, "total_steps": 1230, "loss": 0.301, "lr": 1.2339777062161326e-05, "epoch": 3.30126582278481, "percentage": 66.26, "elapsed_time": "23:12:19", "remaining_time": "11:48:58"}
816
+ {"current_steps": 816, "total_steps": 1230, "loss": 0.2944, "lr": 1.2287377510237293e-05, "epoch": 3.3053164556962025, "percentage": 66.34, "elapsed_time": "23:14:04", "remaining_time": "11:47:17"}
817
+ {"current_steps": 817, "total_steps": 1230, "loss": 0.2917, "lr": 1.2235040074714488e-05, "epoch": 3.309367088607595, "percentage": 66.42, "elapsed_time": "23:15:50", "remaining_time": "11:45:36"}
818
+ {"current_steps": 818, "total_steps": 1230, "loss": 0.2927, "lr": 1.2182765177111434e-05, "epoch": 3.3134177215189875, "percentage": 66.5, "elapsed_time": "23:17:34", "remaining_time": "11:43:54"}
819
+ {"current_steps": 819, "total_steps": 1230, "loss": 0.2986, "lr": 1.213055323844297e-05, "epoch": 3.3174683544303796, "percentage": 66.59, "elapsed_time": "23:19:14", "remaining_time": "11:42:10"}
820
+ {"current_steps": 820, "total_steps": 1230, "loss": 0.3, "lr": 1.2078404679216864e-05, "epoch": 3.321518987341772, "percentage": 66.67, "elapsed_time": "23:20:51", "remaining_time": "11:40:25"}
821
+ {"current_steps": 821, "total_steps": 1230, "loss": 0.3088, "lr": 1.2026319919430458e-05, "epoch": 3.3255696202531646, "percentage": 66.75, "elapsed_time": "23:22:20", "remaining_time": "11:38:36"}
822
+ {"current_steps": 822, "total_steps": 1230, "loss": 0.2859, "lr": 1.1974299378567227e-05, "epoch": 3.329620253164557, "percentage": 66.83, "elapsed_time": "23:24:02", "remaining_time": "11:36:53"}
823
+ {"current_steps": 823, "total_steps": 1230, "loss": 0.3035, "lr": 1.1922343475593462e-05, "epoch": 3.333670886075949, "percentage": 66.91, "elapsed_time": "23:25:53", "remaining_time": "11:35:15"}
824
+ {"current_steps": 824, "total_steps": 1230, "loss": 0.2831, "lr": 1.187045262895488e-05, "epoch": 3.3377215189873417, "percentage": 66.99, "elapsed_time": "23:27:21", "remaining_time": "11:33:25"}
825
+ {"current_steps": 825, "total_steps": 1230, "loss": 0.3094, "lr": 1.1818627256573203e-05, "epoch": 3.3417721518987342, "percentage": 67.07, "elapsed_time": "23:29:13", "remaining_time": "11:31:48"}
826
+ {"current_steps": 826, "total_steps": 1230, "loss": 0.3071, "lr": 1.1766867775842864e-05, "epoch": 3.3458227848101267, "percentage": 67.15, "elapsed_time": "23:31:07", "remaining_time": "11:30:11"}
827
+ {"current_steps": 827, "total_steps": 1230, "loss": 0.297, "lr": 1.1715174603627615e-05, "epoch": 3.349873417721519, "percentage": 67.24, "elapsed_time": "23:32:42", "remaining_time": "11:28:25"}
828
+ {"current_steps": 828, "total_steps": 1230, "loss": 0.3051, "lr": 1.1663548156257147e-05, "epoch": 3.3539240506329113, "percentage": 67.32, "elapsed_time": "23:34:26", "remaining_time": "11:26:43"}
829
+ {"current_steps": 829, "total_steps": 1230, "loss": 0.2786, "lr": 1.161198884952377e-05, "epoch": 3.357974683544304, "percentage": 67.4, "elapsed_time": "23:36:00", "remaining_time": "11:24:56"}
830
+ {"current_steps": 830, "total_steps": 1230, "loss": 0.2898, "lr": 1.1560497098679056e-05, "epoch": 3.3620253164556964, "percentage": 67.48, "elapsed_time": "23:37:48", "remaining_time": "11:23:16"}
831
+ {"current_steps": 831, "total_steps": 1230, "loss": 0.3266, "lr": 1.1509073318430479e-05, "epoch": 3.3660759493670884, "percentage": 67.56, "elapsed_time": "23:39:38", "remaining_time": "11:21:38"}
832
+ {"current_steps": 832, "total_steps": 1230, "loss": 0.2842, "lr": 1.1457717922938116e-05, "epoch": 3.370126582278481, "percentage": 67.64, "elapsed_time": "23:41:26", "remaining_time": "11:19:57"}
833
+ {"current_steps": 833, "total_steps": 1230, "loss": 0.303, "lr": 1.1406431325811233e-05, "epoch": 3.3741772151898735, "percentage": 67.72, "elapsed_time": "23:43:05", "remaining_time": "11:18:13"}
834
+ {"current_steps": 834, "total_steps": 1230, "loss": 0.2966, "lr": 1.135521394010506e-05, "epoch": 3.378227848101266, "percentage": 67.8, "elapsed_time": "23:44:54", "remaining_time": "11:16:34"}
835
+ {"current_steps": 835, "total_steps": 1230, "loss": 0.2947, "lr": 1.1304066178317367e-05, "epoch": 3.382278481012658, "percentage": 67.89, "elapsed_time": "23:46:25", "remaining_time": "11:14:46"}
836
+ {"current_steps": 836, "total_steps": 1230, "loss": 0.2915, "lr": 1.1252988452385199e-05, "epoch": 3.3863291139240506, "percentage": 67.97, "elapsed_time": "23:48:15", "remaining_time": "11:13:07"}
837
+ {"current_steps": 837, "total_steps": 1230, "loss": 0.3064, "lr": 1.1201981173681536e-05, "epoch": 3.390379746835443, "percentage": 68.05, "elapsed_time": "23:50:22", "remaining_time": "11:11:36"}
838
+ {"current_steps": 838, "total_steps": 1230, "loss": 0.2713, "lr": 1.1151044753011991e-05, "epoch": 3.3944303797468356, "percentage": 68.13, "elapsed_time": "23:51:54", "remaining_time": "11:09:49"}
839
+ {"current_steps": 839, "total_steps": 1230, "loss": 0.2785, "lr": 1.1100179600611491e-05, "epoch": 3.3984810126582277, "percentage": 68.21, "elapsed_time": "23:53:27", "remaining_time": "11:08:02"}
840
+ {"current_steps": 840, "total_steps": 1230, "loss": 0.2877, "lr": 1.1049386126140985e-05, "epoch": 3.40253164556962, "percentage": 68.29, "elapsed_time": "23:55:14", "remaining_time": "11:06:21"}
841
+ {"current_steps": 841, "total_steps": 1230, "loss": 0.3069, "lr": 1.0998664738684128e-05, "epoch": 3.4065822784810127, "percentage": 68.37, "elapsed_time": "23:56:51", "remaining_time": "11:04:36"}
842
+ {"current_steps": 842, "total_steps": 1230, "loss": 0.3047, "lr": 1.0948015846744e-05, "epoch": 3.410632911392405, "percentage": 68.46, "elapsed_time": "23:58:26", "remaining_time": "11:02:50"}
843
+ {"current_steps": 843, "total_steps": 1230, "loss": 0.2737, "lr": 1.0897439858239832e-05, "epoch": 3.4146835443037973, "percentage": 68.54, "elapsed_time": "1 day, 0:00:01", "remaining_time": "11:01:04"}
844
+ {"current_steps": 844, "total_steps": 1230, "loss": 0.3024, "lr": 1.0846937180503652e-05, "epoch": 3.41873417721519, "percentage": 68.62, "elapsed_time": "1 day, 0:02:02", "remaining_time": "10:59:30"}
845
+ {"current_steps": 845, "total_steps": 1230, "loss": 0.282, "lr": 1.0796508220277117e-05, "epoch": 3.4227848101265823, "percentage": 68.7, "elapsed_time": "1 day, 0:03:41", "remaining_time": "10:57:46"}
846
+ {"current_steps": 846, "total_steps": 1230, "loss": 0.3057, "lr": 1.0746153383708107e-05, "epoch": 3.426835443037975, "percentage": 68.78, "elapsed_time": "1 day, 0:05:21", "remaining_time": "10:56:02"}
847
+ {"current_steps": 847, "total_steps": 1230, "loss": 0.3004, "lr": 1.0695873076347579e-05, "epoch": 3.430886075949367, "percentage": 68.86, "elapsed_time": "1 day, 0:07:02", "remaining_time": "10:54:19"}
848
+ {"current_steps": 848, "total_steps": 1230, "loss": 0.3068, "lr": 1.0645667703146205e-05, "epoch": 3.4349367088607594, "percentage": 68.94, "elapsed_time": "1 day, 0:08:51", "remaining_time": "10:52:40"}
849
+ {"current_steps": 849, "total_steps": 1230, "loss": 0.2739, "lr": 1.0595537668451161e-05, "epoch": 3.438987341772152, "percentage": 69.02, "elapsed_time": "1 day, 0:10:27", "remaining_time": "10:50:54"}
850
+ {"current_steps": 850, "total_steps": 1230, "loss": 0.2953, "lr": 1.0545483376002854e-05, "epoch": 3.4430379746835444, "percentage": 69.11, "elapsed_time": "1 day, 0:12:22", "remaining_time": "10:49:17"}
851
+ {"current_steps": 851, "total_steps": 1230, "loss": 0.3058, "lr": 1.0495505228931676e-05, "epoch": 3.4470886075949365, "percentage": 69.19, "elapsed_time": "1 day, 0:13:47", "remaining_time": "10:47:27"}
852
+ {"current_steps": 852, "total_steps": 1230, "loss": 0.304, "lr": 1.044560362975474e-05, "epoch": 3.451139240506329, "percentage": 69.27, "elapsed_time": "1 day, 0:15:21", "remaining_time": "10:45:41"}
853
+ {"current_steps": 853, "total_steps": 1230, "loss": 0.2851, "lr": 1.0395778980372695e-05, "epoch": 3.4551898734177215, "percentage": 69.35, "elapsed_time": "1 day, 0:16:59", "remaining_time": "10:43:56"}
854
+ {"current_steps": 854, "total_steps": 1230, "loss": 0.2926, "lr": 1.0346031682066381e-05, "epoch": 3.459240506329114, "percentage": 69.43, "elapsed_time": "1 day, 0:18:50", "remaining_time": "10:42:17"}
855
+ {"current_steps": 855, "total_steps": 1230, "loss": 0.2994, "lr": 1.0296362135493724e-05, "epoch": 3.463291139240506, "percentage": 69.51, "elapsed_time": "1 day, 0:20:34", "remaining_time": "10:40:35"}
856
+ {"current_steps": 856, "total_steps": 1230, "loss": 0.3285, "lr": 1.0246770740686422e-05, "epoch": 3.4673417721518986, "percentage": 69.59, "elapsed_time": "1 day, 0:22:38", "remaining_time": "10:39:02"}
857
+ {"current_steps": 857, "total_steps": 1230, "loss": 0.3057, "lr": 1.0197257897046743e-05, "epoch": 3.471392405063291, "percentage": 69.67, "elapsed_time": "1 day, 0:24:25", "remaining_time": "10:37:22"}
858
+ {"current_steps": 858, "total_steps": 1230, "loss": 0.2892, "lr": 1.014782400334433e-05, "epoch": 3.4754430379746837, "percentage": 69.76, "elapsed_time": "1 day, 0:26:10", "remaining_time": "10:35:41"}
859
+ {"current_steps": 859, "total_steps": 1230, "loss": 0.2843, "lr": 1.009846945771296e-05, "epoch": 3.479493670886076, "percentage": 69.84, "elapsed_time": "1 day, 0:27:55", "remaining_time": "10:33:59"}
860
+ {"current_steps": 860, "total_steps": 1230, "loss": 0.2976, "lr": 1.0049194657647363e-05, "epoch": 3.4835443037974683, "percentage": 69.92, "elapsed_time": "1 day, 0:29:44", "remaining_time": "10:32:19"}
861
+ {"current_steps": 861, "total_steps": 1230, "loss": 0.3056, "lr": 1.0000000000000006e-05, "epoch": 3.487594936708861, "percentage": 70.0, "elapsed_time": "1 day, 0:31:36", "remaining_time": "10:30:41"}
862
+ {"current_steps": 862, "total_steps": 1230, "loss": 0.2894, "lr": 9.950885880977891e-06, "epoch": 3.4916455696202533, "percentage": 70.08, "elapsed_time": "1 day, 0:33:22", "remaining_time": "10:29:00"}
863
+ {"current_steps": 863, "total_steps": 1230, "loss": 0.2884, "lr": 9.901852696139382e-06, "epoch": 3.4956962025316454, "percentage": 70.16, "elapsed_time": "1 day, 0:35:02", "remaining_time": "10:27:16"}
864
+ {"current_steps": 864, "total_steps": 1230, "loss": 0.309, "lr": 9.852900840391027e-06, "epoch": 3.499746835443038, "percentage": 70.24, "elapsed_time": "1 day, 0:36:45", "remaining_time": "10:25:34"}
865
+ {"current_steps": 865, "total_steps": 1230, "loss": 0.2906, "lr": 9.804030707984313e-06, "epoch": 3.5037974683544304, "percentage": 70.33, "elapsed_time": "1 day, 0:38:28", "remaining_time": "10:23:51"}
866
+ {"current_steps": 866, "total_steps": 1230, "loss": 0.287, "lr": 9.755242692512599e-06, "epoch": 3.507848101265823, "percentage": 70.41, "elapsed_time": "1 day, 0:40:10", "remaining_time": "10:22:09"}
867
+ {"current_steps": 867, "total_steps": 1230, "loss": 0.2981, "lr": 9.70653718690782e-06, "epoch": 3.5118987341772154, "percentage": 70.49, "elapsed_time": "1 day, 0:42:00", "remaining_time": "10:20:29"}
868
+ {"current_steps": 868, "total_steps": 1230, "loss": 0.303, "lr": 9.657914583437454e-06, "epoch": 3.5159493670886075, "percentage": 70.57, "elapsed_time": "1 day, 0:43:38", "remaining_time": "10:18:45"}
869
+ {"current_steps": 869, "total_steps": 1230, "loss": 0.2822, "lr": 9.609375273701246e-06, "epoch": 3.52, "percentage": 70.65, "elapsed_time": "1 day, 0:45:03", "remaining_time": "10:16:55"}
870
+ {"current_steps": 870, "total_steps": 1230, "loss": 0.2925, "lr": 9.560919648628133e-06, "epoch": 3.5240506329113925, "percentage": 70.73, "elapsed_time": "1 day, 0:46:56", "remaining_time": "10:15:17"}
871
+ {"current_steps": 871, "total_steps": 1230, "loss": 0.3262, "lr": 9.512548098473047e-06, "epoch": 3.5281012658227846, "percentage": 70.81, "elapsed_time": "1 day, 0:48:59", "remaining_time": "10:13:43"}
872
+ {"current_steps": 872, "total_steps": 1230, "loss": 0.2799, "lr": 9.464261012813825e-06, "epoch": 3.532151898734177, "percentage": 70.89, "elapsed_time": "1 day, 0:50:24", "remaining_time": "10:11:53"}
873
+ {"current_steps": 873, "total_steps": 1230, "loss": 0.2848, "lr": 9.416058780547987e-06, "epoch": 3.5362025316455696, "percentage": 70.98, "elapsed_time": "1 day, 0:52:08", "remaining_time": "10:10:11"}
874
+ {"current_steps": 874, "total_steps": 1230, "loss": 0.2908, "lr": 9.367941789889714e-06, "epoch": 3.540253164556962, "percentage": 71.06, "elapsed_time": "1 day, 0:53:49", "remaining_time": "10:08:27"}
875
+ {"current_steps": 875, "total_steps": 1230, "loss": 0.3001, "lr": 9.319910428366607e-06, "epoch": 3.5443037974683547, "percentage": 71.14, "elapsed_time": "1 day, 0:55:25", "remaining_time": "10:06:42"}
876
+ {"current_steps": 876, "total_steps": 1230, "loss": 0.3016, "lr": 9.271965082816667e-06, "epoch": 3.5483544303797467, "percentage": 71.22, "elapsed_time": "1 day, 0:57:11", "remaining_time": "10:05:01"}
877
+ {"current_steps": 877, "total_steps": 1230, "loss": 0.3073, "lr": 9.224106139385111e-06, "epoch": 3.5524050632911393, "percentage": 71.3, "elapsed_time": "1 day, 0:59:03", "remaining_time": "10:03:23"}
878
+ {"current_steps": 878, "total_steps": 1230, "loss": 0.2773, "lr": 9.176333983521291e-06, "epoch": 3.5564556962025318, "percentage": 71.38, "elapsed_time": "1 day, 1:00:46", "remaining_time": "10:01:40"}
879
+ {"current_steps": 879, "total_steps": 1230, "loss": 0.2995, "lr": 9.12864899997558e-06, "epoch": 3.560506329113924, "percentage": 71.46, "elapsed_time": "1 day, 1:02:30", "remaining_time": "9:59:58"}
880
+ {"current_steps": 880, "total_steps": 1230, "loss": 0.2937, "lr": 9.08105157279628e-06, "epoch": 3.5645569620253164, "percentage": 71.54, "elapsed_time": "1 day, 1:04:11", "remaining_time": "9:58:15"}
881
+ {"current_steps": 881, "total_steps": 1230, "loss": 0.2769, "lr": 9.03354208532653e-06, "epoch": 3.568607594936709, "percentage": 71.63, "elapsed_time": "1 day, 1:05:49", "remaining_time": "9:56:31"}
882
+ {"current_steps": 882, "total_steps": 1230, "loss": 0.307, "lr": 8.986120920201205e-06, "epoch": 3.5726582278481014, "percentage": 71.71, "elapsed_time": "1 day, 1:07:34", "remaining_time": "9:54:49"}
883
+ {"current_steps": 883, "total_steps": 1230, "loss": 0.2804, "lr": 8.938788459343852e-06, "epoch": 3.576708860759494, "percentage": 71.79, "elapsed_time": "1 day, 1:09:01", "remaining_time": "9:53:01"}
884
+ {"current_steps": 884, "total_steps": 1230, "loss": 0.3235, "lr": 8.8915450839636e-06, "epoch": 3.580759493670886, "percentage": 71.87, "elapsed_time": "1 day, 1:10:47", "remaining_time": "9:51:19"}
885
+ {"current_steps": 885, "total_steps": 1230, "loss": 0.2753, "lr": 8.844391174552116e-06, "epoch": 3.5848101265822785, "percentage": 71.95, "elapsed_time": "1 day, 1:12:20", "remaining_time": "9:49:33"}
886
+ {"current_steps": 886, "total_steps": 1230, "loss": 0.2809, "lr": 8.797327110880479e-06, "epoch": 3.588860759493671, "percentage": 72.03, "elapsed_time": "1 day, 1:13:56", "remaining_time": "9:47:48"}
887
+ {"current_steps": 887, "total_steps": 1230, "loss": 0.289, "lr": 8.750353271996206e-06, "epoch": 3.592911392405063, "percentage": 72.11, "elapsed_time": "1 day, 1:15:44", "remaining_time": "9:46:07"}
888
+ {"current_steps": 888, "total_steps": 1230, "loss": 0.3059, "lr": 8.703470036220132e-06, "epoch": 3.5969620253164556, "percentage": 72.2, "elapsed_time": "1 day, 1:17:23", "remaining_time": "9:44:24"}
889
+ {"current_steps": 889, "total_steps": 1230, "loss": 0.289, "lr": 8.656677781143394e-06, "epoch": 3.601012658227848, "percentage": 72.28, "elapsed_time": "1 day, 1:19:05", "remaining_time": "9:42:41"}
890
+ {"current_steps": 890, "total_steps": 1230, "loss": 0.2962, "lr": 8.609976883624377e-06, "epoch": 3.6050632911392406, "percentage": 72.36, "elapsed_time": "1 day, 1:20:46", "remaining_time": "9:40:58"}
891
+ {"current_steps": 891, "total_steps": 1230, "loss": 0.2963, "lr": 8.563367719785698e-06, "epoch": 3.609113924050633, "percentage": 72.44, "elapsed_time": "1 day, 1:22:35", "remaining_time": "9:39:18"}
892
+ {"current_steps": 892, "total_steps": 1230, "loss": 0.2762, "lr": 8.516850665011138e-06, "epoch": 3.613164556962025, "percentage": 72.52, "elapsed_time": "1 day, 1:24:10", "remaining_time": "9:37:32"}
893
+ {"current_steps": 893, "total_steps": 1230, "loss": 0.2989, "lr": 8.47042609394269e-06, "epoch": 3.6172151898734177, "percentage": 72.6, "elapsed_time": "1 day, 1:25:51", "remaining_time": "9:35:49"}
894
+ {"current_steps": 894, "total_steps": 1230, "loss": 0.2839, "lr": 8.424094380477432e-06, "epoch": 3.6212658227848102, "percentage": 72.68, "elapsed_time": "1 day, 1:27:24", "remaining_time": "9:34:03"}
895
+ {"current_steps": 895, "total_steps": 1230, "loss": 0.2933, "lr": 8.37785589776465e-06, "epoch": 3.6253164556962023, "percentage": 72.76, "elapsed_time": "1 day, 1:29:19", "remaining_time": "9:32:25"}
896
+ {"current_steps": 896, "total_steps": 1230, "loss": 0.2862, "lr": 8.331711018202694e-06, "epoch": 3.629367088607595, "percentage": 72.85, "elapsed_time": "1 day, 1:31:08", "remaining_time": "9:30:45"}
897
+ {"current_steps": 897, "total_steps": 1230, "loss": 0.2974, "lr": 8.285660113436104e-06, "epoch": 3.6334177215189873, "percentage": 72.93, "elapsed_time": "1 day, 1:32:44", "remaining_time": "9:29:00"}
898
+ {"current_steps": 898, "total_steps": 1230, "loss": 0.2791, "lr": 8.239703554352527e-06, "epoch": 3.63746835443038, "percentage": 73.01, "elapsed_time": "1 day, 1:34:31", "remaining_time": "9:27:19"}
899
+ {"current_steps": 899, "total_steps": 1230, "loss": 0.3033, "lr": 8.193841711079775e-06, "epoch": 3.6415189873417724, "percentage": 73.09, "elapsed_time": "1 day, 1:36:25", "remaining_time": "9:25:41"}
900
+ {"current_steps": 900, "total_steps": 1230, "loss": 0.2914, "lr": 8.148074952982828e-06, "epoch": 3.6455696202531644, "percentage": 73.17, "elapsed_time": "1 day, 1:38:05", "remaining_time": "9:23:58"}
901
+ {"current_steps": 901, "total_steps": 1230, "loss": 0.3078, "lr": 8.102403648660859e-06, "epoch": 3.649620253164557, "percentage": 73.25, "elapsed_time": "1 day, 1:39:31", "remaining_time": "9:22:09"}
902
+ {"current_steps": 902, "total_steps": 1230, "loss": 0.2981, "lr": 8.056828165944282e-06, "epoch": 3.6536708860759495, "percentage": 73.33, "elapsed_time": "1 day, 1:41:15", "remaining_time": "9:20:27"}
903
+ {"current_steps": 903, "total_steps": 1230, "loss": 0.3039, "lr": 8.011348871891762e-06, "epoch": 3.6577215189873415, "percentage": 73.41, "elapsed_time": "1 day, 1:42:52", "remaining_time": "9:18:42"}
904
+ {"current_steps": 904, "total_steps": 1230, "loss": 0.2957, "lr": 7.965966132787287e-06, "epoch": 3.661772151898734, "percentage": 73.5, "elapsed_time": "1 day, 1:44:30", "remaining_time": "9:16:58"}
905
+ {"current_steps": 905, "total_steps": 1230, "loss": 0.3017, "lr": 7.920680314137189e-06, "epoch": 3.6658227848101266, "percentage": 73.58, "elapsed_time": "1 day, 1:46:26", "remaining_time": "9:15:21"}
906
+ {"current_steps": 906, "total_steps": 1230, "loss": 0.3053, "lr": 7.875491780667246e-06, "epoch": 3.669873417721519, "percentage": 73.66, "elapsed_time": "1 day, 1:48:13", "remaining_time": "9:13:40"}
907
+ {"current_steps": 907, "total_steps": 1230, "loss": 0.2993, "lr": 7.830400896319667e-06, "epoch": 3.6739240506329116, "percentage": 73.74, "elapsed_time": "1 day, 1:49:48", "remaining_time": "9:11:55"}
908
+ {"current_steps": 908, "total_steps": 1230, "loss": 0.2797, "lr": 7.785408024250259e-06, "epoch": 3.6779746835443037, "percentage": 73.82, "elapsed_time": "1 day, 1:51:25", "remaining_time": "9:10:10"}
909
+ {"current_steps": 909, "total_steps": 1230, "loss": 0.3125, "lr": 7.74051352682542e-06, "epoch": 3.682025316455696, "percentage": 73.9, "elapsed_time": "1 day, 1:53:20", "remaining_time": "9:08:32"}
910
+ {"current_steps": 910, "total_steps": 1230, "loss": 0.2908, "lr": 7.695717765619257e-06, "epoch": 3.6860759493670887, "percentage": 73.98, "elapsed_time": "1 day, 1:54:54", "remaining_time": "9:06:46"}
911
+ {"current_steps": 911, "total_steps": 1230, "loss": 0.3064, "lr": 7.651021101410673e-06, "epoch": 3.690126582278481, "percentage": 74.07, "elapsed_time": "1 day, 1:56:41", "remaining_time": "9:05:06"}
912
+ {"current_steps": 912, "total_steps": 1230, "loss": 0.2776, "lr": 7.606423894180464e-06, "epoch": 3.6941772151898733, "percentage": 74.15, "elapsed_time": "1 day, 1:58:21", "remaining_time": "9:03:22"}
913
+ {"current_steps": 913, "total_steps": 1230, "loss": 0.3043, "lr": 7.56192650310839e-06, "epoch": 3.698227848101266, "percentage": 74.23, "elapsed_time": "1 day, 2:00:10", "remaining_time": "9:01:42"}
914
+ {"current_steps": 914, "total_steps": 1230, "loss": 0.301, "lr": 7.517529286570349e-06, "epoch": 3.7022784810126583, "percentage": 74.31, "elapsed_time": "1 day, 2:02:02", "remaining_time": "9:00:03"}
915
+ {"current_steps": 915, "total_steps": 1230, "loss": 0.2635, "lr": 7.473232602135387e-06, "epoch": 3.706329113924051, "percentage": 74.39, "elapsed_time": "1 day, 2:03:34", "remaining_time": "8:58:16"}
916
+ {"current_steps": 916, "total_steps": 1230, "loss": 0.304, "lr": 7.429036806562935e-06, "epoch": 3.710379746835443, "percentage": 74.47, "elapsed_time": "1 day, 2:05:02", "remaining_time": "8:56:29"}
917
+ {"current_steps": 917, "total_steps": 1230, "loss": 0.2754, "lr": 7.3849422557998455e-06, "epoch": 3.7144303797468354, "percentage": 74.55, "elapsed_time": "1 day, 2:06:48", "remaining_time": "8:54:48"}
918
+ {"current_steps": 918, "total_steps": 1230, "loss": 0.3059, "lr": 7.340949304977567e-06, "epoch": 3.718481012658228, "percentage": 74.63, "elapsed_time": "1 day, 2:08:25", "remaining_time": "8:53:03"}
919
+ {"current_steps": 919, "total_steps": 1230, "loss": 0.2983, "lr": 7.297058308409282e-06, "epoch": 3.72253164556962, "percentage": 74.72, "elapsed_time": "1 day, 2:10:08", "remaining_time": "8:51:21"}
920
+ {"current_steps": 920, "total_steps": 1230, "loss": 0.2919, "lr": 7.25326961958704e-06, "epoch": 3.7265822784810125, "percentage": 74.8, "elapsed_time": "1 day, 2:11:43", "remaining_time": "8:49:36"}
921
+ {"current_steps": 921, "total_steps": 1230, "loss": 0.2881, "lr": 7.209583591178921e-06, "epoch": 3.730632911392405, "percentage": 74.88, "elapsed_time": "1 day, 2:13:18", "remaining_time": "8:47:51"}
922
+ {"current_steps": 922, "total_steps": 1230, "loss": 0.2776, "lr": 7.1660005750261925e-06, "epoch": 3.7346835443037976, "percentage": 74.96, "elapsed_time": "1 day, 2:14:50", "remaining_time": "8:46:05"}
923
+ {"current_steps": 923, "total_steps": 1230, "loss": 0.3029, "lr": 7.1225209221404765e-06, "epoch": 3.73873417721519, "percentage": 75.04, "elapsed_time": "1 day, 2:16:36", "remaining_time": "8:44:23"}
924
+ {"current_steps": 924, "total_steps": 1230, "loss": 0.2904, "lr": 7.079144982700909e-06, "epoch": 3.742784810126582, "percentage": 75.12, "elapsed_time": "1 day, 2:18:10", "remaining_time": "8:42:38"}
925
+ {"current_steps": 925, "total_steps": 1230, "loss": 0.3018, "lr": 7.0358731060513695e-06, "epoch": 3.7468354430379747, "percentage": 75.2, "elapsed_time": "1 day, 2:20:00", "remaining_time": "8:40:58"}
926
+ {"current_steps": 926, "total_steps": 1230, "loss": 0.31, "lr": 6.99270564069757e-06, "epoch": 3.750886075949367, "percentage": 75.28, "elapsed_time": "1 day, 2:21:54", "remaining_time": "8:39:19"}
927
+ {"current_steps": 927, "total_steps": 1230, "loss": 0.3073, "lr": 6.949642934304375e-06, "epoch": 3.7549367088607593, "percentage": 75.37, "elapsed_time": "1 day, 2:23:45", "remaining_time": "8:37:40"}
928
+ {"current_steps": 928, "total_steps": 1230, "loss": 0.2877, "lr": 6.906685333692871e-06, "epoch": 3.7589873417721518, "percentage": 75.45, "elapsed_time": "1 day, 2:25:23", "remaining_time": "8:35:56"}
929
+ {"current_steps": 929, "total_steps": 1230, "loss": 0.294, "lr": 6.86383318483769e-06, "epoch": 3.7630379746835443, "percentage": 75.53, "elapsed_time": "1 day, 2:27:04", "remaining_time": "8:34:13"}
930
+ {"current_steps": 930, "total_steps": 1230, "loss": 0.2887, "lr": 6.821086832864139e-06, "epoch": 3.767088607594937, "percentage": 75.61, "elapsed_time": "1 day, 2:28:41", "remaining_time": "8:32:28"}
931
+ {"current_steps": 931, "total_steps": 1230, "loss": 0.3072, "lr": 6.77844662204546e-06, "epoch": 3.7711392405063293, "percentage": 75.69, "elapsed_time": "1 day, 2:30:31", "remaining_time": "8:30:48"}
932
+ {"current_steps": 932, "total_steps": 1230, "loss": 0.2925, "lr": 6.7359128958000455e-06, "epoch": 3.7751898734177214, "percentage": 75.77, "elapsed_time": "1 day, 2:32:16", "remaining_time": "8:29:07"}
933
+ {"current_steps": 933, "total_steps": 1230, "loss": 0.2903, "lr": 6.693485996688695e-06, "epoch": 3.779240506329114, "percentage": 75.85, "elapsed_time": "1 day, 2:33:56", "remaining_time": "8:27:23"}
934
+ {"current_steps": 934, "total_steps": 1230, "loss": 0.296, "lr": 6.651166266411801e-06, "epoch": 3.7832911392405064, "percentage": 75.93, "elapsed_time": "1 day, 2:35:33", "remaining_time": "8:25:39"}
935
+ {"current_steps": 935, "total_steps": 1230, "loss": 0.3007, "lr": 6.6089540458066725e-06, "epoch": 3.7873417721518985, "percentage": 76.02, "elapsed_time": "1 day, 2:37:34", "remaining_time": "8:24:02"}
936
+ {"current_steps": 936, "total_steps": 1230, "loss": 0.2918, "lr": 6.566849674844711e-06, "epoch": 3.791392405063291, "percentage": 76.1, "elapsed_time": "1 day, 2:39:15", "remaining_time": "8:22:19"}
937
+ {"current_steps": 937, "total_steps": 1230, "loss": 0.3015, "lr": 6.524853492628747e-06, "epoch": 3.7954430379746835, "percentage": 76.18, "elapsed_time": "1 day, 2:40:52", "remaining_time": "8:20:35"}
938
+ {"current_steps": 938, "total_steps": 1230, "loss": 0.2767, "lr": 6.4829658373902536e-06, "epoch": 3.799493670886076, "percentage": 76.26, "elapsed_time": "1 day, 2:42:20", "remaining_time": "8:18:48"}
939
+ {"current_steps": 939, "total_steps": 1230, "loss": 0.2995, "lr": 6.441187046486648e-06, "epoch": 3.8035443037974686, "percentage": 76.34, "elapsed_time": "1 day, 2:44:00", "remaining_time": "8:17:05"}
940
+ {"current_steps": 940, "total_steps": 1230, "loss": 0.292, "lr": 6.399517456398567e-06, "epoch": 3.8075949367088606, "percentage": 76.42, "elapsed_time": "1 day, 2:45:43", "remaining_time": "8:15:23"}
941
+ {"current_steps": 941, "total_steps": 1230, "loss": 0.3031, "lr": 6.357957402727164e-06, "epoch": 3.811645569620253, "percentage": 76.5, "elapsed_time": "1 day, 2:47:31", "remaining_time": "8:13:42"}
942
+ {"current_steps": 942, "total_steps": 1230, "loss": 0.301, "lr": 6.316507220191395e-06, "epoch": 3.8156962025316457, "percentage": 76.59, "elapsed_time": "1 day, 2:49:18", "remaining_time": "8:12:00"}
943
+ {"current_steps": 943, "total_steps": 1230, "loss": 0.2988, "lr": 6.275167242625331e-06, "epoch": 3.8197468354430377, "percentage": 76.67, "elapsed_time": "1 day, 2:50:54", "remaining_time": "8:10:16"}
944
+ {"current_steps": 944, "total_steps": 1230, "loss": 0.2716, "lr": 6.233937802975471e-06, "epoch": 3.8237974683544302, "percentage": 76.75, "elapsed_time": "1 day, 2:52:30", "remaining_time": "8:08:32"}
945
+ {"current_steps": 945, "total_steps": 1230, "loss": 0.2994, "lr": 6.192819233298046e-06, "epoch": 3.8278481012658228, "percentage": 76.83, "elapsed_time": "1 day, 2:54:13", "remaining_time": "8:06:49"}
946
+ {"current_steps": 946, "total_steps": 1230, "loss": 0.3066, "lr": 6.151811864756383e-06, "epoch": 3.8318987341772153, "percentage": 76.91, "elapsed_time": "1 day, 2:55:59", "remaining_time": "8:05:08"}
947
+ {"current_steps": 947, "total_steps": 1230, "loss": 0.297, "lr": 6.1109160276181655e-06, "epoch": 3.835949367088608, "percentage": 76.99, "elapsed_time": "1 day, 2:57:30", "remaining_time": "8:03:22"}
948
+ {"current_steps": 948, "total_steps": 1230, "loss": 0.284, "lr": 6.070132051252868e-06, "epoch": 3.84, "percentage": 77.07, "elapsed_time": "1 day, 2:59:15", "remaining_time": "8:01:40"}
949
+ {"current_steps": 949, "total_steps": 1230, "loss": 0.2879, "lr": 6.0294602641290034e-06, "epoch": 3.8440506329113924, "percentage": 77.15, "elapsed_time": "1 day, 3:00:52", "remaining_time": "7:59:56"}
950
+ {"current_steps": 950, "total_steps": 1230, "loss": 0.2872, "lr": 5.988900993811575e-06, "epoch": 3.848101265822785, "percentage": 77.24, "elapsed_time": "1 day, 3:02:25", "remaining_time": "7:58:11"}
951
+ {"current_steps": 951, "total_steps": 1230, "loss": 0.2993, "lr": 5.948454566959363e-06, "epoch": 3.852151898734177, "percentage": 77.32, "elapsed_time": "1 day, 3:04:17", "remaining_time": "7:56:31"}
952
+ {"current_steps": 952, "total_steps": 1230, "loss": 0.2911, "lr": 5.908121309322328e-06, "epoch": 3.8562025316455695, "percentage": 77.4, "elapsed_time": "1 day, 3:06:14", "remaining_time": "7:54:53"}
953
+ {"current_steps": 953, "total_steps": 1230, "loss": 0.3034, "lr": 5.867901545738976e-06, "epoch": 3.860253164556962, "percentage": 77.48, "elapsed_time": "1 day, 3:07:57", "remaining_time": "7:53:10"}
954
+ {"current_steps": 954, "total_steps": 1230, "loss": 0.276, "lr": 5.827795600133774e-06, "epoch": 3.8643037974683545, "percentage": 77.56, "elapsed_time": "1 day, 3:09:22", "remaining_time": "7:51:23"}
955
+ {"current_steps": 955, "total_steps": 1230, "loss": 0.2859, "lr": 5.787803795514466e-06, "epoch": 3.868354430379747, "percentage": 77.64, "elapsed_time": "1 day, 3:10:52", "remaining_time": "7:49:37"}
956
+ {"current_steps": 956, "total_steps": 1230, "loss": 0.3253, "lr": 5.747926453969576e-06, "epoch": 3.872405063291139, "percentage": 77.72, "elapsed_time": "1 day, 3:12:31", "remaining_time": "7:47:54"}
957
+ {"current_steps": 957, "total_steps": 1230, "loss": 0.2816, "lr": 5.708163896665708e-06, "epoch": 3.8764556962025316, "percentage": 77.8, "elapsed_time": "1 day, 3:14:09", "remaining_time": "7:46:10"}
958
+ {"current_steps": 958, "total_steps": 1230, "loss": 0.295, "lr": 5.668516443845047e-06, "epoch": 3.880506329113924, "percentage": 77.89, "elapsed_time": "1 day, 3:16:03", "remaining_time": "7:44:30"}
959
+ {"current_steps": 959, "total_steps": 1230, "loss": 0.2967, "lr": 5.6289844148227225e-06, "epoch": 3.884556962025316, "percentage": 77.97, "elapsed_time": "1 day, 3:17:35", "remaining_time": "7:42:45"}
960
+ {"current_steps": 960, "total_steps": 1230, "loss": 0.2901, "lr": 5.5895681279842615e-06, "epoch": 3.8886075949367087, "percentage": 78.05, "elapsed_time": "1 day, 3:19:16", "remaining_time": "7:41:02"}
961
+ {"current_steps": 961, "total_steps": 1230, "loss": 0.2692, "lr": 5.550267900783019e-06, "epoch": 3.8926582278481012, "percentage": 78.13, "elapsed_time": "1 day, 3:20:47", "remaining_time": "7:39:17"}
962
+ {"current_steps": 962, "total_steps": 1230, "loss": 0.3041, "lr": 5.511084049737623e-06, "epoch": 3.8967088607594937, "percentage": 78.21, "elapsed_time": "1 day, 3:22:29", "remaining_time": "7:37:34"}
963
+ {"current_steps": 963, "total_steps": 1230, "loss": 0.2858, "lr": 5.4720168904294215e-06, "epoch": 3.9007594936708863, "percentage": 78.29, "elapsed_time": "1 day, 3:24:09", "remaining_time": "7:35:51"}
964
+ {"current_steps": 964, "total_steps": 1230, "loss": 0.2928, "lr": 5.433066737499948e-06, "epoch": 3.9048101265822783, "percentage": 78.37, "elapsed_time": "1 day, 3:25:47", "remaining_time": "7:34:07"}
965
+ {"current_steps": 965, "total_steps": 1230, "loss": 0.2921, "lr": 5.394233904648376e-06, "epoch": 3.908860759493671, "percentage": 78.46, "elapsed_time": "1 day, 3:27:42", "remaining_time": "7:32:28"}
966
+ {"current_steps": 966, "total_steps": 1230, "loss": 0.295, "lr": 5.355518704628997e-06, "epoch": 3.9129113924050634, "percentage": 78.54, "elapsed_time": "1 day, 3:29:42", "remaining_time": "7:30:51"}
967
+ {"current_steps": 967, "total_steps": 1230, "loss": 0.3041, "lr": 5.316921449248731e-06, "epoch": 3.9169620253164554, "percentage": 78.62, "elapsed_time": "1 day, 3:31:27", "remaining_time": "7:29:09"}
968
+ {"current_steps": 968, "total_steps": 1230, "loss": 0.3088, "lr": 5.278442449364538e-06, "epoch": 3.921012658227848, "percentage": 78.7, "elapsed_time": "1 day, 3:33:12", "remaining_time": "7:27:27"}
969
+ {"current_steps": 969, "total_steps": 1230, "loss": 0.3103, "lr": 5.240082014881016e-06, "epoch": 3.9250632911392405, "percentage": 78.78, "elapsed_time": "1 day, 3:35:14", "remaining_time": "7:25:50"}
970
+ {"current_steps": 970, "total_steps": 1230, "loss": 0.288, "lr": 5.201840454747822e-06, "epoch": 3.929113924050633, "percentage": 78.86, "elapsed_time": "1 day, 3:36:37", "remaining_time": "7:24:02"}
971
+ {"current_steps": 971, "total_steps": 1230, "loss": 0.2808, "lr": 5.163718076957223e-06, "epoch": 3.9331645569620255, "percentage": 78.94, "elapsed_time": "1 day, 3:38:09", "remaining_time": "7:22:17"}
972
+ {"current_steps": 972, "total_steps": 1230, "loss": 0.2969, "lr": 5.125715188541609e-06, "epoch": 3.9372151898734176, "percentage": 79.02, "elapsed_time": "1 day, 3:40:04", "remaining_time": "7:20:38"}
973
+ {"current_steps": 973, "total_steps": 1230, "loss": 0.314, "lr": 5.087832095571021e-06, "epoch": 3.94126582278481, "percentage": 79.11, "elapsed_time": "1 day, 3:41:56", "remaining_time": "7:18:58"}
974
+ {"current_steps": 974, "total_steps": 1230, "loss": 0.3061, "lr": 5.0500691031506766e-06, "epoch": 3.9453164556962026, "percentage": 79.19, "elapsed_time": "1 day, 3:43:54", "remaining_time": "7:17:19"}
975
+ {"current_steps": 975, "total_steps": 1230, "loss": 0.2756, "lr": 5.01242651541854e-06, "epoch": 3.9493670886075947, "percentage": 79.27, "elapsed_time": "1 day, 3:45:34", "remaining_time": "7:15:36"}
976
+ {"current_steps": 976, "total_steps": 1230, "loss": 0.3076, "lr": 4.974904635542815e-06, "epoch": 3.953417721518987, "percentage": 79.35, "elapsed_time": "1 day, 3:47:24", "remaining_time": "7:13:56"}
977
+ {"current_steps": 977, "total_steps": 1230, "loss": 0.2779, "lr": 4.937503765719582e-06, "epoch": 3.9574683544303797, "percentage": 79.43, "elapsed_time": "1 day, 3:49:00", "remaining_time": "7:12:11"}
978
+ {"current_steps": 978, "total_steps": 1230, "loss": 0.3014, "lr": 4.900224207170299e-06, "epoch": 3.961518987341772, "percentage": 79.51, "elapsed_time": "1 day, 3:50:51", "remaining_time": "7:10:31"}
979
+ {"current_steps": 979, "total_steps": 1230, "loss": 0.2875, "lr": 4.8630662601394065e-06, "epoch": 3.9655696202531647, "percentage": 79.59, "elapsed_time": "1 day, 3:52:32", "remaining_time": "7:08:48"}
980
+ {"current_steps": 980, "total_steps": 1230, "loss": 0.2837, "lr": 4.8260302238918995e-06, "epoch": 3.969620253164557, "percentage": 79.67, "elapsed_time": "1 day, 3:54:07", "remaining_time": "7:07:04"}
981
+ {"current_steps": 981, "total_steps": 1230, "loss": 0.2956, "lr": 4.789116396710924e-06, "epoch": 3.9736708860759493, "percentage": 79.76, "elapsed_time": "1 day, 3:55:43", "remaining_time": "7:05:20"}
982
+ {"current_steps": 982, "total_steps": 1230, "loss": 0.2942, "lr": 4.752325075895368e-06, "epoch": 3.977721518987342, "percentage": 79.84, "elapsed_time": "1 day, 3:57:28", "remaining_time": "7:03:38"}
983
+ {"current_steps": 983, "total_steps": 1230, "loss": 0.2762, "lr": 4.715656557757473e-06, "epoch": 3.981772151898734, "percentage": 79.92, "elapsed_time": "1 day, 3:59:08", "remaining_time": "7:01:55"}
984
+ {"current_steps": 984, "total_steps": 1230, "loss": 0.3, "lr": 4.679111137620442e-06, "epoch": 3.9858227848101264, "percentage": 80.0, "elapsed_time": "1 day, 4:00:55", "remaining_time": "7:00:13"}
985
+ {"current_steps": 985, "total_steps": 1230, "loss": 0.2968, "lr": 4.6426891098160585e-06, "epoch": 3.989873417721519, "percentage": 80.08, "elapsed_time": "1 day, 4:02:30", "remaining_time": "6:58:29"}
986
+ {"current_steps": 986, "total_steps": 1230, "loss": 0.3046, "lr": 4.6063907676823474e-06, "epoch": 3.9939240506329114, "percentage": 80.16, "elapsed_time": "1 day, 4:04:16", "remaining_time": "6:56:47"}
987
+ {"current_steps": 987, "total_steps": 1230, "loss": 0.336, "lr": 4.570216403561141e-06, "epoch": 3.997974683544304, "percentage": 80.24, "elapsed_time": "1 day, 4:05:52", "remaining_time": "6:55:03"}
988
+ {"current_steps": 988, "total_steps": 1230, "loss": 0.2641, "lr": 4.534166308795815e-06, "epoch": 4.002025316455696, "percentage": 80.33, "elapsed_time": "1 day, 4:08:48", "remaining_time": "6:53:39"}