gsmyrnis commited on
Commit
3a87dbd
·
verified ·
1 Parent(s): 5c86b26

Training in progress, epoch 5

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:167eddde8e328c0c985ba86a9ea8dfb42e2000161dd3cc6d0b81afc5ccbc5c60
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:461417812296ba3498ffc22735c52f07b476f3714d83dcae51d7e9017dc3e831
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b02e9bf9ee646b742c2299df4a43d2f1b5e0aeb7cd4fb8e53813bbb1f02445a3
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2826b1e963ca5f0601b1fa1e74d70fee5385b90d0b31c07c167b69315e110e4c
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9e5301d4077952da1b276a1feaf1b506f95f4398f32a05a2a7887933d6f40fae
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3512cec777a2ade732ee807892e8203505d4b85bdec6adb06fb39f0ed7d3dd5c
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:76ce4d0495143ab4ca739eb80fee1ca7781bbb8a463b31b98687cf5317c3db01
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:40ffb3a0df4a2baf7988afe09d62e1de5d278306d1e3e5a1c8479c258ab11165
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -747,3 +747,490 @@
747
  {"current_steps": 747, "total_steps": 1235, "loss": 0.3223, "lr": 1.620572014799777e-05, "epoch": 3.0242914979757085, "percentage": 60.49, "elapsed_time": "4:09:09", "remaining_time": "2:42:46"}
748
  {"current_steps": 748, "total_steps": 1235, "loss": 0.3214, "lr": 1.6150208128905857e-05, "epoch": 3.02834008097166, "percentage": 60.57, "elapsed_time": "4:09:25", "remaining_time": "2:42:23"}
749
  {"current_steps": 749, "total_steps": 1235, "loss": 0.3165, "lr": 1.6094726892647147e-05, "epoch": 3.032388663967611, "percentage": 60.65, "elapsed_time": "4:09:45", "remaining_time": "2:42:03"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
747
  {"current_steps": 747, "total_steps": 1235, "loss": 0.3223, "lr": 1.620572014799777e-05, "epoch": 3.0242914979757085, "percentage": 60.49, "elapsed_time": "4:09:09", "remaining_time": "2:42:46"}
748
  {"current_steps": 748, "total_steps": 1235, "loss": 0.3214, "lr": 1.6150208128905857e-05, "epoch": 3.02834008097166, "percentage": 60.57, "elapsed_time": "4:09:25", "remaining_time": "2:42:23"}
749
  {"current_steps": 749, "total_steps": 1235, "loss": 0.3165, "lr": 1.6094726892647147e-05, "epoch": 3.032388663967611, "percentage": 60.65, "elapsed_time": "4:09:45", "remaining_time": "2:42:03"}
750
+ {"current_steps": 750, "total_steps": 1235, "loss": 0.3264, "lr": 1.6039276882848135e-05, "epoch": 3.0364372469635628, "percentage": 60.73, "elapsed_time": "4:10:05", "remaining_time": "2:41:43"}
751
+ {"current_steps": 751, "total_steps": 1235, "loss": 0.3294, "lr": 1.5983858542885635e-05, "epoch": 3.0404858299595143, "percentage": 60.81, "elapsed_time": "4:10:23", "remaining_time": "2:41:22"}
752
+ {"current_steps": 752, "total_steps": 1235, "loss": 0.3289, "lr": 1.5928472315883203e-05, "epoch": 3.0445344129554655, "percentage": 60.89, "elapsed_time": "4:10:45", "remaining_time": "2:41:03"}
753
+ {"current_steps": 753, "total_steps": 1235, "loss": 0.3143, "lr": 1.5873118644707633e-05, "epoch": 3.048582995951417, "percentage": 60.97, "elapsed_time": "4:11:02", "remaining_time": "2:40:41"}
754
+ {"current_steps": 754, "total_steps": 1235, "loss": 0.3314, "lr": 1.5817797971965413e-05, "epoch": 3.0526315789473686, "percentage": 61.05, "elapsed_time": "4:11:23", "remaining_time": "2:40:22"}
755
+ {"current_steps": 755, "total_steps": 1235, "loss": 0.3312, "lr": 1.576251073999917e-05, "epoch": 3.0566801619433197, "percentage": 61.13, "elapsed_time": "4:11:42", "remaining_time": "2:40:01"}
756
+ {"current_steps": 756, "total_steps": 1235, "loss": 0.3272, "lr": 1.5707257390884126e-05, "epoch": 3.0607287449392713, "percentage": 61.21, "elapsed_time": "4:11:58", "remaining_time": "2:39:39"}
757
+ {"current_steps": 757, "total_steps": 1235, "loss": 0.3272, "lr": 1.5652038366424595e-05, "epoch": 3.064777327935223, "percentage": 61.3, "elapsed_time": "4:12:17", "remaining_time": "2:39:18"}
758
+ {"current_steps": 758, "total_steps": 1235, "loss": 0.3304, "lr": 1.5596854108150424e-05, "epoch": 3.068825910931174, "percentage": 61.38, "elapsed_time": "4:12:34", "remaining_time": "2:38:56"}
759
+ {"current_steps": 759, "total_steps": 1235, "loss": 0.3383, "lr": 1.5541705057313476e-05, "epoch": 3.0728744939271255, "percentage": 61.46, "elapsed_time": "4:12:54", "remaining_time": "2:38:36"}
760
+ {"current_steps": 760, "total_steps": 1235, "loss": 0.339, "lr": 1.5486591654884086e-05, "epoch": 3.076923076923077, "percentage": 61.54, "elapsed_time": "4:13:13", "remaining_time": "2:38:15"}
761
+ {"current_steps": 761, "total_steps": 1235, "loss": 0.3253, "lr": 1.543151434154755e-05, "epoch": 3.080971659919028, "percentage": 61.62, "elapsed_time": "4:13:32", "remaining_time": "2:37:55"}
762
+ {"current_steps": 762, "total_steps": 1235, "loss": 0.3149, "lr": 1.5376473557700615e-05, "epoch": 3.08502024291498, "percentage": 61.7, "elapsed_time": "4:13:48", "remaining_time": "2:37:32"}
763
+ {"current_steps": 763, "total_steps": 1235, "loss": 0.3494, "lr": 1.5321469743447893e-05, "epoch": 3.0890688259109313, "percentage": 61.78, "elapsed_time": "4:14:09", "remaining_time": "2:37:13"}
764
+ {"current_steps": 764, "total_steps": 1235, "loss": 0.3377, "lr": 1.5266503338598434e-05, "epoch": 3.0931174089068825, "percentage": 61.86, "elapsed_time": "4:14:29", "remaining_time": "2:36:53"}
765
+ {"current_steps": 765, "total_steps": 1235, "loss": 0.3353, "lr": 1.5211574782662149e-05, "epoch": 3.097165991902834, "percentage": 61.94, "elapsed_time": "4:14:52", "remaining_time": "2:36:35"}
766
+ {"current_steps": 766, "total_steps": 1235, "loss": 0.334, "lr": 1.5156684514846307e-05, "epoch": 3.1012145748987856, "percentage": 62.02, "elapsed_time": "4:15:12", "remaining_time": "2:36:15"}
767
+ {"current_steps": 767, "total_steps": 1235, "loss": 0.3271, "lr": 1.5101832974052012e-05, "epoch": 3.1052631578947367, "percentage": 62.11, "elapsed_time": "4:15:35", "remaining_time": "2:35:57"}
768
+ {"current_steps": 768, "total_steps": 1235, "loss": 0.333, "lr": 1.5047020598870737e-05, "epoch": 3.1093117408906883, "percentage": 62.19, "elapsed_time": "4:15:53", "remaining_time": "2:35:35"}
769
+ {"current_steps": 769, "total_steps": 1235, "loss": 0.341, "lr": 1.4992247827580778e-05, "epoch": 3.11336032388664, "percentage": 62.27, "elapsed_time": "4:16:11", "remaining_time": "2:35:14"}
770
+ {"current_steps": 770, "total_steps": 1235, "loss": 0.3262, "lr": 1.493751509814374e-05, "epoch": 3.117408906882591, "percentage": 62.35, "elapsed_time": "4:16:31", "remaining_time": "2:34:54"}
771
+ {"current_steps": 771, "total_steps": 1235, "loss": 0.3342, "lr": 1.4882822848201073e-05, "epoch": 3.1214574898785425, "percentage": 62.43, "elapsed_time": "4:16:50", "remaining_time": "2:34:34"}
772
+ {"current_steps": 772, "total_steps": 1235, "loss": 0.333, "lr": 1.4828171515070553e-05, "epoch": 3.125506072874494, "percentage": 62.51, "elapsed_time": "4:17:09", "remaining_time": "2:34:13"}
773
+ {"current_steps": 773, "total_steps": 1235, "loss": 0.3126, "lr": 1.4773561535742793e-05, "epoch": 3.1295546558704452, "percentage": 62.59, "elapsed_time": "4:17:26", "remaining_time": "2:33:52"}
774
+ {"current_steps": 774, "total_steps": 1235, "loss": 0.3279, "lr": 1.4718993346877715e-05, "epoch": 3.133603238866397, "percentage": 62.67, "elapsed_time": "4:17:47", "remaining_time": "2:33:32"}
775
+ {"current_steps": 775, "total_steps": 1235, "loss": 0.3364, "lr": 1.466446738480111e-05, "epoch": 3.1376518218623484, "percentage": 62.75, "elapsed_time": "4:18:09", "remaining_time": "2:33:13"}
776
+ {"current_steps": 776, "total_steps": 1235, "loss": 0.3238, "lr": 1.460998408550112e-05, "epoch": 3.1417004048582995, "percentage": 62.83, "elapsed_time": "4:18:29", "remaining_time": "2:32:53"}
777
+ {"current_steps": 777, "total_steps": 1235, "loss": 0.3357, "lr": 1.4555543884624751e-05, "epoch": 3.145748987854251, "percentage": 62.91, "elapsed_time": "4:18:47", "remaining_time": "2:32:32"}
778
+ {"current_steps": 778, "total_steps": 1235, "loss": 0.3163, "lr": 1.4501147217474402e-05, "epoch": 3.1497975708502026, "percentage": 63.0, "elapsed_time": "4:19:04", "remaining_time": "2:32:11"}
779
+ {"current_steps": 779, "total_steps": 1235, "loss": 0.3372, "lr": 1.444679451900437e-05, "epoch": 3.1538461538461537, "percentage": 63.08, "elapsed_time": "4:19:24", "remaining_time": "2:31:51"}
780
+ {"current_steps": 780, "total_steps": 1235, "loss": 0.3298, "lr": 1.4392486223817397e-05, "epoch": 3.1578947368421053, "percentage": 63.16, "elapsed_time": "4:19:46", "remaining_time": "2:31:32"}
781
+ {"current_steps": 781, "total_steps": 1235, "loss": 0.3338, "lr": 1.4338222766161143e-05, "epoch": 3.161943319838057, "percentage": 63.24, "elapsed_time": "4:20:05", "remaining_time": "2:31:11"}
782
+ {"current_steps": 782, "total_steps": 1235, "loss": 0.3259, "lr": 1.4284004579924777e-05, "epoch": 3.165991902834008, "percentage": 63.32, "elapsed_time": "4:20:23", "remaining_time": "2:30:50"}
783
+ {"current_steps": 783, "total_steps": 1235, "loss": 0.3505, "lr": 1.4229832098635479e-05, "epoch": 3.1700404858299596, "percentage": 63.4, "elapsed_time": "4:20:44", "remaining_time": "2:30:31"}
784
+ {"current_steps": 784, "total_steps": 1235, "loss": 0.3337, "lr": 1.4175705755454963e-05, "epoch": 3.174089068825911, "percentage": 63.48, "elapsed_time": "4:21:03", "remaining_time": "2:30:10"}
785
+ {"current_steps": 785, "total_steps": 1235, "loss": 0.3255, "lr": 1.412162598317602e-05, "epoch": 3.1781376518218623, "percentage": 63.56, "elapsed_time": "4:21:23", "remaining_time": "2:29:50"}
786
+ {"current_steps": 786, "total_steps": 1235, "loss": 0.3371, "lr": 1.406759321421907e-05, "epoch": 3.182186234817814, "percentage": 63.64, "elapsed_time": "4:21:43", "remaining_time": "2:29:30"}
787
+ {"current_steps": 787, "total_steps": 1235, "loss": 0.3316, "lr": 1.401360788062871e-05, "epoch": 3.1862348178137654, "percentage": 63.72, "elapsed_time": "4:22:02", "remaining_time": "2:29:10"}
788
+ {"current_steps": 788, "total_steps": 1235, "loss": 0.3198, "lr": 1.3959670414070204e-05, "epoch": 3.1902834008097165, "percentage": 63.81, "elapsed_time": "4:22:23", "remaining_time": "2:28:50"}
789
+ {"current_steps": 789, "total_steps": 1235, "loss": 0.3267, "lr": 1.3905781245826108e-05, "epoch": 3.194331983805668, "percentage": 63.89, "elapsed_time": "4:22:42", "remaining_time": "2:28:29"}
790
+ {"current_steps": 790, "total_steps": 1235, "loss": 0.3412, "lr": 1.3851940806792778e-05, "epoch": 3.1983805668016196, "percentage": 63.97, "elapsed_time": "4:23:03", "remaining_time": "2:28:10"}
791
+ {"current_steps": 791, "total_steps": 1235, "loss": 0.3409, "lr": 1.379814952747693e-05, "epoch": 3.2024291497975708, "percentage": 64.05, "elapsed_time": "4:23:25", "remaining_time": "2:27:51"}
792
+ {"current_steps": 792, "total_steps": 1235, "loss": 0.3286, "lr": 1.3744407837992193e-05, "epoch": 3.2064777327935223, "percentage": 64.13, "elapsed_time": "4:23:44", "remaining_time": "2:27:31"}
793
+ {"current_steps": 793, "total_steps": 1235, "loss": 0.326, "lr": 1.3690716168055692e-05, "epoch": 3.2105263157894735, "percentage": 64.21, "elapsed_time": "4:24:05", "remaining_time": "2:27:12"}
794
+ {"current_steps": 794, "total_steps": 1235, "loss": 0.3337, "lr": 1.363707494698459e-05, "epoch": 3.214574898785425, "percentage": 64.29, "elapsed_time": "4:24:25", "remaining_time": "2:26:51"}
795
+ {"current_steps": 795, "total_steps": 1235, "loss": 0.3289, "lr": 1.358348460369265e-05, "epoch": 3.2186234817813766, "percentage": 64.37, "elapsed_time": "4:24:44", "remaining_time": "2:26:31"}
796
+ {"current_steps": 796, "total_steps": 1235, "loss": 0.3304, "lr": 1.352994556668684e-05, "epoch": 3.2226720647773277, "percentage": 64.45, "elapsed_time": "4:25:03", "remaining_time": "2:26:10"}
797
+ {"current_steps": 797, "total_steps": 1235, "loss": 0.3305, "lr": 1.3476458264063865e-05, "epoch": 3.2267206477732793, "percentage": 64.53, "elapsed_time": "4:25:23", "remaining_time": "2:25:50"}
798
+ {"current_steps": 798, "total_steps": 1235, "loss": 0.3265, "lr": 1.342302312350678e-05, "epoch": 3.230769230769231, "percentage": 64.62, "elapsed_time": "4:25:42", "remaining_time": "2:25:30"}
799
+ {"current_steps": 799, "total_steps": 1235, "loss": 0.334, "lr": 1.3369640572281537e-05, "epoch": 3.234817813765182, "percentage": 64.7, "elapsed_time": "4:25:59", "remaining_time": "2:25:08"}
800
+ {"current_steps": 800, "total_steps": 1235, "loss": 0.3373, "lr": 1.3316311037233596e-05, "epoch": 3.2388663967611335, "percentage": 64.78, "elapsed_time": "4:26:18", "remaining_time": "2:24:48"}
801
+ {"current_steps": 801, "total_steps": 1235, "loss": 0.332, "lr": 1.326303494478451e-05, "epoch": 3.242914979757085, "percentage": 64.86, "elapsed_time": "4:26:34", "remaining_time": "2:24:26"}
802
+ {"current_steps": 802, "total_steps": 1235, "loss": 0.3414, "lr": 1.3209812720928472e-05, "epoch": 3.246963562753036, "percentage": 64.94, "elapsed_time": "4:26:56", "remaining_time": "2:24:07"}
803
+ {"current_steps": 803, "total_steps": 1235, "loss": 0.328, "lr": 1.315664479122898e-05, "epoch": 3.251012145748988, "percentage": 65.02, "elapsed_time": "4:27:13", "remaining_time": "2:23:45"}
804
+ {"current_steps": 804, "total_steps": 1235, "loss": 0.3347, "lr": 1.3103531580815378e-05, "epoch": 3.2550607287449393, "percentage": 65.1, "elapsed_time": "4:27:35", "remaining_time": "2:23:26"}
805
+ {"current_steps": 805, "total_steps": 1235, "loss": 0.3272, "lr": 1.3050473514379488e-05, "epoch": 3.2591093117408905, "percentage": 65.18, "elapsed_time": "4:27:56", "remaining_time": "2:23:07"}
806
+ {"current_steps": 806, "total_steps": 1235, "loss": 0.3298, "lr": 1.2997471016172188e-05, "epoch": 3.263157894736842, "percentage": 65.26, "elapsed_time": "4:28:11", "remaining_time": "2:22:44"}
807
+ {"current_steps": 807, "total_steps": 1235, "loss": 0.3265, "lr": 1.2944524510000042e-05, "epoch": 3.2672064777327936, "percentage": 65.34, "elapsed_time": "4:28:30", "remaining_time": "2:22:24"}
808
+ {"current_steps": 808, "total_steps": 1235, "loss": 0.3436, "lr": 1.2891634419221908e-05, "epoch": 3.2712550607287447, "percentage": 65.43, "elapsed_time": "4:28:50", "remaining_time": "2:22:04"}
809
+ {"current_steps": 809, "total_steps": 1235, "loss": 0.3401, "lr": 1.2838801166745545e-05, "epoch": 3.2753036437246963, "percentage": 65.51, "elapsed_time": "4:29:11", "remaining_time": "2:21:44"}
810
+ {"current_steps": 810, "total_steps": 1235, "loss": 0.3241, "lr": 1.2786025175024216e-05, "epoch": 3.279352226720648, "percentage": 65.59, "elapsed_time": "4:29:33", "remaining_time": "2:21:26"}
811
+ {"current_steps": 811, "total_steps": 1235, "loss": 0.3325, "lr": 1.2733306866053357e-05, "epoch": 3.283400809716599, "percentage": 65.67, "elapsed_time": "4:29:55", "remaining_time": "2:21:06"}
812
+ {"current_steps": 812, "total_steps": 1235, "loss": 0.3297, "lr": 1.2680646661367163e-05, "epoch": 3.2874493927125505, "percentage": 65.75, "elapsed_time": "4:30:12", "remaining_time": "2:20:45"}
813
+ {"current_steps": 813, "total_steps": 1235, "loss": 0.3409, "lr": 1.2628044982035219e-05, "epoch": 3.291497975708502, "percentage": 65.83, "elapsed_time": "4:30:33", "remaining_time": "2:20:25"}
814
+ {"current_steps": 814, "total_steps": 1235, "loss": 0.3371, "lr": 1.2575502248659155e-05, "epoch": 3.2955465587044532, "percentage": 65.91, "elapsed_time": "4:30:49", "remaining_time": "2:20:04"}
815
+ {"current_steps": 815, "total_steps": 1235, "loss": 0.3277, "lr": 1.2523018881369269e-05, "epoch": 3.299595141700405, "percentage": 65.99, "elapsed_time": "4:31:09", "remaining_time": "2:19:44"}
816
+ {"current_steps": 816, "total_steps": 1235, "loss": 0.3289, "lr": 1.2470595299821176e-05, "epoch": 3.3036437246963564, "percentage": 66.07, "elapsed_time": "4:31:27", "remaining_time": "2:19:23"}
817
+ {"current_steps": 817, "total_steps": 1235, "loss": 0.3268, "lr": 1.2418231923192416e-05, "epoch": 3.3076923076923075, "percentage": 66.15, "elapsed_time": "4:31:47", "remaining_time": "2:19:03"}
818
+ {"current_steps": 818, "total_steps": 1235, "loss": 0.3369, "lr": 1.2365929170179165e-05, "epoch": 3.311740890688259, "percentage": 66.23, "elapsed_time": "4:32:08", "remaining_time": "2:18:43"}
819
+ {"current_steps": 819, "total_steps": 1235, "loss": 0.3259, "lr": 1.2313687458992848e-05, "epoch": 3.3157894736842106, "percentage": 66.32, "elapsed_time": "4:32:28", "remaining_time": "2:18:24"}
820
+ {"current_steps": 820, "total_steps": 1235, "loss": 0.3298, "lr": 1.2261507207356785e-05, "epoch": 3.3198380566801617, "percentage": 66.4, "elapsed_time": "4:32:49", "remaining_time": "2:18:04"}
821
+ {"current_steps": 821, "total_steps": 1235, "loss": 0.3351, "lr": 1.220938883250288e-05, "epoch": 3.3238866396761133, "percentage": 66.48, "elapsed_time": "4:33:08", "remaining_time": "2:17:43"}
822
+ {"current_steps": 822, "total_steps": 1235, "loss": 0.3241, "lr": 1.215733275116827e-05, "epoch": 3.327935222672065, "percentage": 66.56, "elapsed_time": "4:33:27", "remaining_time": "2:17:23"}
823
+ {"current_steps": 823, "total_steps": 1235, "loss": 0.3286, "lr": 1.2105339379592005e-05, "epoch": 3.331983805668016, "percentage": 66.64, "elapsed_time": "4:33:45", "remaining_time": "2:17:02"}
824
+ {"current_steps": 824, "total_steps": 1235, "loss": 0.3222, "lr": 1.2053409133511681e-05, "epoch": 3.3360323886639676, "percentage": 66.72, "elapsed_time": "4:34:03", "remaining_time": "2:16:41"}
825
+ {"current_steps": 825, "total_steps": 1235, "loss": 0.3274, "lr": 1.2001542428160173e-05, "epoch": 3.340080971659919, "percentage": 66.8, "elapsed_time": "4:34:18", "remaining_time": "2:16:19"}
826
+ {"current_steps": 826, "total_steps": 1235, "loss": 0.3294, "lr": 1.1949739678262278e-05, "epoch": 3.3441295546558703, "percentage": 66.88, "elapsed_time": "4:34:38", "remaining_time": "2:15:59"}
827
+ {"current_steps": 827, "total_steps": 1235, "loss": 0.3243, "lr": 1.189800129803139e-05, "epoch": 3.348178137651822, "percentage": 66.96, "elapsed_time": "4:34:56", "remaining_time": "2:15:38"}
828
+ {"current_steps": 828, "total_steps": 1235, "loss": 0.3412, "lr": 1.1846327701166228e-05, "epoch": 3.3522267206477734, "percentage": 67.04, "elapsed_time": "4:35:17", "remaining_time": "2:15:19"}
829
+ {"current_steps": 829, "total_steps": 1235, "loss": 0.3324, "lr": 1.1794719300847493e-05, "epoch": 3.3562753036437245, "percentage": 67.13, "elapsed_time": "4:35:40", "remaining_time": "2:15:00"}
830
+ {"current_steps": 830, "total_steps": 1235, "loss": 0.3322, "lr": 1.1743176509734582e-05, "epoch": 3.360323886639676, "percentage": 67.21, "elapsed_time": "4:35:59", "remaining_time": "2:14:40"}
831
+ {"current_steps": 831, "total_steps": 1235, "loss": 0.332, "lr": 1.1691699739962275e-05, "epoch": 3.3643724696356276, "percentage": 67.29, "elapsed_time": "4:36:18", "remaining_time": "2:14:19"}
832
+ {"current_steps": 832, "total_steps": 1235, "loss": 0.3274, "lr": 1.1640289403137456e-05, "epoch": 3.3684210526315788, "percentage": 67.37, "elapsed_time": "4:36:37", "remaining_time": "2:13:59"}
833
+ {"current_steps": 833, "total_steps": 1235, "loss": 0.3246, "lr": 1.1588945910335802e-05, "epoch": 3.3724696356275303, "percentage": 67.45, "elapsed_time": "4:36:59", "remaining_time": "2:13:40"}
834
+ {"current_steps": 834, "total_steps": 1235, "loss": 0.3332, "lr": 1.1537669672098517e-05, "epoch": 3.376518218623482, "percentage": 67.53, "elapsed_time": "4:37:16", "remaining_time": "2:13:19"}
835
+ {"current_steps": 835, "total_steps": 1235, "loss": 0.3217, "lr": 1.1486461098429036e-05, "epoch": 3.380566801619433, "percentage": 67.61, "elapsed_time": "4:37:37", "remaining_time": "2:12:59"}
836
+ {"current_steps": 836, "total_steps": 1235, "loss": 0.3308, "lr": 1.1435320598789747e-05, "epoch": 3.3846153846153846, "percentage": 67.69, "elapsed_time": "4:37:57", "remaining_time": "2:12:39"}
837
+ {"current_steps": 837, "total_steps": 1235, "loss": 0.3264, "lr": 1.1384248582098736e-05, "epoch": 3.388663967611336, "percentage": 67.77, "elapsed_time": "4:38:16", "remaining_time": "2:12:19"}
838
+ {"current_steps": 838, "total_steps": 1235, "loss": 0.3267, "lr": 1.1333245456726467e-05, "epoch": 3.3927125506072873, "percentage": 67.85, "elapsed_time": "4:38:37", "remaining_time": "2:11:59"}
839
+ {"current_steps": 839, "total_steps": 1235, "loss": 0.3242, "lr": 1.128231163049258e-05, "epoch": 3.396761133603239, "percentage": 67.94, "elapsed_time": "4:38:54", "remaining_time": "2:11:38"}
840
+ {"current_steps": 840, "total_steps": 1235, "loss": 0.3353, "lr": 1.123144751066259e-05, "epoch": 3.4008097165991904, "percentage": 68.02, "elapsed_time": "4:39:13", "remaining_time": "2:11:18"}
841
+ {"current_steps": 841, "total_steps": 1235, "loss": 0.3345, "lr": 1.1180653503944657e-05, "epoch": 3.4048582995951415, "percentage": 68.1, "elapsed_time": "4:39:34", "remaining_time": "2:10:58"}
842
+ {"current_steps": 842, "total_steps": 1235, "loss": 0.3316, "lr": 1.1129930016486287e-05, "epoch": 3.408906882591093, "percentage": 68.18, "elapsed_time": "4:39:50", "remaining_time": "2:10:36"}
843
+ {"current_steps": 843, "total_steps": 1235, "loss": 0.3448, "lr": 1.107927745387114e-05, "epoch": 3.4129554655870447, "percentage": 68.26, "elapsed_time": "4:40:11", "remaining_time": "2:10:17"}
844
+ {"current_steps": 844, "total_steps": 1235, "loss": 0.328, "lr": 1.1028696221115766e-05, "epoch": 3.417004048582996, "percentage": 68.34, "elapsed_time": "4:40:28", "remaining_time": "2:09:56"}
845
+ {"current_steps": 845, "total_steps": 1235, "loss": 0.3279, "lr": 1.0978186722666341e-05, "epoch": 3.4210526315789473, "percentage": 68.42, "elapsed_time": "4:40:49", "remaining_time": "2:09:36"}
846
+ {"current_steps": 846, "total_steps": 1235, "loss": 0.3135, "lr": 1.0927749362395475e-05, "epoch": 3.425101214574899, "percentage": 68.5, "elapsed_time": "4:41:09", "remaining_time": "2:09:16"}
847
+ {"current_steps": 847, "total_steps": 1235, "loss": 0.3272, "lr": 1.0877384543598954e-05, "epoch": 3.42914979757085, "percentage": 68.58, "elapsed_time": "4:41:26", "remaining_time": "2:08:55"}
848
+ {"current_steps": 848, "total_steps": 1235, "loss": 0.3284, "lr": 1.0827092668992529e-05, "epoch": 3.4331983805668016, "percentage": 68.66, "elapsed_time": "4:41:44", "remaining_time": "2:08:34"}
849
+ {"current_steps": 849, "total_steps": 1235, "loss": 0.3408, "lr": 1.077687414070869e-05, "epoch": 3.437246963562753, "percentage": 68.74, "elapsed_time": "4:42:04", "remaining_time": "2:08:14"}
850
+ {"current_steps": 850, "total_steps": 1235, "loss": 0.3365, "lr": 1.0726729360293451e-05, "epoch": 3.4412955465587043, "percentage": 68.83, "elapsed_time": "4:42:26", "remaining_time": "2:07:55"}
851
+ {"current_steps": 851, "total_steps": 1235, "loss": 0.3422, "lr": 1.0676658728703147e-05, "epoch": 3.445344129554656, "percentage": 68.91, "elapsed_time": "4:42:49", "remaining_time": "2:07:37"}
852
+ {"current_steps": 852, "total_steps": 1235, "loss": 0.3398, "lr": 1.0626662646301198e-05, "epoch": 3.4493927125506074, "percentage": 68.99, "elapsed_time": "4:43:11", "remaining_time": "2:07:18"}
853
+ {"current_steps": 853, "total_steps": 1235, "loss": 0.3247, "lr": 1.0576741512854958e-05, "epoch": 3.4534412955465585, "percentage": 69.07, "elapsed_time": "4:43:29", "remaining_time": "2:06:57"}
854
+ {"current_steps": 854, "total_steps": 1235, "loss": 0.3441, "lr": 1.052689572753247e-05, "epoch": 3.45748987854251, "percentage": 69.15, "elapsed_time": "4:43:51", "remaining_time": "2:06:38"}
855
+ {"current_steps": 855, "total_steps": 1235, "loss": 0.3334, "lr": 1.0477125688899328e-05, "epoch": 3.4615384615384617, "percentage": 69.23, "elapsed_time": "4:44:10", "remaining_time": "2:06:18"}
856
+ {"current_steps": 856, "total_steps": 1235, "loss": 0.3365, "lr": 1.0427431794915406e-05, "epoch": 3.465587044534413, "percentage": 69.31, "elapsed_time": "4:44:32", "remaining_time": "2:05:58"}
857
+ {"current_steps": 857, "total_steps": 1235, "loss": 0.3246, "lr": 1.0377814442931769e-05, "epoch": 3.4696356275303644, "percentage": 69.39, "elapsed_time": "4:44:49", "remaining_time": "2:05:37"}
858
+ {"current_steps": 858, "total_steps": 1235, "loss": 0.3316, "lr": 1.0328274029687439e-05, "epoch": 3.473684210526316, "percentage": 69.47, "elapsed_time": "4:45:10", "remaining_time": "2:05:18"}
859
+ {"current_steps": 859, "total_steps": 1235, "loss": 0.3365, "lr": 1.0278810951306253e-05, "epoch": 3.477732793522267, "percentage": 69.55, "elapsed_time": "4:45:30", "remaining_time": "2:04:58"}
860
+ {"current_steps": 860, "total_steps": 1235, "loss": 0.3229, "lr": 1.0229425603293647e-05, "epoch": 3.4817813765182186, "percentage": 69.64, "elapsed_time": "4:45:51", "remaining_time": "2:04:38"}
861
+ {"current_steps": 861, "total_steps": 1235, "loss": 0.3469, "lr": 1.0180118380533558e-05, "epoch": 3.48582995951417, "percentage": 69.72, "elapsed_time": "4:46:12", "remaining_time": "2:04:19"}
862
+ {"current_steps": 862, "total_steps": 1235, "loss": 0.3192, "lr": 1.0130889677285225e-05, "epoch": 3.4898785425101213, "percentage": 69.8, "elapsed_time": "4:46:31", "remaining_time": "2:03:59"}
863
+ {"current_steps": 863, "total_steps": 1235, "loss": 0.3302, "lr": 1.008173988718005e-05, "epoch": 3.493927125506073, "percentage": 69.88, "elapsed_time": "4:46:52", "remaining_time": "2:03:39"}
864
+ {"current_steps": 864, "total_steps": 1235, "loss": 0.3247, "lr": 1.0032669403218439e-05, "epoch": 3.4979757085020244, "percentage": 69.96, "elapsed_time": "4:47:12", "remaining_time": "2:03:19"}
865
+ {"current_steps": 865, "total_steps": 1235, "loss": 0.3272, "lr": 9.983678617766677e-06, "epoch": 3.5020242914979756, "percentage": 70.04, "elapsed_time": "4:47:32", "remaining_time": "2:02:59"}
866
+ {"current_steps": 866, "total_steps": 1235, "loss": 0.3298, "lr": 9.934767922553788e-06, "epoch": 3.506072874493927, "percentage": 70.12, "elapsed_time": "4:47:53", "remaining_time": "2:02:40"}
867
+ {"current_steps": 867, "total_steps": 1235, "loss": 0.335, "lr": 9.885937708668371e-06, "epoch": 3.5101214574898787, "percentage": 70.2, "elapsed_time": "4:48:14", "remaining_time": "2:02:20"}
868
+ {"current_steps": 868, "total_steps": 1235, "loss": 0.3415, "lr": 9.837188366555524e-06, "epoch": 3.51417004048583, "percentage": 70.28, "elapsed_time": "4:48:33", "remaining_time": "2:02:00"}
869
+ {"current_steps": 869, "total_steps": 1235, "loss": 0.3408, "lr": 9.788520286013691e-06, "epoch": 3.5182186234817814, "percentage": 70.36, "elapsed_time": "4:48:53", "remaining_time": "2:01:40"}
870
+ {"current_steps": 870, "total_steps": 1235, "loss": 0.3297, "lr": 9.739933856191537e-06, "epoch": 3.522267206477733, "percentage": 70.45, "elapsed_time": "4:49:14", "remaining_time": "2:01:20"}
871
+ {"current_steps": 871, "total_steps": 1235, "loss": 0.3238, "lr": 9.691429465584866e-06, "epoch": 3.526315789473684, "percentage": 70.53, "elapsed_time": "4:49:32", "remaining_time": "2:00:59"}
872
+ {"current_steps": 872, "total_steps": 1235, "loss": 0.3243, "lr": 9.643007502033492e-06, "epoch": 3.5303643724696356, "percentage": 70.61, "elapsed_time": "4:49:51", "remaining_time": "2:00:39"}
873
+ {"current_steps": 873, "total_steps": 1235, "loss": 0.3375, "lr": 9.594668352718152e-06, "epoch": 3.534412955465587, "percentage": 70.69, "elapsed_time": "4:50:10", "remaining_time": "2:00:19"}
874
+ {"current_steps": 874, "total_steps": 1235, "loss": 0.3279, "lr": 9.546412404157383e-06, "epoch": 3.5384615384615383, "percentage": 70.77, "elapsed_time": "4:50:27", "remaining_time": "1:59:58"}
875
+ {"current_steps": 875, "total_steps": 1235, "loss": 0.3253, "lr": 9.498240042204471e-06, "epoch": 3.54251012145749, "percentage": 70.85, "elapsed_time": "4:50:47", "remaining_time": "1:59:38"}
876
+ {"current_steps": 876, "total_steps": 1235, "loss": 0.3249, "lr": 9.450151652044339e-06, "epoch": 3.5465587044534415, "percentage": 70.93, "elapsed_time": "4:51:06", "remaining_time": "1:59:17"}
877
+ {"current_steps": 877, "total_steps": 1235, "loss": 0.3319, "lr": 9.402147618190472e-06, "epoch": 3.5506072874493926, "percentage": 71.01, "elapsed_time": "4:51:27", "remaining_time": "1:58:58"}
878
+ {"current_steps": 878, "total_steps": 1235, "loss": 0.3333, "lr": 9.354228324481841e-06, "epoch": 3.554655870445344, "percentage": 71.09, "elapsed_time": "4:51:47", "remaining_time": "1:58:38"}
879
+ {"current_steps": 879, "total_steps": 1235, "loss": 0.3411, "lr": 9.306394154079852e-06, "epoch": 3.5587044534412957, "percentage": 71.17, "elapsed_time": "4:52:07", "remaining_time": "1:58:18"}
880
+ {"current_steps": 880, "total_steps": 1235, "loss": 0.3352, "lr": 9.258645489465254e-06, "epoch": 3.562753036437247, "percentage": 71.26, "elapsed_time": "4:52:28", "remaining_time": "1:57:59"}
881
+ {"current_steps": 881, "total_steps": 1235, "loss": 0.3266, "lr": 9.21098271243509e-06, "epoch": 3.5668016194331984, "percentage": 71.34, "elapsed_time": "4:52:46", "remaining_time": "1:57:38"}
882
+ {"current_steps": 882, "total_steps": 1235, "loss": 0.3315, "lr": 9.163406204099659e-06, "epoch": 3.57085020242915, "percentage": 71.42, "elapsed_time": "4:53:04", "remaining_time": "1:57:17"}
883
+ {"current_steps": 883, "total_steps": 1235, "loss": 0.3368, "lr": 9.115916344879452e-06, "epoch": 3.574898785425101, "percentage": 71.5, "elapsed_time": "4:53:24", "remaining_time": "1:56:57"}
884
+ {"current_steps": 884, "total_steps": 1235, "loss": 0.3413, "lr": 9.068513514502126e-06, "epoch": 3.5789473684210527, "percentage": 71.58, "elapsed_time": "4:53:45", "remaining_time": "1:56:38"}
885
+ {"current_steps": 885, "total_steps": 1235, "loss": 0.3414, "lr": 9.021198091999439e-06, "epoch": 3.582995951417004, "percentage": 71.66, "elapsed_time": "4:54:07", "remaining_time": "1:56:19"}
886
+ {"current_steps": 886, "total_steps": 1235, "loss": 0.3308, "lr": 8.973970455704251e-06, "epoch": 3.5870445344129553, "percentage": 71.74, "elapsed_time": "4:54:31", "remaining_time": "1:56:00"}
887
+ {"current_steps": 887, "total_steps": 1235, "loss": 0.3329, "lr": 8.926830983247495e-06, "epoch": 3.591093117408907, "percentage": 71.82, "elapsed_time": "4:54:53", "remaining_time": "1:55:41"}
888
+ {"current_steps": 888, "total_steps": 1235, "loss": 0.3361, "lr": 8.879780051555116e-06, "epoch": 3.5951417004048585, "percentage": 71.9, "elapsed_time": "4:55:13", "remaining_time": "1:55:21"}
889
+ {"current_steps": 889, "total_steps": 1235, "loss": 0.3379, "lr": 8.83281803684512e-06, "epoch": 3.5991902834008096, "percentage": 71.98, "elapsed_time": "4:55:31", "remaining_time": "1:55:01"}
890
+ {"current_steps": 890, "total_steps": 1235, "loss": 0.3269, "lr": 8.785945314624532e-06, "epoch": 3.603238866396761, "percentage": 72.06, "elapsed_time": "4:55:48", "remaining_time": "1:54:40"}
891
+ {"current_steps": 891, "total_steps": 1235, "loss": 0.3368, "lr": 8.739162259686385e-06, "epoch": 3.6072874493927127, "percentage": 72.15, "elapsed_time": "4:56:11", "remaining_time": "1:54:21"}
892
+ {"current_steps": 892, "total_steps": 1235, "loss": 0.3302, "lr": 8.692469246106734e-06, "epoch": 3.611336032388664, "percentage": 72.23, "elapsed_time": "4:56:29", "remaining_time": "1:54:00"}
893
+ {"current_steps": 893, "total_steps": 1235, "loss": 0.3287, "lr": 8.645866647241677e-06, "epoch": 3.6153846153846154, "percentage": 72.31, "elapsed_time": "4:56:48", "remaining_time": "1:53:40"}
894
+ {"current_steps": 894, "total_steps": 1235, "loss": 0.3367, "lr": 8.599354835724348e-06, "epoch": 3.619433198380567, "percentage": 72.39, "elapsed_time": "4:57:07", "remaining_time": "1:53:19"}
895
+ {"current_steps": 895, "total_steps": 1235, "loss": 0.334, "lr": 8.552934183461958e-06, "epoch": 3.623481781376518, "percentage": 72.47, "elapsed_time": "4:57:27", "remaining_time": "1:52:59"}
896
+ {"current_steps": 896, "total_steps": 1235, "loss": 0.3234, "lr": 8.506605061632805e-06, "epoch": 3.6275303643724697, "percentage": 72.55, "elapsed_time": "4:57:47", "remaining_time": "1:52:40"}
897
+ {"current_steps": 897, "total_steps": 1235, "loss": 0.3248, "lr": 8.460367840683308e-06, "epoch": 3.6315789473684212, "percentage": 72.63, "elapsed_time": "4:58:05", "remaining_time": "1:52:19"}
898
+ {"current_steps": 898, "total_steps": 1235, "loss": 0.3302, "lr": 8.414222890325065e-06, "epoch": 3.6356275303643724, "percentage": 72.71, "elapsed_time": "4:58:24", "remaining_time": "1:51:59"}
899
+ {"current_steps": 899, "total_steps": 1235, "loss": 0.3415, "lr": 8.368170579531855e-06, "epoch": 3.639676113360324, "percentage": 72.79, "elapsed_time": "4:58:42", "remaining_time": "1:51:38"}
900
+ {"current_steps": 900, "total_steps": 1235, "loss": 0.3391, "lr": 8.322211276536733e-06, "epoch": 3.6437246963562755, "percentage": 72.87, "elapsed_time": "4:58:59", "remaining_time": "1:51:17"}
901
+ {"current_steps": 901, "total_steps": 1235, "loss": 0.3312, "lr": 8.27634534882907e-06, "epoch": 3.6477732793522266, "percentage": 72.96, "elapsed_time": "4:59:22", "remaining_time": "1:50:58"}
902
+ {"current_steps": 902, "total_steps": 1235, "loss": 0.3175, "lr": 8.230573163151585e-06, "epoch": 3.651821862348178, "percentage": 73.04, "elapsed_time": "4:59:40", "remaining_time": "1:50:38"}
903
+ {"current_steps": 903, "total_steps": 1235, "loss": 0.3396, "lr": 8.184895085497466e-06, "epoch": 3.6558704453441297, "percentage": 73.12, "elapsed_time": "4:59:57", "remaining_time": "1:50:17"}
904
+ {"current_steps": 904, "total_steps": 1235, "loss": 0.3387, "lr": 8.139311481107401e-06, "epoch": 3.659919028340081, "percentage": 73.2, "elapsed_time": "5:00:18", "remaining_time": "1:49:57"}
905
+ {"current_steps": 905, "total_steps": 1235, "loss": 0.3248, "lr": 8.093822714466686e-06, "epoch": 3.6639676113360324, "percentage": 73.28, "elapsed_time": "5:00:35", "remaining_time": "1:49:36"}
906
+ {"current_steps": 906, "total_steps": 1235, "loss": 0.3428, "lr": 8.048429149302271e-06, "epoch": 3.668016194331984, "percentage": 73.36, "elapsed_time": "5:00:55", "remaining_time": "1:49:16"}
907
+ {"current_steps": 907, "total_steps": 1235, "loss": 0.3348, "lr": 8.003131148579902e-06, "epoch": 3.672064777327935, "percentage": 73.44, "elapsed_time": "5:01:16", "remaining_time": "1:48:57"}
908
+ {"current_steps": 908, "total_steps": 1235, "loss": 0.3318, "lr": 7.957929074501182e-06, "epoch": 3.6761133603238867, "percentage": 73.52, "elapsed_time": "5:01:35", "remaining_time": "1:48:36"}
909
+ {"current_steps": 909, "total_steps": 1235, "loss": 0.3336, "lr": 7.912823288500695e-06, "epoch": 3.6801619433198383, "percentage": 73.6, "elapsed_time": "5:01:57", "remaining_time": "1:48:17"}
910
+ {"current_steps": 910, "total_steps": 1235, "loss": 0.3334, "lr": 7.867814151243102e-06, "epoch": 3.6842105263157894, "percentage": 73.68, "elapsed_time": "5:02:21", "remaining_time": "1:47:59"}
911
+ {"current_steps": 911, "total_steps": 1235, "loss": 0.3277, "lr": 7.822902022620267e-06, "epoch": 3.688259109311741, "percentage": 73.77, "elapsed_time": "5:02:44", "remaining_time": "1:47:40"}
912
+ {"current_steps": 912, "total_steps": 1235, "loss": 0.3297, "lr": 7.778087261748377e-06, "epoch": 3.6923076923076925, "percentage": 73.85, "elapsed_time": "5:03:04", "remaining_time": "1:47:20"}
913
+ {"current_steps": 913, "total_steps": 1235, "loss": 0.3396, "lr": 7.733370226965056e-06, "epoch": 3.6963562753036436, "percentage": 73.93, "elapsed_time": "5:03:25", "remaining_time": "1:47:00"}
914
+ {"current_steps": 914, "total_steps": 1235, "loss": 0.3465, "lr": 7.688751275826527e-06, "epoch": 3.700404858299595, "percentage": 74.01, "elapsed_time": "5:03:47", "remaining_time": "1:46:41"}
915
+ {"current_steps": 915, "total_steps": 1235, "loss": 0.3181, "lr": 7.644230765104735e-06, "epoch": 3.7044534412955468, "percentage": 74.09, "elapsed_time": "5:04:06", "remaining_time": "1:46:21"}
916
+ {"current_steps": 916, "total_steps": 1235, "loss": 0.337, "lr": 7.599809050784502e-06, "epoch": 3.708502024291498, "percentage": 74.17, "elapsed_time": "5:04:25", "remaining_time": "1:46:01"}
917
+ {"current_steps": 917, "total_steps": 1235, "loss": 0.3327, "lr": 7.555486488060661e-06, "epoch": 3.7125506072874495, "percentage": 74.25, "elapsed_time": "5:04:45", "remaining_time": "1:45:41"}
918
+ {"current_steps": 918, "total_steps": 1235, "loss": 0.3275, "lr": 7.511263431335249e-06, "epoch": 3.716599190283401, "percentage": 74.33, "elapsed_time": "5:05:05", "remaining_time": "1:45:21"}
919
+ {"current_steps": 919, "total_steps": 1235, "loss": 0.3444, "lr": 7.467140234214656e-06, "epoch": 3.720647773279352, "percentage": 74.41, "elapsed_time": "5:05:24", "remaining_time": "1:45:00"}
920
+ {"current_steps": 920, "total_steps": 1235, "loss": 0.3212, "lr": 7.423117249506777e-06, "epoch": 3.7246963562753037, "percentage": 74.49, "elapsed_time": "5:05:42", "remaining_time": "1:44:40"}
921
+ {"current_steps": 921, "total_steps": 1235, "loss": 0.3328, "lr": 7.379194829218231e-06, "epoch": 3.7287449392712553, "percentage": 74.57, "elapsed_time": "5:06:06", "remaining_time": "1:44:21"}
922
+ {"current_steps": 922, "total_steps": 1235, "loss": 0.3431, "lr": 7.335373324551518e-06, "epoch": 3.7327935222672064, "percentage": 74.66, "elapsed_time": "5:06:27", "remaining_time": "1:44:02"}
923
+ {"current_steps": 923, "total_steps": 1235, "loss": 0.327, "lr": 7.291653085902224e-06, "epoch": 3.736842105263158, "percentage": 74.74, "elapsed_time": "5:06:50", "remaining_time": "1:43:43"}
924
+ {"current_steps": 924, "total_steps": 1235, "loss": 0.3432, "lr": 7.248034462856213e-06, "epoch": 3.7408906882591095, "percentage": 74.82, "elapsed_time": "5:07:12", "remaining_time": "1:43:23"}
925
+ {"current_steps": 925, "total_steps": 1235, "loss": 0.3304, "lr": 7.20451780418683e-06, "epoch": 3.7449392712550607, "percentage": 74.9, "elapsed_time": "5:07:30", "remaining_time": "1:43:03"}
926
+ {"current_steps": 926, "total_steps": 1235, "loss": 0.3209, "lr": 7.161103457852128e-06, "epoch": 3.748987854251012, "percentage": 74.98, "elapsed_time": "5:07:52", "remaining_time": "1:42:44"}
927
+ {"current_steps": 927, "total_steps": 1235, "loss": 0.3304, "lr": 7.117791770992046e-06, "epoch": 3.753036437246964, "percentage": 75.06, "elapsed_time": "5:08:12", "remaining_time": "1:42:24"}
928
+ {"current_steps": 928, "total_steps": 1235, "loss": 0.3326, "lr": 7.074583089925688e-06, "epoch": 3.757085020242915, "percentage": 75.14, "elapsed_time": "5:08:30", "remaining_time": "1:42:03"}
929
+ {"current_steps": 929, "total_steps": 1235, "loss": 0.328, "lr": 7.0314777601485155e-06, "epoch": 3.7611336032388665, "percentage": 75.22, "elapsed_time": "5:08:45", "remaining_time": "1:41:42"}
930
+ {"current_steps": 930, "total_steps": 1235, "loss": 0.3371, "lr": 6.988476126329604e-06, "epoch": 3.765182186234818, "percentage": 75.3, "elapsed_time": "5:09:03", "remaining_time": "1:41:21"}
931
+ {"current_steps": 931, "total_steps": 1235, "loss": 0.3275, "lr": 6.945578532308857e-06, "epoch": 3.769230769230769, "percentage": 75.38, "elapsed_time": "5:09:23", "remaining_time": "1:41:01"}
932
+ {"current_steps": 932, "total_steps": 1235, "loss": 0.3286, "lr": 6.902785321094301e-06, "epoch": 3.7732793522267207, "percentage": 75.47, "elapsed_time": "5:09:45", "remaining_time": "1:40:42"}
933
+ {"current_steps": 933, "total_steps": 1235, "loss": 0.3162, "lr": 6.8600968348593115e-06, "epoch": 3.7773279352226723, "percentage": 75.55, "elapsed_time": "5:10:04", "remaining_time": "1:40:22"}
934
+ {"current_steps": 934, "total_steps": 1235, "loss": 0.3453, "lr": 6.817513414939892e-06, "epoch": 3.7813765182186234, "percentage": 75.63, "elapsed_time": "5:10:26", "remaining_time": "1:40:02"}
935
+ {"current_steps": 935, "total_steps": 1235, "loss": 0.3378, "lr": 6.775035401831924e-06, "epoch": 3.785425101214575, "percentage": 75.71, "elapsed_time": "5:10:46", "remaining_time": "1:39:42"}
936
+ {"current_steps": 936, "total_steps": 1235, "loss": 0.334, "lr": 6.732663135188473e-06, "epoch": 3.7894736842105265, "percentage": 75.79, "elapsed_time": "5:11:02", "remaining_time": "1:39:21"}
937
+ {"current_steps": 937, "total_steps": 1235, "loss": 0.332, "lr": 6.690396953817055e-06, "epoch": 3.7935222672064777, "percentage": 75.87, "elapsed_time": "5:11:23", "remaining_time": "1:39:02"}
938
+ {"current_steps": 938, "total_steps": 1235, "loss": 0.326, "lr": 6.648237195676927e-06, "epoch": 3.7975708502024292, "percentage": 75.95, "elapsed_time": "5:11:42", "remaining_time": "1:38:41"}
939
+ {"current_steps": 939, "total_steps": 1235, "loss": 0.3378, "lr": 6.606184197876395e-06, "epoch": 3.801619433198381, "percentage": 76.03, "elapsed_time": "5:12:03", "remaining_time": "1:38:22"}
940
+ {"current_steps": 940, "total_steps": 1235, "loss": 0.3312, "lr": 6.564238296670109e-06, "epoch": 3.805668016194332, "percentage": 76.11, "elapsed_time": "5:12:24", "remaining_time": "1:38:02"}
941
+ {"current_steps": 941, "total_steps": 1235, "loss": 0.3427, "lr": 6.52239982745638e-06, "epoch": 3.8097165991902835, "percentage": 76.19, "elapsed_time": "5:12:44", "remaining_time": "1:37:42"}
942
+ {"current_steps": 942, "total_steps": 1235, "loss": 0.343, "lr": 6.480669124774484e-06, "epoch": 3.813765182186235, "percentage": 76.28, "elapsed_time": "5:13:02", "remaining_time": "1:37:21"}
943
+ {"current_steps": 943, "total_steps": 1235, "loss": 0.3238, "lr": 6.439046522302013e-06, "epoch": 3.817813765182186, "percentage": 76.36, "elapsed_time": "5:13:21", "remaining_time": "1:37:01"}
944
+ {"current_steps": 944, "total_steps": 1235, "loss": 0.3248, "lr": 6.397532352852191e-06, "epoch": 3.8218623481781377, "percentage": 76.44, "elapsed_time": "5:13:39", "remaining_time": "1:36:41"}
945
+ {"current_steps": 945, "total_steps": 1235, "loss": 0.3287, "lr": 6.356126948371202e-06, "epoch": 3.8259109311740893, "percentage": 76.52, "elapsed_time": "5:13:59", "remaining_time": "1:36:21"}
946
+ {"current_steps": 946, "total_steps": 1235, "loss": 0.3275, "lr": 6.314830639935559e-06, "epoch": 3.8299595141700404, "percentage": 76.6, "elapsed_time": "5:14:20", "remaining_time": "1:36:01"}
947
+ {"current_steps": 947, "total_steps": 1235, "loss": 0.3187, "lr": 6.273643757749448e-06, "epoch": 3.834008097165992, "percentage": 76.68, "elapsed_time": "5:14:41", "remaining_time": "1:35:42"}
948
+ {"current_steps": 948, "total_steps": 1235, "loss": 0.3219, "lr": 6.2325666311420856e-06, "epoch": 3.8380566801619436, "percentage": 76.76, "elapsed_time": "5:15:02", "remaining_time": "1:35:22"}
949
+ {"current_steps": 949, "total_steps": 1235, "loss": 0.3315, "lr": 6.1915995885650675e-06, "epoch": 3.8421052631578947, "percentage": 76.84, "elapsed_time": "5:15:19", "remaining_time": "1:35:01"}
950
+ {"current_steps": 950, "total_steps": 1235, "loss": 0.3189, "lr": 6.150742957589784e-06, "epoch": 3.8461538461538463, "percentage": 76.92, "elapsed_time": "5:15:40", "remaining_time": "1:34:42"}
951
+ {"current_steps": 951, "total_steps": 1235, "loss": 0.3373, "lr": 6.109997064904774e-06, "epoch": 3.850202429149798, "percentage": 77.0, "elapsed_time": "5:16:04", "remaining_time": "1:34:23"}
952
+ {"current_steps": 952, "total_steps": 1235, "loss": 0.3218, "lr": 6.069362236313092e-06, "epoch": 3.854251012145749, "percentage": 77.09, "elapsed_time": "5:16:24", "remaining_time": "1:34:03"}
953
+ {"current_steps": 953, "total_steps": 1235, "loss": 0.3207, "lr": 6.0288387967297565e-06, "epoch": 3.8582995951417005, "percentage": 77.17, "elapsed_time": "5:16:42", "remaining_time": "1:33:43"}
954
+ {"current_steps": 954, "total_steps": 1235, "loss": 0.3268, "lr": 5.988427070179108e-06, "epoch": 3.862348178137652, "percentage": 77.25, "elapsed_time": "5:17:02", "remaining_time": "1:33:22"}
955
+ {"current_steps": 955, "total_steps": 1235, "loss": 0.3238, "lr": 5.948127379792234e-06, "epoch": 3.866396761133603, "percentage": 77.33, "elapsed_time": "5:17:22", "remaining_time": "1:33:03"}
956
+ {"current_steps": 956, "total_steps": 1235, "loss": 0.3367, "lr": 5.90794004780439e-06, "epoch": 3.8704453441295548, "percentage": 77.41, "elapsed_time": "5:17:42", "remaining_time": "1:32:43"}
957
+ {"current_steps": 957, "total_steps": 1235, "loss": 0.3347, "lr": 5.867865395552405e-06, "epoch": 3.8744939271255063, "percentage": 77.49, "elapsed_time": "5:18:01", "remaining_time": "1:32:23"}
958
+ {"current_steps": 958, "total_steps": 1235, "loss": 0.3301, "lr": 5.8279037434721364e-06, "epoch": 3.8785425101214575, "percentage": 77.57, "elapsed_time": "5:18:22", "remaining_time": "1:32:03"}
959
+ {"current_steps": 959, "total_steps": 1235, "loss": 0.3237, "lr": 5.788055411095892e-06, "epoch": 3.882591093117409, "percentage": 77.65, "elapsed_time": "5:18:43", "remaining_time": "1:31:43"}
960
+ {"current_steps": 960, "total_steps": 1235, "loss": 0.3239, "lr": 5.7483207170498625e-06, "epoch": 3.8866396761133606, "percentage": 77.73, "elapsed_time": "5:19:02", "remaining_time": "1:31:23"}
961
+ {"current_steps": 961, "total_steps": 1235, "loss": 0.3232, "lr": 5.708699979051613e-06, "epoch": 3.8906882591093117, "percentage": 77.81, "elapsed_time": "5:19:22", "remaining_time": "1:31:03"}
962
+ {"current_steps": 962, "total_steps": 1235, "loss": 0.3351, "lr": 5.66919351390751e-06, "epoch": 3.8947368421052633, "percentage": 77.89, "elapsed_time": "5:19:40", "remaining_time": "1:30:42"}
963
+ {"current_steps": 963, "total_steps": 1235, "loss": 0.3311, "lr": 5.629801637510188e-06, "epoch": 3.898785425101215, "percentage": 77.98, "elapsed_time": "5:19:56", "remaining_time": "1:30:22"}
964
+ {"current_steps": 964, "total_steps": 1235, "loss": 0.319, "lr": 5.590524664836043e-06, "epoch": 3.902834008097166, "percentage": 78.06, "elapsed_time": "5:20:17", "remaining_time": "1:30:02"}
965
+ {"current_steps": 965, "total_steps": 1235, "loss": 0.3303, "lr": 5.551362909942708e-06, "epoch": 3.9068825910931175, "percentage": 78.14, "elapsed_time": "5:20:33", "remaining_time": "1:29:41"}
966
+ {"current_steps": 966, "total_steps": 1235, "loss": 0.329, "lr": 5.51231668596653e-06, "epoch": 3.910931174089069, "percentage": 78.22, "elapsed_time": "5:20:56", "remaining_time": "1:29:22"}
967
+ {"current_steps": 967, "total_steps": 1235, "loss": 0.3311, "lr": 5.47338630512007e-06, "epoch": 3.91497975708502, "percentage": 78.3, "elapsed_time": "5:21:13", "remaining_time": "1:29:01"}
968
+ {"current_steps": 968, "total_steps": 1235, "loss": 0.3317, "lr": 5.434572078689617e-06, "epoch": 3.919028340080972, "percentage": 78.38, "elapsed_time": "5:21:32", "remaining_time": "1:28:41"}
969
+ {"current_steps": 969, "total_steps": 1235, "loss": 0.3323, "lr": 5.395874317032694e-06, "epoch": 3.9230769230769234, "percentage": 78.46, "elapsed_time": "5:21:51", "remaining_time": "1:28:21"}
970
+ {"current_steps": 970, "total_steps": 1235, "loss": 0.3298, "lr": 5.357293329575573e-06, "epoch": 3.9271255060728745, "percentage": 78.54, "elapsed_time": "5:22:09", "remaining_time": "1:28:00"}
971
+ {"current_steps": 971, "total_steps": 1235, "loss": 0.3325, "lr": 5.318829424810797e-06, "epoch": 3.931174089068826, "percentage": 78.62, "elapsed_time": "5:22:31", "remaining_time": "1:27:41"}
972
+ {"current_steps": 972, "total_steps": 1235, "loss": 0.3284, "lr": 5.280482910294728e-06, "epoch": 3.9352226720647776, "percentage": 78.7, "elapsed_time": "5:22:51", "remaining_time": "1:27:21"}
973
+ {"current_steps": 973, "total_steps": 1235, "loss": 0.3225, "lr": 5.242254092645078e-06, "epoch": 3.9392712550607287, "percentage": 78.79, "elapsed_time": "5:23:12", "remaining_time": "1:27:01"}
974
+ {"current_steps": 974, "total_steps": 1235, "loss": 0.3335, "lr": 5.2041432775384445e-06, "epoch": 3.9433198380566803, "percentage": 78.87, "elapsed_time": "5:23:33", "remaining_time": "1:26:42"}
975
+ {"current_steps": 975, "total_steps": 1235, "loss": 0.3146, "lr": 5.166150769707892e-06, "epoch": 3.9473684210526314, "percentage": 78.95, "elapsed_time": "5:23:50", "remaining_time": "1:26:21"}
976
+ {"current_steps": 976, "total_steps": 1235, "loss": 0.3332, "lr": 5.128276872940503e-06, "epoch": 3.951417004048583, "percentage": 79.03, "elapsed_time": "5:24:10", "remaining_time": "1:26:01"}
977
+ {"current_steps": 977, "total_steps": 1235, "loss": 0.3175, "lr": 5.090521890074953e-06, "epoch": 3.9554655870445345, "percentage": 79.11, "elapsed_time": "5:24:25", "remaining_time": "1:25:40"}
978
+ {"current_steps": 978, "total_steps": 1235, "loss": 0.3271, "lr": 5.0528861229990675e-06, "epoch": 3.9595141700404857, "percentage": 79.19, "elapsed_time": "5:24:45", "remaining_time": "1:25:20"}
979
+ {"current_steps": 979, "total_steps": 1235, "loss": 0.3293, "lr": 5.015369872647442e-06, "epoch": 3.9635627530364372, "percentage": 79.27, "elapsed_time": "5:25:07", "remaining_time": "1:25:01"}
980
+ {"current_steps": 980, "total_steps": 1235, "loss": 0.3275, "lr": 4.9779734389990195e-06, "epoch": 3.967611336032389, "percentage": 79.35, "elapsed_time": "5:25:27", "remaining_time": "1:24:41"}
981
+ {"current_steps": 981, "total_steps": 1235, "loss": 0.325, "lr": 4.940697121074675e-06, "epoch": 3.97165991902834, "percentage": 79.43, "elapsed_time": "5:25:45", "remaining_time": "1:24:20"}
982
+ {"current_steps": 982, "total_steps": 1235, "loss": 0.3217, "lr": 4.903541216934864e-06, "epoch": 3.9757085020242915, "percentage": 79.51, "elapsed_time": "5:26:05", "remaining_time": "1:24:00"}
983
+ {"current_steps": 983, "total_steps": 1235, "loss": 0.3294, "lr": 4.8665060236772e-06, "epoch": 3.979757085020243, "percentage": 79.6, "elapsed_time": "5:26:25", "remaining_time": "1:23:40"}
984
+ {"current_steps": 984, "total_steps": 1235, "loss": 0.328, "lr": 4.829591837434102e-06, "epoch": 3.983805668016194, "percentage": 79.68, "elapsed_time": "5:26:42", "remaining_time": "1:23:20"}
985
+ {"current_steps": 985, "total_steps": 1235, "loss": 0.3326, "lr": 4.792798953370424e-06, "epoch": 3.9878542510121457, "percentage": 79.76, "elapsed_time": "5:26:59", "remaining_time": "1:22:59"}
986
+ {"current_steps": 986, "total_steps": 1235, "loss": 0.3353, "lr": 4.756127665681083e-06, "epoch": 3.9919028340080973, "percentage": 79.84, "elapsed_time": "5:27:18", "remaining_time": "1:22:39"}
987
+ {"current_steps": 987, "total_steps": 1235, "loss": 0.327, "lr": 4.719578267588725e-06, "epoch": 3.9959514170040484, "percentage": 79.92, "elapsed_time": "5:27:38", "remaining_time": "1:22:19"}
988
+ {"current_steps": 988, "total_steps": 1235, "loss": 0.32, "lr": 4.6831510513413525e-06, "epoch": 4.0, "percentage": 80.0, "elapsed_time": "5:28:01", "remaining_time": "1:22:00"}
989
+ {"current_steps": 989, "total_steps": 1235, "loss": 0.2803, "lr": 4.6468463082100176e-06, "epoch": 4.004048582995951, "percentage": 80.08, "elapsed_time": "5:30:04", "remaining_time": "1:22:06"}
990
+ {"current_steps": 990, "total_steps": 1235, "loss": 0.2553, "lr": 4.610664328486485e-06, "epoch": 4.008097165991903, "percentage": 80.16, "elapsed_time": "5:30:22", "remaining_time": "1:21:45"}
991
+ {"current_steps": 991, "total_steps": 1235, "loss": 0.2605, "lr": 4.5746054014809e-06, "epoch": 4.012145748987854, "percentage": 80.24, "elapsed_time": "5:30:42", "remaining_time": "1:21:25"}
992
+ {"current_steps": 992, "total_steps": 1235, "loss": 0.2578, "lr": 4.5386698155194766e-06, "epoch": 4.016194331983805, "percentage": 80.32, "elapsed_time": "5:31:00", "remaining_time": "1:21:05"}
993
+ {"current_steps": 993, "total_steps": 1235, "loss": 0.2684, "lr": 4.502857857942204e-06, "epoch": 4.020242914979757, "percentage": 80.4, "elapsed_time": "5:31:18", "remaining_time": "1:20:44"}
994
+ {"current_steps": 994, "total_steps": 1235, "loss": 0.2719, "lr": 4.467169815100549e-06, "epoch": 4.0242914979757085, "percentage": 80.49, "elapsed_time": "5:31:40", "remaining_time": "1:20:24"}
995
+ {"current_steps": 995, "total_steps": 1235, "loss": 0.2797, "lr": 4.431605972355137e-06, "epoch": 4.02834008097166, "percentage": 80.57, "elapsed_time": "5:32:01", "remaining_time": "1:20:05"}
996
+ {"current_steps": 996, "total_steps": 1235, "loss": 0.2587, "lr": 4.396166614073516e-06, "epoch": 4.032388663967612, "percentage": 80.65, "elapsed_time": "5:32:19", "remaining_time": "1:19:44"}
997
+ {"current_steps": 997, "total_steps": 1235, "loss": 0.2616, "lr": 4.360852023627846e-06, "epoch": 4.036437246963563, "percentage": 80.73, "elapsed_time": "5:32:38", "remaining_time": "1:19:24"}
998
+ {"current_steps": 998, "total_steps": 1235, "loss": 0.2582, "lr": 4.325662483392656e-06, "epoch": 4.040485829959514, "percentage": 80.81, "elapsed_time": "5:32:55", "remaining_time": "1:19:03"}
999
+ {"current_steps": 999, "total_steps": 1235, "loss": 0.248, "lr": 4.29059827474257e-06, "epoch": 4.044534412955466, "percentage": 80.89, "elapsed_time": "5:33:14", "remaining_time": "1:18:43"}
1000
+ {"current_steps": 1000, "total_steps": 1235, "loss": 0.273, "lr": 4.255659678050063e-06, "epoch": 4.048582995951417, "percentage": 80.97, "elapsed_time": "5:33:35", "remaining_time": "1:18:23"}
1001
+ {"current_steps": 1001, "total_steps": 1235, "loss": 0.2592, "lr": 4.22084697268323e-06, "epoch": 4.052631578947368, "percentage": 81.05, "elapsed_time": "5:33:55", "remaining_time": "1:18:03"}
1002
+ {"current_steps": 1002, "total_steps": 1235, "loss": 0.2661, "lr": 4.186160437003535e-06, "epoch": 4.05668016194332, "percentage": 81.13, "elapsed_time": "5:34:16", "remaining_time": "1:17:43"}
1003
+ {"current_steps": 1003, "total_steps": 1235, "loss": 0.2477, "lr": 4.151600348363582e-06, "epoch": 4.060728744939271, "percentage": 81.21, "elapsed_time": "5:34:32", "remaining_time": "1:17:22"}
1004
+ {"current_steps": 1004, "total_steps": 1235, "loss": 0.2572, "lr": 4.11716698310493e-06, "epoch": 4.064777327935222, "percentage": 81.3, "elapsed_time": "5:34:54", "remaining_time": "1:17:03"}
1005
+ {"current_steps": 1005, "total_steps": 1235, "loss": 0.2584, "lr": 4.082860616555848e-06, "epoch": 4.068825910931174, "percentage": 81.38, "elapsed_time": "5:35:16", "remaining_time": "1:16:43"}
1006
+ {"current_steps": 1006, "total_steps": 1235, "loss": 0.2651, "lr": 4.048681523029125e-06, "epoch": 4.0728744939271255, "percentage": 81.46, "elapsed_time": "5:35:34", "remaining_time": "1:16:23"}
1007
+ {"current_steps": 1007, "total_steps": 1235, "loss": 0.2622, "lr": 4.014629975819882e-06, "epoch": 4.076923076923077, "percentage": 81.54, "elapsed_time": "5:35:54", "remaining_time": "1:16:03"}
1008
+ {"current_steps": 1008, "total_steps": 1235, "loss": 0.2596, "lr": 3.9807062472033855e-06, "epoch": 4.080971659919029, "percentage": 81.62, "elapsed_time": "5:36:09", "remaining_time": "1:15:42"}
1009
+ {"current_steps": 1009, "total_steps": 1235, "loss": 0.2598, "lr": 3.94691060843287e-06, "epoch": 4.08502024291498, "percentage": 81.7, "elapsed_time": "5:36:30", "remaining_time": "1:15:22"}
1010
+ {"current_steps": 1010, "total_steps": 1235, "loss": 0.2605, "lr": 3.913243329737353e-06, "epoch": 4.089068825910931, "percentage": 81.78, "elapsed_time": "5:36:50", "remaining_time": "1:15:02"}
1011
+ {"current_steps": 1011, "total_steps": 1235, "loss": 0.2653, "lr": 3.879704680319503e-06, "epoch": 4.093117408906883, "percentage": 81.86, "elapsed_time": "5:37:12", "remaining_time": "1:14:42"}
1012
+ {"current_steps": 1012, "total_steps": 1235, "loss": 0.2493, "lr": 3.846294928353471e-06, "epoch": 4.097165991902834, "percentage": 81.94, "elapsed_time": "5:37:28", "remaining_time": "1:14:21"}
1013
+ {"current_steps": 1013, "total_steps": 1235, "loss": 0.2651, "lr": 3.8130143409827345e-06, "epoch": 4.101214574898785, "percentage": 82.02, "elapsed_time": "5:37:45", "remaining_time": "1:14:01"}
1014
+ {"current_steps": 1014, "total_steps": 1235, "loss": 0.2725, "lr": 3.7798631843179887e-06, "epoch": 4.105263157894737, "percentage": 82.11, "elapsed_time": "5:38:05", "remaining_time": "1:13:41"}
1015
+ {"current_steps": 1015, "total_steps": 1235, "loss": 0.266, "lr": 3.7468417234349973e-06, "epoch": 4.109311740890688, "percentage": 82.19, "elapsed_time": "5:38:25", "remaining_time": "1:13:21"}
1016
+ {"current_steps": 1016, "total_steps": 1235, "loss": 0.2679, "lr": 3.7139502223724823e-06, "epoch": 4.113360323886639, "percentage": 82.27, "elapsed_time": "5:38:42", "remaining_time": "1:13:00"}
1017
+ {"current_steps": 1017, "total_steps": 1235, "loss": 0.2619, "lr": 3.6811889441300095e-06, "epoch": 4.117408906882591, "percentage": 82.35, "elapsed_time": "5:39:02", "remaining_time": "1:12:40"}
1018
+ {"current_steps": 1018, "total_steps": 1235, "loss": 0.2589, "lr": 3.648558150665886e-06, "epoch": 4.1214574898785425, "percentage": 82.43, "elapsed_time": "5:39:21", "remaining_time": "1:12:20"}
1019
+ {"current_steps": 1019, "total_steps": 1235, "loss": 0.2722, "lr": 3.616058102895075e-06, "epoch": 4.125506072874494, "percentage": 82.51, "elapsed_time": "5:39:40", "remaining_time": "1:12:00"}
1020
+ {"current_steps": 1020, "total_steps": 1235, "loss": 0.25, "lr": 3.583689060687079e-06, "epoch": 4.129554655870446, "percentage": 82.59, "elapsed_time": "5:40:00", "remaining_time": "1:11:40"}
1021
+ {"current_steps": 1021, "total_steps": 1235, "loss": 0.2569, "lr": 3.5514512828639023e-06, "epoch": 4.133603238866397, "percentage": 82.67, "elapsed_time": "5:40:19", "remaining_time": "1:11:19"}
1022
+ {"current_steps": 1022, "total_steps": 1235, "loss": 0.269, "lr": 3.51934502719796e-06, "epoch": 4.137651821862348, "percentage": 82.75, "elapsed_time": "5:40:42", "remaining_time": "1:11:00"}
1023
+ {"current_steps": 1023, "total_steps": 1235, "loss": 0.2631, "lr": 3.4873705504100185e-06, "epoch": 4.1417004048583, "percentage": 82.83, "elapsed_time": "5:41:03", "remaining_time": "1:10:40"}
1024
+ {"current_steps": 1024, "total_steps": 1235, "loss": 0.2639, "lr": 3.4555281081671345e-06, "epoch": 4.145748987854251, "percentage": 82.91, "elapsed_time": "5:41:22", "remaining_time": "1:10:20"}
1025
+ {"current_steps": 1025, "total_steps": 1235, "loss": 0.262, "lr": 3.4238179550806326e-06, "epoch": 4.149797570850202, "percentage": 83.0, "elapsed_time": "5:41:42", "remaining_time": "1:10:00"}
1026
+ {"current_steps": 1026, "total_steps": 1235, "loss": 0.2694, "lr": 3.3922403447040497e-06, "epoch": 4.153846153846154, "percentage": 83.08, "elapsed_time": "5:42:02", "remaining_time": "1:09:40"}
1027
+ {"current_steps": 1027, "total_steps": 1235, "loss": 0.2571, "lr": 3.3607955295311247e-06, "epoch": 4.157894736842105, "percentage": 83.16, "elapsed_time": "5:42:22", "remaining_time": "1:09:20"}
1028
+ {"current_steps": 1028, "total_steps": 1235, "loss": 0.2643, "lr": 3.32948376099375e-06, "epoch": 4.161943319838056, "percentage": 83.24, "elapsed_time": "5:42:39", "remaining_time": "1:08:59"}
1029
+ {"current_steps": 1029, "total_steps": 1235, "loss": 0.2602, "lr": 3.2983052894599976e-06, "epoch": 4.165991902834008, "percentage": 83.32, "elapsed_time": "5:43:00", "remaining_time": "1:08:40"}
1030
+ {"current_steps": 1030, "total_steps": 1235, "loss": 0.2498, "lr": 3.2672603642320945e-06, "epoch": 4.17004048582996, "percentage": 83.4, "elapsed_time": "5:43:20", "remaining_time": "1:08:20"}
1031
+ {"current_steps": 1031, "total_steps": 1235, "loss": 0.2677, "lr": 3.236349233544438e-06, "epoch": 4.174089068825911, "percentage": 83.48, "elapsed_time": "5:43:41", "remaining_time": "1:08:00"}
1032
+ {"current_steps": 1032, "total_steps": 1235, "loss": 0.2616, "lr": 3.205572144561604e-06, "epoch": 4.178137651821863, "percentage": 83.56, "elapsed_time": "5:44:02", "remaining_time": "1:07:40"}
1033
+ {"current_steps": 1033, "total_steps": 1235, "loss": 0.2483, "lr": 3.174929343376374e-06, "epoch": 4.182186234817814, "percentage": 83.64, "elapsed_time": "5:44:21", "remaining_time": "1:07:20"}
1034
+ {"current_steps": 1034, "total_steps": 1235, "loss": 0.2742, "lr": 3.1444210750077777e-06, "epoch": 4.186234817813765, "percentage": 83.72, "elapsed_time": "5:44:43", "remaining_time": "1:07:00"}
1035
+ {"current_steps": 1035, "total_steps": 1235, "loss": 0.2808, "lr": 3.1140475833991046e-06, "epoch": 4.190283400809717, "percentage": 83.81, "elapsed_time": "5:45:04", "remaining_time": "1:06:40"}
1036
+ {"current_steps": 1036, "total_steps": 1235, "loss": 0.2504, "lr": 3.0838091114159895e-06, "epoch": 4.194331983805668, "percentage": 83.89, "elapsed_time": "5:45:20", "remaining_time": "1:06:20"}
1037
+ {"current_steps": 1037, "total_steps": 1235, "loss": 0.2669, "lr": 3.0537059008444524e-06, "epoch": 4.198380566801619, "percentage": 83.97, "elapsed_time": "5:45:37", "remaining_time": "1:05:59"}
1038
+ {"current_steps": 1038, "total_steps": 1235, "loss": 0.2743, "lr": 3.0237381923889563e-06, "epoch": 4.202429149797571, "percentage": 84.05, "elapsed_time": "5:45:58", "remaining_time": "1:05:39"}
1039
+ {"current_steps": 1039, "total_steps": 1235, "loss": 0.2677, "lr": 2.9939062256704997e-06, "epoch": 4.206477732793522, "percentage": 84.13, "elapsed_time": "5:46:21", "remaining_time": "1:05:20"}
1040
+ {"current_steps": 1040, "total_steps": 1235, "loss": 0.2496, "lr": 2.964210239224696e-06, "epoch": 4.2105263157894735, "percentage": 84.21, "elapsed_time": "5:46:42", "remaining_time": "1:05:00"}
1041
+ {"current_steps": 1041, "total_steps": 1235, "loss": 0.2582, "lr": 2.934650470499869e-06, "epoch": 4.2145748987854255, "percentage": 84.29, "elapsed_time": "5:47:02", "remaining_time": "1:04:40"}
1042
+ {"current_steps": 1042, "total_steps": 1235, "loss": 0.2554, "lr": 2.905227155855128e-06, "epoch": 4.218623481781377, "percentage": 84.37, "elapsed_time": "5:47:23", "remaining_time": "1:04:20"}
1043
+ {"current_steps": 1043, "total_steps": 1235, "loss": 0.2726, "lr": 2.875940530558519e-06, "epoch": 4.222672064777328, "percentage": 84.45, "elapsed_time": "5:47:45", "remaining_time": "1:04:01"}
1044
+ {"current_steps": 1044, "total_steps": 1235, "loss": 0.2659, "lr": 2.8467908287851154e-06, "epoch": 4.22672064777328, "percentage": 84.53, "elapsed_time": "5:48:04", "remaining_time": "1:03:40"}
1045
+ {"current_steps": 1045, "total_steps": 1235, "loss": 0.2515, "lr": 2.8177782836151603e-06, "epoch": 4.230769230769231, "percentage": 84.62, "elapsed_time": "5:48:26", "remaining_time": "1:03:21"}
1046
+ {"current_steps": 1046, "total_steps": 1235, "loss": 0.2634, "lr": 2.7889031270321874e-06, "epoch": 4.234817813765182, "percentage": 84.7, "elapsed_time": "5:48:48", "remaining_time": "1:03:01"}
1047
+ {"current_steps": 1047, "total_steps": 1235, "loss": 0.261, "lr": 2.760165589921184e-06, "epoch": 4.238866396761134, "percentage": 84.78, "elapsed_time": "5:49:09", "remaining_time": "1:02:41"}
1048
+ {"current_steps": 1048, "total_steps": 1235, "loss": 0.2412, "lr": 2.7315659020667305e-06, "epoch": 4.242914979757085, "percentage": 84.86, "elapsed_time": "5:49:28", "remaining_time": "1:02:21"}
1049
+ {"current_steps": 1049, "total_steps": 1235, "loss": 0.2541, "lr": 2.703104292151164e-06, "epoch": 4.246963562753036, "percentage": 84.94, "elapsed_time": "5:49:45", "remaining_time": "1:02:00"}
1050
+ {"current_steps": 1050, "total_steps": 1235, "loss": 0.2656, "lr": 2.6747809877527607e-06, "epoch": 4.251012145748988, "percentage": 85.02, "elapsed_time": "5:50:01", "remaining_time": "1:01:40"}
1051
+ {"current_steps": 1051, "total_steps": 1235, "loss": 0.2722, "lr": 2.6465962153439082e-06, "epoch": 4.255060728744939, "percentage": 85.1, "elapsed_time": "5:50:25", "remaining_time": "1:01:20"}
1052
+ {"current_steps": 1052, "total_steps": 1235, "loss": 0.2706, "lr": 2.618550200289303e-06, "epoch": 4.2591093117408905, "percentage": 85.18, "elapsed_time": "5:50:43", "remaining_time": "1:01:00"}
1053
+ {"current_steps": 1053, "total_steps": 1235, "loss": 0.2643, "lr": 2.59064316684412e-06, "epoch": 4.2631578947368425, "percentage": 85.26, "elapsed_time": "5:51:02", "remaining_time": "1:00:40"}
1054
+ {"current_steps": 1054, "total_steps": 1235, "loss": 0.2521, "lr": 2.562875338152264e-06, "epoch": 4.267206477732794, "percentage": 85.34, "elapsed_time": "5:51:18", "remaining_time": "1:00:19"}
1055
+ {"current_steps": 1055, "total_steps": 1235, "loss": 0.2455, "lr": 2.5352469362445552e-06, "epoch": 4.271255060728745, "percentage": 85.43, "elapsed_time": "5:51:37", "remaining_time": "0:59:59"}
1056
+ {"current_steps": 1056, "total_steps": 1235, "loss": 0.2661, "lr": 2.5077581820369523e-06, "epoch": 4.275303643724697, "percentage": 85.51, "elapsed_time": "5:51:57", "remaining_time": "0:59:39"}
1057
+ {"current_steps": 1057, "total_steps": 1235, "loss": 0.2503, "lr": 2.480409295328803e-06, "epoch": 4.279352226720648, "percentage": 85.59, "elapsed_time": "5:52:18", "remaining_time": "0:59:19"}
1058
+ {"current_steps": 1058, "total_steps": 1235, "loss": 0.263, "lr": 2.45320049480108e-06, "epoch": 4.283400809716599, "percentage": 85.67, "elapsed_time": "5:52:40", "remaining_time": "0:59:00"}
1059
+ {"current_steps": 1059, "total_steps": 1235, "loss": 0.2687, "lr": 2.4261319980146293e-06, "epoch": 4.287449392712551, "percentage": 85.75, "elapsed_time": "5:53:03", "remaining_time": "0:58:40"}
1060
+ {"current_steps": 1060, "total_steps": 1235, "loss": 0.2681, "lr": 2.399204021408421e-06, "epoch": 4.291497975708502, "percentage": 85.83, "elapsed_time": "5:53:23", "remaining_time": "0:58:20"}
1061
+ {"current_steps": 1061, "total_steps": 1235, "loss": 0.252, "lr": 2.3724167802978395e-06, "epoch": 4.295546558704453, "percentage": 85.91, "elapsed_time": "5:53:44", "remaining_time": "0:58:00"}
1062
+ {"current_steps": 1062, "total_steps": 1235, "loss": 0.2697, "lr": 2.3457704888729625e-06, "epoch": 4.299595141700405, "percentage": 85.99, "elapsed_time": "5:54:04", "remaining_time": "0:57:40"}
1063
+ {"current_steps": 1063, "total_steps": 1235, "loss": 0.2592, "lr": 2.3192653601968162e-06, "epoch": 4.303643724696356, "percentage": 86.07, "elapsed_time": "5:54:26", "remaining_time": "0:57:20"}
1064
+ {"current_steps": 1064, "total_steps": 1235, "loss": 0.2566, "lr": 2.2929016062037057e-06, "epoch": 4.3076923076923075, "percentage": 86.15, "elapsed_time": "5:54:44", "remaining_time": "0:57:00"}
1065
+ {"current_steps": 1065, "total_steps": 1235, "loss": 0.2601, "lr": 2.2666794376975055e-06, "epoch": 4.3117408906882595, "percentage": 86.23, "elapsed_time": "5:55:01", "remaining_time": "0:56:40"}
1066
+ {"current_steps": 1066, "total_steps": 1235, "loss": 0.2574, "lr": 2.24059906434998e-06, "epoch": 4.315789473684211, "percentage": 86.32, "elapsed_time": "5:55:20", "remaining_time": "0:56:20"}
1067
+ {"current_steps": 1067, "total_steps": 1235, "loss": 0.2589, "lr": 2.214660694699091e-06, "epoch": 4.319838056680162, "percentage": 86.4, "elapsed_time": "5:55:39", "remaining_time": "0:55:59"}
1068
+ {"current_steps": 1068, "total_steps": 1235, "loss": 0.2639, "lr": 2.188864536147355e-06, "epoch": 4.323886639676114, "percentage": 86.48, "elapsed_time": "5:56:03", "remaining_time": "0:55:40"}
1069
+ {"current_steps": 1069, "total_steps": 1235, "loss": 0.2698, "lr": 2.1632107949601757e-06, "epoch": 4.327935222672065, "percentage": 86.56, "elapsed_time": "5:56:23", "remaining_time": "0:55:20"}
1070
+ {"current_steps": 1070, "total_steps": 1235, "loss": 0.2642, "lr": 2.137699676264171e-06, "epoch": 4.331983805668016, "percentage": 86.64, "elapsed_time": "5:56:44", "remaining_time": "0:55:00"}
1071
+ {"current_steps": 1071, "total_steps": 1235, "loss": 0.257, "lr": 2.1123313840455738e-06, "epoch": 4.336032388663968, "percentage": 86.72, "elapsed_time": "5:57:02", "remaining_time": "0:54:40"}
1072
+ {"current_steps": 1072, "total_steps": 1235, "loss": 0.2551, "lr": 2.08710612114857e-06, "epoch": 4.340080971659919, "percentage": 86.8, "elapsed_time": "5:57:22", "remaining_time": "0:54:20"}
1073
+ {"current_steps": 1073, "total_steps": 1235, "loss": 0.2479, "lr": 2.0620240892736953e-06, "epoch": 4.34412955465587, "percentage": 86.88, "elapsed_time": "5:57:41", "remaining_time": "0:54:00"}
1074
+ {"current_steps": 1074, "total_steps": 1235, "loss": 0.2686, "lr": 2.0370854889762e-06, "epoch": 4.348178137651822, "percentage": 86.96, "elapsed_time": "5:58:00", "remaining_time": "0:53:40"}
1075
+ {"current_steps": 1075, "total_steps": 1235, "loss": 0.2501, "lr": 2.0122905196644726e-06, "epoch": 4.352226720647773, "percentage": 87.04, "elapsed_time": "5:58:18", "remaining_time": "0:53:19"}
1076
+ {"current_steps": 1076, "total_steps": 1235, "loss": 0.2529, "lr": 1.987639379598427e-06, "epoch": 4.3562753036437245, "percentage": 87.13, "elapsed_time": "5:58:42", "remaining_time": "0:53:00"}
1077
+ {"current_steps": 1077, "total_steps": 1235, "loss": 0.2533, "lr": 1.963132265887919e-06, "epoch": 4.3603238866396765, "percentage": 87.21, "elapsed_time": "5:58:57", "remaining_time": "0:52:39"}
1078
+ {"current_steps": 1078, "total_steps": 1235, "loss": 0.2584, "lr": 1.9387693744911784e-06, "epoch": 4.364372469635628, "percentage": 87.29, "elapsed_time": "5:59:17", "remaining_time": "0:52:19"}
1079
+ {"current_steps": 1079, "total_steps": 1235, "loss": 0.2631, "lr": 1.9145509002132368e-06, "epoch": 4.368421052631579, "percentage": 87.37, "elapsed_time": "5:59:36", "remaining_time": "0:51:59"}
1080
+ {"current_steps": 1080, "total_steps": 1235, "loss": 0.2512, "lr": 1.8904770367043723e-06, "epoch": 4.372469635627531, "percentage": 87.45, "elapsed_time": "5:59:57", "remaining_time": "0:51:39"}
1081
+ {"current_steps": 1081, "total_steps": 1235, "loss": 0.2653, "lr": 1.8665479764585504e-06, "epoch": 4.376518218623482, "percentage": 87.53, "elapsed_time": "6:00:17", "remaining_time": "0:51:19"}
1082
+ {"current_steps": 1082, "total_steps": 1235, "loss": 0.2568, "lr": 1.8427639108118977e-06, "epoch": 4.380566801619433, "percentage": 87.61, "elapsed_time": "6:00:37", "remaining_time": "0:50:59"}
1083
+ {"current_steps": 1083, "total_steps": 1235, "loss": 0.2613, "lr": 1.8191250299411755e-06, "epoch": 4.384615384615385, "percentage": 87.69, "elapsed_time": "6:01:00", "remaining_time": "0:50:40"}
1084
+ {"current_steps": 1084, "total_steps": 1235, "loss": 0.2728, "lr": 1.7956315228622446e-06, "epoch": 4.388663967611336, "percentage": 87.77, "elapsed_time": "6:01:20", "remaining_time": "0:50:20"}
1085
+ {"current_steps": 1085, "total_steps": 1235, "loss": 0.2597, "lr": 1.7722835774285553e-06, "epoch": 4.392712550607287, "percentage": 87.85, "elapsed_time": "6:01:37", "remaining_time": "0:49:59"}
1086
+ {"current_steps": 1086, "total_steps": 1235, "loss": 0.2569, "lr": 1.7490813803296624e-06, "epoch": 4.396761133603239, "percentage": 87.94, "elapsed_time": "6:01:55", "remaining_time": "0:49:39"}
1087
+ {"current_steps": 1087, "total_steps": 1235, "loss": 0.2653, "lr": 1.726025117089718e-06, "epoch": 4.40080971659919, "percentage": 88.02, "elapsed_time": "6:02:17", "remaining_time": "0:49:19"}
1088
+ {"current_steps": 1088, "total_steps": 1235, "loss": 0.2676, "lr": 1.70311497206598e-06, "epoch": 4.4048582995951415, "percentage": 88.1, "elapsed_time": "6:02:38", "remaining_time": "0:48:59"}
1089
+ {"current_steps": 1089, "total_steps": 1235, "loss": 0.2553, "lr": 1.6803511284473638e-06, "epoch": 4.4089068825910935, "percentage": 88.18, "elapsed_time": "6:02:54", "remaining_time": "0:48:39"}
1090
+ {"current_steps": 1090, "total_steps": 1235, "loss": 0.2475, "lr": 1.6577337682529538e-06, "epoch": 4.412955465587045, "percentage": 88.26, "elapsed_time": "6:03:13", "remaining_time": "0:48:19"}
1091
+ {"current_steps": 1091, "total_steps": 1235, "loss": 0.2627, "lr": 1.6352630723305617e-06, "epoch": 4.417004048582996, "percentage": 88.34, "elapsed_time": "6:03:32", "remaining_time": "0:47:59"}
1092
+ {"current_steps": 1092, "total_steps": 1235, "loss": 0.2512, "lr": 1.612939220355272e-06, "epoch": 4.421052631578947, "percentage": 88.42, "elapsed_time": "6:03:50", "remaining_time": "0:47:38"}
1093
+ {"current_steps": 1093, "total_steps": 1235, "loss": 0.2684, "lr": 1.5907623908280112e-06, "epoch": 4.425101214574899, "percentage": 88.5, "elapsed_time": "6:04:10", "remaining_time": "0:47:18"}
1094
+ {"current_steps": 1094, "total_steps": 1235, "loss": 0.2617, "lr": 1.568732761074121e-06, "epoch": 4.42914979757085, "percentage": 88.58, "elapsed_time": "6:04:31", "remaining_time": "0:46:58"}
1095
+ {"current_steps": 1095, "total_steps": 1235, "loss": 0.2399, "lr": 1.5468505072419237e-06, "epoch": 4.433198380566802, "percentage": 88.66, "elapsed_time": "6:04:49", "remaining_time": "0:46:38"}
1096
+ {"current_steps": 1096, "total_steps": 1235, "loss": 0.2628, "lr": 1.5251158043013448e-06, "epoch": 4.437246963562753, "percentage": 88.74, "elapsed_time": "6:05:09", "remaining_time": "0:46:18"}
1097
+ {"current_steps": 1097, "total_steps": 1235, "loss": 0.2555, "lr": 1.5035288260424885e-06, "epoch": 4.441295546558704, "percentage": 88.83, "elapsed_time": "6:05:25", "remaining_time": "0:45:58"}
1098
+ {"current_steps": 1098, "total_steps": 1235, "loss": 0.2623, "lr": 1.4820897450742623e-06, "epoch": 4.445344129554655, "percentage": 88.91, "elapsed_time": "6:05:48", "remaining_time": "0:45:38"}
1099
+ {"current_steps": 1099, "total_steps": 1235, "loss": 0.2661, "lr": 1.4607987328229767e-06, "epoch": 4.449392712550607, "percentage": 88.99, "elapsed_time": "6:06:09", "remaining_time": "0:45:18"}
1100
+ {"current_steps": 1100, "total_steps": 1235, "loss": 0.232, "lr": 1.4396559595310056e-06, "epoch": 4.4534412955465585, "percentage": 89.07, "elapsed_time": "6:06:26", "remaining_time": "0:44:58"}
1101
+ {"current_steps": 1101, "total_steps": 1235, "loss": 0.2476, "lr": 1.4186615942553973e-06, "epoch": 4.4574898785425106, "percentage": 89.15, "elapsed_time": "6:06:47", "remaining_time": "0:44:38"}
1102
+ {"current_steps": 1102, "total_steps": 1235, "loss": 0.264, "lr": 1.3978158048665424e-06, "epoch": 4.461538461538462, "percentage": 89.23, "elapsed_time": "6:07:07", "remaining_time": "0:44:18"}
1103
+ {"current_steps": 1103, "total_steps": 1235, "loss": 0.242, "lr": 1.3771187580468115e-06, "epoch": 4.465587044534413, "percentage": 89.31, "elapsed_time": "6:07:28", "remaining_time": "0:43:58"}
1104
+ {"current_steps": 1104, "total_steps": 1235, "loss": 0.2592, "lr": 1.3565706192892392e-06, "epoch": 4.469635627530364, "percentage": 89.39, "elapsed_time": "6:07:46", "remaining_time": "0:43:38"}
1105
+ {"current_steps": 1105, "total_steps": 1235, "loss": 0.2539, "lr": 1.3361715528961993e-06, "epoch": 4.473684210526316, "percentage": 89.47, "elapsed_time": "6:08:06", "remaining_time": "0:43:18"}
1106
+ {"current_steps": 1106, "total_steps": 1235, "loss": 0.2533, "lr": 1.3159217219780817e-06, "epoch": 4.477732793522267, "percentage": 89.55, "elapsed_time": "6:08:25", "remaining_time": "0:42:58"}
1107
+ {"current_steps": 1107, "total_steps": 1235, "loss": 0.2588, "lr": 1.2958212884519949e-06, "epoch": 4.481781376518219, "percentage": 89.64, "elapsed_time": "6:08:48", "remaining_time": "0:42:38"}
1108
+ {"current_steps": 1108, "total_steps": 1235, "loss": 0.2592, "lr": 1.2758704130404675e-06, "epoch": 4.48582995951417, "percentage": 89.72, "elapsed_time": "6:09:06", "remaining_time": "0:42:18"}
1109
+ {"current_steps": 1109, "total_steps": 1235, "loss": 0.2618, "lr": 1.2560692552701738e-06, "epoch": 4.489878542510121, "percentage": 89.8, "elapsed_time": "6:09:26", "remaining_time": "0:41:58"}
1110
+ {"current_steps": 1110, "total_steps": 1235, "loss": 0.2658, "lr": 1.2364179734706382e-06, "epoch": 4.493927125506072, "percentage": 89.88, "elapsed_time": "6:09:47", "remaining_time": "0:41:38"}
1111
+ {"current_steps": 1111, "total_steps": 1235, "loss": 0.2686, "lr": 1.2169167247729852e-06, "epoch": 4.497975708502024, "percentage": 89.96, "elapsed_time": "6:10:07", "remaining_time": "0:41:18"}
1112
+ {"current_steps": 1112, "total_steps": 1235, "loss": 0.2787, "lr": 1.1975656651086864e-06, "epoch": 4.502024291497976, "percentage": 90.04, "elapsed_time": "6:10:26", "remaining_time": "0:40:58"}
1113
+ {"current_steps": 1113, "total_steps": 1235, "loss": 0.2535, "lr": 1.1783649492082926e-06, "epoch": 4.506072874493928, "percentage": 90.12, "elapsed_time": "6:10:46", "remaining_time": "0:40:38"}
1114
+ {"current_steps": 1114, "total_steps": 1235, "loss": 0.2672, "lr": 1.1593147306002183e-06, "epoch": 4.510121457489879, "percentage": 90.2, "elapsed_time": "6:11:06", "remaining_time": "0:40:18"}
1115
+ {"current_steps": 1115, "total_steps": 1235, "loss": 0.272, "lr": 1.140415161609505e-06, "epoch": 4.51417004048583, "percentage": 90.28, "elapsed_time": "6:11:28", "remaining_time": "0:39:58"}
1116
+ {"current_steps": 1116, "total_steps": 1235, "loss": 0.2668, "lr": 1.121666393356604e-06, "epoch": 4.518218623481781, "percentage": 90.36, "elapsed_time": "6:11:46", "remaining_time": "0:39:38"}
1117
+ {"current_steps": 1117, "total_steps": 1235, "loss": 0.2458, "lr": 1.1030685757561632e-06, "epoch": 4.522267206477733, "percentage": 90.45, "elapsed_time": "6:12:03", "remaining_time": "0:39:18"}
1118
+ {"current_steps": 1118, "total_steps": 1235, "loss": 0.2539, "lr": 1.0846218575158373e-06, "epoch": 4.526315789473684, "percentage": 90.53, "elapsed_time": "6:12:23", "remaining_time": "0:38:58"}
1119
+ {"current_steps": 1119, "total_steps": 1235, "loss": 0.2659, "lr": 1.066326386135097e-06, "epoch": 4.530364372469636, "percentage": 90.61, "elapsed_time": "6:12:46", "remaining_time": "0:38:38"}
1120
+ {"current_steps": 1120, "total_steps": 1235, "loss": 0.2642, "lr": 1.0481823079040398e-06, "epoch": 4.534412955465587, "percentage": 90.69, "elapsed_time": "6:13:06", "remaining_time": "0:38:18"}
1121
+ {"current_steps": 1121, "total_steps": 1235, "loss": 0.2546, "lr": 1.0301897679022344e-06, "epoch": 4.538461538461538, "percentage": 90.77, "elapsed_time": "6:13:26", "remaining_time": "0:37:58"}
1122
+ {"current_steps": 1122, "total_steps": 1235, "loss": 0.2717, "lr": 1.0123489099975491e-06, "epoch": 4.5425101214574894, "percentage": 90.85, "elapsed_time": "6:13:47", "remaining_time": "0:37:38"}
1123
+ {"current_steps": 1123, "total_steps": 1235, "loss": 0.2691, "lr": 9.9465987684501e-07, "epoch": 4.5465587044534415, "percentage": 90.93, "elapsed_time": "6:14:10", "remaining_time": "0:37:19"}
1124
+ {"current_steps": 1124, "total_steps": 1235, "loss": 0.2783, "lr": 9.771228098856534e-07, "epoch": 4.550607287449393, "percentage": 91.01, "elapsed_time": "6:14:29", "remaining_time": "0:36:58"}
1125
+ {"current_steps": 1125, "total_steps": 1235, "loss": 0.2541, "lr": 9.597378493454013e-07, "epoch": 4.554655870445345, "percentage": 91.09, "elapsed_time": "6:14:49", "remaining_time": "0:36:38"}
1126
+ {"current_steps": 1126, "total_steps": 1235, "loss": 0.258, "lr": 9.425051342339353e-07, "epoch": 4.558704453441296, "percentage": 91.17, "elapsed_time": "6:15:09", "remaining_time": "0:36:18"}
1127
+ {"current_steps": 1127, "total_steps": 1235, "loss": 0.2614, "lr": 9.254248023435864e-07, "epoch": 4.562753036437247, "percentage": 91.26, "elapsed_time": "6:15:26", "remaining_time": "0:35:58"}
1128
+ {"current_steps": 1128, "total_steps": 1235, "loss": 0.2541, "lr": 9.084969902482288e-07, "epoch": 4.566801619433198, "percentage": 91.34, "elapsed_time": "6:15:45", "remaining_time": "0:35:38"}
1129
+ {"current_steps": 1129, "total_steps": 1235, "loss": 0.2512, "lr": 8.917218333021993e-07, "epoch": 4.57085020242915, "percentage": 91.42, "elapsed_time": "6:16:06", "remaining_time": "0:35:18"}
1130
+ {"current_steps": 1130, "total_steps": 1235, "loss": 0.2417, "lr": 8.750994656392109e-07, "epoch": 4.574898785425101, "percentage": 91.5, "elapsed_time": "6:16:21", "remaining_time": "0:34:58"}
1131
+ {"current_steps": 1131, "total_steps": 1235, "loss": 0.262, "lr": 8.58630020171265e-07, "epoch": 4.578947368421053, "percentage": 91.58, "elapsed_time": "6:16:41", "remaining_time": "0:34:38"}
1132
+ {"current_steps": 1132, "total_steps": 1235, "loss": 0.2523, "lr": 8.423136285876099e-07, "epoch": 4.582995951417004, "percentage": 91.66, "elapsed_time": "6:17:00", "remaining_time": "0:34:18"}
1133
+ {"current_steps": 1133, "total_steps": 1235, "loss": 0.2649, "lr": 8.26150421353682e-07, "epoch": 4.587044534412955, "percentage": 91.74, "elapsed_time": "6:17:22", "remaining_time": "0:33:58"}
1134
+ {"current_steps": 1134, "total_steps": 1235, "loss": 0.2558, "lr": 8.101405277100549e-07, "epoch": 4.5910931174089065, "percentage": 91.82, "elapsed_time": "6:17:42", "remaining_time": "0:33:38"}
1135
+ {"current_steps": 1135, "total_steps": 1235, "loss": 0.2697, "lr": 7.942840756714077e-07, "epoch": 4.5951417004048585, "percentage": 91.9, "elapsed_time": "6:18:02", "remaining_time": "0:33:18"}
1136
+ {"current_steps": 1136, "total_steps": 1235, "loss": 0.2743, "lr": 7.785811920255093e-07, "epoch": 4.59919028340081, "percentage": 91.98, "elapsed_time": "6:18:23", "remaining_time": "0:32:58"}
1137
+ {"current_steps": 1137, "total_steps": 1235, "loss": 0.2655, "lr": 7.630320023322024e-07, "epoch": 4.603238866396762, "percentage": 92.06, "elapsed_time": "6:18:43", "remaining_time": "0:32:38"}
1138
+ {"current_steps": 1138, "total_steps": 1235, "loss": 0.2687, "lr": 7.476366309223903e-07, "epoch": 4.607287449392713, "percentage": 92.15, "elapsed_time": "6:19:05", "remaining_time": "0:32:18"}
1139
+ {"current_steps": 1139, "total_steps": 1235, "loss": 0.2573, "lr": 7.323952008970537e-07, "epoch": 4.611336032388664, "percentage": 92.23, "elapsed_time": "6:19:22", "remaining_time": "0:31:58"}
1140
+ {"current_steps": 1140, "total_steps": 1235, "loss": 0.2447, "lr": 7.173078341262618e-07, "epoch": 4.615384615384615, "percentage": 92.31, "elapsed_time": "6:19:40", "remaining_time": "0:31:38"}
1141
+ {"current_steps": 1141, "total_steps": 1235, "loss": 0.2536, "lr": 7.023746512481989e-07, "epoch": 4.619433198380567, "percentage": 92.39, "elapsed_time": "6:20:02", "remaining_time": "0:31:18"}
1142
+ {"current_steps": 1142, "total_steps": 1235, "loss": 0.2487, "lr": 6.875957716681902e-07, "epoch": 4.623481781376518, "percentage": 92.47, "elapsed_time": "6:20:19", "remaining_time": "0:30:58"}
1143
+ {"current_steps": 1143, "total_steps": 1235, "loss": 0.2634, "lr": 6.729713135577687e-07, "epoch": 4.62753036437247, "percentage": 92.55, "elapsed_time": "6:20:39", "remaining_time": "0:30:38"}
1144
+ {"current_steps": 1144, "total_steps": 1235, "loss": 0.2771, "lr": 6.585013938537143e-07, "epoch": 4.631578947368421, "percentage": 92.63, "elapsed_time": "6:20:59", "remaining_time": "0:30:18"}
1145
+ {"current_steps": 1145, "total_steps": 1235, "loss": 0.2682, "lr": 6.441861282571115e-07, "epoch": 4.635627530364372, "percentage": 92.71, "elapsed_time": "6:21:13", "remaining_time": "0:29:57"}
1146
+ {"current_steps": 1146, "total_steps": 1235, "loss": 0.2616, "lr": 6.300256312324471e-07, "epoch": 4.6396761133603235, "percentage": 92.79, "elapsed_time": "6:21:32", "remaining_time": "0:29:37"}
1147
+ {"current_steps": 1147, "total_steps": 1235, "loss": 0.2699, "lr": 6.160200160066776e-07, "epoch": 4.6437246963562755, "percentage": 92.87, "elapsed_time": "6:21:53", "remaining_time": "0:29:17"}
1148
+ {"current_steps": 1148, "total_steps": 1235, "loss": 0.2695, "lr": 6.021693945683327e-07, "epoch": 4.647773279352227, "percentage": 92.96, "elapsed_time": "6:22:14", "remaining_time": "0:28:58"}
1149
+ {"current_steps": 1149, "total_steps": 1235, "loss": 0.2557, "lr": 5.884738776666044e-07, "epoch": 4.651821862348179, "percentage": 93.04, "elapsed_time": "6:22:30", "remaining_time": "0:28:37"}
1150
+ {"current_steps": 1150, "total_steps": 1235, "loss": 0.2651, "lr": 5.749335748104878e-07, "epoch": 4.65587044534413, "percentage": 93.12, "elapsed_time": "6:22:47", "remaining_time": "0:28:17"}
1151
+ {"current_steps": 1151, "total_steps": 1235, "loss": 0.2652, "lr": 5.615485942678778e-07, "epoch": 4.659919028340081, "percentage": 93.2, "elapsed_time": "6:23:07", "remaining_time": "0:27:57"}
1152
+ {"current_steps": 1152, "total_steps": 1235, "loss": 0.2693, "lr": 5.483190430647289e-07, "epoch": 4.663967611336032, "percentage": 93.28, "elapsed_time": "6:23:29", "remaining_time": "0:27:37"}
1153
+ {"current_steps": 1153, "total_steps": 1235, "loss": 0.2535, "lr": 5.352450269841747e-07, "epoch": 4.668016194331984, "percentage": 93.36, "elapsed_time": "6:23:49", "remaining_time": "0:27:17"}
1154
+ {"current_steps": 1154, "total_steps": 1235, "loss": 0.2719, "lr": 5.22326650565701e-07, "epoch": 4.672064777327935, "percentage": 93.44, "elapsed_time": "6:24:07", "remaining_time": "0:26:57"}
1155
+ {"current_steps": 1155, "total_steps": 1235, "loss": 0.2824, "lr": 5.095640171043048e-07, "epoch": 4.676113360323887, "percentage": 93.52, "elapsed_time": "6:24:27", "remaining_time": "0:26:37"}
1156
+ {"current_steps": 1156, "total_steps": 1235, "loss": 0.2402, "lr": 4.969572286496594e-07, "epoch": 4.680161943319838, "percentage": 93.6, "elapsed_time": "6:24:44", "remaining_time": "0:26:17"}
1157
+ {"current_steps": 1157, "total_steps": 1235, "loss": 0.2563, "lr": 4.845063860053079e-07, "epoch": 4.684210526315789, "percentage": 93.68, "elapsed_time": "6:25:00", "remaining_time": "0:25:57"}
1158
+ {"current_steps": 1158, "total_steps": 1235, "loss": 0.2517, "lr": 4.7221158872785997e-07, "epoch": 4.6882591093117405, "percentage": 93.77, "elapsed_time": "6:25:20", "remaining_time": "0:25:37"}
1159
+ {"current_steps": 1159, "total_steps": 1235, "loss": 0.2688, "lr": 4.600729351261857e-07, "epoch": 4.6923076923076925, "percentage": 93.85, "elapsed_time": "6:25:43", "remaining_time": "0:25:17"}
1160
+ {"current_steps": 1160, "total_steps": 1235, "loss": 0.2722, "lr": 4.4809052226063355e-07, "epoch": 4.696356275303644, "percentage": 93.93, "elapsed_time": "6:26:03", "remaining_time": "0:24:57"}
1161
+ {"current_steps": 1161, "total_steps": 1235, "loss": 0.2773, "lr": 4.3626444594226046e-07, "epoch": 4.700404858299595, "percentage": 94.01, "elapsed_time": "6:26:24", "remaining_time": "0:24:37"}
1162
+ {"current_steps": 1162, "total_steps": 1235, "loss": 0.2646, "lr": 4.245948007320588e-07, "epoch": 4.704453441295547, "percentage": 94.09, "elapsed_time": "6:26:42", "remaining_time": "0:24:17"}
1163
+ {"current_steps": 1163, "total_steps": 1235, "loss": 0.2534, "lr": 4.130816799401971e-07, "epoch": 4.708502024291498, "percentage": 94.17, "elapsed_time": "6:27:00", "remaining_time": "0:23:57"}
1164
+ {"current_steps": 1164, "total_steps": 1235, "loss": 0.2643, "lr": 4.017251756252827e-07, "epoch": 4.712550607287449, "percentage": 94.25, "elapsed_time": "6:27:19", "remaining_time": "0:23:37"}
1165
+ {"current_steps": 1165, "total_steps": 1235, "loss": 0.258, "lr": 3.9052537859362473e-07, "epoch": 4.716599190283401, "percentage": 94.33, "elapsed_time": "6:27:36", "remaining_time": "0:23:17"}
1166
+ {"current_steps": 1166, "total_steps": 1235, "loss": 0.252, "lr": 3.7948237839849687e-07, "epoch": 4.720647773279352, "percentage": 94.41, "elapsed_time": "6:27:51", "remaining_time": "0:22:57"}
1167
+ {"current_steps": 1167, "total_steps": 1235, "loss": 0.2572, "lr": 3.6859626333943797e-07, "epoch": 4.724696356275303, "percentage": 94.49, "elapsed_time": "6:28:09", "remaining_time": "0:22:37"}
1168
+ {"current_steps": 1168, "total_steps": 1235, "loss": 0.2545, "lr": 3.578671204615347e-07, "epoch": 4.728744939271255, "percentage": 94.57, "elapsed_time": "6:28:29", "remaining_time": "0:22:17"}
1169
+ {"current_steps": 1169, "total_steps": 1235, "loss": 0.2505, "lr": 3.472950355547267e-07, "epoch": 4.732793522267206, "percentage": 94.66, "elapsed_time": "6:28:46", "remaining_time": "0:21:56"}
1170
+ {"current_steps": 1170, "total_steps": 1235, "loss": 0.2525, "lr": 3.3688009315312244e-07, "epoch": 4.7368421052631575, "percentage": 94.74, "elapsed_time": "6:29:05", "remaining_time": "0:21:36"}
1171
+ {"current_steps": 1171, "total_steps": 1235, "loss": 0.2446, "lr": 3.266223765343224e-07, "epoch": 4.7408906882591095, "percentage": 94.82, "elapsed_time": "6:29:23", "remaining_time": "0:21:16"}
1172
+ {"current_steps": 1172, "total_steps": 1235, "loss": 0.2597, "lr": 3.16521967718757e-07, "epoch": 4.744939271255061, "percentage": 94.9, "elapsed_time": "6:29:47", "remaining_time": "0:20:57"}
1173
+ {"current_steps": 1173, "total_steps": 1235, "loss": 0.2514, "lr": 3.0657894746902726e-07, "epoch": 4.748987854251012, "percentage": 94.98, "elapsed_time": "6:30:04", "remaining_time": "0:20:37"}
1174
+ {"current_steps": 1174, "total_steps": 1235, "loss": 0.2582, "lr": 2.9679339528925654e-07, "epoch": 4.753036437246964, "percentage": 95.06, "elapsed_time": "6:30:25", "remaining_time": "0:20:17"}
1175
+ {"current_steps": 1175, "total_steps": 1235, "loss": 0.2567, "lr": 2.871653894244597e-07, "epoch": 4.757085020242915, "percentage": 95.14, "elapsed_time": "6:30:45", "remaining_time": "0:19:57"}
1176
+ {"current_steps": 1176, "total_steps": 1235, "loss": 0.2622, "lr": 2.7769500685991266e-07, "epoch": 4.761133603238866, "percentage": 95.22, "elapsed_time": "6:31:05", "remaining_time": "0:19:37"}
1177
+ {"current_steps": 1177, "total_steps": 1235, "loss": 0.2571, "lr": 2.683823233205485e-07, "epoch": 4.765182186234818, "percentage": 95.3, "elapsed_time": "6:31:26", "remaining_time": "0:19:17"}
1178
+ {"current_steps": 1178, "total_steps": 1235, "loss": 0.2675, "lr": 2.592274132703287e-07, "epoch": 4.769230769230769, "percentage": 95.38, "elapsed_time": "6:31:47", "remaining_time": "0:18:57"}
1179
+ {"current_steps": 1179, "total_steps": 1235, "loss": 0.2643, "lr": 2.502303499116754e-07, "epoch": 4.77327935222672, "percentage": 95.47, "elapsed_time": "6:32:08", "remaining_time": "0:18:37"}
1180
+ {"current_steps": 1180, "total_steps": 1235, "loss": 0.2597, "lr": 2.413912051848666e-07, "epoch": 4.777327935222672, "percentage": 95.55, "elapsed_time": "6:32:30", "remaining_time": "0:18:17"}
1181
+ {"current_steps": 1181, "total_steps": 1235, "loss": 0.2607, "lr": 2.3271004976746613e-07, "epoch": 4.781376518218623, "percentage": 95.63, "elapsed_time": "6:32:48", "remaining_time": "0:17:57"}
1182
+ {"current_steps": 1182, "total_steps": 1235, "loss": 0.2616, "lr": 2.2418695307376393e-07, "epoch": 4.7854251012145745, "percentage": 95.71, "elapsed_time": "6:33:08", "remaining_time": "0:17:37"}
1183
+ {"current_steps": 1183, "total_steps": 1235, "loss": 0.2644, "lr": 2.1582198325420968e-07, "epoch": 4.7894736842105265, "percentage": 95.79, "elapsed_time": "6:33:28", "remaining_time": "0:17:17"}
1184
+ {"current_steps": 1184, "total_steps": 1235, "loss": 0.265, "lr": 2.0761520719488447e-07, "epoch": 4.793522267206478, "percentage": 95.87, "elapsed_time": "6:33:47", "remaining_time": "0:16:57"}
1185
+ {"current_steps": 1185, "total_steps": 1235, "loss": 0.262, "lr": 1.9956669051694798e-07, "epoch": 4.797570850202429, "percentage": 95.95, "elapsed_time": "6:34:08", "remaining_time": "0:16:37"}
1186
+ {"current_steps": 1186, "total_steps": 1235, "loss": 0.2609, "lr": 1.916764975761254e-07, "epoch": 4.801619433198381, "percentage": 96.03, "elapsed_time": "6:34:26", "remaining_time": "0:16:17"}
1187
+ {"current_steps": 1187, "total_steps": 1235, "loss": 0.2551, "lr": 1.839446914621923e-07, "epoch": 4.805668016194332, "percentage": 96.11, "elapsed_time": "6:34:41", "remaining_time": "0:15:57"}
1188
+ {"current_steps": 1188, "total_steps": 1235, "loss": 0.2612, "lr": 1.7637133399845962e-07, "epoch": 4.809716599190283, "percentage": 96.19, "elapsed_time": "6:35:03", "remaining_time": "0:15:37"}
1189
+ {"current_steps": 1189, "total_steps": 1235, "loss": 0.264, "lr": 1.6895648574129397e-07, "epoch": 4.813765182186235, "percentage": 96.28, "elapsed_time": "6:35:24", "remaining_time": "0:15:17"}
1190
+ {"current_steps": 1190, "total_steps": 1235, "loss": 0.2753, "lr": 1.6170020597962465e-07, "epoch": 4.817813765182186, "percentage": 96.36, "elapsed_time": "6:35:41", "remaining_time": "0:14:57"}
1191
+ {"current_steps": 1191, "total_steps": 1235, "loss": 0.2623, "lr": 1.5460255273447078e-07, "epoch": 4.821862348178137, "percentage": 96.44, "elapsed_time": "6:36:02", "remaining_time": "0:14:37"}
1192
+ {"current_steps": 1192, "total_steps": 1235, "loss": 0.2679, "lr": 1.4766358275847715e-07, "epoch": 4.825910931174089, "percentage": 96.52, "elapsed_time": "6:36:23", "remaining_time": "0:14:17"}
1193
+ {"current_steps": 1193, "total_steps": 1235, "loss": 0.2544, "lr": 1.4088335153546573e-07, "epoch": 4.82995951417004, "percentage": 96.6, "elapsed_time": "6:36:44", "remaining_time": "0:13:58"}
1194
+ {"current_steps": 1194, "total_steps": 1235, "loss": 0.2499, "lr": 1.3426191327998496e-07, "epoch": 4.834008097165992, "percentage": 96.68, "elapsed_time": "6:37:02", "remaining_time": "0:13:38"}
1195
+ {"current_steps": 1195, "total_steps": 1235, "loss": 0.278, "lr": 1.277993209368744e-07, "epoch": 4.838056680161944, "percentage": 96.76, "elapsed_time": "6:37:24", "remaining_time": "0:13:18"}
1196
+ {"current_steps": 1196, "total_steps": 1235, "loss": 0.253, "lr": 1.214956261808542e-07, "epoch": 4.842105263157895, "percentage": 96.84, "elapsed_time": "6:37:40", "remaining_time": "0:12:58"}
1197
+ {"current_steps": 1197, "total_steps": 1235, "loss": 0.2681, "lr": 1.1535087941609846e-07, "epoch": 4.846153846153846, "percentage": 96.92, "elapsed_time": "6:38:03", "remaining_time": "0:12:38"}
1198
+ {"current_steps": 1198, "total_steps": 1235, "loss": 0.2695, "lr": 1.0936512977583802e-07, "epoch": 4.850202429149798, "percentage": 97.0, "elapsed_time": "6:38:22", "remaining_time": "0:12:18"}
1199
+ {"current_steps": 1199, "total_steps": 1235, "loss": 0.2648, "lr": 1.0353842512196732e-07, "epoch": 4.854251012145749, "percentage": 97.09, "elapsed_time": "6:38:44", "remaining_time": "0:11:58"}
1200
+ {"current_steps": 1200, "total_steps": 1235, "loss": 0.2494, "lr": 9.787081204466253e-08, "epoch": 4.8582995951417, "percentage": 97.17, "elapsed_time": "6:39:04", "remaining_time": "0:11:38"}
1201
+ {"current_steps": 1201, "total_steps": 1235, "loss": 0.2619, "lr": 9.236233586200627e-08, "epoch": 4.862348178137652, "percentage": 97.25, "elapsed_time": "6:39:21", "remaining_time": "0:11:18"}
1202
+ {"current_steps": 1202, "total_steps": 1235, "loss": 0.2677, "lr": 8.70130406196279e-08, "epoch": 4.866396761133603, "percentage": 97.33, "elapsed_time": "6:39:41", "remaining_time": "0:10:58"}
1203
+ {"current_steps": 1203, "total_steps": 1235, "loss": 0.2792, "lr": 8.182296909035047e-08, "epoch": 4.870445344129554, "percentage": 97.41, "elapsed_time": "6:40:02", "remaining_time": "0:10:38"}
1204
+ {"current_steps": 1204, "total_steps": 1235, "loss": 0.2699, "lr": 7.679216277384439e-08, "epoch": 4.874493927125506, "percentage": 97.49, "elapsed_time": "6:40:23", "remaining_time": "0:10:18"}
1205
+ {"current_steps": 1205, "total_steps": 1235, "loss": 0.2688, "lr": 7.19206618963053e-08, "epoch": 4.8785425101214575, "percentage": 97.57, "elapsed_time": "6:40:43", "remaining_time": "0:09:58"}
1206
+ {"current_steps": 1206, "total_steps": 1235, "loss": 0.2678, "lr": 6.720850541012347e-08, "epoch": 4.882591093117409, "percentage": 97.65, "elapsed_time": "6:41:06", "remaining_time": "0:09:38"}
1207
+ {"current_steps": 1207, "total_steps": 1235, "loss": 0.267, "lr": 6.265573099357714e-08, "epoch": 4.886639676113361, "percentage": 97.73, "elapsed_time": "6:41:26", "remaining_time": "0:09:18"}
1208
+ {"current_steps": 1208, "total_steps": 1235, "loss": 0.2606, "lr": 5.826237505053067e-08, "epoch": 4.890688259109312, "percentage": 97.81, "elapsed_time": "6:41:46", "remaining_time": "0:08:58"}
1209
+ {"current_steps": 1209, "total_steps": 1235, "loss": 0.2618, "lr": 5.4028472710137e-08, "epoch": 4.894736842105263, "percentage": 97.89, "elapsed_time": "6:42:05", "remaining_time": "0:08:38"}
1210
+ {"current_steps": 1210, "total_steps": 1235, "loss": 0.2604, "lr": 4.9954057826571146e-08, "epoch": 4.898785425101215, "percentage": 97.98, "elapsed_time": "6:42:27", "remaining_time": "0:08:18"}
1211
+ {"current_steps": 1211, "total_steps": 1235, "loss": 0.2614, "lr": 4.6039162978743776e-08, "epoch": 4.902834008097166, "percentage": 98.06, "elapsed_time": "6:42:47", "remaining_time": "0:07:58"}
1212
+ {"current_steps": 1212, "total_steps": 1235, "loss": 0.2629, "lr": 4.228381947004812e-08, "epoch": 4.906882591093117, "percentage": 98.14, "elapsed_time": "6:43:08", "remaining_time": "0:07:39"}
1213
+ {"current_steps": 1213, "total_steps": 1235, "loss": 0.2514, "lr": 3.868805732811343e-08, "epoch": 4.910931174089069, "percentage": 98.22, "elapsed_time": "6:43:30", "remaining_time": "0:07:19"}
1214
+ {"current_steps": 1214, "total_steps": 1235, "loss": 0.2677, "lr": 3.525190530455636e-08, "epoch": 4.91497975708502, "percentage": 98.3, "elapsed_time": "6:43:50", "remaining_time": "0:06:59"}
1215
+ {"current_steps": 1215, "total_steps": 1235, "loss": 0.2546, "lr": 3.197539087475887e-08, "epoch": 4.919028340080971, "percentage": 98.38, "elapsed_time": "6:44:08", "remaining_time": "0:06:39"}
1216
+ {"current_steps": 1216, "total_steps": 1235, "loss": 0.2572, "lr": 2.8858540237641786e-08, "epoch": 4.923076923076923, "percentage": 98.46, "elapsed_time": "6:44:25", "remaining_time": "0:06:19"}
1217
+ {"current_steps": 1217, "total_steps": 1235, "loss": 0.2589, "lr": 2.5901378315458247e-08, "epoch": 4.9271255060728745, "percentage": 98.54, "elapsed_time": "6:44:45", "remaining_time": "0:05:59"}
1218
+ {"current_steps": 1218, "total_steps": 1235, "loss": 0.2551, "lr": 2.3103928753598347e-08, "epoch": 4.931174089068826, "percentage": 98.62, "elapsed_time": "6:45:07", "remaining_time": "0:05:39"}
1219
+ {"current_steps": 1219, "total_steps": 1235, "loss": 0.249, "lr": 2.0466213920393718e-08, "epoch": 4.935222672064778, "percentage": 98.7, "elapsed_time": "6:45:28", "remaining_time": "0:05:19"}
1220
+ {"current_steps": 1220, "total_steps": 1235, "loss": 0.2661, "lr": 1.7988254906942115e-08, "epoch": 4.939271255060729, "percentage": 98.79, "elapsed_time": "6:45:47", "remaining_time": "0:04:59"}
1221
+ {"current_steps": 1221, "total_steps": 1235, "loss": 0.2507, "lr": 1.5670071526936447e-08, "epoch": 4.94331983805668, "percentage": 98.87, "elapsed_time": "6:46:03", "remaining_time": "0:04:39"}
1222
+ {"current_steps": 1222, "total_steps": 1235, "loss": 0.2647, "lr": 1.3511682316509344e-08, "epoch": 4.947368421052632, "percentage": 98.95, "elapsed_time": "6:46:19", "remaining_time": "0:04:19"}
1223
+ {"current_steps": 1223, "total_steps": 1235, "loss": 0.2593, "lr": 1.1513104534086605e-08, "epoch": 4.951417004048583, "percentage": 99.03, "elapsed_time": "6:46:37", "remaining_time": "0:03:59"}
1224
+ {"current_steps": 1224, "total_steps": 1235, "loss": 0.2505, "lr": 9.67435416023843e-09, "epoch": 4.955465587044534, "percentage": 99.11, "elapsed_time": "6:46:55", "remaining_time": "0:03:39"}
1225
+ {"current_steps": 1225, "total_steps": 1235, "loss": 0.2582, "lr": 7.995445897566178e-09, "epoch": 4.959514170040486, "percentage": 99.19, "elapsed_time": "6:47:14", "remaining_time": "0:03:19"}
1226
+ {"current_steps": 1226, "total_steps": 1235, "loss": 0.2582, "lr": 6.476393170578021e-09, "epoch": 4.963562753036437, "percentage": 99.27, "elapsed_time": "6:47:33", "remaining_time": "0:02:59"}
1227
+ {"current_steps": 1227, "total_steps": 1235, "loss": 0.2624, "lr": 5.11720812557348e-09, "epoch": 4.967611336032388, "percentage": 99.35, "elapsed_time": "6:47:55", "remaining_time": "0:02:39"}
1228
+ {"current_steps": 1228, "total_steps": 1235, "loss": 0.2623, "lr": 3.917901630563492e-09, "epoch": 4.97165991902834, "percentage": 99.43, "elapsed_time": "6:48:17", "remaining_time": "0:02:19"}
1229
+ {"current_steps": 1229, "total_steps": 1235, "loss": 0.2536, "lr": 2.878483275170485e-09, "epoch": 4.9757085020242915, "percentage": 99.51, "elapsed_time": "6:48:35", "remaining_time": "0:01:59"}
1230
+ {"current_steps": 1230, "total_steps": 1235, "loss": 0.2598, "lr": 1.998961370555108e-09, "epoch": 4.979757085020243, "percentage": 99.6, "elapsed_time": "6:48:55", "remaining_time": "0:01:39"}
1231
+ {"current_steps": 1231, "total_steps": 1235, "loss": 0.2649, "lr": 1.2793429493518361e-09, "epoch": 4.983805668016195, "percentage": 99.68, "elapsed_time": "6:49:16", "remaining_time": "0:01:19"}
1232
+ {"current_steps": 1232, "total_steps": 1235, "loss": 0.2573, "lr": 7.196337656112384e-10, "epoch": 4.987854251012146, "percentage": 99.76, "elapsed_time": "6:49:34", "remaining_time": "0:00:59"}
1233
+ {"current_steps": 1233, "total_steps": 1235, "loss": 0.2533, "lr": 3.198382947511292e-10, "epoch": 4.991902834008097, "percentage": 99.84, "elapsed_time": "6:49:55", "remaining_time": "0:00:39"}
1234
+ {"current_steps": 1234, "total_steps": 1235, "loss": 0.2629, "lr": 7.995973352770137e-11, "epoch": 4.995951417004049, "percentage": 99.92, "elapsed_time": "6:50:11", "remaining_time": "0:00:19"}
1235
+ {"current_steps": 1235, "total_steps": 1235, "loss": 0.258, "lr": 0.0, "epoch": 5.0, "percentage": 100.0, "elapsed_time": "6:50:30", "remaining_time": "0:00:00"}
1236
+ {"current_steps": 1235, "total_steps": 1235, "epoch": 5.0, "percentage": 100.0, "elapsed_time": "6:54:10", "remaining_time": "0:00:00"}