gsmyrnis commited on
Commit
2f2b96d
·
verified ·
1 Parent(s): a7da946

Training in progress, epoch 2

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:552ed359425e49db60643998fe1f7c02970bd06a9a780b38e176a8e99aae1f39
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:53ef9972f8ab44ee3f98bfd40217e015db9403822de59929f1115471df74a4c2
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a211104c63871d635fbd0e9cd5d635f0cebac1cc737dbeff63c0d7874c4bfb45
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eec38113a86d3accf6b2b13633749bed075bbcc04a81a40a8ab1e4dd3cbb9c62
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8447aff97e7bdf052e59d28fd3ba49437d7f8b5740e273d2203989236834d651
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d92b0bc05604445569784f8f8ac6c3483aecfbeb6a56ea26e5c7acc5d52f8292
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bfc592c99c44ed8d8e21b7d56e17efefbb2fa4618b37f58141b3fb56742f9533
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:469387ce4c0e890cb706d29e730abe5a2df5340a0ed970ebf07e3f2de112a09f
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -692,3 +692,336 @@
692
  {"current_steps": 692, "total_steps": 1026, "loss": 0.5208, "lr": 2.897625618079769e-06, "epoch": 2.0214216163583254, "percentage": 67.45, "elapsed_time": "2:53:16", "remaining_time": "1:23:38"}
693
  {"current_steps": 693, "total_steps": 1026, "loss": 0.5438, "lr": 2.88219697999927e-06, "epoch": 2.024342745861733, "percentage": 67.54, "elapsed_time": "2:53:33", "remaining_time": "1:23:24"}
694
  {"current_steps": 694, "total_steps": 1026, "loss": 0.5444, "lr": 2.8667928766603115e-06, "epoch": 2.0272638753651413, "percentage": 67.64, "elapsed_time": "2:53:47", "remaining_time": "1:23:08"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
692
  {"current_steps": 692, "total_steps": 1026, "loss": 0.5208, "lr": 2.897625618079769e-06, "epoch": 2.0214216163583254, "percentage": 67.45, "elapsed_time": "2:53:16", "remaining_time": "1:23:38"}
693
  {"current_steps": 693, "total_steps": 1026, "loss": 0.5438, "lr": 2.88219697999927e-06, "epoch": 2.024342745861733, "percentage": 67.54, "elapsed_time": "2:53:33", "remaining_time": "1:23:24"}
694
  {"current_steps": 694, "total_steps": 1026, "loss": 0.5444, "lr": 2.8667928766603115e-06, "epoch": 2.0272638753651413, "percentage": 67.64, "elapsed_time": "2:53:47", "remaining_time": "1:23:08"}
695
+ {"current_steps": 695, "total_steps": 1026, "loss": 0.4634, "lr": 2.851413486519388e-06, "epoch": 2.030185004868549, "percentage": 67.74, "elapsed_time": "2:53:58", "remaining_time": "1:22:51"}
696
+ {"current_steps": 696, "total_steps": 1026, "loss": 0.5391, "lr": 2.8360589877466848e-06, "epoch": 2.033106134371957, "percentage": 67.84, "elapsed_time": "2:54:14", "remaining_time": "1:22:36"}
697
+ {"current_steps": 697, "total_steps": 1026, "loss": 0.4871, "lr": 2.8207295582240248e-06, "epoch": 2.036027263875365, "percentage": 67.93, "elapsed_time": "2:54:27", "remaining_time": "1:22:20"}
698
+ {"current_steps": 698, "total_steps": 1026, "loss": 0.5574, "lr": 2.8054253755428017e-06, "epoch": 2.038948393378773, "percentage": 68.03, "elapsed_time": "2:54:42", "remaining_time": "1:22:06"}
699
+ {"current_steps": 699, "total_steps": 1026, "loss": 0.4977, "lr": 2.7901466170019242e-06, "epoch": 2.0418695228821813, "percentage": 68.13, "elapsed_time": "2:55:00", "remaining_time": "1:21:52"}
700
+ {"current_steps": 700, "total_steps": 1026, "loss": 0.56, "lr": 2.774893459605766e-06, "epoch": 2.044790652385589, "percentage": 68.23, "elapsed_time": "2:55:14", "remaining_time": "1:21:36"}
701
+ {"current_steps": 701, "total_steps": 1026, "loss": 0.5028, "lr": 2.7596660800621076e-06, "epoch": 2.047711781888997, "percentage": 68.32, "elapsed_time": "2:55:27", "remaining_time": "1:21:20"}
702
+ {"current_steps": 702, "total_steps": 1026, "loss": 0.5174, "lr": 2.744464654780096e-06, "epoch": 2.050632911392405, "percentage": 68.42, "elapsed_time": "2:55:40", "remaining_time": "1:21:04"}
703
+ {"current_steps": 703, "total_steps": 1026, "loss": 0.5104, "lr": 2.7292893598681934e-06, "epoch": 2.053554040895813, "percentage": 68.52, "elapsed_time": "2:55:56", "remaining_time": "1:20:50"}
704
+ {"current_steps": 704, "total_steps": 1026, "loss": 0.5375, "lr": 2.714140371132149e-06, "epoch": 2.0564751703992212, "percentage": 68.62, "elapsed_time": "2:56:11", "remaining_time": "1:20:35"}
705
+ {"current_steps": 705, "total_steps": 1026, "loss": 0.5105, "lr": 2.69901786407295e-06, "epoch": 2.059396299902629, "percentage": 68.71, "elapsed_time": "2:56:25", "remaining_time": "1:20:19"}
706
+ {"current_steps": 706, "total_steps": 1026, "loss": 0.4899, "lr": 2.6839220138847966e-06, "epoch": 2.062317429406037, "percentage": 68.81, "elapsed_time": "2:56:40", "remaining_time": "1:20:04"}
707
+ {"current_steps": 707, "total_steps": 1026, "loss": 0.5388, "lr": 2.6688529954530612e-06, "epoch": 2.065238558909445, "percentage": 68.91, "elapsed_time": "2:56:56", "remaining_time": "1:19:50"}
708
+ {"current_steps": 708, "total_steps": 1026, "loss": 0.5822, "lr": 2.653810983352282e-06, "epoch": 2.068159688412853, "percentage": 69.01, "elapsed_time": "2:57:07", "remaining_time": "1:19:33"}
709
+ {"current_steps": 709, "total_steps": 1026, "loss": 0.4639, "lr": 2.6387961518441223e-06, "epoch": 2.0710808179162608, "percentage": 69.1, "elapsed_time": "2:57:21", "remaining_time": "1:19:17"}
710
+ {"current_steps": 710, "total_steps": 1026, "loss": 0.5153, "lr": 2.6238086748753587e-06, "epoch": 2.074001947419669, "percentage": 69.2, "elapsed_time": "2:57:35", "remaining_time": "1:19:02"}
711
+ {"current_steps": 711, "total_steps": 1026, "loss": 0.5245, "lr": 2.6088487260758643e-06, "epoch": 2.076923076923077, "percentage": 69.3, "elapsed_time": "2:57:50", "remaining_time": "1:18:47"}
712
+ {"current_steps": 712, "total_steps": 1026, "loss": 0.4816, "lr": 2.593916478756605e-06, "epoch": 2.079844206426485, "percentage": 69.4, "elapsed_time": "2:58:04", "remaining_time": "1:18:31"}
713
+ {"current_steps": 713, "total_steps": 1026, "loss": 0.5824, "lr": 2.579012105907619e-06, "epoch": 2.082765335929893, "percentage": 69.49, "elapsed_time": "2:58:17", "remaining_time": "1:18:16"}
714
+ {"current_steps": 714, "total_steps": 1026, "loss": 0.4738, "lr": 2.5641357801960186e-06, "epoch": 2.0856864654333007, "percentage": 69.59, "elapsed_time": "2:58:27", "remaining_time": "1:17:58"}
715
+ {"current_steps": 715, "total_steps": 1026, "loss": 0.5299, "lr": 2.5492876739639912e-06, "epoch": 2.088607594936709, "percentage": 69.69, "elapsed_time": "2:58:41", "remaining_time": "1:17:43"}
716
+ {"current_steps": 716, "total_steps": 1026, "loss": 0.5162, "lr": 2.534467959226806e-06, "epoch": 2.091528724440117, "percentage": 69.79, "elapsed_time": "2:58:58", "remaining_time": "1:17:29"}
717
+ {"current_steps": 717, "total_steps": 1026, "loss": 0.5081, "lr": 2.519676807670811e-06, "epoch": 2.094449853943525, "percentage": 69.88, "elapsed_time": "2:59:14", "remaining_time": "1:17:14"}
718
+ {"current_steps": 718, "total_steps": 1026, "loss": 0.5576, "lr": 2.504914390651453e-06, "epoch": 2.097370983446933, "percentage": 69.98, "elapsed_time": "2:59:29", "remaining_time": "1:16:59"}
719
+ {"current_steps": 719, "total_steps": 1026, "loss": 0.4998, "lr": 2.4901808791912864e-06, "epoch": 2.1002921129503407, "percentage": 70.08, "elapsed_time": "2:59:44", "remaining_time": "1:16:44"}
720
+ {"current_steps": 720, "total_steps": 1026, "loss": 0.5696, "lr": 2.475476443977996e-06, "epoch": 2.103213242453749, "percentage": 70.18, "elapsed_time": "3:00:01", "remaining_time": "1:16:30"}
721
+ {"current_steps": 721, "total_steps": 1026, "loss": 0.4764, "lr": 2.460801255362425e-06, "epoch": 2.1061343719571566, "percentage": 70.27, "elapsed_time": "3:00:17", "remaining_time": "1:16:15"}
722
+ {"current_steps": 722, "total_steps": 1026, "loss": 0.5357, "lr": 2.446155483356582e-06, "epoch": 2.1090555014605648, "percentage": 70.37, "elapsed_time": "3:00:29", "remaining_time": "1:15:59"}
723
+ {"current_steps": 723, "total_steps": 1026, "loss": 0.4915, "lr": 2.4315392976316923e-06, "epoch": 2.111976630963973, "percentage": 70.47, "elapsed_time": "3:00:44", "remaining_time": "1:15:44"}
724
+ {"current_steps": 724, "total_steps": 1026, "loss": 0.4838, "lr": 2.4169528675162256e-06, "epoch": 2.1148977604673806, "percentage": 70.57, "elapsed_time": "3:00:58", "remaining_time": "1:15:29"}
725
+ {"current_steps": 725, "total_steps": 1026, "loss": 0.537, "lr": 2.40239636199393e-06, "epoch": 2.117818889970789, "percentage": 70.66, "elapsed_time": "3:01:13", "remaining_time": "1:15:14"}
726
+ {"current_steps": 726, "total_steps": 1026, "loss": 0.549, "lr": 2.3878699497018763e-06, "epoch": 2.1207400194741965, "percentage": 70.76, "elapsed_time": "3:01:28", "remaining_time": "1:14:59"}
727
+ {"current_steps": 727, "total_steps": 1026, "loss": 0.5042, "lr": 2.373373798928507e-06, "epoch": 2.1236611489776047, "percentage": 70.86, "elapsed_time": "3:01:39", "remaining_time": "1:14:42"}
728
+ {"current_steps": 728, "total_steps": 1026, "loss": 0.5795, "lr": 2.358908077611684e-06, "epoch": 2.1265822784810124, "percentage": 70.96, "elapsed_time": "3:01:56", "remaining_time": "1:14:28"}
729
+ {"current_steps": 729, "total_steps": 1026, "loss": 0.468, "lr": 2.344472953336747e-06, "epoch": 2.1295034079844206, "percentage": 71.05, "elapsed_time": "3:02:09", "remaining_time": "1:14:12"}
730
+ {"current_steps": 730, "total_steps": 1026, "loss": 0.5022, "lr": 2.3300685933345656e-06, "epoch": 2.132424537487829, "percentage": 71.15, "elapsed_time": "3:02:24", "remaining_time": "1:13:57"}
731
+ {"current_steps": 731, "total_steps": 1026, "loss": 0.5877, "lr": 2.3156951644796065e-06, "epoch": 2.1353456669912365, "percentage": 71.25, "elapsed_time": "3:02:40", "remaining_time": "1:13:43"}
732
+ {"current_steps": 732, "total_steps": 1026, "loss": 0.4814, "lr": 2.3013528332879976e-06, "epoch": 2.1382667964946447, "percentage": 71.35, "elapsed_time": "3:02:54", "remaining_time": "1:13:27"}
733
+ {"current_steps": 733, "total_steps": 1026, "loss": 0.4953, "lr": 2.287041765915606e-06, "epoch": 2.1411879259980524, "percentage": 71.44, "elapsed_time": "3:03:10", "remaining_time": "1:13:13"}
734
+ {"current_steps": 734, "total_steps": 1026, "loss": 0.5269, "lr": 2.272762128156101e-06, "epoch": 2.1441090555014606, "percentage": 71.54, "elapsed_time": "3:03:27", "remaining_time": "1:12:59"}
735
+ {"current_steps": 735, "total_steps": 1026, "loss": 0.5244, "lr": 2.2585140854390432e-06, "epoch": 2.1470301850048688, "percentage": 71.64, "elapsed_time": "3:03:40", "remaining_time": "1:12:43"}
736
+ {"current_steps": 736, "total_steps": 1026, "loss": 0.5341, "lr": 2.2442978028279634e-06, "epoch": 2.1499513145082765, "percentage": 71.73, "elapsed_time": "3:03:56", "remaining_time": "1:12:28"}
737
+ {"current_steps": 737, "total_steps": 1026, "loss": 0.5243, "lr": 2.2301134450184535e-06, "epoch": 2.1528724440116846, "percentage": 71.83, "elapsed_time": "3:04:12", "remaining_time": "1:12:13"}
738
+ {"current_steps": 738, "total_steps": 1026, "loss": 0.5157, "lr": 2.215961176336255e-06, "epoch": 2.1557935735150924, "percentage": 71.93, "elapsed_time": "3:04:25", "remaining_time": "1:11:58"}
739
+ {"current_steps": 739, "total_steps": 1026, "loss": 0.4653, "lr": 2.2018411607353572e-06, "epoch": 2.1587147030185005, "percentage": 72.03, "elapsed_time": "3:04:41", "remaining_time": "1:11:43"}
740
+ {"current_steps": 740, "total_steps": 1026, "loss": 0.5521, "lr": 2.187753561796097e-06, "epoch": 2.1616358325219083, "percentage": 72.12, "elapsed_time": "3:04:58", "remaining_time": "1:11:29"}
741
+ {"current_steps": 741, "total_steps": 1026, "loss": 0.5736, "lr": 2.1736985427232684e-06, "epoch": 2.1645569620253164, "percentage": 72.22, "elapsed_time": "3:05:15", "remaining_time": "1:11:15"}
742
+ {"current_steps": 742, "total_steps": 1026, "loss": 0.4856, "lr": 2.159676266344222e-06, "epoch": 2.1674780915287246, "percentage": 72.32, "elapsed_time": "3:05:28", "remaining_time": "1:10:59"}
743
+ {"current_steps": 743, "total_steps": 1026, "loss": 0.513, "lr": 2.1456868951069875e-06, "epoch": 2.1703992210321323, "percentage": 72.42, "elapsed_time": "3:05:46", "remaining_time": "1:10:45"}
744
+ {"current_steps": 744, "total_steps": 1026, "loss": 0.5183, "lr": 2.1317305910783886e-06, "epoch": 2.1733203505355405, "percentage": 72.51, "elapsed_time": "3:06:01", "remaining_time": "1:10:30"}
745
+ {"current_steps": 745, "total_steps": 1026, "loss": 0.5169, "lr": 2.117807515942163e-06, "epoch": 2.1762414800389482, "percentage": 72.61, "elapsed_time": "3:06:16", "remaining_time": "1:10:15"}
746
+ {"current_steps": 746, "total_steps": 1026, "loss": 0.5256, "lr": 2.1039178309970975e-06, "epoch": 2.1791626095423564, "percentage": 72.71, "elapsed_time": "3:06:30", "remaining_time": "1:10:00"}
747
+ {"current_steps": 747, "total_steps": 1026, "loss": 0.5264, "lr": 2.090061697155147e-06, "epoch": 2.1820837390457646, "percentage": 72.81, "elapsed_time": "3:06:45", "remaining_time": "1:09:45"}
748
+ {"current_steps": 748, "total_steps": 1026, "loss": 0.497, "lr": 2.076239274939582e-06, "epoch": 2.1850048685491723, "percentage": 72.9, "elapsed_time": "3:07:00", "remaining_time": "1:09:30"}
749
+ {"current_steps": 749, "total_steps": 1026, "loss": 0.492, "lr": 2.062450724483118e-06, "epoch": 2.1879259980525805, "percentage": 73.0, "elapsed_time": "3:07:10", "remaining_time": "1:09:13"}
750
+ {"current_steps": 750, "total_steps": 1026, "loss": 0.4833, "lr": 2.0486962055260744e-06, "epoch": 2.190847127555988, "percentage": 73.1, "elapsed_time": "3:07:26", "remaining_time": "1:08:58"}
751
+ {"current_steps": 751, "total_steps": 1026, "loss": 0.5325, "lr": 2.03497587741451e-06, "epoch": 2.1937682570593964, "percentage": 73.2, "elapsed_time": "3:07:40", "remaining_time": "1:08:43"}
752
+ {"current_steps": 752, "total_steps": 1026, "loss": 0.5753, "lr": 2.021289899098384e-06, "epoch": 2.196689386562804, "percentage": 73.29, "elapsed_time": "3:07:55", "remaining_time": "1:08:28"}
753
+ {"current_steps": 753, "total_steps": 1026, "loss": 0.5095, "lr": 2.0076384291297134e-06, "epoch": 2.1996105160662123, "percentage": 73.39, "elapsed_time": "3:08:08", "remaining_time": "1:08:12"}
754
+ {"current_steps": 754, "total_steps": 1026, "loss": 0.5004, "lr": 1.994021625660737e-06, "epoch": 2.2025316455696204, "percentage": 73.49, "elapsed_time": "3:08:21", "remaining_time": "1:07:56"}
755
+ {"current_steps": 755, "total_steps": 1026, "loss": 0.5377, "lr": 1.9804396464420798e-06, "epoch": 2.205452775073028, "percentage": 73.59, "elapsed_time": "3:08:36", "remaining_time": "1:07:41"}
756
+ {"current_steps": 756, "total_steps": 1026, "loss": 0.5214, "lr": 1.966892648820932e-06, "epoch": 2.2083739045764363, "percentage": 73.68, "elapsed_time": "3:08:46", "remaining_time": "1:07:25"}
757
+ {"current_steps": 757, "total_steps": 1026, "loss": 0.522, "lr": 1.953380789739216e-06, "epoch": 2.211295034079844, "percentage": 73.78, "elapsed_time": "3:09:01", "remaining_time": "1:07:10"}
758
+ {"current_steps": 758, "total_steps": 1026, "loss": 0.5279, "lr": 1.939904225731783e-06, "epoch": 2.2142161635832522, "percentage": 73.88, "elapsed_time": "3:09:19", "remaining_time": "1:06:56"}
759
+ {"current_steps": 759, "total_steps": 1026, "loss": 0.5082, "lr": 1.9264631129245836e-06, "epoch": 2.21713729308666, "percentage": 73.98, "elapsed_time": "3:09:34", "remaining_time": "1:06:41"}
760
+ {"current_steps": 760, "total_steps": 1026, "loss": 0.5129, "lr": 1.9130576070328695e-06, "epoch": 2.220058422590068, "percentage": 74.07, "elapsed_time": "3:09:48", "remaining_time": "1:06:26"}
761
+ {"current_steps": 761, "total_steps": 1026, "loss": 0.499, "lr": 1.8996878633593829e-06, "epoch": 2.2229795520934763, "percentage": 74.17, "elapsed_time": "3:10:04", "remaining_time": "1:06:11"}
762
+ {"current_steps": 762, "total_steps": 1026, "loss": 0.5343, "lr": 1.8863540367925676e-06, "epoch": 2.225900681596884, "percentage": 74.27, "elapsed_time": "3:10:16", "remaining_time": "1:05:55"}
763
+ {"current_steps": 763, "total_steps": 1026, "loss": 0.4869, "lr": 1.873056281804762e-06, "epoch": 2.228821811100292, "percentage": 74.37, "elapsed_time": "3:10:29", "remaining_time": "1:05:39"}
764
+ {"current_steps": 764, "total_steps": 1026, "loss": 0.5201, "lr": 1.8597947524504178e-06, "epoch": 2.2317429406037, "percentage": 74.46, "elapsed_time": "3:10:44", "remaining_time": "1:05:24"}
765
+ {"current_steps": 765, "total_steps": 1026, "loss": 0.5354, "lr": 1.8465696023643115e-06, "epoch": 2.234664070107108, "percentage": 74.56, "elapsed_time": "3:11:01", "remaining_time": "1:05:10"}
766
+ {"current_steps": 766, "total_steps": 1026, "loss": 0.558, "lr": 1.8333809847597644e-06, "epoch": 2.2375851996105163, "percentage": 74.66, "elapsed_time": "3:11:15", "remaining_time": "1:04:55"}
767
+ {"current_steps": 767, "total_steps": 1026, "loss": 0.4795, "lr": 1.8202290524268761e-06, "epoch": 2.240506329113924, "percentage": 74.76, "elapsed_time": "3:11:29", "remaining_time": "1:04:39"}
768
+ {"current_steps": 768, "total_steps": 1026, "loss": 0.5228, "lr": 1.8071139577307416e-06, "epoch": 2.243427458617332, "percentage": 74.85, "elapsed_time": "3:11:42", "remaining_time": "1:04:24"}
769
+ {"current_steps": 769, "total_steps": 1026, "loss": 0.4903, "lr": 1.7940358526096885e-06, "epoch": 2.24634858812074, "percentage": 74.95, "elapsed_time": "3:11:57", "remaining_time": "1:04:09"}
770
+ {"current_steps": 770, "total_steps": 1026, "loss": 0.5906, "lr": 1.7809948885735295e-06, "epoch": 2.249269717624148, "percentage": 75.05, "elapsed_time": "3:12:13", "remaining_time": "1:03:54"}
771
+ {"current_steps": 771, "total_steps": 1026, "loss": 0.4726, "lr": 1.7679912167017922e-06, "epoch": 2.252190847127556, "percentage": 75.15, "elapsed_time": "3:12:29", "remaining_time": "1:03:39"}
772
+ {"current_steps": 772, "total_steps": 1026, "loss": 0.5263, "lr": 1.7550249876419746e-06, "epoch": 2.255111976630964, "percentage": 75.24, "elapsed_time": "3:12:45", "remaining_time": "1:03:25"}
773
+ {"current_steps": 773, "total_steps": 1026, "loss": 0.5207, "lr": 1.7420963516078016e-06, "epoch": 2.258033106134372, "percentage": 75.34, "elapsed_time": "3:13:02", "remaining_time": "1:03:11"}
774
+ {"current_steps": 774, "total_steps": 1026, "loss": 0.5634, "lr": 1.7292054583774809e-06, "epoch": 2.26095423563778, "percentage": 75.44, "elapsed_time": "3:13:19", "remaining_time": "1:02:56"}
775
+ {"current_steps": 775, "total_steps": 1026, "loss": 0.5167, "lr": 1.7163524572919748e-06, "epoch": 2.263875365141188, "percentage": 75.54, "elapsed_time": "3:13:33", "remaining_time": "1:02:41"}
776
+ {"current_steps": 776, "total_steps": 1026, "loss": 0.4734, "lr": 1.7035374972532593e-06, "epoch": 2.2667964946445958, "percentage": 75.63, "elapsed_time": "3:13:48", "remaining_time": "1:02:26"}
777
+ {"current_steps": 777, "total_steps": 1026, "loss": 0.5436, "lr": 1.6907607267226079e-06, "epoch": 2.269717624148004, "percentage": 75.73, "elapsed_time": "3:14:04", "remaining_time": "1:02:11"}
778
+ {"current_steps": 778, "total_steps": 1026, "loss": 0.5207, "lr": 1.6780222937188662e-06, "epoch": 2.272638753651412, "percentage": 75.83, "elapsed_time": "3:14:22", "remaining_time": "1:01:57"}
779
+ {"current_steps": 779, "total_steps": 1026, "loss": 0.5304, "lr": 1.665322345816746e-06, "epoch": 2.27555988315482, "percentage": 75.93, "elapsed_time": "3:14:35", "remaining_time": "1:01:42"}
780
+ {"current_steps": 780, "total_steps": 1026, "loss": 0.4604, "lr": 1.6526610301451028e-06, "epoch": 2.278481012658228, "percentage": 76.02, "elapsed_time": "3:14:50", "remaining_time": "1:01:26"}
781
+ {"current_steps": 781, "total_steps": 1026, "loss": 0.508, "lr": 1.6400384933852403e-06, "epoch": 2.2814021421616357, "percentage": 76.12, "elapsed_time": "3:15:01", "remaining_time": "1:01:10"}
782
+ {"current_steps": 782, "total_steps": 1026, "loss": 0.5429, "lr": 1.6274548817692088e-06, "epoch": 2.284323271665044, "percentage": 76.22, "elapsed_time": "3:15:16", "remaining_time": "1:00:55"}
783
+ {"current_steps": 783, "total_steps": 1026, "loss": 0.5126, "lr": 1.6149103410781086e-06, "epoch": 2.2872444011684516, "percentage": 76.32, "elapsed_time": "3:15:27", "remaining_time": "1:00:39"}
784
+ {"current_steps": 784, "total_steps": 1026, "loss": 0.4995, "lr": 1.6024050166404097e-06, "epoch": 2.29016553067186, "percentage": 76.41, "elapsed_time": "3:15:41", "remaining_time": "1:00:24"}
785
+ {"current_steps": 785, "total_steps": 1026, "loss": 0.5333, "lr": 1.5899390533302538e-06, "epoch": 2.293086660175268, "percentage": 76.51, "elapsed_time": "3:15:54", "remaining_time": "1:00:08"}
786
+ {"current_steps": 786, "total_steps": 1026, "loss": 0.5012, "lr": 1.5775125955657877e-06, "epoch": 2.2960077896786757, "percentage": 76.61, "elapsed_time": "3:16:11", "remaining_time": "0:59:54"}
787
+ {"current_steps": 787, "total_steps": 1026, "loss": 0.5413, "lr": 1.5651257873074898e-06, "epoch": 2.298928919182084, "percentage": 76.71, "elapsed_time": "3:16:24", "remaining_time": "0:59:38"}
788
+ {"current_steps": 788, "total_steps": 1026, "loss": 0.5229, "lr": 1.5527787720564946e-06, "epoch": 2.3018500486854916, "percentage": 76.8, "elapsed_time": "3:16:40", "remaining_time": "0:59:24"}
789
+ {"current_steps": 789, "total_steps": 1026, "loss": 0.5079, "lr": 1.5404716928529356e-06, "epoch": 2.3047711781888998, "percentage": 76.9, "elapsed_time": "3:16:53", "remaining_time": "0:59:08"}
790
+ {"current_steps": 790, "total_steps": 1026, "loss": 0.5056, "lr": 1.5282046922742876e-06, "epoch": 2.3076923076923075, "percentage": 77.0, "elapsed_time": "3:17:07", "remaining_time": "0:58:53"}
791
+ {"current_steps": 791, "total_steps": 1026, "loss": 0.5279, "lr": 1.515977912433717e-06, "epoch": 2.3106134371957157, "percentage": 77.1, "elapsed_time": "3:17:23", "remaining_time": "0:58:38"}
792
+ {"current_steps": 792, "total_steps": 1026, "loss": 0.5483, "lr": 1.50379149497843e-06, "epoch": 2.313534566699124, "percentage": 77.19, "elapsed_time": "3:17:37", "remaining_time": "0:58:23"}
793
+ {"current_steps": 793, "total_steps": 1026, "loss": 0.4898, "lr": 1.4916455810880358e-06, "epoch": 2.3164556962025316, "percentage": 77.29, "elapsed_time": "3:17:51", "remaining_time": "0:58:08"}
794
+ {"current_steps": 794, "total_steps": 1026, "loss": 0.5101, "lr": 1.4795403114729095e-06, "epoch": 2.3193768257059397, "percentage": 77.39, "elapsed_time": "3:18:05", "remaining_time": "0:57:52"}
795
+ {"current_steps": 795, "total_steps": 1026, "loss": 0.5854, "lr": 1.4674758263725614e-06, "epoch": 2.3222979552093475, "percentage": 77.49, "elapsed_time": "3:18:18", "remaining_time": "0:57:37"}
796
+ {"current_steps": 796, "total_steps": 1026, "loss": 0.4989, "lr": 1.4554522655540176e-06, "epoch": 2.3252190847127556, "percentage": 77.58, "elapsed_time": "3:18:34", "remaining_time": "0:57:22"}
797
+ {"current_steps": 797, "total_steps": 1026, "loss": 0.516, "lr": 1.4434697683101928e-06, "epoch": 2.3281402142161634, "percentage": 77.68, "elapsed_time": "3:18:48", "remaining_time": "0:57:07"}
798
+ {"current_steps": 798, "total_steps": 1026, "loss": 0.4936, "lr": 1.4315284734582802e-06, "epoch": 2.3310613437195715, "percentage": 77.78, "elapsed_time": "3:19:01", "remaining_time": "0:56:51"}
799
+ {"current_steps": 799, "total_steps": 1026, "loss": 0.5665, "lr": 1.4196285193381431e-06, "epoch": 2.3339824732229797, "percentage": 77.88, "elapsed_time": "3:19:14", "remaining_time": "0:56:36"}
800
+ {"current_steps": 800, "total_steps": 1026, "loss": 0.5191, "lr": 1.4077700438107183e-06, "epoch": 2.3369036027263874, "percentage": 77.97, "elapsed_time": "3:19:28", "remaining_time": "0:56:21"}
801
+ {"current_steps": 801, "total_steps": 1026, "loss": 0.4785, "lr": 1.3959531842564046e-06, "epoch": 2.3398247322297956, "percentage": 78.07, "elapsed_time": "3:19:41", "remaining_time": "0:56:05"}
802
+ {"current_steps": 802, "total_steps": 1026, "loss": 0.5643, "lr": 1.3841780775734847e-06, "epoch": 2.3427458617332033, "percentage": 78.17, "elapsed_time": "3:19:54", "remaining_time": "0:55:49"}
803
+ {"current_steps": 803, "total_steps": 1026, "loss": 0.5629, "lr": 1.3724448601765328e-06, "epoch": 2.3456669912366115, "percentage": 78.27, "elapsed_time": "3:20:07", "remaining_time": "0:55:34"}
804
+ {"current_steps": 804, "total_steps": 1026, "loss": 0.456, "lr": 1.3607536679948397e-06, "epoch": 2.3485881207400197, "percentage": 78.36, "elapsed_time": "3:20:22", "remaining_time": "0:55:19"}
805
+ {"current_steps": 805, "total_steps": 1026, "loss": 0.52, "lr": 1.3491046364708294e-06, "epoch": 2.3515092502434274, "percentage": 78.46, "elapsed_time": "3:20:38", "remaining_time": "0:55:05"}
806
+ {"current_steps": 806, "total_steps": 1026, "loss": 0.5231, "lr": 1.337497900558497e-06, "epoch": 2.3544303797468356, "percentage": 78.56, "elapsed_time": "3:20:51", "remaining_time": "0:54:49"}
807
+ {"current_steps": 807, "total_steps": 1026, "loss": 0.5191, "lr": 1.325933594721841e-06, "epoch": 2.3573515092502433, "percentage": 78.65, "elapsed_time": "3:21:06", "remaining_time": "0:54:34"}
808
+ {"current_steps": 808, "total_steps": 1026, "loss": 0.4641, "lr": 1.3144118529333126e-06, "epoch": 2.3602726387536515, "percentage": 78.75, "elapsed_time": "3:21:21", "remaining_time": "0:54:19"}
809
+ {"current_steps": 809, "total_steps": 1026, "loss": 0.5363, "lr": 1.3029328086722537e-06, "epoch": 2.3631937682570596, "percentage": 78.85, "elapsed_time": "3:21:36", "remaining_time": "0:54:04"}
810
+ {"current_steps": 810, "total_steps": 1026, "loss": 0.5278, "lr": 1.2914965949233572e-06, "epoch": 2.3661148977604674, "percentage": 78.95, "elapsed_time": "3:21:49", "remaining_time": "0:53:49"}
811
+ {"current_steps": 811, "total_steps": 1026, "loss": 0.4919, "lr": 1.2801033441751244e-06, "epoch": 2.3690360272638755, "percentage": 79.04, "elapsed_time": "3:22:03", "remaining_time": "0:53:33"}
812
+ {"current_steps": 812, "total_steps": 1026, "loss": 0.5063, "lr": 1.268753188418329e-06, "epoch": 2.3719571567672832, "percentage": 79.14, "elapsed_time": "3:22:18", "remaining_time": "0:53:19"}
813
+ {"current_steps": 813, "total_steps": 1026, "loss": 0.5185, "lr": 1.257446259144494e-06, "epoch": 2.3748782862706914, "percentage": 79.24, "elapsed_time": "3:22:32", "remaining_time": "0:53:03"}
814
+ {"current_steps": 814, "total_steps": 1026, "loss": 0.5426, "lr": 1.24618268734436e-06, "epoch": 2.377799415774099, "percentage": 79.34, "elapsed_time": "3:22:50", "remaining_time": "0:52:49"}
815
+ {"current_steps": 815, "total_steps": 1026, "loss": 0.4996, "lr": 1.2349626035063705e-06, "epoch": 2.3807205452775073, "percentage": 79.43, "elapsed_time": "3:23:05", "remaining_time": "0:52:34"}
816
+ {"current_steps": 816, "total_steps": 1026, "loss": 0.5392, "lr": 1.2237861376151632e-06, "epoch": 2.3836416747809155, "percentage": 79.53, "elapsed_time": "3:23:16", "remaining_time": "0:52:18"}
817
+ {"current_steps": 817, "total_steps": 1026, "loss": 0.5361, "lr": 1.2126534191500622e-06, "epoch": 2.386562804284323, "percentage": 79.63, "elapsed_time": "3:23:27", "remaining_time": "0:52:02"}
818
+ {"current_steps": 818, "total_steps": 1026, "loss": 0.4732, "lr": 1.2015645770835765e-06, "epoch": 2.3894839337877314, "percentage": 79.73, "elapsed_time": "3:23:41", "remaining_time": "0:51:47"}
819
+ {"current_steps": 819, "total_steps": 1026, "loss": 0.5227, "lr": 1.1905197398799074e-06, "epoch": 2.392405063291139, "percentage": 79.82, "elapsed_time": "3:23:59", "remaining_time": "0:51:33"}
820
+ {"current_steps": 820, "total_steps": 1026, "loss": 0.5606, "lr": 1.1795190354934587e-06, "epoch": 2.3953261927945473, "percentage": 79.92, "elapsed_time": "3:24:14", "remaining_time": "0:51:18"}
821
+ {"current_steps": 821, "total_steps": 1026, "loss": 0.5035, "lr": 1.168562591367361e-06, "epoch": 2.398247322297955, "percentage": 80.02, "elapsed_time": "3:24:32", "remaining_time": "0:51:04"}
822
+ {"current_steps": 822, "total_steps": 1026, "loss": 0.5485, "lr": 1.1576505344319843e-06, "epoch": 2.401168451801363, "percentage": 80.12, "elapsed_time": "3:24:46", "remaining_time": "0:50:49"}
823
+ {"current_steps": 823, "total_steps": 1026, "loss": 0.5122, "lr": 1.146782991103475e-06, "epoch": 2.4040895813047714, "percentage": 80.21, "elapsed_time": "3:25:03", "remaining_time": "0:50:34"}
824
+ {"current_steps": 824, "total_steps": 1026, "loss": 0.528, "lr": 1.1359600872822879e-06, "epoch": 2.407010710808179, "percentage": 80.31, "elapsed_time": "3:25:20", "remaining_time": "0:50:20"}
825
+ {"current_steps": 825, "total_steps": 1026, "loss": 0.5335, "lr": 1.1251819483517334e-06, "epoch": 2.4099318403115872, "percentage": 80.41, "elapsed_time": "3:25:36", "remaining_time": "0:50:05"}
826
+ {"current_steps": 826, "total_steps": 1026, "loss": 0.519, "lr": 1.1144486991765175e-06, "epoch": 2.412852969814995, "percentage": 80.51, "elapsed_time": "3:25:52", "remaining_time": "0:49:50"}
827
+ {"current_steps": 827, "total_steps": 1026, "loss": 0.5488, "lr": 1.1037604641012995e-06, "epoch": 2.415774099318403, "percentage": 80.6, "elapsed_time": "3:26:10", "remaining_time": "0:49:36"}
828
+ {"current_steps": 828, "total_steps": 1026, "loss": 0.4853, "lr": 1.0931173669492472e-06, "epoch": 2.418695228821811, "percentage": 80.7, "elapsed_time": "3:26:24", "remaining_time": "0:49:21"}
829
+ {"current_steps": 829, "total_steps": 1026, "loss": 0.5224, "lr": 1.0825195310206132e-06, "epoch": 2.421616358325219, "percentage": 80.8, "elapsed_time": "3:26:39", "remaining_time": "0:49:06"}
830
+ {"current_steps": 830, "total_steps": 1026, "loss": 0.4971, "lr": 1.0719670790912928e-06, "epoch": 2.424537487828627, "percentage": 80.9, "elapsed_time": "3:26:55", "remaining_time": "0:48:51"}
831
+ {"current_steps": 831, "total_steps": 1026, "loss": 0.5404, "lr": 1.0614601334114099e-06, "epoch": 2.427458617332035, "percentage": 80.99, "elapsed_time": "3:27:08", "remaining_time": "0:48:36"}
832
+ {"current_steps": 832, "total_steps": 1026, "loss": 0.5179, "lr": 1.0509988157038952e-06, "epoch": 2.430379746835443, "percentage": 81.09, "elapsed_time": "3:27:24", "remaining_time": "0:48:21"}
833
+ {"current_steps": 833, "total_steps": 1026, "loss": 0.4465, "lr": 1.0405832471630862e-06, "epoch": 2.433300876338851, "percentage": 81.19, "elapsed_time": "3:27:39", "remaining_time": "0:48:06"}
834
+ {"current_steps": 834, "total_steps": 1026, "loss": 0.5782, "lr": 1.030213548453311e-06, "epoch": 2.436222005842259, "percentage": 81.29, "elapsed_time": "3:27:55", "remaining_time": "0:47:52"}
835
+ {"current_steps": 835, "total_steps": 1026, "loss": 0.471, "lr": 1.019889839707498e-06, "epoch": 2.439143135345667, "percentage": 81.38, "elapsed_time": "3:28:07", "remaining_time": "0:47:36"}
836
+ {"current_steps": 836, "total_steps": 1026, "loss": 0.525, "lr": 1.0096122405257802e-06, "epoch": 2.442064264849075, "percentage": 81.48, "elapsed_time": "3:28:21", "remaining_time": "0:47:21"}
837
+ {"current_steps": 837, "total_steps": 1026, "loss": 0.55, "lr": 9.99380869974116e-07, "epoch": 2.444985394352483, "percentage": 81.58, "elapsed_time": "3:28:32", "remaining_time": "0:47:05"}
838
+ {"current_steps": 838, "total_steps": 1026, "loss": 0.4883, "lr": 9.891958465828999e-07, "epoch": 2.447906523855891, "percentage": 81.68, "elapsed_time": "3:28:48", "remaining_time": "0:46:50"}
839
+ {"current_steps": 839, "total_steps": 1026, "loss": 0.5127, "lr": 9.790572883455974e-07, "epoch": 2.450827653359299, "percentage": 81.77, "elapsed_time": "3:29:03", "remaining_time": "0:46:35"}
840
+ {"current_steps": 840, "total_steps": 1026, "loss": 0.5376, "lr": 9.689653127173743e-07, "epoch": 2.453748782862707, "percentage": 81.87, "elapsed_time": "3:29:18", "remaining_time": "0:46:20"}
841
+ {"current_steps": 841, "total_steps": 1026, "loss": 0.5108, "lr": 9.589200366137375e-07, "epoch": 2.456669912366115, "percentage": 81.97, "elapsed_time": "3:29:34", "remaining_time": "0:46:06"}
842
+ {"current_steps": 842, "total_steps": 1026, "loss": 0.5436, "lr": 9.489215764091813e-07, "epoch": 2.459591041869523, "percentage": 82.07, "elapsed_time": "3:29:48", "remaining_time": "0:45:50"}
843
+ {"current_steps": 843, "total_steps": 1026, "loss": 0.4733, "lr": 9.389700479358365e-07, "epoch": 2.4625121713729308, "percentage": 82.16, "elapsed_time": "3:30:01", "remaining_time": "0:45:35"}
844
+ {"current_steps": 844, "total_steps": 1026, "loss": 0.5599, "lr": 9.290655664821296e-07, "epoch": 2.465433300876339, "percentage": 82.26, "elapsed_time": "3:30:14", "remaining_time": "0:45:20"}
845
+ {"current_steps": 845, "total_steps": 1026, "loss": 0.4792, "lr": 9.192082467914465e-07, "epoch": 2.4683544303797467, "percentage": 82.36, "elapsed_time": "3:30:28", "remaining_time": "0:45:05"}
846
+ {"current_steps": 846, "total_steps": 1026, "loss": 0.5397, "lr": 9.093982030608095e-07, "epoch": 2.471275559883155, "percentage": 82.46, "elapsed_time": "3:30:40", "remaining_time": "0:44:49"}
847
+ {"current_steps": 847, "total_steps": 1026, "loss": 0.4975, "lr": 8.996355489395442e-07, "epoch": 2.474196689386563, "percentage": 82.55, "elapsed_time": "3:30:55", "remaining_time": "0:44:34"}
848
+ {"current_steps": 848, "total_steps": 1026, "loss": 0.4914, "lr": 8.899203975279674e-07, "epoch": 2.4771178188899707, "percentage": 82.65, "elapsed_time": "3:31:08", "remaining_time": "0:44:19"}
849
+ {"current_steps": 849, "total_steps": 1026, "loss": 0.5599, "lr": 8.802528613760775e-07, "epoch": 2.480038948393379, "percentage": 82.75, "elapsed_time": "3:31:25", "remaining_time": "0:44:04"}
850
+ {"current_steps": 850, "total_steps": 1026, "loss": 0.4598, "lr": 8.706330524822548e-07, "epoch": 2.4829600778967866, "percentage": 82.85, "elapsed_time": "3:31:45", "remaining_time": "0:43:50"}
851
+ {"current_steps": 851, "total_steps": 1026, "loss": 0.5195, "lr": 8.610610822919546e-07, "epoch": 2.485881207400195, "percentage": 82.94, "elapsed_time": "3:32:01", "remaining_time": "0:43:36"}
852
+ {"current_steps": 852, "total_steps": 1026, "loss": 0.5181, "lr": 8.515370616964219e-07, "epoch": 2.4888023369036025, "percentage": 83.04, "elapsed_time": "3:32:17", "remaining_time": "0:43:21"}
853
+ {"current_steps": 853, "total_steps": 1026, "loss": 0.5267, "lr": 8.420611010314062e-07, "epoch": 2.4917234664070107, "percentage": 83.14, "elapsed_time": "3:32:33", "remaining_time": "0:43:06"}
854
+ {"current_steps": 854, "total_steps": 1026, "loss": 0.5086, "lr": 8.326333100758843e-07, "epoch": 2.494644595910419, "percentage": 83.24, "elapsed_time": "3:32:49", "remaining_time": "0:42:51"}
855
+ {"current_steps": 855, "total_steps": 1026, "loss": 0.5536, "lr": 8.232537980507848e-07, "epoch": 2.4975657254138266, "percentage": 83.33, "elapsed_time": "3:33:04", "remaining_time": "0:42:36"}
856
+ {"current_steps": 856, "total_steps": 1026, "loss": 0.5238, "lr": 8.13922673617727e-07, "epoch": 2.5004868549172348, "percentage": 83.43, "elapsed_time": "3:33:18", "remaining_time": "0:42:21"}
857
+ {"current_steps": 857, "total_steps": 1026, "loss": 0.4823, "lr": 8.046400448777575e-07, "epoch": 2.5034079844206425, "percentage": 83.53, "elapsed_time": "3:33:34", "remaining_time": "0:42:07"}
858
+ {"current_steps": 858, "total_steps": 1026, "loss": 0.5466, "lr": 7.954060193701019e-07, "epoch": 2.5063291139240507, "percentage": 83.63, "elapsed_time": "3:33:52", "remaining_time": "0:41:52"}
859
+ {"current_steps": 859, "total_steps": 1026, "loss": 0.5104, "lr": 7.862207040709191e-07, "epoch": 2.5092502434274584, "percentage": 83.72, "elapsed_time": "3:34:10", "remaining_time": "0:41:38"}
860
+ {"current_steps": 860, "total_steps": 1026, "loss": 0.5379, "lr": 7.770842053920585e-07, "epoch": 2.5121713729308666, "percentage": 83.82, "elapsed_time": "3:34:24", "remaining_time": "0:41:23"}
861
+ {"current_steps": 861, "total_steps": 1026, "loss": 0.482, "lr": 7.679966291798297e-07, "epoch": 2.5150925024342747, "percentage": 83.92, "elapsed_time": "3:34:41", "remaining_time": "0:41:08"}
862
+ {"current_steps": 862, "total_steps": 1026, "loss": 0.5032, "lr": 7.589580807137742e-07, "epoch": 2.5180136319376825, "percentage": 84.02, "elapsed_time": "3:34:55", "remaining_time": "0:40:53"}
863
+ {"current_steps": 863, "total_steps": 1026, "loss": 0.5706, "lr": 7.4996866470545e-07, "epoch": 2.5209347614410906, "percentage": 84.11, "elapsed_time": "3:35:11", "remaining_time": "0:40:38"}
864
+ {"current_steps": 864, "total_steps": 1026, "loss": 0.5204, "lr": 7.410284852972127e-07, "epoch": 2.523855890944499, "percentage": 84.21, "elapsed_time": "3:35:29", "remaining_time": "0:40:24"}
865
+ {"current_steps": 865, "total_steps": 1026, "loss": 0.4916, "lr": 7.321376460610136e-07, "epoch": 2.5267770204479065, "percentage": 84.31, "elapsed_time": "3:35:44", "remaining_time": "0:40:09"}
866
+ {"current_steps": 866, "total_steps": 1026, "loss": 0.5395, "lr": 7.232962499972002e-07, "epoch": 2.5296981499513143, "percentage": 84.41, "elapsed_time": "3:35:59", "remaining_time": "0:39:54"}
867
+ {"current_steps": 867, "total_steps": 1026, "loss": 0.4924, "lr": 7.145043995333173e-07, "epoch": 2.5326192794547224, "percentage": 84.5, "elapsed_time": "3:36:15", "remaining_time": "0:39:39"}
868
+ {"current_steps": 868, "total_steps": 1026, "loss": 0.513, "lr": 7.057621965229267e-07, "epoch": 2.5355404089581306, "percentage": 84.6, "elapsed_time": "3:36:26", "remaining_time": "0:39:23"}
869
+ {"current_steps": 869, "total_steps": 1026, "loss": 0.5695, "lr": 6.970697422444228e-07, "epoch": 2.5384615384615383, "percentage": 84.7, "elapsed_time": "3:36:41", "remaining_time": "0:39:08"}
870
+ {"current_steps": 870, "total_steps": 1026, "loss": 0.4925, "lr": 6.884271373998608e-07, "epoch": 2.5413826679649465, "percentage": 84.8, "elapsed_time": "3:36:55", "remaining_time": "0:38:53"}
871
+ {"current_steps": 871, "total_steps": 1026, "loss": 0.5083, "lr": 6.798344821137947e-07, "epoch": 2.5443037974683547, "percentage": 84.89, "elapsed_time": "3:37:10", "remaining_time": "0:38:38"}
872
+ {"current_steps": 872, "total_steps": 1026, "loss": 0.5352, "lr": 6.71291875932108e-07, "epoch": 2.5472249269717624, "percentage": 84.99, "elapsed_time": "3:37:23", "remaining_time": "0:38:23"}
873
+ {"current_steps": 873, "total_steps": 1026, "loss": 0.5262, "lr": 6.62799417820868e-07, "epoch": 2.5501460564751706, "percentage": 85.09, "elapsed_time": "3:37:35", "remaining_time": "0:38:08"}
874
+ {"current_steps": 874, "total_steps": 1026, "loss": 0.5399, "lr": 6.543572061651738e-07, "epoch": 2.5530671859785783, "percentage": 85.19, "elapsed_time": "3:37:49", "remaining_time": "0:37:52"}
875
+ {"current_steps": 875, "total_steps": 1026, "loss": 0.4725, "lr": 6.459653387680248e-07, "epoch": 2.5559883154819865, "percentage": 85.28, "elapsed_time": "3:38:00", "remaining_time": "0:37:37"}
876
+ {"current_steps": 876, "total_steps": 1026, "loss": 0.5122, "lr": 6.376239128491784e-07, "epoch": 2.558909444985394, "percentage": 85.38, "elapsed_time": "3:38:11", "remaining_time": "0:37:21"}
877
+ {"current_steps": 877, "total_steps": 1026, "loss": 0.4941, "lr": 6.293330250440277e-07, "epoch": 2.5618305744888024, "percentage": 85.48, "elapsed_time": "3:38:23", "remaining_time": "0:37:06"}
878
+ {"current_steps": 878, "total_steps": 1026, "loss": 0.5592, "lr": 6.210927714024834e-07, "epoch": 2.5647517039922105, "percentage": 85.58, "elapsed_time": "3:38:36", "remaining_time": "0:36:50"}
879
+ {"current_steps": 879, "total_steps": 1026, "loss": 0.5282, "lr": 6.129032473878582e-07, "epoch": 2.5676728334956183, "percentage": 85.67, "elapsed_time": "3:38:49", "remaining_time": "0:36:35"}
880
+ {"current_steps": 880, "total_steps": 1026, "loss": 0.4562, "lr": 6.047645478757635e-07, "epoch": 2.5705939629990264, "percentage": 85.77, "elapsed_time": "3:39:01", "remaining_time": "0:36:20"}
881
+ {"current_steps": 881, "total_steps": 1026, "loss": 0.5501, "lr": 5.966767671530078e-07, "epoch": 2.573515092502434, "percentage": 85.87, "elapsed_time": "3:39:18", "remaining_time": "0:36:05"}
882
+ {"current_steps": 882, "total_steps": 1026, "loss": 0.5359, "lr": 5.88639998916506e-07, "epoch": 2.5764362220058423, "percentage": 85.96, "elapsed_time": "3:39:34", "remaining_time": "0:35:50"}
883
+ {"current_steps": 883, "total_steps": 1026, "loss": 0.5274, "lr": 5.806543362721945e-07, "epoch": 2.57935735150925, "percentage": 86.06, "elapsed_time": "3:39:50", "remaining_time": "0:35:36"}
884
+ {"current_steps": 884, "total_steps": 1026, "loss": 0.4765, "lr": 5.727198717339511e-07, "epoch": 2.5822784810126582, "percentage": 86.16, "elapsed_time": "3:40:01", "remaining_time": "0:35:20"}
885
+ {"current_steps": 885, "total_steps": 1026, "loss": 0.5282, "lr": 5.648366972225222e-07, "epoch": 2.5851996105160664, "percentage": 86.26, "elapsed_time": "3:40:17", "remaining_time": "0:35:05"}
886
+ {"current_steps": 886, "total_steps": 1026, "loss": 0.5137, "lr": 5.570049040644609e-07, "epoch": 2.588120740019474, "percentage": 86.35, "elapsed_time": "3:40:32", "remaining_time": "0:34:50"}
887
+ {"current_steps": 887, "total_steps": 1026, "loss": 0.4973, "lr": 5.492245829910664e-07, "epoch": 2.5910418695228823, "percentage": 86.45, "elapsed_time": "3:40:43", "remaining_time": "0:34:35"}
888
+ {"current_steps": 888, "total_steps": 1026, "loss": 0.4881, "lr": 5.414958241373358e-07, "epoch": 2.59396299902629, "percentage": 86.55, "elapsed_time": "3:40:57", "remaining_time": "0:34:20"}
889
+ {"current_steps": 889, "total_steps": 1026, "loss": 0.5446, "lr": 5.33818717040917e-07, "epoch": 2.596884128529698, "percentage": 86.65, "elapsed_time": "3:41:13", "remaining_time": "0:34:05"}
890
+ {"current_steps": 890, "total_steps": 1026, "loss": 0.5544, "lr": 5.261933506410722e-07, "epoch": 2.599805258033106, "percentage": 86.74, "elapsed_time": "3:41:31", "remaining_time": "0:33:51"}
891
+ {"current_steps": 891, "total_steps": 1026, "loss": 0.4792, "lr": 5.186198132776459e-07, "epoch": 2.602726387536514, "percentage": 86.84, "elapsed_time": "3:41:47", "remaining_time": "0:33:36"}
892
+ {"current_steps": 892, "total_steps": 1026, "loss": 0.5271, "lr": 5.110981926900488e-07, "epoch": 2.6056475170399223, "percentage": 86.94, "elapsed_time": "3:42:01", "remaining_time": "0:33:21"}
893
+ {"current_steps": 893, "total_steps": 1026, "loss": 0.4772, "lr": 5.036285760162307e-07, "epoch": 2.60856864654333, "percentage": 87.04, "elapsed_time": "3:42:13", "remaining_time": "0:33:05"}
894
+ {"current_steps": 894, "total_steps": 1026, "loss": 0.5078, "lr": 4.962110497916789e-07, "epoch": 2.611489776046738, "percentage": 87.13, "elapsed_time": "3:42:28", "remaining_time": "0:32:50"}
895
+ {"current_steps": 895, "total_steps": 1026, "loss": 0.5177, "lr": 4.888456999484098e-07, "epoch": 2.6144109055501463, "percentage": 87.23, "elapsed_time": "3:42:44", "remaining_time": "0:32:36"}
896
+ {"current_steps": 896, "total_steps": 1026, "loss": 0.5068, "lr": 4.815326118139813e-07, "epoch": 2.617332035053554, "percentage": 87.33, "elapsed_time": "3:43:01", "remaining_time": "0:32:21"}
897
+ {"current_steps": 897, "total_steps": 1026, "loss": 0.4836, "lr": 4.742718701104965e-07, "epoch": 2.620253164556962, "percentage": 87.43, "elapsed_time": "3:43:16", "remaining_time": "0:32:06"}
898
+ {"current_steps": 898, "total_steps": 1026, "loss": 0.5688, "lr": 4.670635589536254e-07, "epoch": 2.62317429406037, "percentage": 87.52, "elapsed_time": "3:43:31", "remaining_time": "0:31:51"}
899
+ {"current_steps": 899, "total_steps": 1026, "loss": 0.5213, "lr": 4.599077618516312e-07, "epoch": 2.626095423563778, "percentage": 87.62, "elapsed_time": "3:43:44", "remaining_time": "0:31:36"}
900
+ {"current_steps": 900, "total_steps": 1026, "loss": 0.515, "lr": 4.528045617044019e-07, "epoch": 2.629016553067186, "percentage": 87.72, "elapsed_time": "3:44:03", "remaining_time": "0:31:22"}
901
+ {"current_steps": 901, "total_steps": 1026, "loss": 0.5119, "lr": 4.457540408024896e-07, "epoch": 2.631937682570594, "percentage": 87.82, "elapsed_time": "3:44:15", "remaining_time": "0:31:06"}
902
+ {"current_steps": 902, "total_steps": 1026, "loss": 0.5273, "lr": 4.387562808261575e-07, "epoch": 2.634858812074002, "percentage": 87.91, "elapsed_time": "3:44:30", "remaining_time": "0:30:51"}
903
+ {"current_steps": 903, "total_steps": 1026, "loss": 0.4994, "lr": 4.3181136284443204e-07, "epoch": 2.63777994157741, "percentage": 88.01, "elapsed_time": "3:44:48", "remaining_time": "0:30:37"}
904
+ {"current_steps": 904, "total_steps": 1026, "loss": 0.5186, "lr": 4.249193673141694e-07, "epoch": 2.6407010710808176, "percentage": 88.11, "elapsed_time": "3:45:01", "remaining_time": "0:30:22"}
905
+ {"current_steps": 905, "total_steps": 1026, "loss": 0.5319, "lr": 4.180803740791156e-07, "epoch": 2.643622200584226, "percentage": 88.21, "elapsed_time": "3:45:16", "remaining_time": "0:30:07"}
906
+ {"current_steps": 906, "total_steps": 1026, "loss": 0.5178, "lr": 4.112944623689863e-07, "epoch": 2.646543330087634, "percentage": 88.3, "elapsed_time": "3:45:32", "remaining_time": "0:29:52"}
907
+ {"current_steps": 907, "total_steps": 1026, "loss": 0.4951, "lr": 4.0456171079854833e-07, "epoch": 2.6494644595910417, "percentage": 88.4, "elapsed_time": "3:45:46", "remaining_time": "0:29:37"}
908
+ {"current_steps": 908, "total_steps": 1026, "loss": 0.4837, "lr": 3.978821973667074e-07, "epoch": 2.65238558909445, "percentage": 88.5, "elapsed_time": "3:46:02", "remaining_time": "0:29:22"}
909
+ {"current_steps": 909, "total_steps": 1026, "loss": 0.5526, "lr": 3.9125599945560866e-07, "epoch": 2.655306718597858, "percentage": 88.6, "elapsed_time": "3:46:18", "remaining_time": "0:29:07"}
910
+ {"current_steps": 910, "total_steps": 1026, "loss": 0.5158, "lr": 3.846831938297324e-07, "epoch": 2.6582278481012658, "percentage": 88.69, "elapsed_time": "3:46:32", "remaining_time": "0:28:52"}
911
+ {"current_steps": 911, "total_steps": 1026, "loss": 0.4809, "lr": 3.7816385663501097e-07, "epoch": 2.661148977604674, "percentage": 88.79, "elapsed_time": "3:46:44", "remaining_time": "0:28:37"}
912
+ {"current_steps": 912, "total_steps": 1026, "loss": 0.5363, "lr": 3.716980633979489e-07, "epoch": 2.6640701071080817, "percentage": 88.89, "elapsed_time": "3:47:01", "remaining_time": "0:28:22"}
913
+ {"current_steps": 913, "total_steps": 1026, "loss": 0.508, "lr": 3.6528588902473905e-07, "epoch": 2.66699123661149, "percentage": 88.99, "elapsed_time": "3:47:17", "remaining_time": "0:28:07"}
914
+ {"current_steps": 914, "total_steps": 1026, "loss": 0.5489, "lr": 3.589274078004029e-07, "epoch": 2.6699123661148976, "percentage": 89.08, "elapsed_time": "3:47:31", "remaining_time": "0:27:52"}
915
+ {"current_steps": 915, "total_steps": 1026, "loss": 0.526, "lr": 3.5262269338792623e-07, "epoch": 2.6728334956183057, "percentage": 89.18, "elapsed_time": "3:47:46", "remaining_time": "0:27:37"}
916
+ {"current_steps": 916, "total_steps": 1026, "loss": 0.5332, "lr": 3.463718188274046e-07, "epoch": 2.675754625121714, "percentage": 89.28, "elapsed_time": "3:48:04", "remaining_time": "0:27:23"}
917
+ {"current_steps": 917, "total_steps": 1026, "loss": 0.4997, "lr": 3.401748565352031e-07, "epoch": 2.6786757546251216, "percentage": 89.38, "elapsed_time": "3:48:18", "remaining_time": "0:27:08"}
918
+ {"current_steps": 918, "total_steps": 1026, "loss": 0.4804, "lr": 3.340318783031099e-07, "epoch": 2.68159688412853, "percentage": 89.47, "elapsed_time": "3:48:32", "remaining_time": "0:26:53"}
919
+ {"current_steps": 919, "total_steps": 1026, "loss": 0.57, "lr": 3.279429552975094e-07, "epoch": 2.6845180136319375, "percentage": 89.57, "elapsed_time": "3:48:48", "remaining_time": "0:26:38"}
920
+ {"current_steps": 920, "total_steps": 1026, "loss": 0.418, "lr": 3.219081580585548e-07, "epoch": 2.6874391431353457, "percentage": 89.67, "elapsed_time": "3:49:00", "remaining_time": "0:26:23"}
921
+ {"current_steps": 921, "total_steps": 1026, "loss": 0.562, "lr": 3.159275564993558e-07, "epoch": 2.6903602726387534, "percentage": 89.77, "elapsed_time": "3:49:16", "remaining_time": "0:26:08"}
922
+ {"current_steps": 922, "total_steps": 1026, "loss": 0.48, "lr": 3.100012199051627e-07, "epoch": 2.6932814021421616, "percentage": 89.86, "elapsed_time": "3:49:30", "remaining_time": "0:25:53"}
923
+ {"current_steps": 923, "total_steps": 1026, "loss": 0.5802, "lr": 3.0412921693256657e-07, "epoch": 2.6962025316455698, "percentage": 89.96, "elapsed_time": "3:49:46", "remaining_time": "0:25:38"}
924
+ {"current_steps": 924, "total_steps": 1026, "loss": 0.5124, "lr": 2.9831161560870346e-07, "epoch": 2.6991236611489775, "percentage": 90.06, "elapsed_time": "3:50:02", "remaining_time": "0:25:23"}
925
+ {"current_steps": 925, "total_steps": 1026, "loss": 0.4959, "lr": 2.9254848333046817e-07, "epoch": 2.7020447906523857, "percentage": 90.16, "elapsed_time": "3:50:15", "remaining_time": "0:25:08"}
926
+ {"current_steps": 926, "total_steps": 1026, "loss": 0.529, "lr": 2.8683988686372956e-07, "epoch": 2.704965920155794, "percentage": 90.25, "elapsed_time": "3:50:30", "remaining_time": "0:24:53"}
927
+ {"current_steps": 927, "total_steps": 1026, "loss": 0.5184, "lr": 2.811858923425609e-07, "epoch": 2.7078870496592016, "percentage": 90.35, "elapsed_time": "3:50:45", "remaining_time": "0:24:38"}
928
+ {"current_steps": 928, "total_steps": 1026, "loss": 0.5438, "lr": 2.755865652684703e-07, "epoch": 2.7108081791626093, "percentage": 90.45, "elapsed_time": "3:51:02", "remaining_time": "0:24:23"}
929
+ {"current_steps": 929, "total_steps": 1026, "loss": 0.4978, "lr": 2.7004197050964744e-07, "epoch": 2.7137293086660175, "percentage": 90.55, "elapsed_time": "3:51:19", "remaining_time": "0:24:09"}
930
+ {"current_steps": 930, "total_steps": 1026, "loss": 0.5041, "lr": 2.645521723002037e-07, "epoch": 2.7166504381694256, "percentage": 90.64, "elapsed_time": "3:51:32", "remaining_time": "0:23:54"}
931
+ {"current_steps": 931, "total_steps": 1026, "loss": 0.5587, "lr": 2.591172342394349e-07, "epoch": 2.7195715676728334, "percentage": 90.74, "elapsed_time": "3:51:48", "remaining_time": "0:23:39"}
932
+ {"current_steps": 932, "total_steps": 1026, "loss": 0.5175, "lr": 2.537372192910825e-07, "epoch": 2.7224926971762415, "percentage": 90.84, "elapsed_time": "3:52:03", "remaining_time": "0:23:24"}
933
+ {"current_steps": 933, "total_steps": 1026, "loss": 0.5033, "lr": 2.4841218978260194e-07, "epoch": 2.7254138266796497, "percentage": 90.94, "elapsed_time": "3:52:17", "remaining_time": "0:23:09"}
934
+ {"current_steps": 934, "total_steps": 1026, "loss": 0.5192, "lr": 2.4314220740444595e-07, "epoch": 2.7283349561830574, "percentage": 91.03, "elapsed_time": "3:52:30", "remaining_time": "0:22:54"}
935
+ {"current_steps": 935, "total_steps": 1026, "loss": 0.5193, "lr": 2.3792733320934348e-07, "epoch": 2.731256085686465, "percentage": 91.13, "elapsed_time": "3:52:45", "remaining_time": "0:22:39"}
936
+ {"current_steps": 936, "total_steps": 1026, "loss": 0.5226, "lr": 2.3276762761159588e-07, "epoch": 2.7341772151898733, "percentage": 91.23, "elapsed_time": "3:52:59", "remaining_time": "0:22:24"}
937
+ {"current_steps": 937, "total_steps": 1026, "loss": 0.5234, "lr": 2.276631503863763e-07, "epoch": 2.7370983446932815, "percentage": 91.33, "elapsed_time": "3:53:15", "remaining_time": "0:22:09"}
938
+ {"current_steps": 938, "total_steps": 1026, "loss": 0.4968, "lr": 2.2261396066903916e-07, "epoch": 2.7400194741966892, "percentage": 91.42, "elapsed_time": "3:53:30", "remaining_time": "0:21:54"}
939
+ {"current_steps": 939, "total_steps": 1026, "loss": 0.5135, "lr": 2.176201169544312e-07, "epoch": 2.7429406037000974, "percentage": 91.52, "elapsed_time": "3:53:45", "remaining_time": "0:21:39"}
940
+ {"current_steps": 940, "total_steps": 1026, "loss": 0.5459, "lr": 2.12681677096217e-07, "epoch": 2.7458617332035056, "percentage": 91.62, "elapsed_time": "3:53:59", "remaining_time": "0:21:24"}
941
+ {"current_steps": 941, "total_steps": 1026, "loss": 0.4538, "lr": 2.0779869830620692e-07, "epoch": 2.7487828627069133, "percentage": 91.72, "elapsed_time": "3:54:10", "remaining_time": "0:21:09"}
942
+ {"current_steps": 942, "total_steps": 1026, "loss": 0.4839, "lr": 2.029712371536957e-07, "epoch": 2.7517039922103215, "percentage": 91.81, "elapsed_time": "3:54:27", "remaining_time": "0:20:54"}
943
+ {"current_steps": 943, "total_steps": 1026, "loss": 0.5445, "lr": 1.9819934956480603e-07, "epoch": 2.754625121713729, "percentage": 91.91, "elapsed_time": "3:54:40", "remaining_time": "0:20:39"}
944
+ {"current_steps": 944, "total_steps": 1026, "loss": 0.4934, "lr": 1.9348309082184102e-07, "epoch": 2.7575462512171374, "percentage": 92.01, "elapsed_time": "3:54:54", "remaining_time": "0:20:24"}
945
+ {"current_steps": 945, "total_steps": 1026, "loss": 0.5456, "lr": 1.888225155626433e-07, "epoch": 2.760467380720545, "percentage": 92.11, "elapsed_time": "3:55:08", "remaining_time": "0:20:09"}
946
+ {"current_steps": 946, "total_steps": 1026, "loss": 0.4462, "lr": 1.8421767777996425e-07, "epoch": 2.7633885102239533, "percentage": 92.2, "elapsed_time": "3:55:22", "remaining_time": "0:19:54"}
947
+ {"current_steps": 947, "total_steps": 1026, "loss": 0.5427, "lr": 1.7966863082083507e-07, "epoch": 2.7663096397273614, "percentage": 92.3, "elapsed_time": "3:55:38", "remaining_time": "0:19:39"}
948
+ {"current_steps": 948, "total_steps": 1026, "loss": 0.5568, "lr": 1.7517542738595071e-07, "epoch": 2.769230769230769, "percentage": 92.4, "elapsed_time": "3:55:54", "remaining_time": "0:19:24"}
949
+ {"current_steps": 949, "total_steps": 1026, "loss": 0.5083, "lr": 1.7073811952905862e-07, "epoch": 2.7721518987341773, "percentage": 92.5, "elapsed_time": "3:56:10", "remaining_time": "0:19:09"}
950
+ {"current_steps": 950, "total_steps": 1026, "loss": 0.4505, "lr": 1.6635675865635859e-07, "epoch": 2.775073028237585, "percentage": 92.59, "elapsed_time": "3:56:22", "remaining_time": "0:18:54"}
951
+ {"current_steps": 951, "total_steps": 1026, "loss": 0.5831, "lr": 1.6203139552590175e-07, "epoch": 2.7779941577409932, "percentage": 92.69, "elapsed_time": "3:56:39", "remaining_time": "0:18:39"}
952
+ {"current_steps": 952, "total_steps": 1026, "loss": 0.4751, "lr": 1.5776208024700702e-07, "epoch": 2.780915287244401, "percentage": 92.79, "elapsed_time": "3:56:51", "remaining_time": "0:18:24"}
953
+ {"current_steps": 953, "total_steps": 1026, "loss": 0.532, "lr": 1.5354886227967934e-07, "epoch": 2.783836416747809, "percentage": 92.88, "elapsed_time": "3:57:02", "remaining_time": "0:18:09"}
954
+ {"current_steps": 954, "total_steps": 1026, "loss": 0.5347, "lr": 1.4939179043403474e-07, "epoch": 2.7867575462512173, "percentage": 92.98, "elapsed_time": "3:57:15", "remaining_time": "0:17:54"}
955
+ {"current_steps": 955, "total_steps": 1026, "loss": 0.5459, "lr": 1.4529091286973994e-07, "epoch": 2.789678675754625, "percentage": 93.08, "elapsed_time": "3:57:31", "remaining_time": "0:17:39"}
956
+ {"current_steps": 956, "total_steps": 1026, "loss": 0.4918, "lr": 1.4124627709544814e-07, "epoch": 2.792599805258033, "percentage": 93.18, "elapsed_time": "3:57:47", "remaining_time": "0:17:24"}
957
+ {"current_steps": 957, "total_steps": 1026, "loss": 0.5016, "lr": 1.3725792996825083e-07, "epoch": 2.7955209347614414, "percentage": 93.27, "elapsed_time": "3:57:59", "remaining_time": "0:17:09"}
958
+ {"current_steps": 958, "total_steps": 1026, "loss": 0.5043, "lr": 1.3332591769314006e-07, "epoch": 2.798442064264849, "percentage": 93.37, "elapsed_time": "3:58:12", "remaining_time": "0:16:54"}
959
+ {"current_steps": 959, "total_steps": 1026, "loss": 0.5637, "lr": 1.2945028582246445e-07, "epoch": 2.801363193768257, "percentage": 93.47, "elapsed_time": "3:58:24", "remaining_time": "0:16:39"}
960
+ {"current_steps": 960, "total_steps": 1026, "loss": 0.5017, "lr": 1.2563107925540774e-07, "epoch": 2.804284323271665, "percentage": 93.57, "elapsed_time": "3:58:39", "remaining_time": "0:16:24"}
961
+ {"current_steps": 961, "total_steps": 1026, "loss": 0.5136, "lr": 1.2186834223746612e-07, "epoch": 2.807205452775073, "percentage": 93.66, "elapsed_time": "3:58:55", "remaining_time": "0:16:09"}
962
+ {"current_steps": 962, "total_steps": 1026, "loss": 0.4964, "lr": 1.1816211835993684e-07, "epoch": 2.810126582278481, "percentage": 93.76, "elapsed_time": "3:59:09", "remaining_time": "0:15:54"}
963
+ {"current_steps": 963, "total_steps": 1026, "loss": 0.5112, "lr": 1.1451245055941251e-07, "epoch": 2.813047711781889, "percentage": 93.86, "elapsed_time": "3:59:24", "remaining_time": "0:15:39"}
964
+ {"current_steps": 964, "total_steps": 1026, "loss": 0.5273, "lr": 1.1091938111728374e-07, "epoch": 2.8159688412852972, "percentage": 93.96, "elapsed_time": "3:59:40", "remaining_time": "0:15:24"}
965
+ {"current_steps": 965, "total_steps": 1026, "loss": 0.5398, "lr": 1.0738295165924783e-07, "epoch": 2.818889970788705, "percentage": 94.05, "elapsed_time": "3:59:54", "remaining_time": "0:15:09"}
966
+ {"current_steps": 966, "total_steps": 1026, "loss": 0.5062, "lr": 1.0390320315482982e-07, "epoch": 2.8218111002921127, "percentage": 94.15, "elapsed_time": "4:00:09", "remaining_time": "0:14:54"}
967
+ {"current_steps": 967, "total_steps": 1026, "loss": 0.5114, "lr": 1.0048017591690607e-07, "epoch": 2.824732229795521, "percentage": 94.25, "elapsed_time": "4:00:22", "remaining_time": "0:14:39"}
968
+ {"current_steps": 968, "total_steps": 1026, "loss": 0.5359, "lr": 9.711390960123634e-08, "epoch": 2.827653359298929, "percentage": 94.35, "elapsed_time": "4:00:37", "remaining_time": "0:14:25"}
969
+ {"current_steps": 969, "total_steps": 1026, "loss": 0.4684, "lr": 9.380444320600591e-08, "epoch": 2.8305744888023368, "percentage": 94.44, "elapsed_time": "4:00:50", "remaining_time": "0:14:10"}
970
+ {"current_steps": 970, "total_steps": 1026, "loss": 0.5426, "lr": 9.055181507137245e-08, "epoch": 2.833495618305745, "percentage": 94.54, "elapsed_time": "4:01:02", "remaining_time": "0:13:54"}
971
+ {"current_steps": 971, "total_steps": 1026, "loss": 0.5258, "lr": 8.73560628790232e-08, "epoch": 2.836416747809153, "percentage": 94.64, "elapsed_time": "4:01:19", "remaining_time": "0:13:40"}
972
+ {"current_steps": 972, "total_steps": 1026, "loss": 0.553, "lr": 8.421722365173856e-08, "epoch": 2.839337877312561, "percentage": 94.74, "elapsed_time": "4:01:33", "remaining_time": "0:13:25"}
973
+ {"current_steps": 973, "total_steps": 1026, "loss": 0.4804, "lr": 8.113533375295968e-08, "epoch": 2.842259006815969, "percentage": 94.83, "elapsed_time": "4:01:49", "remaining_time": "0:13:10"}
974
+ {"current_steps": 974, "total_steps": 1026, "loss": 0.5268, "lr": 7.81104288863721e-08, "epoch": 2.8451801363193767, "percentage": 94.93, "elapsed_time": "4:02:06", "remaining_time": "0:12:55"}
975
+ {"current_steps": 975, "total_steps": 1026, "loss": 0.5059, "lr": 7.514254409549005e-08, "epoch": 2.848101265822785, "percentage": 95.03, "elapsed_time": "4:02:21", "remaining_time": "0:12:40"}
976
+ {"current_steps": 976, "total_steps": 1026, "loss": 0.5401, "lr": 7.223171376325e-08, "epoch": 2.8510223953261926, "percentage": 95.13, "elapsed_time": "4:02:34", "remaining_time": "0:12:25"}
977
+ {"current_steps": 977, "total_steps": 1026, "loss": 0.5179, "lr": 6.93779716116122e-08, "epoch": 2.853943524829601, "percentage": 95.22, "elapsed_time": "4:02:48", "remaining_time": "0:12:10"}
978
+ {"current_steps": 978, "total_steps": 1026, "loss": 0.479, "lr": 6.658135070116978e-08, "epoch": 2.856864654333009, "percentage": 95.32, "elapsed_time": "4:03:05", "remaining_time": "0:11:55"}
979
+ {"current_steps": 979, "total_steps": 1026, "loss": 0.4933, "lr": 6.384188343076914e-08, "epoch": 2.8597857838364167, "percentage": 95.42, "elapsed_time": "4:03:17", "remaining_time": "0:11:40"}
980
+ {"current_steps": 980, "total_steps": 1026, "loss": 0.5225, "lr": 6.115960153712963e-08, "epoch": 2.862706913339825, "percentage": 95.52, "elapsed_time": "4:03:32", "remaining_time": "0:11:25"}
981
+ {"current_steps": 981, "total_steps": 1026, "loss": 0.5649, "lr": 5.8534536094478345e-08, "epoch": 2.8656280428432326, "percentage": 95.61, "elapsed_time": "4:03:46", "remaining_time": "0:11:10"}
982
+ {"current_steps": 982, "total_steps": 1026, "loss": 0.474, "lr": 5.596671751419147e-08, "epoch": 2.8685491723466408, "percentage": 95.71, "elapsed_time": "4:04:03", "remaining_time": "0:10:56"}
983
+ {"current_steps": 983, "total_steps": 1026, "loss": 0.529, "lr": 5.3456175544437936e-08, "epoch": 2.8714703018500485, "percentage": 95.81, "elapsed_time": "4:04:17", "remaining_time": "0:10:41"}
984
+ {"current_steps": 984, "total_steps": 1026, "loss": 0.4909, "lr": 5.100293926984023e-08, "epoch": 2.8743914313534566, "percentage": 95.91, "elapsed_time": "4:04:31", "remaining_time": "0:10:26"}
985
+ {"current_steps": 985, "total_steps": 1026, "loss": 0.5029, "lr": 4.860703711113246e-08, "epoch": 2.877312560856865, "percentage": 96.0, "elapsed_time": "4:04:46", "remaining_time": "0:10:11"}
986
+ {"current_steps": 986, "total_steps": 1026, "loss": 0.5376, "lr": 4.626849682483392e-08, "epoch": 2.8802336903602725, "percentage": 96.1, "elapsed_time": "4:05:00", "remaining_time": "0:09:56"}
987
+ {"current_steps": 987, "total_steps": 1026, "loss": 0.5467, "lr": 4.398734550292716e-08, "epoch": 2.8831548198636807, "percentage": 96.2, "elapsed_time": "4:05:16", "remaining_time": "0:09:41"}
988
+ {"current_steps": 988, "total_steps": 1026, "loss": 0.4568, "lr": 4.176360957254266e-08, "epoch": 2.8860759493670884, "percentage": 96.3, "elapsed_time": "4:05:29", "remaining_time": "0:09:26"}
989
+ {"current_steps": 989, "total_steps": 1026, "loss": 0.5319, "lr": 3.959731479565465e-08, "epoch": 2.8889970788704966, "percentage": 96.39, "elapsed_time": "4:05:44", "remaining_time": "0:09:11"}
990
+ {"current_steps": 990, "total_steps": 1026, "loss": 0.5782, "lr": 3.748848626878132e-08, "epoch": 2.8919182083739043, "percentage": 96.49, "elapsed_time": "4:05:59", "remaining_time": "0:08:56"}
991
+ {"current_steps": 991, "total_steps": 1026, "loss": 0.462, "lr": 3.543714842269508e-08, "epoch": 2.8948393378773125, "percentage": 96.59, "elapsed_time": "4:06:13", "remaining_time": "0:08:41"}
992
+ {"current_steps": 992, "total_steps": 1026, "loss": 0.5218, "lr": 3.344332502213887e-08, "epoch": 2.8977604673807207, "percentage": 96.69, "elapsed_time": "4:06:27", "remaining_time": "0:08:26"}
993
+ {"current_steps": 993, "total_steps": 1026, "loss": 0.4832, "lr": 3.150703916554976e-08, "epoch": 2.9006815968841284, "percentage": 96.78, "elapsed_time": "4:06:41", "remaining_time": "0:08:11"}
994
+ {"current_steps": 994, "total_steps": 1026, "loss": 0.5087, "lr": 2.962831328479465e-08, "epoch": 2.9036027263875366, "percentage": 96.88, "elapsed_time": "4:06:55", "remaining_time": "0:07:56"}
995
+ {"current_steps": 995, "total_steps": 1026, "loss": 0.5639, "lr": 2.7807169144906108e-08, "epoch": 2.9065238558909448, "percentage": 96.98, "elapsed_time": "4:07:12", "remaining_time": "0:07:42"}
996
+ {"current_steps": 996, "total_steps": 1026, "loss": 0.534, "lr": 2.6043627843834185e-08, "epoch": 2.9094449853943525, "percentage": 97.08, "elapsed_time": "4:07:27", "remaining_time": "0:07:27"}
997
+ {"current_steps": 997, "total_steps": 1026, "loss": 0.471, "lr": 2.4337709812199405e-08, "epoch": 2.91236611489776, "percentage": 97.17, "elapsed_time": "4:07:41", "remaining_time": "0:07:12"}
998
+ {"current_steps": 998, "total_steps": 1026, "loss": 0.5252, "lr": 2.2689434813056856e-08, "epoch": 2.9152872444011684, "percentage": 97.27, "elapsed_time": "4:07:56", "remaining_time": "0:06:57"}
999
+ {"current_steps": 999, "total_steps": 1026, "loss": 0.5683, "lr": 2.1098821941667457e-08, "epoch": 2.9182083739045765, "percentage": 97.37, "elapsed_time": "4:08:11", "remaining_time": "0:06:42"}
1000
+ {"current_steps": 1000, "total_steps": 1026, "loss": 0.4844, "lr": 1.9565889625275945e-08, "epoch": 2.9211295034079843, "percentage": 97.47, "elapsed_time": "4:08:22", "remaining_time": "0:06:27"}
1001
+ {"current_steps": 1001, "total_steps": 1026, "loss": 0.4881, "lr": 1.8090655622899356e-08, "epoch": 2.9240506329113924, "percentage": 97.56, "elapsed_time": "4:08:35", "remaining_time": "0:06:12"}
1002
+ {"current_steps": 1002, "total_steps": 1026, "loss": 0.5576, "lr": 1.6673137025118303e-08, "epoch": 2.9269717624148006, "percentage": 97.66, "elapsed_time": "4:08:51", "remaining_time": "0:05:57"}
1003
+ {"current_steps": 1003, "total_steps": 1026, "loss": 0.5248, "lr": 1.5313350253882143e-08, "epoch": 2.9298928919182083, "percentage": 97.76, "elapsed_time": "4:09:07", "remaining_time": "0:05:42"}
1004
+ {"current_steps": 1004, "total_steps": 1026, "loss": 0.5207, "lr": 1.4011311062316347e-08, "epoch": 2.9328140214216165, "percentage": 97.86, "elapsed_time": "4:09:23", "remaining_time": "0:05:27"}
1005
+ {"current_steps": 1005, "total_steps": 1026, "loss": 0.483, "lr": 1.2767034534540978e-08, "epoch": 2.9357351509250242, "percentage": 97.95, "elapsed_time": "4:09:36", "remaining_time": "0:05:12"}
1006
+ {"current_steps": 1006, "total_steps": 1026, "loss": 0.4624, "lr": 1.158053508549528e-08, "epoch": 2.9386562804284324, "percentage": 98.05, "elapsed_time": "4:09:49", "remaining_time": "0:04:58"}
1007
+ {"current_steps": 1007, "total_steps": 1026, "loss": 0.5295, "lr": 1.0451826460772252e-08, "epoch": 2.94157740993184, "percentage": 98.15, "elapsed_time": "4:10:07", "remaining_time": "0:04:43"}
1008
+ {"current_steps": 1008, "total_steps": 1026, "loss": 0.5164, "lr": 9.38092173645766e-09, "epoch": 2.9444985394352483, "percentage": 98.25, "elapsed_time": "4:10:23", "remaining_time": "0:04:28"}
1009
+ {"current_steps": 1009, "total_steps": 1026, "loss": 0.5474, "lr": 8.367833318980168e-09, "epoch": 2.9474196689386565, "percentage": 98.34, "elapsed_time": "4:10:40", "remaining_time": "0:04:13"}
1010
+ {"current_steps": 1010, "total_steps": 1026, "loss": 0.4825, "lr": 7.412572944965335e-09, "epoch": 2.950340798442064, "percentage": 98.44, "elapsed_time": "4:10:53", "remaining_time": "0:03:58"}
1011
+ {"current_steps": 1011, "total_steps": 1026, "loss": 0.507, "lr": 6.515151681101284e-09, "epoch": 2.9532619279454724, "percentage": 98.54, "elapsed_time": "4:11:09", "remaining_time": "0:03:43"}
1012
+ {"current_steps": 1012, "total_steps": 1026, "loss": 0.5173, "lr": 5.675579924011576e-09, "epoch": 2.95618305744888, "percentage": 98.64, "elapsed_time": "4:11:24", "remaining_time": "0:03:28"}
1013
+ {"current_steps": 1013, "total_steps": 1026, "loss": 0.4984, "lr": 4.89386740013198e-09, "epoch": 2.9591041869522883, "percentage": 98.73, "elapsed_time": "4:11:41", "remaining_time": "0:03:13"}
1014
+ {"current_steps": 1014, "total_steps": 1026, "loss": 0.5463, "lr": 4.170023165600001e-09, "epoch": 2.962025316455696, "percentage": 98.83, "elapsed_time": "4:11:56", "remaining_time": "0:02:58"}
1015
+ {"current_steps": 1015, "total_steps": 1026, "loss": 0.4929, "lr": 3.5040556061483043e-09, "epoch": 2.964946445959104, "percentage": 98.93, "elapsed_time": "4:12:14", "remaining_time": "0:02:44"}
1016
+ {"current_steps": 1016, "total_steps": 1026, "loss": 0.5618, "lr": 2.8959724370092313e-09, "epoch": 2.9678675754625123, "percentage": 99.03, "elapsed_time": "4:12:29", "remaining_time": "0:02:29"}
1017
+ {"current_steps": 1017, "total_steps": 1026, "loss": 0.5245, "lr": 2.3457807028248734e-09, "epoch": 2.97078870496592, "percentage": 99.12, "elapsed_time": "4:12:44", "remaining_time": "0:02:14"}
1018
+ {"current_steps": 1018, "total_steps": 1026, "loss": 0.5129, "lr": 1.8534867775649169e-09, "epoch": 2.9737098344693282, "percentage": 99.22, "elapsed_time": "4:12:59", "remaining_time": "0:01:59"}
1019
+ {"current_steps": 1019, "total_steps": 1026, "loss": 0.4844, "lr": 1.4190963644522549e-09, "epoch": 2.976630963972736, "percentage": 99.32, "elapsed_time": "4:13:14", "remaining_time": "0:01:44"}
1020
+ {"current_steps": 1020, "total_steps": 1026, "loss": 0.5588, "lr": 1.0426144958985974e-09, "epoch": 2.979552093476144, "percentage": 99.42, "elapsed_time": "4:13:31", "remaining_time": "0:01:29"}
1021
+ {"current_steps": 1021, "total_steps": 1026, "loss": 0.4614, "lr": 7.240455334456276e-10, "epoch": 2.982473222979552, "percentage": 99.51, "elapsed_time": "4:13:46", "remaining_time": "0:01:14"}
1022
+ {"current_steps": 1022, "total_steps": 1026, "loss": 0.5183, "lr": 4.633931677139325e-10, "epoch": 2.98539435248296, "percentage": 99.61, "elapsed_time": "4:13:58", "remaining_time": "0:00:59"}
1023
+ {"current_steps": 1023, "total_steps": 1026, "loss": 0.5797, "lr": 2.60660418360259e-10, "epoch": 2.988315481986368, "percentage": 99.71, "elapsed_time": "4:14:14", "remaining_time": "0:00:44"}
1024
+ {"current_steps": 1024, "total_steps": 1026, "loss": 0.5132, "lr": 1.158496340419868e-10, "epoch": 2.991236611489776, "percentage": 99.81, "elapsed_time": "4:14:27", "remaining_time": "0:00:29"}
1025
+ {"current_steps": 1025, "total_steps": 1026, "loss": 0.5159, "lr": 2.8962492393258546e-11, "epoch": 2.994157740993184, "percentage": 99.9, "elapsed_time": "4:14:40", "remaining_time": "0:00:14"}
1026
+ {"current_steps": 1026, "total_steps": 1026, "loss": 0.5245, "lr": 0.0, "epoch": 2.9970788704965923, "percentage": 100.0, "elapsed_time": "4:14:58", "remaining_time": "0:00:00"}
1027
+ {"current_steps": 1026, "total_steps": 1026, "epoch": 2.9970788704965923, "percentage": 100.0, "elapsed_time": "4:17:05", "remaining_time": "0:00:00"}