neginr commited on
Commit
39424d0
·
verified ·
1 Parent(s): 5cd5bea

Training in progress, epoch 5

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f3b1916b0620b47f9a8f7c35beee8fe22a64a1e29097d647a735e12813ac7508
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3a46caa95559fb9a17c4f90e323b16bab425cfa44c80d0f28c3c9fe4b6f05503
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:efdd687e6d8b3e13c352ad92f086b6ea74ea31c5f3242158ade55e0c470d76b8
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fbcb5009eeb03af18a7781370bc5d529365bab91a1bba8551b94bc5fe4c17c2f
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:621a23f90ae0aaa7606478100ba3c63db23cb19093651ff5bc3dfb90b9571bec
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f1c1143a5c10c6296963cd9f2453e3b34343d85b73e1aedccb21da6accb89d51
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3534f511c6c7c6bf69ee5b28b6cf951607dde1b1add09eb309c1767abc5ad86e
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:35be0b2cc3860226c3f84b548ae0b4e6192449be8da36f5d2cffc8011f727242
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -966,3 +966,236 @@
966
  {"current_steps": 966, "total_steps": 1200, "loss": 0.3679, "lr": 4.4570807708605825e-06, "epoch": 4.025, "percentage": 80.5, "elapsed_time": "6:23:50", "remaining_time": "1:32:58"}
967
  {"current_steps": 967, "total_steps": 1200, "loss": 0.3851, "lr": 4.420534205145293e-06, "epoch": 4.029166666666667, "percentage": 80.58, "elapsed_time": "6:24:12", "remaining_time": "1:32:34"}
968
  {"current_steps": 968, "total_steps": 1200, "loss": 0.3817, "lr": 4.384119466466816e-06, "epoch": 4.033333333333333, "percentage": 80.67, "elapsed_time": "6:24:36", "remaining_time": "1:32:10"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
966
  {"current_steps": 966, "total_steps": 1200, "loss": 0.3679, "lr": 4.4570807708605825e-06, "epoch": 4.025, "percentage": 80.5, "elapsed_time": "6:23:50", "remaining_time": "1:32:58"}
967
  {"current_steps": 967, "total_steps": 1200, "loss": 0.3851, "lr": 4.420534205145293e-06, "epoch": 4.029166666666667, "percentage": 80.58, "elapsed_time": "6:24:12", "remaining_time": "1:32:34"}
968
  {"current_steps": 968, "total_steps": 1200, "loss": 0.3817, "lr": 4.384119466466816e-06, "epoch": 4.033333333333333, "percentage": 80.67, "elapsed_time": "6:24:36", "remaining_time": "1:32:10"}
969
+ {"current_steps": 969, "total_steps": 1200, "loss": 0.3786, "lr": 4.347836862951722e-06, "epoch": 4.0375, "percentage": 80.75, "elapsed_time": "6:25:00", "remaining_time": "1:31:46"}
970
+ {"current_steps": 970, "total_steps": 1200, "loss": 0.4043, "lr": 4.311686701608486e-06, "epoch": 4.041666666666667, "percentage": 80.83, "elapsed_time": "6:25:24", "remaining_time": "1:31:23"}
971
+ {"current_steps": 971, "total_steps": 1200, "loss": 0.3808, "lr": 4.2756692883249176e-06, "epoch": 4.045833333333333, "percentage": 80.92, "elapsed_time": "6:25:49", "remaining_time": "1:30:59"}
972
+ {"current_steps": 972, "total_steps": 1200, "loss": 0.3893, "lr": 4.239784927865562e-06, "epoch": 4.05, "percentage": 81.0, "elapsed_time": "6:26:12", "remaining_time": "1:30:35"}
973
+ {"current_steps": 973, "total_steps": 1200, "loss": 0.3974, "lr": 4.204033923869135e-06, "epoch": 4.054166666666666, "percentage": 81.08, "elapsed_time": "6:26:35", "remaining_time": "1:30:11"}
974
+ {"current_steps": 974, "total_steps": 1200, "loss": 0.3689, "lr": 4.168416578845936e-06, "epoch": 4.058333333333334, "percentage": 81.17, "elapsed_time": "6:26:59", "remaining_time": "1:29:47"}
975
+ {"current_steps": 975, "total_steps": 1200, "loss": 0.3874, "lr": 4.132933194175299e-06, "epoch": 4.0625, "percentage": 81.25, "elapsed_time": "6:27:22", "remaining_time": "1:29:23"}
976
+ {"current_steps": 976, "total_steps": 1200, "loss": 0.4063, "lr": 4.097584070103042e-06, "epoch": 4.066666666666666, "percentage": 81.33, "elapsed_time": "6:27:45", "remaining_time": "1:28:59"}
977
+ {"current_steps": 977, "total_steps": 1200, "loss": 0.3971, "lr": 4.0623695057389415e-06, "epoch": 4.070833333333334, "percentage": 81.42, "elapsed_time": "6:28:08", "remaining_time": "1:28:35"}
978
+ {"current_steps": 978, "total_steps": 1200, "loss": 0.3813, "lr": 4.027289799054148e-06, "epoch": 4.075, "percentage": 81.5, "elapsed_time": "6:28:32", "remaining_time": "1:28:11"}
979
+ {"current_steps": 979, "total_steps": 1200, "loss": 0.39, "lr": 3.992345246878726e-06, "epoch": 4.079166666666667, "percentage": 81.58, "elapsed_time": "6:28:56", "remaining_time": "1:27:47"}
980
+ {"current_steps": 980, "total_steps": 1200, "loss": 0.4023, "lr": 3.957536144899123e-06, "epoch": 4.083333333333333, "percentage": 81.67, "elapsed_time": "6:29:19", "remaining_time": "1:27:23"}
981
+ {"current_steps": 981, "total_steps": 1200, "loss": 0.3952, "lr": 3.922862787655654e-06, "epoch": 4.0875, "percentage": 81.75, "elapsed_time": "6:29:42", "remaining_time": "1:26:59"}
982
+ {"current_steps": 982, "total_steps": 1200, "loss": 0.3868, "lr": 3.888325468540013e-06, "epoch": 4.091666666666667, "percentage": 81.83, "elapsed_time": "6:30:05", "remaining_time": "1:26:35"}
983
+ {"current_steps": 983, "total_steps": 1200, "loss": 0.393, "lr": 3.853924479792803e-06, "epoch": 4.095833333333333, "percentage": 81.92, "elapsed_time": "6:30:28", "remaining_time": "1:26:11"}
984
+ {"current_steps": 984, "total_steps": 1200, "loss": 0.3889, "lr": 3.819660112501053e-06, "epoch": 4.1, "percentage": 82.0, "elapsed_time": "6:30:51", "remaining_time": "1:25:47"}
985
+ {"current_steps": 985, "total_steps": 1200, "loss": 0.3945, "lr": 3.7855326565957563e-06, "epoch": 4.104166666666667, "percentage": 82.08, "elapsed_time": "6:31:15", "remaining_time": "1:25:24"}
986
+ {"current_steps": 986, "total_steps": 1200, "loss": 0.3921, "lr": 3.7515424008494195e-06, "epoch": 4.108333333333333, "percentage": 82.17, "elapsed_time": "6:31:38", "remaining_time": "1:25:00"}
987
+ {"current_steps": 987, "total_steps": 1200, "loss": 0.383, "lr": 3.717689632873618e-06, "epoch": 4.1125, "percentage": 82.25, "elapsed_time": "6:32:01", "remaining_time": "1:24:35"}
988
+ {"current_steps": 988, "total_steps": 1200, "loss": 0.4101, "lr": 3.683974639116563e-06, "epoch": 4.116666666666666, "percentage": 82.33, "elapsed_time": "6:32:24", "remaining_time": "1:24:12"}
989
+ {"current_steps": 989, "total_steps": 1200, "loss": 0.4102, "lr": 3.650397704860673e-06, "epoch": 4.120833333333334, "percentage": 82.42, "elapsed_time": "6:32:47", "remaining_time": "1:23:48"}
990
+ {"current_steps": 990, "total_steps": 1200, "loss": 0.385, "lr": 3.616959114220162e-06, "epoch": 4.125, "percentage": 82.5, "elapsed_time": "6:33:11", "remaining_time": "1:23:24"}
991
+ {"current_steps": 991, "total_steps": 1200, "loss": 0.381, "lr": 3.583659150138661e-06, "epoch": 4.129166666666666, "percentage": 82.58, "elapsed_time": "6:33:35", "remaining_time": "1:23:00"}
992
+ {"current_steps": 992, "total_steps": 1200, "loss": 0.3873, "lr": 3.5504980943867538e-06, "epoch": 4.133333333333334, "percentage": 82.67, "elapsed_time": "6:33:57", "remaining_time": "1:22:36"}
993
+ {"current_steps": 993, "total_steps": 1200, "loss": 0.3894, "lr": 3.5174762275596864e-06, "epoch": 4.1375, "percentage": 82.75, "elapsed_time": "6:34:21", "remaining_time": "1:22:12"}
994
+ {"current_steps": 994, "total_steps": 1200, "loss": 0.3906, "lr": 3.484593829074918e-06, "epoch": 4.141666666666667, "percentage": 82.83, "elapsed_time": "6:34:44", "remaining_time": "1:21:48"}
995
+ {"current_steps": 995, "total_steps": 1200, "loss": 0.4021, "lr": 3.451851177169789e-06, "epoch": 4.145833333333333, "percentage": 82.92, "elapsed_time": "6:35:07", "remaining_time": "1:21:24"}
996
+ {"current_steps": 996, "total_steps": 1200, "loss": 0.3866, "lr": 3.419248548899168e-06, "epoch": 4.15, "percentage": 83.0, "elapsed_time": "6:35:31", "remaining_time": "1:21:00"}
997
+ {"current_steps": 997, "total_steps": 1200, "loss": 0.3692, "lr": 3.3867862201330916e-06, "epoch": 4.154166666666667, "percentage": 83.08, "elapsed_time": "6:35:54", "remaining_time": "1:20:36"}
998
+ {"current_steps": 998, "total_steps": 1200, "loss": 0.3906, "lr": 3.354464465554448e-06, "epoch": 4.158333333333333, "percentage": 83.17, "elapsed_time": "6:36:17", "remaining_time": "1:20:12"}
999
+ {"current_steps": 999, "total_steps": 1200, "loss": 0.3938, "lr": 3.3222835586566384e-06, "epoch": 4.1625, "percentage": 83.25, "elapsed_time": "6:36:40", "remaining_time": "1:19:48"}
1000
+ {"current_steps": 1000, "total_steps": 1200, "loss": 0.3988, "lr": 3.290243771741275e-06, "epoch": 4.166666666666667, "percentage": 83.33, "elapsed_time": "6:37:02", "remaining_time": "1:19:24"}
1001
+ {"current_steps": 1001, "total_steps": 1200, "loss": 0.3951, "lr": 3.2583453759158634e-06, "epoch": 4.170833333333333, "percentage": 83.42, "elapsed_time": "6:37:26", "remaining_time": "1:19:00"}
1002
+ {"current_steps": 1002, "total_steps": 1200, "loss": 0.3935, "lr": 3.2265886410915214e-06, "epoch": 4.175, "percentage": 83.5, "elapsed_time": "6:37:50", "remaining_time": "1:18:36"}
1003
+ {"current_steps": 1003, "total_steps": 1200, "loss": 0.3829, "lr": 3.1949738359806905e-06, "epoch": 4.179166666666666, "percentage": 83.58, "elapsed_time": "6:38:13", "remaining_time": "1:18:12"}
1004
+ {"current_steps": 1004, "total_steps": 1200, "loss": 0.3947, "lr": 3.1635012280948496e-06, "epoch": 4.183333333333334, "percentage": 83.67, "elapsed_time": "6:38:36", "remaining_time": "1:17:49"}
1005
+ {"current_steps": 1005, "total_steps": 1200, "loss": 0.4171, "lr": 3.13217108374229e-06, "epoch": 4.1875, "percentage": 83.75, "elapsed_time": "6:39:00", "remaining_time": "1:17:25"}
1006
+ {"current_steps": 1006, "total_steps": 1200, "loss": 0.3934, "lr": 3.1009836680257965e-06, "epoch": 4.191666666666666, "percentage": 83.83, "elapsed_time": "6:39:24", "remaining_time": "1:17:01"}
1007
+ {"current_steps": 1007, "total_steps": 1200, "loss": 0.3857, "lr": 3.0699392448404787e-06, "epoch": 4.195833333333334, "percentage": 83.92, "elapsed_time": "6:39:47", "remaining_time": "1:16:37"}
1008
+ {"current_steps": 1008, "total_steps": 1200, "loss": 0.3959, "lr": 3.039038076871481e-06, "epoch": 4.2, "percentage": 84.0, "elapsed_time": "6:40:10", "remaining_time": "1:16:13"}
1009
+ {"current_steps": 1009, "total_steps": 1200, "loss": 0.3966, "lr": 3.00828042559179e-06, "epoch": 4.204166666666667, "percentage": 84.08, "elapsed_time": "6:40:32", "remaining_time": "1:15:49"}
1010
+ {"current_steps": 1010, "total_steps": 1200, "loss": 0.397, "lr": 2.9776665512600054e-06, "epoch": 4.208333333333333, "percentage": 84.17, "elapsed_time": "6:40:55", "remaining_time": "1:15:25"}
1011
+ {"current_steps": 1011, "total_steps": 1200, "loss": 0.397, "lr": 2.947196712918157e-06, "epoch": 4.2125, "percentage": 84.25, "elapsed_time": "6:41:18", "remaining_time": "1:15:01"}
1012
+ {"current_steps": 1012, "total_steps": 1200, "loss": 0.3964, "lr": 2.9168711683894903e-06, "epoch": 4.216666666666667, "percentage": 84.33, "elapsed_time": "6:41:41", "remaining_time": "1:14:37"}
1013
+ {"current_steps": 1013, "total_steps": 1200, "loss": 0.3973, "lr": 2.886690174276301e-06, "epoch": 4.220833333333333, "percentage": 84.42, "elapsed_time": "6:42:05", "remaining_time": "1:14:13"}
1014
+ {"current_steps": 1014, "total_steps": 1200, "loss": 0.3999, "lr": 2.8566539859577558e-06, "epoch": 4.225, "percentage": 84.5, "elapsed_time": "6:42:28", "remaining_time": "1:13:49"}
1015
+ {"current_steps": 1015, "total_steps": 1200, "loss": 0.3836, "lr": 2.8267628575877414e-06, "epoch": 4.229166666666667, "percentage": 84.58, "elapsed_time": "6:42:52", "remaining_time": "1:13:25"}
1016
+ {"current_steps": 1016, "total_steps": 1200, "loss": 0.3838, "lr": 2.7970170420926957e-06, "epoch": 4.233333333333333, "percentage": 84.67, "elapsed_time": "6:43:16", "remaining_time": "1:13:02"}
1017
+ {"current_steps": 1017, "total_steps": 1200, "loss": 0.3882, "lr": 2.7674167911694837e-06, "epoch": 4.2375, "percentage": 84.75, "elapsed_time": "6:43:39", "remaining_time": "1:12:38"}
1018
+ {"current_steps": 1018, "total_steps": 1200, "loss": 0.3927, "lr": 2.737962355283272e-06, "epoch": 4.241666666666666, "percentage": 84.83, "elapsed_time": "6:44:02", "remaining_time": "1:12:14"}
1019
+ {"current_steps": 1019, "total_steps": 1200, "loss": 0.398, "lr": 2.7086539836653923e-06, "epoch": 4.245833333333334, "percentage": 84.92, "elapsed_time": "6:44:25", "remaining_time": "1:11:50"}
1020
+ {"current_steps": 1020, "total_steps": 1200, "loss": 0.3984, "lr": 2.679491924311226e-06, "epoch": 4.25, "percentage": 85.0, "elapsed_time": "6:44:49", "remaining_time": "1:11:26"}
1021
+ {"current_steps": 1021, "total_steps": 1200, "loss": 0.3887, "lr": 2.65047642397815e-06, "epoch": 4.254166666666666, "percentage": 85.08, "elapsed_time": "6:45:12", "remaining_time": "1:11:02"}
1022
+ {"current_steps": 1022, "total_steps": 1200, "loss": 0.3893, "lr": 2.6216077281833976e-06, "epoch": 4.258333333333334, "percentage": 85.17, "elapsed_time": "6:45:35", "remaining_time": "1:10:38"}
1023
+ {"current_steps": 1023, "total_steps": 1200, "loss": 0.3929, "lr": 2.5928860812020063e-06, "epoch": 4.2625, "percentage": 85.25, "elapsed_time": "6:45:58", "remaining_time": "1:10:14"}
1024
+ {"current_steps": 1024, "total_steps": 1200, "loss": 0.3846, "lr": 2.564311726064754e-06, "epoch": 4.266666666666667, "percentage": 85.33, "elapsed_time": "6:46:21", "remaining_time": "1:09:50"}
1025
+ {"current_steps": 1025, "total_steps": 1200, "loss": 0.3758, "lr": 2.535884904556085e-06, "epoch": 4.270833333333333, "percentage": 85.42, "elapsed_time": "6:46:45", "remaining_time": "1:09:26"}
1026
+ {"current_steps": 1026, "total_steps": 1200, "loss": 0.3927, "lr": 2.5076058572120855e-06, "epoch": 4.275, "percentage": 85.5, "elapsed_time": "6:47:08", "remaining_time": "1:09:02"}
1027
+ {"current_steps": 1027, "total_steps": 1200, "loss": 0.3877, "lr": 2.4794748233184285e-06, "epoch": 4.279166666666667, "percentage": 85.58, "elapsed_time": "6:47:31", "remaining_time": "1:08:38"}
1028
+ {"current_steps": 1028, "total_steps": 1200, "loss": 0.3892, "lr": 2.4514920409083586e-06, "epoch": 4.283333333333333, "percentage": 85.67, "elapsed_time": "6:47:53", "remaining_time": "1:08:14"}
1029
+ {"current_steps": 1029, "total_steps": 1200, "loss": 0.3848, "lr": 2.423657746760695e-06, "epoch": 4.2875, "percentage": 85.75, "elapsed_time": "6:48:17", "remaining_time": "1:07:51"}
1030
+ {"current_steps": 1030, "total_steps": 1200, "loss": 0.4155, "lr": 2.3959721763977805e-06, "epoch": 4.291666666666667, "percentage": 85.83, "elapsed_time": "6:48:40", "remaining_time": "1:07:27"}
1031
+ {"current_steps": 1031, "total_steps": 1200, "loss": 0.3843, "lr": 2.3684355640835334e-06, "epoch": 4.295833333333333, "percentage": 85.92, "elapsed_time": "6:49:03", "remaining_time": "1:07:03"}
1032
+ {"current_steps": 1032, "total_steps": 1200, "loss": 0.3884, "lr": 2.3410481428214602e-06, "epoch": 4.3, "percentage": 86.0, "elapsed_time": "6:49:26", "remaining_time": "1:06:39"}
1033
+ {"current_steps": 1033, "total_steps": 1200, "loss": 0.3806, "lr": 2.313810144352664e-06, "epoch": 4.304166666666666, "percentage": 86.08, "elapsed_time": "6:49:48", "remaining_time": "1:06:15"}
1034
+ {"current_steps": 1034, "total_steps": 1200, "loss": 0.3886, "lr": 2.2867217991538793e-06, "epoch": 4.308333333333334, "percentage": 86.17, "elapsed_time": "6:50:12", "remaining_time": "1:05:51"}
1035
+ {"current_steps": 1035, "total_steps": 1200, "loss": 0.3943, "lr": 2.259783336435566e-06, "epoch": 4.3125, "percentage": 86.25, "elapsed_time": "6:50:36", "remaining_time": "1:05:27"}
1036
+ {"current_steps": 1036, "total_steps": 1200, "loss": 0.3876, "lr": 2.2329949841399223e-06, "epoch": 4.316666666666666, "percentage": 86.33, "elapsed_time": "6:50:59", "remaining_time": "1:05:03"}
1037
+ {"current_steps": 1037, "total_steps": 1200, "loss": 0.3901, "lr": 2.206356968938965e-06, "epoch": 4.320833333333334, "percentage": 86.42, "elapsed_time": "6:51:22", "remaining_time": "1:04:39"}
1038
+ {"current_steps": 1038, "total_steps": 1200, "loss": 0.3963, "lr": 2.1798695162326444e-06, "epoch": 4.325, "percentage": 86.5, "elapsed_time": "6:51:45", "remaining_time": "1:04:15"}
1039
+ {"current_steps": 1039, "total_steps": 1200, "loss": 0.3935, "lr": 2.1535328501468935e-06, "epoch": 4.329166666666667, "percentage": 86.58, "elapsed_time": "6:52:08", "remaining_time": "1:03:51"}
1040
+ {"current_steps": 1040, "total_steps": 1200, "loss": 0.4077, "lr": 2.127347193531757e-06, "epoch": 4.333333333333333, "percentage": 86.67, "elapsed_time": "6:52:31", "remaining_time": "1:03:27"}
1041
+ {"current_steps": 1041, "total_steps": 1200, "loss": 0.395, "lr": 2.1013127679595002e-06, "epoch": 4.3375, "percentage": 86.75, "elapsed_time": "6:52:53", "remaining_time": "1:03:03"}
1042
+ {"current_steps": 1042, "total_steps": 1200, "loss": 0.3948, "lr": 2.0754297937227317e-06, "epoch": 4.341666666666667, "percentage": 86.83, "elapsed_time": "6:53:17", "remaining_time": "1:02:40"}
1043
+ {"current_steps": 1043, "total_steps": 1200, "loss": 0.4002, "lr": 2.04969848983255e-06, "epoch": 4.345833333333333, "percentage": 86.92, "elapsed_time": "6:53:41", "remaining_time": "1:02:16"}
1044
+ {"current_steps": 1044, "total_steps": 1200, "loss": 0.3981, "lr": 2.024119074016664e-06, "epoch": 4.35, "percentage": 87.0, "elapsed_time": "6:54:04", "remaining_time": "1:01:52"}
1045
+ {"current_steps": 1045, "total_steps": 1200, "loss": 0.3999, "lr": 1.998691762717577e-06, "epoch": 4.354166666666667, "percentage": 87.08, "elapsed_time": "6:54:28", "remaining_time": "1:01:28"}
1046
+ {"current_steps": 1046, "total_steps": 1200, "loss": 0.3878, "lr": 1.973416771090755e-06, "epoch": 4.358333333333333, "percentage": 87.17, "elapsed_time": "6:54:52", "remaining_time": "1:01:04"}
1047
+ {"current_steps": 1047, "total_steps": 1200, "loss": 0.3888, "lr": 1.948294313002792e-06, "epoch": 4.3625, "percentage": 87.25, "elapsed_time": "6:55:15", "remaining_time": "1:00:40"}
1048
+ {"current_steps": 1048, "total_steps": 1200, "loss": 0.3849, "lr": 1.9233246010295903e-06, "epoch": 4.366666666666666, "percentage": 87.33, "elapsed_time": "6:55:38", "remaining_time": "1:00:17"}
1049
+ {"current_steps": 1049, "total_steps": 1200, "loss": 0.3745, "lr": 1.8985078464546002e-06, "epoch": 4.370833333333334, "percentage": 87.42, "elapsed_time": "6:56:01", "remaining_time": "0:59:53"}
1050
+ {"current_steps": 1050, "total_steps": 1200, "loss": 0.3843, "lr": 1.8738442592670014e-06, "epoch": 4.375, "percentage": 87.5, "elapsed_time": "6:56:23", "remaining_time": "0:59:29"}
1051
+ {"current_steps": 1051, "total_steps": 1200, "loss": 0.3816, "lr": 1.8493340481599275e-06, "epoch": 4.379166666666666, "percentage": 87.58, "elapsed_time": "6:56:46", "remaining_time": "0:59:05"}
1052
+ {"current_steps": 1052, "total_steps": 1200, "loss": 0.3805, "lr": 1.8249774205287151e-06, "epoch": 4.383333333333334, "percentage": 87.67, "elapsed_time": "6:57:10", "remaining_time": "0:58:41"}
1053
+ {"current_steps": 1053, "total_steps": 1200, "loss": 0.3851, "lr": 1.800774582469138e-06, "epoch": 4.3875, "percentage": 87.75, "elapsed_time": "6:57:33", "remaining_time": "0:58:17"}
1054
+ {"current_steps": 1054, "total_steps": 1200, "loss": 0.4012, "lr": 1.7767257387756599e-06, "epoch": 4.391666666666667, "percentage": 87.83, "elapsed_time": "6:57:56", "remaining_time": "0:57:53"}
1055
+ {"current_steps": 1055, "total_steps": 1200, "loss": 0.3834, "lr": 1.7528310929397196e-06, "epoch": 4.395833333333333, "percentage": 87.92, "elapsed_time": "6:58:20", "remaining_time": "0:57:29"}
1056
+ {"current_steps": 1056, "total_steps": 1200, "loss": 0.3883, "lr": 1.7290908471479805e-06, "epoch": 4.4, "percentage": 88.0, "elapsed_time": "6:58:42", "remaining_time": "0:57:05"}
1057
+ {"current_steps": 1057, "total_steps": 1200, "loss": 0.3889, "lr": 1.7055052022806595e-06, "epoch": 4.404166666666667, "percentage": 88.08, "elapsed_time": "6:59:06", "remaining_time": "0:56:41"}
1058
+ {"current_steps": 1058, "total_steps": 1200, "loss": 0.3762, "lr": 1.682074357909782e-06, "epoch": 4.408333333333333, "percentage": 88.17, "elapsed_time": "6:59:28", "remaining_time": "0:56:18"}
1059
+ {"current_steps": 1059, "total_steps": 1200, "loss": 0.3817, "lr": 1.6587985122975193e-06, "epoch": 4.4125, "percentage": 88.25, "elapsed_time": "6:59:52", "remaining_time": "0:55:54"}
1060
+ {"current_steps": 1060, "total_steps": 1200, "loss": 0.384, "lr": 1.6356778623945223e-06, "epoch": 4.416666666666667, "percentage": 88.33, "elapsed_time": "7:00:15", "remaining_time": "0:55:30"}
1061
+ {"current_steps": 1061, "total_steps": 1200, "loss": 0.3908, "lr": 1.612712603838218e-06, "epoch": 4.420833333333333, "percentage": 88.42, "elapsed_time": "7:00:39", "remaining_time": "0:55:06"}
1062
+ {"current_steps": 1062, "total_steps": 1200, "loss": 0.3861, "lr": 1.5899029309511926e-06, "epoch": 4.425, "percentage": 88.5, "elapsed_time": "7:01:02", "remaining_time": "0:54:42"}
1063
+ {"current_steps": 1063, "total_steps": 1200, "loss": 0.3828, "lr": 1.5672490367395244e-06, "epoch": 4.429166666666666, "percentage": 88.58, "elapsed_time": "7:01:25", "remaining_time": "0:54:18"}
1064
+ {"current_steps": 1064, "total_steps": 1200, "loss": 0.4043, "lr": 1.5447511128911542e-06, "epoch": 4.433333333333334, "percentage": 88.67, "elapsed_time": "7:01:48", "remaining_time": "0:53:54"}
1065
+ {"current_steps": 1065, "total_steps": 1200, "loss": 0.3782, "lr": 1.5224093497742654e-06, "epoch": 4.4375, "percentage": 88.75, "elapsed_time": "7:02:10", "remaining_time": "0:53:30"}
1066
+ {"current_steps": 1066, "total_steps": 1200, "loss": 0.3973, "lr": 1.5002239364356784e-06, "epoch": 4.441666666666666, "percentage": 88.83, "elapsed_time": "7:02:33", "remaining_time": "0:53:07"}
1067
+ {"current_steps": 1067, "total_steps": 1200, "loss": 0.3862, "lr": 1.4781950605992434e-06, "epoch": 4.445833333333334, "percentage": 88.92, "elapsed_time": "7:02:57", "remaining_time": "0:52:43"}
1068
+ {"current_steps": 1068, "total_steps": 1200, "loss": 0.3909, "lr": 1.4563229086642538e-06, "epoch": 4.45, "percentage": 89.0, "elapsed_time": "7:03:19", "remaining_time": "0:52:19"}
1069
+ {"current_steps": 1069, "total_steps": 1200, "loss": 0.3883, "lr": 1.4346076657038689e-06, "epoch": 4.454166666666667, "percentage": 89.08, "elapsed_time": "7:03:43", "remaining_time": "0:51:55"}
1070
+ {"current_steps": 1070, "total_steps": 1200, "loss": 0.3832, "lr": 1.4130495154635494e-06, "epoch": 4.458333333333333, "percentage": 89.17, "elapsed_time": "7:04:06", "remaining_time": "0:51:31"}
1071
+ {"current_steps": 1071, "total_steps": 1200, "loss": 0.3681, "lr": 1.3916486403595108e-06, "epoch": 4.4625, "percentage": 89.25, "elapsed_time": "7:04:29", "remaining_time": "0:51:07"}
1072
+ {"current_steps": 1072, "total_steps": 1200, "loss": 0.3782, "lr": 1.3704052214771513e-06, "epoch": 4.466666666666667, "percentage": 89.33, "elapsed_time": "7:04:53", "remaining_time": "0:50:43"}
1073
+ {"current_steps": 1073, "total_steps": 1200, "loss": 0.3876, "lr": 1.3493194385695608e-06, "epoch": 4.470833333333333, "percentage": 89.42, "elapsed_time": "7:05:16", "remaining_time": "0:50:20"}
1074
+ {"current_steps": 1074, "total_steps": 1200, "loss": 0.3909, "lr": 1.3283914700559675e-06, "epoch": 4.475, "percentage": 89.5, "elapsed_time": "7:05:40", "remaining_time": "0:49:56"}
1075
+ {"current_steps": 1075, "total_steps": 1200, "loss": 0.3777, "lr": 1.3076214930202324e-06, "epoch": 4.479166666666667, "percentage": 89.58, "elapsed_time": "7:06:02", "remaining_time": "0:49:32"}
1076
+ {"current_steps": 1076, "total_steps": 1200, "loss": 0.3833, "lr": 1.2870096832093726e-06, "epoch": 4.483333333333333, "percentage": 89.67, "elapsed_time": "7:06:24", "remaining_time": "0:49:08"}
1077
+ {"current_steps": 1077, "total_steps": 1200, "loss": 0.3909, "lr": 1.2665562150320487e-06, "epoch": 4.4875, "percentage": 89.75, "elapsed_time": "7:06:46", "remaining_time": "0:48:44"}
1078
+ {"current_steps": 1078, "total_steps": 1200, "loss": 0.4034, "lr": 1.2462612615571046e-06, "epoch": 4.491666666666666, "percentage": 89.83, "elapsed_time": "7:07:09", "remaining_time": "0:48:20"}
1079
+ {"current_steps": 1079, "total_steps": 1200, "loss": 0.3979, "lr": 1.2261249945120922e-06, "epoch": 4.495833333333334, "percentage": 89.92, "elapsed_time": "7:07:32", "remaining_time": "0:47:56"}
1080
+ {"current_steps": 1080, "total_steps": 1200, "loss": 0.4179, "lr": 1.2061475842818337e-06, "epoch": 4.5, "percentage": 90.0, "elapsed_time": "7:07:55", "remaining_time": "0:47:32"}
1081
+ {"current_steps": 1081, "total_steps": 1200, "loss": 0.3716, "lr": 1.1863291999069592e-06, "epoch": 4.504166666666666, "percentage": 90.08, "elapsed_time": "7:08:17", "remaining_time": "0:47:08"}
1082
+ {"current_steps": 1082, "total_steps": 1200, "loss": 0.388, "lr": 1.1666700090824956e-06, "epoch": 4.508333333333333, "percentage": 90.17, "elapsed_time": "7:08:39", "remaining_time": "0:46:44"}
1083
+ {"current_steps": 1083, "total_steps": 1200, "loss": 0.3931, "lr": 1.1471701781564316e-06, "epoch": 4.5125, "percentage": 90.25, "elapsed_time": "7:09:02", "remaining_time": "0:46:21"}
1084
+ {"current_steps": 1084, "total_steps": 1200, "loss": 0.3958, "lr": 1.12782987212833e-06, "epoch": 4.516666666666667, "percentage": 90.33, "elapsed_time": "7:09:25", "remaining_time": "0:45:57"}
1085
+ {"current_steps": 1085, "total_steps": 1200, "loss": 0.3921, "lr": 1.1086492546479065e-06, "epoch": 4.520833333333333, "percentage": 90.42, "elapsed_time": "7:09:48", "remaining_time": "0:45:33"}
1086
+ {"current_steps": 1086, "total_steps": 1200, "loss": 0.3716, "lr": 1.0896284880136632e-06, "epoch": 4.525, "percentage": 90.5, "elapsed_time": "7:10:11", "remaining_time": "0:45:09"}
1087
+ {"current_steps": 1087, "total_steps": 1200, "loss": 0.3964, "lr": 1.070767733171514e-06, "epoch": 4.529166666666667, "percentage": 90.58, "elapsed_time": "7:10:34", "remaining_time": "0:44:45"}
1088
+ {"current_steps": 1088, "total_steps": 1200, "loss": 0.3982, "lr": 1.052067149713416e-06, "epoch": 4.533333333333333, "percentage": 90.67, "elapsed_time": "7:10:56", "remaining_time": "0:44:21"}
1089
+ {"current_steps": 1089, "total_steps": 1200, "loss": 0.3895, "lr": 1.0335268958760135e-06, "epoch": 4.5375, "percentage": 90.75, "elapsed_time": "7:11:19", "remaining_time": "0:43:57"}
1090
+ {"current_steps": 1090, "total_steps": 1200, "loss": 0.3962, "lr": 1.0151471285393223e-06, "epoch": 4.541666666666667, "percentage": 90.83, "elapsed_time": "7:11:43", "remaining_time": "0:43:34"}
1091
+ {"current_steps": 1091, "total_steps": 1200, "loss": 0.4045, "lr": 9.96928003225377e-07, "epoch": 4.545833333333333, "percentage": 90.92, "elapsed_time": "7:12:07", "remaining_time": "0:43:10"}
1092
+ {"current_steps": 1092, "total_steps": 1200, "loss": 0.3936, "lr": 9.788696740969295e-07, "epoch": 4.55, "percentage": 91.0, "elapsed_time": "7:12:30", "remaining_time": "0:42:46"}
1093
+ {"current_steps": 1093, "total_steps": 1200, "loss": 0.4077, "lr": 9.609722939561373e-07, "epoch": 4.554166666666667, "percentage": 91.08, "elapsed_time": "7:12:53", "remaining_time": "0:42:22"}
1094
+ {"current_steps": 1094, "total_steps": 1200, "loss": 0.3984, "lr": 9.432360142432761e-07, "epoch": 4.558333333333334, "percentage": 91.17, "elapsed_time": "7:13:15", "remaining_time": "0:41:58"}
1095
+ {"current_steps": 1095, "total_steps": 1200, "loss": 0.385, "lr": 9.256609850354636e-07, "epoch": 4.5625, "percentage": 91.25, "elapsed_time": "7:13:38", "remaining_time": "0:41:34"}
1096
+ {"current_steps": 1096, "total_steps": 1200, "loss": 0.3945, "lr": 9.082473550453619e-07, "epoch": 4.566666666666666, "percentage": 91.33, "elapsed_time": "7:14:02", "remaining_time": "0:41:11"}
1097
+ {"current_steps": 1097, "total_steps": 1200, "loss": 0.3908, "lr": 8.909952716199566e-07, "epoch": 4.570833333333333, "percentage": 91.42, "elapsed_time": "7:14:24", "remaining_time": "0:40:47"}
1098
+ {"current_steps": 1098, "total_steps": 1200, "loss": 0.3889, "lr": 8.739048807392913e-07, "epoch": 4.575, "percentage": 91.5, "elapsed_time": "7:14:48", "remaining_time": "0:40:23"}
1099
+ {"current_steps": 1099, "total_steps": 1200, "loss": 0.3844, "lr": 8.569763270152265e-07, "epoch": 4.579166666666667, "percentage": 91.58, "elapsed_time": "7:15:11", "remaining_time": "0:39:59"}
1100
+ {"current_steps": 1100, "total_steps": 1200, "loss": 0.3863, "lr": 8.402097536902221e-07, "epoch": 4.583333333333333, "percentage": 91.67, "elapsed_time": "7:15:34", "remaining_time": "0:39:35"}
1101
+ {"current_steps": 1101, "total_steps": 1200, "loss": 0.382, "lr": 8.23605302636139e-07, "epoch": 4.5875, "percentage": 91.75, "elapsed_time": "7:15:58", "remaining_time": "0:39:12"}
1102
+ {"current_steps": 1102, "total_steps": 1200, "loss": 0.3861, "lr": 8.071631143530178e-07, "epoch": 4.591666666666667, "percentage": 91.83, "elapsed_time": "7:16:21", "remaining_time": "0:38:48"}
1103
+ {"current_steps": 1103, "total_steps": 1200, "loss": 0.3838, "lr": 7.908833279678885e-07, "epoch": 4.595833333333333, "percentage": 91.92, "elapsed_time": "7:16:43", "remaining_time": "0:38:24"}
1104
+ {"current_steps": 1104, "total_steps": 1200, "loss": 0.4004, "lr": 7.747660812336221e-07, "epoch": 4.6, "percentage": 92.0, "elapsed_time": "7:17:06", "remaining_time": "0:38:00"}
1105
+ {"current_steps": 1105, "total_steps": 1200, "loss": 0.3785, "lr": 7.588115105277372e-07, "epoch": 4.604166666666667, "percentage": 92.08, "elapsed_time": "7:17:29", "remaining_time": "0:37:36"}
1106
+ {"current_steps": 1106, "total_steps": 1200, "loss": 0.384, "lr": 7.430197508512482e-07, "epoch": 4.608333333333333, "percentage": 92.17, "elapsed_time": "7:17:52", "remaining_time": "0:37:12"}
1107
+ {"current_steps": 1107, "total_steps": 1200, "loss": 0.381, "lr": 7.273909358275411e-07, "epoch": 4.6125, "percentage": 92.25, "elapsed_time": "7:18:15", "remaining_time": "0:36:49"}
1108
+ {"current_steps": 1108, "total_steps": 1200, "loss": 0.3796, "lr": 7.11925197701222e-07, "epoch": 4.616666666666667, "percentage": 92.33, "elapsed_time": "7:18:38", "remaining_time": "0:36:25"}
1109
+ {"current_steps": 1109, "total_steps": 1200, "loss": 0.3811, "lr": 6.966226673370125e-07, "epoch": 4.620833333333334, "percentage": 92.42, "elapsed_time": "7:19:02", "remaining_time": "0:36:01"}
1110
+ {"current_steps": 1110, "total_steps": 1200, "loss": 0.3971, "lr": 6.814834742186361e-07, "epoch": 4.625, "percentage": 92.5, "elapsed_time": "7:19:25", "remaining_time": "0:35:37"}
1111
+ {"current_steps": 1111, "total_steps": 1200, "loss": 0.381, "lr": 6.665077464477198e-07, "epoch": 4.629166666666666, "percentage": 92.58, "elapsed_time": "7:19:49", "remaining_time": "0:35:14"}
1112
+ {"current_steps": 1112, "total_steps": 1200, "loss": 0.4016, "lr": 6.516956107427241e-07, "epoch": 4.633333333333333, "percentage": 92.67, "elapsed_time": "7:20:13", "remaining_time": "0:34:50"}
1113
+ {"current_steps": 1113, "total_steps": 1200, "loss": 0.3776, "lr": 6.370471924378474e-07, "epoch": 4.6375, "percentage": 92.75, "elapsed_time": "7:20:36", "remaining_time": "0:34:26"}
1114
+ {"current_steps": 1114, "total_steps": 1200, "loss": 0.3808, "lr": 6.225626154819852e-07, "epoch": 4.641666666666667, "percentage": 92.83, "elapsed_time": "7:20:59", "remaining_time": "0:34:02"}
1115
+ {"current_steps": 1115, "total_steps": 1200, "loss": 0.397, "lr": 6.082420024376801e-07, "epoch": 4.645833333333333, "percentage": 92.92, "elapsed_time": "7:21:23", "remaining_time": "0:33:38"}
1116
+ {"current_steps": 1116, "total_steps": 1200, "loss": 0.3919, "lr": 5.940854744800706e-07, "epoch": 4.65, "percentage": 93.0, "elapsed_time": "7:21:46", "remaining_time": "0:33:15"}
1117
+ {"current_steps": 1117, "total_steps": 1200, "loss": 0.4142, "lr": 5.800931513958796e-07, "epoch": 4.654166666666667, "percentage": 93.08, "elapsed_time": "7:22:10", "remaining_time": "0:32:51"}
1118
+ {"current_steps": 1118, "total_steps": 1200, "loss": 0.3872, "lr": 5.66265151582397e-07, "epoch": 4.658333333333333, "percentage": 93.17, "elapsed_time": "7:22:33", "remaining_time": "0:32:27"}
1119
+ {"current_steps": 1119, "total_steps": 1200, "loss": 0.4013, "lr": 5.526015920464689e-07, "epoch": 4.6625, "percentage": 93.25, "elapsed_time": "7:22:56", "remaining_time": "0:32:03"}
1120
+ {"current_steps": 1120, "total_steps": 1200, "loss": 0.3826, "lr": 5.391025884035239e-07, "epoch": 4.666666666666667, "percentage": 93.33, "elapsed_time": "7:23:19", "remaining_time": "0:31:39"}
1121
+ {"current_steps": 1121, "total_steps": 1200, "loss": 0.3813, "lr": 5.257682548765841e-07, "epoch": 4.670833333333333, "percentage": 93.42, "elapsed_time": "7:23:42", "remaining_time": "0:31:16"}
1122
+ {"current_steps": 1122, "total_steps": 1200, "loss": 0.3879, "lr": 5.125987042952973e-07, "epoch": 4.675, "percentage": 93.5, "elapsed_time": "7:24:06", "remaining_time": "0:30:52"}
1123
+ {"current_steps": 1123, "total_steps": 1200, "loss": 0.3768, "lr": 4.99594048094989e-07, "epoch": 4.679166666666667, "percentage": 93.58, "elapsed_time": "7:24:29", "remaining_time": "0:30:28"}
1124
+ {"current_steps": 1124, "total_steps": 1200, "loss": 0.4001, "lr": 4.867543963157162e-07, "epoch": 4.683333333333334, "percentage": 93.67, "elapsed_time": "7:24:52", "remaining_time": "0:30:04"}
1125
+ {"current_steps": 1125, "total_steps": 1200, "loss": 0.398, "lr": 4.740798576013328e-07, "epoch": 4.6875, "percentage": 93.75, "elapsed_time": "7:25:15", "remaining_time": "0:29:41"}
1126
+ {"current_steps": 1126, "total_steps": 1200, "loss": 0.3934, "lr": 4.615705391985814e-07, "epoch": 4.691666666666666, "percentage": 93.83, "elapsed_time": "7:25:38", "remaining_time": "0:29:17"}
1127
+ {"current_steps": 1127, "total_steps": 1200, "loss": 0.3996, "lr": 4.492265469561696e-07, "epoch": 4.695833333333333, "percentage": 93.92, "elapsed_time": "7:26:01", "remaining_time": "0:28:53"}
1128
+ {"current_steps": 1128, "total_steps": 1200, "loss": 0.3907, "lr": 4.3704798532388624e-07, "epoch": 4.7, "percentage": 94.0, "elapsed_time": "7:26:24", "remaining_time": "0:28:29"}
1129
+ {"current_steps": 1129, "total_steps": 1200, "loss": 0.4026, "lr": 4.2503495735171987e-07, "epoch": 4.704166666666667, "percentage": 94.08, "elapsed_time": "7:26:47", "remaining_time": "0:28:05"}
1130
+ {"current_steps": 1130, "total_steps": 1200, "loss": 0.3891, "lr": 4.1318756468897047e-07, "epoch": 4.708333333333333, "percentage": 94.17, "elapsed_time": "7:27:11", "remaining_time": "0:27:42"}
1131
+ {"current_steps": 1131, "total_steps": 1200, "loss": 0.3795, "lr": 4.0150590758340826e-07, "epoch": 4.7125, "percentage": 94.25, "elapsed_time": "7:27:34", "remaining_time": "0:27:18"}
1132
+ {"current_steps": 1132, "total_steps": 1200, "loss": 0.383, "lr": 3.899900848804139e-07, "epoch": 4.716666666666667, "percentage": 94.33, "elapsed_time": "7:27:57", "remaining_time": "0:26:54"}
1133
+ {"current_steps": 1133, "total_steps": 1200, "loss": 0.3852, "lr": 3.7864019402214845e-07, "epoch": 4.720833333333333, "percentage": 94.42, "elapsed_time": "7:28:20", "remaining_time": "0:26:30"}
1134
+ {"current_steps": 1134, "total_steps": 1200, "loss": 0.3958, "lr": 3.674563310467205e-07, "epoch": 4.725, "percentage": 94.5, "elapsed_time": "7:28:43", "remaining_time": "0:26:07"}
1135
+ {"current_steps": 1135, "total_steps": 1200, "loss": 0.4072, "lr": 3.5643859058738686e-07, "epoch": 4.729166666666667, "percentage": 94.58, "elapsed_time": "7:29:06", "remaining_time": "0:25:43"}
1136
+ {"current_steps": 1136, "total_steps": 1200, "loss": 0.3698, "lr": 3.455870658717353e-07, "epoch": 4.733333333333333, "percentage": 94.67, "elapsed_time": "7:29:29", "remaining_time": "0:25:19"}
1137
+ {"current_steps": 1137, "total_steps": 1200, "loss": 0.3898, "lr": 3.349018487209099e-07, "epoch": 4.7375, "percentage": 94.75, "elapsed_time": "7:29:53", "remaining_time": "0:24:55"}
1138
+ {"current_steps": 1138, "total_steps": 1200, "loss": 0.3901, "lr": 3.2438302954882486e-07, "epoch": 4.741666666666667, "percentage": 94.83, "elapsed_time": "7:30:17", "remaining_time": "0:24:31"}
1139
+ {"current_steps": 1139, "total_steps": 1200, "loss": 0.3812, "lr": 3.1403069736140715e-07, "epoch": 4.745833333333334, "percentage": 94.92, "elapsed_time": "7:30:39", "remaining_time": "0:24:08"}
1140
+ {"current_steps": 1140, "total_steps": 1200, "loss": 0.3938, "lr": 3.038449397558396e-07, "epoch": 4.75, "percentage": 95.0, "elapsed_time": "7:31:03", "remaining_time": "0:23:44"}
1141
+ {"current_steps": 1141, "total_steps": 1200, "loss": 0.4035, "lr": 2.9382584291981265e-07, "epoch": 4.754166666666666, "percentage": 95.08, "elapsed_time": "7:31:25", "remaining_time": "0:23:20"}
1142
+ {"current_steps": 1142, "total_steps": 1200, "loss": 0.3984, "lr": 2.839734916308068e-07, "epoch": 4.758333333333333, "percentage": 95.17, "elapsed_time": "7:31:48", "remaining_time": "0:22:56"}
1143
+ {"current_steps": 1143, "total_steps": 1200, "loss": 0.3836, "lr": 2.7428796925537127e-07, "epoch": 4.7625, "percentage": 95.25, "elapsed_time": "7:32:13", "remaining_time": "0:22:33"}
1144
+ {"current_steps": 1144, "total_steps": 1200, "loss": 0.3972, "lr": 2.647693577484156e-07, "epoch": 4.766666666666667, "percentage": 95.33, "elapsed_time": "7:32:35", "remaining_time": "0:22:09"}
1145
+ {"current_steps": 1145, "total_steps": 1200, "loss": 0.3904, "lr": 2.554177376525191e-07, "epoch": 4.770833333333333, "percentage": 95.42, "elapsed_time": "7:32:58", "remaining_time": "0:21:45"}
1146
+ {"current_steps": 1146, "total_steps": 1200, "loss": 0.3911, "lr": 2.462331880972468e-07, "epoch": 4.775, "percentage": 95.5, "elapsed_time": "7:33:21", "remaining_time": "0:21:21"}
1147
+ {"current_steps": 1147, "total_steps": 1200, "loss": 0.3998, "lr": 2.3721578679848146e-07, "epoch": 4.779166666666667, "percentage": 95.58, "elapsed_time": "7:33:44", "remaining_time": "0:20:57"}
1148
+ {"current_steps": 1148, "total_steps": 1200, "loss": 0.3965, "lr": 2.2836561005776803e-07, "epoch": 4.783333333333333, "percentage": 95.67, "elapsed_time": "7:34:09", "remaining_time": "0:20:34"}
1149
+ {"current_steps": 1149, "total_steps": 1200, "loss": 0.3813, "lr": 2.1968273276166352e-07, "epoch": 4.7875, "percentage": 95.75, "elapsed_time": "7:34:32", "remaining_time": "0:20:10"}
1150
+ {"current_steps": 1150, "total_steps": 1200, "loss": 0.4015, "lr": 2.111672283811106e-07, "epoch": 4.791666666666667, "percentage": 95.83, "elapsed_time": "7:34:56", "remaining_time": "0:19:46"}
1151
+ {"current_steps": 1151, "total_steps": 1200, "loss": 0.3849, "lr": 2.0281916897080477e-07, "epoch": 4.795833333333333, "percentage": 95.92, "elapsed_time": "7:35:19", "remaining_time": "0:19:23"}
1152
+ {"current_steps": 1152, "total_steps": 1200, "loss": 0.399, "lr": 1.9463862516859277e-07, "epoch": 4.8, "percentage": 96.0, "elapsed_time": "7:35:43", "remaining_time": "0:18:59"}
1153
+ {"current_steps": 1153, "total_steps": 1200, "loss": 0.4107, "lr": 1.8662566619487954e-07, "epoch": 4.804166666666667, "percentage": 96.08, "elapsed_time": "7:36:06", "remaining_time": "0:18:35"}
1154
+ {"current_steps": 1154, "total_steps": 1200, "loss": 0.39, "lr": 1.7878035985202657e-07, "epoch": 4.808333333333334, "percentage": 96.17, "elapsed_time": "7:36:30", "remaining_time": "0:18:11"}
1155
+ {"current_steps": 1155, "total_steps": 1200, "loss": 0.4039, "lr": 1.7110277252379238e-07, "epoch": 4.8125, "percentage": 96.25, "elapsed_time": "7:36:53", "remaining_time": "0:17:48"}
1156
+ {"current_steps": 1156, "total_steps": 1200, "loss": 0.3935, "lr": 1.6359296917476619e-07, "epoch": 4.816666666666666, "percentage": 96.33, "elapsed_time": "7:37:17", "remaining_time": "0:17:24"}
1157
+ {"current_steps": 1157, "total_steps": 1200, "loss": 0.3855, "lr": 1.5625101334981742e-07, "epoch": 4.820833333333333, "percentage": 96.42, "elapsed_time": "7:37:40", "remaining_time": "0:17:00"}
1158
+ {"current_steps": 1158, "total_steps": 1200, "loss": 0.3853, "lr": 1.4907696717356035e-07, "epoch": 4.825, "percentage": 96.5, "elapsed_time": "7:38:03", "remaining_time": "0:16:36"}
1159
+ {"current_steps": 1159, "total_steps": 1200, "loss": 0.3882, "lr": 1.4207089134982143e-07, "epoch": 4.829166666666667, "percentage": 96.58, "elapsed_time": "7:38:26", "remaining_time": "0:16:13"}
1160
+ {"current_steps": 1160, "total_steps": 1200, "loss": 0.384, "lr": 1.3523284516113955e-07, "epoch": 4.833333333333333, "percentage": 96.67, "elapsed_time": "7:38:49", "remaining_time": "0:15:49"}
1161
+ {"current_steps": 1161, "total_steps": 1200, "loss": 0.3811, "lr": 1.2856288646825087e-07, "epoch": 4.8375, "percentage": 96.75, "elapsed_time": "7:39:11", "remaining_time": "0:15:25"}
1162
+ {"current_steps": 1162, "total_steps": 1200, "loss": 0.3898, "lr": 1.2206107170960046e-07, "epoch": 4.841666666666667, "percentage": 96.83, "elapsed_time": "7:39:34", "remaining_time": "0:15:01"}
1163
+ {"current_steps": 1163, "total_steps": 1200, "loss": 0.3892, "lr": 1.1572745590087586e-07, "epoch": 4.845833333333333, "percentage": 96.92, "elapsed_time": "7:39:58", "remaining_time": "0:14:38"}
1164
+ {"current_steps": 1164, "total_steps": 1200, "loss": 0.3982, "lr": 1.0956209263453421e-07, "epoch": 4.85, "percentage": 97.0, "elapsed_time": "7:40:21", "remaining_time": "0:14:14"}
1165
+ {"current_steps": 1165, "total_steps": 1200, "loss": 0.3941, "lr": 1.0356503407934038e-07, "epoch": 4.854166666666667, "percentage": 97.08, "elapsed_time": "7:40:45", "remaining_time": "0:13:50"}
1166
+ {"current_steps": 1166, "total_steps": 1200, "loss": 0.3991, "lr": 9.77363309799384e-08, "epoch": 4.858333333333333, "percentage": 97.17, "elapsed_time": "7:41:09", "remaining_time": "0:13:26"}
1167
+ {"current_steps": 1167, "total_steps": 1200, "loss": 0.3826, "lr": 9.207603265642296e-08, "epoch": 4.8625, "percentage": 97.25, "elapsed_time": "7:41:32", "remaining_time": "0:13:03"}
1168
+ {"current_steps": 1168, "total_steps": 1200, "loss": 0.3966, "lr": 8.658418700391302e-08, "epoch": 4.866666666666667, "percentage": 97.33, "elapsed_time": "7:41:55", "remaining_time": "0:12:39"}
1169
+ {"current_steps": 1169, "total_steps": 1200, "loss": 0.3961, "lr": 8.126084049214334e-08, "epoch": 4.870833333333334, "percentage": 97.42, "elapsed_time": "7:42:19", "remaining_time": "0:12:15"}
1170
+ {"current_steps": 1170, "total_steps": 1200, "loss": 0.3845, "lr": 7.61060381650891e-08, "epoch": 4.875, "percentage": 97.5, "elapsed_time": "7:42:42", "remaining_time": "0:11:51"}
1171
+ {"current_steps": 1171, "total_steps": 1200, "loss": 0.3805, "lr": 7.111982364056857e-08, "epoch": 4.879166666666666, "percentage": 97.58, "elapsed_time": "7:43:05", "remaining_time": "0:11:28"}
1172
+ {"current_steps": 1172, "total_steps": 1200, "loss": 0.3994, "lr": 6.630223910987887e-08, "epoch": 4.883333333333333, "percentage": 97.67, "elapsed_time": "7:43:28", "remaining_time": "0:11:04"}
1173
+ {"current_steps": 1173, "total_steps": 1200, "loss": 0.3735, "lr": 6.165332533744072e-08, "epoch": 4.8875, "percentage": 97.75, "elapsed_time": "7:43:51", "remaining_time": "0:10:40"}
1174
+ {"current_steps": 1174, "total_steps": 1200, "loss": 0.4078, "lr": 5.717312166045208e-08, "epoch": 4.891666666666667, "percentage": 97.83, "elapsed_time": "7:44:14", "remaining_time": "0:10:16"}
1175
+ {"current_steps": 1175, "total_steps": 1200, "loss": 0.4021, "lr": 5.286166598855502e-08, "epoch": 4.895833333333333, "percentage": 97.92, "elapsed_time": "7:44:37", "remaining_time": "0:09:53"}
1176
+ {"current_steps": 1176, "total_steps": 1200, "loss": 0.3907, "lr": 4.871899480351605e-08, "epoch": 4.9, "percentage": 98.0, "elapsed_time": "7:45:00", "remaining_time": "0:09:29"}
1177
+ {"current_steps": 1177, "total_steps": 1200, "loss": 0.4049, "lr": 4.474514315891299e-08, "epoch": 4.904166666666667, "percentage": 98.08, "elapsed_time": "7:45:23", "remaining_time": "0:09:05"}
1178
+ {"current_steps": 1178, "total_steps": 1200, "loss": 0.3998, "lr": 4.0940144679852963e-08, "epoch": 4.908333333333333, "percentage": 98.17, "elapsed_time": "7:45:46", "remaining_time": "0:08:41"}
1179
+ {"current_steps": 1179, "total_steps": 1200, "loss": 0.3884, "lr": 3.73040315626616e-08, "epoch": 4.9125, "percentage": 98.25, "elapsed_time": "7:46:10", "remaining_time": "0:08:18"}
1180
+ {"current_steps": 1180, "total_steps": 1200, "loss": 0.4044, "lr": 3.383683457463649e-08, "epoch": 4.916666666666667, "percentage": 98.33, "elapsed_time": "7:46:34", "remaining_time": "0:07:54"}
1181
+ {"current_steps": 1181, "total_steps": 1200, "loss": 0.3987, "lr": 3.053858305377411e-08, "epoch": 4.920833333333333, "percentage": 98.42, "elapsed_time": "7:46:57", "remaining_time": "0:07:30"}
1182
+ {"current_steps": 1182, "total_steps": 1200, "loss": 0.3925, "lr": 2.740930490852334e-08, "epoch": 4.925, "percentage": 98.5, "elapsed_time": "7:47:20", "remaining_time": "0:07:07"}
1183
+ {"current_steps": 1183, "total_steps": 1200, "loss": 0.4001, "lr": 2.4449026617547887e-08, "epoch": 4.929166666666667, "percentage": 98.58, "elapsed_time": "7:47:42", "remaining_time": "0:06:43"}
1184
+ {"current_steps": 1184, "total_steps": 1200, "loss": 0.3888, "lr": 2.1657773229508684e-08, "epoch": 4.933333333333334, "percentage": 98.67, "elapsed_time": "7:48:06", "remaining_time": "0:06:19"}
1185
+ {"current_steps": 1185, "total_steps": 1200, "loss": 0.3909, "lr": 1.9035568362844037e-08, "epoch": 4.9375, "percentage": 98.75, "elapsed_time": "7:48:30", "remaining_time": "0:05:55"}
1186
+ {"current_steps": 1186, "total_steps": 1200, "loss": 0.4057, "lr": 1.658243420557426e-08, "epoch": 4.941666666666666, "percentage": 98.83, "elapsed_time": "7:48:53", "remaining_time": "0:05:32"}
1187
+ {"current_steps": 1187, "total_steps": 1200, "loss": 0.3865, "lr": 1.42983915151107e-08, "epoch": 4.945833333333333, "percentage": 98.92, "elapsed_time": "7:49:16", "remaining_time": "0:05:08"}
1188
+ {"current_steps": 1188, "total_steps": 1200, "loss": 0.3896, "lr": 1.2183459618084759e-08, "epoch": 4.95, "percentage": 99.0, "elapsed_time": "7:49:40", "remaining_time": "0:04:44"}
1189
+ {"current_steps": 1189, "total_steps": 1200, "loss": 0.3893, "lr": 1.0237656410181374e-08, "epoch": 4.954166666666667, "percentage": 99.08, "elapsed_time": "7:50:03", "remaining_time": "0:04:20"}
1190
+ {"current_steps": 1190, "total_steps": 1200, "loss": 0.4016, "lr": 8.460998355988014e-09, "epoch": 4.958333333333333, "percentage": 99.17, "elapsed_time": "7:50:26", "remaining_time": "0:03:57"}
1191
+ {"current_steps": 1191, "total_steps": 1200, "loss": 0.3937, "lr": 6.853500488854803e-09, "epoch": 4.9625, "percentage": 99.25, "elapsed_time": "7:50:49", "remaining_time": "0:03:33"}
1192
+ {"current_steps": 1192, "total_steps": 1200, "loss": 0.3893, "lr": 5.415176410765721e-09, "epoch": 4.966666666666667, "percentage": 99.33, "elapsed_time": "7:51:12", "remaining_time": "0:03:09"}
1193
+ {"current_steps": 1193, "total_steps": 1200, "loss": 0.3935, "lr": 4.1460382922320355e-09, "epoch": 4.970833333333333, "percentage": 99.42, "elapsed_time": "7:51:36", "remaining_time": "0:02:46"}
1194
+ {"current_steps": 1194, "total_steps": 1200, "loss": 0.386, "lr": 3.0460968721746086e-09, "epoch": 4.975, "percentage": 99.5, "elapsed_time": "7:51:59", "remaining_time": "0:02:22"}
1195
+ {"current_steps": 1195, "total_steps": 1200, "loss": 0.3837, "lr": 2.1153614578506286e-09, "epoch": 4.979166666666667, "percentage": 99.58, "elapsed_time": "7:52:22", "remaining_time": "0:01:58"}
1196
+ {"current_steps": 1196, "total_steps": 1200, "loss": 0.4026, "lr": 1.3538399247559064e-09, "epoch": 4.983333333333333, "percentage": 99.67, "elapsed_time": "7:52:45", "remaining_time": "0:01:34"}
1197
+ {"current_steps": 1197, "total_steps": 1200, "loss": 0.3893, "lr": 7.615387165738065e-10, "epoch": 4.9875, "percentage": 99.75, "elapsed_time": "7:53:08", "remaining_time": "0:01:11"}
1198
+ {"current_steps": 1198, "total_steps": 1200, "loss": 0.3933, "lr": 3.384628451152949e-10, "epoch": 4.991666666666667, "percentage": 99.83, "elapsed_time": "7:53:32", "remaining_time": "0:00:47"}
1199
+ {"current_steps": 1199, "total_steps": 1200, "loss": 0.3833, "lr": 8.461589027453087e-11, "epoch": 4.995833333333334, "percentage": 99.92, "elapsed_time": "7:53:55", "remaining_time": "0:00:23"}
1200
+ {"current_steps": 1200, "total_steps": 1200, "loss": 0.3754, "lr": 0.0, "epoch": 5.0, "percentage": 100.0, "elapsed_time": "7:54:17", "remaining_time": "0:00:00"}
1201
+ {"current_steps": 1200, "total_steps": 1200, "epoch": 5.0, "percentage": 100.0, "elapsed_time": "7:59:22", "remaining_time": "0:00:00"}