gsmyrnis commited on
Commit
92ead4e
·
verified ·
1 Parent(s): d70103c

Training in progress, epoch 4

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dad095630fb9cef750a6d69b8087a7d54100c780a07d4b1825a8495468dd0498
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:47ed62012645ee058b345a8bd70885b7174094455ab2fda24fc4ff59de43eb3d
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:51bad2c4120c5f6d191c187c5864145771780d79350c4be5797f2b41c3589cd7
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:91314e27f47b3ee0d325ac08f5b054d821798ad70d4341b7ec39f351f334fcc5
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4caaed04dd04ce5b73b2281049211fa1d3128a53d0100e32162e35bddc21895c
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f3e5ae2f96e159ffc0273a0892d1b94bd303bc07071872bc29530bb780509cd3
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cdd63485ba0cbd72e48e0fb9846ff802d6441993d89e18e3c9a51f6d5ba993d2
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f0c235b899c8f7aefed906942982c48edba07d711349f403f79bbe60635cc95e
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -916,3 +916,218 @@
916
  {"current_steps": 889, "total_steps": 1105, "loss": 1.0207, "lr": 4.482305921809669e-06, "epoch": 4.020293122886133, "percentage": 80.45, "elapsed_time": "3:05:02", "remaining_time": "0:44:57"}
917
  {"current_steps": 890, "total_steps": 1105, "loss": 1.025, "lr": 4.442505193950129e-06, "epoch": 4.024802705749718, "percentage": 80.54, "elapsed_time": "3:05:27", "remaining_time": "0:44:47"}
918
  {"current_steps": 891, "total_steps": 1105, "loss": 1.0192, "lr": 4.402859871552932e-06, "epoch": 4.029312288613303, "percentage": 80.63, "elapsed_time": "3:05:51", "remaining_time": "0:44:38"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
916
  {"current_steps": 889, "total_steps": 1105, "loss": 1.0207, "lr": 4.482305921809669e-06, "epoch": 4.020293122886133, "percentage": 80.45, "elapsed_time": "3:05:02", "remaining_time": "0:44:57"}
917
  {"current_steps": 890, "total_steps": 1105, "loss": 1.025, "lr": 4.442505193950129e-06, "epoch": 4.024802705749718, "percentage": 80.54, "elapsed_time": "3:05:27", "remaining_time": "0:44:47"}
918
  {"current_steps": 891, "total_steps": 1105, "loss": 1.0192, "lr": 4.402859871552932e-06, "epoch": 4.029312288613303, "percentage": 80.63, "elapsed_time": "3:05:51", "remaining_time": "0:44:38"}
919
+ {"current_steps": 892, "total_steps": 1105, "loss": 1.0209, "lr": 4.363370350639405e-06, "epoch": 4.0338218714768885, "percentage": 80.72, "elapsed_time": "3:06:15", "remaining_time": "0:44:28"}
920
+ {"current_steps": 893, "total_steps": 1105, "loss": 1.0271, "lr": 4.3240370256745435e-06, "epoch": 4.038331454340473, "percentage": 80.81, "elapsed_time": "3:06:39", "remaining_time": "0:44:18"}
921
+ {"current_steps": 894, "total_steps": 1105, "loss": 1.0492, "lr": 4.284860289563102e-06, "epoch": 4.042841037204059, "percentage": 80.9, "elapsed_time": "3:07:03", "remaining_time": "0:44:08"}
922
+ {"current_steps": 895, "total_steps": 1105, "loss": 1.0271, "lr": 4.2458405336456395e-06, "epoch": 4.047350620067644, "percentage": 81.0, "elapsed_time": "3:07:27", "remaining_time": "0:43:59"}
923
+ {"current_steps": 896, "total_steps": 1105, "loss": 1.0174, "lr": 4.206978147694625e-06, "epoch": 4.051860202931229, "percentage": 81.09, "elapsed_time": "3:07:51", "remaining_time": "0:43:49"}
924
+ {"current_steps": 897, "total_steps": 1105, "loss": 1.0112, "lr": 4.168273519910547e-06, "epoch": 4.056369785794814, "percentage": 81.18, "elapsed_time": "3:08:15", "remaining_time": "0:43:39"}
925
+ {"current_steps": 898, "total_steps": 1105, "loss": 1.0113, "lr": 4.129727036918032e-06, "epoch": 4.060879368658399, "percentage": 81.27, "elapsed_time": "3:08:39", "remaining_time": "0:43:29"}
926
+ {"current_steps": 899, "total_steps": 1105, "loss": 0.9981, "lr": 4.091339083761983e-06, "epoch": 4.065388951521984, "percentage": 81.36, "elapsed_time": "3:09:03", "remaining_time": "0:43:19"}
927
+ {"current_steps": 900, "total_steps": 1105, "loss": 0.994, "lr": 4.053110043903717e-06, "epoch": 4.069898534385569, "percentage": 81.45, "elapsed_time": "3:09:27", "remaining_time": "0:43:09"}
928
+ {"current_steps": 901, "total_steps": 1105, "loss": 1.0267, "lr": 4.015040299217168e-06, "epoch": 4.074408117249154, "percentage": 81.54, "elapsed_time": "3:09:51", "remaining_time": "0:42:59"}
929
+ {"current_steps": 902, "total_steps": 1105, "loss": 0.9911, "lr": 3.977130229985038e-06, "epoch": 4.07891770011274, "percentage": 81.63, "elapsed_time": "3:10:15", "remaining_time": "0:42:49"}
930
+ {"current_steps": 903, "total_steps": 1105, "loss": 0.9979, "lr": 3.939380214895025e-06, "epoch": 4.0834272829763245, "percentage": 81.72, "elapsed_time": "3:10:39", "remaining_time": "0:42:38"}
931
+ {"current_steps": 904, "total_steps": 1105, "loss": 1.0451, "lr": 3.901790631036033e-06, "epoch": 4.08793686583991, "percentage": 81.81, "elapsed_time": "3:11:03", "remaining_time": "0:42:28"}
932
+ {"current_steps": 905, "total_steps": 1105, "loss": 1.0086, "lr": 3.864361853894378e-06, "epoch": 4.092446448703495, "percentage": 81.9, "elapsed_time": "3:11:27", "remaining_time": "0:42:18"}
933
+ {"current_steps": 906, "total_steps": 1105, "loss": 1.0102, "lr": 3.827094257350092e-06, "epoch": 4.09695603156708, "percentage": 81.99, "elapsed_time": "3:11:51", "remaining_time": "0:42:08"}
934
+ {"current_steps": 907, "total_steps": 1105, "loss": 1.0098, "lr": 3.7899882136731304e-06, "epoch": 4.101465614430666, "percentage": 82.08, "elapsed_time": "3:12:15", "remaining_time": "0:41:58"}
935
+ {"current_steps": 908, "total_steps": 1105, "loss": 1.0123, "lr": 3.7530440935197e-06, "epoch": 4.10597519729425, "percentage": 82.17, "elapsed_time": "3:12:39", "remaining_time": "0:41:47"}
936
+ {"current_steps": 909, "total_steps": 1105, "loss": 1.0369, "lr": 3.7162622659285185e-06, "epoch": 4.110484780157836, "percentage": 82.26, "elapsed_time": "3:13:03", "remaining_time": "0:41:37"}
937
+ {"current_steps": 910, "total_steps": 1105, "loss": 1.0073, "lr": 3.679643098317158e-06, "epoch": 4.11499436302142, "percentage": 82.35, "elapsed_time": "3:13:26", "remaining_time": "0:41:27"}
938
+ {"current_steps": 911, "total_steps": 1105, "loss": 1.0227, "lr": 3.6431869564783617e-06, "epoch": 4.119503945885006, "percentage": 82.44, "elapsed_time": "3:13:50", "remaining_time": "0:41:16"}
939
+ {"current_steps": 912, "total_steps": 1105, "loss": 0.9934, "lr": 3.6068942045763944e-06, "epoch": 4.12401352874859, "percentage": 82.53, "elapsed_time": "3:14:15", "remaining_time": "0:41:06"}
940
+ {"current_steps": 913, "total_steps": 1105, "loss": 1.0642, "lr": 3.5707652051433917e-06, "epoch": 4.128523111612176, "percentage": 82.62, "elapsed_time": "3:14:39", "remaining_time": "0:40:56"}
941
+ {"current_steps": 914, "total_steps": 1105, "loss": 1.0028, "lr": 3.5348003190757442e-06, "epoch": 4.133032694475761, "percentage": 82.71, "elapsed_time": "3:15:03", "remaining_time": "0:40:45"}
942
+ {"current_steps": 915, "total_steps": 1105, "loss": 1.0318, "lr": 3.49899990563052e-06, "epoch": 4.137542277339346, "percentage": 82.81, "elapsed_time": "3:15:27", "remaining_time": "0:40:35"}
943
+ {"current_steps": 916, "total_steps": 1105, "loss": 1.0156, "lr": 3.463364322421827e-06, "epoch": 4.1420518602029315, "percentage": 82.9, "elapsed_time": "3:15:50", "remaining_time": "0:40:24"}
944
+ {"current_steps": 917, "total_steps": 1105, "loss": 1.015, "lr": 3.427893925417285e-06, "epoch": 4.146561443066516, "percentage": 82.99, "elapsed_time": "3:16:14", "remaining_time": "0:40:14"}
945
+ {"current_steps": 918, "total_steps": 1105, "loss": 1.05, "lr": 3.39258906893444e-06, "epoch": 4.151071025930102, "percentage": 83.08, "elapsed_time": "3:16:38", "remaining_time": "0:40:03"}
946
+ {"current_steps": 919, "total_steps": 1105, "loss": 1.0294, "lr": 3.3574501056372455e-06, "epoch": 4.155580608793686, "percentage": 83.17, "elapsed_time": "3:17:02", "remaining_time": "0:39:52"}
947
+ {"current_steps": 920, "total_steps": 1105, "loss": 1.0456, "lr": 3.3224773865325257e-06, "epoch": 4.160090191657272, "percentage": 83.26, "elapsed_time": "3:17:26", "remaining_time": "0:39:42"}
948
+ {"current_steps": 921, "total_steps": 1105, "loss": 1.0403, "lr": 3.287671260966463e-06, "epoch": 4.164599774520857, "percentage": 83.35, "elapsed_time": "3:17:50", "remaining_time": "0:39:31"}
949
+ {"current_steps": 922, "total_steps": 1105, "loss": 1.0375, "lr": 3.253032076621141e-06, "epoch": 4.169109357384442, "percentage": 83.44, "elapsed_time": "3:18:14", "remaining_time": "0:39:20"}
950
+ {"current_steps": 923, "total_steps": 1105, "loss": 1.0028, "lr": 3.21856017951103e-06, "epoch": 4.173618940248027, "percentage": 83.53, "elapsed_time": "3:18:38", "remaining_time": "0:39:10"}
951
+ {"current_steps": 924, "total_steps": 1105, "loss": 1.0391, "lr": 3.1842559139795637e-06, "epoch": 4.178128523111612, "percentage": 83.62, "elapsed_time": "3:19:03", "remaining_time": "0:38:59"}
952
+ {"current_steps": 925, "total_steps": 1105, "loss": 1.0293, "lr": 3.15011962269568e-06, "epoch": 4.182638105975197, "percentage": 83.71, "elapsed_time": "3:19:27", "remaining_time": "0:38:48"}
953
+ {"current_steps": 926, "total_steps": 1105, "loss": 1.0058, "lr": 3.1161516466504117e-06, "epoch": 4.187147688838783, "percentage": 83.8, "elapsed_time": "3:19:51", "remaining_time": "0:38:38"}
954
+ {"current_steps": 927, "total_steps": 1105, "loss": 1.0351, "lr": 3.082352325153459e-06, "epoch": 4.1916572717023675, "percentage": 83.89, "elapsed_time": "3:20:15", "remaining_time": "0:38:27"}
955
+ {"current_steps": 928, "total_steps": 1105, "loss": 0.9942, "lr": 3.048721995829829e-06, "epoch": 4.196166854565953, "percentage": 83.98, "elapsed_time": "3:20:39", "remaining_time": "0:38:16"}
956
+ {"current_steps": 929, "total_steps": 1105, "loss": 1.031, "lr": 3.015260994616431e-06, "epoch": 4.200676437429538, "percentage": 84.07, "elapsed_time": "3:21:03", "remaining_time": "0:38:05"}
957
+ {"current_steps": 930, "total_steps": 1105, "loss": 1.026, "lr": 2.981969655758756e-06, "epoch": 4.205186020293123, "percentage": 84.16, "elapsed_time": "3:21:26", "remaining_time": "0:37:54"}
958
+ {"current_steps": 931, "total_steps": 1105, "loss": 1.0614, "lr": 2.948848311807515e-06, "epoch": 4.209695603156708, "percentage": 84.25, "elapsed_time": "3:21:50", "remaining_time": "0:37:43"}
959
+ {"current_steps": 932, "total_steps": 1105, "loss": 1.0387, "lr": 2.9158972936153065e-06, "epoch": 4.214205186020293, "percentage": 84.34, "elapsed_time": "3:22:15", "remaining_time": "0:37:32"}
960
+ {"current_steps": 933, "total_steps": 1105, "loss": 1.0024, "lr": 2.8831169303333517e-06, "epoch": 4.218714768883879, "percentage": 84.43, "elapsed_time": "3:22:39", "remaining_time": "0:37:21"}
961
+ {"current_steps": 934, "total_steps": 1105, "loss": 1.0472, "lr": 2.850507549408157e-06, "epoch": 4.223224351747463, "percentage": 84.52, "elapsed_time": "3:23:03", "remaining_time": "0:37:10"}
962
+ {"current_steps": 935, "total_steps": 1105, "loss": 1.054, "lr": 2.8180694765782914e-06, "epoch": 4.227733934611049, "percentage": 84.62, "elapsed_time": "3:23:28", "remaining_time": "0:36:59"}
963
+ {"current_steps": 936, "total_steps": 1105, "loss": 1.0062, "lr": 2.7858030358710884e-06, "epoch": 4.232243517474633, "percentage": 84.71, "elapsed_time": "3:23:52", "remaining_time": "0:36:48"}
964
+ {"current_steps": 937, "total_steps": 1105, "loss": 1.0276, "lr": 2.753708549599443e-06, "epoch": 4.236753100338219, "percentage": 84.8, "elapsed_time": "3:24:15", "remaining_time": "0:36:37"}
965
+ {"current_steps": 938, "total_steps": 1105, "loss": 1.0304, "lr": 2.721786338358583e-06, "epoch": 4.241262683201803, "percentage": 84.89, "elapsed_time": "3:24:39", "remaining_time": "0:36:26"}
966
+ {"current_steps": 939, "total_steps": 1105, "loss": 0.9777, "lr": 2.690036721022844e-06, "epoch": 4.245772266065389, "percentage": 84.98, "elapsed_time": "3:25:03", "remaining_time": "0:36:15"}
967
+ {"current_steps": 940, "total_steps": 1105, "loss": 1.0059, "lr": 2.658460014742523e-06, "epoch": 4.250281848928974, "percentage": 85.07, "elapsed_time": "3:25:27", "remaining_time": "0:36:03"}
968
+ {"current_steps": 941, "total_steps": 1105, "loss": 1.0265, "lr": 2.6270565349406728e-06, "epoch": 4.254791431792559, "percentage": 85.16, "elapsed_time": "3:25:52", "remaining_time": "0:35:52"}
969
+ {"current_steps": 942, "total_steps": 1105, "loss": 0.9855, "lr": 2.595826595309987e-06, "epoch": 4.2593010146561445, "percentage": 85.25, "elapsed_time": "3:26:15", "remaining_time": "0:35:41"}
970
+ {"current_steps": 943, "total_steps": 1105, "loss": 0.9845, "lr": 2.5647705078096265e-06, "epoch": 4.263810597519729, "percentage": 85.34, "elapsed_time": "3:26:39", "remaining_time": "0:35:30"}
971
+ {"current_steps": 944, "total_steps": 1105, "loss": 1.0556, "lr": 2.533888582662145e-06, "epoch": 4.268320180383315, "percentage": 85.43, "elapsed_time": "3:27:03", "remaining_time": "0:35:18"}
972
+ {"current_steps": 945, "total_steps": 1105, "loss": 0.9949, "lr": 2.5031811283503648e-06, "epoch": 4.2728297632469, "percentage": 85.52, "elapsed_time": "3:27:27", "remaining_time": "0:35:07"}
973
+ {"current_steps": 946, "total_steps": 1105, "loss": 1.0141, "lr": 2.4726484516142856e-06, "epoch": 4.277339346110485, "percentage": 85.61, "elapsed_time": "3:27:51", "remaining_time": "0:34:56"}
974
+ {"current_steps": 947, "total_steps": 1105, "loss": 0.9866, "lr": 2.4422908574480598e-06, "epoch": 4.28184892897407, "percentage": 85.7, "elapsed_time": "3:28:15", "remaining_time": "0:34:44"}
975
+ {"current_steps": 948, "total_steps": 1105, "loss": 1.0017, "lr": 2.412108649096898e-06, "epoch": 4.286358511837655, "percentage": 85.79, "elapsed_time": "3:28:39", "remaining_time": "0:34:33"}
976
+ {"current_steps": 949, "total_steps": 1105, "loss": 1.0495, "lr": 2.382102128054078e-06, "epoch": 4.29086809470124, "percentage": 85.88, "elapsed_time": "3:29:03", "remaining_time": "0:34:21"}
977
+ {"current_steps": 950, "total_steps": 1105, "loss": 1.0231, "lr": 2.3522715940579176e-06, "epoch": 4.295377677564825, "percentage": 85.97, "elapsed_time": "3:29:27", "remaining_time": "0:34:10"}
978
+ {"current_steps": 951, "total_steps": 1105, "loss": 1.068, "lr": 2.322617345088778e-06, "epoch": 4.29988726042841, "percentage": 86.06, "elapsed_time": "3:29:52", "remaining_time": "0:33:59"}
979
+ {"current_steps": 952, "total_steps": 1105, "loss": 1.0163, "lr": 2.2931396773660876e-06, "epoch": 4.304396843291996, "percentage": 86.15, "elapsed_time": "3:30:16", "remaining_time": "0:33:47"}
980
+ {"current_steps": 953, "total_steps": 1105, "loss": 1.007, "lr": 2.263838885345393e-06, "epoch": 4.3089064261555805, "percentage": 86.24, "elapsed_time": "3:30:40", "remaining_time": "0:33:36"}
981
+ {"current_steps": 954, "total_steps": 1105, "loss": 1.0024, "lr": 2.2347152617154055e-06, "epoch": 4.313416009019166, "percentage": 86.33, "elapsed_time": "3:31:04", "remaining_time": "0:33:24"}
982
+ {"current_steps": 955, "total_steps": 1105, "loss": 1.0653, "lr": 2.205769097395081e-06, "epoch": 4.317925591882751, "percentage": 86.43, "elapsed_time": "3:31:28", "remaining_time": "0:33:12"}
983
+ {"current_steps": 956, "total_steps": 1105, "loss": 1.0504, "lr": 2.177000681530721e-06, "epoch": 4.322435174746336, "percentage": 86.52, "elapsed_time": "3:31:53", "remaining_time": "0:33:01"}
984
+ {"current_steps": 957, "total_steps": 1105, "loss": 1.0532, "lr": 2.148410301493078e-06, "epoch": 4.326944757609921, "percentage": 86.61, "elapsed_time": "3:32:17", "remaining_time": "0:32:49"}
985
+ {"current_steps": 958, "total_steps": 1105, "loss": 1.0474, "lr": 2.119998242874488e-06, "epoch": 4.331454340473506, "percentage": 86.7, "elapsed_time": "3:32:41", "remaining_time": "0:32:38"}
986
+ {"current_steps": 959, "total_steps": 1105, "loss": 1.0406, "lr": 2.0917647894860018e-06, "epoch": 4.335963923337092, "percentage": 86.79, "elapsed_time": "3:33:05", "remaining_time": "0:32:26"}
987
+ {"current_steps": 960, "total_steps": 1105, "loss": 1.0382, "lr": 2.0637102233545847e-06, "epoch": 4.340473506200676, "percentage": 86.88, "elapsed_time": "3:33:29", "remaining_time": "0:32:14"}
988
+ {"current_steps": 961, "total_steps": 1105, "loss": 1.0291, "lr": 2.0358348247202577e-06, "epoch": 4.344983089064262, "percentage": 86.97, "elapsed_time": "3:33:53", "remaining_time": "0:32:02"}
989
+ {"current_steps": 962, "total_steps": 1105, "loss": 1.0375, "lr": 2.0081388720333382e-06, "epoch": 4.349492671927846, "percentage": 87.06, "elapsed_time": "3:34:17", "remaining_time": "0:31:51"}
990
+ {"current_steps": 963, "total_steps": 1105, "loss": 1.0073, "lr": 1.9806226419516195e-06, "epoch": 4.354002254791432, "percentage": 87.15, "elapsed_time": "3:34:41", "remaining_time": "0:31:39"}
991
+ {"current_steps": 964, "total_steps": 1105, "loss": 1.0487, "lr": 1.95328640933764e-06, "epoch": 4.358511837655017, "percentage": 87.24, "elapsed_time": "3:35:04", "remaining_time": "0:31:27"}
992
+ {"current_steps": 965, "total_steps": 1105, "loss": 1.0134, "lr": 1.926130447255925e-06, "epoch": 4.363021420518602, "percentage": 87.33, "elapsed_time": "3:35:29", "remaining_time": "0:31:15"}
993
+ {"current_steps": 966, "total_steps": 1105, "loss": 0.9751, "lr": 1.8991550269702475e-06, "epoch": 4.3675310033821875, "percentage": 87.42, "elapsed_time": "3:35:53", "remaining_time": "0:31:03"}
994
+ {"current_steps": 967, "total_steps": 1105, "loss": 0.9989, "lr": 1.8723604179409415e-06, "epoch": 4.372040586245772, "percentage": 87.51, "elapsed_time": "3:36:17", "remaining_time": "0:30:52"}
995
+ {"current_steps": 968, "total_steps": 1105, "loss": 1.0428, "lr": 1.8457468878221885e-06, "epoch": 4.376550169109358, "percentage": 87.6, "elapsed_time": "3:36:41", "remaining_time": "0:30:40"}
996
+ {"current_steps": 969, "total_steps": 1105, "loss": 0.9669, "lr": 1.8193147024593604e-06, "epoch": 4.381059751972942, "percentage": 87.69, "elapsed_time": "3:37:05", "remaining_time": "0:30:28"}
997
+ {"current_steps": 970, "total_steps": 1105, "loss": 1.074, "lr": 1.7930641258863501e-06, "epoch": 4.385569334836528, "percentage": 87.78, "elapsed_time": "3:37:30", "remaining_time": "0:30:16"}
998
+ {"current_steps": 971, "total_steps": 1105, "loss": 1.0294, "lr": 1.7669954203229545e-06, "epoch": 4.390078917700112, "percentage": 87.87, "elapsed_time": "3:37:54", "remaining_time": "0:30:04"}
999
+ {"current_steps": 972, "total_steps": 1105, "loss": 1.0098, "lr": 1.7411088461722281e-06, "epoch": 4.394588500563698, "percentage": 87.96, "elapsed_time": "3:38:18", "remaining_time": "0:29:52"}
1000
+ {"current_steps": 973, "total_steps": 1105, "loss": 0.9963, "lr": 1.7154046620178966e-06, "epoch": 4.399098083427283, "percentage": 88.05, "elapsed_time": "3:38:42", "remaining_time": "0:29:40"}
1001
+ {"current_steps": 974, "total_steps": 1105, "loss": 1.0725, "lr": 1.6898831246217805e-06, "epoch": 4.403607666290868, "percentage": 88.14, "elapsed_time": "3:39:06", "remaining_time": "0:29:28"}
1002
+ {"current_steps": 975, "total_steps": 1105, "loss": 1.0174, "lr": 1.6645444889212158e-06, "epoch": 4.408117249154453, "percentage": 88.24, "elapsed_time": "3:39:30", "remaining_time": "0:29:16"}
1003
+ {"current_steps": 976, "total_steps": 1105, "loss": 0.9963, "lr": 1.6393890080265173e-06, "epoch": 4.412626832018038, "percentage": 88.33, "elapsed_time": "3:39:54", "remaining_time": "0:29:03"}
1004
+ {"current_steps": 977, "total_steps": 1105, "loss": 1.0336, "lr": 1.6144169332184456e-06, "epoch": 4.4171364148816235, "percentage": 88.42, "elapsed_time": "3:40:18", "remaining_time": "0:28:51"}
1005
+ {"current_steps": 978, "total_steps": 1105, "loss": 1.0174, "lr": 1.5896285139457046e-06, "epoch": 4.421645997745209, "percentage": 88.51, "elapsed_time": "3:40:42", "remaining_time": "0:28:39"}
1006
+ {"current_steps": 979, "total_steps": 1105, "loss": 1.0222, "lr": 1.5650239978224346e-06, "epoch": 4.4261555806087935, "percentage": 88.6, "elapsed_time": "3:41:06", "remaining_time": "0:28:27"}
1007
+ {"current_steps": 980, "total_steps": 1105, "loss": 0.9948, "lr": 1.5406036306257477e-06, "epoch": 4.430665163472379, "percentage": 88.69, "elapsed_time": "3:41:29", "remaining_time": "0:28:15"}
1008
+ {"current_steps": 981, "total_steps": 1105, "loss": 1.0121, "lr": 1.5163676562932828e-06, "epoch": 4.435174746335964, "percentage": 88.78, "elapsed_time": "3:41:53", "remaining_time": "0:28:02"}
1009
+ {"current_steps": 982, "total_steps": 1105, "loss": 1.0336, "lr": 1.4923163169207456e-06, "epoch": 4.439684329199549, "percentage": 88.87, "elapsed_time": "3:42:17", "remaining_time": "0:27:50"}
1010
+ {"current_steps": 983, "total_steps": 1105, "loss": 0.9924, "lr": 1.4684498527595147e-06, "epoch": 4.444193912063134, "percentage": 88.96, "elapsed_time": "3:42:41", "remaining_time": "0:27:38"}
1011
+ {"current_steps": 984, "total_steps": 1105, "loss": 1.0497, "lr": 1.4447685022142288e-06, "epoch": 4.448703494926719, "percentage": 89.05, "elapsed_time": "3:43:05", "remaining_time": "0:27:25"}
1012
+ {"current_steps": 985, "total_steps": 1105, "loss": 0.9923, "lr": 1.4212725018404072e-06, "epoch": 4.453213077790305, "percentage": 89.14, "elapsed_time": "3:43:29", "remaining_time": "0:27:13"}
1013
+ {"current_steps": 986, "total_steps": 1105, "loss": 1.0515, "lr": 1.397962086342075e-06, "epoch": 4.457722660653889, "percentage": 89.23, "elapsed_time": "3:43:53", "remaining_time": "0:27:01"}
1014
+ {"current_steps": 987, "total_steps": 1105, "loss": 1.0174, "lr": 1.3748374885694516e-06, "epoch": 4.462232243517475, "percentage": 89.32, "elapsed_time": "3:44:17", "remaining_time": "0:26:48"}
1015
+ {"current_steps": 988, "total_steps": 1105, "loss": 1.058, "lr": 1.3518989395165848e-06, "epoch": 4.466741826381059, "percentage": 89.41, "elapsed_time": "3:44:41", "remaining_time": "0:26:36"}
1016
+ {"current_steps": 989, "total_steps": 1105, "loss": 1.0205, "lr": 1.329146668319068e-06, "epoch": 4.471251409244645, "percentage": 89.5, "elapsed_time": "3:45:05", "remaining_time": "0:26:24"}
1017
+ {"current_steps": 990, "total_steps": 1105, "loss": 1.0191, "lr": 1.3065809022517506e-06, "epoch": 4.4757609921082295, "percentage": 89.59, "elapsed_time": "3:45:29", "remaining_time": "0:26:11"}
1018
+ {"current_steps": 991, "total_steps": 1105, "loss": 1.0353, "lr": 1.2842018667264533e-06, "epoch": 4.480270574971815, "percentage": 89.68, "elapsed_time": "3:45:53", "remaining_time": "0:25:59"}
1019
+ {"current_steps": 992, "total_steps": 1105, "loss": 1.0341, "lr": 1.2620097852897394e-06, "epoch": 4.4847801578354005, "percentage": 89.77, "elapsed_time": "3:46:16", "remaining_time": "0:25:46"}
1020
+ {"current_steps": 993, "total_steps": 1105, "loss": 1.025, "lr": 1.240004879620651e-06, "epoch": 4.489289740698985, "percentage": 89.86, "elapsed_time": "3:46:40", "remaining_time": "0:25:34"}
1021
+ {"current_steps": 994, "total_steps": 1105, "loss": 1.0452, "lr": 1.2181873695285251e-06, "epoch": 4.493799323562571, "percentage": 89.95, "elapsed_time": "3:47:05", "remaining_time": "0:25:21"}
1022
+ {"current_steps": 995, "total_steps": 1105, "loss": 1.0354, "lr": 1.1965574729507746e-06, "epoch": 4.498308906426155, "percentage": 90.05, "elapsed_time": "3:47:29", "remaining_time": "0:25:09"}
1023
+ {"current_steps": 996, "total_steps": 1105, "loss": 1.0255, "lr": 1.1751154059507308e-06, "epoch": 4.502818489289741, "percentage": 90.14, "elapsed_time": "3:47:53", "remaining_time": "0:24:56"}
1024
+ {"current_steps": 997, "total_steps": 1105, "loss": 1.0162, "lr": 1.1538613827154688e-06, "epoch": 4.507328072153326, "percentage": 90.23, "elapsed_time": "3:48:18", "remaining_time": "0:24:43"}
1025
+ {"current_steps": 998, "total_steps": 1105, "loss": 1.0288, "lr": 1.1327956155536746e-06, "epoch": 4.511837655016911, "percentage": 90.32, "elapsed_time": "3:48:42", "remaining_time": "0:24:31"}
1026
+ {"current_steps": 999, "total_steps": 1105, "loss": 1.0719, "lr": 1.1119183148935298e-06, "epoch": 4.516347237880496, "percentage": 90.41, "elapsed_time": "3:49:06", "remaining_time": "0:24:18"}
1027
+ {"current_steps": 1000, "total_steps": 1105, "loss": 1.0291, "lr": 1.0912296892805952e-06, "epoch": 4.520856820744081, "percentage": 90.5, "elapsed_time": "3:49:30", "remaining_time": "0:24:05"}
1028
+ {"current_steps": 1001, "total_steps": 1105, "loss": 0.9935, "lr": 1.0707299453757481e-06, "epoch": 4.525366403607666, "percentage": 90.59, "elapsed_time": "3:49:54", "remaining_time": "0:23:53"}
1029
+ {"current_steps": 1002, "total_steps": 1105, "loss": 1.0203, "lr": 1.0504192879530928e-06, "epoch": 4.529875986471252, "percentage": 90.68, "elapsed_time": "3:50:18", "remaining_time": "0:23:40"}
1030
+ {"current_steps": 1003, "total_steps": 1105, "loss": 0.9729, "lr": 1.0302979198979425e-06, "epoch": 4.5343855693348365, "percentage": 90.77, "elapsed_time": "3:50:42", "remaining_time": "0:23:27"}
1031
+ {"current_steps": 1004, "total_steps": 1105, "loss": 0.9821, "lr": 1.0103660422047712e-06, "epoch": 4.538895152198422, "percentage": 90.86, "elapsed_time": "3:51:06", "remaining_time": "0:23:14"}
1032
+ {"current_steps": 1005, "total_steps": 1105, "loss": 1.0874, "lr": 9.906238539752122e-07, "epoch": 4.543404735062007, "percentage": 90.95, "elapsed_time": "3:51:30", "remaining_time": "0:23:02"}
1033
+ {"current_steps": 1006, "total_steps": 1105, "loss": 0.9841, "lr": 9.710715524160785e-07, "epoch": 4.547914317925592, "percentage": 91.04, "elapsed_time": "3:51:54", "remaining_time": "0:22:49"}
1034
+ {"current_steps": 1007, "total_steps": 1105, "loss": 1.0535, "lr": 9.517093328373739e-07, "epoch": 4.552423900789177, "percentage": 91.13, "elapsed_time": "3:52:18", "remaining_time": "0:22:36"}
1035
+ {"current_steps": 1008, "total_steps": 1105, "loss": 1.0435, "lr": 9.325373886503652e-07, "epoch": 4.556933483652762, "percentage": 91.22, "elapsed_time": "3:52:42", "remaining_time": "0:22:23"}
1036
+ {"current_steps": 1009, "total_steps": 1105, "loss": 1.0348, "lr": 9.135559113656245e-07, "epoch": 4.561443066516347, "percentage": 91.31, "elapsed_time": "3:53:06", "remaining_time": "0:22:10"}
1037
+ {"current_steps": 1010, "total_steps": 1105, "loss": 1.0268, "lr": 8.947650905911431e-07, "epoch": 4.565952649379932, "percentage": 91.4, "elapsed_time": "3:53:30", "remaining_time": "0:21:57"}
1038
+ {"current_steps": 1011, "total_steps": 1105, "loss": 1.0381, "lr": 8.761651140304184e-07, "epoch": 4.570462232243518, "percentage": 91.49, "elapsed_time": "3:53:54", "remaining_time": "0:21:44"}
1039
+ {"current_steps": 1012, "total_steps": 1105, "loss": 1.0275, "lr": 8.577561674805856e-07, "epoch": 4.574971815107102, "percentage": 91.58, "elapsed_time": "3:54:17", "remaining_time": "0:21:31"}
1040
+ {"current_steps": 1013, "total_steps": 1105, "loss": 0.9977, "lr": 8.395384348305602e-07, "epoch": 4.579481397970688, "percentage": 91.67, "elapsed_time": "3:54:41", "remaining_time": "0:21:18"}
1041
+ {"current_steps": 1014, "total_steps": 1105, "loss": 1.0414, "lr": 8.215120980591984e-07, "epoch": 4.5839909808342725, "percentage": 91.76, "elapsed_time": "3:55:05", "remaining_time": "0:21:05"}
1042
+ {"current_steps": 1015, "total_steps": 1105, "loss": 1.0303, "lr": 8.036773372334905e-07, "epoch": 4.588500563697858, "percentage": 91.86, "elapsed_time": "3:55:30", "remaining_time": "0:20:52"}
1043
+ {"current_steps": 1016, "total_steps": 1105, "loss": 0.9987, "lr": 7.860343305067441e-07, "epoch": 4.5930101465614435, "percentage": 91.95, "elapsed_time": "3:55:54", "remaining_time": "0:20:39"}
1044
+ {"current_steps": 1017, "total_steps": 1105, "loss": 1.0318, "lr": 7.685832541168281e-07, "epoch": 4.597519729425028, "percentage": 92.04, "elapsed_time": "3:56:18", "remaining_time": "0:20:26"}
1045
+ {"current_steps": 1018, "total_steps": 1105, "loss": 1.0009, "lr": 7.513242823843892e-07, "epoch": 4.602029312288614, "percentage": 92.13, "elapsed_time": "3:56:42", "remaining_time": "0:20:13"}
1046
+ {"current_steps": 1019, "total_steps": 1105, "loss": 1.016, "lr": 7.342575877111225e-07, "epoch": 4.606538895152198, "percentage": 92.22, "elapsed_time": "3:57:06", "remaining_time": "0:20:00"}
1047
+ {"current_steps": 1020, "total_steps": 1105, "loss": 1.0222, "lr": 7.173833405780439e-07, "epoch": 4.611048478015784, "percentage": 92.31, "elapsed_time": "3:57:29", "remaining_time": "0:19:47"}
1048
+ {"current_steps": 1021, "total_steps": 1105, "loss": 1.0526, "lr": 7.007017095438029e-07, "epoch": 4.615558060879369, "percentage": 92.4, "elapsed_time": "3:57:54", "remaining_time": "0:19:34"}
1049
+ {"current_steps": 1022, "total_steps": 1105, "loss": 0.9788, "lr": 6.842128612429677e-07, "epoch": 4.620067643742954, "percentage": 92.49, "elapsed_time": "3:58:18", "remaining_time": "0:19:21"}
1050
+ {"current_steps": 1023, "total_steps": 1105, "loss": 1.0264, "lr": 6.67916960384396e-07, "epoch": 4.624577226606539, "percentage": 92.58, "elapsed_time": "3:58:42", "remaining_time": "0:19:08"}
1051
+ {"current_steps": 1024, "total_steps": 1105, "loss": 0.9908, "lr": 6.51814169749565e-07, "epoch": 4.629086809470124, "percentage": 92.67, "elapsed_time": "3:59:06", "remaining_time": "0:18:54"}
1052
+ {"current_steps": 1025, "total_steps": 1105, "loss": 1.0425, "lr": 6.359046501909527e-07, "epoch": 4.633596392333709, "percentage": 92.76, "elapsed_time": "3:59:30", "remaining_time": "0:18:41"}
1053
+ {"current_steps": 1026, "total_steps": 1105, "loss": 1.0332, "lr": 6.20188560630437e-07, "epoch": 4.638105975197294, "percentage": 92.85, "elapsed_time": "3:59:54", "remaining_time": "0:18:28"}
1054
+ {"current_steps": 1027, "total_steps": 1105, "loss": 1.0296, "lr": 6.046660580576968e-07, "epoch": 4.642615558060879, "percentage": 92.94, "elapsed_time": "4:00:19", "remaining_time": "0:18:15"}
1055
+ {"current_steps": 1028, "total_steps": 1105, "loss": 0.995, "lr": 5.89337297528656e-07, "epoch": 4.647125140924464, "percentage": 93.03, "elapsed_time": "4:00:43", "remaining_time": "0:18:01"}
1056
+ {"current_steps": 1029, "total_steps": 1105, "loss": 0.9963, "lr": 5.742024321639217e-07, "epoch": 4.6516347237880495, "percentage": 93.12, "elapsed_time": "4:01:07", "remaining_time": "0:17:48"}
1057
+ {"current_steps": 1030, "total_steps": 1105, "loss": 1.0056, "lr": 5.592616131472727e-07, "epoch": 4.656144306651635, "percentage": 93.21, "elapsed_time": "4:01:31", "remaining_time": "0:17:35"}
1058
+ {"current_steps": 1031, "total_steps": 1105, "loss": 1.0245, "lr": 5.445149897241275e-07, "epoch": 4.66065388951522, "percentage": 93.3, "elapsed_time": "4:01:55", "remaining_time": "0:17:21"}
1059
+ {"current_steps": 1032, "total_steps": 1105, "loss": 1.0151, "lr": 5.29962709200067e-07, "epoch": 4.665163472378805, "percentage": 93.39, "elapsed_time": "4:02:19", "remaining_time": "0:17:08"}
1060
+ {"current_steps": 1033, "total_steps": 1105, "loss": 1.0037, "lr": 5.156049169393673e-07, "epoch": 4.66967305524239, "percentage": 93.48, "elapsed_time": "4:02:42", "remaining_time": "0:16:55"}
1061
+ {"current_steps": 1034, "total_steps": 1105, "loss": 1.0042, "lr": 5.014417563635276e-07, "epoch": 4.674182638105975, "percentage": 93.57, "elapsed_time": "4:03:06", "remaining_time": "0:16:41"}
1062
+ {"current_steps": 1035, "total_steps": 1105, "loss": 1.0164, "lr": 4.874733689498645e-07, "epoch": 4.678692220969561, "percentage": 93.67, "elapsed_time": "4:03:30", "remaining_time": "0:16:28"}
1063
+ {"current_steps": 1036, "total_steps": 1105, "loss": 0.9919, "lr": 4.73699894230073e-07, "epoch": 4.683201803833145, "percentage": 93.76, "elapsed_time": "4:03:54", "remaining_time": "0:16:14"}
1064
+ {"current_steps": 1037, "total_steps": 1105, "loss": 1.0171, "lr": 4.6012146978885677e-07, "epoch": 4.687711386696731, "percentage": 93.85, "elapsed_time": "4:04:18", "remaining_time": "0:16:01"}
1065
+ {"current_steps": 1038, "total_steps": 1105, "loss": 1.0286, "lr": 4.46738231262529e-07, "epoch": 4.692220969560315, "percentage": 93.94, "elapsed_time": "4:04:42", "remaining_time": "0:15:47"}
1066
+ {"current_steps": 1039, "total_steps": 1105, "loss": 1.0506, "lr": 4.3355031233767607e-07, "epoch": 4.696730552423901, "percentage": 94.03, "elapsed_time": "4:05:06", "remaining_time": "0:15:34"}
1067
+ {"current_steps": 1040, "total_steps": 1105, "loss": 0.9963, "lr": 4.205578447498204e-07, "epoch": 4.7012401352874855, "percentage": 94.12, "elapsed_time": "4:05:30", "remaining_time": "0:15:20"}
1068
+ {"current_steps": 1041, "total_steps": 1105, "loss": 0.989, "lr": 4.0776095828209074e-07, "epoch": 4.705749718151071, "percentage": 94.21, "elapsed_time": "4:05:55", "remaining_time": "0:15:07"}
1069
+ {"current_steps": 1042, "total_steps": 1105, "loss": 1.0065, "lr": 3.9515978076394293e-07, "epoch": 4.7102593010146565, "percentage": 94.3, "elapsed_time": "4:06:18", "remaining_time": "0:14:53"}
1070
+ {"current_steps": 1043, "total_steps": 1105, "loss": 1.0051, "lr": 3.8275443806987446e-07, "epoch": 4.714768883878241, "percentage": 94.39, "elapsed_time": "4:06:42", "remaining_time": "0:14:39"}
1071
+ {"current_steps": 1044, "total_steps": 1105, "loss": 1.0428, "lr": 3.7054505411816543e-07, "epoch": 4.719278466741827, "percentage": 94.48, "elapsed_time": "4:07:06", "remaining_time": "0:14:26"}
1072
+ {"current_steps": 1045, "total_steps": 1105, "loss": 1.048, "lr": 3.5853175086964176e-07, "epoch": 4.723788049605411, "percentage": 94.57, "elapsed_time": "4:07:30", "remaining_time": "0:14:12"}
1073
+ {"current_steps": 1046, "total_steps": 1105, "loss": 1.0315, "lr": 3.467146483264672e-07, "epoch": 4.728297632468997, "percentage": 94.66, "elapsed_time": "4:07:54", "remaining_time": "0:13:58"}
1074
+ {"current_steps": 1047, "total_steps": 1105, "loss": 1.0532, "lr": 3.350938645309243e-07, "epoch": 4.732807215332581, "percentage": 94.75, "elapsed_time": "4:08:18", "remaining_time": "0:13:45"}
1075
+ {"current_steps": 1048, "total_steps": 1105, "loss": 1.0143, "lr": 3.236695155642555e-07, "epoch": 4.737316798196167, "percentage": 94.84, "elapsed_time": "4:08:42", "remaining_time": "0:13:31"}
1076
+ {"current_steps": 1049, "total_steps": 1105, "loss": 1.0477, "lr": 3.124417155454884e-07, "epoch": 4.741826381059752, "percentage": 94.93, "elapsed_time": "4:09:06", "remaining_time": "0:13:17"}
1077
+ {"current_steps": 1050, "total_steps": 1105, "loss": 1.0488, "lr": 3.0141057663030773e-07, "epoch": 4.746335963923337, "percentage": 95.02, "elapsed_time": "4:09:30", "remaining_time": "0:13:04"}
1078
+ {"current_steps": 1051, "total_steps": 1105, "loss": 1.0023, "lr": 2.905762090099318e-07, "epoch": 4.750845546786922, "percentage": 95.11, "elapsed_time": "4:09:54", "remaining_time": "0:12:50"}
1079
+ {"current_steps": 1052, "total_steps": 1105, "loss": 1.0308, "lr": 2.799387209100002e-07, "epoch": 4.755355129650507, "percentage": 95.2, "elapsed_time": "4:10:19", "remaining_time": "0:12:36"}
1080
+ {"current_steps": 1053, "total_steps": 1105, "loss": 1.0129, "lr": 2.6949821858951007e-07, "epoch": 4.7598647125140925, "percentage": 95.29, "elapsed_time": "4:10:42", "remaining_time": "0:12:22"}
1081
+ {"current_steps": 1054, "total_steps": 1105, "loss": 1.0176, "lr": 2.5925480633974154e-07, "epoch": 4.764374295377678, "percentage": 95.38, "elapsed_time": "4:11:06", "remaining_time": "0:12:09"}
1082
+ {"current_steps": 1055, "total_steps": 1105, "loss": 1.0089, "lr": 2.492085864832272e-07, "epoch": 4.768883878241263, "percentage": 95.48, "elapsed_time": "4:11:30", "remaining_time": "0:11:55"}
1083
+ {"current_steps": 1056, "total_steps": 1105, "loss": 1.0065, "lr": 2.393596593727199e-07, "epoch": 4.773393461104848, "percentage": 95.57, "elapsed_time": "4:11:54", "remaining_time": "0:11:41"}
1084
+ {"current_steps": 1057, "total_steps": 1105, "loss": 1.0002, "lr": 2.29708123390191e-07, "epoch": 4.777903043968433, "percentage": 95.66, "elapsed_time": "4:12:19", "remaining_time": "0:11:27"}
1085
+ {"current_steps": 1058, "total_steps": 1105, "loss": 1.0396, "lr": 2.202540749458626e-07, "epoch": 4.782412626832018, "percentage": 95.75, "elapsed_time": "4:12:43", "remaining_time": "0:11:13"}
1086
+ {"current_steps": 1059, "total_steps": 1105, "loss": 1.0345, "lr": 2.1099760847721696e-07, "epoch": 4.786922209695603, "percentage": 95.84, "elapsed_time": "4:13:07", "remaining_time": "0:10:59"}
1087
+ {"current_steps": 1060, "total_steps": 1105, "loss": 0.9979, "lr": 2.01938816448084e-07, "epoch": 4.791431792559188, "percentage": 95.93, "elapsed_time": "4:13:31", "remaining_time": "0:10:45"}
1088
+ {"current_steps": 1061, "total_steps": 1105, "loss": 1.0055, "lr": 1.9307778934769316e-07, "epoch": 4.795941375422774, "percentage": 96.02, "elapsed_time": "4:13:55", "remaining_time": "0:10:31"}
1089
+ {"current_steps": 1062, "total_steps": 1105, "loss": 1.0618, "lr": 1.844146156897808e-07, "epoch": 4.800450958286358, "percentage": 96.11, "elapsed_time": "4:14:19", "remaining_time": "0:10:17"}
1090
+ {"current_steps": 1063, "total_steps": 1105, "loss": 1.0315, "lr": 1.7594938201170863e-07, "epoch": 4.804960541149944, "percentage": 96.2, "elapsed_time": "4:14:43", "remaining_time": "0:10:03"}
1091
+ {"current_steps": 1064, "total_steps": 1105, "loss": 1.0378, "lr": 1.676821728735889e-07, "epoch": 4.8094701240135285, "percentage": 96.29, "elapsed_time": "4:15:08", "remaining_time": "0:09:49"}
1092
+ {"current_steps": 1065, "total_steps": 1105, "loss": 1.0235, "lr": 1.596130708574517e-07, "epoch": 4.813979706877114, "percentage": 96.38, "elapsed_time": "4:15:32", "remaining_time": "0:09:35"}
1093
+ {"current_steps": 1066, "total_steps": 1105, "loss": 1.0427, "lr": 1.517421565664101e-07, "epoch": 4.818489289740699, "percentage": 96.47, "elapsed_time": "4:15:56", "remaining_time": "0:09:21"}
1094
+ {"current_steps": 1067, "total_steps": 1105, "loss": 1.0378, "lr": 1.440695086238586e-07, "epoch": 4.822998872604284, "percentage": 96.56, "elapsed_time": "4:16:20", "remaining_time": "0:09:07"}
1095
+ {"current_steps": 1068, "total_steps": 1105, "loss": 1.0141, "lr": 1.3659520367269142e-07, "epoch": 4.8275084554678696, "percentage": 96.65, "elapsed_time": "4:16:44", "remaining_time": "0:08:53"}
1096
+ {"current_steps": 1069, "total_steps": 1105, "loss": 1.0116, "lr": 1.293193163745299e-07, "epoch": 4.832018038331454, "percentage": 96.74, "elapsed_time": "4:17:08", "remaining_time": "0:08:39"}
1097
+ {"current_steps": 1070, "total_steps": 1105, "loss": 1.0422, "lr": 1.2224191940898521e-07, "epoch": 4.83652762119504, "percentage": 96.83, "elapsed_time": "4:17:31", "remaining_time": "0:08:25"}
1098
+ {"current_steps": 1071, "total_steps": 1105, "loss": 0.9952, "lr": 1.1536308347292357e-07, "epoch": 4.841037204058624, "percentage": 96.92, "elapsed_time": "4:17:54", "remaining_time": "0:08:11"}
1099
+ {"current_steps": 1072, "total_steps": 1105, "loss": 0.9925, "lr": 1.0868287727976434e-07, "epoch": 4.84554678692221, "percentage": 97.01, "elapsed_time": "4:18:19", "remaining_time": "0:07:57"}
1100
+ {"current_steps": 1073, "total_steps": 1105, "loss": 1.0123, "lr": 1.0220136755879407e-07, "epoch": 4.850056369785795, "percentage": 97.1, "elapsed_time": "4:18:43", "remaining_time": "0:07:42"}
1101
+ {"current_steps": 1074, "total_steps": 1105, "loss": 0.9797, "lr": 9.59186190545025e-08, "epoch": 4.85456595264938, "percentage": 97.19, "elapsed_time": "4:19:07", "remaining_time": "0:07:28"}
1102
+ {"current_steps": 1075, "total_steps": 1105, "loss": 1.0002, "lr": 8.983469452592542e-08, "epoch": 4.859075535512965, "percentage": 97.29, "elapsed_time": "4:19:31", "remaining_time": "0:07:14"}
1103
+ {"current_steps": 1076, "total_steps": 1105, "loss": 1.055, "lr": 8.394965474602945e-08, "epoch": 4.86358511837655, "percentage": 97.38, "elapsed_time": "4:19:55", "remaining_time": "0:07:00"}
1104
+ {"current_steps": 1077, "total_steps": 1105, "loss": 1.0411, "lr": 7.826355850110378e-08, "epoch": 4.868094701240135, "percentage": 97.47, "elapsed_time": "4:20:19", "remaining_time": "0:06:46"}
1105
+ {"current_steps": 1078, "total_steps": 1105, "loss": 1.0188, "lr": 7.277646259016058e-08, "epoch": 4.87260428410372, "percentage": 97.56, "elapsed_time": "4:20:43", "remaining_time": "0:06:31"}
1106
+ {"current_steps": 1079, "total_steps": 1105, "loss": 1.0482, "lr": 6.748842182438654e-08, "epoch": 4.8771138669673055, "percentage": 97.65, "elapsed_time": "4:21:07", "remaining_time": "0:06:17"}
1107
+ {"current_steps": 1080, "total_steps": 1105, "loss": 1.0822, "lr": 6.239948902657667e-08, "epoch": 4.881623449830891, "percentage": 97.74, "elapsed_time": "4:21:31", "remaining_time": "0:06:03"}
1108
+ {"current_steps": 1081, "total_steps": 1105, "loss": 0.9551, "lr": 5.7509715030621414e-08, "epoch": 4.886133032694476, "percentage": 97.83, "elapsed_time": "4:21:55", "remaining_time": "0:05:48"}
1109
+ {"current_steps": 1082, "total_steps": 1105, "loss": 1.0322, "lr": 5.281914868098925e-08, "epoch": 4.890642615558061, "percentage": 97.92, "elapsed_time": "4:22:19", "remaining_time": "0:05:34"}
1110
+ {"current_steps": 1083, "total_steps": 1105, "loss": 1.02, "lr": 4.8327836832244846e-08, "epoch": 4.895152198421646, "percentage": 98.01, "elapsed_time": "4:22:43", "remaining_time": "0:05:20"}
1111
+ {"current_steps": 1084, "total_steps": 1105, "loss": 1.0162, "lr": 4.403582434857834e-08, "epoch": 4.899661781285231, "percentage": 98.1, "elapsed_time": "4:23:07", "remaining_time": "0:05:05"}
1112
+ {"current_steps": 1085, "total_steps": 1105, "loss": 1.0376, "lr": 3.9943154103356805e-08, "epoch": 4.904171364148816, "percentage": 98.19, "elapsed_time": "4:23:32", "remaining_time": "0:04:51"}
1113
+ {"current_steps": 1086, "total_steps": 1105, "loss": 1.0141, "lr": 3.6049866978693504e-08, "epoch": 4.908680947012401, "percentage": 98.28, "elapsed_time": "4:23:56", "remaining_time": "0:04:37"}
1114
+ {"current_steps": 1087, "total_steps": 1105, "loss": 1.0248, "lr": 3.235600186505039e-08, "epoch": 4.913190529875987, "percentage": 98.37, "elapsed_time": "4:24:20", "remaining_time": "0:04:22"}
1115
+ {"current_steps": 1088, "total_steps": 1105, "loss": 1.0362, "lr": 2.886159566083402e-08, "epoch": 4.917700112739571, "percentage": 98.46, "elapsed_time": "4:24:43", "remaining_time": "0:04:08"}
1116
+ {"current_steps": 1089, "total_steps": 1105, "loss": 0.9985, "lr": 2.556668327203582e-08, "epoch": 4.922209695603157, "percentage": 98.55, "elapsed_time": "4:25:08", "remaining_time": "0:03:53"}
1117
+ {"current_steps": 1090, "total_steps": 1105, "loss": 1.0511, "lr": 2.2471297611890154e-08, "epoch": 4.9267192784667415, "percentage": 98.64, "elapsed_time": "4:25:32", "remaining_time": "0:03:39"}
1118
+ {"current_steps": 1091, "total_steps": 1105, "loss": 1.0296, "lr": 1.957546960052792e-08, "epoch": 4.931228861330327, "percentage": 98.73, "elapsed_time": "4:25:56", "remaining_time": "0:03:24"}
1119
+ {"current_steps": 1092, "total_steps": 1105, "loss": 1.0352, "lr": 1.687922816468346e-08, "epoch": 4.9357384441939125, "percentage": 98.82, "elapsed_time": "4:26:19", "remaining_time": "0:03:10"}
1120
+ {"current_steps": 1093, "total_steps": 1105, "loss": 1.0032, "lr": 1.4382600237394794e-08, "epoch": 4.940248027057497, "percentage": 98.91, "elapsed_time": "4:26:43", "remaining_time": "0:02:55"}
1121
+ {"current_steps": 1094, "total_steps": 1105, "loss": 1.0472, "lr": 1.2085610757746057e-08, "epoch": 4.944757609921083, "percentage": 99.0, "elapsed_time": "4:27:08", "remaining_time": "0:02:41"}
1122
+ {"current_steps": 1095, "total_steps": 1105, "loss": 1.0006, "lr": 9.988282670607696e-09, "epoch": 4.949267192784667, "percentage": 99.1, "elapsed_time": "4:27:32", "remaining_time": "0:02:26"}
1123
+ {"current_steps": 1096, "total_steps": 1105, "loss": 1.0547, "lr": 8.090636926409989e-09, "epoch": 4.953776775648253, "percentage": 99.19, "elapsed_time": "4:27:56", "remaining_time": "0:02:12"}
1124
+ {"current_steps": 1097, "total_steps": 1105, "loss": 1.0623, "lr": 6.392692480938767e-09, "epoch": 4.958286358511837, "percentage": 99.28, "elapsed_time": "4:28:21", "remaining_time": "0:01:57"}
1125
+ {"current_steps": 1098, "total_steps": 1105, "loss": 1.0375, "lr": 4.89446629514001e-09, "epoch": 4.962795941375423, "percentage": 99.37, "elapsed_time": "4:28:45", "remaining_time": "0:01:42"}
1126
+ {"current_steps": 1099, "total_steps": 1105, "loss": 1.0433, "lr": 3.5959733349555382e-09, "epoch": 4.967305524239007, "percentage": 99.46, "elapsed_time": "4:29:09", "remaining_time": "0:01:28"}
1127
+ {"current_steps": 1100, "total_steps": 1105, "loss": 0.9994, "lr": 2.4972265711653563e-09, "epoch": 4.971815107102593, "percentage": 99.55, "elapsed_time": "4:29:33", "remaining_time": "0:01:13"}
1128
+ {"current_steps": 1101, "total_steps": 1105, "loss": 1.0461, "lr": 1.5982369792699737e-09, "epoch": 4.976324689966178, "percentage": 99.64, "elapsed_time": "4:29:57", "remaining_time": "0:00:58"}
1129
+ {"current_steps": 1102, "total_steps": 1105, "loss": 1.0319, "lr": 8.990135393727173e-10, "epoch": 4.980834272829763, "percentage": 99.73, "elapsed_time": "4:30:21", "remaining_time": "0:00:44"}
1130
+ {"current_steps": 1103, "total_steps": 1105, "loss": 1.0478, "lr": 3.995632360864754e-10, "epoch": 4.9853438556933485, "percentage": 99.82, "elapsed_time": "4:30:45", "remaining_time": "0:00:29"}
1131
+ {"current_steps": 1104, "total_steps": 1105, "loss": 1.0286, "lr": 9.989105847818536e-11, "epoch": 4.989853438556933, "percentage": 99.91, "elapsed_time": "4:31:09", "remaining_time": "0:00:14"}
1132
+ {"current_steps": 1105, "total_steps": 1105, "loss": 0.9683, "lr": 0.0, "epoch": 4.994363021420519, "percentage": 100.0, "elapsed_time": "4:31:34", "remaining_time": "0:00:00"}
1133
+ {"current_steps": 1105, "total_steps": 1105, "epoch": 4.994363021420519, "percentage": 100.0, "elapsed_time": "4:36:16", "remaining_time": "0:00:00"}