Training in progress, epoch 4
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4877660776
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f3b1916b0620b47f9a8f7c35beee8fe22a64a1e29097d647a735e12813ac7508
|
3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4932751008
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:efdd687e6d8b3e13c352ad92f086b6ea74ea31c5f3242158ade55e0c470d76b8
|
3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4330865200
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:621a23f90ae0aaa7606478100ba3c63db23cb19093651ff5bc3dfb90b9571bec
|
3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1089994880
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3534f511c6c7c6bf69ee5b28b6cf951607dde1b1add09eb309c1767abc5ad86e
|
3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
@@ -725,3 +725,244 @@
|
|
725 |
{"current_steps": 725, "total_steps": 1200, "loss": 0.4256, "lr": 1.6240944911997765e-05, "epoch": 3.0208333333333335, "percentage": 60.42, "elapsed_time": "4:47:20", "remaining_time": "3:08:15"}
|
726 |
{"current_steps": 726, "total_steps": 1200, "loss": 0.4304, "lr": 1.6183820092469103e-05, "epoch": 3.025, "percentage": 60.5, "elapsed_time": "4:47:42", "remaining_time": "3:07:50"}
|
727 |
{"current_steps": 727, "total_steps": 1200, "loss": 0.437, "lr": 1.6126727563886485e-05, "epoch": 3.029166666666667, "percentage": 60.58, "elapsed_time": "4:48:05", "remaining_time": "3:07:26"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
725 |
{"current_steps": 725, "total_steps": 1200, "loss": 0.4256, "lr": 1.6240944911997765e-05, "epoch": 3.0208333333333335, "percentage": 60.42, "elapsed_time": "4:47:20", "remaining_time": "3:08:15"}
|
726 |
{"current_steps": 726, "total_steps": 1200, "loss": 0.4304, "lr": 1.6183820092469103e-05, "epoch": 3.025, "percentage": 60.5, "elapsed_time": "4:47:42", "remaining_time": "3:07:50"}
|
727 |
{"current_steps": 727, "total_steps": 1200, "loss": 0.437, "lr": 1.6126727563886485e-05, "epoch": 3.029166666666667, "percentage": 60.58, "elapsed_time": "4:48:05", "remaining_time": "3:07:26"}
|
728 |
+
{"current_steps": 728, "total_steps": 1200, "loss": 0.4282, "lr": 1.6069667809343396e-05, "epoch": 3.033333333333333, "percentage": 60.67, "elapsed_time": "4:48:28", "remaining_time": "3:07:02"}
|
729 |
+
{"current_steps": 729, "total_steps": 1200, "loss": 0.44, "lr": 1.601264131165606e-05, "epoch": 3.0375, "percentage": 60.75, "elapsed_time": "4:48:52", "remaining_time": "3:06:38"}
|
730 |
+
{"current_steps": 730, "total_steps": 1200, "loss": 0.4316, "lr": 1.5955648553359247e-05, "epoch": 3.0416666666666665, "percentage": 60.83, "elapsed_time": "4:49:15", "remaining_time": "3:06:14"}
|
731 |
+
{"current_steps": 731, "total_steps": 1200, "loss": 0.4341, "lr": 1.5898690016702253e-05, "epoch": 3.0458333333333334, "percentage": 60.92, "elapsed_time": "4:49:39", "remaining_time": "3:05:50"}
|
732 |
+
{"current_steps": 732, "total_steps": 1200, "loss": 0.4333, "lr": 1.584176618364482e-05, "epoch": 3.05, "percentage": 61.0, "elapsed_time": "4:50:02", "remaining_time": "3:05:26"}
|
733 |
+
{"current_steps": 733, "total_steps": 1200, "loss": 0.4268, "lr": 1.5784877535853014e-05, "epoch": 3.0541666666666667, "percentage": 61.08, "elapsed_time": "4:50:26", "remaining_time": "3:05:02"}
|
734 |
+
{"current_steps": 734, "total_steps": 1200, "loss": 0.4389, "lr": 1.5728024554695204e-05, "epoch": 3.058333333333333, "percentage": 61.17, "elapsed_time": "4:50:49", "remaining_time": "3:04:38"}
|
735 |
+
{"current_steps": 735, "total_steps": 1200, "loss": 0.4442, "lr": 1.5671207721237945e-05, "epoch": 3.0625, "percentage": 61.25, "elapsed_time": "4:51:12", "remaining_time": "3:04:14"}
|
736 |
+
{"current_steps": 736, "total_steps": 1200, "loss": 0.4384, "lr": 1.561442751624193e-05, "epoch": 3.066666666666667, "percentage": 61.33, "elapsed_time": "4:51:35", "remaining_time": "3:03:49"}
|
737 |
+
{"current_steps": 737, "total_steps": 1200, "loss": 0.4284, "lr": 1.555768442015794e-05, "epoch": 3.0708333333333333, "percentage": 61.42, "elapsed_time": "4:51:58", "remaining_time": "3:03:25"}
|
738 |
+
{"current_steps": 738, "total_steps": 1200, "loss": 0.422, "lr": 1.5500978913122702e-05, "epoch": 3.075, "percentage": 61.5, "elapsed_time": "4:52:22", "remaining_time": "3:03:01"}
|
739 |
+
{"current_steps": 739, "total_steps": 1200, "loss": 0.4191, "lr": 1.5444311474954932e-05, "epoch": 3.0791666666666666, "percentage": 61.58, "elapsed_time": "4:52:45", "remaining_time": "3:02:37"}
|
740 |
+
{"current_steps": 740, "total_steps": 1200, "loss": 0.4337, "lr": 1.53876825851512e-05, "epoch": 3.0833333333333335, "percentage": 61.67, "elapsed_time": "4:53:08", "remaining_time": "3:02:13"}
|
741 |
+
{"current_steps": 741, "total_steps": 1200, "loss": 0.4263, "lr": 1.53310927228819e-05, "epoch": 3.0875, "percentage": 61.75, "elapsed_time": "4:53:31", "remaining_time": "3:01:49"}
|
742 |
+
{"current_steps": 742, "total_steps": 1200, "loss": 0.417, "lr": 1.5274542366987174e-05, "epoch": 3.091666666666667, "percentage": 61.83, "elapsed_time": "4:53:55", "remaining_time": "3:01:25"}
|
743 |
+
{"current_steps": 743, "total_steps": 1200, "loss": 0.4251, "lr": 1.5218031995972917e-05, "epoch": 3.095833333333333, "percentage": 61.92, "elapsed_time": "4:54:18", "remaining_time": "3:01:01"}
|
744 |
+
{"current_steps": 744, "total_steps": 1200, "loss": 0.4315, "lr": 1.5161562088006649e-05, "epoch": 3.1, "percentage": 62.0, "elapsed_time": "4:54:42", "remaining_time": "3:00:37"}
|
745 |
+
{"current_steps": 745, "total_steps": 1200, "loss": 0.415, "lr": 1.5105133120913524e-05, "epoch": 3.1041666666666665, "percentage": 62.08, "elapsed_time": "4:55:05", "remaining_time": "3:00:13"}
|
746 |
+
{"current_steps": 746, "total_steps": 1200, "loss": 0.4263, "lr": 1.5048745572172286e-05, "epoch": 3.1083333333333334, "percentage": 62.17, "elapsed_time": "4:55:28", "remaining_time": "2:59:49"}
|
747 |
+
{"current_steps": 747, "total_steps": 1200, "loss": 0.4254, "lr": 1.4992399918911168e-05, "epoch": 3.1125, "percentage": 62.25, "elapsed_time": "4:55:51", "remaining_time": "2:59:24"}
|
748 |
+
{"current_steps": 748, "total_steps": 1200, "loss": 0.4177, "lr": 1.4936096637903967e-05, "epoch": 3.1166666666666667, "percentage": 62.33, "elapsed_time": "4:56:13", "remaining_time": "2:59:00"}
|
749 |
+
{"current_steps": 749, "total_steps": 1200, "loss": 0.4216, "lr": 1.4879836205565887e-05, "epoch": 3.120833333333333, "percentage": 62.42, "elapsed_time": "4:56:36", "remaining_time": "2:58:36"}
|
750 |
+
{"current_steps": 750, "total_steps": 1200, "loss": 0.4281, "lr": 1.4823619097949584e-05, "epoch": 3.125, "percentage": 62.5, "elapsed_time": "4:57:00", "remaining_time": "2:58:12"}
|
751 |
+
{"current_steps": 751, "total_steps": 1200, "loss": 0.4169, "lr": 1.4767445790741133e-05, "epoch": 3.129166666666667, "percentage": 62.58, "elapsed_time": "4:57:22", "remaining_time": "2:57:47"}
|
752 |
+
{"current_steps": 752, "total_steps": 1200, "loss": 0.4394, "lr": 1.4711316759255963e-05, "epoch": 3.1333333333333333, "percentage": 62.67, "elapsed_time": "4:57:46", "remaining_time": "2:57:23"}
|
753 |
+
{"current_steps": 753, "total_steps": 1200, "loss": 0.4275, "lr": 1.4655232478434864e-05, "epoch": 3.1375, "percentage": 62.75, "elapsed_time": "4:58:09", "remaining_time": "2:56:59"}
|
754 |
+
{"current_steps": 754, "total_steps": 1200, "loss": 0.4347, "lr": 1.4599193422839987e-05, "epoch": 3.1416666666666666, "percentage": 62.83, "elapsed_time": "4:58:33", "remaining_time": "2:56:35"}
|
755 |
+
{"current_steps": 755, "total_steps": 1200, "loss": 0.4293, "lr": 1.4543200066650786e-05, "epoch": 3.1458333333333335, "percentage": 62.92, "elapsed_time": "4:58:57", "remaining_time": "2:56:12"}
|
756 |
+
{"current_steps": 756, "total_steps": 1200, "loss": 0.4202, "lr": 1.4487252883660019e-05, "epoch": 3.15, "percentage": 63.0, "elapsed_time": "4:59:20", "remaining_time": "2:55:48"}
|
757 |
+
{"current_steps": 757, "total_steps": 1200, "loss": 0.4327, "lr": 1.4431352347269769e-05, "epoch": 3.154166666666667, "percentage": 63.08, "elapsed_time": "4:59:43", "remaining_time": "2:55:24"}
|
758 |
+
{"current_steps": 758, "total_steps": 1200, "loss": 0.4311, "lr": 1.4375498930487388e-05, "epoch": 3.158333333333333, "percentage": 63.17, "elapsed_time": "5:00:07", "remaining_time": "2:55:00"}
|
759 |
+
{"current_steps": 759, "total_steps": 1200, "loss": 0.4422, "lr": 1.4319693105921548e-05, "epoch": 3.1625, "percentage": 63.25, "elapsed_time": "5:00:30", "remaining_time": "2:54:36"}
|
760 |
+
{"current_steps": 760, "total_steps": 1200, "loss": 0.4241, "lr": 1.4263935345778202e-05, "epoch": 3.1666666666666665, "percentage": 63.33, "elapsed_time": "5:00:53", "remaining_time": "2:54:12"}
|
761 |
+
{"current_steps": 761, "total_steps": 1200, "loss": 0.4322, "lr": 1.4208226121856586e-05, "epoch": 3.1708333333333334, "percentage": 63.42, "elapsed_time": "5:01:17", "remaining_time": "2:53:48"}
|
762 |
+
{"current_steps": 762, "total_steps": 1200, "loss": 0.4213, "lr": 1.4152565905545268e-05, "epoch": 3.175, "percentage": 63.5, "elapsed_time": "5:01:40", "remaining_time": "2:53:24"}
|
763 |
+
{"current_steps": 763, "total_steps": 1200, "loss": 0.431, "lr": 1.4096955167818128e-05, "epoch": 3.1791666666666667, "percentage": 63.58, "elapsed_time": "5:02:03", "remaining_time": "2:53:00"}
|
764 |
+
{"current_steps": 764, "total_steps": 1200, "loss": 0.422, "lr": 1.404139437923036e-05, "epoch": 3.183333333333333, "percentage": 63.67, "elapsed_time": "5:02:26", "remaining_time": "2:52:36"}
|
765 |
+
{"current_steps": 765, "total_steps": 1200, "loss": 0.4131, "lr": 1.3985884009914542e-05, "epoch": 3.1875, "percentage": 63.75, "elapsed_time": "5:02:50", "remaining_time": "2:52:12"}
|
766 |
+
{"current_steps": 766, "total_steps": 1200, "loss": 0.4289, "lr": 1.3930424529576593e-05, "epoch": 3.191666666666667, "percentage": 63.83, "elapsed_time": "5:03:13", "remaining_time": "2:51:47"}
|
767 |
+
{"current_steps": 767, "total_steps": 1200, "loss": 0.4241, "lr": 1.387501640749184e-05, "epoch": 3.1958333333333333, "percentage": 63.92, "elapsed_time": "5:03:36", "remaining_time": "2:51:24"}
|
768 |
+
{"current_steps": 768, "total_steps": 1200, "loss": 0.4338, "lr": 1.3819660112501054e-05, "epoch": 3.2, "percentage": 64.0, "elapsed_time": "5:03:59", "remaining_time": "2:50:59"}
|
769 |
+
{"current_steps": 769, "total_steps": 1200, "loss": 0.4337, "lr": 1.3764356113006441e-05, "epoch": 3.2041666666666666, "percentage": 64.08, "elapsed_time": "5:04:22", "remaining_time": "2:50:35"}
|
770 |
+
{"current_steps": 770, "total_steps": 1200, "loss": 0.4209, "lr": 1.3709104876967732e-05, "epoch": 3.2083333333333335, "percentage": 64.17, "elapsed_time": "5:04:46", "remaining_time": "2:50:11"}
|
771 |
+
{"current_steps": 771, "total_steps": 1200, "loss": 0.444, "lr": 1.3653906871898161e-05, "epoch": 3.2125, "percentage": 64.25, "elapsed_time": "5:05:09", "remaining_time": "2:49:47"}
|
772 |
+
{"current_steps": 772, "total_steps": 1200, "loss": 0.4355, "lr": 1.3598762564860569e-05, "epoch": 3.216666666666667, "percentage": 64.33, "elapsed_time": "5:05:32", "remaining_time": "2:49:23"}
|
773 |
+
{"current_steps": 773, "total_steps": 1200, "loss": 0.4168, "lr": 1.3543672422463426e-05, "epoch": 3.220833333333333, "percentage": 64.42, "elapsed_time": "5:05:55", "remaining_time": "2:48:59"}
|
774 |
+
{"current_steps": 774, "total_steps": 1200, "loss": 0.4406, "lr": 1.3488636910856871e-05, "epoch": 3.225, "percentage": 64.5, "elapsed_time": "5:06:17", "remaining_time": "2:48:34"}
|
775 |
+
{"current_steps": 775, "total_steps": 1200, "loss": 0.4341, "lr": 1.3433656495728781e-05, "epoch": 3.2291666666666665, "percentage": 64.58, "elapsed_time": "5:06:39", "remaining_time": "2:48:09"}
|
776 |
+
{"current_steps": 776, "total_steps": 1200, "loss": 0.4186, "lr": 1.3378731642300841e-05, "epoch": 3.2333333333333334, "percentage": 64.67, "elapsed_time": "5:07:02", "remaining_time": "2:47:45"}
|
777 |
+
{"current_steps": 777, "total_steps": 1200, "loss": 0.4331, "lr": 1.3323862815324585e-05, "epoch": 3.2375, "percentage": 64.75, "elapsed_time": "5:07:24", "remaining_time": "2:47:21"}
|
778 |
+
{"current_steps": 778, "total_steps": 1200, "loss": 0.4301, "lr": 1.3269050479077472e-05, "epoch": 3.2416666666666667, "percentage": 64.83, "elapsed_time": "5:07:48", "remaining_time": "2:46:57"}
|
779 |
+
{"current_steps": 779, "total_steps": 1200, "loss": 0.4279, "lr": 1.321429509735898e-05, "epoch": 3.245833333333333, "percentage": 64.92, "elapsed_time": "5:08:11", "remaining_time": "2:46:33"}
|
780 |
+
{"current_steps": 780, "total_steps": 1200, "loss": 0.4294, "lr": 1.3159597133486628e-05, "epoch": 3.25, "percentage": 65.0, "elapsed_time": "5:08:34", "remaining_time": "2:46:09"}
|
781 |
+
{"current_steps": 781, "total_steps": 1200, "loss": 0.4412, "lr": 1.3104957050292117e-05, "epoch": 3.2541666666666664, "percentage": 65.08, "elapsed_time": "5:08:58", "remaining_time": "2:45:45"}
|
782 |
+
{"current_steps": 782, "total_steps": 1200, "loss": 0.4332, "lr": 1.3050375310117374e-05, "epoch": 3.2583333333333333, "percentage": 65.17, "elapsed_time": "5:09:21", "remaining_time": "2:45:21"}
|
783 |
+
{"current_steps": 783, "total_steps": 1200, "loss": 0.4411, "lr": 1.2995852374810652e-05, "epoch": 3.2625, "percentage": 65.25, "elapsed_time": "5:09:45", "remaining_time": "2:44:57"}
|
784 |
+
{"current_steps": 784, "total_steps": 1200, "loss": 0.4269, "lr": 1.2941388705722627e-05, "epoch": 3.2666666666666666, "percentage": 65.33, "elapsed_time": "5:10:07", "remaining_time": "2:44:33"}
|
785 |
+
{"current_steps": 785, "total_steps": 1200, "loss": 0.4364, "lr": 1.2886984763702474e-05, "epoch": 3.2708333333333335, "percentage": 65.42, "elapsed_time": "5:10:30", "remaining_time": "2:44:09"}
|
786 |
+
{"current_steps": 786, "total_steps": 1200, "loss": 0.427, "lr": 1.2832641009093995e-05, "epoch": 3.275, "percentage": 65.5, "elapsed_time": "5:10:53", "remaining_time": "2:43:44"}
|
787 |
+
{"current_steps": 787, "total_steps": 1200, "loss": 0.436, "lr": 1.2778357901731714e-05, "epoch": 3.279166666666667, "percentage": 65.58, "elapsed_time": "5:11:16", "remaining_time": "2:43:20"}
|
788 |
+
{"current_steps": 788, "total_steps": 1200, "loss": 0.4284, "lr": 1.2724135900936979e-05, "epoch": 3.283333333333333, "percentage": 65.67, "elapsed_time": "5:11:39", "remaining_time": "2:42:57"}
|
789 |
+
{"current_steps": 789, "total_steps": 1200, "loss": 0.4289, "lr": 1.2669975465514057e-05, "epoch": 3.2875, "percentage": 65.75, "elapsed_time": "5:12:02", "remaining_time": "2:42:32"}
|
790 |
+
{"current_steps": 790, "total_steps": 1200, "loss": 0.432, "lr": 1.2615877053746315e-05, "epoch": 3.2916666666666665, "percentage": 65.83, "elapsed_time": "5:12:26", "remaining_time": "2:42:09"}
|
791 |
+
{"current_steps": 791, "total_steps": 1200, "loss": 0.4295, "lr": 1.2561841123392266e-05, "epoch": 3.2958333333333334, "percentage": 65.92, "elapsed_time": "5:12:49", "remaining_time": "2:41:44"}
|
792 |
+
{"current_steps": 792, "total_steps": 1200, "loss": 0.4289, "lr": 1.250786813168176e-05, "epoch": 3.3, "percentage": 66.0, "elapsed_time": "5:13:12", "remaining_time": "2:41:21"}
|
793 |
+
{"current_steps": 793, "total_steps": 1200, "loss": 0.418, "lr": 1.2453958535312064e-05, "epoch": 3.3041666666666667, "percentage": 66.08, "elapsed_time": "5:13:35", "remaining_time": "2:40:56"}
|
794 |
+
{"current_steps": 794, "total_steps": 1200, "loss": 0.423, "lr": 1.2400112790444024e-05, "epoch": 3.3083333333333336, "percentage": 66.17, "elapsed_time": "5:13:58", "remaining_time": "2:40:32"}
|
795 |
+
{"current_steps": 795, "total_steps": 1200, "loss": 0.4415, "lr": 1.2346331352698206e-05, "epoch": 3.3125, "percentage": 66.25, "elapsed_time": "5:14:21", "remaining_time": "2:40:08"}
|
796 |
+
{"current_steps": 796, "total_steps": 1200, "loss": 0.44, "lr": 1.2292614677151038e-05, "epoch": 3.3166666666666664, "percentage": 66.33, "elapsed_time": "5:14:44", "remaining_time": "2:39:44"}
|
797 |
+
{"current_steps": 797, "total_steps": 1200, "loss": 0.4293, "lr": 1.2238963218330944e-05, "epoch": 3.3208333333333333, "percentage": 66.42, "elapsed_time": "5:15:07", "remaining_time": "2:39:20"}
|
798 |
+
{"current_steps": 798, "total_steps": 1200, "loss": 0.424, "lr": 1.218537743021453e-05, "epoch": 3.325, "percentage": 66.5, "elapsed_time": "5:15:29", "remaining_time": "2:38:55"}
|
799 |
+
{"current_steps": 799, "total_steps": 1200, "loss": 0.4257, "lr": 1.2131857766222703e-05, "epoch": 3.3291666666666666, "percentage": 66.58, "elapsed_time": "5:15:53", "remaining_time": "2:38:32"}
|
800 |
+
{"current_steps": 800, "total_steps": 1200, "loss": 0.4325, "lr": 1.2078404679216864e-05, "epoch": 3.3333333333333335, "percentage": 66.67, "elapsed_time": "5:16:16", "remaining_time": "2:38:08"}
|
801 |
+
{"current_steps": 801, "total_steps": 1200, "loss": 0.4223, "lr": 1.2025018621495077e-05, "epoch": 3.3375, "percentage": 66.75, "elapsed_time": "5:16:38", "remaining_time": "2:37:43"}
|
802 |
+
{"current_steps": 802, "total_steps": 1200, "loss": 0.4262, "lr": 1.1971700044788213e-05, "epoch": 3.341666666666667, "percentage": 66.83, "elapsed_time": "5:17:02", "remaining_time": "2:37:19"}
|
803 |
+
{"current_steps": 803, "total_steps": 1200, "loss": 0.434, "lr": 1.191844940025617e-05, "epoch": 3.345833333333333, "percentage": 66.92, "elapsed_time": "5:17:24", "remaining_time": "2:36:55"}
|
804 |
+
{"current_steps": 804, "total_steps": 1200, "loss": 0.4309, "lr": 1.1865267138484e-05, "epoch": 3.35, "percentage": 67.0, "elapsed_time": "5:17:48", "remaining_time": "2:36:32"}
|
805 |
+
{"current_steps": 805, "total_steps": 1200, "loss": 0.4369, "lr": 1.1812153709478149e-05, "epoch": 3.3541666666666665, "percentage": 67.08, "elapsed_time": "5:18:12", "remaining_time": "2:36:08"}
|
806 |
+
{"current_steps": 806, "total_steps": 1200, "loss": 0.4325, "lr": 1.1759109562662633e-05, "epoch": 3.3583333333333334, "percentage": 67.17, "elapsed_time": "5:18:34", "remaining_time": "2:35:44"}
|
807 |
+
{"current_steps": 807, "total_steps": 1200, "loss": 0.4351, "lr": 1.1706135146875224e-05, "epoch": 3.3625, "percentage": 67.25, "elapsed_time": "5:18:58", "remaining_time": "2:35:20"}
|
808 |
+
{"current_steps": 808, "total_steps": 1200, "loss": 0.4115, "lr": 1.1653230910363645e-05, "epoch": 3.3666666666666667, "percentage": 67.33, "elapsed_time": "5:19:22", "remaining_time": "2:34:56"}
|
809 |
+
{"current_steps": 809, "total_steps": 1200, "loss": 0.4041, "lr": 1.1600397300781811e-05, "epoch": 3.3708333333333336, "percentage": 67.42, "elapsed_time": "5:19:45", "remaining_time": "2:34:32"}
|
810 |
+
{"current_steps": 810, "total_steps": 1200, "loss": 0.4322, "lr": 1.1547634765186016e-05, "epoch": 3.375, "percentage": 67.5, "elapsed_time": "5:20:11", "remaining_time": "2:34:09"}
|
811 |
+
{"current_steps": 811, "total_steps": 1200, "loss": 0.4313, "lr": 1.1494943750031144e-05, "epoch": 3.3791666666666664, "percentage": 67.58, "elapsed_time": "5:20:34", "remaining_time": "2:33:46"}
|
812 |
+
{"current_steps": 812, "total_steps": 1200, "loss": 0.4216, "lr": 1.144232470116692e-05, "epoch": 3.3833333333333333, "percentage": 67.67, "elapsed_time": "5:20:58", "remaining_time": "2:33:22"}
|
813 |
+
{"current_steps": 813, "total_steps": 1200, "loss": 0.431, "lr": 1.1389778063834094e-05, "epoch": 3.3875, "percentage": 67.75, "elapsed_time": "5:21:21", "remaining_time": "2:32:58"}
|
814 |
+
{"current_steps": 814, "total_steps": 1200, "loss": 0.4521, "lr": 1.1337304282660746e-05, "epoch": 3.3916666666666666, "percentage": 67.83, "elapsed_time": "5:21:45", "remaining_time": "2:32:34"}
|
815 |
+
{"current_steps": 815, "total_steps": 1200, "loss": 0.437, "lr": 1.1284903801658418e-05, "epoch": 3.3958333333333335, "percentage": 67.92, "elapsed_time": "5:22:09", "remaining_time": "2:32:10"}
|
816 |
+
{"current_steps": 816, "total_steps": 1200, "loss": 0.4372, "lr": 1.123257706421845e-05, "epoch": 3.4, "percentage": 68.0, "elapsed_time": "5:22:32", "remaining_time": "2:31:47"}
|
817 |
+
{"current_steps": 817, "total_steps": 1200, "loss": 0.448, "lr": 1.1180324513108203e-05, "epoch": 3.404166666666667, "percentage": 68.08, "elapsed_time": "5:22:56", "remaining_time": "2:31:23"}
|
818 |
+
{"current_steps": 818, "total_steps": 1200, "loss": 0.4445, "lr": 1.112814659046729e-05, "epoch": 3.408333333333333, "percentage": 68.17, "elapsed_time": "5:23:20", "remaining_time": "2:30:59"}
|
819 |
+
{"current_steps": 819, "total_steps": 1200, "loss": 0.429, "lr": 1.1076043737803825e-05, "epoch": 3.4125, "percentage": 68.25, "elapsed_time": "5:23:45", "remaining_time": "2:30:36"}
|
820 |
+
{"current_steps": 820, "total_steps": 1200, "loss": 0.4517, "lr": 1.1024016395990758e-05, "epoch": 3.4166666666666665, "percentage": 68.33, "elapsed_time": "5:24:09", "remaining_time": "2:30:13"}
|
821 |
+
{"current_steps": 821, "total_steps": 1200, "loss": 0.4271, "lr": 1.0972065005262067e-05, "epoch": 3.4208333333333334, "percentage": 68.42, "elapsed_time": "5:24:31", "remaining_time": "2:29:48"}
|
822 |
+
{"current_steps": 822, "total_steps": 1200, "loss": 0.4173, "lr": 1.0920190005209066e-05, "epoch": 3.425, "percentage": 68.5, "elapsed_time": "5:24:55", "remaining_time": "2:29:24"}
|
823 |
+
{"current_steps": 823, "total_steps": 1200, "loss": 0.4364, "lr": 1.086839183477669e-05, "epoch": 3.4291666666666667, "percentage": 68.58, "elapsed_time": "5:25:18", "remaining_time": "2:29:00"}
|
824 |
+
{"current_steps": 824, "total_steps": 1200, "loss": 0.432, "lr": 1.0816670932259763e-05, "epoch": 3.4333333333333336, "percentage": 68.67, "elapsed_time": "5:25:41", "remaining_time": "2:28:37"}
|
825 |
+
{"current_steps": 825, "total_steps": 1200, "loss": 0.4209, "lr": 1.0765027735299327e-05, "epoch": 3.4375, "percentage": 68.75, "elapsed_time": "5:26:05", "remaining_time": "2:28:13"}
|
826 |
+
{"current_steps": 826, "total_steps": 1200, "loss": 0.4218, "lr": 1.0713462680878864e-05, "epoch": 3.4416666666666664, "percentage": 68.83, "elapsed_time": "5:26:28", "remaining_time": "2:27:49"}
|
827 |
+
{"current_steps": 827, "total_steps": 1200, "loss": 0.4343, "lr": 1.066197620532068e-05, "epoch": 3.4458333333333333, "percentage": 68.92, "elapsed_time": "5:26:52", "remaining_time": "2:27:25"}
|
828 |
+
{"current_steps": 828, "total_steps": 1200, "loss": 0.4268, "lr": 1.061056874428219e-05, "epoch": 3.45, "percentage": 69.0, "elapsed_time": "5:27:15", "remaining_time": "2:27:01"}
|
829 |
+
{"current_steps": 829, "total_steps": 1200, "loss": 0.4262, "lr": 1.055924073275218e-05, "epoch": 3.4541666666666666, "percentage": 69.08, "elapsed_time": "5:27:38", "remaining_time": "2:26:37"}
|
830 |
+
{"current_steps": 830, "total_steps": 1200, "loss": 0.4351, "lr": 1.0507992605047193e-05, "epoch": 3.4583333333333335, "percentage": 69.17, "elapsed_time": "5:28:02", "remaining_time": "2:26:13"}
|
831 |
+
{"current_steps": 831, "total_steps": 1200, "loss": 0.4159, "lr": 1.0456824794807832e-05, "epoch": 3.4625, "percentage": 69.25, "elapsed_time": "5:28:24", "remaining_time": "2:25:49"}
|
832 |
+
{"current_steps": 832, "total_steps": 1200, "loss": 0.417, "lr": 1.0405737734995083e-05, "epoch": 3.466666666666667, "percentage": 69.33, "elapsed_time": "5:28:47", "remaining_time": "2:25:25"}
|
833 |
+
{"current_steps": 833, "total_steps": 1200, "loss": 0.4268, "lr": 1.0354731857886628e-05, "epoch": 3.470833333333333, "percentage": 69.42, "elapsed_time": "5:29:09", "remaining_time": "2:25:01"}
|
834 |
+
{"current_steps": 834, "total_steps": 1200, "loss": 0.4295, "lr": 1.0303807595073262e-05, "epoch": 3.475, "percentage": 69.5, "elapsed_time": "5:29:33", "remaining_time": "2:24:37"}
|
835 |
+
{"current_steps": 835, "total_steps": 1200, "loss": 0.4367, "lr": 1.0252965377455155e-05, "epoch": 3.4791666666666665, "percentage": 69.58, "elapsed_time": "5:29:56", "remaining_time": "2:24:13"}
|
836 |
+
{"current_steps": 836, "total_steps": 1200, "loss": 0.4212, "lr": 1.0202205635238263e-05, "epoch": 3.4833333333333334, "percentage": 69.67, "elapsed_time": "5:30:18", "remaining_time": "2:23:49"}
|
837 |
+
{"current_steps": 837, "total_steps": 1200, "loss": 0.428, "lr": 1.0151528797930662e-05, "epoch": 3.4875, "percentage": 69.75, "elapsed_time": "5:30:41", "remaining_time": "2:23:25"}
|
838 |
+
{"current_steps": 838, "total_steps": 1200, "loss": 0.4333, "lr": 1.010093529433892e-05, "epoch": 3.4916666666666667, "percentage": 69.83, "elapsed_time": "5:31:04", "remaining_time": "2:23:01"}
|
839 |
+
{"current_steps": 839, "total_steps": 1200, "loss": 0.444, "lr": 1.0050425552564475e-05, "epoch": 3.4958333333333336, "percentage": 69.92, "elapsed_time": "5:31:28", "remaining_time": "2:22:37"}
|
840 |
+
{"current_steps": 840, "total_steps": 1200, "loss": 0.4275, "lr": 1.0000000000000006e-05, "epoch": 3.5, "percentage": 70.0, "elapsed_time": "5:31:51", "remaining_time": "2:22:13"}
|
841 |
+
{"current_steps": 841, "total_steps": 1200, "loss": 0.4354, "lr": 9.949659063325801e-06, "epoch": 3.5041666666666664, "percentage": 70.08, "elapsed_time": "5:32:14", "remaining_time": "2:21:49"}
|
842 |
+
{"current_steps": 842, "total_steps": 1200, "loss": 0.425, "lr": 9.899403168506206e-06, "epoch": 3.5083333333333333, "percentage": 70.17, "elapsed_time": "5:32:37", "remaining_time": "2:21:25"}
|
843 |
+
{"current_steps": 843, "total_steps": 1200, "loss": 0.4165, "lr": 9.849232740785923e-06, "epoch": 3.5125, "percentage": 70.25, "elapsed_time": "5:33:00", "remaining_time": "2:21:01"}
|
844 |
+
{"current_steps": 844, "total_steps": 1200, "loss": 0.4222, "lr": 9.799148204686495e-06, "epoch": 3.5166666666666666, "percentage": 70.33, "elapsed_time": "5:33:24", "remaining_time": "2:20:38"}
|
845 |
+
{"current_steps": 845, "total_steps": 1200, "loss": 0.4313, "lr": 9.749149984002697e-06, "epoch": 3.5208333333333335, "percentage": 70.42, "elapsed_time": "5:33:47", "remaining_time": "2:20:14"}
|
846 |
+
{"current_steps": 846, "total_steps": 1200, "loss": 0.4349, "lr": 9.699238501798916e-06, "epoch": 3.525, "percentage": 70.5, "elapsed_time": "5:34:10", "remaining_time": "2:19:50"}
|
847 |
+
{"current_steps": 847, "total_steps": 1200, "loss": 0.4308, "lr": 9.649414180405605e-06, "epoch": 3.529166666666667, "percentage": 70.58, "elapsed_time": "5:34:34", "remaining_time": "2:19:26"}
|
848 |
+
{"current_steps": 848, "total_steps": 1200, "loss": 0.4305, "lr": 9.599677441415694e-06, "epoch": 3.533333333333333, "percentage": 70.67, "elapsed_time": "5:34:58", "remaining_time": "2:19:02"}
|
849 |
+
{"current_steps": 849, "total_steps": 1200, "loss": 0.4181, "lr": 9.550028705681024e-06, "epoch": 3.5375, "percentage": 70.75, "elapsed_time": "5:35:21", "remaining_time": "2:18:38"}
|
850 |
+
{"current_steps": 850, "total_steps": 1200, "loss": 0.4336, "lr": 9.5004683933088e-06, "epoch": 3.5416666666666665, "percentage": 70.83, "elapsed_time": "5:35:46", "remaining_time": "2:18:15"}
|
851 |
+
{"current_steps": 851, "total_steps": 1200, "loss": 0.424, "lr": 9.450996923658011e-06, "epoch": 3.5458333333333334, "percentage": 70.92, "elapsed_time": "5:36:08", "remaining_time": "2:17:51"}
|
852 |
+
{"current_steps": 852, "total_steps": 1200, "loss": 0.4414, "lr": 9.401614715335905e-06, "epoch": 3.55, "percentage": 71.0, "elapsed_time": "5:36:31", "remaining_time": "2:17:27"}
|
853 |
+
{"current_steps": 853, "total_steps": 1200, "loss": 0.4207, "lr": 9.352322186194434e-06, "epoch": 3.5541666666666667, "percentage": 71.08, "elapsed_time": "5:36:54", "remaining_time": "2:17:03"}
|
854 |
+
{"current_steps": 854, "total_steps": 1200, "loss": 0.4302, "lr": 9.30311975332672e-06, "epoch": 3.5583333333333336, "percentage": 71.17, "elapsed_time": "5:37:18", "remaining_time": "2:16:39"}
|
855 |
+
{"current_steps": 855, "total_steps": 1200, "loss": 0.4169, "lr": 9.254007833063521e-06, "epoch": 3.5625, "percentage": 71.25, "elapsed_time": "5:37:41", "remaining_time": "2:16:15"}
|
856 |
+
{"current_steps": 856, "total_steps": 1200, "loss": 0.4377, "lr": 9.204986840969749e-06, "epoch": 3.5666666666666664, "percentage": 71.33, "elapsed_time": "5:38:03", "remaining_time": "2:15:51"}
|
857 |
+
{"current_steps": 857, "total_steps": 1200, "loss": 0.4379, "lr": 9.15605719184086e-06, "epoch": 3.5708333333333333, "percentage": 71.42, "elapsed_time": "5:38:26", "remaining_time": "2:15:27"}
|
858 |
+
{"current_steps": 858, "total_steps": 1200, "loss": 0.4266, "lr": 9.107219299699459e-06, "epoch": 3.575, "percentage": 71.5, "elapsed_time": "5:38:49", "remaining_time": "2:15:03"}
|
859 |
+
{"current_steps": 859, "total_steps": 1200, "loss": 0.4213, "lr": 9.058473577791708e-06, "epoch": 3.5791666666666666, "percentage": 71.58, "elapsed_time": "5:39:12", "remaining_time": "2:14:39"}
|
860 |
+
{"current_steps": 860, "total_steps": 1200, "loss": 0.4235, "lr": 9.009820438583881e-06, "epoch": 3.5833333333333335, "percentage": 71.67, "elapsed_time": "5:39:35", "remaining_time": "2:14:15"}
|
861 |
+
{"current_steps": 861, "total_steps": 1200, "loss": 0.4254, "lr": 8.961260293758838e-06, "epoch": 3.5875, "percentage": 71.75, "elapsed_time": "5:39:59", "remaining_time": "2:13:51"}
|
862 |
+
{"current_steps": 862, "total_steps": 1200, "loss": 0.4277, "lr": 8.912793554212571e-06, "epoch": 3.591666666666667, "percentage": 71.83, "elapsed_time": "5:40:21", "remaining_time": "2:13:27"}
|
863 |
+
{"current_steps": 863, "total_steps": 1200, "loss": 0.4254, "lr": 8.864420630050713e-06, "epoch": 3.595833333333333, "percentage": 71.92, "elapsed_time": "5:40:44", "remaining_time": "2:13:03"}
|
864 |
+
{"current_steps": 864, "total_steps": 1200, "loss": 0.4348, "lr": 8.816141930585067e-06, "epoch": 3.6, "percentage": 72.0, "elapsed_time": "5:41:06", "remaining_time": "2:12:39"}
|
865 |
+
{"current_steps": 865, "total_steps": 1200, "loss": 0.423, "lr": 8.767957864330145e-06, "epoch": 3.6041666666666665, "percentage": 72.08, "elapsed_time": "5:41:29", "remaining_time": "2:12:15"}
|
866 |
+
{"current_steps": 866, "total_steps": 1200, "loss": 0.4223, "lr": 8.719868838999717e-06, "epoch": 3.6083333333333334, "percentage": 72.17, "elapsed_time": "5:41:52", "remaining_time": "2:11:51"}
|
867 |
+
{"current_steps": 867, "total_steps": 1200, "loss": 0.4177, "lr": 8.67187526150335e-06, "epoch": 3.6125, "percentage": 72.25, "elapsed_time": "5:42:15", "remaining_time": "2:11:27"}
|
868 |
+
{"current_steps": 868, "total_steps": 1200, "loss": 0.432, "lr": 8.623977537942969e-06, "epoch": 3.6166666666666667, "percentage": 72.33, "elapsed_time": "5:42:37", "remaining_time": "2:11:03"}
|
869 |
+
{"current_steps": 869, "total_steps": 1200, "loss": 0.4222, "lr": 8.576176073609425e-06, "epoch": 3.6208333333333336, "percentage": 72.42, "elapsed_time": "5:43:01", "remaining_time": "2:10:39"}
|
870 |
+
{"current_steps": 870, "total_steps": 1200, "loss": 0.4249, "lr": 8.528471272979083e-06, "epoch": 3.625, "percentage": 72.5, "elapsed_time": "5:43:23", "remaining_time": "2:10:15"}
|
871 |
+
{"current_steps": 871, "total_steps": 1200, "loss": 0.4339, "lr": 8.480863539710333e-06, "epoch": 3.6291666666666664, "percentage": 72.58, "elapsed_time": "5:43:47", "remaining_time": "2:09:51"}
|
872 |
+
{"current_steps": 872, "total_steps": 1200, "loss": 0.4245, "lr": 8.43335327664027e-06, "epoch": 3.6333333333333333, "percentage": 72.67, "elapsed_time": "5:44:09", "remaining_time": "2:09:27"}
|
873 |
+
{"current_steps": 873, "total_steps": 1200, "loss": 0.4611, "lr": 8.385940885781205e-06, "epoch": 3.6375, "percentage": 72.75, "elapsed_time": "5:44:33", "remaining_time": "2:09:03"}
|
874 |
+
{"current_steps": 874, "total_steps": 1200, "loss": 0.4273, "lr": 8.338626768317306e-06, "epoch": 3.6416666666666666, "percentage": 72.83, "elapsed_time": "5:44:57", "remaining_time": "2:08:39"}
|
875 |
+
{"current_steps": 875, "total_steps": 1200, "loss": 0.4035, "lr": 8.291411324601191e-06, "epoch": 3.6458333333333335, "percentage": 72.92, "elapsed_time": "5:45:20", "remaining_time": "2:08:16"}
|
876 |
+
{"current_steps": 876, "total_steps": 1200, "loss": 0.4294, "lr": 8.24429495415054e-06, "epoch": 3.65, "percentage": 73.0, "elapsed_time": "5:45:44", "remaining_time": "2:07:52"}
|
877 |
+
{"current_steps": 877, "total_steps": 1200, "loss": 0.4251, "lr": 8.197278055644715e-06, "epoch": 3.654166666666667, "percentage": 73.08, "elapsed_time": "5:46:06", "remaining_time": "2:07:28"}
|
878 |
+
{"current_steps": 878, "total_steps": 1200, "loss": 0.4321, "lr": 8.15036102692139e-06, "epoch": 3.658333333333333, "percentage": 73.17, "elapsed_time": "5:46:29", "remaining_time": "2:07:04"}
|
879 |
+
{"current_steps": 879, "total_steps": 1200, "loss": 0.4295, "lr": 8.103544264973178e-06, "epoch": 3.6625, "percentage": 73.25, "elapsed_time": "5:46:53", "remaining_time": "2:06:40"}
|
880 |
+
{"current_steps": 880, "total_steps": 1200, "loss": 0.4304, "lr": 8.056828165944282e-06, "epoch": 3.6666666666666665, "percentage": 73.33, "elapsed_time": "5:47:15", "remaining_time": "2:06:16"}
|
881 |
+
{"current_steps": 881, "total_steps": 1200, "loss": 0.4192, "lr": 8.010213125127128e-06, "epoch": 3.6708333333333334, "percentage": 73.42, "elapsed_time": "5:47:39", "remaining_time": "2:05:52"}
|
882 |
+
{"current_steps": 882, "total_steps": 1200, "loss": 0.4334, "lr": 7.963699536959032e-06, "epoch": 3.675, "percentage": 73.5, "elapsed_time": "5:48:02", "remaining_time": "2:05:29"}
|
883 |
+
{"current_steps": 883, "total_steps": 1200, "loss": 0.4464, "lr": 7.917287795018874e-06, "epoch": 3.6791666666666667, "percentage": 73.58, "elapsed_time": "5:48:26", "remaining_time": "2:05:05"}
|
884 |
+
{"current_steps": 884, "total_steps": 1200, "loss": 0.4391, "lr": 7.870978292023739e-06, "epoch": 3.6833333333333336, "percentage": 73.67, "elapsed_time": "5:48:50", "remaining_time": "2:04:41"}
|
885 |
+
{"current_steps": 885, "total_steps": 1200, "loss": 0.4327, "lr": 7.824771419825588e-06, "epoch": 3.6875, "percentage": 73.75, "elapsed_time": "5:49:13", "remaining_time": "2:04:18"}
|
886 |
+
{"current_steps": 886, "total_steps": 1200, "loss": 0.4364, "lr": 7.778667569408006e-06, "epoch": 3.6916666666666664, "percentage": 73.83, "elapsed_time": "5:49:36", "remaining_time": "2:03:54"}
|
887 |
+
{"current_steps": 887, "total_steps": 1200, "loss": 0.4414, "lr": 7.732667130882819e-06, "epoch": 3.6958333333333333, "percentage": 73.92, "elapsed_time": "5:49:59", "remaining_time": "2:03:30"}
|
888 |
+
{"current_steps": 888, "total_steps": 1200, "loss": 0.4397, "lr": 7.686770493486835e-06, "epoch": 3.7, "percentage": 74.0, "elapsed_time": "5:50:22", "remaining_time": "2:03:06"}
|
889 |
+
{"current_steps": 889, "total_steps": 1200, "loss": 0.4185, "lr": 7.640978045578538e-06, "epoch": 3.7041666666666666, "percentage": 74.08, "elapsed_time": "5:50:46", "remaining_time": "2:02:42"}
|
890 |
+
{"current_steps": 890, "total_steps": 1200, "loss": 0.4196, "lr": 7.595290174634802e-06, "epoch": 3.7083333333333335, "percentage": 74.17, "elapsed_time": "5:51:10", "remaining_time": "2:02:19"}
|
891 |
+
{"current_steps": 891, "total_steps": 1200, "loss": 0.4223, "lr": 7.549707267247612e-06, "epoch": 3.7125, "percentage": 74.25, "elapsed_time": "5:51:34", "remaining_time": "2:01:55"}
|
892 |
+
{"current_steps": 892, "total_steps": 1200, "loss": 0.4331, "lr": 7.504229709120801e-06, "epoch": 3.716666666666667, "percentage": 74.33, "elapsed_time": "5:51:57", "remaining_time": "2:01:31"}
|
893 |
+
{"current_steps": 893, "total_steps": 1200, "loss": 0.4293, "lr": 7.4588578850667634e-06, "epoch": 3.720833333333333, "percentage": 74.42, "elapsed_time": "5:52:20", "remaining_time": "2:01:07"}
|
894 |
+
{"current_steps": 894, "total_steps": 1200, "loss": 0.4328, "lr": 7.413592179003255e-06, "epoch": 3.725, "percentage": 74.5, "elapsed_time": "5:52:43", "remaining_time": "2:00:43"}
|
895 |
+
{"current_steps": 895, "total_steps": 1200, "loss": 0.4374, "lr": 7.368432973950053e-06, "epoch": 3.7291666666666665, "percentage": 74.58, "elapsed_time": "5:53:06", "remaining_time": "2:00:20"}
|
896 |
+
{"current_steps": 896, "total_steps": 1200, "loss": 0.4214, "lr": 7.323380652025794e-06, "epoch": 3.7333333333333334, "percentage": 74.67, "elapsed_time": "5:53:33", "remaining_time": "1:59:57"}
|
897 |
+
{"current_steps": 897, "total_steps": 1200, "loss": 0.43, "lr": 7.278435594444719e-06, "epoch": 3.7375, "percentage": 74.75, "elapsed_time": "5:53:57", "remaining_time": "1:59:33"}
|
898 |
+
{"current_steps": 898, "total_steps": 1200, "loss": 0.4115, "lr": 7.2335981815134415e-06, "epoch": 3.7416666666666667, "percentage": 74.83, "elapsed_time": "5:54:21", "remaining_time": "1:59:10"}
|
899 |
+
{"current_steps": 899, "total_steps": 1200, "loss": 0.4338, "lr": 7.1888687926276965e-06, "epoch": 3.7458333333333336, "percentage": 74.92, "elapsed_time": "5:54:44", "remaining_time": "1:58:46"}
|
900 |
+
{"current_steps": 900, "total_steps": 1200, "loss": 0.4365, "lr": 7.1442478062692135e-06, "epoch": 3.75, "percentage": 75.0, "elapsed_time": "5:55:06", "remaining_time": "1:58:22"}
|
901 |
+
{"current_steps": 901, "total_steps": 1200, "loss": 0.4277, "lr": 7.09973560000244e-06, "epoch": 3.7541666666666664, "percentage": 75.08, "elapsed_time": "5:55:30", "remaining_time": "1:57:58"}
|
902 |
+
{"current_steps": 902, "total_steps": 1200, "loss": 0.4257, "lr": 7.055332550471354e-06, "epoch": 3.7583333333333333, "percentage": 75.17, "elapsed_time": "5:55:53", "remaining_time": "1:57:34"}
|
903 |
+
{"current_steps": 903, "total_steps": 1200, "loss": 0.4346, "lr": 7.01103903339633e-06, "epoch": 3.7625, "percentage": 75.25, "elapsed_time": "5:56:17", "remaining_time": "1:57:10"}
|
904 |
+
{"current_steps": 904, "total_steps": 1200, "loss": 0.4261, "lr": 6.966855423570898e-06, "epoch": 3.7666666666666666, "percentage": 75.33, "elapsed_time": "5:56:39", "remaining_time": "1:56:46"}
|
905 |
+
{"current_steps": 905, "total_steps": 1200, "loss": 0.4227, "lr": 6.922782094858609e-06, "epoch": 3.7708333333333335, "percentage": 75.42, "elapsed_time": "5:57:03", "remaining_time": "1:56:23"}
|
906 |
+
{"current_steps": 906, "total_steps": 1200, "loss": 0.4283, "lr": 6.878819420189857e-06, "epoch": 3.775, "percentage": 75.5, "elapsed_time": "5:57:26", "remaining_time": "1:55:59"}
|
907 |
+
{"current_steps": 907, "total_steps": 1200, "loss": 0.4268, "lr": 6.834967771558722e-06, "epoch": 3.779166666666667, "percentage": 75.58, "elapsed_time": "5:57:49", "remaining_time": "1:55:35"}
|
908 |
+
{"current_steps": 908, "total_steps": 1200, "loss": 0.4179, "lr": 6.7912275200198496e-06, "epoch": 3.783333333333333, "percentage": 75.67, "elapsed_time": "5:58:12", "remaining_time": "1:55:11"}
|
909 |
+
{"current_steps": 909, "total_steps": 1200, "loss": 0.4276, "lr": 6.747599035685255e-06, "epoch": 3.7875, "percentage": 75.75, "elapsed_time": "5:58:35", "remaining_time": "1:54:47"}
|
910 |
+
{"current_steps": 910, "total_steps": 1200, "loss": 0.4103, "lr": 6.704082687721243e-06, "epoch": 3.7916666666666665, "percentage": 75.83, "elapsed_time": "5:58:57", "remaining_time": "1:54:23"}
|
911 |
+
{"current_steps": 911, "total_steps": 1200, "loss": 0.4278, "lr": 6.660678844345276e-06, "epoch": 3.7958333333333334, "percentage": 75.92, "elapsed_time": "5:59:20", "remaining_time": "1:53:59"}
|
912 |
+
{"current_steps": 912, "total_steps": 1200, "loss": 0.4394, "lr": 6.617387872822842e-06, "epoch": 3.8, "percentage": 76.0, "elapsed_time": "5:59:43", "remaining_time": "1:53:35"}
|
913 |
+
{"current_steps": 913, "total_steps": 1200, "loss": 0.4272, "lr": 6.57421013946433e-06, "epoch": 3.8041666666666667, "percentage": 76.08, "elapsed_time": "6:00:06", "remaining_time": "1:53:11"}
|
914 |
+
{"current_steps": 914, "total_steps": 1200, "loss": 0.4245, "lr": 6.531146009621994e-06, "epoch": 3.8083333333333336, "percentage": 76.17, "elapsed_time": "6:00:28", "remaining_time": "1:52:47"}
|
915 |
+
{"current_steps": 915, "total_steps": 1200, "loss": 0.4293, "lr": 6.488195847686795e-06, "epoch": 3.8125, "percentage": 76.25, "elapsed_time": "6:00:52", "remaining_time": "1:52:24"}
|
916 |
+
{"current_steps": 916, "total_steps": 1200, "loss": 0.4271, "lr": 6.445360017085356e-06, "epoch": 3.8166666666666664, "percentage": 76.33, "elapsed_time": "6:01:15", "remaining_time": "1:52:00"}
|
917 |
+
{"current_steps": 917, "total_steps": 1200, "loss": 0.4181, "lr": 6.402638880276868e-06, "epoch": 3.8208333333333333, "percentage": 76.42, "elapsed_time": "6:01:39", "remaining_time": "1:51:36"}
|
918 |
+
{"current_steps": 918, "total_steps": 1200, "loss": 0.4288, "lr": 6.360032798750033e-06, "epoch": 3.825, "percentage": 76.5, "elapsed_time": "6:02:02", "remaining_time": "1:51:12"}
|
919 |
+
{"current_steps": 919, "total_steps": 1200, "loss": 0.4369, "lr": 6.317542133020005e-06, "epoch": 3.8291666666666666, "percentage": 76.58, "elapsed_time": "6:02:25", "remaining_time": "1:50:49"}
|
920 |
+
{"current_steps": 920, "total_steps": 1200, "loss": 0.4305, "lr": 6.275167242625331e-06, "epoch": 3.8333333333333335, "percentage": 76.67, "elapsed_time": "6:02:49", "remaining_time": "1:50:25"}
|
921 |
+
{"current_steps": 921, "total_steps": 1200, "loss": 0.4298, "lr": 6.232908486124918e-06, "epoch": 3.8375, "percentage": 76.75, "elapsed_time": "6:03:12", "remaining_time": "1:50:01"}
|
922 |
+
{"current_steps": 922, "total_steps": 1200, "loss": 0.4209, "lr": 6.190766221095013e-06, "epoch": 3.841666666666667, "percentage": 76.83, "elapsed_time": "6:03:36", "remaining_time": "1:49:37"}
|
923 |
+
{"current_steps": 923, "total_steps": 1200, "loss": 0.4318, "lr": 6.148740804126121e-06, "epoch": 3.845833333333333, "percentage": 76.92, "elapsed_time": "6:03:59", "remaining_time": "1:49:14"}
|
924 |
+
{"current_steps": 924, "total_steps": 1200, "loss": 0.4278, "lr": 6.106832590820053e-06, "epoch": 3.85, "percentage": 77.0, "elapsed_time": "6:04:22", "remaining_time": "1:48:50"}
|
925 |
+
{"current_steps": 925, "total_steps": 1200, "loss": 0.4278, "lr": 6.065041935786906e-06, "epoch": 3.8541666666666665, "percentage": 77.08, "elapsed_time": "6:04:45", "remaining_time": "1:48:26"}
|
926 |
+
{"current_steps": 926, "total_steps": 1200, "loss": 0.4248, "lr": 6.023369192641999e-06, "epoch": 3.8583333333333334, "percentage": 77.17, "elapsed_time": "6:05:08", "remaining_time": "1:48:02"}
|
927 |
+
{"current_steps": 927, "total_steps": 1200, "loss": 0.43, "lr": 5.981814714002982e-06, "epoch": 3.8625, "percentage": 77.25, "elapsed_time": "6:05:32", "remaining_time": "1:47:39"}
|
928 |
+
{"current_steps": 928, "total_steps": 1200, "loss": 0.4237, "lr": 5.940378851486766e-06, "epoch": 3.8666666666666667, "percentage": 77.33, "elapsed_time": "6:05:55", "remaining_time": "1:47:15"}
|
929 |
+
{"current_steps": 929, "total_steps": 1200, "loss": 0.4277, "lr": 5.899061955706593e-06, "epoch": 3.8708333333333336, "percentage": 77.42, "elapsed_time": "6:06:18", "remaining_time": "1:46:51"}
|
930 |
+
{"current_steps": 930, "total_steps": 1200, "loss": 0.4254, "lr": 5.857864376269051e-06, "epoch": 3.875, "percentage": 77.5, "elapsed_time": "6:06:41", "remaining_time": "1:46:27"}
|
931 |
+
{"current_steps": 931, "total_steps": 1200, "loss": 0.4413, "lr": 5.816786461771129e-06, "epoch": 3.8791666666666664, "percentage": 77.58, "elapsed_time": "6:07:05", "remaining_time": "1:46:03"}
|
932 |
+
{"current_steps": 932, "total_steps": 1200, "loss": 0.419, "lr": 5.7758285597972585e-06, "epoch": 3.8833333333333333, "percentage": 77.67, "elapsed_time": "6:07:28", "remaining_time": "1:45:40"}
|
933 |
+
{"current_steps": 933, "total_steps": 1200, "loss": 0.4263, "lr": 5.734991016916372e-06, "epoch": 3.8875, "percentage": 77.75, "elapsed_time": "6:07:51", "remaining_time": "1:45:16"}
|
934 |
+
{"current_steps": 934, "total_steps": 1200, "loss": 0.428, "lr": 5.694274178678973e-06, "epoch": 3.8916666666666666, "percentage": 77.83, "elapsed_time": "6:08:15", "remaining_time": "1:44:52"}
|
935 |
+
{"current_steps": 935, "total_steps": 1200, "loss": 0.4297, "lr": 5.65367838961421e-06, "epoch": 3.8958333333333335, "percentage": 77.92, "elapsed_time": "6:08:39", "remaining_time": "1:44:29"}
|
936 |
+
{"current_steps": 936, "total_steps": 1200, "loss": 0.4234, "lr": 5.613203993226981e-06, "epoch": 3.9, "percentage": 78.0, "elapsed_time": "6:09:02", "remaining_time": "1:44:05"}
|
937 |
+
{"current_steps": 937, "total_steps": 1200, "loss": 0.427, "lr": 5.5728513319949725e-06, "epoch": 3.904166666666667, "percentage": 78.08, "elapsed_time": "6:09:25", "remaining_time": "1:43:41"}
|
938 |
+
{"current_steps": 938, "total_steps": 1200, "loss": 0.4224, "lr": 5.53262074736584e-06, "epoch": 3.908333333333333, "percentage": 78.17, "elapsed_time": "6:09:48", "remaining_time": "1:43:17"}
|
939 |
+
{"current_steps": 939, "total_steps": 1200, "loss": 0.4247, "lr": 5.492512579754252e-06, "epoch": 3.9125, "percentage": 78.25, "elapsed_time": "6:10:11", "remaining_time": "1:42:53"}
|
940 |
+
{"current_steps": 940, "total_steps": 1200, "loss": 0.4276, "lr": 5.452527168539026e-06, "epoch": 3.9166666666666665, "percentage": 78.33, "elapsed_time": "6:10:34", "remaining_time": "1:42:29"}
|
941 |
+
{"current_steps": 941, "total_steps": 1200, "loss": 0.4276, "lr": 5.412664852060294e-06, "epoch": 3.9208333333333334, "percentage": 78.42, "elapsed_time": "6:10:56", "remaining_time": "1:42:05"}
|
942 |
+
{"current_steps": 942, "total_steps": 1200, "loss": 0.4306, "lr": 5.372925967616591e-06, "epoch": 3.925, "percentage": 78.5, "elapsed_time": "6:11:18", "remaining_time": "1:41:41"}
|
943 |
+
{"current_steps": 943, "total_steps": 1200, "loss": 0.4333, "lr": 5.333310851462026e-06, "epoch": 3.9291666666666667, "percentage": 78.58, "elapsed_time": "6:11:41", "remaining_time": "1:41:17"}
|
944 |
+
{"current_steps": 944, "total_steps": 1200, "loss": 0.435, "lr": 5.293819838803429e-06, "epoch": 3.9333333333333336, "percentage": 78.67, "elapsed_time": "6:12:05", "remaining_time": "1:40:54"}
|
945 |
+
{"current_steps": 945, "total_steps": 1200, "loss": 0.4233, "lr": 5.254453263797521e-06, "epoch": 3.9375, "percentage": 78.75, "elapsed_time": "6:12:28", "remaining_time": "1:40:30"}
|
946 |
+
{"current_steps": 946, "total_steps": 1200, "loss": 0.4266, "lr": 5.215211459548082e-06, "epoch": 3.9416666666666664, "percentage": 78.83, "elapsed_time": "6:12:52", "remaining_time": "1:40:06"}
|
947 |
+
{"current_steps": 947, "total_steps": 1200, "loss": 0.4168, "lr": 5.17609475810313e-06, "epoch": 3.9458333333333333, "percentage": 78.92, "elapsed_time": "6:13:15", "remaining_time": "1:39:43"}
|
948 |
+
{"current_steps": 948, "total_steps": 1200, "loss": 0.4417, "lr": 5.137103490452113e-06, "epoch": 3.95, "percentage": 79.0, "elapsed_time": "6:13:39", "remaining_time": "1:39:19"}
|
949 |
+
{"current_steps": 949, "total_steps": 1200, "loss": 0.4159, "lr": 5.098237986523129e-06, "epoch": 3.9541666666666666, "percentage": 79.08, "elapsed_time": "6:14:02", "remaining_time": "1:38:55"}
|
950 |
+
{"current_steps": 950, "total_steps": 1200, "loss": 0.4222, "lr": 5.059498575180084e-06, "epoch": 3.9583333333333335, "percentage": 79.17, "elapsed_time": "6:14:26", "remaining_time": "1:38:32"}
|
951 |
+
{"current_steps": 951, "total_steps": 1200, "loss": 0.4249, "lr": 5.0208855842199565e-06, "epoch": 3.9625, "percentage": 79.25, "elapsed_time": "6:14:48", "remaining_time": "1:38:08"}
|
952 |
+
{"current_steps": 952, "total_steps": 1200, "loss": 0.402, "lr": 4.982399340370017e-06, "epoch": 3.966666666666667, "percentage": 79.33, "elapsed_time": "6:15:11", "remaining_time": "1:37:44"}
|
953 |
+
{"current_steps": 953, "total_steps": 1200, "loss": 0.4386, "lr": 4.944040169285043e-06, "epoch": 3.970833333333333, "percentage": 79.42, "elapsed_time": "6:15:34", "remaining_time": "1:37:20"}
|
954 |
+
{"current_steps": 954, "total_steps": 1200, "loss": 0.4287, "lr": 4.90580839554456e-06, "epoch": 3.975, "percentage": 79.5, "elapsed_time": "6:15:57", "remaining_time": "1:36:56"}
|
955 |
+
{"current_steps": 955, "total_steps": 1200, "loss": 0.4003, "lr": 4.867704342650143e-06, "epoch": 3.9791666666666665, "percentage": 79.58, "elapsed_time": "6:16:21", "remaining_time": "1:36:33"}
|
956 |
+
{"current_steps": 956, "total_steps": 1200, "loss": 0.4319, "lr": 4.829728333022623e-06, "epoch": 3.9833333333333334, "percentage": 79.67, "elapsed_time": "6:16:44", "remaining_time": "1:36:09"}
|
957 |
+
{"current_steps": 957, "total_steps": 1200, "loss": 0.4149, "lr": 4.791880687999382e-06, "epoch": 3.9875, "percentage": 79.75, "elapsed_time": "6:17:07", "remaining_time": "1:35:45"}
|
958 |
+
{"current_steps": 958, "total_steps": 1200, "loss": 0.4033, "lr": 4.754161727831643e-06, "epoch": 3.9916666666666667, "percentage": 79.83, "elapsed_time": "6:17:30", "remaining_time": "1:35:21"}
|
959 |
+
{"current_steps": 959, "total_steps": 1200, "loss": 0.4175, "lr": 4.716571771681737e-06, "epoch": 3.9958333333333336, "percentage": 79.92, "elapsed_time": "6:17:53", "remaining_time": "1:34:57"}
|
960 |
+
{"current_steps": 960, "total_steps": 1200, "loss": 0.4229, "lr": 4.679111137620442e-06, "epoch": 4.0, "percentage": 80.0, "elapsed_time": "6:18:15", "remaining_time": "1:34:33"}
|
961 |
+
{"current_steps": 961, "total_steps": 1200, "loss": 0.3881, "lr": 4.641780142624231e-06, "epoch": 4.004166666666666, "percentage": 80.08, "elapsed_time": "6:21:54", "remaining_time": "1:34:58"}
|
962 |
+
{"current_steps": 962, "total_steps": 1200, "loss": 0.4078, "lr": 4.604579102572641e-06, "epoch": 4.008333333333334, "percentage": 80.17, "elapsed_time": "6:22:18", "remaining_time": "1:34:34"}
|
963 |
+
{"current_steps": 963, "total_steps": 1200, "loss": 0.4066, "lr": 4.567508332245605e-06, "epoch": 4.0125, "percentage": 80.25, "elapsed_time": "6:22:41", "remaining_time": "1:34:10"}
|
964 |
+
{"current_steps": 964, "total_steps": 1200, "loss": 0.3988, "lr": 4.530568145320724e-06, "epoch": 4.016666666666667, "percentage": 80.33, "elapsed_time": "6:23:05", "remaining_time": "1:33:47"}
|
965 |
+
{"current_steps": 965, "total_steps": 1200, "loss": 0.3932, "lr": 4.493758854370682e-06, "epoch": 4.020833333333333, "percentage": 80.42, "elapsed_time": "6:23:27", "remaining_time": "1:33:22"}
|
966 |
+
{"current_steps": 966, "total_steps": 1200, "loss": 0.3679, "lr": 4.4570807708605825e-06, "epoch": 4.025, "percentage": 80.5, "elapsed_time": "6:23:50", "remaining_time": "1:32:58"}
|
967 |
+
{"current_steps": 967, "total_steps": 1200, "loss": 0.3851, "lr": 4.420534205145293e-06, "epoch": 4.029166666666667, "percentage": 80.58, "elapsed_time": "6:24:12", "remaining_time": "1:32:34"}
|
968 |
+
{"current_steps": 968, "total_steps": 1200, "loss": 0.3817, "lr": 4.384119466466816e-06, "epoch": 4.033333333333333, "percentage": 80.67, "elapsed_time": "6:24:36", "remaining_time": "1:32:10"}
|