Training in progress, epoch 3
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4877660776
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dad095630fb9cef750a6d69b8087a7d54100c780a07d4b1825a8495468dd0498
|
3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4932751008
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:51bad2c4120c5f6d191c187c5864145771780d79350c4be5797f2b41c3589cd7
|
3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4330865200
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4caaed04dd04ce5b73b2281049211fa1d3128a53d0100e32162e35bddc21895c
|
3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1089994880
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cdd63485ba0cbd72e48e0fb9846ff802d6441993d89e18e3c9a51f6d5ba993d2
|
3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
@@ -694,3 +694,225 @@
|
|
694 |
{"current_steps": 667, "total_steps": 1105, "loss": 1.116, "lr": 1.6292119893295567e-05, "epoch": 3.0169109357384443, "percentage": 60.36, "elapsed_time": "1:33:22", "remaining_time": "1:01:18"}
|
695 |
{"current_steps": 668, "total_steps": 1105, "loss": 1.0563, "lr": 1.6230023207179653e-05, "epoch": 3.0214205186020293, "percentage": 60.45, "elapsed_time": "1:33:46", "remaining_time": "1:01:20"}
|
696 |
{"current_steps": 669, "total_steps": 1105, "loss": 1.0638, "lr": 1.6167964179760954e-05, "epoch": 3.0259301014656144, "percentage": 60.54, "elapsed_time": "1:34:10", "remaining_time": "1:01:22"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
694 |
{"current_steps": 667, "total_steps": 1105, "loss": 1.116, "lr": 1.6292119893295567e-05, "epoch": 3.0169109357384443, "percentage": 60.36, "elapsed_time": "1:33:22", "remaining_time": "1:01:18"}
|
695 |
{"current_steps": 668, "total_steps": 1105, "loss": 1.0563, "lr": 1.6230023207179653e-05, "epoch": 3.0214205186020293, "percentage": 60.45, "elapsed_time": "1:33:46", "remaining_time": "1:01:20"}
|
696 |
{"current_steps": 669, "total_steps": 1105, "loss": 1.0638, "lr": 1.6167964179760954e-05, "epoch": 3.0259301014656144, "percentage": 60.54, "elapsed_time": "1:34:10", "remaining_time": "1:01:22"}
|
697 |
+
{"current_steps": 670, "total_steps": 1105, "loss": 1.0399, "lr": 1.6105943430953686e-05, "epoch": 3.0304396843291994, "percentage": 60.63, "elapsed_time": "1:34:34", "remaining_time": "1:01:24"}
|
698 |
+
{"current_steps": 671, "total_steps": 1105, "loss": 1.0728, "lr": 1.6043961580289656e-05, "epoch": 3.0349492671927845, "percentage": 60.72, "elapsed_time": "1:34:58", "remaining_time": "1:01:25"}
|
699 |
+
{"current_steps": 672, "total_steps": 1105, "loss": 1.0542, "lr": 1.5982019246912146e-05, "epoch": 3.03945885005637, "percentage": 60.81, "elapsed_time": "1:35:22", "remaining_time": "1:01:27"}
|
700 |
+
{"current_steps": 673, "total_steps": 1105, "loss": 1.0684, "lr": 1.5920117049569666e-05, "epoch": 3.043968432919955, "percentage": 60.9, "elapsed_time": "1:35:46", "remaining_time": "1:01:28"}
|
701 |
+
{"current_steps": 674, "total_steps": 1105, "loss": 1.0525, "lr": 1.585825560660983e-05, "epoch": 3.04847801578354, "percentage": 61.0, "elapsed_time": "1:36:10", "remaining_time": "1:01:30"}
|
702 |
+
{"current_steps": 675, "total_steps": 1105, "loss": 1.088, "lr": 1.5796435535973124e-05, "epoch": 3.052987598647125, "percentage": 61.09, "elapsed_time": "1:36:35", "remaining_time": "1:01:31"}
|
703 |
+
{"current_steps": 676, "total_steps": 1105, "loss": 1.0925, "lr": 1.5734657455186794e-05, "epoch": 3.05749718151071, "percentage": 61.18, "elapsed_time": "1:36:58", "remaining_time": "1:01:32"}
|
704 |
+
{"current_steps": 677, "total_steps": 1105, "loss": 1.0764, "lr": 1.5672921981358625e-05, "epoch": 3.062006764374295, "percentage": 61.27, "elapsed_time": "1:37:22", "remaining_time": "1:01:33"}
|
705 |
+
{"current_steps": 678, "total_steps": 1105, "loss": 1.0603, "lr": 1.5611229731170793e-05, "epoch": 3.0665163472378807, "percentage": 61.36, "elapsed_time": "1:37:47", "remaining_time": "1:01:35"}
|
706 |
+
{"current_steps": 679, "total_steps": 1105, "loss": 1.0888, "lr": 1.5549581320873715e-05, "epoch": 3.0710259301014657, "percentage": 61.45, "elapsed_time": "1:38:10", "remaining_time": "1:01:35"}
|
707 |
+
{"current_steps": 680, "total_steps": 1105, "loss": 1.0454, "lr": 1.5487977366279888e-05, "epoch": 3.075535512965051, "percentage": 61.54, "elapsed_time": "1:38:34", "remaining_time": "1:01:36"}
|
708 |
+
{"current_steps": 681, "total_steps": 1105, "loss": 1.0838, "lr": 1.5426418482757742e-05, "epoch": 3.080045095828636, "percentage": 61.63, "elapsed_time": "1:38:58", "remaining_time": "1:01:37"}
|
709 |
+
{"current_steps": 682, "total_steps": 1105, "loss": 1.09, "lr": 1.536490528522547e-05, "epoch": 3.084554678692221, "percentage": 61.72, "elapsed_time": "1:39:22", "remaining_time": "1:01:38"}
|
710 |
+
{"current_steps": 683, "total_steps": 1105, "loss": 1.0436, "lr": 1.530343838814492e-05, "epoch": 3.089064261555806, "percentage": 61.81, "elapsed_time": "1:39:46", "remaining_time": "1:01:38"}
|
711 |
+
{"current_steps": 684, "total_steps": 1105, "loss": 1.0667, "lr": 1.5242018405515438e-05, "epoch": 3.0935738444193914, "percentage": 61.9, "elapsed_time": "1:40:10", "remaining_time": "1:01:39"}
|
712 |
+
{"current_steps": 685, "total_steps": 1105, "loss": 1.0482, "lr": 1.5180645950867714e-05, "epoch": 3.0980834272829765, "percentage": 61.99, "elapsed_time": "1:40:34", "remaining_time": "1:01:40"}
|
713 |
+
{"current_steps": 686, "total_steps": 1105, "loss": 1.0888, "lr": 1.5119321637257711e-05, "epoch": 3.1025930101465615, "percentage": 62.08, "elapsed_time": "1:40:59", "remaining_time": "1:01:41"}
|
714 |
+
{"current_steps": 687, "total_steps": 1105, "loss": 1.088, "lr": 1.5058046077260477e-05, "epoch": 3.1071025930101466, "percentage": 62.17, "elapsed_time": "1:41:24", "remaining_time": "1:01:42"}
|
715 |
+
{"current_steps": 688, "total_steps": 1105, "loss": 1.0343, "lr": 1.499681988296408e-05, "epoch": 3.1116121758737316, "percentage": 62.26, "elapsed_time": "1:41:48", "remaining_time": "1:01:42"}
|
716 |
+
{"current_steps": 689, "total_steps": 1105, "loss": 1.0673, "lr": 1.493564366596344e-05, "epoch": 3.1161217587373167, "percentage": 62.35, "elapsed_time": "1:42:12", "remaining_time": "1:01:42"}
|
717 |
+
{"current_steps": 690, "total_steps": 1105, "loss": 1.0887, "lr": 1.4874518037354274e-05, "epoch": 3.1206313416009017, "percentage": 62.44, "elapsed_time": "1:42:36", "remaining_time": "1:01:42"}
|
718 |
+
{"current_steps": 691, "total_steps": 1105, "loss": 1.0574, "lr": 1.481344360772695e-05, "epoch": 3.125140924464487, "percentage": 62.53, "elapsed_time": "1:43:00", "remaining_time": "1:01:42"}
|
719 |
+
{"current_steps": 692, "total_steps": 1105, "loss": 1.0809, "lr": 1.4752420987160423e-05, "epoch": 3.1296505073280723, "percentage": 62.62, "elapsed_time": "1:43:24", "remaining_time": "1:01:42"}
|
720 |
+
{"current_steps": 693, "total_steps": 1105, "loss": 1.0943, "lr": 1.4691450785216095e-05, "epoch": 3.1341600901916573, "percentage": 62.71, "elapsed_time": "1:43:48", "remaining_time": "1:01:42"}
|
721 |
+
{"current_steps": 694, "total_steps": 1105, "loss": 1.0993, "lr": 1.4630533610931765e-05, "epoch": 3.1386696730552424, "percentage": 62.81, "elapsed_time": "1:44:12", "remaining_time": "1:01:43"}
|
722 |
+
{"current_steps": 695, "total_steps": 1105, "loss": 1.0353, "lr": 1.4569670072815552e-05, "epoch": 3.1431792559188274, "percentage": 62.9, "elapsed_time": "1:44:37", "remaining_time": "1:01:43"}
|
723 |
+
{"current_steps": 696, "total_steps": 1105, "loss": 1.0544, "lr": 1.450886077883976e-05, "epoch": 3.1476888387824125, "percentage": 62.99, "elapsed_time": "1:45:01", "remaining_time": "1:01:42"}
|
724 |
+
{"current_steps": 697, "total_steps": 1105, "loss": 1.0474, "lr": 1.444810633643488e-05, "epoch": 3.152198421645998, "percentage": 63.08, "elapsed_time": "1:45:25", "remaining_time": "1:01:42"}
|
725 |
+
{"current_steps": 698, "total_steps": 1105, "loss": 1.0767, "lr": 1.4387407352483452e-05, "epoch": 3.156708004509583, "percentage": 63.17, "elapsed_time": "1:45:48", "remaining_time": "1:01:41"}
|
726 |
+
{"current_steps": 699, "total_steps": 1105, "loss": 1.0993, "lr": 1.4326764433314066e-05, "epoch": 3.161217587373168, "percentage": 63.26, "elapsed_time": "1:46:13", "remaining_time": "1:01:41"}
|
727 |
+
{"current_steps": 700, "total_steps": 1105, "loss": 1.0832, "lr": 1.4266178184695253e-05, "epoch": 3.165727170236753, "percentage": 63.35, "elapsed_time": "1:46:37", "remaining_time": "1:01:41"}
|
728 |
+
{"current_steps": 701, "total_steps": 1105, "loss": 1.073, "lr": 1.4205649211829471e-05, "epoch": 3.170236753100338, "percentage": 63.44, "elapsed_time": "1:47:01", "remaining_time": "1:01:40"}
|
729 |
+
{"current_steps": 702, "total_steps": 1105, "loss": 1.0608, "lr": 1.4145178119347026e-05, "epoch": 3.174746335963923, "percentage": 63.53, "elapsed_time": "1:47:25", "remaining_time": "1:01:40"}
|
730 |
+
{"current_steps": 703, "total_steps": 1105, "loss": 1.0754, "lr": 1.4084765511300065e-05, "epoch": 3.1792559188275087, "percentage": 63.62, "elapsed_time": "1:47:49", "remaining_time": "1:01:39"}
|
731 |
+
{"current_steps": 704, "total_steps": 1105, "loss": 1.0505, "lr": 1.4024411991156534e-05, "epoch": 3.1837655016910937, "percentage": 63.71, "elapsed_time": "1:48:13", "remaining_time": "1:01:38"}
|
732 |
+
{"current_steps": 705, "total_steps": 1105, "loss": 1.0596, "lr": 1.3964118161794118e-05, "epoch": 3.188275084554679, "percentage": 63.8, "elapsed_time": "1:48:37", "remaining_time": "1:01:37"}
|
733 |
+
{"current_steps": 706, "total_steps": 1105, "loss": 1.0819, "lr": 1.390388462549427e-05, "epoch": 3.192784667418264, "percentage": 63.89, "elapsed_time": "1:49:01", "remaining_time": "1:01:37"}
|
734 |
+
{"current_steps": 707, "total_steps": 1105, "loss": 1.0698, "lr": 1.3843711983936156e-05, "epoch": 3.197294250281849, "percentage": 63.98, "elapsed_time": "1:49:25", "remaining_time": "1:01:35"}
|
735 |
+
{"current_steps": 708, "total_steps": 1105, "loss": 1.1177, "lr": 1.378360083819067e-05, "epoch": 3.201803833145434, "percentage": 64.07, "elapsed_time": "1:49:49", "remaining_time": "1:01:34"}
|
736 |
+
{"current_steps": 709, "total_steps": 1105, "loss": 1.0851, "lr": 1.3723551788714395e-05, "epoch": 3.206313416009019, "percentage": 64.16, "elapsed_time": "1:50:13", "remaining_time": "1:01:33"}
|
737 |
+
{"current_steps": 710, "total_steps": 1105, "loss": 1.0254, "lr": 1.3663565435343656e-05, "epoch": 3.2108229988726045, "percentage": 64.25, "elapsed_time": "1:50:37", "remaining_time": "1:01:32"}
|
738 |
+
{"current_steps": 711, "total_steps": 1105, "loss": 1.0893, "lr": 1.3603642377288485e-05, "epoch": 3.2153325817361895, "percentage": 64.34, "elapsed_time": "1:51:01", "remaining_time": "1:01:31"}
|
739 |
+
{"current_steps": 712, "total_steps": 1105, "loss": 1.1153, "lr": 1.3543783213126638e-05, "epoch": 3.2198421645997746, "percentage": 64.43, "elapsed_time": "1:51:26", "remaining_time": "1:01:30"}
|
740 |
+
{"current_steps": 713, "total_steps": 1105, "loss": 1.0859, "lr": 1.3483988540797652e-05, "epoch": 3.2243517474633596, "percentage": 64.52, "elapsed_time": "1:51:50", "remaining_time": "1:01:29"}
|
741 |
+
{"current_steps": 714, "total_steps": 1105, "loss": 1.1081, "lr": 1.3424258957596839e-05, "epoch": 3.2288613303269447, "percentage": 64.62, "elapsed_time": "1:52:14", "remaining_time": "1:01:27"}
|
742 |
+
{"current_steps": 715, "total_steps": 1105, "loss": 1.0498, "lr": 1.336459506016933e-05, "epoch": 3.2333709131905297, "percentage": 64.71, "elapsed_time": "1:52:38", "remaining_time": "1:01:26"}
|
743 |
+
{"current_steps": 716, "total_steps": 1105, "loss": 1.0548, "lr": 1.3304997444504099e-05, "epoch": 3.2378804960541148, "percentage": 64.8, "elapsed_time": "1:53:03", "remaining_time": "1:01:25"}
|
744 |
+
{"current_steps": 717, "total_steps": 1105, "loss": 1.0474, "lr": 1.3245466705928052e-05, "epoch": 3.2423900789177003, "percentage": 64.89, "elapsed_time": "1:53:27", "remaining_time": "1:01:23"}
|
745 |
+
{"current_steps": 718, "total_steps": 1105, "loss": 1.04, "lr": 1.3186003439100035e-05, "epoch": 3.2468996617812853, "percentage": 64.98, "elapsed_time": "1:53:51", "remaining_time": "1:01:22"}
|
746 |
+
{"current_steps": 719, "total_steps": 1105, "loss": 1.0746, "lr": 1.3126608238004904e-05, "epoch": 3.2514092446448704, "percentage": 65.07, "elapsed_time": "1:54:15", "remaining_time": "1:01:20"}
|
747 |
+
{"current_steps": 720, "total_steps": 1105, "loss": 1.0429, "lr": 1.3067281695947619e-05, "epoch": 3.2559188275084554, "percentage": 65.16, "elapsed_time": "1:54:39", "remaining_time": "1:01:18"}
|
748 |
+
{"current_steps": 721, "total_steps": 1105, "loss": 1.0721, "lr": 1.300802440554728e-05, "epoch": 3.2604284103720405, "percentage": 65.25, "elapsed_time": "1:55:03", "remaining_time": "1:01:16"}
|
749 |
+
{"current_steps": 722, "total_steps": 1105, "loss": 1.0751, "lr": 1.2948836958731245e-05, "epoch": 3.264937993235626, "percentage": 65.34, "elapsed_time": "1:55:27", "remaining_time": "1:01:15"}
|
750 |
+
{"current_steps": 723, "total_steps": 1105, "loss": 1.1017, "lr": 1.2889719946729176e-05, "epoch": 3.269447576099211, "percentage": 65.43, "elapsed_time": "1:55:51", "remaining_time": "1:01:12"}
|
751 |
+
{"current_steps": 724, "total_steps": 1105, "loss": 1.0906, "lr": 1.2830673960067173e-05, "epoch": 3.273957158962796, "percentage": 65.52, "elapsed_time": "1:56:15", "remaining_time": "1:01:10"}
|
752 |
+
{"current_steps": 725, "total_steps": 1105, "loss": 1.0721, "lr": 1.277169958856183e-05, "epoch": 3.278466741826381, "percentage": 65.61, "elapsed_time": "1:56:40", "remaining_time": "1:01:08"}
|
753 |
+
{"current_steps": 726, "total_steps": 1105, "loss": 1.0736, "lr": 1.2712797421314403e-05, "epoch": 3.282976324689966, "percentage": 65.7, "elapsed_time": "1:57:04", "remaining_time": "1:01:06"}
|
754 |
+
{"current_steps": 727, "total_steps": 1105, "loss": 1.0951, "lr": 1.265396804670487e-05, "epoch": 3.287485907553551, "percentage": 65.79, "elapsed_time": "1:57:28", "remaining_time": "1:01:04"}
|
755 |
+
{"current_steps": 728, "total_steps": 1105, "loss": 1.0484, "lr": 1.2595212052386073e-05, "epoch": 3.2919954904171362, "percentage": 65.88, "elapsed_time": "1:57:52", "remaining_time": "1:01:02"}
|
756 |
+
{"current_steps": 729, "total_steps": 1105, "loss": 1.0496, "lr": 1.2536530025277868e-05, "epoch": 3.2965050732807217, "percentage": 65.97, "elapsed_time": "1:58:16", "remaining_time": "1:01:00"}
|
757 |
+
{"current_steps": 730, "total_steps": 1105, "loss": 1.0515, "lr": 1.2477922551561226e-05, "epoch": 3.301014656144307, "percentage": 66.06, "elapsed_time": "1:58:40", "remaining_time": "1:00:57"}
|
758 |
+
{"current_steps": 731, "total_steps": 1105, "loss": 1.0632, "lr": 1.2419390216672421e-05, "epoch": 3.305524239007892, "percentage": 66.15, "elapsed_time": "1:59:04", "remaining_time": "1:00:55"}
|
759 |
+
{"current_steps": 732, "total_steps": 1105, "loss": 1.0279, "lr": 1.2360933605297128e-05, "epoch": 3.310033821871477, "percentage": 66.24, "elapsed_time": "1:59:28", "remaining_time": "1:00:52"}
|
760 |
+
{"current_steps": 733, "total_steps": 1105, "loss": 1.054, "lr": 1.2302553301364629e-05, "epoch": 3.314543404735062, "percentage": 66.33, "elapsed_time": "1:59:52", "remaining_time": "1:00:50"}
|
761 |
+
{"current_steps": 734, "total_steps": 1105, "loss": 1.0927, "lr": 1.2244249888041955e-05, "epoch": 3.319052987598647, "percentage": 66.43, "elapsed_time": "2:00:16", "remaining_time": "1:00:47"}
|
762 |
+
{"current_steps": 735, "total_steps": 1105, "loss": 1.0371, "lr": 1.218602394772809e-05, "epoch": 3.323562570462232, "percentage": 66.52, "elapsed_time": "2:00:40", "remaining_time": "1:00:44"}
|
763 |
+
{"current_steps": 736, "total_steps": 1105, "loss": 1.1787, "lr": 1.2127876062048096e-05, "epoch": 3.3280721533258175, "percentage": 66.61, "elapsed_time": "2:01:04", "remaining_time": "1:00:42"}
|
764 |
+
{"current_steps": 737, "total_steps": 1105, "loss": 1.0904, "lr": 1.2069806811847362e-05, "epoch": 3.3325817361894026, "percentage": 66.7, "elapsed_time": "2:01:28", "remaining_time": "1:00:39"}
|
765 |
+
{"current_steps": 738, "total_steps": 1105, "loss": 1.0964, "lr": 1.2011816777185785e-05, "epoch": 3.3370913190529876, "percentage": 66.79, "elapsed_time": "2:01:52", "remaining_time": "1:00:36"}
|
766 |
+
{"current_steps": 739, "total_steps": 1105, "loss": 1.0868, "lr": 1.1953906537331942e-05, "epoch": 3.3416009019165727, "percentage": 66.88, "elapsed_time": "2:02:16", "remaining_time": "1:00:33"}
|
767 |
+
{"current_steps": 740, "total_steps": 1105, "loss": 1.066, "lr": 1.1896076670757367e-05, "epoch": 3.3461104847801577, "percentage": 66.97, "elapsed_time": "2:02:40", "remaining_time": "1:00:30"}
|
768 |
+
{"current_steps": 741, "total_steps": 1105, "loss": 1.0535, "lr": 1.1838327755130701e-05, "epoch": 3.3506200676437428, "percentage": 67.06, "elapsed_time": "2:03:05", "remaining_time": "1:00:28"}
|
769 |
+
{"current_steps": 742, "total_steps": 1105, "loss": 1.0704, "lr": 1.1780660367311993e-05, "epoch": 3.3551296505073283, "percentage": 67.15, "elapsed_time": "2:03:30", "remaining_time": "1:00:25"}
|
770 |
+
{"current_steps": 743, "total_steps": 1105, "loss": 1.0786, "lr": 1.1723075083346873e-05, "epoch": 3.3596392333709133, "percentage": 67.24, "elapsed_time": "2:03:53", "remaining_time": "1:00:21"}
|
771 |
+
{"current_steps": 744, "total_steps": 1105, "loss": 1.069, "lr": 1.166557247846083e-05, "epoch": 3.3641488162344984, "percentage": 67.33, "elapsed_time": "2:04:17", "remaining_time": "1:00:18"}
|
772 |
+
{"current_steps": 745, "total_steps": 1105, "loss": 1.0971, "lr": 1.1608153127053487e-05, "epoch": 3.3686583990980834, "percentage": 67.42, "elapsed_time": "2:04:41", "remaining_time": "1:00:15"}
|
773 |
+
{"current_steps": 746, "total_steps": 1105, "loss": 1.0853, "lr": 1.1550817602692815e-05, "epoch": 3.3731679819616684, "percentage": 67.51, "elapsed_time": "2:05:05", "remaining_time": "1:00:11"}
|
774 |
+
{"current_steps": 747, "total_steps": 1105, "loss": 1.0992, "lr": 1.1493566478109441e-05, "epoch": 3.3776775648252535, "percentage": 67.6, "elapsed_time": "2:05:29", "remaining_time": "1:00:08"}
|
775 |
+
{"current_steps": 748, "total_steps": 1105, "loss": 1.0851, "lr": 1.1436400325190898e-05, "epoch": 3.382187147688839, "percentage": 67.69, "elapsed_time": "2:05:53", "remaining_time": "1:00:05"}
|
776 |
+
{"current_steps": 749, "total_steps": 1105, "loss": 1.0612, "lr": 1.1379319714975949e-05, "epoch": 3.386696730552424, "percentage": 67.78, "elapsed_time": "2:06:17", "remaining_time": "1:00:01"}
|
777 |
+
{"current_steps": 750, "total_steps": 1105, "loss": 1.0356, "lr": 1.132232521764884e-05, "epoch": 3.391206313416009, "percentage": 67.87, "elapsed_time": "2:06:41", "remaining_time": "0:59:58"}
|
778 |
+
{"current_steps": 751, "total_steps": 1105, "loss": 1.034, "lr": 1.1265417402533645e-05, "epoch": 3.395715896279594, "percentage": 67.96, "elapsed_time": "2:07:05", "remaining_time": "0:59:54"}
|
779 |
+
{"current_steps": 752, "total_steps": 1105, "loss": 1.0765, "lr": 1.120859683808856e-05, "epoch": 3.400225479143179, "percentage": 68.05, "elapsed_time": "2:07:31", "remaining_time": "0:59:51"}
|
780 |
+
{"current_steps": 753, "total_steps": 1105, "loss": 1.0675, "lr": 1.1151864091900199e-05, "epoch": 3.4047350620067642, "percentage": 68.14, "elapsed_time": "2:07:55", "remaining_time": "0:59:47"}
|
781 |
+
{"current_steps": 754, "total_steps": 1105, "loss": 1.0464, "lr": 1.1095219730677988e-05, "epoch": 3.4092446448703493, "percentage": 68.24, "elapsed_time": "2:08:18", "remaining_time": "0:59:44"}
|
782 |
+
{"current_steps": 755, "total_steps": 1105, "loss": 1.0826, "lr": 1.103866432024843e-05, "epoch": 3.4137542277339348, "percentage": 68.33, "elapsed_time": "2:08:44", "remaining_time": "0:59:40"}
|
783 |
+
{"current_steps": 756, "total_steps": 1105, "loss": 1.0735, "lr": 1.0982198425549526e-05, "epoch": 3.41826381059752, "percentage": 68.42, "elapsed_time": "2:09:07", "remaining_time": "0:59:36"}
|
784 |
+
{"current_steps": 757, "total_steps": 1105, "loss": 1.0447, "lr": 1.0925822610625052e-05, "epoch": 3.422773393461105, "percentage": 68.51, "elapsed_time": "2:09:32", "remaining_time": "0:59:32"}
|
785 |
+
{"current_steps": 758, "total_steps": 1105, "loss": 1.08, "lr": 1.0869537438619003e-05, "epoch": 3.42728297632469, "percentage": 68.6, "elapsed_time": "2:09:56", "remaining_time": "0:59:28"}
|
786 |
+
{"current_steps": 759, "total_steps": 1105, "loss": 1.073, "lr": 1.0813343471769917e-05, "epoch": 3.431792559188275, "percentage": 68.69, "elapsed_time": "2:10:19", "remaining_time": "0:59:24"}
|
787 |
+
{"current_steps": 760, "total_steps": 1105, "loss": 1.0719, "lr": 1.0757241271405285e-05, "epoch": 3.43630214205186, "percentage": 68.78, "elapsed_time": "2:10:43", "remaining_time": "0:59:20"}
|
788 |
+
{"current_steps": 761, "total_steps": 1105, "loss": 1.0486, "lr": 1.0701231397935921e-05, "epoch": 3.4408117249154455, "percentage": 68.87, "elapsed_time": "2:11:07", "remaining_time": "0:59:16"}
|
789 |
+
{"current_steps": 762, "total_steps": 1105, "loss": 1.0799, "lr": 1.0645314410850368e-05, "epoch": 3.4453213077790306, "percentage": 68.96, "elapsed_time": "2:11:31", "remaining_time": "0:59:12"}
|
790 |
+
{"current_steps": 763, "total_steps": 1105, "loss": 1.123, "lr": 1.0589490868709342e-05, "epoch": 3.4498308906426156, "percentage": 69.05, "elapsed_time": "2:11:54", "remaining_time": "0:59:07"}
|
791 |
+
{"current_steps": 764, "total_steps": 1105, "loss": 1.0659, "lr": 1.0533761329140106e-05, "epoch": 3.4543404735062007, "percentage": 69.14, "elapsed_time": "2:12:18", "remaining_time": "0:59:03"}
|
792 |
+
{"current_steps": 765, "total_steps": 1105, "loss": 1.0782, "lr": 1.0478126348830933e-05, "epoch": 3.4588500563697857, "percentage": 69.23, "elapsed_time": "2:12:42", "remaining_time": "0:58:58"}
|
793 |
+
{"current_steps": 766, "total_steps": 1105, "loss": 1.0813, "lr": 1.0422586483525528e-05, "epoch": 3.4633596392333708, "percentage": 69.32, "elapsed_time": "2:13:06", "remaining_time": "0:58:54"}
|
794 |
+
{"current_steps": 767, "total_steps": 1105, "loss": 1.1173, "lr": 1.0367142288017495e-05, "epoch": 3.4678692220969562, "percentage": 69.41, "elapsed_time": "2:13:30", "remaining_time": "0:58:50"}
|
795 |
+
{"current_steps": 768, "total_steps": 1105, "loss": 1.0558, "lr": 1.0311794316144756e-05, "epoch": 3.4723788049605413, "percentage": 69.5, "elapsed_time": "2:13:54", "remaining_time": "0:58:45"}
|
796 |
+
{"current_steps": 769, "total_steps": 1105, "loss": 1.0615, "lr": 1.0256543120784074e-05, "epoch": 3.4768883878241263, "percentage": 69.59, "elapsed_time": "2:14:18", "remaining_time": "0:58:41"}
|
797 |
+
{"current_steps": 770, "total_steps": 1105, "loss": 1.0584, "lr": 1.0201389253845475e-05, "epoch": 3.4813979706877114, "percentage": 69.68, "elapsed_time": "2:14:42", "remaining_time": "0:58:36"}
|
798 |
+
{"current_steps": 771, "total_steps": 1105, "loss": 1.0374, "lr": 1.0146333266266779e-05, "epoch": 3.4859075535512964, "percentage": 69.77, "elapsed_time": "2:15:06", "remaining_time": "0:58:31"}
|
799 |
+
{"current_steps": 772, "total_steps": 1105, "loss": 1.0712, "lr": 1.0091375708008084e-05, "epoch": 3.4904171364148815, "percentage": 69.86, "elapsed_time": "2:15:31", "remaining_time": "0:58:27"}
|
800 |
+
{"current_steps": 773, "total_steps": 1105, "loss": 1.1248, "lr": 1.003651712804624e-05, "epoch": 3.4949267192784665, "percentage": 69.95, "elapsed_time": "2:15:55", "remaining_time": "0:58:22"}
|
801 |
+
{"current_steps": 774, "total_steps": 1105, "loss": 1.0864, "lr": 9.981758074369422e-06, "epoch": 3.499436302142052, "percentage": 70.05, "elapsed_time": "2:16:20", "remaining_time": "0:58:18"}
|
802 |
+
{"current_steps": 775, "total_steps": 1105, "loss": 1.0892, "lr": 9.927099093971598e-06, "epoch": 3.503945885005637, "percentage": 70.14, "elapsed_time": "2:16:44", "remaining_time": "0:58:13"}
|
803 |
+
{"current_steps": 776, "total_steps": 1105, "loss": 1.067, "lr": 9.872540732847126e-06, "epoch": 3.508455467869222, "percentage": 70.23, "elapsed_time": "2:17:08", "remaining_time": "0:58:08"}
|
804 |
+
{"current_steps": 777, "total_steps": 1105, "loss": 1.0372, "lr": 9.81808353598524e-06, "epoch": 3.512965050732807, "percentage": 70.32, "elapsed_time": "2:17:32", "remaining_time": "0:58:03"}
|
805 |
+
{"current_steps": 778, "total_steps": 1105, "loss": 1.0768, "lr": 9.76372804736464e-06, "epoch": 3.5174746335963922, "percentage": 70.41, "elapsed_time": "2:17:55", "remaining_time": "0:57:58"}
|
806 |
+
{"current_steps": 779, "total_steps": 1105, "loss": 1.0651, "lr": 9.709474809948072e-06, "epoch": 3.5219842164599777, "percentage": 70.5, "elapsed_time": "2:18:19", "remaining_time": "0:57:53"}
|
807 |
+
{"current_steps": 780, "total_steps": 1105, "loss": 1.017, "lr": 9.655324365676845e-06, "epoch": 3.5264937993235623, "percentage": 70.59, "elapsed_time": "2:18:43", "remaining_time": "0:57:48"}
|
808 |
+
{"current_steps": 781, "total_steps": 1105, "loss": 1.0533, "lr": 9.601277255465502e-06, "epoch": 3.531003382187148, "percentage": 70.68, "elapsed_time": "2:19:08", "remaining_time": "0:57:43"}
|
809 |
+
{"current_steps": 782, "total_steps": 1105, "loss": 1.0956, "lr": 9.547334019196325e-06, "epoch": 3.535512965050733, "percentage": 70.77, "elapsed_time": "2:19:31", "remaining_time": "0:57:37"}
|
810 |
+
{"current_steps": 783, "total_steps": 1105, "loss": 1.0486, "lr": 9.493495195714028e-06, "epoch": 3.540022547914318, "percentage": 70.86, "elapsed_time": "2:19:55", "remaining_time": "0:57:32"}
|
811 |
+
{"current_steps": 784, "total_steps": 1105, "loss": 1.1089, "lr": 9.439761322820306e-06, "epoch": 3.544532130777903, "percentage": 70.95, "elapsed_time": "2:20:19", "remaining_time": "0:57:27"}
|
812 |
+
{"current_steps": 785, "total_steps": 1105, "loss": 1.0674, "lr": 9.386132937268506e-06, "epoch": 3.549041713641488, "percentage": 71.04, "elapsed_time": "2:20:43", "remaining_time": "0:57:21"}
|
813 |
+
{"current_steps": 786, "total_steps": 1105, "loss": 1.0855, "lr": 9.332610574758259e-06, "epoch": 3.5535512965050735, "percentage": 71.13, "elapsed_time": "2:21:07", "remaining_time": "0:57:16"}
|
814 |
+
{"current_steps": 787, "total_steps": 1105, "loss": 1.0352, "lr": 9.27919476993009e-06, "epoch": 3.5580608793686586, "percentage": 71.22, "elapsed_time": "2:21:31", "remaining_time": "0:57:11"}
|
815 |
+
{"current_steps": 788, "total_steps": 1105, "loss": 1.0722, "lr": 9.225886056360145e-06, "epoch": 3.5625704622322436, "percentage": 71.31, "elapsed_time": "2:21:55", "remaining_time": "0:57:05"}
|
816 |
+
{"current_steps": 789, "total_steps": 1105, "loss": 1.0818, "lr": 9.172684966554792e-06, "epoch": 3.5670800450958287, "percentage": 71.4, "elapsed_time": "2:22:19", "remaining_time": "0:57:00"}
|
817 |
+
{"current_steps": 790, "total_steps": 1105, "loss": 1.0651, "lr": 9.119592031945354e-06, "epoch": 3.5715896279594137, "percentage": 71.49, "elapsed_time": "2:22:43", "remaining_time": "0:56:54"}
|
818 |
+
{"current_steps": 791, "total_steps": 1105, "loss": 1.0291, "lr": 9.066607782882776e-06, "epoch": 3.5760992108229988, "percentage": 71.58, "elapsed_time": "2:23:07", "remaining_time": "0:56:48"}
|
819 |
+
{"current_steps": 792, "total_steps": 1105, "loss": 1.009, "lr": 9.013732748632338e-06, "epoch": 3.580608793686584, "percentage": 71.67, "elapsed_time": "2:23:31", "remaining_time": "0:56:43"}
|
820 |
+
{"current_steps": 793, "total_steps": 1105, "loss": 1.0517, "lr": 8.960967457368338e-06, "epoch": 3.5851183765501693, "percentage": 71.76, "elapsed_time": "2:23:55", "remaining_time": "0:56:37"}
|
821 |
+
{"current_steps": 794, "total_steps": 1105, "loss": 1.0757, "lr": 8.908312436168866e-06, "epoch": 3.5896279594137543, "percentage": 71.86, "elapsed_time": "2:24:18", "remaining_time": "0:56:31"}
|
822 |
+
{"current_steps": 795, "total_steps": 1105, "loss": 1.092, "lr": 8.855768211010503e-06, "epoch": 3.5941375422773394, "percentage": 71.95, "elapsed_time": "2:24:42", "remaining_time": "0:56:25"}
|
823 |
+
{"current_steps": 796, "total_steps": 1105, "loss": 1.0726, "lr": 8.803335306763065e-06, "epoch": 3.5986471251409244, "percentage": 72.04, "elapsed_time": "2:25:06", "remaining_time": "0:56:19"}
|
824 |
+
{"current_steps": 797, "total_steps": 1105, "loss": 1.088, "lr": 8.751014247184388e-06, "epoch": 3.6031567080045095, "percentage": 72.13, "elapsed_time": "2:25:31", "remaining_time": "0:56:14"}
|
825 |
+
{"current_steps": 798, "total_steps": 1105, "loss": 1.059, "lr": 8.698805554915074e-06, "epoch": 3.6076662908680945, "percentage": 72.22, "elapsed_time": "2:25:55", "remaining_time": "0:56:08"}
|
826 |
+
{"current_steps": 799, "total_steps": 1105, "loss": 1.0382, "lr": 8.646709751473288e-06, "epoch": 3.6121758737316796, "percentage": 72.31, "elapsed_time": "2:26:19", "remaining_time": "0:56:02"}
|
827 |
+
{"current_steps": 800, "total_steps": 1105, "loss": 1.0464, "lr": 8.594727357249506e-06, "epoch": 3.616685456595265, "percentage": 72.4, "elapsed_time": "2:26:43", "remaining_time": "0:55:56"}
|
828 |
+
{"current_steps": 801, "total_steps": 1105, "loss": 1.0706, "lr": 8.542858891501385e-06, "epoch": 3.62119503945885, "percentage": 72.49, "elapsed_time": "2:27:07", "remaining_time": "0:55:50"}
|
829 |
+
{"current_steps": 802, "total_steps": 1105, "loss": 1.0092, "lr": 8.491104872348506e-06, "epoch": 3.625704622322435, "percentage": 72.58, "elapsed_time": "2:27:31", "remaining_time": "0:55:44"}
|
830 |
+
{"current_steps": 803, "total_steps": 1105, "loss": 1.0812, "lr": 8.43946581676724e-06, "epoch": 3.6302142051860202, "percentage": 72.67, "elapsed_time": "2:27:55", "remaining_time": "0:55:37"}
|
831 |
+
{"current_steps": 804, "total_steps": 1105, "loss": 1.0498, "lr": 8.387942240585587e-06, "epoch": 3.6347237880496053, "percentage": 72.76, "elapsed_time": "2:28:19", "remaining_time": "0:55:31"}
|
832 |
+
{"current_steps": 805, "total_steps": 1105, "loss": 1.1054, "lr": 8.336534658478004e-06, "epoch": 3.6392333709131908, "percentage": 72.85, "elapsed_time": "2:28:43", "remaining_time": "0:55:25"}
|
833 |
+
{"current_steps": 806, "total_steps": 1105, "loss": 1.1096, "lr": 8.285243583960276e-06, "epoch": 3.6437429537767754, "percentage": 72.94, "elapsed_time": "2:29:06", "remaining_time": "0:55:19"}
|
834 |
+
{"current_steps": 807, "total_steps": 1105, "loss": 1.0884, "lr": 8.23406952938436e-06, "epoch": 3.648252536640361, "percentage": 73.03, "elapsed_time": "2:29:31", "remaining_time": "0:55:12"}
|
835 |
+
{"current_steps": 808, "total_steps": 1105, "loss": 1.0782, "lr": 8.18301300593332e-06, "epoch": 3.652762119503946, "percentage": 73.12, "elapsed_time": "2:29:55", "remaining_time": "0:55:06"}
|
836 |
+
{"current_steps": 809, "total_steps": 1105, "loss": 1.0923, "lr": 8.132074523616158e-06, "epoch": 3.657271702367531, "percentage": 73.21, "elapsed_time": "2:30:19", "remaining_time": "0:55:00"}
|
837 |
+
{"current_steps": 810, "total_steps": 1105, "loss": 1.1009, "lr": 8.08125459126278e-06, "epoch": 3.661781285231116, "percentage": 73.3, "elapsed_time": "2:30:43", "remaining_time": "0:54:53"}
|
838 |
+
{"current_steps": 811, "total_steps": 1105, "loss": 1.0776, "lr": 8.030553716518853e-06, "epoch": 3.666290868094701, "percentage": 73.39, "elapsed_time": "2:31:07", "remaining_time": "0:54:47"}
|
839 |
+
{"current_steps": 812, "total_steps": 1105, "loss": 1.0619, "lr": 7.979972405840795e-06, "epoch": 3.6708004509582866, "percentage": 73.48, "elapsed_time": "2:31:32", "remaining_time": "0:54:40"}
|
840 |
+
{"current_steps": 813, "total_steps": 1105, "loss": 1.1126, "lr": 7.92951116449067e-06, "epoch": 3.6753100338218716, "percentage": 73.57, "elapsed_time": "2:31:56", "remaining_time": "0:54:34"}
|
841 |
+
{"current_steps": 814, "total_steps": 1105, "loss": 1.0797, "lr": 7.879170496531153e-06, "epoch": 3.6798196166854567, "percentage": 73.67, "elapsed_time": "2:32:20", "remaining_time": "0:54:27"}
|
842 |
+
{"current_steps": 815, "total_steps": 1105, "loss": 1.0836, "lr": 7.828950904820514e-06, "epoch": 3.6843291995490417, "percentage": 73.76, "elapsed_time": "2:32:44", "remaining_time": "0:54:20"}
|
843 |
+
{"current_steps": 816, "total_steps": 1105, "loss": 1.0715, "lr": 7.778852891007559e-06, "epoch": 3.6888387824126267, "percentage": 73.85, "elapsed_time": "2:33:09", "remaining_time": "0:54:14"}
|
844 |
+
{"current_steps": 817, "total_steps": 1105, "loss": 1.0575, "lr": 7.728876955526654e-06, "epoch": 3.693348365276212, "percentage": 73.94, "elapsed_time": "2:33:32", "remaining_time": "0:54:07"}
|
845 |
+
{"current_steps": 818, "total_steps": 1105, "loss": 1.0581, "lr": 7.679023597592713e-06, "epoch": 3.697857948139797, "percentage": 74.03, "elapsed_time": "2:33:56", "remaining_time": "0:54:00"}
|
846 |
+
{"current_steps": 819, "total_steps": 1105, "loss": 1.0785, "lr": 7.629293315196209e-06, "epoch": 3.7023675310033823, "percentage": 74.12, "elapsed_time": "2:34:20", "remaining_time": "0:53:53"}
|
847 |
+
{"current_steps": 820, "total_steps": 1105, "loss": 1.0996, "lr": 7.579686605098193e-06, "epoch": 3.7068771138669674, "percentage": 74.21, "elapsed_time": "2:34:44", "remaining_time": "0:53:47"}
|
848 |
+
{"current_steps": 821, "total_steps": 1105, "loss": 1.0673, "lr": 7.530203962825331e-06, "epoch": 3.7113866967305524, "percentage": 74.3, "elapsed_time": "2:35:09", "remaining_time": "0:53:40"}
|
849 |
+
{"current_steps": 822, "total_steps": 1105, "loss": 1.0736, "lr": 7.4808458826649935e-06, "epoch": 3.7158962795941375, "percentage": 74.39, "elapsed_time": "2:35:33", "remaining_time": "0:53:33"}
|
850 |
+
{"current_steps": 823, "total_steps": 1105, "loss": 1.0832, "lr": 7.431612857660248e-06, "epoch": 3.7204058624577225, "percentage": 74.48, "elapsed_time": "2:35:57", "remaining_time": "0:53:26"}
|
851 |
+
{"current_steps": 824, "total_steps": 1105, "loss": 1.0435, "lr": 7.382505379605005e-06, "epoch": 3.724915445321308, "percentage": 74.57, "elapsed_time": "2:36:20", "remaining_time": "0:53:19"}
|
852 |
+
{"current_steps": 825, "total_steps": 1105, "loss": 1.0953, "lr": 7.333523939039057e-06, "epoch": 3.7294250281848926, "percentage": 74.66, "elapsed_time": "2:36:45", "remaining_time": "0:53:12"}
|
853 |
+
{"current_steps": 826, "total_steps": 1105, "loss": 1.0529, "lr": 7.28466902524321e-06, "epoch": 3.733934611048478, "percentage": 74.75, "elapsed_time": "2:37:09", "remaining_time": "0:53:05"}
|
854 |
+
{"current_steps": 827, "total_steps": 1105, "loss": 1.0584, "lr": 7.235941126234349e-06, "epoch": 3.738444193912063, "percentage": 74.84, "elapsed_time": "2:37:34", "remaining_time": "0:52:58"}
|
855 |
+
{"current_steps": 828, "total_steps": 1105, "loss": 1.0881, "lr": 7.187340728760632e-06, "epoch": 3.7429537767756482, "percentage": 74.93, "elapsed_time": "2:37:58", "remaining_time": "0:52:50"}
|
856 |
+
{"current_steps": 829, "total_steps": 1105, "loss": 1.1157, "lr": 7.138868318296566e-06, "epoch": 3.7474633596392333, "percentage": 75.02, "elapsed_time": "2:38:22", "remaining_time": "0:52:43"}
|
857 |
+
{"current_steps": 830, "total_steps": 1105, "loss": 1.0638, "lr": 7.090524379038184e-06, "epoch": 3.7519729425028183, "percentage": 75.11, "elapsed_time": "2:38:45", "remaining_time": "0:52:36"}
|
858 |
+
{"current_steps": 831, "total_steps": 1105, "loss": 1.0688, "lr": 7.042309393898219e-06, "epoch": 3.756482525366404, "percentage": 75.2, "elapsed_time": "2:39:09", "remaining_time": "0:52:28"}
|
859 |
+
{"current_steps": 832, "total_steps": 1105, "loss": 1.0273, "lr": 6.99422384450126e-06, "epoch": 3.760992108229989, "percentage": 75.29, "elapsed_time": "2:39:33", "remaining_time": "0:52:21"}
|
860 |
+
{"current_steps": 833, "total_steps": 1105, "loss": 1.066, "lr": 6.946268211178957e-06, "epoch": 3.765501691093574, "percentage": 75.38, "elapsed_time": "2:39:57", "remaining_time": "0:52:13"}
|
861 |
+
{"current_steps": 834, "total_steps": 1105, "loss": 1.064, "lr": 6.8984429729651935e-06, "epoch": 3.770011273957159, "percentage": 75.48, "elapsed_time": "2:40:21", "remaining_time": "0:52:06"}
|
862 |
+
{"current_steps": 835, "total_steps": 1105, "loss": 1.0259, "lr": 6.850748607591351e-06, "epoch": 3.774520856820744, "percentage": 75.57, "elapsed_time": "2:40:44", "remaining_time": "0:51:58"}
|
863 |
+
{"current_steps": 836, "total_steps": 1105, "loss": 1.0653, "lr": 6.803185591481478e-06, "epoch": 3.779030439684329, "percentage": 75.66, "elapsed_time": "2:41:09", "remaining_time": "0:51:51"}
|
864 |
+
{"current_steps": 837, "total_steps": 1105, "loss": 1.0816, "lr": 6.755754399747587e-06, "epoch": 3.783540022547914, "percentage": 75.75, "elapsed_time": "2:41:33", "remaining_time": "0:51:43"}
|
865 |
+
{"current_steps": 838, "total_steps": 1105, "loss": 1.1054, "lr": 6.708455506184875e-06, "epoch": 3.7880496054114996, "percentage": 75.84, "elapsed_time": "2:41:57", "remaining_time": "0:51:36"}
|
866 |
+
{"current_steps": 839, "total_steps": 1105, "loss": 1.0559, "lr": 6.661289383266984e-06, "epoch": 3.7925591882750846, "percentage": 75.93, "elapsed_time": "2:42:21", "remaining_time": "0:51:28"}
|
867 |
+
{"current_steps": 840, "total_steps": 1105, "loss": 1.0415, "lr": 6.614256502141325e-06, "epoch": 3.7970687711386697, "percentage": 76.02, "elapsed_time": "2:42:45", "remaining_time": "0:51:20"}
|
868 |
+
{"current_steps": 841, "total_steps": 1105, "loss": 1.0511, "lr": 6.567357332624309e-06, "epoch": 3.8015783540022547, "percentage": 76.11, "elapsed_time": "2:43:09", "remaining_time": "0:51:13"}
|
869 |
+
{"current_steps": 842, "total_steps": 1105, "loss": 1.0931, "lr": 6.520592343196716e-06, "epoch": 3.80608793686584, "percentage": 76.2, "elapsed_time": "2:43:33", "remaining_time": "0:51:05"}
|
870 |
+
{"current_steps": 843, "total_steps": 1105, "loss": 1.1137, "lr": 6.47396200099897e-06, "epoch": 3.8105975197294253, "percentage": 76.29, "elapsed_time": "2:43:58", "remaining_time": "0:50:57"}
|
871 |
+
{"current_steps": 844, "total_steps": 1105, "loss": 1.0804, "lr": 6.427466771826494e-06, "epoch": 3.81510710259301, "percentage": 76.38, "elapsed_time": "2:44:22", "remaining_time": "0:50:49"}
|
872 |
+
{"current_steps": 845, "total_steps": 1105, "loss": 1.1133, "lr": 6.381107120125063e-06, "epoch": 3.8196166854565954, "percentage": 76.47, "elapsed_time": "2:44:46", "remaining_time": "0:50:41"}
|
873 |
+
{"current_steps": 846, "total_steps": 1105, "loss": 1.0807, "lr": 6.334883508986132e-06, "epoch": 3.8241262683201804, "percentage": 76.56, "elapsed_time": "2:45:09", "remaining_time": "0:50:33"}
|
874 |
+
{"current_steps": 847, "total_steps": 1105, "loss": 1.0759, "lr": 6.288796400142256e-06, "epoch": 3.8286358511837655, "percentage": 76.65, "elapsed_time": "2:45:33", "remaining_time": "0:50:25"}
|
875 |
+
{"current_steps": 848, "total_steps": 1105, "loss": 1.0655, "lr": 6.242846253962433e-06, "epoch": 3.8331454340473505, "percentage": 76.74, "elapsed_time": "2:45:57", "remaining_time": "0:50:17"}
|
876 |
+
{"current_steps": 849, "total_steps": 1105, "loss": 1.0735, "lr": 6.197033529447551e-06, "epoch": 3.8376550169109356, "percentage": 76.83, "elapsed_time": "2:46:21", "remaining_time": "0:50:09"}
|
877 |
+
{"current_steps": 850, "total_steps": 1105, "loss": 1.0923, "lr": 6.1513586842257476e-06, "epoch": 3.842164599774521, "percentage": 76.92, "elapsed_time": "2:46:44", "remaining_time": "0:50:01"}
|
878 |
+
{"current_steps": 851, "total_steps": 1105, "loss": 1.1053, "lr": 6.1058221745478976e-06, "epoch": 3.846674182638106, "percentage": 77.01, "elapsed_time": "2:47:09", "remaining_time": "0:49:53"}
|
879 |
+
{"current_steps": 852, "total_steps": 1105, "loss": 1.0845, "lr": 6.060424455283011e-06, "epoch": 3.851183765501691, "percentage": 77.1, "elapsed_time": "2:47:33", "remaining_time": "0:49:45"}
|
880 |
+
{"current_steps": 853, "total_steps": 1105, "loss": 1.0836, "lr": 6.01516597991372e-06, "epoch": 3.855693348365276, "percentage": 77.19, "elapsed_time": "2:47:57", "remaining_time": "0:49:37"}
|
881 |
+
{"current_steps": 854, "total_steps": 1105, "loss": 1.0624, "lr": 5.970047200531719e-06, "epoch": 3.8602029312288613, "percentage": 77.29, "elapsed_time": "2:48:21", "remaining_time": "0:49:28"}
|
882 |
+
{"current_steps": 855, "total_steps": 1105, "loss": 1.0705, "lr": 5.925068567833263e-06, "epoch": 3.8647125140924463, "percentage": 77.38, "elapsed_time": "2:48:45", "remaining_time": "0:49:20"}
|
883 |
+
{"current_steps": 856, "total_steps": 1105, "loss": 1.0893, "lr": 5.88023053111469e-06, "epoch": 3.8692220969560314, "percentage": 77.47, "elapsed_time": "2:49:09", "remaining_time": "0:49:12"}
|
884 |
+
{"current_steps": 857, "total_steps": 1105, "loss": 1.0625, "lr": 5.835533538267875e-06, "epoch": 3.873731679819617, "percentage": 77.56, "elapsed_time": "2:49:33", "remaining_time": "0:49:04"}
|
885 |
+
{"current_steps": 858, "total_steps": 1105, "loss": 1.0677, "lr": 5.790978035775836e-06, "epoch": 3.878241262683202, "percentage": 77.65, "elapsed_time": "2:49:57", "remaining_time": "0:48:55"}
|
886 |
+
{"current_steps": 859, "total_steps": 1105, "loss": 1.0596, "lr": 5.746564468708183e-06, "epoch": 3.882750845546787, "percentage": 77.74, "elapsed_time": "2:50:21", "remaining_time": "0:48:47"}
|
887 |
+
{"current_steps": 860, "total_steps": 1105, "loss": 1.0699, "lr": 5.702293280716753e-06, "epoch": 3.887260428410372, "percentage": 77.83, "elapsed_time": "2:50:44", "remaining_time": "0:48:38"}
|
888 |
+
{"current_steps": 861, "total_steps": 1105, "loss": 1.0561, "lr": 5.6581649140311216e-06, "epoch": 3.891770011273957, "percentage": 77.92, "elapsed_time": "2:51:08", "remaining_time": "0:48:29"}
|
889 |
+
{"current_steps": 862, "total_steps": 1105, "loss": 1.068, "lr": 5.614179809454207e-06, "epoch": 3.8962795941375425, "percentage": 78.01, "elapsed_time": "2:51:32", "remaining_time": "0:48:21"}
|
890 |
+
{"current_steps": 863, "total_steps": 1105, "loss": 1.0508, "lr": 5.570338406357885e-06, "epoch": 3.900789177001127, "percentage": 78.1, "elapsed_time": "2:51:56", "remaining_time": "0:48:12"}
|
891 |
+
{"current_steps": 864, "total_steps": 1105, "loss": 1.0763, "lr": 5.526641142678568e-06, "epoch": 3.9052987598647126, "percentage": 78.19, "elapsed_time": "2:52:20", "remaining_time": "0:48:04"}
|
892 |
+
{"current_steps": 865, "total_steps": 1105, "loss": 1.0121, "lr": 5.483088454912855e-06, "epoch": 3.9098083427282977, "percentage": 78.28, "elapsed_time": "2:52:43", "remaining_time": "0:47:55"}
|
893 |
+
{"current_steps": 866, "total_steps": 1105, "loss": 1.0204, "lr": 5.439680778113141e-06, "epoch": 3.9143179255918827, "percentage": 78.37, "elapsed_time": "2:53:07", "remaining_time": "0:47:46"}
|
894 |
+
{"current_steps": 867, "total_steps": 1105, "loss": 1.038, "lr": 5.396418545883318e-06, "epoch": 3.918827508455468, "percentage": 78.46, "elapsed_time": "2:53:32", "remaining_time": "0:47:38"}
|
895 |
+
{"current_steps": 868, "total_steps": 1105, "loss": 1.0988, "lr": 5.35330219037439e-06, "epoch": 3.923337091319053, "percentage": 78.55, "elapsed_time": "2:53:56", "remaining_time": "0:47:29"}
|
896 |
+
{"current_steps": 869, "total_steps": 1105, "loss": 1.0501, "lr": 5.3103321422802075e-06, "epoch": 3.9278466741826383, "percentage": 78.64, "elapsed_time": "2:54:20", "remaining_time": "0:47:20"}
|
897 |
+
{"current_steps": 870, "total_steps": 1105, "loss": 1.0479, "lr": 5.267508830833121e-06, "epoch": 3.9323562570462234, "percentage": 78.73, "elapsed_time": "2:54:44", "remaining_time": "0:47:12"}
|
898 |
+
{"current_steps": 871, "total_steps": 1105, "loss": 1.0977, "lr": 5.224832683799721e-06, "epoch": 3.9368658399098084, "percentage": 78.82, "elapsed_time": "2:55:08", "remaining_time": "0:47:03"}
|
899 |
+
{"current_steps": 872, "total_steps": 1105, "loss": 1.0865, "lr": 5.182304127476568e-06, "epoch": 3.9413754227733935, "percentage": 78.91, "elapsed_time": "2:55:32", "remaining_time": "0:46:54"}
|
900 |
+
{"current_steps": 873, "total_steps": 1105, "loss": 1.0523, "lr": 5.1399235866859e-06, "epoch": 3.9458850056369785, "percentage": 79.0, "elapsed_time": "2:55:56", "remaining_time": "0:46:45"}
|
901 |
+
{"current_steps": 874, "total_steps": 1105, "loss": 1.0891, "lr": 5.097691484771434e-06, "epoch": 3.9503945885005636, "percentage": 79.1, "elapsed_time": "2:56:20", "remaining_time": "0:46:36"}
|
902 |
+
{"current_steps": 875, "total_steps": 1105, "loss": 1.0852, "lr": 5.055608243594097e-06, "epoch": 3.9549041713641486, "percentage": 79.19, "elapsed_time": "2:56:44", "remaining_time": "0:46:27"}
|
903 |
+
{"current_steps": 876, "total_steps": 1105, "loss": 1.0637, "lr": 5.01367428352785e-06, "epoch": 3.959413754227734, "percentage": 79.28, "elapsed_time": "2:57:08", "remaining_time": "0:46:18"}
|
904 |
+
{"current_steps": 877, "total_steps": 1105, "loss": 1.0631, "lr": 4.97189002345545e-06, "epoch": 3.963923337091319, "percentage": 79.37, "elapsed_time": "2:57:32", "remaining_time": "0:46:09"}
|
905 |
+
{"current_steps": 878, "total_steps": 1105, "loss": 1.0769, "lr": 4.930255880764294e-06, "epoch": 3.968432919954904, "percentage": 79.46, "elapsed_time": "2:57:56", "remaining_time": "0:46:00"}
|
906 |
+
{"current_steps": 879, "total_steps": 1105, "loss": 1.0705, "lr": 4.8887722713422526e-06, "epoch": 3.9729425028184893, "percentage": 79.55, "elapsed_time": "2:58:20", "remaining_time": "0:45:51"}
|
907 |
+
{"current_steps": 880, "total_steps": 1105, "loss": 1.0705, "lr": 4.847439609573475e-06, "epoch": 3.9774520856820743, "percentage": 79.64, "elapsed_time": "2:58:44", "remaining_time": "0:45:42"}
|
908 |
+
{"current_steps": 881, "total_steps": 1105, "loss": 1.0912, "lr": 4.806258308334306e-06, "epoch": 3.9819616685456594, "percentage": 79.73, "elapsed_time": "2:59:08", "remaining_time": "0:45:32"}
|
909 |
+
{"current_steps": 882, "total_steps": 1105, "loss": 1.0411, "lr": 4.765228778989113e-06, "epoch": 3.9864712514092444, "percentage": 79.82, "elapsed_time": "2:59:33", "remaining_time": "0:45:23"}
|
910 |
+
{"current_steps": 883, "total_steps": 1105, "loss": 1.0693, "lr": 4.724351431386211e-06, "epoch": 3.99098083427283, "percentage": 79.91, "elapsed_time": "2:59:57", "remaining_time": "0:45:14"}
|
911 |
+
{"current_steps": 884, "total_steps": 1105, "loss": 1.0555, "lr": 4.683626673853758e-06, "epoch": 3.995490417136415, "percentage": 80.0, "elapsed_time": "3:00:21", "remaining_time": "0:45:05"}
|
912 |
+
{"current_steps": 885, "total_steps": 1105, "loss": 1.0406, "lr": 4.643054913195666e-06, "epoch": 4.002254791431793, "percentage": 80.09, "elapsed_time": "3:03:27", "remaining_time": "0:45:36"}
|
913 |
+
{"current_steps": 886, "total_steps": 1105, "loss": 0.9927, "lr": 4.602636554687545e-06, "epoch": 4.006764374295377, "percentage": 80.18, "elapsed_time": "3:03:51", "remaining_time": "0:45:26"}
|
914 |
+
{"current_steps": 887, "total_steps": 1105, "loss": 1.0148, "lr": 4.5623720020726505e-06, "epoch": 4.011273957158963, "percentage": 80.27, "elapsed_time": "3:04:15", "remaining_time": "0:45:17"}
|
915 |
+
{"current_steps": 888, "total_steps": 1105, "loss": 0.9822, "lr": 4.5222616575578695e-06, "epoch": 4.015783540022548, "percentage": 80.36, "elapsed_time": "3:04:38", "remaining_time": "0:45:07"}
|
916 |
+
{"current_steps": 889, "total_steps": 1105, "loss": 1.0207, "lr": 4.482305921809669e-06, "epoch": 4.020293122886133, "percentage": 80.45, "elapsed_time": "3:05:02", "remaining_time": "0:44:57"}
|
917 |
+
{"current_steps": 890, "total_steps": 1105, "loss": 1.025, "lr": 4.442505193950129e-06, "epoch": 4.024802705749718, "percentage": 80.54, "elapsed_time": "3:05:27", "remaining_time": "0:44:47"}
|
918 |
+
{"current_steps": 891, "total_steps": 1105, "loss": 1.0192, "lr": 4.402859871552932e-06, "epoch": 4.029312288613303, "percentage": 80.63, "elapsed_time": "3:05:51", "remaining_time": "0:44:38"}
|