neginr commited on
Commit
8d556d6
·
verified ·
1 Parent(s): edeae45

Training in progress, epoch 4

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bf0c2794ab0fa726350553c2a9a6c471e3fe9e9af7c62f206edff6287d5a993c
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:af9ccd3044c2808f22c0e3da9f882399b4873fba119e662f86f939950732d586
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4921c5c8909ab409dd0b93009469f26723c514b7a1131f5378d383237b534db5
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9a001678faaae80088c14d188eae2c2cd0c2a05e5f12875b58842194a50323f8
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f109dd0bedc4215ccacc440dec1e303cf980f76f6d22de463da9ef80aaad8c07
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c320fac219f3868d7b2ab3a2bfe65fcec52e3474b386625bdf67c1cbbc93b075
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e9243f2e22d8de829fbb4337df4a3fd0f706873beab14e87acf44635d3a6af57
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0cd7cfb4a537b69058a6ecd057174a003a08b4416c32fed3be233a47d2b049c0
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -571,3 +571,146 @@
571
  {"current_steps": 571, "total_steps": 715, "loss": 0.3311, "lr": 9.498253328252023e-06, "epoch": 3.985645933014354, "percentage": 79.86, "elapsed_time": "15:50:38", "remaining_time": "3:59:44"}
572
  {"current_steps": 572, "total_steps": 715, "loss": 0.3316, "lr": 9.372184811749544e-06, "epoch": 3.9926054806437583, "percentage": 80.0, "elapsed_time": "15:52:17", "remaining_time": "3:58:04"}
573
  {"current_steps": 573, "total_steps": 715, "loss": 0.3252, "lr": 9.246847422467718e-06, "epoch": 4.003479773814702, "percentage": 80.14, "elapsed_time": "15:55:47", "remaining_time": "3:56:51"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
571
  {"current_steps": 571, "total_steps": 715, "loss": 0.3311, "lr": 9.498253328252023e-06, "epoch": 3.985645933014354, "percentage": 79.86, "elapsed_time": "15:50:38", "remaining_time": "3:59:44"}
572
  {"current_steps": 572, "total_steps": 715, "loss": 0.3316, "lr": 9.372184811749544e-06, "epoch": 3.9926054806437583, "percentage": 80.0, "elapsed_time": "15:52:17", "remaining_time": "3:58:04"}
573
  {"current_steps": 573, "total_steps": 715, "loss": 0.3252, "lr": 9.246847422467718e-06, "epoch": 4.003479773814702, "percentage": 80.14, "elapsed_time": "15:55:47", "remaining_time": "3:56:51"}
574
+ {"current_steps": 574, "total_steps": 715, "loss": 0.3121, "lr": 9.122244152378919e-06, "epoch": 4.010439321444106, "percentage": 80.28, "elapsed_time": "15:57:26", "remaining_time": "3:55:11"}
575
+ {"current_steps": 575, "total_steps": 715, "loss": 0.3038, "lr": 8.998377975931096e-06, "epoch": 4.01739886907351, "percentage": 80.42, "elapsed_time": "15:59:06", "remaining_time": "3:53:31"}
576
+ {"current_steps": 576, "total_steps": 715, "loss": 0.3086, "lr": 8.875251849976823e-06, "epoch": 4.024358416702914, "percentage": 80.56, "elapsed_time": "16:00:45", "remaining_time": "3:51:50"}
577
+ {"current_steps": 577, "total_steps": 715, "loss": 0.3109, "lr": 8.752868713702617e-06, "epoch": 4.0313179643323185, "percentage": 80.7, "elapsed_time": "16:02:24", "remaining_time": "3:50:10"}
578
+ {"current_steps": 578, "total_steps": 715, "loss": 0.3054, "lr": 8.63123148855888e-06, "epoch": 4.038277511961723, "percentage": 80.84, "elapsed_time": "16:04:03", "remaining_time": "3:48:30"}
579
+ {"current_steps": 579, "total_steps": 715, "loss": 0.3147, "lr": 8.510343078190075e-06, "epoch": 4.045237059591127, "percentage": 80.98, "elapsed_time": "16:05:42", "remaining_time": "3:46:50"}
580
+ {"current_steps": 580, "total_steps": 715, "loss": 0.3075, "lr": 8.39020636836545e-06, "epoch": 4.052196607220531, "percentage": 81.12, "elapsed_time": "16:07:22", "remaining_time": "3:45:09"}
581
+ {"current_steps": 581, "total_steps": 715, "loss": 0.3078, "lr": 8.270824226910163e-06, "epoch": 4.059156154849934, "percentage": 81.26, "elapsed_time": "16:09:01", "remaining_time": "3:43:29"}
582
+ {"current_steps": 582, "total_steps": 715, "loss": 0.3108, "lr": 8.152199503636819e-06, "epoch": 4.066115702479339, "percentage": 81.4, "elapsed_time": "16:10:41", "remaining_time": "3:41:49"}
583
+ {"current_steps": 583, "total_steps": 715, "loss": 0.3034, "lr": 8.034335030277406e-06, "epoch": 4.073075250108743, "percentage": 81.54, "elapsed_time": "16:12:20", "remaining_time": "3:40:09"}
584
+ {"current_steps": 584, "total_steps": 715, "loss": 0.3101, "lr": 7.917233620415716e-06, "epoch": 4.080034797738147, "percentage": 81.68, "elapsed_time": "16:13:59", "remaining_time": "3:38:28"}
585
+ {"current_steps": 585, "total_steps": 715, "loss": 0.3119, "lr": 7.800898069420203e-06, "epoch": 4.086994345367551, "percentage": 81.82, "elapsed_time": "16:15:39", "remaining_time": "3:36:48"}
586
+ {"current_steps": 586, "total_steps": 715, "loss": 0.3108, "lr": 7.685331154377254e-06, "epoch": 4.0939538929969554, "percentage": 81.96, "elapsed_time": "16:17:18", "remaining_time": "3:35:08"}
587
+ {"current_steps": 587, "total_steps": 715, "loss": 0.3116, "lr": 7.570535634024847e-06, "epoch": 4.10091344062636, "percentage": 82.1, "elapsed_time": "16:18:57", "remaining_time": "3:33:28"}
588
+ {"current_steps": 588, "total_steps": 715, "loss": 0.313, "lr": 7.456514248686737e-06, "epoch": 4.107872988255763, "percentage": 82.24, "elapsed_time": "16:20:36", "remaining_time": "3:31:47"}
589
+ {"current_steps": 589, "total_steps": 715, "loss": 0.3187, "lr": 7.343269720207051e-06, "epoch": 4.114832535885167, "percentage": 82.38, "elapsed_time": "16:22:15", "remaining_time": "3:30:07"}
590
+ {"current_steps": 590, "total_steps": 715, "loss": 0.3054, "lr": 7.2308047518852895e-06, "epoch": 4.121792083514571, "percentage": 82.52, "elapsed_time": "16:23:55", "remaining_time": "3:28:27"}
591
+ {"current_steps": 591, "total_steps": 715, "loss": 0.3094, "lr": 7.119122028411798e-06, "epoch": 4.128751631143976, "percentage": 82.66, "elapsed_time": "16:25:34", "remaining_time": "3:26:47"}
592
+ {"current_steps": 592, "total_steps": 715, "loss": 0.3149, "lr": 7.008224215803672e-06, "epoch": 4.13571117877338, "percentage": 82.8, "elapsed_time": "16:27:13", "remaining_time": "3:25:06"}
593
+ {"current_steps": 593, "total_steps": 715, "loss": 0.3101, "lr": 6.898113961341128e-06, "epoch": 4.142670726402784, "percentage": 82.94, "elapsed_time": "16:28:52", "remaining_time": "3:23:26"}
594
+ {"current_steps": 594, "total_steps": 715, "loss": 0.3052, "lr": 6.788793893504335e-06, "epoch": 4.149630274032188, "percentage": 83.08, "elapsed_time": "16:30:32", "remaining_time": "3:21:46"}
595
+ {"current_steps": 595, "total_steps": 715, "loss": 0.3096, "lr": 6.680266621910632e-06, "epoch": 4.156589821661592, "percentage": 83.22, "elapsed_time": "16:32:11", "remaining_time": "3:20:06"}
596
+ {"current_steps": 596, "total_steps": 715, "loss": 0.3137, "lr": 6.5725347372522204e-06, "epoch": 4.163549369290996, "percentage": 83.36, "elapsed_time": "16:33:50", "remaining_time": "3:18:26"}
597
+ {"current_steps": 597, "total_steps": 715, "loss": 0.3108, "lr": 6.465600811234356e-06, "epoch": 4.1705089169204, "percentage": 83.5, "elapsed_time": "16:35:29", "remaining_time": "3:16:45"}
598
+ {"current_steps": 598, "total_steps": 715, "loss": 0.3079, "lr": 6.3594673965139675e-06, "epoch": 4.177468464549804, "percentage": 83.64, "elapsed_time": "16:37:08", "remaining_time": "3:15:05"}
599
+ {"current_steps": 599, "total_steps": 715, "loss": 0.3063, "lr": 6.254137026638676e-06, "epoch": 4.184428012179208, "percentage": 83.78, "elapsed_time": "16:38:48", "remaining_time": "3:13:25"}
600
+ {"current_steps": 600, "total_steps": 715, "loss": 0.3067, "lr": 6.149612215986334e-06, "epoch": 4.1913875598086126, "percentage": 83.92, "elapsed_time": "16:40:27", "remaining_time": "3:11:45"}
601
+ {"current_steps": 601, "total_steps": 715, "loss": 0.3106, "lr": 6.045895459705042e-06, "epoch": 4.198347107438017, "percentage": 84.06, "elapsed_time": "16:42:06", "remaining_time": "3:10:05"}
602
+ {"current_steps": 602, "total_steps": 715, "loss": 0.3075, "lr": 5.94298923365352e-06, "epoch": 4.205306655067421, "percentage": 84.2, "elapsed_time": "16:43:45", "remaining_time": "3:08:24"}
603
+ {"current_steps": 603, "total_steps": 715, "loss": 0.3115, "lr": 5.840895994342068e-06, "epoch": 4.212266202696824, "percentage": 84.34, "elapsed_time": "16:45:25", "remaining_time": "3:06:44"}
604
+ {"current_steps": 604, "total_steps": 715, "loss": 0.3115, "lr": 5.7396181788738735e-06, "epoch": 4.2192257503262285, "percentage": 84.48, "elapsed_time": "16:47:04", "remaining_time": "3:05:04"}
605
+ {"current_steps": 605, "total_steps": 715, "loss": 0.3135, "lr": 5.639158204886861e-06, "epoch": 4.226185297955633, "percentage": 84.62, "elapsed_time": "16:48:43", "remaining_time": "3:03:24"}
606
+ {"current_steps": 606, "total_steps": 715, "loss": 0.3122, "lr": 5.539518470495991e-06, "epoch": 4.233144845585037, "percentage": 84.76, "elapsed_time": "16:50:23", "remaining_time": "3:01:44"}
607
+ {"current_steps": 607, "total_steps": 715, "loss": 0.3064, "lr": 5.440701354235995e-06, "epoch": 4.240104393214441, "percentage": 84.9, "elapsed_time": "16:52:02", "remaining_time": "3:00:03"}
608
+ {"current_steps": 608, "total_steps": 715, "loss": 0.3075, "lr": 5.3427092150045975e-06, "epoch": 4.247063940843845, "percentage": 85.03, "elapsed_time": "16:53:41", "remaining_time": "2:58:23"}
609
+ {"current_steps": 609, "total_steps": 715, "loss": 0.3094, "lr": 5.24554439200621e-06, "epoch": 4.2540234884732495, "percentage": 85.17, "elapsed_time": "16:55:20", "remaining_time": "2:56:43"}
610
+ {"current_steps": 610, "total_steps": 715, "loss": 0.3129, "lr": 5.149209204696073e-06, "epoch": 4.260983036102654, "percentage": 85.31, "elapsed_time": "16:57:00", "remaining_time": "2:55:03"}
611
+ {"current_steps": 611, "total_steps": 715, "loss": 0.3129, "lr": 5.05370595272495e-06, "epoch": 4.267942583732057, "percentage": 85.45, "elapsed_time": "16:58:39", "remaining_time": "2:53:23"}
612
+ {"current_steps": 612, "total_steps": 715, "loss": 0.3176, "lr": 4.959036915884134e-06, "epoch": 4.274902131361461, "percentage": 85.59, "elapsed_time": "17:00:18", "remaining_time": "2:51:43"}
613
+ {"current_steps": 613, "total_steps": 715, "loss": 0.3031, "lr": 4.865204354051129e-06, "epoch": 4.2818616789908654, "percentage": 85.73, "elapsed_time": "17:01:57", "remaining_time": "2:50:02"}
614
+ {"current_steps": 614, "total_steps": 715, "loss": 0.3083, "lr": 4.7722105071356065e-06, "epoch": 4.28882122662027, "percentage": 85.87, "elapsed_time": "17:03:36", "remaining_time": "2:48:22"}
615
+ {"current_steps": 615, "total_steps": 715, "loss": 0.3089, "lr": 4.68005759502602e-06, "epoch": 4.295780774249674, "percentage": 86.01, "elapsed_time": "17:05:16", "remaining_time": "2:46:42"}
616
+ {"current_steps": 616, "total_steps": 715, "loss": 0.3157, "lr": 4.588747817536563e-06, "epoch": 4.302740321879078, "percentage": 86.15, "elapsed_time": "17:06:55", "remaining_time": "2:45:02"}
617
+ {"current_steps": 617, "total_steps": 715, "loss": 0.3049, "lr": 4.498283354354654e-06, "epoch": 4.309699869508482, "percentage": 86.29, "elapsed_time": "17:08:34", "remaining_time": "2:43:22"}
618
+ {"current_steps": 618, "total_steps": 715, "loss": 0.3146, "lr": 4.408666364988938e-06, "epoch": 4.3166594171378865, "percentage": 86.43, "elapsed_time": "17:10:13", "remaining_time": "2:41:42"}
619
+ {"current_steps": 619, "total_steps": 715, "loss": 0.3121, "lr": 4.31989898871771e-06, "epoch": 4.32361896476729, "percentage": 86.57, "elapsed_time": "17:11:52", "remaining_time": "2:40:02"}
620
+ {"current_steps": 620, "total_steps": 715, "loss": 0.3056, "lr": 4.231983344537875e-06, "epoch": 4.330578512396694, "percentage": 86.71, "elapsed_time": "17:13:32", "remaining_time": "2:38:21"}
621
+ {"current_steps": 621, "total_steps": 715, "loss": 0.3092, "lr": 4.144921531114317e-06, "epoch": 4.337538060026098, "percentage": 86.85, "elapsed_time": "17:15:11", "remaining_time": "2:36:41"}
622
+ {"current_steps": 622, "total_steps": 715, "loss": 0.3087, "lr": 4.058715626729837e-06, "epoch": 4.344497607655502, "percentage": 86.99, "elapsed_time": "17:16:50", "remaining_time": "2:35:01"}
623
+ {"current_steps": 623, "total_steps": 715, "loss": 0.3124, "lr": 3.973367689235548e-06, "epoch": 4.351457155284907, "percentage": 87.13, "elapsed_time": "17:18:29", "remaining_time": "2:33:21"}
624
+ {"current_steps": 624, "total_steps": 715, "loss": 0.3097, "lr": 3.888879756001726e-06, "epoch": 4.358416702914311, "percentage": 87.27, "elapsed_time": "17:20:09", "remaining_time": "2:31:41"}
625
+ {"current_steps": 625, "total_steps": 715, "loss": 0.3082, "lr": 3.805253843869179e-06, "epoch": 4.365376250543715, "percentage": 87.41, "elapsed_time": "17:21:48", "remaining_time": "2:30:01"}
626
+ {"current_steps": 626, "total_steps": 715, "loss": 0.3172, "lr": 3.72249194910113e-06, "epoch": 4.372335798173118, "percentage": 87.55, "elapsed_time": "17:23:27", "remaining_time": "2:28:21"}
627
+ {"current_steps": 627, "total_steps": 715, "loss": 0.3082, "lr": 3.6405960473355183e-06, "epoch": 4.3792953458025226, "percentage": 87.69, "elapsed_time": "17:25:06", "remaining_time": "2:26:40"}
628
+ {"current_steps": 628, "total_steps": 715, "loss": 0.3098, "lr": 3.5595680935378972e-06, "epoch": 4.386254893431927, "percentage": 87.83, "elapsed_time": "17:26:46", "remaining_time": "2:25:00"}
629
+ {"current_steps": 629, "total_steps": 715, "loss": 0.3132, "lr": 3.4794100219546967e-06, "epoch": 4.393214441061331, "percentage": 87.97, "elapsed_time": "17:28:25", "remaining_time": "2:23:20"}
630
+ {"current_steps": 630, "total_steps": 715, "loss": 0.3057, "lr": 3.400123746067099e-06, "epoch": 4.400173988690735, "percentage": 88.11, "elapsed_time": "17:30:04", "remaining_time": "2:21:40"}
631
+ {"current_steps": 631, "total_steps": 715, "loss": 0.3092, "lr": 3.321711158545351e-06, "epoch": 4.407133536320139, "percentage": 88.25, "elapsed_time": "17:31:43", "remaining_time": "2:20:00"}
632
+ {"current_steps": 632, "total_steps": 715, "loss": 0.309, "lr": 3.2441741312036014e-06, "epoch": 4.414093083949544, "percentage": 88.39, "elapsed_time": "17:33:23", "remaining_time": "2:18:20"}
633
+ {"current_steps": 633, "total_steps": 715, "loss": 0.3105, "lr": 3.167514514955157e-06, "epoch": 4.421052631578947, "percentage": 88.53, "elapsed_time": "17:35:02", "remaining_time": "2:16:40"}
634
+ {"current_steps": 634, "total_steps": 715, "loss": 0.3071, "lr": 3.0917341397683633e-06, "epoch": 4.428012179208351, "percentage": 88.67, "elapsed_time": "17:36:41", "remaining_time": "2:15:00"}
635
+ {"current_steps": 635, "total_steps": 715, "loss": 0.3099, "lr": 3.0168348146228842e-06, "epoch": 4.434971726837755, "percentage": 88.81, "elapsed_time": "17:38:20", "remaining_time": "2:13:20"}
636
+ {"current_steps": 636, "total_steps": 715, "loss": 0.3102, "lr": 2.942818327466559e-06, "epoch": 4.4419312744671595, "percentage": 88.95, "elapsed_time": "17:39:59", "remaining_time": "2:11:39"}
637
+ {"current_steps": 637, "total_steps": 715, "loss": 0.3167, "lr": 2.8696864451726614e-06, "epoch": 4.448890822096564, "percentage": 89.09, "elapsed_time": "17:41:39", "remaining_time": "2:09:59"}
638
+ {"current_steps": 638, "total_steps": 715, "loss": 0.3076, "lr": 2.79744091349778e-06, "epoch": 4.455850369725968, "percentage": 89.23, "elapsed_time": "17:43:18", "remaining_time": "2:08:19"}
639
+ {"current_steps": 639, "total_steps": 715, "loss": 0.3124, "lr": 2.7260834570400986e-06, "epoch": 4.462809917355372, "percentage": 89.37, "elapsed_time": "17:44:57", "remaining_time": "2:06:39"}
640
+ {"current_steps": 640, "total_steps": 715, "loss": 0.3079, "lr": 2.6556157791982707e-06, "epoch": 4.469769464984776, "percentage": 89.51, "elapsed_time": "17:46:36", "remaining_time": "2:04:59"}
641
+ {"current_steps": 641, "total_steps": 715, "loss": 0.3047, "lr": 2.586039562130722e-06, "epoch": 4.4767290126141805, "percentage": 89.65, "elapsed_time": "17:48:15", "remaining_time": "2:03:19"}
642
+ {"current_steps": 642, "total_steps": 715, "loss": 0.3117, "lr": 2.5173564667155015e-06, "epoch": 4.483688560243584, "percentage": 89.79, "elapsed_time": "17:49:55", "remaining_time": "2:01:39"}
643
+ {"current_steps": 643, "total_steps": 715, "loss": 0.3086, "lr": 2.4495681325106535e-06, "epoch": 4.490648107872988, "percentage": 89.93, "elapsed_time": "17:51:34", "remaining_time": "1:59:59"}
644
+ {"current_steps": 644, "total_steps": 715, "loss": 0.3075, "lr": 2.3826761777150643e-06, "epoch": 4.497607655502392, "percentage": 90.07, "elapsed_time": "17:53:13", "remaining_time": "1:58:19"}
645
+ {"current_steps": 645, "total_steps": 715, "loss": 0.3116, "lr": 2.3166821991298384e-06, "epoch": 4.5045672031317965, "percentage": 90.21, "elapsed_time": "17:54:52", "remaining_time": "1:56:39"}
646
+ {"current_steps": 646, "total_steps": 715, "loss": 0.313, "lr": 2.2515877721201697e-06, "epoch": 4.511526750761201, "percentage": 90.35, "elapsed_time": "17:56:31", "remaining_time": "1:54:59"}
647
+ {"current_steps": 647, "total_steps": 715, "loss": 0.3097, "lr": 2.1873944505777447e-06, "epoch": 4.518486298390605, "percentage": 90.49, "elapsed_time": "17:58:10", "remaining_time": "1:53:19"}
648
+ {"current_steps": 648, "total_steps": 715, "loss": 0.3093, "lr": 2.124103766883661e-06, "epoch": 4.525445846020009, "percentage": 90.63, "elapsed_time": "17:59:50", "remaining_time": "1:51:38"}
649
+ {"current_steps": 649, "total_steps": 715, "loss": 0.3109, "lr": 2.0617172318718205e-06, "epoch": 4.532405393649412, "percentage": 90.77, "elapsed_time": "18:01:29", "remaining_time": "1:49:58"}
650
+ {"current_steps": 650, "total_steps": 715, "loss": 0.306, "lr": 2.000236334792871e-06, "epoch": 4.539364941278817, "percentage": 90.91, "elapsed_time": "18:03:08", "remaining_time": "1:48:18"}
651
+ {"current_steps": 651, "total_steps": 715, "loss": 0.308, "lr": 1.9396625432786866e-06, "epoch": 4.546324488908221, "percentage": 91.05, "elapsed_time": "18:04:47", "remaining_time": "1:46:38"}
652
+ {"current_steps": 652, "total_steps": 715, "loss": 0.3132, "lr": 1.879997303307297e-06, "epoch": 4.553284036537625, "percentage": 91.19, "elapsed_time": "18:06:27", "remaining_time": "1:44:58"}
653
+ {"current_steps": 653, "total_steps": 715, "loss": 0.312, "lr": 1.8212420391683761e-06, "epoch": 4.560243584167029, "percentage": 91.33, "elapsed_time": "18:08:06", "remaining_time": "1:43:18"}
654
+ {"current_steps": 654, "total_steps": 715, "loss": 0.3101, "lr": 1.7633981534292565e-06, "epoch": 4.5672031317964334, "percentage": 91.47, "elapsed_time": "18:09:45", "remaining_time": "1:41:38"}
655
+ {"current_steps": 655, "total_steps": 715, "loss": 0.3065, "lr": 1.7064670269014306e-06, "epoch": 4.574162679425838, "percentage": 91.61, "elapsed_time": "18:11:25", "remaining_time": "1:39:58"}
656
+ {"current_steps": 656, "total_steps": 715, "loss": 0.3083, "lr": 1.65045001860761e-06, "epoch": 4.581122227055241, "percentage": 91.75, "elapsed_time": "18:13:04", "remaining_time": "1:38:18"}
657
+ {"current_steps": 657, "total_steps": 715, "loss": 0.3129, "lr": 1.5953484657492734e-06, "epoch": 4.588081774684645, "percentage": 91.89, "elapsed_time": "18:14:43", "remaining_time": "1:36:38"}
658
+ {"current_steps": 658, "total_steps": 715, "loss": 0.3111, "lr": 1.5411636836747357e-06, "epoch": 4.595041322314049, "percentage": 92.03, "elapsed_time": "18:16:22", "remaining_time": "1:34:58"}
659
+ {"current_steps": 659, "total_steps": 715, "loss": 0.3151, "lr": 1.4878969658477505e-06, "epoch": 4.602000869943454, "percentage": 92.17, "elapsed_time": "18:18:02", "remaining_time": "1:33:18"}
660
+ {"current_steps": 660, "total_steps": 715, "loss": 0.3081, "lr": 1.435549583816669e-06, "epoch": 4.608960417572858, "percentage": 92.31, "elapsed_time": "18:19:41", "remaining_time": "1:31:38"}
661
+ {"current_steps": 661, "total_steps": 715, "loss": 0.3133, "lr": 1.3841227871840278e-06, "epoch": 4.615919965202262, "percentage": 92.45, "elapsed_time": "18:21:20", "remaining_time": "1:29:58"}
662
+ {"current_steps": 662, "total_steps": 715, "loss": 0.3094, "lr": 1.3336178035767612e-06, "epoch": 4.622879512831666, "percentage": 92.59, "elapsed_time": "18:22:59", "remaining_time": "1:28:18"}
663
+ {"current_steps": 663, "total_steps": 715, "loss": 0.3038, "lr": 1.2840358386168972e-06, "epoch": 4.62983906046107, "percentage": 92.73, "elapsed_time": "18:24:39", "remaining_time": "1:26:38"}
664
+ {"current_steps": 664, "total_steps": 715, "loss": 0.311, "lr": 1.2353780758927347e-06, "epoch": 4.636798608090475, "percentage": 92.87, "elapsed_time": "18:26:18", "remaining_time": "1:24:58"}
665
+ {"current_steps": 665, "total_steps": 715, "loss": 0.3124, "lr": 1.1876456769306554e-06, "epoch": 4.643758155719878, "percentage": 93.01, "elapsed_time": "18:27:57", "remaining_time": "1:23:18"}
666
+ {"current_steps": 666, "total_steps": 715, "loss": 0.3105, "lr": 1.1408397811673376e-06, "epoch": 4.650717703349282, "percentage": 93.15, "elapsed_time": "18:29:36", "remaining_time": "1:21:38"}
667
+ {"current_steps": 667, "total_steps": 715, "loss": 0.3039, "lr": 1.0949615059225871e-06, "epoch": 4.657677250978686, "percentage": 93.29, "elapsed_time": "18:31:15", "remaining_time": "1:19:58"}
668
+ {"current_steps": 668, "total_steps": 715, "loss": 0.3147, "lr": 1.0500119463726467e-06, "epoch": 4.6646367986080906, "percentage": 93.43, "elapsed_time": "18:32:55", "remaining_time": "1:18:18"}
669
+ {"current_steps": 669, "total_steps": 715, "loss": 0.3114, "lr": 1.0059921755240797e-06, "epoch": 4.671596346237495, "percentage": 93.57, "elapsed_time": "18:34:34", "remaining_time": "1:16:38"}
670
+ {"current_steps": 670, "total_steps": 715, "loss": 0.312, "lr": 9.62903244188147e-07, "epoch": 4.678555893866899, "percentage": 93.71, "elapsed_time": "18:36:13", "remaining_time": "1:14:58"}
671
+ {"current_steps": 671, "total_steps": 715, "loss": 0.3115, "lr": 9.207461809556872e-07, "epoch": 4.685515441496303, "percentage": 93.85, "elapsed_time": "18:37:52", "remaining_time": "1:13:18"}
672
+ {"current_steps": 672, "total_steps": 715, "loss": 0.3122, "lr": 8.795219921726139e-07, "epoch": 4.6924749891257065, "percentage": 93.99, "elapsed_time": "18:39:31", "remaining_time": "1:11:38"}
673
+ {"current_steps": 673, "total_steps": 715, "loss": 0.3074, "lr": 8.392316619158669e-07, "epoch": 4.699434536755111, "percentage": 94.13, "elapsed_time": "18:41:11", "remaining_time": "1:09:58"}
674
+ {"current_steps": 674, "total_steps": 715, "loss": 0.3107, "lr": 7.998761519699205e-07, "epoch": 4.706394084384515, "percentage": 94.27, "elapsed_time": "18:42:50", "remaining_time": "1:08:18"}
675
+ {"current_steps": 675, "total_steps": 715, "loss": 0.314, "lr": 7.61456401803824e-07, "epoch": 4.713353632013919, "percentage": 94.41, "elapsed_time": "18:44:29", "remaining_time": "1:06:38"}
676
+ {"current_steps": 676, "total_steps": 715, "loss": 0.3053, "lr": 7.239733285487882e-07, "epoch": 4.720313179643323, "percentage": 94.55, "elapsed_time": "18:46:08", "remaining_time": "1:04:58"}
677
+ {"current_steps": 677, "total_steps": 715, "loss": 0.3098, "lr": 6.874278269762924e-07, "epoch": 4.7272727272727275, "percentage": 94.69, "elapsed_time": "18:47:48", "remaining_time": "1:03:18"}
678
+ {"current_steps": 678, "total_steps": 715, "loss": 0.3111, "lr": 6.518207694766965e-07, "epoch": 4.734232274902132, "percentage": 94.83, "elapsed_time": "18:49:27", "remaining_time": "1:01:38"}
679
+ {"current_steps": 679, "total_steps": 715, "loss": 0.3057, "lr": 6.171530060384445e-07, "epoch": 4.741191822531535, "percentage": 94.97, "elapsed_time": "18:51:06", "remaining_time": "0:59:58"}
680
+ {"current_steps": 680, "total_steps": 715, "loss": 0.3085, "lr": 5.834253642277655e-07, "epoch": 4.748151370160939, "percentage": 95.1, "elapsed_time": "18:52:45", "remaining_time": "0:58:18"}
681
+ {"current_steps": 681, "total_steps": 715, "loss": 0.307, "lr": 5.506386491689197e-07, "epoch": 4.7551109177903434, "percentage": 95.24, "elapsed_time": "18:54:25", "remaining_time": "0:56:38"}
682
+ {"current_steps": 682, "total_steps": 715, "loss": 0.3086, "lr": 5.187936435249796e-07, "epoch": 4.762070465419748, "percentage": 95.38, "elapsed_time": "18:56:04", "remaining_time": "0:54:58"}
683
+ {"current_steps": 683, "total_steps": 715, "loss": 0.3121, "lr": 4.878911074791371e-07, "epoch": 4.769030013049152, "percentage": 95.52, "elapsed_time": "18:57:43", "remaining_time": "0:53:18"}
684
+ {"current_steps": 684, "total_steps": 715, "loss": 0.3062, "lr": 4.57931778716576e-07, "epoch": 4.775989560678556, "percentage": 95.66, "elapsed_time": "18:59:23", "remaining_time": "0:51:38"}
685
+ {"current_steps": 685, "total_steps": 715, "loss": 0.3119, "lr": 4.2891637240684234e-07, "epoch": 4.78294910830796, "percentage": 95.8, "elapsed_time": "19:01:02", "remaining_time": "0:49:58"}
686
+ {"current_steps": 686, "total_steps": 715, "loss": 0.3081, "lr": 4.0084558118678173e-07, "epoch": 4.789908655937364, "percentage": 95.94, "elapsed_time": "19:02:41", "remaining_time": "0:48:18"}
687
+ {"current_steps": 687, "total_steps": 715, "loss": 0.3114, "lr": 3.7372007514401063e-07, "epoch": 4.796868203566768, "percentage": 96.08, "elapsed_time": "19:04:21", "remaining_time": "0:46:38"}
688
+ {"current_steps": 688, "total_steps": 715, "loss": 0.3016, "lr": 3.4754050180090704e-07, "epoch": 4.803827751196172, "percentage": 96.22, "elapsed_time": "19:06:00", "remaining_time": "0:44:58"}
689
+ {"current_steps": 689, "total_steps": 715, "loss": 0.3113, "lr": 3.223074860991693e-07, "epoch": 4.810787298825576, "percentage": 96.36, "elapsed_time": "19:07:39", "remaining_time": "0:43:18"}
690
+ {"current_steps": 690, "total_steps": 715, "loss": 0.3082, "lr": 2.980216303848815e-07, "epoch": 4.81774684645498, "percentage": 96.5, "elapsed_time": "19:09:18", "remaining_time": "0:41:38"}
691
+ {"current_steps": 691, "total_steps": 715, "loss": 0.3076, "lr": 2.746835143941473e-07, "epoch": 4.824706394084385, "percentage": 96.64, "elapsed_time": "19:10:57", "remaining_time": "0:39:58"}
692
+ {"current_steps": 692, "total_steps": 715, "loss": 0.3079, "lr": 2.5229369523923853e-07, "epoch": 4.831665941713789, "percentage": 96.78, "elapsed_time": "19:12:37", "remaining_time": "0:38:18"}
693
+ {"current_steps": 693, "total_steps": 715, "loss": 0.3095, "lr": 2.3085270739531706e-07, "epoch": 4.838625489343193, "percentage": 96.92, "elapsed_time": "19:14:16", "remaining_time": "0:36:38"}
694
+ {"current_steps": 694, "total_steps": 715, "loss": 0.3087, "lr": 2.1036106268765398e-07, "epoch": 4.845585036972597, "percentage": 97.06, "elapsed_time": "19:15:55", "remaining_time": "0:34:58"}
695
+ {"current_steps": 695, "total_steps": 715, "loss": 0.3104, "lr": 1.908192502794215e-07, "epoch": 4.8525445846020006, "percentage": 97.2, "elapsed_time": "19:17:34", "remaining_time": "0:33:18"}
696
+ {"current_steps": 696, "total_steps": 715, "loss": 0.3113, "lr": 1.7222773666001336e-07, "epoch": 4.859504132231405, "percentage": 97.34, "elapsed_time": "19:19:13", "remaining_time": "0:31:38"}
697
+ {"current_steps": 697, "total_steps": 715, "loss": 0.3086, "lr": 1.545869656339072e-07, "epoch": 4.866463679860809, "percentage": 97.48, "elapsed_time": "19:20:53", "remaining_time": "0:29:58"}
698
+ {"current_steps": 698, "total_steps": 715, "loss": 0.3124, "lr": 1.3789735831009064e-07, "epoch": 4.873423227490213, "percentage": 97.62, "elapsed_time": "19:22:32", "remaining_time": "0:28:18"}
699
+ {"current_steps": 699, "total_steps": 715, "loss": 0.3092, "lr": 1.2215931309197626e-07, "epoch": 4.880382775119617, "percentage": 97.76, "elapsed_time": "19:24:11", "remaining_time": "0:26:38"}
700
+ {"current_steps": 700, "total_steps": 715, "loss": 0.311, "lr": 1.0737320566790221e-07, "epoch": 4.887342322749022, "percentage": 97.9, "elapsed_time": "19:25:50", "remaining_time": "0:24:58"}
701
+ {"current_steps": 701, "total_steps": 715, "loss": 0.3135, "lr": 9.35393890021885e-08, "epoch": 4.894301870378426, "percentage": 98.04, "elapsed_time": "19:27:30", "remaining_time": "0:23:19"}
702
+ {"current_steps": 702, "total_steps": 715, "loss": 0.3063, "lr": 8.065819332667702e-08, "epoch": 4.901261418007829, "percentage": 98.18, "elapsed_time": "19:29:09", "remaining_time": "0:21:39"}
703
+ {"current_steps": 703, "total_steps": 715, "loss": 0.311, "lr": 6.872992613286223e-08, "epoch": 4.908220965637233, "percentage": 98.32, "elapsed_time": "19:30:48", "remaining_time": "0:19:59"}
704
+ {"current_steps": 704, "total_steps": 715, "loss": 0.3123, "lr": 5.775487216456377e-08, "epoch": 4.9151805132666375, "percentage": 98.46, "elapsed_time": "19:32:28", "remaining_time": "0:18:19"}
705
+ {"current_steps": 705, "total_steps": 715, "loss": 0.3155, "lr": 4.7733293411105216e-08, "epoch": 4.922140060896042, "percentage": 98.6, "elapsed_time": "19:34:07", "remaining_time": "0:16:39"}
706
+ {"current_steps": 706, "total_steps": 715, "loss": 0.3044, "lr": 3.8665429101070185e-08, "epoch": 4.929099608525446, "percentage": 98.74, "elapsed_time": "19:35:46", "remaining_time": "0:14:59"}
707
+ {"current_steps": 707, "total_steps": 715, "loss": 0.3121, "lr": 3.055149569660909e-08, "epoch": 4.93605915615485, "percentage": 98.88, "elapsed_time": "19:37:26", "remaining_time": "0:13:19"}
708
+ {"current_steps": 708, "total_steps": 715, "loss": 0.3123, "lr": 2.3391686888238894e-08, "epoch": 4.943018703784254, "percentage": 99.02, "elapsed_time": "19:39:05", "remaining_time": "0:11:39"}
709
+ {"current_steps": 709, "total_steps": 715, "loss": 0.3037, "lr": 1.7186173590251208e-08, "epoch": 4.949978251413658, "percentage": 99.16, "elapsed_time": "19:40:44", "remaining_time": "0:09:59"}
710
+ {"current_steps": 710, "total_steps": 715, "loss": 0.3109, "lr": 1.1935103936600023e-08, "epoch": 4.956937799043062, "percentage": 99.3, "elapsed_time": "19:42:24", "remaining_time": "0:08:19"}
711
+ {"current_steps": 711, "total_steps": 715, "loss": 0.315, "lr": 7.63860327740229e-09, "epoch": 4.963897346672466, "percentage": 99.44, "elapsed_time": "19:44:03", "remaining_time": "0:06:39"}
712
+ {"current_steps": 712, "total_steps": 715, "loss": 0.3114, "lr": 4.296774175918117e-09, "epoch": 4.97085689430187, "percentage": 99.58, "elapsed_time": "19:45:43", "remaining_time": "0:04:59"}
713
+ {"current_steps": 713, "total_steps": 715, "loss": 0.3132, "lr": 1.909696406103834e-09, "epoch": 4.9778164419312745, "percentage": 99.72, "elapsed_time": "19:47:23", "remaining_time": "0:03:19"}
714
+ {"current_steps": 714, "total_steps": 715, "loss": 0.3053, "lr": 4.77426950733495e-10, "epoch": 4.984775989560679, "percentage": 99.86, "elapsed_time": "19:49:02", "remaining_time": "0:01:39"}
715
+ {"current_steps": 715, "total_steps": 715, "loss": 0.3097, "lr": 0.0, "epoch": 4.991735537190083, "percentage": 100.0, "elapsed_time": "19:50:42", "remaining_time": "0:00:00"}
716
+ {"current_steps": 715, "total_steps": 715, "epoch": 4.991735537190083, "percentage": 100.0, "elapsed_time": "19:53:48", "remaining_time": "0:00:00"}