Training in progress, epoch 3
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4877660776
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:859999415129a8904d509cc6346c9539b26b55bd8880b66aabc76b2dc6b30c46
|
3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4932751008
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d3eab6206f90615b1e4570389ac8bbe2e1413273af34b0501e30f107e0883dc0
|
3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4330865200
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e8372f6bb480a88ba3bbbfe18f6df82cf5a5da35b749636005844195f58722b6
|
3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1089994880
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e5a8a224f8fb12e29002a71d3bb3bd17da1751758f311cf58a189ada904b08f6
|
3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
@@ -486,3 +486,242 @@
|
|
486 |
{"current_steps": 486, "total_steps": 1200, "loss": 0.484, "lr": 2.9696192404926747e-05, "epoch": 2.025, "percentage": 40.5, "elapsed_time": "3:12:18", "remaining_time": "4:42:32"}
|
487 |
{"current_steps": 487, "total_steps": 1200, "loss": 0.485, "lr": 2.964526814211338e-05, "epoch": 2.029166666666667, "percentage": 40.58, "elapsed_time": "3:12:42", "remaining_time": "4:42:08"}
|
488 |
{"current_steps": 488, "total_steps": 1200, "loss": 0.4809, "lr": 2.959426226500493e-05, "epoch": 2.033333333333333, "percentage": 40.67, "elapsed_time": "3:13:07", "remaining_time": "4:41:46"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
486 |
{"current_steps": 486, "total_steps": 1200, "loss": 0.484, "lr": 2.9696192404926747e-05, "epoch": 2.025, "percentage": 40.5, "elapsed_time": "3:12:18", "remaining_time": "4:42:32"}
|
487 |
{"current_steps": 487, "total_steps": 1200, "loss": 0.485, "lr": 2.964526814211338e-05, "epoch": 2.029166666666667, "percentage": 40.58, "elapsed_time": "3:12:42", "remaining_time": "4:42:08"}
|
488 |
{"current_steps": 488, "total_steps": 1200, "loss": 0.4809, "lr": 2.959426226500493e-05, "epoch": 2.033333333333333, "percentage": 40.67, "elapsed_time": "3:13:07", "remaining_time": "4:41:46"}
|
489 |
+
{"current_steps": 489, "total_steps": 1200, "loss": 0.4661, "lr": 2.954317520519217e-05, "epoch": 2.0375, "percentage": 40.75, "elapsed_time": "3:13:30", "remaining_time": "4:41:22"}
|
490 |
+
{"current_steps": 490, "total_steps": 1200, "loss": 0.483, "lr": 2.9492007394952812e-05, "epoch": 2.0416666666666665, "percentage": 40.83, "elapsed_time": "3:13:54", "remaining_time": "4:40:57"}
|
491 |
+
{"current_steps": 491, "total_steps": 1200, "loss": 0.4672, "lr": 2.9440759267247828e-05, "epoch": 2.0458333333333334, "percentage": 40.92, "elapsed_time": "3:14:17", "remaining_time": "4:40:32"}
|
492 |
+
{"current_steps": 492, "total_steps": 1200, "loss": 0.4781, "lr": 2.938943125571782e-05, "epoch": 2.05, "percentage": 41.0, "elapsed_time": "3:14:40", "remaining_time": "4:40:08"}
|
493 |
+
{"current_steps": 493, "total_steps": 1200, "loss": 0.4736, "lr": 2.933802379467932e-05, "epoch": 2.0541666666666667, "percentage": 41.08, "elapsed_time": "3:15:04", "remaining_time": "4:39:44"}
|
494 |
+
{"current_steps": 494, "total_steps": 1200, "loss": 0.4795, "lr": 2.9286537319121143e-05, "epoch": 2.058333333333333, "percentage": 41.17, "elapsed_time": "3:15:28", "remaining_time": "4:39:21"}
|
495 |
+
{"current_steps": 495, "total_steps": 1200, "loss": 0.5018, "lr": 2.9234972264700687e-05, "epoch": 2.0625, "percentage": 41.25, "elapsed_time": "3:15:50", "remaining_time": "4:38:55"}
|
496 |
+
{"current_steps": 496, "total_steps": 1200, "loss": 0.4698, "lr": 2.9183329067740235e-05, "epoch": 2.066666666666667, "percentage": 41.33, "elapsed_time": "3:16:13", "remaining_time": "4:38:30"}
|
497 |
+
{"current_steps": 497, "total_steps": 1200, "loss": 0.4755, "lr": 2.9131608165223313e-05, "epoch": 2.0708333333333333, "percentage": 41.42, "elapsed_time": "3:16:35", "remaining_time": "4:38:05"}
|
498 |
+
{"current_steps": 498, "total_steps": 1200, "loss": 0.5212, "lr": 2.9079809994790937e-05, "epoch": 2.075, "percentage": 41.5, "elapsed_time": "3:16:57", "remaining_time": "4:37:39"}
|
499 |
+
{"current_steps": 499, "total_steps": 1200, "loss": 0.4897, "lr": 2.902793499473794e-05, "epoch": 2.0791666666666666, "percentage": 41.58, "elapsed_time": "3:17:21", "remaining_time": "4:37:14"}
|
500 |
+
{"current_steps": 500, "total_steps": 1200, "loss": 0.4785, "lr": 2.897598360400925e-05, "epoch": 2.0833333333333335, "percentage": 41.67, "elapsed_time": "3:17:44", "remaining_time": "4:36:49"}
|
501 |
+
{"current_steps": 501, "total_steps": 1200, "loss": 0.4776, "lr": 2.8923956262196178e-05, "epoch": 2.0875, "percentage": 41.75, "elapsed_time": "3:18:07", "remaining_time": "4:36:25"}
|
502 |
+
{"current_steps": 502, "total_steps": 1200, "loss": 0.5005, "lr": 2.8871853409532727e-05, "epoch": 2.091666666666667, "percentage": 41.83, "elapsed_time": "3:18:30", "remaining_time": "4:36:00"}
|
503 |
+
{"current_steps": 503, "total_steps": 1200, "loss": 0.4657, "lr": 2.88196754868918e-05, "epoch": 2.095833333333333, "percentage": 41.92, "elapsed_time": "3:18:52", "remaining_time": "4:35:35"}
|
504 |
+
{"current_steps": 504, "total_steps": 1200, "loss": 0.4723, "lr": 2.876742293578155e-05, "epoch": 2.1, "percentage": 42.0, "elapsed_time": "3:19:15", "remaining_time": "4:35:10"}
|
505 |
+
{"current_steps": 505, "total_steps": 1200, "loss": 0.4727, "lr": 2.871509619834159e-05, "epoch": 2.1041666666666665, "percentage": 42.08, "elapsed_time": "3:19:39", "remaining_time": "4:34:46"}
|
506 |
+
{"current_steps": 506, "total_steps": 1200, "loss": 0.4715, "lr": 2.8662695717339263e-05, "epoch": 2.1083333333333334, "percentage": 42.17, "elapsed_time": "3:20:02", "remaining_time": "4:34:21"}
|
507 |
+
{"current_steps": 507, "total_steps": 1200, "loss": 0.482, "lr": 2.8610221936165906e-05, "epoch": 2.1125, "percentage": 42.25, "elapsed_time": "3:20:26", "remaining_time": "4:33:58"}
|
508 |
+
{"current_steps": 508, "total_steps": 1200, "loss": 0.485, "lr": 2.8557675298833086e-05, "epoch": 2.1166666666666667, "percentage": 42.33, "elapsed_time": "3:20:48", "remaining_time": "4:33:32"}
|
509 |
+
{"current_steps": 509, "total_steps": 1200, "loss": 0.4873, "lr": 2.8505056249968864e-05, "epoch": 2.120833333333333, "percentage": 42.42, "elapsed_time": "3:21:11", "remaining_time": "4:33:07"}
|
510 |
+
{"current_steps": 510, "total_steps": 1200, "loss": 0.4823, "lr": 2.8452365234813992e-05, "epoch": 2.125, "percentage": 42.5, "elapsed_time": "3:21:33", "remaining_time": "4:32:41"}
|
511 |
+
{"current_steps": 511, "total_steps": 1200, "loss": 0.4914, "lr": 2.8399602699218194e-05, "epoch": 2.129166666666667, "percentage": 42.58, "elapsed_time": "3:21:56", "remaining_time": "4:32:17"}
|
512 |
+
{"current_steps": 512, "total_steps": 1200, "loss": 0.4818, "lr": 2.834676908963636e-05, "epoch": 2.1333333333333333, "percentage": 42.67, "elapsed_time": "3:22:20", "remaining_time": "4:31:53"}
|
513 |
+
{"current_steps": 513, "total_steps": 1200, "loss": 0.4661, "lr": 2.8293864853124783e-05, "epoch": 2.1375, "percentage": 42.75, "elapsed_time": "3:22:42", "remaining_time": "4:31:27"}
|
514 |
+
{"current_steps": 514, "total_steps": 1200, "loss": 0.4712, "lr": 2.8240890437337373e-05, "epoch": 2.1416666666666666, "percentage": 42.83, "elapsed_time": "3:23:05", "remaining_time": "4:31:02"}
|
515 |
+
{"current_steps": 515, "total_steps": 1200, "loss": 0.4785, "lr": 2.8187846290521852e-05, "epoch": 2.1458333333333335, "percentage": 42.92, "elapsed_time": "3:23:28", "remaining_time": "4:30:38"}
|
516 |
+
{"current_steps": 516, "total_steps": 1200, "loss": 0.4756, "lr": 2.813473286151601e-05, "epoch": 2.15, "percentage": 43.0, "elapsed_time": "3:23:50", "remaining_time": "4:30:13"}
|
517 |
+
{"current_steps": 517, "total_steps": 1200, "loss": 0.475, "lr": 2.8081550599743835e-05, "epoch": 2.154166666666667, "percentage": 43.08, "elapsed_time": "3:24:14", "remaining_time": "4:29:49"}
|
518 |
+
{"current_steps": 518, "total_steps": 1200, "loss": 0.4827, "lr": 2.8028299955211785e-05, "epoch": 2.158333333333333, "percentage": 43.17, "elapsed_time": "3:24:38", "remaining_time": "4:29:25"}
|
519 |
+
{"current_steps": 519, "total_steps": 1200, "loss": 0.4774, "lr": 2.7974981378504926e-05, "epoch": 2.1625, "percentage": 43.25, "elapsed_time": "3:25:02", "remaining_time": "4:29:03"}
|
520 |
+
{"current_steps": 520, "total_steps": 1200, "loss": 0.4865, "lr": 2.792159532078314e-05, "epoch": 2.1666666666666665, "percentage": 43.33, "elapsed_time": "3:25:25", "remaining_time": "4:28:38"}
|
521 |
+
{"current_steps": 521, "total_steps": 1200, "loss": 0.4804, "lr": 2.7868142233777305e-05, "epoch": 2.1708333333333334, "percentage": 43.42, "elapsed_time": "3:25:49", "remaining_time": "4:28:14"}
|
522 |
+
{"current_steps": 522, "total_steps": 1200, "loss": 0.473, "lr": 2.7814622569785474e-05, "epoch": 2.175, "percentage": 43.5, "elapsed_time": "3:26:12", "remaining_time": "4:27:50"}
|
523 |
+
{"current_steps": 523, "total_steps": 1200, "loss": 0.4804, "lr": 2.776103678166906e-05, "epoch": 2.1791666666666667, "percentage": 43.58, "elapsed_time": "3:26:36", "remaining_time": "4:27:26"}
|
524 |
+
{"current_steps": 524, "total_steps": 1200, "loss": 0.481, "lr": 2.770738532284897e-05, "epoch": 2.183333333333333, "percentage": 43.67, "elapsed_time": "3:26:59", "remaining_time": "4:27:02"}
|
525 |
+
{"current_steps": 525, "total_steps": 1200, "loss": 0.486, "lr": 2.7653668647301797e-05, "epoch": 2.1875, "percentage": 43.75, "elapsed_time": "3:27:22", "remaining_time": "4:26:38"}
|
526 |
+
{"current_steps": 526, "total_steps": 1200, "loss": 0.4704, "lr": 2.7599887209555986e-05, "epoch": 2.191666666666667, "percentage": 43.83, "elapsed_time": "3:27:46", "remaining_time": "4:26:13"}
|
527 |
+
{"current_steps": 527, "total_steps": 1200, "loss": 0.4735, "lr": 2.7546041464687942e-05, "epoch": 2.1958333333333333, "percentage": 43.92, "elapsed_time": "3:28:09", "remaining_time": "4:25:49"}
|
528 |
+
{"current_steps": 528, "total_steps": 1200, "loss": 0.4906, "lr": 2.7492131868318247e-05, "epoch": 2.2, "percentage": 44.0, "elapsed_time": "3:28:32", "remaining_time": "4:25:24"}
|
529 |
+
{"current_steps": 529, "total_steps": 1200, "loss": 0.478, "lr": 2.7438158876607732e-05, "epoch": 2.2041666666666666, "percentage": 44.08, "elapsed_time": "3:28:56", "remaining_time": "4:25:01"}
|
530 |
+
{"current_steps": 530, "total_steps": 1200, "loss": 0.4926, "lr": 2.738412294625369e-05, "epoch": 2.2083333333333335, "percentage": 44.17, "elapsed_time": "3:29:20", "remaining_time": "4:24:38"}
|
531 |
+
{"current_steps": 531, "total_steps": 1200, "loss": 0.4726, "lr": 2.7330024534485948e-05, "epoch": 2.2125, "percentage": 44.25, "elapsed_time": "3:29:42", "remaining_time": "4:24:12"}
|
532 |
+
{"current_steps": 532, "total_steps": 1200, "loss": 0.4732, "lr": 2.7275864099063033e-05, "epoch": 2.216666666666667, "percentage": 44.33, "elapsed_time": "3:30:05", "remaining_time": "4:23:48"}
|
533 |
+
{"current_steps": 533, "total_steps": 1200, "loss": 0.4946, "lr": 2.7221642098268292e-05, "epoch": 2.220833333333333, "percentage": 44.42, "elapsed_time": "3:30:28", "remaining_time": "4:23:23"}
|
534 |
+
{"current_steps": 534, "total_steps": 1200, "loss": 0.4831, "lr": 2.7167358990906e-05, "epoch": 2.225, "percentage": 44.5, "elapsed_time": "3:30:51", "remaining_time": "4:22:58"}
|
535 |
+
{"current_steps": 535, "total_steps": 1200, "loss": 0.477, "lr": 2.7113015236297537e-05, "epoch": 2.2291666666666665, "percentage": 44.58, "elapsed_time": "3:31:14", "remaining_time": "4:22:34"}
|
536 |
+
{"current_steps": 536, "total_steps": 1200, "loss": 0.4698, "lr": 2.7058611294277378e-05, "epoch": 2.2333333333333334, "percentage": 44.67, "elapsed_time": "3:31:38", "remaining_time": "4:22:11"}
|
537 |
+
{"current_steps": 537, "total_steps": 1200, "loss": 0.4719, "lr": 2.7004147625189353e-05, "epoch": 2.2375, "percentage": 44.75, "elapsed_time": "3:32:02", "remaining_time": "4:21:47"}
|
538 |
+
{"current_steps": 538, "total_steps": 1200, "loss": 0.4898, "lr": 2.694962468988263e-05, "epoch": 2.2416666666666667, "percentage": 44.83, "elapsed_time": "3:32:25", "remaining_time": "4:21:22"}
|
539 |
+
{"current_steps": 539, "total_steps": 1200, "loss": 0.4922, "lr": 2.6895042949707886e-05, "epoch": 2.245833333333333, "percentage": 44.92, "elapsed_time": "3:32:47", "remaining_time": "4:20:57"}
|
540 |
+
{"current_steps": 540, "total_steps": 1200, "loss": 0.4862, "lr": 2.684040286651338e-05, "epoch": 2.25, "percentage": 45.0, "elapsed_time": "3:33:11", "remaining_time": "4:20:33"}
|
541 |
+
{"current_steps": 541, "total_steps": 1200, "loss": 0.4751, "lr": 2.6785704902641024e-05, "epoch": 2.2541666666666664, "percentage": 45.08, "elapsed_time": "3:33:34", "remaining_time": "4:20:10"}
|
542 |
+
{"current_steps": 542, "total_steps": 1200, "loss": 0.4719, "lr": 2.673094952092253e-05, "epoch": 2.2583333333333333, "percentage": 45.17, "elapsed_time": "3:33:57", "remaining_time": "4:19:45"}
|
543 |
+
{"current_steps": 543, "total_steps": 1200, "loss": 0.4807, "lr": 2.667613718467542e-05, "epoch": 2.2625, "percentage": 45.25, "elapsed_time": "3:34:20", "remaining_time": "4:19:20"}
|
544 |
+
{"current_steps": 544, "total_steps": 1200, "loss": 0.4706, "lr": 2.6621268357699165e-05, "epoch": 2.2666666666666666, "percentage": 45.33, "elapsed_time": "3:34:43", "remaining_time": "4:18:56"}
|
545 |
+
{"current_steps": 545, "total_steps": 1200, "loss": 0.4708, "lr": 2.6566343504271227e-05, "epoch": 2.2708333333333335, "percentage": 45.42, "elapsed_time": "3:35:06", "remaining_time": "4:18:31"}
|
546 |
+
{"current_steps": 546, "total_steps": 1200, "loss": 0.4791, "lr": 2.6511363089143137e-05, "epoch": 2.275, "percentage": 45.5, "elapsed_time": "3:35:30", "remaining_time": "4:18:08"}
|
547 |
+
{"current_steps": 547, "total_steps": 1200, "loss": 0.4773, "lr": 2.645632757753658e-05, "epoch": 2.279166666666667, "percentage": 45.58, "elapsed_time": "3:35:53", "remaining_time": "4:17:43"}
|
548 |
+
{"current_steps": 548, "total_steps": 1200, "loss": 0.4782, "lr": 2.640123743513943e-05, "epoch": 2.283333333333333, "percentage": 45.67, "elapsed_time": "3:36:16", "remaining_time": "4:17:18"}
|
549 |
+
{"current_steps": 549, "total_steps": 1200, "loss": 0.4904, "lr": 2.6346093128101847e-05, "epoch": 2.2875, "percentage": 45.75, "elapsed_time": "3:36:39", "remaining_time": "4:16:54"}
|
550 |
+
{"current_steps": 550, "total_steps": 1200, "loss": 0.4737, "lr": 2.6290895123032277e-05, "epoch": 2.2916666666666665, "percentage": 45.83, "elapsed_time": "3:37:02", "remaining_time": "4:16:29"}
|
551 |
+
{"current_steps": 551, "total_steps": 1200, "loss": 0.4717, "lr": 2.623564388699356e-05, "epoch": 2.2958333333333334, "percentage": 45.92, "elapsed_time": "3:37:25", "remaining_time": "4:16:05"}
|
552 |
+
{"current_steps": 552, "total_steps": 1200, "loss": 0.4958, "lr": 2.618033988749895e-05, "epoch": 2.3, "percentage": 46.0, "elapsed_time": "3:37:48", "remaining_time": "4:15:41"}
|
553 |
+
{"current_steps": 553, "total_steps": 1200, "loss": 0.4863, "lr": 2.6124983592508164e-05, "epoch": 2.3041666666666667, "percentage": 46.08, "elapsed_time": "3:38:12", "remaining_time": "4:15:17"}
|
554 |
+
{"current_steps": 554, "total_steps": 1200, "loss": 0.4751, "lr": 2.6069575470423417e-05, "epoch": 2.3083333333333336, "percentage": 46.17, "elapsed_time": "3:38:34", "remaining_time": "4:14:52"}
|
555 |
+
{"current_steps": 555, "total_steps": 1200, "loss": 0.4857, "lr": 2.601411599008546e-05, "epoch": 2.3125, "percentage": 46.25, "elapsed_time": "3:38:57", "remaining_time": "4:14:27"}
|
556 |
+
{"current_steps": 556, "total_steps": 1200, "loss": 0.4971, "lr": 2.595860562076964e-05, "epoch": 2.3166666666666664, "percentage": 46.33, "elapsed_time": "3:39:19", "remaining_time": "4:14:02"}
|
557 |
+
{"current_steps": 557, "total_steps": 1200, "loss": 0.4771, "lr": 2.590304483218188e-05, "epoch": 2.3208333333333333, "percentage": 46.42, "elapsed_time": "3:39:43", "remaining_time": "4:13:38"}
|
558 |
+
{"current_steps": 558, "total_steps": 1200, "loss": 0.4678, "lr": 2.5847434094454737e-05, "epoch": 2.325, "percentage": 46.5, "elapsed_time": "3:40:06", "remaining_time": "4:13:14"}
|
559 |
+
{"current_steps": 559, "total_steps": 1200, "loss": 0.4874, "lr": 2.5791773878143423e-05, "epoch": 2.3291666666666666, "percentage": 46.58, "elapsed_time": "3:40:29", "remaining_time": "4:12:50"}
|
560 |
+
{"current_steps": 560, "total_steps": 1200, "loss": 0.4846, "lr": 2.5736064654221808e-05, "epoch": 2.3333333333333335, "percentage": 46.67, "elapsed_time": "3:40:52", "remaining_time": "4:12:26"}
|
561 |
+
{"current_steps": 561, "total_steps": 1200, "loss": 0.4717, "lr": 2.568030689407846e-05, "epoch": 2.3375, "percentage": 46.75, "elapsed_time": "3:41:16", "remaining_time": "4:12:02"}
|
562 |
+
{"current_steps": 562, "total_steps": 1200, "loss": 0.4896, "lr": 2.5624501069512614e-05, "epoch": 2.341666666666667, "percentage": 46.83, "elapsed_time": "3:41:40", "remaining_time": "4:11:38"}
|
563 |
+
{"current_steps": 563, "total_steps": 1200, "loss": 0.4793, "lr": 2.556864765273024e-05, "epoch": 2.345833333333333, "percentage": 46.92, "elapsed_time": "3:42:03", "remaining_time": "4:11:14"}
|
564 |
+
{"current_steps": 564, "total_steps": 1200, "loss": 0.4728, "lr": 2.5512747116339985e-05, "epoch": 2.35, "percentage": 47.0, "elapsed_time": "3:42:25", "remaining_time": "4:10:49"}
|
565 |
+
{"current_steps": 565, "total_steps": 1200, "loss": 0.4858, "lr": 2.5456799933349224e-05, "epoch": 2.3541666666666665, "percentage": 47.08, "elapsed_time": "3:42:49", "remaining_time": "4:10:25"}
|
566 |
+
{"current_steps": 566, "total_steps": 1200, "loss": 0.4756, "lr": 2.540080657716002e-05, "epoch": 2.3583333333333334, "percentage": 47.17, "elapsed_time": "3:43:13", "remaining_time": "4:10:02"}
|
567 |
+
{"current_steps": 567, "total_steps": 1200, "loss": 0.4834, "lr": 2.534476752156514e-05, "epoch": 2.3625, "percentage": 47.25, "elapsed_time": "3:43:36", "remaining_time": "4:09:38"}
|
568 |
+
{"current_steps": 568, "total_steps": 1200, "loss": 0.4726, "lr": 2.528868324074405e-05, "epoch": 2.3666666666666667, "percentage": 47.33, "elapsed_time": "3:44:00", "remaining_time": "4:09:14"}
|
569 |
+
{"current_steps": 569, "total_steps": 1200, "loss": 0.4878, "lr": 2.523255420925887e-05, "epoch": 2.3708333333333336, "percentage": 47.42, "elapsed_time": "3:44:23", "remaining_time": "4:08:50"}
|
570 |
+
{"current_steps": 570, "total_steps": 1200, "loss": 0.4842, "lr": 2.5176380902050418e-05, "epoch": 2.375, "percentage": 47.5, "elapsed_time": "3:44:46", "remaining_time": "4:08:26"}
|
571 |
+
{"current_steps": 571, "total_steps": 1200, "loss": 0.4676, "lr": 2.512016379443412e-05, "epoch": 2.3791666666666664, "percentage": 47.58, "elapsed_time": "3:45:10", "remaining_time": "4:08:03"}
|
572 |
+
{"current_steps": 572, "total_steps": 1200, "loss": 0.4777, "lr": 2.506390336209604e-05, "epoch": 2.3833333333333333, "percentage": 47.67, "elapsed_time": "3:45:33", "remaining_time": "4:07:38"}
|
573 |
+
{"current_steps": 573, "total_steps": 1200, "loss": 0.472, "lr": 2.5007600081088833e-05, "epoch": 2.3875, "percentage": 47.75, "elapsed_time": "3:45:55", "remaining_time": "4:07:13"}
|
574 |
+
{"current_steps": 574, "total_steps": 1200, "loss": 0.4939, "lr": 2.4951254427827723e-05, "epoch": 2.3916666666666666, "percentage": 47.83, "elapsed_time": "3:46:19", "remaining_time": "4:06:49"}
|
575 |
+
{"current_steps": 575, "total_steps": 1200, "loss": 0.4677, "lr": 2.4894866879086478e-05, "epoch": 2.3958333333333335, "percentage": 47.92, "elapsed_time": "3:46:41", "remaining_time": "4:06:24"}
|
576 |
+
{"current_steps": 576, "total_steps": 1200, "loss": 0.4809, "lr": 2.4838437911993355e-05, "epoch": 2.4, "percentage": 48.0, "elapsed_time": "3:47:05", "remaining_time": "4:06:01"}
|
577 |
+
{"current_steps": 577, "total_steps": 1200, "loss": 0.4875, "lr": 2.478196800402709e-05, "epoch": 2.404166666666667, "percentage": 48.08, "elapsed_time": "3:47:28", "remaining_time": "4:05:37"}
|
578 |
+
{"current_steps": 578, "total_steps": 1200, "loss": 0.4786, "lr": 2.4725457633012836e-05, "epoch": 2.408333333333333, "percentage": 48.17, "elapsed_time": "3:47:51", "remaining_time": "4:05:12"}
|
579 |
+
{"current_steps": 579, "total_steps": 1200, "loss": 0.4742, "lr": 2.4668907277118114e-05, "epoch": 2.4125, "percentage": 48.25, "elapsed_time": "3:48:15", "remaining_time": "4:04:48"}
|
580 |
+
{"current_steps": 580, "total_steps": 1200, "loss": 0.494, "lr": 2.4612317414848804e-05, "epoch": 2.4166666666666665, "percentage": 48.33, "elapsed_time": "3:48:38", "remaining_time": "4:04:25"}
|
581 |
+
{"current_steps": 581, "total_steps": 1200, "loss": 0.4741, "lr": 2.455568852504507e-05, "epoch": 2.4208333333333334, "percentage": 48.42, "elapsed_time": "3:49:02", "remaining_time": "4:04:00"}
|
582 |
+
{"current_steps": 582, "total_steps": 1200, "loss": 0.4887, "lr": 2.4499021086877304e-05, "epoch": 2.425, "percentage": 48.5, "elapsed_time": "3:49:25", "remaining_time": "4:03:37"}
|
583 |
+
{"current_steps": 583, "total_steps": 1200, "loss": 0.4777, "lr": 2.4442315579842068e-05, "epoch": 2.4291666666666667, "percentage": 48.58, "elapsed_time": "3:49:49", "remaining_time": "4:03:14"}
|
584 |
+
{"current_steps": 584, "total_steps": 1200, "loss": 0.4984, "lr": 2.4385572483758066e-05, "epoch": 2.4333333333333336, "percentage": 48.67, "elapsed_time": "3:50:12", "remaining_time": "4:02:49"}
|
585 |
+
{"current_steps": 585, "total_steps": 1200, "loss": 0.4779, "lr": 2.4328792278762058e-05, "epoch": 2.4375, "percentage": 48.75, "elapsed_time": "3:50:36", "remaining_time": "4:02:25"}
|
586 |
+
{"current_steps": 586, "total_steps": 1200, "loss": 0.4771, "lr": 2.4271975445304806e-05, "epoch": 2.4416666666666664, "percentage": 48.83, "elapsed_time": "3:50:59", "remaining_time": "4:02:01"}
|
587 |
+
{"current_steps": 587, "total_steps": 1200, "loss": 0.4708, "lr": 2.4215122464146996e-05, "epoch": 2.4458333333333333, "percentage": 48.92, "elapsed_time": "3:51:22", "remaining_time": "4:01:37"}
|
588 |
+
{"current_steps": 588, "total_steps": 1200, "loss": 0.4797, "lr": 2.4158233816355185e-05, "epoch": 2.45, "percentage": 49.0, "elapsed_time": "3:51:45", "remaining_time": "4:01:13"}
|
589 |
+
{"current_steps": 589, "total_steps": 1200, "loss": 0.4921, "lr": 2.4101309983297757e-05, "epoch": 2.4541666666666666, "percentage": 49.08, "elapsed_time": "3:52:08", "remaining_time": "4:00:48"}
|
590 |
+
{"current_steps": 590, "total_steps": 1200, "loss": 0.4783, "lr": 2.4044351446640763e-05, "epoch": 2.4583333333333335, "percentage": 49.17, "elapsed_time": "3:52:30", "remaining_time": "4:00:23"}
|
591 |
+
{"current_steps": 591, "total_steps": 1200, "loss": 0.4876, "lr": 2.3987358688343946e-05, "epoch": 2.4625, "percentage": 49.25, "elapsed_time": "3:52:54", "remaining_time": "3:59:59"}
|
592 |
+
{"current_steps": 592, "total_steps": 1200, "loss": 0.4796, "lr": 2.3930332190656604e-05, "epoch": 2.466666666666667, "percentage": 49.33, "elapsed_time": "3:53:17", "remaining_time": "3:59:35"}
|
593 |
+
{"current_steps": 593, "total_steps": 1200, "loss": 0.4913, "lr": 2.3873272436113525e-05, "epoch": 2.470833333333333, "percentage": 49.42, "elapsed_time": "3:53:41", "remaining_time": "3:59:12"}
|
594 |
+
{"current_steps": 594, "total_steps": 1200, "loss": 0.473, "lr": 2.38161799075309e-05, "epoch": 2.475, "percentage": 49.5, "elapsed_time": "3:54:04", "remaining_time": "3:58:47"}
|
595 |
+
{"current_steps": 595, "total_steps": 1200, "loss": 0.4784, "lr": 2.375905508800224e-05, "epoch": 2.4791666666666665, "percentage": 49.58, "elapsed_time": "3:54:26", "remaining_time": "3:58:23"}
|
596 |
+
{"current_steps": 596, "total_steps": 1200, "loss": 0.4756, "lr": 2.370189846089429e-05, "epoch": 2.4833333333333334, "percentage": 49.67, "elapsed_time": "3:54:48", "remaining_time": "3:57:57"}
|
597 |
+
{"current_steps": 597, "total_steps": 1200, "loss": 0.4809, "lr": 2.3644710509842956e-05, "epoch": 2.4875, "percentage": 49.75, "elapsed_time": "3:55:12", "remaining_time": "3:57:34"}
|
598 |
+
{"current_steps": 598, "total_steps": 1200, "loss": 0.4953, "lr": 2.358749171874915e-05, "epoch": 2.4916666666666667, "percentage": 49.83, "elapsed_time": "3:55:34", "remaining_time": "3:57:09"}
|
599 |
+
{"current_steps": 599, "total_steps": 1200, "loss": 0.4902, "lr": 2.3530242571774787e-05, "epoch": 2.4958333333333336, "percentage": 49.92, "elapsed_time": "3:55:58", "remaining_time": "3:56:45"}
|
600 |
+
{"current_steps": 600, "total_steps": 1200, "loss": 0.4934, "lr": 2.3472963553338614e-05, "epoch": 2.5, "percentage": 50.0, "elapsed_time": "3:56:21", "remaining_time": "3:56:21"}
|
601 |
+
{"current_steps": 601, "total_steps": 1200, "loss": 0.4834, "lr": 2.341565514811214e-05, "epoch": 2.5041666666666664, "percentage": 50.08, "elapsed_time": "3:56:45", "remaining_time": "3:55:57"}
|
602 |
+
{"current_steps": 602, "total_steps": 1200, "loss": 0.4942, "lr": 2.3358317841015547e-05, "epoch": 2.5083333333333333, "percentage": 50.17, "elapsed_time": "3:57:09", "remaining_time": "3:55:34"}
|
603 |
+
{"current_steps": 603, "total_steps": 1200, "loss": 0.4884, "lr": 2.3300952117213552e-05, "epoch": 2.5125, "percentage": 50.25, "elapsed_time": "3:57:32", "remaining_time": "3:55:10"}
|
604 |
+
{"current_steps": 604, "total_steps": 1200, "loss": 0.4823, "lr": 2.3243558462111354e-05, "epoch": 2.5166666666666666, "percentage": 50.33, "elapsed_time": "3:57:54", "remaining_time": "3:54:45"}
|
605 |
+
{"current_steps": 605, "total_steps": 1200, "loss": 0.4809, "lr": 2.3186137361350455e-05, "epoch": 2.5208333333333335, "percentage": 50.42, "elapsed_time": "3:58:17", "remaining_time": "3:54:21"}
|
606 |
+
{"current_steps": 606, "total_steps": 1200, "loss": 0.4833, "lr": 2.312868930080462e-05, "epoch": 2.525, "percentage": 50.5, "elapsed_time": "3:58:40", "remaining_time": "3:53:57"}
|
607 |
+
{"current_steps": 607, "total_steps": 1200, "loss": 0.4882, "lr": 2.3071214766575722e-05, "epoch": 2.529166666666667, "percentage": 50.58, "elapsed_time": "3:59:04", "remaining_time": "3:53:33"}
|
608 |
+
{"current_steps": 608, "total_steps": 1200, "loss": 0.4704, "lr": 2.3013714244989665e-05, "epoch": 2.533333333333333, "percentage": 50.67, "elapsed_time": "3:59:28", "remaining_time": "3:53:09"}
|
609 |
+
{"current_steps": 609, "total_steps": 1200, "loss": 0.474, "lr": 2.2956188222592218e-05, "epoch": 2.5375, "percentage": 50.75, "elapsed_time": "3:59:51", "remaining_time": "3:52:45"}
|
610 |
+
{"current_steps": 610, "total_steps": 1200, "loss": 0.4877, "lr": 2.2898637186144935e-05, "epoch": 2.5416666666666665, "percentage": 50.83, "elapsed_time": "4:00:14", "remaining_time": "3:52:21"}
|
611 |
+
{"current_steps": 611, "total_steps": 1200, "loss": 0.4804, "lr": 2.2841061622621052e-05, "epoch": 2.5458333333333334, "percentage": 50.92, "elapsed_time": "4:00:36", "remaining_time": "3:51:56"}
|
612 |
+
{"current_steps": 612, "total_steps": 1200, "loss": 0.4834, "lr": 2.278346201920131e-05, "epoch": 2.55, "percentage": 51.0, "elapsed_time": "4:00:59", "remaining_time": "3:51:32"}
|
613 |
+
{"current_steps": 613, "total_steps": 1200, "loss": 0.4658, "lr": 2.2725838863269894e-05, "epoch": 2.5541666666666667, "percentage": 51.08, "elapsed_time": "4:01:23", "remaining_time": "3:51:08"}
|
614 |
+
{"current_steps": 614, "total_steps": 1200, "loss": 0.4819, "lr": 2.2668192642410257e-05, "epoch": 2.5583333333333336, "percentage": 51.17, "elapsed_time": "4:01:44", "remaining_time": "3:50:43"}
|
615 |
+
{"current_steps": 615, "total_steps": 1200, "loss": 0.4885, "lr": 2.261052384440104e-05, "epoch": 2.5625, "percentage": 51.25, "elapsed_time": "4:02:08", "remaining_time": "3:50:19"}
|
616 |
+
{"current_steps": 616, "total_steps": 1200, "loss": 0.4803, "lr": 2.25528329572119e-05, "epoch": 2.5666666666666664, "percentage": 51.33, "elapsed_time": "4:02:31", "remaining_time": "3:49:55"}
|
617 |
+
{"current_steps": 617, "total_steps": 1200, "loss": 0.4904, "lr": 2.249512046899941e-05, "epoch": 2.5708333333333333, "percentage": 51.42, "elapsed_time": "4:02:53", "remaining_time": "3:49:30"}
|
618 |
+
{"current_steps": 618, "total_steps": 1200, "loss": 0.481, "lr": 2.243738686810295e-05, "epoch": 2.575, "percentage": 51.5, "elapsed_time": "4:03:16", "remaining_time": "3:49:06"}
|
619 |
+
{"current_steps": 619, "total_steps": 1200, "loss": 0.4826, "lr": 2.237963264304051e-05, "epoch": 2.5791666666666666, "percentage": 51.58, "elapsed_time": "4:03:39", "remaining_time": "3:48:41"}
|
620 |
+
{"current_steps": 620, "total_steps": 1200, "loss": 0.4962, "lr": 2.2321858282504606e-05, "epoch": 2.5833333333333335, "percentage": 51.67, "elapsed_time": "4:04:02", "remaining_time": "3:48:17"}
|
621 |
+
{"current_steps": 621, "total_steps": 1200, "loss": 0.4878, "lr": 2.226406427535814e-05, "epoch": 2.5875, "percentage": 51.75, "elapsed_time": "4:04:26", "remaining_time": "3:47:54"}
|
622 |
+
{"current_steps": 622, "total_steps": 1200, "loss": 0.4862, "lr": 2.220625111063024e-05, "epoch": 2.591666666666667, "percentage": 51.83, "elapsed_time": "4:04:49", "remaining_time": "3:47:30"}
|
623 |
+
{"current_steps": 623, "total_steps": 1200, "loss": 0.4743, "lr": 2.214841927751215e-05, "epoch": 2.595833333333333, "percentage": 51.92, "elapsed_time": "4:05:12", "remaining_time": "3:47:06"}
|
624 |
+
{"current_steps": 624, "total_steps": 1200, "loss": 0.4823, "lr": 2.209056926535307e-05, "epoch": 2.6, "percentage": 52.0, "elapsed_time": "4:05:35", "remaining_time": "3:46:41"}
|
625 |
+
{"current_steps": 625, "total_steps": 1200, "loss": 0.4932, "lr": 2.203270156365604e-05, "epoch": 2.6041666666666665, "percentage": 52.08, "elapsed_time": "4:05:58", "remaining_time": "3:46:17"}
|
626 |
+
{"current_steps": 626, "total_steps": 1200, "loss": 0.4956, "lr": 2.1974816662073758e-05, "epoch": 2.6083333333333334, "percentage": 52.17, "elapsed_time": "4:06:21", "remaining_time": "3:45:54"}
|
627 |
+
{"current_steps": 627, "total_steps": 1200, "loss": 0.4814, "lr": 2.1916915050404482e-05, "epoch": 2.6125, "percentage": 52.25, "elapsed_time": "4:06:44", "remaining_time": "3:45:29"}
|
628 |
+
{"current_steps": 628, "total_steps": 1200, "loss": 0.4851, "lr": 2.185899721858785e-05, "epoch": 2.6166666666666667, "percentage": 52.33, "elapsed_time": "4:07:06", "remaining_time": "3:45:04"}
|
629 |
+
{"current_steps": 629, "total_steps": 1200, "loss": 0.4821, "lr": 2.1801063656700747e-05, "epoch": 2.6208333333333336, "percentage": 52.42, "elapsed_time": "4:07:30", "remaining_time": "3:44:41"}
|
630 |
+
{"current_steps": 630, "total_steps": 1200, "loss": 0.4954, "lr": 2.174311485495317e-05, "epoch": 2.625, "percentage": 52.5, "elapsed_time": "4:07:53", "remaining_time": "3:44:16"}
|
631 |
+
{"current_steps": 631, "total_steps": 1200, "loss": 0.4781, "lr": 2.168515130368406e-05, "epoch": 2.6291666666666664, "percentage": 52.58, "elapsed_time": "4:08:15", "remaining_time": "3:43:51"}
|
632 |
+
{"current_steps": 632, "total_steps": 1200, "loss": 0.4803, "lr": 2.1627173493357167e-05, "epoch": 2.6333333333333333, "percentage": 52.67, "elapsed_time": "4:08:38", "remaining_time": "3:43:27"}
|
633 |
+
{"current_steps": 633, "total_steps": 1200, "loss": 0.4826, "lr": 2.1569181914556904e-05, "epoch": 2.6375, "percentage": 52.75, "elapsed_time": "4:09:01", "remaining_time": "3:43:03"}
|
634 |
+
{"current_steps": 634, "total_steps": 1200, "loss": 0.4779, "lr": 2.1511177057984164e-05, "epoch": 2.6416666666666666, "percentage": 52.83, "elapsed_time": "4:09:25", "remaining_time": "3:42:40"}
|
635 |
+
{"current_steps": 635, "total_steps": 1200, "loss": 0.4884, "lr": 2.1453159414452216e-05, "epoch": 2.6458333333333335, "percentage": 52.92, "elapsed_time": "4:09:48", "remaining_time": "3:42:16"}
|
636 |
+
{"current_steps": 636, "total_steps": 1200, "loss": 0.4851, "lr": 2.1395129474882507e-05, "epoch": 2.65, "percentage": 53.0, "elapsed_time": "4:10:11", "remaining_time": "3:41:52"}
|
637 |
+
{"current_steps": 637, "total_steps": 1200, "loss": 0.4781, "lr": 2.133708773030055e-05, "epoch": 2.654166666666667, "percentage": 53.08, "elapsed_time": "4:10:35", "remaining_time": "3:41:28"}
|
638 |
+
{"current_steps": 638, "total_steps": 1200, "loss": 0.4784, "lr": 2.1279034671831714e-05, "epoch": 2.658333333333333, "percentage": 53.17, "elapsed_time": "4:10:58", "remaining_time": "3:41:04"}
|
639 |
+
{"current_steps": 639, "total_steps": 1200, "loss": 0.4917, "lr": 2.1220970790697142e-05, "epoch": 2.6625, "percentage": 53.25, "elapsed_time": "4:11:21", "remaining_time": "3:40:40"}
|
640 |
+
{"current_steps": 640, "total_steps": 1200, "loss": 0.4719, "lr": 2.1162896578209517e-05, "epoch": 2.6666666666666665, "percentage": 53.33, "elapsed_time": "4:11:44", "remaining_time": "3:40:16"}
|
641 |
+
{"current_steps": 641, "total_steps": 1200, "loss": 0.4868, "lr": 2.1104812525768974e-05, "epoch": 2.6708333333333334, "percentage": 53.42, "elapsed_time": "4:12:08", "remaining_time": "3:39:53"}
|
642 |
+
{"current_steps": 642, "total_steps": 1200, "loss": 0.4861, "lr": 2.1046719124858882e-05, "epoch": 2.675, "percentage": 53.5, "elapsed_time": "4:12:31", "remaining_time": "3:39:29"}
|
643 |
+
{"current_steps": 643, "total_steps": 1200, "loss": 0.4894, "lr": 2.0988616867041724e-05, "epoch": 2.6791666666666667, "percentage": 53.58, "elapsed_time": "4:12:55", "remaining_time": "3:39:05"}
|
644 |
+
{"current_steps": 644, "total_steps": 1200, "loss": 0.4804, "lr": 2.093050624395494e-05, "epoch": 2.6833333333333336, "percentage": 53.67, "elapsed_time": "4:13:18", "remaining_time": "3:38:41"}
|
645 |
+
{"current_steps": 645, "total_steps": 1200, "loss": 0.4846, "lr": 2.0872387747306725e-05, "epoch": 2.6875, "percentage": 53.75, "elapsed_time": "4:13:41", "remaining_time": "3:38:17"}
|
646 |
+
{"current_steps": 646, "total_steps": 1200, "loss": 0.4799, "lr": 2.081426186887192e-05, "epoch": 2.6916666666666664, "percentage": 53.83, "elapsed_time": "4:14:04", "remaining_time": "3:37:53"}
|
647 |
+
{"current_steps": 647, "total_steps": 1200, "loss": 0.48, "lr": 2.0756129100487824e-05, "epoch": 2.6958333333333333, "percentage": 53.92, "elapsed_time": "4:14:28", "remaining_time": "3:37:29"}
|
648 |
+
{"current_steps": 648, "total_steps": 1200, "loss": 0.4907, "lr": 2.0697989934050025e-05, "epoch": 2.7, "percentage": 54.0, "elapsed_time": "4:14:52", "remaining_time": "3:37:06"}
|
649 |
+
{"current_steps": 649, "total_steps": 1200, "loss": 0.4734, "lr": 2.063984486150826e-05, "epoch": 2.7041666666666666, "percentage": 54.08, "elapsed_time": "4:15:16", "remaining_time": "3:36:43"}
|
650 |
+
{"current_steps": 650, "total_steps": 1200, "loss": 0.4947, "lr": 2.058169437486223e-05, "epoch": 2.7083333333333335, "percentage": 54.17, "elapsed_time": "4:15:39", "remaining_time": "3:36:19"}
|
651 |
+
{"current_steps": 651, "total_steps": 1200, "loss": 0.4835, "lr": 2.0523538966157467e-05, "epoch": 2.7125, "percentage": 54.25, "elapsed_time": "4:16:02", "remaining_time": "3:35:55"}
|
652 |
+
{"current_steps": 652, "total_steps": 1200, "loss": 0.4772, "lr": 2.0465379127481127e-05, "epoch": 2.716666666666667, "percentage": 54.33, "elapsed_time": "4:16:26", "remaining_time": "3:35:32"}
|
653 |
+
{"current_steps": 653, "total_steps": 1200, "loss": 0.4683, "lr": 2.0407215350957874e-05, "epoch": 2.720833333333333, "percentage": 54.42, "elapsed_time": "4:16:49", "remaining_time": "3:35:08"}
|
654 |
+
{"current_steps": 654, "total_steps": 1200, "loss": 0.4803, "lr": 2.0349048128745673e-05, "epoch": 2.725, "percentage": 54.5, "elapsed_time": "4:17:13", "remaining_time": "3:34:44"}
|
655 |
+
{"current_steps": 655, "total_steps": 1200, "loss": 0.478, "lr": 2.029087795303166e-05, "epoch": 2.7291666666666665, "percentage": 54.58, "elapsed_time": "4:17:34", "remaining_time": "3:34:19"}
|
656 |
+
{"current_steps": 656, "total_steps": 1200, "loss": 0.4652, "lr": 2.0232705316027946e-05, "epoch": 2.7333333333333334, "percentage": 54.67, "elapsed_time": "4:17:59", "remaining_time": "3:33:56"}
|
657 |
+
{"current_steps": 657, "total_steps": 1200, "loss": 0.4826, "lr": 2.017453070996748e-05, "epoch": 2.7375, "percentage": 54.75, "elapsed_time": "4:18:25", "remaining_time": "3:33:34"}
|
658 |
+
{"current_steps": 658, "total_steps": 1200, "loss": 0.477, "lr": 2.011635462709988e-05, "epoch": 2.7416666666666667, "percentage": 54.83, "elapsed_time": "4:18:48", "remaining_time": "3:33:11"}
|
659 |
+
{"current_steps": 659, "total_steps": 1200, "loss": 0.478, "lr": 2.0058177559687243e-05, "epoch": 2.7458333333333336, "percentage": 54.92, "elapsed_time": "4:19:12", "remaining_time": "3:32:47"}
|
660 |
+
{"current_steps": 660, "total_steps": 1200, "loss": 0.4815, "lr": 2e-05, "epoch": 2.75, "percentage": 55.0, "elapsed_time": "4:19:35", "remaining_time": "3:32:23"}
|
661 |
+
{"current_steps": 661, "total_steps": 1200, "loss": 0.481, "lr": 1.9941822440312767e-05, "epoch": 2.7541666666666664, "percentage": 55.08, "elapsed_time": "4:19:59", "remaining_time": "3:32:00"}
|
662 |
+
{"current_steps": 662, "total_steps": 1200, "loss": 0.4768, "lr": 1.9883645372900123e-05, "epoch": 2.7583333333333333, "percentage": 55.17, "elapsed_time": "4:20:22", "remaining_time": "3:31:36"}
|
663 |
+
{"current_steps": 663, "total_steps": 1200, "loss": 0.4805, "lr": 1.9825469290032525e-05, "epoch": 2.7625, "percentage": 55.25, "elapsed_time": "4:20:47", "remaining_time": "3:31:13"}
|
664 |
+
{"current_steps": 664, "total_steps": 1200, "loss": 0.4722, "lr": 1.9767294683972064e-05, "epoch": 2.7666666666666666, "percentage": 55.33, "elapsed_time": "4:21:10", "remaining_time": "3:30:49"}
|
665 |
+
{"current_steps": 665, "total_steps": 1200, "loss": 0.4831, "lr": 1.9709122046968347e-05, "epoch": 2.7708333333333335, "percentage": 55.42, "elapsed_time": "4:21:33", "remaining_time": "3:30:25"}
|
666 |
+
{"current_steps": 666, "total_steps": 1200, "loss": 0.4719, "lr": 1.965095187125433e-05, "epoch": 2.775, "percentage": 55.5, "elapsed_time": "4:21:56", "remaining_time": "3:30:01"}
|
667 |
+
{"current_steps": 667, "total_steps": 1200, "loss": 0.4816, "lr": 1.9592784649042126e-05, "epoch": 2.779166666666667, "percentage": 55.58, "elapsed_time": "4:22:20", "remaining_time": "3:29:37"}
|
668 |
+
{"current_steps": 668, "total_steps": 1200, "loss": 0.4698, "lr": 1.9534620872518877e-05, "epoch": 2.783333333333333, "percentage": 55.67, "elapsed_time": "4:22:43", "remaining_time": "3:29:13"}
|
669 |
+
{"current_steps": 669, "total_steps": 1200, "loss": 0.4726, "lr": 1.9476461033842543e-05, "epoch": 2.7875, "percentage": 55.75, "elapsed_time": "4:23:06", "remaining_time": "3:28:50"}
|
670 |
+
{"current_steps": 670, "total_steps": 1200, "loss": 0.4741, "lr": 1.9418305625137773e-05, "epoch": 2.7916666666666665, "percentage": 55.83, "elapsed_time": "4:23:29", "remaining_time": "3:28:25"}
|
671 |
+
{"current_steps": 671, "total_steps": 1200, "loss": 0.4943, "lr": 1.936015513849175e-05, "epoch": 2.7958333333333334, "percentage": 55.92, "elapsed_time": "4:23:52", "remaining_time": "3:28:02"}
|
672 |
+
{"current_steps": 672, "total_steps": 1200, "loss": 0.473, "lr": 1.930201006594999e-05, "epoch": 2.8, "percentage": 56.0, "elapsed_time": "4:24:16", "remaining_time": "3:27:38"}
|
673 |
+
{"current_steps": 673, "total_steps": 1200, "loss": 0.4751, "lr": 1.9243870899512183e-05, "epoch": 2.8041666666666667, "percentage": 56.08, "elapsed_time": "4:24:39", "remaining_time": "3:27:14"}
|
674 |
+
{"current_steps": 674, "total_steps": 1200, "loss": 0.4835, "lr": 1.9185738131128085e-05, "epoch": 2.8083333333333336, "percentage": 56.17, "elapsed_time": "4:25:02", "remaining_time": "3:26:50"}
|
675 |
+
{"current_steps": 675, "total_steps": 1200, "loss": 0.4795, "lr": 1.9127612252693285e-05, "epoch": 2.8125, "percentage": 56.25, "elapsed_time": "4:25:26", "remaining_time": "3:26:26"}
|
676 |
+
{"current_steps": 676, "total_steps": 1200, "loss": 0.4897, "lr": 1.9069493756045066e-05, "epoch": 2.8166666666666664, "percentage": 56.33, "elapsed_time": "4:25:48", "remaining_time": "3:26:02"}
|
677 |
+
{"current_steps": 677, "total_steps": 1200, "loss": 0.4822, "lr": 1.9011383132958283e-05, "epoch": 2.8208333333333333, "percentage": 56.42, "elapsed_time": "4:26:10", "remaining_time": "3:25:37"}
|
678 |
+
{"current_steps": 678, "total_steps": 1200, "loss": 0.4808, "lr": 1.8953280875141125e-05, "epoch": 2.825, "percentage": 56.5, "elapsed_time": "4:26:33", "remaining_time": "3:25:13"}
|
679 |
+
{"current_steps": 679, "total_steps": 1200, "loss": 0.4628, "lr": 1.8895187474231033e-05, "epoch": 2.8291666666666666, "percentage": 56.58, "elapsed_time": "4:26:55", "remaining_time": "3:24:48"}
|
680 |
+
{"current_steps": 680, "total_steps": 1200, "loss": 0.4849, "lr": 1.8837103421790486e-05, "epoch": 2.8333333333333335, "percentage": 56.67, "elapsed_time": "4:27:19", "remaining_time": "3:24:25"}
|
681 |
+
{"current_steps": 681, "total_steps": 1200, "loss": 0.482, "lr": 1.877902920930286e-05, "epoch": 2.8375, "percentage": 56.75, "elapsed_time": "4:27:42", "remaining_time": "3:24:01"}
|
682 |
+
{"current_steps": 682, "total_steps": 1200, "loss": 0.4791, "lr": 1.872096532816829e-05, "epoch": 2.841666666666667, "percentage": 56.83, "elapsed_time": "4:28:05", "remaining_time": "3:23:37"}
|
683 |
+
{"current_steps": 683, "total_steps": 1200, "loss": 0.4795, "lr": 1.866291226969946e-05, "epoch": 2.845833333333333, "percentage": 56.92, "elapsed_time": "4:28:28", "remaining_time": "3:23:13"}
|
684 |
+
{"current_steps": 684, "total_steps": 1200, "loss": 0.4725, "lr": 1.8604870525117496e-05, "epoch": 2.85, "percentage": 57.0, "elapsed_time": "4:28:50", "remaining_time": "3:22:48"}
|
685 |
+
{"current_steps": 685, "total_steps": 1200, "loss": 0.4892, "lr": 1.854684058554779e-05, "epoch": 2.8541666666666665, "percentage": 57.08, "elapsed_time": "4:29:13", "remaining_time": "3:22:24"}
|
686 |
+
{"current_steps": 686, "total_steps": 1200, "loss": 0.4796, "lr": 1.8488822942015846e-05, "epoch": 2.8583333333333334, "percentage": 57.17, "elapsed_time": "4:29:36", "remaining_time": "3:22:00"}
|
687 |
+
{"current_steps": 687, "total_steps": 1200, "loss": 0.4825, "lr": 1.8430818085443106e-05, "epoch": 2.8625, "percentage": 57.25, "elapsed_time": "4:30:00", "remaining_time": "3:21:37"}
|
688 |
+
{"current_steps": 688, "total_steps": 1200, "loss": 0.4716, "lr": 1.837282650664284e-05, "epoch": 2.8666666666666667, "percentage": 57.33, "elapsed_time": "4:30:24", "remaining_time": "3:21:14"}
|
689 |
+
{"current_steps": 689, "total_steps": 1200, "loss": 0.4727, "lr": 1.8314848696315944e-05, "epoch": 2.8708333333333336, "percentage": 57.42, "elapsed_time": "4:30:47", "remaining_time": "3:20:50"}
|
690 |
+
{"current_steps": 690, "total_steps": 1200, "loss": 0.4749, "lr": 1.8256885145046837e-05, "epoch": 2.875, "percentage": 57.5, "elapsed_time": "4:31:10", "remaining_time": "3:20:26"}
|
691 |
+
{"current_steps": 691, "total_steps": 1200, "loss": 0.4904, "lr": 1.8198936343299263e-05, "epoch": 2.8791666666666664, "percentage": 57.58, "elapsed_time": "4:31:34", "remaining_time": "3:20:02"}
|
692 |
+
{"current_steps": 692, "total_steps": 1200, "loss": 0.4783, "lr": 1.814100278141216e-05, "epoch": 2.8833333333333333, "percentage": 57.67, "elapsed_time": "4:31:58", "remaining_time": "3:19:39"}
|
693 |
+
{"current_steps": 693, "total_steps": 1200, "loss": 0.4787, "lr": 1.808308494959552e-05, "epoch": 2.8875, "percentage": 57.75, "elapsed_time": "4:32:20", "remaining_time": "3:19:14"}
|
694 |
+
{"current_steps": 694, "total_steps": 1200, "loss": 0.4798, "lr": 1.8025183337926246e-05, "epoch": 2.8916666666666666, "percentage": 57.83, "elapsed_time": "4:32:42", "remaining_time": "3:18:49"}
|
695 |
+
{"current_steps": 695, "total_steps": 1200, "loss": 0.476, "lr": 1.7967298436343962e-05, "epoch": 2.8958333333333335, "percentage": 57.92, "elapsed_time": "4:33:05", "remaining_time": "3:18:26"}
|
696 |
+
{"current_steps": 696, "total_steps": 1200, "loss": 0.4811, "lr": 1.7909430734646936e-05, "epoch": 2.9, "percentage": 58.0, "elapsed_time": "4:33:28", "remaining_time": "3:18:02"}
|
697 |
+
{"current_steps": 697, "total_steps": 1200, "loss": 0.4785, "lr": 1.785158072248786e-05, "epoch": 2.904166666666667, "percentage": 58.08, "elapsed_time": "4:33:51", "remaining_time": "3:17:37"}
|
698 |
+
{"current_steps": 698, "total_steps": 1200, "loss": 0.48, "lr": 1.7793748889369765e-05, "epoch": 2.908333333333333, "percentage": 58.17, "elapsed_time": "4:34:12", "remaining_time": "3:17:12"}
|
699 |
+
{"current_steps": 699, "total_steps": 1200, "loss": 0.4748, "lr": 1.773593572464187e-05, "epoch": 2.9125, "percentage": 58.25, "elapsed_time": "4:34:35", "remaining_time": "3:16:48"}
|
700 |
+
{"current_steps": 700, "total_steps": 1200, "loss": 0.4818, "lr": 1.7678141717495394e-05, "epoch": 2.9166666666666665, "percentage": 58.33, "elapsed_time": "4:34:59", "remaining_time": "3:16:25"}
|
701 |
+
{"current_steps": 701, "total_steps": 1200, "loss": 0.4799, "lr": 1.7620367356959496e-05, "epoch": 2.9208333333333334, "percentage": 58.42, "elapsed_time": "4:35:22", "remaining_time": "3:16:01"}
|
702 |
+
{"current_steps": 702, "total_steps": 1200, "loss": 0.4911, "lr": 1.7562613131897056e-05, "epoch": 2.925, "percentage": 58.5, "elapsed_time": "4:35:46", "remaining_time": "3:15:37"}
|
703 |
+
{"current_steps": 703, "total_steps": 1200, "loss": 0.4773, "lr": 1.7504879531000586e-05, "epoch": 2.9291666666666667, "percentage": 58.58, "elapsed_time": "4:36:08", "remaining_time": "3:15:13"}
|
704 |
+
{"current_steps": 704, "total_steps": 1200, "loss": 0.4742, "lr": 1.7447167042788108e-05, "epoch": 2.9333333333333336, "percentage": 58.67, "elapsed_time": "4:36:32", "remaining_time": "3:14:49"}
|
705 |
+
{"current_steps": 705, "total_steps": 1200, "loss": 0.4785, "lr": 1.7389476155598974e-05, "epoch": 2.9375, "percentage": 58.75, "elapsed_time": "4:36:54", "remaining_time": "3:14:25"}
|
706 |
+
{"current_steps": 706, "total_steps": 1200, "loss": 0.484, "lr": 1.7331807357589746e-05, "epoch": 2.9416666666666664, "percentage": 58.83, "elapsed_time": "4:37:17", "remaining_time": "3:14:01"}
|
707 |
+
{"current_steps": 707, "total_steps": 1200, "loss": 0.4859, "lr": 1.7274161136730113e-05, "epoch": 2.9458333333333333, "percentage": 58.92, "elapsed_time": "4:37:40", "remaining_time": "3:13:37"}
|
708 |
+
{"current_steps": 708, "total_steps": 1200, "loss": 0.4841, "lr": 1.72165379807987e-05, "epoch": 2.95, "percentage": 59.0, "elapsed_time": "4:38:03", "remaining_time": "3:13:13"}
|
709 |
+
{"current_steps": 709, "total_steps": 1200, "loss": 0.4693, "lr": 1.715893837737895e-05, "epoch": 2.9541666666666666, "percentage": 59.08, "elapsed_time": "4:38:27", "remaining_time": "3:12:50"}
|
710 |
+
{"current_steps": 710, "total_steps": 1200, "loss": 0.4841, "lr": 1.7101362813855068e-05, "epoch": 2.9583333333333335, "percentage": 59.17, "elapsed_time": "4:38:50", "remaining_time": "3:12:26"}
|
711 |
+
{"current_steps": 711, "total_steps": 1200, "loss": 0.4746, "lr": 1.704381177740779e-05, "epoch": 2.9625, "percentage": 59.25, "elapsed_time": "4:39:14", "remaining_time": "3:12:02"}
|
712 |
+
{"current_steps": 712, "total_steps": 1200, "loss": 0.4927, "lr": 1.698628575501034e-05, "epoch": 2.966666666666667, "percentage": 59.33, "elapsed_time": "4:39:37", "remaining_time": "3:11:39"}
|
713 |
+
{"current_steps": 713, "total_steps": 1200, "loss": 0.49, "lr": 1.692878523342428e-05, "epoch": 2.970833333333333, "percentage": 59.42, "elapsed_time": "4:40:00", "remaining_time": "3:11:15"}
|
714 |
+
{"current_steps": 714, "total_steps": 1200, "loss": 0.4819, "lr": 1.687131069919538e-05, "epoch": 2.975, "percentage": 59.5, "elapsed_time": "4:40:24", "remaining_time": "3:10:51"}
|
715 |
+
{"current_steps": 715, "total_steps": 1200, "loss": 0.4665, "lr": 1.6813862638649552e-05, "epoch": 2.9791666666666665, "percentage": 59.58, "elapsed_time": "4:40:47", "remaining_time": "3:10:28"}
|
716 |
+
{"current_steps": 716, "total_steps": 1200, "loss": 0.4891, "lr": 1.6756441537888656e-05, "epoch": 2.9833333333333334, "percentage": 59.67, "elapsed_time": "4:41:10", "remaining_time": "3:10:04"}
|
717 |
+
{"current_steps": 717, "total_steps": 1200, "loss": 0.4724, "lr": 1.6699047882786448e-05, "epoch": 2.9875, "percentage": 59.75, "elapsed_time": "4:41:33", "remaining_time": "3:09:40"}
|
718 |
+
{"current_steps": 718, "total_steps": 1200, "loss": 0.4761, "lr": 1.664168215898446e-05, "epoch": 2.9916666666666667, "percentage": 59.83, "elapsed_time": "4:41:56", "remaining_time": "3:09:16"}
|
719 |
+
{"current_steps": 719, "total_steps": 1200, "loss": 0.4938, "lr": 1.658434485188787e-05, "epoch": 2.9958333333333336, "percentage": 59.92, "elapsed_time": "4:42:19", "remaining_time": "3:08:52"}
|
720 |
+
{"current_steps": 720, "total_steps": 1200, "loss": 0.4882, "lr": 1.6527036446661396e-05, "epoch": 3.0, "percentage": 60.0, "elapsed_time": "4:42:42", "remaining_time": "3:08:28"}
|
721 |
+
{"current_steps": 721, "total_steps": 1200, "loss": 0.442, "lr": 1.6469757428225223e-05, "epoch": 3.004166666666667, "percentage": 60.08, "elapsed_time": "4:45:48", "remaining_time": "3:09:52"}
|
722 |
+
{"current_steps": 722, "total_steps": 1200, "loss": 0.4253, "lr": 1.641250828125085e-05, "epoch": 3.0083333333333333, "percentage": 60.17, "elapsed_time": "4:46:11", "remaining_time": "3:09:28"}
|
723 |
+
{"current_steps": 723, "total_steps": 1200, "loss": 0.4277, "lr": 1.635528949015705e-05, "epoch": 3.0125, "percentage": 60.25, "elapsed_time": "4:46:33", "remaining_time": "3:09:03"}
|
724 |
+
{"current_steps": 724, "total_steps": 1200, "loss": 0.43, "lr": 1.6298101539105712e-05, "epoch": 3.0166666666666666, "percentage": 60.33, "elapsed_time": "4:46:56", "remaining_time": "3:08:39"}
|
725 |
+
{"current_steps": 725, "total_steps": 1200, "loss": 0.4256, "lr": 1.6240944911997765e-05, "epoch": 3.0208333333333335, "percentage": 60.42, "elapsed_time": "4:47:20", "remaining_time": "3:08:15"}
|
726 |
+
{"current_steps": 726, "total_steps": 1200, "loss": 0.4304, "lr": 1.6183820092469103e-05, "epoch": 3.025, "percentage": 60.5, "elapsed_time": "4:47:42", "remaining_time": "3:07:50"}
|
727 |
+
{"current_steps": 727, "total_steps": 1200, "loss": 0.437, "lr": 1.6126727563886485e-05, "epoch": 3.029166666666667, "percentage": 60.58, "elapsed_time": "4:48:05", "remaining_time": "3:07:26"}
|