d1_code_python_0.3k / trainer_log.jsonl
ryanmarten's picture
Training in progress, epoch 3
09c87f9 verified
raw
history blame
8.02 kB
{"current_steps": 1, "total_steps": 117, "loss": 1.0254, "lr": 8.333333333333333e-07, "epoch": 0.10126582278481013, "percentage": 0.85, "elapsed_time": "0:00:38", "remaining_time": "1:14:07"}
{"current_steps": 2, "total_steps": 117, "loss": 1.0615, "lr": 1.6666666666666667e-06, "epoch": 0.20253164556962025, "percentage": 1.71, "elapsed_time": "0:01:21", "remaining_time": "1:17:49"}
{"current_steps": 3, "total_steps": 117, "loss": 1.0233, "lr": 2.5e-06, "epoch": 0.3037974683544304, "percentage": 2.56, "elapsed_time": "0:02:04", "remaining_time": "1:18:52"}
{"current_steps": 4, "total_steps": 117, "loss": 1.0127, "lr": 3.3333333333333333e-06, "epoch": 0.4050632911392405, "percentage": 3.42, "elapsed_time": "0:02:46", "remaining_time": "1:18:36"}
{"current_steps": 5, "total_steps": 117, "loss": 1.0077, "lr": 4.166666666666667e-06, "epoch": 0.5063291139240507, "percentage": 4.27, "elapsed_time": "0:03:30", "remaining_time": "1:18:25"}
{"current_steps": 6, "total_steps": 117, "loss": 0.9553, "lr": 5e-06, "epoch": 0.6075949367088608, "percentage": 5.13, "elapsed_time": "0:04:09", "remaining_time": "1:16:52"}
{"current_steps": 7, "total_steps": 117, "loss": 0.9506, "lr": 5.833333333333334e-06, "epoch": 0.7088607594936709, "percentage": 5.98, "elapsed_time": "0:04:53", "remaining_time": "1:16:55"}
{"current_steps": 8, "total_steps": 117, "loss": 0.9288, "lr": 6.666666666666667e-06, "epoch": 0.810126582278481, "percentage": 6.84, "elapsed_time": "0:05:30", "remaining_time": "1:15:01"}
{"current_steps": 9, "total_steps": 117, "loss": 0.9344, "lr": 7.500000000000001e-06, "epoch": 0.9113924050632911, "percentage": 7.69, "elapsed_time": "0:06:16", "remaining_time": "1:15:23"}
{"current_steps": 10, "total_steps": 117, "loss": 0.9483, "lr": 8.333333333333334e-06, "epoch": 1.0506329113924051, "percentage": 8.55, "elapsed_time": "0:07:41", "remaining_time": "1:22:15"}
{"current_steps": 11, "total_steps": 117, "loss": 0.8686, "lr": 9.166666666666666e-06, "epoch": 1.1518987341772151, "percentage": 9.4, "elapsed_time": "0:08:19", "remaining_time": "1:20:13"}
{"current_steps": 12, "total_steps": 117, "loss": 0.8883, "lr": 1e-05, "epoch": 1.2531645569620253, "percentage": 10.26, "elapsed_time": "0:08:52", "remaining_time": "1:17:42"}
{"current_steps": 13, "total_steps": 117, "loss": 0.8377, "lr": 9.997762161417517e-06, "epoch": 1.3544303797468356, "percentage": 11.11, "elapsed_time": "0:09:32", "remaining_time": "1:16:16"}
{"current_steps": 14, "total_steps": 117, "loss": 0.8419, "lr": 9.991050648838676e-06, "epoch": 1.4556962025316456, "percentage": 11.97, "elapsed_time": "0:10:09", "remaining_time": "1:14:43"}
{"current_steps": 15, "total_steps": 117, "loss": 0.7982, "lr": 9.979871469976197e-06, "epoch": 1.5569620253164556, "percentage": 12.82, "elapsed_time": "0:10:52", "remaining_time": "1:13:59"}
{"current_steps": 16, "total_steps": 117, "loss": 0.7941, "lr": 9.964234631709188e-06, "epoch": 1.6582278481012658, "percentage": 13.68, "elapsed_time": "0:11:38", "remaining_time": "1:13:27"}
{"current_steps": 17, "total_steps": 117, "loss": 0.8057, "lr": 9.944154131125643e-06, "epoch": 1.759493670886076, "percentage": 14.53, "elapsed_time": "0:12:23", "remaining_time": "1:12:51"}
{"current_steps": 18, "total_steps": 117, "loss": 0.7861, "lr": 9.91964794299315e-06, "epoch": 1.8607594936708862, "percentage": 15.38, "elapsed_time": "0:13:02", "remaining_time": "1:11:46"}
{"current_steps": 19, "total_steps": 117, "loss": 0.7739, "lr": 9.890738003669029e-06, "epoch": 1.9620253164556962, "percentage": 16.24, "elapsed_time": "0:13:44", "remaining_time": "1:10:51"}
{"current_steps": 20, "total_steps": 117, "loss": 0.7816, "lr": 9.857450191464337e-06, "epoch": 2.1012658227848102, "percentage": 17.09, "elapsed_time": "0:15:19", "remaining_time": "1:14:18"}
{"current_steps": 21, "total_steps": 117, "loss": 0.7302, "lr": 9.819814303479268e-06, "epoch": 2.2025316455696204, "percentage": 17.95, "elapsed_time": "0:15:58", "remaining_time": "1:13:00"}
{"current_steps": 22, "total_steps": 117, "loss": 0.725, "lr": 9.777864028930705e-06, "epoch": 2.3037974683544302, "percentage": 18.8, "elapsed_time": "0:16:42", "remaining_time": "1:12:08"}
{"current_steps": 23, "total_steps": 117, "loss": 0.7069, "lr": 9.731636918995821e-06, "epoch": 2.4050632911392404, "percentage": 19.66, "elapsed_time": "0:17:24", "remaining_time": "1:11:09"}
{"current_steps": 24, "total_steps": 117, "loss": 0.7035, "lr": 9.681174353198687e-06, "epoch": 2.5063291139240507, "percentage": 20.51, "elapsed_time": "0:18:03", "remaining_time": "1:10:00"}
{"current_steps": 25, "total_steps": 117, "loss": 0.7033, "lr": 9.626521502369984e-06, "epoch": 2.607594936708861, "percentage": 21.37, "elapsed_time": "0:18:42", "remaining_time": "1:08:52"}
{"current_steps": 26, "total_steps": 117, "loss": 0.6926, "lr": 9.567727288213005e-06, "epoch": 2.708860759493671, "percentage": 22.22, "elapsed_time": "0:19:24", "remaining_time": "1:07:54"}
{"current_steps": 27, "total_steps": 117, "loss": 0.6847, "lr": 9.504844339512096e-06, "epoch": 2.810126582278481, "percentage": 23.08, "elapsed_time": "0:20:09", "remaining_time": "1:07:12"}
{"current_steps": 28, "total_steps": 117, "loss": 0.6755, "lr": 9.437928945022772e-06, "epoch": 2.911392405063291, "percentage": 23.93, "elapsed_time": "0:20:46", "remaining_time": "1:06:03"}
{"current_steps": 29, "total_steps": 117, "loss": 0.651, "lr": 9.36704100308565e-06, "epoch": 3.050632911392405, "percentage": 24.79, "elapsed_time": "0:22:16", "remaining_time": "1:07:35"}
{"current_steps": 30, "total_steps": 117, "loss": 0.6295, "lr": 9.292243968009332e-06, "epoch": 3.151898734177215, "percentage": 25.64, "elapsed_time": "0:22:58", "remaining_time": "1:06:37"}
{"current_steps": 31, "total_steps": 117, "loss": 0.6384, "lr": 9.213604793270196e-06, "epoch": 3.2531645569620253, "percentage": 26.5, "elapsed_time": "0:23:41", "remaining_time": "1:05:44"}
{"current_steps": 32, "total_steps": 117, "loss": 0.6182, "lr": 9.131193871579975e-06, "epoch": 3.3544303797468356, "percentage": 27.35, "elapsed_time": "0:24:23", "remaining_time": "1:04:47"}
{"current_steps": 33, "total_steps": 117, "loss": 0.6218, "lr": 9.045084971874738e-06, "epoch": 3.4556962025316453, "percentage": 28.21, "elapsed_time": "0:25:05", "remaining_time": "1:03:53"}
{"current_steps": 34, "total_steps": 117, "loss": 0.6392, "lr": 8.955355173281709e-06, "epoch": 3.5569620253164556, "percentage": 29.06, "elapsed_time": "0:25:49", "remaining_time": "1:03:02"}
{"current_steps": 35, "total_steps": 117, "loss": 0.6261, "lr": 8.862084796122998e-06, "epoch": 3.6582278481012658, "percentage": 29.91, "elapsed_time": "0:26:31", "remaining_time": "1:02:08"}
{"current_steps": 36, "total_steps": 117, "loss": 0.6191, "lr": 8.765357330018056e-06, "epoch": 3.759493670886076, "percentage": 30.77, "elapsed_time": "0:27:09", "remaining_time": "1:01:06"}
{"current_steps": 37, "total_steps": 117, "loss": 0.6017, "lr": 8.665259359149132e-06, "epoch": 3.8607594936708862, "percentage": 31.62, "elapsed_time": "0:27:54", "remaining_time": "1:00:21"}
{"current_steps": 38, "total_steps": 117, "loss": 0.5768, "lr": 8.561880484756726e-06, "epoch": 3.962025316455696, "percentage": 32.48, "elapsed_time": "0:28:32", "remaining_time": "0:59:19"}
{"current_steps": 39, "total_steps": 117, "loss": 0.5861, "lr": 8.455313244934324e-06, "epoch": 4.10126582278481, "percentage": 33.33, "elapsed_time": "0:30:10", "remaining_time": "1:00:21"}
{"current_steps": 40, "total_steps": 117, "loss": 0.5407, "lr": 8.345653031794292e-06, "epoch": 4.2025316455696204, "percentage": 34.19, "elapsed_time": "0:30:49", "remaining_time": "0:59:20"}
{"current_steps": 41, "total_steps": 117, "loss": 0.5468, "lr": 8.232998006078998e-06, "epoch": 4.30379746835443, "percentage": 35.04, "elapsed_time": "0:31:31", "remaining_time": "0:58:26"}
{"current_steps": 42, "total_steps": 117, "loss": 0.5338, "lr": 8.117449009293668e-06, "epoch": 4.405063291139241, "percentage": 35.9, "elapsed_time": "0:32:14", "remaining_time": "0:57:34"}