Training in progress, epoch 2
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4877660776
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cafee2ebcb91ecd189b88b75865eb1a49ca38405f2983f12c6e4951bdb234d41
|
3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4932751008
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e9c3eada553cf7ac15c8c2c700d9a10314412c6914c000c2500aac9b15bf93c0
|
3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4330865200
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8e3644248b6be5029c8f0e4a1ef9684697170c8078ea81dc8dd8113ae99bae4a
|
3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1089994880
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8ff5425278bac4180f9c5c19eb48a4d9565faac3f923475b0ea6241897253baf
|
3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
@@ -219,3 +219,114 @@
|
|
219 |
{"current_steps": 219, "total_steps": 550, "loss": 0.3918, "lr": 6.021945019389719e-05, "epoch": 1.9841628959276019, "percentage": 39.82, "elapsed_time": "5:56:39", "remaining_time": "8:59:03"}
|
220 |
{"current_steps": 220, "total_steps": 550, "loss": 0.385, "lr": 6.000000000000001e-05, "epoch": 1.993212669683258, "percentage": 40.0, "elapsed_time": "5:58:16", "remaining_time": "8:57:24"}
|
221 |
{"current_steps": 221, "total_steps": 550, "loss": 0.6705, "lr": 5.977974420901908e-05, "epoch": 2.004524886877828, "percentage": 40.18, "elapsed_time": "6:01:27", "remaining_time": "8:58:05"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
219 |
{"current_steps": 219, "total_steps": 550, "loss": 0.3918, "lr": 6.021945019389719e-05, "epoch": 1.9841628959276019, "percentage": 39.82, "elapsed_time": "5:56:39", "remaining_time": "8:59:03"}
|
220 |
{"current_steps": 220, "total_steps": 550, "loss": 0.385, "lr": 6.000000000000001e-05, "epoch": 1.993212669683258, "percentage": 40.0, "elapsed_time": "5:58:16", "remaining_time": "8:57:24"}
|
221 |
{"current_steps": 221, "total_steps": 550, "loss": 0.6705, "lr": 5.977974420901908e-05, "epoch": 2.004524886877828, "percentage": 40.18, "elapsed_time": "6:01:27", "remaining_time": "8:58:05"}
|
222 |
+
{"current_steps": 222, "total_steps": 550, "loss": 0.364, "lr": 5.955869169282556e-05, "epoch": 2.013574660633484, "percentage": 40.36, "elapsed_time": "6:03:03", "remaining_time": "8:56:25"}
|
223 |
+
{"current_steps": 223, "total_steps": 550, "loss": 0.3695, "lr": 5.9336851355382557e-05, "epoch": 2.02262443438914, "percentage": 40.55, "elapsed_time": "6:04:41", "remaining_time": "8:54:46"}
|
224 |
+
{"current_steps": 224, "total_steps": 550, "loss": 0.3643, "lr": 5.911423213238653e-05, "epoch": 2.0316742081447963, "percentage": 40.73, "elapsed_time": "6:06:18", "remaining_time": "8:53:06"}
|
225 |
+
{"current_steps": 225, "total_steps": 550, "loss": 0.3601, "lr": 5.889084299090732e-05, "epoch": 2.0407239819004523, "percentage": 40.91, "elapsed_time": "6:07:55", "remaining_time": "8:51:27"}
|
226 |
+
{"current_steps": 226, "total_steps": 550, "loss": 0.3645, "lr": 5.866669292902695e-05, "epoch": 2.0497737556561084, "percentage": 41.09, "elapsed_time": "6:09:32", "remaining_time": "8:49:47"}
|
227 |
+
{"current_steps": 227, "total_steps": 550, "loss": 0.363, "lr": 5.844179097547725e-05, "epoch": 2.0588235294117645, "percentage": 41.27, "elapsed_time": "6:11:09", "remaining_time": "8:48:07"}
|
228 |
+
{"current_steps": 228, "total_steps": 550, "loss": 0.3593, "lr": 5.821614618927613e-05, "epoch": 2.067873303167421, "percentage": 41.45, "elapsed_time": "6:12:46", "remaining_time": "8:46:28"}
|
229 |
+
{"current_steps": 229, "total_steps": 550, "loss": 0.3647, "lr": 5.798976765936264e-05, "epoch": 2.076923076923077, "percentage": 41.64, "elapsed_time": "6:14:23", "remaining_time": "8:44:48"}
|
230 |
+
{"current_steps": 230, "total_steps": 550, "loss": 0.3587, "lr": 5.776266450423097e-05, "epoch": 2.085972850678733, "percentage": 41.82, "elapsed_time": "6:16:01", "remaining_time": "8:43:09"}
|
231 |
+
{"current_steps": 231, "total_steps": 550, "loss": 0.3627, "lr": 5.75348458715631e-05, "epoch": 2.0950226244343892, "percentage": 42.0, "elapsed_time": "6:17:38", "remaining_time": "8:41:29"}
|
232 |
+
{"current_steps": 232, "total_steps": 550, "loss": 0.3541, "lr": 5.7306320937860336e-05, "epoch": 2.1040723981900453, "percentage": 42.18, "elapsed_time": "6:19:15", "remaining_time": "8:39:50"}
|
233 |
+
{"current_steps": 233, "total_steps": 550, "loss": 0.3651, "lr": 5.7077098908073676e-05, "epoch": 2.1131221719457014, "percentage": 42.36, "elapsed_time": "6:20:52", "remaining_time": "8:38:11"}
|
234 |
+
{"current_steps": 234, "total_steps": 550, "loss": 0.3556, "lr": 5.684718901523307e-05, "epoch": 2.1221719457013575, "percentage": 42.55, "elapsed_time": "6:22:30", "remaining_time": "8:36:32"}
|
235 |
+
{"current_steps": 235, "total_steps": 550, "loss": 0.3596, "lr": 5.661660052007547e-05, "epoch": 2.1312217194570136, "percentage": 42.73, "elapsed_time": "6:24:07", "remaining_time": "8:34:53"}
|
236 |
+
{"current_steps": 236, "total_steps": 550, "loss": 0.3549, "lr": 5.6385342710671815e-05, "epoch": 2.1402714932126696, "percentage": 42.91, "elapsed_time": "6:25:44", "remaining_time": "8:33:13"}
|
237 |
+
{"current_steps": 237, "total_steps": 550, "loss": 0.3576, "lr": 5.6153424902053e-05, "epoch": 2.1493212669683257, "percentage": 43.09, "elapsed_time": "6:27:20", "remaining_time": "8:31:33"}
|
238 |
+
{"current_steps": 238, "total_steps": 550, "loss": 0.3577, "lr": 5.59208564358345e-05, "epoch": 2.158371040723982, "percentage": 43.27, "elapsed_time": "6:28:57", "remaining_time": "8:29:54"}
|
239 |
+
{"current_steps": 239, "total_steps": 550, "loss": 0.3656, "lr": 5.568764667984022e-05, "epoch": 2.167420814479638, "percentage": 43.45, "elapsed_time": "6:30:34", "remaining_time": "8:28:14"}
|
240 |
+
{"current_steps": 240, "total_steps": 550, "loss": 0.3534, "lr": 5.5453805027725145e-05, "epoch": 2.176470588235294, "percentage": 43.64, "elapsed_time": "6:32:11", "remaining_time": "8:26:35"}
|
241 |
+
{"current_steps": 241, "total_steps": 550, "loss": 0.3534, "lr": 5.521934089859692e-05, "epoch": 2.1855203619909505, "percentage": 43.82, "elapsed_time": "6:33:48", "remaining_time": "8:24:55"}
|
242 |
+
{"current_steps": 242, "total_steps": 550, "loss": 0.3579, "lr": 5.4984263736636494e-05, "epoch": 2.1945701357466065, "percentage": 44.0, "elapsed_time": "6:35:25", "remaining_time": "8:23:16"}
|
243 |
+
{"current_steps": 243, "total_steps": 550, "loss": 0.359, "lr": 5.4748583010717636e-05, "epoch": 2.2036199095022626, "percentage": 44.18, "elapsed_time": "6:37:02", "remaining_time": "8:21:36"}
|
244 |
+
{"current_steps": 244, "total_steps": 550, "loss": 0.3627, "lr": 5.451230821402564e-05, "epoch": 2.2126696832579187, "percentage": 44.36, "elapsed_time": "6:38:39", "remaining_time": "8:19:57"}
|
245 |
+
{"current_steps": 245, "total_steps": 550, "loss": 0.3558, "lr": 5.427544886367488e-05, "epoch": 2.2217194570135748, "percentage": 44.55, "elapsed_time": "6:40:16", "remaining_time": "8:18:18"}
|
246 |
+
{"current_steps": 246, "total_steps": 550, "loss": 0.3577, "lr": 5.403801450032544e-05, "epoch": 2.230769230769231, "percentage": 44.73, "elapsed_time": "6:41:54", "remaining_time": "8:16:39"}
|
247 |
+
{"current_steps": 247, "total_steps": 550, "loss": 0.3627, "lr": 5.380001468779883e-05, "epoch": 2.239819004524887, "percentage": 44.91, "elapsed_time": "6:43:31", "remaining_time": "8:15:00"}
|
248 |
+
{"current_steps": 248, "total_steps": 550, "loss": 0.3583, "lr": 5.356145901269282e-05, "epoch": 2.248868778280543, "percentage": 45.09, "elapsed_time": "6:45:08", "remaining_time": "8:13:21"}
|
249 |
+
{"current_steps": 249, "total_steps": 550, "loss": 0.3612, "lr": 5.3322357083995235e-05, "epoch": 2.257918552036199, "percentage": 45.27, "elapsed_time": "6:46:45", "remaining_time": "8:11:42"}
|
250 |
+
{"current_steps": 250, "total_steps": 550, "loss": 0.354, "lr": 5.3082718532696874e-05, "epoch": 2.266968325791855, "percentage": 45.45, "elapsed_time": "6:48:23", "remaining_time": "8:10:03"}
|
251 |
+
{"current_steps": 251, "total_steps": 550, "loss": 0.3528, "lr": 5.284255301140364e-05, "epoch": 2.276018099547511, "percentage": 45.64, "elapsed_time": "6:50:00", "remaining_time": "8:08:24"}
|
252 |
+
{"current_steps": 252, "total_steps": 550, "loss": 0.3504, "lr": 5.2601870193947716e-05, "epoch": 2.2850678733031673, "percentage": 45.82, "elapsed_time": "6:51:37", "remaining_time": "8:06:46"}
|
253 |
+
{"current_steps": 253, "total_steps": 550, "loss": 0.3527, "lr": 5.23606797749979e-05, "epoch": 2.2941176470588234, "percentage": 46.0, "elapsed_time": "6:53:14", "remaining_time": "8:05:07"}
|
254 |
+
{"current_steps": 254, "total_steps": 550, "loss": 0.3545, "lr": 5.21189914696691e-05, "epoch": 2.3031674208144794, "percentage": 46.18, "elapsed_time": "6:54:52", "remaining_time": "8:03:28"}
|
255 |
+
{"current_steps": 255, "total_steps": 550, "loss": 0.3525, "lr": 5.1876815013131e-05, "epoch": 2.3122171945701355, "percentage": 46.36, "elapsed_time": "6:56:29", "remaining_time": "8:01:49"}
|
256 |
+
{"current_steps": 256, "total_steps": 550, "loss": 0.3561, "lr": 5.163416016021597e-05, "epoch": 2.321266968325792, "percentage": 46.55, "elapsed_time": "6:58:06", "remaining_time": "8:00:10"}
|
257 |
+
{"current_steps": 257, "total_steps": 550, "loss": 0.3515, "lr": 5.1391036685026093e-05, "epoch": 2.330316742081448, "percentage": 46.73, "elapsed_time": "6:59:44", "remaining_time": "7:58:31"}
|
258 |
+
{"current_steps": 258, "total_steps": 550, "loss": 0.3513, "lr": 5.114745438053952e-05, "epoch": 2.339366515837104, "percentage": 46.91, "elapsed_time": "7:01:21", "remaining_time": "7:56:52"}
|
259 |
+
{"current_steps": 259, "total_steps": 550, "loss": 0.3557, "lr": 5.0903423058215925e-05, "epoch": 2.3484162895927603, "percentage": 47.09, "elapsed_time": "7:02:58", "remaining_time": "7:55:13"}
|
260 |
+
{"current_steps": 260, "total_steps": 550, "loss": 0.3503, "lr": 5.06589525476014e-05, "epoch": 2.3574660633484164, "percentage": 47.27, "elapsed_time": "7:04:35", "remaining_time": "7:53:34"}
|
261 |
+
{"current_steps": 261, "total_steps": 550, "loss": 0.3568, "lr": 5.0414052695932486e-05, "epoch": 2.3665158371040724, "percentage": 47.45, "elapsed_time": "7:06:12", "remaining_time": "7:51:55"}
|
262 |
+
{"current_steps": 262, "total_steps": 550, "loss": 0.3537, "lr": 5.016873336773949e-05, "epoch": 2.3755656108597285, "percentage": 47.64, "elapsed_time": "7:07:50", "remaining_time": "7:50:17"}
|
263 |
+
{"current_steps": 263, "total_steps": 550, "loss": 0.3587, "lr": 4.992300444444916e-05, "epoch": 2.3846153846153846, "percentage": 47.82, "elapsed_time": "7:09:27", "remaining_time": "7:48:39"}
|
264 |
+
{"current_steps": 264, "total_steps": 550, "loss": 0.3544, "lr": 4.967687582398671e-05, "epoch": 2.3936651583710407, "percentage": 48.0, "elapsed_time": "7:11:05", "remaining_time": "7:47:00"}
|
265 |
+
{"current_steps": 265, "total_steps": 550, "loss": 0.3553, "lr": 4.94303574203771e-05, "epoch": 2.4027149321266967, "percentage": 48.18, "elapsed_time": "7:12:42", "remaining_time": "7:45:21"}
|
266 |
+
{"current_steps": 266, "total_steps": 550, "loss": 0.3516, "lr": 4.9183459163345644e-05, "epoch": 2.411764705882353, "percentage": 48.36, "elapsed_time": "7:14:19", "remaining_time": "7:43:42"}
|
267 |
+
{"current_steps": 267, "total_steps": 550, "loss": 0.3539, "lr": 4.893619099791817e-05, "epoch": 2.420814479638009, "percentage": 48.55, "elapsed_time": "7:15:56", "remaining_time": "7:42:03"}
|
268 |
+
{"current_steps": 268, "total_steps": 550, "loss": 0.3588, "lr": 4.868856288402032e-05, "epoch": 2.4298642533936654, "percentage": 48.73, "elapsed_time": "7:17:33", "remaining_time": "7:40:24"}
|
269 |
+
{"current_steps": 269, "total_steps": 550, "loss": 0.3543, "lr": 4.8440584796076395e-05, "epoch": 2.4389140271493215, "percentage": 48.91, "elapsed_time": "7:19:10", "remaining_time": "7:38:46"}
|
270 |
+
{"current_steps": 270, "total_steps": 550, "loss": 0.3601, "lr": 4.819226672260763e-05, "epoch": 2.4479638009049776, "percentage": 49.09, "elapsed_time": "7:20:48", "remaining_time": "7:37:07"}
|
271 |
+
{"current_steps": 271, "total_steps": 550, "loss": 0.3587, "lr": 4.794361866582982e-05, "epoch": 2.4570135746606336, "percentage": 49.27, "elapsed_time": "7:22:25", "remaining_time": "7:35:28"}
|
272 |
+
{"current_steps": 272, "total_steps": 550, "loss": 0.3558, "lr": 4.7694650641250446e-05, "epoch": 2.4660633484162897, "percentage": 49.45, "elapsed_time": "7:24:02", "remaining_time": "7:33:50"}
|
273 |
+
{"current_steps": 273, "total_steps": 550, "loss": 0.3535, "lr": 4.7445372677265205e-05, "epoch": 2.475113122171946, "percentage": 49.64, "elapsed_time": "7:25:39", "remaining_time": "7:32:11"}
|
274 |
+
{"current_steps": 274, "total_steps": 550, "loss": 0.3584, "lr": 4.719579481475416e-05, "epoch": 2.484162895927602, "percentage": 49.82, "elapsed_time": "7:27:16", "remaining_time": "7:30:32"}
|
275 |
+
{"current_steps": 275, "total_steps": 550, "loss": 0.3555, "lr": 4.694592710667723e-05, "epoch": 2.493212669683258, "percentage": 50.0, "elapsed_time": "7:28:53", "remaining_time": "7:28:53"}
|
276 |
+
{"current_steps": 276, "total_steps": 550, "loss": 0.3563, "lr": 4.6695779617669236e-05, "epoch": 2.502262443438914, "percentage": 50.18, "elapsed_time": "7:30:30", "remaining_time": "7:27:14"}
|
277 |
+
{"current_steps": 277, "total_steps": 550, "loss": 0.359, "lr": 4.6445362423634574e-05, "epoch": 2.51131221719457, "percentage": 50.36, "elapsed_time": "7:32:07", "remaining_time": "7:25:36"}
|
278 |
+
{"current_steps": 278, "total_steps": 550, "loss": 0.3524, "lr": 4.61946856113413e-05, "epoch": 2.520361990950226, "percentage": 50.55, "elapsed_time": "7:33:44", "remaining_time": "7:23:57"}
|
279 |
+
{"current_steps": 279, "total_steps": 550, "loss": 0.3517, "lr": 4.594375927801487e-05, "epoch": 2.5294117647058822, "percentage": 50.73, "elapsed_time": "7:35:21", "remaining_time": "7:22:18"}
|
280 |
+
{"current_steps": 280, "total_steps": 550, "loss": 0.3599, "lr": 4.5692593530931416e-05, "epoch": 2.5384615384615383, "percentage": 50.91, "elapsed_time": "7:36:58", "remaining_time": "7:20:39"}
|
281 |
+
{"current_steps": 281, "total_steps": 550, "loss": 0.3557, "lr": 4.5441198487010574e-05, "epoch": 2.5475113122171944, "percentage": 51.09, "elapsed_time": "7:38:35", "remaining_time": "7:19:00"}
|
282 |
+
{"current_steps": 282, "total_steps": 550, "loss": 0.351, "lr": 4.5189584272408074e-05, "epoch": 2.5565610859728505, "percentage": 51.27, "elapsed_time": "7:40:12", "remaining_time": "7:17:21"}
|
283 |
+
{"current_steps": 283, "total_steps": 550, "loss": 0.3559, "lr": 4.493776102210779e-05, "epoch": 2.5656108597285066, "percentage": 51.45, "elapsed_time": "7:41:49", "remaining_time": "7:15:42"}
|
284 |
+
{"current_steps": 284, "total_steps": 550, "loss": 0.3565, "lr": 4.468573887951354e-05, "epoch": 2.5746606334841626, "percentage": 51.64, "elapsed_time": "7:43:26", "remaining_time": "7:14:03"}
|
285 |
+
{"current_steps": 285, "total_steps": 550, "loss": 0.3532, "lr": 4.4433527996040443e-05, "epoch": 2.583710407239819, "percentage": 51.82, "elapsed_time": "7:45:03", "remaining_time": "7:12:25"}
|
286 |
+
{"current_steps": 286, "total_steps": 550, "loss": 0.3559, "lr": 4.418113853070614e-05, "epoch": 2.5927601809954752, "percentage": 52.0, "elapsed_time": "7:46:40", "remaining_time": "7:10:46"}
|
287 |
+
{"current_steps": 287, "total_steps": 550, "loss": 0.3595, "lr": 4.392858064972149e-05, "epoch": 2.6018099547511313, "percentage": 52.18, "elapsed_time": "7:48:17", "remaining_time": "7:09:07"}
|
288 |
+
{"current_steps": 288, "total_steps": 550, "loss": 0.354, "lr": 4.3675864526081106e-05, "epoch": 2.6108597285067874, "percentage": 52.36, "elapsed_time": "7:49:54", "remaining_time": "7:07:28"}
|
289 |
+
{"current_steps": 289, "total_steps": 550, "loss": 0.3517, "lr": 4.34230003391536e-05, "epoch": 2.6199095022624435, "percentage": 52.55, "elapsed_time": "7:51:31", "remaining_time": "7:05:50"}
|
290 |
+
{"current_steps": 290, "total_steps": 550, "loss": 0.3532, "lr": 4.316999827427154e-05, "epoch": 2.6289592760180995, "percentage": 52.73, "elapsed_time": "7:53:08", "remaining_time": "7:04:11"}
|
291 |
+
{"current_steps": 291, "total_steps": 550, "loss": 0.3576, "lr": 4.2916868522321235e-05, "epoch": 2.6380090497737556, "percentage": 52.91, "elapsed_time": "7:54:45", "remaining_time": "7:02:32"}
|
292 |
+
{"current_steps": 292, "total_steps": 550, "loss": 0.3591, "lr": 4.266362127933216e-05, "epoch": 2.6470588235294117, "percentage": 53.09, "elapsed_time": "7:56:22", "remaining_time": "7:00:54"}
|
293 |
+
{"current_steps": 293, "total_steps": 550, "loss": 0.3528, "lr": 4.2410266746066345e-05, "epoch": 2.6561085972850678, "percentage": 53.27, "elapsed_time": "7:57:59", "remaining_time": "6:59:15"}
|
294 |
+
{"current_steps": 294, "total_steps": 550, "loss": 0.359, "lr": 4.215681512760744e-05, "epoch": 2.665158371040724, "percentage": 53.45, "elapsed_time": "7:59:36", "remaining_time": "6:57:36"}
|
295 |
+
{"current_steps": 295, "total_steps": 550, "loss": 0.3541, "lr": 4.19032766329497e-05, "epoch": 2.6742081447963804, "percentage": 53.64, "elapsed_time": "8:01:13", "remaining_time": "6:55:58"}
|
296 |
+
{"current_steps": 296, "total_steps": 550, "loss": 0.3533, "lr": 4.1649661474586694e-05, "epoch": 2.6832579185520364, "percentage": 53.82, "elapsed_time": "8:02:50", "remaining_time": "6:54:19"}
|
297 |
+
{"current_steps": 297, "total_steps": 550, "loss": 0.3597, "lr": 4.139597986810005e-05, "epoch": 2.6923076923076925, "percentage": 54.0, "elapsed_time": "8:04:27", "remaining_time": "6:52:40"}
|
298 |
+
{"current_steps": 298, "total_steps": 550, "loss": 0.3506, "lr": 4.114224203174785e-05, "epoch": 2.7013574660633486, "percentage": 54.18, "elapsed_time": "8:06:04", "remaining_time": "6:51:02"}
|
299 |
+
{"current_steps": 299, "total_steps": 550, "loss": 0.3556, "lr": 4.0888458186053184e-05, "epoch": 2.7104072398190047, "percentage": 54.36, "elapsed_time": "8:07:41", "remaining_time": "6:49:23"}
|
300 |
+
{"current_steps": 300, "total_steps": 550, "loss": 0.3529, "lr": 4.063463855339232e-05, "epoch": 2.7194570135746607, "percentage": 54.55, "elapsed_time": "8:09:17", "remaining_time": "6:47:44"}
|
301 |
+
{"current_steps": 301, "total_steps": 550, "loss": 0.3482, "lr": 4.0380793357583076e-05, "epoch": 2.728506787330317, "percentage": 54.73, "elapsed_time": "8:10:54", "remaining_time": "6:46:06"}
|
302 |
+
{"current_steps": 302, "total_steps": 550, "loss": 0.3581, "lr": 4.012693282347289e-05, "epoch": 2.737556561085973, "percentage": 54.91, "elapsed_time": "8:12:31", "remaining_time": "6:44:27"}
|
303 |
+
{"current_steps": 303, "total_steps": 550, "loss": 0.3568, "lr": 3.9873067176527114e-05, "epoch": 2.746606334841629, "percentage": 55.09, "elapsed_time": "8:14:09", "remaining_time": "6:42:49"}
|
304 |
+
{"current_steps": 304, "total_steps": 550, "loss": 0.3548, "lr": 3.961920664241694e-05, "epoch": 2.755656108597285, "percentage": 55.27, "elapsed_time": "8:15:46", "remaining_time": "6:41:10"}
|
305 |
+
{"current_steps": 305, "total_steps": 550, "loss": 0.3547, "lr": 3.9365361446607684e-05, "epoch": 2.764705882352941, "percentage": 55.45, "elapsed_time": "8:17:23", "remaining_time": "6:39:32"}
|
306 |
+
{"current_steps": 306, "total_steps": 550, "loss": 0.3602, "lr": 3.911154181394682e-05, "epoch": 2.773755656108597, "percentage": 55.64, "elapsed_time": "8:19:00", "remaining_time": "6:37:53"}
|
307 |
+
{"current_steps": 307, "total_steps": 550, "loss": 0.3562, "lr": 3.885775796825216e-05, "epoch": 2.7828054298642533, "percentage": 55.82, "elapsed_time": "8:20:37", "remaining_time": "6:36:15"}
|
308 |
+
{"current_steps": 308, "total_steps": 550, "loss": 0.3479, "lr": 3.860402013189998e-05, "epoch": 2.7918552036199094, "percentage": 56.0, "elapsed_time": "8:22:14", "remaining_time": "6:34:36"}
|
309 |
+
{"current_steps": 309, "total_steps": 550, "loss": 0.3572, "lr": 3.835033852541332e-05, "epoch": 2.8009049773755654, "percentage": 56.18, "elapsed_time": "8:23:51", "remaining_time": "6:32:58"}
|
310 |
+
{"current_steps": 310, "total_steps": 550, "loss": 0.3519, "lr": 3.809672336705031e-05, "epoch": 2.8099547511312215, "percentage": 56.36, "elapsed_time": "8:25:28", "remaining_time": "6:31:19"}
|
311 |
+
{"current_steps": 311, "total_steps": 550, "loss": 0.3559, "lr": 3.784318487239257e-05, "epoch": 2.8190045248868776, "percentage": 56.55, "elapsed_time": "8:27:05", "remaining_time": "6:29:41"}
|
312 |
+
{"current_steps": 312, "total_steps": 550, "loss": 0.3504, "lr": 3.758973325393367e-05, "epoch": 2.8280542986425337, "percentage": 56.73, "elapsed_time": "8:28:42", "remaining_time": "6:28:02"}
|
313 |
+
{"current_steps": 313, "total_steps": 550, "loss": 0.3569, "lr": 3.7336378720667846e-05, "epoch": 2.83710407239819, "percentage": 56.91, "elapsed_time": "8:30:18", "remaining_time": "6:26:24"}
|
314 |
+
{"current_steps": 314, "total_steps": 550, "loss": 0.3559, "lr": 3.708313147767878e-05, "epoch": 2.8461538461538463, "percentage": 57.09, "elapsed_time": "8:31:55", "remaining_time": "6:24:45"}
|
315 |
+
{"current_steps": 315, "total_steps": 550, "loss": 0.3516, "lr": 3.683000172572846e-05, "epoch": 2.8552036199095023, "percentage": 57.27, "elapsed_time": "8:33:32", "remaining_time": "6:23:07"}
|
316 |
+
{"current_steps": 316, "total_steps": 550, "loss": 0.3575, "lr": 3.657699966084642e-05, "epoch": 2.8642533936651584, "percentage": 57.45, "elapsed_time": "8:35:09", "remaining_time": "6:21:28"}
|
317 |
+
{"current_steps": 317, "total_steps": 550, "loss": 0.3579, "lr": 3.632413547391891e-05, "epoch": 2.8733031674208145, "percentage": 57.64, "elapsed_time": "8:36:46", "remaining_time": "6:19:50"}
|
318 |
+
{"current_steps": 318, "total_steps": 550, "loss": 0.3486, "lr": 3.6071419350278515e-05, "epoch": 2.8823529411764706, "percentage": 57.82, "elapsed_time": "8:38:23", "remaining_time": "6:18:12"}
|
319 |
+
{"current_steps": 319, "total_steps": 550, "loss": 0.3468, "lr": 3.581886146929387e-05, "epoch": 2.8914027149321266, "percentage": 58.0, "elapsed_time": "8:40:00", "remaining_time": "6:16:33"}
|
320 |
+
{"current_steps": 320, "total_steps": 550, "loss": 0.3526, "lr": 3.556647200395956e-05, "epoch": 2.9004524886877827, "percentage": 58.18, "elapsed_time": "8:41:37", "remaining_time": "6:14:55"}
|
321 |
+
{"current_steps": 321, "total_steps": 550, "loss": 0.3498, "lr": 3.5314261120486474e-05, "epoch": 2.909502262443439, "percentage": 58.36, "elapsed_time": "8:43:14", "remaining_time": "6:13:16"}
|
322 |
+
{"current_steps": 322, "total_steps": 550, "loss": 0.353, "lr": 3.5062238977892214e-05, "epoch": 2.918552036199095, "percentage": 58.55, "elapsed_time": "8:44:51", "remaining_time": "6:11:38"}
|
323 |
+
{"current_steps": 323, "total_steps": 550, "loss": 0.3551, "lr": 3.481041572759193e-05, "epoch": 2.9276018099547514, "percentage": 58.73, "elapsed_time": "8:46:29", "remaining_time": "6:10:00"}
|
324 |
+
{"current_steps": 324, "total_steps": 550, "loss": 0.3555, "lr": 3.4558801512989446e-05, "epoch": 2.9366515837104075, "percentage": 58.91, "elapsed_time": "8:48:06", "remaining_time": "6:08:22"}
|
325 |
+
{"current_steps": 325, "total_steps": 550, "loss": 0.3553, "lr": 3.4307406469068604e-05, "epoch": 2.9457013574660635, "percentage": 59.09, "elapsed_time": "8:49:43", "remaining_time": "6:06:43"}
|
326 |
+
{"current_steps": 326, "total_steps": 550, "loss": 0.3574, "lr": 3.405624072198514e-05, "epoch": 2.9547511312217196, "percentage": 59.27, "elapsed_time": "8:51:20", "remaining_time": "6:05:05"}
|
327 |
+
{"current_steps": 327, "total_steps": 550, "loss": 0.3517, "lr": 3.3805314388658714e-05, "epoch": 2.9638009049773757, "percentage": 59.45, "elapsed_time": "8:52:57", "remaining_time": "6:03:27"}
|
328 |
+
{"current_steps": 328, "total_steps": 550, "loss": 0.3449, "lr": 3.3554637576365446e-05, "epoch": 2.9728506787330318, "percentage": 59.64, "elapsed_time": "8:54:34", "remaining_time": "6:01:49"}
|
329 |
+
{"current_steps": 329, "total_steps": 550, "loss": 0.3514, "lr": 3.330422038233078e-05, "epoch": 2.981900452488688, "percentage": 59.82, "elapsed_time": "8:56:11", "remaining_time": "6:00:10"}
|
330 |
+
{"current_steps": 330, "total_steps": 550, "loss": 0.3508, "lr": 3.305407289332279e-05, "epoch": 2.990950226244344, "percentage": 60.0, "elapsed_time": "8:57:48", "remaining_time": "5:58:32"}
|
331 |
+
{"current_steps": 331, "total_steps": 550, "loss": 0.6016, "lr": 3.280420518524585e-05, "epoch": 3.002262443438914, "percentage": 60.18, "elapsed_time": "9:01:00", "remaining_time": "5:57:56"}
|
332 |
+
{"current_steps": 332, "total_steps": 550, "loss": 0.3304, "lr": 3.25546273227348e-05, "epoch": 3.01131221719457, "percentage": 60.36, "elapsed_time": "9:02:36", "remaining_time": "5:56:17"}
|