Training in progress, epoch 4
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4877660776
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3d5d59da7a5c19bba5863d52f0607e25edc8d98e5f5c69d75a64493a2e7050b3
|
3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4932751008
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fec8ce0169928d45c8348e836230c378b454c50f6d0d851379f5914eef8e7065
|
3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4330865200
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:719849f04ce4fd6f53504351d75cecf61e75914a4963ae7b34dcb2d839c4d1f9
|
3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1089994880
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1cff62e00a7e26669e354f0391328ecfa916e9cf817efdbfc282b396fd2a481b
|
3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
@@ -316,3 +316,66 @@
|
|
316 |
{"current_steps": 316, "total_steps": 380, "loss": 0.434, "lr": 6.715720255058e-06, "epoch": 4.113728675873274, "percentage": 83.16, "elapsed_time": "9:04:00", "remaining_time": "1:50:10"}
|
317 |
{"current_steps": 317, "total_steps": 380, "loss": 0.4246, "lr": 6.513340869498859e-06, "epoch": 4.126726238830219, "percentage": 83.42, "elapsed_time": "9:05:40", "remaining_time": "1:48:26"}
|
318 |
{"current_steps": 318, "total_steps": 380, "loss": 0.4288, "lr": 6.313787120497376e-06, "epoch": 4.139723801787165, "percentage": 83.68, "elapsed_time": "9:07:23", "remaining_time": "1:46:43"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
316 |
{"current_steps": 316, "total_steps": 380, "loss": 0.434, "lr": 6.715720255058e-06, "epoch": 4.113728675873274, "percentage": 83.16, "elapsed_time": "9:04:00", "remaining_time": "1:50:10"}
|
317 |
{"current_steps": 317, "total_steps": 380, "loss": 0.4246, "lr": 6.513340869498859e-06, "epoch": 4.126726238830219, "percentage": 83.42, "elapsed_time": "9:05:40", "remaining_time": "1:48:26"}
|
318 |
{"current_steps": 318, "total_steps": 380, "loss": 0.4288, "lr": 6.313787120497376e-06, "epoch": 4.139723801787165, "percentage": 83.68, "elapsed_time": "9:07:23", "remaining_time": "1:46:43"}
|
319 |
+
{"current_steps": 319, "total_steps": 380, "loss": 0.4236, "lr": 6.117075846591123e-06, "epoch": 4.15272136474411, "percentage": 83.95, "elapsed_time": "9:09:04", "remaining_time": "1:44:59"}
|
320 |
+
{"current_steps": 320, "total_steps": 380, "loss": 0.4258, "lr": 5.923223646466923e-06, "epoch": 4.1657189277010565, "percentage": 84.21, "elapsed_time": "9:10:44", "remaining_time": "1:43:15"}
|
321 |
+
{"current_steps": 321, "total_steps": 380, "loss": 0.4257, "lr": 5.732246877560146e-06, "epoch": 4.178716490658002, "percentage": 84.47, "elapsed_time": "9:12:25", "remaining_time": "1:41:32"}
|
322 |
+
{"current_steps": 322, "total_steps": 380, "loss": 0.4263, "lr": 5.5441616546745646e-06, "epoch": 4.191714053614947, "percentage": 84.74, "elapsed_time": "9:14:05", "remaining_time": "1:39:48"}
|
323 |
+
{"current_steps": 323, "total_steps": 380, "loss": 0.4243, "lr": 5.358983848622452e-06, "epoch": 4.204711616571893, "percentage": 85.0, "elapsed_time": "9:15:47", "remaining_time": "1:38:04"}
|
324 |
+
{"current_steps": 324, "total_steps": 380, "loss": 0.4278, "lr": 5.176729084885508e-06, "epoch": 4.217709179528838, "percentage": 85.26, "elapsed_time": "9:17:27", "remaining_time": "1:36:21"}
|
325 |
+
{"current_steps": 325, "total_steps": 380, "loss": 0.4253, "lr": 4.99741274229625e-06, "epoch": 4.230706742485784, "percentage": 85.53, "elapsed_time": "9:19:08", "remaining_time": "1:34:37"}
|
326 |
+
{"current_steps": 326, "total_steps": 380, "loss": 0.4255, "lr": 4.821049951740442e-06, "epoch": 4.24370430544273, "percentage": 85.79, "elapsed_time": "9:20:49", "remaining_time": "1:32:53"}
|
327 |
+
{"current_steps": 327, "total_steps": 380, "loss": 0.4273, "lr": 4.647655594880225e-06, "epoch": 4.256701868399675, "percentage": 86.05, "elapsed_time": "9:22:29", "remaining_time": "1:31:10"}
|
328 |
+
{"current_steps": 328, "total_steps": 380, "loss": 0.4327, "lr": 4.4772443028985004e-06, "epoch": 4.269699431356621, "percentage": 86.32, "elapsed_time": "9:24:12", "remaining_time": "1:29:26"}
|
329 |
+
{"current_steps": 329, "total_steps": 380, "loss": 0.4295, "lr": 4.3098304552642385e-06, "epoch": 4.282696994313566, "percentage": 86.58, "elapsed_time": "9:25:53", "remaining_time": "1:27:43"}
|
330 |
+
{"current_steps": 330, "total_steps": 380, "loss": 0.4235, "lr": 4.1454281785191995e-06, "epoch": 4.295694557270512, "percentage": 86.84, "elapsed_time": "9:27:37", "remaining_time": "1:26:00"}
|
331 |
+
{"current_steps": 331, "total_steps": 380, "loss": 0.4259, "lr": 3.984051345085855e-06, "epoch": 4.308692120227457, "percentage": 87.11, "elapsed_time": "9:29:18", "remaining_time": "1:24:16"}
|
332 |
+
{"current_steps": 332, "total_steps": 380, "loss": 0.4205, "lr": 3.825713572096903e-06, "epoch": 4.3216896831844025, "percentage": 87.37, "elapsed_time": "9:30:59", "remaining_time": "1:22:33"}
|
333 |
+
{"current_steps": 333, "total_steps": 380, "loss": 0.4263, "lr": 3.6704282202461515e-06, "epoch": 4.334687246141349, "percentage": 87.63, "elapsed_time": "9:32:40", "remaining_time": "1:20:49"}
|
334 |
+
{"current_steps": 334, "total_steps": 380, "loss": 0.424, "lr": 3.518208392661184e-06, "epoch": 4.347684809098294, "percentage": 87.89, "elapsed_time": "9:34:22", "remaining_time": "1:19:06"}
|
335 |
+
{"current_steps": 335, "total_steps": 380, "loss": 0.422, "lr": 3.3690669337977e-06, "epoch": 4.36068237205524, "percentage": 88.16, "elapsed_time": "9:36:02", "remaining_time": "1:17:22"}
|
336 |
+
{"current_steps": 336, "total_steps": 380, "loss": 0.4236, "lr": 3.2230164283556918e-06, "epoch": 4.373679935012185, "percentage": 88.42, "elapsed_time": "9:37:43", "remaining_time": "1:15:39"}
|
337 |
+
{"current_steps": 337, "total_steps": 380, "loss": 0.4257, "lr": 3.080069200217497e-06, "epoch": 4.3866774979691305, "percentage": 88.68, "elapsed_time": "9:39:23", "remaining_time": "1:13:55"}
|
338 |
+
{"current_steps": 338, "total_steps": 380, "loss": 0.4253, "lr": 2.9402373114079295e-06, "epoch": 4.399675060926076, "percentage": 88.95, "elapsed_time": "9:41:04", "remaining_time": "1:12:12"}
|
339 |
+
{"current_steps": 339, "total_steps": 380, "loss": 0.431, "lr": 2.803532561076492e-06, "epoch": 4.412672623883022, "percentage": 89.21, "elapsed_time": "9:42:45", "remaining_time": "1:10:28"}
|
340 |
+
{"current_steps": 340, "total_steps": 380, "loss": 0.4306, "lr": 2.669966484501716e-06, "epoch": 4.425670186839968, "percentage": 89.47, "elapsed_time": "9:44:30", "remaining_time": "1:08:45"}
|
341 |
+
{"current_steps": 341, "total_steps": 380, "loss": 0.4266, "lr": 2.5395503521178143e-06, "epoch": 4.438667749796913, "percentage": 89.74, "elapsed_time": "9:46:14", "remaining_time": "1:07:02"}
|
342 |
+
{"current_steps": 342, "total_steps": 380, "loss": 0.4303, "lr": 2.4122951685636674e-06, "epoch": 4.451665312753859, "percentage": 90.0, "elapsed_time": "9:47:55", "remaining_time": "1:05:19"}
|
343 |
+
{"current_steps": 343, "total_steps": 380, "loss": 0.431, "lr": 2.2882116717542634e-06, "epoch": 4.464662875710804, "percentage": 90.26, "elapsed_time": "9:49:36", "remaining_time": "1:03:36"}
|
344 |
+
{"current_steps": 344, "total_steps": 380, "loss": 0.4238, "lr": 2.1673103319746146e-06, "epoch": 4.477660438667749, "percentage": 90.53, "elapsed_time": "9:51:20", "remaining_time": "1:01:53"}
|
345 |
+
{"current_steps": 345, "total_steps": 380, "loss": 0.423, "lr": 2.049601350996233e-06, "epoch": 4.490658001624696, "percentage": 90.79, "elapsed_time": "9:53:01", "remaining_time": "1:00:09"}
|
346 |
+
{"current_steps": 346, "total_steps": 380, "loss": 0.4243, "lr": 1.93509466121633e-06, "epoch": 4.503655564581641, "percentage": 91.05, "elapsed_time": "9:54:43", "remaining_time": "0:58:26"}
|
347 |
+
{"current_steps": 347, "total_steps": 380, "loss": 0.4277, "lr": 1.8237999248197002e-06, "epoch": 4.516653127538587, "percentage": 91.32, "elapsed_time": "9:56:24", "remaining_time": "0:56:43"}
|
348 |
+
{"current_steps": 348, "total_steps": 380, "loss": 0.4236, "lr": 1.7157265329634354e-06, "epoch": 4.529650690495532, "percentage": 91.58, "elapsed_time": "9:58:05", "remaining_time": "0:54:59"}
|
349 |
+
{"current_steps": 349, "total_steps": 380, "loss": 0.4288, "lr": 1.6108836049844434e-06, "epoch": 4.5426482534524775, "percentage": 91.84, "elapsed_time": "9:59:45", "remaining_time": "0:53:16"}
|
350 |
+
{"current_steps": 350, "total_steps": 380, "loss": 0.4333, "lr": 1.5092799876299835e-06, "epoch": 4.555645816409423, "percentage": 92.11, "elapsed_time": "10:01:26", "remaining_time": "0:51:33"}
|
351 |
+
{"current_steps": 351, "total_steps": 380, "loss": 0.428, "lr": 1.4109242543111834e-06, "epoch": 4.568643379366369, "percentage": 92.37, "elapsed_time": "10:03:06", "remaining_time": "0:49:49"}
|
352 |
+
{"current_steps": 352, "total_steps": 380, "loss": 0.4203, "lr": 1.3158247043795735e-06, "epoch": 4.581640942323315, "percentage": 92.63, "elapsed_time": "10:04:46", "remaining_time": "0:48:06"}
|
353 |
+
{"current_steps": 353, "total_steps": 380, "loss": 0.4263, "lr": 1.2239893624267852e-06, "epoch": 4.59463850528026, "percentage": 92.89, "elapsed_time": "10:06:26", "remaining_time": "0:46:23"}
|
354 |
+
{"current_steps": 354, "total_steps": 380, "loss": 0.4229, "lr": 1.1354259776074472e-06, "epoch": 4.6076360682372055, "percentage": 93.16, "elapsed_time": "10:08:09", "remaining_time": "0:44:40"}
|
355 |
+
{"current_steps": 355, "total_steps": 380, "loss": 0.4253, "lr": 1.050142022985292e-06, "epoch": 4.620633631194151, "percentage": 93.42, "elapsed_time": "10:09:50", "remaining_time": "0:42:56"}
|
356 |
+
{"current_steps": 356, "total_steps": 380, "loss": 0.4245, "lr": 9.681446949025752e-07, "epoch": 4.633631194151096, "percentage": 93.68, "elapsed_time": "10:11:31", "remaining_time": "0:41:13"}
|
357 |
+
{"current_steps": 357, "total_steps": 380, "loss": 0.4179, "lr": 8.89440912372832e-07, "epoch": 4.646628757108042, "percentage": 93.95, "elapsed_time": "10:13:11", "remaining_time": "0:39:30"}
|
358 |
+
{"current_steps": 358, "total_steps": 380, "loss": 0.4301, "lr": 8.140373164970428e-07, "epoch": 4.659626320064988, "percentage": 94.21, "elapsed_time": "10:14:52", "remaining_time": "0:37:47"}
|
359 |
+
{"current_steps": 359, "total_steps": 380, "loss": 0.4227, "lr": 7.419402699032852e-07, "epoch": 4.6726238830219335, "percentage": 94.47, "elapsed_time": "10:16:35", "remaining_time": "0:36:04"}
|
360 |
+
{"current_steps": 360, "total_steps": 380, "loss": 0.4264, "lr": 6.731558562097995e-07, "epoch": 4.685621445978879, "percentage": 94.74, "elapsed_time": "10:18:16", "remaining_time": "0:34:20"}
|
361 |
+
{"current_steps": 361, "total_steps": 380, "loss": 0.4265, "lr": 6.076898795116792e-07, "epoch": 4.698619008935824, "percentage": 95.0, "elapsed_time": "10:19:57", "remaining_time": "0:32:37"}
|
362 |
+
{"current_steps": 362, "total_steps": 380, "loss": 0.4272, "lr": 5.455478638911071e-07, "epoch": 4.71161657189277, "percentage": 95.26, "elapsed_time": "10:21:37", "remaining_time": "0:30:54"}
|
363 |
+
{"current_steps": 363, "total_steps": 380, "loss": 0.4204, "lr": 4.867350529512261e-07, "epoch": 4.724614134849716, "percentage": 95.53, "elapsed_time": "10:23:18", "remaining_time": "0:29:11"}
|
364 |
+
{"current_steps": 364, "total_steps": 380, "loss": 0.4274, "lr": 4.3125640937368373e-07, "epoch": 4.737611697806662, "percentage": 95.79, "elapsed_time": "10:24:58", "remaining_time": "0:27:28"}
|
365 |
+
{"current_steps": 365, "total_steps": 380, "loss": 0.4248, "lr": 3.791166144998704e-07, "epoch": 4.750609260763607, "percentage": 96.05, "elapsed_time": "10:26:38", "remaining_time": "0:25:45"}
|
366 |
+
{"current_steps": 366, "total_steps": 380, "loss": 0.4243, "lr": 3.3032006793590977e-07, "epoch": 4.763606823720552, "percentage": 96.32, "elapsed_time": "10:28:20", "remaining_time": "0:24:02"}
|
367 |
+
{"current_steps": 367, "total_steps": 380, "loss": 0.4267, "lr": 2.848708871814054e-07, "epoch": 4.776604386677498, "percentage": 96.58, "elapsed_time": "10:30:00", "remaining_time": "0:22:18"}
|
368 |
+
{"current_steps": 368, "total_steps": 380, "loss": 0.4217, "lr": 2.4277290728202063e-07, "epoch": 4.789601949634443, "percentage": 96.84, "elapsed_time": "10:31:41", "remaining_time": "0:20:35"}
|
369 |
+
{"current_steps": 369, "total_steps": 380, "loss": 0.4332, "lr": 2.040296805058528e-07, "epoch": 4.802599512591389, "percentage": 97.11, "elapsed_time": "10:33:22", "remaining_time": "0:18:52"}
|
370 |
+
{"current_steps": 370, "total_steps": 380, "loss": 0.4316, "lr": 1.6864447604370004e-07, "epoch": 4.815597075548335, "percentage": 97.37, "elapsed_time": "10:35:02", "remaining_time": "0:17:09"}
|
371 |
+
{"current_steps": 371, "total_steps": 380, "loss": 0.4325, "lr": 1.3662027973320614e-07, "epoch": 4.8285946385052805, "percentage": 97.63, "elapsed_time": "10:36:43", "remaining_time": "0:15:26"}
|
372 |
+
{"current_steps": 372, "total_steps": 380, "loss": 0.4198, "lr": 1.0795979380690657e-07, "epoch": 4.841592201462226, "percentage": 97.89, "elapsed_time": "10:38:24", "remaining_time": "0:13:43"}
|
373 |
+
{"current_steps": 373, "total_steps": 380, "loss": 0.4187, "lr": 8.266543666421544e-08, "epoch": 4.854589764419171, "percentage": 98.16, "elapsed_time": "10:40:04", "remaining_time": "0:12:00"}
|
374 |
+
{"current_steps": 374, "total_steps": 380, "loss": 0.4251, "lr": 6.073934266735303e-08, "epoch": 4.867587327376117, "percentage": 98.42, "elapsed_time": "10:41:45", "remaining_time": "0:10:17"}
|
375 |
+
{"current_steps": 375, "total_steps": 380, "loss": 0.4287, "lr": 4.218336196125439e-08, "epoch": 4.880584890333062, "percentage": 98.68, "elapsed_time": "10:43:26", "remaining_time": "0:08:34"}
|
376 |
+
{"current_steps": 376, "total_steps": 380, "loss": 0.4247, "lr": 2.699906031745414e-08, "epoch": 4.8935824532900085, "percentage": 98.95, "elapsed_time": "10:45:07", "remaining_time": "0:06:51"}
|
377 |
+
{"current_steps": 377, "total_steps": 380, "loss": 0.4235, "lr": 1.5187719001943378e-08, "epoch": 4.906580016246954, "percentage": 99.21, "elapsed_time": "10:46:47", "remaining_time": "0:05:08"}
|
378 |
+
{"current_steps": 378, "total_steps": 380, "loss": 0.4252, "lr": 6.750334667091629e-09, "epoch": 4.919577579203899, "percentage": 99.47, "elapsed_time": "10:48:28", "remaining_time": "0:03:25"}
|
379 |
+
{"current_steps": 379, "total_steps": 380, "loss": 0.429, "lr": 1.6876192675052695e-09, "epoch": 4.932575142160845, "percentage": 99.74, "elapsed_time": "10:50:10", "remaining_time": "0:01:42"}
|
380 |
+
{"current_steps": 380, "total_steps": 380, "loss": 0.4249, "lr": 0.0, "epoch": 4.94557270511779, "percentage": 100.0, "elapsed_time": "10:51:51", "remaining_time": "0:00:00"}
|
381 |
+
{"current_steps": 380, "total_steps": 380, "epoch": 4.94557270511779, "percentage": 100.0, "elapsed_time": "10:54:34", "remaining_time": "0:00:00"}
|