sedrickkeh commited on
Commit
3e37275
·
verified ·
1 Parent(s): 628be32

Training in progress, epoch 14

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e825c07703e25dedda3f586a6135bfe6e48ab3bd0be38c3c2790422e61c7fca7
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:871faef99db0af07d6d1811eb9b2d3f5993c67aca4b44a0892f9f0eeb4b00a5b
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:46df5400b3afaae893ef1b18ffa6cc7187602acbaf6cf699f73afd3bf5954173
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a51f3487d3095a7ee2c7227ae4e358cbcc2b26649dc3a85ddd1ee3b82be76867
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:75eea3438acfc6cd8bb0f007de52f0287deda841a433ed20c3188f3dfeb07265
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b8cfc29da97abc14f328aa8ea044bd2174c21263c40dbed989f8bdff727595d9
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fcf14aacc74c5e5900b205682b0cb8d3bc05e3179f549bb33bd7ba95a0abd44e
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cac9e8426c0d63c87df7e5ef27b575c37cd53ba9cab660b7542498ab6458a4e6
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -440,3 +440,27 @@
440
  {"current_steps": 440, "total_steps": 465, "loss": 0.0031, "lr": 8.800130808372553e-08, "epoch": 14.08, "percentage": 94.62, "elapsed_time": "4:12:17", "remaining_time": "0:14:20"}
441
  {"current_steps": 441, "total_steps": 465, "loss": 0.002, "lr": 8.11207248201834e-08, "epoch": 14.112, "percentage": 94.84, "elapsed_time": "4:12:54", "remaining_time": "0:13:45"}
442
  {"current_steps": 442, "total_steps": 465, "loss": 0.0024, "lr": 7.45179921325162e-08, "epoch": 14.144, "percentage": 95.05, "elapsed_time": "4:13:22", "remaining_time": "0:13:11"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
440
  {"current_steps": 440, "total_steps": 465, "loss": 0.0031, "lr": 8.800130808372553e-08, "epoch": 14.08, "percentage": 94.62, "elapsed_time": "4:12:17", "remaining_time": "0:14:20"}
441
  {"current_steps": 441, "total_steps": 465, "loss": 0.002, "lr": 8.11207248201834e-08, "epoch": 14.112, "percentage": 94.84, "elapsed_time": "4:12:54", "remaining_time": "0:13:45"}
442
  {"current_steps": 442, "total_steps": 465, "loss": 0.0024, "lr": 7.45179921325162e-08, "epoch": 14.144, "percentage": 95.05, "elapsed_time": "4:13:22", "remaining_time": "0:13:11"}
443
+ {"current_steps": 443, "total_steps": 465, "loss": 0.0026, "lr": 6.819348298638839e-08, "epoch": 14.176, "percentage": 95.27, "elapsed_time": "4:13:56", "remaining_time": "0:12:36"}
444
+ {"current_steps": 444, "total_steps": 465, "loss": 0.0029, "lr": 6.214755463157417e-08, "epoch": 14.208, "percentage": 95.48, "elapsed_time": "4:14:34", "remaining_time": "0:12:02"}
445
+ {"current_steps": 445, "total_steps": 465, "loss": 0.0021, "lr": 5.638054858177644e-08, "epoch": 14.24, "percentage": 95.7, "elapsed_time": "4:15:09", "remaining_time": "0:11:28"}
446
+ {"current_steps": 446, "total_steps": 465, "loss": 0.0043, "lr": 5.089279059533658e-08, "epoch": 14.272, "percentage": 95.91, "elapsed_time": "4:15:40", "remaining_time": "0:10:53"}
447
+ {"current_steps": 447, "total_steps": 465, "loss": 0.0029, "lr": 4.568459065683206e-08, "epoch": 14.304, "percentage": 96.13, "elapsed_time": "4:16:12", "remaining_time": "0:10:19"}
448
+ {"current_steps": 448, "total_steps": 465, "loss": 0.0029, "lr": 4.0756242959567596e-08, "epoch": 14.336, "percentage": 96.34, "elapsed_time": "4:16:39", "remaining_time": "0:09:44"}
449
+ {"current_steps": 449, "total_steps": 465, "loss": 0.0033, "lr": 3.610802588895845e-08, "epoch": 14.368, "percentage": 96.56, "elapsed_time": "4:17:11", "remaining_time": "0:09:09"}
450
+ {"current_steps": 450, "total_steps": 465, "loss": 0.0028, "lr": 3.1740202006804166e-08, "epoch": 14.4, "percentage": 96.77, "elapsed_time": "4:17:49", "remaining_time": "0:08:35"}
451
+ {"current_steps": 451, "total_steps": 465, "loss": 0.0015, "lr": 2.765301803645426e-08, "epoch": 14.432, "percentage": 96.99, "elapsed_time": "4:18:13", "remaining_time": "0:08:00"}
452
+ {"current_steps": 452, "total_steps": 465, "loss": 0.003, "lr": 2.3846704848878298e-08, "epoch": 14.464, "percentage": 97.2, "elapsed_time": "4:18:54", "remaining_time": "0:07:26"}
453
+ {"current_steps": 453, "total_steps": 465, "loss": 0.0027, "lr": 2.0321477449619098e-08, "epoch": 14.496, "percentage": 97.42, "elapsed_time": "4:19:36", "remaining_time": "0:06:52"}
454
+ {"current_steps": 454, "total_steps": 465, "loss": 0.002, "lr": 1.7077534966650767e-08, "epoch": 14.528, "percentage": 97.63, "elapsed_time": "4:20:08", "remaining_time": "0:06:18"}
455
+ {"current_steps": 455, "total_steps": 465, "loss": 0.0032, "lr": 1.411506063912882e-08, "epoch": 14.56, "percentage": 97.85, "elapsed_time": "4:20:40", "remaining_time": "0:05:43"}
456
+ {"current_steps": 456, "total_steps": 465, "loss": 0.0019, "lr": 1.1434221807041234e-08, "epoch": 14.592, "percentage": 98.06, "elapsed_time": "4:21:11", "remaining_time": "0:05:09"}
457
+ {"current_steps": 457, "total_steps": 465, "loss": 0.0021, "lr": 9.035169901754902e-09, "epoch": 14.624, "percentage": 98.28, "elapsed_time": "4:21:37", "remaining_time": "0:04:34"}
458
+ {"current_steps": 458, "total_steps": 465, "loss": 0.0025, "lr": 6.918040437463025e-09, "epoch": 14.656, "percentage": 98.49, "elapsed_time": "4:22:10", "remaining_time": "0:04:00"}
459
+ {"current_steps": 459, "total_steps": 465, "loss": 0.0028, "lr": 5.082953003528457e-09, "epoch": 14.688, "percentage": 98.71, "elapsed_time": "4:22:40", "remaining_time": "0:03:26"}
460
+ {"current_steps": 460, "total_steps": 465, "loss": 0.0028, "lr": 3.530011257730226e-09, "epoch": 14.72, "percentage": 98.92, "elapsed_time": "4:23:12", "remaining_time": "0:02:51"}
461
+ {"current_steps": 461, "total_steps": 465, "loss": 0.0019, "lr": 2.2593029204076578e-09, "epoch": 14.752, "percentage": 99.14, "elapsed_time": "4:23:39", "remaining_time": "0:02:17"}
462
+ {"current_steps": 462, "total_steps": 465, "loss": 0.0035, "lr": 1.2708997695043412e-09, "epoch": 14.784, "percentage": 99.35, "elapsed_time": "4:24:19", "remaining_time": "0:01:42"}
463
+ {"current_steps": 463, "total_steps": 465, "loss": 0.0017, "lr": 5.648576365169245e-10, "epoch": 14.816, "percentage": 99.57, "elapsed_time": "4:24:42", "remaining_time": "0:01:08"}
464
+ {"current_steps": 464, "total_steps": 465, "loss": 0.0029, "lr": 1.4121640333653042e-10, "epoch": 14.848, "percentage": 99.78, "elapsed_time": "4:25:13", "remaining_time": "0:00:34"}
465
+ {"current_steps": 465, "total_steps": 465, "loss": 0.0022, "lr": 0.0, "epoch": 14.88, "percentage": 100.0, "elapsed_time": "4:25:43", "remaining_time": "0:00:00"}
466
+ {"current_steps": 465, "total_steps": 465, "epoch": 14.88, "percentage": 100.0, "elapsed_time": "4:28:21", "remaining_time": "0:00:00"}