ryanmarten commited on
Commit
66958d7
·
verified ·
1 Parent(s): 5fddc6f

Training in progress, epoch 6

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3e6a8c36232b57183f7e013e1ecd560cb8f89e4a500dbd3300edd6aee641d19a
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:69487f4d7d81287eaf542d3b7ce9000516a8d45254e1002df97e87933843bd51
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b9b083404178c90c34dd660a10f11b6d73df620cc1f0022ba09aa3ecb542918e
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:06082780aac1d79f0961ab6d9de99cf50ab299f40f1af86f96b46e495a90305d
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:305f96f6722c9bba2c7b2f40b4d82d73529a41e66bf584bc13a0669f45506fbb
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:563de47b3f14a2fa6e9157afc86544c375328cdc0adf0e479a07314a8f0ce536
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2351d525acd45d6e2e201b8de11b015a75bca17f00aea376227d729123a560e0
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ff595cf9fd25621b7c33fd6115e63901ee1f8f63f3638ec21e7952cdb1da5c62
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -212,3 +212,31 @@
212
  {"current_steps": 195, "total_steps": 224, "loss": 0.2764, "lr": 1.0097768704058542e-06, "epoch": 5.962025316455696, "percentage": 87.05, "elapsed_time": "6:20:49", "remaining_time": "0:56:38"}
213
  {"current_steps": 196, "total_steps": 224, "loss": 0.2661, "lr": 9.424343531000968e-07, "epoch": 5.992405063291139, "percentage": 87.5, "elapsed_time": "6:22:44", "remaining_time": "0:54:40"}
214
  {"current_steps": 197, "total_steps": 224, "loss": 0.2701, "lr": 8.773044733510338e-07, "epoch": 6.030379746835443, "percentage": 87.95, "elapsed_time": "6:25:36", "remaining_time": "0:52:51"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
212
  {"current_steps": 195, "total_steps": 224, "loss": 0.2764, "lr": 1.0097768704058542e-06, "epoch": 5.962025316455696, "percentage": 87.05, "elapsed_time": "6:20:49", "remaining_time": "0:56:38"}
213
  {"current_steps": 196, "total_steps": 224, "loss": 0.2661, "lr": 9.424343531000968e-07, "epoch": 5.992405063291139, "percentage": 87.5, "elapsed_time": "6:22:44", "remaining_time": "0:54:40"}
214
  {"current_steps": 197, "total_steps": 224, "loss": 0.2701, "lr": 8.773044733510338e-07, "epoch": 6.030379746835443, "percentage": 87.95, "elapsed_time": "6:25:36", "remaining_time": "0:52:51"}
215
+ {"current_steps": 198, "total_steps": 224, "loss": 0.2479, "lr": 8.144031414842012e-07, "epoch": 6.060759493670886, "percentage": 88.39, "elapsed_time": "6:27:27", "remaining_time": "0:50:52"}
216
+ {"current_steps": 199, "total_steps": 224, "loss": 0.2495, "lr": 7.537457234218271e-07, "epoch": 6.091139240506329, "percentage": 88.84, "elapsed_time": "6:29:25", "remaining_time": "0:48:55"}
217
+ {"current_steps": 200, "total_steps": 224, "loss": 0.2705, "lr": 6.953470369291349e-07, "epoch": 6.121518987341772, "percentage": 89.29, "elapsed_time": "6:31:22", "remaining_time": "0:46:57"}
218
+ {"current_steps": 201, "total_steps": 224, "loss": 0.2563, "lr": 6.392213479945852e-07, "epoch": 6.151898734177215, "percentage": 89.73, "elapsed_time": "6:33:14", "remaining_time": "0:44:59"}
219
+ {"current_steps": 202, "total_steps": 224, "loss": 0.2572, "lr": 5.853823673448877e-07, "epoch": 6.182278481012658, "percentage": 90.18, "elapsed_time": "6:35:12", "remaining_time": "0:43:02"}
220
+ {"current_steps": 203, "total_steps": 224, "loss": 0.2615, "lr": 5.33843247095659e-07, "epoch": 6.2126582278481015, "percentage": 90.62, "elapsed_time": "6:37:04", "remaining_time": "0:41:04"}
221
+ {"current_steps": 204, "total_steps": 224, "loss": 0.2498, "lr": 4.846165775385459e-07, "epoch": 6.243037974683545, "percentage": 91.07, "elapsed_time": "6:38:46", "remaining_time": "0:39:05"}
222
+ {"current_steps": 205, "total_steps": 224, "loss": 0.2608, "lr": 4.3771438406559173e-07, "epoch": 6.273417721518987, "percentage": 91.52, "elapsed_time": "6:40:44", "remaining_time": "0:37:08"}
223
+ {"current_steps": 206, "total_steps": 224, "loss": 0.2633, "lr": 3.931481242315993e-07, "epoch": 6.30379746835443, "percentage": 91.96, "elapsed_time": "6:42:40", "remaining_time": "0:35:11"}
224
+ {"current_steps": 207, "total_steps": 224, "loss": 0.2555, "lr": 3.5092868495520294e-07, "epoch": 6.334177215189873, "percentage": 92.41, "elapsed_time": "6:44:42", "remaining_time": "0:33:14"}
225
+ {"current_steps": 208, "total_steps": 224, "loss": 0.264, "lr": 3.110663798593616e-07, "epoch": 6.364556962025317, "percentage": 92.86, "elapsed_time": "6:46:29", "remaining_time": "0:31:16"}
226
+ {"current_steps": 209, "total_steps": 224, "loss": 0.2509, "lr": 2.735709467518699e-07, "epoch": 6.39493670886076, "percentage": 93.3, "elapsed_time": "6:48:29", "remaining_time": "0:29:19"}
227
+ {"current_steps": 210, "total_steps": 224, "loss": 0.2569, "lr": 2.384515452465475e-07, "epoch": 6.425316455696202, "percentage": 93.75, "elapsed_time": "6:50:35", "remaining_time": "0:27:22"}
228
+ {"current_steps": 211, "total_steps": 224, "loss": 0.2554, "lr": 2.0571675452567997e-07, "epoch": 6.455696202531645, "percentage": 94.2, "elapsed_time": "6:52:35", "remaining_time": "0:25:25"}
229
+ {"current_steps": 212, "total_steps": 224, "loss": 0.2567, "lr": 1.7537457124423896e-07, "epoch": 6.4860759493670885, "percentage": 94.64, "elapsed_time": "6:54:44", "remaining_time": "0:23:28"}
230
+ {"current_steps": 213, "total_steps": 224, "loss": 0.2589, "lr": 1.474324075764111e-07, "epoch": 6.516455696202532, "percentage": 95.09, "elapsed_time": "6:56:29", "remaining_time": "0:21:30"}
231
+ {"current_steps": 214, "total_steps": 224, "loss": 0.2508, "lr": 1.2189708940490653e-07, "epoch": 6.546835443037975, "percentage": 95.54, "elapsed_time": "6:58:31", "remaining_time": "0:19:33"}
232
+ {"current_steps": 215, "total_steps": 224, "loss": 0.2515, "lr": 9.877485465349057e-08, "epoch": 6.577215189873417, "percentage": 95.98, "elapsed_time": "7:00:16", "remaining_time": "0:17:35"}
233
+ {"current_steps": 216, "total_steps": 224, "loss": 0.2596, "lr": 7.807135176314707e-08, "epoch": 6.6075949367088604, "percentage": 96.43, "elapsed_time": "7:02:18", "remaining_time": "0:15:38"}
234
+ {"current_steps": 217, "total_steps": 224, "loss": 0.2688, "lr": 5.979163831223988e-08, "epoch": 6.637974683544304, "percentage": 96.88, "elapsed_time": "7:04:11", "remaining_time": "0:13:41"}
235
+ {"current_steps": 218, "total_steps": 224, "loss": 0.2612, "lr": 4.394017978101905e-08, "epoch": 6.668354430379747, "percentage": 97.32, "elapsed_time": "7:06:17", "remaining_time": "0:11:43"}
236
+ {"current_steps": 219, "total_steps": 224, "loss": 0.2717, "lr": 3.0520848460765525e-08, "epoch": 6.69873417721519, "percentage": 97.77, "elapsed_time": "7:08:25", "remaining_time": "0:09:46"}
237
+ {"current_steps": 220, "total_steps": 224, "loss": 0.2736, "lr": 1.9536922507841227e-08, "epoch": 6.729113924050633, "percentage": 98.21, "elapsed_time": "7:10:34", "remaining_time": "0:07:49"}
238
+ {"current_steps": 221, "total_steps": 224, "loss": 0.2457, "lr": 1.099108514288627e-08, "epoch": 6.759493670886076, "percentage": 98.66, "elapsed_time": "7:12:32", "remaining_time": "0:05:52"}
239
+ {"current_steps": 222, "total_steps": 224, "loss": 0.2759, "lr": 4.885423995341088e-09, "epoch": 6.789873417721519, "percentage": 99.11, "elapsed_time": "7:14:21", "remaining_time": "0:03:54"}
240
+ {"current_steps": 223, "total_steps": 224, "loss": 0.2636, "lr": 1.2214305934699078e-09, "epoch": 6.820253164556962, "percentage": 99.55, "elapsed_time": "7:16:21", "remaining_time": "0:01:57"}
241
+ {"current_steps": 224, "total_steps": 224, "loss": 0.2577, "lr": 0.0, "epoch": 6.850632911392405, "percentage": 100.0, "elapsed_time": "7:18:00", "remaining_time": "0:00:00"}
242
+ {"current_steps": 224, "total_steps": 224, "epoch": 6.850632911392405, "percentage": 100.0, "elapsed_time": "7:19:56", "remaining_time": "0:00:00"}