neginr commited on
Commit
a9370b3
·
verified ·
1 Parent(s): 7d895df

Training in progress, epoch 7

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d0d120e057ceca23d213004b724fcbbe67a45af1f565dab7df6387712968d22d
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c146df0f62f81ee0048ae919f77bcfa5e3eeeff401e47f823920077b76c68154
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cb923283f5efbd513fd617e7b1eca6b4aed2638c32dee564e3dee534130f5ac4
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:619752c08fea531e16c00a4f4108a239c6445099a251a8fd3aa1c01045923131
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d4652215f44c9d46f19fc1aeb787f8d85222c58d12d0711d331aee86c9458f95
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f975ff69863c30ba62cdbbda9e16478f7e947ccb82f93d021d8a1ee4329fb71c
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9bdd420700ba49a6dc1b995d52679108a06ec22b912eea0126b4416b0661ec99
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9b8ed04a49a2fcea5eba7d02d1a8668414e9d319f3a1dd913188e9e7cd5d41ea
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -210,3 +210,23 @@
210
  {"current_steps": 210, "total_steps": 231, "loss": 0.15, "lr": 5.036030109968082e-07, "epoch": 6.363636363636363, "percentage": 90.91, "elapsed_time": "0:52:30", "remaining_time": "0:05:15"}
211
  {"current_steps": 211, "total_steps": 231, "loss": 0.1368, "lr": 4.5714297722121105e-07, "epoch": 6.393939393939394, "percentage": 91.34, "elapsed_time": "0:52:42", "remaining_time": "0:04:59"}
212
  {"current_steps": 212, "total_steps": 231, "loss": 0.1636, "lr": 4.128809507704445e-07, "epoch": 6.424242424242424, "percentage": 91.77, "elapsed_time": "0:52:56", "remaining_time": "0:04:44"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
210
  {"current_steps": 210, "total_steps": 231, "loss": 0.15, "lr": 5.036030109968082e-07, "epoch": 6.363636363636363, "percentage": 90.91, "elapsed_time": "0:52:30", "remaining_time": "0:05:15"}
211
  {"current_steps": 211, "total_steps": 231, "loss": 0.1368, "lr": 4.5714297722121105e-07, "epoch": 6.393939393939394, "percentage": 91.34, "elapsed_time": "0:52:42", "remaining_time": "0:04:59"}
212
  {"current_steps": 212, "total_steps": 231, "loss": 0.1636, "lr": 4.128809507704445e-07, "epoch": 6.424242424242424, "percentage": 91.77, "elapsed_time": "0:52:56", "remaining_time": "0:04:44"}
213
+ {"current_steps": 213, "total_steps": 231, "loss": 0.1135, "lr": 3.708271265220087e-07, "epoch": 6.454545454545454, "percentage": 92.21, "elapsed_time": "0:53:08", "remaining_time": "0:04:29"}
214
+ {"current_steps": 214, "total_steps": 231, "loss": 0.1391, "lr": 3.309911907379393e-07, "epoch": 6.484848484848484, "percentage": 92.64, "elapsed_time": "0:53:18", "remaining_time": "0:04:14"}
215
+ {"current_steps": 215, "total_steps": 231, "loss": 0.1633, "lr": 2.9338231883378365e-07, "epoch": 6.515151515151516, "percentage": 93.07, "elapsed_time": "0:53:28", "remaining_time": "0:03:58"}
216
+ {"current_steps": 216, "total_steps": 231, "loss": 0.1044, "lr": 2.5800917326521013e-07, "epoch": 6.545454545454545, "percentage": 93.51, "elapsed_time": "0:53:41", "remaining_time": "0:03:43"}
217
+ {"current_steps": 217, "total_steps": 231, "loss": 0.1302, "lr": 2.248799015327907e-07, "epoch": 6.575757575757576, "percentage": 93.94, "elapsed_time": "0:53:54", "remaining_time": "0:03:28"}
218
+ {"current_steps": 218, "total_steps": 231, "loss": 0.1377, "lr": 1.9400213430538773e-07, "epoch": 6.606060606060606, "percentage": 94.37, "elapsed_time": "0:54:06", "remaining_time": "0:03:13"}
219
+ {"current_steps": 219, "total_steps": 231, "loss": 0.1713, "lr": 1.6538298366257975e-07, "epoch": 6.636363636363637, "percentage": 94.81, "elapsed_time": "0:54:19", "remaining_time": "0:02:58"}
220
+ {"current_steps": 220, "total_steps": 231, "loss": 0.1478, "lr": 1.3902904145653094e-07, "epoch": 6.666666666666667, "percentage": 95.24, "elapsed_time": "0:54:31", "remaining_time": "0:02:43"}
221
+ {"current_steps": 221, "total_steps": 231, "loss": 0.1182, "lr": 1.1494637779369766e-07, "epoch": 6.696969696969697, "percentage": 95.67, "elapsed_time": "0:54:42", "remaining_time": "0:02:28"}
222
+ {"current_steps": 222, "total_steps": 231, "loss": 0.1542, "lr": 9.314053963669245e-08, "epoch": 6.7272727272727275, "percentage": 96.1, "elapsed_time": "0:54:54", "remaining_time": "0:02:13"}
223
+ {"current_steps": 223, "total_steps": 231, "loss": 0.145, "lr": 7.361654952665608e-08, "epoch": 6.757575757575758, "percentage": 96.54, "elapsed_time": "0:55:05", "remaining_time": "0:01:58"}
224
+ {"current_steps": 224, "total_steps": 231, "loss": 0.1504, "lr": 5.637890442641403e-08, "epoch": 6.787878787878788, "percentage": 96.97, "elapsed_time": "0:55:17", "remaining_time": "0:01:43"}
225
+ {"current_steps": 225, "total_steps": 231, "loss": 0.147, "lr": 4.143157468468717e-08, "epoch": 6.818181818181818, "percentage": 97.4, "elapsed_time": "0:55:29", "remaining_time": "0:01:28"}
226
+ {"current_steps": 226, "total_steps": 231, "loss": 0.147, "lr": 2.8778003121607834e-08, "epoch": 6.848484848484849, "percentage": 97.84, "elapsed_time": "0:55:40", "remaining_time": "0:01:13"}
227
+ {"current_steps": 227, "total_steps": 231, "loss": 0.1384, "lr": 1.8421104235727406e-08, "epoch": 6.878787878787879, "percentage": 98.27, "elapsed_time": "0:55:52", "remaining_time": "0:00:59"}
228
+ {"current_steps": 228, "total_steps": 231, "loss": 0.1421, "lr": 1.0363263532724433e-08, "epoch": 6.909090909090909, "percentage": 98.7, "elapsed_time": "0:56:05", "remaining_time": "0:00:44"}
229
+ {"current_steps": 229, "total_steps": 231, "loss": 0.1359, "lr": 4.606336975948589e-09, "epoch": 6.9393939393939394, "percentage": 99.13, "elapsed_time": "0:56:19", "remaining_time": "0:00:29"}
230
+ {"current_steps": 230, "total_steps": 231, "loss": 0.145, "lr": 1.1516505589381777e-09, "epoch": 6.96969696969697, "percentage": 99.57, "elapsed_time": "0:56:33", "remaining_time": "0:00:14"}
231
+ {"current_steps": 231, "total_steps": 231, "loss": 0.1566, "lr": 0.0, "epoch": 7.0, "percentage": 100.0, "elapsed_time": "0:56:45", "remaining_time": "0:00:00"}
232
+ {"current_steps": 231, "total_steps": 231, "epoch": 7.0, "percentage": 100.0, "elapsed_time": "0:59:31", "remaining_time": "0:00:00"}