neginr commited on
Commit
e9ae020
·
verified ·
1 Parent(s): eef8ff8

Training in progress, epoch 7

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:18ff8ffa2f5469cdf300e96d841480bee238d2cab412a17c21d2d19496a0065f
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9153eb7556a90d2da5117c750b89677f2a2f061ff3c313f46df6c38a4cb87d1a
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dc2430dab697377bcd6a7e3abb53148144cddea03a58700422a805d9ffafdffb
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:757a133f8b26c33c87fa40d8f1f34b40fde3c9f02c54fc823016fd9b82f15468
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c5aa4872934f5dc719aa8f5eac1f82c0b2f785298efb2ade859990e7e61ca1cb
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a519af5d090231993b18ad2f27344926080d281d33cbc9df1518236c3001a7c3
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:be36aa77955b9a79322a4f73d1bf2e136303bf2630529fbf8b80bff9da74026a
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:32a20c0dfef9fe79a19c6e59029ca4dd7d7a4e0b4c8dbe7524ee570c0e91a440
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -204,3 +204,29 @@
204
  {"current_steps": 204, "total_steps": 231, "loss": 0.1045, "lr": 8.278869849454718e-07, "epoch": 6.181818181818182, "percentage": 88.31, "elapsed_time": "1:15:36", "remaining_time": "0:10:00"}
205
  {"current_steps": 205, "total_steps": 231, "loss": 0.0925, "lr": 7.684811715985429e-07, "epoch": 6.212121212121212, "percentage": 88.74, "elapsed_time": "1:15:54", "remaining_time": "0:09:37"}
206
  {"current_steps": 206, "total_steps": 231, "loss": 0.074, "lr": 7.1120165501533e-07, "epoch": 6.242424242424242, "percentage": 89.18, "elapsed_time": "1:16:12", "remaining_time": "0:09:14"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
204
  {"current_steps": 204, "total_steps": 231, "loss": 0.1045, "lr": 8.278869849454718e-07, "epoch": 6.181818181818182, "percentage": 88.31, "elapsed_time": "1:15:36", "remaining_time": "0:10:00"}
205
  {"current_steps": 205, "total_steps": 231, "loss": 0.0925, "lr": 7.684811715985429e-07, "epoch": 6.212121212121212, "percentage": 88.74, "elapsed_time": "1:15:54", "remaining_time": "0:09:37"}
206
  {"current_steps": 206, "total_steps": 231, "loss": 0.074, "lr": 7.1120165501533e-07, "epoch": 6.242424242424242, "percentage": 89.18, "elapsed_time": "1:16:12", "remaining_time": "0:09:14"}
207
+ {"current_steps": 207, "total_steps": 231, "loss": 0.0755, "lr": 6.560616283932897e-07, "epoch": 6.2727272727272725, "percentage": 89.61, "elapsed_time": "1:16:32", "remaining_time": "0:08:52"}
208
+ {"current_steps": 208, "total_steps": 231, "loss": 0.0771, "lr": 6.030737921409169e-07, "epoch": 6.303030303030303, "percentage": 90.04, "elapsed_time": "1:16:51", "remaining_time": "0:08:29"}
209
+ {"current_steps": 209, "total_steps": 231, "loss": 0.0765, "lr": 5.522503509524591e-07, "epoch": 6.333333333333333, "percentage": 90.48, "elapsed_time": "1:17:07", "remaining_time": "0:08:07"}
210
+ {"current_steps": 210, "total_steps": 231, "loss": 0.0698, "lr": 5.036030109968082e-07, "epoch": 6.363636363636363, "percentage": 90.91, "elapsed_time": "1:17:27", "remaining_time": "0:07:44"}
211
+ {"current_steps": 211, "total_steps": 231, "loss": 0.0911, "lr": 4.5714297722121105e-07, "epoch": 6.393939393939394, "percentage": 91.34, "elapsed_time": "1:17:48", "remaining_time": "0:07:22"}
212
+ {"current_steps": 212, "total_steps": 231, "loss": 0.0915, "lr": 4.128809507704445e-07, "epoch": 6.424242424242424, "percentage": 91.77, "elapsed_time": "1:18:14", "remaining_time": "0:07:00"}
213
+ {"current_steps": 213, "total_steps": 231, "loss": 0.0951, "lr": 3.708271265220087e-07, "epoch": 6.454545454545454, "percentage": 92.21, "elapsed_time": "1:18:31", "remaining_time": "0:06:38"}
214
+ {"current_steps": 214, "total_steps": 231, "loss": 0.0714, "lr": 3.309911907379393e-07, "epoch": 6.484848484848484, "percentage": 92.64, "elapsed_time": "1:18:50", "remaining_time": "0:06:15"}
215
+ {"current_steps": 215, "total_steps": 231, "loss": 0.0919, "lr": 2.9338231883378365e-07, "epoch": 6.515151515151516, "percentage": 93.07, "elapsed_time": "1:19:10", "remaining_time": "0:05:53"}
216
+ {"current_steps": 216, "total_steps": 231, "loss": 0.0955, "lr": 2.5800917326521013e-07, "epoch": 6.545454545454545, "percentage": 93.51, "elapsed_time": "1:19:30", "remaining_time": "0:05:31"}
217
+ {"current_steps": 217, "total_steps": 231, "loss": 0.0898, "lr": 2.248799015327907e-07, "epoch": 6.575757575757576, "percentage": 93.94, "elapsed_time": "1:19:49", "remaining_time": "0:05:08"}
218
+ {"current_steps": 218, "total_steps": 231, "loss": 0.0875, "lr": 1.9400213430538773e-07, "epoch": 6.606060606060606, "percentage": 94.37, "elapsed_time": "1:20:05", "remaining_time": "0:04:46"}
219
+ {"current_steps": 219, "total_steps": 231, "loss": 0.0776, "lr": 1.6538298366257975e-07, "epoch": 6.636363636363637, "percentage": 94.81, "elapsed_time": "1:20:21", "remaining_time": "0:04:24"}
220
+ {"current_steps": 220, "total_steps": 231, "loss": 0.0698, "lr": 1.3902904145653094e-07, "epoch": 6.666666666666667, "percentage": 95.24, "elapsed_time": "1:20:35", "remaining_time": "0:04:01"}
221
+ {"current_steps": 221, "total_steps": 231, "loss": 0.0977, "lr": 1.1494637779369766e-07, "epoch": 6.696969696969697, "percentage": 95.67, "elapsed_time": "1:20:58", "remaining_time": "0:03:39"}
222
+ {"current_steps": 222, "total_steps": 231, "loss": 0.0729, "lr": 9.314053963669245e-08, "epoch": 6.7272727272727275, "percentage": 96.1, "elapsed_time": "1:21:21", "remaining_time": "0:03:17"}
223
+ {"current_steps": 223, "total_steps": 231, "loss": 0.1075, "lr": 7.361654952665608e-08, "epoch": 6.757575757575758, "percentage": 96.54, "elapsed_time": "1:21:37", "remaining_time": "0:02:55"}
224
+ {"current_steps": 224, "total_steps": 231, "loss": 0.0876, "lr": 5.637890442641403e-08, "epoch": 6.787878787878788, "percentage": 96.97, "elapsed_time": "1:21:54", "remaining_time": "0:02:33"}
225
+ {"current_steps": 225, "total_steps": 231, "loss": 0.0636, "lr": 4.143157468468717e-08, "epoch": 6.818181818181818, "percentage": 97.4, "elapsed_time": "1:22:11", "remaining_time": "0:02:11"}
226
+ {"current_steps": 226, "total_steps": 231, "loss": 0.0849, "lr": 2.8778003121607834e-08, "epoch": 6.848484848484849, "percentage": 97.84, "elapsed_time": "1:22:29", "remaining_time": "0:01:49"}
227
+ {"current_steps": 227, "total_steps": 231, "loss": 0.0816, "lr": 1.8421104235727406e-08, "epoch": 6.878787878787879, "percentage": 98.27, "elapsed_time": "1:22:41", "remaining_time": "0:01:27"}
228
+ {"current_steps": 228, "total_steps": 231, "loss": 0.1109, "lr": 1.0363263532724433e-08, "epoch": 6.909090909090909, "percentage": 98.7, "elapsed_time": "1:23:04", "remaining_time": "0:01:05"}
229
+ {"current_steps": 229, "total_steps": 231, "loss": 0.0824, "lr": 4.606336975948589e-09, "epoch": 6.9393939393939394, "percentage": 99.13, "elapsed_time": "1:23:24", "remaining_time": "0:00:43"}
230
+ {"current_steps": 230, "total_steps": 231, "loss": 0.0673, "lr": 1.1516505589381777e-09, "epoch": 6.96969696969697, "percentage": 99.57, "elapsed_time": "1:23:42", "remaining_time": "0:00:21"}
231
+ {"current_steps": 231, "total_steps": 231, "loss": 0.0905, "lr": 0.0, "epoch": 7.0, "percentage": 100.0, "elapsed_time": "1:24:00", "remaining_time": "0:00:00"}
232
+ {"current_steps": 231, "total_steps": 231, "epoch": 7.0, "percentage": 100.0, "elapsed_time": "1:27:25", "remaining_time": "0:00:00"}