neginr commited on
Commit
e020c6b
·
verified ·
1 Parent(s): 5fc0a8c

Training in progress, epoch 7

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:86df7b6301e7206f1a7a0ad0d65c78f6efaf18ec6367c568bb75faa4908f6f1b
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7ac732aeeee81fc0b4e4143b1012c48de7f6b3e6d202bfa2f93693821f743089
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:52f10facb64bf12df78cc2e4e3fc5027d2fdd824a86841e4e7171bb31b48f5b2
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cbe27b996ff6ead1ea52867303b4319d39e11bc2fbbb6dbdd92de795eb9111e3
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:449b7e1081793d1bc5be797aa516ac10c666463b0a98b57acd2c8bb89a7261c6
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1bae8222c0e42f155fe932620ecb697633b7c3cbf0cc017c2ec427cd6abebb1b
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7caa97156029201abd9363ce9ac82736c830c654cd8e6391e1d1eec71e3eb4e8
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:26536eee75f4a58196852e0dfa9d168bd5e321b718549ae41c9b5773864baf59
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -208,3 +208,25 @@
208
  {"current_steps": 208, "total_steps": 231, "loss": 0.0848, "lr": 6.030737921409169e-07, "epoch": 6.303030303030303, "percentage": 90.04, "elapsed_time": "0:58:46", "remaining_time": "0:06:29"}
209
  {"current_steps": 209, "total_steps": 231, "loss": 0.0693, "lr": 5.522503509524591e-07, "epoch": 6.333333333333333, "percentage": 90.48, "elapsed_time": "0:59:00", "remaining_time": "0:06:12"}
210
  {"current_steps": 210, "total_steps": 231, "loss": 0.0698, "lr": 5.036030109968082e-07, "epoch": 6.363636363636363, "percentage": 90.91, "elapsed_time": "0:59:13", "remaining_time": "0:05:55"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
208
  {"current_steps": 208, "total_steps": 231, "loss": 0.0848, "lr": 6.030737921409169e-07, "epoch": 6.303030303030303, "percentage": 90.04, "elapsed_time": "0:58:46", "remaining_time": "0:06:29"}
209
  {"current_steps": 209, "total_steps": 231, "loss": 0.0693, "lr": 5.522503509524591e-07, "epoch": 6.333333333333333, "percentage": 90.48, "elapsed_time": "0:59:00", "remaining_time": "0:06:12"}
210
  {"current_steps": 210, "total_steps": 231, "loss": 0.0698, "lr": 5.036030109968082e-07, "epoch": 6.363636363636363, "percentage": 90.91, "elapsed_time": "0:59:13", "remaining_time": "0:05:55"}
211
+ {"current_steps": 211, "total_steps": 231, "loss": 0.0981, "lr": 4.5714297722121105e-07, "epoch": 6.393939393939394, "percentage": 91.34, "elapsed_time": "0:59:29", "remaining_time": "0:05:38"}
212
+ {"current_steps": 212, "total_steps": 231, "loss": 0.0704, "lr": 4.128809507704445e-07, "epoch": 6.424242424242424, "percentage": 91.77, "elapsed_time": "0:59:42", "remaining_time": "0:05:21"}
213
+ {"current_steps": 213, "total_steps": 231, "loss": 0.0925, "lr": 3.708271265220087e-07, "epoch": 6.454545454545454, "percentage": 92.21, "elapsed_time": "0:59:56", "remaining_time": "0:05:03"}
214
+ {"current_steps": 214, "total_steps": 231, "loss": 0.0839, "lr": 3.309911907379393e-07, "epoch": 6.484848484848484, "percentage": 92.64, "elapsed_time": "1:00:14", "remaining_time": "0:04:47"}
215
+ {"current_steps": 215, "total_steps": 231, "loss": 0.089, "lr": 2.9338231883378365e-07, "epoch": 6.515151515151516, "percentage": 93.07, "elapsed_time": "1:00:24", "remaining_time": "0:04:29"}
216
+ {"current_steps": 216, "total_steps": 231, "loss": 0.0791, "lr": 2.5800917326521013e-07, "epoch": 6.545454545454545, "percentage": 93.51, "elapsed_time": "1:00:43", "remaining_time": "0:04:13"}
217
+ {"current_steps": 217, "total_steps": 231, "loss": 0.0794, "lr": 2.248799015327907e-07, "epoch": 6.575757575757576, "percentage": 93.94, "elapsed_time": "1:00:58", "remaining_time": "0:03:56"}
218
+ {"current_steps": 218, "total_steps": 231, "loss": 0.0703, "lr": 1.9400213430538773e-07, "epoch": 6.606060606060606, "percentage": 94.37, "elapsed_time": "1:01:10", "remaining_time": "0:03:38"}
219
+ {"current_steps": 219, "total_steps": 231, "loss": 0.0752, "lr": 1.6538298366257975e-07, "epoch": 6.636363636363637, "percentage": 94.81, "elapsed_time": "1:01:26", "remaining_time": "0:03:21"}
220
+ {"current_steps": 220, "total_steps": 231, "loss": 0.0744, "lr": 1.3902904145653094e-07, "epoch": 6.666666666666667, "percentage": 95.24, "elapsed_time": "1:01:40", "remaining_time": "0:03:05"}
221
+ {"current_steps": 221, "total_steps": 231, "loss": 0.0963, "lr": 1.1494637779369766e-07, "epoch": 6.696969696969697, "percentage": 95.67, "elapsed_time": "1:01:59", "remaining_time": "0:02:48"}
222
+ {"current_steps": 222, "total_steps": 231, "loss": 0.0868, "lr": 9.314053963669245e-08, "epoch": 6.7272727272727275, "percentage": 96.1, "elapsed_time": "1:02:09", "remaining_time": "0:02:31"}
223
+ {"current_steps": 223, "total_steps": 231, "loss": 0.0774, "lr": 7.361654952665608e-08, "epoch": 6.757575757575758, "percentage": 96.54, "elapsed_time": "1:02:21", "remaining_time": "0:02:14"}
224
+ {"current_steps": 224, "total_steps": 231, "loss": 0.0851, "lr": 5.637890442641403e-08, "epoch": 6.787878787878788, "percentage": 96.97, "elapsed_time": "1:02:35", "remaining_time": "0:01:57"}
225
+ {"current_steps": 225, "total_steps": 231, "loss": 0.1035, "lr": 4.143157468468717e-08, "epoch": 6.818181818181818, "percentage": 97.4, "elapsed_time": "1:02:49", "remaining_time": "0:01:40"}
226
+ {"current_steps": 226, "total_steps": 231, "loss": 0.0856, "lr": 2.8778003121607834e-08, "epoch": 6.848484848484849, "percentage": 97.84, "elapsed_time": "1:03:01", "remaining_time": "0:01:23"}
227
+ {"current_steps": 227, "total_steps": 231, "loss": 0.0522, "lr": 1.8421104235727406e-08, "epoch": 6.878787878787879, "percentage": 98.27, "elapsed_time": "1:03:14", "remaining_time": "0:01:06"}
228
+ {"current_steps": 228, "total_steps": 231, "loss": 0.0615, "lr": 1.0363263532724433e-08, "epoch": 6.909090909090909, "percentage": 98.7, "elapsed_time": "1:03:24", "remaining_time": "0:00:50"}
229
+ {"current_steps": 229, "total_steps": 231, "loss": 0.0772, "lr": 4.606336975948589e-09, "epoch": 6.9393939393939394, "percentage": 99.13, "elapsed_time": "1:03:35", "remaining_time": "0:00:33"}
230
+ {"current_steps": 230, "total_steps": 231, "loss": 0.0753, "lr": 1.1516505589381777e-09, "epoch": 6.96969696969697, "percentage": 99.57, "elapsed_time": "1:03:48", "remaining_time": "0:00:16"}
231
+ {"current_steps": 231, "total_steps": 231, "loss": 0.0692, "lr": 0.0, "epoch": 7.0, "percentage": 100.0, "elapsed_time": "1:04:01", "remaining_time": "0:00:00"}
232
+ {"current_steps": 231, "total_steps": 231, "epoch": 7.0, "percentage": 100.0, "elapsed_time": "1:07:20", "remaining_time": "0:00:00"}