neginr commited on
Commit
7543017
·
verified ·
1 Parent(s): 88f589c

Training in progress, epoch 13

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ecce232892ac44c65c0daba70b88d6db50cd6eb695a9ca15e485f37bb55d6692
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ff4157406d2be970ec9e50a9a37e6bae2b211686993cecd7c9777ae672248531
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a036c8484d5d33911c894f7dbc4ea44a3539765a79221fdf48f430b9f5b66fbd
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:27c9f990e8223dd779fd084d890da46e78c194ed4c372ac27ad21f1ec811adcc
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ec6d40cd9fb3a43f3db5b9be63c6efbefab90af8f2dc5d907004cd8d7d84dc63
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5c15e0160675dce8ae8aed1d254f233a410449c7de7d53adcc587c240f7ed9c7
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:84224f4194b8c3ed6b6b81258330dd6916e3cd5f4fdb4f46b881141393242700
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1228d353a83a0c9be92e29165f8d3269e60d72a5a27c429ba396ebcf36f5168f
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -119,3 +119,13 @@
119
  {"current_steps": 119, "total_steps": 130, "loss": 0.1438, "lr": 2.1651789586287442e-07, "epoch": 11.9, "percentage": 91.54, "elapsed_time": "0:38:55", "remaining_time": "0:03:35"}
120
  {"current_steps": 120, "total_steps": 130, "loss": 0.0711, "lr": 1.7916662733218848e-07, "epoch": 12.0, "percentage": 92.31, "elapsed_time": "0:39:02", "remaining_time": "0:03:15"}
121
  {"current_steps": 121, "total_steps": 130, "loss": 0.1147, "lr": 1.4529091286973994e-07, "epoch": 12.1, "percentage": 93.08, "elapsed_time": "0:41:14", "remaining_time": "0:03:04"}
 
 
 
 
 
 
 
 
 
 
 
119
  {"current_steps": 119, "total_steps": 130, "loss": 0.1438, "lr": 2.1651789586287442e-07, "epoch": 11.9, "percentage": 91.54, "elapsed_time": "0:38:55", "remaining_time": "0:03:35"}
120
  {"current_steps": 120, "total_steps": 130, "loss": 0.0711, "lr": 1.7916662733218848e-07, "epoch": 12.0, "percentage": 92.31, "elapsed_time": "0:39:02", "remaining_time": "0:03:15"}
121
  {"current_steps": 121, "total_steps": 130, "loss": 0.1147, "lr": 1.4529091286973994e-07, "epoch": 12.1, "percentage": 93.08, "elapsed_time": "0:41:14", "remaining_time": "0:03:04"}
122
+ {"current_steps": 122, "total_steps": 130, "loss": 0.0725, "lr": 1.1491517499091498e-07, "epoch": 12.2, "percentage": 93.85, "elapsed_time": "0:41:23", "remaining_time": "0:02:42"}
123
+ {"current_steps": 123, "total_steps": 130, "loss": 0.1093, "lr": 8.80613129216762e-08, "epoch": 12.3, "percentage": 94.62, "elapsed_time": "0:41:32", "remaining_time": "0:02:21"}
124
+ {"current_steps": 124, "total_steps": 130, "loss": 0.0863, "lr": 6.474868681043578e-08, "epoch": 12.4, "percentage": 95.38, "elapsed_time": "0:41:43", "remaining_time": "0:02:01"}
125
+ {"current_steps": 125, "total_steps": 130, "loss": 0.1132, "lr": 4.499410377045765e-08, "epoch": 12.5, "percentage": 96.15, "elapsed_time": "0:41:54", "remaining_time": "0:01:40"}
126
+ {"current_steps": 126, "total_steps": 130, "loss": 0.1052, "lr": 2.8811805762860578e-08, "epoch": 12.6, "percentage": 96.92, "elapsed_time": "0:42:04", "remaining_time": "0:01:20"}
127
+ {"current_steps": 127, "total_steps": 130, "loss": 0.0705, "lr": 1.6213459328950355e-08, "epoch": 12.7, "percentage": 97.69, "elapsed_time": "0:42:11", "remaining_time": "0:00:59"}
128
+ {"current_steps": 128, "total_steps": 130, "loss": 0.1106, "lr": 7.2081471792911914e-09, "epoch": 12.8, "percentage": 98.46, "elapsed_time": "0:42:19", "remaining_time": "0:00:39"}
129
+ {"current_steps": 129, "total_steps": 130, "loss": 0.075, "lr": 1.8023616455731253e-09, "epoch": 12.9, "percentage": 99.23, "elapsed_time": "0:42:25", "remaining_time": "0:00:19"}
130
+ {"current_steps": 130, "total_steps": 130, "loss": 0.1035, "lr": 0.0, "epoch": 13.0, "percentage": 100.0, "elapsed_time": "0:42:35", "remaining_time": "0:00:00"}
131
+ {"current_steps": 130, "total_steps": 130, "epoch": 13.0, "percentage": 100.0, "elapsed_time": "0:47:16", "remaining_time": "0:00:00"}