sedrickkeh commited on
Commit
c6521ec
·
verified ·
1 Parent(s): a96ff32

Training in progress, epoch 12

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f18b8b25f6b2de3e74c05c8c5d733b3a29bdab42bc02d047e8c1293ab338f8c6
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:85acbc9cf83ae371dbac185ab927dc2c0fb87ec4711f4d56ebfcddd1346c2a9f
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:da5861909ed62219ff2817d98df4163d1725a6543906cb8113b911ed0cbcb689
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b2daf2d99097616b68102a2e950dd305f4d6d0b74e88906e33716c55be1eb6b
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:051bafaba83fd72715a1f881b954fb651fc0cf95d6e9debf7624404493df70a9
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:43887f949f28796b05ddf3d10bcf615ca68656698e9e13cf50caf4f0f1a2ee05
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:45748dcc8ef9766321d66a39629bd033628658ab675dbcf0d1a0a8bf08f2d7de
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fb990bd1b00a85af12e9532a1dc8d3c9a6be608405d29db01674659d668064c4
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -115,3 +115,13 @@
115
  {"current_steps": 115, "total_steps": 130, "loss": 0.3481, "lr": 4.001027817058789e-07, "epoch": 11.04, "percentage": 88.46, "elapsed_time": "1:53:30", "remaining_time": "0:14:48"}
116
  {"current_steps": 116, "total_steps": 130, "loss": 0.2101, "lr": 3.49143333753309e-07, "epoch": 11.136, "percentage": 89.23, "elapsed_time": "1:54:26", "remaining_time": "0:13:48"}
117
  {"current_steps": 117, "total_steps": 130, "loss": 0.2186, "lr": 3.015368960704584e-07, "epoch": 11.232, "percentage": 90.0, "elapsed_time": "1:55:20", "remaining_time": "0:12:48"}
 
 
 
 
 
 
 
 
 
 
 
115
  {"current_steps": 115, "total_steps": 130, "loss": 0.3481, "lr": 4.001027817058789e-07, "epoch": 11.04, "percentage": 88.46, "elapsed_time": "1:53:30", "remaining_time": "0:14:48"}
116
  {"current_steps": 116, "total_steps": 130, "loss": 0.2101, "lr": 3.49143333753309e-07, "epoch": 11.136, "percentage": 89.23, "elapsed_time": "1:54:26", "remaining_time": "0:13:48"}
117
  {"current_steps": 117, "total_steps": 130, "loss": 0.2186, "lr": 3.015368960704584e-07, "epoch": 11.232, "percentage": 90.0, "elapsed_time": "1:55:20", "remaining_time": "0:12:48"}
118
+ {"current_steps": 118, "total_steps": 130, "loss": 0.2138, "lr": 2.573177902642726e-07, "epoch": 11.328, "percentage": 90.77, "elapsed_time": "1:56:11", "remaining_time": "0:11:48"}
119
+ {"current_steps": 119, "total_steps": 130, "loss": 0.2177, "lr": 2.1651789586287442e-07, "epoch": 11.424, "percentage": 91.54, "elapsed_time": "1:57:07", "remaining_time": "0:10:49"}
120
+ {"current_steps": 120, "total_steps": 130, "loss": 0.2061, "lr": 1.7916662733218848e-07, "epoch": 11.52, "percentage": 92.31, "elapsed_time": "1:58:02", "remaining_time": "0:09:50"}
121
+ {"current_steps": 121, "total_steps": 130, "loss": 0.2153, "lr": 1.4529091286973994e-07, "epoch": 11.616, "percentage": 93.08, "elapsed_time": "1:58:52", "remaining_time": "0:08:50"}
122
+ {"current_steps": 122, "total_steps": 130, "loss": 0.2386, "lr": 1.1491517499091498e-07, "epoch": 11.712, "percentage": 93.85, "elapsed_time": "1:59:42", "remaining_time": "0:07:50"}
123
+ {"current_steps": 123, "total_steps": 130, "loss": 0.2242, "lr": 8.80613129216762e-08, "epoch": 11.808, "percentage": 94.62, "elapsed_time": "2:00:36", "remaining_time": "0:06:51"}
124
+ {"current_steps": 124, "total_steps": 130, "loss": 0.2041, "lr": 6.474868681043578e-08, "epoch": 11.904, "percentage": 95.38, "elapsed_time": "2:01:24", "remaining_time": "0:05:52"}
125
+ {"current_steps": 125, "total_steps": 130, "loss": 0.3536, "lr": 4.499410377045765e-08, "epoch": 12.0, "percentage": 96.15, "elapsed_time": "2:02:26", "remaining_time": "0:04:53"}
126
+ {"current_steps": 126, "total_steps": 130, "loss": 0.2289, "lr": 2.8811805762860578e-08, "epoch": 12.096, "percentage": 96.92, "elapsed_time": "2:04:26", "remaining_time": "0:03:57"}
127
+ {"current_steps": 127, "total_steps": 130, "loss": 0.213, "lr": 1.6213459328950355e-08, "epoch": 12.192, "percentage": 97.69, "elapsed_time": "2:05:19", "remaining_time": "0:02:57"}