ryanmarten commited on
Commit
71037f4
·
verified ·
1 Parent(s): 99d11eb

Training in progress, epoch 6

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:908643f5f9c86968afd1568dcefa046d210137aa9d3b31959c426597f0bbe1e8
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1dcb03405f854a31eb5a94e9b8647ab6e2a07055dcc4dda6d622dd7fea888f03
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:416f1313cc70886827d37a7844eb6babcf075e627df1f7ab4cd89d2aee40fb86
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:33634cc11b06be9819ce0ee3d61771dfa1acf897d682186efbd1aeff4c543f63
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cb1942f1a98671cb26d60515fe30d0748b78fcd2898e97fd5914cbc2b4a86812
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bbdd70941027a4bdf2850e034fb84ed6f67e4c98aa4199b707935aa66f7d1cd5
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d2f37cddbf23b7da3ac97c49db6bf2f1d4017c33d7737bd8798d033263f00459
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:19e7508ff7b343e2107818b59c27ca0e7719cb159a9d86b1672eb9e89dc957ec
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -195,3 +195,31 @@
195
  {"current_steps": 195, "total_steps": 224, "loss": 0.4549, "lr": 1.0097768704058542e-06, "epoch": 5.962025316455696, "percentage": 87.05, "elapsed_time": "6:35:34", "remaining_time": "0:58:49"}
196
  {"current_steps": 196, "total_steps": 224, "loss": 0.4376, "lr": 9.424343531000968e-07, "epoch": 5.992405063291139, "percentage": 87.5, "elapsed_time": "6:37:33", "remaining_time": "0:56:47"}
197
  {"current_steps": 197, "total_steps": 224, "loss": 0.4275, "lr": 8.773044733510338e-07, "epoch": 6.030379746835443, "percentage": 87.95, "elapsed_time": "6:40:33", "remaining_time": "0:54:53"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
195
  {"current_steps": 195, "total_steps": 224, "loss": 0.4549, "lr": 1.0097768704058542e-06, "epoch": 5.962025316455696, "percentage": 87.05, "elapsed_time": "6:35:34", "remaining_time": "0:58:49"}
196
  {"current_steps": 196, "total_steps": 224, "loss": 0.4376, "lr": 9.424343531000968e-07, "epoch": 5.992405063291139, "percentage": 87.5, "elapsed_time": "6:37:33", "remaining_time": "0:56:47"}
197
  {"current_steps": 197, "total_steps": 224, "loss": 0.4275, "lr": 8.773044733510338e-07, "epoch": 6.030379746835443, "percentage": 87.95, "elapsed_time": "6:40:33", "remaining_time": "0:54:53"}
198
+ {"current_steps": 198, "total_steps": 224, "loss": 0.4399, "lr": 8.144031414842012e-07, "epoch": 6.060759493670886, "percentage": 88.39, "elapsed_time": "6:42:41", "remaining_time": "0:52:52"}
199
+ {"current_steps": 199, "total_steps": 224, "loss": 0.4305, "lr": 7.537457234218271e-07, "epoch": 6.091139240506329, "percentage": 88.84, "elapsed_time": "6:44:36", "remaining_time": "0:50:49"}
200
+ {"current_steps": 200, "total_steps": 224, "loss": 0.4333, "lr": 6.953470369291349e-07, "epoch": 6.121518987341772, "percentage": 89.29, "elapsed_time": "6:46:44", "remaining_time": "0:48:48"}
201
+ {"current_steps": 201, "total_steps": 224, "loss": 0.4128, "lr": 6.392213479945852e-07, "epoch": 6.151898734177215, "percentage": 89.73, "elapsed_time": "6:48:36", "remaining_time": "0:46:45"}
202
+ {"current_steps": 202, "total_steps": 224, "loss": 0.4265, "lr": 5.853823673448877e-07, "epoch": 6.182278481012658, "percentage": 90.18, "elapsed_time": "6:50:32", "remaining_time": "0:44:42"}
203
+ {"current_steps": 203, "total_steps": 224, "loss": 0.4233, "lr": 5.33843247095659e-07, "epoch": 6.2126582278481015, "percentage": 90.62, "elapsed_time": "6:52:36", "remaining_time": "0:42:40"}
204
+ {"current_steps": 204, "total_steps": 224, "loss": 0.4267, "lr": 4.846165775385459e-07, "epoch": 6.243037974683545, "percentage": 91.07, "elapsed_time": "6:54:30", "remaining_time": "0:40:38"}
205
+ {"current_steps": 205, "total_steps": 224, "loss": 0.4405, "lr": 4.3771438406559173e-07, "epoch": 6.273417721518987, "percentage": 91.52, "elapsed_time": "6:56:30", "remaining_time": "0:38:36"}
206
+ {"current_steps": 206, "total_steps": 224, "loss": 0.4217, "lr": 3.931481242315993e-07, "epoch": 6.30379746835443, "percentage": 91.96, "elapsed_time": "6:58:27", "remaining_time": "0:36:33"}
207
+ {"current_steps": 207, "total_steps": 224, "loss": 0.4162, "lr": 3.5092868495520294e-07, "epoch": 6.334177215189873, "percentage": 92.41, "elapsed_time": "7:00:19", "remaining_time": "0:34:31"}
208
+ {"current_steps": 208, "total_steps": 224, "loss": 0.4405, "lr": 3.110663798593616e-07, "epoch": 6.364556962025317, "percentage": 92.86, "elapsed_time": "7:02:22", "remaining_time": "0:32:29"}
209
+ {"current_steps": 209, "total_steps": 224, "loss": 0.4126, "lr": 2.735709467518699e-07, "epoch": 6.39493670886076, "percentage": 93.3, "elapsed_time": "7:04:16", "remaining_time": "0:30:27"}
210
+ {"current_steps": 210, "total_steps": 224, "loss": 0.4179, "lr": 2.384515452465475e-07, "epoch": 6.425316455696202, "percentage": 93.75, "elapsed_time": "7:06:08", "remaining_time": "0:28:24"}
211
+ {"current_steps": 211, "total_steps": 224, "loss": 0.4231, "lr": 2.0571675452567997e-07, "epoch": 6.455696202531645, "percentage": 94.2, "elapsed_time": "7:07:52", "remaining_time": "0:26:21"}
212
+ {"current_steps": 212, "total_steps": 224, "loss": 0.4134, "lr": 1.7537457124423896e-07, "epoch": 6.4860759493670885, "percentage": 94.64, "elapsed_time": "7:09:57", "remaining_time": "0:24:20"}
213
+ {"current_steps": 213, "total_steps": 224, "loss": 0.4212, "lr": 1.474324075764111e-07, "epoch": 6.516455696202532, "percentage": 95.09, "elapsed_time": "7:12:00", "remaining_time": "0:22:18"}
214
+ {"current_steps": 214, "total_steps": 224, "loss": 0.4217, "lr": 1.2189708940490653e-07, "epoch": 6.546835443037975, "percentage": 95.54, "elapsed_time": "7:13:54", "remaining_time": "0:20:16"}
215
+ {"current_steps": 215, "total_steps": 224, "loss": 0.4196, "lr": 9.877485465349057e-08, "epoch": 6.577215189873417, "percentage": 95.98, "elapsed_time": "7:15:59", "remaining_time": "0:18:15"}
216
+ {"current_steps": 216, "total_steps": 224, "loss": 0.4107, "lr": 7.807135176314707e-08, "epoch": 6.6075949367088604, "percentage": 96.43, "elapsed_time": "7:17:58", "remaining_time": "0:16:13"}
217
+ {"current_steps": 217, "total_steps": 224, "loss": 0.4114, "lr": 5.979163831223988e-08, "epoch": 6.637974683544304, "percentage": 96.88, "elapsed_time": "7:20:06", "remaining_time": "0:14:11"}
218
+ {"current_steps": 218, "total_steps": 224, "loss": 0.4126, "lr": 4.394017978101905e-08, "epoch": 6.668354430379747, "percentage": 97.32, "elapsed_time": "7:22:12", "remaining_time": "0:12:10"}
219
+ {"current_steps": 219, "total_steps": 224, "loss": 0.423, "lr": 3.0520848460765525e-08, "epoch": 6.69873417721519, "percentage": 97.77, "elapsed_time": "7:24:27", "remaining_time": "0:10:08"}
220
+ {"current_steps": 220, "total_steps": 224, "loss": 0.4318, "lr": 1.9536922507841227e-08, "epoch": 6.729113924050633, "percentage": 98.21, "elapsed_time": "7:26:38", "remaining_time": "0:08:07"}
221
+ {"current_steps": 221, "total_steps": 224, "loss": 0.424, "lr": 1.099108514288627e-08, "epoch": 6.759493670886076, "percentage": 98.66, "elapsed_time": "7:28:47", "remaining_time": "0:06:05"}
222
+ {"current_steps": 222, "total_steps": 224, "loss": 0.4227, "lr": 4.885423995341088e-09, "epoch": 6.789873417721519, "percentage": 99.11, "elapsed_time": "7:30:43", "remaining_time": "0:04:03"}
223
+ {"current_steps": 223, "total_steps": 224, "loss": 0.4047, "lr": 1.2214305934699078e-09, "epoch": 6.820253164556962, "percentage": 99.55, "elapsed_time": "7:32:44", "remaining_time": "0:02:01"}
224
+ {"current_steps": 224, "total_steps": 224, "loss": 0.4324, "lr": 0.0, "epoch": 6.850632911392405, "percentage": 100.0, "elapsed_time": "7:34:48", "remaining_time": "0:00:00"}
225
+ {"current_steps": 224, "total_steps": 224, "epoch": 6.850632911392405, "percentage": 100.0, "elapsed_time": "7:36:48", "remaining_time": "0:00:00"}