Training in progress, epoch 6
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4877660776
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9799b0e1ad66cfcfd87c9fd4924b81edd5d69f41e7267a83adbb91b4fb7bef4e
|
3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4932751008
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a9cf1d4bcc583ef4cda420e387cff0d2e726a30853b256a9df451f6a5fa497bd
|
3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4330865200
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6f32de4ebec72c5b7f2b8d7f15e38dc9a2741b7db455e8e5c2bd9950038924f4
|
3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1089994880
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:34a2cba4f3fe657317a30f2cb8d83b480f10bcc36ff55634ef2e907957a5396a
|
3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
@@ -195,3 +195,31 @@
|
|
195 |
{"current_steps": 195, "total_steps": 224, "loss": 0.4538, "lr": 1.0097768704058542e-06, "epoch": 5.962025316455696, "percentage": 87.05, "elapsed_time": "5:25:33", "remaining_time": "0:48:24"}
|
196 |
{"current_steps": 196, "total_steps": 224, "loss": 0.4218, "lr": 9.424343531000968e-07, "epoch": 5.992405063291139, "percentage": 87.5, "elapsed_time": "5:27:02", "remaining_time": "0:46:43"}
|
197 |
{"current_steps": 197, "total_steps": 224, "loss": 0.3992, "lr": 8.773044733510338e-07, "epoch": 6.030379746835443, "percentage": 87.95, "elapsed_time": "5:29:50", "remaining_time": "0:45:12"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
195 |
{"current_steps": 195, "total_steps": 224, "loss": 0.4538, "lr": 1.0097768704058542e-06, "epoch": 5.962025316455696, "percentage": 87.05, "elapsed_time": "5:25:33", "remaining_time": "0:48:24"}
|
196 |
{"current_steps": 196, "total_steps": 224, "loss": 0.4218, "lr": 9.424343531000968e-07, "epoch": 5.992405063291139, "percentage": 87.5, "elapsed_time": "5:27:02", "remaining_time": "0:46:43"}
|
197 |
{"current_steps": 197, "total_steps": 224, "loss": 0.3992, "lr": 8.773044733510338e-07, "epoch": 6.030379746835443, "percentage": 87.95, "elapsed_time": "5:29:50", "remaining_time": "0:45:12"}
|
198 |
+
{"current_steps": 198, "total_steps": 224, "loss": 0.4266, "lr": 8.144031414842012e-07, "epoch": 6.060759493670886, "percentage": 88.39, "elapsed_time": "5:31:27", "remaining_time": "0:43:31"}
|
199 |
+
{"current_steps": 199, "total_steps": 224, "loss": 0.4318, "lr": 7.537457234218271e-07, "epoch": 6.091139240506329, "percentage": 88.84, "elapsed_time": "5:33:11", "remaining_time": "0:41:51"}
|
200 |
+
{"current_steps": 200, "total_steps": 224, "loss": 0.3855, "lr": 6.953470369291349e-07, "epoch": 6.121518987341772, "percentage": 89.29, "elapsed_time": "5:34:42", "remaining_time": "0:40:09"}
|
201 |
+
{"current_steps": 201, "total_steps": 224, "loss": 0.3982, "lr": 6.392213479945852e-07, "epoch": 6.151898734177215, "percentage": 89.73, "elapsed_time": "5:36:10", "remaining_time": "0:38:28"}
|
202 |
+
{"current_steps": 202, "total_steps": 224, "loss": 0.3997, "lr": 5.853823673448877e-07, "epoch": 6.182278481012658, "percentage": 90.18, "elapsed_time": "5:37:39", "remaining_time": "0:36:46"}
|
203 |
+
{"current_steps": 203, "total_steps": 224, "loss": 0.4078, "lr": 5.33843247095659e-07, "epoch": 6.2126582278481015, "percentage": 90.62, "elapsed_time": "5:39:22", "remaining_time": "0:35:06"}
|
204 |
+
{"current_steps": 204, "total_steps": 224, "loss": 0.4125, "lr": 4.846165775385459e-07, "epoch": 6.243037974683545, "percentage": 91.07, "elapsed_time": "5:41:04", "remaining_time": "0:33:26"}
|
205 |
+
{"current_steps": 205, "total_steps": 224, "loss": 0.3987, "lr": 4.3771438406559173e-07, "epoch": 6.273417721518987, "percentage": 91.52, "elapsed_time": "5:42:36", "remaining_time": "0:31:45"}
|
206 |
+
{"current_steps": 206, "total_steps": 224, "loss": 0.3957, "lr": 3.931481242315993e-07, "epoch": 6.30379746835443, "percentage": 91.96, "elapsed_time": "5:44:03", "remaining_time": "0:30:03"}
|
207 |
+
{"current_steps": 207, "total_steps": 224, "loss": 0.4177, "lr": 3.5092868495520294e-07, "epoch": 6.334177215189873, "percentage": 92.41, "elapsed_time": "5:45:52", "remaining_time": "0:28:24"}
|
208 |
+
{"current_steps": 208, "total_steps": 224, "loss": 0.3776, "lr": 3.110663798593616e-07, "epoch": 6.364556962025317, "percentage": 92.86, "elapsed_time": "5:47:22", "remaining_time": "0:26:43"}
|
209 |
+
{"current_steps": 209, "total_steps": 224, "loss": 0.3958, "lr": 2.735709467518699e-07, "epoch": 6.39493670886076, "percentage": 93.3, "elapsed_time": "5:49:09", "remaining_time": "0:25:03"}
|
210 |
+
{"current_steps": 210, "total_steps": 224, "loss": 0.4096, "lr": 2.384515452465475e-07, "epoch": 6.425316455696202, "percentage": 93.75, "elapsed_time": "5:50:46", "remaining_time": "0:23:23"}
|
211 |
+
{"current_steps": 211, "total_steps": 224, "loss": 0.4089, "lr": 2.0571675452567997e-07, "epoch": 6.455696202531645, "percentage": 94.2, "elapsed_time": "5:52:26", "remaining_time": "0:21:42"}
|
212 |
+
{"current_steps": 212, "total_steps": 224, "loss": 0.4003, "lr": 1.7537457124423896e-07, "epoch": 6.4860759493670885, "percentage": 94.64, "elapsed_time": "5:54:03", "remaining_time": "0:20:02"}
|
213 |
+
{"current_steps": 213, "total_steps": 224, "loss": 0.393, "lr": 1.474324075764111e-07, "epoch": 6.516455696202532, "percentage": 95.09, "elapsed_time": "5:55:52", "remaining_time": "0:18:22"}
|
214 |
+
{"current_steps": 214, "total_steps": 224, "loss": 0.4313, "lr": 1.2189708940490653e-07, "epoch": 6.546835443037975, "percentage": 95.54, "elapsed_time": "5:57:22", "remaining_time": "0:16:41"}
|
215 |
+
{"current_steps": 215, "total_steps": 224, "loss": 0.4221, "lr": 9.877485465349057e-08, "epoch": 6.577215189873417, "percentage": 95.98, "elapsed_time": "5:58:59", "remaining_time": "0:15:01"}
|
216 |
+
{"current_steps": 216, "total_steps": 224, "loss": 0.3746, "lr": 7.807135176314707e-08, "epoch": 6.6075949367088604, "percentage": 96.43, "elapsed_time": "6:00:40", "remaining_time": "0:13:21"}
|
217 |
+
{"current_steps": 217, "total_steps": 224, "loss": 0.3625, "lr": 5.979163831223988e-08, "epoch": 6.637974683544304, "percentage": 96.88, "elapsed_time": "6:02:18", "remaining_time": "0:11:41"}
|
218 |
+
{"current_steps": 218, "total_steps": 224, "loss": 0.4116, "lr": 4.394017978101905e-08, "epoch": 6.668354430379747, "percentage": 97.32, "elapsed_time": "6:03:58", "remaining_time": "0:10:01"}
|
219 |
+
{"current_steps": 219, "total_steps": 224, "loss": 0.3864, "lr": 3.0520848460765525e-08, "epoch": 6.69873417721519, "percentage": 97.77, "elapsed_time": "6:05:29", "remaining_time": "0:08:20"}
|
220 |
+
{"current_steps": 220, "total_steps": 224, "loss": 0.4204, "lr": 1.9536922507841227e-08, "epoch": 6.729113924050633, "percentage": 98.21, "elapsed_time": "6:07:12", "remaining_time": "0:06:40"}
|
221 |
+
{"current_steps": 221, "total_steps": 224, "loss": 0.3968, "lr": 1.099108514288627e-08, "epoch": 6.759493670886076, "percentage": 98.66, "elapsed_time": "6:08:44", "remaining_time": "0:05:00"}
|
222 |
+
{"current_steps": 222, "total_steps": 224, "loss": 0.4067, "lr": 4.885423995341088e-09, "epoch": 6.789873417721519, "percentage": 99.11, "elapsed_time": "6:10:24", "remaining_time": "0:03:20"}
|
223 |
+
{"current_steps": 223, "total_steps": 224, "loss": 0.3949, "lr": 1.2214305934699078e-09, "epoch": 6.820253164556962, "percentage": 99.55, "elapsed_time": "6:12:07", "remaining_time": "0:01:40"}
|
224 |
+
{"current_steps": 224, "total_steps": 224, "loss": 0.4155, "lr": 0.0, "epoch": 6.850632911392405, "percentage": 100.0, "elapsed_time": "6:13:47", "remaining_time": "0:00:00"}
|
225 |
+
{"current_steps": 224, "total_steps": 224, "epoch": 6.850632911392405, "percentage": 100.0, "elapsed_time": "6:16:00", "remaining_time": "0:00:00"}
|