Training in progress, epoch 5
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4877660776
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:33f573f37f1faf605923ed02338567c221e6b4846fb7e4e5521c95de52fb3576
|
3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4932751008
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:89675e1c6134de1de248285c8a712c3fe648a1e579b5e75d6de18bfffeb6fb82
|
3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4330865200
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:becebfd12f70af66fd52b6b5a9d974fe503554832b1d7881e7f277d19a576c32
|
3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1089994880
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b3273e84b49c727cbdad40c8479f33c97b14f47a5ff4b64e01b3fd946fc506b1
|
3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
@@ -166,3 +166,37 @@
|
|
166 |
{"current_steps": 166, "total_steps": 224, "loss": 0.1526, "lr": 3.83517761602209e-06, "epoch": 5.0810126582278485, "percentage": 74.11, "elapsed_time": "2:02:14", "remaining_time": "0:42:42"}
|
167 |
{"current_steps": 167, "total_steps": 224, "loss": 0.1462, "lr": 3.712871334091154e-06, "epoch": 5.111392405063291, "percentage": 74.55, "elapsed_time": "2:03:01", "remaining_time": "0:41:59"}
|
168 |
{"current_steps": 168, "total_steps": 224, "loss": 0.146, "lr": 3.592100910419738e-06, "epoch": 5.141772151898734, "percentage": 75.0, "elapsed_time": "2:03:35", "remaining_time": "0:41:11"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
166 |
{"current_steps": 166, "total_steps": 224, "loss": 0.1526, "lr": 3.83517761602209e-06, "epoch": 5.0810126582278485, "percentage": 74.11, "elapsed_time": "2:02:14", "remaining_time": "0:42:42"}
|
167 |
{"current_steps": 167, "total_steps": 224, "loss": 0.1462, "lr": 3.712871334091154e-06, "epoch": 5.111392405063291, "percentage": 74.55, "elapsed_time": "2:03:01", "remaining_time": "0:41:59"}
|
168 |
{"current_steps": 168, "total_steps": 224, "loss": 0.146, "lr": 3.592100910419738e-06, "epoch": 5.141772151898734, "percentage": 75.0, "elapsed_time": "2:03:35", "remaining_time": "0:41:11"}
|
169 |
+
{"current_steps": 169, "total_steps": 224, "loss": 0.1649, "lr": 3.4728958475459052e-06, "epoch": 5.172151898734177, "percentage": 75.45, "elapsed_time": "2:04:09", "remaining_time": "0:40:24"}
|
170 |
+
{"current_steps": 170, "total_steps": 224, "loss": 0.1765, "lr": 3.355285265611784e-06, "epoch": 5.2025316455696204, "percentage": 75.89, "elapsed_time": "2:04:55", "remaining_time": "0:39:40"}
|
171 |
+
{"current_steps": 171, "total_steps": 224, "loss": 0.1491, "lr": 3.2392978952499553e-06, "epoch": 5.232911392405064, "percentage": 76.34, "elapsed_time": "2:05:35", "remaining_time": "0:38:55"}
|
172 |
+
{"current_steps": 172, "total_steps": 224, "loss": 0.15, "lr": 3.1249620705649417e-06, "epoch": 5.263291139240506, "percentage": 76.79, "elapsed_time": "2:06:25", "remaining_time": "0:38:13"}
|
173 |
+
{"current_steps": 173, "total_steps": 224, "loss": 0.1674, "lr": 3.0123057222115835e-06, "epoch": 5.293670886075949, "percentage": 77.23, "elapsed_time": "2:07:06", "remaining_time": "0:37:28"}
|
174 |
+
{"current_steps": 174, "total_steps": 224, "loss": 0.1224, "lr": 2.9013563705719673e-06, "epoch": 5.324050632911392, "percentage": 77.68, "elapsed_time": "2:07:42", "remaining_time": "0:36:41"}
|
175 |
+
{"current_steps": 175, "total_steps": 224, "loss": 0.1749, "lr": 2.7921411190325753e-06, "epoch": 5.3544303797468356, "percentage": 78.12, "elapsed_time": "2:08:29", "remaining_time": "0:35:58"}
|
176 |
+
{"current_steps": 176, "total_steps": 224, "loss": 0.1434, "lr": 2.6846866473633126e-06, "epoch": 5.384810126582279, "percentage": 78.57, "elapsed_time": "2:09:14", "remaining_time": "0:35:14"}
|
177 |
+
{"current_steps": 177, "total_steps": 224, "loss": 0.136, "lr": 2.579019205199992e-06, "epoch": 5.415189873417722, "percentage": 79.02, "elapsed_time": "2:09:54", "remaining_time": "0:34:29"}
|
178 |
+
{"current_steps": 178, "total_steps": 224, "loss": 0.1534, "lr": 2.4751646056319334e-06, "epoch": 5.445569620253164, "percentage": 79.46, "elapsed_time": "2:10:32", "remaining_time": "0:33:44"}
|
179 |
+
{"current_steps": 179, "total_steps": 224, "loss": 0.1533, "lr": 2.373148218896182e-06, "epoch": 5.4759493670886075, "percentage": 79.91, "elapsed_time": "2:11:08", "remaining_time": "0:32:58"}
|
180 |
+
{"current_steps": 180, "total_steps": 224, "loss": 0.1407, "lr": 2.2729949661798876e-06, "epoch": 5.506329113924051, "percentage": 80.36, "elapsed_time": "2:11:45", "remaining_time": "0:32:12"}
|
181 |
+
{"current_steps": 181, "total_steps": 224, "loss": 0.1623, "lr": 2.174729313532433e-06, "epoch": 5.536708860759494, "percentage": 80.8, "elapsed_time": "2:12:30", "remaining_time": "0:31:28"}
|
182 |
+
{"current_steps": 182, "total_steps": 224, "loss": 0.156, "lr": 2.078375265888707e-06, "epoch": 5.567088607594937, "percentage": 81.25, "elapsed_time": "2:13:23", "remaining_time": "0:30:46"}
|
183 |
+
{"current_steps": 183, "total_steps": 224, "loss": 0.1931, "lr": 1.9839563612050273e-06, "epoch": 5.597468354430379, "percentage": 81.7, "elapsed_time": "2:14:12", "remaining_time": "0:30:04"}
|
184 |
+
{"current_steps": 184, "total_steps": 224, "loss": 0.1774, "lr": 1.8914956647091497e-06, "epoch": 5.627848101265823, "percentage": 82.14, "elapsed_time": "2:14:56", "remaining_time": "0:29:20"}
|
185 |
+
{"current_steps": 185, "total_steps": 224, "loss": 0.1459, "lr": 1.8010157632657544e-06, "epoch": 5.658227848101266, "percentage": 82.59, "elapsed_time": "2:15:42", "remaining_time": "0:28:36"}
|
186 |
+
{"current_steps": 186, "total_steps": 224, "loss": 0.1389, "lr": 1.7125387598587862e-06, "epoch": 5.688607594936709, "percentage": 83.04, "elapsed_time": "2:16:13", "remaining_time": "0:27:49"}
|
187 |
+
{"current_steps": 187, "total_steps": 224, "loss": 0.1732, "lr": 1.6260862681919965e-06, "epoch": 5.718987341772152, "percentage": 83.48, "elapsed_time": "2:17:00", "remaining_time": "0:27:06"}
|
188 |
+
{"current_steps": 188, "total_steps": 224, "loss": 0.1417, "lr": 1.5416794074090258e-06, "epoch": 5.749367088607595, "percentage": 83.93, "elapsed_time": "2:17:45", "remaining_time": "0:26:22"}
|
189 |
+
{"current_steps": 189, "total_steps": 224, "loss": 0.1578, "lr": 1.459338796934293e-06, "epoch": 5.779746835443038, "percentage": 84.38, "elapsed_time": "2:18:30", "remaining_time": "0:25:38"}
|
190 |
+
{"current_steps": 190, "total_steps": 224, "loss": 0.139, "lr": 1.3790845514359363e-06, "epoch": 5.810126582278481, "percentage": 84.82, "elapsed_time": "2:19:11", "remaining_time": "0:24:54"}
|
191 |
+
{"current_steps": 191, "total_steps": 224, "loss": 0.1434, "lr": 1.300936275912098e-06, "epoch": 5.840506329113924, "percentage": 85.27, "elapsed_time": "2:19:54", "remaining_time": "0:24:10"}
|
192 |
+
{"current_steps": 192, "total_steps": 224, "loss": 0.1439, "lr": 1.224913060901688e-06, "epoch": 5.870886075949367, "percentage": 85.71, "elapsed_time": "2:20:37", "remaining_time": "0:23:26"}
|
193 |
+
{"current_steps": 193, "total_steps": 224, "loss": 0.1535, "lr": 1.1510334778208332e-06, "epoch": 5.9012658227848105, "percentage": 86.16, "elapsed_time": "2:21:25", "remaining_time": "0:22:42"}
|
194 |
+
{"current_steps": 194, "total_steps": 224, "loss": 0.1739, "lr": 1.0793155744261352e-06, "epoch": 5.931645569620253, "percentage": 86.61, "elapsed_time": "2:22:14", "remaining_time": "0:21:59"}
|
195 |
+
{"current_steps": 195, "total_steps": 224, "loss": 0.1783, "lr": 1.0097768704058542e-06, "epoch": 5.962025316455696, "percentage": 87.05, "elapsed_time": "2:23:12", "remaining_time": "0:21:17"}
|
196 |
+
{"current_steps": 196, "total_steps": 224, "loss": 0.1879, "lr": 9.424343531000968e-07, "epoch": 5.992405063291139, "percentage": 87.5, "elapsed_time": "2:23:59", "remaining_time": "0:20:34"}
|
197 |
+
{"current_steps": 197, "total_steps": 224, "loss": 0.1484, "lr": 8.773044733510338e-07, "epoch": 6.030379746835443, "percentage": 87.95, "elapsed_time": "2:25:35", "remaining_time": "0:19:57"}
|
198 |
+
{"current_steps": 198, "total_steps": 224, "loss": 0.1436, "lr": 8.144031414842012e-07, "epoch": 6.060759493670886, "percentage": 88.39, "elapsed_time": "2:26:21", "remaining_time": "0:19:13"}
|
199 |
+
{"current_steps": 199, "total_steps": 224, "loss": 0.1643, "lr": 7.537457234218271e-07, "epoch": 6.091139240506329, "percentage": 88.84, "elapsed_time": "2:27:16", "remaining_time": "0:18:30"}
|
200 |
+
{"current_steps": 200, "total_steps": 224, "loss": 0.1174, "lr": 6.953470369291349e-07, "epoch": 6.121518987341772, "percentage": 89.29, "elapsed_time": "2:27:50", "remaining_time": "0:17:44"}
|
201 |
+
{"current_steps": 201, "total_steps": 224, "loss": 0.1283, "lr": 6.392213479945852e-07, "epoch": 6.151898734177215, "percentage": 89.73, "elapsed_time": "2:28:35", "remaining_time": "0:17:00"}
|
202 |
+
{"current_steps": 202, "total_steps": 224, "loss": 0.1456, "lr": 5.853823673448877e-07, "epoch": 6.182278481012658, "percentage": 90.18, "elapsed_time": "2:29:21", "remaining_time": "0:16:16"}
|