ryanmarten commited on
Commit
42254b2
·
verified ·
1 Parent(s): 69df4d7

Training in progress, epoch 6

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:78e594347fb358c09be570dcbbfb4511004957738b6a1cb387265c6d96fc0b26
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd633338ade60607cd74969db123f2a64a191790c12cabbde80b2f5204a5a795
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bc78cbbe9f907ba7dc03886a15103505044886e82dcfb8e2b5301cbe667945f3
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:73534b9e33c4fcaa8ccee5019d44e4ec09a8cb648d4f0cbe0af0de7557b130f3
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0203b04df2e21ef3b4ecfd013b20859b10eedabd327cff424fecd909adc3a8be
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:df1e799804712c323cd9c2abd1cd1fce5af07835981ab8c2eb459e45be2ad31e
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f0c7a0023fee2182f73cdcf31b54052cf778b2350f1b9a1865b2e8c0bfc68d8c
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e0f02fe902a6a6047c3636ffd10acf61eb5f212dec444884b7a48d82289916a3
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -197,3 +197,29 @@
197
  {"current_steps": 197, "total_steps": 224, "loss": 0.1606, "lr": 8.773044733510338e-07, "epoch": 6.030379746835443, "percentage": 87.95, "elapsed_time": "3:12:52", "remaining_time": "0:26:26"}
198
  {"current_steps": 198, "total_steps": 224, "loss": 0.1829, "lr": 8.144031414842012e-07, "epoch": 6.060759493670886, "percentage": 88.39, "elapsed_time": "3:13:54", "remaining_time": "0:25:27"}
199
  {"current_steps": 199, "total_steps": 224, "loss": 0.1714, "lr": 7.537457234218271e-07, "epoch": 6.091139240506329, "percentage": 88.84, "elapsed_time": "3:14:56", "remaining_time": "0:24:29"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
197
  {"current_steps": 197, "total_steps": 224, "loss": 0.1606, "lr": 8.773044733510338e-07, "epoch": 6.030379746835443, "percentage": 87.95, "elapsed_time": "3:12:52", "remaining_time": "0:26:26"}
198
  {"current_steps": 198, "total_steps": 224, "loss": 0.1829, "lr": 8.144031414842012e-07, "epoch": 6.060759493670886, "percentage": 88.39, "elapsed_time": "3:13:54", "remaining_time": "0:25:27"}
199
  {"current_steps": 199, "total_steps": 224, "loss": 0.1714, "lr": 7.537457234218271e-07, "epoch": 6.091139240506329, "percentage": 88.84, "elapsed_time": "3:14:56", "remaining_time": "0:24:29"}
200
+ {"current_steps": 200, "total_steps": 224, "loss": 0.1902, "lr": 6.953470369291349e-07, "epoch": 6.121518987341772, "percentage": 89.29, "elapsed_time": "3:15:56", "remaining_time": "0:23:30"}
201
+ {"current_steps": 201, "total_steps": 224, "loss": 0.1663, "lr": 6.392213479945852e-07, "epoch": 6.151898734177215, "percentage": 89.73, "elapsed_time": "3:16:51", "remaining_time": "0:22:31"}
202
+ {"current_steps": 202, "total_steps": 224, "loss": 0.1636, "lr": 5.853823673448877e-07, "epoch": 6.182278481012658, "percentage": 90.18, "elapsed_time": "3:17:56", "remaining_time": "0:21:33"}
203
+ {"current_steps": 203, "total_steps": 224, "loss": 0.1589, "lr": 5.33843247095659e-07, "epoch": 6.2126582278481015, "percentage": 90.62, "elapsed_time": "3:19:02", "remaining_time": "0:20:35"}
204
+ {"current_steps": 204, "total_steps": 224, "loss": 0.1649, "lr": 4.846165775385459e-07, "epoch": 6.243037974683545, "percentage": 91.07, "elapsed_time": "3:20:05", "remaining_time": "0:19:37"}
205
+ {"current_steps": 205, "total_steps": 224, "loss": 0.1538, "lr": 4.3771438406559173e-07, "epoch": 6.273417721518987, "percentage": 91.52, "elapsed_time": "3:20:58", "remaining_time": "0:18:37"}
206
+ {"current_steps": 206, "total_steps": 224, "loss": 0.1546, "lr": 3.931481242315993e-07, "epoch": 6.30379746835443, "percentage": 91.96, "elapsed_time": "3:21:53", "remaining_time": "0:17:38"}
207
+ {"current_steps": 207, "total_steps": 224, "loss": 0.1753, "lr": 3.5092868495520294e-07, "epoch": 6.334177215189873, "percentage": 92.41, "elapsed_time": "3:22:52", "remaining_time": "0:16:39"}
208
+ {"current_steps": 208, "total_steps": 224, "loss": 0.1347, "lr": 3.110663798593616e-07, "epoch": 6.364556962025317, "percentage": 92.86, "elapsed_time": "3:23:40", "remaining_time": "0:15:40"}
209
+ {"current_steps": 209, "total_steps": 224, "loss": 0.1493, "lr": 2.735709467518699e-07, "epoch": 6.39493670886076, "percentage": 93.3, "elapsed_time": "3:24:36", "remaining_time": "0:14:41"}
210
+ {"current_steps": 210, "total_steps": 224, "loss": 0.1503, "lr": 2.384515452465475e-07, "epoch": 6.425316455696202, "percentage": 93.75, "elapsed_time": "3:25:26", "remaining_time": "0:13:41"}
211
+ {"current_steps": 211, "total_steps": 224, "loss": 0.1557, "lr": 2.0571675452567997e-07, "epoch": 6.455696202531645, "percentage": 94.2, "elapsed_time": "3:26:11", "remaining_time": "0:12:42"}
212
+ {"current_steps": 212, "total_steps": 224, "loss": 0.1631, "lr": 1.7537457124423896e-07, "epoch": 6.4860759493670885, "percentage": 94.64, "elapsed_time": "3:27:02", "remaining_time": "0:11:43"}
213
+ {"current_steps": 213, "total_steps": 224, "loss": 0.1546, "lr": 1.474324075764111e-07, "epoch": 6.516455696202532, "percentage": 95.09, "elapsed_time": "3:27:52", "remaining_time": "0:10:44"}
214
+ {"current_steps": 214, "total_steps": 224, "loss": 0.1656, "lr": 1.2189708940490653e-07, "epoch": 6.546835443037975, "percentage": 95.54, "elapsed_time": "3:28:53", "remaining_time": "0:09:45"}
215
+ {"current_steps": 215, "total_steps": 224, "loss": 0.1851, "lr": 9.877485465349057e-08, "epoch": 6.577215189873417, "percentage": 95.98, "elapsed_time": "3:29:59", "remaining_time": "0:08:47"}
216
+ {"current_steps": 216, "total_steps": 224, "loss": 0.1618, "lr": 7.807135176314707e-08, "epoch": 6.6075949367088604, "percentage": 96.43, "elapsed_time": "3:30:58", "remaining_time": "0:07:48"}
217
+ {"current_steps": 217, "total_steps": 224, "loss": 0.1752, "lr": 5.979163831223988e-08, "epoch": 6.637974683544304, "percentage": 96.88, "elapsed_time": "3:32:02", "remaining_time": "0:06:50"}
218
+ {"current_steps": 218, "total_steps": 224, "loss": 0.1561, "lr": 4.394017978101905e-08, "epoch": 6.668354430379747, "percentage": 97.32, "elapsed_time": "3:32:59", "remaining_time": "0:05:51"}
219
+ {"current_steps": 219, "total_steps": 224, "loss": 0.1622, "lr": 3.0520848460765525e-08, "epoch": 6.69873417721519, "percentage": 97.77, "elapsed_time": "3:33:55", "remaining_time": "0:04:53"}
220
+ {"current_steps": 220, "total_steps": 224, "loss": 0.1538, "lr": 1.9536922507841227e-08, "epoch": 6.729113924050633, "percentage": 98.21, "elapsed_time": "3:34:49", "remaining_time": "0:03:54"}
221
+ {"current_steps": 221, "total_steps": 224, "loss": 0.1692, "lr": 1.099108514288627e-08, "epoch": 6.759493670886076, "percentage": 98.66, "elapsed_time": "3:35:40", "remaining_time": "0:02:55"}
222
+ {"current_steps": 222, "total_steps": 224, "loss": 0.1701, "lr": 4.885423995341088e-09, "epoch": 6.789873417721519, "percentage": 99.11, "elapsed_time": "3:36:39", "remaining_time": "0:01:57"}
223
+ {"current_steps": 223, "total_steps": 224, "loss": 0.1726, "lr": 1.2214305934699078e-09, "epoch": 6.820253164556962, "percentage": 99.55, "elapsed_time": "3:37:41", "remaining_time": "0:00:58"}
224
+ {"current_steps": 224, "total_steps": 224, "loss": 0.1786, "lr": 0.0, "epoch": 6.850632911392405, "percentage": 100.0, "elapsed_time": "3:38:37", "remaining_time": "0:00:00"}
225
+ {"current_steps": 224, "total_steps": 224, "epoch": 6.850632911392405, "percentage": 100.0, "elapsed_time": "3:40:49", "remaining_time": "0:00:00"}