sedrickkeh commited on
Commit
351bed7
·
verified ·
1 Parent(s): 83cc15d

Training in progress, epoch 2

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c650f71aa81b5b2233cbfcb6cfcfb2ba98937f3f33ce99f1a08e1568c7c2c6d7
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3a2e9f7fe8d3abeb254c17815d5411f88bb48cdac114b4d05fe8e4b8808f815f
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cc33f1f068cbc9016bf15355ac3a52892a33e012a663dda8650bcd8476035767
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:633e67d7f094297a1ce49112aa63550ba926c7910b4499837360d2e64abbb312
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ca01f67353b2afbbe044d730cda0b822013a1f02c5cac55f382f09206838b2c7
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:589e0c01d763a785eddca64b81cb8aaa07b5eca69d5df862f933171bfa1338f1
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0163d1edd7df921e9950312393b738e01bac6a15568b86cc9f217b743edc0e71
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ec10207dd46a8237ca9055c7d978cd93f693b763796afbebc4b7b57ec3754bf1
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -212,3 +212,102 @@
212
  {"current_steps": 212, "total_steps": 312, "loss": 0.3631, "lr": 5.66116260882442e-06, "epoch": 2.0319488817891376, "percentage": 67.95, "elapsed_time": "1:52:26", "remaining_time": "0:53:02"}
213
  {"current_steps": 213, "total_steps": 312, "loss": 0.4092, "lr": 5.560349359695181e-06, "epoch": 2.0415335463258786, "percentage": 68.27, "elapsed_time": "1:53:00", "remaining_time": "0:52:31"}
214
  {"current_steps": 214, "total_steps": 312, "loss": 0.3753, "lr": 5.460095002604533e-06, "epoch": 2.0511182108626196, "percentage": 68.59, "elapsed_time": "1:53:31", "remaining_time": "0:51:59"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
212
  {"current_steps": 212, "total_steps": 312, "loss": 0.3631, "lr": 5.66116260882442e-06, "epoch": 2.0319488817891376, "percentage": 67.95, "elapsed_time": "1:52:26", "remaining_time": "0:53:02"}
213
  {"current_steps": 213, "total_steps": 312, "loss": 0.4092, "lr": 5.560349359695181e-06, "epoch": 2.0415335463258786, "percentage": 68.27, "elapsed_time": "1:53:00", "remaining_time": "0:52:31"}
214
  {"current_steps": 214, "total_steps": 312, "loss": 0.3753, "lr": 5.460095002604533e-06, "epoch": 2.0511182108626196, "percentage": 68.59, "elapsed_time": "1:53:31", "remaining_time": "0:51:59"}
215
+ {"current_steps": 215, "total_steps": 312, "loss": 0.356, "lr": 5.360412158221661e-06, "epoch": 2.060702875399361, "percentage": 68.91, "elapsed_time": "1:54:05", "remaining_time": "0:51:28"}
216
+ {"current_steps": 216, "total_steps": 312, "loss": 0.4177, "lr": 5.2613133752700145e-06, "epoch": 2.070287539936102, "percentage": 69.23, "elapsed_time": "1:54:33", "remaining_time": "0:50:54"}
217
+ {"current_steps": 217, "total_steps": 312, "loss": 0.3691, "lr": 5.1628111289476025e-06, "epoch": 2.0798722044728435, "percentage": 69.55, "elapsed_time": "1:55:02", "remaining_time": "0:50:21"}
218
+ {"current_steps": 218, "total_steps": 312, "loss": 0.3823, "lr": 5.064917819356532e-06, "epoch": 2.0894568690095845, "percentage": 69.87, "elapsed_time": "1:55:29", "remaining_time": "0:49:47"}
219
+ {"current_steps": 219, "total_steps": 312, "loss": 0.3456, "lr": 4.967645769942e-06, "epoch": 2.099041533546326, "percentage": 70.19, "elapsed_time": "1:56:02", "remaining_time": "0:49:16"}
220
+ {"current_steps": 220, "total_steps": 312, "loss": 0.3792, "lr": 4.87100722594094e-06, "epoch": 2.108626198083067, "percentage": 70.51, "elapsed_time": "1:56:31", "remaining_time": "0:48:43"}
221
+ {"current_steps": 221, "total_steps": 312, "loss": 0.3891, "lr": 4.775014352840512e-06, "epoch": 2.1182108626198084, "percentage": 70.83, "elapsed_time": "1:57:05", "remaining_time": "0:48:12"}
222
+ {"current_steps": 222, "total_steps": 312, "loss": 0.35, "lr": 4.679679234846636e-06, "epoch": 2.1277955271565494, "percentage": 71.15, "elapsed_time": "1:57:31", "remaining_time": "0:47:38"}
223
+ {"current_steps": 223, "total_steps": 312, "loss": 0.3809, "lr": 4.5850138733627435e-06, "epoch": 2.137380191693291, "percentage": 71.47, "elapsed_time": "1:58:06", "remaining_time": "0:47:08"}
224
+ {"current_steps": 224, "total_steps": 312, "loss": 0.3707, "lr": 4.491030185478976e-06, "epoch": 2.146964856230032, "percentage": 71.79, "elapsed_time": "1:58:36", "remaining_time": "0:46:35"}
225
+ {"current_steps": 225, "total_steps": 312, "loss": 0.4152, "lr": 4.397740002471973e-06, "epoch": 2.1565495207667733, "percentage": 72.12, "elapsed_time": "1:59:10", "remaining_time": "0:46:04"}
226
+ {"current_steps": 226, "total_steps": 312, "loss": 0.3372, "lr": 4.305155068315481e-06, "epoch": 2.1661341853035143, "percentage": 72.44, "elapsed_time": "1:59:42", "remaining_time": "0:45:33"}
227
+ {"current_steps": 227, "total_steps": 312, "loss": 0.3655, "lr": 4.213287038201943e-06, "epoch": 2.1757188498402558, "percentage": 72.76, "elapsed_time": "2:00:09", "remaining_time": "0:44:59"}
228
+ {"current_steps": 228, "total_steps": 312, "loss": 0.406, "lr": 4.12214747707527e-06, "epoch": 2.1853035143769968, "percentage": 73.08, "elapsed_time": "2:00:42", "remaining_time": "0:44:28"}
229
+ {"current_steps": 229, "total_steps": 312, "loss": 0.372, "lr": 4.0317478581749644e-06, "epoch": 2.194888178913738, "percentage": 73.4, "elapsed_time": "2:01:11", "remaining_time": "0:43:55"}
230
+ {"current_steps": 230, "total_steps": 312, "loss": 0.4101, "lr": 3.942099561591802e-06, "epoch": 2.2044728434504792, "percentage": 73.72, "elapsed_time": "2:01:42", "remaining_time": "0:43:23"}
231
+ {"current_steps": 231, "total_steps": 312, "loss": 0.3337, "lr": 3.853213872835229e-06, "epoch": 2.2140575079872207, "percentage": 74.04, "elapsed_time": "2:02:16", "remaining_time": "0:42:52"}
232
+ {"current_steps": 232, "total_steps": 312, "loss": 0.4058, "lr": 3.7651019814126656e-06, "epoch": 2.2236421725239617, "percentage": 74.36, "elapsed_time": "2:02:44", "remaining_time": "0:42:19"}
233
+ {"current_steps": 233, "total_steps": 312, "loss": 0.3918, "lr": 3.677774979420904e-06, "epoch": 2.2332268370607027, "percentage": 74.68, "elapsed_time": "2:03:19", "remaining_time": "0:41:48"}
234
+ {"current_steps": 234, "total_steps": 312, "loss": 0.3621, "lr": 3.591243860149759e-06, "epoch": 2.242811501597444, "percentage": 75.0, "elapsed_time": "2:03:47", "remaining_time": "0:41:15"}
235
+ {"current_steps": 235, "total_steps": 312, "loss": 0.3925, "lr": 3.505519516698165e-06, "epoch": 2.252396166134185, "percentage": 75.32, "elapsed_time": "2:04:20", "remaining_time": "0:40:44"}
236
+ {"current_steps": 236, "total_steps": 312, "loss": 0.3365, "lr": 3.4206127406028744e-06, "epoch": 2.2619808306709266, "percentage": 75.64, "elapsed_time": "2:04:52", "remaining_time": "0:40:12"}
237
+ {"current_steps": 237, "total_steps": 312, "loss": 0.3639, "lr": 3.3365342204799613e-06, "epoch": 2.2715654952076676, "percentage": 75.96, "elapsed_time": "2:05:27", "remaining_time": "0:39:42"}
238
+ {"current_steps": 238, "total_steps": 312, "loss": 0.3617, "lr": 3.2532945406792573e-06, "epoch": 2.281150159744409, "percentage": 76.28, "elapsed_time": "2:06:03", "remaining_time": "0:39:11"}
239
+ {"current_steps": 239, "total_steps": 312, "loss": 0.3911, "lr": 3.1709041799519312e-06, "epoch": 2.29073482428115, "percentage": 76.6, "elapsed_time": "2:06:34", "remaining_time": "0:38:39"}
240
+ {"current_steps": 240, "total_steps": 312, "loss": 0.3543, "lr": 3.089373510131354e-06, "epoch": 2.3003194888178915, "percentage": 76.92, "elapsed_time": "2:07:03", "remaining_time": "0:38:07"}
241
+ {"current_steps": 241, "total_steps": 312, "loss": 0.3149, "lr": 3.0087127948274264e-06, "epoch": 2.3099041533546325, "percentage": 77.24, "elapsed_time": "2:07:36", "remaining_time": "0:37:35"}
242
+ {"current_steps": 242, "total_steps": 312, "loss": 0.3974, "lr": 2.9289321881345257e-06, "epoch": 2.319488817891374, "percentage": 77.56, "elapsed_time": "2:08:07", "remaining_time": "0:37:03"}
243
+ {"current_steps": 243, "total_steps": 312, "loss": 0.3367, "lr": 2.850041733353247e-06, "epoch": 2.329073482428115, "percentage": 77.88, "elapsed_time": "2:08:38", "remaining_time": "0:36:31"}
244
+ {"current_steps": 244, "total_steps": 312, "loss": 0.3803, "lr": 2.7720513617260857e-06, "epoch": 2.3386581469648564, "percentage": 78.21, "elapsed_time": "2:09:08", "remaining_time": "0:35:59"}
245
+ {"current_steps": 245, "total_steps": 312, "loss": 0.3815, "lr": 2.694970891187225e-06, "epoch": 2.3482428115015974, "percentage": 78.53, "elapsed_time": "2:09:42", "remaining_time": "0:35:28"}
246
+ {"current_steps": 246, "total_steps": 312, "loss": 0.3935, "lr": 2.6188100251265947e-06, "epoch": 2.357827476038339, "percentage": 78.85, "elapsed_time": "2:10:15", "remaining_time": "0:34:56"}
247
+ {"current_steps": 247, "total_steps": 312, "loss": 0.3229, "lr": 2.5435783511683444e-06, "epoch": 2.36741214057508, "percentage": 79.17, "elapsed_time": "2:10:46", "remaining_time": "0:34:24"}
248
+ {"current_steps": 248, "total_steps": 312, "loss": 0.383, "lr": 2.469285339963892e-06, "epoch": 2.376996805111821, "percentage": 79.49, "elapsed_time": "2:11:21", "remaining_time": "0:33:53"}
249
+ {"current_steps": 249, "total_steps": 312, "loss": 0.3828, "lr": 2.395940343999691e-06, "epoch": 2.3865814696485623, "percentage": 79.81, "elapsed_time": "2:11:54", "remaining_time": "0:33:22"}
250
+ {"current_steps": 250, "total_steps": 312, "loss": 0.3815, "lr": 2.323552596419889e-06, "epoch": 2.3961661341853033, "percentage": 80.13, "elapsed_time": "2:12:24", "remaining_time": "0:32:50"}
251
+ {"current_steps": 251, "total_steps": 312, "loss": 0.3819, "lr": 2.2521312098639914e-06, "epoch": 2.405750798722045, "percentage": 80.45, "elapsed_time": "2:12:51", "remaining_time": "0:32:17"}
252
+ {"current_steps": 252, "total_steps": 312, "loss": 0.4087, "lr": 2.1816851753197023e-06, "epoch": 2.415335463258786, "percentage": 80.77, "elapsed_time": "2:13:23", "remaining_time": "0:31:45"}
253
+ {"current_steps": 253, "total_steps": 312, "loss": 0.3657, "lr": 2.1122233609910903e-06, "epoch": 2.4249201277955272, "percentage": 81.09, "elapsed_time": "2:13:52", "remaining_time": "0:31:13"}
254
+ {"current_steps": 254, "total_steps": 312, "loss": 0.3457, "lr": 2.043754511182191e-06, "epoch": 2.4345047923322682, "percentage": 81.41, "elapsed_time": "2:14:23", "remaining_time": "0:30:41"}
255
+ {"current_steps": 255, "total_steps": 312, "loss": 0.3919, "lr": 1.9762872451962214e-06, "epoch": 2.4440894568690097, "percentage": 81.73, "elapsed_time": "2:14:56", "remaining_time": "0:30:09"}
256
+ {"current_steps": 256, "total_steps": 312, "loss": 0.3691, "lr": 1.9098300562505266e-06, "epoch": 2.4536741214057507, "percentage": 82.05, "elapsed_time": "2:15:29", "remaining_time": "0:29:38"}
257
+ {"current_steps": 257, "total_steps": 312, "loss": 0.364, "lr": 1.8443913104073984e-06, "epoch": 2.463258785942492, "percentage": 82.37, "elapsed_time": "2:15:59", "remaining_time": "0:29:06"}
258
+ {"current_steps": 258, "total_steps": 312, "loss": 0.3308, "lr": 1.7799792455209019e-06, "epoch": 2.472843450479233, "percentage": 82.69, "elapsed_time": "2:16:29", "remaining_time": "0:28:34"}
259
+ {"current_steps": 259, "total_steps": 312, "loss": 0.3769, "lr": 1.716601970199836e-06, "epoch": 2.4824281150159746, "percentage": 83.01, "elapsed_time": "2:16:58", "remaining_time": "0:28:01"}
260
+ {"current_steps": 260, "total_steps": 312, "loss": 0.4193, "lr": 1.6542674627869738e-06, "epoch": 2.4920127795527156, "percentage": 83.33, "elapsed_time": "2:17:31", "remaining_time": "0:27:30"}
261
+ {"current_steps": 261, "total_steps": 312, "loss": 0.3798, "lr": 1.5929835703546992e-06, "epoch": 2.501597444089457, "percentage": 83.65, "elapsed_time": "2:18:03", "remaining_time": "0:26:58"}
262
+ {"current_steps": 262, "total_steps": 312, "loss": 0.3632, "lr": 1.5327580077171589e-06, "epoch": 2.511182108626198, "percentage": 83.97, "elapsed_time": "2:18:36", "remaining_time": "0:26:27"}
263
+ {"current_steps": 263, "total_steps": 312, "loss": 0.3762, "lr": 1.4735983564590784e-06, "epoch": 2.520766773162939, "percentage": 84.29, "elapsed_time": "2:19:03", "remaining_time": "0:25:54"}
264
+ {"current_steps": 264, "total_steps": 312, "loss": 0.3675, "lr": 1.4155120639813392e-06, "epoch": 2.5303514376996805, "percentage": 84.62, "elapsed_time": "2:19:32", "remaining_time": "0:25:22"}
265
+ {"current_steps": 265, "total_steps": 312, "loss": 0.3627, "lr": 1.3585064425634542e-06, "epoch": 2.539936102236422, "percentage": 84.94, "elapsed_time": "2:20:01", "remaining_time": "0:24:50"}
266
+ {"current_steps": 266, "total_steps": 312, "loss": 0.4046, "lr": 1.3025886684430467e-06, "epoch": 2.549520766773163, "percentage": 85.26, "elapsed_time": "2:20:30", "remaining_time": "0:24:17"}
267
+ {"current_steps": 267, "total_steps": 312, "loss": 0.3789, "lr": 1.2477657809124632e-06, "epoch": 2.559105431309904, "percentage": 85.58, "elapsed_time": "2:20:58", "remaining_time": "0:23:45"}
268
+ {"current_steps": 268, "total_steps": 312, "loss": 0.3703, "lr": 1.19404468143262e-06, "epoch": 2.5686900958466454, "percentage": 85.9, "elapsed_time": "2:21:26", "remaining_time": "0:23:13"}
269
+ {"current_steps": 269, "total_steps": 312, "loss": 0.3394, "lr": 1.1414321327642019e-06, "epoch": 2.5782747603833864, "percentage": 86.22, "elapsed_time": "2:21:55", "remaining_time": "0:22:41"}
270
+ {"current_steps": 270, "total_steps": 312, "loss": 0.3589, "lr": 1.0899347581163222e-06, "epoch": 2.587859424920128, "percentage": 86.54, "elapsed_time": "2:22:28", "remaining_time": "0:22:09"}
271
+ {"current_steps": 271, "total_steps": 312, "loss": 0.3832, "lr": 1.0395590403127487e-06, "epoch": 2.597444089456869, "percentage": 86.86, "elapsed_time": "2:22:58", "remaining_time": "0:21:37"}
272
+ {"current_steps": 272, "total_steps": 312, "loss": 0.3646, "lr": 9.903113209758098e-07, "epoch": 2.6070287539936103, "percentage": 87.18, "elapsed_time": "2:23:28", "remaining_time": "0:21:05"}
273
+ {"current_steps": 273, "total_steps": 312, "loss": 0.3973, "lr": 9.421977997280596e-07, "epoch": 2.6166134185303513, "percentage": 87.5, "elapsed_time": "2:24:01", "remaining_time": "0:20:34"}
274
+ {"current_steps": 274, "total_steps": 312, "loss": 0.3828, "lr": 8.952245334118415e-07, "epoch": 2.626198083067093, "percentage": 87.82, "elapsed_time": "2:24:35", "remaining_time": "0:20:03"}
275
+ {"current_steps": 275, "total_steps": 312, "loss": 0.3961, "lr": 8.493974353268019e-07, "epoch": 2.635782747603834, "percentage": 88.14, "elapsed_time": "2:25:09", "remaining_time": "0:19:31"}
276
+ {"current_steps": 276, "total_steps": 312, "loss": 0.3796, "lr": 8.047222744854943e-07, "epoch": 2.6453674121405752, "percentage": 88.46, "elapsed_time": "2:25:41", "remaining_time": "0:19:00"}
277
+ {"current_steps": 277, "total_steps": 312, "loss": 0.3777, "lr": 7.612046748871327e-07, "epoch": 2.6549520766773163, "percentage": 88.78, "elapsed_time": "2:26:13", "remaining_time": "0:18:28"}
278
+ {"current_steps": 278, "total_steps": 312, "loss": 0.354, "lr": 7.188501148096117e-07, "epoch": 2.6645367412140573, "percentage": 89.1, "elapsed_time": "2:26:48", "remaining_time": "0:17:57"}
279
+ {"current_steps": 279, "total_steps": 312, "loss": 0.4123, "lr": 6.776639261198581e-07, "epoch": 2.6741214057507987, "percentage": 89.42, "elapsed_time": "2:27:21", "remaining_time": "0:17:25"}
280
+ {"current_steps": 280, "total_steps": 312, "loss": 0.3542, "lr": 6.37651293602628e-07, "epoch": 2.68370607028754, "percentage": 89.74, "elapsed_time": "2:27:52", "remaining_time": "0:16:53"}
281
+ {"current_steps": 281, "total_steps": 312, "loss": 0.3847, "lr": 5.988172543078097e-07, "epoch": 2.693290734824281, "percentage": 90.06, "elapsed_time": "2:28:20", "remaining_time": "0:16:21"}
282
+ {"current_steps": 282, "total_steps": 312, "loss": 0.374, "lr": 5.611666969163243e-07, "epoch": 2.702875399361022, "percentage": 90.38, "elapsed_time": "2:28:54", "remaining_time": "0:15:50"}
283
+ {"current_steps": 283, "total_steps": 312, "loss": 0.3634, "lr": 5.247043611247127e-07, "epoch": 2.7124600638977636, "percentage": 90.71, "elapsed_time": "2:29:27", "remaining_time": "0:15:18"}
284
+ {"current_steps": 284, "total_steps": 312, "loss": 0.3363, "lr": 4.894348370484648e-07, "epoch": 2.722044728434505, "percentage": 91.03, "elapsed_time": "2:30:00", "remaining_time": "0:14:47"}
285
+ {"current_steps": 285, "total_steps": 312, "loss": 0.3938, "lr": 4.553625646441928e-07, "epoch": 2.731629392971246, "percentage": 91.35, "elapsed_time": "2:30:33", "remaining_time": "0:14:15"}
286
+ {"current_steps": 286, "total_steps": 312, "loss": 0.3544, "lr": 4.224918331506955e-07, "epoch": 2.741214057507987, "percentage": 91.67, "elapsed_time": "2:31:04", "remaining_time": "0:13:44"}
287
+ {"current_steps": 287, "total_steps": 312, "loss": 0.3973, "lr": 3.908267805490051e-07, "epoch": 2.7507987220447285, "percentage": 91.99, "elapsed_time": "2:31:39", "remaining_time": "0:13:12"}
288
+ {"current_steps": 288, "total_steps": 312, "loss": 0.3991, "lr": 3.603713930414676e-07, "epoch": 2.7603833865814695, "percentage": 92.31, "elapsed_time": "2:32:06", "remaining_time": "0:12:40"}
289
+ {"current_steps": 289, "total_steps": 312, "loss": 0.3604, "lr": 3.3112950454993633e-07, "epoch": 2.769968051118211, "percentage": 92.63, "elapsed_time": "2:32:34", "remaining_time": "0:12:08"}
290
+ {"current_steps": 290, "total_steps": 312, "loss": 0.3654, "lr": 3.0310479623313125e-07, "epoch": 2.779552715654952, "percentage": 92.95, "elapsed_time": "2:33:07", "remaining_time": "0:11:36"}
291
+ {"current_steps": 291, "total_steps": 312, "loss": 0.427, "lr": 2.7630079602323447e-07, "epoch": 2.7891373801916934, "percentage": 93.27, "elapsed_time": "2:33:39", "remaining_time": "0:11:05"}
292
+ {"current_steps": 292, "total_steps": 312, "loss": 0.3213, "lr": 2.507208781817638e-07, "epoch": 2.7987220447284344, "percentage": 93.59, "elapsed_time": "2:34:07", "remaining_time": "0:10:33"}
293
+ {"current_steps": 293, "total_steps": 312, "loss": 0.372, "lr": 2.2636826287480872e-07, "epoch": 2.8083067092651754, "percentage": 93.91, "elapsed_time": "2:34:36", "remaining_time": "0:10:01"}
294
+ {"current_steps": 294, "total_steps": 312, "loss": 0.3641, "lr": 2.0324601576764525e-07, "epoch": 2.817891373801917, "percentage": 94.23, "elapsed_time": "2:35:07", "remaining_time": "0:09:29"}
295
+ {"current_steps": 295, "total_steps": 312, "loss": 0.4412, "lr": 1.81357047638816e-07, "epoch": 2.8274760383386583, "percentage": 94.55, "elapsed_time": "2:35:42", "remaining_time": "0:08:58"}
296
+ {"current_steps": 296, "total_steps": 312, "loss": 0.3375, "lr": 1.6070411401370335e-07, "epoch": 2.8370607028753994, "percentage": 94.87, "elapsed_time": "2:36:14", "remaining_time": "0:08:26"}
297
+ {"current_steps": 297, "total_steps": 312, "loss": 0.398, "lr": 1.4128981481764115e-07, "epoch": 2.8466453674121404, "percentage": 95.19, "elapsed_time": "2:36:48", "remaining_time": "0:07:55"}
298
+ {"current_steps": 298, "total_steps": 312, "loss": 0.3686, "lr": 1.231165940486234e-07, "epoch": 2.856230031948882, "percentage": 95.51, "elapsed_time": "2:37:15", "remaining_time": "0:07:23"}
299
+ {"current_steps": 299, "total_steps": 312, "loss": 0.4175, "lr": 1.0618673946963365e-07, "epoch": 2.8658146964856233, "percentage": 95.83, "elapsed_time": "2:37:47", "remaining_time": "0:06:51"}
300
+ {"current_steps": 300, "total_steps": 312, "loss": 0.3317, "lr": 9.0502382320653e-08, "epoch": 2.8753993610223643, "percentage": 96.15, "elapsed_time": "2:38:22", "remaining_time": "0:06:20"}
301
+ {"current_steps": 301, "total_steps": 312, "loss": 0.3893, "lr": 7.606549705035937e-08, "epoch": 2.8849840255591053, "percentage": 96.47, "elapsed_time": "2:38:52", "remaining_time": "0:05:48"}
302
+ {"current_steps": 302, "total_steps": 312, "loss": 0.411, "lr": 6.287790106757396e-08, "epoch": 2.8945686900958467, "percentage": 96.79, "elapsed_time": "2:39:24", "remaining_time": "0:05:16"}
303
+ {"current_steps": 303, "total_steps": 312, "loss": 0.3882, "lr": 5.094125451247656e-08, "epoch": 2.9041533546325877, "percentage": 97.12, "elapsed_time": "2:40:00", "remaining_time": "0:04:45"}
304
+ {"current_steps": 304, "total_steps": 312, "loss": 0.4154, "lr": 4.025706004760932e-08, "epoch": 2.913738019169329, "percentage": 97.44, "elapsed_time": "2:40:30", "remaining_time": "0:04:13"}
305
+ {"current_steps": 305, "total_steps": 312, "loss": 0.3293, "lr": 3.082666266872036e-08, "epoch": 2.92332268370607, "percentage": 97.76, "elapsed_time": "2:40:57", "remaining_time": "0:03:41"}
306
+ {"current_steps": 306, "total_steps": 312, "loss": 0.3585, "lr": 2.265124953543918e-08, "epoch": 2.9329073482428116, "percentage": 98.08, "elapsed_time": "2:41:31", "remaining_time": "0:03:10"}
307
+ {"current_steps": 307, "total_steps": 312, "loss": 0.4593, "lr": 1.5731849821833955e-08, "epoch": 2.9424920127795526, "percentage": 98.4, "elapsed_time": "2:42:00", "remaining_time": "0:02:38"}
308
+ {"current_steps": 308, "total_steps": 312, "loss": 0.3501, "lr": 1.0069334586854106e-08, "epoch": 2.952076677316294, "percentage": 98.72, "elapsed_time": "2:42:33", "remaining_time": "0:02:06"}
309
+ {"current_steps": 309, "total_steps": 312, "loss": 0.3676, "lr": 5.664416664666883e-09, "epoch": 2.961661341853035, "percentage": 99.04, "elapsed_time": "2:43:05", "remaining_time": "0:01:35"}
310
+ {"current_steps": 310, "total_steps": 312, "loss": 0.3948, "lr": 2.5176505749346937e-09, "epoch": 2.9712460063897765, "percentage": 99.36, "elapsed_time": "2:43:36", "remaining_time": "0:01:03"}
311
+ {"current_steps": 311, "total_steps": 312, "loss": 0.3643, "lr": 6.294324529942942e-10, "epoch": 2.9808306709265175, "percentage": 99.68, "elapsed_time": "2:44:07", "remaining_time": "0:00:31"}
312
+ {"current_steps": 312, "total_steps": 312, "loss": 0.3668, "lr": 0.0, "epoch": 2.9904153354632586, "percentage": 100.0, "elapsed_time": "2:44:43", "remaining_time": "0:00:00"}
313
+ {"current_steps": 312, "total_steps": 312, "epoch": 2.9904153354632586, "percentage": 100.0, "elapsed_time": "2:46:14", "remaining_time": "0:00:00"}