sedrickkeh commited on
Commit
c7a0e53
·
verified ·
1 Parent(s): 54c4ab8

Training in progress, epoch 2

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:02e109b74fb94ca219589c8571654b6818674cf7f39c13e2cc1f2f1df756d146
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2aaa7608dd516fd0b8150f8b5e13043a836957a279a2f5b2464c0b485dccf0fd
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bb755fbac0ddac7ca0a0c5fad13fe67d6d10c48f7bb51dc3037304245dd9c4e8
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4590ae01a3fcdb3517524f512e13f393e11eb83d43a983c15614777849584b15
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ea12b045d153ab6be8c13c65e50f2cfaf5f62ad60a97f9b2addf442625d95017
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4325e5026cc0a54744728ccfe898e44429845f99c895f5dcc20dbdcf1f8fea9d
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f23d8cfa56eb926f4d4804fb7bc4a0eacbc86969069807b90569cbb3f0f89b49
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8f8b8135b2122aee9ff3d5f6518f0c98d2e5791cffdf8280e65003410eeda320
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -208,3 +208,106 @@
208
  {"current_steps": 208, "total_steps": 312, "loss": 0.5447, "lr": 3.0348748417303826e-06, "epoch": 1.9968, "percentage": 66.67, "elapsed_time": "5:26:48", "remaining_time": "2:43:24"}
209
  {"current_steps": 209, "total_steps": 312, "loss": 1.0076, "lr": 2.9834142279959754e-06, "epoch": 2.0064, "percentage": 66.99, "elapsed_time": "5:29:15", "remaining_time": "2:42:15"}
210
  {"current_steps": 210, "total_steps": 312, "loss": 0.5325, "lr": 2.932207475167398e-06, "epoch": 2.016, "percentage": 67.31, "elapsed_time": "5:30:46", "remaining_time": "2:40:39"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
208
  {"current_steps": 208, "total_steps": 312, "loss": 0.5447, "lr": 3.0348748417303826e-06, "epoch": 1.9968, "percentage": 66.67, "elapsed_time": "5:26:48", "remaining_time": "2:43:24"}
209
  {"current_steps": 209, "total_steps": 312, "loss": 1.0076, "lr": 2.9834142279959754e-06, "epoch": 2.0064, "percentage": 66.99, "elapsed_time": "5:29:15", "remaining_time": "2:42:15"}
210
  {"current_steps": 210, "total_steps": 312, "loss": 0.5325, "lr": 2.932207475167398e-06, "epoch": 2.016, "percentage": 67.31, "elapsed_time": "5:30:46", "remaining_time": "2:40:39"}
211
+ {"current_steps": 211, "total_steps": 312, "loss": 0.5812, "lr": 2.8812610294830568e-06, "epoch": 2.0256, "percentage": 67.63, "elapsed_time": "5:32:37", "remaining_time": "2:39:13"}
212
+ {"current_steps": 212, "total_steps": 312, "loss": 0.5126, "lr": 2.83058130441221e-06, "epoch": 2.0352, "percentage": 67.95, "elapsed_time": "5:34:06", "remaining_time": "2:37:35"}
213
+ {"current_steps": 213, "total_steps": 312, "loss": 0.5893, "lr": 2.7801746798475905e-06, "epoch": 2.0448, "percentage": 68.27, "elapsed_time": "5:35:52", "remaining_time": "2:36:06"}
214
+ {"current_steps": 214, "total_steps": 312, "loss": 0.5568, "lr": 2.7300475013022666e-06, "epoch": 2.0544, "percentage": 68.59, "elapsed_time": "5:37:23", "remaining_time": "2:34:30"}
215
+ {"current_steps": 215, "total_steps": 312, "loss": 0.5738, "lr": 2.6802060791108304e-06, "epoch": 2.064, "percentage": 68.91, "elapsed_time": "5:38:44", "remaining_time": "2:32:49"}
216
+ {"current_steps": 216, "total_steps": 312, "loss": 0.4556, "lr": 2.6306566876350072e-06, "epoch": 2.0736, "percentage": 69.23, "elapsed_time": "5:40:05", "remaining_time": "2:31:09"}
217
+ {"current_steps": 217, "total_steps": 312, "loss": 0.5503, "lr": 2.5814055644738013e-06, "epoch": 2.0832, "percentage": 69.55, "elapsed_time": "5:41:58", "remaining_time": "2:29:42"}
218
+ {"current_steps": 218, "total_steps": 312, "loss": 0.507, "lr": 2.532458909678266e-06, "epoch": 2.0928, "percentage": 69.87, "elapsed_time": "5:43:29", "remaining_time": "2:28:06"}
219
+ {"current_steps": 219, "total_steps": 312, "loss": 0.5551, "lr": 2.483822884971e-06, "epoch": 2.1024, "percentage": 70.19, "elapsed_time": "5:45:03", "remaining_time": "2:26:32"}
220
+ {"current_steps": 220, "total_steps": 312, "loss": 0.5125, "lr": 2.43550361297047e-06, "epoch": 2.112, "percentage": 70.51, "elapsed_time": "5:46:38", "remaining_time": "2:24:57"}
221
+ {"current_steps": 221, "total_steps": 312, "loss": 0.5489, "lr": 2.387507176420256e-06, "epoch": 2.1216, "percentage": 70.83, "elapsed_time": "5:48:08", "remaining_time": "2:23:21"}
222
+ {"current_steps": 222, "total_steps": 312, "loss": 0.5195, "lr": 2.339839617423318e-06, "epoch": 2.1312, "percentage": 71.15, "elapsed_time": "5:49:34", "remaining_time": "2:21:43"}
223
+ {"current_steps": 223, "total_steps": 312, "loss": 0.5181, "lr": 2.2925069366813718e-06, "epoch": 2.1408, "percentage": 71.47, "elapsed_time": "5:51:03", "remaining_time": "2:20:06"}
224
+ {"current_steps": 224, "total_steps": 312, "loss": 0.5357, "lr": 2.245515092739488e-06, "epoch": 2.1504, "percentage": 71.79, "elapsed_time": "5:52:50", "remaining_time": "2:18:37"}
225
+ {"current_steps": 225, "total_steps": 312, "loss": 0.5389, "lr": 2.1988700012359865e-06, "epoch": 2.16, "percentage": 72.12, "elapsed_time": "5:54:26", "remaining_time": "2:17:03"}
226
+ {"current_steps": 226, "total_steps": 312, "loss": 0.4976, "lr": 2.1525775341577404e-06, "epoch": 2.1696, "percentage": 72.44, "elapsed_time": "5:55:49", "remaining_time": "2:15:23"}
227
+ {"current_steps": 227, "total_steps": 312, "loss": 0.5311, "lr": 2.1066435191009717e-06, "epoch": 2.1792, "percentage": 72.76, "elapsed_time": "5:57:41", "remaining_time": "2:13:56"}
228
+ {"current_steps": 228, "total_steps": 312, "loss": 0.5153, "lr": 2.061073738537635e-06, "epoch": 2.1888, "percentage": 73.08, "elapsed_time": "5:59:24", "remaining_time": "2:12:24"}
229
+ {"current_steps": 229, "total_steps": 312, "loss": 0.5571, "lr": 2.0158739290874822e-06, "epoch": 2.1984, "percentage": 73.4, "elapsed_time": "6:01:13", "remaining_time": "2:10:55"}
230
+ {"current_steps": 230, "total_steps": 312, "loss": 0.5989, "lr": 1.971049780795901e-06, "epoch": 2.208, "percentage": 73.72, "elapsed_time": "6:02:38", "remaining_time": "2:09:17"}
231
+ {"current_steps": 231, "total_steps": 312, "loss": 0.4818, "lr": 1.9266069364176144e-06, "epoch": 2.2176, "percentage": 74.04, "elapsed_time": "6:03:48", "remaining_time": "2:07:34"}
232
+ {"current_steps": 232, "total_steps": 312, "loss": 0.5287, "lr": 1.8825509907063328e-06, "epoch": 2.2272, "percentage": 74.36, "elapsed_time": "6:05:22", "remaining_time": "2:05:59"}
233
+ {"current_steps": 233, "total_steps": 312, "loss": 0.5527, "lr": 1.838887489710452e-06, "epoch": 2.2368, "percentage": 74.68, "elapsed_time": "6:07:05", "remaining_time": "2:04:27"}
234
+ {"current_steps": 234, "total_steps": 312, "loss": 0.4751, "lr": 1.7956219300748796e-06, "epoch": 2.2464, "percentage": 75.0, "elapsed_time": "6:08:35", "remaining_time": "2:02:51"}
235
+ {"current_steps": 235, "total_steps": 312, "loss": 0.5778, "lr": 1.7527597583490825e-06, "epoch": 2.2560000000000002, "percentage": 75.32, "elapsed_time": "6:10:10", "remaining_time": "2:01:17"}
236
+ {"current_steps": 236, "total_steps": 312, "loss": 0.5591, "lr": 1.7103063703014372e-06, "epoch": 2.2656, "percentage": 75.64, "elapsed_time": "6:11:53", "remaining_time": "1:59:45"}
237
+ {"current_steps": 237, "total_steps": 312, "loss": 0.5066, "lr": 1.6682671102399806e-06, "epoch": 2.2752, "percentage": 75.96, "elapsed_time": "6:13:36", "remaining_time": "1:58:13"}
238
+ {"current_steps": 238, "total_steps": 312, "loss": 0.5288, "lr": 1.6266472703396286e-06, "epoch": 2.2848, "percentage": 76.28, "elapsed_time": "6:15:04", "remaining_time": "1:56:37"}
239
+ {"current_steps": 239, "total_steps": 312, "loss": 0.5317, "lr": 1.5854520899759656e-06, "epoch": 2.2944, "percentage": 76.6, "elapsed_time": "6:16:20", "remaining_time": "1:54:56"}
240
+ {"current_steps": 240, "total_steps": 312, "loss": 0.5226, "lr": 1.544686755065677e-06, "epoch": 2.304, "percentage": 76.92, "elapsed_time": "6:17:47", "remaining_time": "1:53:20"}
241
+ {"current_steps": 241, "total_steps": 312, "loss": 0.5536, "lr": 1.5043563974137132e-06, "epoch": 2.3136, "percentage": 77.24, "elapsed_time": "6:19:11", "remaining_time": "1:51:42"}
242
+ {"current_steps": 242, "total_steps": 312, "loss": 0.5563, "lr": 1.4644660940672628e-06, "epoch": 2.3232, "percentage": 77.56, "elapsed_time": "6:21:04", "remaining_time": "1:50:13"}
243
+ {"current_steps": 243, "total_steps": 312, "loss": 0.4857, "lr": 1.4250208666766235e-06, "epoch": 2.3327999999999998, "percentage": 77.88, "elapsed_time": "6:22:44", "remaining_time": "1:48:40"}
244
+ {"current_steps": 244, "total_steps": 312, "loss": 0.4783, "lr": 1.3860256808630429e-06, "epoch": 2.3424, "percentage": 78.21, "elapsed_time": "6:24:10", "remaining_time": "1:47:04"}
245
+ {"current_steps": 245, "total_steps": 312, "loss": 0.5553, "lr": 1.3474854455936126e-06, "epoch": 2.352, "percentage": 78.53, "elapsed_time": "6:25:41", "remaining_time": "1:45:28"}
246
+ {"current_steps": 246, "total_steps": 312, "loss": 0.5389, "lr": 1.3094050125632973e-06, "epoch": 2.3616, "percentage": 78.85, "elapsed_time": "6:26:56", "remaining_time": "1:43:48"}
247
+ {"current_steps": 247, "total_steps": 312, "loss": 0.4804, "lr": 1.2717891755841722e-06, "epoch": 2.3712, "percentage": 79.17, "elapsed_time": "6:28:23", "remaining_time": "1:42:12"}
248
+ {"current_steps": 248, "total_steps": 312, "loss": 0.5717, "lr": 1.234642669981946e-06, "epoch": 2.3808, "percentage": 79.49, "elapsed_time": "6:29:56", "remaining_time": "1:40:37"}
249
+ {"current_steps": 249, "total_steps": 312, "loss": 0.5226, "lr": 1.1979701719998454e-06, "epoch": 2.3904, "percentage": 79.81, "elapsed_time": "6:31:38", "remaining_time": "1:39:05"}
250
+ {"current_steps": 250, "total_steps": 312, "loss": 0.5395, "lr": 1.1617762982099446e-06, "epoch": 2.4, "percentage": 80.13, "elapsed_time": "6:33:23", "remaining_time": "1:37:33"}
251
+ {"current_steps": 251, "total_steps": 312, "loss": 0.509, "lr": 1.1260656049319957e-06, "epoch": 2.4096, "percentage": 80.45, "elapsed_time": "6:35:04", "remaining_time": "1:36:00"}
252
+ {"current_steps": 252, "total_steps": 312, "loss": 0.5682, "lr": 1.0908425876598512e-06, "epoch": 2.4192, "percentage": 80.77, "elapsed_time": "6:36:48", "remaining_time": "1:34:28"}
253
+ {"current_steps": 253, "total_steps": 312, "loss": 0.5389, "lr": 1.0561116804955451e-06, "epoch": 2.4288, "percentage": 81.09, "elapsed_time": "6:38:24", "remaining_time": "1:32:54"}
254
+ {"current_steps": 254, "total_steps": 312, "loss": 0.4982, "lr": 1.0218772555910955e-06, "epoch": 2.4384, "percentage": 81.41, "elapsed_time": "6:39:57", "remaining_time": "1:31:19"}
255
+ {"current_steps": 255, "total_steps": 312, "loss": 0.5787, "lr": 9.881436225981107e-07, "epoch": 2.448, "percentage": 81.73, "elapsed_time": "6:41:53", "remaining_time": "1:29:50"}
256
+ {"current_steps": 256, "total_steps": 312, "loss": 0.4473, "lr": 9.549150281252633e-07, "epoch": 2.4576000000000002, "percentage": 82.05, "elapsed_time": "6:43:11", "remaining_time": "1:28:11"}
257
+ {"current_steps": 257, "total_steps": 312, "loss": 0.5655, "lr": 9.221956552036992e-07, "epoch": 2.4672, "percentage": 82.37, "elapsed_time": "6:44:56", "remaining_time": "1:26:39"}
258
+ {"current_steps": 258, "total_steps": 312, "loss": 0.5304, "lr": 8.899896227604509e-07, "epoch": 2.4768, "percentage": 82.69, "elapsed_time": "6:46:29", "remaining_time": "1:25:04"}
259
+ {"current_steps": 259, "total_steps": 312, "loss": 0.5282, "lr": 8.58300985099918e-07, "epoch": 2.4864, "percentage": 83.01, "elapsed_time": "6:47:56", "remaining_time": "1:23:28"}
260
+ {"current_steps": 260, "total_steps": 312, "loss": 0.5628, "lr": 8.271337313934869e-07, "epoch": 2.496, "percentage": 83.33, "elapsed_time": "6:49:43", "remaining_time": "1:21:56"}
261
+ {"current_steps": 261, "total_steps": 312, "loss": 0.5245, "lr": 7.964917851773496e-07, "epoch": 2.5056000000000003, "percentage": 83.65, "elapsed_time": "6:51:32", "remaining_time": "1:20:25"}
262
+ {"current_steps": 262, "total_steps": 312, "loss": 0.4994, "lr": 7.663790038585794e-07, "epoch": 2.5152, "percentage": 83.97, "elapsed_time": "6:52:49", "remaining_time": "1:18:47"}
263
+ {"current_steps": 263, "total_steps": 312, "loss": 0.5233, "lr": 7.367991782295392e-07, "epoch": 2.5248, "percentage": 84.29, "elapsed_time": "6:54:05", "remaining_time": "1:17:09"}
264
+ {"current_steps": 264, "total_steps": 312, "loss": 0.5305, "lr": 7.077560319906696e-07, "epoch": 2.5343999999999998, "percentage": 84.62, "elapsed_time": "6:55:49", "remaining_time": "1:15:36"}
265
+ {"current_steps": 265, "total_steps": 312, "loss": 0.5075, "lr": 6.792532212817271e-07, "epoch": 2.544, "percentage": 84.94, "elapsed_time": "6:57:06", "remaining_time": "1:13:58"}
266
+ {"current_steps": 266, "total_steps": 312, "loss": 0.5858, "lr": 6.512943342215234e-07, "epoch": 2.5536, "percentage": 85.26, "elapsed_time": "6:58:43", "remaining_time": "1:12:24"}
267
+ {"current_steps": 267, "total_steps": 312, "loss": 0.5053, "lr": 6.238828904562316e-07, "epoch": 2.5632, "percentage": 85.58, "elapsed_time": "7:00:05", "remaining_time": "1:10:48"}
268
+ {"current_steps": 268, "total_steps": 312, "loss": 0.5295, "lr": 5.9702234071631e-07, "epoch": 2.5728, "percentage": 85.9, "elapsed_time": "7:01:33", "remaining_time": "1:09:12"}
269
+ {"current_steps": 269, "total_steps": 312, "loss": 0.5053, "lr": 5.707160663821009e-07, "epoch": 2.5824, "percentage": 86.22, "elapsed_time": "7:03:11", "remaining_time": "1:07:38"}
270
+ {"current_steps": 270, "total_steps": 312, "loss": 0.5196, "lr": 5.449673790581611e-07, "epoch": 2.592, "percentage": 86.54, "elapsed_time": "7:04:55", "remaining_time": "1:06:05"}
271
+ {"current_steps": 271, "total_steps": 312, "loss": 0.5181, "lr": 5.197795201563744e-07, "epoch": 2.6016, "percentage": 86.86, "elapsed_time": "7:06:26", "remaining_time": "1:04:31"}
272
+ {"current_steps": 272, "total_steps": 312, "loss": 0.5888, "lr": 4.951556604879049e-07, "epoch": 2.6112, "percentage": 87.18, "elapsed_time": "7:08:22", "remaining_time": "1:02:59"}
273
+ {"current_steps": 273, "total_steps": 312, "loss": 0.5424, "lr": 4.710988998640298e-07, "epoch": 2.6208, "percentage": 87.5, "elapsed_time": "7:09:53", "remaining_time": "1:01:24"}
274
+ {"current_steps": 274, "total_steps": 312, "loss": 0.5004, "lr": 4.4761226670592074e-07, "epoch": 2.6304, "percentage": 87.82, "elapsed_time": "7:11:25", "remaining_time": "0:59:50"}
275
+ {"current_steps": 275, "total_steps": 312, "loss": 0.5305, "lr": 4.2469871766340096e-07, "epoch": 2.64, "percentage": 88.14, "elapsed_time": "7:13:06", "remaining_time": "0:58:16"}
276
+ {"current_steps": 276, "total_steps": 312, "loss": 0.5355, "lr": 4.0236113724274716e-07, "epoch": 2.6496, "percentage": 88.46, "elapsed_time": "7:14:23", "remaining_time": "0:56:39"}
277
+ {"current_steps": 277, "total_steps": 312, "loss": 0.5671, "lr": 3.8060233744356634e-07, "epoch": 2.6592000000000002, "percentage": 88.78, "elapsed_time": "7:16:07", "remaining_time": "0:55:06"}
278
+ {"current_steps": 278, "total_steps": 312, "loss": 0.5108, "lr": 3.5942505740480583e-07, "epoch": 2.6688, "percentage": 89.1, "elapsed_time": "7:17:46", "remaining_time": "0:53:32"}
279
+ {"current_steps": 279, "total_steps": 312, "loss": 0.5229, "lr": 3.3883196305992906e-07, "epoch": 2.6784, "percentage": 89.42, "elapsed_time": "7:19:06", "remaining_time": "0:51:56"}
280
+ {"current_steps": 280, "total_steps": 312, "loss": 0.5244, "lr": 3.18825646801314e-07, "epoch": 2.6879999999999997, "percentage": 89.74, "elapsed_time": "7:20:39", "remaining_time": "0:50:21"}
281
+ {"current_steps": 281, "total_steps": 312, "loss": 0.5123, "lr": 2.9940862715390483e-07, "epoch": 2.6976, "percentage": 90.06, "elapsed_time": "7:22:00", "remaining_time": "0:48:45"}
282
+ {"current_steps": 282, "total_steps": 312, "loss": 0.5092, "lr": 2.8058334845816214e-07, "epoch": 2.7072000000000003, "percentage": 90.38, "elapsed_time": "7:23:31", "remaining_time": "0:47:10"}
283
+ {"current_steps": 283, "total_steps": 312, "loss": 0.5442, "lr": 2.6235218056235633e-07, "epoch": 2.7168, "percentage": 90.71, "elapsed_time": "7:25:10", "remaining_time": "0:45:37"}
284
+ {"current_steps": 284, "total_steps": 312, "loss": 0.5711, "lr": 2.447174185242324e-07, "epoch": 2.7264, "percentage": 91.03, "elapsed_time": "7:26:39", "remaining_time": "0:44:02"}
285
+ {"current_steps": 285, "total_steps": 312, "loss": 0.5, "lr": 2.276812823220964e-07, "epoch": 2.7359999999999998, "percentage": 91.35, "elapsed_time": "7:28:10", "remaining_time": "0:42:27"}
286
+ {"current_steps": 286, "total_steps": 312, "loss": 0.5256, "lr": 2.1124591657534776e-07, "epoch": 2.7456, "percentage": 91.67, "elapsed_time": "7:29:40", "remaining_time": "0:40:52"}
287
+ {"current_steps": 287, "total_steps": 312, "loss": 0.5371, "lr": 1.9541339027450256e-07, "epoch": 2.7552, "percentage": 91.99, "elapsed_time": "7:31:25", "remaining_time": "0:39:19"}
288
+ {"current_steps": 288, "total_steps": 312, "loss": 0.5725, "lr": 1.801856965207338e-07, "epoch": 2.7648, "percentage": 92.31, "elapsed_time": "7:33:13", "remaining_time": "0:37:46"}
289
+ {"current_steps": 289, "total_steps": 312, "loss": 0.4762, "lr": 1.6556475227496816e-07, "epoch": 2.7744, "percentage": 92.63, "elapsed_time": "7:34:44", "remaining_time": "0:36:11"}
290
+ {"current_steps": 290, "total_steps": 312, "loss": 0.5404, "lr": 1.5155239811656562e-07, "epoch": 2.784, "percentage": 92.95, "elapsed_time": "7:36:16", "remaining_time": "0:34:36"}
291
+ {"current_steps": 291, "total_steps": 312, "loss": 0.5515, "lr": 1.3815039801161723e-07, "epoch": 2.7936, "percentage": 93.27, "elapsed_time": "7:37:58", "remaining_time": "0:33:02"}
292
+ {"current_steps": 292, "total_steps": 312, "loss": 0.5259, "lr": 1.253604390908819e-07, "epoch": 2.8032, "percentage": 93.59, "elapsed_time": "7:39:17", "remaining_time": "0:31:27"}
293
+ {"current_steps": 293, "total_steps": 312, "loss": 0.5366, "lr": 1.1318413143740436e-07, "epoch": 2.8128, "percentage": 93.91, "elapsed_time": "7:40:45", "remaining_time": "0:29:52"}
294
+ {"current_steps": 294, "total_steps": 312, "loss": 0.5674, "lr": 1.0162300788382263e-07, "epoch": 2.8224, "percentage": 94.23, "elapsed_time": "7:42:20", "remaining_time": "0:28:18"}
295
+ {"current_steps": 295, "total_steps": 312, "loss": 0.4563, "lr": 9.0678523819408e-08, "epoch": 2.832, "percentage": 94.55, "elapsed_time": "7:43:46", "remaining_time": "0:26:43"}
296
+ {"current_steps": 296, "total_steps": 312, "loss": 0.5201, "lr": 8.035205700685167e-08, "epoch": 2.8416, "percentage": 94.87, "elapsed_time": "7:45:03", "remaining_time": "0:25:08"}
297
+ {"current_steps": 297, "total_steps": 312, "loss": 0.574, "lr": 7.064490740882057e-08, "epoch": 2.8512, "percentage": 95.19, "elapsed_time": "7:46:33", "remaining_time": "0:23:33"}
298
+ {"current_steps": 298, "total_steps": 312, "loss": 0.5587, "lr": 6.15582970243117e-08, "epoch": 2.8608000000000002, "percentage": 95.51, "elapsed_time": "7:47:54", "remaining_time": "0:21:58"}
299
+ {"current_steps": 299, "total_steps": 312, "loss": 0.4771, "lr": 5.3093369734816824e-08, "epoch": 2.8704, "percentage": 95.83, "elapsed_time": "7:49:30", "remaining_time": "0:20:24"}
300
+ {"current_steps": 300, "total_steps": 312, "loss": 0.5471, "lr": 4.52511911603265e-08, "epoch": 2.88, "percentage": 96.15, "elapsed_time": "7:51:14", "remaining_time": "0:18:50"}
301
+ {"current_steps": 301, "total_steps": 312, "loss": 0.5279, "lr": 3.8032748525179684e-08, "epoch": 2.8895999999999997, "percentage": 96.47, "elapsed_time": "7:52:44", "remaining_time": "0:17:16"}
302
+ {"current_steps": 302, "total_steps": 312, "loss": 0.5488, "lr": 3.143895053378698e-08, "epoch": 2.8992, "percentage": 96.79, "elapsed_time": "7:54:24", "remaining_time": "0:15:42"}
303
+ {"current_steps": 303, "total_steps": 312, "loss": 0.5458, "lr": 2.547062725623828e-08, "epoch": 2.9088000000000003, "percentage": 97.12, "elapsed_time": "7:56:04", "remaining_time": "0:14:08"}
304
+ {"current_steps": 304, "total_steps": 312, "loss": 0.4718, "lr": 2.012853002380466e-08, "epoch": 2.9184, "percentage": 97.44, "elapsed_time": "7:57:42", "remaining_time": "0:12:34"}
305
+ {"current_steps": 305, "total_steps": 312, "loss": 0.552, "lr": 1.541333133436018e-08, "epoch": 2.928, "percentage": 97.76, "elapsed_time": "7:59:29", "remaining_time": "0:11:00"}
306
+ {"current_steps": 306, "total_steps": 312, "loss": 0.5287, "lr": 1.132562476771959e-08, "epoch": 2.9375999999999998, "percentage": 98.08, "elapsed_time": "8:00:53", "remaining_time": "0:09:25"}
307
+ {"current_steps": 307, "total_steps": 312, "loss": 0.4764, "lr": 7.865924910916977e-09, "epoch": 2.9472, "percentage": 98.4, "elapsed_time": "8:02:15", "remaining_time": "0:07:51"}
308
+ {"current_steps": 308, "total_steps": 312, "loss": 0.5559, "lr": 5.034667293427053e-09, "epoch": 2.9568, "percentage": 98.72, "elapsed_time": "8:03:53", "remaining_time": "0:06:17"}
309
+ {"current_steps": 309, "total_steps": 312, "loss": 0.4897, "lr": 2.8322083323334417e-09, "epoch": 2.9664, "percentage": 99.04, "elapsed_time": "8:05:19", "remaining_time": "0:04:42"}
310
+ {"current_steps": 310, "total_steps": 312, "loss": 0.5773, "lr": 1.2588252874673469e-09, "epoch": 2.976, "percentage": 99.36, "elapsed_time": "8:06:53", "remaining_time": "0:03:08"}
311
+ {"current_steps": 311, "total_steps": 312, "loss": 0.5365, "lr": 3.147162264971471e-10, "epoch": 2.9856, "percentage": 99.68, "elapsed_time": "8:08:25", "remaining_time": "0:01:34"}
312
+ {"current_steps": 312, "total_steps": 312, "loss": 0.5758, "lr": 0.0, "epoch": 2.9952, "percentage": 100.0, "elapsed_time": "8:10:10", "remaining_time": "0:00:00"}
313
+ {"current_steps": 312, "total_steps": 312, "epoch": 2.9952, "percentage": 100.0, "elapsed_time": "8:12:17", "remaining_time": "0:00:00"}