neginr commited on
Commit
1d407cd
·
verified ·
1 Parent(s): 095a287

Training in progress, epoch 0

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cafee2ebcb91ecd189b88b75865eb1a49ca38405f2983f12c6e4951bdb234d41
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3e32710c88092895ee260ec5a8ac0f8f5773d56a2f0f9655f0bae24f076e3878
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e9c3eada553cf7ac15c8c2c700d9a10314412c6914c000c2500aac9b15bf93c0
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:05ae56627f4c096baa5ad34d4e920d071ee8aa0ec98aa6e0f6e4f99a9efd70f5
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8e3644248b6be5029c8f0e4a1ef9684697170c8078ea81dc8dd8113ae99bae4a
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:efaf187383d1e6f0641df3806d03308d765e0572cb5dee80fc959f0b41837d5a
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8ff5425278bac4180f9c5c19eb48a4d9565faac3f923475b0ea6241897253baf
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a05a5fd5a9dd78297c0bd00789ed43d322cce523007f3cab9ab6596a494d5fc6
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -1,332 +1,138 @@
1
- {"current_steps": 1, "total_steps": 550, "loss": 0.8156, "lr": 1.4545454545454546e-06, "epoch": 0.00904977375565611, "percentage": 0.18, "elapsed_time": "0:02:30", "remaining_time": "22:56:04"}
2
- {"current_steps": 2, "total_steps": 550, "loss": 0.8156, "lr": 2.9090909090909093e-06, "epoch": 0.01809954751131222, "percentage": 0.36, "elapsed_time": "0:04:08", "remaining_time": "18:52:47"}
3
- {"current_steps": 3, "total_steps": 550, "loss": 0.7979, "lr": 4.363636363636364e-06, "epoch": 0.027149321266968326, "percentage": 0.55, "elapsed_time": "0:05:44", "remaining_time": "17:28:13"}
4
- {"current_steps": 4, "total_steps": 550, "loss": 0.7695, "lr": 5.8181818181818185e-06, "epoch": 0.03619909502262444, "percentage": 0.73, "elapsed_time": "0:07:21", "remaining_time": "16:44:41"}
5
- {"current_steps": 5, "total_steps": 550, "loss": 0.7246, "lr": 7.272727272727273e-06, "epoch": 0.04524886877828054, "percentage": 0.91, "elapsed_time": "0:08:58", "remaining_time": "16:18:37"}
6
- {"current_steps": 6, "total_steps": 550, "loss": 0.7081, "lr": 8.727272727272728e-06, "epoch": 0.05429864253393665, "percentage": 1.09, "elapsed_time": "0:10:35", "remaining_time": "16:00:27"}
7
- {"current_steps": 7, "total_steps": 550, "loss": 0.7281, "lr": 1.0181818181818182e-05, "epoch": 0.06334841628959276, "percentage": 1.27, "elapsed_time": "0:12:12", "remaining_time": "15:47:10"}
8
- {"current_steps": 8, "total_steps": 550, "loss": 0.7178, "lr": 1.1636363636363637e-05, "epoch": 0.07239819004524888, "percentage": 1.45, "elapsed_time": "0:13:49", "remaining_time": "15:36:22"}
9
- {"current_steps": 9, "total_steps": 550, "loss": 0.7186, "lr": 1.3090909090909092e-05, "epoch": 0.08144796380090498, "percentage": 1.64, "elapsed_time": "0:15:26", "remaining_time": "15:27:59"}
10
- {"current_steps": 10, "total_steps": 550, "loss": 0.7, "lr": 1.4545454545454546e-05, "epoch": 0.09049773755656108, "percentage": 1.82, "elapsed_time": "0:17:03", "remaining_time": "15:20:49"}
11
- {"current_steps": 11, "total_steps": 550, "loss": 0.663, "lr": 1.6000000000000003e-05, "epoch": 0.09954751131221719, "percentage": 2.0, "elapsed_time": "0:18:40", "remaining_time": "15:14:49"}
12
- {"current_steps": 12, "total_steps": 550, "loss": 0.6339, "lr": 1.7454545454545456e-05, "epoch": 0.1085972850678733, "percentage": 2.18, "elapsed_time": "0:20:17", "remaining_time": "15:09:39"}
13
- {"current_steps": 13, "total_steps": 550, "loss": 0.6293, "lr": 1.8909090909090912e-05, "epoch": 0.11764705882352941, "percentage": 2.36, "elapsed_time": "0:21:54", "remaining_time": "15:05:00"}
14
- {"current_steps": 14, "total_steps": 550, "loss": 0.5996, "lr": 2.0363636363636365e-05, "epoch": 0.12669683257918551, "percentage": 2.55, "elapsed_time": "0:23:31", "remaining_time": "15:00:34"}
15
- {"current_steps": 15, "total_steps": 550, "loss": 0.5915, "lr": 2.1818181818181818e-05, "epoch": 0.13574660633484162, "percentage": 2.73, "elapsed_time": "0:25:08", "remaining_time": "14:56:35"}
16
- {"current_steps": 16, "total_steps": 550, "loss": 0.5795, "lr": 2.3272727272727274e-05, "epoch": 0.14479638009049775, "percentage": 2.91, "elapsed_time": "0:26:45", "remaining_time": "14:52:55"}
17
- {"current_steps": 17, "total_steps": 550, "loss": 0.576, "lr": 2.4727272727272727e-05, "epoch": 0.15384615384615385, "percentage": 3.09, "elapsed_time": "0:28:22", "remaining_time": "14:49:31"}
18
- {"current_steps": 18, "total_steps": 550, "loss": 0.5644, "lr": 2.6181818181818183e-05, "epoch": 0.16289592760180996, "percentage": 3.27, "elapsed_time": "0:29:59", "remaining_time": "14:46:25"}
19
- {"current_steps": 19, "total_steps": 550, "loss": 0.5588, "lr": 2.763636363636364e-05, "epoch": 0.17194570135746606, "percentage": 3.45, "elapsed_time": "0:31:36", "remaining_time": "14:43:24"}
20
- {"current_steps": 20, "total_steps": 550, "loss": 0.5527, "lr": 2.9090909090909093e-05, "epoch": 0.18099547511312217, "percentage": 3.64, "elapsed_time": "0:33:13", "remaining_time": "14:40:32"}
21
- {"current_steps": 21, "total_steps": 550, "loss": 0.537, "lr": 3.054545454545455e-05, "epoch": 0.19004524886877827, "percentage": 3.82, "elapsed_time": "0:34:50", "remaining_time": "14:37:49"}
22
- {"current_steps": 22, "total_steps": 550, "loss": 0.5302, "lr": 3.2000000000000005e-05, "epoch": 0.19909502262443438, "percentage": 4.0, "elapsed_time": "0:36:27", "remaining_time": "14:35:10"}
23
- {"current_steps": 23, "total_steps": 550, "loss": 0.5312, "lr": 3.345454545454546e-05, "epoch": 0.2081447963800905, "percentage": 4.18, "elapsed_time": "0:38:04", "remaining_time": "14:32:34"}
24
- {"current_steps": 24, "total_steps": 550, "loss": 0.5404, "lr": 3.490909090909091e-05, "epoch": 0.2171945701357466, "percentage": 4.36, "elapsed_time": "0:39:41", "remaining_time": "14:30:00"}
25
- {"current_steps": 25, "total_steps": 550, "loss": 0.5403, "lr": 3.6363636363636364e-05, "epoch": 0.22624434389140272, "percentage": 4.55, "elapsed_time": "0:41:18", "remaining_time": "14:27:33"}
26
- {"current_steps": 26, "total_steps": 550, "loss": 0.5293, "lr": 3.7818181818181824e-05, "epoch": 0.23529411764705882, "percentage": 4.73, "elapsed_time": "0:42:55", "remaining_time": "14:25:05"}
27
- {"current_steps": 27, "total_steps": 550, "loss": 0.521, "lr": 3.927272727272728e-05, "epoch": 0.24434389140271492, "percentage": 4.91, "elapsed_time": "0:44:32", "remaining_time": "14:22:43"}
28
- {"current_steps": 28, "total_steps": 550, "loss": 0.5171, "lr": 4.072727272727273e-05, "epoch": 0.25339366515837103, "percentage": 5.09, "elapsed_time": "0:46:09", "remaining_time": "14:20:27"}
29
- {"current_steps": 29, "total_steps": 550, "loss": 0.5131, "lr": 4.218181818181818e-05, "epoch": 0.26244343891402716, "percentage": 5.27, "elapsed_time": "0:47:46", "remaining_time": "14:18:15"}
30
- {"current_steps": 30, "total_steps": 550, "loss": 0.5163, "lr": 4.3636363636363636e-05, "epoch": 0.27149321266968324, "percentage": 5.45, "elapsed_time": "0:49:23", "remaining_time": "14:16:03"}
31
- {"current_steps": 31, "total_steps": 550, "loss": 0.5136, "lr": 4.509090909090909e-05, "epoch": 0.28054298642533937, "percentage": 5.64, "elapsed_time": "0:51:00", "remaining_time": "14:13:55"}
32
- {"current_steps": 32, "total_steps": 550, "loss": 0.5111, "lr": 4.654545454545455e-05, "epoch": 0.2895927601809955, "percentage": 5.82, "elapsed_time": "0:52:37", "remaining_time": "14:11:45"}
33
- {"current_steps": 33, "total_steps": 550, "loss": 0.5057, "lr": 4.8e-05, "epoch": 0.2986425339366516, "percentage": 6.0, "elapsed_time": "0:54:13", "remaining_time": "14:09:38"}
34
- {"current_steps": 34, "total_steps": 550, "loss": 0.5055, "lr": 4.9454545454545454e-05, "epoch": 0.3076923076923077, "percentage": 6.18, "elapsed_time": "0:55:50", "remaining_time": "14:07:33"}
35
- {"current_steps": 35, "total_steps": 550, "loss": 0.4878, "lr": 5.0909090909090914e-05, "epoch": 0.3167420814479638, "percentage": 6.36, "elapsed_time": "0:57:27", "remaining_time": "14:05:32"}
36
- {"current_steps": 36, "total_steps": 550, "loss": 0.4989, "lr": 5.236363636363637e-05, "epoch": 0.3257918552036199, "percentage": 6.55, "elapsed_time": "0:59:04", "remaining_time": "14:03:29"}
37
- {"current_steps": 37, "total_steps": 550, "loss": 0.4893, "lr": 5.381818181818182e-05, "epoch": 0.334841628959276, "percentage": 6.73, "elapsed_time": "1:00:41", "remaining_time": "14:01:27"}
38
- {"current_steps": 38, "total_steps": 550, "loss": 0.487, "lr": 5.527272727272728e-05, "epoch": 0.3438914027149321, "percentage": 6.91, "elapsed_time": "1:02:18", "remaining_time": "13:59:27"}
39
- {"current_steps": 39, "total_steps": 550, "loss": 0.4906, "lr": 5.672727272727273e-05, "epoch": 0.35294117647058826, "percentage": 7.09, "elapsed_time": "1:03:55", "remaining_time": "13:57:30"}
40
- {"current_steps": 40, "total_steps": 550, "loss": 0.4904, "lr": 5.8181818181818185e-05, "epoch": 0.36199095022624433, "percentage": 7.27, "elapsed_time": "1:05:31", "remaining_time": "13:55:32"}
41
- {"current_steps": 41, "total_steps": 550, "loss": 0.484, "lr": 5.9636363636363645e-05, "epoch": 0.37104072398190047, "percentage": 7.45, "elapsed_time": "1:07:08", "remaining_time": "13:53:37"}
42
- {"current_steps": 42, "total_steps": 550, "loss": 0.475, "lr": 6.10909090909091e-05, "epoch": 0.38009049773755654, "percentage": 7.64, "elapsed_time": "1:08:45", "remaining_time": "13:51:41"}
43
- {"current_steps": 43, "total_steps": 550, "loss": 0.4961, "lr": 6.254545454545456e-05, "epoch": 0.3891402714932127, "percentage": 7.82, "elapsed_time": "1:10:22", "remaining_time": "13:49:49"}
44
- {"current_steps": 44, "total_steps": 550, "loss": 0.478, "lr": 6.400000000000001e-05, "epoch": 0.39819004524886875, "percentage": 8.0, "elapsed_time": "1:11:59", "remaining_time": "13:47:55"}
45
- {"current_steps": 45, "total_steps": 550, "loss": 0.4857, "lr": 6.545454545454546e-05, "epoch": 0.4072398190045249, "percentage": 8.18, "elapsed_time": "1:13:36", "remaining_time": "13:46:03"}
46
- {"current_steps": 46, "total_steps": 550, "loss": 0.4826, "lr": 6.690909090909092e-05, "epoch": 0.416289592760181, "percentage": 8.36, "elapsed_time": "1:15:13", "remaining_time": "13:44:12"}
47
- {"current_steps": 47, "total_steps": 550, "loss": 0.4757, "lr": 6.836363636363637e-05, "epoch": 0.4253393665158371, "percentage": 8.55, "elapsed_time": "1:16:50", "remaining_time": "13:42:21"}
48
- {"current_steps": 48, "total_steps": 550, "loss": 0.477, "lr": 6.981818181818182e-05, "epoch": 0.4343891402714932, "percentage": 8.73, "elapsed_time": "1:18:27", "remaining_time": "13:40:31"}
49
- {"current_steps": 49, "total_steps": 550, "loss": 0.475, "lr": 7.127272727272728e-05, "epoch": 0.4434389140271493, "percentage": 8.91, "elapsed_time": "1:20:04", "remaining_time": "13:38:42"}
50
- {"current_steps": 50, "total_steps": 550, "loss": 0.4784, "lr": 7.272727272727273e-05, "epoch": 0.45248868778280543, "percentage": 9.09, "elapsed_time": "1:21:41", "remaining_time": "13:36:51"}
51
- {"current_steps": 51, "total_steps": 550, "loss": 0.5044, "lr": 7.418181818181818e-05, "epoch": 0.46153846153846156, "percentage": 9.27, "elapsed_time": "1:23:18", "remaining_time": "13:35:03"}
52
- {"current_steps": 52, "total_steps": 550, "loss": 0.4854, "lr": 7.563636363636365e-05, "epoch": 0.47058823529411764, "percentage": 9.45, "elapsed_time": "1:24:54", "remaining_time": "13:33:12"}
53
- {"current_steps": 53, "total_steps": 550, "loss": 0.4873, "lr": 7.70909090909091e-05, "epoch": 0.4796380090497738, "percentage": 9.64, "elapsed_time": "1:26:31", "remaining_time": "13:31:24"}
54
- {"current_steps": 54, "total_steps": 550, "loss": 0.4775, "lr": 7.854545454545455e-05, "epoch": 0.48868778280542985, "percentage": 9.82, "elapsed_time": "1:28:08", "remaining_time": "13:29:36"}
55
- {"current_steps": 55, "total_steps": 550, "loss": 0.4818, "lr": 8e-05, "epoch": 0.497737556561086, "percentage": 10.0, "elapsed_time": "1:29:45", "remaining_time": "13:27:51"}
56
- {"current_steps": 56, "total_steps": 550, "loss": 0.5467, "lr": 7.999919440291627e-05, "epoch": 0.5067873303167421, "percentage": 10.18, "elapsed_time": "1:31:22", "remaining_time": "13:26:05"}
57
- {"current_steps": 57, "total_steps": 550, "loss": 0.5014, "lr": 7.999677764411438e-05, "epoch": 0.5158371040723982, "percentage": 10.36, "elapsed_time": "1:32:59", "remaining_time": "13:24:20"}
58
- {"current_steps": 58, "total_steps": 550, "loss": 0.4822, "lr": 7.999274982094104e-05, "epoch": 0.5248868778280543, "percentage": 10.55, "elapsed_time": "1:34:36", "remaining_time": "13:22:34"}
59
- {"current_steps": 59, "total_steps": 550, "loss": 0.4802, "lr": 7.998711109563637e-05, "epoch": 0.5339366515837104, "percentage": 10.73, "elapsed_time": "1:36:13", "remaining_time": "13:20:49"}
60
- {"current_steps": 60, "total_steps": 550, "loss": 0.4745, "lr": 7.997986169532741e-05, "epoch": 0.5429864253393665, "percentage": 10.91, "elapsed_time": "1:37:50", "remaining_time": "13:19:05"}
61
- {"current_steps": 61, "total_steps": 550, "loss": 0.4729, "lr": 7.997100191201896e-05, "epoch": 0.5520361990950227, "percentage": 11.09, "elapsed_time": "1:39:27", "remaining_time": "13:17:20"}
62
- {"current_steps": 62, "total_steps": 550, "loss": 0.46, "lr": 7.996053210258176e-05, "epoch": 0.5610859728506787, "percentage": 11.27, "elapsed_time": "1:41:04", "remaining_time": "13:15:36"}
63
- {"current_steps": 63, "total_steps": 550, "loss": 0.465, "lr": 7.994845268873825e-05, "epoch": 0.5701357466063348, "percentage": 11.45, "elapsed_time": "1:42:41", "remaining_time": "13:13:52"}
64
- {"current_steps": 64, "total_steps": 550, "loss": 0.4579, "lr": 7.993476415704543e-05, "epoch": 0.579185520361991, "percentage": 11.64, "elapsed_time": "1:44:18", "remaining_time": "13:12:09"}
65
- {"current_steps": 65, "total_steps": 550, "loss": 0.4757, "lr": 7.991946705887539e-05, "epoch": 0.5882352941176471, "percentage": 11.82, "elapsed_time": "1:45:56", "remaining_time": "13:10:25"}
66
- {"current_steps": 66, "total_steps": 550, "loss": 0.4714, "lr": 7.990256201039297e-05, "epoch": 0.5972850678733032, "percentage": 12.0, "elapsed_time": "1:47:32", "remaining_time": "13:08:41"}
67
- {"current_steps": 67, "total_steps": 550, "loss": 0.4779, "lr": 7.98840496925311e-05, "epoch": 0.6063348416289592, "percentage": 12.18, "elapsed_time": "1:49:10", "remaining_time": "13:06:58"}
68
- {"current_steps": 68, "total_steps": 550, "loss": 0.4794, "lr": 7.986393085096324e-05, "epoch": 0.6153846153846154, "percentage": 12.36, "elapsed_time": "1:50:46", "remaining_time": "13:05:15"}
69
- {"current_steps": 69, "total_steps": 550, "loss": 0.4708, "lr": 7.984220629607336e-05, "epoch": 0.6244343891402715, "percentage": 12.55, "elapsed_time": "1:52:24", "remaining_time": "13:03:33"}
70
- {"current_steps": 70, "total_steps": 550, "loss": 0.4712, "lr": 7.981887690292339e-05, "epoch": 0.6334841628959276, "percentage": 12.73, "elapsed_time": "1:54:01", "remaining_time": "13:01:50"}
71
- {"current_steps": 71, "total_steps": 550, "loss": 0.4667, "lr": 7.979394361121789e-05, "epoch": 0.6425339366515838, "percentage": 12.91, "elapsed_time": "1:55:38", "remaining_time": "13:00:08"}
72
- {"current_steps": 72, "total_steps": 550, "loss": 0.4682, "lr": 7.97674074252662e-05, "epoch": 0.6515837104072398, "percentage": 13.09, "elapsed_time": "1:57:15", "remaining_time": "12:58:25"}
73
- {"current_steps": 73, "total_steps": 550, "loss": 0.464, "lr": 7.9739269413942e-05, "epoch": 0.6606334841628959, "percentage": 13.27, "elapsed_time": "1:58:52", "remaining_time": "12:56:42"}
74
- {"current_steps": 74, "total_steps": 550, "loss": 0.4601, "lr": 7.970953071064036e-05, "epoch": 0.669683257918552, "percentage": 13.45, "elapsed_time": "2:00:28", "remaining_time": "12:54:59"}
75
- {"current_steps": 75, "total_steps": 550, "loss": 0.4633, "lr": 7.967819251323182e-05, "epoch": 0.6787330316742082, "percentage": 13.64, "elapsed_time": "2:02:05", "remaining_time": "12:53:17"}
76
- {"current_steps": 76, "total_steps": 550, "loss": 0.4577, "lr": 7.964525608401445e-05, "epoch": 0.6877828054298643, "percentage": 13.82, "elapsed_time": "2:03:42", "remaining_time": "12:51:35"}
77
- {"current_steps": 77, "total_steps": 550, "loss": 0.4562, "lr": 7.961072274966282e-05, "epoch": 0.6968325791855203, "percentage": 14.0, "elapsed_time": "2:05:20", "remaining_time": "12:49:54"}
78
- {"current_steps": 78, "total_steps": 550, "loss": 0.4523, "lr": 7.957459390117458e-05, "epoch": 0.7058823529411765, "percentage": 14.18, "elapsed_time": "2:06:57", "remaining_time": "12:48:12"}
79
- {"current_steps": 79, "total_steps": 550, "loss": 0.4602, "lr": 7.95368709938145e-05, "epoch": 0.7149321266968326, "percentage": 14.36, "elapsed_time": "2:08:34", "remaining_time": "12:46:31"}
80
- {"current_steps": 80, "total_steps": 550, "loss": 0.447, "lr": 7.949755554705577e-05, "epoch": 0.7239819004524887, "percentage": 14.55, "elapsed_time": "2:10:10", "remaining_time": "12:44:49"}
81
- {"current_steps": 81, "total_steps": 550, "loss": 0.4485, "lr": 7.945664914451888e-05, "epoch": 0.7330316742081447, "percentage": 14.73, "elapsed_time": "2:11:47", "remaining_time": "12:43:07"}
82
- {"current_steps": 82, "total_steps": 550, "loss": 0.4493, "lr": 7.941415343390773e-05, "epoch": 0.7420814479638009, "percentage": 14.91, "elapsed_time": "2:13:24", "remaining_time": "12:41:25"}
83
- {"current_steps": 83, "total_steps": 550, "loss": 0.4557, "lr": 7.937007012694335e-05, "epoch": 0.751131221719457, "percentage": 15.09, "elapsed_time": "2:15:01", "remaining_time": "12:39:43"}
84
- {"current_steps": 84, "total_steps": 550, "loss": 0.4617, "lr": 7.932440099929493e-05, "epoch": 0.7601809954751131, "percentage": 15.27, "elapsed_time": "2:16:38", "remaining_time": "12:38:02"}
85
- {"current_steps": 85, "total_steps": 550, "loss": 0.463, "lr": 7.927714789050826e-05, "epoch": 0.7692307692307693, "percentage": 15.45, "elapsed_time": "2:18:15", "remaining_time": "12:36:22"}
86
- {"current_steps": 86, "total_steps": 550, "loss": 0.4461, "lr": 7.92283127039317e-05, "epoch": 0.7782805429864253, "percentage": 15.64, "elapsed_time": "2:19:52", "remaining_time": "12:34:41"}
87
- {"current_steps": 87, "total_steps": 550, "loss": 0.4451, "lr": 7.917789740663941e-05, "epoch": 0.7873303167420814, "percentage": 15.82, "elapsed_time": "2:21:29", "remaining_time": "12:33:00"}
88
- {"current_steps": 88, "total_steps": 550, "loss": 0.4421, "lr": 7.912590402935223e-05, "epoch": 0.7963800904977375, "percentage": 16.0, "elapsed_time": "2:23:06", "remaining_time": "12:31:20"}
89
- {"current_steps": 89, "total_steps": 550, "loss": 0.4518, "lr": 7.907233466635582e-05, "epoch": 0.8054298642533937, "percentage": 16.18, "elapsed_time": "2:24:43", "remaining_time": "12:29:40"}
90
- {"current_steps": 90, "total_steps": 550, "loss": 0.4466, "lr": 7.90171914754163e-05, "epoch": 0.8144796380090498, "percentage": 16.36, "elapsed_time": "2:26:20", "remaining_time": "12:27:59"}
91
- {"current_steps": 91, "total_steps": 550, "loss": 0.4465, "lr": 7.896047667769335e-05, "epoch": 0.8235294117647058, "percentage": 16.55, "elapsed_time": "2:27:57", "remaining_time": "12:26:19"}
92
- {"current_steps": 92, "total_steps": 550, "loss": 0.4367, "lr": 7.890219255765077e-05, "epoch": 0.832579185520362, "percentage": 16.73, "elapsed_time": "2:29:35", "remaining_time": "12:24:40"}
93
- {"current_steps": 93, "total_steps": 550, "loss": 0.447, "lr": 7.884234146296442e-05, "epoch": 0.8416289592760181, "percentage": 16.91, "elapsed_time": "2:31:13", "remaining_time": "12:23:05"}
94
- {"current_steps": 94, "total_steps": 550, "loss": 0.4414, "lr": 7.878092580442766e-05, "epoch": 0.8506787330316742, "percentage": 17.09, "elapsed_time": "2:32:51", "remaining_time": "12:21:29"}
95
- {"current_steps": 95, "total_steps": 550, "loss": 0.4491, "lr": 7.871794805585427e-05, "epoch": 0.8597285067873304, "percentage": 17.27, "elapsed_time": "2:34:28", "remaining_time": "12:19:49"}
96
- {"current_steps": 96, "total_steps": 550, "loss": 0.4452, "lr": 7.865341075397874e-05, "epoch": 0.8687782805429864, "percentage": 17.45, "elapsed_time": "2:36:05", "remaining_time": "12:18:09"}
97
- {"current_steps": 97, "total_steps": 550, "loss": 0.4392, "lr": 7.858731649835424e-05, "epoch": 0.8778280542986425, "percentage": 17.64, "elapsed_time": "2:37:42", "remaining_time": "12:16:31"}
98
- {"current_steps": 98, "total_steps": 550, "loss": 0.4434, "lr": 7.85196679512477e-05, "epoch": 0.8868778280542986, "percentage": 17.82, "elapsed_time": "2:39:19", "remaining_time": "12:14:52"}
99
- {"current_steps": 99, "total_steps": 550, "loss": 0.4337, "lr": 7.845046783753276e-05, "epoch": 0.8959276018099548, "percentage": 18.0, "elapsed_time": "2:40:57", "remaining_time": "12:13:14"}
100
- {"current_steps": 100, "total_steps": 550, "loss": 0.4372, "lr": 7.837971894457991e-05, "epoch": 0.9049773755656109, "percentage": 18.18, "elapsed_time": "2:42:35", "remaining_time": "12:11:39"}
101
- {"current_steps": 101, "total_steps": 550, "loss": 0.4414, "lr": 7.830742412214422e-05, "epoch": 0.9140271493212669, "percentage": 18.36, "elapsed_time": "2:44:13", "remaining_time": "12:10:02"}
102
- {"current_steps": 102, "total_steps": 550, "loss": 0.441, "lr": 7.82335862822506e-05, "epoch": 0.9230769230769231, "percentage": 18.55, "elapsed_time": "2:45:50", "remaining_time": "12:08:24"}
103
- {"current_steps": 103, "total_steps": 550, "loss": 0.4304, "lr": 7.815820839907651e-05, "epoch": 0.9321266968325792, "percentage": 18.73, "elapsed_time": "2:47:28", "remaining_time": "12:06:46"}
104
- {"current_steps": 104, "total_steps": 550, "loss": 0.4417, "lr": 7.808129350883207e-05, "epoch": 0.9411764705882353, "percentage": 18.91, "elapsed_time": "2:49:05", "remaining_time": "12:05:09"}
105
- {"current_steps": 105, "total_steps": 550, "loss": 0.4402, "lr": 7.800284470963783e-05, "epoch": 0.9502262443438914, "percentage": 19.09, "elapsed_time": "2:50:42", "remaining_time": "12:03:30"}
106
- {"current_steps": 106, "total_steps": 550, "loss": 0.4363, "lr": 7.792286516139999e-05, "epoch": 0.9592760180995475, "percentage": 19.27, "elapsed_time": "2:52:20", "remaining_time": "12:01:53"}
107
- {"current_steps": 107, "total_steps": 550, "loss": 0.4315, "lr": 7.784135808568308e-05, "epoch": 0.9683257918552036, "percentage": 19.45, "elapsed_time": "2:53:58", "remaining_time": "12:00:16"}
108
- {"current_steps": 108, "total_steps": 550, "loss": 0.4433, "lr": 7.775832676558028e-05, "epoch": 0.9773755656108597, "percentage": 19.64, "elapsed_time": "2:55:35", "remaining_time": "11:58:38"}
109
- {"current_steps": 109, "total_steps": 550, "loss": 0.4382, "lr": 7.7673774545581e-05, "epoch": 0.9864253393665159, "percentage": 19.82, "elapsed_time": "2:57:13", "remaining_time": "11:57:01"}
110
- {"current_steps": 110, "total_steps": 550, "loss": 0.4406, "lr": 7.758770483143634e-05, "epoch": 0.995475113122172, "percentage": 20.0, "elapsed_time": "2:58:50", "remaining_time": "11:55:22"}
111
- {"current_steps": 111, "total_steps": 550, "loss": 0.7405, "lr": 7.750012109002185e-05, "epoch": 1.006787330316742, "percentage": 20.18, "elapsed_time": "3:01:56", "remaining_time": "11:59:34"}
112
- {"current_steps": 112, "total_steps": 550, "loss": 0.4453, "lr": 7.741102684919787e-05, "epoch": 1.0158371040723981, "percentage": 20.36, "elapsed_time": "3:03:34", "remaining_time": "11:57:53"}
113
- {"current_steps": 113, "total_steps": 550, "loss": 0.4238, "lr": 7.732042569766741e-05, "epoch": 1.0248868778280542, "percentage": 20.55, "elapsed_time": "3:05:11", "remaining_time": "11:56:12"}
114
- {"current_steps": 114, "total_steps": 550, "loss": 0.425, "lr": 7.722832128483165e-05, "epoch": 1.0339366515837105, "percentage": 20.73, "elapsed_time": "3:06:49", "remaining_time": "11:54:33"}
115
- {"current_steps": 115, "total_steps": 550, "loss": 0.4176, "lr": 7.71347173206429e-05, "epoch": 1.0429864253393666, "percentage": 20.91, "elapsed_time": "3:08:26", "remaining_time": "11:52:49"}
116
- {"current_steps": 116, "total_steps": 550, "loss": 0.4311, "lr": 7.703961757545522e-05, "epoch": 1.0520361990950227, "percentage": 21.09, "elapsed_time": "3:10:04", "remaining_time": "11:51:08"}
117
- {"current_steps": 117, "total_steps": 550, "loss": 0.4176, "lr": 7.694302587987245e-05, "epoch": 1.0610859728506787, "percentage": 21.27, "elapsed_time": "3:11:41", "remaining_time": "11:49:26"}
118
- {"current_steps": 118, "total_steps": 550, "loss": 0.4218, "lr": 7.6844946124594e-05, "epoch": 1.0701357466063348, "percentage": 21.45, "elapsed_time": "3:13:20", "remaining_time": "11:47:49"}
119
- {"current_steps": 119, "total_steps": 550, "loss": 0.4217, "lr": 7.674538226025815e-05, "epoch": 1.079185520361991, "percentage": 21.64, "elapsed_time": "3:14:58", "remaining_time": "11:46:09"}
120
- {"current_steps": 120, "total_steps": 550, "loss": 0.417, "lr": 7.664433829728279e-05, "epoch": 1.088235294117647, "percentage": 21.82, "elapsed_time": "3:16:36", "remaining_time": "11:44:31"}
121
- {"current_steps": 121, "total_steps": 550, "loss": 0.4089, "lr": 7.654181830570404e-05, "epoch": 1.0972850678733033, "percentage": 22.0, "elapsed_time": "3:18:14", "remaining_time": "11:42:50"}
122
- {"current_steps": 122, "total_steps": 550, "loss": 0.4082, "lr": 7.64378264150122e-05, "epoch": 1.1063348416289593, "percentage": 22.18, "elapsed_time": "3:19:51", "remaining_time": "11:41:09"}
123
- {"current_steps": 123, "total_steps": 550, "loss": 0.4125, "lr": 7.633236681398549e-05, "epoch": 1.1153846153846154, "percentage": 22.36, "elapsed_time": "3:21:29", "remaining_time": "11:39:28"}
124
- {"current_steps": 124, "total_steps": 550, "loss": 0.4219, "lr": 7.622544375052124e-05, "epoch": 1.1244343891402715, "percentage": 22.55, "elapsed_time": "3:23:06", "remaining_time": "11:37:46"}
125
- {"current_steps": 125, "total_steps": 550, "loss": 0.4103, "lr": 7.611706153146486e-05, "epoch": 1.1334841628959276, "percentage": 22.73, "elapsed_time": "3:24:43", "remaining_time": "11:36:03"}
126
- {"current_steps": 126, "total_steps": 550, "loss": 0.4144, "lr": 7.600722452243632e-05, "epoch": 1.1425339366515836, "percentage": 22.91, "elapsed_time": "3:26:20", "remaining_time": "11:34:20"}
127
- {"current_steps": 127, "total_steps": 550, "loss": 0.416, "lr": 7.589593714765434e-05, "epoch": 1.1515837104072397, "percentage": 23.09, "elapsed_time": "3:27:57", "remaining_time": "11:32:38"}
128
- {"current_steps": 128, "total_steps": 550, "loss": 0.4107, "lr": 7.578320388975816e-05, "epoch": 1.160633484162896, "percentage": 23.27, "elapsed_time": "3:29:34", "remaining_time": "11:30:55"}
129
- {"current_steps": 129, "total_steps": 550, "loss": 0.4107, "lr": 7.566902928962694e-05, "epoch": 1.169683257918552, "percentage": 23.45, "elapsed_time": "3:31:11", "remaining_time": "11:29:13"}
130
- {"current_steps": 130, "total_steps": 550, "loss": 0.4193, "lr": 7.555341794619695e-05, "epoch": 1.1787330316742082, "percentage": 23.64, "elapsed_time": "3:32:48", "remaining_time": "11:27:30"}
131
- {"current_steps": 131, "total_steps": 550, "loss": 0.403, "lr": 7.543637451627623e-05, "epoch": 1.1877828054298643, "percentage": 23.82, "elapsed_time": "3:34:25", "remaining_time": "11:25:48"}
132
- {"current_steps": 132, "total_steps": 550, "loss": 0.4066, "lr": 7.531790371435709e-05, "epoch": 1.1968325791855203, "percentage": 24.0, "elapsed_time": "3:36:02", "remaining_time": "11:24:06"}
133
- {"current_steps": 133, "total_steps": 550, "loss": 0.4151, "lr": 7.519801031242613e-05, "epoch": 1.2058823529411764, "percentage": 24.18, "elapsed_time": "3:37:38", "remaining_time": "11:22:24"}
134
- {"current_steps": 134, "total_steps": 550, "loss": 0.4089, "lr": 7.507669913977213e-05, "epoch": 1.2149321266968327, "percentage": 24.36, "elapsed_time": "3:39:15", "remaining_time": "11:20:42"}
135
- {"current_steps": 135, "total_steps": 550, "loss": 0.405, "lr": 7.49539750827914e-05, "epoch": 1.2239819004524888, "percentage": 24.55, "elapsed_time": "3:40:52", "remaining_time": "11:18:59"}
136
- {"current_steps": 136, "total_steps": 550, "loss": 0.4065, "lr": 7.482984308479109e-05, "epoch": 1.2330316742081449, "percentage": 24.73, "elapsed_time": "3:42:29", "remaining_time": "11:17:18"}
137
- {"current_steps": 137, "total_steps": 550, "loss": 0.4113, "lr": 7.470430814578997e-05, "epoch": 1.242081447963801, "percentage": 24.91, "elapsed_time": "3:44:06", "remaining_time": "11:15:36"}
138
- {"current_steps": 138, "total_steps": 550, "loss": 0.4064, "lr": 7.457737532231708e-05, "epoch": 1.251131221719457, "percentage": 25.09, "elapsed_time": "3:45:43", "remaining_time": "11:13:54"}
139
- {"current_steps": 139, "total_steps": 550, "loss": 0.4035, "lr": 7.444904972720803e-05, "epoch": 1.260180995475113, "percentage": 25.27, "elapsed_time": "3:47:20", "remaining_time": "11:12:13"}
140
- {"current_steps": 140, "total_steps": 550, "loss": 0.4118, "lr": 7.431933652939909e-05, "epoch": 1.2692307692307692, "percentage": 25.45, "elapsed_time": "3:48:57", "remaining_time": "11:10:31"}
141
- {"current_steps": 141, "total_steps": 550, "loss": 0.401, "lr": 7.418824095371895e-05, "epoch": 1.2782805429864252, "percentage": 25.64, "elapsed_time": "3:50:34", "remaining_time": "11:08:50"}
142
- {"current_steps": 142, "total_steps": 550, "loss": 0.4099, "lr": 7.405576828067829e-05, "epoch": 1.2873303167420813, "percentage": 25.82, "elapsed_time": "3:52:11", "remaining_time": "11:07:08"}
143
- {"current_steps": 143, "total_steps": 550, "loss": 0.4046, "lr": 7.392192384625704e-05, "epoch": 1.2963800904977376, "percentage": 26.0, "elapsed_time": "3:53:48", "remaining_time": "11:05:26"}
144
- {"current_steps": 144, "total_steps": 550, "loss": 0.4053, "lr": 7.378671304168955e-05, "epoch": 1.3054298642533937, "percentage": 26.18, "elapsed_time": "3:55:25", "remaining_time": "11:03:45"}
145
- {"current_steps": 145, "total_steps": 550, "loss": 0.4048, "lr": 7.365014131324725e-05, "epoch": 1.3144796380090498, "percentage": 26.36, "elapsed_time": "3:57:02", "remaining_time": "11:02:03"}
146
- {"current_steps": 146, "total_steps": 550, "loss": 0.4052, "lr": 7.35122141620195e-05, "epoch": 1.3235294117647058, "percentage": 26.55, "elapsed_time": "3:58:38", "remaining_time": "11:00:22"}
147
- {"current_steps": 147, "total_steps": 550, "loss": 0.3967, "lr": 7.337293714369182e-05, "epoch": 1.332579185520362, "percentage": 26.73, "elapsed_time": "4:00:15", "remaining_time": "10:58:40"}
148
- {"current_steps": 148, "total_steps": 550, "loss": 0.403, "lr": 7.323231586832219e-05, "epoch": 1.3416289592760182, "percentage": 26.91, "elapsed_time": "4:01:52", "remaining_time": "10:57:00"}
149
- {"current_steps": 149, "total_steps": 550, "loss": 0.3994, "lr": 7.30903560001151e-05, "epoch": 1.3506787330316743, "percentage": 27.09, "elapsed_time": "4:03:29", "remaining_time": "10:55:19"}
150
- {"current_steps": 150, "total_steps": 550, "loss": 0.4047, "lr": 7.294706325719331e-05, "epoch": 1.3597285067873304, "percentage": 27.27, "elapsed_time": "4:05:06", "remaining_time": "10:53:38"}
151
- {"current_steps": 151, "total_steps": 550, "loss": 0.4077, "lr": 7.280244341136765e-05, "epoch": 1.3687782805429864, "percentage": 27.45, "elapsed_time": "4:06:43", "remaining_time": "10:51:57"}
152
- {"current_steps": 152, "total_steps": 550, "loss": 0.405, "lr": 7.26565022879044e-05, "epoch": 1.3778280542986425, "percentage": 27.64, "elapsed_time": "4:08:20", "remaining_time": "10:50:16"}
153
- {"current_steps": 153, "total_steps": 550, "loss": 0.403, "lr": 7.250924576529072e-05, "epoch": 1.3868778280542986, "percentage": 27.82, "elapsed_time": "4:09:57", "remaining_time": "10:48:36"}
154
- {"current_steps": 154, "total_steps": 550, "loss": 0.4056, "lr": 7.236067977499791e-05, "epoch": 1.3959276018099547, "percentage": 28.0, "elapsed_time": "4:11:34", "remaining_time": "10:46:55"}
155
- {"current_steps": 155, "total_steps": 550, "loss": 0.4056, "lr": 7.221081030124235e-05, "epoch": 1.4049773755656108, "percentage": 28.18, "elapsed_time": "4:13:11", "remaining_time": "10:45:14"}
156
- {"current_steps": 156, "total_steps": 550, "loss": 0.4043, "lr": 7.205964338074462e-05, "epoch": 1.4140271493212668, "percentage": 28.36, "elapsed_time": "4:14:48", "remaining_time": "10:43:33"}
157
- {"current_steps": 157, "total_steps": 550, "loss": 0.4056, "lr": 7.190718510248622e-05, "epoch": 1.4230769230769231, "percentage": 28.55, "elapsed_time": "4:16:25", "remaining_time": "10:41:52"}
158
- {"current_steps": 158, "total_steps": 550, "loss": 0.4053, "lr": 7.175344160746438e-05, "epoch": 1.4321266968325792, "percentage": 28.73, "elapsed_time": "4:18:02", "remaining_time": "10:40:11"}
159
- {"current_steps": 159, "total_steps": 550, "loss": 0.3935, "lr": 7.159841908844465e-05, "epoch": 1.4411764705882353, "percentage": 28.91, "elapsed_time": "4:19:38", "remaining_time": "10:38:30"}
160
- {"current_steps": 160, "total_steps": 550, "loss": 0.4012, "lr": 7.144212378971151e-05, "epoch": 1.4502262443438914, "percentage": 29.09, "elapsed_time": "4:21:15", "remaining_time": "10:36:49"}
161
- {"current_steps": 161, "total_steps": 550, "loss": 0.3952, "lr": 7.128456200681678e-05, "epoch": 1.4592760180995474, "percentage": 29.27, "elapsed_time": "4:22:52", "remaining_time": "10:35:08"}
162
- {"current_steps": 162, "total_steps": 550, "loss": 0.3905, "lr": 7.11257400863261e-05, "epoch": 1.4683257918552037, "percentage": 29.45, "elapsed_time": "4:24:29", "remaining_time": "10:33:28"}
163
- {"current_steps": 163, "total_steps": 550, "loss": 0.3964, "lr": 7.096566442556331e-05, "epoch": 1.4773755656108598, "percentage": 29.64, "elapsed_time": "4:26:06", "remaining_time": "10:31:48"}
164
- {"current_steps": 164, "total_steps": 550, "loss": 0.3949, "lr": 7.080434147235263e-05, "epoch": 1.4864253393665159, "percentage": 29.82, "elapsed_time": "4:27:43", "remaining_time": "10:30:07"}
165
- {"current_steps": 165, "total_steps": 550, "loss": 0.4037, "lr": 7.064177772475912e-05, "epoch": 1.495475113122172, "percentage": 30.0, "elapsed_time": "4:29:20", "remaining_time": "10:28:27"}
166
- {"current_steps": 166, "total_steps": 550, "loss": 0.4021, "lr": 7.047797973082684e-05, "epoch": 1.504524886877828, "percentage": 30.18, "elapsed_time": "4:30:57", "remaining_time": "10:26:47"}
167
- {"current_steps": 167, "total_steps": 550, "loss": 0.3913, "lr": 7.031295408831508e-05, "epoch": 1.5135746606334841, "percentage": 30.36, "elapsed_time": "4:32:34", "remaining_time": "10:25:07"}
168
- {"current_steps": 168, "total_steps": 550, "loss": 0.4031, "lr": 7.014670744443267e-05, "epoch": 1.5226244343891402, "percentage": 30.55, "elapsed_time": "4:34:11", "remaining_time": "10:23:27"}
169
- {"current_steps": 169, "total_steps": 550, "loss": 0.3981, "lr": 6.997924649557017e-05, "epoch": 1.5316742081447963, "percentage": 30.73, "elapsed_time": "4:35:48", "remaining_time": "10:21:47"}
170
- {"current_steps": 170, "total_steps": 550, "loss": 0.3992, "lr": 6.98105779870302e-05, "epoch": 1.5407239819004523, "percentage": 30.91, "elapsed_time": "4:37:25", "remaining_time": "10:20:07"}
171
- {"current_steps": 171, "total_steps": 550, "loss": 0.3983, "lr": 6.964070871275567e-05, "epoch": 1.5497737556561086, "percentage": 31.09, "elapsed_time": "4:39:02", "remaining_time": "10:18:27"}
172
- {"current_steps": 172, "total_steps": 550, "loss": 0.3993, "lr": 6.94696455150562e-05, "epoch": 1.5588235294117647, "percentage": 31.27, "elapsed_time": "4:40:39", "remaining_time": "10:16:47"}
173
- {"current_steps": 173, "total_steps": 550, "loss": 0.3979, "lr": 6.929739528433244e-05, "epoch": 1.5678733031674208, "percentage": 31.45, "elapsed_time": "4:42:16", "remaining_time": "10:15:07"}
174
- {"current_steps": 174, "total_steps": 550, "loss": 0.3976, "lr": 6.912396495879857e-05, "epoch": 1.5769230769230769, "percentage": 31.64, "elapsed_time": "4:43:53", "remaining_time": "10:13:27"}
175
- {"current_steps": 175, "total_steps": 550, "loss": 0.3985, "lr": 6.89493615242028e-05, "epoch": 1.5859728506787332, "percentage": 31.82, "elapsed_time": "4:45:30", "remaining_time": "10:11:47"}
176
- {"current_steps": 176, "total_steps": 550, "loss": 0.3956, "lr": 6.877359201354606e-05, "epoch": 1.5950226244343892, "percentage": 32.0, "elapsed_time": "4:47:07", "remaining_time": "10:10:07"}
177
- {"current_steps": 177, "total_steps": 550, "loss": 0.3976, "lr": 6.859666350679854e-05, "epoch": 1.6040723981900453, "percentage": 32.18, "elapsed_time": "4:48:44", "remaining_time": "10:08:28"}
178
- {"current_steps": 178, "total_steps": 550, "loss": 0.3924, "lr": 6.841858313061477e-05, "epoch": 1.6131221719457014, "percentage": 32.36, "elapsed_time": "4:50:21", "remaining_time": "10:06:48"}
179
- {"current_steps": 179, "total_steps": 550, "loss": 0.3994, "lr": 6.823935805804626e-05, "epoch": 1.6221719457013575, "percentage": 32.55, "elapsed_time": "4:51:58", "remaining_time": "10:05:08"}
180
- {"current_steps": 180, "total_steps": 550, "loss": 0.3899, "lr": 6.805899550825285e-05, "epoch": 1.6312217194570136, "percentage": 32.73, "elapsed_time": "4:53:34", "remaining_time": "10:03:28"}
181
- {"current_steps": 181, "total_steps": 550, "loss": 0.3872, "lr": 6.787750274621175e-05, "epoch": 1.6402714932126696, "percentage": 32.91, "elapsed_time": "4:55:11", "remaining_time": "10:01:48"}
182
- {"current_steps": 182, "total_steps": 550, "loss": 0.395, "lr": 6.769488708242492e-05, "epoch": 1.6493212669683257, "percentage": 33.09, "elapsed_time": "4:56:48", "remaining_time": "10:00:08"}
183
- {"current_steps": 183, "total_steps": 550, "loss": 0.3936, "lr": 6.751115587262469e-05, "epoch": 1.6583710407239818, "percentage": 33.27, "elapsed_time": "4:58:25", "remaining_time": "9:58:29"}
184
- {"current_steps": 184, "total_steps": 550, "loss": 0.3905, "lr": 6.732631651747739e-05, "epoch": 1.6674208144796379, "percentage": 33.45, "elapsed_time": "5:00:02", "remaining_time": "9:56:49"}
185
- {"current_steps": 185, "total_steps": 550, "loss": 0.3936, "lr": 6.714037646228529e-05, "epoch": 1.6764705882352942, "percentage": 33.64, "elapsed_time": "5:01:39", "remaining_time": "9:55:10"}
186
- {"current_steps": 186, "total_steps": 550, "loss": 0.3918, "lr": 6.695334319668672e-05, "epoch": 1.6855203619909502, "percentage": 33.82, "elapsed_time": "5:03:16", "remaining_time": "9:53:30"}
187
- {"current_steps": 187, "total_steps": 550, "loss": 0.3964, "lr": 6.676522425435433e-05, "epoch": 1.6945701357466063, "percentage": 34.0, "elapsed_time": "5:04:53", "remaining_time": "9:51:51"}
188
- {"current_steps": 188, "total_steps": 550, "loss": 0.3955, "lr": 6.65760272126917e-05, "epoch": 1.7036199095022626, "percentage": 34.18, "elapsed_time": "5:06:30", "remaining_time": "9:50:12"}
189
- {"current_steps": 189, "total_steps": 550, "loss": 0.388, "lr": 6.638575969252806e-05, "epoch": 1.7126696832579187, "percentage": 34.36, "elapsed_time": "5:08:07", "remaining_time": "9:48:32"}
190
- {"current_steps": 190, "total_steps": 550, "loss": 0.3943, "lr": 6.619442935781141e-05, "epoch": 1.7217194570135748, "percentage": 34.55, "elapsed_time": "5:09:44", "remaining_time": "9:46:53"}
191
- {"current_steps": 191, "total_steps": 550, "loss": 0.3929, "lr": 6.600204391529971e-05, "epoch": 1.7307692307692308, "percentage": 34.73, "elapsed_time": "5:11:21", "remaining_time": "9:45:14"}
192
- {"current_steps": 192, "total_steps": 550, "loss": 0.3929, "lr": 6.580861111425053e-05, "epoch": 1.739819004524887, "percentage": 34.91, "elapsed_time": "5:12:58", "remaining_time": "9:43:34"}
193
- {"current_steps": 193, "total_steps": 550, "loss": 0.3899, "lr": 6.56141387461089e-05, "epoch": 1.748868778280543, "percentage": 35.09, "elapsed_time": "5:14:35", "remaining_time": "9:41:55"}
194
- {"current_steps": 194, "total_steps": 550, "loss": 0.395, "lr": 6.541863464419346e-05, "epoch": 1.757918552036199, "percentage": 35.27, "elapsed_time": "5:16:12", "remaining_time": "9:40:16"}
195
- {"current_steps": 195, "total_steps": 550, "loss": 0.3845, "lr": 6.52221066833809e-05, "epoch": 1.7669683257918551, "percentage": 35.45, "elapsed_time": "5:17:49", "remaining_time": "9:38:36"}
196
- {"current_steps": 196, "total_steps": 550, "loss": 0.39, "lr": 6.502456277978887e-05, "epoch": 1.7760180995475112, "percentage": 35.64, "elapsed_time": "5:19:26", "remaining_time": "9:36:57"}
197
- {"current_steps": 197, "total_steps": 550, "loss": 0.3878, "lr": 6.482601089045696e-05, "epoch": 1.7850678733031673, "percentage": 35.82, "elapsed_time": "5:21:03", "remaining_time": "9:35:18"}
198
- {"current_steps": 198, "total_steps": 550, "loss": 0.3827, "lr": 6.462645901302633e-05, "epoch": 1.7941176470588234, "percentage": 36.0, "elapsed_time": "5:22:40", "remaining_time": "9:33:38"}
199
- {"current_steps": 199, "total_steps": 550, "loss": 0.383, "lr": 6.442591518541753e-05, "epoch": 1.8031674208144797, "percentage": 36.18, "elapsed_time": "5:24:17", "remaining_time": "9:31:59"}
200
- {"current_steps": 200, "total_steps": 550, "loss": 0.3867, "lr": 6.422438748550667e-05, "epoch": 1.8122171945701357, "percentage": 36.36, "elapsed_time": "5:25:54", "remaining_time": "9:30:20"}
201
- {"current_steps": 201, "total_steps": 550, "loss": 0.3906, "lr": 6.402188403080013e-05, "epoch": 1.8212669683257918, "percentage": 36.55, "elapsed_time": "5:27:31", "remaining_time": "9:28:41"}
202
- {"current_steps": 202, "total_steps": 550, "loss": 0.3856, "lr": 6.381841297810753e-05, "epoch": 1.8303167420814481, "percentage": 36.73, "elapsed_time": "5:29:08", "remaining_time": "9:27:02"}
203
- {"current_steps": 203, "total_steps": 550, "loss": 0.3893, "lr": 6.361398252321321e-05, "epoch": 1.8393665158371042, "percentage": 36.91, "elapsed_time": "5:30:45", "remaining_time": "9:25:23"}
204
- {"current_steps": 204, "total_steps": 550, "loss": 0.3851, "lr": 6.340860090054608e-05, "epoch": 1.8484162895927603, "percentage": 37.09, "elapsed_time": "5:32:22", "remaining_time": "9:23:44"}
205
- {"current_steps": 205, "total_steps": 550, "loss": 0.3868, "lr": 6.320227638284793e-05, "epoch": 1.8574660633484164, "percentage": 37.27, "elapsed_time": "5:33:59", "remaining_time": "9:22:05"}
206
- {"current_steps": 206, "total_steps": 550, "loss": 0.3921, "lr": 6.29950172808403e-05, "epoch": 1.8665158371040724, "percentage": 37.45, "elapsed_time": "5:35:36", "remaining_time": "9:20:25"}
207
- {"current_steps": 207, "total_steps": 550, "loss": 0.3849, "lr": 6.278683194288956e-05, "epoch": 1.8755656108597285, "percentage": 37.64, "elapsed_time": "5:37:13", "remaining_time": "9:18:46"}
208
- {"current_steps": 208, "total_steps": 550, "loss": 0.3904, "lr": 6.257772875467078e-05, "epoch": 1.8846153846153846, "percentage": 37.82, "elapsed_time": "5:38:51", "remaining_time": "9:17:09"}
209
- {"current_steps": 209, "total_steps": 550, "loss": 0.3918, "lr": 6.236771613882987e-05, "epoch": 1.8936651583710407, "percentage": 38.0, "elapsed_time": "5:40:28", "remaining_time": "9:15:30"}
210
- {"current_steps": 210, "total_steps": 550, "loss": 0.3871, "lr": 6.215680255464442e-05, "epoch": 1.9027149321266967, "percentage": 38.18, "elapsed_time": "5:42:05", "remaining_time": "9:13:51"}
211
- {"current_steps": 211, "total_steps": 550, "loss": 0.3898, "lr": 6.194499649768281e-05, "epoch": 1.9117647058823528, "percentage": 38.36, "elapsed_time": "5:43:42", "remaining_time": "9:12:12"}
212
- {"current_steps": 212, "total_steps": 550, "loss": 0.3843, "lr": 6.173230649946213e-05, "epoch": 1.9208144796380089, "percentage": 38.55, "elapsed_time": "5:45:19", "remaining_time": "9:10:33"}
213
- {"current_steps": 213, "total_steps": 550, "loss": 0.3831, "lr": 6.15187411271045e-05, "epoch": 1.9298642533936652, "percentage": 38.73, "elapsed_time": "5:46:56", "remaining_time": "9:08:55"}
214
- {"current_steps": 214, "total_steps": 550, "loss": 0.3857, "lr": 6.130430898299199e-05, "epoch": 1.9389140271493213, "percentage": 38.91, "elapsed_time": "5:48:33", "remaining_time": "9:07:16"}
215
- {"current_steps": 215, "total_steps": 550, "loss": 0.3873, "lr": 6.10890187044201e-05, "epoch": 1.9479638009049773, "percentage": 39.09, "elapsed_time": "5:50:10", "remaining_time": "9:05:37"}
216
- {"current_steps": 216, "total_steps": 550, "loss": 0.3859, "lr": 6.087287896324984e-05, "epoch": 1.9570135746606336, "percentage": 39.27, "elapsed_time": "5:51:47", "remaining_time": "9:03:58"}
217
- {"current_steps": 217, "total_steps": 550, "loss": 0.3913, "lr": 6.0655898465558484e-05, "epoch": 1.9660633484162897, "percentage": 39.45, "elapsed_time": "5:53:24", "remaining_time": "9:02:19"}
218
- {"current_steps": 218, "total_steps": 550, "loss": 0.3829, "lr": 6.043808595128883e-05, "epoch": 1.9751131221719458, "percentage": 39.64, "elapsed_time": "5:55:02", "remaining_time": "9:00:41"}
219
- {"current_steps": 219, "total_steps": 550, "loss": 0.3918, "lr": 6.021945019389719e-05, "epoch": 1.9841628959276019, "percentage": 39.82, "elapsed_time": "5:56:39", "remaining_time": "8:59:03"}
220
- {"current_steps": 220, "total_steps": 550, "loss": 0.385, "lr": 6.000000000000001e-05, "epoch": 1.993212669683258, "percentage": 40.0, "elapsed_time": "5:58:16", "remaining_time": "8:57:24"}
221
- {"current_steps": 221, "total_steps": 550, "loss": 0.6705, "lr": 5.977974420901908e-05, "epoch": 2.004524886877828, "percentage": 40.18, "elapsed_time": "6:01:27", "remaining_time": "8:58:05"}
222
- {"current_steps": 222, "total_steps": 550, "loss": 0.364, "lr": 5.955869169282556e-05, "epoch": 2.013574660633484, "percentage": 40.36, "elapsed_time": "6:03:03", "remaining_time": "8:56:25"}
223
- {"current_steps": 223, "total_steps": 550, "loss": 0.3695, "lr": 5.9336851355382557e-05, "epoch": 2.02262443438914, "percentage": 40.55, "elapsed_time": "6:04:41", "remaining_time": "8:54:46"}
224
- {"current_steps": 224, "total_steps": 550, "loss": 0.3643, "lr": 5.911423213238653e-05, "epoch": 2.0316742081447963, "percentage": 40.73, "elapsed_time": "6:06:18", "remaining_time": "8:53:06"}
225
- {"current_steps": 225, "total_steps": 550, "loss": 0.3601, "lr": 5.889084299090732e-05, "epoch": 2.0407239819004523, "percentage": 40.91, "elapsed_time": "6:07:55", "remaining_time": "8:51:27"}
226
- {"current_steps": 226, "total_steps": 550, "loss": 0.3645, "lr": 5.866669292902695e-05, "epoch": 2.0497737556561084, "percentage": 41.09, "elapsed_time": "6:09:32", "remaining_time": "8:49:47"}
227
- {"current_steps": 227, "total_steps": 550, "loss": 0.363, "lr": 5.844179097547725e-05, "epoch": 2.0588235294117645, "percentage": 41.27, "elapsed_time": "6:11:09", "remaining_time": "8:48:07"}
228
- {"current_steps": 228, "total_steps": 550, "loss": 0.3593, "lr": 5.821614618927613e-05, "epoch": 2.067873303167421, "percentage": 41.45, "elapsed_time": "6:12:46", "remaining_time": "8:46:28"}
229
- {"current_steps": 229, "total_steps": 550, "loss": 0.3647, "lr": 5.798976765936264e-05, "epoch": 2.076923076923077, "percentage": 41.64, "elapsed_time": "6:14:23", "remaining_time": "8:44:48"}
230
- {"current_steps": 230, "total_steps": 550, "loss": 0.3587, "lr": 5.776266450423097e-05, "epoch": 2.085972850678733, "percentage": 41.82, "elapsed_time": "6:16:01", "remaining_time": "8:43:09"}
231
- {"current_steps": 231, "total_steps": 550, "loss": 0.3627, "lr": 5.75348458715631e-05, "epoch": 2.0950226244343892, "percentage": 42.0, "elapsed_time": "6:17:38", "remaining_time": "8:41:29"}
232
- {"current_steps": 232, "total_steps": 550, "loss": 0.3541, "lr": 5.7306320937860336e-05, "epoch": 2.1040723981900453, "percentage": 42.18, "elapsed_time": "6:19:15", "remaining_time": "8:39:50"}
233
- {"current_steps": 233, "total_steps": 550, "loss": 0.3651, "lr": 5.7077098908073676e-05, "epoch": 2.1131221719457014, "percentage": 42.36, "elapsed_time": "6:20:52", "remaining_time": "8:38:11"}
234
- {"current_steps": 234, "total_steps": 550, "loss": 0.3556, "lr": 5.684718901523307e-05, "epoch": 2.1221719457013575, "percentage": 42.55, "elapsed_time": "6:22:30", "remaining_time": "8:36:32"}
235
- {"current_steps": 235, "total_steps": 550, "loss": 0.3596, "lr": 5.661660052007547e-05, "epoch": 2.1312217194570136, "percentage": 42.73, "elapsed_time": "6:24:07", "remaining_time": "8:34:53"}
236
- {"current_steps": 236, "total_steps": 550, "loss": 0.3549, "lr": 5.6385342710671815e-05, "epoch": 2.1402714932126696, "percentage": 42.91, "elapsed_time": "6:25:44", "remaining_time": "8:33:13"}
237
- {"current_steps": 237, "total_steps": 550, "loss": 0.3576, "lr": 5.6153424902053e-05, "epoch": 2.1493212669683257, "percentage": 43.09, "elapsed_time": "6:27:20", "remaining_time": "8:31:33"}
238
- {"current_steps": 238, "total_steps": 550, "loss": 0.3577, "lr": 5.59208564358345e-05, "epoch": 2.158371040723982, "percentage": 43.27, "elapsed_time": "6:28:57", "remaining_time": "8:29:54"}
239
- {"current_steps": 239, "total_steps": 550, "loss": 0.3656, "lr": 5.568764667984022e-05, "epoch": 2.167420814479638, "percentage": 43.45, "elapsed_time": "6:30:34", "remaining_time": "8:28:14"}
240
- {"current_steps": 240, "total_steps": 550, "loss": 0.3534, "lr": 5.5453805027725145e-05, "epoch": 2.176470588235294, "percentage": 43.64, "elapsed_time": "6:32:11", "remaining_time": "8:26:35"}
241
- {"current_steps": 241, "total_steps": 550, "loss": 0.3534, "lr": 5.521934089859692e-05, "epoch": 2.1855203619909505, "percentage": 43.82, "elapsed_time": "6:33:48", "remaining_time": "8:24:55"}
242
- {"current_steps": 242, "total_steps": 550, "loss": 0.3579, "lr": 5.4984263736636494e-05, "epoch": 2.1945701357466065, "percentage": 44.0, "elapsed_time": "6:35:25", "remaining_time": "8:23:16"}
243
- {"current_steps": 243, "total_steps": 550, "loss": 0.359, "lr": 5.4748583010717636e-05, "epoch": 2.2036199095022626, "percentage": 44.18, "elapsed_time": "6:37:02", "remaining_time": "8:21:36"}
244
- {"current_steps": 244, "total_steps": 550, "loss": 0.3627, "lr": 5.451230821402564e-05, "epoch": 2.2126696832579187, "percentage": 44.36, "elapsed_time": "6:38:39", "remaining_time": "8:19:57"}
245
- {"current_steps": 245, "total_steps": 550, "loss": 0.3558, "lr": 5.427544886367488e-05, "epoch": 2.2217194570135748, "percentage": 44.55, "elapsed_time": "6:40:16", "remaining_time": "8:18:18"}
246
- {"current_steps": 246, "total_steps": 550, "loss": 0.3577, "lr": 5.403801450032544e-05, "epoch": 2.230769230769231, "percentage": 44.73, "elapsed_time": "6:41:54", "remaining_time": "8:16:39"}
247
- {"current_steps": 247, "total_steps": 550, "loss": 0.3627, "lr": 5.380001468779883e-05, "epoch": 2.239819004524887, "percentage": 44.91, "elapsed_time": "6:43:31", "remaining_time": "8:15:00"}
248
- {"current_steps": 248, "total_steps": 550, "loss": 0.3583, "lr": 5.356145901269282e-05, "epoch": 2.248868778280543, "percentage": 45.09, "elapsed_time": "6:45:08", "remaining_time": "8:13:21"}
249
- {"current_steps": 249, "total_steps": 550, "loss": 0.3612, "lr": 5.3322357083995235e-05, "epoch": 2.257918552036199, "percentage": 45.27, "elapsed_time": "6:46:45", "remaining_time": "8:11:42"}
250
- {"current_steps": 250, "total_steps": 550, "loss": 0.354, "lr": 5.3082718532696874e-05, "epoch": 2.266968325791855, "percentage": 45.45, "elapsed_time": "6:48:23", "remaining_time": "8:10:03"}
251
- {"current_steps": 251, "total_steps": 550, "loss": 0.3528, "lr": 5.284255301140364e-05, "epoch": 2.276018099547511, "percentage": 45.64, "elapsed_time": "6:50:00", "remaining_time": "8:08:24"}
252
- {"current_steps": 252, "total_steps": 550, "loss": 0.3504, "lr": 5.2601870193947716e-05, "epoch": 2.2850678733031673, "percentage": 45.82, "elapsed_time": "6:51:37", "remaining_time": "8:06:46"}
253
- {"current_steps": 253, "total_steps": 550, "loss": 0.3527, "lr": 5.23606797749979e-05, "epoch": 2.2941176470588234, "percentage": 46.0, "elapsed_time": "6:53:14", "remaining_time": "8:05:07"}
254
- {"current_steps": 254, "total_steps": 550, "loss": 0.3545, "lr": 5.21189914696691e-05, "epoch": 2.3031674208144794, "percentage": 46.18, "elapsed_time": "6:54:52", "remaining_time": "8:03:28"}
255
- {"current_steps": 255, "total_steps": 550, "loss": 0.3525, "lr": 5.1876815013131e-05, "epoch": 2.3122171945701355, "percentage": 46.36, "elapsed_time": "6:56:29", "remaining_time": "8:01:49"}
256
- {"current_steps": 256, "total_steps": 550, "loss": 0.3561, "lr": 5.163416016021597e-05, "epoch": 2.321266968325792, "percentage": 46.55, "elapsed_time": "6:58:06", "remaining_time": "8:00:10"}
257
- {"current_steps": 257, "total_steps": 550, "loss": 0.3515, "lr": 5.1391036685026093e-05, "epoch": 2.330316742081448, "percentage": 46.73, "elapsed_time": "6:59:44", "remaining_time": "7:58:31"}
258
- {"current_steps": 258, "total_steps": 550, "loss": 0.3513, "lr": 5.114745438053952e-05, "epoch": 2.339366515837104, "percentage": 46.91, "elapsed_time": "7:01:21", "remaining_time": "7:56:52"}
259
- {"current_steps": 259, "total_steps": 550, "loss": 0.3557, "lr": 5.0903423058215925e-05, "epoch": 2.3484162895927603, "percentage": 47.09, "elapsed_time": "7:02:58", "remaining_time": "7:55:13"}
260
- {"current_steps": 260, "total_steps": 550, "loss": 0.3503, "lr": 5.06589525476014e-05, "epoch": 2.3574660633484164, "percentage": 47.27, "elapsed_time": "7:04:35", "remaining_time": "7:53:34"}
261
- {"current_steps": 261, "total_steps": 550, "loss": 0.3568, "lr": 5.0414052695932486e-05, "epoch": 2.3665158371040724, "percentage": 47.45, "elapsed_time": "7:06:12", "remaining_time": "7:51:55"}
262
- {"current_steps": 262, "total_steps": 550, "loss": 0.3537, "lr": 5.016873336773949e-05, "epoch": 2.3755656108597285, "percentage": 47.64, "elapsed_time": "7:07:50", "remaining_time": "7:50:17"}
263
- {"current_steps": 263, "total_steps": 550, "loss": 0.3587, "lr": 4.992300444444916e-05, "epoch": 2.3846153846153846, "percentage": 47.82, "elapsed_time": "7:09:27", "remaining_time": "7:48:39"}
264
- {"current_steps": 264, "total_steps": 550, "loss": 0.3544, "lr": 4.967687582398671e-05, "epoch": 2.3936651583710407, "percentage": 48.0, "elapsed_time": "7:11:05", "remaining_time": "7:47:00"}
265
- {"current_steps": 265, "total_steps": 550, "loss": 0.3553, "lr": 4.94303574203771e-05, "epoch": 2.4027149321266967, "percentage": 48.18, "elapsed_time": "7:12:42", "remaining_time": "7:45:21"}
266
- {"current_steps": 266, "total_steps": 550, "loss": 0.3516, "lr": 4.9183459163345644e-05, "epoch": 2.411764705882353, "percentage": 48.36, "elapsed_time": "7:14:19", "remaining_time": "7:43:42"}
267
- {"current_steps": 267, "total_steps": 550, "loss": 0.3539, "lr": 4.893619099791817e-05, "epoch": 2.420814479638009, "percentage": 48.55, "elapsed_time": "7:15:56", "remaining_time": "7:42:03"}
268
- {"current_steps": 268, "total_steps": 550, "loss": 0.3588, "lr": 4.868856288402032e-05, "epoch": 2.4298642533936654, "percentage": 48.73, "elapsed_time": "7:17:33", "remaining_time": "7:40:24"}
269
- {"current_steps": 269, "total_steps": 550, "loss": 0.3543, "lr": 4.8440584796076395e-05, "epoch": 2.4389140271493215, "percentage": 48.91, "elapsed_time": "7:19:10", "remaining_time": "7:38:46"}
270
- {"current_steps": 270, "total_steps": 550, "loss": 0.3601, "lr": 4.819226672260763e-05, "epoch": 2.4479638009049776, "percentage": 49.09, "elapsed_time": "7:20:48", "remaining_time": "7:37:07"}
271
- {"current_steps": 271, "total_steps": 550, "loss": 0.3587, "lr": 4.794361866582982e-05, "epoch": 2.4570135746606336, "percentage": 49.27, "elapsed_time": "7:22:25", "remaining_time": "7:35:28"}
272
- {"current_steps": 272, "total_steps": 550, "loss": 0.3558, "lr": 4.7694650641250446e-05, "epoch": 2.4660633484162897, "percentage": 49.45, "elapsed_time": "7:24:02", "remaining_time": "7:33:50"}
273
- {"current_steps": 273, "total_steps": 550, "loss": 0.3535, "lr": 4.7445372677265205e-05, "epoch": 2.475113122171946, "percentage": 49.64, "elapsed_time": "7:25:39", "remaining_time": "7:32:11"}
274
- {"current_steps": 274, "total_steps": 550, "loss": 0.3584, "lr": 4.719579481475416e-05, "epoch": 2.484162895927602, "percentage": 49.82, "elapsed_time": "7:27:16", "remaining_time": "7:30:32"}
275
- {"current_steps": 275, "total_steps": 550, "loss": 0.3555, "lr": 4.694592710667723e-05, "epoch": 2.493212669683258, "percentage": 50.0, "elapsed_time": "7:28:53", "remaining_time": "7:28:53"}
276
- {"current_steps": 276, "total_steps": 550, "loss": 0.3563, "lr": 4.6695779617669236e-05, "epoch": 2.502262443438914, "percentage": 50.18, "elapsed_time": "7:30:30", "remaining_time": "7:27:14"}
277
- {"current_steps": 277, "total_steps": 550, "loss": 0.359, "lr": 4.6445362423634574e-05, "epoch": 2.51131221719457, "percentage": 50.36, "elapsed_time": "7:32:07", "remaining_time": "7:25:36"}
278
- {"current_steps": 278, "total_steps": 550, "loss": 0.3524, "lr": 4.61946856113413e-05, "epoch": 2.520361990950226, "percentage": 50.55, "elapsed_time": "7:33:44", "remaining_time": "7:23:57"}
279
- {"current_steps": 279, "total_steps": 550, "loss": 0.3517, "lr": 4.594375927801487e-05, "epoch": 2.5294117647058822, "percentage": 50.73, "elapsed_time": "7:35:21", "remaining_time": "7:22:18"}
280
- {"current_steps": 280, "total_steps": 550, "loss": 0.3599, "lr": 4.5692593530931416e-05, "epoch": 2.5384615384615383, "percentage": 50.91, "elapsed_time": "7:36:58", "remaining_time": "7:20:39"}
281
- {"current_steps": 281, "total_steps": 550, "loss": 0.3557, "lr": 4.5441198487010574e-05, "epoch": 2.5475113122171944, "percentage": 51.09, "elapsed_time": "7:38:35", "remaining_time": "7:19:00"}
282
- {"current_steps": 282, "total_steps": 550, "loss": 0.351, "lr": 4.5189584272408074e-05, "epoch": 2.5565610859728505, "percentage": 51.27, "elapsed_time": "7:40:12", "remaining_time": "7:17:21"}
283
- {"current_steps": 283, "total_steps": 550, "loss": 0.3559, "lr": 4.493776102210779e-05, "epoch": 2.5656108597285066, "percentage": 51.45, "elapsed_time": "7:41:49", "remaining_time": "7:15:42"}
284
- {"current_steps": 284, "total_steps": 550, "loss": 0.3565, "lr": 4.468573887951354e-05, "epoch": 2.5746606334841626, "percentage": 51.64, "elapsed_time": "7:43:26", "remaining_time": "7:14:03"}
285
- {"current_steps": 285, "total_steps": 550, "loss": 0.3532, "lr": 4.4433527996040443e-05, "epoch": 2.583710407239819, "percentage": 51.82, "elapsed_time": "7:45:03", "remaining_time": "7:12:25"}
286
- {"current_steps": 286, "total_steps": 550, "loss": 0.3559, "lr": 4.418113853070614e-05, "epoch": 2.5927601809954752, "percentage": 52.0, "elapsed_time": "7:46:40", "remaining_time": "7:10:46"}
287
- {"current_steps": 287, "total_steps": 550, "loss": 0.3595, "lr": 4.392858064972149e-05, "epoch": 2.6018099547511313, "percentage": 52.18, "elapsed_time": "7:48:17", "remaining_time": "7:09:07"}
288
- {"current_steps": 288, "total_steps": 550, "loss": 0.354, "lr": 4.3675864526081106e-05, "epoch": 2.6108597285067874, "percentage": 52.36, "elapsed_time": "7:49:54", "remaining_time": "7:07:28"}
289
- {"current_steps": 289, "total_steps": 550, "loss": 0.3517, "lr": 4.34230003391536e-05, "epoch": 2.6199095022624435, "percentage": 52.55, "elapsed_time": "7:51:31", "remaining_time": "7:05:50"}
290
- {"current_steps": 290, "total_steps": 550, "loss": 0.3532, "lr": 4.316999827427154e-05, "epoch": 2.6289592760180995, "percentage": 52.73, "elapsed_time": "7:53:08", "remaining_time": "7:04:11"}
291
- {"current_steps": 291, "total_steps": 550, "loss": 0.3576, "lr": 4.2916868522321235e-05, "epoch": 2.6380090497737556, "percentage": 52.91, "elapsed_time": "7:54:45", "remaining_time": "7:02:32"}
292
- {"current_steps": 292, "total_steps": 550, "loss": 0.3591, "lr": 4.266362127933216e-05, "epoch": 2.6470588235294117, "percentage": 53.09, "elapsed_time": "7:56:22", "remaining_time": "7:00:54"}
293
- {"current_steps": 293, "total_steps": 550, "loss": 0.3528, "lr": 4.2410266746066345e-05, "epoch": 2.6561085972850678, "percentage": 53.27, "elapsed_time": "7:57:59", "remaining_time": "6:59:15"}
294
- {"current_steps": 294, "total_steps": 550, "loss": 0.359, "lr": 4.215681512760744e-05, "epoch": 2.665158371040724, "percentage": 53.45, "elapsed_time": "7:59:36", "remaining_time": "6:57:36"}
295
- {"current_steps": 295, "total_steps": 550, "loss": 0.3541, "lr": 4.19032766329497e-05, "epoch": 2.6742081447963804, "percentage": 53.64, "elapsed_time": "8:01:13", "remaining_time": "6:55:58"}
296
- {"current_steps": 296, "total_steps": 550, "loss": 0.3533, "lr": 4.1649661474586694e-05, "epoch": 2.6832579185520364, "percentage": 53.82, "elapsed_time": "8:02:50", "remaining_time": "6:54:19"}
297
- {"current_steps": 297, "total_steps": 550, "loss": 0.3597, "lr": 4.139597986810005e-05, "epoch": 2.6923076923076925, "percentage": 54.0, "elapsed_time": "8:04:27", "remaining_time": "6:52:40"}
298
- {"current_steps": 298, "total_steps": 550, "loss": 0.3506, "lr": 4.114224203174785e-05, "epoch": 2.7013574660633486, "percentage": 54.18, "elapsed_time": "8:06:04", "remaining_time": "6:51:02"}
299
- {"current_steps": 299, "total_steps": 550, "loss": 0.3556, "lr": 4.0888458186053184e-05, "epoch": 2.7104072398190047, "percentage": 54.36, "elapsed_time": "8:07:41", "remaining_time": "6:49:23"}
300
- {"current_steps": 300, "total_steps": 550, "loss": 0.3529, "lr": 4.063463855339232e-05, "epoch": 2.7194570135746607, "percentage": 54.55, "elapsed_time": "8:09:17", "remaining_time": "6:47:44"}
301
- {"current_steps": 301, "total_steps": 550, "loss": 0.3482, "lr": 4.0380793357583076e-05, "epoch": 2.728506787330317, "percentage": 54.73, "elapsed_time": "8:10:54", "remaining_time": "6:46:06"}
302
- {"current_steps": 302, "total_steps": 550, "loss": 0.3581, "lr": 4.012693282347289e-05, "epoch": 2.737556561085973, "percentage": 54.91, "elapsed_time": "8:12:31", "remaining_time": "6:44:27"}
303
- {"current_steps": 303, "total_steps": 550, "loss": 0.3568, "lr": 3.9873067176527114e-05, "epoch": 2.746606334841629, "percentage": 55.09, "elapsed_time": "8:14:09", "remaining_time": "6:42:49"}
304
- {"current_steps": 304, "total_steps": 550, "loss": 0.3548, "lr": 3.961920664241694e-05, "epoch": 2.755656108597285, "percentage": 55.27, "elapsed_time": "8:15:46", "remaining_time": "6:41:10"}
305
- {"current_steps": 305, "total_steps": 550, "loss": 0.3547, "lr": 3.9365361446607684e-05, "epoch": 2.764705882352941, "percentage": 55.45, "elapsed_time": "8:17:23", "remaining_time": "6:39:32"}
306
- {"current_steps": 306, "total_steps": 550, "loss": 0.3602, "lr": 3.911154181394682e-05, "epoch": 2.773755656108597, "percentage": 55.64, "elapsed_time": "8:19:00", "remaining_time": "6:37:53"}
307
- {"current_steps": 307, "total_steps": 550, "loss": 0.3562, "lr": 3.885775796825216e-05, "epoch": 2.7828054298642533, "percentage": 55.82, "elapsed_time": "8:20:37", "remaining_time": "6:36:15"}
308
- {"current_steps": 308, "total_steps": 550, "loss": 0.3479, "lr": 3.860402013189998e-05, "epoch": 2.7918552036199094, "percentage": 56.0, "elapsed_time": "8:22:14", "remaining_time": "6:34:36"}
309
- {"current_steps": 309, "total_steps": 550, "loss": 0.3572, "lr": 3.835033852541332e-05, "epoch": 2.8009049773755654, "percentage": 56.18, "elapsed_time": "8:23:51", "remaining_time": "6:32:58"}
310
- {"current_steps": 310, "total_steps": 550, "loss": 0.3519, "lr": 3.809672336705031e-05, "epoch": 2.8099547511312215, "percentage": 56.36, "elapsed_time": "8:25:28", "remaining_time": "6:31:19"}
311
- {"current_steps": 311, "total_steps": 550, "loss": 0.3559, "lr": 3.784318487239257e-05, "epoch": 2.8190045248868776, "percentage": 56.55, "elapsed_time": "8:27:05", "remaining_time": "6:29:41"}
312
- {"current_steps": 312, "total_steps": 550, "loss": 0.3504, "lr": 3.758973325393367e-05, "epoch": 2.8280542986425337, "percentage": 56.73, "elapsed_time": "8:28:42", "remaining_time": "6:28:02"}
313
- {"current_steps": 313, "total_steps": 550, "loss": 0.3569, "lr": 3.7336378720667846e-05, "epoch": 2.83710407239819, "percentage": 56.91, "elapsed_time": "8:30:18", "remaining_time": "6:26:24"}
314
- {"current_steps": 314, "total_steps": 550, "loss": 0.3559, "lr": 3.708313147767878e-05, "epoch": 2.8461538461538463, "percentage": 57.09, "elapsed_time": "8:31:55", "remaining_time": "6:24:45"}
315
- {"current_steps": 315, "total_steps": 550, "loss": 0.3516, "lr": 3.683000172572846e-05, "epoch": 2.8552036199095023, "percentage": 57.27, "elapsed_time": "8:33:32", "remaining_time": "6:23:07"}
316
- {"current_steps": 316, "total_steps": 550, "loss": 0.3575, "lr": 3.657699966084642e-05, "epoch": 2.8642533936651584, "percentage": 57.45, "elapsed_time": "8:35:09", "remaining_time": "6:21:28"}
317
- {"current_steps": 317, "total_steps": 550, "loss": 0.3579, "lr": 3.632413547391891e-05, "epoch": 2.8733031674208145, "percentage": 57.64, "elapsed_time": "8:36:46", "remaining_time": "6:19:50"}
318
- {"current_steps": 318, "total_steps": 550, "loss": 0.3486, "lr": 3.6071419350278515e-05, "epoch": 2.8823529411764706, "percentage": 57.82, "elapsed_time": "8:38:23", "remaining_time": "6:18:12"}
319
- {"current_steps": 319, "total_steps": 550, "loss": 0.3468, "lr": 3.581886146929387e-05, "epoch": 2.8914027149321266, "percentage": 58.0, "elapsed_time": "8:40:00", "remaining_time": "6:16:33"}
320
- {"current_steps": 320, "total_steps": 550, "loss": 0.3526, "lr": 3.556647200395956e-05, "epoch": 2.9004524886877827, "percentage": 58.18, "elapsed_time": "8:41:37", "remaining_time": "6:14:55"}
321
- {"current_steps": 321, "total_steps": 550, "loss": 0.3498, "lr": 3.5314261120486474e-05, "epoch": 2.909502262443439, "percentage": 58.36, "elapsed_time": "8:43:14", "remaining_time": "6:13:16"}
322
- {"current_steps": 322, "total_steps": 550, "loss": 0.353, "lr": 3.5062238977892214e-05, "epoch": 2.918552036199095, "percentage": 58.55, "elapsed_time": "8:44:51", "remaining_time": "6:11:38"}
323
- {"current_steps": 323, "total_steps": 550, "loss": 0.3551, "lr": 3.481041572759193e-05, "epoch": 2.9276018099547514, "percentage": 58.73, "elapsed_time": "8:46:29", "remaining_time": "6:10:00"}
324
- {"current_steps": 324, "total_steps": 550, "loss": 0.3555, "lr": 3.4558801512989446e-05, "epoch": 2.9366515837104075, "percentage": 58.91, "elapsed_time": "8:48:06", "remaining_time": "6:08:22"}
325
- {"current_steps": 325, "total_steps": 550, "loss": 0.3553, "lr": 3.4307406469068604e-05, "epoch": 2.9457013574660635, "percentage": 59.09, "elapsed_time": "8:49:43", "remaining_time": "6:06:43"}
326
- {"current_steps": 326, "total_steps": 550, "loss": 0.3574, "lr": 3.405624072198514e-05, "epoch": 2.9547511312217196, "percentage": 59.27, "elapsed_time": "8:51:20", "remaining_time": "6:05:05"}
327
- {"current_steps": 327, "total_steps": 550, "loss": 0.3517, "lr": 3.3805314388658714e-05, "epoch": 2.9638009049773757, "percentage": 59.45, "elapsed_time": "8:52:57", "remaining_time": "6:03:27"}
328
- {"current_steps": 328, "total_steps": 550, "loss": 0.3449, "lr": 3.3554637576365446e-05, "epoch": 2.9728506787330318, "percentage": 59.64, "elapsed_time": "8:54:34", "remaining_time": "6:01:49"}
329
- {"current_steps": 329, "total_steps": 550, "loss": 0.3514, "lr": 3.330422038233078e-05, "epoch": 2.981900452488688, "percentage": 59.82, "elapsed_time": "8:56:11", "remaining_time": "6:00:10"}
330
- {"current_steps": 330, "total_steps": 550, "loss": 0.3508, "lr": 3.305407289332279e-05, "epoch": 2.990950226244344, "percentage": 60.0, "elapsed_time": "8:57:48", "remaining_time": "5:58:32"}
331
- {"current_steps": 331, "total_steps": 550, "loss": 0.6016, "lr": 3.280420518524585e-05, "epoch": 3.002262443438914, "percentage": 60.18, "elapsed_time": "9:01:00", "remaining_time": "5:57:56"}
332
- {"current_steps": 332, "total_steps": 550, "loss": 0.3304, "lr": 3.25546273227348e-05, "epoch": 3.01131221719457, "percentage": 60.36, "elapsed_time": "9:02:36", "remaining_time": "5:56:17"}
 
1
+ {"current_steps": 1, "total_steps": 550, "loss": 0.8197, "lr": 1.4545454545454546e-06, "epoch": 0.00904977375565611, "percentage": 0.18, "elapsed_time": "0:01:05", "remaining_time": "10:02:17"}
2
+ {"current_steps": 2, "total_steps": 550, "loss": 0.8224, "lr": 2.9090909090909093e-06, "epoch": 0.01809954751131222, "percentage": 0.36, "elapsed_time": "0:01:57", "remaining_time": "8:57:27"}
3
+ {"current_steps": 3, "total_steps": 550, "loss": 0.8034, "lr": 4.363636363636364e-06, "epoch": 0.027149321266968326, "percentage": 0.55, "elapsed_time": "0:02:48", "remaining_time": "8:31:57"}
4
+ {"current_steps": 4, "total_steps": 550, "loss": 0.7741, "lr": 5.8181818181818185e-06, "epoch": 0.03619909502262444, "percentage": 0.73, "elapsed_time": "0:03:39", "remaining_time": "8:19:57"}
5
+ {"current_steps": 5, "total_steps": 550, "loss": 0.7292, "lr": 7.272727272727273e-06, "epoch": 0.04524886877828054, "percentage": 0.91, "elapsed_time": "0:04:31", "remaining_time": "8:12:41"}
6
+ {"current_steps": 6, "total_steps": 550, "loss": 0.7138, "lr": 8.727272727272728e-06, "epoch": 0.05429864253393665, "percentage": 1.09, "elapsed_time": "0:05:22", "remaining_time": "8:07:31"}
7
+ {"current_steps": 7, "total_steps": 550, "loss": 0.732, "lr": 1.0181818181818182e-05, "epoch": 0.06334841628959276, "percentage": 1.27, "elapsed_time": "0:06:14", "remaining_time": "8:03:46"}
8
+ {"current_steps": 8, "total_steps": 550, "loss": 0.723, "lr": 1.1636363636363637e-05, "epoch": 0.07239819004524888, "percentage": 1.45, "elapsed_time": "0:07:05", "remaining_time": "8:00:35"}
9
+ {"current_steps": 9, "total_steps": 550, "loss": 0.7228, "lr": 1.3090909090909092e-05, "epoch": 0.08144796380090498, "percentage": 1.64, "elapsed_time": "0:07:57", "remaining_time": "7:58:14"}
10
+ {"current_steps": 10, "total_steps": 550, "loss": 0.7034, "lr": 1.4545454545454546e-05, "epoch": 0.09049773755656108, "percentage": 1.82, "elapsed_time": "0:08:48", "remaining_time": "7:55:51"}
11
+ {"current_steps": 11, "total_steps": 550, "loss": 0.6666, "lr": 1.6000000000000003e-05, "epoch": 0.09954751131221719, "percentage": 2.0, "elapsed_time": "0:09:39", "remaining_time": "7:53:35"}
12
+ {"current_steps": 12, "total_steps": 550, "loss": 0.6361, "lr": 1.7454545454545456e-05, "epoch": 0.1085972850678733, "percentage": 2.18, "elapsed_time": "0:10:31", "remaining_time": "7:52:05"}
13
+ {"current_steps": 13, "total_steps": 550, "loss": 0.633, "lr": 1.8909090909090912e-05, "epoch": 0.11764705882352941, "percentage": 2.36, "elapsed_time": "0:11:23", "remaining_time": "7:50:32"}
14
+ {"current_steps": 14, "total_steps": 550, "loss": 0.6039, "lr": 2.0363636363636365e-05, "epoch": 0.12669683257918551, "percentage": 2.55, "elapsed_time": "0:12:14", "remaining_time": "7:48:59"}
15
+ {"current_steps": 15, "total_steps": 550, "loss": 0.5948, "lr": 2.1818181818181818e-05, "epoch": 0.13574660633484162, "percentage": 2.73, "elapsed_time": "0:13:06", "remaining_time": "7:47:22"}
16
+ {"current_steps": 16, "total_steps": 550, "loss": 0.581, "lr": 2.3272727272727274e-05, "epoch": 0.14479638009049775, "percentage": 2.91, "elapsed_time": "0:13:57", "remaining_time": "7:46:01"}
17
+ {"current_steps": 17, "total_steps": 550, "loss": 0.5777, "lr": 2.4727272727272727e-05, "epoch": 0.15384615384615385, "percentage": 3.09, "elapsed_time": "0:14:49", "remaining_time": "7:44:57"}
18
+ {"current_steps": 18, "total_steps": 550, "loss": 0.567, "lr": 2.6181818181818183e-05, "epoch": 0.16289592760180996, "percentage": 3.27, "elapsed_time": "0:15:41", "remaining_time": "7:43:48"}
19
+ {"current_steps": 19, "total_steps": 550, "loss": 0.5617, "lr": 2.763636363636364e-05, "epoch": 0.17194570135746606, "percentage": 3.45, "elapsed_time": "0:16:33", "remaining_time": "7:42:44"}
20
+ {"current_steps": 20, "total_steps": 550, "loss": 0.5546, "lr": 2.9090909090909093e-05, "epoch": 0.18099547511312217, "percentage": 3.64, "elapsed_time": "0:17:24", "remaining_time": "7:41:29"}
21
+ {"current_steps": 21, "total_steps": 550, "loss": 0.5388, "lr": 3.054545454545455e-05, "epoch": 0.19004524886877827, "percentage": 3.82, "elapsed_time": "0:18:18", "remaining_time": "7:41:05"}
22
+ {"current_steps": 22, "total_steps": 550, "loss": 0.5357, "lr": 3.2000000000000005e-05, "epoch": 0.19909502262443438, "percentage": 4.0, "elapsed_time": "0:19:10", "remaining_time": "7:40:12"}
23
+ {"current_steps": 23, "total_steps": 550, "loss": 0.537, "lr": 3.345454545454546e-05, "epoch": 0.2081447963800905, "percentage": 4.18, "elapsed_time": "0:20:02", "remaining_time": "7:39:09"}
24
+ {"current_steps": 24, "total_steps": 550, "loss": 0.5304, "lr": 3.490909090909091e-05, "epoch": 0.2171945701357466, "percentage": 4.36, "elapsed_time": "0:20:53", "remaining_time": "7:37:59"}
25
+ {"current_steps": 25, "total_steps": 550, "loss": 0.5316, "lr": 3.6363636363636364e-05, "epoch": 0.22624434389140272, "percentage": 4.55, "elapsed_time": "0:21:46", "remaining_time": "7:37:12"}
26
+ {"current_steps": 1, "total_steps": 550, "loss": 0.8197, "lr": 1.4545454545454546e-06, "epoch": 0.00904977375565611, "percentage": 0.18, "elapsed_time": "0:01:04", "remaining_time": "9:46:21"}
27
+ {"current_steps": 2, "total_steps": 550, "loss": 0.8224, "lr": 2.9090909090909093e-06, "epoch": 0.01809954751131222, "percentage": 0.36, "elapsed_time": "0:01:54", "remaining_time": "8:42:21"}
28
+ {"current_steps": 3, "total_steps": 550, "loss": 0.8034, "lr": 4.363636363636364e-06, "epoch": 0.027149321266968326, "percentage": 0.55, "elapsed_time": "0:02:43", "remaining_time": "8:17:36"}
29
+ {"current_steps": 4, "total_steps": 550, "loss": 0.774, "lr": 5.8181818181818185e-06, "epoch": 0.03619909502262444, "percentage": 0.73, "elapsed_time": "0:03:32", "remaining_time": "8:04:32"}
30
+ {"current_steps": 5, "total_steps": 550, "loss": 0.7292, "lr": 7.272727272727273e-06, "epoch": 0.04524886877828054, "percentage": 0.91, "elapsed_time": "0:04:22", "remaining_time": "7:56:51"}
31
+ {"current_steps": 6, "total_steps": 550, "loss": 0.7138, "lr": 8.727272727272728e-06, "epoch": 0.05429864253393665, "percentage": 1.09, "elapsed_time": "0:05:12", "remaining_time": "7:51:34"}
32
+ {"current_steps": 7, "total_steps": 550, "loss": 0.7317, "lr": 1.0181818181818182e-05, "epoch": 0.06334841628959276, "percentage": 1.27, "elapsed_time": "0:06:01", "remaining_time": "7:46:57"}
33
+ {"current_steps": 8, "total_steps": 550, "loss": 0.7227, "lr": 1.1636363636363637e-05, "epoch": 0.07239819004524888, "percentage": 1.45, "elapsed_time": "0:06:50", "remaining_time": "7:43:10"}
34
+ {"current_steps": 9, "total_steps": 550, "loss": 0.7225, "lr": 1.3090909090909092e-05, "epoch": 0.08144796380090498, "percentage": 1.64, "elapsed_time": "0:07:39", "remaining_time": "7:40:26"}
35
+ {"current_steps": 10, "total_steps": 550, "loss": 0.7032, "lr": 1.4545454545454546e-05, "epoch": 0.09049773755656108, "percentage": 1.82, "elapsed_time": "0:08:28", "remaining_time": "7:37:52"}
36
+ {"current_steps": 11, "total_steps": 550, "loss": 0.6662, "lr": 1.6000000000000003e-05, "epoch": 0.09954751131221719, "percentage": 2.0, "elapsed_time": "0:09:17", "remaining_time": "7:35:32"}
37
+ {"current_steps": 12, "total_steps": 550, "loss": 0.6361, "lr": 1.7454545454545456e-05, "epoch": 0.1085972850678733, "percentage": 2.18, "elapsed_time": "0:10:07", "remaining_time": "7:34:04"}
38
+ {"current_steps": 13, "total_steps": 550, "loss": 0.6328, "lr": 1.8909090909090912e-05, "epoch": 0.11764705882352941, "percentage": 2.36, "elapsed_time": "0:10:56", "remaining_time": "7:32:06"}
39
+ {"current_steps": 14, "total_steps": 550, "loss": 0.6038, "lr": 2.0363636363636365e-05, "epoch": 0.12669683257918551, "percentage": 2.55, "elapsed_time": "0:11:45", "remaining_time": "7:30:13"}
40
+ {"current_steps": 15, "total_steps": 550, "loss": 0.5949, "lr": 2.1818181818181818e-05, "epoch": 0.13574660633484162, "percentage": 2.73, "elapsed_time": "0:12:34", "remaining_time": "7:28:25"}
41
+ {"current_steps": 16, "total_steps": 550, "loss": 0.5812, "lr": 2.3272727272727274e-05, "epoch": 0.14479638009049775, "percentage": 2.91, "elapsed_time": "0:13:23", "remaining_time": "7:26:56"}
42
+ {"current_steps": 17, "total_steps": 550, "loss": 0.5777, "lr": 2.4727272727272727e-05, "epoch": 0.15384615384615385, "percentage": 3.09, "elapsed_time": "0:14:12", "remaining_time": "7:25:32"}
43
+ {"current_steps": 18, "total_steps": 550, "loss": 0.5671, "lr": 2.6181818181818183e-05, "epoch": 0.16289592760180996, "percentage": 3.27, "elapsed_time": "0:15:02", "remaining_time": "7:24:23"}
44
+ {"current_steps": 19, "total_steps": 550, "loss": 0.5617, "lr": 2.763636363636364e-05, "epoch": 0.17194570135746606, "percentage": 3.45, "elapsed_time": "0:15:51", "remaining_time": "7:23:20"}
45
+ {"current_steps": 20, "total_steps": 550, "loss": 0.5547, "lr": 2.9090909090909093e-05, "epoch": 0.18099547511312217, "percentage": 3.64, "elapsed_time": "0:16:41", "remaining_time": "7:22:08"}
46
+ {"current_steps": 21, "total_steps": 550, "loss": 0.5392, "lr": 3.054545454545455e-05, "epoch": 0.19004524886877827, "percentage": 3.82, "elapsed_time": "0:17:31", "remaining_time": "7:21:31"}
47
+ {"current_steps": 22, "total_steps": 550, "loss": 0.5373, "lr": 3.2000000000000005e-05, "epoch": 0.19909502262443438, "percentage": 4.0, "elapsed_time": "0:18:20", "remaining_time": "7:20:10"}
48
+ {"current_steps": 23, "total_steps": 550, "loss": 0.534, "lr": 3.345454545454546e-05, "epoch": 0.2081447963800905, "percentage": 4.18, "elapsed_time": "0:19:09", "remaining_time": "7:18:57"}
49
+ {"current_steps": 24, "total_steps": 550, "loss": 0.5286, "lr": 3.490909090909091e-05, "epoch": 0.2171945701357466, "percentage": 4.36, "elapsed_time": "0:19:58", "remaining_time": "7:17:52"}
50
+ {"current_steps": 25, "total_steps": 550, "loss": 0.5301, "lr": 3.6363636363636364e-05, "epoch": 0.22624434389140272, "percentage": 4.55, "elapsed_time": "0:20:47", "remaining_time": "7:16:38"}
51
+ {"current_steps": 26, "total_steps": 550, "loss": 0.5214, "lr": 3.7818181818181824e-05, "epoch": 0.23529411764705882, "percentage": 4.73, "elapsed_time": "0:21:37", "remaining_time": "7:15:42"}
52
+ {"current_steps": 27, "total_steps": 550, "loss": 0.5115, "lr": 3.927272727272728e-05, "epoch": 0.24434389140271492, "percentage": 4.91, "elapsed_time": "0:22:26", "remaining_time": "7:14:36"}
53
+ {"current_steps": 28, "total_steps": 550, "loss": 0.5095, "lr": 4.072727272727273e-05, "epoch": 0.25339366515837103, "percentage": 5.09, "elapsed_time": "0:23:15", "remaining_time": "7:13:36"}
54
+ {"current_steps": 29, "total_steps": 550, "loss": 0.5087, "lr": 4.218181818181818e-05, "epoch": 0.26244343891402716, "percentage": 5.27, "elapsed_time": "0:24:04", "remaining_time": "7:12:31"}
55
+ {"current_steps": 30, "total_steps": 550, "loss": 0.5111, "lr": 4.3636363636363636e-05, "epoch": 0.27149321266968324, "percentage": 5.45, "elapsed_time": "0:24:54", "remaining_time": "7:11:38"}
56
+ {"current_steps": 31, "total_steps": 550, "loss": 0.5072, "lr": 4.509090909090909e-05, "epoch": 0.28054298642533937, "percentage": 5.64, "elapsed_time": "0:25:43", "remaining_time": "7:10:33"}
57
+ {"current_steps": 32, "total_steps": 550, "loss": 0.5046, "lr": 4.654545454545455e-05, "epoch": 0.2895927601809955, "percentage": 5.82, "elapsed_time": "0:26:32", "remaining_time": "7:09:34"}
58
+ {"current_steps": 33, "total_steps": 550, "loss": 0.503, "lr": 4.8e-05, "epoch": 0.2986425339366516, "percentage": 6.0, "elapsed_time": "0:27:21", "remaining_time": "7:08:35"}
59
+ {"current_steps": 34, "total_steps": 550, "loss": 0.5011, "lr": 4.9454545454545454e-05, "epoch": 0.3076923076923077, "percentage": 6.18, "elapsed_time": "0:28:10", "remaining_time": "7:07:35"}
60
+ {"current_steps": 35, "total_steps": 550, "loss": 0.4895, "lr": 5.0909090909090914e-05, "epoch": 0.3167420814479638, "percentage": 6.36, "elapsed_time": "0:28:59", "remaining_time": "7:06:36"}
61
+ {"current_steps": 36, "total_steps": 550, "loss": 0.4956, "lr": 5.236363636363637e-05, "epoch": 0.3257918552036199, "percentage": 6.55, "elapsed_time": "0:29:48", "remaining_time": "7:05:34"}
62
+ {"current_steps": 37, "total_steps": 550, "loss": 0.4887, "lr": 5.381818181818182e-05, "epoch": 0.334841628959276, "percentage": 6.73, "elapsed_time": "0:30:37", "remaining_time": "7:04:43"}
63
+ {"current_steps": 38, "total_steps": 550, "loss": 0.487, "lr": 5.527272727272728e-05, "epoch": 0.3438914027149321, "percentage": 6.91, "elapsed_time": "0:31:26", "remaining_time": "7:03:39"}
64
+ {"current_steps": 39, "total_steps": 550, "loss": 0.4854, "lr": 5.672727272727273e-05, "epoch": 0.35294117647058826, "percentage": 7.09, "elapsed_time": "0:32:15", "remaining_time": "7:02:43"}
65
+ {"current_steps": 40, "total_steps": 550, "loss": 0.4943, "lr": 5.8181818181818185e-05, "epoch": 0.36199095022624433, "percentage": 7.27, "elapsed_time": "0:33:05", "remaining_time": "7:01:49"}
66
+ {"current_steps": 41, "total_steps": 550, "loss": 0.4846, "lr": 5.9636363636363645e-05, "epoch": 0.37104072398190047, "percentage": 7.45, "elapsed_time": "0:33:54", "remaining_time": "7:00:57"}
67
+ {"current_steps": 42, "total_steps": 550, "loss": 0.4765, "lr": 6.10909090909091e-05, "epoch": 0.38009049773755654, "percentage": 7.64, "elapsed_time": "0:34:43", "remaining_time": "7:00:06"}
68
+ {"current_steps": 43, "total_steps": 550, "loss": 0.4865, "lr": 6.254545454545456e-05, "epoch": 0.3891402714932127, "percentage": 7.82, "elapsed_time": "0:35:32", "remaining_time": "6:59:09"}
69
+ {"current_steps": 44, "total_steps": 550, "loss": 0.4858, "lr": 6.400000000000001e-05, "epoch": 0.39819004524886875, "percentage": 8.0, "elapsed_time": "0:36:21", "remaining_time": "6:58:12"}
70
+ {"current_steps": 45, "total_steps": 550, "loss": 0.4949, "lr": 6.545454545454546e-05, "epoch": 0.4072398190045249, "percentage": 8.18, "elapsed_time": "0:37:10", "remaining_time": "6:57:14"}
71
+ {"current_steps": 46, "total_steps": 550, "loss": 0.4799, "lr": 6.690909090909092e-05, "epoch": 0.416289592760181, "percentage": 8.36, "elapsed_time": "0:37:59", "remaining_time": "6:56:17"}
72
+ {"current_steps": 47, "total_steps": 550, "loss": 0.4779, "lr": 6.836363636363637e-05, "epoch": 0.4253393665158371, "percentage": 8.55, "elapsed_time": "0:38:48", "remaining_time": "6:55:19"}
73
+ {"current_steps": 48, "total_steps": 550, "loss": 0.4776, "lr": 6.981818181818182e-05, "epoch": 0.4343891402714932, "percentage": 8.73, "elapsed_time": "0:39:37", "remaining_time": "6:54:20"}
74
+ {"current_steps": 49, "total_steps": 550, "loss": 0.4731, "lr": 7.127272727272728e-05, "epoch": 0.4434389140271493, "percentage": 8.91, "elapsed_time": "0:40:25", "remaining_time": "6:53:23"}
75
+ {"current_steps": 50, "total_steps": 550, "loss": 0.4702, "lr": 7.272727272727273e-05, "epoch": 0.45248868778280543, "percentage": 9.09, "elapsed_time": "0:41:14", "remaining_time": "6:52:28"}
76
+ {"current_steps": 51, "total_steps": 550, "loss": 0.4853, "lr": 7.418181818181818e-05, "epoch": 0.46153846153846156, "percentage": 9.27, "elapsed_time": "0:42:03", "remaining_time": "6:51:34"}
77
+ {"current_steps": 52, "total_steps": 550, "loss": 0.4663, "lr": 7.563636363636365e-05, "epoch": 0.47058823529411764, "percentage": 9.45, "elapsed_time": "0:42:52", "remaining_time": "6:50:38"}
78
+ {"current_steps": 53, "total_steps": 550, "loss": 0.4819, "lr": 7.70909090909091e-05, "epoch": 0.4796380090497738, "percentage": 9.64, "elapsed_time": "0:43:41", "remaining_time": "6:49:41"}
79
+ {"current_steps": 54, "total_steps": 550, "loss": 0.4765, "lr": 7.854545454545455e-05, "epoch": 0.48868778280542985, "percentage": 9.82, "elapsed_time": "0:44:30", "remaining_time": "6:48:49"}
80
+ {"current_steps": 55, "total_steps": 550, "loss": 0.4764, "lr": 8e-05, "epoch": 0.497737556561086, "percentage": 10.0, "elapsed_time": "0:45:19", "remaining_time": "6:47:52"}
81
+ {"current_steps": 56, "total_steps": 550, "loss": 0.4853, "lr": 7.999919440291627e-05, "epoch": 0.5067873303167421, "percentage": 10.18, "elapsed_time": "0:46:08", "remaining_time": "6:46:58"}
82
+ {"current_steps": 57, "total_steps": 550, "loss": 0.4766, "lr": 7.999677764411438e-05, "epoch": 0.5158371040723982, "percentage": 10.36, "elapsed_time": "0:46:57", "remaining_time": "6:46:05"}
83
+ {"current_steps": 58, "total_steps": 550, "loss": 0.4697, "lr": 7.999274982094104e-05, "epoch": 0.5248868778280543, "percentage": 10.55, "elapsed_time": "0:47:46", "remaining_time": "6:45:14"}
84
+ {"current_steps": 59, "total_steps": 550, "loss": 0.4753, "lr": 7.998711109563637e-05, "epoch": 0.5339366515837104, "percentage": 10.73, "elapsed_time": "0:48:35", "remaining_time": "6:44:20"}
85
+ {"current_steps": 60, "total_steps": 550, "loss": 0.4646, "lr": 7.997986169532741e-05, "epoch": 0.5429864253393665, "percentage": 10.91, "elapsed_time": "0:49:24", "remaining_time": "6:43:26"}
86
+ {"current_steps": 61, "total_steps": 550, "loss": 0.4719, "lr": 7.997100191201896e-05, "epoch": 0.5520361990950227, "percentage": 11.09, "elapsed_time": "0:50:13", "remaining_time": "6:42:34"}
87
+ {"current_steps": 62, "total_steps": 550, "loss": 0.4597, "lr": 7.996053210258176e-05, "epoch": 0.5610859728506787, "percentage": 11.27, "elapsed_time": "0:51:01", "remaining_time": "6:41:39"}
88
+ {"current_steps": 63, "total_steps": 550, "loss": 0.4631, "lr": 7.994845268873825e-05, "epoch": 0.5701357466063348, "percentage": 11.45, "elapsed_time": "0:51:50", "remaining_time": "6:40:46"}
89
+ {"current_steps": 64, "total_steps": 550, "loss": 0.4557, "lr": 7.993476415704543e-05, "epoch": 0.579185520361991, "percentage": 11.64, "elapsed_time": "0:52:39", "remaining_time": "6:39:50"}
90
+ {"current_steps": 65, "total_steps": 550, "loss": 0.4601, "lr": 7.991946705887539e-05, "epoch": 0.5882352941176471, "percentage": 11.82, "elapsed_time": "0:53:28", "remaining_time": "6:39:00"}
91
+ {"current_steps": 66, "total_steps": 550, "loss": 0.4616, "lr": 7.990256201039297e-05, "epoch": 0.5972850678733032, "percentage": 12.0, "elapsed_time": "0:54:17", "remaining_time": "6:38:10"}
92
+ {"current_steps": 67, "total_steps": 550, "loss": 0.4536, "lr": 7.98840496925311e-05, "epoch": 0.6063348416289592, "percentage": 12.18, "elapsed_time": "0:55:07", "remaining_time": "6:37:24"}
93
+ {"current_steps": 68, "total_steps": 550, "loss": 0.4483, "lr": 7.986393085096324e-05, "epoch": 0.6153846153846154, "percentage": 12.36, "elapsed_time": "0:55:56", "remaining_time": "6:36:33"}
94
+ {"current_steps": 69, "total_steps": 550, "loss": 0.4508, "lr": 7.984220629607336e-05, "epoch": 0.6244343891402715, "percentage": 12.55, "elapsed_time": "0:56:45", "remaining_time": "6:35:40"}
95
+ {"current_steps": 70, "total_steps": 550, "loss": 0.4494, "lr": 7.981887690292339e-05, "epoch": 0.6334841628959276, "percentage": 12.73, "elapsed_time": "0:57:34", "remaining_time": "6:34:50"}
96
+ {"current_steps": 71, "total_steps": 550, "loss": 0.4519, "lr": 7.979394361121789e-05, "epoch": 0.6425339366515838, "percentage": 12.91, "elapsed_time": "0:58:23", "remaining_time": "6:33:59"}
97
+ {"current_steps": 72, "total_steps": 550, "loss": 0.4555, "lr": 7.97674074252662e-05, "epoch": 0.6515837104072398, "percentage": 13.09, "elapsed_time": "0:59:12", "remaining_time": "6:33:06"}
98
+ {"current_steps": 73, "total_steps": 550, "loss": 0.4521, "lr": 7.9739269413942e-05, "epoch": 0.6606334841628959, "percentage": 13.27, "elapsed_time": "1:00:01", "remaining_time": "6:32:12"}
99
+ {"current_steps": 74, "total_steps": 550, "loss": 0.4531, "lr": 7.970953071064036e-05, "epoch": 0.669683257918552, "percentage": 13.45, "elapsed_time": "1:00:50", "remaining_time": "6:31:19"}
100
+ {"current_steps": 75, "total_steps": 550, "loss": 0.4705, "lr": 7.967819251323182e-05, "epoch": 0.6787330316742082, "percentage": 13.64, "elapsed_time": "1:01:39", "remaining_time": "6:30:29"}
101
+ {"current_steps": 76, "total_steps": 550, "loss": 0.4488, "lr": 7.964525608401445e-05, "epoch": 0.6877828054298643, "percentage": 13.82, "elapsed_time": "1:02:28", "remaining_time": "6:29:38"}
102
+ {"current_steps": 77, "total_steps": 550, "loss": 0.4551, "lr": 7.961072274966282e-05, "epoch": 0.6968325791855203, "percentage": 14.0, "elapsed_time": "1:03:17", "remaining_time": "6:28:44"}
103
+ {"current_steps": 78, "total_steps": 550, "loss": 0.4457, "lr": 7.957459390117458e-05, "epoch": 0.7058823529411765, "percentage": 14.18, "elapsed_time": "1:04:05", "remaining_time": "6:27:52"}
104
+ {"current_steps": 79, "total_steps": 550, "loss": 0.454, "lr": 7.95368709938145e-05, "epoch": 0.7149321266968326, "percentage": 14.36, "elapsed_time": "1:04:55", "remaining_time": "6:27:02"}
105
+ {"current_steps": 80, "total_steps": 550, "loss": 0.441, "lr": 7.949755554705577e-05, "epoch": 0.7239819004524887, "percentage": 14.55, "elapsed_time": "1:05:44", "remaining_time": "6:26:11"}
106
+ {"current_steps": 81, "total_steps": 550, "loss": 0.4442, "lr": 7.945664914451888e-05, "epoch": 0.7330316742081447, "percentage": 14.73, "elapsed_time": "1:06:33", "remaining_time": "6:25:23"}
107
+ {"current_steps": 82, "total_steps": 550, "loss": 0.4406, "lr": 7.941415343390773e-05, "epoch": 0.7420814479638009, "percentage": 14.91, "elapsed_time": "1:07:22", "remaining_time": "6:24:31"}
108
+ {"current_steps": 83, "total_steps": 550, "loss": 0.4507, "lr": 7.937007012694335e-05, "epoch": 0.751131221719457, "percentage": 15.09, "elapsed_time": "1:08:10", "remaining_time": "6:23:37"}
109
+ {"current_steps": 84, "total_steps": 550, "loss": 0.4532, "lr": 7.932440099929493e-05, "epoch": 0.7601809954751131, "percentage": 15.27, "elapsed_time": "1:08:59", "remaining_time": "6:22:44"}
110
+ {"current_steps": 85, "total_steps": 550, "loss": 0.4454, "lr": 7.927714789050826e-05, "epoch": 0.7692307692307693, "percentage": 15.45, "elapsed_time": "1:09:48", "remaining_time": "6:21:53"}
111
+ {"current_steps": 86, "total_steps": 550, "loss": 0.4367, "lr": 7.92283127039317e-05, "epoch": 0.7782805429864253, "percentage": 15.64, "elapsed_time": "1:10:37", "remaining_time": "6:21:02"}
112
+ {"current_steps": 87, "total_steps": 550, "loss": 0.4332, "lr": 7.917789740663941e-05, "epoch": 0.7873303167420814, "percentage": 15.82, "elapsed_time": "1:11:26", "remaining_time": "6:20:10"}
113
+ {"current_steps": 88, "total_steps": 550, "loss": 0.4345, "lr": 7.912590402935223e-05, "epoch": 0.7963800904977375, "percentage": 16.0, "elapsed_time": "1:12:14", "remaining_time": "6:19:18"}
114
+ {"current_steps": 89, "total_steps": 550, "loss": 0.4419, "lr": 7.907233466635582e-05, "epoch": 0.8054298642533937, "percentage": 16.18, "elapsed_time": "1:13:03", "remaining_time": "6:18:25"}
115
+ {"current_steps": 90, "total_steps": 550, "loss": 0.4383, "lr": 7.90171914754163e-05, "epoch": 0.8144796380090498, "percentage": 16.36, "elapsed_time": "1:13:51", "remaining_time": "6:17:32"}
116
+ {"current_steps": 91, "total_steps": 550, "loss": 0.4348, "lr": 7.896047667769335e-05, "epoch": 0.8235294117647058, "percentage": 16.55, "elapsed_time": "1:14:40", "remaining_time": "6:16:40"}
117
+ {"current_steps": 92, "total_steps": 550, "loss": 0.4293, "lr": 7.890219255765077e-05, "epoch": 0.832579185520362, "percentage": 16.73, "elapsed_time": "1:15:30", "remaining_time": "6:15:54"}
118
+ {"current_steps": 93, "total_steps": 550, "loss": 0.4375, "lr": 7.884234146296442e-05, "epoch": 0.8416289592760181, "percentage": 16.91, "elapsed_time": "1:16:19", "remaining_time": "6:15:01"}
119
+ {"current_steps": 94, "total_steps": 550, "loss": 0.4301, "lr": 7.878092580442766e-05, "epoch": 0.8506787330316742, "percentage": 17.09, "elapsed_time": "1:17:08", "remaining_time": "6:14:12"}
120
+ {"current_steps": 95, "total_steps": 550, "loss": 0.4377, "lr": 7.871794805585427e-05, "epoch": 0.8597285067873304, "percentage": 17.27, "elapsed_time": "1:17:57", "remaining_time": "6:13:20"}
121
+ {"current_steps": 96, "total_steps": 550, "loss": 0.4303, "lr": 7.865341075397874e-05, "epoch": 0.8687782805429864, "percentage": 17.45, "elapsed_time": "1:18:45", "remaining_time": "6:12:28"}
122
+ {"current_steps": 97, "total_steps": 550, "loss": 0.4321, "lr": 7.858731649835424e-05, "epoch": 0.8778280542986425, "percentage": 17.64, "elapsed_time": "1:19:34", "remaining_time": "6:11:37"}
123
+ {"current_steps": 98, "total_steps": 550, "loss": 0.4369, "lr": 7.85196679512477e-05, "epoch": 0.8868778280542986, "percentage": 17.82, "elapsed_time": "1:20:23", "remaining_time": "6:10:48"}
124
+ {"current_steps": 99, "total_steps": 550, "loss": 0.4229, "lr": 7.845046783753276e-05, "epoch": 0.8959276018099548, "percentage": 18.0, "elapsed_time": "1:21:12", "remaining_time": "6:09:56"}
125
+ {"current_steps": 100, "total_steps": 550, "loss": 0.4294, "lr": 7.837971894457991e-05, "epoch": 0.9049773755656109, "percentage": 18.18, "elapsed_time": "1:22:01", "remaining_time": "6:09:07"}
126
+ {"current_steps": 101, "total_steps": 550, "loss": 0.4276, "lr": 7.830742412214422e-05, "epoch": 0.9140271493212669, "percentage": 18.36, "elapsed_time": "1:22:50", "remaining_time": "6:08:16"}
127
+ {"current_steps": 102, "total_steps": 550, "loss": 0.4284, "lr": 7.82335862822506e-05, "epoch": 0.9230769230769231, "percentage": 18.55, "elapsed_time": "1:23:39", "remaining_time": "6:07:25"}
128
+ {"current_steps": 103, "total_steps": 550, "loss": 0.4237, "lr": 7.815820839907651e-05, "epoch": 0.9321266968325792, "percentage": 18.73, "elapsed_time": "1:24:28", "remaining_time": "6:06:34"}
129
+ {"current_steps": 104, "total_steps": 550, "loss": 0.4325, "lr": 7.808129350883207e-05, "epoch": 0.9411764705882353, "percentage": 18.91, "elapsed_time": "1:25:16", "remaining_time": "6:05:42"}
130
+ {"current_steps": 105, "total_steps": 550, "loss": 0.4282, "lr": 7.800284470963783e-05, "epoch": 0.9502262443438914, "percentage": 19.09, "elapsed_time": "1:26:05", "remaining_time": "6:04:50"}
131
+ {"current_steps": 106, "total_steps": 550, "loss": 0.426, "lr": 7.792286516139999e-05, "epoch": 0.9592760180995475, "percentage": 19.27, "elapsed_time": "1:26:53", "remaining_time": "6:03:58"}
132
+ {"current_steps": 107, "total_steps": 550, "loss": 0.4241, "lr": 7.784135808568308e-05, "epoch": 0.9683257918552036, "percentage": 19.45, "elapsed_time": "1:27:42", "remaining_time": "6:03:08"}
133
+ {"current_steps": 108, "total_steps": 550, "loss": 0.4356, "lr": 7.775832676558028e-05, "epoch": 0.9773755656108597, "percentage": 19.64, "elapsed_time": "1:28:31", "remaining_time": "6:02:17"}
134
+ {"current_steps": 109, "total_steps": 550, "loss": 0.4366, "lr": 7.7673774545581e-05, "epoch": 0.9864253393665159, "percentage": 19.82, "elapsed_time": "1:29:19", "remaining_time": "6:01:24"}
135
+ {"current_steps": 110, "total_steps": 550, "loss": 0.4329, "lr": 7.758770483143634e-05, "epoch": 0.995475113122172, "percentage": 20.0, "elapsed_time": "1:30:08", "remaining_time": "6:00:33"}
136
+ {"current_steps": 111, "total_steps": 550, "loss": 0.4137, "lr": 7.750012109002185e-05, "epoch": 1.006787330316742, "percentage": 20.18, "elapsed_time": "1:32:46", "remaining_time": "6:06:54"}
137
+ {"current_steps": 112, "total_steps": 550, "loss": 0.414, "lr": 7.741102684919787e-05, "epoch": 1.0158371040723981, "percentage": 20.36, "elapsed_time": "1:33:35", "remaining_time": "6:05:59"}
138
+ {"current_steps": 113, "total_steps": 550, "loss": 0.4059, "lr": 7.732042569766741e-05, "epoch": 1.0248868778280542, "percentage": 20.55, "elapsed_time": "1:34:24", "remaining_time": "6:05:04"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5e181380a1d815202a0f1016792dbdff776dd2f8e5e0f1f05cbfd42792051ea6
3
- size 7160
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cc1409cdfa320cecaf01b23c7cc425d4df9cf6a45c18f326509576976f8812c9
3
+ size 7288