neginr commited on
Commit
1604df7
·
verified ·
1 Parent(s): cb97bca

Training in progress, epoch 1

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2bd51b5b2ad4e088fa46a43be088a5b087fb002ace122ed7940e307bd5dfdc90
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f10ad0c990899f705f5d432a4532d775a7d3d084dd9c9f9be0ae23bba0d48cb0
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a9a321df940364d3062620ac1d54c04773a2f96adbe4bf75d2692828289cb708
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:96ebfc4bc368c86172b060c19329e902f5b2d7215c73ae1602382f0e4d50a991
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3d7463019e2b09248de5a8ddd0cf053920b4f1ecd1e918a8fc55eeeb72fe10e9
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:710d9b234280555cc0d13db7a3e4ceb2173890cd133c1b13549e8ea06ca65233
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:38541c915a5e6c6dbc72d2e4b11faa12621e56e1dbc531e8d5ce25518bec7628
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e7b4bf9e938fcecc3ac08a2ddbacfc246eddb1bf4a97fa7ffbdeeb3425a0a6a2
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -111,3 +111,114 @@
111
  {"current_steps": 110, "total_steps": 555, "loss": 0.6088, "lr": 7.77105607722978e-05, "epoch": 0.9898762654668166, "percentage": 19.82, "elapsed_time": "3:37:01", "remaining_time": "14:37:56"}
112
  {"current_steps": 111, "total_steps": 555, "loss": 0.6027, "lr": 7.762583821310548e-05, "epoch": 0.9988751406074241, "percentage": 20.0, "elapsed_time": "3:38:58", "remaining_time": "14:35:53"}
113
  {"current_steps": 112, "total_steps": 555, "loss": 1.109, "lr": 7.753962429077881e-05, "epoch": 1.0078740157480315, "percentage": 20.18, "elapsed_time": "3:42:50", "remaining_time": "14:41:23"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
111
  {"current_steps": 110, "total_steps": 555, "loss": 0.6088, "lr": 7.77105607722978e-05, "epoch": 0.9898762654668166, "percentage": 19.82, "elapsed_time": "3:37:01", "remaining_time": "14:37:56"}
112
  {"current_steps": 111, "total_steps": 555, "loss": 0.6027, "lr": 7.762583821310548e-05, "epoch": 0.9988751406074241, "percentage": 20.0, "elapsed_time": "3:38:58", "remaining_time": "14:35:53"}
113
  {"current_steps": 112, "total_steps": 555, "loss": 1.109, "lr": 7.753962429077881e-05, "epoch": 1.0078740157480315, "percentage": 20.18, "elapsed_time": "3:42:50", "remaining_time": "14:41:23"}
114
+ {"current_steps": 113, "total_steps": 555, "loss": 0.5896, "lr": 7.7451922422551e-05, "epoch": 1.0168728908886389, "percentage": 20.36, "elapsed_time": "3:44:49", "remaining_time": "14:39:23"}
115
+ {"current_steps": 114, "total_steps": 555, "loss": 0.5776, "lr": 7.736273608463253e-05, "epoch": 1.0258717660292462, "percentage": 20.54, "elapsed_time": "3:46:47", "remaining_time": "14:37:19"}
116
+ {"current_steps": 115, "total_steps": 555, "loss": 0.5907, "lr": 7.727206881207334e-05, "epoch": 1.0348706411698538, "percentage": 20.72, "elapsed_time": "3:48:44", "remaining_time": "14:35:12"}
117
+ {"current_steps": 116, "total_steps": 555, "loss": 0.5873, "lr": 7.717992419862268e-05, "epoch": 1.0438695163104612, "percentage": 20.9, "elapsed_time": "3:50:44", "remaining_time": "14:33:12"}
118
+ {"current_steps": 117, "total_steps": 555, "loss": 0.5835, "lr": 7.708630589658667e-05, "epoch": 1.0528683914510686, "percentage": 21.08, "elapsed_time": "3:52:44", "remaining_time": "14:31:16"}
119
+ {"current_steps": 118, "total_steps": 555, "loss": 0.5794, "lr": 7.699121761668355e-05, "epoch": 1.061867266591676, "percentage": 21.26, "elapsed_time": "3:54:43", "remaining_time": "14:29:16"}
120
+ {"current_steps": 119, "total_steps": 555, "loss": 0.582, "lr": 7.689466312789661e-05, "epoch": 1.0708661417322836, "percentage": 21.44, "elapsed_time": "3:56:42", "remaining_time": "14:27:16"}
121
+ {"current_steps": 120, "total_steps": 555, "loss": 0.5907, "lr": 7.679664625732478e-05, "epoch": 1.079865016872891, "percentage": 21.62, "elapsed_time": "3:58:42", "remaining_time": "14:25:18"}
122
+ {"current_steps": 121, "total_steps": 555, "loss": 0.5742, "lr": 7.669717089003094e-05, "epoch": 1.0888638920134983, "percentage": 21.8, "elapsed_time": "4:00:43", "remaining_time": "14:23:23"}
123
+ {"current_steps": 122, "total_steps": 555, "loss": 0.5831, "lr": 7.659624096888792e-05, "epoch": 1.0978627671541057, "percentage": 21.98, "elapsed_time": "4:02:40", "remaining_time": "14:21:18"}
124
+ {"current_steps": 123, "total_steps": 555, "loss": 0.5827, "lr": 7.649386049442223e-05, "epoch": 1.106861642294713, "percentage": 22.16, "elapsed_time": "4:04:39", "remaining_time": "14:19:16"}
125
+ {"current_steps": 124, "total_steps": 555, "loss": 0.5745, "lr": 7.639003352465551e-05, "epoch": 1.1158605174353207, "percentage": 22.34, "elapsed_time": "4:06:39", "remaining_time": "14:17:18"}
126
+ {"current_steps": 125, "total_steps": 555, "loss": 0.5839, "lr": 7.628476417494368e-05, "epoch": 1.124859392575928, "percentage": 22.52, "elapsed_time": "4:08:37", "remaining_time": "14:15:15"}
127
+ {"current_steps": 126, "total_steps": 555, "loss": 0.5754, "lr": 7.617805661781374e-05, "epoch": 1.1338582677165354, "percentage": 22.7, "elapsed_time": "4:10:34", "remaining_time": "14:13:08"}
128
+ {"current_steps": 127, "total_steps": 555, "loss": 0.5772, "lr": 7.60699150827985e-05, "epoch": 1.1428571428571428, "percentage": 22.88, "elapsed_time": "4:12:34", "remaining_time": "14:11:10"}
129
+ {"current_steps": 128, "total_steps": 555, "loss": 0.5727, "lr": 7.596034385626888e-05, "epoch": 1.1518560179977504, "percentage": 23.06, "elapsed_time": "4:14:33", "remaining_time": "14:09:12"}
130
+ {"current_steps": 129, "total_steps": 555, "loss": 0.5736, "lr": 7.584934728126403e-05, "epoch": 1.1608548931383578, "percentage": 23.24, "elapsed_time": "4:16:32", "remaining_time": "14:07:12"}
131
+ {"current_steps": 130, "total_steps": 555, "loss": 0.5677, "lr": 7.573692975731914e-05, "epoch": 1.1698537682789651, "percentage": 23.42, "elapsed_time": "4:18:30", "remaining_time": "14:05:08"}
132
+ {"current_steps": 131, "total_steps": 555, "loss": 0.5796, "lr": 7.562309574029112e-05, "epoch": 1.1788526434195725, "percentage": 23.6, "elapsed_time": "4:20:30", "remaining_time": "14:03:08"}
133
+ {"current_steps": 132, "total_steps": 555, "loss": 0.5669, "lr": 7.550784974218195e-05, "epoch": 1.18785151856018, "percentage": 23.78, "elapsed_time": "4:22:29", "remaining_time": "14:01:09"}
134
+ {"current_steps": 133, "total_steps": 555, "loss": 0.5641, "lr": 7.539119633095983e-05, "epoch": 1.1968503937007875, "percentage": 23.96, "elapsed_time": "4:24:28", "remaining_time": "13:59:08"}
135
+ {"current_steps": 134, "total_steps": 555, "loss": 0.5763, "lr": 7.527314013037815e-05, "epoch": 1.2058492688413949, "percentage": 24.14, "elapsed_time": "4:26:26", "remaining_time": "13:57:04"}
136
+ {"current_steps": 135, "total_steps": 555, "loss": 0.5703, "lr": 7.515368581979224e-05, "epoch": 1.2148481439820022, "percentage": 24.32, "elapsed_time": "4:28:24", "remaining_time": "13:55:03"}
137
+ {"current_steps": 136, "total_steps": 555, "loss": 0.5703, "lr": 7.503283813397379e-05, "epoch": 1.2238470191226096, "percentage": 24.5, "elapsed_time": "4:30:23", "remaining_time": "13:53:01"}
138
+ {"current_steps": 137, "total_steps": 555, "loss": 0.5715, "lr": 7.491060186292331e-05, "epoch": 1.232845894263217, "percentage": 24.68, "elapsed_time": "4:32:21", "remaining_time": "13:50:59"}
139
+ {"current_steps": 138, "total_steps": 555, "loss": 0.5714, "lr": 7.478698185168019e-05, "epoch": 1.2418447694038246, "percentage": 24.86, "elapsed_time": "4:34:23", "remaining_time": "13:49:07"}
140
+ {"current_steps": 139, "total_steps": 555, "loss": 0.5761, "lr": 7.466198300013066e-05, "epoch": 1.250843644544432, "percentage": 25.05, "elapsed_time": "4:36:23", "remaining_time": "13:47:11"}
141
+ {"current_steps": 140, "total_steps": 555, "loss": 0.5697, "lr": 7.453561026281366e-05, "epoch": 1.2598425196850394, "percentage": 25.23, "elapsed_time": "4:38:21", "remaining_time": "13:45:06"}
142
+ {"current_steps": 141, "total_steps": 555, "loss": 0.5725, "lr": 7.440786864872433e-05, "epoch": 1.2688413948256467, "percentage": 25.41, "elapsed_time": "4:40:19", "remaining_time": "13:43:05"}
143
+ {"current_steps": 142, "total_steps": 555, "loss": 0.5737, "lr": 7.427876322111558e-05, "epoch": 1.277840269966254, "percentage": 25.59, "elapsed_time": "4:42:19", "remaining_time": "13:41:06"}
144
+ {"current_steps": 143, "total_steps": 555, "loss": 0.5724, "lr": 7.414829909729727e-05, "epoch": 1.2868391451068617, "percentage": 25.77, "elapsed_time": "4:44:18", "remaining_time": "13:39:07"}
145
+ {"current_steps": 144, "total_steps": 555, "loss": 0.5725, "lr": 7.40164814484336e-05, "epoch": 1.295838020247469, "percentage": 25.95, "elapsed_time": "4:46:17", "remaining_time": "13:37:07"}
146
+ {"current_steps": 145, "total_steps": 555, "loss": 0.5743, "lr": 7.388331549933787e-05, "epoch": 1.3048368953880765, "percentage": 26.13, "elapsed_time": "4:48:15", "remaining_time": "13:35:04"}
147
+ {"current_steps": 146, "total_steps": 555, "loss": 0.5658, "lr": 7.37488065282656e-05, "epoch": 1.3138357705286838, "percentage": 26.31, "elapsed_time": "4:50:13", "remaining_time": "13:33:01"}
148
+ {"current_steps": 147, "total_steps": 555, "loss": 0.5708, "lr": 7.361295986670522e-05, "epoch": 1.3228346456692912, "percentage": 26.49, "elapsed_time": "4:52:10", "remaining_time": "13:30:57"}
149
+ {"current_steps": 148, "total_steps": 555, "loss": 0.5629, "lr": 7.347578089916672e-05, "epoch": 1.3318335208098988, "percentage": 26.67, "elapsed_time": "4:54:09", "remaining_time": "13:28:55"}
150
+ {"current_steps": 149, "total_steps": 555, "loss": 0.5711, "lr": 7.333727506296831e-05, "epoch": 1.3408323959505062, "percentage": 26.85, "elapsed_time": "4:56:08", "remaining_time": "13:26:56"}
151
+ {"current_steps": 150, "total_steps": 555, "loss": 0.5701, "lr": 7.319744784802087e-05, "epoch": 1.3498312710911136, "percentage": 27.03, "elapsed_time": "4:58:07", "remaining_time": "13:24:55"}
152
+ {"current_steps": 151, "total_steps": 555, "loss": 0.568, "lr": 7.305630479661033e-05, "epoch": 1.3588301462317212, "percentage": 27.21, "elapsed_time": "5:00:04", "remaining_time": "13:22:52"}
153
+ {"current_steps": 152, "total_steps": 555, "loss": 0.5704, "lr": 7.291385150317796e-05, "epoch": 1.3678290213723285, "percentage": 27.39, "elapsed_time": "5:02:04", "remaining_time": "13:20:53"}
154
+ {"current_steps": 153, "total_steps": 555, "loss": 0.5626, "lr": 7.277009361409874e-05, "epoch": 1.376827896512936, "percentage": 27.57, "elapsed_time": "5:04:03", "remaining_time": "13:18:53"}
155
+ {"current_steps": 154, "total_steps": 555, "loss": 0.5682, "lr": 7.262503682745744e-05, "epoch": 1.3858267716535433, "percentage": 27.75, "elapsed_time": "5:06:00", "remaining_time": "13:16:49"}
156
+ {"current_steps": 155, "total_steps": 555, "loss": 0.5652, "lr": 7.247868689282283e-05, "epoch": 1.3948256467941507, "percentage": 27.93, "elapsed_time": "5:07:58", "remaining_time": "13:14:47"}
157
+ {"current_steps": 156, "total_steps": 555, "loss": 0.5702, "lr": 7.233104961101974e-05, "epoch": 1.4038245219347583, "percentage": 28.11, "elapsed_time": "5:09:56", "remaining_time": "13:12:44"}
158
+ {"current_steps": 157, "total_steps": 555, "loss": 0.5656, "lr": 7.21821308338992e-05, "epoch": 1.4128233970753656, "percentage": 28.29, "elapsed_time": "5:11:54", "remaining_time": "13:10:41"}
159
+ {"current_steps": 158, "total_steps": 555, "loss": 0.5625, "lr": 7.203193646410642e-05, "epoch": 1.421822272215973, "percentage": 28.47, "elapsed_time": "5:13:51", "remaining_time": "13:08:38"}
160
+ {"current_steps": 159, "total_steps": 555, "loss": 0.5622, "lr": 7.188047245484686e-05, "epoch": 1.4308211473565804, "percentage": 28.65, "elapsed_time": "5:15:50", "remaining_time": "13:06:38"}
161
+ {"current_steps": 160, "total_steps": 555, "loss": 0.5663, "lr": 7.172774480965033e-05, "epoch": 1.4398200224971878, "percentage": 28.83, "elapsed_time": "5:17:47", "remaining_time": "13:04:33"}
162
+ {"current_steps": 161, "total_steps": 555, "loss": 0.5604, "lr": 7.157375958213288e-05, "epoch": 1.4488188976377954, "percentage": 29.01, "elapsed_time": "5:19:45", "remaining_time": "13:02:30"}
163
+ {"current_steps": 162, "total_steps": 555, "loss": 0.5644, "lr": 7.141852287575701e-05, "epoch": 1.4578177727784027, "percentage": 29.19, "elapsed_time": "5:21:43", "remaining_time": "13:00:29"}
164
+ {"current_steps": 163, "total_steps": 555, "loss": 0.5543, "lr": 7.126204084358963e-05, "epoch": 1.4668166479190101, "percentage": 29.37, "elapsed_time": "5:23:40", "remaining_time": "12:58:24"}
165
+ {"current_steps": 164, "total_steps": 555, "loss": 0.5667, "lr": 7.110431968805825e-05, "epoch": 1.4758155230596175, "percentage": 29.55, "elapsed_time": "5:25:36", "remaining_time": "12:56:17"}
166
+ {"current_steps": 165, "total_steps": 555, "loss": 0.5649, "lr": 7.094536566070514e-05, "epoch": 1.4848143982002249, "percentage": 29.73, "elapsed_time": "5:27:34", "remaining_time": "12:54:16"}
167
+ {"current_steps": 166, "total_steps": 555, "loss": 0.5597, "lr": 7.078518506193945e-05, "epoch": 1.4938132733408325, "percentage": 29.91, "elapsed_time": "5:29:32", "remaining_time": "12:52:13"}
168
+ {"current_steps": 167, "total_steps": 555, "loss": 0.5683, "lr": 7.062378424078758e-05, "epoch": 1.5028121484814398, "percentage": 30.09, "elapsed_time": "5:31:29", "remaining_time": "12:50:11"}
169
+ {"current_steps": 168, "total_steps": 555, "loss": 0.5627, "lr": 7.046116959464149e-05, "epoch": 1.5118110236220472, "percentage": 30.27, "elapsed_time": "5:33:27", "remaining_time": "12:48:07"}
170
+ {"current_steps": 169, "total_steps": 555, "loss": 0.5619, "lr": 7.02973475690051e-05, "epoch": 1.5208098987626548, "percentage": 30.45, "elapsed_time": "5:35:25", "remaining_time": "12:46:08"}
171
+ {"current_steps": 170, "total_steps": 555, "loss": 0.5685, "lr": 7.013232465723888e-05, "epoch": 1.529808773903262, "percentage": 30.63, "elapsed_time": "5:37:24", "remaining_time": "12:44:08"}
172
+ {"current_steps": 171, "total_steps": 555, "loss": 0.5649, "lr": 6.996610740030237e-05, "epoch": 1.5388076490438696, "percentage": 30.81, "elapsed_time": "5:39:23", "remaining_time": "12:42:08"}
173
+ {"current_steps": 172, "total_steps": 555, "loss": 0.5641, "lr": 6.979870238649506e-05, "epoch": 1.547806524184477, "percentage": 30.99, "elapsed_time": "5:41:22", "remaining_time": "12:40:08"}
174
+ {"current_steps": 173, "total_steps": 555, "loss": 0.5607, "lr": 6.963011625119514e-05, "epoch": 1.5568053993250843, "percentage": 31.17, "elapsed_time": "5:43:20", "remaining_time": "12:38:07"}
175
+ {"current_steps": 174, "total_steps": 555, "loss": 0.5632, "lr": 6.94603556765965e-05, "epoch": 1.565804274465692, "percentage": 31.35, "elapsed_time": "5:45:18", "remaining_time": "12:36:06"}
176
+ {"current_steps": 175, "total_steps": 555, "loss": 0.5561, "lr": 6.928942739144394e-05, "epoch": 1.574803149606299, "percentage": 31.53, "elapsed_time": "5:47:15", "remaining_time": "12:34:03"}
177
+ {"current_steps": 176, "total_steps": 555, "loss": 0.5684, "lr": 6.911733817076638e-05, "epoch": 1.5838020247469067, "percentage": 31.71, "elapsed_time": "5:49:13", "remaining_time": "12:32:01"}
178
+ {"current_steps": 177, "total_steps": 555, "loss": 0.5636, "lr": 6.894409483560845e-05, "epoch": 1.592800899887514, "percentage": 31.89, "elapsed_time": "5:51:12", "remaining_time": "12:30:02"}
179
+ {"current_steps": 178, "total_steps": 555, "loss": 0.5636, "lr": 6.876970425275993e-05, "epoch": 1.6017997750281214, "percentage": 32.07, "elapsed_time": "5:53:10", "remaining_time": "12:28:00"}
180
+ {"current_steps": 179, "total_steps": 555, "loss": 0.5657, "lr": 6.859417333448376e-05, "epoch": 1.610798650168729, "percentage": 32.25, "elapsed_time": "5:55:08", "remaining_time": "12:26:00"}
181
+ {"current_steps": 180, "total_steps": 555, "loss": 0.553, "lr": 6.841750903824196e-05, "epoch": 1.6197975253093362, "percentage": 32.43, "elapsed_time": "5:57:08", "remaining_time": "12:24:03"}
182
+ {"current_steps": 181, "total_steps": 555, "loss": 0.553, "lr": 6.823971836641988e-05, "epoch": 1.6287964004499438, "percentage": 32.61, "elapsed_time": "5:59:07", "remaining_time": "12:22:02"}
183
+ {"current_steps": 182, "total_steps": 555, "loss": 0.5606, "lr": 6.806080836604868e-05, "epoch": 1.6377952755905512, "percentage": 32.79, "elapsed_time": "6:01:05", "remaining_time": "12:20:02"}
184
+ {"current_steps": 183, "total_steps": 555, "loss": 0.5611, "lr": 6.788078612852596e-05, "epoch": 1.6467941507311585, "percentage": 32.97, "elapsed_time": "6:03:05", "remaining_time": "12:18:04"}
185
+ {"current_steps": 184, "total_steps": 555, "loss": 0.5589, "lr": 6.769965878933468e-05, "epoch": 1.6557930258717661, "percentage": 33.15, "elapsed_time": "6:05:02", "remaining_time": "12:16:02"}
186
+ {"current_steps": 185, "total_steps": 555, "loss": 0.5513, "lr": 6.751743352776041e-05, "epoch": 1.6647919010123733, "percentage": 33.33, "elapsed_time": "6:07:00", "remaining_time": "12:14:00"}
187
+ {"current_steps": 186, "total_steps": 555, "loss": 0.561, "lr": 6.733411756660668e-05, "epoch": 1.6737907761529809, "percentage": 33.51, "elapsed_time": "6:09:00", "remaining_time": "12:12:03"}
188
+ {"current_steps": 187, "total_steps": 555, "loss": 0.5565, "lr": 6.714971817190872e-05, "epoch": 1.6827896512935883, "percentage": 33.69, "elapsed_time": "6:10:59", "remaining_time": "12:10:05"}
189
+ {"current_steps": 188, "total_steps": 555, "loss": 0.5554, "lr": 6.696424265264549e-05, "epoch": 1.6917885264341956, "percentage": 33.87, "elapsed_time": "6:13:00", "remaining_time": "12:08:09"}
190
+ {"current_steps": 189, "total_steps": 555, "loss": 0.5603, "lr": 6.677769836044991e-05, "epoch": 1.7007874015748032, "percentage": 34.05, "elapsed_time": "6:15:02", "remaining_time": "12:06:15"}
191
+ {"current_steps": 190, "total_steps": 555, "loss": 0.5574, "lr": 6.659009268931756e-05, "epoch": 1.7097862767154106, "percentage": 34.23, "elapsed_time": "6:17:02", "remaining_time": "12:04:18"}
192
+ {"current_steps": 191, "total_steps": 555, "loss": 0.5507, "lr": 6.64014330753135e-05, "epoch": 1.718785151856018, "percentage": 34.41, "elapsed_time": "6:19:00", "remaining_time": "12:02:17"}
193
+ {"current_steps": 192, "total_steps": 555, "loss": 0.5551, "lr": 6.621172699627761e-05, "epoch": 1.7277840269966256, "percentage": 34.59, "elapsed_time": "6:20:59", "remaining_time": "12:00:17"}
194
+ {"current_steps": 193, "total_steps": 555, "loss": 0.555, "lr": 6.602098197152817e-05, "epoch": 1.7367829021372327, "percentage": 34.77, "elapsed_time": "6:22:58", "remaining_time": "11:58:19"}
195
+ {"current_steps": 194, "total_steps": 555, "loss": 0.5631, "lr": 6.582920556156378e-05, "epoch": 1.7457817772778403, "percentage": 34.95, "elapsed_time": "6:24:56", "remaining_time": "11:56:18"}
196
+ {"current_steps": 195, "total_steps": 555, "loss": 0.56, "lr": 6.563640536776375e-05, "epoch": 1.7547806524184477, "percentage": 35.14, "elapsed_time": "6:26:53", "remaining_time": "11:54:16"}
197
+ {"current_steps": 196, "total_steps": 555, "loss": 0.5518, "lr": 6.544258903208679e-05, "epoch": 1.763779527559055, "percentage": 35.32, "elapsed_time": "6:28:51", "remaining_time": "11:52:15"}
198
+ {"current_steps": 197, "total_steps": 555, "loss": 0.55, "lr": 6.524776423676806e-05, "epoch": 1.7727784026996627, "percentage": 35.5, "elapsed_time": "6:30:47", "remaining_time": "11:50:09"}
199
+ {"current_steps": 198, "total_steps": 555, "loss": 0.5579, "lr": 6.505193870401472e-05, "epoch": 1.7817772778402698, "percentage": 35.68, "elapsed_time": "6:32:45", "remaining_time": "11:48:09"}
200
+ {"current_steps": 199, "total_steps": 555, "loss": 0.5628, "lr": 6.485512019569986e-05, "epoch": 1.7907761529808774, "percentage": 35.86, "elapsed_time": "6:34:43", "remaining_time": "11:46:09"}
201
+ {"current_steps": 200, "total_steps": 555, "loss": 0.5561, "lr": 6.465731651305475e-05, "epoch": 1.7997750281214848, "percentage": 36.04, "elapsed_time": "6:36:41", "remaining_time": "11:44:07"}
202
+ {"current_steps": 201, "total_steps": 555, "loss": 0.5589, "lr": 6.445853549635982e-05, "epoch": 1.8087739032620922, "percentage": 36.22, "elapsed_time": "6:38:39", "remaining_time": "11:42:06"}
203
+ {"current_steps": 202, "total_steps": 555, "loss": 0.5464, "lr": 6.425878502463363e-05, "epoch": 1.8177727784026998, "percentage": 36.4, "elapsed_time": "6:40:36", "remaining_time": "11:40:04"}
204
+ {"current_steps": 203, "total_steps": 555, "loss": 0.5583, "lr": 6.405807301532082e-05, "epoch": 1.826771653543307, "percentage": 36.58, "elapsed_time": "6:42:34", "remaining_time": "11:38:04"}
205
+ {"current_steps": 204, "total_steps": 555, "loss": 0.5515, "lr": 6.38564074239781e-05, "epoch": 1.8357705286839145, "percentage": 36.76, "elapsed_time": "6:44:32", "remaining_time": "11:36:03"}
206
+ {"current_steps": 205, "total_steps": 555, "loss": 0.5545, "lr": 6.365379624395911e-05, "epoch": 1.844769403824522, "percentage": 36.94, "elapsed_time": "6:46:30", "remaining_time": "11:34:02"}
207
+ {"current_steps": 206, "total_steps": 555, "loss": 0.5511, "lr": 6.345024750609735e-05, "epoch": 1.8537682789651293, "percentage": 37.12, "elapsed_time": "6:48:27", "remaining_time": "11:31:59"}
208
+ {"current_steps": 207, "total_steps": 555, "loss": 0.5569, "lr": 6.324576927838811e-05, "epoch": 1.862767154105737, "percentage": 37.3, "elapsed_time": "6:50:25", "remaining_time": "11:29:59"}
209
+ {"current_steps": 208, "total_steps": 555, "loss": 0.5507, "lr": 6.30403696656685e-05, "epoch": 1.871766029246344, "percentage": 37.48, "elapsed_time": "6:52:24", "remaining_time": "11:27:59"}
210
+ {"current_steps": 209, "total_steps": 555, "loss": 0.551, "lr": 6.28340568092963e-05, "epoch": 1.8807649043869517, "percentage": 37.66, "elapsed_time": "6:54:19", "remaining_time": "11:25:55"}
211
+ {"current_steps": 210, "total_steps": 555, "loss": 0.5552, "lr": 6.26268388868272e-05, "epoch": 1.889763779527559, "percentage": 37.84, "elapsed_time": "6:56:17", "remaining_time": "11:23:53"}
212
+ {"current_steps": 211, "total_steps": 555, "loss": 0.5515, "lr": 6.241872411169075e-05, "epoch": 1.8987626546681664, "percentage": 38.02, "elapsed_time": "6:58:14", "remaining_time": "11:21:51"}
213
+ {"current_steps": 212, "total_steps": 555, "loss": 0.5452, "lr": 6.220972073286469e-05, "epoch": 1.907761529808774, "percentage": 38.2, "elapsed_time": "7:00:10", "remaining_time": "11:19:49"}
214
+ {"current_steps": 213, "total_steps": 555, "loss": 0.5509, "lr": 6.199983703454813e-05, "epoch": 1.9167604049493814, "percentage": 38.38, "elapsed_time": "7:02:08", "remaining_time": "11:17:48"}
215
+ {"current_steps": 214, "total_steps": 555, "loss": 0.5456, "lr": 6.178908133583306e-05, "epoch": 1.9257592800899888, "percentage": 38.56, "elapsed_time": "7:04:06", "remaining_time": "11:15:47"}
216
+ {"current_steps": 215, "total_steps": 555, "loss": 0.5525, "lr": 6.157746199037473e-05, "epoch": 1.9347581552305961, "percentage": 38.74, "elapsed_time": "7:06:02", "remaining_time": "11:13:45"}
217
+ {"current_steps": 216, "total_steps": 555, "loss": 0.5494, "lr": 6.136498738606038e-05, "epoch": 1.9437570303712035, "percentage": 38.92, "elapsed_time": "7:08:00", "remaining_time": "11:11:43"}
218
+ {"current_steps": 217, "total_steps": 555, "loss": 0.5578, "lr": 6.115166594467696e-05, "epoch": 1.952755905511811, "percentage": 39.1, "elapsed_time": "7:09:57", "remaining_time": "11:09:42"}
219
+ {"current_steps": 218, "total_steps": 555, "loss": 0.5501, "lr": 6.093750612157719e-05, "epoch": 1.9617547806524185, "percentage": 39.28, "elapsed_time": "7:11:55", "remaining_time": "11:07:41"}
220
+ {"current_steps": 219, "total_steps": 555, "loss": 0.5544, "lr": 6.0722516405344436e-05, "epoch": 1.9707536557930259, "percentage": 39.46, "elapsed_time": "7:13:51", "remaining_time": "11:05:38"}
221
+ {"current_steps": 220, "total_steps": 555, "loss": 0.5436, "lr": 6.050670531745629e-05, "epoch": 1.9797525309336335, "percentage": 39.64, "elapsed_time": "7:15:47", "remaining_time": "11:03:36"}
222
+ {"current_steps": 221, "total_steps": 555, "loss": 0.5589, "lr": 6.0290081411946785e-05, "epoch": 1.9887514060742406, "percentage": 39.82, "elapsed_time": "7:17:46", "remaining_time": "11:01:36"}
223
+ {"current_steps": 222, "total_steps": 555, "loss": 0.5489, "lr": 6.007265327506734e-05, "epoch": 1.9977502812148482, "percentage": 40.0, "elapsed_time": "7:19:43", "remaining_time": "10:59:35"}
224
+ {"current_steps": 223, "total_steps": 555, "loss": 0.9973, "lr": 5.985442952494643e-05, "epoch": 2.0067491563554554, "percentage": 40.18, "elapsed_time": "7:23:29", "remaining_time": "11:00:16"}