Training in progress, epoch 0
Browse files- model-00001-of-00004.safetensors +1 -1
- model-00002-of-00004.safetensors +1 -1
- model-00003-of-00004.safetensors +1 -1
- model-00004-of-00004.safetensors +1 -1
- trainer_log.jsonl +138 -332
- training_args.bin +2 -2
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4877660776
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3e32710c88092895ee260ec5a8ac0f8f5773d56a2f0f9655f0bae24f076e3878
|
3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4932751008
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:05ae56627f4c096baa5ad34d4e920d071ee8aa0ec98aa6e0f6e4f99a9efd70f5
|
3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4330865200
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:efaf187383d1e6f0641df3806d03308d765e0572cb5dee80fc959f0b41837d5a
|
3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1089994880
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a05a5fd5a9dd78297c0bd00789ed43d322cce523007f3cab9ab6596a494d5fc6
|
3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
@@ -1,332 +1,138 @@
|
|
1 |
-
{"current_steps": 1, "total_steps": 550, "loss": 0.
|
2 |
-
{"current_steps": 2, "total_steps": 550, "loss": 0.
|
3 |
-
{"current_steps": 3, "total_steps": 550, "loss": 0.
|
4 |
-
{"current_steps": 4, "total_steps": 550, "loss": 0.
|
5 |
-
{"current_steps": 5, "total_steps": 550, "loss": 0.
|
6 |
-
{"current_steps": 6, "total_steps": 550, "loss": 0.
|
7 |
-
{"current_steps": 7, "total_steps": 550, "loss": 0.
|
8 |
-
{"current_steps": 8, "total_steps": 550, "loss": 0.
|
9 |
-
{"current_steps": 9, "total_steps": 550, "loss": 0.
|
10 |
-
{"current_steps": 10, "total_steps": 550, "loss": 0.
|
11 |
-
{"current_steps": 11, "total_steps": 550, "loss": 0.
|
12 |
-
{"current_steps": 12, "total_steps": 550, "loss": 0.
|
13 |
-
{"current_steps": 13, "total_steps": 550, "loss": 0.
|
14 |
-
{"current_steps": 14, "total_steps": 550, "loss": 0.
|
15 |
-
{"current_steps": 15, "total_steps": 550, "loss": 0.
|
16 |
-
{"current_steps": 16, "total_steps": 550, "loss": 0.
|
17 |
-
{"current_steps": 17, "total_steps": 550, "loss": 0.
|
18 |
-
{"current_steps": 18, "total_steps": 550, "loss": 0.
|
19 |
-
{"current_steps": 19, "total_steps": 550, "loss": 0.
|
20 |
-
{"current_steps": 20, "total_steps": 550, "loss": 0.
|
21 |
-
{"current_steps": 21, "total_steps": 550, "loss": 0.
|
22 |
-
{"current_steps": 22, "total_steps": 550, "loss": 0.
|
23 |
-
{"current_steps": 23, "total_steps": 550, "loss": 0.
|
24 |
-
{"current_steps": 24, "total_steps": 550, "loss": 0.
|
25 |
-
{"current_steps": 25, "total_steps": 550, "loss": 0.
|
26 |
-
{"current_steps":
|
27 |
-
{"current_steps":
|
28 |
-
{"current_steps":
|
29 |
-
{"current_steps":
|
30 |
-
{"current_steps":
|
31 |
-
{"current_steps":
|
32 |
-
{"current_steps":
|
33 |
-
{"current_steps":
|
34 |
-
{"current_steps":
|
35 |
-
{"current_steps":
|
36 |
-
{"current_steps":
|
37 |
-
{"current_steps":
|
38 |
-
{"current_steps":
|
39 |
-
{"current_steps":
|
40 |
-
{"current_steps":
|
41 |
-
{"current_steps":
|
42 |
-
{"current_steps":
|
43 |
-
{"current_steps":
|
44 |
-
{"current_steps":
|
45 |
-
{"current_steps":
|
46 |
-
{"current_steps":
|
47 |
-
{"current_steps":
|
48 |
-
{"current_steps":
|
49 |
-
{"current_steps":
|
50 |
-
{"current_steps":
|
51 |
-
{"current_steps":
|
52 |
-
{"current_steps":
|
53 |
-
{"current_steps":
|
54 |
-
{"current_steps":
|
55 |
-
{"current_steps":
|
56 |
-
{"current_steps":
|
57 |
-
{"current_steps":
|
58 |
-
{"current_steps":
|
59 |
-
{"current_steps":
|
60 |
-
{"current_steps":
|
61 |
-
{"current_steps":
|
62 |
-
{"current_steps":
|
63 |
-
{"current_steps":
|
64 |
-
{"current_steps":
|
65 |
-
{"current_steps":
|
66 |
-
{"current_steps":
|
67 |
-
{"current_steps":
|
68 |
-
{"current_steps":
|
69 |
-
{"current_steps":
|
70 |
-
{"current_steps":
|
71 |
-
{"current_steps":
|
72 |
-
{"current_steps":
|
73 |
-
{"current_steps":
|
74 |
-
{"current_steps":
|
75 |
-
{"current_steps":
|
76 |
-
{"current_steps":
|
77 |
-
{"current_steps":
|
78 |
-
{"current_steps":
|
79 |
-
{"current_steps":
|
80 |
-
{"current_steps":
|
81 |
-
{"current_steps":
|
82 |
-
{"current_steps":
|
83 |
-
{"current_steps":
|
84 |
-
{"current_steps":
|
85 |
-
{"current_steps":
|
86 |
-
{"current_steps":
|
87 |
-
{"current_steps":
|
88 |
-
{"current_steps":
|
89 |
-
{"current_steps":
|
90 |
-
{"current_steps":
|
91 |
-
{"current_steps":
|
92 |
-
{"current_steps":
|
93 |
-
{"current_steps":
|
94 |
-
{"current_steps":
|
95 |
-
{"current_steps":
|
96 |
-
{"current_steps":
|
97 |
-
{"current_steps":
|
98 |
-
{"current_steps":
|
99 |
-
{"current_steps":
|
100 |
-
{"current_steps":
|
101 |
-
{"current_steps":
|
102 |
-
{"current_steps":
|
103 |
-
{"current_steps":
|
104 |
-
{"current_steps":
|
105 |
-
{"current_steps":
|
106 |
-
{"current_steps":
|
107 |
-
{"current_steps":
|
108 |
-
{"current_steps":
|
109 |
-
{"current_steps":
|
110 |
-
{"current_steps":
|
111 |
-
{"current_steps":
|
112 |
-
{"current_steps":
|
113 |
-
{"current_steps":
|
114 |
-
{"current_steps":
|
115 |
-
{"current_steps":
|
116 |
-
{"current_steps":
|
117 |
-
{"current_steps":
|
118 |
-
{"current_steps":
|
119 |
-
{"current_steps":
|
120 |
-
{"current_steps":
|
121 |
-
{"current_steps":
|
122 |
-
{"current_steps":
|
123 |
-
{"current_steps":
|
124 |
-
{"current_steps":
|
125 |
-
{"current_steps":
|
126 |
-
{"current_steps":
|
127 |
-
{"current_steps":
|
128 |
-
{"current_steps":
|
129 |
-
{"current_steps":
|
130 |
-
{"current_steps":
|
131 |
-
{"current_steps":
|
132 |
-
{"current_steps":
|
133 |
-
{"current_steps":
|
134 |
-
{"current_steps":
|
135 |
-
{"current_steps":
|
136 |
-
{"current_steps":
|
137 |
-
{"current_steps":
|
138 |
-
{"current_steps":
|
139 |
-
{"current_steps": 139, "total_steps": 550, "loss": 0.4035, "lr": 7.444904972720803e-05, "epoch": 1.260180995475113, "percentage": 25.27, "elapsed_time": "3:47:20", "remaining_time": "11:12:13"}
|
140 |
-
{"current_steps": 140, "total_steps": 550, "loss": 0.4118, "lr": 7.431933652939909e-05, "epoch": 1.2692307692307692, "percentage": 25.45, "elapsed_time": "3:48:57", "remaining_time": "11:10:31"}
|
141 |
-
{"current_steps": 141, "total_steps": 550, "loss": 0.401, "lr": 7.418824095371895e-05, "epoch": 1.2782805429864252, "percentage": 25.64, "elapsed_time": "3:50:34", "remaining_time": "11:08:50"}
|
142 |
-
{"current_steps": 142, "total_steps": 550, "loss": 0.4099, "lr": 7.405576828067829e-05, "epoch": 1.2873303167420813, "percentage": 25.82, "elapsed_time": "3:52:11", "remaining_time": "11:07:08"}
|
143 |
-
{"current_steps": 143, "total_steps": 550, "loss": 0.4046, "lr": 7.392192384625704e-05, "epoch": 1.2963800904977376, "percentage": 26.0, "elapsed_time": "3:53:48", "remaining_time": "11:05:26"}
|
144 |
-
{"current_steps": 144, "total_steps": 550, "loss": 0.4053, "lr": 7.378671304168955e-05, "epoch": 1.3054298642533937, "percentage": 26.18, "elapsed_time": "3:55:25", "remaining_time": "11:03:45"}
|
145 |
-
{"current_steps": 145, "total_steps": 550, "loss": 0.4048, "lr": 7.365014131324725e-05, "epoch": 1.3144796380090498, "percentage": 26.36, "elapsed_time": "3:57:02", "remaining_time": "11:02:03"}
|
146 |
-
{"current_steps": 146, "total_steps": 550, "loss": 0.4052, "lr": 7.35122141620195e-05, "epoch": 1.3235294117647058, "percentage": 26.55, "elapsed_time": "3:58:38", "remaining_time": "11:00:22"}
|
147 |
-
{"current_steps": 147, "total_steps": 550, "loss": 0.3967, "lr": 7.337293714369182e-05, "epoch": 1.332579185520362, "percentage": 26.73, "elapsed_time": "4:00:15", "remaining_time": "10:58:40"}
|
148 |
-
{"current_steps": 148, "total_steps": 550, "loss": 0.403, "lr": 7.323231586832219e-05, "epoch": 1.3416289592760182, "percentage": 26.91, "elapsed_time": "4:01:52", "remaining_time": "10:57:00"}
|
149 |
-
{"current_steps": 149, "total_steps": 550, "loss": 0.3994, "lr": 7.30903560001151e-05, "epoch": 1.3506787330316743, "percentage": 27.09, "elapsed_time": "4:03:29", "remaining_time": "10:55:19"}
|
150 |
-
{"current_steps": 150, "total_steps": 550, "loss": 0.4047, "lr": 7.294706325719331e-05, "epoch": 1.3597285067873304, "percentage": 27.27, "elapsed_time": "4:05:06", "remaining_time": "10:53:38"}
|
151 |
-
{"current_steps": 151, "total_steps": 550, "loss": 0.4077, "lr": 7.280244341136765e-05, "epoch": 1.3687782805429864, "percentage": 27.45, "elapsed_time": "4:06:43", "remaining_time": "10:51:57"}
|
152 |
-
{"current_steps": 152, "total_steps": 550, "loss": 0.405, "lr": 7.26565022879044e-05, "epoch": 1.3778280542986425, "percentage": 27.64, "elapsed_time": "4:08:20", "remaining_time": "10:50:16"}
|
153 |
-
{"current_steps": 153, "total_steps": 550, "loss": 0.403, "lr": 7.250924576529072e-05, "epoch": 1.3868778280542986, "percentage": 27.82, "elapsed_time": "4:09:57", "remaining_time": "10:48:36"}
|
154 |
-
{"current_steps": 154, "total_steps": 550, "loss": 0.4056, "lr": 7.236067977499791e-05, "epoch": 1.3959276018099547, "percentage": 28.0, "elapsed_time": "4:11:34", "remaining_time": "10:46:55"}
|
155 |
-
{"current_steps": 155, "total_steps": 550, "loss": 0.4056, "lr": 7.221081030124235e-05, "epoch": 1.4049773755656108, "percentage": 28.18, "elapsed_time": "4:13:11", "remaining_time": "10:45:14"}
|
156 |
-
{"current_steps": 156, "total_steps": 550, "loss": 0.4043, "lr": 7.205964338074462e-05, "epoch": 1.4140271493212668, "percentage": 28.36, "elapsed_time": "4:14:48", "remaining_time": "10:43:33"}
|
157 |
-
{"current_steps": 157, "total_steps": 550, "loss": 0.4056, "lr": 7.190718510248622e-05, "epoch": 1.4230769230769231, "percentage": 28.55, "elapsed_time": "4:16:25", "remaining_time": "10:41:52"}
|
158 |
-
{"current_steps": 158, "total_steps": 550, "loss": 0.4053, "lr": 7.175344160746438e-05, "epoch": 1.4321266968325792, "percentage": 28.73, "elapsed_time": "4:18:02", "remaining_time": "10:40:11"}
|
159 |
-
{"current_steps": 159, "total_steps": 550, "loss": 0.3935, "lr": 7.159841908844465e-05, "epoch": 1.4411764705882353, "percentage": 28.91, "elapsed_time": "4:19:38", "remaining_time": "10:38:30"}
|
160 |
-
{"current_steps": 160, "total_steps": 550, "loss": 0.4012, "lr": 7.144212378971151e-05, "epoch": 1.4502262443438914, "percentage": 29.09, "elapsed_time": "4:21:15", "remaining_time": "10:36:49"}
|
161 |
-
{"current_steps": 161, "total_steps": 550, "loss": 0.3952, "lr": 7.128456200681678e-05, "epoch": 1.4592760180995474, "percentage": 29.27, "elapsed_time": "4:22:52", "remaining_time": "10:35:08"}
|
162 |
-
{"current_steps": 162, "total_steps": 550, "loss": 0.3905, "lr": 7.11257400863261e-05, "epoch": 1.4683257918552037, "percentage": 29.45, "elapsed_time": "4:24:29", "remaining_time": "10:33:28"}
|
163 |
-
{"current_steps": 163, "total_steps": 550, "loss": 0.3964, "lr": 7.096566442556331e-05, "epoch": 1.4773755656108598, "percentage": 29.64, "elapsed_time": "4:26:06", "remaining_time": "10:31:48"}
|
164 |
-
{"current_steps": 164, "total_steps": 550, "loss": 0.3949, "lr": 7.080434147235263e-05, "epoch": 1.4864253393665159, "percentage": 29.82, "elapsed_time": "4:27:43", "remaining_time": "10:30:07"}
|
165 |
-
{"current_steps": 165, "total_steps": 550, "loss": 0.4037, "lr": 7.064177772475912e-05, "epoch": 1.495475113122172, "percentage": 30.0, "elapsed_time": "4:29:20", "remaining_time": "10:28:27"}
|
166 |
-
{"current_steps": 166, "total_steps": 550, "loss": 0.4021, "lr": 7.047797973082684e-05, "epoch": 1.504524886877828, "percentage": 30.18, "elapsed_time": "4:30:57", "remaining_time": "10:26:47"}
|
167 |
-
{"current_steps": 167, "total_steps": 550, "loss": 0.3913, "lr": 7.031295408831508e-05, "epoch": 1.5135746606334841, "percentage": 30.36, "elapsed_time": "4:32:34", "remaining_time": "10:25:07"}
|
168 |
-
{"current_steps": 168, "total_steps": 550, "loss": 0.4031, "lr": 7.014670744443267e-05, "epoch": 1.5226244343891402, "percentage": 30.55, "elapsed_time": "4:34:11", "remaining_time": "10:23:27"}
|
169 |
-
{"current_steps": 169, "total_steps": 550, "loss": 0.3981, "lr": 6.997924649557017e-05, "epoch": 1.5316742081447963, "percentage": 30.73, "elapsed_time": "4:35:48", "remaining_time": "10:21:47"}
|
170 |
-
{"current_steps": 170, "total_steps": 550, "loss": 0.3992, "lr": 6.98105779870302e-05, "epoch": 1.5407239819004523, "percentage": 30.91, "elapsed_time": "4:37:25", "remaining_time": "10:20:07"}
|
171 |
-
{"current_steps": 171, "total_steps": 550, "loss": 0.3983, "lr": 6.964070871275567e-05, "epoch": 1.5497737556561086, "percentage": 31.09, "elapsed_time": "4:39:02", "remaining_time": "10:18:27"}
|
172 |
-
{"current_steps": 172, "total_steps": 550, "loss": 0.3993, "lr": 6.94696455150562e-05, "epoch": 1.5588235294117647, "percentage": 31.27, "elapsed_time": "4:40:39", "remaining_time": "10:16:47"}
|
173 |
-
{"current_steps": 173, "total_steps": 550, "loss": 0.3979, "lr": 6.929739528433244e-05, "epoch": 1.5678733031674208, "percentage": 31.45, "elapsed_time": "4:42:16", "remaining_time": "10:15:07"}
|
174 |
-
{"current_steps": 174, "total_steps": 550, "loss": 0.3976, "lr": 6.912396495879857e-05, "epoch": 1.5769230769230769, "percentage": 31.64, "elapsed_time": "4:43:53", "remaining_time": "10:13:27"}
|
175 |
-
{"current_steps": 175, "total_steps": 550, "loss": 0.3985, "lr": 6.89493615242028e-05, "epoch": 1.5859728506787332, "percentage": 31.82, "elapsed_time": "4:45:30", "remaining_time": "10:11:47"}
|
176 |
-
{"current_steps": 176, "total_steps": 550, "loss": 0.3956, "lr": 6.877359201354606e-05, "epoch": 1.5950226244343892, "percentage": 32.0, "elapsed_time": "4:47:07", "remaining_time": "10:10:07"}
|
177 |
-
{"current_steps": 177, "total_steps": 550, "loss": 0.3976, "lr": 6.859666350679854e-05, "epoch": 1.6040723981900453, "percentage": 32.18, "elapsed_time": "4:48:44", "remaining_time": "10:08:28"}
|
178 |
-
{"current_steps": 178, "total_steps": 550, "loss": 0.3924, "lr": 6.841858313061477e-05, "epoch": 1.6131221719457014, "percentage": 32.36, "elapsed_time": "4:50:21", "remaining_time": "10:06:48"}
|
179 |
-
{"current_steps": 179, "total_steps": 550, "loss": 0.3994, "lr": 6.823935805804626e-05, "epoch": 1.6221719457013575, "percentage": 32.55, "elapsed_time": "4:51:58", "remaining_time": "10:05:08"}
|
180 |
-
{"current_steps": 180, "total_steps": 550, "loss": 0.3899, "lr": 6.805899550825285e-05, "epoch": 1.6312217194570136, "percentage": 32.73, "elapsed_time": "4:53:34", "remaining_time": "10:03:28"}
|
181 |
-
{"current_steps": 181, "total_steps": 550, "loss": 0.3872, "lr": 6.787750274621175e-05, "epoch": 1.6402714932126696, "percentage": 32.91, "elapsed_time": "4:55:11", "remaining_time": "10:01:48"}
|
182 |
-
{"current_steps": 182, "total_steps": 550, "loss": 0.395, "lr": 6.769488708242492e-05, "epoch": 1.6493212669683257, "percentage": 33.09, "elapsed_time": "4:56:48", "remaining_time": "10:00:08"}
|
183 |
-
{"current_steps": 183, "total_steps": 550, "loss": 0.3936, "lr": 6.751115587262469e-05, "epoch": 1.6583710407239818, "percentage": 33.27, "elapsed_time": "4:58:25", "remaining_time": "9:58:29"}
|
184 |
-
{"current_steps": 184, "total_steps": 550, "loss": 0.3905, "lr": 6.732631651747739e-05, "epoch": 1.6674208144796379, "percentage": 33.45, "elapsed_time": "5:00:02", "remaining_time": "9:56:49"}
|
185 |
-
{"current_steps": 185, "total_steps": 550, "loss": 0.3936, "lr": 6.714037646228529e-05, "epoch": 1.6764705882352942, "percentage": 33.64, "elapsed_time": "5:01:39", "remaining_time": "9:55:10"}
|
186 |
-
{"current_steps": 186, "total_steps": 550, "loss": 0.3918, "lr": 6.695334319668672e-05, "epoch": 1.6855203619909502, "percentage": 33.82, "elapsed_time": "5:03:16", "remaining_time": "9:53:30"}
|
187 |
-
{"current_steps": 187, "total_steps": 550, "loss": 0.3964, "lr": 6.676522425435433e-05, "epoch": 1.6945701357466063, "percentage": 34.0, "elapsed_time": "5:04:53", "remaining_time": "9:51:51"}
|
188 |
-
{"current_steps": 188, "total_steps": 550, "loss": 0.3955, "lr": 6.65760272126917e-05, "epoch": 1.7036199095022626, "percentage": 34.18, "elapsed_time": "5:06:30", "remaining_time": "9:50:12"}
|
189 |
-
{"current_steps": 189, "total_steps": 550, "loss": 0.388, "lr": 6.638575969252806e-05, "epoch": 1.7126696832579187, "percentage": 34.36, "elapsed_time": "5:08:07", "remaining_time": "9:48:32"}
|
190 |
-
{"current_steps": 190, "total_steps": 550, "loss": 0.3943, "lr": 6.619442935781141e-05, "epoch": 1.7217194570135748, "percentage": 34.55, "elapsed_time": "5:09:44", "remaining_time": "9:46:53"}
|
191 |
-
{"current_steps": 191, "total_steps": 550, "loss": 0.3929, "lr": 6.600204391529971e-05, "epoch": 1.7307692307692308, "percentage": 34.73, "elapsed_time": "5:11:21", "remaining_time": "9:45:14"}
|
192 |
-
{"current_steps": 192, "total_steps": 550, "loss": 0.3929, "lr": 6.580861111425053e-05, "epoch": 1.739819004524887, "percentage": 34.91, "elapsed_time": "5:12:58", "remaining_time": "9:43:34"}
|
193 |
-
{"current_steps": 193, "total_steps": 550, "loss": 0.3899, "lr": 6.56141387461089e-05, "epoch": 1.748868778280543, "percentage": 35.09, "elapsed_time": "5:14:35", "remaining_time": "9:41:55"}
|
194 |
-
{"current_steps": 194, "total_steps": 550, "loss": 0.395, "lr": 6.541863464419346e-05, "epoch": 1.757918552036199, "percentage": 35.27, "elapsed_time": "5:16:12", "remaining_time": "9:40:16"}
|
195 |
-
{"current_steps": 195, "total_steps": 550, "loss": 0.3845, "lr": 6.52221066833809e-05, "epoch": 1.7669683257918551, "percentage": 35.45, "elapsed_time": "5:17:49", "remaining_time": "9:38:36"}
|
196 |
-
{"current_steps": 196, "total_steps": 550, "loss": 0.39, "lr": 6.502456277978887e-05, "epoch": 1.7760180995475112, "percentage": 35.64, "elapsed_time": "5:19:26", "remaining_time": "9:36:57"}
|
197 |
-
{"current_steps": 197, "total_steps": 550, "loss": 0.3878, "lr": 6.482601089045696e-05, "epoch": 1.7850678733031673, "percentage": 35.82, "elapsed_time": "5:21:03", "remaining_time": "9:35:18"}
|
198 |
-
{"current_steps": 198, "total_steps": 550, "loss": 0.3827, "lr": 6.462645901302633e-05, "epoch": 1.7941176470588234, "percentage": 36.0, "elapsed_time": "5:22:40", "remaining_time": "9:33:38"}
|
199 |
-
{"current_steps": 199, "total_steps": 550, "loss": 0.383, "lr": 6.442591518541753e-05, "epoch": 1.8031674208144797, "percentage": 36.18, "elapsed_time": "5:24:17", "remaining_time": "9:31:59"}
|
200 |
-
{"current_steps": 200, "total_steps": 550, "loss": 0.3867, "lr": 6.422438748550667e-05, "epoch": 1.8122171945701357, "percentage": 36.36, "elapsed_time": "5:25:54", "remaining_time": "9:30:20"}
|
201 |
-
{"current_steps": 201, "total_steps": 550, "loss": 0.3906, "lr": 6.402188403080013e-05, "epoch": 1.8212669683257918, "percentage": 36.55, "elapsed_time": "5:27:31", "remaining_time": "9:28:41"}
|
202 |
-
{"current_steps": 202, "total_steps": 550, "loss": 0.3856, "lr": 6.381841297810753e-05, "epoch": 1.8303167420814481, "percentage": 36.73, "elapsed_time": "5:29:08", "remaining_time": "9:27:02"}
|
203 |
-
{"current_steps": 203, "total_steps": 550, "loss": 0.3893, "lr": 6.361398252321321e-05, "epoch": 1.8393665158371042, "percentage": 36.91, "elapsed_time": "5:30:45", "remaining_time": "9:25:23"}
|
204 |
-
{"current_steps": 204, "total_steps": 550, "loss": 0.3851, "lr": 6.340860090054608e-05, "epoch": 1.8484162895927603, "percentage": 37.09, "elapsed_time": "5:32:22", "remaining_time": "9:23:44"}
|
205 |
-
{"current_steps": 205, "total_steps": 550, "loss": 0.3868, "lr": 6.320227638284793e-05, "epoch": 1.8574660633484164, "percentage": 37.27, "elapsed_time": "5:33:59", "remaining_time": "9:22:05"}
|
206 |
-
{"current_steps": 206, "total_steps": 550, "loss": 0.3921, "lr": 6.29950172808403e-05, "epoch": 1.8665158371040724, "percentage": 37.45, "elapsed_time": "5:35:36", "remaining_time": "9:20:25"}
|
207 |
-
{"current_steps": 207, "total_steps": 550, "loss": 0.3849, "lr": 6.278683194288956e-05, "epoch": 1.8755656108597285, "percentage": 37.64, "elapsed_time": "5:37:13", "remaining_time": "9:18:46"}
|
208 |
-
{"current_steps": 208, "total_steps": 550, "loss": 0.3904, "lr": 6.257772875467078e-05, "epoch": 1.8846153846153846, "percentage": 37.82, "elapsed_time": "5:38:51", "remaining_time": "9:17:09"}
|
209 |
-
{"current_steps": 209, "total_steps": 550, "loss": 0.3918, "lr": 6.236771613882987e-05, "epoch": 1.8936651583710407, "percentage": 38.0, "elapsed_time": "5:40:28", "remaining_time": "9:15:30"}
|
210 |
-
{"current_steps": 210, "total_steps": 550, "loss": 0.3871, "lr": 6.215680255464442e-05, "epoch": 1.9027149321266967, "percentage": 38.18, "elapsed_time": "5:42:05", "remaining_time": "9:13:51"}
|
211 |
-
{"current_steps": 211, "total_steps": 550, "loss": 0.3898, "lr": 6.194499649768281e-05, "epoch": 1.9117647058823528, "percentage": 38.36, "elapsed_time": "5:43:42", "remaining_time": "9:12:12"}
|
212 |
-
{"current_steps": 212, "total_steps": 550, "loss": 0.3843, "lr": 6.173230649946213e-05, "epoch": 1.9208144796380089, "percentage": 38.55, "elapsed_time": "5:45:19", "remaining_time": "9:10:33"}
|
213 |
-
{"current_steps": 213, "total_steps": 550, "loss": 0.3831, "lr": 6.15187411271045e-05, "epoch": 1.9298642533936652, "percentage": 38.73, "elapsed_time": "5:46:56", "remaining_time": "9:08:55"}
|
214 |
-
{"current_steps": 214, "total_steps": 550, "loss": 0.3857, "lr": 6.130430898299199e-05, "epoch": 1.9389140271493213, "percentage": 38.91, "elapsed_time": "5:48:33", "remaining_time": "9:07:16"}
|
215 |
-
{"current_steps": 215, "total_steps": 550, "loss": 0.3873, "lr": 6.10890187044201e-05, "epoch": 1.9479638009049773, "percentage": 39.09, "elapsed_time": "5:50:10", "remaining_time": "9:05:37"}
|
216 |
-
{"current_steps": 216, "total_steps": 550, "loss": 0.3859, "lr": 6.087287896324984e-05, "epoch": 1.9570135746606336, "percentage": 39.27, "elapsed_time": "5:51:47", "remaining_time": "9:03:58"}
|
217 |
-
{"current_steps": 217, "total_steps": 550, "loss": 0.3913, "lr": 6.0655898465558484e-05, "epoch": 1.9660633484162897, "percentage": 39.45, "elapsed_time": "5:53:24", "remaining_time": "9:02:19"}
|
218 |
-
{"current_steps": 218, "total_steps": 550, "loss": 0.3829, "lr": 6.043808595128883e-05, "epoch": 1.9751131221719458, "percentage": 39.64, "elapsed_time": "5:55:02", "remaining_time": "9:00:41"}
|
219 |
-
{"current_steps": 219, "total_steps": 550, "loss": 0.3918, "lr": 6.021945019389719e-05, "epoch": 1.9841628959276019, "percentage": 39.82, "elapsed_time": "5:56:39", "remaining_time": "8:59:03"}
|
220 |
-
{"current_steps": 220, "total_steps": 550, "loss": 0.385, "lr": 6.000000000000001e-05, "epoch": 1.993212669683258, "percentage": 40.0, "elapsed_time": "5:58:16", "remaining_time": "8:57:24"}
|
221 |
-
{"current_steps": 221, "total_steps": 550, "loss": 0.6705, "lr": 5.977974420901908e-05, "epoch": 2.004524886877828, "percentage": 40.18, "elapsed_time": "6:01:27", "remaining_time": "8:58:05"}
|
222 |
-
{"current_steps": 222, "total_steps": 550, "loss": 0.364, "lr": 5.955869169282556e-05, "epoch": 2.013574660633484, "percentage": 40.36, "elapsed_time": "6:03:03", "remaining_time": "8:56:25"}
|
223 |
-
{"current_steps": 223, "total_steps": 550, "loss": 0.3695, "lr": 5.9336851355382557e-05, "epoch": 2.02262443438914, "percentage": 40.55, "elapsed_time": "6:04:41", "remaining_time": "8:54:46"}
|
224 |
-
{"current_steps": 224, "total_steps": 550, "loss": 0.3643, "lr": 5.911423213238653e-05, "epoch": 2.0316742081447963, "percentage": 40.73, "elapsed_time": "6:06:18", "remaining_time": "8:53:06"}
|
225 |
-
{"current_steps": 225, "total_steps": 550, "loss": 0.3601, "lr": 5.889084299090732e-05, "epoch": 2.0407239819004523, "percentage": 40.91, "elapsed_time": "6:07:55", "remaining_time": "8:51:27"}
|
226 |
-
{"current_steps": 226, "total_steps": 550, "loss": 0.3645, "lr": 5.866669292902695e-05, "epoch": 2.0497737556561084, "percentage": 41.09, "elapsed_time": "6:09:32", "remaining_time": "8:49:47"}
|
227 |
-
{"current_steps": 227, "total_steps": 550, "loss": 0.363, "lr": 5.844179097547725e-05, "epoch": 2.0588235294117645, "percentage": 41.27, "elapsed_time": "6:11:09", "remaining_time": "8:48:07"}
|
228 |
-
{"current_steps": 228, "total_steps": 550, "loss": 0.3593, "lr": 5.821614618927613e-05, "epoch": 2.067873303167421, "percentage": 41.45, "elapsed_time": "6:12:46", "remaining_time": "8:46:28"}
|
229 |
-
{"current_steps": 229, "total_steps": 550, "loss": 0.3647, "lr": 5.798976765936264e-05, "epoch": 2.076923076923077, "percentage": 41.64, "elapsed_time": "6:14:23", "remaining_time": "8:44:48"}
|
230 |
-
{"current_steps": 230, "total_steps": 550, "loss": 0.3587, "lr": 5.776266450423097e-05, "epoch": 2.085972850678733, "percentage": 41.82, "elapsed_time": "6:16:01", "remaining_time": "8:43:09"}
|
231 |
-
{"current_steps": 231, "total_steps": 550, "loss": 0.3627, "lr": 5.75348458715631e-05, "epoch": 2.0950226244343892, "percentage": 42.0, "elapsed_time": "6:17:38", "remaining_time": "8:41:29"}
|
232 |
-
{"current_steps": 232, "total_steps": 550, "loss": 0.3541, "lr": 5.7306320937860336e-05, "epoch": 2.1040723981900453, "percentage": 42.18, "elapsed_time": "6:19:15", "remaining_time": "8:39:50"}
|
233 |
-
{"current_steps": 233, "total_steps": 550, "loss": 0.3651, "lr": 5.7077098908073676e-05, "epoch": 2.1131221719457014, "percentage": 42.36, "elapsed_time": "6:20:52", "remaining_time": "8:38:11"}
|
234 |
-
{"current_steps": 234, "total_steps": 550, "loss": 0.3556, "lr": 5.684718901523307e-05, "epoch": 2.1221719457013575, "percentage": 42.55, "elapsed_time": "6:22:30", "remaining_time": "8:36:32"}
|
235 |
-
{"current_steps": 235, "total_steps": 550, "loss": 0.3596, "lr": 5.661660052007547e-05, "epoch": 2.1312217194570136, "percentage": 42.73, "elapsed_time": "6:24:07", "remaining_time": "8:34:53"}
|
236 |
-
{"current_steps": 236, "total_steps": 550, "loss": 0.3549, "lr": 5.6385342710671815e-05, "epoch": 2.1402714932126696, "percentage": 42.91, "elapsed_time": "6:25:44", "remaining_time": "8:33:13"}
|
237 |
-
{"current_steps": 237, "total_steps": 550, "loss": 0.3576, "lr": 5.6153424902053e-05, "epoch": 2.1493212669683257, "percentage": 43.09, "elapsed_time": "6:27:20", "remaining_time": "8:31:33"}
|
238 |
-
{"current_steps": 238, "total_steps": 550, "loss": 0.3577, "lr": 5.59208564358345e-05, "epoch": 2.158371040723982, "percentage": 43.27, "elapsed_time": "6:28:57", "remaining_time": "8:29:54"}
|
239 |
-
{"current_steps": 239, "total_steps": 550, "loss": 0.3656, "lr": 5.568764667984022e-05, "epoch": 2.167420814479638, "percentage": 43.45, "elapsed_time": "6:30:34", "remaining_time": "8:28:14"}
|
240 |
-
{"current_steps": 240, "total_steps": 550, "loss": 0.3534, "lr": 5.5453805027725145e-05, "epoch": 2.176470588235294, "percentage": 43.64, "elapsed_time": "6:32:11", "remaining_time": "8:26:35"}
|
241 |
-
{"current_steps": 241, "total_steps": 550, "loss": 0.3534, "lr": 5.521934089859692e-05, "epoch": 2.1855203619909505, "percentage": 43.82, "elapsed_time": "6:33:48", "remaining_time": "8:24:55"}
|
242 |
-
{"current_steps": 242, "total_steps": 550, "loss": 0.3579, "lr": 5.4984263736636494e-05, "epoch": 2.1945701357466065, "percentage": 44.0, "elapsed_time": "6:35:25", "remaining_time": "8:23:16"}
|
243 |
-
{"current_steps": 243, "total_steps": 550, "loss": 0.359, "lr": 5.4748583010717636e-05, "epoch": 2.2036199095022626, "percentage": 44.18, "elapsed_time": "6:37:02", "remaining_time": "8:21:36"}
|
244 |
-
{"current_steps": 244, "total_steps": 550, "loss": 0.3627, "lr": 5.451230821402564e-05, "epoch": 2.2126696832579187, "percentage": 44.36, "elapsed_time": "6:38:39", "remaining_time": "8:19:57"}
|
245 |
-
{"current_steps": 245, "total_steps": 550, "loss": 0.3558, "lr": 5.427544886367488e-05, "epoch": 2.2217194570135748, "percentage": 44.55, "elapsed_time": "6:40:16", "remaining_time": "8:18:18"}
|
246 |
-
{"current_steps": 246, "total_steps": 550, "loss": 0.3577, "lr": 5.403801450032544e-05, "epoch": 2.230769230769231, "percentage": 44.73, "elapsed_time": "6:41:54", "remaining_time": "8:16:39"}
|
247 |
-
{"current_steps": 247, "total_steps": 550, "loss": 0.3627, "lr": 5.380001468779883e-05, "epoch": 2.239819004524887, "percentage": 44.91, "elapsed_time": "6:43:31", "remaining_time": "8:15:00"}
|
248 |
-
{"current_steps": 248, "total_steps": 550, "loss": 0.3583, "lr": 5.356145901269282e-05, "epoch": 2.248868778280543, "percentage": 45.09, "elapsed_time": "6:45:08", "remaining_time": "8:13:21"}
|
249 |
-
{"current_steps": 249, "total_steps": 550, "loss": 0.3612, "lr": 5.3322357083995235e-05, "epoch": 2.257918552036199, "percentage": 45.27, "elapsed_time": "6:46:45", "remaining_time": "8:11:42"}
|
250 |
-
{"current_steps": 250, "total_steps": 550, "loss": 0.354, "lr": 5.3082718532696874e-05, "epoch": 2.266968325791855, "percentage": 45.45, "elapsed_time": "6:48:23", "remaining_time": "8:10:03"}
|
251 |
-
{"current_steps": 251, "total_steps": 550, "loss": 0.3528, "lr": 5.284255301140364e-05, "epoch": 2.276018099547511, "percentage": 45.64, "elapsed_time": "6:50:00", "remaining_time": "8:08:24"}
|
252 |
-
{"current_steps": 252, "total_steps": 550, "loss": 0.3504, "lr": 5.2601870193947716e-05, "epoch": 2.2850678733031673, "percentage": 45.82, "elapsed_time": "6:51:37", "remaining_time": "8:06:46"}
|
253 |
-
{"current_steps": 253, "total_steps": 550, "loss": 0.3527, "lr": 5.23606797749979e-05, "epoch": 2.2941176470588234, "percentage": 46.0, "elapsed_time": "6:53:14", "remaining_time": "8:05:07"}
|
254 |
-
{"current_steps": 254, "total_steps": 550, "loss": 0.3545, "lr": 5.21189914696691e-05, "epoch": 2.3031674208144794, "percentage": 46.18, "elapsed_time": "6:54:52", "remaining_time": "8:03:28"}
|
255 |
-
{"current_steps": 255, "total_steps": 550, "loss": 0.3525, "lr": 5.1876815013131e-05, "epoch": 2.3122171945701355, "percentage": 46.36, "elapsed_time": "6:56:29", "remaining_time": "8:01:49"}
|
256 |
-
{"current_steps": 256, "total_steps": 550, "loss": 0.3561, "lr": 5.163416016021597e-05, "epoch": 2.321266968325792, "percentage": 46.55, "elapsed_time": "6:58:06", "remaining_time": "8:00:10"}
|
257 |
-
{"current_steps": 257, "total_steps": 550, "loss": 0.3515, "lr": 5.1391036685026093e-05, "epoch": 2.330316742081448, "percentage": 46.73, "elapsed_time": "6:59:44", "remaining_time": "7:58:31"}
|
258 |
-
{"current_steps": 258, "total_steps": 550, "loss": 0.3513, "lr": 5.114745438053952e-05, "epoch": 2.339366515837104, "percentage": 46.91, "elapsed_time": "7:01:21", "remaining_time": "7:56:52"}
|
259 |
-
{"current_steps": 259, "total_steps": 550, "loss": 0.3557, "lr": 5.0903423058215925e-05, "epoch": 2.3484162895927603, "percentage": 47.09, "elapsed_time": "7:02:58", "remaining_time": "7:55:13"}
|
260 |
-
{"current_steps": 260, "total_steps": 550, "loss": 0.3503, "lr": 5.06589525476014e-05, "epoch": 2.3574660633484164, "percentage": 47.27, "elapsed_time": "7:04:35", "remaining_time": "7:53:34"}
|
261 |
-
{"current_steps": 261, "total_steps": 550, "loss": 0.3568, "lr": 5.0414052695932486e-05, "epoch": 2.3665158371040724, "percentage": 47.45, "elapsed_time": "7:06:12", "remaining_time": "7:51:55"}
|
262 |
-
{"current_steps": 262, "total_steps": 550, "loss": 0.3537, "lr": 5.016873336773949e-05, "epoch": 2.3755656108597285, "percentage": 47.64, "elapsed_time": "7:07:50", "remaining_time": "7:50:17"}
|
263 |
-
{"current_steps": 263, "total_steps": 550, "loss": 0.3587, "lr": 4.992300444444916e-05, "epoch": 2.3846153846153846, "percentage": 47.82, "elapsed_time": "7:09:27", "remaining_time": "7:48:39"}
|
264 |
-
{"current_steps": 264, "total_steps": 550, "loss": 0.3544, "lr": 4.967687582398671e-05, "epoch": 2.3936651583710407, "percentage": 48.0, "elapsed_time": "7:11:05", "remaining_time": "7:47:00"}
|
265 |
-
{"current_steps": 265, "total_steps": 550, "loss": 0.3553, "lr": 4.94303574203771e-05, "epoch": 2.4027149321266967, "percentage": 48.18, "elapsed_time": "7:12:42", "remaining_time": "7:45:21"}
|
266 |
-
{"current_steps": 266, "total_steps": 550, "loss": 0.3516, "lr": 4.9183459163345644e-05, "epoch": 2.411764705882353, "percentage": 48.36, "elapsed_time": "7:14:19", "remaining_time": "7:43:42"}
|
267 |
-
{"current_steps": 267, "total_steps": 550, "loss": 0.3539, "lr": 4.893619099791817e-05, "epoch": 2.420814479638009, "percentage": 48.55, "elapsed_time": "7:15:56", "remaining_time": "7:42:03"}
|
268 |
-
{"current_steps": 268, "total_steps": 550, "loss": 0.3588, "lr": 4.868856288402032e-05, "epoch": 2.4298642533936654, "percentage": 48.73, "elapsed_time": "7:17:33", "remaining_time": "7:40:24"}
|
269 |
-
{"current_steps": 269, "total_steps": 550, "loss": 0.3543, "lr": 4.8440584796076395e-05, "epoch": 2.4389140271493215, "percentage": 48.91, "elapsed_time": "7:19:10", "remaining_time": "7:38:46"}
|
270 |
-
{"current_steps": 270, "total_steps": 550, "loss": 0.3601, "lr": 4.819226672260763e-05, "epoch": 2.4479638009049776, "percentage": 49.09, "elapsed_time": "7:20:48", "remaining_time": "7:37:07"}
|
271 |
-
{"current_steps": 271, "total_steps": 550, "loss": 0.3587, "lr": 4.794361866582982e-05, "epoch": 2.4570135746606336, "percentage": 49.27, "elapsed_time": "7:22:25", "remaining_time": "7:35:28"}
|
272 |
-
{"current_steps": 272, "total_steps": 550, "loss": 0.3558, "lr": 4.7694650641250446e-05, "epoch": 2.4660633484162897, "percentage": 49.45, "elapsed_time": "7:24:02", "remaining_time": "7:33:50"}
|
273 |
-
{"current_steps": 273, "total_steps": 550, "loss": 0.3535, "lr": 4.7445372677265205e-05, "epoch": 2.475113122171946, "percentage": 49.64, "elapsed_time": "7:25:39", "remaining_time": "7:32:11"}
|
274 |
-
{"current_steps": 274, "total_steps": 550, "loss": 0.3584, "lr": 4.719579481475416e-05, "epoch": 2.484162895927602, "percentage": 49.82, "elapsed_time": "7:27:16", "remaining_time": "7:30:32"}
|
275 |
-
{"current_steps": 275, "total_steps": 550, "loss": 0.3555, "lr": 4.694592710667723e-05, "epoch": 2.493212669683258, "percentage": 50.0, "elapsed_time": "7:28:53", "remaining_time": "7:28:53"}
|
276 |
-
{"current_steps": 276, "total_steps": 550, "loss": 0.3563, "lr": 4.6695779617669236e-05, "epoch": 2.502262443438914, "percentage": 50.18, "elapsed_time": "7:30:30", "remaining_time": "7:27:14"}
|
277 |
-
{"current_steps": 277, "total_steps": 550, "loss": 0.359, "lr": 4.6445362423634574e-05, "epoch": 2.51131221719457, "percentage": 50.36, "elapsed_time": "7:32:07", "remaining_time": "7:25:36"}
|
278 |
-
{"current_steps": 278, "total_steps": 550, "loss": 0.3524, "lr": 4.61946856113413e-05, "epoch": 2.520361990950226, "percentage": 50.55, "elapsed_time": "7:33:44", "remaining_time": "7:23:57"}
|
279 |
-
{"current_steps": 279, "total_steps": 550, "loss": 0.3517, "lr": 4.594375927801487e-05, "epoch": 2.5294117647058822, "percentage": 50.73, "elapsed_time": "7:35:21", "remaining_time": "7:22:18"}
|
280 |
-
{"current_steps": 280, "total_steps": 550, "loss": 0.3599, "lr": 4.5692593530931416e-05, "epoch": 2.5384615384615383, "percentage": 50.91, "elapsed_time": "7:36:58", "remaining_time": "7:20:39"}
|
281 |
-
{"current_steps": 281, "total_steps": 550, "loss": 0.3557, "lr": 4.5441198487010574e-05, "epoch": 2.5475113122171944, "percentage": 51.09, "elapsed_time": "7:38:35", "remaining_time": "7:19:00"}
|
282 |
-
{"current_steps": 282, "total_steps": 550, "loss": 0.351, "lr": 4.5189584272408074e-05, "epoch": 2.5565610859728505, "percentage": 51.27, "elapsed_time": "7:40:12", "remaining_time": "7:17:21"}
|
283 |
-
{"current_steps": 283, "total_steps": 550, "loss": 0.3559, "lr": 4.493776102210779e-05, "epoch": 2.5656108597285066, "percentage": 51.45, "elapsed_time": "7:41:49", "remaining_time": "7:15:42"}
|
284 |
-
{"current_steps": 284, "total_steps": 550, "loss": 0.3565, "lr": 4.468573887951354e-05, "epoch": 2.5746606334841626, "percentage": 51.64, "elapsed_time": "7:43:26", "remaining_time": "7:14:03"}
|
285 |
-
{"current_steps": 285, "total_steps": 550, "loss": 0.3532, "lr": 4.4433527996040443e-05, "epoch": 2.583710407239819, "percentage": 51.82, "elapsed_time": "7:45:03", "remaining_time": "7:12:25"}
|
286 |
-
{"current_steps": 286, "total_steps": 550, "loss": 0.3559, "lr": 4.418113853070614e-05, "epoch": 2.5927601809954752, "percentage": 52.0, "elapsed_time": "7:46:40", "remaining_time": "7:10:46"}
|
287 |
-
{"current_steps": 287, "total_steps": 550, "loss": 0.3595, "lr": 4.392858064972149e-05, "epoch": 2.6018099547511313, "percentage": 52.18, "elapsed_time": "7:48:17", "remaining_time": "7:09:07"}
|
288 |
-
{"current_steps": 288, "total_steps": 550, "loss": 0.354, "lr": 4.3675864526081106e-05, "epoch": 2.6108597285067874, "percentage": 52.36, "elapsed_time": "7:49:54", "remaining_time": "7:07:28"}
|
289 |
-
{"current_steps": 289, "total_steps": 550, "loss": 0.3517, "lr": 4.34230003391536e-05, "epoch": 2.6199095022624435, "percentage": 52.55, "elapsed_time": "7:51:31", "remaining_time": "7:05:50"}
|
290 |
-
{"current_steps": 290, "total_steps": 550, "loss": 0.3532, "lr": 4.316999827427154e-05, "epoch": 2.6289592760180995, "percentage": 52.73, "elapsed_time": "7:53:08", "remaining_time": "7:04:11"}
|
291 |
-
{"current_steps": 291, "total_steps": 550, "loss": 0.3576, "lr": 4.2916868522321235e-05, "epoch": 2.6380090497737556, "percentage": 52.91, "elapsed_time": "7:54:45", "remaining_time": "7:02:32"}
|
292 |
-
{"current_steps": 292, "total_steps": 550, "loss": 0.3591, "lr": 4.266362127933216e-05, "epoch": 2.6470588235294117, "percentage": 53.09, "elapsed_time": "7:56:22", "remaining_time": "7:00:54"}
|
293 |
-
{"current_steps": 293, "total_steps": 550, "loss": 0.3528, "lr": 4.2410266746066345e-05, "epoch": 2.6561085972850678, "percentage": 53.27, "elapsed_time": "7:57:59", "remaining_time": "6:59:15"}
|
294 |
-
{"current_steps": 294, "total_steps": 550, "loss": 0.359, "lr": 4.215681512760744e-05, "epoch": 2.665158371040724, "percentage": 53.45, "elapsed_time": "7:59:36", "remaining_time": "6:57:36"}
|
295 |
-
{"current_steps": 295, "total_steps": 550, "loss": 0.3541, "lr": 4.19032766329497e-05, "epoch": 2.6742081447963804, "percentage": 53.64, "elapsed_time": "8:01:13", "remaining_time": "6:55:58"}
|
296 |
-
{"current_steps": 296, "total_steps": 550, "loss": 0.3533, "lr": 4.1649661474586694e-05, "epoch": 2.6832579185520364, "percentage": 53.82, "elapsed_time": "8:02:50", "remaining_time": "6:54:19"}
|
297 |
-
{"current_steps": 297, "total_steps": 550, "loss": 0.3597, "lr": 4.139597986810005e-05, "epoch": 2.6923076923076925, "percentage": 54.0, "elapsed_time": "8:04:27", "remaining_time": "6:52:40"}
|
298 |
-
{"current_steps": 298, "total_steps": 550, "loss": 0.3506, "lr": 4.114224203174785e-05, "epoch": 2.7013574660633486, "percentage": 54.18, "elapsed_time": "8:06:04", "remaining_time": "6:51:02"}
|
299 |
-
{"current_steps": 299, "total_steps": 550, "loss": 0.3556, "lr": 4.0888458186053184e-05, "epoch": 2.7104072398190047, "percentage": 54.36, "elapsed_time": "8:07:41", "remaining_time": "6:49:23"}
|
300 |
-
{"current_steps": 300, "total_steps": 550, "loss": 0.3529, "lr": 4.063463855339232e-05, "epoch": 2.7194570135746607, "percentage": 54.55, "elapsed_time": "8:09:17", "remaining_time": "6:47:44"}
|
301 |
-
{"current_steps": 301, "total_steps": 550, "loss": 0.3482, "lr": 4.0380793357583076e-05, "epoch": 2.728506787330317, "percentage": 54.73, "elapsed_time": "8:10:54", "remaining_time": "6:46:06"}
|
302 |
-
{"current_steps": 302, "total_steps": 550, "loss": 0.3581, "lr": 4.012693282347289e-05, "epoch": 2.737556561085973, "percentage": 54.91, "elapsed_time": "8:12:31", "remaining_time": "6:44:27"}
|
303 |
-
{"current_steps": 303, "total_steps": 550, "loss": 0.3568, "lr": 3.9873067176527114e-05, "epoch": 2.746606334841629, "percentage": 55.09, "elapsed_time": "8:14:09", "remaining_time": "6:42:49"}
|
304 |
-
{"current_steps": 304, "total_steps": 550, "loss": 0.3548, "lr": 3.961920664241694e-05, "epoch": 2.755656108597285, "percentage": 55.27, "elapsed_time": "8:15:46", "remaining_time": "6:41:10"}
|
305 |
-
{"current_steps": 305, "total_steps": 550, "loss": 0.3547, "lr": 3.9365361446607684e-05, "epoch": 2.764705882352941, "percentage": 55.45, "elapsed_time": "8:17:23", "remaining_time": "6:39:32"}
|
306 |
-
{"current_steps": 306, "total_steps": 550, "loss": 0.3602, "lr": 3.911154181394682e-05, "epoch": 2.773755656108597, "percentage": 55.64, "elapsed_time": "8:19:00", "remaining_time": "6:37:53"}
|
307 |
-
{"current_steps": 307, "total_steps": 550, "loss": 0.3562, "lr": 3.885775796825216e-05, "epoch": 2.7828054298642533, "percentage": 55.82, "elapsed_time": "8:20:37", "remaining_time": "6:36:15"}
|
308 |
-
{"current_steps": 308, "total_steps": 550, "loss": 0.3479, "lr": 3.860402013189998e-05, "epoch": 2.7918552036199094, "percentage": 56.0, "elapsed_time": "8:22:14", "remaining_time": "6:34:36"}
|
309 |
-
{"current_steps": 309, "total_steps": 550, "loss": 0.3572, "lr": 3.835033852541332e-05, "epoch": 2.8009049773755654, "percentage": 56.18, "elapsed_time": "8:23:51", "remaining_time": "6:32:58"}
|
310 |
-
{"current_steps": 310, "total_steps": 550, "loss": 0.3519, "lr": 3.809672336705031e-05, "epoch": 2.8099547511312215, "percentage": 56.36, "elapsed_time": "8:25:28", "remaining_time": "6:31:19"}
|
311 |
-
{"current_steps": 311, "total_steps": 550, "loss": 0.3559, "lr": 3.784318487239257e-05, "epoch": 2.8190045248868776, "percentage": 56.55, "elapsed_time": "8:27:05", "remaining_time": "6:29:41"}
|
312 |
-
{"current_steps": 312, "total_steps": 550, "loss": 0.3504, "lr": 3.758973325393367e-05, "epoch": 2.8280542986425337, "percentage": 56.73, "elapsed_time": "8:28:42", "remaining_time": "6:28:02"}
|
313 |
-
{"current_steps": 313, "total_steps": 550, "loss": 0.3569, "lr": 3.7336378720667846e-05, "epoch": 2.83710407239819, "percentage": 56.91, "elapsed_time": "8:30:18", "remaining_time": "6:26:24"}
|
314 |
-
{"current_steps": 314, "total_steps": 550, "loss": 0.3559, "lr": 3.708313147767878e-05, "epoch": 2.8461538461538463, "percentage": 57.09, "elapsed_time": "8:31:55", "remaining_time": "6:24:45"}
|
315 |
-
{"current_steps": 315, "total_steps": 550, "loss": 0.3516, "lr": 3.683000172572846e-05, "epoch": 2.8552036199095023, "percentage": 57.27, "elapsed_time": "8:33:32", "remaining_time": "6:23:07"}
|
316 |
-
{"current_steps": 316, "total_steps": 550, "loss": 0.3575, "lr": 3.657699966084642e-05, "epoch": 2.8642533936651584, "percentage": 57.45, "elapsed_time": "8:35:09", "remaining_time": "6:21:28"}
|
317 |
-
{"current_steps": 317, "total_steps": 550, "loss": 0.3579, "lr": 3.632413547391891e-05, "epoch": 2.8733031674208145, "percentage": 57.64, "elapsed_time": "8:36:46", "remaining_time": "6:19:50"}
|
318 |
-
{"current_steps": 318, "total_steps": 550, "loss": 0.3486, "lr": 3.6071419350278515e-05, "epoch": 2.8823529411764706, "percentage": 57.82, "elapsed_time": "8:38:23", "remaining_time": "6:18:12"}
|
319 |
-
{"current_steps": 319, "total_steps": 550, "loss": 0.3468, "lr": 3.581886146929387e-05, "epoch": 2.8914027149321266, "percentage": 58.0, "elapsed_time": "8:40:00", "remaining_time": "6:16:33"}
|
320 |
-
{"current_steps": 320, "total_steps": 550, "loss": 0.3526, "lr": 3.556647200395956e-05, "epoch": 2.9004524886877827, "percentage": 58.18, "elapsed_time": "8:41:37", "remaining_time": "6:14:55"}
|
321 |
-
{"current_steps": 321, "total_steps": 550, "loss": 0.3498, "lr": 3.5314261120486474e-05, "epoch": 2.909502262443439, "percentage": 58.36, "elapsed_time": "8:43:14", "remaining_time": "6:13:16"}
|
322 |
-
{"current_steps": 322, "total_steps": 550, "loss": 0.353, "lr": 3.5062238977892214e-05, "epoch": 2.918552036199095, "percentage": 58.55, "elapsed_time": "8:44:51", "remaining_time": "6:11:38"}
|
323 |
-
{"current_steps": 323, "total_steps": 550, "loss": 0.3551, "lr": 3.481041572759193e-05, "epoch": 2.9276018099547514, "percentage": 58.73, "elapsed_time": "8:46:29", "remaining_time": "6:10:00"}
|
324 |
-
{"current_steps": 324, "total_steps": 550, "loss": 0.3555, "lr": 3.4558801512989446e-05, "epoch": 2.9366515837104075, "percentage": 58.91, "elapsed_time": "8:48:06", "remaining_time": "6:08:22"}
|
325 |
-
{"current_steps": 325, "total_steps": 550, "loss": 0.3553, "lr": 3.4307406469068604e-05, "epoch": 2.9457013574660635, "percentage": 59.09, "elapsed_time": "8:49:43", "remaining_time": "6:06:43"}
|
326 |
-
{"current_steps": 326, "total_steps": 550, "loss": 0.3574, "lr": 3.405624072198514e-05, "epoch": 2.9547511312217196, "percentage": 59.27, "elapsed_time": "8:51:20", "remaining_time": "6:05:05"}
|
327 |
-
{"current_steps": 327, "total_steps": 550, "loss": 0.3517, "lr": 3.3805314388658714e-05, "epoch": 2.9638009049773757, "percentage": 59.45, "elapsed_time": "8:52:57", "remaining_time": "6:03:27"}
|
328 |
-
{"current_steps": 328, "total_steps": 550, "loss": 0.3449, "lr": 3.3554637576365446e-05, "epoch": 2.9728506787330318, "percentage": 59.64, "elapsed_time": "8:54:34", "remaining_time": "6:01:49"}
|
329 |
-
{"current_steps": 329, "total_steps": 550, "loss": 0.3514, "lr": 3.330422038233078e-05, "epoch": 2.981900452488688, "percentage": 59.82, "elapsed_time": "8:56:11", "remaining_time": "6:00:10"}
|
330 |
-
{"current_steps": 330, "total_steps": 550, "loss": 0.3508, "lr": 3.305407289332279e-05, "epoch": 2.990950226244344, "percentage": 60.0, "elapsed_time": "8:57:48", "remaining_time": "5:58:32"}
|
331 |
-
{"current_steps": 331, "total_steps": 550, "loss": 0.6016, "lr": 3.280420518524585e-05, "epoch": 3.002262443438914, "percentage": 60.18, "elapsed_time": "9:01:00", "remaining_time": "5:57:56"}
|
332 |
-
{"current_steps": 332, "total_steps": 550, "loss": 0.3304, "lr": 3.25546273227348e-05, "epoch": 3.01131221719457, "percentage": 60.36, "elapsed_time": "9:02:36", "remaining_time": "5:56:17"}
|
|
|
1 |
+
{"current_steps": 1, "total_steps": 550, "loss": 0.8197, "lr": 1.4545454545454546e-06, "epoch": 0.00904977375565611, "percentage": 0.18, "elapsed_time": "0:01:05", "remaining_time": "10:02:17"}
|
2 |
+
{"current_steps": 2, "total_steps": 550, "loss": 0.8224, "lr": 2.9090909090909093e-06, "epoch": 0.01809954751131222, "percentage": 0.36, "elapsed_time": "0:01:57", "remaining_time": "8:57:27"}
|
3 |
+
{"current_steps": 3, "total_steps": 550, "loss": 0.8034, "lr": 4.363636363636364e-06, "epoch": 0.027149321266968326, "percentage": 0.55, "elapsed_time": "0:02:48", "remaining_time": "8:31:57"}
|
4 |
+
{"current_steps": 4, "total_steps": 550, "loss": 0.7741, "lr": 5.8181818181818185e-06, "epoch": 0.03619909502262444, "percentage": 0.73, "elapsed_time": "0:03:39", "remaining_time": "8:19:57"}
|
5 |
+
{"current_steps": 5, "total_steps": 550, "loss": 0.7292, "lr": 7.272727272727273e-06, "epoch": 0.04524886877828054, "percentage": 0.91, "elapsed_time": "0:04:31", "remaining_time": "8:12:41"}
|
6 |
+
{"current_steps": 6, "total_steps": 550, "loss": 0.7138, "lr": 8.727272727272728e-06, "epoch": 0.05429864253393665, "percentage": 1.09, "elapsed_time": "0:05:22", "remaining_time": "8:07:31"}
|
7 |
+
{"current_steps": 7, "total_steps": 550, "loss": 0.732, "lr": 1.0181818181818182e-05, "epoch": 0.06334841628959276, "percentage": 1.27, "elapsed_time": "0:06:14", "remaining_time": "8:03:46"}
|
8 |
+
{"current_steps": 8, "total_steps": 550, "loss": 0.723, "lr": 1.1636363636363637e-05, "epoch": 0.07239819004524888, "percentage": 1.45, "elapsed_time": "0:07:05", "remaining_time": "8:00:35"}
|
9 |
+
{"current_steps": 9, "total_steps": 550, "loss": 0.7228, "lr": 1.3090909090909092e-05, "epoch": 0.08144796380090498, "percentage": 1.64, "elapsed_time": "0:07:57", "remaining_time": "7:58:14"}
|
10 |
+
{"current_steps": 10, "total_steps": 550, "loss": 0.7034, "lr": 1.4545454545454546e-05, "epoch": 0.09049773755656108, "percentage": 1.82, "elapsed_time": "0:08:48", "remaining_time": "7:55:51"}
|
11 |
+
{"current_steps": 11, "total_steps": 550, "loss": 0.6666, "lr": 1.6000000000000003e-05, "epoch": 0.09954751131221719, "percentage": 2.0, "elapsed_time": "0:09:39", "remaining_time": "7:53:35"}
|
12 |
+
{"current_steps": 12, "total_steps": 550, "loss": 0.6361, "lr": 1.7454545454545456e-05, "epoch": 0.1085972850678733, "percentage": 2.18, "elapsed_time": "0:10:31", "remaining_time": "7:52:05"}
|
13 |
+
{"current_steps": 13, "total_steps": 550, "loss": 0.633, "lr": 1.8909090909090912e-05, "epoch": 0.11764705882352941, "percentage": 2.36, "elapsed_time": "0:11:23", "remaining_time": "7:50:32"}
|
14 |
+
{"current_steps": 14, "total_steps": 550, "loss": 0.6039, "lr": 2.0363636363636365e-05, "epoch": 0.12669683257918551, "percentage": 2.55, "elapsed_time": "0:12:14", "remaining_time": "7:48:59"}
|
15 |
+
{"current_steps": 15, "total_steps": 550, "loss": 0.5948, "lr": 2.1818181818181818e-05, "epoch": 0.13574660633484162, "percentage": 2.73, "elapsed_time": "0:13:06", "remaining_time": "7:47:22"}
|
16 |
+
{"current_steps": 16, "total_steps": 550, "loss": 0.581, "lr": 2.3272727272727274e-05, "epoch": 0.14479638009049775, "percentage": 2.91, "elapsed_time": "0:13:57", "remaining_time": "7:46:01"}
|
17 |
+
{"current_steps": 17, "total_steps": 550, "loss": 0.5777, "lr": 2.4727272727272727e-05, "epoch": 0.15384615384615385, "percentage": 3.09, "elapsed_time": "0:14:49", "remaining_time": "7:44:57"}
|
18 |
+
{"current_steps": 18, "total_steps": 550, "loss": 0.567, "lr": 2.6181818181818183e-05, "epoch": 0.16289592760180996, "percentage": 3.27, "elapsed_time": "0:15:41", "remaining_time": "7:43:48"}
|
19 |
+
{"current_steps": 19, "total_steps": 550, "loss": 0.5617, "lr": 2.763636363636364e-05, "epoch": 0.17194570135746606, "percentage": 3.45, "elapsed_time": "0:16:33", "remaining_time": "7:42:44"}
|
20 |
+
{"current_steps": 20, "total_steps": 550, "loss": 0.5546, "lr": 2.9090909090909093e-05, "epoch": 0.18099547511312217, "percentage": 3.64, "elapsed_time": "0:17:24", "remaining_time": "7:41:29"}
|
21 |
+
{"current_steps": 21, "total_steps": 550, "loss": 0.5388, "lr": 3.054545454545455e-05, "epoch": 0.19004524886877827, "percentage": 3.82, "elapsed_time": "0:18:18", "remaining_time": "7:41:05"}
|
22 |
+
{"current_steps": 22, "total_steps": 550, "loss": 0.5357, "lr": 3.2000000000000005e-05, "epoch": 0.19909502262443438, "percentage": 4.0, "elapsed_time": "0:19:10", "remaining_time": "7:40:12"}
|
23 |
+
{"current_steps": 23, "total_steps": 550, "loss": 0.537, "lr": 3.345454545454546e-05, "epoch": 0.2081447963800905, "percentage": 4.18, "elapsed_time": "0:20:02", "remaining_time": "7:39:09"}
|
24 |
+
{"current_steps": 24, "total_steps": 550, "loss": 0.5304, "lr": 3.490909090909091e-05, "epoch": 0.2171945701357466, "percentage": 4.36, "elapsed_time": "0:20:53", "remaining_time": "7:37:59"}
|
25 |
+
{"current_steps": 25, "total_steps": 550, "loss": 0.5316, "lr": 3.6363636363636364e-05, "epoch": 0.22624434389140272, "percentage": 4.55, "elapsed_time": "0:21:46", "remaining_time": "7:37:12"}
|
26 |
+
{"current_steps": 1, "total_steps": 550, "loss": 0.8197, "lr": 1.4545454545454546e-06, "epoch": 0.00904977375565611, "percentage": 0.18, "elapsed_time": "0:01:04", "remaining_time": "9:46:21"}
|
27 |
+
{"current_steps": 2, "total_steps": 550, "loss": 0.8224, "lr": 2.9090909090909093e-06, "epoch": 0.01809954751131222, "percentage": 0.36, "elapsed_time": "0:01:54", "remaining_time": "8:42:21"}
|
28 |
+
{"current_steps": 3, "total_steps": 550, "loss": 0.8034, "lr": 4.363636363636364e-06, "epoch": 0.027149321266968326, "percentage": 0.55, "elapsed_time": "0:02:43", "remaining_time": "8:17:36"}
|
29 |
+
{"current_steps": 4, "total_steps": 550, "loss": 0.774, "lr": 5.8181818181818185e-06, "epoch": 0.03619909502262444, "percentage": 0.73, "elapsed_time": "0:03:32", "remaining_time": "8:04:32"}
|
30 |
+
{"current_steps": 5, "total_steps": 550, "loss": 0.7292, "lr": 7.272727272727273e-06, "epoch": 0.04524886877828054, "percentage": 0.91, "elapsed_time": "0:04:22", "remaining_time": "7:56:51"}
|
31 |
+
{"current_steps": 6, "total_steps": 550, "loss": 0.7138, "lr": 8.727272727272728e-06, "epoch": 0.05429864253393665, "percentage": 1.09, "elapsed_time": "0:05:12", "remaining_time": "7:51:34"}
|
32 |
+
{"current_steps": 7, "total_steps": 550, "loss": 0.7317, "lr": 1.0181818181818182e-05, "epoch": 0.06334841628959276, "percentage": 1.27, "elapsed_time": "0:06:01", "remaining_time": "7:46:57"}
|
33 |
+
{"current_steps": 8, "total_steps": 550, "loss": 0.7227, "lr": 1.1636363636363637e-05, "epoch": 0.07239819004524888, "percentage": 1.45, "elapsed_time": "0:06:50", "remaining_time": "7:43:10"}
|
34 |
+
{"current_steps": 9, "total_steps": 550, "loss": 0.7225, "lr": 1.3090909090909092e-05, "epoch": 0.08144796380090498, "percentage": 1.64, "elapsed_time": "0:07:39", "remaining_time": "7:40:26"}
|
35 |
+
{"current_steps": 10, "total_steps": 550, "loss": 0.7032, "lr": 1.4545454545454546e-05, "epoch": 0.09049773755656108, "percentage": 1.82, "elapsed_time": "0:08:28", "remaining_time": "7:37:52"}
|
36 |
+
{"current_steps": 11, "total_steps": 550, "loss": 0.6662, "lr": 1.6000000000000003e-05, "epoch": 0.09954751131221719, "percentage": 2.0, "elapsed_time": "0:09:17", "remaining_time": "7:35:32"}
|
37 |
+
{"current_steps": 12, "total_steps": 550, "loss": 0.6361, "lr": 1.7454545454545456e-05, "epoch": 0.1085972850678733, "percentage": 2.18, "elapsed_time": "0:10:07", "remaining_time": "7:34:04"}
|
38 |
+
{"current_steps": 13, "total_steps": 550, "loss": 0.6328, "lr": 1.8909090909090912e-05, "epoch": 0.11764705882352941, "percentage": 2.36, "elapsed_time": "0:10:56", "remaining_time": "7:32:06"}
|
39 |
+
{"current_steps": 14, "total_steps": 550, "loss": 0.6038, "lr": 2.0363636363636365e-05, "epoch": 0.12669683257918551, "percentage": 2.55, "elapsed_time": "0:11:45", "remaining_time": "7:30:13"}
|
40 |
+
{"current_steps": 15, "total_steps": 550, "loss": 0.5949, "lr": 2.1818181818181818e-05, "epoch": 0.13574660633484162, "percentage": 2.73, "elapsed_time": "0:12:34", "remaining_time": "7:28:25"}
|
41 |
+
{"current_steps": 16, "total_steps": 550, "loss": 0.5812, "lr": 2.3272727272727274e-05, "epoch": 0.14479638009049775, "percentage": 2.91, "elapsed_time": "0:13:23", "remaining_time": "7:26:56"}
|
42 |
+
{"current_steps": 17, "total_steps": 550, "loss": 0.5777, "lr": 2.4727272727272727e-05, "epoch": 0.15384615384615385, "percentage": 3.09, "elapsed_time": "0:14:12", "remaining_time": "7:25:32"}
|
43 |
+
{"current_steps": 18, "total_steps": 550, "loss": 0.5671, "lr": 2.6181818181818183e-05, "epoch": 0.16289592760180996, "percentage": 3.27, "elapsed_time": "0:15:02", "remaining_time": "7:24:23"}
|
44 |
+
{"current_steps": 19, "total_steps": 550, "loss": 0.5617, "lr": 2.763636363636364e-05, "epoch": 0.17194570135746606, "percentage": 3.45, "elapsed_time": "0:15:51", "remaining_time": "7:23:20"}
|
45 |
+
{"current_steps": 20, "total_steps": 550, "loss": 0.5547, "lr": 2.9090909090909093e-05, "epoch": 0.18099547511312217, "percentage": 3.64, "elapsed_time": "0:16:41", "remaining_time": "7:22:08"}
|
46 |
+
{"current_steps": 21, "total_steps": 550, "loss": 0.5392, "lr": 3.054545454545455e-05, "epoch": 0.19004524886877827, "percentage": 3.82, "elapsed_time": "0:17:31", "remaining_time": "7:21:31"}
|
47 |
+
{"current_steps": 22, "total_steps": 550, "loss": 0.5373, "lr": 3.2000000000000005e-05, "epoch": 0.19909502262443438, "percentage": 4.0, "elapsed_time": "0:18:20", "remaining_time": "7:20:10"}
|
48 |
+
{"current_steps": 23, "total_steps": 550, "loss": 0.534, "lr": 3.345454545454546e-05, "epoch": 0.2081447963800905, "percentage": 4.18, "elapsed_time": "0:19:09", "remaining_time": "7:18:57"}
|
49 |
+
{"current_steps": 24, "total_steps": 550, "loss": 0.5286, "lr": 3.490909090909091e-05, "epoch": 0.2171945701357466, "percentage": 4.36, "elapsed_time": "0:19:58", "remaining_time": "7:17:52"}
|
50 |
+
{"current_steps": 25, "total_steps": 550, "loss": 0.5301, "lr": 3.6363636363636364e-05, "epoch": 0.22624434389140272, "percentage": 4.55, "elapsed_time": "0:20:47", "remaining_time": "7:16:38"}
|
51 |
+
{"current_steps": 26, "total_steps": 550, "loss": 0.5214, "lr": 3.7818181818181824e-05, "epoch": 0.23529411764705882, "percentage": 4.73, "elapsed_time": "0:21:37", "remaining_time": "7:15:42"}
|
52 |
+
{"current_steps": 27, "total_steps": 550, "loss": 0.5115, "lr": 3.927272727272728e-05, "epoch": 0.24434389140271492, "percentage": 4.91, "elapsed_time": "0:22:26", "remaining_time": "7:14:36"}
|
53 |
+
{"current_steps": 28, "total_steps": 550, "loss": 0.5095, "lr": 4.072727272727273e-05, "epoch": 0.25339366515837103, "percentage": 5.09, "elapsed_time": "0:23:15", "remaining_time": "7:13:36"}
|
54 |
+
{"current_steps": 29, "total_steps": 550, "loss": 0.5087, "lr": 4.218181818181818e-05, "epoch": 0.26244343891402716, "percentage": 5.27, "elapsed_time": "0:24:04", "remaining_time": "7:12:31"}
|
55 |
+
{"current_steps": 30, "total_steps": 550, "loss": 0.5111, "lr": 4.3636363636363636e-05, "epoch": 0.27149321266968324, "percentage": 5.45, "elapsed_time": "0:24:54", "remaining_time": "7:11:38"}
|
56 |
+
{"current_steps": 31, "total_steps": 550, "loss": 0.5072, "lr": 4.509090909090909e-05, "epoch": 0.28054298642533937, "percentage": 5.64, "elapsed_time": "0:25:43", "remaining_time": "7:10:33"}
|
57 |
+
{"current_steps": 32, "total_steps": 550, "loss": 0.5046, "lr": 4.654545454545455e-05, "epoch": 0.2895927601809955, "percentage": 5.82, "elapsed_time": "0:26:32", "remaining_time": "7:09:34"}
|
58 |
+
{"current_steps": 33, "total_steps": 550, "loss": 0.503, "lr": 4.8e-05, "epoch": 0.2986425339366516, "percentage": 6.0, "elapsed_time": "0:27:21", "remaining_time": "7:08:35"}
|
59 |
+
{"current_steps": 34, "total_steps": 550, "loss": 0.5011, "lr": 4.9454545454545454e-05, "epoch": 0.3076923076923077, "percentage": 6.18, "elapsed_time": "0:28:10", "remaining_time": "7:07:35"}
|
60 |
+
{"current_steps": 35, "total_steps": 550, "loss": 0.4895, "lr": 5.0909090909090914e-05, "epoch": 0.3167420814479638, "percentage": 6.36, "elapsed_time": "0:28:59", "remaining_time": "7:06:36"}
|
61 |
+
{"current_steps": 36, "total_steps": 550, "loss": 0.4956, "lr": 5.236363636363637e-05, "epoch": 0.3257918552036199, "percentage": 6.55, "elapsed_time": "0:29:48", "remaining_time": "7:05:34"}
|
62 |
+
{"current_steps": 37, "total_steps": 550, "loss": 0.4887, "lr": 5.381818181818182e-05, "epoch": 0.334841628959276, "percentage": 6.73, "elapsed_time": "0:30:37", "remaining_time": "7:04:43"}
|
63 |
+
{"current_steps": 38, "total_steps": 550, "loss": 0.487, "lr": 5.527272727272728e-05, "epoch": 0.3438914027149321, "percentage": 6.91, "elapsed_time": "0:31:26", "remaining_time": "7:03:39"}
|
64 |
+
{"current_steps": 39, "total_steps": 550, "loss": 0.4854, "lr": 5.672727272727273e-05, "epoch": 0.35294117647058826, "percentage": 7.09, "elapsed_time": "0:32:15", "remaining_time": "7:02:43"}
|
65 |
+
{"current_steps": 40, "total_steps": 550, "loss": 0.4943, "lr": 5.8181818181818185e-05, "epoch": 0.36199095022624433, "percentage": 7.27, "elapsed_time": "0:33:05", "remaining_time": "7:01:49"}
|
66 |
+
{"current_steps": 41, "total_steps": 550, "loss": 0.4846, "lr": 5.9636363636363645e-05, "epoch": 0.37104072398190047, "percentage": 7.45, "elapsed_time": "0:33:54", "remaining_time": "7:00:57"}
|
67 |
+
{"current_steps": 42, "total_steps": 550, "loss": 0.4765, "lr": 6.10909090909091e-05, "epoch": 0.38009049773755654, "percentage": 7.64, "elapsed_time": "0:34:43", "remaining_time": "7:00:06"}
|
68 |
+
{"current_steps": 43, "total_steps": 550, "loss": 0.4865, "lr": 6.254545454545456e-05, "epoch": 0.3891402714932127, "percentage": 7.82, "elapsed_time": "0:35:32", "remaining_time": "6:59:09"}
|
69 |
+
{"current_steps": 44, "total_steps": 550, "loss": 0.4858, "lr": 6.400000000000001e-05, "epoch": 0.39819004524886875, "percentage": 8.0, "elapsed_time": "0:36:21", "remaining_time": "6:58:12"}
|
70 |
+
{"current_steps": 45, "total_steps": 550, "loss": 0.4949, "lr": 6.545454545454546e-05, "epoch": 0.4072398190045249, "percentage": 8.18, "elapsed_time": "0:37:10", "remaining_time": "6:57:14"}
|
71 |
+
{"current_steps": 46, "total_steps": 550, "loss": 0.4799, "lr": 6.690909090909092e-05, "epoch": 0.416289592760181, "percentage": 8.36, "elapsed_time": "0:37:59", "remaining_time": "6:56:17"}
|
72 |
+
{"current_steps": 47, "total_steps": 550, "loss": 0.4779, "lr": 6.836363636363637e-05, "epoch": 0.4253393665158371, "percentage": 8.55, "elapsed_time": "0:38:48", "remaining_time": "6:55:19"}
|
73 |
+
{"current_steps": 48, "total_steps": 550, "loss": 0.4776, "lr": 6.981818181818182e-05, "epoch": 0.4343891402714932, "percentage": 8.73, "elapsed_time": "0:39:37", "remaining_time": "6:54:20"}
|
74 |
+
{"current_steps": 49, "total_steps": 550, "loss": 0.4731, "lr": 7.127272727272728e-05, "epoch": 0.4434389140271493, "percentage": 8.91, "elapsed_time": "0:40:25", "remaining_time": "6:53:23"}
|
75 |
+
{"current_steps": 50, "total_steps": 550, "loss": 0.4702, "lr": 7.272727272727273e-05, "epoch": 0.45248868778280543, "percentage": 9.09, "elapsed_time": "0:41:14", "remaining_time": "6:52:28"}
|
76 |
+
{"current_steps": 51, "total_steps": 550, "loss": 0.4853, "lr": 7.418181818181818e-05, "epoch": 0.46153846153846156, "percentage": 9.27, "elapsed_time": "0:42:03", "remaining_time": "6:51:34"}
|
77 |
+
{"current_steps": 52, "total_steps": 550, "loss": 0.4663, "lr": 7.563636363636365e-05, "epoch": 0.47058823529411764, "percentage": 9.45, "elapsed_time": "0:42:52", "remaining_time": "6:50:38"}
|
78 |
+
{"current_steps": 53, "total_steps": 550, "loss": 0.4819, "lr": 7.70909090909091e-05, "epoch": 0.4796380090497738, "percentage": 9.64, "elapsed_time": "0:43:41", "remaining_time": "6:49:41"}
|
79 |
+
{"current_steps": 54, "total_steps": 550, "loss": 0.4765, "lr": 7.854545454545455e-05, "epoch": 0.48868778280542985, "percentage": 9.82, "elapsed_time": "0:44:30", "remaining_time": "6:48:49"}
|
80 |
+
{"current_steps": 55, "total_steps": 550, "loss": 0.4764, "lr": 8e-05, "epoch": 0.497737556561086, "percentage": 10.0, "elapsed_time": "0:45:19", "remaining_time": "6:47:52"}
|
81 |
+
{"current_steps": 56, "total_steps": 550, "loss": 0.4853, "lr": 7.999919440291627e-05, "epoch": 0.5067873303167421, "percentage": 10.18, "elapsed_time": "0:46:08", "remaining_time": "6:46:58"}
|
82 |
+
{"current_steps": 57, "total_steps": 550, "loss": 0.4766, "lr": 7.999677764411438e-05, "epoch": 0.5158371040723982, "percentage": 10.36, "elapsed_time": "0:46:57", "remaining_time": "6:46:05"}
|
83 |
+
{"current_steps": 58, "total_steps": 550, "loss": 0.4697, "lr": 7.999274982094104e-05, "epoch": 0.5248868778280543, "percentage": 10.55, "elapsed_time": "0:47:46", "remaining_time": "6:45:14"}
|
84 |
+
{"current_steps": 59, "total_steps": 550, "loss": 0.4753, "lr": 7.998711109563637e-05, "epoch": 0.5339366515837104, "percentage": 10.73, "elapsed_time": "0:48:35", "remaining_time": "6:44:20"}
|
85 |
+
{"current_steps": 60, "total_steps": 550, "loss": 0.4646, "lr": 7.997986169532741e-05, "epoch": 0.5429864253393665, "percentage": 10.91, "elapsed_time": "0:49:24", "remaining_time": "6:43:26"}
|
86 |
+
{"current_steps": 61, "total_steps": 550, "loss": 0.4719, "lr": 7.997100191201896e-05, "epoch": 0.5520361990950227, "percentage": 11.09, "elapsed_time": "0:50:13", "remaining_time": "6:42:34"}
|
87 |
+
{"current_steps": 62, "total_steps": 550, "loss": 0.4597, "lr": 7.996053210258176e-05, "epoch": 0.5610859728506787, "percentage": 11.27, "elapsed_time": "0:51:01", "remaining_time": "6:41:39"}
|
88 |
+
{"current_steps": 63, "total_steps": 550, "loss": 0.4631, "lr": 7.994845268873825e-05, "epoch": 0.5701357466063348, "percentage": 11.45, "elapsed_time": "0:51:50", "remaining_time": "6:40:46"}
|
89 |
+
{"current_steps": 64, "total_steps": 550, "loss": 0.4557, "lr": 7.993476415704543e-05, "epoch": 0.579185520361991, "percentage": 11.64, "elapsed_time": "0:52:39", "remaining_time": "6:39:50"}
|
90 |
+
{"current_steps": 65, "total_steps": 550, "loss": 0.4601, "lr": 7.991946705887539e-05, "epoch": 0.5882352941176471, "percentage": 11.82, "elapsed_time": "0:53:28", "remaining_time": "6:39:00"}
|
91 |
+
{"current_steps": 66, "total_steps": 550, "loss": 0.4616, "lr": 7.990256201039297e-05, "epoch": 0.5972850678733032, "percentage": 12.0, "elapsed_time": "0:54:17", "remaining_time": "6:38:10"}
|
92 |
+
{"current_steps": 67, "total_steps": 550, "loss": 0.4536, "lr": 7.98840496925311e-05, "epoch": 0.6063348416289592, "percentage": 12.18, "elapsed_time": "0:55:07", "remaining_time": "6:37:24"}
|
93 |
+
{"current_steps": 68, "total_steps": 550, "loss": 0.4483, "lr": 7.986393085096324e-05, "epoch": 0.6153846153846154, "percentage": 12.36, "elapsed_time": "0:55:56", "remaining_time": "6:36:33"}
|
94 |
+
{"current_steps": 69, "total_steps": 550, "loss": 0.4508, "lr": 7.984220629607336e-05, "epoch": 0.6244343891402715, "percentage": 12.55, "elapsed_time": "0:56:45", "remaining_time": "6:35:40"}
|
95 |
+
{"current_steps": 70, "total_steps": 550, "loss": 0.4494, "lr": 7.981887690292339e-05, "epoch": 0.6334841628959276, "percentage": 12.73, "elapsed_time": "0:57:34", "remaining_time": "6:34:50"}
|
96 |
+
{"current_steps": 71, "total_steps": 550, "loss": 0.4519, "lr": 7.979394361121789e-05, "epoch": 0.6425339366515838, "percentage": 12.91, "elapsed_time": "0:58:23", "remaining_time": "6:33:59"}
|
97 |
+
{"current_steps": 72, "total_steps": 550, "loss": 0.4555, "lr": 7.97674074252662e-05, "epoch": 0.6515837104072398, "percentage": 13.09, "elapsed_time": "0:59:12", "remaining_time": "6:33:06"}
|
98 |
+
{"current_steps": 73, "total_steps": 550, "loss": 0.4521, "lr": 7.9739269413942e-05, "epoch": 0.6606334841628959, "percentage": 13.27, "elapsed_time": "1:00:01", "remaining_time": "6:32:12"}
|
99 |
+
{"current_steps": 74, "total_steps": 550, "loss": 0.4531, "lr": 7.970953071064036e-05, "epoch": 0.669683257918552, "percentage": 13.45, "elapsed_time": "1:00:50", "remaining_time": "6:31:19"}
|
100 |
+
{"current_steps": 75, "total_steps": 550, "loss": 0.4705, "lr": 7.967819251323182e-05, "epoch": 0.6787330316742082, "percentage": 13.64, "elapsed_time": "1:01:39", "remaining_time": "6:30:29"}
|
101 |
+
{"current_steps": 76, "total_steps": 550, "loss": 0.4488, "lr": 7.964525608401445e-05, "epoch": 0.6877828054298643, "percentage": 13.82, "elapsed_time": "1:02:28", "remaining_time": "6:29:38"}
|
102 |
+
{"current_steps": 77, "total_steps": 550, "loss": 0.4551, "lr": 7.961072274966282e-05, "epoch": 0.6968325791855203, "percentage": 14.0, "elapsed_time": "1:03:17", "remaining_time": "6:28:44"}
|
103 |
+
{"current_steps": 78, "total_steps": 550, "loss": 0.4457, "lr": 7.957459390117458e-05, "epoch": 0.7058823529411765, "percentage": 14.18, "elapsed_time": "1:04:05", "remaining_time": "6:27:52"}
|
104 |
+
{"current_steps": 79, "total_steps": 550, "loss": 0.454, "lr": 7.95368709938145e-05, "epoch": 0.7149321266968326, "percentage": 14.36, "elapsed_time": "1:04:55", "remaining_time": "6:27:02"}
|
105 |
+
{"current_steps": 80, "total_steps": 550, "loss": 0.441, "lr": 7.949755554705577e-05, "epoch": 0.7239819004524887, "percentage": 14.55, "elapsed_time": "1:05:44", "remaining_time": "6:26:11"}
|
106 |
+
{"current_steps": 81, "total_steps": 550, "loss": 0.4442, "lr": 7.945664914451888e-05, "epoch": 0.7330316742081447, "percentage": 14.73, "elapsed_time": "1:06:33", "remaining_time": "6:25:23"}
|
107 |
+
{"current_steps": 82, "total_steps": 550, "loss": 0.4406, "lr": 7.941415343390773e-05, "epoch": 0.7420814479638009, "percentage": 14.91, "elapsed_time": "1:07:22", "remaining_time": "6:24:31"}
|
108 |
+
{"current_steps": 83, "total_steps": 550, "loss": 0.4507, "lr": 7.937007012694335e-05, "epoch": 0.751131221719457, "percentage": 15.09, "elapsed_time": "1:08:10", "remaining_time": "6:23:37"}
|
109 |
+
{"current_steps": 84, "total_steps": 550, "loss": 0.4532, "lr": 7.932440099929493e-05, "epoch": 0.7601809954751131, "percentage": 15.27, "elapsed_time": "1:08:59", "remaining_time": "6:22:44"}
|
110 |
+
{"current_steps": 85, "total_steps": 550, "loss": 0.4454, "lr": 7.927714789050826e-05, "epoch": 0.7692307692307693, "percentage": 15.45, "elapsed_time": "1:09:48", "remaining_time": "6:21:53"}
|
111 |
+
{"current_steps": 86, "total_steps": 550, "loss": 0.4367, "lr": 7.92283127039317e-05, "epoch": 0.7782805429864253, "percentage": 15.64, "elapsed_time": "1:10:37", "remaining_time": "6:21:02"}
|
112 |
+
{"current_steps": 87, "total_steps": 550, "loss": 0.4332, "lr": 7.917789740663941e-05, "epoch": 0.7873303167420814, "percentage": 15.82, "elapsed_time": "1:11:26", "remaining_time": "6:20:10"}
|
113 |
+
{"current_steps": 88, "total_steps": 550, "loss": 0.4345, "lr": 7.912590402935223e-05, "epoch": 0.7963800904977375, "percentage": 16.0, "elapsed_time": "1:12:14", "remaining_time": "6:19:18"}
|
114 |
+
{"current_steps": 89, "total_steps": 550, "loss": 0.4419, "lr": 7.907233466635582e-05, "epoch": 0.8054298642533937, "percentage": 16.18, "elapsed_time": "1:13:03", "remaining_time": "6:18:25"}
|
115 |
+
{"current_steps": 90, "total_steps": 550, "loss": 0.4383, "lr": 7.90171914754163e-05, "epoch": 0.8144796380090498, "percentage": 16.36, "elapsed_time": "1:13:51", "remaining_time": "6:17:32"}
|
116 |
+
{"current_steps": 91, "total_steps": 550, "loss": 0.4348, "lr": 7.896047667769335e-05, "epoch": 0.8235294117647058, "percentage": 16.55, "elapsed_time": "1:14:40", "remaining_time": "6:16:40"}
|
117 |
+
{"current_steps": 92, "total_steps": 550, "loss": 0.4293, "lr": 7.890219255765077e-05, "epoch": 0.832579185520362, "percentage": 16.73, "elapsed_time": "1:15:30", "remaining_time": "6:15:54"}
|
118 |
+
{"current_steps": 93, "total_steps": 550, "loss": 0.4375, "lr": 7.884234146296442e-05, "epoch": 0.8416289592760181, "percentage": 16.91, "elapsed_time": "1:16:19", "remaining_time": "6:15:01"}
|
119 |
+
{"current_steps": 94, "total_steps": 550, "loss": 0.4301, "lr": 7.878092580442766e-05, "epoch": 0.8506787330316742, "percentage": 17.09, "elapsed_time": "1:17:08", "remaining_time": "6:14:12"}
|
120 |
+
{"current_steps": 95, "total_steps": 550, "loss": 0.4377, "lr": 7.871794805585427e-05, "epoch": 0.8597285067873304, "percentage": 17.27, "elapsed_time": "1:17:57", "remaining_time": "6:13:20"}
|
121 |
+
{"current_steps": 96, "total_steps": 550, "loss": 0.4303, "lr": 7.865341075397874e-05, "epoch": 0.8687782805429864, "percentage": 17.45, "elapsed_time": "1:18:45", "remaining_time": "6:12:28"}
|
122 |
+
{"current_steps": 97, "total_steps": 550, "loss": 0.4321, "lr": 7.858731649835424e-05, "epoch": 0.8778280542986425, "percentage": 17.64, "elapsed_time": "1:19:34", "remaining_time": "6:11:37"}
|
123 |
+
{"current_steps": 98, "total_steps": 550, "loss": 0.4369, "lr": 7.85196679512477e-05, "epoch": 0.8868778280542986, "percentage": 17.82, "elapsed_time": "1:20:23", "remaining_time": "6:10:48"}
|
124 |
+
{"current_steps": 99, "total_steps": 550, "loss": 0.4229, "lr": 7.845046783753276e-05, "epoch": 0.8959276018099548, "percentage": 18.0, "elapsed_time": "1:21:12", "remaining_time": "6:09:56"}
|
125 |
+
{"current_steps": 100, "total_steps": 550, "loss": 0.4294, "lr": 7.837971894457991e-05, "epoch": 0.9049773755656109, "percentage": 18.18, "elapsed_time": "1:22:01", "remaining_time": "6:09:07"}
|
126 |
+
{"current_steps": 101, "total_steps": 550, "loss": 0.4276, "lr": 7.830742412214422e-05, "epoch": 0.9140271493212669, "percentage": 18.36, "elapsed_time": "1:22:50", "remaining_time": "6:08:16"}
|
127 |
+
{"current_steps": 102, "total_steps": 550, "loss": 0.4284, "lr": 7.82335862822506e-05, "epoch": 0.9230769230769231, "percentage": 18.55, "elapsed_time": "1:23:39", "remaining_time": "6:07:25"}
|
128 |
+
{"current_steps": 103, "total_steps": 550, "loss": 0.4237, "lr": 7.815820839907651e-05, "epoch": 0.9321266968325792, "percentage": 18.73, "elapsed_time": "1:24:28", "remaining_time": "6:06:34"}
|
129 |
+
{"current_steps": 104, "total_steps": 550, "loss": 0.4325, "lr": 7.808129350883207e-05, "epoch": 0.9411764705882353, "percentage": 18.91, "elapsed_time": "1:25:16", "remaining_time": "6:05:42"}
|
130 |
+
{"current_steps": 105, "total_steps": 550, "loss": 0.4282, "lr": 7.800284470963783e-05, "epoch": 0.9502262443438914, "percentage": 19.09, "elapsed_time": "1:26:05", "remaining_time": "6:04:50"}
|
131 |
+
{"current_steps": 106, "total_steps": 550, "loss": 0.426, "lr": 7.792286516139999e-05, "epoch": 0.9592760180995475, "percentage": 19.27, "elapsed_time": "1:26:53", "remaining_time": "6:03:58"}
|
132 |
+
{"current_steps": 107, "total_steps": 550, "loss": 0.4241, "lr": 7.784135808568308e-05, "epoch": 0.9683257918552036, "percentage": 19.45, "elapsed_time": "1:27:42", "remaining_time": "6:03:08"}
|
133 |
+
{"current_steps": 108, "total_steps": 550, "loss": 0.4356, "lr": 7.775832676558028e-05, "epoch": 0.9773755656108597, "percentage": 19.64, "elapsed_time": "1:28:31", "remaining_time": "6:02:17"}
|
134 |
+
{"current_steps": 109, "total_steps": 550, "loss": 0.4366, "lr": 7.7673774545581e-05, "epoch": 0.9864253393665159, "percentage": 19.82, "elapsed_time": "1:29:19", "remaining_time": "6:01:24"}
|
135 |
+
{"current_steps": 110, "total_steps": 550, "loss": 0.4329, "lr": 7.758770483143634e-05, "epoch": 0.995475113122172, "percentage": 20.0, "elapsed_time": "1:30:08", "remaining_time": "6:00:33"}
|
136 |
+
{"current_steps": 111, "total_steps": 550, "loss": 0.4137, "lr": 7.750012109002185e-05, "epoch": 1.006787330316742, "percentage": 20.18, "elapsed_time": "1:32:46", "remaining_time": "6:06:54"}
|
137 |
+
{"current_steps": 112, "total_steps": 550, "loss": 0.414, "lr": 7.741102684919787e-05, "epoch": 1.0158371040723981, "percentage": 20.36, "elapsed_time": "1:33:35", "remaining_time": "6:05:59"}
|
138 |
+
{"current_steps": 113, "total_steps": 550, "loss": 0.4059, "lr": 7.732042569766741e-05, "epoch": 1.0248868778280542, "percentage": 20.55, "elapsed_time": "1:34:24", "remaining_time": "6:05:04"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cc1409cdfa320cecaf01b23c7cc425d4df9cf6a45c18f326509576976f8812c9
|
3 |
+
size 7288
|