Run 5. Outer Step 50. Inner Step 19.
Browse files- config.json +16 -17
config.json
CHANGED
@@ -1,5 +1,5 @@
|
|
1 |
{
|
2 |
-
"_name_or_path": "
|
3 |
"all_reduce_scores": {
|
4 |
"0": "NON_PARTICIPATING",
|
5 |
"1": "SUCCESS",
|
@@ -34,7 +34,7 @@
|
|
34 |
"125": "NON_PARTICIPATING",
|
35 |
"126": "NON_PARTICIPATING",
|
36 |
"127": "NON_PARTICIPATING",
|
37 |
-
"128": "
|
38 |
"129": "NON_PARTICIPATING",
|
39 |
"13": "SUCCESS",
|
40 |
"130": "NON_PARTICIPATING",
|
@@ -55,7 +55,7 @@
|
|
55 |
"144": "NON_PARTICIPATING",
|
56 |
"145": "NON_PARTICIPATING",
|
57 |
"146": "NON_PARTICIPATING",
|
58 |
-
"147": "
|
59 |
"148": "NON_PARTICIPATING",
|
60 |
"149": "NON_PARTICIPATING",
|
61 |
"15": "SUCCESS",
|
@@ -99,7 +99,7 @@
|
|
99 |
"184": "NON_PARTICIPATING",
|
100 |
"185": "NON_PARTICIPATING",
|
101 |
"186": "NON_PARTICIPATING",
|
102 |
-
"187": "
|
103 |
"188": "NON_PARTICIPATING",
|
104 |
"189": "NON_PARTICIPATING",
|
105 |
"19": "SUCCESS",
|
@@ -112,21 +112,21 @@
|
|
112 |
"196": "NON_PARTICIPATING",
|
113 |
"197": "NON_PARTICIPATING",
|
114 |
"198": "NON_PARTICIPATING",
|
115 |
-
"199": "
|
116 |
"2": "SUCCESS",
|
117 |
"20": "SUCCESS",
|
118 |
-
"200": "
|
119 |
"201": "NON_PARTICIPATING",
|
120 |
"202": "NON_PARTICIPATING",
|
121 |
"203": "NON_PARTICIPATING",
|
122 |
"204": "NON_PARTICIPATING",
|
123 |
-
"205": "
|
124 |
"206": "NON_PARTICIPATING",
|
125 |
"207": "NON_PARTICIPATING",
|
126 |
"208": "NON_PARTICIPATING",
|
127 |
"209": "NON_PARTICIPATING",
|
128 |
"21": "SUCCESS",
|
129 |
-
"210": "
|
130 |
"211": "NON_PARTICIPATING",
|
131 |
"212": "NON_PARTICIPATING",
|
132 |
"213": "NON_PARTICIPATING",
|
@@ -137,7 +137,7 @@
|
|
137 |
"218": "NON_PARTICIPATING",
|
138 |
"219": "NON_PARTICIPATING",
|
139 |
"22": "SUCCESS",
|
140 |
-
"220": "
|
141 |
"221": "NON_PARTICIPATING",
|
142 |
"222": "NON_PARTICIPATING",
|
143 |
"223": "NON_PARTICIPATING",
|
@@ -153,7 +153,7 @@
|
|
153 |
"232": "NON_PARTICIPATING",
|
154 |
"233": "NON_PARTICIPATING",
|
155 |
"234": "NON_PARTICIPATING",
|
156 |
-
"235": "
|
157 |
"236": "NON_PARTICIPATING",
|
158 |
"237": "NON_PARTICIPATING",
|
159 |
"238": "NON_PARTICIPATING",
|
@@ -227,12 +227,12 @@
|
|
227 |
"7": "SUCCESS",
|
228 |
"70": "SUCCESS",
|
229 |
"71": "SUCCESS",
|
230 |
-
"72": "
|
231 |
"73": "SUCCESS",
|
232 |
"74": "SUCCESS",
|
233 |
"75": "SUCCESS",
|
234 |
"76": "SUCCESS",
|
235 |
-
"77": "
|
236 |
"78": "SUCCESS",
|
237 |
"79": "SUCCESS",
|
238 |
"8": "SUCCESS",
|
@@ -253,7 +253,7 @@
|
|
253 |
"93": "SUCCESS",
|
254 |
"94": "SUCCESS",
|
255 |
"95": "SUCCESS",
|
256 |
-
"96": "
|
257 |
"97": "SUCCESS",
|
258 |
"98": "SUCCESS",
|
259 |
"99": "SUCCESS"
|
@@ -264,17 +264,16 @@
|
|
264 |
"attention_bias": false,
|
265 |
"attention_dropout": 0.0,
|
266 |
"block_list": [
|
267 |
-
|
268 |
-
5771929
|
269 |
],
|
270 |
"bos_token_id": 1,
|
271 |
"eos_token_id": 2,
|
272 |
"hidden_act": "silu",
|
273 |
"hidden_size": 2048,
|
274 |
"initializer_range": 0.02,
|
275 |
-
"inner_step":
|
276 |
"intermediate_size": 5632,
|
277 |
-
"last_allreduce_block":
|
278 |
"max_position_embeddings": 2048,
|
279 |
"mlp_bias": false,
|
280 |
"model_type": "llama",
|
|
|
1 |
{
|
2 |
+
"_name_or_path": "unrented5443/sn38-v2-5",
|
3 |
"all_reduce_scores": {
|
4 |
"0": "NON_PARTICIPATING",
|
5 |
"1": "SUCCESS",
|
|
|
34 |
"125": "NON_PARTICIPATING",
|
35 |
"126": "NON_PARTICIPATING",
|
36 |
"127": "NON_PARTICIPATING",
|
37 |
+
"128": "NON_PARTICIPATING",
|
38 |
"129": "NON_PARTICIPATING",
|
39 |
"13": "SUCCESS",
|
40 |
"130": "NON_PARTICIPATING",
|
|
|
55 |
"144": "NON_PARTICIPATING",
|
56 |
"145": "NON_PARTICIPATING",
|
57 |
"146": "NON_PARTICIPATING",
|
58 |
+
"147": "SUCCESS",
|
59 |
"148": "NON_PARTICIPATING",
|
60 |
"149": "NON_PARTICIPATING",
|
61 |
"15": "SUCCESS",
|
|
|
99 |
"184": "NON_PARTICIPATING",
|
100 |
"185": "NON_PARTICIPATING",
|
101 |
"186": "NON_PARTICIPATING",
|
102 |
+
"187": "SUCCESS",
|
103 |
"188": "NON_PARTICIPATING",
|
104 |
"189": "NON_PARTICIPATING",
|
105 |
"19": "SUCCESS",
|
|
|
112 |
"196": "NON_PARTICIPATING",
|
113 |
"197": "NON_PARTICIPATING",
|
114 |
"198": "NON_PARTICIPATING",
|
115 |
+
"199": "SUCCESS",
|
116 |
"2": "SUCCESS",
|
117 |
"20": "SUCCESS",
|
118 |
+
"200": "SUCCESS",
|
119 |
"201": "NON_PARTICIPATING",
|
120 |
"202": "NON_PARTICIPATING",
|
121 |
"203": "NON_PARTICIPATING",
|
122 |
"204": "NON_PARTICIPATING",
|
123 |
+
"205": "NON_PARTICIPATING",
|
124 |
"206": "NON_PARTICIPATING",
|
125 |
"207": "NON_PARTICIPATING",
|
126 |
"208": "NON_PARTICIPATING",
|
127 |
"209": "NON_PARTICIPATING",
|
128 |
"21": "SUCCESS",
|
129 |
+
"210": "SUCCESS",
|
130 |
"211": "NON_PARTICIPATING",
|
131 |
"212": "NON_PARTICIPATING",
|
132 |
"213": "NON_PARTICIPATING",
|
|
|
137 |
"218": "NON_PARTICIPATING",
|
138 |
"219": "NON_PARTICIPATING",
|
139 |
"22": "SUCCESS",
|
140 |
+
"220": "NON_PARTICIPATING",
|
141 |
"221": "NON_PARTICIPATING",
|
142 |
"222": "NON_PARTICIPATING",
|
143 |
"223": "NON_PARTICIPATING",
|
|
|
153 |
"232": "NON_PARTICIPATING",
|
154 |
"233": "NON_PARTICIPATING",
|
155 |
"234": "NON_PARTICIPATING",
|
156 |
+
"235": "NON_PARTICIPATING",
|
157 |
"236": "NON_PARTICIPATING",
|
158 |
"237": "NON_PARTICIPATING",
|
159 |
"238": "NON_PARTICIPATING",
|
|
|
227 |
"7": "SUCCESS",
|
228 |
"70": "SUCCESS",
|
229 |
"71": "SUCCESS",
|
230 |
+
"72": "NON_PARTICIPATING",
|
231 |
"73": "SUCCESS",
|
232 |
"74": "SUCCESS",
|
233 |
"75": "SUCCESS",
|
234 |
"76": "SUCCESS",
|
235 |
+
"77": "NON_PARTICIPATING",
|
236 |
"78": "SUCCESS",
|
237 |
"79": "SUCCESS",
|
238 |
"8": "SUCCESS",
|
|
|
253 |
"93": "SUCCESS",
|
254 |
"94": "SUCCESS",
|
255 |
"95": "SUCCESS",
|
256 |
+
"96": "SUCCESS",
|
257 |
"97": "SUCCESS",
|
258 |
"98": "SUCCESS",
|
259 |
"99": "SUCCESS"
|
|
|
264 |
"attention_bias": false,
|
265 |
"attention_dropout": 0.0,
|
266 |
"block_list": [
|
267 |
+
5774545
|
|
|
268 |
],
|
269 |
"bos_token_id": 1,
|
270 |
"eos_token_id": 2,
|
271 |
"hidden_act": "silu",
|
272 |
"hidden_size": 2048,
|
273 |
"initializer_range": 0.02,
|
274 |
+
"inner_step": 19,
|
275 |
"intermediate_size": 5632,
|
276 |
+
"last_allreduce_block": 5770468,
|
277 |
"max_position_embeddings": 2048,
|
278 |
"mlp_bias": false,
|
279 |
"model_type": "llama",
|