rooftopcoder commited on
Commit
eae9df7
1 Parent(s): b2a8b6e

End of training

Browse files
Files changed (3) hide show
  1. all_results.json +4 -4
  2. train_results.json +4 -4
  3. trainer_state.json +9 -21
all_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 2.97,
3
  "train_loss": 0.0,
4
- "train_runtime": 32.9708,
5
  "train_samples": 156240,
6
- "train_samples_per_second": 14216.232,
7
- "train_steps_per_second": 111.098
8
  }
 
1
  {
2
+ "epoch": 2.76,
3
  "train_loss": 0.0,
4
+ "train_runtime": 33.2317,
5
  "train_samples": 156240,
6
+ "train_samples_per_second": 14104.587,
7
+ "train_steps_per_second": 110.226
8
  }
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 2.97,
3
  "train_loss": 0.0,
4
- "train_runtime": 32.9708,
5
  "train_samples": 156240,
6
- "train_samples_per_second": 14216.232,
7
- "train_steps_per_second": 111.098
8
  }
 
1
  {
2
+ "epoch": 2.76,
3
  "train_loss": 0.0,
4
+ "train_runtime": 33.2317,
5
  "train_samples": 156240,
6
+ "train_samples_per_second": 14104.587,
7
+ "train_steps_per_second": 110.226
8
  }
trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 2.9694859717386852,
5
- "global_step": 14500,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -170,30 +170,18 @@
170
  "step": 13500
171
  },
172
  {
173
- "epoch": 2.87,
174
- "learning_rate": 0.0,
175
- "loss": 5.9514,
176
- "step": 14000
177
- },
178
- {
179
- "epoch": 2.97,
180
- "learning_rate": 0.0,
181
- "loss": 5.9511,
182
- "step": 14500
183
- },
184
- {
185
- "epoch": 2.97,
186
- "step": 14500,
187
- "total_flos": 9.092500022196634e+16,
188
  "train_loss": 0.0,
189
- "train_runtime": 32.9708,
190
- "train_samples_per_second": 14216.232,
191
- "train_steps_per_second": 111.098
192
  }
193
  ],
194
  "max_steps": 3663,
195
  "num_train_epochs": 3,
196
- "total_flos": 9.092500022196634e+16,
197
  "trial_name": null,
198
  "trial_params": null
199
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 2.764693835756707,
5
+ "global_step": 13500,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
170
  "step": 13500
171
  },
172
  {
173
+ "epoch": 2.76,
174
+ "step": 13500,
175
+ "total_flos": 8.465387806030234e+16,
 
 
 
 
 
 
 
 
 
 
 
 
176
  "train_loss": 0.0,
177
+ "train_runtime": 33.2317,
178
+ "train_samples_per_second": 14104.587,
179
+ "train_steps_per_second": 110.226
180
  }
181
  ],
182
  "max_steps": 3663,
183
  "num_train_epochs": 3,
184
+ "total_flos": 8.465387806030234e+16,
185
  "trial_name": null,
186
  "trial_params": null
187
  }