Training in progress, step 52200, checkpoint
Browse files
last-checkpoint/README.md
CHANGED
@@ -1197,6 +1197,10 @@ You can finetune this model on your own dataset.
|
|
1197 |
| 0.9171 | 51900 | 0.3976 |
|
1198 |
| 0.9180 | 51950 | 0.2939 |
|
1199 |
| 0.9189 | 52000 | 0.3193 |
|
|
|
|
|
|
|
|
|
1200 |
|
1201 |
|
1202 |
### Framework Versions
|
|
|
1197 |
| 0.9171 | 51900 | 0.3976 |
|
1198 |
| 0.9180 | 51950 | 0.2939 |
|
1199 |
| 0.9189 | 52000 | 0.3193 |
|
1200 |
+
| 0.9198 | 52050 | 0.2988 |
|
1201 |
+
| 0.9206 | 52100 | 0.2286 |
|
1202 |
+
| 0.9215 | 52150 | 0.371 |
|
1203 |
+
| 0.9224 | 52200 | 0.2825 |
|
1204 |
|
1205 |
|
1206 |
### Framework Versions
|
last-checkpoint/model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 90864192
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dcce17b7b84aa84d9a62e4ecacf9221e386cc1f4a8fd8f1ff065fb84d8b66600
|
3 |
size 90864192
|
last-checkpoint/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 180609210
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3b1907993a4836b8d7f68772a56e92f265d1d0b880c0f389e3d9a3261d2c18d6
|
3 |
size 180609210
|
last-checkpoint/rng_state.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14244
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7eb456525d851480624b8b851b2b4e427ee862f93eba28a337891329169059e3
|
3 |
size 14244
|
last-checkpoint/scaler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 988
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8f8d439a57eb96c40411a5c7daa3d2c6f4bcb1ca85fe20f7f71f85e34ad3c1e4
|
3 |
size 988
|
last-checkpoint/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1064
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8195c12f983d26de39eb9400cc5a62a3f600dcf25125907830ba8d58cfd3e0c0
|
3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
@@ -2,9 +2,9 @@
|
|
2 |
"best_global_step": null,
|
3 |
"best_metric": null,
|
4 |
"best_model_checkpoint": null,
|
5 |
-
"epoch": 0.
|
6 |
"eval_steps": 500,
|
7 |
-
"global_step":
|
8 |
"is_hyper_param_search": false,
|
9 |
"is_local_process_zero": true,
|
10 |
"is_world_process_zero": true,
|
@@ -7288,6 +7288,34 @@
|
|
7288 |
"learning_rate": 4.527694331546602e-06,
|
7289 |
"loss": 0.3193,
|
7290 |
"step": 52000
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
7291 |
}
|
7292 |
],
|
7293 |
"logging_steps": 50,
|
|
|
2 |
"best_global_step": null,
|
3 |
"best_metric": null,
|
4 |
"best_model_checkpoint": null,
|
5 |
+
"epoch": 0.9224081567740453,
|
6 |
"eval_steps": 500,
|
7 |
+
"global_step": 52200,
|
8 |
"is_hyper_param_search": false,
|
9 |
"is_local_process_zero": true,
|
10 |
"is_world_process_zero": true,
|
|
|
7288 |
"learning_rate": 4.527694331546602e-06,
|
7289 |
"loss": 0.3193,
|
7290 |
"step": 52000
|
7291 |
+
},
|
7292 |
+
{
|
7293 |
+
"epoch": 0.9197575586223958,
|
7294 |
+
"grad_norm": 1.4950217008590698,
|
7295 |
+
"learning_rate": 4.478608313208066e-06,
|
7296 |
+
"loss": 0.2988,
|
7297 |
+
"step": 52050
|
7298 |
+
},
|
7299 |
+
{
|
7300 |
+
"epoch": 0.9206410913396124,
|
7301 |
+
"grad_norm": 1.5405720472335815,
|
7302 |
+
"learning_rate": 4.42952229486953e-06,
|
7303 |
+
"loss": 0.2286,
|
7304 |
+
"step": 52100
|
7305 |
+
},
|
7306 |
+
{
|
7307 |
+
"epoch": 0.9215246240568288,
|
7308 |
+
"grad_norm": 1.5918203592300415,
|
7309 |
+
"learning_rate": 4.3804362765309926e-06,
|
7310 |
+
"loss": 0.371,
|
7311 |
+
"step": 52150
|
7312 |
+
},
|
7313 |
+
{
|
7314 |
+
"epoch": 0.9224081567740453,
|
7315 |
+
"grad_norm": 1.2329323291778564,
|
7316 |
+
"learning_rate": 4.331350258192457e-06,
|
7317 |
+
"loss": 0.2825,
|
7318 |
+
"step": 52200
|
7319 |
}
|
7320 |
],
|
7321 |
"logging_steps": 50,
|