Training in progress, step 54000, checkpoint
Browse files
last-checkpoint/README.md
CHANGED
@@ -1233,6 +1233,10 @@ You can finetune this model on your own dataset.
|
|
1233 |
| 0.9489 | 53700 | 0.303 |
|
1234 |
| 0.9498 | 53750 | 0.2651 |
|
1235 |
| 0.9507 | 53800 | 0.3384 |
|
|
|
|
|
|
|
|
|
1236 |
|
1237 |
|
1238 |
### Framework Versions
|
|
|
1233 |
| 0.9489 | 53700 | 0.303 |
|
1234 |
| 0.9498 | 53750 | 0.2651 |
|
1235 |
| 0.9507 | 53800 | 0.3384 |
|
1236 |
+
| 0.9516 | 53850 | 0.3324 |
|
1237 |
+
| 0.9524 | 53900 | 0.2253 |
|
1238 |
+
| 0.9533 | 53950 | 0.2942 |
|
1239 |
+
| 0.9542 | 54000 | 0.2997 |
|
1240 |
|
1241 |
|
1242 |
### Framework Versions
|
last-checkpoint/model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 90864192
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d367b7e3094b9509638dc3aab8cd20aa7d72d8a2079791ccc62c560157ab98a0
|
3 |
size 90864192
|
last-checkpoint/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 180609210
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ebfbc0071777229c33761182ed33d399969ad60e886668928a56deda972d74c1
|
3 |
size 180609210
|
last-checkpoint/rng_state.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14244
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4b32f599e36a2e355058567f81a1cf5fcee6ab44b38d16fa4944caffd04dfbb3
|
3 |
size 14244
|
last-checkpoint/scaler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 988
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8db4dd2df84f2b4b00fc6674bde1c97fccefdb7d0ae1f644ab8647d522122a7c
|
3 |
size 988
|
last-checkpoint/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1064
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f315466204b131c92fd6cdb19db01462071017aa8244ad37245b5ffab5418efa
|
3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
@@ -2,9 +2,9 @@
|
|
2 |
"best_global_step": null,
|
3 |
"best_metric": null,
|
4 |
"best_model_checkpoint": null,
|
5 |
-
"epoch": 0.
|
6 |
"eval_steps": 500,
|
7 |
-
"global_step":
|
8 |
"is_hyper_param_search": false,
|
9 |
"is_local_process_zero": true,
|
10 |
"is_world_process_zero": true,
|
@@ -7540,6 +7540,34 @@
|
|
7540 |
"learning_rate": 2.761579391726061e-06,
|
7541 |
"loss": 0.3384,
|
7542 |
"step": 53800
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
7543 |
}
|
7544 |
],
|
7545 |
"logging_steps": 50,
|
|
|
2 |
"best_global_step": null,
|
3 |
"best_metric": null,
|
4 |
"best_model_checkpoint": null,
|
5 |
+
"epoch": 0.95421533459384,
|
6 |
"eval_steps": 500,
|
7 |
+
"global_step": 54000,
|
8 |
"is_hyper_param_search": false,
|
9 |
"is_local_process_zero": true,
|
10 |
"is_world_process_zero": true,
|
|
|
7540 |
"learning_rate": 2.761579391726061e-06,
|
7541 |
"loss": 0.3384,
|
7542 |
"step": 53800
|
7543 |
+
},
|
7544 |
+
{
|
7545 |
+
"epoch": 0.9515647364421904,
|
7546 |
+
"grad_norm": 3.1194252967834473,
|
7547 |
+
"learning_rate": 2.712493373387524e-06,
|
7548 |
+
"loss": 0.3324,
|
7549 |
+
"step": 53850
|
7550 |
+
},
|
7551 |
+
{
|
7552 |
+
"epoch": 0.952448269159407,
|
7553 |
+
"grad_norm": 1.082737684249878,
|
7554 |
+
"learning_rate": 2.663407355048988e-06,
|
7555 |
+
"loss": 0.2253,
|
7556 |
+
"step": 53900
|
7557 |
+
},
|
7558 |
+
{
|
7559 |
+
"epoch": 0.9533318018766235,
|
7560 |
+
"grad_norm": 1.0127415657043457,
|
7561 |
+
"learning_rate": 2.614321336710452e-06,
|
7562 |
+
"loss": 0.2942,
|
7563 |
+
"step": 53950
|
7564 |
+
},
|
7565 |
+
{
|
7566 |
+
"epoch": 0.95421533459384,
|
7567 |
+
"grad_norm": 4.512701988220215,
|
7568 |
+
"learning_rate": 2.5652353183719152e-06,
|
7569 |
+
"loss": 0.2997,
|
7570 |
+
"step": 54000
|
7571 |
}
|
7572 |
],
|
7573 |
"logging_steps": 50,
|