Training in progress, step 52000, checkpoint
Browse files
last-checkpoint/README.md
CHANGED
@@ -1193,6 +1193,10 @@ You can finetune this model on your own dataset.
|
|
1193 |
| 0.9136 | 51700 | 0.3088 |
|
1194 |
| 0.9145 | 51750 | 0.2287 |
|
1195 |
| 0.9153 | 51800 | 0.2067 |
|
|
|
|
|
|
|
|
|
1196 |
|
1197 |
|
1198 |
### Framework Versions
|
|
|
1193 |
| 0.9136 | 51700 | 0.3088 |
|
1194 |
| 0.9145 | 51750 | 0.2287 |
|
1195 |
| 0.9153 | 51800 | 0.2067 |
|
1196 |
+
| 0.9162 | 51850 | 0.2735 |
|
1197 |
+
| 0.9171 | 51900 | 0.3976 |
|
1198 |
+
| 0.9180 | 51950 | 0.2939 |
|
1199 |
+
| 0.9189 | 52000 | 0.3193 |
|
1200 |
|
1201 |
|
1202 |
### Framework Versions
|
last-checkpoint/model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 90864192
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:64df739ab78548e5d75f993ab6041c207785adcb30fa9a57cf9234173976387d
|
3 |
size 90864192
|
last-checkpoint/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 180609210
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ab3798d7d967dd27d94d9da8c3b443a2ae8d98157d0a447c72ba241256385ef3
|
3 |
size 180609210
|
last-checkpoint/rng_state.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14244
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1bf77e2ef33f60ef48f8a5fc09cb1943760ae6ba4d88634c23d14cfcf6cad117
|
3 |
size 14244
|
last-checkpoint/scaler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 988
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:12597bbc3e3311f727af17ce6725c67e2c62ce8d20a5da4fcf3ead6fc2b4cd3a
|
3 |
size 988
|
last-checkpoint/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1064
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:69967b924386ed794e36fcb2fe2f94715b55410c1d3076df0af1214b0c14df7b
|
3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
@@ -2,9 +2,9 @@
|
|
2 |
"best_global_step": null,
|
3 |
"best_metric": null,
|
4 |
"best_model_checkpoint": null,
|
5 |
-
"epoch": 0.
|
6 |
"eval_steps": 500,
|
7 |
-
"global_step":
|
8 |
"is_hyper_param_search": false,
|
9 |
"is_local_process_zero": true,
|
10 |
"is_world_process_zero": true,
|
@@ -7260,6 +7260,34 @@
|
|
7260 |
"learning_rate": 4.724038404900748e-06,
|
7261 |
"loss": 0.2067,
|
7262 |
"step": 51800
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
7263 |
}
|
7264 |
],
|
7265 |
"logging_steps": 50,
|
|
|
2 |
"best_global_step": null,
|
3 |
"best_metric": null,
|
4 |
"best_model_checkpoint": null,
|
5 |
+
"epoch": 0.9188740259051793,
|
6 |
"eval_steps": 500,
|
7 |
+
"global_step": 52000,
|
8 |
"is_hyper_param_search": false,
|
9 |
"is_local_process_zero": true,
|
10 |
"is_world_process_zero": true,
|
|
|
7260 |
"learning_rate": 4.724038404900748e-06,
|
7261 |
"loss": 0.2067,
|
7262 |
"step": 51800
|
7263 |
+
},
|
7264 |
+
{
|
7265 |
+
"epoch": 0.9162234277535297,
|
7266 |
+
"grad_norm": 1.1146478652954102,
|
7267 |
+
"learning_rate": 4.674952386562212e-06,
|
7268 |
+
"loss": 0.2735,
|
7269 |
+
"step": 51850
|
7270 |
+
},
|
7271 |
+
{
|
7272 |
+
"epoch": 0.9171069604707462,
|
7273 |
+
"grad_norm": 2.2454397678375244,
|
7274 |
+
"learning_rate": 4.625866368223675e-06,
|
7275 |
+
"loss": 0.3976,
|
7276 |
+
"step": 51900
|
7277 |
+
},
|
7278 |
+
{
|
7279 |
+
"epoch": 0.9179904931879628,
|
7280 |
+
"grad_norm": 1.902377724647522,
|
7281 |
+
"learning_rate": 4.576780349885139e-06,
|
7282 |
+
"loss": 0.2939,
|
7283 |
+
"step": 51950
|
7284 |
+
},
|
7285 |
+
{
|
7286 |
+
"epoch": 0.9188740259051793,
|
7287 |
+
"grad_norm": 4.320808410644531,
|
7288 |
+
"learning_rate": 4.527694331546602e-06,
|
7289 |
+
"loss": 0.3193,
|
7290 |
+
"step": 52000
|
7291 |
}
|
7292 |
],
|
7293 |
"logging_steps": 50,
|