Training in progress, step 40, checkpoint
Browse files
last-checkpoint/model-00001-of-00003.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4943178720
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:720105d2b88abf15d23994fec61854b0a1497a10d1d208715bd59904ab5936ff
|
3 |
size 4943178720
|
last-checkpoint/model-00002-of-00003.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4999819336
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:22f56733ac237ee5fada526e2a06e89d311e7ce1cb761f9b8f6986910b678378
|
3 |
size 4999819336
|
last-checkpoint/model-00003-of-00003.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4540532728
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:31711beccc0b973ef7bf69d348d844233b185f6888f0520ae136ada35d74f983
|
3 |
size 4540532728
|
last-checkpoint/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14710155092
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5dcb4aaff4751c7031e867ff29e6e2b9b4b0674cc9dd1b3848e0ceb758301a28
|
3 |
size 14710155092
|
last-checkpoint/trainer_state.json
CHANGED
@@ -11,37 +11,37 @@
|
|
11 |
{
|
12 |
"epoch": 0.019230769230769232,
|
13 |
"eval_loss": 1.8673125505447388,
|
14 |
-
"eval_runtime": 14.
|
15 |
-
"eval_samples_per_second": 101.
|
16 |
-
"eval_steps_per_second": 6.
|
17 |
"step": 1
|
18 |
},
|
19 |
{
|
20 |
"epoch": 0.19230769230769232,
|
21 |
-
"grad_norm":
|
22 |
"learning_rate": 6.666666666666667e-05,
|
23 |
-
"loss": 2.
|
24 |
"step": 10
|
25 |
},
|
26 |
{
|
27 |
"epoch": 0.38461538461538464,
|
28 |
-
"grad_norm":
|
29 |
"learning_rate": 0.00013333333333333334,
|
30 |
-
"loss":
|
31 |
"step": 20
|
32 |
},
|
33 |
{
|
34 |
"epoch": 0.5769230769230769,
|
35 |
-
"grad_norm":
|
36 |
"learning_rate": 0.0002,
|
37 |
-
"loss":
|
38 |
"step": 30
|
39 |
},
|
40 |
{
|
41 |
"epoch": 0.7692307692307693,
|
42 |
-
"grad_norm":
|
43 |
"learning_rate": 0.00019984815164333163,
|
44 |
-
"loss":
|
45 |
"step": 40
|
46 |
}
|
47 |
],
|
|
|
11 |
{
|
12 |
"epoch": 0.019230769230769232,
|
13 |
"eval_loss": 1.8673125505447388,
|
14 |
+
"eval_runtime": 14.7715,
|
15 |
+
"eval_samples_per_second": 101.615,
|
16 |
+
"eval_steps_per_second": 6.364,
|
17 |
"step": 1
|
18 |
},
|
19 |
{
|
20 |
"epoch": 0.19230769230769232,
|
21 |
+
"grad_norm": 18.375,
|
22 |
"learning_rate": 6.666666666666667e-05,
|
23 |
+
"loss": 2.4377,
|
24 |
"step": 10
|
25 |
},
|
26 |
{
|
27 |
"epoch": 0.38461538461538464,
|
28 |
+
"grad_norm": 80.5,
|
29 |
"learning_rate": 0.00013333333333333334,
|
30 |
+
"loss": 2.8471,
|
31 |
"step": 20
|
32 |
},
|
33 |
{
|
34 |
"epoch": 0.5769230769230769,
|
35 |
+
"grad_norm": 1200.0,
|
36 |
"learning_rate": 0.0002,
|
37 |
+
"loss": 7.8725,
|
38 |
"step": 30
|
39 |
},
|
40 |
{
|
41 |
"epoch": 0.7692307692307693,
|
42 |
+
"grad_norm": 37.25,
|
43 |
"learning_rate": 0.00019984815164333163,
|
44 |
+
"loss": 13.1972,
|
45 |
"step": 40
|
46 |
}
|
47 |
],
|
last-checkpoint/training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 6776
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:53ebcd35271d188c087a5f00ee35959f144cc8fbcdfc0d1744678c3f065510bd
|
3 |
size 6776
|