Training in progress, epoch 10
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4877660776
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:80bfb9bfadf311c23337d56daf925e6ada11ac6ea69174a7ebb5b34885b81b76
|
3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4932751008
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5268576b765f17ae774e539b6aecb8b1cad52a168a80aec4d4207b372b258d6f
|
3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4330865200
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:398a0d1c23eec2055ffa74e0a07a71857ba404e9b1e4e09f08b00e9f86630c0a
|
3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1089994880
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9242d2ffe140cfba72f7e05d90f7a540804409b106c55fdbf8a7dcae5821d5e0
|
3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
@@ -98,3 +98,11 @@
|
|
98 |
{"current_steps": 98, "total_steps": 117, "loss": 0.2609, "lr": 7.863952067298042e-07, "epoch": 10.30379746835443, "percentage": 83.76, "elapsed_time": "1:18:11", "remaining_time": "0:15:09"}
|
99 |
{"current_steps": 99, "total_steps": 117, "loss": 0.2403, "lr": 7.077560319906696e-07, "epoch": 10.405063291139241, "percentage": 84.62, "elapsed_time": "1:18:56", "remaining_time": "0:14:21"}
|
100 |
{"current_steps": 100, "total_steps": 117, "loss": 0.2876, "lr": 6.329589969143518e-07, "epoch": 10.50632911392405, "percentage": 85.47, "elapsed_time": "1:19:38", "remaining_time": "0:13:32"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
98 |
{"current_steps": 98, "total_steps": 117, "loss": 0.2609, "lr": 7.863952067298042e-07, "epoch": 10.30379746835443, "percentage": 83.76, "elapsed_time": "1:18:11", "remaining_time": "0:15:09"}
|
99 |
{"current_steps": 99, "total_steps": 117, "loss": 0.2403, "lr": 7.077560319906696e-07, "epoch": 10.405063291139241, "percentage": 84.62, "elapsed_time": "1:18:56", "remaining_time": "0:14:21"}
|
100 |
{"current_steps": 100, "total_steps": 117, "loss": 0.2876, "lr": 6.329589969143518e-07, "epoch": 10.50632911392405, "percentage": 85.47, "elapsed_time": "1:19:38", "remaining_time": "0:13:32"}
|
101 |
+
{"current_steps": 101, "total_steps": 117, "loss": 0.277, "lr": 5.620710549772295e-07, "epoch": 10.60759493670886, "percentage": 86.32, "elapsed_time": "1:20:23", "remaining_time": "0:12:44"}
|
102 |
+
{"current_steps": 102, "total_steps": 117, "loss": 0.2838, "lr": 4.951556604879049e-07, "epoch": 10.708860759493671, "percentage": 87.18, "elapsed_time": "1:21:01", "remaining_time": "0:11:54"}
|
103 |
+
{"current_steps": 103, "total_steps": 117, "loss": 0.256, "lr": 4.322727117869951e-07, "epoch": 10.810126582278482, "percentage": 88.03, "elapsed_time": "1:21:43", "remaining_time": "0:11:06"}
|
104 |
+
{"current_steps": 104, "total_steps": 117, "loss": 0.2958, "lr": 3.734784976300165e-07, "epoch": 10.91139240506329, "percentage": 88.89, "elapsed_time": "1:22:28", "remaining_time": "0:10:18"}
|
105 |
+
{"current_steps": 105, "total_steps": 117, "loss": 0.2405, "lr": 3.18825646801314e-07, "epoch": 11.050632911392405, "percentage": 89.74, "elapsed_time": "1:24:14", "remaining_time": "0:09:37"}
|
106 |
+
{"current_steps": 106, "total_steps": 117, "loss": 0.2295, "lr": 2.6836308100417874e-07, "epoch": 11.151898734177216, "percentage": 90.6, "elapsed_time": "1:24:57", "remaining_time": "0:08:49"}
|
107 |
+
{"current_steps": 107, "total_steps": 117, "loss": 0.2759, "lr": 2.2213597106929608e-07, "epoch": 11.253164556962025, "percentage": 91.45, "elapsed_time": "1:25:42", "remaining_time": "0:08:00"}
|
108 |
+
{"current_steps": 108, "total_steps": 117, "loss": 0.2662, "lr": 1.801856965207338e-07, "epoch": 11.354430379746836, "percentage": 92.31, "elapsed_time": "1:26:26", "remaining_time": "0:07:12"}
|