Training in progress, epoch 8
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4877660776
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:51a86cbb334d6d92a991c89d9f33c1fcd70bfe0214407c633d9895efb132e4a4
|
3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4932751008
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:547d5b7c7e6e27ac9d692ce0a2f5c1bd6206ccc28c6389fbee3eec8b30e1ed6d
|
3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4330865200
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f8415a69f086436620b224ea4bd8b8badd7a21a3ac8da12a8457d9805a462227
|
3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1089994880
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:76d2425fe3e44094f95307631ba34ce0f2ec3018988af9fc610966e2ca7f6e1d
|
3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
@@ -78,3 +78,14 @@
|
|
78 |
{"current_steps": 78, "total_steps": 117, "loss": 0.3053, "lr": 3.0348748417303826e-06, "epoch": 8.20253164556962, "percentage": 66.67, "elapsed_time": "1:00:13", "remaining_time": "0:30:06"}
|
79 |
{"current_steps": 79, "total_steps": 117, "loss": 0.2778, "lr": 2.8982138584521734e-06, "epoch": 8.30379746835443, "percentage": 67.52, "elapsed_time": "1:00:52", "remaining_time": "0:29:17"}
|
80 |
{"current_steps": 80, "total_steps": 117, "loss": 0.2992, "lr": 2.7634342584218364e-06, "epoch": 8.405063291139241, "percentage": 68.38, "elapsed_time": "1:01:28", "remaining_time": "0:28:26"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
78 |
{"current_steps": 78, "total_steps": 117, "loss": 0.3053, "lr": 3.0348748417303826e-06, "epoch": 8.20253164556962, "percentage": 66.67, "elapsed_time": "1:00:13", "remaining_time": "0:30:06"}
|
79 |
{"current_steps": 79, "total_steps": 117, "loss": 0.2778, "lr": 2.8982138584521734e-06, "epoch": 8.30379746835443, "percentage": 67.52, "elapsed_time": "1:00:52", "remaining_time": "0:29:17"}
|
80 |
{"current_steps": 80, "total_steps": 117, "loss": 0.2992, "lr": 2.7634342584218364e-06, "epoch": 8.405063291139241, "percentage": 68.38, "elapsed_time": "1:01:28", "remaining_time": "0:28:26"}
|
81 |
+
{"current_steps": 81, "total_steps": 117, "loss": 0.297, "lr": 2.6306566876350072e-06, "epoch": 8.50632911392405, "percentage": 69.23, "elapsed_time": "1:02:07", "remaining_time": "0:27:36"}
|
82 |
+
{"current_steps": 82, "total_steps": 117, "loss": 0.3169, "lr": 2.5000000000000015e-06, "epoch": 8.60759493670886, "percentage": 70.09, "elapsed_time": "1:02:46", "remaining_time": "0:26:47"}
|
83 |
+
{"current_steps": 83, "total_steps": 117, "loss": 0.2725, "lr": 2.371581150947476e-06, "epoch": 8.708860759493671, "percentage": 70.94, "elapsed_time": "1:03:25", "remaining_time": "0:25:58"}
|
84 |
+
{"current_steps": 84, "total_steps": 117, "loss": 0.2936, "lr": 2.245515092739488e-06, "epoch": 8.810126582278482, "percentage": 71.79, "elapsed_time": "1:04:06", "remaining_time": "0:25:11"}
|
85 |
+
{"current_steps": 85, "total_steps": 117, "loss": 0.2858, "lr": 2.1219146715716332e-06, "epoch": 8.91139240506329, "percentage": 72.65, "elapsed_time": "1:04:47", "remaining_time": "0:24:23"}
|
86 |
+
{"current_steps": 86, "total_steps": 117, "loss": 0.245, "lr": 2.0008905265604316e-06, "epoch": 9.050632911392405, "percentage": 73.5, "elapsed_time": "1:06:23", "remaining_time": "0:23:56"}
|
87 |
+
{"current_steps": 87, "total_steps": 117, "loss": 0.263, "lr": 1.8825509907063328e-06, "epoch": 9.151898734177216, "percentage": 74.36, "elapsed_time": "1:06:57", "remaining_time": "0:23:05"}
|
88 |
+
{"current_steps": 88, "total_steps": 117, "loss": 0.2263, "lr": 1.7670019939210025e-06, "epoch": 9.253164556962025, "percentage": 75.21, "elapsed_time": "1:07:36", "remaining_time": "0:22:16"}
|
89 |
+
{"current_steps": 89, "total_steps": 117, "loss": 0.2687, "lr": 1.6543469682057105e-06, "epoch": 9.354430379746836, "percentage": 76.07, "elapsed_time": "1:08:21", "remaining_time": "0:21:30"}
|
90 |
+
{"current_steps": 90, "total_steps": 117, "loss": 0.2365, "lr": 1.544686755065677e-06, "epoch": 9.455696202531646, "percentage": 76.92, "elapsed_time": "1:09:02", "remaining_time": "0:20:42"}
|
91 |
+
{"current_steps": 91, "total_steps": 117, "loss": 0.2839, "lr": 1.438119515243277e-06, "epoch": 9.556962025316455, "percentage": 77.78, "elapsed_time": "1:09:47", "remaining_time": "0:19:56"}
|