Training in progress, epoch 8
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4877660776
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0f57c3eff2884d1df440b3b62bf4862922e9377d962ab01c968396011eaa47ee
|
3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4932751008
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5eb7593156970237fdc6a467de7aa56654560db06c8971c9e9ecf88e309974b6
|
3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4330865200
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:93ce5340eef25311094ded3aac1de6a4eb9ee6fb9737d0d89beae15bcefdd0b6
|
3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1089994880
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e247c1b7daaa90f379253889424426afb77e81cb375e7e984911c7f9edeb9b85
|
3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
@@ -78,3 +78,18 @@
|
|
78 |
{"current_steps": 78, "total_steps": 117, "loss": 0.2946, "lr": 3.0348748417303826e-06, "epoch": 8.20253164556962, "percentage": 66.67, "elapsed_time": "1:01:24", "remaining_time": "0:30:42"}
|
79 |
{"current_steps": 79, "total_steps": 117, "loss": 0.2876, "lr": 2.8982138584521734e-06, "epoch": 8.30379746835443, "percentage": 67.52, "elapsed_time": "1:02:09", "remaining_time": "0:29:53"}
|
80 |
{"current_steps": 80, "total_steps": 117, "loss": 0.3127, "lr": 2.7634342584218364e-06, "epoch": 8.405063291139241, "percentage": 68.38, "elapsed_time": "1:02:48", "remaining_time": "0:29:02"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
78 |
{"current_steps": 78, "total_steps": 117, "loss": 0.2946, "lr": 3.0348748417303826e-06, "epoch": 8.20253164556962, "percentage": 66.67, "elapsed_time": "1:01:24", "remaining_time": "0:30:42"}
|
79 |
{"current_steps": 79, "total_steps": 117, "loss": 0.2876, "lr": 2.8982138584521734e-06, "epoch": 8.30379746835443, "percentage": 67.52, "elapsed_time": "1:02:09", "remaining_time": "0:29:53"}
|
80 |
{"current_steps": 80, "total_steps": 117, "loss": 0.3127, "lr": 2.7634342584218364e-06, "epoch": 8.405063291139241, "percentage": 68.38, "elapsed_time": "1:02:48", "remaining_time": "0:29:02"}
|
81 |
+
{"current_steps": 81, "total_steps": 117, "loss": 0.304, "lr": 2.6306566876350072e-06, "epoch": 8.50632911392405, "percentage": 69.23, "elapsed_time": "1:03:33", "remaining_time": "0:28:14"}
|
82 |
+
{"current_steps": 82, "total_steps": 117, "loss": 0.3259, "lr": 2.5000000000000015e-06, "epoch": 8.60759493670886, "percentage": 70.09, "elapsed_time": "1:04:10", "remaining_time": "0:27:23"}
|
83 |
+
{"current_steps": 83, "total_steps": 117, "loss": 0.31, "lr": 2.371581150947476e-06, "epoch": 8.708860759493671, "percentage": 70.94, "elapsed_time": "1:04:51", "remaining_time": "0:26:34"}
|
84 |
+
{"current_steps": 84, "total_steps": 117, "loss": 0.3248, "lr": 2.245515092739488e-06, "epoch": 8.810126582278482, "percentage": 71.79, "elapsed_time": "1:05:34", "remaining_time": "0:25:45"}
|
85 |
+
{"current_steps": 85, "total_steps": 117, "loss": 0.3359, "lr": 2.1219146715716332e-06, "epoch": 8.91139240506329, "percentage": 72.65, "elapsed_time": "1:06:15", "remaining_time": "0:24:56"}
|
86 |
+
{"current_steps": 86, "total_steps": 117, "loss": 0.3083, "lr": 2.0008905265604316e-06, "epoch": 9.050632911392405, "percentage": 73.5, "elapsed_time": "1:08:05", "remaining_time": "0:24:32"}
|
87 |
+
{"current_steps": 87, "total_steps": 117, "loss": 0.2697, "lr": 1.8825509907063328e-06, "epoch": 9.151898734177216, "percentage": 74.36, "elapsed_time": "1:08:44", "remaining_time": "0:23:42"}
|
88 |
+
{"current_steps": 88, "total_steps": 117, "loss": 0.294, "lr": 1.7670019939210025e-06, "epoch": 9.253164556962025, "percentage": 75.21, "elapsed_time": "1:09:25", "remaining_time": "0:22:52"}
|
89 |
+
{"current_steps": 89, "total_steps": 117, "loss": 0.2649, "lr": 1.6543469682057105e-06, "epoch": 9.354430379746836, "percentage": 76.07, "elapsed_time": "1:10:09", "remaining_time": "0:22:04"}
|
90 |
+
{"current_steps": 90, "total_steps": 117, "loss": 0.2425, "lr": 1.544686755065677e-06, "epoch": 9.455696202531646, "percentage": 76.92, "elapsed_time": "1:10:49", "remaining_time": "0:21:14"}
|
91 |
+
{"current_steps": 91, "total_steps": 117, "loss": 0.2892, "lr": 1.438119515243277e-06, "epoch": 9.556962025316455, "percentage": 77.78, "elapsed_time": "1:11:26", "remaining_time": "0:20:24"}
|
92 |
+
{"current_steps": 92, "total_steps": 117, "loss": 0.3171, "lr": 1.3347406408508695e-06, "epoch": 9.658227848101266, "percentage": 78.63, "elapsed_time": "1:12:08", "remaining_time": "0:19:36"}
|
93 |
+
{"current_steps": 93, "total_steps": 117, "loss": 0.2762, "lr": 1.234642669981946e-06, "epoch": 9.759493670886076, "percentage": 79.49, "elapsed_time": "1:12:51", "remaining_time": "0:18:48"}
|
94 |
+
{"current_steps": 94, "total_steps": 117, "loss": 0.3063, "lr": 1.137915203877003e-06, "epoch": 9.860759493670885, "percentage": 80.34, "elapsed_time": "1:13:38", "remaining_time": "0:18:01"}
|
95 |
+
{"current_steps": 95, "total_steps": 117, "loss": 0.2458, "lr": 1.044644826718295e-06, "epoch": 9.962025316455696, "percentage": 81.2, "elapsed_time": "1:14:19", "remaining_time": "0:17:12"}
|