Training in progress, epoch 9
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4877660776
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c0aa8dc106145cfcbe0627f9aefe30d07a925693c8eb2cc27c1c82a73403ca25
|
3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4932751008
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:185836b0c081caeb7d47427b2fe705067b8beccd4e9e1cb0f8acdb1c272f8e36
|
3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4330865200
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:151b7498ee63d492c70bfca9583c45c6af20661d3c3bb68e6bf0e4a8476a8453
|
3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1089994880
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:147077ecd4b7a712f80101af0524f00293005f51dd00c9fa6a9883ce32f88c8c
|
3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
@@ -78,3 +78,25 @@
|
|
78 |
{"current_steps": 78, "total_steps": 130, "loss": 0.1806, "lr": 4.131759111665349e-06, "epoch": 7.8, "percentage": 60.0, "elapsed_time": "0:24:08", "remaining_time": "0:16:05"}
|
79 |
{"current_steps": 79, "total_steps": 130, "loss": 0.0962, "lr": 3.999871531119779e-06, "epoch": 7.9, "percentage": 60.77, "elapsed_time": "0:24:13", "remaining_time": "0:15:38"}
|
80 |
{"current_steps": 80, "total_steps": 130, "loss": 0.2206, "lr": 3.86870498785139e-06, "epoch": 8.0, "percentage": 61.54, "elapsed_time": "0:24:25", "remaining_time": "0:15:15"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
78 |
{"current_steps": 78, "total_steps": 130, "loss": 0.1806, "lr": 4.131759111665349e-06, "epoch": 7.8, "percentage": 60.0, "elapsed_time": "0:24:08", "remaining_time": "0:16:05"}
|
79 |
{"current_steps": 79, "total_steps": 130, "loss": 0.0962, "lr": 3.999871531119779e-06, "epoch": 7.9, "percentage": 60.77, "elapsed_time": "0:24:13", "remaining_time": "0:15:38"}
|
80 |
{"current_steps": 80, "total_steps": 130, "loss": 0.2206, "lr": 3.86870498785139e-06, "epoch": 8.0, "percentage": 61.54, "elapsed_time": "0:24:25", "remaining_time": "0:15:15"}
|
81 |
+
{"current_steps": 81, "total_steps": 130, "loss": 0.1653, "lr": 3.7383540456788915e-06, "epoch": 8.1, "percentage": 62.31, "elapsed_time": "0:26:34", "remaining_time": "0:16:04"}
|
82 |
+
{"current_steps": 82, "total_steps": 130, "loss": 0.0885, "lr": 3.6089126804177373e-06, "epoch": 8.2, "percentage": 63.08, "elapsed_time": "0:26:40", "remaining_time": "0:15:37"}
|
83 |
+
{"current_steps": 83, "total_steps": 130, "loss": 0.1024, "lr": 3.480474212128766e-06, "epoch": 8.3, "percentage": 63.85, "elapsed_time": "0:26:48", "remaining_time": "0:15:10"}
|
84 |
+
{"current_steps": 84, "total_steps": 130, "loss": 0.1749, "lr": 3.3531312378396026e-06, "epoch": 8.4, "percentage": 64.62, "elapsed_time": "0:26:57", "remaining_time": "0:14:45"}
|
85 |
+
{"current_steps": 85, "total_steps": 130, "loss": 0.1421, "lr": 3.226975564787322e-06, "epoch": 8.5, "percentage": 65.38, "elapsed_time": "0:27:05", "remaining_time": "0:14:20"}
|
86 |
+
{"current_steps": 86, "total_steps": 130, "loss": 0.1319, "lr": 3.1020981442305187e-06, "epoch": 8.6, "percentage": 66.15, "elapsed_time": "0:27:13", "remaining_time": "0:13:55"}
|
87 |
+
{"current_steps": 87, "total_steps": 130, "loss": 0.1755, "lr": 2.978589005878476e-06, "epoch": 8.7, "percentage": 66.92, "elapsed_time": "0:27:23", "remaining_time": "0:13:32"}
|
88 |
+
{"current_steps": 88, "total_steps": 130, "loss": 0.1519, "lr": 2.8565371929847286e-06, "epoch": 8.8, "percentage": 67.69, "elapsed_time": "0:27:34", "remaining_time": "0:13:09"}
|
89 |
+
{"current_steps": 89, "total_steps": 130, "loss": 0.1402, "lr": 2.736030698151815e-06, "epoch": 8.9, "percentage": 68.46, "elapsed_time": "0:27:43", "remaining_time": "0:12:46"}
|
90 |
+
{"current_steps": 90, "total_steps": 130, "loss": 0.091, "lr": 2.6171563998934605e-06, "epoch": 9.0, "percentage": 69.23, "elapsed_time": "0:27:51", "remaining_time": "0:12:22"}
|
91 |
+
{"current_steps": 91, "total_steps": 130, "loss": 0.0827, "lr": 2.5000000000000015e-06, "epoch": 9.1, "percentage": 70.0, "elapsed_time": "0:30:30", "remaining_time": "0:13:04"}
|
92 |
+
{"current_steps": 92, "total_steps": 130, "loss": 0.1305, "lr": 2.384645961752113e-06, "epoch": 9.2, "percentage": 70.77, "elapsed_time": "0:30:40", "remaining_time": "0:12:40"}
|
93 |
+
{"current_steps": 93, "total_steps": 130, "loss": 0.072, "lr": 2.2711774490274767e-06, "epoch": 9.3, "percentage": 71.54, "elapsed_time": "0:30:45", "remaining_time": "0:12:14"}
|
94 |
+
{"current_steps": 94, "total_steps": 130, "loss": 0.1218, "lr": 2.159676266344222e-06, "epoch": 9.4, "percentage": 72.31, "elapsed_time": "0:30:54", "remaining_time": "0:11:50"}
|
95 |
+
{"current_steps": 95, "total_steps": 130, "loss": 0.1264, "lr": 2.050222799884387e-06, "epoch": 9.5, "percentage": 73.08, "elapsed_time": "0:31:02", "remaining_time": "0:11:26"}
|
96 |
+
{"current_steps": 96, "total_steps": 130, "loss": 0.15, "lr": 1.942895959539939e-06, "epoch": 9.6, "percentage": 73.85, "elapsed_time": "0:31:10", "remaining_time": "0:11:02"}
|
97 |
+
{"current_steps": 97, "total_steps": 130, "loss": 0.098, "lr": 1.8377731220231144e-06, "epoch": 9.7, "percentage": 74.62, "elapsed_time": "0:31:17", "remaining_time": "0:10:38"}
|
98 |
+
{"current_steps": 98, "total_steps": 130, "loss": 0.1517, "lr": 1.7349300750820758e-06, "epoch": 9.8, "percentage": 75.38, "elapsed_time": "0:31:25", "remaining_time": "0:10:15"}
|
99 |
+
{"current_steps": 99, "total_steps": 130, "loss": 0.0969, "lr": 1.6344409628621482e-06, "epoch": 9.9, "percentage": 76.15, "elapsed_time": "0:31:33", "remaining_time": "0:09:52"}
|
100 |
+
{"current_steps": 100, "total_steps": 130, "loss": 0.1355, "lr": 1.5363782324520033e-06, "epoch": 10.0, "percentage": 76.92, "elapsed_time": "0:31:43", "remaining_time": "0:09:31"}
|
101 |
+
{"current_steps": 101, "total_steps": 130, "loss": 0.0391, "lr": 1.4408125816532981e-06, "epoch": 10.1, "percentage": 77.69, "elapsed_time": "0:33:48", "remaining_time": "0:09:42"}
|
102 |
+
{"current_steps": 102, "total_steps": 130, "loss": 0.1106, "lr": 1.347812908011485e-06, "epoch": 10.2, "percentage": 78.46, "elapsed_time": "0:33:59", "remaining_time": "0:09:19"}
|