Training in progress, epoch 5
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4877660776
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:101202fd2623dccecabf0eac53603f73fa7fba94b4ab4709eafb42825f039d77
|
3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4932751008
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:82e2db3b121ce681f010dd9c244dffff81b202f4f3bf4d6431c42bd3fd3633a6
|
3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4330865200
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4ebd48b340b336fe9b332ea2e8ce13cf64bfc4cfb686e6483ba38f2d732aef49
|
3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1089994880
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e45839859321d1c0143cf94255368effcdc83b18daafecea437a6daf17078987
|
3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
@@ -60,3 +60,11 @@
|
|
60 |
{"current_steps": 60, "total_steps": 70, "loss": 0.2433, "lr": 1.2177842662977136e-06, "epoch": 5.78125, "percentage": 85.71, "elapsed_time": "0:21:24", "remaining_time": "0:03:34"}
|
61 |
{"current_steps": 61, "total_steps": 70, "loss": 0.2232, "lr": 9.903113209758098e-07, "epoch": 5.875, "percentage": 87.14, "elapsed_time": "0:21:38", "remaining_time": "0:03:11"}
|
62 |
{"current_steps": 62, "total_steps": 70, "loss": 0.1921, "lr": 7.852378812959227e-07, "epoch": 5.96875, "percentage": 88.57, "elapsed_time": "0:21:51", "remaining_time": "0:02:49"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
60 |
{"current_steps": 60, "total_steps": 70, "loss": 0.2433, "lr": 1.2177842662977136e-06, "epoch": 5.78125, "percentage": 85.71, "elapsed_time": "0:21:24", "remaining_time": "0:03:34"}
|
61 |
{"current_steps": 61, "total_steps": 70, "loss": 0.2232, "lr": 9.903113209758098e-07, "epoch": 5.875, "percentage": 87.14, "elapsed_time": "0:21:38", "remaining_time": "0:03:11"}
|
62 |
{"current_steps": 62, "total_steps": 70, "loss": 0.1921, "lr": 7.852378812959227e-07, "epoch": 5.96875, "percentage": 88.57, "elapsed_time": "0:21:51", "remaining_time": "0:02:49"}
|
63 |
+
{"current_steps": 63, "total_steps": 70, "loss": 0.2026, "lr": 6.030737921409169e-07, "epoch": 6.09375, "percentage": 90.0, "elapsed_time": "0:23:47", "remaining_time": "0:02:38"}
|
64 |
+
{"current_steps": 64, "total_steps": 70, "loss": 0.1918, "lr": 4.4427194213859216e-07, "epoch": 6.1875, "percentage": 91.43, "elapsed_time": "0:23:57", "remaining_time": "0:02:14"}
|
65 |
+
{"current_steps": 65, "total_steps": 70, "loss": 0.2292, "lr": 3.0922713770922155e-07, "epoch": 6.28125, "percentage": 92.86, "elapsed_time": "0:24:09", "remaining_time": "0:01:51"}
|
66 |
+
{"current_steps": 66, "total_steps": 70, "loss": 0.2002, "lr": 1.9827512151456175e-07, "epoch": 6.375, "percentage": 94.29, "elapsed_time": "0:24:23", "remaining_time": "0:01:28"}
|
67 |
+
{"current_steps": 67, "total_steps": 70, "loss": 0.2056, "lr": 1.1169173774871478e-07, "epoch": 6.46875, "percentage": 95.71, "elapsed_time": "0:24:37", "remaining_time": "0:01:06"}
|
68 |
+
{"current_steps": 68, "total_steps": 70, "loss": 0.2116, "lr": 4.9692246345985905e-08, "epoch": 6.5625, "percentage": 97.14, "elapsed_time": "0:24:51", "remaining_time": "0:00:43"}
|
69 |
+
{"current_steps": 69, "total_steps": 70, "loss": 0.2591, "lr": 1.2430787810776556e-08, "epoch": 6.65625, "percentage": 98.57, "elapsed_time": "0:25:07", "remaining_time": "0:00:21"}
|
70 |
+
{"current_steps": 70, "total_steps": 70, "loss": 0.2233, "lr": 0.0, "epoch": 6.75, "percentage": 100.0, "elapsed_time": "0:25:19", "remaining_time": "0:00:00"}
|