Training in progress, epoch 5
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4877660776
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:188189b2039c1fdadd95494fd6b160d1b99ff049e1c8aaedb80cdc22bb0d14e1
|
3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4932751008
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:71e4c837c479906e5319e9da1cba8528c9b95b6e7fb58491832f66649e78432c
|
3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4330865200
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cf26346e257d235fb761150db580c9bc434bfded46cb7b67063bc9adb4119b14
|
3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1089994880
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d00576041ba1ff80d2b45e09261e1a06c0c1f6be48567d91e638b7b291bc65c8
|
3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
@@ -61,3 +61,16 @@
|
|
61 |
{"current_steps": 53, "total_steps": 70, "loss": 0.1889, "lr": 3.3831416240314085e-06, "epoch": 5.088, "percentage": 75.71, "elapsed_time": "0:54:31", "remaining_time": "0:17:29"}
|
62 |
{"current_steps": 54, "total_steps": 70, "loss": 0.1604, "lr": 3.017631819139273e-06, "epoch": 5.184, "percentage": 77.14, "elapsed_time": "0:55:27", "remaining_time": "0:16:25"}
|
63 |
{"current_steps": 55, "total_steps": 70, "loss": 0.1715, "lr": 2.669481281701739e-06, "epoch": 5.28, "percentage": 78.57, "elapsed_time": "0:56:17", "remaining_time": "0:15:21"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
61 |
{"current_steps": 53, "total_steps": 70, "loss": 0.1889, "lr": 3.3831416240314085e-06, "epoch": 5.088, "percentage": 75.71, "elapsed_time": "0:54:31", "remaining_time": "0:17:29"}
|
62 |
{"current_steps": 54, "total_steps": 70, "loss": 0.1604, "lr": 3.017631819139273e-06, "epoch": 5.184, "percentage": 77.14, "elapsed_time": "0:55:27", "remaining_time": "0:16:25"}
|
63 |
{"current_steps": 55, "total_steps": 70, "loss": 0.1715, "lr": 2.669481281701739e-06, "epoch": 5.28, "percentage": 78.57, "elapsed_time": "0:56:17", "remaining_time": "0:15:21"}
|
64 |
+
{"current_steps": 56, "total_steps": 70, "loss": 0.1748, "lr": 2.339555568810221e-06, "epoch": 5.376, "percentage": 80.0, "elapsed_time": "0:57:14", "remaining_time": "0:14:18"}
|
65 |
+
{"current_steps": 57, "total_steps": 70, "loss": 0.1669, "lr": 2.0286749277707783e-06, "epoch": 5.4719999999999995, "percentage": 81.43, "elapsed_time": "0:58:11", "remaining_time": "0:13:16"}
|
66 |
+
{"current_steps": 58, "total_steps": 70, "loss": 0.2036, "lr": 1.7376122568400533e-06, "epoch": 5.568, "percentage": 82.86, "elapsed_time": "0:59:12", "remaining_time": "0:12:14"}
|
67 |
+
{"current_steps": 59, "total_steps": 70, "loss": 0.2097, "lr": 1.467091183678444e-06, "epoch": 5.664, "percentage": 84.29, "elapsed_time": "1:00:17", "remaining_time": "0:11:14"}
|
68 |
+
{"current_steps": 60, "total_steps": 70, "loss": 0.1764, "lr": 1.2177842662977136e-06, "epoch": 5.76, "percentage": 85.71, "elapsed_time": "1:01:14", "remaining_time": "0:10:12"}
|
69 |
+
{"current_steps": 61, "total_steps": 70, "loss": 0.204, "lr": 9.903113209758098e-07, "epoch": 5.856, "percentage": 87.14, "elapsed_time": "1:02:10", "remaining_time": "0:09:10"}
|
70 |
+
{"current_steps": 62, "total_steps": 70, "loss": 0.2055, "lr": 7.852378812959227e-07, "epoch": 5.952, "percentage": 88.57, "elapsed_time": "1:03:13", "remaining_time": "0:08:09"}
|
71 |
+
{"current_steps": 63, "total_steps": 70, "loss": 0.1803, "lr": 6.030737921409169e-07, "epoch": 6.048, "percentage": 90.0, "elapsed_time": "1:05:24", "remaining_time": "0:07:16"}
|
72 |
+
{"current_steps": 64, "total_steps": 70, "loss": 0.1836, "lr": 4.4427194213859216e-07, "epoch": 6.144, "percentage": 91.43, "elapsed_time": "1:06:26", "remaining_time": "0:06:13"}
|
73 |
+
{"current_steps": 65, "total_steps": 70, "loss": 0.1562, "lr": 3.0922713770922155e-07, "epoch": 6.24, "percentage": 92.86, "elapsed_time": "1:07:17", "remaining_time": "0:05:10"}
|
74 |
+
{"current_steps": 66, "total_steps": 70, "loss": 0.1752, "lr": 1.9827512151456175e-07, "epoch": 6.336, "percentage": 94.29, "elapsed_time": "1:08:11", "remaining_time": "0:04:07"}
|
75 |
+
{"current_steps": 67, "total_steps": 70, "loss": 0.1824, "lr": 1.1169173774871478e-07, "epoch": 6.432, "percentage": 95.71, "elapsed_time": "1:09:05", "remaining_time": "0:03:05"}
|
76 |
+
{"current_steps": 68, "total_steps": 70, "loss": 0.1875, "lr": 4.9692246345985905e-08, "epoch": 6.5280000000000005, "percentage": 97.14, "elapsed_time": "1:10:12", "remaining_time": "0:02:03"}
|