Training in progress, epoch 4
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4877660776
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7698daf6d251549784ea1649d6032c997947645cc5aa4cc7f80c0c46c80273eb
|
3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4932751008
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a3b35502fecfd0511a75320a2a9d87ed1b4e2e0a6621d36d21846e7ef0d83467
|
3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4330865200
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1dfe13ec26799dbf87126f342e4e0c0ec5afdfaca6449fa785e9933ffea21ef4
|
3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1089994880
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:caf37ac2341388ea29beacf3f7d9191390a4784d598485cd1b7c1604a3be2466
|
3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
@@ -48,3 +48,14 @@
|
|
48 |
{"current_steps": 48, "total_steps": 70, "loss": 0.1904, "lr": 5.43789342646837e-06, "epoch": 4.571428571428571, "percentage": 68.57, "elapsed_time": "0:23:39", "remaining_time": "0:10:50"}
|
49 |
{"current_steps": 49, "total_steps": 70, "loss": 0.1865, "lr": 5.000000000000003e-06, "epoch": 4.666666666666667, "percentage": 70.0, "elapsed_time": "0:24:01", "remaining_time": "0:10:17"}
|
50 |
{"current_steps": 50, "total_steps": 70, "loss": 0.1748, "lr": 4.5745373613424075e-06, "epoch": 4.761904761904762, "percentage": 71.43, "elapsed_time": "0:24:17", "remaining_time": "0:09:42"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
48 |
{"current_steps": 48, "total_steps": 70, "loss": 0.1904, "lr": 5.43789342646837e-06, "epoch": 4.571428571428571, "percentage": 68.57, "elapsed_time": "0:23:39", "remaining_time": "0:10:50"}
|
49 |
{"current_steps": 49, "total_steps": 70, "loss": 0.1865, "lr": 5.000000000000003e-06, "epoch": 4.666666666666667, "percentage": 70.0, "elapsed_time": "0:24:01", "remaining_time": "0:10:17"}
|
50 |
{"current_steps": 50, "total_steps": 70, "loss": 0.1748, "lr": 4.5745373613424075e-06, "epoch": 4.761904761904762, "percentage": 71.43, "elapsed_time": "0:24:17", "remaining_time": "0:09:42"}
|
51 |
+
{"current_steps": 51, "total_steps": 70, "loss": 0.1672, "lr": 4.162563277652104e-06, "epoch": 4.857142857142857, "percentage": 72.86, "elapsed_time": "0:24:34", "remaining_time": "0:09:09"}
|
52 |
+
{"current_steps": 52, "total_steps": 70, "loss": 0.1941, "lr": 3.7651019814126656e-06, "epoch": 4.9523809523809526, "percentage": 74.29, "elapsed_time": "0:24:55", "remaining_time": "0:08:37"}
|
53 |
+
{"current_steps": 53, "total_steps": 70, "loss": 0.1631, "lr": 3.3831416240314085e-06, "epoch": 5.0476190476190474, "percentage": 75.71, "elapsed_time": "0:27:01", "remaining_time": "0:08:40"}
|
54 |
+
{"current_steps": 54, "total_steps": 70, "loss": 0.1847, "lr": 3.017631819139273e-06, "epoch": 5.142857142857143, "percentage": 77.14, "elapsed_time": "0:27:19", "remaining_time": "0:08:05"}
|
55 |
+
{"current_steps": 55, "total_steps": 70, "loss": 0.1626, "lr": 2.669481281701739e-06, "epoch": 5.238095238095238, "percentage": 78.57, "elapsed_time": "0:27:38", "remaining_time": "0:07:32"}
|
56 |
+
{"current_steps": 56, "total_steps": 70, "loss": 0.1512, "lr": 2.339555568810221e-06, "epoch": 5.333333333333333, "percentage": 80.0, "elapsed_time": "0:27:57", "remaining_time": "0:06:59"}
|
57 |
+
{"current_steps": 57, "total_steps": 70, "loss": 0.1708, "lr": 2.0286749277707783e-06, "epoch": 5.428571428571429, "percentage": 81.43, "elapsed_time": "0:28:15", "remaining_time": "0:06:26"}
|
58 |
+
{"current_steps": 58, "total_steps": 70, "loss": 0.1864, "lr": 1.7376122568400533e-06, "epoch": 5.523809523809524, "percentage": 82.86, "elapsed_time": "0:28:37", "remaining_time": "0:05:55"}
|
59 |
+
{"current_steps": 59, "total_steps": 70, "loss": 0.1478, "lr": 1.467091183678444e-06, "epoch": 5.619047619047619, "percentage": 84.29, "elapsed_time": "0:28:53", "remaining_time": "0:05:23"}
|
60 |
+
{"current_steps": 60, "total_steps": 70, "loss": 0.1831, "lr": 1.2177842662977136e-06, "epoch": 5.714285714285714, "percentage": 85.71, "elapsed_time": "0:29:16", "remaining_time": "0:04:52"}
|
61 |
+
{"current_steps": 61, "total_steps": 70, "loss": 0.1748, "lr": 9.903113209758098e-07, "epoch": 5.809523809523809, "percentage": 87.14, "elapsed_time": "0:29:37", "remaining_time": "0:04:22"}
|