Training in progress, epoch 3
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4877660776
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ca91e1448eb55f1df3b048d75992583112c995a703114d8cdc5abbfaff1feca9
|
3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4932751008
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bf2a6ca5f68e14c5edb94d8e4420b5518955aa98e66ee92213f389c6064d4811
|
3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4330865200
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:58a97b7bd5286b823b8d14f20b5e7d5d518c1534b5b8a55f395e460196b48d2f
|
3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1089994880
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:486d6da917b586afd369f3cbf34c8e7c8c0b4731ff1f0748a6a202020e49c3bd
|
3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
@@ -97,3 +97,37 @@
|
|
97 |
{"current_steps": 97, "total_steps": 224, "loss": 0.5393, "lr": 1.402448623755254e-05, "epoch": 2.962025316455696, "percentage": 43.3, "elapsed_time": "2:40:50", "remaining_time": "3:30:35"}
|
98 |
{"current_steps": 98, "total_steps": 224, "loss": 0.5532, "lr": 1.3880918526722497e-05, "epoch": 2.992405063291139, "percentage": 43.75, "elapsed_time": "2:42:40", "remaining_time": "3:29:08"}
|
99 |
{"current_steps": 99, "total_steps": 224, "loss": 0.5193, "lr": 1.3736402761368597e-05, "epoch": 3.030379746835443, "percentage": 44.2, "elapsed_time": "2:45:08", "remaining_time": "3:28:31"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
97 |
{"current_steps": 97, "total_steps": 224, "loss": 0.5393, "lr": 1.402448623755254e-05, "epoch": 2.962025316455696, "percentage": 43.3, "elapsed_time": "2:40:50", "remaining_time": "3:30:35"}
|
98 |
{"current_steps": 98, "total_steps": 224, "loss": 0.5532, "lr": 1.3880918526722497e-05, "epoch": 2.992405063291139, "percentage": 43.75, "elapsed_time": "2:42:40", "remaining_time": "3:29:08"}
|
99 |
{"current_steps": 99, "total_steps": 224, "loss": 0.5193, "lr": 1.3736402761368597e-05, "epoch": 3.030379746835443, "percentage": 44.2, "elapsed_time": "2:45:08", "remaining_time": "3:28:31"}
|
100 |
+
{"current_steps": 100, "total_steps": 224, "loss": 0.4932, "lr": 1.3590974244686248e-05, "epoch": 3.060759493670886, "percentage": 44.64, "elapsed_time": "2:46:42", "remaining_time": "3:26:42"}
|
101 |
+
{"current_steps": 101, "total_steps": 224, "loss": 0.5025, "lr": 1.344466850284333e-05, "epoch": 3.091139240506329, "percentage": 45.09, "elapsed_time": "2:48:12", "remaining_time": "3:24:51"}
|
102 |
+
{"current_steps": 102, "total_steps": 224, "loss": 0.5014, "lr": 1.3297521276301666e-05, "epoch": 3.1215189873417724, "percentage": 45.54, "elapsed_time": "2:49:54", "remaining_time": "3:23:13"}
|
103 |
+
{"current_steps": 103, "total_steps": 224, "loss": 0.502, "lr": 1.3149568511086104e-05, "epoch": 3.151898734177215, "percentage": 45.98, "elapsed_time": "2:51:47", "remaining_time": "3:21:48"}
|
104 |
+
{"current_steps": 104, "total_steps": 224, "loss": 0.5195, "lr": 1.300084635000341e-05, "epoch": 3.1822784810126583, "percentage": 46.43, "elapsed_time": "2:53:32", "remaining_time": "3:20:14"}
|
105 |
+
{"current_steps": 105, "total_steps": 224, "loss": 0.505, "lr": 1.2851391123813075e-05, "epoch": 3.212658227848101, "percentage": 46.88, "elapsed_time": "2:55:27", "remaining_time": "3:18:51"}
|
106 |
+
{"current_steps": 106, "total_steps": 224, "loss": 0.5103, "lr": 1.2701239342352223e-05, "epoch": 3.2430379746835443, "percentage": 47.32, "elapsed_time": "2:57:13", "remaining_time": "3:17:17"}
|
107 |
+
{"current_steps": 107, "total_steps": 224, "loss": 0.5124, "lr": 1.2550427685616767e-05, "epoch": 3.2734177215189875, "percentage": 47.77, "elapsed_time": "2:58:40", "remaining_time": "3:15:22"}
|
108 |
+
{"current_steps": 108, "total_steps": 224, "loss": 0.5106, "lr": 1.239899299480098e-05, "epoch": 3.3037974683544302, "percentage": 48.21, "elapsed_time": "3:00:16", "remaining_time": "3:13:38"}
|
109 |
+
{"current_steps": 109, "total_steps": 224, "loss": 0.5037, "lr": 1.2246972263297718e-05, "epoch": 3.3341772151898734, "percentage": 48.66, "elapsed_time": "3:02:01", "remaining_time": "3:12:02"}
|
110 |
+
{"current_steps": 110, "total_steps": 224, "loss": 0.5228, "lr": 1.2094402627661447e-05, "epoch": 3.3645569620253166, "percentage": 49.11, "elapsed_time": "3:03:40", "remaining_time": "3:10:20"}
|
111 |
+
{"current_steps": 111, "total_steps": 224, "loss": 0.5273, "lr": 1.1941321358536278e-05, "epoch": 3.3949367088607594, "percentage": 49.55, "elapsed_time": "3:05:30", "remaining_time": "3:08:51"}
|
112 |
+
{"current_steps": 112, "total_steps": 224, "loss": 0.4798, "lr": 1.1787765851551296e-05, "epoch": 3.4253164556962026, "percentage": 50.0, "elapsed_time": "3:07:09", "remaining_time": "3:07:09"}
|
113 |
+
{"current_steps": 113, "total_steps": 224, "loss": 0.507, "lr": 1.1633773618185302e-05, "epoch": 3.4556962025316453, "percentage": 50.45, "elapsed_time": "3:09:01", "remaining_time": "3:05:41"}
|
114 |
+
{"current_steps": 114, "total_steps": 224, "loss": 0.478, "lr": 1.14793822766033e-05, "epoch": 3.4860759493670885, "percentage": 50.89, "elapsed_time": "3:10:38", "remaining_time": "3:03:56"}
|
115 |
+
{"current_steps": 115, "total_steps": 224, "loss": 0.5019, "lr": 1.132462954246688e-05, "epoch": 3.5164556962025317, "percentage": 51.34, "elapsed_time": "3:12:18", "remaining_time": "3:02:16"}
|
116 |
+
{"current_steps": 116, "total_steps": 224, "loss": 0.4937, "lr": 1.1169553219720828e-05, "epoch": 3.546835443037975, "percentage": 51.79, "elapsed_time": "3:14:04", "remaining_time": "3:00:41"}
|
117 |
+
{"current_steps": 117, "total_steps": 224, "loss": 0.5107, "lr": 1.1014191191358118e-05, "epoch": 3.5772151898734177, "percentage": 52.23, "elapsed_time": "3:15:44", "remaining_time": "2:59:00"}
|
118 |
+
{"current_steps": 118, "total_steps": 224, "loss": 0.4958, "lr": 1.085858141016566e-05, "epoch": 3.607594936708861, "percentage": 52.68, "elapsed_time": "3:17:25", "remaining_time": "2:57:20"}
|
119 |
+
{"current_steps": 119, "total_steps": 224, "loss": 0.5018, "lr": 1.070276188945293e-05, "epoch": 3.6379746835443036, "percentage": 53.12, "elapsed_time": "3:19:11", "remaining_time": "2:55:45"}
|
120 |
+
{"current_steps": 120, "total_steps": 224, "loss": 0.5047, "lr": 1.0546770693765859e-05, "epoch": 3.668354430379747, "percentage": 53.57, "elapsed_time": "3:20:41", "remaining_time": "2:53:55"}
|
121 |
+
{"current_steps": 121, "total_steps": 224, "loss": 0.4935, "lr": 1.0390645929588197e-05, "epoch": 3.69873417721519, "percentage": 54.02, "elapsed_time": "3:22:14", "remaining_time": "2:52:09"}
|
122 |
+
{"current_steps": 122, "total_steps": 224, "loss": 0.4941, "lr": 1.0234425736032607e-05, "epoch": 3.729113924050633, "percentage": 54.46, "elapsed_time": "3:24:01", "remaining_time": "2:50:34"}
|
123 |
+
{"current_steps": 123, "total_steps": 224, "loss": 0.5013, "lr": 1.007814827552384e-05, "epoch": 3.759493670886076, "percentage": 54.91, "elapsed_time": "3:25:39", "remaining_time": "2:48:52"}
|
124 |
+
{"current_steps": 124, "total_steps": 224, "loss": 0.5118, "lr": 9.92185172447616e-06, "epoch": 3.7898734177215188, "percentage": 55.36, "elapsed_time": "3:27:25", "remaining_time": "2:47:16"}
|
125 |
+
{"current_steps": 125, "total_steps": 224, "loss": 0.4981, "lr": 9.765574263967397e-06, "epoch": 3.820253164556962, "percentage": 55.8, "elapsed_time": "3:28:56", "remaining_time": "2:45:28"}
|
126 |
+
{"current_steps": 126, "total_steps": 224, "loss": 0.4737, "lr": 9.609354070411807e-06, "epoch": 3.850632911392405, "percentage": 56.25, "elapsed_time": "3:30:25", "remaining_time": "2:43:39"}
|
127 |
+
{"current_steps": 127, "total_steps": 224, "loss": 0.4813, "lr": 9.453229306234143e-06, "epoch": 3.8810126582278484, "percentage": 56.7, "elapsed_time": "3:32:07", "remaining_time": "2:42:01"}
|
128 |
+
{"current_steps": 128, "total_steps": 224, "loss": 0.5146, "lr": 9.297238110547075e-06, "epoch": 3.911392405063291, "percentage": 57.14, "elapsed_time": "3:33:42", "remaining_time": "2:40:17"}
|
129 |
+
{"current_steps": 129, "total_steps": 224, "loss": 0.4689, "lr": 9.14141858983434e-06, "epoch": 3.9417721518987343, "percentage": 57.59, "elapsed_time": "3:35:15", "remaining_time": "2:38:31"}
|
130 |
+
{"current_steps": 130, "total_steps": 224, "loss": 0.5002, "lr": 8.985808808641883e-06, "epoch": 3.972151898734177, "percentage": 58.04, "elapsed_time": "3:36:42", "remaining_time": "2:36:41"}
|
131 |
+
{"current_steps": 131, "total_steps": 224, "loss": 0.5119, "lr": 8.830446780279175e-06, "epoch": 4.010126582278481, "percentage": 58.48, "elapsed_time": "3:39:07", "remaining_time": "2:35:33"}
|
132 |
+
{"current_steps": 132, "total_steps": 224, "loss": 0.4309, "lr": 8.675370457533122e-06, "epoch": 4.040506329113924, "percentage": 58.93, "elapsed_time": "3:40:34", "remaining_time": "2:33:44"}
|
133 |
+
{"current_steps": 133, "total_steps": 224, "loss": 0.4589, "lr": 8.520617723396702e-06, "epoch": 4.0708860759493675, "percentage": 59.38, "elapsed_time": "3:42:11", "remaining_time": "2:32:01"}
|