Training in progress, epoch 2
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4877660776
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b1cf0d73a4944c76886e467ccd71da98f24a912867e5e9abaec18060b4494a79
|
3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4932751008
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c30f08ffcacdc0461992ef8ef343531df084f80592cd8a29f36d948eaf7ccebd
|
3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4330865200
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:471721731aede15e95ac5a1a3fcf2562385b737f0387e025076adface8669a05
|
3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1089994880
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c5e9a3ec7c3b93ce0e4574165b68e30a954f9a0ee4f5eda55d0c2e53af121f53
|
3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
@@ -68,3 +68,36 @@
|
|
68 |
{"current_steps": 68, "total_steps": 224, "loss": 0.4652, "lr": 1.762685178110382e-05, "epoch": 2.081012658227848, "percentage": 30.36, "elapsed_time": "0:50:03", "remaining_time": "1:54:50"}
|
69 |
{"current_steps": 69, "total_steps": 224, "loss": 0.451, "lr": 1.752483539436807e-05, "epoch": 2.1113924050632913, "percentage": 30.8, "elapsed_time": "0:50:41", "remaining_time": "1:53:52"}
|
70 |
{"current_steps": 70, "total_steps": 224, "loss": 0.4843, "lr": 1.7420980794800013e-05, "epoch": 2.141772151898734, "percentage": 31.25, "elapsed_time": "0:51:44", "remaining_time": "1:53:49"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
68 |
{"current_steps": 68, "total_steps": 224, "loss": 0.4652, "lr": 1.762685178110382e-05, "epoch": 2.081012658227848, "percentage": 30.36, "elapsed_time": "0:50:03", "remaining_time": "1:54:50"}
|
69 |
{"current_steps": 69, "total_steps": 224, "loss": 0.451, "lr": 1.752483539436807e-05, "epoch": 2.1113924050632913, "percentage": 30.8, "elapsed_time": "0:50:41", "remaining_time": "1:53:52"}
|
70 |
{"current_steps": 70, "total_steps": 224, "loss": 0.4843, "lr": 1.7420980794800013e-05, "epoch": 2.141772151898734, "percentage": 31.25, "elapsed_time": "0:51:44", "remaining_time": "1:53:49"}
|
71 |
+
{"current_steps": 71, "total_steps": 224, "loss": 0.4779, "lr": 1.731531335263669e-05, "epoch": 2.1721518987341772, "percentage": 31.7, "elapsed_time": "0:52:26", "remaining_time": "1:53:00"}
|
72 |
+
{"current_steps": 72, "total_steps": 224, "loss": 0.4812, "lr": 1.720785888096743e-05, "epoch": 2.2025316455696204, "percentage": 32.14, "elapsed_time": "0:53:08", "remaining_time": "1:52:12"}
|
73 |
+
{"current_steps": 73, "total_steps": 224, "loss": 0.4881, "lr": 1.7098643629428035e-05, "epoch": 2.232911392405063, "percentage": 32.59, "elapsed_time": "0:53:56", "remaining_time": "1:51:34"}
|
74 |
+
{"current_steps": 74, "total_steps": 224, "loss": 0.4389, "lr": 1.698769427778842e-05, "epoch": 2.2632911392405064, "percentage": 33.04, "elapsed_time": "0:54:46", "remaining_time": "1:51:00"}
|
75 |
+
{"current_steps": 75, "total_steps": 224, "loss": 0.4898, "lr": 1.687503792943506e-05, "epoch": 2.293670886075949, "percentage": 33.48, "elapsed_time": "0:55:31", "remaining_time": "1:50:19"}
|
76 |
+
{"current_steps": 76, "total_steps": 224, "loss": 0.4513, "lr": 1.6760702104750046e-05, "epoch": 2.3240506329113924, "percentage": 33.93, "elapsed_time": "0:56:02", "remaining_time": "1:49:08"}
|
77 |
+
{"current_steps": 77, "total_steps": 224, "loss": 0.4544, "lr": 1.664471473438822e-05, "epoch": 2.3544303797468356, "percentage": 34.38, "elapsed_time": "0:56:48", "remaining_time": "1:48:26"}
|
78 |
+
{"current_steps": 78, "total_steps": 224, "loss": 0.4695, "lr": 1.6527104152454096e-05, "epoch": 2.3848101265822783, "percentage": 34.82, "elapsed_time": "0:57:47", "remaining_time": "1:48:10"}
|
79 |
+
{"current_steps": 79, "total_steps": 224, "loss": 0.5128, "lr": 1.6407899089580263e-05, "epoch": 2.4151898734177215, "percentage": 35.27, "elapsed_time": "0:58:28", "remaining_time": "1:47:18"}
|
80 |
+
{"current_steps": 80, "total_steps": 224, "loss": 0.4573, "lr": 1.628712866590885e-05, "epoch": 2.4455696202531647, "percentage": 35.71, "elapsed_time": "0:59:02", "remaining_time": "1:46:16"}
|
81 |
+
{"current_steps": 81, "total_steps": 224, "loss": 0.4605, "lr": 1.6164822383977912e-05, "epoch": 2.4759493670886075, "percentage": 36.16, "elapsed_time": "0:59:44", "remaining_time": "1:45:27"}
|
82 |
+
{"current_steps": 82, "total_steps": 224, "loss": 0.4683, "lr": 1.604101012151436e-05, "epoch": 2.5063291139240507, "percentage": 36.61, "elapsed_time": "1:00:22", "remaining_time": "1:44:32"}
|
83 |
+
{"current_steps": 83, "total_steps": 224, "loss": 0.4751, "lr": 1.5915722124135227e-05, "epoch": 2.536708860759494, "percentage": 37.05, "elapsed_time": "1:01:16", "remaining_time": "1:44:06"}
|
84 |
+
{"current_steps": 84, "total_steps": 224, "loss": 0.4879, "lr": 1.5788988997959115e-05, "epoch": 2.5670886075949366, "percentage": 37.5, "elapsed_time": "1:02:05", "remaining_time": "1:43:29"}
|
85 |
+
{"current_steps": 85, "total_steps": 224, "loss": 0.4601, "lr": 1.5660841702129533e-05, "epoch": 2.59746835443038, "percentage": 37.95, "elapsed_time": "1:02:53", "remaining_time": "1:42:50"}
|
86 |
+
{"current_steps": 86, "total_steps": 224, "loss": 0.4797, "lr": 1.5531311541251995e-05, "epoch": 2.6278481012658226, "percentage": 38.39, "elapsed_time": "1:03:31", "remaining_time": "1:41:56"}
|
87 |
+
{"current_steps": 87, "total_steps": 224, "loss": 0.4646, "lr": 1.540043015774676e-05, "epoch": 2.6582278481012658, "percentage": 38.84, "elapsed_time": "1:04:15", "remaining_time": "1:41:11"}
|
88 |
+
{"current_steps": 88, "total_steps": 224, "loss": 0.4658, "lr": 1.5268229524119007e-05, "epoch": 2.688607594936709, "percentage": 39.29, "elapsed_time": "1:04:57", "remaining_time": "1:40:23"}
|
89 |
+
{"current_steps": 89, "total_steps": 224, "loss": 0.4632, "lr": 1.513474193514842e-05, "epoch": 2.7189873417721517, "percentage": 39.73, "elapsed_time": "1:05:36", "remaining_time": "1:39:31"}
|
90 |
+
{"current_steps": 90, "total_steps": 224, "loss": 0.4835, "lr": 1.5000000000000002e-05, "epoch": 2.749367088607595, "percentage": 40.18, "elapsed_time": "1:06:12", "remaining_time": "1:38:35"}
|
91 |
+
{"current_steps": 91, "total_steps": 224, "loss": 0.4503, "lr": 1.4864036634258112e-05, "epoch": 2.779746835443038, "percentage": 40.62, "elapsed_time": "1:07:07", "remaining_time": "1:38:05"}
|
92 |
+
{"current_steps": 92, "total_steps": 224, "loss": 0.4418, "lr": 1.4726885051885654e-05, "epoch": 2.810126582278481, "percentage": 41.07, "elapsed_time": "1:07:48", "remaining_time": "1:37:17"}
|
93 |
+
{"current_steps": 93, "total_steps": 224, "loss": 0.4674, "lr": 1.4588578757110359e-05, "epoch": 2.840506329113924, "percentage": 41.52, "elapsed_time": "1:08:23", "remaining_time": "1:36:20"}
|
94 |
+
{"current_steps": 94, "total_steps": 224, "loss": 0.4354, "lr": 1.4449151536240167e-05, "epoch": 2.8708860759493673, "percentage": 41.96, "elapsed_time": "1:09:01", "remaining_time": "1:35:27"}
|
95 |
+
{"current_steps": 95, "total_steps": 224, "loss": 0.4402, "lr": 1.4308637449409705e-05, "epoch": 2.90126582278481, "percentage": 42.41, "elapsed_time": "1:09:43", "remaining_time": "1:34:40"}
|
96 |
+
{"current_steps": 96, "total_steps": 224, "loss": 0.4654, "lr": 1.4167070822259868e-05, "epoch": 2.9316455696202532, "percentage": 42.86, "elapsed_time": "1:10:18", "remaining_time": "1:33:45"}
|
97 |
+
{"current_steps": 97, "total_steps": 224, "loss": 0.4391, "lr": 1.402448623755254e-05, "epoch": 2.962025316455696, "percentage": 43.3, "elapsed_time": "1:10:49", "remaining_time": "1:32:43"}
|
98 |
+
{"current_steps": 98, "total_steps": 224, "loss": 0.4737, "lr": 1.3880918526722497e-05, "epoch": 2.992405063291139, "percentage": 43.75, "elapsed_time": "1:11:29", "remaining_time": "1:31:55"}
|
99 |
+
{"current_steps": 99, "total_steps": 224, "loss": 0.3205, "lr": 1.3736402761368597e-05, "epoch": 3.030379746835443, "percentage": 44.2, "elapsed_time": "1:13:10", "remaining_time": "1:32:23"}
|
100 |
+
{"current_steps": 100, "total_steps": 224, "loss": 0.3245, "lr": 1.3590974244686248e-05, "epoch": 3.060759493670886, "percentage": 44.64, "elapsed_time": "1:13:53", "remaining_time": "1:31:37"}
|
101 |
+
{"current_steps": 101, "total_steps": 224, "loss": 0.3338, "lr": 1.344466850284333e-05, "epoch": 3.091139240506329, "percentage": 45.09, "elapsed_time": "1:14:37", "remaining_time": "1:30:52"}
|
102 |
+
{"current_steps": 102, "total_steps": 224, "loss": 0.3402, "lr": 1.3297521276301666e-05, "epoch": 3.1215189873417724, "percentage": 45.54, "elapsed_time": "1:15:24", "remaining_time": "1:30:11"}
|
103 |
+
{"current_steps": 103, "total_steps": 224, "loss": 0.3152, "lr": 1.3149568511086104e-05, "epoch": 3.151898734177215, "percentage": 45.98, "elapsed_time": "1:16:01", "remaining_time": "1:29:18"}
|