Training in progress, epoch 9
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4877660776
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a868337d45b4abb301473052af7d0c1542a032069ef9a2962c519275f59b36aa
|
3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4932751008
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:343b5d964d363cc6908b73bbc431925bc67d7dc440f1a307c237e5d06679bfa4
|
3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4330865200
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5e0db662d69104108d03a3aafa2b346c78fbe09626a5a387d106208ed04a53bc
|
3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1089994880
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d034920501ce5fb2fda70ab2e66b4c333fdb6220e534efab7febea9a7b638731
|
3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
@@ -90,3 +90,27 @@
|
|
90 |
{"current_steps": 90, "total_steps": 117, "loss": 0.1054, "lr": 1.544686755065677e-06, "epoch": 9.455696202531646, "percentage": 76.92, "elapsed_time": "0:39:36", "remaining_time": "0:11:52"}
|
91 |
{"current_steps": 91, "total_steps": 117, "loss": 0.0803, "lr": 1.438119515243277e-06, "epoch": 9.556962025316455, "percentage": 77.78, "elapsed_time": "0:39:49", "remaining_time": "0:11:22"}
|
92 |
{"current_steps": 92, "total_steps": 117, "loss": 0.0831, "lr": 1.3347406408508695e-06, "epoch": 9.658227848101266, "percentage": 78.63, "elapsed_time": "0:40:10", "remaining_time": "0:10:55"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
90 |
{"current_steps": 90, "total_steps": 117, "loss": 0.1054, "lr": 1.544686755065677e-06, "epoch": 9.455696202531646, "percentage": 76.92, "elapsed_time": "0:39:36", "remaining_time": "0:11:52"}
|
91 |
{"current_steps": 91, "total_steps": 117, "loss": 0.0803, "lr": 1.438119515243277e-06, "epoch": 9.556962025316455, "percentage": 77.78, "elapsed_time": "0:39:49", "remaining_time": "0:11:22"}
|
92 |
{"current_steps": 92, "total_steps": 117, "loss": 0.0831, "lr": 1.3347406408508695e-06, "epoch": 9.658227848101266, "percentage": 78.63, "elapsed_time": "0:40:10", "remaining_time": "0:10:55"}
|
93 |
+
{"current_steps": 93, "total_steps": 117, "loss": 0.0867, "lr": 1.234642669981946e-06, "epoch": 9.759493670886076, "percentage": 79.49, "elapsed_time": "0:40:37", "remaining_time": "0:10:29"}
|
94 |
+
{"current_steps": 94, "total_steps": 117, "loss": 0.0788, "lr": 1.137915203877003e-06, "epoch": 9.860759493670885, "percentage": 80.34, "elapsed_time": "0:40:55", "remaining_time": "0:10:00"}
|
95 |
+
{"current_steps": 95, "total_steps": 117, "loss": 0.0804, "lr": 1.044644826718295e-06, "epoch": 9.962025316455696, "percentage": 81.2, "elapsed_time": "0:41:17", "remaining_time": "0:09:33"}
|
96 |
+
{"current_steps": 96, "total_steps": 117, "loss": 0.0793, "lr": 9.549150281252633e-07, "epoch": 10.10126582278481, "percentage": 82.05, "elapsed_time": "0:42:38", "remaining_time": "0:09:19"}
|
97 |
+
{"current_steps": 97, "total_steps": 117, "loss": 0.0954, "lr": 8.688061284200266e-07, "epoch": 10.20253164556962, "percentage": 82.91, "elapsed_time": "0:43:04", "remaining_time": "0:08:52"}
|
98 |
+
{"current_steps": 98, "total_steps": 117, "loss": 0.0753, "lr": 7.863952067298042e-07, "epoch": 10.30379746835443, "percentage": 83.76, "elapsed_time": "0:43:25", "remaining_time": "0:08:25"}
|
99 |
+
{"current_steps": 99, "total_steps": 117, "loss": 0.0874, "lr": 7.077560319906696e-07, "epoch": 10.405063291139241, "percentage": 84.62, "elapsed_time": "0:43:48", "remaining_time": "0:07:57"}
|
100 |
+
{"current_steps": 100, "total_steps": 117, "loss": 0.0861, "lr": 6.329589969143518e-07, "epoch": 10.50632911392405, "percentage": 85.47, "elapsed_time": "0:44:10", "remaining_time": "0:07:30"}
|
101 |
+
{"current_steps": 101, "total_steps": 117, "loss": 0.0848, "lr": 5.620710549772295e-07, "epoch": 10.60759493670886, "percentage": 86.32, "elapsed_time": "0:44:31", "remaining_time": "0:07:03"}
|
102 |
+
{"current_steps": 102, "total_steps": 117, "loss": 0.0829, "lr": 4.951556604879049e-07, "epoch": 10.708860759493671, "percentage": 87.18, "elapsed_time": "0:44:56", "remaining_time": "0:06:36"}
|
103 |
+
{"current_steps": 103, "total_steps": 117, "loss": 0.0529, "lr": 4.322727117869951e-07, "epoch": 10.810126582278482, "percentage": 88.03, "elapsed_time": "0:45:10", "remaining_time": "0:06:08"}
|
104 |
+
{"current_steps": 104, "total_steps": 117, "loss": 0.0677, "lr": 3.734784976300165e-07, "epoch": 10.91139240506329, "percentage": 88.89, "elapsed_time": "0:45:33", "remaining_time": "0:05:41"}
|
105 |
+
{"current_steps": 105, "total_steps": 117, "loss": 0.0674, "lr": 3.18825646801314e-07, "epoch": 11.050632911392405, "percentage": 89.74, "elapsed_time": "0:46:44", "remaining_time": "0:05:20"}
|
106 |
+
{"current_steps": 106, "total_steps": 117, "loss": 0.0845, "lr": 2.6836308100417874e-07, "epoch": 11.151898734177216, "percentage": 90.6, "elapsed_time": "0:47:08", "remaining_time": "0:04:53"}
|
107 |
+
{"current_steps": 107, "total_steps": 117, "loss": 0.0505, "lr": 2.2213597106929608e-07, "epoch": 11.253164556962025, "percentage": 91.45, "elapsed_time": "0:47:27", "remaining_time": "0:04:26"}
|
108 |
+
{"current_steps": 108, "total_steps": 117, "loss": 0.0694, "lr": 1.801856965207338e-07, "epoch": 11.354430379746836, "percentage": 92.31, "elapsed_time": "0:47:46", "remaining_time": "0:03:58"}
|
109 |
+
{"current_steps": 109, "total_steps": 117, "loss": 0.0537, "lr": 1.4254980853566248e-07, "epoch": 11.455696202531646, "percentage": 93.16, "elapsed_time": "0:48:06", "remaining_time": "0:03:31"}
|
110 |
+
{"current_steps": 110, "total_steps": 117, "loss": 0.1016, "lr": 1.0926199633097156e-07, "epoch": 11.556962025316455, "percentage": 94.02, "elapsed_time": "0:48:29", "remaining_time": "0:03:05"}
|
111 |
+
{"current_steps": 111, "total_steps": 117, "loss": 0.0463, "lr": 8.035205700685167e-08, "epoch": 11.658227848101266, "percentage": 94.87, "elapsed_time": "0:48:45", "remaining_time": "0:02:38"}
|
112 |
+
{"current_steps": 112, "total_steps": 117, "loss": 0.1114, "lr": 5.584586887435739e-08, "epoch": 11.759493670886076, "percentage": 95.73, "elapsed_time": "0:49:11", "remaining_time": "0:02:11"}
|
113 |
+
{"current_steps": 113, "total_steps": 117, "loss": 0.0997, "lr": 3.576536829081323e-08, "epoch": 11.860759493670885, "percentage": 96.58, "elapsed_time": "0:49:41", "remaining_time": "0:01:45"}
|
114 |
+
{"current_steps": 114, "total_steps": 117, "loss": 0.0705, "lr": 2.012853002380466e-08, "epoch": 11.962025316455696, "percentage": 97.44, "elapsed_time": "0:49:59", "remaining_time": "0:01:18"}
|
115 |
+
{"current_steps": 115, "total_steps": 117, "loss": 0.072, "lr": 8.949351161324227e-09, "epoch": 12.10126582278481, "percentage": 98.29, "elapsed_time": "0:51:14", "remaining_time": "0:00:53"}
|
116 |
+
{"current_steps": 116, "total_steps": 117, "loss": 0.0706, "lr": 2.237838582483387e-09, "epoch": 12.20253164556962, "percentage": 99.15, "elapsed_time": "0:51:34", "remaining_time": "0:00:26"}
|