ryanmarten commited on
Commit
c5f7f52
·
verified ·
1 Parent(s): a9fa85d

Training in progress, epoch 9

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b28d43a31d102ed2f75b5f86254f1143f0f24d971a33ad76ec79ff82dc93082a
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a868337d45b4abb301473052af7d0c1542a032069ef9a2962c519275f59b36aa
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:029a0332e5294855113eccdc3a0d379907616d4be3e9bade21ec6e3b39954932
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:343b5d964d363cc6908b73bbc431925bc67d7dc440f1a307c237e5d06679bfa4
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:355d8c2e006ec9adb124e0fff5f31b7a6a7365eecf73b50091c445e58916945e
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5e0db662d69104108d03a3aafa2b346c78fbe09626a5a387d106208ed04a53bc
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:28885be57a5e09b629a5fd74dd751589e3cb2240d2f71a4e6a92b5c78bc5c80a
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d034920501ce5fb2fda70ab2e66b4c333fdb6220e534efab7febea9a7b638731
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -90,3 +90,27 @@
90
  {"current_steps": 90, "total_steps": 117, "loss": 0.1054, "lr": 1.544686755065677e-06, "epoch": 9.455696202531646, "percentage": 76.92, "elapsed_time": "0:39:36", "remaining_time": "0:11:52"}
91
  {"current_steps": 91, "total_steps": 117, "loss": 0.0803, "lr": 1.438119515243277e-06, "epoch": 9.556962025316455, "percentage": 77.78, "elapsed_time": "0:39:49", "remaining_time": "0:11:22"}
92
  {"current_steps": 92, "total_steps": 117, "loss": 0.0831, "lr": 1.3347406408508695e-06, "epoch": 9.658227848101266, "percentage": 78.63, "elapsed_time": "0:40:10", "remaining_time": "0:10:55"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
90
  {"current_steps": 90, "total_steps": 117, "loss": 0.1054, "lr": 1.544686755065677e-06, "epoch": 9.455696202531646, "percentage": 76.92, "elapsed_time": "0:39:36", "remaining_time": "0:11:52"}
91
  {"current_steps": 91, "total_steps": 117, "loss": 0.0803, "lr": 1.438119515243277e-06, "epoch": 9.556962025316455, "percentage": 77.78, "elapsed_time": "0:39:49", "remaining_time": "0:11:22"}
92
  {"current_steps": 92, "total_steps": 117, "loss": 0.0831, "lr": 1.3347406408508695e-06, "epoch": 9.658227848101266, "percentage": 78.63, "elapsed_time": "0:40:10", "remaining_time": "0:10:55"}
93
+ {"current_steps": 93, "total_steps": 117, "loss": 0.0867, "lr": 1.234642669981946e-06, "epoch": 9.759493670886076, "percentage": 79.49, "elapsed_time": "0:40:37", "remaining_time": "0:10:29"}
94
+ {"current_steps": 94, "total_steps": 117, "loss": 0.0788, "lr": 1.137915203877003e-06, "epoch": 9.860759493670885, "percentage": 80.34, "elapsed_time": "0:40:55", "remaining_time": "0:10:00"}
95
+ {"current_steps": 95, "total_steps": 117, "loss": 0.0804, "lr": 1.044644826718295e-06, "epoch": 9.962025316455696, "percentage": 81.2, "elapsed_time": "0:41:17", "remaining_time": "0:09:33"}
96
+ {"current_steps": 96, "total_steps": 117, "loss": 0.0793, "lr": 9.549150281252633e-07, "epoch": 10.10126582278481, "percentage": 82.05, "elapsed_time": "0:42:38", "remaining_time": "0:09:19"}
97
+ {"current_steps": 97, "total_steps": 117, "loss": 0.0954, "lr": 8.688061284200266e-07, "epoch": 10.20253164556962, "percentage": 82.91, "elapsed_time": "0:43:04", "remaining_time": "0:08:52"}
98
+ {"current_steps": 98, "total_steps": 117, "loss": 0.0753, "lr": 7.863952067298042e-07, "epoch": 10.30379746835443, "percentage": 83.76, "elapsed_time": "0:43:25", "remaining_time": "0:08:25"}
99
+ {"current_steps": 99, "total_steps": 117, "loss": 0.0874, "lr": 7.077560319906696e-07, "epoch": 10.405063291139241, "percentage": 84.62, "elapsed_time": "0:43:48", "remaining_time": "0:07:57"}
100
+ {"current_steps": 100, "total_steps": 117, "loss": 0.0861, "lr": 6.329589969143518e-07, "epoch": 10.50632911392405, "percentage": 85.47, "elapsed_time": "0:44:10", "remaining_time": "0:07:30"}
101
+ {"current_steps": 101, "total_steps": 117, "loss": 0.0848, "lr": 5.620710549772295e-07, "epoch": 10.60759493670886, "percentage": 86.32, "elapsed_time": "0:44:31", "remaining_time": "0:07:03"}
102
+ {"current_steps": 102, "total_steps": 117, "loss": 0.0829, "lr": 4.951556604879049e-07, "epoch": 10.708860759493671, "percentage": 87.18, "elapsed_time": "0:44:56", "remaining_time": "0:06:36"}
103
+ {"current_steps": 103, "total_steps": 117, "loss": 0.0529, "lr": 4.322727117869951e-07, "epoch": 10.810126582278482, "percentage": 88.03, "elapsed_time": "0:45:10", "remaining_time": "0:06:08"}
104
+ {"current_steps": 104, "total_steps": 117, "loss": 0.0677, "lr": 3.734784976300165e-07, "epoch": 10.91139240506329, "percentage": 88.89, "elapsed_time": "0:45:33", "remaining_time": "0:05:41"}
105
+ {"current_steps": 105, "total_steps": 117, "loss": 0.0674, "lr": 3.18825646801314e-07, "epoch": 11.050632911392405, "percentage": 89.74, "elapsed_time": "0:46:44", "remaining_time": "0:05:20"}
106
+ {"current_steps": 106, "total_steps": 117, "loss": 0.0845, "lr": 2.6836308100417874e-07, "epoch": 11.151898734177216, "percentage": 90.6, "elapsed_time": "0:47:08", "remaining_time": "0:04:53"}
107
+ {"current_steps": 107, "total_steps": 117, "loss": 0.0505, "lr": 2.2213597106929608e-07, "epoch": 11.253164556962025, "percentage": 91.45, "elapsed_time": "0:47:27", "remaining_time": "0:04:26"}
108
+ {"current_steps": 108, "total_steps": 117, "loss": 0.0694, "lr": 1.801856965207338e-07, "epoch": 11.354430379746836, "percentage": 92.31, "elapsed_time": "0:47:46", "remaining_time": "0:03:58"}
109
+ {"current_steps": 109, "total_steps": 117, "loss": 0.0537, "lr": 1.4254980853566248e-07, "epoch": 11.455696202531646, "percentage": 93.16, "elapsed_time": "0:48:06", "remaining_time": "0:03:31"}
110
+ {"current_steps": 110, "total_steps": 117, "loss": 0.1016, "lr": 1.0926199633097156e-07, "epoch": 11.556962025316455, "percentage": 94.02, "elapsed_time": "0:48:29", "remaining_time": "0:03:05"}
111
+ {"current_steps": 111, "total_steps": 117, "loss": 0.0463, "lr": 8.035205700685167e-08, "epoch": 11.658227848101266, "percentage": 94.87, "elapsed_time": "0:48:45", "remaining_time": "0:02:38"}
112
+ {"current_steps": 112, "total_steps": 117, "loss": 0.1114, "lr": 5.584586887435739e-08, "epoch": 11.759493670886076, "percentage": 95.73, "elapsed_time": "0:49:11", "remaining_time": "0:02:11"}
113
+ {"current_steps": 113, "total_steps": 117, "loss": 0.0997, "lr": 3.576536829081323e-08, "epoch": 11.860759493670885, "percentage": 96.58, "elapsed_time": "0:49:41", "remaining_time": "0:01:45"}
114
+ {"current_steps": 114, "total_steps": 117, "loss": 0.0705, "lr": 2.012853002380466e-08, "epoch": 11.962025316455696, "percentage": 97.44, "elapsed_time": "0:49:59", "remaining_time": "0:01:18"}
115
+ {"current_steps": 115, "total_steps": 117, "loss": 0.072, "lr": 8.949351161324227e-09, "epoch": 12.10126582278481, "percentage": 98.29, "elapsed_time": "0:51:14", "remaining_time": "0:00:53"}
116
+ {"current_steps": 116, "total_steps": 117, "loss": 0.0706, "lr": 2.237838582483387e-09, "epoch": 12.20253164556962, "percentage": 99.15, "elapsed_time": "0:51:34", "remaining_time": "0:00:26"}