ryanmarten commited on
Commit
1f18535
·
verified ·
1 Parent(s): 9ef345d

Training in progress, epoch 11

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0ec6168ffca50fc29c50b1ae402eba7e658a6288299b00a6bc510d668a82f434
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b91ddfebeafcdb902d522a1c411c581331e6cb5346c0f1422cecf5d7634858cc
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:592d959e0096f5576e49dd5c9ef8e0aaa6091ff0be71e6ef82bbed5fec69e790
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0b24ba5135f696fcb907fc78b36a914b84a0a08fd8ac713dbb80bd2633dde0a4
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7e3b2ff527268c71dedb4acfd1216bf71f613476ef98f058710e031b43fd3167
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9a20470e0481f9604bf6b2e1205b873fe514055ffc178be5b08dac801a5aef43
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5c3b25b2c094ab50349d41fdc70138e1cdb67f40e592184b65940a473ef4b433
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8acc1cecaef70819c951314d83023df3a04020db97b57e282805fa6779ee62d7
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -100,3 +100,19 @@
100
  {"current_steps": 100, "total_steps": 117, "loss": 0.873, "lr": 6.329589969143518e-07, "epoch": 10.50632911392405, "percentage": 85.47, "elapsed_time": "1:12:44", "remaining_time": "0:12:21"}
101
  {"current_steps": 101, "total_steps": 117, "loss": 0.808, "lr": 5.620710549772295e-07, "epoch": 10.60759493670886, "percentage": 86.32, "elapsed_time": "1:13:29", "remaining_time": "0:11:38"}
102
  {"current_steps": 102, "total_steps": 117, "loss": 0.8738, "lr": 4.951556604879049e-07, "epoch": 10.708860759493671, "percentage": 87.18, "elapsed_time": "1:14:02", "remaining_time": "0:10:53"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
100
  {"current_steps": 100, "total_steps": 117, "loss": 0.873, "lr": 6.329589969143518e-07, "epoch": 10.50632911392405, "percentage": 85.47, "elapsed_time": "1:12:44", "remaining_time": "0:12:21"}
101
  {"current_steps": 101, "total_steps": 117, "loss": 0.808, "lr": 5.620710549772295e-07, "epoch": 10.60759493670886, "percentage": 86.32, "elapsed_time": "1:13:29", "remaining_time": "0:11:38"}
102
  {"current_steps": 102, "total_steps": 117, "loss": 0.8738, "lr": 4.951556604879049e-07, "epoch": 10.708860759493671, "percentage": 87.18, "elapsed_time": "1:14:02", "remaining_time": "0:10:53"}
103
+ {"current_steps": 103, "total_steps": 117, "loss": 0.9147, "lr": 4.322727117869951e-07, "epoch": 10.810126582278482, "percentage": 88.03, "elapsed_time": "1:14:41", "remaining_time": "0:10:09"}
104
+ {"current_steps": 104, "total_steps": 117, "loss": 0.9001, "lr": 3.734784976300165e-07, "epoch": 10.91139240506329, "percentage": 88.89, "elapsed_time": "1:15:21", "remaining_time": "0:09:25"}
105
+ {"current_steps": 105, "total_steps": 117, "loss": 0.8632, "lr": 3.18825646801314e-07, "epoch": 11.050632911392405, "percentage": 89.74, "elapsed_time": "1:17:04", "remaining_time": "0:08:48"}
106
+ {"current_steps": 106, "total_steps": 117, "loss": 0.9821, "lr": 2.6836308100417874e-07, "epoch": 11.151898734177216, "percentage": 90.6, "elapsed_time": "1:17:48", "remaining_time": "0:08:04"}
107
+ {"current_steps": 107, "total_steps": 117, "loss": 0.8456, "lr": 2.2213597106929608e-07, "epoch": 11.253164556962025, "percentage": 91.45, "elapsed_time": "1:18:27", "remaining_time": "0:07:19"}
108
+ {"current_steps": 108, "total_steps": 117, "loss": 0.9029, "lr": 1.801856965207338e-07, "epoch": 11.354430379746836, "percentage": 92.31, "elapsed_time": "1:19:03", "remaining_time": "0:06:35"}
109
+ {"current_steps": 109, "total_steps": 117, "loss": 0.8791, "lr": 1.4254980853566248e-07, "epoch": 11.455696202531646, "percentage": 93.16, "elapsed_time": "1:19:37", "remaining_time": "0:05:50"}
110
+ {"current_steps": 110, "total_steps": 117, "loss": 0.9583, "lr": 1.0926199633097156e-07, "epoch": 11.556962025316455, "percentage": 94.02, "elapsed_time": "1:20:18", "remaining_time": "0:05:06"}
111
+ {"current_steps": 111, "total_steps": 117, "loss": 0.939, "lr": 8.035205700685167e-08, "epoch": 11.658227848101266, "percentage": 94.87, "elapsed_time": "1:20:50", "remaining_time": "0:04:22"}
112
+ {"current_steps": 112, "total_steps": 117, "loss": 0.9014, "lr": 5.584586887435739e-08, "epoch": 11.759493670886076, "percentage": 95.73, "elapsed_time": "1:21:31", "remaining_time": "0:03:38"}
113
+ {"current_steps": 113, "total_steps": 117, "loss": 0.892, "lr": 3.576536829081323e-08, "epoch": 11.860759493670885, "percentage": 96.58, "elapsed_time": "1:22:15", "remaining_time": "0:02:54"}
114
+ {"current_steps": 114, "total_steps": 117, "loss": 0.8862, "lr": 2.012853002380466e-08, "epoch": 11.962025316455696, "percentage": 97.44, "elapsed_time": "1:22:56", "remaining_time": "0:02:10"}
115
+ {"current_steps": 115, "total_steps": 117, "loss": 0.8917, "lr": 8.949351161324227e-09, "epoch": 12.10126582278481, "percentage": 98.29, "elapsed_time": "1:24:40", "remaining_time": "0:01:28"}
116
+ {"current_steps": 116, "total_steps": 117, "loss": 0.9134, "lr": 2.237838582483387e-09, "epoch": 12.20253164556962, "percentage": 99.15, "elapsed_time": "1:25:24", "remaining_time": "0:00:44"}
117
+ {"current_steps": 117, "total_steps": 117, "loss": 0.9271, "lr": 0.0, "epoch": 12.30379746835443, "percentage": 100.0, "elapsed_time": "1:26:03", "remaining_time": "0:00:00"}
118
+ {"current_steps": 117, "total_steps": 117, "epoch": 12.30379746835443, "percentage": 100.0, "elapsed_time": "1:27:50", "remaining_time": "0:00:00"}