ryanmarten commited on
Commit
c85060f
·
verified ·
1 Parent(s): 7824c1f

Training in progress, epoch 10

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:35ed5b595dcff85456c65105eafa841211494589bebbb9eaf0262a9e4fc1a8fe
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:895fef0f980f8d450e94439613082c87db2b4b8904f0b86b6563b5537e9ecb51
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:10f329b42426f8516875fa6345cdc2a9a22d3636497b28c5a880db55f490883b
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:10001cb060ef6d163b61eaa4dd2b9f6173fca9105916e255dead31d4211343e1
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9799dfaafe275121fec5cecabc11f39cc43577ebc782e7d917cb36af0b3b44c5
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:05519a91455b7bbeab132197ae1797428084f5a5d62ca7a10a640d6e7f8f276b
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a769d6caa6f6ab6e1df9d123dce1fc0d7a892967c9da59226ba5826b9a3ea4eb
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:578f81978ff22c092693e55840fbf635251135a24f347ed1dc37af5d5eb7c0ca
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -99,3 +99,13 @@
99
  {"current_steps": 99, "total_steps": 117, "loss": 0.3116, "lr": 7.077560319906696e-07, "epoch": 10.405063291139241, "percentage": 84.62, "elapsed_time": "1:01:57", "remaining_time": "0:11:15"}
100
  {"current_steps": 100, "total_steps": 117, "loss": 0.2836, "lr": 6.329589969143518e-07, "epoch": 10.50632911392405, "percentage": 85.47, "elapsed_time": "1:02:28", "remaining_time": "0:10:37"}
101
  {"current_steps": 101, "total_steps": 117, "loss": 0.2645, "lr": 5.620710549772295e-07, "epoch": 10.60759493670886, "percentage": 86.32, "elapsed_time": "1:03:02", "remaining_time": "0:09:59"}
 
 
 
 
 
 
 
 
 
 
 
99
  {"current_steps": 99, "total_steps": 117, "loss": 0.3116, "lr": 7.077560319906696e-07, "epoch": 10.405063291139241, "percentage": 84.62, "elapsed_time": "1:01:57", "remaining_time": "0:11:15"}
100
  {"current_steps": 100, "total_steps": 117, "loss": 0.2836, "lr": 6.329589969143518e-07, "epoch": 10.50632911392405, "percentage": 85.47, "elapsed_time": "1:02:28", "remaining_time": "0:10:37"}
101
  {"current_steps": 101, "total_steps": 117, "loss": 0.2645, "lr": 5.620710549772295e-07, "epoch": 10.60759493670886, "percentage": 86.32, "elapsed_time": "1:03:02", "remaining_time": "0:09:59"}
102
+ {"current_steps": 102, "total_steps": 117, "loss": 0.3388, "lr": 4.951556604879049e-07, "epoch": 10.708860759493671, "percentage": 87.18, "elapsed_time": "1:03:39", "remaining_time": "0:09:21"}
103
+ {"current_steps": 103, "total_steps": 117, "loss": 0.3216, "lr": 4.322727117869951e-07, "epoch": 10.810126582278482, "percentage": 88.03, "elapsed_time": "1:04:04", "remaining_time": "0:08:42"}
104
+ {"current_steps": 104, "total_steps": 117, "loss": 0.2864, "lr": 3.734784976300165e-07, "epoch": 10.91139240506329, "percentage": 88.89, "elapsed_time": "1:04:37", "remaining_time": "0:08:04"}
105
+ {"current_steps": 105, "total_steps": 117, "loss": 0.2778, "lr": 3.18825646801314e-07, "epoch": 11.050632911392405, "percentage": 89.74, "elapsed_time": "1:06:05", "remaining_time": "0:07:33"}
106
+ {"current_steps": 106, "total_steps": 117, "loss": 0.2832, "lr": 2.6836308100417874e-07, "epoch": 11.151898734177216, "percentage": 90.6, "elapsed_time": "1:06:30", "remaining_time": "0:06:54"}
107
+ {"current_steps": 107, "total_steps": 117, "loss": 0.3289, "lr": 2.2213597106929608e-07, "epoch": 11.253164556962025, "percentage": 91.45, "elapsed_time": "1:06:56", "remaining_time": "0:06:15"}
108
+ {"current_steps": 108, "total_steps": 117, "loss": 0.3073, "lr": 1.801856965207338e-07, "epoch": 11.354430379746836, "percentage": 92.31, "elapsed_time": "1:07:28", "remaining_time": "0:05:37"}
109
+ {"current_steps": 109, "total_steps": 117, "loss": 0.3237, "lr": 1.4254980853566248e-07, "epoch": 11.455696202531646, "percentage": 93.16, "elapsed_time": "1:07:59", "remaining_time": "0:04:59"}
110
+ {"current_steps": 110, "total_steps": 117, "loss": 0.3008, "lr": 1.0926199633097156e-07, "epoch": 11.556962025316455, "percentage": 94.02, "elapsed_time": "1:08:33", "remaining_time": "0:04:21"}
111
+ {"current_steps": 111, "total_steps": 117, "loss": 0.2535, "lr": 8.035205700685167e-08, "epoch": 11.658227848101266, "percentage": 94.87, "elapsed_time": "1:09:02", "remaining_time": "0:03:43"}