ryanmarten commited on
Commit
d889c0d
·
verified ·
1 Parent(s): bd2647f

Training in progress, epoch 5

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d519ed078e21be11b6154cff71869dde053483fcccb9869e216277714684feb6
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:260ac56e0838e8061c9bda4b5eca3878fa4c30d5f3592d92da8f3e2e53ae31c4
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:70d1f0eee3a722902f84cfeaf96d2b31b3259e5968dc6f3b599b7bf5ac0c3dfa
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:58ef366818dead635213e3e1f64fe948a865aa51601526136a08e9365709492a
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:082ba1c7b2d4e3bdec99601610d4796ab2c6e78c35b1cbc408fbc4074489d541
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2f652996fdf326d77c23bd01c409a1b4395c53208a3ec595288130cc001e92a6
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3125abd99b9124f6bf6f310c7320df6e9b95f21fdcab7b7589f1a50aa80b2ed7
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:45bc5c597fbc7fb538bb6dbe922c49120aa229e020c145953aa8f6d17697ae21
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -51,3 +51,15 @@
51
  {"current_steps": 51, "total_steps": 70, "loss": 0.5232, "lr": 4.162563277652104e-06, "epoch": 4.896, "percentage": 72.86, "elapsed_time": "1:50:01", "remaining_time": "0:40:59"}
52
  {"current_steps": 52, "total_steps": 70, "loss": 0.5234, "lr": 3.7651019814126656e-06, "epoch": 4.992, "percentage": 74.29, "elapsed_time": "1:52:15", "remaining_time": "0:38:51"}
53
  {"current_steps": 53, "total_steps": 70, "loss": 0.506, "lr": 3.3831416240314085e-06, "epoch": 5.088, "percentage": 75.71, "elapsed_time": "1:55:03", "remaining_time": "0:36:54"}
 
 
 
 
 
 
 
 
 
 
 
 
 
51
  {"current_steps": 51, "total_steps": 70, "loss": 0.5232, "lr": 4.162563277652104e-06, "epoch": 4.896, "percentage": 72.86, "elapsed_time": "1:50:01", "remaining_time": "0:40:59"}
52
  {"current_steps": 52, "total_steps": 70, "loss": 0.5234, "lr": 3.7651019814126656e-06, "epoch": 4.992, "percentage": 74.29, "elapsed_time": "1:52:15", "remaining_time": "0:38:51"}
53
  {"current_steps": 53, "total_steps": 70, "loss": 0.506, "lr": 3.3831416240314085e-06, "epoch": 5.088, "percentage": 75.71, "elapsed_time": "1:55:03", "remaining_time": "0:36:54"}
54
+ {"current_steps": 54, "total_steps": 70, "loss": 0.505, "lr": 3.017631819139273e-06, "epoch": 5.184, "percentage": 77.14, "elapsed_time": "1:57:10", "remaining_time": "0:34:43"}
55
+ {"current_steps": 55, "total_steps": 70, "loss": 0.4782, "lr": 2.669481281701739e-06, "epoch": 5.28, "percentage": 78.57, "elapsed_time": "1:59:29", "remaining_time": "0:32:35"}
56
+ {"current_steps": 56, "total_steps": 70, "loss": 0.4828, "lr": 2.339555568810221e-06, "epoch": 5.376, "percentage": 80.0, "elapsed_time": "2:01:37", "remaining_time": "0:30:24"}
57
+ {"current_steps": 57, "total_steps": 70, "loss": 0.4821, "lr": 2.0286749277707783e-06, "epoch": 5.4719999999999995, "percentage": 81.43, "elapsed_time": "2:03:38", "remaining_time": "0:28:11"}
58
+ {"current_steps": 58, "total_steps": 70, "loss": 0.5088, "lr": 1.7376122568400533e-06, "epoch": 5.568, "percentage": 82.86, "elapsed_time": "2:05:40", "remaining_time": "0:26:00"}
59
+ {"current_steps": 59, "total_steps": 70, "loss": 0.4867, "lr": 1.467091183678444e-06, "epoch": 5.664, "percentage": 84.29, "elapsed_time": "2:07:55", "remaining_time": "0:23:50"}
60
+ {"current_steps": 60, "total_steps": 70, "loss": 0.4952, "lr": 1.2177842662977136e-06, "epoch": 5.76, "percentage": 85.71, "elapsed_time": "2:10:01", "remaining_time": "0:21:40"}
61
+ {"current_steps": 61, "total_steps": 70, "loss": 0.4903, "lr": 9.903113209758098e-07, "epoch": 5.856, "percentage": 87.14, "elapsed_time": "2:11:56", "remaining_time": "0:19:28"}
62
+ {"current_steps": 62, "total_steps": 70, "loss": 0.4913, "lr": 7.852378812959227e-07, "epoch": 5.952, "percentage": 88.57, "elapsed_time": "2:14:09", "remaining_time": "0:17:18"}
63
+ {"current_steps": 63, "total_steps": 70, "loss": 0.4707, "lr": 6.030737921409169e-07, "epoch": 6.048, "percentage": 90.0, "elapsed_time": "2:17:11", "remaining_time": "0:15:14"}
64
+ {"current_steps": 64, "total_steps": 70, "loss": 0.4783, "lr": 4.4427194213859216e-07, "epoch": 6.144, "percentage": 91.43, "elapsed_time": "2:19:14", "remaining_time": "0:13:03"}
65
+ {"current_steps": 65, "total_steps": 70, "loss": 0.4672, "lr": 3.0922713770922155e-07, "epoch": 6.24, "percentage": 92.86, "elapsed_time": "2:21:17", "remaining_time": "0:10:52"}