ryanmarten commited on
Commit
13280d6
·
verified ·
1 Parent(s): 70b79b0

Training in progress, epoch 5

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:26a10ae4e2198c593b61106177c037f35c67d12468c5ff16a16a36bcc05d520a
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b8badccf226308fdac307f938cbb0580d0fa7f7ee9c9bbc58f42d7741ffbf611
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fd768c0780a537c3ee1465f9c7d481e97c22a897f614edaf45af681af5b05dd5
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f89fe330114bf176ba3f739ff241be18f3db062d40e1274cf29b3e1b66e81d3e
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f4fba68d47464a1ec6f554836e7e25739b7bfe5c9b7ee894ca0f05b00689773f
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4fe0fbd08a4c506a46eec2e957e939aa3c0aae4f75606a71f45a41aacadb340d
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:34bb4c4a76f63d206df5878f9a7dbc84ef03c7f620ab142eac1feee73c0ffe21
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e07b05c0cb2697d202e6098ac9efa0a2075bfbb4a0e9ca0fd9de330a4e3b3e66
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -52,3 +52,14 @@
52
  {"current_steps": 52, "total_steps": 70, "loss": 0.3495, "lr": 3.7651019814126656e-06, "epoch": 4.992, "percentage": 74.29, "elapsed_time": "1:07:55", "remaining_time": "0:23:30"}
53
  {"current_steps": 53, "total_steps": 70, "loss": 0.3695, "lr": 3.3831416240314085e-06, "epoch": 5.088, "percentage": 75.71, "elapsed_time": "1:10:03", "remaining_time": "0:22:28"}
54
  {"current_steps": 54, "total_steps": 70, "loss": 0.3982, "lr": 3.017631819139273e-06, "epoch": 5.184, "percentage": 77.14, "elapsed_time": "1:11:17", "remaining_time": "0:21:07"}
 
 
 
 
 
 
 
 
 
 
 
 
52
  {"current_steps": 52, "total_steps": 70, "loss": 0.3495, "lr": 3.7651019814126656e-06, "epoch": 4.992, "percentage": 74.29, "elapsed_time": "1:07:55", "remaining_time": "0:23:30"}
53
  {"current_steps": 53, "total_steps": 70, "loss": 0.3695, "lr": 3.3831416240314085e-06, "epoch": 5.088, "percentage": 75.71, "elapsed_time": "1:10:03", "remaining_time": "0:22:28"}
54
  {"current_steps": 54, "total_steps": 70, "loss": 0.3982, "lr": 3.017631819139273e-06, "epoch": 5.184, "percentage": 77.14, "elapsed_time": "1:11:17", "remaining_time": "0:21:07"}
55
+ {"current_steps": 55, "total_steps": 70, "loss": 0.3929, "lr": 2.669481281701739e-06, "epoch": 5.28, "percentage": 78.57, "elapsed_time": "1:12:33", "remaining_time": "0:19:47"}
56
+ {"current_steps": 56, "total_steps": 70, "loss": 0.3905, "lr": 2.339555568810221e-06, "epoch": 5.376, "percentage": 80.0, "elapsed_time": "1:13:51", "remaining_time": "0:18:27"}
57
+ {"current_steps": 57, "total_steps": 70, "loss": 0.3392, "lr": 2.0286749277707783e-06, "epoch": 5.4719999999999995, "percentage": 81.43, "elapsed_time": "1:15:06", "remaining_time": "0:17:07"}
58
+ {"current_steps": 58, "total_steps": 70, "loss": 0.3676, "lr": 1.7376122568400533e-06, "epoch": 5.568, "percentage": 82.86, "elapsed_time": "1:16:20", "remaining_time": "0:15:47"}
59
+ {"current_steps": 59, "total_steps": 70, "loss": 0.3683, "lr": 1.467091183678444e-06, "epoch": 5.664, "percentage": 84.29, "elapsed_time": "1:17:36", "remaining_time": "0:14:28"}
60
+ {"current_steps": 60, "total_steps": 70, "loss": 0.3499, "lr": 1.2177842662977136e-06, "epoch": 5.76, "percentage": 85.71, "elapsed_time": "1:18:41", "remaining_time": "0:13:06"}
61
+ {"current_steps": 61, "total_steps": 70, "loss": 0.3651, "lr": 9.903113209758098e-07, "epoch": 5.856, "percentage": 87.14, "elapsed_time": "1:19:56", "remaining_time": "0:11:47"}
62
+ {"current_steps": 62, "total_steps": 70, "loss": 0.3403, "lr": 7.852378812959227e-07, "epoch": 5.952, "percentage": 88.57, "elapsed_time": "1:21:10", "remaining_time": "0:10:28"}
63
+ {"current_steps": 63, "total_steps": 70, "loss": 0.3845, "lr": 6.030737921409169e-07, "epoch": 6.048, "percentage": 90.0, "elapsed_time": "1:23:38", "remaining_time": "0:09:17"}
64
+ {"current_steps": 64, "total_steps": 70, "loss": 0.3422, "lr": 4.4427194213859216e-07, "epoch": 6.144, "percentage": 91.43, "elapsed_time": "1:24:52", "remaining_time": "0:07:57"}
65
+ {"current_steps": 65, "total_steps": 70, "loss": 0.4087, "lr": 3.0922713770922155e-07, "epoch": 6.24, "percentage": 92.86, "elapsed_time": "1:26:14", "remaining_time": "0:06:38"}