neginr commited on
Commit
88f589c
·
verified ·
1 Parent(s): 3ed4a0e

Training in progress, epoch 11

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c0aa8dc106145cfcbe0627f9aefe30d07a925693c8eb2cc27c1c82a73403ca25
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ecce232892ac44c65c0daba70b88d6db50cd6eb695a9ca15e485f37bb55d6692
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:185836b0c081caeb7d47427b2fe705067b8beccd4e9e1cb0f8acdb1c272f8e36
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a036c8484d5d33911c894f7dbc4ea44a3539765a79221fdf48f430b9f5b66fbd
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:151b7498ee63d492c70bfca9583c45c6af20661d3c3bb68e6bf0e4a8476a8453
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ec6d40cd9fb3a43f3db5b9be63c6efbefab90af8f2dc5d907004cd8d7d84dc63
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:147077ecd4b7a712f80101af0524f00293005f51dd00c9fa6a9883ce32f88c8c
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:84224f4194b8c3ed6b6b81258330dd6916e3cd5f4fdb4f46b881141393242700
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -100,3 +100,22 @@
100
  {"current_steps": 100, "total_steps": 130, "loss": 0.1355, "lr": 1.5363782324520033e-06, "epoch": 10.0, "percentage": 76.92, "elapsed_time": "0:31:43", "remaining_time": "0:09:31"}
101
  {"current_steps": 101, "total_steps": 130, "loss": 0.0391, "lr": 1.4408125816532981e-06, "epoch": 10.1, "percentage": 77.69, "elapsed_time": "0:33:48", "remaining_time": "0:09:42"}
102
  {"current_steps": 102, "total_steps": 130, "loss": 0.1106, "lr": 1.347812908011485e-06, "epoch": 10.2, "percentage": 78.46, "elapsed_time": "0:33:59", "remaining_time": "0:09:19"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
100
  {"current_steps": 100, "total_steps": 130, "loss": 0.1355, "lr": 1.5363782324520033e-06, "epoch": 10.0, "percentage": 76.92, "elapsed_time": "0:31:43", "remaining_time": "0:09:31"}
101
  {"current_steps": 101, "total_steps": 130, "loss": 0.0391, "lr": 1.4408125816532981e-06, "epoch": 10.1, "percentage": 77.69, "elapsed_time": "0:33:48", "remaining_time": "0:09:42"}
102
  {"current_steps": 102, "total_steps": 130, "loss": 0.1106, "lr": 1.347812908011485e-06, "epoch": 10.2, "percentage": 78.46, "elapsed_time": "0:33:59", "remaining_time": "0:09:19"}
103
+ {"current_steps": 103, "total_steps": 130, "loss": 0.1052, "lr": 1.257446259144494e-06, "epoch": 10.3, "percentage": 79.23, "elapsed_time": "0:34:08", "remaining_time": "0:08:56"}
104
+ {"current_steps": 104, "total_steps": 130, "loss": 0.1319, "lr": 1.1697777844051105e-06, "epoch": 10.4, "percentage": 80.0, "elapsed_time": "0:34:16", "remaining_time": "0:08:34"}
105
+ {"current_steps": 105, "total_steps": 130, "loss": 0.1034, "lr": 1.0848706879118893e-06, "epoch": 10.5, "percentage": 80.77, "elapsed_time": "0:34:26", "remaining_time": "0:08:12"}
106
+ {"current_steps": 106, "total_steps": 130, "loss": 0.0851, "lr": 1.0027861829824953e-06, "epoch": 10.6, "percentage": 81.54, "elapsed_time": "0:34:34", "remaining_time": "0:07:49"}
107
+ {"current_steps": 107, "total_steps": 130, "loss": 0.0931, "lr": 9.235834480022788e-07, "epoch": 10.7, "percentage": 82.31, "elapsed_time": "0:34:41", "remaining_time": "0:07:27"}
108
+ {"current_steps": 108, "total_steps": 130, "loss": 0.1037, "lr": 8.473195837599419e-07, "epoch": 10.8, "percentage": 83.08, "elapsed_time": "0:34:50", "remaining_time": "0:07:05"}
109
+ {"current_steps": 109, "total_steps": 130, "loss": 0.1289, "lr": 7.740495722810271e-07, "epoch": 10.9, "percentage": 83.85, "elapsed_time": "0:35:00", "remaining_time": "0:06:44"}
110
+ {"current_steps": 110, "total_steps": 130, "loss": 0.1238, "lr": 7.03826237188916e-07, "epoch": 11.0, "percentage": 84.62, "elapsed_time": "0:35:09", "remaining_time": "0:06:23"}
111
+ {"current_steps": 111, "total_steps": 130, "loss": 0.1133, "lr": 6.367002056219285e-07, "epoch": 11.1, "percentage": 85.38, "elapsed_time": "0:37:51", "remaining_time": "0:06:28"}
112
+ {"current_steps": 112, "total_steps": 130, "loss": 0.1142, "lr": 5.727198717339511e-07, "epoch": 11.2, "percentage": 86.15, "elapsed_time": "0:37:59", "remaining_time": "0:06:06"}
113
+ {"current_steps": 113, "total_steps": 130, "loss": 0.0774, "lr": 5.119313618049309e-07, "epoch": 11.3, "percentage": 86.92, "elapsed_time": "0:38:06", "remaining_time": "0:05:43"}
114
+ {"current_steps": 114, "total_steps": 130, "loss": 0.0911, "lr": 4.54378500986381e-07, "epoch": 11.4, "percentage": 87.69, "elapsed_time": "0:38:16", "remaining_time": "0:05:22"}
115
+ {"current_steps": 115, "total_steps": 130, "loss": 0.0846, "lr": 4.001027817058789e-07, "epoch": 11.5, "percentage": 88.46, "elapsed_time": "0:38:24", "remaining_time": "0:05:00"}
116
+ {"current_steps": 116, "total_steps": 130, "loss": 0.0847, "lr": 3.49143333753309e-07, "epoch": 11.6, "percentage": 89.23, "elapsed_time": "0:38:32", "remaining_time": "0:04:39"}
117
+ {"current_steps": 117, "total_steps": 130, "loss": 0.1033, "lr": 3.015368960704584e-07, "epoch": 11.7, "percentage": 90.0, "elapsed_time": "0:38:40", "remaining_time": "0:04:17"}
118
+ {"current_steps": 118, "total_steps": 130, "loss": 0.0809, "lr": 2.573177902642726e-07, "epoch": 11.8, "percentage": 90.77, "elapsed_time": "0:38:46", "remaining_time": "0:03:56"}
119
+ {"current_steps": 119, "total_steps": 130, "loss": 0.1438, "lr": 2.1651789586287442e-07, "epoch": 11.9, "percentage": 91.54, "elapsed_time": "0:38:55", "remaining_time": "0:03:35"}
120
+ {"current_steps": 120, "total_steps": 130, "loss": 0.0711, "lr": 1.7916662733218848e-07, "epoch": 12.0, "percentage": 92.31, "elapsed_time": "0:39:02", "remaining_time": "0:03:15"}
121
+ {"current_steps": 121, "total_steps": 130, "loss": 0.1147, "lr": 1.4529091286973994e-07, "epoch": 12.1, "percentage": 93.08, "elapsed_time": "0:41:14", "remaining_time": "0:03:04"}