neginr commited on
Commit
3ed4a0e
·
verified ·
1 Parent(s): 2ff95a2

Training in progress, epoch 9

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7db1d536c29aa9a430cbd1c402fff4bdc773916299d56a1dfb3c2c0a8857211b
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c0aa8dc106145cfcbe0627f9aefe30d07a925693c8eb2cc27c1c82a73403ca25
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:393fab4cad92f0649f4fc5354651987441276008ab46e8f596be5c4b1114944d
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:185836b0c081caeb7d47427b2fe705067b8beccd4e9e1cb0f8acdb1c272f8e36
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:75d2259351b69758fd8692354e3adf9c3b4eb787fb943f5055a3cbd2f8854742
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:151b7498ee63d492c70bfca9583c45c6af20661d3c3bb68e6bf0e4a8476a8453
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:109ca82f49344452cf981157b2e05eb70a993e73a48819e587dc671b17d053c5
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:147077ecd4b7a712f80101af0524f00293005f51dd00c9fa6a9883ce32f88c8c
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -78,3 +78,25 @@
78
  {"current_steps": 78, "total_steps": 130, "loss": 0.1806, "lr": 4.131759111665349e-06, "epoch": 7.8, "percentage": 60.0, "elapsed_time": "0:24:08", "remaining_time": "0:16:05"}
79
  {"current_steps": 79, "total_steps": 130, "loss": 0.0962, "lr": 3.999871531119779e-06, "epoch": 7.9, "percentage": 60.77, "elapsed_time": "0:24:13", "remaining_time": "0:15:38"}
80
  {"current_steps": 80, "total_steps": 130, "loss": 0.2206, "lr": 3.86870498785139e-06, "epoch": 8.0, "percentage": 61.54, "elapsed_time": "0:24:25", "remaining_time": "0:15:15"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
78
  {"current_steps": 78, "total_steps": 130, "loss": 0.1806, "lr": 4.131759111665349e-06, "epoch": 7.8, "percentage": 60.0, "elapsed_time": "0:24:08", "remaining_time": "0:16:05"}
79
  {"current_steps": 79, "total_steps": 130, "loss": 0.0962, "lr": 3.999871531119779e-06, "epoch": 7.9, "percentage": 60.77, "elapsed_time": "0:24:13", "remaining_time": "0:15:38"}
80
  {"current_steps": 80, "total_steps": 130, "loss": 0.2206, "lr": 3.86870498785139e-06, "epoch": 8.0, "percentage": 61.54, "elapsed_time": "0:24:25", "remaining_time": "0:15:15"}
81
+ {"current_steps": 81, "total_steps": 130, "loss": 0.1653, "lr": 3.7383540456788915e-06, "epoch": 8.1, "percentage": 62.31, "elapsed_time": "0:26:34", "remaining_time": "0:16:04"}
82
+ {"current_steps": 82, "total_steps": 130, "loss": 0.0885, "lr": 3.6089126804177373e-06, "epoch": 8.2, "percentage": 63.08, "elapsed_time": "0:26:40", "remaining_time": "0:15:37"}
83
+ {"current_steps": 83, "total_steps": 130, "loss": 0.1024, "lr": 3.480474212128766e-06, "epoch": 8.3, "percentage": 63.85, "elapsed_time": "0:26:48", "remaining_time": "0:15:10"}
84
+ {"current_steps": 84, "total_steps": 130, "loss": 0.1749, "lr": 3.3531312378396026e-06, "epoch": 8.4, "percentage": 64.62, "elapsed_time": "0:26:57", "remaining_time": "0:14:45"}
85
+ {"current_steps": 85, "total_steps": 130, "loss": 0.1421, "lr": 3.226975564787322e-06, "epoch": 8.5, "percentage": 65.38, "elapsed_time": "0:27:05", "remaining_time": "0:14:20"}
86
+ {"current_steps": 86, "total_steps": 130, "loss": 0.1319, "lr": 3.1020981442305187e-06, "epoch": 8.6, "percentage": 66.15, "elapsed_time": "0:27:13", "remaining_time": "0:13:55"}
87
+ {"current_steps": 87, "total_steps": 130, "loss": 0.1755, "lr": 2.978589005878476e-06, "epoch": 8.7, "percentage": 66.92, "elapsed_time": "0:27:23", "remaining_time": "0:13:32"}
88
+ {"current_steps": 88, "total_steps": 130, "loss": 0.1519, "lr": 2.8565371929847286e-06, "epoch": 8.8, "percentage": 67.69, "elapsed_time": "0:27:34", "remaining_time": "0:13:09"}
89
+ {"current_steps": 89, "total_steps": 130, "loss": 0.1402, "lr": 2.736030698151815e-06, "epoch": 8.9, "percentage": 68.46, "elapsed_time": "0:27:43", "remaining_time": "0:12:46"}
90
+ {"current_steps": 90, "total_steps": 130, "loss": 0.091, "lr": 2.6171563998934605e-06, "epoch": 9.0, "percentage": 69.23, "elapsed_time": "0:27:51", "remaining_time": "0:12:22"}
91
+ {"current_steps": 91, "total_steps": 130, "loss": 0.0827, "lr": 2.5000000000000015e-06, "epoch": 9.1, "percentage": 70.0, "elapsed_time": "0:30:30", "remaining_time": "0:13:04"}
92
+ {"current_steps": 92, "total_steps": 130, "loss": 0.1305, "lr": 2.384645961752113e-06, "epoch": 9.2, "percentage": 70.77, "elapsed_time": "0:30:40", "remaining_time": "0:12:40"}
93
+ {"current_steps": 93, "total_steps": 130, "loss": 0.072, "lr": 2.2711774490274767e-06, "epoch": 9.3, "percentage": 71.54, "elapsed_time": "0:30:45", "remaining_time": "0:12:14"}
94
+ {"current_steps": 94, "total_steps": 130, "loss": 0.1218, "lr": 2.159676266344222e-06, "epoch": 9.4, "percentage": 72.31, "elapsed_time": "0:30:54", "remaining_time": "0:11:50"}
95
+ {"current_steps": 95, "total_steps": 130, "loss": 0.1264, "lr": 2.050222799884387e-06, "epoch": 9.5, "percentage": 73.08, "elapsed_time": "0:31:02", "remaining_time": "0:11:26"}
96
+ {"current_steps": 96, "total_steps": 130, "loss": 0.15, "lr": 1.942895959539939e-06, "epoch": 9.6, "percentage": 73.85, "elapsed_time": "0:31:10", "remaining_time": "0:11:02"}
97
+ {"current_steps": 97, "total_steps": 130, "loss": 0.098, "lr": 1.8377731220231144e-06, "epoch": 9.7, "percentage": 74.62, "elapsed_time": "0:31:17", "remaining_time": "0:10:38"}
98
+ {"current_steps": 98, "total_steps": 130, "loss": 0.1517, "lr": 1.7349300750820758e-06, "epoch": 9.8, "percentage": 75.38, "elapsed_time": "0:31:25", "remaining_time": "0:10:15"}
99
+ {"current_steps": 99, "total_steps": 130, "loss": 0.0969, "lr": 1.6344409628621482e-06, "epoch": 9.9, "percentage": 76.15, "elapsed_time": "0:31:33", "remaining_time": "0:09:52"}
100
+ {"current_steps": 100, "total_steps": 130, "loss": 0.1355, "lr": 1.5363782324520033e-06, "epoch": 10.0, "percentage": 76.92, "elapsed_time": "0:31:43", "remaining_time": "0:09:31"}
101
+ {"current_steps": 101, "total_steps": 130, "loss": 0.0391, "lr": 1.4408125816532981e-06, "epoch": 10.1, "percentage": 77.69, "elapsed_time": "0:33:48", "remaining_time": "0:09:42"}
102
+ {"current_steps": 102, "total_steps": 130, "loss": 0.1106, "lr": 1.347812908011485e-06, "epoch": 10.2, "percentage": 78.46, "elapsed_time": "0:33:59", "remaining_time": "0:09:19"}