ryanmarten commited on
Commit
1ecba6c
·
verified ·
1 Parent(s): 35e50a6

Training in progress, epoch 8

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9262da9886ebf1663081967593e5549415847952558ee1d648c23fd8d7863c28
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9fa0e365f18e93793b0a880903b2a76e74451034c5f75512e69e038e6ffebc5f
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f7845f47659305da081eb8e598fe30d2546ceaf4c06b23ad08b717c30892ca57
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d2ec6ccdded93523b413511481dfb42cf7cc2a0e3aeb36b2fd97d92ece781347
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1b25d79aa43cac7d1a9dc628267457a149d7cd21e14fde8afd001099bbb18fdb
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c8143c6cfe75bd5d8d341bfacdb15436653e1e4d5afb71291eee72b00120fc25
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:681e745bcaf4aef5ad23ec4ef0fef065112c52764d78983f7e0169cf4eb6f831
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5959a25860f1725d15f7aa7626f28cb82d415b8761455aae7ac374684d5bcaa9
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -79,3 +79,13 @@
79
  {"current_steps": 79, "total_steps": 117, "loss": 0.2925, "lr": 2.8982138584521734e-06, "epoch": 8.30379746835443, "percentage": 67.52, "elapsed_time": "0:49:15", "remaining_time": "0:23:41"}
80
  {"current_steps": 80, "total_steps": 117, "loss": 0.3337, "lr": 2.7634342584218364e-06, "epoch": 8.405063291139241, "percentage": 68.38, "elapsed_time": "0:49:51", "remaining_time": "0:23:03"}
81
  {"current_steps": 81, "total_steps": 117, "loss": 0.3679, "lr": 2.6306566876350072e-06, "epoch": 8.50632911392405, "percentage": 69.23, "elapsed_time": "0:50:19", "remaining_time": "0:22:22"}
 
 
 
 
 
 
 
 
 
 
 
79
  {"current_steps": 79, "total_steps": 117, "loss": 0.2925, "lr": 2.8982138584521734e-06, "epoch": 8.30379746835443, "percentage": 67.52, "elapsed_time": "0:49:15", "remaining_time": "0:23:41"}
80
  {"current_steps": 80, "total_steps": 117, "loss": 0.3337, "lr": 2.7634342584218364e-06, "epoch": 8.405063291139241, "percentage": 68.38, "elapsed_time": "0:49:51", "remaining_time": "0:23:03"}
81
  {"current_steps": 81, "total_steps": 117, "loss": 0.3679, "lr": 2.6306566876350072e-06, "epoch": 8.50632911392405, "percentage": 69.23, "elapsed_time": "0:50:19", "remaining_time": "0:22:22"}
82
+ {"current_steps": 82, "total_steps": 117, "loss": 0.3498, "lr": 2.5000000000000015e-06, "epoch": 8.60759493670886, "percentage": 70.09, "elapsed_time": "0:50:55", "remaining_time": "0:21:44"}
83
+ {"current_steps": 83, "total_steps": 117, "loss": 0.35, "lr": 2.371581150947476e-06, "epoch": 8.708860759493671, "percentage": 70.94, "elapsed_time": "0:51:31", "remaining_time": "0:21:06"}
84
+ {"current_steps": 84, "total_steps": 117, "loss": 0.3702, "lr": 2.245515092739488e-06, "epoch": 8.810126582278482, "percentage": 71.79, "elapsed_time": "0:51:57", "remaining_time": "0:20:24"}
85
+ {"current_steps": 85, "total_steps": 117, "loss": 0.3309, "lr": 2.1219146715716332e-06, "epoch": 8.91139240506329, "percentage": 72.65, "elapsed_time": "0:52:24", "remaining_time": "0:19:43"}
86
+ {"current_steps": 86, "total_steps": 117, "loss": 0.3211, "lr": 2.0008905265604316e-06, "epoch": 9.050632911392405, "percentage": 73.5, "elapsed_time": "0:54:05", "remaining_time": "0:19:29"}
87
+ {"current_steps": 87, "total_steps": 117, "loss": 0.3193, "lr": 1.8825509907063328e-06, "epoch": 9.151898734177216, "percentage": 74.36, "elapsed_time": "0:54:36", "remaining_time": "0:18:49"}
88
+ {"current_steps": 88, "total_steps": 117, "loss": 0.27, "lr": 1.7670019939210025e-06, "epoch": 9.253164556962025, "percentage": 75.21, "elapsed_time": "0:55:10", "remaining_time": "0:18:11"}
89
+ {"current_steps": 89, "total_steps": 117, "loss": 0.3201, "lr": 1.6543469682057105e-06, "epoch": 9.354430379746836, "percentage": 76.07, "elapsed_time": "0:55:45", "remaining_time": "0:17:32"}
90
+ {"current_steps": 90, "total_steps": 117, "loss": 0.3328, "lr": 1.544686755065677e-06, "epoch": 9.455696202531646, "percentage": 76.92, "elapsed_time": "0:56:16", "remaining_time": "0:16:52"}
91
+ {"current_steps": 91, "total_steps": 117, "loss": 0.3224, "lr": 1.438119515243277e-06, "epoch": 9.556962025316455, "percentage": 77.78, "elapsed_time": "0:56:47", "remaining_time": "0:16:13"}