ryanmarten commited on
Commit
835a7b1
·
verified ·
1 Parent(s): ac1cd01

Training in progress, epoch 2

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:635163bcb7a7d1d963ff50b7c0dcd8a0776dae208395df6140a9524a8faef878
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6ae6632db935fe8767eb8f15a698cd68df7cbf076b23b1b7dea60b01b45d8d8d
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6ad75a633044b8702576ee6127b12e4b40d60593c099bf33784f09efe7bbab9b
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b31bc0fbdc7d6944483a7d48a6055e56bf60209382effd724e988e142fc10ee6
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a40b16a0702a4acdc8fd02aa8e11e91edd4faac79c5a8c3a395358ce2b985283
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d437bf016abeba62caeecc4dbb489eaf6eb0b5351401c57c98ba4f66725a191
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:36d85f05f0906df5f631e9742da0b5d97026a6e62691de0522a431cbd6dc6af6
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e43341690e9b9182f71892bbcd674ed499fcb7012f1328fae7c5abf1a231f30c
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -20,3 +20,14 @@
20
  {"current_steps": 20, "total_steps": 70, "loss": 0.6891, "lr": 1.7971325072229227e-05, "epoch": 1.92, "percentage": 28.57, "elapsed_time": "0:40:54", "remaining_time": "1:42:15"}
21
  {"current_steps": 21, "total_steps": 70, "loss": 0.6961, "lr": 1.766044443118978e-05, "epoch": 2.016, "percentage": 30.0, "elapsed_time": "0:43:34", "remaining_time": "1:41:39"}
22
  {"current_steps": 22, "total_steps": 70, "loss": 0.649, "lr": 1.7330518718298263e-05, "epoch": 2.112, "percentage": 31.43, "elapsed_time": "0:45:11", "remaining_time": "1:38:36"}
 
 
 
 
 
 
 
 
 
 
 
 
20
  {"current_steps": 20, "total_steps": 70, "loss": 0.6891, "lr": 1.7971325072229227e-05, "epoch": 1.92, "percentage": 28.57, "elapsed_time": "0:40:54", "remaining_time": "1:42:15"}
21
  {"current_steps": 21, "total_steps": 70, "loss": 0.6961, "lr": 1.766044443118978e-05, "epoch": 2.016, "percentage": 30.0, "elapsed_time": "0:43:34", "remaining_time": "1:41:39"}
22
  {"current_steps": 22, "total_steps": 70, "loss": 0.649, "lr": 1.7330518718298263e-05, "epoch": 2.112, "percentage": 31.43, "elapsed_time": "0:45:11", "remaining_time": "1:38:36"}
23
+ {"current_steps": 23, "total_steps": 70, "loss": 0.6771, "lr": 1.698236818086073e-05, "epoch": 2.208, "percentage": 32.86, "elapsed_time": "0:47:07", "remaining_time": "1:36:18"}
24
+ {"current_steps": 24, "total_steps": 70, "loss": 0.6587, "lr": 1.6616858375968596e-05, "epoch": 2.304, "percentage": 34.29, "elapsed_time": "0:49:12", "remaining_time": "1:34:18"}
25
+ {"current_steps": 25, "total_steps": 70, "loss": 0.6357, "lr": 1.6234898018587336e-05, "epoch": 2.4, "percentage": 35.71, "elapsed_time": "0:51:11", "remaining_time": "1:32:09"}
26
+ {"current_steps": 26, "total_steps": 70, "loss": 0.6431, "lr": 1.5837436722347902e-05, "epoch": 2.496, "percentage": 37.14, "elapsed_time": "0:53:16", "remaining_time": "1:30:09"}
27
+ {"current_steps": 27, "total_steps": 70, "loss": 0.6341, "lr": 1.5425462638657597e-05, "epoch": 2.592, "percentage": 38.57, "elapsed_time": "0:55:18", "remaining_time": "1:28:04"}
28
+ {"current_steps": 28, "total_steps": 70, "loss": 0.6476, "lr": 1.5000000000000002e-05, "epoch": 2.6879999999999997, "percentage": 40.0, "elapsed_time": "0:57:12", "remaining_time": "1:25:49"}
29
+ {"current_steps": 29, "total_steps": 70, "loss": 0.624, "lr": 1.4562106573531632e-05, "epoch": 2.784, "percentage": 41.43, "elapsed_time": "0:59:08", "remaining_time": "1:23:36"}
30
+ {"current_steps": 30, "total_steps": 70, "loss": 0.6233, "lr": 1.4112871031306118e-05, "epoch": 2.88, "percentage": 42.86, "elapsed_time": "1:01:11", "remaining_time": "1:21:35"}
31
+ {"current_steps": 31, "total_steps": 70, "loss": 0.6252, "lr": 1.3653410243663953e-05, "epoch": 2.976, "percentage": 44.29, "elapsed_time": "1:03:16", "remaining_time": "1:19:36"}
32
+ {"current_steps": 32, "total_steps": 70, "loss": 0.5995, "lr": 1.3184866502516846e-05, "epoch": 3.072, "percentage": 45.71, "elapsed_time": "1:05:58", "remaining_time": "1:18:20"}
33
+ {"current_steps": 33, "total_steps": 70, "loss": 0.5774, "lr": 1.2708404681430054e-05, "epoch": 3.168, "percentage": 47.14, "elapsed_time": "1:08:05", "remaining_time": "1:16:20"}