ryanmarten commited on
Commit
c88aff6
·
verified ·
1 Parent(s): acd039a

Training in progress, epoch 4

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:812b091a86c552b9e4d8012b096f19ed3f2ae7cce006904657bae356995abc59
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2d44f09662157e5960f3dff45b5f860fc7e9a9ef64caf13ddb41a12d6b793302
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3beb3962aead30369444bd090562ab43145f909efe107da23faf6e737987eb78
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7be9c4f7e1b71da200beabf3814be15a0e57f92a17716fd3753bcfe2240ae7f8
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c19ab23918f855c73c1300a554c31d68ca10d947c536c1b304da868fb66103da
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7614690f51473e70495ddc23f412ca351eab4fa613aed839c75f508c9182e516
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2b3748b76712c13be4a3a3461f2de0f25c342af59b2e7b1d465fa6f1f84a51bb
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9a30c54d4547aad32c6ba38e52718f5b2660b96a445096ce715c658ccf6a39cd
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -41,3 +41,13 @@
41
  {"current_steps": 41, "total_steps": 70, "loss": 0.5795, "lr": 8.756562953525151e-06, "epoch": 3.936, "percentage": 58.57, "elapsed_time": "1:24:18", "remaining_time": "0:59:38"}
42
  {"current_steps": 42, "total_steps": 70, "loss": 0.5616, "lr": 8.263518223330698e-06, "epoch": 4.032, "percentage": 60.0, "elapsed_time": "1:27:05", "remaining_time": "0:58:03"}
43
  {"current_steps": 43, "total_steps": 70, "loss": 0.5312, "lr": 7.774790660436857e-06, "epoch": 4.128, "percentage": 61.43, "elapsed_time": "1:29:11", "remaining_time": "0:56:00"}
 
 
 
 
 
 
 
 
 
 
 
41
  {"current_steps": 41, "total_steps": 70, "loss": 0.5795, "lr": 8.756562953525151e-06, "epoch": 3.936, "percentage": 58.57, "elapsed_time": "1:24:18", "remaining_time": "0:59:38"}
42
  {"current_steps": 42, "total_steps": 70, "loss": 0.5616, "lr": 8.263518223330698e-06, "epoch": 4.032, "percentage": 60.0, "elapsed_time": "1:27:05", "remaining_time": "0:58:03"}
43
  {"current_steps": 43, "total_steps": 70, "loss": 0.5312, "lr": 7.774790660436857e-06, "epoch": 4.128, "percentage": 61.43, "elapsed_time": "1:29:11", "remaining_time": "0:56:00"}
44
+ {"current_steps": 44, "total_steps": 70, "loss": 0.5379, "lr": 7.291595318569951e-06, "epoch": 4.224, "percentage": 62.86, "elapsed_time": "1:31:07", "remaining_time": "0:53:50"}
45
+ {"current_steps": 45, "total_steps": 70, "loss": 0.5334, "lr": 6.815133497483157e-06, "epoch": 4.32, "percentage": 64.29, "elapsed_time": "1:33:00", "remaining_time": "0:51:40"}
46
+ {"current_steps": 46, "total_steps": 70, "loss": 0.528, "lr": 6.34658975633605e-06, "epoch": 4.416, "percentage": 65.71, "elapsed_time": "1:35:01", "remaining_time": "0:49:34"}
47
+ {"current_steps": 47, "total_steps": 70, "loss": 0.5297, "lr": 5.887128968693887e-06, "epoch": 4.5120000000000005, "percentage": 67.14, "elapsed_time": "1:37:02", "remaining_time": "0:47:29"}
48
+ {"current_steps": 48, "total_steps": 70, "loss": 0.5571, "lr": 5.43789342646837e-06, "epoch": 4.608, "percentage": 68.57, "elapsed_time": "1:39:13", "remaining_time": "0:45:28"}
49
+ {"current_steps": 49, "total_steps": 70, "loss": 0.5411, "lr": 5.000000000000003e-06, "epoch": 4.704, "percentage": 70.0, "elapsed_time": "1:41:17", "remaining_time": "0:43:24"}
50
+ {"current_steps": 50, "total_steps": 70, "loss": 0.5274, "lr": 4.5745373613424075e-06, "epoch": 4.8, "percentage": 71.43, "elapsed_time": "1:43:15", "remaining_time": "0:41:18"}
51
+ {"current_steps": 51, "total_steps": 70, "loss": 0.5161, "lr": 4.162563277652104e-06, "epoch": 4.896, "percentage": 72.86, "elapsed_time": "1:45:13", "remaining_time": "0:39:11"}
52
+ {"current_steps": 52, "total_steps": 70, "loss": 0.5304, "lr": 3.7651019814126656e-06, "epoch": 4.992, "percentage": 74.29, "elapsed_time": "1:46:57", "remaining_time": "0:37:01"}
53
+ {"current_steps": 53, "total_steps": 70, "loss": 0.5299, "lr": 3.3831416240314085e-06, "epoch": 5.088, "percentage": 75.71, "elapsed_time": "1:49:45", "remaining_time": "0:35:12"}