ryanmarten commited on
Commit
ff3ff5f
·
verified ·
1 Parent(s): c88aff6

Training in progress, epoch 5

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2d44f09662157e5960f3dff45b5f860fc7e9a9ef64caf13ddb41a12d6b793302
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:42c7493a33ba4ec6e48b06b6db132a06df177db8d00972433b7a58023d618140
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7be9c4f7e1b71da200beabf3814be15a0e57f92a17716fd3753bcfe2240ae7f8
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:77af113ae38d1f5152c452bc84888f32fa81b110f54a6b465c3e1d04e2278015
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7614690f51473e70495ddc23f412ca351eab4fa613aed839c75f508c9182e516
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:632c9cc1003fa58bbbab4c0b7d06e17b820b5d7def2ee2df506a277f6ec3f731
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9a30c54d4547aad32c6ba38e52718f5b2660b96a445096ce715c658ccf6a39cd
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d9e653ab2d8d7a1590bda3f5e7b5313a2b5322d5c0ddbecbd235a8cc9cf426a3
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -51,3 +51,14 @@
51
  {"current_steps": 51, "total_steps": 70, "loss": 0.5161, "lr": 4.162563277652104e-06, "epoch": 4.896, "percentage": 72.86, "elapsed_time": "1:45:13", "remaining_time": "0:39:11"}
52
  {"current_steps": 52, "total_steps": 70, "loss": 0.5304, "lr": 3.7651019814126656e-06, "epoch": 4.992, "percentage": 74.29, "elapsed_time": "1:46:57", "remaining_time": "0:37:01"}
53
  {"current_steps": 53, "total_steps": 70, "loss": 0.5299, "lr": 3.3831416240314085e-06, "epoch": 5.088, "percentage": 75.71, "elapsed_time": "1:49:45", "remaining_time": "0:35:12"}
 
 
 
 
 
 
 
 
 
 
 
 
51
  {"current_steps": 51, "total_steps": 70, "loss": 0.5161, "lr": 4.162563277652104e-06, "epoch": 4.896, "percentage": 72.86, "elapsed_time": "1:45:13", "remaining_time": "0:39:11"}
52
  {"current_steps": 52, "total_steps": 70, "loss": 0.5304, "lr": 3.7651019814126656e-06, "epoch": 4.992, "percentage": 74.29, "elapsed_time": "1:46:57", "remaining_time": "0:37:01"}
53
  {"current_steps": 53, "total_steps": 70, "loss": 0.5299, "lr": 3.3831416240314085e-06, "epoch": 5.088, "percentage": 75.71, "elapsed_time": "1:49:45", "remaining_time": "0:35:12"}
54
+ {"current_steps": 54, "total_steps": 70, "loss": 0.511, "lr": 3.017631819139273e-06, "epoch": 5.184, "percentage": 77.14, "elapsed_time": "1:51:47", "remaining_time": "0:33:07"}
55
+ {"current_steps": 55, "total_steps": 70, "loss": 0.5149, "lr": 2.669481281701739e-06, "epoch": 5.28, "percentage": 78.57, "elapsed_time": "1:53:45", "remaining_time": "0:31:01"}
56
+ {"current_steps": 56, "total_steps": 70, "loss": 0.4947, "lr": 2.339555568810221e-06, "epoch": 5.376, "percentage": 80.0, "elapsed_time": "1:55:42", "remaining_time": "0:28:55"}
57
+ {"current_steps": 57, "total_steps": 70, "loss": 0.4909, "lr": 2.0286749277707783e-06, "epoch": 5.4719999999999995, "percentage": 81.43, "elapsed_time": "1:57:34", "remaining_time": "0:26:49"}
58
+ {"current_steps": 58, "total_steps": 70, "loss": 0.508, "lr": 1.7376122568400533e-06, "epoch": 5.568, "percentage": 82.86, "elapsed_time": "1:59:31", "remaining_time": "0:24:43"}
59
+ {"current_steps": 59, "total_steps": 70, "loss": 0.506, "lr": 1.467091183678444e-06, "epoch": 5.664, "percentage": 84.29, "elapsed_time": "2:01:27", "remaining_time": "0:22:38"}
60
+ {"current_steps": 60, "total_steps": 70, "loss": 0.5173, "lr": 1.2177842662977136e-06, "epoch": 5.76, "percentage": 85.71, "elapsed_time": "2:03:24", "remaining_time": "0:20:34"}
61
+ {"current_steps": 61, "total_steps": 70, "loss": 0.4913, "lr": 9.903113209758098e-07, "epoch": 5.856, "percentage": 87.14, "elapsed_time": "2:05:19", "remaining_time": "0:18:29"}
62
+ {"current_steps": 62, "total_steps": 70, "loss": 0.5044, "lr": 7.852378812959227e-07, "epoch": 5.952, "percentage": 88.57, "elapsed_time": "2:07:21", "remaining_time": "0:16:25"}
63
+ {"current_steps": 63, "total_steps": 70, "loss": 0.4999, "lr": 6.030737921409169e-07, "epoch": 6.048, "percentage": 90.0, "elapsed_time": "2:10:35", "remaining_time": "0:14:30"}
64
+ {"current_steps": 64, "total_steps": 70, "loss": 0.5107, "lr": 4.4427194213859216e-07, "epoch": 6.144, "percentage": 91.43, "elapsed_time": "2:12:37", "remaining_time": "0:12:26"}