ryanmarten commited on
Commit
3457200
·
verified ·
1 Parent(s): 2922dba

Training in progress, epoch 4

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9cdd30bf1b8715641dd55f940e79fc162b3523f4444db1f95223a33f900774e9
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1350fde116c6e6542edab91b188797dc5a9ee91a4da6db2195400dc6ec56f3b0
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:672733c75b97bbc3e0687a340b8e8fb69f8ef4f6fe16b87df0552e5440d29745
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3d5263f79024786cd7417c43f0ac20ef8d36fafc02a98d806b317776c20e2fe5
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bf848945b14caacbc8188d349b9d9ac43e201e6fc77c37fe7f8590698ef07bb7
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:66d322ec357c06709cd8e22aed7d9864d5a8e82d7d37501ea6d326f6e7fa5497
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c22144c5047ae5e1b0eeb64a3290567022478c52240cb1481e5998635dd3ed93
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d091913f400fbc0ddb7fb19abbd368909e24fad7e057b66bf61133d0f1ab2c2d
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -41,3 +41,13 @@
41
  {"current_steps": 41, "total_steps": 70, "loss": 0.5673, "lr": 8.756562953525151e-06, "epoch": 3.936, "percentage": 58.57, "elapsed_time": "1:24:42", "remaining_time": "0:59:55"}
42
  {"current_steps": 42, "total_steps": 70, "loss": 0.5655, "lr": 8.263518223330698e-06, "epoch": 4.032, "percentage": 60.0, "elapsed_time": "1:27:38", "remaining_time": "0:58:25"}
43
  {"current_steps": 43, "total_steps": 70, "loss": 0.5387, "lr": 7.774790660436857e-06, "epoch": 4.128, "percentage": 61.43, "elapsed_time": "1:29:33", "remaining_time": "0:56:13"}
 
 
 
 
 
 
 
 
 
 
 
41
  {"current_steps": 41, "total_steps": 70, "loss": 0.5673, "lr": 8.756562953525151e-06, "epoch": 3.936, "percentage": 58.57, "elapsed_time": "1:24:42", "remaining_time": "0:59:55"}
42
  {"current_steps": 42, "total_steps": 70, "loss": 0.5655, "lr": 8.263518223330698e-06, "epoch": 4.032, "percentage": 60.0, "elapsed_time": "1:27:38", "remaining_time": "0:58:25"}
43
  {"current_steps": 43, "total_steps": 70, "loss": 0.5387, "lr": 7.774790660436857e-06, "epoch": 4.128, "percentage": 61.43, "elapsed_time": "1:29:33", "remaining_time": "0:56:13"}
44
+ {"current_steps": 44, "total_steps": 70, "loss": 0.5444, "lr": 7.291595318569951e-06, "epoch": 4.224, "percentage": 62.86, "elapsed_time": "1:31:34", "remaining_time": "0:54:06"}
45
+ {"current_steps": 45, "total_steps": 70, "loss": 0.5435, "lr": 6.815133497483157e-06, "epoch": 4.32, "percentage": 64.29, "elapsed_time": "1:33:38", "remaining_time": "0:52:01"}
46
+ {"current_steps": 46, "total_steps": 70, "loss": 0.5304, "lr": 6.34658975633605e-06, "epoch": 4.416, "percentage": 65.71, "elapsed_time": "1:35:39", "remaining_time": "0:49:54"}
47
+ {"current_steps": 47, "total_steps": 70, "loss": 0.5202, "lr": 5.887128968693887e-06, "epoch": 4.5120000000000005, "percentage": 67.14, "elapsed_time": "1:37:42", "remaining_time": "0:47:48"}
48
+ {"current_steps": 48, "total_steps": 70, "loss": 0.5011, "lr": 5.43789342646837e-06, "epoch": 4.608, "percentage": 68.57, "elapsed_time": "1:39:36", "remaining_time": "0:45:39"}
49
+ {"current_steps": 49, "total_steps": 70, "loss": 0.547, "lr": 5.000000000000003e-06, "epoch": 4.704, "percentage": 70.0, "elapsed_time": "1:41:29", "remaining_time": "0:43:29"}
50
+ {"current_steps": 50, "total_steps": 70, "loss": 0.5212, "lr": 4.5745373613424075e-06, "epoch": 4.8, "percentage": 71.43, "elapsed_time": "1:43:35", "remaining_time": "0:41:26"}
51
+ {"current_steps": 51, "total_steps": 70, "loss": 0.5275, "lr": 4.162563277652104e-06, "epoch": 4.896, "percentage": 72.86, "elapsed_time": "1:45:37", "remaining_time": "0:39:20"}
52
+ {"current_steps": 52, "total_steps": 70, "loss": 0.5189, "lr": 3.7651019814126656e-06, "epoch": 4.992, "percentage": 74.29, "elapsed_time": "1:47:45", "remaining_time": "0:37:18"}
53
+ {"current_steps": 53, "total_steps": 70, "loss": 0.5069, "lr": 3.3831416240314085e-06, "epoch": 5.088, "percentage": 75.71, "elapsed_time": "1:50:40", "remaining_time": "0:35:30"}