ryanmarten commited on
Commit
6dbf2fd
·
verified ·
1 Parent(s): a309f54

Training in progress, epoch 4

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bfabf51a239eee52ce41b20fa5cfdee053e9a7c6a801030e9f254dd48fb9741d
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f06a720863f4ca713417da724c11294611de92f9d2f6e4b942c6e317cbe4eb3a
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dbcc28d0a2607ea22c9fc14df617a156f1f522f35d1f02d056bc0e491ba96923
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:58998596806d58c56a33d126d5d66ef89c01bb4c52676922e0cb01b2d3ec34b8
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f29d3efacb771ffd70ca339dc9c426315e2a963272df34d428ce18ace11f0e17
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:67b320e018a50596ec6a11c47ab21068a70a567e737da3d184c030910661a52b
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d5c5118e96f1ba9711d2287cacdef9ec4727f740ee3e1cbba1f4c24f40db07ea
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:76394e8a4635bbf2309739dc3f034ce678afd6785059d988b4a8ab60e4c70360
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -51,3 +51,13 @@
51
  {"current_steps": 43, "total_steps": 70, "loss": 0.2231, "lr": 7.774790660436857e-06, "epoch": 4.128, "percentage": 61.43, "elapsed_time": "0:43:56", "remaining_time": "0:27:35"}
52
  {"current_steps": 44, "total_steps": 70, "loss": 0.2397, "lr": 7.291595318569951e-06, "epoch": 4.224, "percentage": 62.86, "elapsed_time": "0:44:59", "remaining_time": "0:26:35"}
53
  {"current_steps": 45, "total_steps": 70, "loss": 0.238, "lr": 6.815133497483157e-06, "epoch": 4.32, "percentage": 64.29, "elapsed_time": "0:45:57", "remaining_time": "0:25:32"}
 
 
 
 
 
 
 
 
 
 
 
51
  {"current_steps": 43, "total_steps": 70, "loss": 0.2231, "lr": 7.774790660436857e-06, "epoch": 4.128, "percentage": 61.43, "elapsed_time": "0:43:56", "remaining_time": "0:27:35"}
52
  {"current_steps": 44, "total_steps": 70, "loss": 0.2397, "lr": 7.291595318569951e-06, "epoch": 4.224, "percentage": 62.86, "elapsed_time": "0:44:59", "remaining_time": "0:26:35"}
53
  {"current_steps": 45, "total_steps": 70, "loss": 0.238, "lr": 6.815133497483157e-06, "epoch": 4.32, "percentage": 64.29, "elapsed_time": "0:45:57", "remaining_time": "0:25:32"}
54
+ {"current_steps": 46, "total_steps": 70, "loss": 0.223, "lr": 6.34658975633605e-06, "epoch": 4.416, "percentage": 65.71, "elapsed_time": "0:47:03", "remaining_time": "0:24:33"}
55
+ {"current_steps": 47, "total_steps": 70, "loss": 0.1976, "lr": 5.887128968693887e-06, "epoch": 4.5120000000000005, "percentage": 67.14, "elapsed_time": "0:47:57", "remaining_time": "0:23:28"}
56
+ {"current_steps": 48, "total_steps": 70, "loss": 0.2047, "lr": 5.43789342646837e-06, "epoch": 4.608, "percentage": 68.57, "elapsed_time": "0:48:50", "remaining_time": "0:22:22"}
57
+ {"current_steps": 49, "total_steps": 70, "loss": 0.2146, "lr": 5.000000000000003e-06, "epoch": 4.704, "percentage": 70.0, "elapsed_time": "0:49:44", "remaining_time": "0:21:18"}
58
+ {"current_steps": 50, "total_steps": 70, "loss": 0.1875, "lr": 4.5745373613424075e-06, "epoch": 4.8, "percentage": 71.43, "elapsed_time": "0:50:35", "remaining_time": "0:20:14"}
59
+ {"current_steps": 51, "total_steps": 70, "loss": 0.2125, "lr": 4.162563277652104e-06, "epoch": 4.896, "percentage": 72.86, "elapsed_time": "0:51:33", "remaining_time": "0:19:12"}
60
+ {"current_steps": 52, "total_steps": 70, "loss": 0.1935, "lr": 3.7651019814126656e-06, "epoch": 4.992, "percentage": 74.29, "elapsed_time": "0:52:26", "remaining_time": "0:18:09"}
61
+ {"current_steps": 53, "total_steps": 70, "loss": 0.1889, "lr": 3.3831416240314085e-06, "epoch": 5.088, "percentage": 75.71, "elapsed_time": "0:54:31", "remaining_time": "0:17:29"}
62
+ {"current_steps": 54, "total_steps": 70, "loss": 0.1604, "lr": 3.017631819139273e-06, "epoch": 5.184, "percentage": 77.14, "elapsed_time": "0:55:27", "remaining_time": "0:16:25"}
63
+ {"current_steps": 55, "total_steps": 70, "loss": 0.1715, "lr": 2.669481281701739e-06, "epoch": 5.28, "percentage": 78.57, "elapsed_time": "0:56:17", "remaining_time": "0:15:21"}