ryanmarten commited on
Commit
bb9e1a0
·
verified ·
1 Parent(s): 28784b6

Training in progress, epoch 4

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1ee828c8a7fefd40f2d899c3ade025279777c28d7f74b7ffe93ae09352b62c3c
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b64a2e060c02e5998029a1062b231061fde8e3b07e988005609bab42a73c836e
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:35c94e51c379f320c9d1ef9d86eef5cb75a72ecb77b9b81d4718b36a08d2a449
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd675075364758ae35437300b79d53cdeee1a1f0e2bcc67b25457cbb0c6c7eea
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c3f53920ee60b5ac9aab09cdf60f53e0476a89977d708c60ff1f2440665d158a
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:00fc671eb1fc2417a28dcf97a4a0bbb07484a609dc5a30dfa0a977f2668e30bb
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:856e02aee48e8e9daa7a39e07dcedfea50c9b66a93d93d593bbd251b9dc1d490
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c1ead2a965db3c156e3c9c553ea2d326cf12f7aea2c19b1fa540ed5a28e3288e
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -42,3 +42,14 @@
42
  {"current_steps": 42, "total_steps": 70, "loss": 0.2663, "lr": 8.263518223330698e-06, "epoch": 4.032, "percentage": 60.0, "elapsed_time": "0:50:55", "remaining_time": "0:33:57"}
43
  {"current_steps": 43, "total_steps": 70, "loss": 0.2544, "lr": 7.774790660436857e-06, "epoch": 4.128, "percentage": 61.43, "elapsed_time": "0:52:02", "remaining_time": "0:32:40"}
44
  {"current_steps": 44, "total_steps": 70, "loss": 0.2319, "lr": 7.291595318569951e-06, "epoch": 4.224, "percentage": 62.86, "elapsed_time": "0:53:00", "remaining_time": "0:31:19"}
 
 
 
 
 
 
 
 
 
 
 
 
42
  {"current_steps": 42, "total_steps": 70, "loss": 0.2663, "lr": 8.263518223330698e-06, "epoch": 4.032, "percentage": 60.0, "elapsed_time": "0:50:55", "remaining_time": "0:33:57"}
43
  {"current_steps": 43, "total_steps": 70, "loss": 0.2544, "lr": 7.774790660436857e-06, "epoch": 4.128, "percentage": 61.43, "elapsed_time": "0:52:02", "remaining_time": "0:32:40"}
44
  {"current_steps": 44, "total_steps": 70, "loss": 0.2319, "lr": 7.291595318569951e-06, "epoch": 4.224, "percentage": 62.86, "elapsed_time": "0:53:00", "remaining_time": "0:31:19"}
45
+ {"current_steps": 45, "total_steps": 70, "loss": 0.2402, "lr": 6.815133497483157e-06, "epoch": 4.32, "percentage": 64.29, "elapsed_time": "0:54:01", "remaining_time": "0:30:01"}
46
+ {"current_steps": 46, "total_steps": 70, "loss": 0.2477, "lr": 6.34658975633605e-06, "epoch": 4.416, "percentage": 65.71, "elapsed_time": "0:55:28", "remaining_time": "0:28:56"}
47
+ {"current_steps": 47, "total_steps": 70, "loss": 0.2338, "lr": 5.887128968693887e-06, "epoch": 4.5120000000000005, "percentage": 67.14, "elapsed_time": "0:56:28", "remaining_time": "0:27:38"}
48
+ {"current_steps": 48, "total_steps": 70, "loss": 0.2279, "lr": 5.43789342646837e-06, "epoch": 4.608, "percentage": 68.57, "elapsed_time": "0:57:34", "remaining_time": "0:26:23"}
49
+ {"current_steps": 49, "total_steps": 70, "loss": 0.2252, "lr": 5.000000000000003e-06, "epoch": 4.704, "percentage": 70.0, "elapsed_time": "0:58:42", "remaining_time": "0:25:09"}
50
+ {"current_steps": 50, "total_steps": 70, "loss": 0.2521, "lr": 4.5745373613424075e-06, "epoch": 4.8, "percentage": 71.43, "elapsed_time": "0:59:52", "remaining_time": "0:23:56"}
51
+ {"current_steps": 51, "total_steps": 70, "loss": 0.2464, "lr": 4.162563277652104e-06, "epoch": 4.896, "percentage": 72.86, "elapsed_time": "1:01:05", "remaining_time": "0:22:45"}
52
+ {"current_steps": 52, "total_steps": 70, "loss": 0.2124, "lr": 3.7651019814126656e-06, "epoch": 4.992, "percentage": 74.29, "elapsed_time": "1:02:09", "remaining_time": "0:21:30"}
53
+ {"current_steps": 53, "total_steps": 70, "loss": 0.2163, "lr": 3.3831416240314085e-06, "epoch": 5.088, "percentage": 75.71, "elapsed_time": "1:04:18", "remaining_time": "0:20:37"}
54
+ {"current_steps": 54, "total_steps": 70, "loss": 0.2113, "lr": 3.017631819139273e-06, "epoch": 5.184, "percentage": 77.14, "elapsed_time": "1:05:18", "remaining_time": "0:19:20"}
55
+ {"current_steps": 55, "total_steps": 70, "loss": 0.1909, "lr": 2.669481281701739e-06, "epoch": 5.28, "percentage": 78.57, "elapsed_time": "1:06:18", "remaining_time": "0:18:05"}