ryanmarten commited on
Commit
cb02fcd
·
verified ·
1 Parent(s): c00361c

Training in progress, epoch 4

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c44d12cc1185635f05157a7f6718cdce412027b542cb9b6de06753577ef99458
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:949d9cf7e79996d90f5b52e9f5a8ff9e89d7b5ddbb7500d35609d5aa1ef7df07
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:83b289a95cd82c3c12dc54d54730101ba8edee36330961b05e3a78e03acb241e
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:24bb98f203c12aa28300a8a65902c605db4fe59274a950b22e3388812b42be30
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:078c63c69677a04af59b7ccb1d1a1285b9cd469f246aa8ba3984e075270cc835
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d75fcf09d456fcc9f8305c70863a51ce9ef048f8894bd6b0c53a5b93b6359653
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d5bad2cabf29bc0122d71bbbde3afae4b56336b20c4515551a0ebf8ff70fdf04
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fd6be055368e57db28b37cd8524045cdc8edd1a378bb76d7c9fca55c82788579
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -41,3 +41,13 @@
41
  {"current_steps": 41, "total_steps": 70, "loss": 0.5491, "lr": 8.756562953525151e-06, "epoch": 3.936, "percentage": 58.57, "elapsed_time": "1:26:25", "remaining_time": "1:01:07"}
42
  {"current_steps": 42, "total_steps": 70, "loss": 0.5528, "lr": 8.263518223330698e-06, "epoch": 4.032, "percentage": 60.0, "elapsed_time": "1:29:20", "remaining_time": "0:59:33"}
43
  {"current_steps": 43, "total_steps": 70, "loss": 0.5261, "lr": 7.774790660436857e-06, "epoch": 4.128, "percentage": 61.43, "elapsed_time": "1:31:11", "remaining_time": "0:57:15"}
 
 
 
 
 
 
 
 
 
 
 
41
  {"current_steps": 41, "total_steps": 70, "loss": 0.5491, "lr": 8.756562953525151e-06, "epoch": 3.936, "percentage": 58.57, "elapsed_time": "1:26:25", "remaining_time": "1:01:07"}
42
  {"current_steps": 42, "total_steps": 70, "loss": 0.5528, "lr": 8.263518223330698e-06, "epoch": 4.032, "percentage": 60.0, "elapsed_time": "1:29:20", "remaining_time": "0:59:33"}
43
  {"current_steps": 43, "total_steps": 70, "loss": 0.5261, "lr": 7.774790660436857e-06, "epoch": 4.128, "percentage": 61.43, "elapsed_time": "1:31:11", "remaining_time": "0:57:15"}
44
+ {"current_steps": 44, "total_steps": 70, "loss": 0.5201, "lr": 7.291595318569951e-06, "epoch": 4.224, "percentage": 62.86, "elapsed_time": "1:33:17", "remaining_time": "0:55:07"}
45
+ {"current_steps": 45, "total_steps": 70, "loss": 0.5307, "lr": 6.815133497483157e-06, "epoch": 4.32, "percentage": 64.29, "elapsed_time": "1:35:14", "remaining_time": "0:52:54"}
46
+ {"current_steps": 46, "total_steps": 70, "loss": 0.5452, "lr": 6.34658975633605e-06, "epoch": 4.416, "percentage": 65.71, "elapsed_time": "1:37:17", "remaining_time": "0:50:45"}
47
+ {"current_steps": 47, "total_steps": 70, "loss": 0.5552, "lr": 5.887128968693887e-06, "epoch": 4.5120000000000005, "percentage": 67.14, "elapsed_time": "1:39:08", "remaining_time": "0:48:31"}
48
+ {"current_steps": 48, "total_steps": 70, "loss": 0.527, "lr": 5.43789342646837e-06, "epoch": 4.608, "percentage": 68.57, "elapsed_time": "1:41:17", "remaining_time": "0:46:25"}
49
+ {"current_steps": 49, "total_steps": 70, "loss": 0.5367, "lr": 5.000000000000003e-06, "epoch": 4.704, "percentage": 70.0, "elapsed_time": "1:43:27", "remaining_time": "0:44:20"}
50
+ {"current_steps": 50, "total_steps": 70, "loss": 0.5246, "lr": 4.5745373613424075e-06, "epoch": 4.8, "percentage": 71.43, "elapsed_time": "1:45:18", "remaining_time": "0:42:07"}
51
+ {"current_steps": 51, "total_steps": 70, "loss": 0.5119, "lr": 4.162563277652104e-06, "epoch": 4.896, "percentage": 72.86, "elapsed_time": "1:47:16", "remaining_time": "0:39:57"}
52
+ {"current_steps": 52, "total_steps": 70, "loss": 0.5245, "lr": 3.7651019814126656e-06, "epoch": 4.992, "percentage": 74.29, "elapsed_time": "1:49:32", "remaining_time": "0:37:55"}
53
+ {"current_steps": 53, "total_steps": 70, "loss": 0.5077, "lr": 3.3831416240314085e-06, "epoch": 5.088, "percentage": 75.71, "elapsed_time": "1:52:28", "remaining_time": "0:36:04"}