ryanmarten commited on
Commit
d2834d3
·
verified ·
1 Parent(s): a001b1f

Training in progress, epoch 4

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ceaf2645bc4e1fbca3d3d3c8d074f20fb3186a81c043d4625624e98f2ff9d604
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f127dceba02fc9b07c228a91118a42004b54d375b110ea448c150d1f3ca0416e
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cc29c6f40f8da2961156b270a31207d60f2a64d5add39851adc8e4cdbdfb6865
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:720d8c4a339d1737a21e3c8d57c61ae88eff5ae34cb0926e95a862c09de588ae
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:11a0b09494af29131f04487f140bc9caae36d8f65b70237533a019202ce020ee
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:020fec583f7c330abeadff303ca5200f9718391437a0fd8b0e9fa1a51603aceb
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dd387959a36fb3b1fbf7d49eaae41aa46d564d2f8980956e75d41158a37cae98
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3aa5c19366fdfd307bf68db9140a0dcc9c39674ee81fe7b9d42444c8306f5bd0
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -41,3 +41,13 @@
41
  {"current_steps": 41, "total_steps": 70, "loss": 0.5829, "lr": 8.756562953525151e-06, "epoch": 3.936, "percentage": 58.57, "elapsed_time": "1:22:13", "remaining_time": "0:58:09"}
42
  {"current_steps": 42, "total_steps": 70, "loss": 0.5896, "lr": 8.263518223330698e-06, "epoch": 4.032, "percentage": 60.0, "elapsed_time": "1:24:49", "remaining_time": "0:56:32"}
43
  {"current_steps": 43, "total_steps": 70, "loss": 0.566, "lr": 7.774790660436857e-06, "epoch": 4.128, "percentage": 61.43, "elapsed_time": "1:26:50", "remaining_time": "0:54:31"}
 
 
 
 
 
 
 
 
 
 
 
41
  {"current_steps": 41, "total_steps": 70, "loss": 0.5829, "lr": 8.756562953525151e-06, "epoch": 3.936, "percentage": 58.57, "elapsed_time": "1:22:13", "remaining_time": "0:58:09"}
42
  {"current_steps": 42, "total_steps": 70, "loss": 0.5896, "lr": 8.263518223330698e-06, "epoch": 4.032, "percentage": 60.0, "elapsed_time": "1:24:49", "remaining_time": "0:56:32"}
43
  {"current_steps": 43, "total_steps": 70, "loss": 0.566, "lr": 7.774790660436857e-06, "epoch": 4.128, "percentage": 61.43, "elapsed_time": "1:26:50", "remaining_time": "0:54:31"}
44
+ {"current_steps": 44, "total_steps": 70, "loss": 0.5505, "lr": 7.291595318569951e-06, "epoch": 4.224, "percentage": 62.86, "elapsed_time": "1:28:55", "remaining_time": "0:52:33"}
45
+ {"current_steps": 45, "total_steps": 70, "loss": 0.5462, "lr": 6.815133497483157e-06, "epoch": 4.32, "percentage": 64.29, "elapsed_time": "1:30:46", "remaining_time": "0:50:25"}
46
+ {"current_steps": 46, "total_steps": 70, "loss": 0.5732, "lr": 6.34658975633605e-06, "epoch": 4.416, "percentage": 65.71, "elapsed_time": "1:32:49", "remaining_time": "0:48:25"}
47
+ {"current_steps": 47, "total_steps": 70, "loss": 0.5436, "lr": 5.887128968693887e-06, "epoch": 4.5120000000000005, "percentage": 67.14, "elapsed_time": "1:34:38", "remaining_time": "0:46:18"}
48
+ {"current_steps": 48, "total_steps": 70, "loss": 0.5416, "lr": 5.43789342646837e-06, "epoch": 4.608, "percentage": 68.57, "elapsed_time": "1:36:29", "remaining_time": "0:44:13"}
49
+ {"current_steps": 49, "total_steps": 70, "loss": 0.5561, "lr": 5.000000000000003e-06, "epoch": 4.704, "percentage": 70.0, "elapsed_time": "1:38:29", "remaining_time": "0:42:12"}
50
+ {"current_steps": 50, "total_steps": 70, "loss": 0.5626, "lr": 4.5745373613424075e-06, "epoch": 4.8, "percentage": 71.43, "elapsed_time": "1:40:25", "remaining_time": "0:40:10"}
51
+ {"current_steps": 51, "total_steps": 70, "loss": 0.5426, "lr": 4.162563277652104e-06, "epoch": 4.896, "percentage": 72.86, "elapsed_time": "1:42:27", "remaining_time": "0:38:10"}
52
+ {"current_steps": 52, "total_steps": 70, "loss": 0.5493, "lr": 3.7651019814126656e-06, "epoch": 4.992, "percentage": 74.29, "elapsed_time": "1:44:18", "remaining_time": "0:36:06"}
53
+ {"current_steps": 53, "total_steps": 70, "loss": 0.5429, "lr": 3.3831416240314085e-06, "epoch": 5.088, "percentage": 75.71, "elapsed_time": "1:47:12", "remaining_time": "0:34:23"}