ryanmarten commited on
Commit
5837291
·
verified ·
1 Parent(s): d2834d3

Training in progress, epoch 5

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f127dceba02fc9b07c228a91118a42004b54d375b110ea448c150d1f3ca0416e
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:25503382cea45f620a71361f641d0b6221bce359e7ef529e9522ab22cdf76bed
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:720d8c4a339d1737a21e3c8d57c61ae88eff5ae34cb0926e95a862c09de588ae
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6c5f363b885171c8f6abf919b402ee610d67a13dd62f9a5631ee8b7362a20220
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:020fec583f7c330abeadff303ca5200f9718391437a0fd8b0e9fa1a51603aceb
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:91d019c95c378c334aafa59771b0bc80378361ab06928e93cb67d42916c033e3
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3aa5c19366fdfd307bf68db9140a0dcc9c39674ee81fe7b9d42444c8306f5bd0
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0015960da2c8715c2f48fc31200e73cad7933f9668c73628ce9fbf2ad05d3856
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -51,3 +51,14 @@
51
  {"current_steps": 51, "total_steps": 70, "loss": 0.5426, "lr": 4.162563277652104e-06, "epoch": 4.896, "percentage": 72.86, "elapsed_time": "1:42:27", "remaining_time": "0:38:10"}
52
  {"current_steps": 52, "total_steps": 70, "loss": 0.5493, "lr": 3.7651019814126656e-06, "epoch": 4.992, "percentage": 74.29, "elapsed_time": "1:44:18", "remaining_time": "0:36:06"}
53
  {"current_steps": 53, "total_steps": 70, "loss": 0.5429, "lr": 3.3831416240314085e-06, "epoch": 5.088, "percentage": 75.71, "elapsed_time": "1:47:12", "remaining_time": "0:34:23"}
 
 
 
 
 
 
 
 
 
 
 
 
51
  {"current_steps": 51, "total_steps": 70, "loss": 0.5426, "lr": 4.162563277652104e-06, "epoch": 4.896, "percentage": 72.86, "elapsed_time": "1:42:27", "remaining_time": "0:38:10"}
52
  {"current_steps": 52, "total_steps": 70, "loss": 0.5493, "lr": 3.7651019814126656e-06, "epoch": 4.992, "percentage": 74.29, "elapsed_time": "1:44:18", "remaining_time": "0:36:06"}
53
  {"current_steps": 53, "total_steps": 70, "loss": 0.5429, "lr": 3.3831416240314085e-06, "epoch": 5.088, "percentage": 75.71, "elapsed_time": "1:47:12", "remaining_time": "0:34:23"}
54
+ {"current_steps": 54, "total_steps": 70, "loss": 0.5462, "lr": 3.017631819139273e-06, "epoch": 5.184, "percentage": 77.14, "elapsed_time": "1:49:16", "remaining_time": "0:32:22"}
55
+ {"current_steps": 55, "total_steps": 70, "loss": 0.5179, "lr": 2.669481281701739e-06, "epoch": 5.28, "percentage": 78.57, "elapsed_time": "1:50:57", "remaining_time": "0:30:15"}
56
+ {"current_steps": 56, "total_steps": 70, "loss": 0.5296, "lr": 2.339555568810221e-06, "epoch": 5.376, "percentage": 80.0, "elapsed_time": "1:52:50", "remaining_time": "0:28:12"}
57
+ {"current_steps": 57, "total_steps": 70, "loss": 0.5381, "lr": 2.0286749277707783e-06, "epoch": 5.4719999999999995, "percentage": 81.43, "elapsed_time": "1:54:48", "remaining_time": "0:26:11"}
58
+ {"current_steps": 58, "total_steps": 70, "loss": 0.5507, "lr": 1.7376122568400533e-06, "epoch": 5.568, "percentage": 82.86, "elapsed_time": "1:56:58", "remaining_time": "0:24:12"}
59
+ {"current_steps": 59, "total_steps": 70, "loss": 0.539, "lr": 1.467091183678444e-06, "epoch": 5.664, "percentage": 84.29, "elapsed_time": "1:58:50", "remaining_time": "0:22:09"}
60
+ {"current_steps": 60, "total_steps": 70, "loss": 0.5313, "lr": 1.2177842662977136e-06, "epoch": 5.76, "percentage": 85.71, "elapsed_time": "2:00:43", "remaining_time": "0:20:07"}
61
+ {"current_steps": 61, "total_steps": 70, "loss": 0.5175, "lr": 9.903113209758098e-07, "epoch": 5.856, "percentage": 87.14, "elapsed_time": "2:02:31", "remaining_time": "0:18:04"}
62
+ {"current_steps": 62, "total_steps": 70, "loss": 0.5251, "lr": 7.852378812959227e-07, "epoch": 5.952, "percentage": 88.57, "elapsed_time": "2:04:31", "remaining_time": "0:16:04"}
63
+ {"current_steps": 63, "total_steps": 70, "loss": 0.5123, "lr": 6.030737921409169e-07, "epoch": 6.048, "percentage": 90.0, "elapsed_time": "2:07:11", "remaining_time": "0:14:07"}
64
+ {"current_steps": 64, "total_steps": 70, "loss": 0.5244, "lr": 4.4427194213859216e-07, "epoch": 6.144, "percentage": 91.43, "elapsed_time": "2:09:07", "remaining_time": "0:12:06"}