ryanmarten commited on
Commit
6eda536
·
verified ·
1 Parent(s): 7f96945

Training in progress, epoch 5

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:86395ccac12d91be1217fc92e4bbeafe489e02b1c8d56f1df7f3ffd6274e9446
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8904e0773149459095052996bb3f6c0023f12d46eddda9210b8404a71cdd1fab
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:30d3a62d305c7359a21fe8a3cd443f99e7c490e7fe6822c7f0e25e3a630bc0b1
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2b08969f0b904d4389f993a0f29f2f68e358fb0b867c910a00cf12ecc54e840c
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:46d2aed2fc6eac172904620e2b96cb866e3fd1035763f599ad46ca386c889838
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d951bcb437acfdff8612c6746f4d2983f9d5ffed2c9bc1a65f4a51834163a3b1
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7a20cf702199306ceec6fa02cc80014f3fb460b24bc38e607b7549b7f14f12d6
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ce3963831a52b408ed73f84f6a98811d9a4f2e6c5d80489b5fad5b9ba72febdc
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -51,3 +51,14 @@
51
  {"current_steps": 51, "total_steps": 70, "loss": 0.5474, "lr": 4.162563277652104e-06, "epoch": 4.896, "percentage": 72.86, "elapsed_time": "1:27:01", "remaining_time": "0:32:25"}
52
  {"current_steps": 52, "total_steps": 70, "loss": 0.5191, "lr": 3.7651019814126656e-06, "epoch": 4.992, "percentage": 74.29, "elapsed_time": "1:28:33", "remaining_time": "0:30:39"}
53
  {"current_steps": 53, "total_steps": 70, "loss": 0.4818, "lr": 3.3831416240314085e-06, "epoch": 5.088, "percentage": 75.71, "elapsed_time": "1:31:14", "remaining_time": "0:29:15"}
 
 
 
 
 
 
 
 
 
 
 
 
51
  {"current_steps": 51, "total_steps": 70, "loss": 0.5474, "lr": 4.162563277652104e-06, "epoch": 4.896, "percentage": 72.86, "elapsed_time": "1:27:01", "remaining_time": "0:32:25"}
52
  {"current_steps": 52, "total_steps": 70, "loss": 0.5191, "lr": 3.7651019814126656e-06, "epoch": 4.992, "percentage": 74.29, "elapsed_time": "1:28:33", "remaining_time": "0:30:39"}
53
  {"current_steps": 53, "total_steps": 70, "loss": 0.4818, "lr": 3.3831416240314085e-06, "epoch": 5.088, "percentage": 75.71, "elapsed_time": "1:31:14", "remaining_time": "0:29:15"}
54
+ {"current_steps": 54, "total_steps": 70, "loss": 0.474, "lr": 3.017631819139273e-06, "epoch": 5.184, "percentage": 77.14, "elapsed_time": "1:33:06", "remaining_time": "0:27:35"}
55
+ {"current_steps": 55, "total_steps": 70, "loss": 0.4917, "lr": 2.669481281701739e-06, "epoch": 5.28, "percentage": 78.57, "elapsed_time": "1:34:43", "remaining_time": "0:25:49"}
56
+ {"current_steps": 56, "total_steps": 70, "loss": 0.4908, "lr": 2.339555568810221e-06, "epoch": 5.376, "percentage": 80.0, "elapsed_time": "1:36:16", "remaining_time": "0:24:04"}
57
+ {"current_steps": 57, "total_steps": 70, "loss": 0.4724, "lr": 2.0286749277707783e-06, "epoch": 5.4719999999999995, "percentage": 81.43, "elapsed_time": "1:37:49", "remaining_time": "0:22:18"}
58
+ {"current_steps": 58, "total_steps": 70, "loss": 0.4812, "lr": 1.7376122568400533e-06, "epoch": 5.568, "percentage": 82.86, "elapsed_time": "1:39:28", "remaining_time": "0:20:34"}
59
+ {"current_steps": 59, "total_steps": 70, "loss": 0.4915, "lr": 1.467091183678444e-06, "epoch": 5.664, "percentage": 84.29, "elapsed_time": "1:41:00", "remaining_time": "0:18:50"}
60
+ {"current_steps": 60, "total_steps": 70, "loss": 0.4941, "lr": 1.2177842662977136e-06, "epoch": 5.76, "percentage": 85.71, "elapsed_time": "1:42:32", "remaining_time": "0:17:05"}
61
+ {"current_steps": 61, "total_steps": 70, "loss": 0.4871, "lr": 9.903113209758098e-07, "epoch": 5.856, "percentage": 87.14, "elapsed_time": "1:44:14", "remaining_time": "0:15:22"}
62
+ {"current_steps": 62, "total_steps": 70, "loss": 0.5032, "lr": 7.852378812959227e-07, "epoch": 5.952, "percentage": 88.57, "elapsed_time": "1:45:57", "remaining_time": "0:13:40"}
63
+ {"current_steps": 63, "total_steps": 70, "loss": 0.4605, "lr": 6.030737921409169e-07, "epoch": 6.048, "percentage": 90.0, "elapsed_time": "1:48:43", "remaining_time": "0:12:04"}
64
+ {"current_steps": 64, "total_steps": 70, "loss": 0.4592, "lr": 4.4427194213859216e-07, "epoch": 6.144, "percentage": 91.43, "elapsed_time": "1:50:22", "remaining_time": "0:10:20"}