ryanmarten commited on
Commit
f79e86a
·
verified ·
1 Parent(s): cb02fcd

Training in progress, epoch 5

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:949d9cf7e79996d90f5b52e9f5a8ff9e89d7b5ddbb7500d35609d5aa1ef7df07
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:25a7d0c2077225adb5cc057046845dd38f7a0dd0215cca57aa2d9fdc1f5d596f
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:24bb98f203c12aa28300a8a65902c605db4fe59274a950b22e3388812b42be30
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fb7da0c816de21254323d6808f75751bce29dc81136a487d16ee8382d9c2fc3f
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d75fcf09d456fcc9f8305c70863a51ce9ef048f8894bd6b0c53a5b93b6359653
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6f4e3389cd3547ed0c64ee2ec58cbd9c443d3af3470584d67eb2090eea9c0dbf
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fd6be055368e57db28b37cd8524045cdc8edd1a378bb76d7c9fca55c82788579
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:073e5f4b6c7acb9a0454f30c9f043a28ffb076e328ce131419384554f6c4d844
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -51,3 +51,14 @@
51
  {"current_steps": 51, "total_steps": 70, "loss": 0.5119, "lr": 4.162563277652104e-06, "epoch": 4.896, "percentage": 72.86, "elapsed_time": "1:47:16", "remaining_time": "0:39:57"}
52
  {"current_steps": 52, "total_steps": 70, "loss": 0.5245, "lr": 3.7651019814126656e-06, "epoch": 4.992, "percentage": 74.29, "elapsed_time": "1:49:32", "remaining_time": "0:37:55"}
53
  {"current_steps": 53, "total_steps": 70, "loss": 0.5077, "lr": 3.3831416240314085e-06, "epoch": 5.088, "percentage": 75.71, "elapsed_time": "1:52:28", "remaining_time": "0:36:04"}
 
 
 
 
 
 
 
 
 
 
 
 
51
  {"current_steps": 51, "total_steps": 70, "loss": 0.5119, "lr": 4.162563277652104e-06, "epoch": 4.896, "percentage": 72.86, "elapsed_time": "1:47:16", "remaining_time": "0:39:57"}
52
  {"current_steps": 52, "total_steps": 70, "loss": 0.5245, "lr": 3.7651019814126656e-06, "epoch": 4.992, "percentage": 74.29, "elapsed_time": "1:49:32", "remaining_time": "0:37:55"}
53
  {"current_steps": 53, "total_steps": 70, "loss": 0.5077, "lr": 3.3831416240314085e-06, "epoch": 5.088, "percentage": 75.71, "elapsed_time": "1:52:28", "remaining_time": "0:36:04"}
54
+ {"current_steps": 54, "total_steps": 70, "loss": 0.5158, "lr": 3.017631819139273e-06, "epoch": 5.184, "percentage": 77.14, "elapsed_time": "1:54:33", "remaining_time": "0:33:56"}
55
+ {"current_steps": 55, "total_steps": 70, "loss": 0.4989, "lr": 2.669481281701739e-06, "epoch": 5.28, "percentage": 78.57, "elapsed_time": "1:56:35", "remaining_time": "0:31:47"}
56
+ {"current_steps": 56, "total_steps": 70, "loss": 0.4991, "lr": 2.339555568810221e-06, "epoch": 5.376, "percentage": 80.0, "elapsed_time": "1:58:42", "remaining_time": "0:29:40"}
57
+ {"current_steps": 57, "total_steps": 70, "loss": 0.483, "lr": 2.0286749277707783e-06, "epoch": 5.4719999999999995, "percentage": 81.43, "elapsed_time": "2:00:46", "remaining_time": "0:27:32"}
58
+ {"current_steps": 58, "total_steps": 70, "loss": 0.4838, "lr": 1.7376122568400533e-06, "epoch": 5.568, "percentage": 82.86, "elapsed_time": "2:02:51", "remaining_time": "0:25:25"}
59
+ {"current_steps": 59, "total_steps": 70, "loss": 0.506, "lr": 1.467091183678444e-06, "epoch": 5.664, "percentage": 84.29, "elapsed_time": "2:05:01", "remaining_time": "0:23:18"}
60
+ {"current_steps": 60, "total_steps": 70, "loss": 0.5098, "lr": 1.2177842662977136e-06, "epoch": 5.76, "percentage": 85.71, "elapsed_time": "2:07:00", "remaining_time": "0:21:10"}
61
+ {"current_steps": 61, "total_steps": 70, "loss": 0.5013, "lr": 9.903113209758098e-07, "epoch": 5.856, "percentage": 87.14, "elapsed_time": "2:09:04", "remaining_time": "0:19:02"}
62
+ {"current_steps": 62, "total_steps": 70, "loss": 0.5112, "lr": 7.852378812959227e-07, "epoch": 5.952, "percentage": 88.57, "elapsed_time": "2:11:09", "remaining_time": "0:16:55"}
63
+ {"current_steps": 63, "total_steps": 70, "loss": 0.5145, "lr": 6.030737921409169e-07, "epoch": 6.048, "percentage": 90.0, "elapsed_time": "2:14:18", "remaining_time": "0:14:55"}
64
+ {"current_steps": 64, "total_steps": 70, "loss": 0.4969, "lr": 4.4427194213859216e-07, "epoch": 6.144, "percentage": 91.43, "elapsed_time": "2:16:26", "remaining_time": "0:12:47"}