sedrickkeh commited on
Commit
4bfa968
·
verified ·
1 Parent(s): 21c2a8f

Training in progress, epoch 5

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1bdd15f99c20bc14223ed7a4a6bfee8b874fd7c7a9875181df65c36bfe07aa59
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a7db0cac043442389744da06e52d70fc630b687e1a390a93f5f754e82a3890d6
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:361a46af8fd1ecffd9a394d819193a95bdf72611d80f07a81a928c371af0f6c0
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fff090bbff3efe80ffca5c94f698605ed9cfadc2342c58a091adadbaa7709762
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b667f897c30d9218cb943558233071f7e495b967e09e9982869ed5cdc718477f
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:26a29a7d367cb3498645db206d38deae04cf2870e2a2a52e657c0e45d4a5033e
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b7353e2b52fcc29959444c93e2908a9dd7a8a7b9c7cbf6898ec52e072f0fe7c5
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1a15e2979298cecddd1ac2c286fdfd3edef589a566d25e6a43bca4b91af7966d
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -54,3 +54,18 @@
54
  {"current_steps": 54, "total_steps": 70, "loss": 0.2236, "lr": 3.017631819139273e-06, "epoch": 5.184, "percentage": 77.14, "elapsed_time": "0:40:29", "remaining_time": "0:11:59"}
55
  {"current_steps": 55, "total_steps": 70, "loss": 0.2247, "lr": 2.669481281701739e-06, "epoch": 5.28, "percentage": 78.57, "elapsed_time": "0:41:07", "remaining_time": "0:11:12"}
56
  {"current_steps": 56, "total_steps": 70, "loss": 0.252, "lr": 2.339555568810221e-06, "epoch": 5.376, "percentage": 80.0, "elapsed_time": "0:41:49", "remaining_time": "0:10:27"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
54
  {"current_steps": 54, "total_steps": 70, "loss": 0.2236, "lr": 3.017631819139273e-06, "epoch": 5.184, "percentage": 77.14, "elapsed_time": "0:40:29", "remaining_time": "0:11:59"}
55
  {"current_steps": 55, "total_steps": 70, "loss": 0.2247, "lr": 2.669481281701739e-06, "epoch": 5.28, "percentage": 78.57, "elapsed_time": "0:41:07", "remaining_time": "0:11:12"}
56
  {"current_steps": 56, "total_steps": 70, "loss": 0.252, "lr": 2.339555568810221e-06, "epoch": 5.376, "percentage": 80.0, "elapsed_time": "0:41:49", "remaining_time": "0:10:27"}
57
+ {"current_steps": 57, "total_steps": 70, "loss": 0.19, "lr": 2.0286749277707783e-06, "epoch": 5.4719999999999995, "percentage": 81.43, "elapsed_time": "0:42:24", "remaining_time": "0:09:40"}
58
+ {"current_steps": 58, "total_steps": 70, "loss": 0.2247, "lr": 1.7376122568400533e-06, "epoch": 5.568, "percentage": 82.86, "elapsed_time": "0:43:05", "remaining_time": "0:08:55"}
59
+ {"current_steps": 59, "total_steps": 70, "loss": 0.2364, "lr": 1.467091183678444e-06, "epoch": 5.664, "percentage": 84.29, "elapsed_time": "0:43:51", "remaining_time": "0:08:10"}
60
+ {"current_steps": 60, "total_steps": 70, "loss": 0.2307, "lr": 1.2177842662977136e-06, "epoch": 5.76, "percentage": 85.71, "elapsed_time": "0:44:34", "remaining_time": "0:07:25"}
61
+ {"current_steps": 61, "total_steps": 70, "loss": 0.2486, "lr": 9.903113209758098e-07, "epoch": 5.856, "percentage": 87.14, "elapsed_time": "0:45:10", "remaining_time": "0:06:39"}
62
+ {"current_steps": 62, "total_steps": 70, "loss": 0.2418, "lr": 7.852378812959227e-07, "epoch": 5.952, "percentage": 88.57, "elapsed_time": "0:45:47", "remaining_time": "0:05:54"}
63
+ {"current_steps": 63, "total_steps": 70, "loss": 0.1956, "lr": 6.030737921409169e-07, "epoch": 6.048, "percentage": 90.0, "elapsed_time": "0:47:25", "remaining_time": "0:05:16"}
64
+ {"current_steps": 64, "total_steps": 70, "loss": 0.221, "lr": 4.4427194213859216e-07, "epoch": 6.144, "percentage": 91.43, "elapsed_time": "0:48:21", "remaining_time": "0:04:31"}
65
+ {"current_steps": 65, "total_steps": 70, "loss": 0.189, "lr": 3.0922713770922155e-07, "epoch": 6.24, "percentage": 92.86, "elapsed_time": "0:49:01", "remaining_time": "0:03:46"}
66
+ {"current_steps": 66, "total_steps": 70, "loss": 0.2004, "lr": 1.9827512151456175e-07, "epoch": 6.336, "percentage": 94.29, "elapsed_time": "0:49:33", "remaining_time": "0:03:00"}
67
+ {"current_steps": 67, "total_steps": 70, "loss": 0.2495, "lr": 1.1169173774871478e-07, "epoch": 6.432, "percentage": 95.71, "elapsed_time": "0:50:12", "remaining_time": "0:02:14"}
68
+ {"current_steps": 68, "total_steps": 70, "loss": 0.2204, "lr": 4.9692246345985905e-08, "epoch": 6.5280000000000005, "percentage": 97.14, "elapsed_time": "0:50:50", "remaining_time": "0:01:29"}
69
+ {"current_steps": 69, "total_steps": 70, "loss": 0.2364, "lr": 1.2430787810776556e-08, "epoch": 6.624, "percentage": 98.57, "elapsed_time": "0:51:29", "remaining_time": "0:00:44"}
70
+ {"current_steps": 70, "total_steps": 70, "loss": 0.2309, "lr": 0.0, "epoch": 6.72, "percentage": 100.0, "elapsed_time": "0:52:17", "remaining_time": "0:00:00"}
71
+ {"current_steps": 70, "total_steps": 70, "epoch": 6.72, "percentage": 100.0, "elapsed_time": "0:54:14", "remaining_time": "0:00:00"}