neginr commited on
Commit
9f77091
·
verified ·
1 Parent(s): 976a5cb

Training in progress, epoch 5

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:748fb8e18c9eb3466ac8e2a215cfa9b8c75363f0a655432f13d4db405fe48226
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:101202fd2623dccecabf0eac53603f73fa7fba94b4ab4709eafb42825f039d77
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ba22200b9025cda6c429c9d2b0fd48af8af32c243dd912761119496420827c9d
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:82e2db3b121ce681f010dd9c244dffff81b202f4f3bf4d6431c42bd3fd3633a6
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1ba71828ef53dfdcb232de03f24e4ca9f0c2472bdc03c0a3c8168ecb6f4319e4
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4ebd48b340b336fe9b332ea2e8ce13cf64bfc4cfb686e6483ba38f2d732aef49
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:55a74cb2eb5890f100725ed2fb35e323909818e0de9355f9fe6208c969951fbe
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e45839859321d1c0143cf94255368effcdc83b18daafecea437a6daf17078987
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -60,3 +60,11 @@
60
  {"current_steps": 60, "total_steps": 70, "loss": 0.2433, "lr": 1.2177842662977136e-06, "epoch": 5.78125, "percentage": 85.71, "elapsed_time": "0:21:24", "remaining_time": "0:03:34"}
61
  {"current_steps": 61, "total_steps": 70, "loss": 0.2232, "lr": 9.903113209758098e-07, "epoch": 5.875, "percentage": 87.14, "elapsed_time": "0:21:38", "remaining_time": "0:03:11"}
62
  {"current_steps": 62, "total_steps": 70, "loss": 0.1921, "lr": 7.852378812959227e-07, "epoch": 5.96875, "percentage": 88.57, "elapsed_time": "0:21:51", "remaining_time": "0:02:49"}
 
 
 
 
 
 
 
 
 
60
  {"current_steps": 60, "total_steps": 70, "loss": 0.2433, "lr": 1.2177842662977136e-06, "epoch": 5.78125, "percentage": 85.71, "elapsed_time": "0:21:24", "remaining_time": "0:03:34"}
61
  {"current_steps": 61, "total_steps": 70, "loss": 0.2232, "lr": 9.903113209758098e-07, "epoch": 5.875, "percentage": 87.14, "elapsed_time": "0:21:38", "remaining_time": "0:03:11"}
62
  {"current_steps": 62, "total_steps": 70, "loss": 0.1921, "lr": 7.852378812959227e-07, "epoch": 5.96875, "percentage": 88.57, "elapsed_time": "0:21:51", "remaining_time": "0:02:49"}
63
+ {"current_steps": 63, "total_steps": 70, "loss": 0.2026, "lr": 6.030737921409169e-07, "epoch": 6.09375, "percentage": 90.0, "elapsed_time": "0:23:47", "remaining_time": "0:02:38"}
64
+ {"current_steps": 64, "total_steps": 70, "loss": 0.1918, "lr": 4.4427194213859216e-07, "epoch": 6.1875, "percentage": 91.43, "elapsed_time": "0:23:57", "remaining_time": "0:02:14"}
65
+ {"current_steps": 65, "total_steps": 70, "loss": 0.2292, "lr": 3.0922713770922155e-07, "epoch": 6.28125, "percentage": 92.86, "elapsed_time": "0:24:09", "remaining_time": "0:01:51"}
66
+ {"current_steps": 66, "total_steps": 70, "loss": 0.2002, "lr": 1.9827512151456175e-07, "epoch": 6.375, "percentage": 94.29, "elapsed_time": "0:24:23", "remaining_time": "0:01:28"}
67
+ {"current_steps": 67, "total_steps": 70, "loss": 0.2056, "lr": 1.1169173774871478e-07, "epoch": 6.46875, "percentage": 95.71, "elapsed_time": "0:24:37", "remaining_time": "0:01:06"}
68
+ {"current_steps": 68, "total_steps": 70, "loss": 0.2116, "lr": 4.9692246345985905e-08, "epoch": 6.5625, "percentage": 97.14, "elapsed_time": "0:24:51", "remaining_time": "0:00:43"}
69
+ {"current_steps": 69, "total_steps": 70, "loss": 0.2591, "lr": 1.2430787810776556e-08, "epoch": 6.65625, "percentage": 98.57, "elapsed_time": "0:25:07", "remaining_time": "0:00:21"}
70
+ {"current_steps": 70, "total_steps": 70, "loss": 0.2233, "lr": 0.0, "epoch": 6.75, "percentage": 100.0, "elapsed_time": "0:25:19", "remaining_time": "0:00:00"}