neginr commited on
Commit
976a5cb
·
verified ·
1 Parent(s): 9002bc8

Training in progress, epoch 4

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0eac6bfb604f6172853f0207a3b5962b95e1f26276091ace82293083ae54346c
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:748fb8e18c9eb3466ac8e2a215cfa9b8c75363f0a655432f13d4db405fe48226
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2d653c697314c16f6969a10433252def909160dbcd5fbe63b42aa5d675f695e7
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ba22200b9025cda6c429c9d2b0fd48af8af32c243dd912761119496420827c9d
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5931281c9bdc2ca6c9ec5d4d748a27ab94f74be464f16971d05e0330a9c1e21b
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1ba71828ef53dfdcb232de03f24e4ca9f0c2472bdc03c0a3c8168ecb6f4319e4
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:37c270bcdc52d332fe69a8ce911dbe808043c7e05dd0dc9e21ed7dbfbacb5fb5
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:55a74cb2eb5890f100725ed2fb35e323909818e0de9355f9fe6208c969951fbe
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -49,3 +49,14 @@
49
  {"current_steps": 49, "total_steps": 70, "loss": 0.2338, "lr": 5.000000000000003e-06, "epoch": 4.71875, "percentage": 70.0, "elapsed_time": "0:17:33", "remaining_time": "0:07:31"}
50
  {"current_steps": 50, "total_steps": 70, "loss": 0.2713, "lr": 4.5745373613424075e-06, "epoch": 4.8125, "percentage": 71.43, "elapsed_time": "0:17:47", "remaining_time": "0:07:07"}
51
  {"current_steps": 51, "total_steps": 70, "loss": 0.2671, "lr": 4.162563277652104e-06, "epoch": 4.90625, "percentage": 72.86, "elapsed_time": "0:18:00", "remaining_time": "0:06:42"}
 
 
 
 
 
 
 
 
 
 
 
 
49
  {"current_steps": 49, "total_steps": 70, "loss": 0.2338, "lr": 5.000000000000003e-06, "epoch": 4.71875, "percentage": 70.0, "elapsed_time": "0:17:33", "remaining_time": "0:07:31"}
50
  {"current_steps": 50, "total_steps": 70, "loss": 0.2713, "lr": 4.5745373613424075e-06, "epoch": 4.8125, "percentage": 71.43, "elapsed_time": "0:17:47", "remaining_time": "0:07:07"}
51
  {"current_steps": 51, "total_steps": 70, "loss": 0.2671, "lr": 4.162563277652104e-06, "epoch": 4.90625, "percentage": 72.86, "elapsed_time": "0:18:00", "remaining_time": "0:06:42"}
52
+ {"current_steps": 52, "total_steps": 70, "loss": 0.2578, "lr": 3.7651019814126656e-06, "epoch": 5.03125, "percentage": 74.29, "elapsed_time": "0:19:49", "remaining_time": "0:06:51"}
53
+ {"current_steps": 53, "total_steps": 70, "loss": 0.2494, "lr": 3.3831416240314085e-06, "epoch": 5.125, "percentage": 75.71, "elapsed_time": "0:20:02", "remaining_time": "0:06:25"}
54
+ {"current_steps": 54, "total_steps": 70, "loss": 0.201, "lr": 3.017631819139273e-06, "epoch": 5.21875, "percentage": 77.14, "elapsed_time": "0:20:13", "remaining_time": "0:05:59"}
55
+ {"current_steps": 55, "total_steps": 70, "loss": 0.2311, "lr": 2.669481281701739e-06, "epoch": 5.3125, "percentage": 78.57, "elapsed_time": "0:20:27", "remaining_time": "0:05:34"}
56
+ {"current_steps": 56, "total_steps": 70, "loss": 0.2233, "lr": 2.339555568810221e-06, "epoch": 5.40625, "percentage": 80.0, "elapsed_time": "0:20:37", "remaining_time": "0:05:09"}
57
+ {"current_steps": 57, "total_steps": 70, "loss": 0.2184, "lr": 2.0286749277707783e-06, "epoch": 5.5, "percentage": 81.43, "elapsed_time": "0:20:48", "remaining_time": "0:04:44"}
58
+ {"current_steps": 58, "total_steps": 70, "loss": 0.2361, "lr": 1.7376122568400533e-06, "epoch": 5.59375, "percentage": 82.86, "elapsed_time": "0:21:04", "remaining_time": "0:04:21"}
59
+ {"current_steps": 59, "total_steps": 70, "loss": 0.195, "lr": 1.467091183678444e-06, "epoch": 5.6875, "percentage": 84.29, "elapsed_time": "0:21:12", "remaining_time": "0:03:57"}
60
+ {"current_steps": 60, "total_steps": 70, "loss": 0.2433, "lr": 1.2177842662977136e-06, "epoch": 5.78125, "percentage": 85.71, "elapsed_time": "0:21:24", "remaining_time": "0:03:34"}
61
+ {"current_steps": 61, "total_steps": 70, "loss": 0.2232, "lr": 9.903113209758098e-07, "epoch": 5.875, "percentage": 87.14, "elapsed_time": "0:21:38", "remaining_time": "0:03:11"}
62
+ {"current_steps": 62, "total_steps": 70, "loss": 0.1921, "lr": 7.852378812959227e-07, "epoch": 5.96875, "percentage": 88.57, "elapsed_time": "0:21:51", "remaining_time": "0:02:49"}