ryanmarten commited on
Commit
91e0a84
·
verified ·
1 Parent(s): 4bcf450

Training in progress, epoch 3

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:20972f7916d323f519debdcd18a13a25cbaab9dbfdc0e8a1275609e00f8db81d
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d70b121a0eb937170cfc964111f43adee543091b4a2d43e1c576fe450e1fb259
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2f14e559598ecaa66f2b7c3adeb3a07e3e2f2dba6394f5cbd8a4bba166a1c19e
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bd125d97c3549d694e66df1f70e982235ccf5c55b52a5bc7337704a694b731f9
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f9f47d16e3b683e9aefa00d3226451d847d5dfc4d75410be9c8da9987fae48c5
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7e55d06b03c16463554e9da8105e8b1879610c9c2afc1a87e64dd0776304b821
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:36b64bbadbdabeb2fb5750d1370a6e8e813fac90fe56c29f3feeff897238f1d4
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:33943d6f0805a238107807bd1e86fac95061afb8e5bf5eec1db7f94dcc0916c4
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -31,3 +31,13 @@
31
  {"current_steps": 31, "total_steps": 70, "loss": 0.6135, "lr": 1.3653410243663953e-05, "epoch": 2.976, "percentage": 44.29, "elapsed_time": "1:04:33", "remaining_time": "1:21:13"}
32
  {"current_steps": 32, "total_steps": 70, "loss": 0.5747, "lr": 1.3184866502516846e-05, "epoch": 3.072, "percentage": 45.71, "elapsed_time": "1:07:25", "remaining_time": "1:20:03"}
33
  {"current_steps": 33, "total_steps": 70, "loss": 0.5785, "lr": 1.2708404681430054e-05, "epoch": 3.168, "percentage": 47.14, "elapsed_time": "1:09:13", "remaining_time": "1:17:36"}
 
 
 
 
 
 
 
 
 
 
 
31
  {"current_steps": 31, "total_steps": 70, "loss": 0.6135, "lr": 1.3653410243663953e-05, "epoch": 2.976, "percentage": 44.29, "elapsed_time": "1:04:33", "remaining_time": "1:21:13"}
32
  {"current_steps": 32, "total_steps": 70, "loss": 0.5747, "lr": 1.3184866502516846e-05, "epoch": 3.072, "percentage": 45.71, "elapsed_time": "1:07:25", "remaining_time": "1:20:03"}
33
  {"current_steps": 33, "total_steps": 70, "loss": 0.5785, "lr": 1.2708404681430054e-05, "epoch": 3.168, "percentage": 47.14, "elapsed_time": "1:09:13", "remaining_time": "1:17:36"}
34
+ {"current_steps": 34, "total_steps": 70, "loss": 0.565, "lr": 1.2225209339563144e-05, "epoch": 3.2640000000000002, "percentage": 48.57, "elapsed_time": "1:11:17", "remaining_time": "1:15:29"}
35
+ {"current_steps": 35, "total_steps": 70, "loss": 0.5754, "lr": 1.1736481776669307e-05, "epoch": 3.36, "percentage": 50.0, "elapsed_time": "1:13:23", "remaining_time": "1:13:23"}
36
+ {"current_steps": 36, "total_steps": 70, "loss": 0.5689, "lr": 1.1243437046474854e-05, "epoch": 3.456, "percentage": 51.43, "elapsed_time": "1:15:25", "remaining_time": "1:11:13"}
37
+ {"current_steps": 37, "total_steps": 70, "loss": 0.5739, "lr": 1.0747300935864245e-05, "epoch": 3.552, "percentage": 52.86, "elapsed_time": "1:17:32", "remaining_time": "1:09:09"}
38
+ {"current_steps": 38, "total_steps": 70, "loss": 0.5675, "lr": 1.0249306917380731e-05, "epoch": 3.648, "percentage": 54.29, "elapsed_time": "1:19:33", "remaining_time": "1:06:59"}
39
+ {"current_steps": 39, "total_steps": 70, "loss": 0.5609, "lr": 9.750693082619274e-06, "epoch": 3.7439999999999998, "percentage": 55.71, "elapsed_time": "1:21:39", "remaining_time": "1:04:54"}
40
+ {"current_steps": 40, "total_steps": 70, "loss": 0.5667, "lr": 9.252699064135759e-06, "epoch": 3.84, "percentage": 57.14, "elapsed_time": "1:23:40", "remaining_time": "1:02:45"}
41
+ {"current_steps": 41, "total_steps": 70, "loss": 0.5535, "lr": 8.756562953525151e-06, "epoch": 3.936, "percentage": 58.57, "elapsed_time": "1:25:30", "remaining_time": "1:00:29"}
42
+ {"current_steps": 42, "total_steps": 70, "loss": 0.5497, "lr": 8.263518223330698e-06, "epoch": 4.032, "percentage": 60.0, "elapsed_time": "1:28:27", "remaining_time": "0:58:58"}
43
+ {"current_steps": 43, "total_steps": 70, "loss": 0.5144, "lr": 7.774790660436857e-06, "epoch": 4.128, "percentage": 61.43, "elapsed_time": "1:30:31", "remaining_time": "0:56:50"}