ryanmarten commited on
Commit
c627eb2
·
verified ·
1 Parent(s): 835a7b1

Training in progress, epoch 3

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6ae6632db935fe8767eb8f15a698cd68df7cbf076b23b1b7dea60b01b45d8d8d
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cadbfcc0fa7ef1669fc81c6a9f2334fccbcaae215dc91f4ae84ccf2016df6c30
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b31bc0fbdc7d6944483a7d48a6055e56bf60209382effd724e988e142fc10ee6
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:38342227bb61f2bca355e82543408867cf528b5c7f7d6d4288a6e35cee6e949a
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0d437bf016abeba62caeecc4dbb489eaf6eb0b5351401c57c98ba4f66725a191
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2eecc93b68a91434c719320c596d9faf17735d17c5d0481196190769ff40c579
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e43341690e9b9182f71892bbcd674ed499fcb7012f1328fae7c5abf1a231f30c
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:181c8ab17d508f2707592ad077b8a3f2f2feaeb72b78288fa7fd08bae4525c9c
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -31,3 +31,13 @@
31
  {"current_steps": 31, "total_steps": 70, "loss": 0.6252, "lr": 1.3653410243663953e-05, "epoch": 2.976, "percentage": 44.29, "elapsed_time": "1:03:16", "remaining_time": "1:19:36"}
32
  {"current_steps": 32, "total_steps": 70, "loss": 0.5995, "lr": 1.3184866502516846e-05, "epoch": 3.072, "percentage": 45.71, "elapsed_time": "1:05:58", "remaining_time": "1:18:20"}
33
  {"current_steps": 33, "total_steps": 70, "loss": 0.5774, "lr": 1.2708404681430054e-05, "epoch": 3.168, "percentage": 47.14, "elapsed_time": "1:08:05", "remaining_time": "1:16:20"}
 
 
 
 
 
 
 
 
 
 
 
31
  {"current_steps": 31, "total_steps": 70, "loss": 0.6252, "lr": 1.3653410243663953e-05, "epoch": 2.976, "percentage": 44.29, "elapsed_time": "1:03:16", "remaining_time": "1:19:36"}
32
  {"current_steps": 32, "total_steps": 70, "loss": 0.5995, "lr": 1.3184866502516846e-05, "epoch": 3.072, "percentage": 45.71, "elapsed_time": "1:05:58", "remaining_time": "1:18:20"}
33
  {"current_steps": 33, "total_steps": 70, "loss": 0.5774, "lr": 1.2708404681430054e-05, "epoch": 3.168, "percentage": 47.14, "elapsed_time": "1:08:05", "remaining_time": "1:16:20"}
34
+ {"current_steps": 34, "total_steps": 70, "loss": 0.5783, "lr": 1.2225209339563144e-05, "epoch": 3.2640000000000002, "percentage": 48.57, "elapsed_time": "1:09:51", "remaining_time": "1:13:58"}
35
+ {"current_steps": 35, "total_steps": 70, "loss": 0.5801, "lr": 1.1736481776669307e-05, "epoch": 3.36, "percentage": 50.0, "elapsed_time": "1:11:43", "remaining_time": "1:11:43"}
36
+ {"current_steps": 36, "total_steps": 70, "loss": 0.585, "lr": 1.1243437046474854e-05, "epoch": 3.456, "percentage": 51.43, "elapsed_time": "1:13:52", "remaining_time": "1:09:46"}
37
+ {"current_steps": 37, "total_steps": 70, "loss": 0.5745, "lr": 1.0747300935864245e-05, "epoch": 3.552, "percentage": 52.86, "elapsed_time": "1:16:00", "remaining_time": "1:07:47"}
38
+ {"current_steps": 38, "total_steps": 70, "loss": 0.5644, "lr": 1.0249306917380731e-05, "epoch": 3.648, "percentage": 54.29, "elapsed_time": "1:17:53", "remaining_time": "1:05:35"}
39
+ {"current_steps": 39, "total_steps": 70, "loss": 0.5688, "lr": 9.750693082619274e-06, "epoch": 3.7439999999999998, "percentage": 55.71, "elapsed_time": "1:19:53", "remaining_time": "1:03:29"}
40
+ {"current_steps": 40, "total_steps": 70, "loss": 0.5636, "lr": 9.252699064135759e-06, "epoch": 3.84, "percentage": 57.14, "elapsed_time": "1:21:55", "remaining_time": "1:01:26"}
41
+ {"current_steps": 41, "total_steps": 70, "loss": 0.567, "lr": 8.756562953525151e-06, "epoch": 3.936, "percentage": 58.57, "elapsed_time": "1:23:47", "remaining_time": "0:59:16"}
42
+ {"current_steps": 42, "total_steps": 70, "loss": 0.5496, "lr": 8.263518223330698e-06, "epoch": 4.032, "percentage": 60.0, "elapsed_time": "1:26:33", "remaining_time": "0:57:42"}
43
+ {"current_steps": 43, "total_steps": 70, "loss": 0.533, "lr": 7.774790660436857e-06, "epoch": 4.128, "percentage": 61.43, "elapsed_time": "1:28:25", "remaining_time": "0:55:31"}