ryanmarten commited on
Commit
5b736f2
·
verified ·
1 Parent(s): 04139b8

Training in progress, epoch 4

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:954196a2a0a50afc118624a587018516a3e4f0895c6a41624955620be132dde9
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fe5cfff7d6140bb9ec412965f039a2eea97e54188705fbc5406d00a3d86ecaeb
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e7a189b8dc6b755acdaa17e6163a90b8102b2d6aa02d8ce782e4f469cf23edf2
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c2da981f4e4fef122748875f0a245cd1b0b620e3298f0434475fd4ef21ceaf38
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b0e7a44d4dd0117524af0bc86f2f3b07a12f4bb2eefa7f7e9099c7aa500f5067
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d0076e3712fef0ae54a12996f004227c678e0b7320ad6b39b970b1f627255910
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f106f5e1e7662b6b22c334e9b0e5dac731ebe816fce6dd5f4fc1179ce63dde7d
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ac382c76378925faee748660e984f946b6d56e1af320f4a8254d368715494df2
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -41,3 +41,13 @@
41
  {"current_steps": 41, "total_steps": 70, "loss": 0.5422, "lr": 8.756562953525151e-06, "epoch": 3.936, "percentage": 58.57, "elapsed_time": "1:23:37", "remaining_time": "0:59:08"}
42
  {"current_steps": 42, "total_steps": 70, "loss": 0.5152, "lr": 8.263518223330698e-06, "epoch": 4.032, "percentage": 60.0, "elapsed_time": "1:26:20", "remaining_time": "0:57:33"}
43
  {"current_steps": 43, "total_steps": 70, "loss": 0.4965, "lr": 7.774790660436857e-06, "epoch": 4.128, "percentage": 61.43, "elapsed_time": "1:28:14", "remaining_time": "0:55:24"}
 
 
 
 
 
 
 
 
 
 
 
41
  {"current_steps": 41, "total_steps": 70, "loss": 0.5422, "lr": 8.756562953525151e-06, "epoch": 3.936, "percentage": 58.57, "elapsed_time": "1:23:37", "remaining_time": "0:59:08"}
42
  {"current_steps": 42, "total_steps": 70, "loss": 0.5152, "lr": 8.263518223330698e-06, "epoch": 4.032, "percentage": 60.0, "elapsed_time": "1:26:20", "remaining_time": "0:57:33"}
43
  {"current_steps": 43, "total_steps": 70, "loss": 0.4965, "lr": 7.774790660436857e-06, "epoch": 4.128, "percentage": 61.43, "elapsed_time": "1:28:14", "remaining_time": "0:55:24"}
44
+ {"current_steps": 44, "total_steps": 70, "loss": 0.518, "lr": 7.291595318569951e-06, "epoch": 4.224, "percentage": 62.86, "elapsed_time": "1:30:09", "remaining_time": "0:53:16"}
45
+ {"current_steps": 45, "total_steps": 70, "loss": 0.5208, "lr": 6.815133497483157e-06, "epoch": 4.32, "percentage": 64.29, "elapsed_time": "1:32:07", "remaining_time": "0:51:10"}
46
+ {"current_steps": 46, "total_steps": 70, "loss": 0.5122, "lr": 6.34658975633605e-06, "epoch": 4.416, "percentage": 65.71, "elapsed_time": "1:34:04", "remaining_time": "0:49:04"}
47
+ {"current_steps": 47, "total_steps": 70, "loss": 0.501, "lr": 5.887128968693887e-06, "epoch": 4.5120000000000005, "percentage": 67.14, "elapsed_time": "1:36:04", "remaining_time": "0:47:00"}
48
+ {"current_steps": 48, "total_steps": 70, "loss": 0.5113, "lr": 5.43789342646837e-06, "epoch": 4.608, "percentage": 68.57, "elapsed_time": "1:38:08", "remaining_time": "0:44:58"}
49
+ {"current_steps": 49, "total_steps": 70, "loss": 0.4793, "lr": 5.000000000000003e-06, "epoch": 4.704, "percentage": 70.0, "elapsed_time": "1:39:55", "remaining_time": "0:42:49"}
50
+ {"current_steps": 50, "total_steps": 70, "loss": 0.5072, "lr": 4.5745373613424075e-06, "epoch": 4.8, "percentage": 71.43, "elapsed_time": "1:41:55", "remaining_time": "0:40:46"}
51
+ {"current_steps": 51, "total_steps": 70, "loss": 0.5148, "lr": 4.162563277652104e-06, "epoch": 4.896, "percentage": 72.86, "elapsed_time": "1:43:54", "remaining_time": "0:38:42"}
52
+ {"current_steps": 52, "total_steps": 70, "loss": 0.4826, "lr": 3.7651019814126656e-06, "epoch": 4.992, "percentage": 74.29, "elapsed_time": "1:45:53", "remaining_time": "0:36:39"}
53
+ {"current_steps": 53, "total_steps": 70, "loss": 0.4708, "lr": 3.3831416240314085e-06, "epoch": 5.088, "percentage": 75.71, "elapsed_time": "1:48:35", "remaining_time": "0:34:49"}