ryanmarten commited on
Commit
9b80097
·
verified ·
1 Parent(s): d08590a

Training in progress, epoch 4

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:74192fc22fb46722ab7f8796184e3c5896a9afd255a58520d1dc1db7f131a9e8
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0463ac2b7163a01784fb49770384a6bdd1900c52ecedc6b79f6d2606004de1d5
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:73a2472295dd4e354a73b4c854ec89653815dd622dbb7091390344b2b8a85f1e
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:02e76c0e838b95cb043cb0dbf106c4ed895ccbe6ab24ec33bf497d2b8a3cc168
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:691bd5fc6471ad7872f22d2e27d797d8a2a548e8d12a21f0b6d90feba6aed88c
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f95c9ea06320a6c7f01032580819b89b9df888b5cdeb89fa10952350c6f7d565
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6b2e63815655c7fea442cbddc62f4b271713633ab95750c06dbe976789b19061
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0e6381847e761967d2db633b619266073da5c097010c0e9aed8762d9f01e04da
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -41,3 +41,15 @@
41
  {"current_steps": 41, "total_steps": 70, "loss": 0.3905, "lr": 8.756562953525151e-06, "epoch": 3.936, "percentage": 58.57, "elapsed_time": "1:18:45", "remaining_time": "0:55:42"}
42
  {"current_steps": 42, "total_steps": 70, "loss": 0.39, "lr": 8.263518223330698e-06, "epoch": 4.032, "percentage": 60.0, "elapsed_time": "1:21:25", "remaining_time": "0:54:17"}
43
  {"current_steps": 43, "total_steps": 70, "loss": 0.3847, "lr": 7.774790660436857e-06, "epoch": 4.128, "percentage": 61.43, "elapsed_time": "1:23:16", "remaining_time": "0:52:17"}
 
 
 
 
 
 
 
 
 
 
 
 
 
41
  {"current_steps": 41, "total_steps": 70, "loss": 0.3905, "lr": 8.756562953525151e-06, "epoch": 3.936, "percentage": 58.57, "elapsed_time": "1:18:45", "remaining_time": "0:55:42"}
42
  {"current_steps": 42, "total_steps": 70, "loss": 0.39, "lr": 8.263518223330698e-06, "epoch": 4.032, "percentage": 60.0, "elapsed_time": "1:21:25", "remaining_time": "0:54:17"}
43
  {"current_steps": 43, "total_steps": 70, "loss": 0.3847, "lr": 7.774790660436857e-06, "epoch": 4.128, "percentage": 61.43, "elapsed_time": "1:23:16", "remaining_time": "0:52:17"}
44
+ {"current_steps": 44, "total_steps": 70, "loss": 0.3637, "lr": 7.291595318569951e-06, "epoch": 4.224, "percentage": 62.86, "elapsed_time": "1:25:12", "remaining_time": "0:50:21"}
45
+ {"current_steps": 45, "total_steps": 70, "loss": 0.3563, "lr": 6.815133497483157e-06, "epoch": 4.32, "percentage": 64.29, "elapsed_time": "1:27:01", "remaining_time": "0:48:20"}
46
+ {"current_steps": 46, "total_steps": 70, "loss": 0.3567, "lr": 6.34658975633605e-06, "epoch": 4.416, "percentage": 65.71, "elapsed_time": "1:29:04", "remaining_time": "0:46:28"}
47
+ {"current_steps": 47, "total_steps": 70, "loss": 0.3567, "lr": 5.887128968693887e-06, "epoch": 4.5120000000000005, "percentage": 67.14, "elapsed_time": "1:30:55", "remaining_time": "0:44:29"}
48
+ {"current_steps": 48, "total_steps": 70, "loss": 0.3563, "lr": 5.43789342646837e-06, "epoch": 4.608, "percentage": 68.57, "elapsed_time": "1:32:45", "remaining_time": "0:42:30"}
49
+ {"current_steps": 49, "total_steps": 70, "loss": 0.3541, "lr": 5.000000000000003e-06, "epoch": 4.704, "percentage": 70.0, "elapsed_time": "1:34:30", "remaining_time": "0:40:30"}
50
+ {"current_steps": 50, "total_steps": 70, "loss": 0.3649, "lr": 4.5745373613424075e-06, "epoch": 4.8, "percentage": 71.43, "elapsed_time": "1:36:18", "remaining_time": "0:38:31"}
51
+ {"current_steps": 51, "total_steps": 70, "loss": 0.3468, "lr": 4.162563277652104e-06, "epoch": 4.896, "percentage": 72.86, "elapsed_time": "1:38:09", "remaining_time": "0:36:33"}
52
+ {"current_steps": 52, "total_steps": 70, "loss": 0.3513, "lr": 3.7651019814126656e-06, "epoch": 4.992, "percentage": 74.29, "elapsed_time": "1:40:07", "remaining_time": "0:34:39"}
53
+ {"current_steps": 53, "total_steps": 70, "loss": 0.3322, "lr": 3.3831416240314085e-06, "epoch": 5.088, "percentage": 75.71, "elapsed_time": "1:42:54", "remaining_time": "0:33:00"}
54
+ {"current_steps": 54, "total_steps": 70, "loss": 0.3432, "lr": 3.017631819139273e-06, "epoch": 5.184, "percentage": 77.14, "elapsed_time": "1:44:45", "remaining_time": "0:31:02"}
55
+ {"current_steps": 55, "total_steps": 70, "loss": 0.3398, "lr": 2.669481281701739e-06, "epoch": 5.28, "percentage": 78.57, "elapsed_time": "1:46:28", "remaining_time": "0:29:02"}