ryanmarten commited on
Commit
4bcf450
·
verified ·
1 Parent(s): 8319b56

Training in progress, epoch 2

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bd57a86c8f864e53a3d1a1279ed189f5900cbaac734220e341148a3edbca90d5
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:20972f7916d323f519debdcd18a13a25cbaab9dbfdc0e8a1275609e00f8db81d
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:66084ae46963a7ae0603459d87e32b77f939aa58e17f474b00a98fbcb1f3fbb7
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2f14e559598ecaa66f2b7c3adeb3a07e3e2f2dba6394f5cbd8a4bba166a1c19e
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:09caf74e1b593c4a44ca99e44ac2a1447838658eb74fc508472a9902be37fbe6
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f9f47d16e3b683e9aefa00d3226451d847d5dfc4d75410be9c8da9987fae48c5
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:eadf66baa5f33c090b4b813ec5d2ef31f54aad9efdb70f9b5efee9a5882f692e
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:36b64bbadbdabeb2fb5750d1370a6e8e813fac90fe56c29f3feeff897238f1d4
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -20,3 +20,14 @@
20
  {"current_steps": 20, "total_steps": 70, "loss": 0.709, "lr": 1.7971325072229227e-05, "epoch": 1.92, "percentage": 28.57, "elapsed_time": "0:41:26", "remaining_time": "1:43:36"}
21
  {"current_steps": 21, "total_steps": 70, "loss": 0.6841, "lr": 1.766044443118978e-05, "epoch": 2.016, "percentage": 30.0, "elapsed_time": "0:44:17", "remaining_time": "1:43:19"}
22
  {"current_steps": 22, "total_steps": 70, "loss": 0.65, "lr": 1.7330518718298263e-05, "epoch": 2.112, "percentage": 31.43, "elapsed_time": "0:46:19", "remaining_time": "1:41:04"}
 
 
 
 
 
 
 
 
 
 
 
 
20
  {"current_steps": 20, "total_steps": 70, "loss": 0.709, "lr": 1.7971325072229227e-05, "epoch": 1.92, "percentage": 28.57, "elapsed_time": "0:41:26", "remaining_time": "1:43:36"}
21
  {"current_steps": 21, "total_steps": 70, "loss": 0.6841, "lr": 1.766044443118978e-05, "epoch": 2.016, "percentage": 30.0, "elapsed_time": "0:44:17", "remaining_time": "1:43:19"}
22
  {"current_steps": 22, "total_steps": 70, "loss": 0.65, "lr": 1.7330518718298263e-05, "epoch": 2.112, "percentage": 31.43, "elapsed_time": "0:46:19", "remaining_time": "1:41:04"}
23
+ {"current_steps": 23, "total_steps": 70, "loss": 0.658, "lr": 1.698236818086073e-05, "epoch": 2.208, "percentage": 32.86, "elapsed_time": "0:48:23", "remaining_time": "1:38:53"}
24
+ {"current_steps": 24, "total_steps": 70, "loss": 0.6298, "lr": 1.6616858375968596e-05, "epoch": 2.304, "percentage": 34.29, "elapsed_time": "0:50:21", "remaining_time": "1:36:32"}
25
+ {"current_steps": 25, "total_steps": 70, "loss": 0.6483, "lr": 1.6234898018587336e-05, "epoch": 2.4, "percentage": 35.71, "elapsed_time": "0:52:22", "remaining_time": "1:34:16"}
26
+ {"current_steps": 26, "total_steps": 70, "loss": 0.6309, "lr": 1.5837436722347902e-05, "epoch": 2.496, "percentage": 37.14, "elapsed_time": "0:54:26", "remaining_time": "1:32:07"}
27
+ {"current_steps": 27, "total_steps": 70, "loss": 0.6434, "lr": 1.5425462638657597e-05, "epoch": 2.592, "percentage": 38.57, "elapsed_time": "0:56:24", "remaining_time": "1:29:49"}
28
+ {"current_steps": 28, "total_steps": 70, "loss": 0.6293, "lr": 1.5000000000000002e-05, "epoch": 2.6879999999999997, "percentage": 40.0, "elapsed_time": "0:58:12", "remaining_time": "1:27:18"}
29
+ {"current_steps": 29, "total_steps": 70, "loss": 0.6267, "lr": 1.4562106573531632e-05, "epoch": 2.784, "percentage": 41.43, "elapsed_time": "1:00:23", "remaining_time": "1:25:22"}
30
+ {"current_steps": 30, "total_steps": 70, "loss": 0.6336, "lr": 1.4112871031306118e-05, "epoch": 2.88, "percentage": 42.86, "elapsed_time": "1:02:27", "remaining_time": "1:23:16"}
31
+ {"current_steps": 31, "total_steps": 70, "loss": 0.6135, "lr": 1.3653410243663953e-05, "epoch": 2.976, "percentage": 44.29, "elapsed_time": "1:04:33", "remaining_time": "1:21:13"}
32
+ {"current_steps": 32, "total_steps": 70, "loss": 0.5747, "lr": 1.3184866502516846e-05, "epoch": 3.072, "percentage": 45.71, "elapsed_time": "1:07:25", "remaining_time": "1:20:03"}
33
+ {"current_steps": 33, "total_steps": 70, "loss": 0.5785, "lr": 1.2708404681430054e-05, "epoch": 3.168, "percentage": 47.14, "elapsed_time": "1:09:13", "remaining_time": "1:17:36"}