ryanmarten commited on
Commit
ef165bc
·
verified ·
1 Parent(s): cf2656f

Training in progress, epoch 2

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:326b28d46f3c64e035a97482e9dc560d41968dfc297912b269831871c442cdd1
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c74ddbbbeffb5ab03871abcc50c7d8614a41d67572f2693fd7bfee4c47564aa5
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4d716f0cf40c6347acdfa4e9caffb02e0ce4c2205882aa5ef502b901ed3c941b
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:23872eb187e6705dbeaaf7f8d1de7e0b0830110b74fca89e6c2a9faa0e96681b
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d8017553227023906df74bdb40880ae52f12445a2181c2cc6d51ece61f27a76f
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:823ba356a8a1d0e4c0759c3eeeb9f90c7b0ac1083beb9877e4a292696fa273c2
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:497efa80e8bf25c1dcdb7a9f34a5cea5b9c40c88239fa1e06e46f9296fa003da
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:67f22247c3e3eaa44ee57008b21dd31b75905330d324c58088325a4082569528
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -20,3 +20,14 @@
20
  {"current_steps": 20, "total_steps": 70, "loss": 0.713, "lr": 1.7971325072229227e-05, "epoch": 1.92, "percentage": 28.57, "elapsed_time": "0:39:53", "remaining_time": "1:39:43"}
21
  {"current_steps": 21, "total_steps": 70, "loss": 0.6956, "lr": 1.766044443118978e-05, "epoch": 2.016, "percentage": 30.0, "elapsed_time": "0:42:32", "remaining_time": "1:39:16"}
22
  {"current_steps": 22, "total_steps": 70, "loss": 0.6748, "lr": 1.7330518718298263e-05, "epoch": 2.112, "percentage": 31.43, "elapsed_time": "0:44:39", "remaining_time": "1:37:26"}
 
 
 
 
 
 
 
 
 
 
 
 
20
  {"current_steps": 20, "total_steps": 70, "loss": 0.713, "lr": 1.7971325072229227e-05, "epoch": 1.92, "percentage": 28.57, "elapsed_time": "0:39:53", "remaining_time": "1:39:43"}
21
  {"current_steps": 21, "total_steps": 70, "loss": 0.6956, "lr": 1.766044443118978e-05, "epoch": 2.016, "percentage": 30.0, "elapsed_time": "0:42:32", "remaining_time": "1:39:16"}
22
  {"current_steps": 22, "total_steps": 70, "loss": 0.6748, "lr": 1.7330518718298263e-05, "epoch": 2.112, "percentage": 31.43, "elapsed_time": "0:44:39", "remaining_time": "1:37:26"}
23
+ {"current_steps": 23, "total_steps": 70, "loss": 0.6648, "lr": 1.698236818086073e-05, "epoch": 2.208, "percentage": 32.86, "elapsed_time": "0:46:37", "remaining_time": "1:35:17"}
24
+ {"current_steps": 24, "total_steps": 70, "loss": 0.6548, "lr": 1.6616858375968596e-05, "epoch": 2.304, "percentage": 34.29, "elapsed_time": "0:48:28", "remaining_time": "1:32:54"}
25
+ {"current_steps": 25, "total_steps": 70, "loss": 0.6792, "lr": 1.6234898018587336e-05, "epoch": 2.4, "percentage": 35.71, "elapsed_time": "0:50:22", "remaining_time": "1:30:40"}
26
+ {"current_steps": 26, "total_steps": 70, "loss": 0.6968, "lr": 1.5837436722347902e-05, "epoch": 2.496, "percentage": 37.14, "elapsed_time": "0:52:15", "remaining_time": "1:28:25"}
27
+ {"current_steps": 27, "total_steps": 70, "loss": 0.6503, "lr": 1.5425462638657597e-05, "epoch": 2.592, "percentage": 38.57, "elapsed_time": "0:54:13", "remaining_time": "1:26:21"}
28
+ {"current_steps": 28, "total_steps": 70, "loss": 0.6455, "lr": 1.5000000000000002e-05, "epoch": 2.6879999999999997, "percentage": 40.0, "elapsed_time": "0:56:06", "remaining_time": "1:24:09"}
29
+ {"current_steps": 29, "total_steps": 70, "loss": 0.6506, "lr": 1.4562106573531632e-05, "epoch": 2.784, "percentage": 41.43, "elapsed_time": "0:58:06", "remaining_time": "1:22:09"}
30
+ {"current_steps": 30, "total_steps": 70, "loss": 0.637, "lr": 1.4112871031306118e-05, "epoch": 2.88, "percentage": 42.86, "elapsed_time": "0:59:56", "remaining_time": "1:19:55"}
31
+ {"current_steps": 31, "total_steps": 70, "loss": 0.6301, "lr": 1.3653410243663953e-05, "epoch": 2.976, "percentage": 44.29, "elapsed_time": "1:01:47", "remaining_time": "1:17:44"}
32
+ {"current_steps": 32, "total_steps": 70, "loss": 0.6197, "lr": 1.3184866502516846e-05, "epoch": 3.072, "percentage": 45.71, "elapsed_time": "1:04:27", "remaining_time": "1:16:32"}
33
+ {"current_steps": 33, "total_steps": 70, "loss": 0.6053, "lr": 1.2708404681430054e-05, "epoch": 3.168, "percentage": 47.14, "elapsed_time": "1:06:21", "remaining_time": "1:14:24"}