ryanmarten commited on
Commit
b32f952
·
verified ·
1 Parent(s): d4cafe2

Training in progress, epoch 6

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3a18f931132dac894b1f12a5361757ab2d0c64870947595d1269a65b70fa55dd
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7a3f5019af82be28dde53be0ba2d08c74be9190b68c9b8f22a4deb178292a99d
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dafef32e8aa8e7c24e3d66f820e0f8b26e73c690933ae4b7c07fab4dccb47a9a
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e7014f3987bf632c74e02e787beedf104a24bbf2b09b0c313588cd6f2079070d
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fc5fb08728cbb7b117559a7c89f358793db7855e7eb820ee8c4940730cdb53da
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8a571e01e280adf41edd7934f78327982273b64de93c450cfa30c7f614757aea
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cf99eac9eaed3cdb2d2753d2e276f4fb35fef36f8773fb00e02cf3265786b0ea
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1b27b294bd35c34ad7ec2ef99f78fe37d027fcf56afb9f710566655b97887db4
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -62,3 +62,10 @@
62
  {"current_steps": 62, "total_steps": 70, "loss": 0.5036, "lr": 7.852378812959227e-07, "epoch": 5.952, "percentage": 88.57, "elapsed_time": "2:10:43", "remaining_time": "0:16:52"}
63
  {"current_steps": 63, "total_steps": 70, "loss": 0.5197, "lr": 6.030737921409169e-07, "epoch": 6.048, "percentage": 90.0, "elapsed_time": "2:14:00", "remaining_time": "0:14:53"}
64
  {"current_steps": 64, "total_steps": 70, "loss": 0.4934, "lr": 4.4427194213859216e-07, "epoch": 6.144, "percentage": 91.43, "elapsed_time": "2:16:00", "remaining_time": "0:12:45"}
 
 
 
 
 
 
 
 
62
  {"current_steps": 62, "total_steps": 70, "loss": 0.5036, "lr": 7.852378812959227e-07, "epoch": 5.952, "percentage": 88.57, "elapsed_time": "2:10:43", "remaining_time": "0:16:52"}
63
  {"current_steps": 63, "total_steps": 70, "loss": 0.5197, "lr": 6.030737921409169e-07, "epoch": 6.048, "percentage": 90.0, "elapsed_time": "2:14:00", "remaining_time": "0:14:53"}
64
  {"current_steps": 64, "total_steps": 70, "loss": 0.4934, "lr": 4.4427194213859216e-07, "epoch": 6.144, "percentage": 91.43, "elapsed_time": "2:16:00", "remaining_time": "0:12:45"}
65
+ {"current_steps": 65, "total_steps": 70, "loss": 0.4938, "lr": 3.0922713770922155e-07, "epoch": 6.24, "percentage": 92.86, "elapsed_time": "2:18:06", "remaining_time": "0:10:37"}
66
+ {"current_steps": 66, "total_steps": 70, "loss": 0.504, "lr": 1.9827512151456175e-07, "epoch": 6.336, "percentage": 94.29, "elapsed_time": "2:20:11", "remaining_time": "0:08:29"}
67
+ {"current_steps": 67, "total_steps": 70, "loss": 0.49, "lr": 1.1169173774871478e-07, "epoch": 6.432, "percentage": 95.71, "elapsed_time": "2:22:18", "remaining_time": "0:06:22"}
68
+ {"current_steps": 68, "total_steps": 70, "loss": 0.4977, "lr": 4.9692246345985905e-08, "epoch": 6.5280000000000005, "percentage": 97.14, "elapsed_time": "2:24:26", "remaining_time": "0:04:14"}
69
+ {"current_steps": 69, "total_steps": 70, "loss": 0.5099, "lr": 1.2430787810776556e-08, "epoch": 6.624, "percentage": 98.57, "elapsed_time": "2:26:20", "remaining_time": "0:02:07"}
70
+ {"current_steps": 70, "total_steps": 70, "loss": 0.4839, "lr": 0.0, "epoch": 6.72, "percentage": 100.0, "elapsed_time": "2:28:13", "remaining_time": "0:00:00"}
71
+ {"current_steps": 70, "total_steps": 70, "epoch": 6.72, "percentage": 100.0, "elapsed_time": "2:30:13", "remaining_time": "0:00:00"}