sedrickkeh commited on
Commit
c52829d
·
verified ·
1 Parent(s): f369e0e

Training in progress, epoch 2

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1fd9ea0dd86821ec3ae355b18848adec36811c7ce14baf0b3aa1c827a52e7822
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b1cf0d73a4944c76886e467ccd71da98f24a912867e5e9abaec18060b4494a79
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:da26e8336d8d7ba2dc36d49e7ea9ef7880002c96cce1a29ed041880213b8f029
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c30f08ffcacdc0461992ef8ef343531df084f80592cd8a29f36d948eaf7ccebd
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4b9edecb6c17accd73764c7f32e75dcf596e01be0065b6d3cddfb5fa926999ed
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:471721731aede15e95ac5a1a3fcf2562385b737f0387e025076adface8669a05
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d38ecc0f7bbf253d4bc6002f200a25296cbaa6baefc9857c127a3f692e93425c
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c5e9a3ec7c3b93ce0e4574165b68e30a954f9a0ee4f5eda55d0c2e53af121f53
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -68,3 +68,36 @@
68
  {"current_steps": 68, "total_steps": 224, "loss": 0.4652, "lr": 1.762685178110382e-05, "epoch": 2.081012658227848, "percentage": 30.36, "elapsed_time": "0:50:03", "remaining_time": "1:54:50"}
69
  {"current_steps": 69, "total_steps": 224, "loss": 0.451, "lr": 1.752483539436807e-05, "epoch": 2.1113924050632913, "percentage": 30.8, "elapsed_time": "0:50:41", "remaining_time": "1:53:52"}
70
  {"current_steps": 70, "total_steps": 224, "loss": 0.4843, "lr": 1.7420980794800013e-05, "epoch": 2.141772151898734, "percentage": 31.25, "elapsed_time": "0:51:44", "remaining_time": "1:53:49"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
68
  {"current_steps": 68, "total_steps": 224, "loss": 0.4652, "lr": 1.762685178110382e-05, "epoch": 2.081012658227848, "percentage": 30.36, "elapsed_time": "0:50:03", "remaining_time": "1:54:50"}
69
  {"current_steps": 69, "total_steps": 224, "loss": 0.451, "lr": 1.752483539436807e-05, "epoch": 2.1113924050632913, "percentage": 30.8, "elapsed_time": "0:50:41", "remaining_time": "1:53:52"}
70
  {"current_steps": 70, "total_steps": 224, "loss": 0.4843, "lr": 1.7420980794800013e-05, "epoch": 2.141772151898734, "percentage": 31.25, "elapsed_time": "0:51:44", "remaining_time": "1:53:49"}
71
+ {"current_steps": 71, "total_steps": 224, "loss": 0.4779, "lr": 1.731531335263669e-05, "epoch": 2.1721518987341772, "percentage": 31.7, "elapsed_time": "0:52:26", "remaining_time": "1:53:00"}
72
+ {"current_steps": 72, "total_steps": 224, "loss": 0.4812, "lr": 1.720785888096743e-05, "epoch": 2.2025316455696204, "percentage": 32.14, "elapsed_time": "0:53:08", "remaining_time": "1:52:12"}
73
+ {"current_steps": 73, "total_steps": 224, "loss": 0.4881, "lr": 1.7098643629428035e-05, "epoch": 2.232911392405063, "percentage": 32.59, "elapsed_time": "0:53:56", "remaining_time": "1:51:34"}
74
+ {"current_steps": 74, "total_steps": 224, "loss": 0.4389, "lr": 1.698769427778842e-05, "epoch": 2.2632911392405064, "percentage": 33.04, "elapsed_time": "0:54:46", "remaining_time": "1:51:00"}
75
+ {"current_steps": 75, "total_steps": 224, "loss": 0.4898, "lr": 1.687503792943506e-05, "epoch": 2.293670886075949, "percentage": 33.48, "elapsed_time": "0:55:31", "remaining_time": "1:50:19"}
76
+ {"current_steps": 76, "total_steps": 224, "loss": 0.4513, "lr": 1.6760702104750046e-05, "epoch": 2.3240506329113924, "percentage": 33.93, "elapsed_time": "0:56:02", "remaining_time": "1:49:08"}
77
+ {"current_steps": 77, "total_steps": 224, "loss": 0.4544, "lr": 1.664471473438822e-05, "epoch": 2.3544303797468356, "percentage": 34.38, "elapsed_time": "0:56:48", "remaining_time": "1:48:26"}
78
+ {"current_steps": 78, "total_steps": 224, "loss": 0.4695, "lr": 1.6527104152454096e-05, "epoch": 2.3848101265822783, "percentage": 34.82, "elapsed_time": "0:57:47", "remaining_time": "1:48:10"}
79
+ {"current_steps": 79, "total_steps": 224, "loss": 0.5128, "lr": 1.6407899089580263e-05, "epoch": 2.4151898734177215, "percentage": 35.27, "elapsed_time": "0:58:28", "remaining_time": "1:47:18"}
80
+ {"current_steps": 80, "total_steps": 224, "loss": 0.4573, "lr": 1.628712866590885e-05, "epoch": 2.4455696202531647, "percentage": 35.71, "elapsed_time": "0:59:02", "remaining_time": "1:46:16"}
81
+ {"current_steps": 81, "total_steps": 224, "loss": 0.4605, "lr": 1.6164822383977912e-05, "epoch": 2.4759493670886075, "percentage": 36.16, "elapsed_time": "0:59:44", "remaining_time": "1:45:27"}
82
+ {"current_steps": 82, "total_steps": 224, "loss": 0.4683, "lr": 1.604101012151436e-05, "epoch": 2.5063291139240507, "percentage": 36.61, "elapsed_time": "1:00:22", "remaining_time": "1:44:32"}
83
+ {"current_steps": 83, "total_steps": 224, "loss": 0.4751, "lr": 1.5915722124135227e-05, "epoch": 2.536708860759494, "percentage": 37.05, "elapsed_time": "1:01:16", "remaining_time": "1:44:06"}
84
+ {"current_steps": 84, "total_steps": 224, "loss": 0.4879, "lr": 1.5788988997959115e-05, "epoch": 2.5670886075949366, "percentage": 37.5, "elapsed_time": "1:02:05", "remaining_time": "1:43:29"}
85
+ {"current_steps": 85, "total_steps": 224, "loss": 0.4601, "lr": 1.5660841702129533e-05, "epoch": 2.59746835443038, "percentage": 37.95, "elapsed_time": "1:02:53", "remaining_time": "1:42:50"}
86
+ {"current_steps": 86, "total_steps": 224, "loss": 0.4797, "lr": 1.5531311541251995e-05, "epoch": 2.6278481012658226, "percentage": 38.39, "elapsed_time": "1:03:31", "remaining_time": "1:41:56"}
87
+ {"current_steps": 87, "total_steps": 224, "loss": 0.4646, "lr": 1.540043015774676e-05, "epoch": 2.6582278481012658, "percentage": 38.84, "elapsed_time": "1:04:15", "remaining_time": "1:41:11"}
88
+ {"current_steps": 88, "total_steps": 224, "loss": 0.4658, "lr": 1.5268229524119007e-05, "epoch": 2.688607594936709, "percentage": 39.29, "elapsed_time": "1:04:57", "remaining_time": "1:40:23"}
89
+ {"current_steps": 89, "total_steps": 224, "loss": 0.4632, "lr": 1.513474193514842e-05, "epoch": 2.7189873417721517, "percentage": 39.73, "elapsed_time": "1:05:36", "remaining_time": "1:39:31"}
90
+ {"current_steps": 90, "total_steps": 224, "loss": 0.4835, "lr": 1.5000000000000002e-05, "epoch": 2.749367088607595, "percentage": 40.18, "elapsed_time": "1:06:12", "remaining_time": "1:38:35"}
91
+ {"current_steps": 91, "total_steps": 224, "loss": 0.4503, "lr": 1.4864036634258112e-05, "epoch": 2.779746835443038, "percentage": 40.62, "elapsed_time": "1:07:07", "remaining_time": "1:38:05"}
92
+ {"current_steps": 92, "total_steps": 224, "loss": 0.4418, "lr": 1.4726885051885654e-05, "epoch": 2.810126582278481, "percentage": 41.07, "elapsed_time": "1:07:48", "remaining_time": "1:37:17"}
93
+ {"current_steps": 93, "total_steps": 224, "loss": 0.4674, "lr": 1.4588578757110359e-05, "epoch": 2.840506329113924, "percentage": 41.52, "elapsed_time": "1:08:23", "remaining_time": "1:36:20"}
94
+ {"current_steps": 94, "total_steps": 224, "loss": 0.4354, "lr": 1.4449151536240167e-05, "epoch": 2.8708860759493673, "percentage": 41.96, "elapsed_time": "1:09:01", "remaining_time": "1:35:27"}
95
+ {"current_steps": 95, "total_steps": 224, "loss": 0.4402, "lr": 1.4308637449409705e-05, "epoch": 2.90126582278481, "percentage": 42.41, "elapsed_time": "1:09:43", "remaining_time": "1:34:40"}
96
+ {"current_steps": 96, "total_steps": 224, "loss": 0.4654, "lr": 1.4167070822259868e-05, "epoch": 2.9316455696202532, "percentage": 42.86, "elapsed_time": "1:10:18", "remaining_time": "1:33:45"}
97
+ {"current_steps": 97, "total_steps": 224, "loss": 0.4391, "lr": 1.402448623755254e-05, "epoch": 2.962025316455696, "percentage": 43.3, "elapsed_time": "1:10:49", "remaining_time": "1:32:43"}
98
+ {"current_steps": 98, "total_steps": 224, "loss": 0.4737, "lr": 1.3880918526722497e-05, "epoch": 2.992405063291139, "percentage": 43.75, "elapsed_time": "1:11:29", "remaining_time": "1:31:55"}
99
+ {"current_steps": 99, "total_steps": 224, "loss": 0.3205, "lr": 1.3736402761368597e-05, "epoch": 3.030379746835443, "percentage": 44.2, "elapsed_time": "1:13:10", "remaining_time": "1:32:23"}
100
+ {"current_steps": 100, "total_steps": 224, "loss": 0.3245, "lr": 1.3590974244686248e-05, "epoch": 3.060759493670886, "percentage": 44.64, "elapsed_time": "1:13:53", "remaining_time": "1:31:37"}
101
+ {"current_steps": 101, "total_steps": 224, "loss": 0.3338, "lr": 1.344466850284333e-05, "epoch": 3.091139240506329, "percentage": 45.09, "elapsed_time": "1:14:37", "remaining_time": "1:30:52"}
102
+ {"current_steps": 102, "total_steps": 224, "loss": 0.3402, "lr": 1.3297521276301666e-05, "epoch": 3.1215189873417724, "percentage": 45.54, "elapsed_time": "1:15:24", "remaining_time": "1:30:11"}
103
+ {"current_steps": 103, "total_steps": 224, "loss": 0.3152, "lr": 1.3149568511086104e-05, "epoch": 3.151898734177215, "percentage": 45.98, "elapsed_time": "1:16:01", "remaining_time": "1:29:18"}