ryanmarten commited on
Commit
0df6073
·
verified ·
1 Parent(s): c45e6e2

Training in progress, epoch 1

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:72c7116e320b1557c2942ada11f6e937c9f77c7cae77c0cc8d3475c128c62c55
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cdf6e8da8e2dd3cd8ca276ae975b5e5bbc414b5dfd9517de17f4e59b90c57d80
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0e45921c5ce8fbc592f3f2bde5f2bfd7e8306c56493ab34f1fcf883d1dfbb92a
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:02ac8f2091604ec108baa80e087cc15a23b93848081dac70035ea431952d4123
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4741fe8f7d07cea199afdb8926476a965bd7878acf29fab0541065be752282c6
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fb8dadfbfa981d10b9ed6a7135e3acc9c4977cf31073079330f3a24a368d94c4
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e8583c28ae9bcc36d07516ee2d4c4dd2489f0f90bae8c10daa3b26914b0e5468
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8b4324c3bfde0c12bcbf6cc8159e4237e82546abc396efe16c7ff461cc80b2f8
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -32,3 +32,36 @@
32
  {"current_steps": 32, "total_steps": 224, "loss": 0.709, "lr": 1.990122514534651e-05, "epoch": 0.9721518987341772, "percentage": 14.29, "elapsed_time": "0:52:37", "remaining_time": "5:15:44"}
33
  {"current_steps": 33, "total_steps": 224, "loss": 0.6872, "lr": 1.9878102910595097e-05, "epoch": 1.010126582278481, "percentage": 14.73, "elapsed_time": "0:55:08", "remaining_time": "5:19:12"}
34
  {"current_steps": 34, "total_steps": 224, "loss": 0.6668, "lr": 1.985256759242359e-05, "epoch": 1.040506329113924, "percentage": 15.18, "elapsed_time": "0:56:55", "remaining_time": "5:18:07"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
32
  {"current_steps": 32, "total_steps": 224, "loss": 0.709, "lr": 1.990122514534651e-05, "epoch": 0.9721518987341772, "percentage": 14.29, "elapsed_time": "0:52:37", "remaining_time": "5:15:44"}
33
  {"current_steps": 33, "total_steps": 224, "loss": 0.6872, "lr": 1.9878102910595097e-05, "epoch": 1.010126582278481, "percentage": 14.73, "elapsed_time": "0:55:08", "remaining_time": "5:19:12"}
34
  {"current_steps": 34, "total_steps": 224, "loss": 0.6668, "lr": 1.985256759242359e-05, "epoch": 1.040506329113924, "percentage": 15.18, "elapsed_time": "0:56:55", "remaining_time": "5:18:07"}
35
+ {"current_steps": 35, "total_steps": 224, "loss": 0.6862, "lr": 1.982462542875576e-05, "epoch": 1.070886075949367, "percentage": 15.62, "elapsed_time": "0:58:24", "remaining_time": "5:15:26"}
36
+ {"current_steps": 36, "total_steps": 224, "loss": 0.6604, "lr": 1.979428324547432e-05, "epoch": 1.1012658227848102, "percentage": 16.07, "elapsed_time": "1:00:12", "remaining_time": "5:14:26"}
37
+ {"current_steps": 37, "total_steps": 224, "loss": 0.6688, "lr": 1.9761548454753455e-05, "epoch": 1.1316455696202532, "percentage": 16.52, "elapsed_time": "1:01:45", "remaining_time": "5:12:06"}
38
+ {"current_steps": 38, "total_steps": 224, "loss": 0.6582, "lr": 1.972642905324813e-05, "epoch": 1.1620253164556962, "percentage": 16.96, "elapsed_time": "1:03:30", "remaining_time": "5:10:51"}
39
+ {"current_steps": 39, "total_steps": 224, "loss": 0.6718, "lr": 1.9688933620140638e-05, "epoch": 1.1924050632911392, "percentage": 17.41, "elapsed_time": "1:05:09", "remaining_time": "5:09:04"}
40
+ {"current_steps": 40, "total_steps": 224, "loss": 0.6488, "lr": 1.96490713150448e-05, "epoch": 1.2227848101265824, "percentage": 17.86, "elapsed_time": "1:06:37", "remaining_time": "5:06:27"}
41
+ {"current_steps": 41, "total_steps": 224, "loss": 0.6432, "lr": 1.9606851875768404e-05, "epoch": 1.2531645569620253, "percentage": 18.3, "elapsed_time": "1:08:22", "remaining_time": "5:05:09"}
42
+ {"current_steps": 42, "total_steps": 224, "loss": 0.6481, "lr": 1.956228561593441e-05, "epoch": 1.2835443037974683, "percentage": 18.75, "elapsed_time": "1:10:04", "remaining_time": "5:03:38"}
43
+ {"current_steps": 43, "total_steps": 224, "loss": 0.651, "lr": 1.9515383422461457e-05, "epoch": 1.3139240506329113, "percentage": 19.2, "elapsed_time": "1:11:44", "remaining_time": "5:01:57"}
44
+ {"current_steps": 44, "total_steps": 224, "loss": 0.648, "lr": 1.9466156752904344e-05, "epoch": 1.3443037974683545, "percentage": 19.64, "elapsed_time": "1:13:23", "remaining_time": "5:00:14"}
45
+ {"current_steps": 45, "total_steps": 224, "loss": 0.641, "lr": 1.9414617632655114e-05, "epoch": 1.3746835443037975, "percentage": 20.09, "elapsed_time": "1:15:02", "remaining_time": "4:58:29"}
46
+ {"current_steps": 46, "total_steps": 224, "loss": 0.6506, "lr": 1.9360778652005416e-05, "epoch": 1.4050632911392404, "percentage": 20.54, "elapsed_time": "1:16:51", "remaining_time": "4:57:24"}
47
+ {"current_steps": 47, "total_steps": 224, "loss": 0.6356, "lr": 1.9304652963070868e-05, "epoch": 1.4354430379746836, "percentage": 20.98, "elapsed_time": "1:18:21", "remaining_time": "4:55:06"}
48
+ {"current_steps": 48, "total_steps": 224, "loss": 0.6266, "lr": 1.9246254276578175e-05, "epoch": 1.4658227848101266, "percentage": 21.43, "elapsed_time": "1:20:06", "remaining_time": "4:53:43"}
49
+ {"current_steps": 49, "total_steps": 224, "loss": 0.6413, "lr": 1.9185596858515797e-05, "epoch": 1.4962025316455696, "percentage": 21.88, "elapsed_time": "1:21:46", "remaining_time": "4:52:04"}
50
+ {"current_steps": 50, "total_steps": 224, "loss": 0.6602, "lr": 1.9122695526648968e-05, "epoch": 1.5265822784810128, "percentage": 22.32, "elapsed_time": "1:23:25", "remaining_time": "4:50:20"}
51
+ {"current_steps": 51, "total_steps": 224, "loss": 0.6456, "lr": 1.905756564689991e-05, "epoch": 1.5569620253164556, "percentage": 22.77, "elapsed_time": "1:25:16", "remaining_time": "4:49:16"}
52
+ {"current_steps": 52, "total_steps": 224, "loss": 0.6278, "lr": 1.8990223129594146e-05, "epoch": 1.5873417721518988, "percentage": 23.21, "elapsed_time": "1:26:49", "remaining_time": "4:47:10"}
53
+ {"current_steps": 53, "total_steps": 224, "loss": 0.645, "lr": 1.8920684425573865e-05, "epoch": 1.6177215189873417, "percentage": 23.66, "elapsed_time": "1:28:32", "remaining_time": "4:45:40"}
54
+ {"current_steps": 54, "total_steps": 224, "loss": 0.6369, "lr": 1.884896652217917e-05, "epoch": 1.6481012658227847, "percentage": 24.11, "elapsed_time": "1:30:16", "remaining_time": "4:44:10"}
55
+ {"current_steps": 55, "total_steps": 224, "loss": 0.6216, "lr": 1.877508693909831e-05, "epoch": 1.678481012658228, "percentage": 24.55, "elapsed_time": "1:31:51", "remaining_time": "4:42:14"}
56
+ {"current_steps": 56, "total_steps": 224, "loss": 0.629, "lr": 1.8699063724087905e-05, "epoch": 1.7088607594936709, "percentage": 25.0, "elapsed_time": "1:33:24", "remaining_time": "4:40:14"}
57
+ {"current_steps": 57, "total_steps": 224, "loss": 0.6251, "lr": 1.862091544856407e-05, "epoch": 1.7392405063291139, "percentage": 25.45, "elapsed_time": "1:35:00", "remaining_time": "4:38:21"}
58
+ {"current_steps": 58, "total_steps": 224, "loss": 0.6191, "lr": 1.854066120306571e-05, "epoch": 1.769620253164557, "percentage": 25.89, "elapsed_time": "1:36:49", "remaining_time": "4:37:07"}
59
+ {"current_steps": 59, "total_steps": 224, "loss": 0.6276, "lr": 1.8458320592590976e-05, "epoch": 1.8, "percentage": 26.34, "elapsed_time": "1:38:17", "remaining_time": "4:34:53"}
60
+ {"current_steps": 60, "total_steps": 224, "loss": 0.62, "lr": 1.837391373180801e-05, "epoch": 1.830379746835443, "percentage": 26.79, "elapsed_time": "1:39:51", "remaining_time": "4:32:57"}
61
+ {"current_steps": 61, "total_steps": 224, "loss": 0.6287, "lr": 1.8287461240141217e-05, "epoch": 1.8607594936708862, "percentage": 27.23, "elapsed_time": "1:41:37", "remaining_time": "4:31:34"}
62
+ {"current_steps": 62, "total_steps": 224, "loss": 0.6397, "lr": 1.8198984236734246e-05, "epoch": 1.891139240506329, "percentage": 27.68, "elapsed_time": "1:43:14", "remaining_time": "4:29:44"}
63
+ {"current_steps": 63, "total_steps": 224, "loss": 0.6151, "lr": 1.8108504335290852e-05, "epoch": 1.9215189873417722, "percentage": 28.12, "elapsed_time": "1:44:37", "remaining_time": "4:27:23"}
64
+ {"current_steps": 64, "total_steps": 224, "loss": 0.6275, "lr": 1.8016043638794975e-05, "epoch": 1.9518987341772152, "percentage": 28.57, "elapsed_time": "1:46:12", "remaining_time": "4:25:30"}
65
+ {"current_steps": 65, "total_steps": 224, "loss": 0.629, "lr": 1.7921624734111292e-05, "epoch": 1.9822784810126581, "percentage": 29.02, "elapsed_time": "1:47:43", "remaining_time": "4:23:30"}
66
+ {"current_steps": 66, "total_steps": 224, "loss": 0.5857, "lr": 1.7825270686467567e-05, "epoch": 2.020253164556962, "percentage": 29.46, "elapsed_time": "1:50:07", "remaining_time": "4:23:38"}
67
+ {"current_steps": 67, "total_steps": 224, "loss": 0.5681, "lr": 1.7727005033820117e-05, "epoch": 2.050632911392405, "percentage": 29.91, "elapsed_time": "1:51:47", "remaining_time": "4:21:57"}