neginr commited on
Commit
ad00dac
·
verified ·
1 Parent(s): 882ff5e

Training in progress, epoch 6

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:529f36cc6c1a606599df7a9dee164693920856eaa316c55656a78339b5856c05
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4eedfb12ffa7651640247566ab5272941030f6bdd26fdf92f99787ea6fefdf37
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f298f99cacb499a8c46273b192904cf1394e3a0af2aa61720b5d6ed8ab786d91
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6c172ec0813f77dccd77f50521fa2406f437a155200ff2947c397e71fb6d7cba
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f4af57787cb004f70beeaf8e37f003b579dea21cd04bab7e2eb3c5b345c0dde1
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0988742bd1c68a4a8aab5d23248729cb9b8c293407d3c099d0d66ba7632c51ff
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d04545968814e02e057dba307678eb50c1a7953abfdac86f70b80117701ddabc
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d1ce4caf6f4ce40fcc68f3dd7d4f5f458ecf3a5d86de1043c5bc7afc91646da
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -343,3 +343,23 @@
343
  {"current_steps": 343, "total_steps": 364, "loss": 0.077, "lr": 2.028332677849254e-07, "epoch": 6.554140127388535, "percentage": 94.23, "elapsed_time": "0:40:11", "remaining_time": "0:02:27"}
344
  {"current_steps": 344, "total_steps": 364, "loss": 0.0824, "lr": 1.840338184455881e-07, "epoch": 6.573248407643312, "percentage": 94.51, "elapsed_time": "0:40:18", "remaining_time": "0:02:20"}
345
  {"current_steps": 345, "total_steps": 364, "loss": 0.0461, "lr": 1.6614038111289034e-07, "epoch": 6.592356687898089, "percentage": 94.78, "elapsed_time": "0:40:21", "remaining_time": "0:02:13"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
343
  {"current_steps": 343, "total_steps": 364, "loss": 0.077, "lr": 2.028332677849254e-07, "epoch": 6.554140127388535, "percentage": 94.23, "elapsed_time": "0:40:11", "remaining_time": "0:02:27"}
344
  {"current_steps": 344, "total_steps": 364, "loss": 0.0824, "lr": 1.840338184455881e-07, "epoch": 6.573248407643312, "percentage": 94.51, "elapsed_time": "0:40:18", "remaining_time": "0:02:20"}
345
  {"current_steps": 345, "total_steps": 364, "loss": 0.0461, "lr": 1.6614038111289034e-07, "epoch": 6.592356687898089, "percentage": 94.78, "elapsed_time": "0:40:21", "remaining_time": "0:02:13"}
346
+ {"current_steps": 346, "total_steps": 364, "loss": 0.0749, "lr": 1.49154607348051e-07, "epoch": 6.611464968152866, "percentage": 95.05, "elapsed_time": "0:40:27", "remaining_time": "0:02:06"}
347
+ {"current_steps": 347, "total_steps": 364, "loss": 0.0743, "lr": 1.330780649350938e-07, "epoch": 6.630573248407643, "percentage": 95.33, "elapsed_time": "0:40:33", "remaining_time": "0:01:59"}
348
+ {"current_steps": 348, "total_steps": 364, "loss": 0.0809, "lr": 1.1791223773614635e-07, "epoch": 6.649681528662421, "percentage": 95.6, "elapsed_time": "0:40:38", "remaining_time": "0:01:52"}
349
+ {"current_steps": 349, "total_steps": 364, "loss": 0.0413, "lr": 1.0365852555447642e-07, "epoch": 6.6687898089171975, "percentage": 95.88, "elapsed_time": "0:40:42", "remaining_time": "0:01:44"}
350
+ {"current_steps": 350, "total_steps": 364, "loss": 0.0552, "lr": 9.031824400528854e-08, "epoch": 6.687898089171974, "percentage": 96.15, "elapsed_time": "0:40:45", "remaining_time": "0:01:37"}
351
+ {"current_steps": 351, "total_steps": 364, "loss": 0.0827, "lr": 7.789262439430012e-08, "epoch": 6.707006369426751, "percentage": 96.43, "elapsed_time": "0:40:53", "remaining_time": "0:01:30"}
352
+ {"current_steps": 352, "total_steps": 364, "loss": 0.0367, "lr": 6.638281360408339e-08, "epoch": 6.726114649681529, "percentage": 96.7, "elapsed_time": "0:40:57", "remaining_time": "0:01:23"}
353
+ {"current_steps": 353, "total_steps": 364, "loss": 0.0711, "lr": 5.578987398821345e-08, "epoch": 6.745222929936306, "percentage": 96.98, "elapsed_time": "0:41:01", "remaining_time": "0:01:16"}
354
+ {"current_steps": 354, "total_steps": 364, "loss": 0.0581, "lr": 4.6114783273213395e-08, "epoch": 6.764331210191083, "percentage": 97.25, "elapsed_time": "0:41:04", "remaining_time": "0:01:09"}
355
+ {"current_steps": 355, "total_steps": 364, "loss": 0.0836, "lr": 3.735843446830867e-08, "epoch": 6.7834394904458595, "percentage": 97.53, "elapsed_time": "0:41:09", "remaining_time": "0:01:02"}
356
+ {"current_steps": 356, "total_steps": 364, "loss": 0.0706, "lr": 2.9521635783001932e-08, "epoch": 6.802547770700637, "percentage": 97.8, "elapsed_time": "0:41:17", "remaining_time": "0:00:55"}
357
+ {"current_steps": 357, "total_steps": 364, "loss": 0.073, "lr": 2.2605110552477162e-08, "epoch": 6.821656050955414, "percentage": 98.08, "elapsed_time": "0:41:25", "remaining_time": "0:00:48"}
358
+ {"current_steps": 358, "total_steps": 364, "loss": 0.0539, "lr": 1.6609497170834154e-08, "epoch": 6.840764331210191, "percentage": 98.35, "elapsed_time": "0:41:29", "remaining_time": "0:00:41"}
359
+ {"current_steps": 359, "total_steps": 364, "loss": 0.0621, "lr": 1.1535349032167908e-08, "epoch": 6.859872611464969, "percentage": 98.63, "elapsed_time": "0:41:34", "remaining_time": "0:00:34"}
360
+ {"current_steps": 360, "total_steps": 364, "loss": 0.0518, "lr": 7.3831344794872415e-09, "epoch": 6.8789808917197455, "percentage": 98.9, "elapsed_time": "0:41:38", "remaining_time": "0:00:27"}
361
+ {"current_steps": 361, "total_steps": 364, "loss": 0.0576, "lr": 4.153236761488266e-09, "epoch": 6.898089171974522, "percentage": 99.18, "elapsed_time": "0:41:42", "remaining_time": "0:00:20"}
362
+ {"current_steps": 362, "total_steps": 364, "loss": 0.0688, "lr": 1.8459539971804608e-09, "epoch": 6.917197452229299, "percentage": 99.45, "elapsed_time": "0:41:46", "remaining_time": "0:00:13"}
363
+ {"current_steps": 363, "total_steps": 364, "loss": 0.0633, "lr": 4.614991483686826e-10, "epoch": 6.936305732484076, "percentage": 99.73, "elapsed_time": "0:41:51", "remaining_time": "0:00:06"}
364
+ {"current_steps": 364, "total_steps": 364, "loss": 0.0559, "lr": 0.0, "epoch": 6.955414012738854, "percentage": 100.0, "elapsed_time": "0:41:56", "remaining_time": "0:00:00"}
365
+ {"current_steps": 364, "total_steps": 364, "epoch": 6.955414012738854, "percentage": 100.0, "elapsed_time": "0:44:48", "remaining_time": "0:00:00"}