ryanmarten commited on
Commit
d4cafe2
·
verified ·
1 Parent(s): 7f1ac4b

Training in progress, epoch 5

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1e9d264a5e3bca944513a6fae94a4e9aceeab0991ea20443f831faab1dcf0db4
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3a18f931132dac894b1f12a5361757ab2d0c64870947595d1269a65b70fa55dd
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:78e09ab025ee3fd2e4822f7594f158bd2507399aadc824fc014db8552efc554a
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dafef32e8aa8e7c24e3d66f820e0f8b26e73c690933ae4b7c07fab4dccb47a9a
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a1674f6fac98629f1b0edb76e225452e4668c1f487f840d8ddafb06dd6a1c91e
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fc5fb08728cbb7b117559a7c89f358793db7855e7eb820ee8c4940730cdb53da
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7020674f9e95009474b1b08ec0830007037295c718118fc349a6a4a142506175
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cf99eac9eaed3cdb2d2753d2e276f4fb35fef36f8773fb00e02cf3265786b0ea
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -51,3 +51,14 @@
51
  {"current_steps": 51, "total_steps": 70, "loss": 0.5229, "lr": 4.162563277652104e-06, "epoch": 4.896, "percentage": 72.86, "elapsed_time": "1:47:34", "remaining_time": "0:40:04"}
52
  {"current_steps": 52, "total_steps": 70, "loss": 0.524, "lr": 3.7651019814126656e-06, "epoch": 4.992, "percentage": 74.29, "elapsed_time": "1:49:25", "remaining_time": "0:37:52"}
53
  {"current_steps": 53, "total_steps": 70, "loss": 0.5191, "lr": 3.3831416240314085e-06, "epoch": 5.088, "percentage": 75.71, "elapsed_time": "1:52:22", "remaining_time": "0:36:02"}
 
 
 
 
 
 
 
 
 
 
 
 
51
  {"current_steps": 51, "total_steps": 70, "loss": 0.5229, "lr": 4.162563277652104e-06, "epoch": 4.896, "percentage": 72.86, "elapsed_time": "1:47:34", "remaining_time": "0:40:04"}
52
  {"current_steps": 52, "total_steps": 70, "loss": 0.524, "lr": 3.7651019814126656e-06, "epoch": 4.992, "percentage": 74.29, "elapsed_time": "1:49:25", "remaining_time": "0:37:52"}
53
  {"current_steps": 53, "total_steps": 70, "loss": 0.5191, "lr": 3.3831416240314085e-06, "epoch": 5.088, "percentage": 75.71, "elapsed_time": "1:52:22", "remaining_time": "0:36:02"}
54
+ {"current_steps": 54, "total_steps": 70, "loss": 0.5063, "lr": 3.017631819139273e-06, "epoch": 5.184, "percentage": 77.14, "elapsed_time": "1:54:18", "remaining_time": "0:33:52"}
55
+ {"current_steps": 55, "total_steps": 70, "loss": 0.5174, "lr": 2.669481281701739e-06, "epoch": 5.28, "percentage": 78.57, "elapsed_time": "1:56:23", "remaining_time": "0:31:44"}
56
+ {"current_steps": 56, "total_steps": 70, "loss": 0.509, "lr": 2.339555568810221e-06, "epoch": 5.376, "percentage": 80.0, "elapsed_time": "1:58:28", "remaining_time": "0:29:37"}
57
+ {"current_steps": 57, "total_steps": 70, "loss": 0.515, "lr": 2.0286749277707783e-06, "epoch": 5.4719999999999995, "percentage": 81.43, "elapsed_time": "2:00:36", "remaining_time": "0:27:30"}
58
+ {"current_steps": 58, "total_steps": 70, "loss": 0.5265, "lr": 1.7376122568400533e-06, "epoch": 5.568, "percentage": 82.86, "elapsed_time": "2:02:37", "remaining_time": "0:25:22"}
59
+ {"current_steps": 59, "total_steps": 70, "loss": 0.4999, "lr": 1.467091183678444e-06, "epoch": 5.664, "percentage": 84.29, "elapsed_time": "2:04:41", "remaining_time": "0:23:14"}
60
+ {"current_steps": 60, "total_steps": 70, "loss": 0.4959, "lr": 1.2177842662977136e-06, "epoch": 5.76, "percentage": 85.71, "elapsed_time": "2:06:43", "remaining_time": "0:21:07"}
61
+ {"current_steps": 61, "total_steps": 70, "loss": 0.4973, "lr": 9.903113209758098e-07, "epoch": 5.856, "percentage": 87.14, "elapsed_time": "2:08:45", "remaining_time": "0:18:59"}
62
+ {"current_steps": 62, "total_steps": 70, "loss": 0.5036, "lr": 7.852378812959227e-07, "epoch": 5.952, "percentage": 88.57, "elapsed_time": "2:10:43", "remaining_time": "0:16:52"}
63
+ {"current_steps": 63, "total_steps": 70, "loss": 0.5197, "lr": 6.030737921409169e-07, "epoch": 6.048, "percentage": 90.0, "elapsed_time": "2:14:00", "remaining_time": "0:14:53"}
64
+ {"current_steps": 64, "total_steps": 70, "loss": 0.4934, "lr": 4.4427194213859216e-07, "epoch": 6.144, "percentage": 91.43, "elapsed_time": "2:16:00", "remaining_time": "0:12:45"}