guyhadad01 commited on
Commit
623d693
·
verified ·
1 Parent(s): 25d6679

Training in progress, step 51200, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -1315,6 +1315,10 @@ You can finetune this model on your own dataset.
1315
  | 0.8994 | 50900 | 0.3639 |
1316
  | 0.9003 | 50950 | 0.2332 |
1317
  | 0.9012 | 51000 | 0.3363 |
 
 
 
 
1318
 
1319
  </details>
1320
 
 
1315
  | 0.8994 | 50900 | 0.3639 |
1316
  | 0.9003 | 50950 | 0.2332 |
1317
  | 0.9012 | 51000 | 0.3363 |
1318
+ | 0.9021 | 51050 | 0.2674 |
1319
+ | 0.9030 | 51100 | 0.331 |
1320
+ | 0.9039 | 51150 | 0.2881 |
1321
+ | 0.9047 | 51200 | 0.3553 |
1322
 
1323
  </details>
1324
 
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8e5b296e1f58fde06ca25a671f7290066af40d31d74f593dd71beb56e81f618e
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:17ad1d70cc9a9203e1932e7a5399b2ea38220c472d491a93ade1e1841ba94da7
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:64cec233f06e1ea5350dc36447e7fd4afa810289f7a83dc18968cd19ae207a12
3
  size 180609210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e0c9ea94de1bc6171fc560eb6edc6e3bb30de3a6197d7f6bdc43b28fa6e8b63a
3
  size 180609210
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c2b900393780cdd3cbb99d501f19a790b00c5891d77d31ffa5ebe767f48b02bb
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:697766d9762a48456880b2166b1f5fb91392394ad67b7232020fe661b72f67bd
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:30c99faa590c236be1e60450ac31ef6bbc0d8a5408817f47526e33c981695098
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4f620a353823eb6b71c8ccf047459bfd67f2ce79246e53f2aa937b07f9d71d34
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2640c4dcf9a6fa010a98a2ceb775abaf0e70fd53baf808dd65285ab30eadea3f
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2fadf44129acc4700f11541025d2dded44dc62ab2fdbe50e09f45fc382b24055
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.901203371560849,
6
  "eval_steps": 500,
7
- "global_step": 51000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -7148,6 +7148,34 @@
7148
  "learning_rate": 5.508432977950561e-06,
7149
  "loss": 0.3363,
7150
  "step": 51000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
7151
  }
7152
  ],
7153
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.904737502429715,
6
  "eval_steps": 500,
7
+ "global_step": 51200,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
7148
  "learning_rate": 5.508432977950561e-06,
7149
  "loss": 0.3363,
7150
  "step": 51000
7151
+ },
7152
+ {
7153
+ "epoch": 0.9020869042780654,
7154
+ "grad_norm": 1.782301664352417,
7155
+ "learning_rate": 5.459346959612025e-06,
7156
+ "loss": 0.2674,
7157
+ "step": 51050
7158
+ },
7159
+ {
7160
+ "epoch": 0.9029704369952819,
7161
+ "grad_norm": 1.5983684062957764,
7162
+ "learning_rate": 5.411242661640259e-06,
7163
+ "loss": 0.331,
7164
+ "step": 51100
7165
+ },
7166
+ {
7167
+ "epoch": 0.9038539697124984,
7168
+ "grad_norm": 1.749089002609253,
7169
+ "learning_rate": 5.362156643301722e-06,
7170
+ "loss": 0.2881,
7171
+ "step": 51150
7172
+ },
7173
+ {
7174
+ "epoch": 0.904737502429715,
7175
+ "grad_norm": 1.2461782693862915,
7176
+ "learning_rate": 5.313070624963186e-06,
7177
+ "loss": 0.3553,
7178
+ "step": 51200
7179
  }
7180
  ],
7181
  "logging_steps": 50,