guyhadad01 commited on
Commit
53aa37c
·
verified ·
1 Parent(s): d8d34b0

Training in progress, step 56000, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -1273,6 +1273,10 @@ You can finetune this model on your own dataset.
1273
  | 0.9843 | 55700 | 0.2922 |
1274
  | 0.9851 | 55750 | 0.2409 |
1275
  | 0.9860 | 55800 | 0.2704 |
 
 
 
 
1276
 
1277
 
1278
  ### Framework Versions
 
1273
  | 0.9843 | 55700 | 0.2922 |
1274
  | 0.9851 | 55750 | 0.2409 |
1275
  | 0.9860 | 55800 | 0.2704 |
1276
+ | 0.9869 | 55850 | 0.2855 |
1277
+ | 0.9878 | 55900 | 0.241 |
1278
+ | 0.9887 | 55950 | 0.2616 |
1279
+ | 0.9896 | 56000 | 0.2572 |
1280
 
1281
 
1282
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:90fcb416e3f1fd9c1877f4daf0be2fc8df1e1250a64fe3f07aae6546f23d2ab0
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:77ce30d7aacd666933a14d83cc737c586dcae579850f877da7309f9895799d43
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5e61e9433fbd41b3556eca2c0125db34a8ece386095ac01a954bcccc5ae50de3
3
  size 180609210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8d280d8e79c740dc707e7398c5e14c4f2ad422cb187845da01e50e47c090ae44
3
  size 180609210
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:404572bee52c0f6fd3f51338bcd9d76b45287337ee0a6f0be420d6125dc37b05
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c072afea83c70b7165bf32b5c5585de459f967b6f4f050240893f3e9f57351d0
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:87465185b3464123ac777bc7dfe2dec56250d184ec4a7d3aafc9cf39b60be6dc
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4674ba66a393298737c507490cd48fcb412b9b21de3a1d3996a7109c47aaae95
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:55ccf2bc2593182b06063b40af4f602a3ba516c801f8e0f593c69740ab2da6ec
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9c1d493f6ec6785592b7a247d7ab39afb368b0e235cf1f0840677960dedafdad
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.9860225124136347,
6
  "eval_steps": 500,
7
- "global_step": 55800,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -7820,6 +7820,34 @@
7820
  "learning_rate": 7.991203785513735e-07,
7821
  "loss": 0.2704,
7822
  "step": 55800
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
7823
  }
7824
  ],
7825
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.9895566432825007,
6
  "eval_steps": 500,
7
+ "global_step": 56000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
7820
  "learning_rate": 7.991203785513735e-07,
7821
  "loss": 0.2704,
7822
  "step": 55800
7823
+ },
7824
+ {
7825
+ "epoch": 0.9869060451308512,
7826
+ "grad_norm": 1.3643758296966553,
7827
+ "learning_rate": 7.50034360212837e-07,
7828
+ "loss": 0.2855,
7829
+ "step": 55850
7830
+ },
7831
+ {
7832
+ "epoch": 0.9877895778480678,
7833
+ "grad_norm": 1.2211904525756836,
7834
+ "learning_rate": 7.009483418743006e-07,
7835
+ "loss": 0.241,
7836
+ "step": 55900
7837
+ },
7838
+ {
7839
+ "epoch": 0.9886731105652843,
7840
+ "grad_norm": 3.049858570098877,
7841
+ "learning_rate": 6.518623235357641e-07,
7842
+ "loss": 0.2616,
7843
+ "step": 55950
7844
+ },
7845
+ {
7846
+ "epoch": 0.9895566432825007,
7847
+ "grad_norm": 1.8196197748184204,
7848
+ "learning_rate": 6.027763051972277e-07,
7849
+ "loss": 0.2572,
7850
+ "step": 56000
7851
  }
7852
  ],
7853
  "logging_steps": 50,