guyhadad01 commited on
Commit
efd19b3
·
verified ·
1 Parent(s): 0eb9553

Training in progress, step 55200, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -1257,6 +1257,10 @@ You can finetune this model on your own dataset.
1257
  | 0.9701 | 54900 | 0.3112 |
1258
  | 0.9710 | 54950 | 0.2889 |
1259
  | 0.9719 | 55000 | 0.2746 |
 
 
 
 
1260
 
1261
 
1262
  ### Framework Versions
 
1257
  | 0.9701 | 54900 | 0.3112 |
1258
  | 0.9710 | 54950 | 0.2889 |
1259
  | 0.9719 | 55000 | 0.2746 |
1260
+ | 0.9728 | 55050 | 0.2772 |
1261
+ | 0.9737 | 55100 | 0.2965 |
1262
+ | 0.9745 | 55150 | 0.2382 |
1263
+ | 0.9754 | 55200 | 0.3863 |
1264
 
1265
 
1266
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b7de782f93f57348bf850bc04f35cc7f6059cfdc1487661cd5cf4f11ce0e636f
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:84dfa838d5d08ff2f7ba730d306c0960dd6da737376547d2bfca93e1966bc1dd
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8dc1a5e4533471281ab4208b72f4dd16330451bdcbc3512cd1466d1a94c0279b
3
  size 180609210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:014ea2c017260d23539bf2018a3aeecb9f09815bf6c03db5f9a232664f2814fd
3
  size 180609210
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:035838ab30ab4d07fb2aaaa81eb5cd5230f5b5f92e211ace87a3143ca1c3c17c
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:74c101267c3a81601197ccbb38d2e72ad72f0ccd27fd0e0454beeffecf5ebfa6
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0d88e34fed71326e402519391fc702de0ba4ca1011f3b15e76161c4e72df1f1c
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9d0369b7df9f4f6057f54d12203a572c70823bfca8ac268e71fe1a019e47a330
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:73e5c254a90680845431aa779809105481c9b9fb095d05b8d7eb9127bf1f4c4d
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f7a98fbd51768bffd64a896f3250670354d9f2cc8cf54c04f0d410e34f028552
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.9718859889381704,
6
  "eval_steps": 500,
7
- "global_step": 55000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -7708,6 +7708,34 @@
7708
  "learning_rate": 1.583514951601186e-06,
7709
  "loss": 0.2746,
7710
  "step": 55000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
7711
  }
7712
  ],
7713
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.9754201198070365,
6
  "eval_steps": 500,
7
+ "global_step": 55200,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
7708
  "learning_rate": 1.583514951601186e-06,
7709
  "loss": 0.2746,
7710
  "step": 55000
7711
+ },
7712
+ {
7713
+ "epoch": 0.9727695216553869,
7714
+ "grad_norm": 1.8150931596755981,
7715
+ "learning_rate": 1.5344289332626496e-06,
7716
+ "loss": 0.2772,
7717
+ "step": 55050
7718
+ },
7719
+ {
7720
+ "epoch": 0.9736530543726034,
7721
+ "grad_norm": 1.4807177782058716,
7722
+ "learning_rate": 1.485342914924113e-06,
7723
+ "loss": 0.2965,
7724
+ "step": 55100
7725
+ },
7726
+ {
7727
+ "epoch": 0.9745365870898199,
7728
+ "grad_norm": 1.4012283086776733,
7729
+ "learning_rate": 1.4362568965855766e-06,
7730
+ "loss": 0.2382,
7731
+ "step": 55150
7732
+ },
7733
+ {
7734
+ "epoch": 0.9754201198070365,
7735
+ "grad_norm": 1.435829520225525,
7736
+ "learning_rate": 1.388152598613811e-06,
7737
+ "loss": 0.3863,
7738
+ "step": 55200
7739
  }
7740
  ],
7741
  "logging_steps": 50,